Пример #1
0
 def parse_hotel(
     self, response: scrapy.http.response.html.HtmlResponse, name, text_eng, text_hr
 ):
     if text_hr is None:
         text_hr = "".join(
             response.xpath("//dd[@class='hotel-description']//text()").extract()
         )
         new_link = response._get_url().replace("esky.hr/hoteli", "esky.com/hotels")
         return scrapy.Request(
             new_link,
             callback=self.parse_hotel,
             cb_kwargs={"name": name, "text_eng": None, "text_hr": text_hr},
         )
     else:
         text_eng = "".join(
             response.xpath("//dd[@class='hotel-description']//text()").extract()
         )
         if text_hr != text_eng:
             return {
                 "name": name,
                 "text_eng": text_eng.strip(),
                 "text_hr": text_hr.strip(),
             }
         else:
             return None
Пример #2
0
 def parse(self, response: scrapy.http.response.html.HtmlResponse):
     text_hr = "".join(
         response.xpath(
             "//dd[@class='hotel-description']//text()").extract())
     if text_hr == "":
         return None
     new_link = response._get_url().replace("esky.hr/hoteli",
                                            "esky.com/hotels")
     return scrapy.Request(new_link,
                           callback=self.parse_eng,
                           cb_kwargs={"text_hr": text_hr})