Beispiel #1
0
 def parse_search_results(self):
     results = self.body.xpath(
         ".//div[contains(@class, 'offer_list_item')]")
     for item in results:
         print(etree.tostring(item))
         item_id = item.attrib["data-id"]
         pic = item.xpath(".//a[contains(@href, '" + item_id + "')]")
         if len(pic) == 0:
             continue
         item_url = self.url + pic[0].attrib["href"]
         item_online = item.xpath(
             ".//span[contains(text(), 'Online:')]")[0].text
         last_update = self.__get_last_update(item_online)
         assert last_update is not None, "Cant parse timestamp '%s'" % item_online
         ad = Ad(item_id, item_url)
         # Here we suppose that this ad was just created
         ad.created = last_update
         ad.last_update = last_update
         yield ad