def residential(self, response): for item in response.doc('ul.review_left > li ').items(): information = item key = information('li').text() value = key.split(':')[1] key = key.split(':')[0] d[key] = value for item in response.doc('ul.review_right:first > li').items(): information1 = item key = information1('li').text() value = key.split(':')[1] key = key.split(':')[0] d2[key] = value for item in response.doc('ul.review_right:last').items(): information2 = item detali = information2('li:first').text().split(":") email = response.doc('div.rl_field_left > div:last').text().split(" ") for each in email: if re.findall("@", each): email = each break else: email = None opisanie = response.doc('div.detail_realty_photo > div.rl_field').text() ploshad = str(d.get('Площадь\t')) if ploshad != None: ploshad = ploshad.replace('\t',' ') floor = d.get('Этаж') if floor != None: floor = floor.replace('\t',' ') return { "path_screen": selen.screen_click_ufa1_(response.url), "Срок эксплуатации": d2.get('Срок эксплуатации'), "Цена": d2.get('Цена'), "Детали": detali[0], "Адрес": d.get('Расположение'), "Площадь": ploshad, "Описание": opisanie, "Ориентир": d.get('Ориентир'), "Район города": d.get('Район города'), "Тип": d.get('Тип'), 'Серия': d.get('Серия'), 'Комнаты': d.get('Комнаты'), 'Этаж': floor, 'Тип дома': d.get('Тип дома'), #"test": d.keys(), "E-mail": email, "Photo": Handler.url_photo(response.doc('div.photos-list-container > div > img').items()), }
def land(self, response): for item in response.doc('ul.review_left > li ').items(): information = item key = information('li').text() value = key.split(':')[1] key = key.split(':')[0] d[key] = value for item in response.doc('ul.review_right:first').items(): information1 = item price_all = information1('li:first').text().split(":") price = information1('li:last').text().split(":") for item in response.doc('ul.review_right:last').items(): information2 = item detali = information2('li:first').text().split(":") email = response.doc('div.rl_field_left > div:last').text().split(" ") for each in email: if re.findall("@", each): email = each break opisanie = response.doc('div.detail_realty_photo > div.rl_field').text() n = '' ploshad = str(d.get('Площадь\t')) if ploshad != None: ploshad = ploshad.replace('\t',' ') return { "path_screen": selen.screen_click_ufa1_(response.url), "Цена общая": price_all[1], "Цена за сотку": price[1], "Детали": detali[0], "Тип": d.get('Тип'), "Адрес": d.get('Расположение'), "Площадь": ploshad, "Описание": opisanie, "Форма собственности": d.get('Форма собственности'), "Ориентир": d.get('Ориентир'), "E-mail": email, "Photo": Handler.url_photo(response.doc('div.photos-list-container > div > img').items()), #"url": response.url, }
def foreign(self, response): for item in response.doc('ul.review_left > li ').items(): information = item key = information('li').text() value = key.split(':')[1] key = key.split(':')[0] d[key] = value for item in response.doc('ul.review_right:first').items(): information1 = item price_all = information1('li:first').text().split(":") price = information1('li:last').text().split(":") for item in response.doc('ul.review_right:last').items(): information2 = item detali = information2('li:first').text().split(":") email = response.doc('div.rl_field_left > div:last').text().split(" ") for each in email: if re.findall("@", each): email = each break else: email = None opisanie = response.doc('div.detail_realty_photo > div.rl_field').text() ploshad = str(d.get('Площадь\t')) if ploshad != None: ploshad = ploshad.replace('\t',' ') return { "path_screen": selen.screen_click_ufa1_(response.url), "Цена общая": price_all[1], "Цена за кв.м": price[1], "Адрес": d.get('Расположение'), "Площадь": str(d.get('Площадь\t')).replace('\t',' '), "Описание": opisanie, "Район города": d.get('Район города'), "Тип помещения": d.get('Тип помещения'), "E-mail": email, "Photo": Handler.url_photo(response.doc('div.photos-list-container > div > img').items()), }