示例#1
0
    def residential(self, response):
        for item in response.doc('ul.review_left > li ').items():
            information = item
            key = information('li').text()
            value = key.split(':')[1]
            key = key.split(':')[0]
            d[key] = value

        for item in response.doc('ul.review_right:first > li').items():
            information1 = item
            key = information1('li').text()
            value = key.split(':')[1]
            key = key.split(':')[0]
            d2[key] = value


        for item in response.doc('ul.review_right:last').items():
            information2 = item
            detali = information2('li:first').text().split(":")

        email = response.doc('div.rl_field_left > div:last').text().split(" ")
        for each in email:
            if re.findall("@", each):
                email = each
                break
            else:
                email = None
        opisanie = response.doc('div.detail_realty_photo > div.rl_field').text()
        ploshad = str(d.get('Площадь\t'))
        if ploshad != None:
            ploshad = ploshad.replace('\t',' ')
        floor =  d.get('Этаж')
        if floor !=  None:
            floor = floor.replace('\t',' ')
        return {
            "path_screen": selen.screen_click_ufa1_(response.url),
            "Срок эксплуатации": d2.get('Срок эксплуатации'),
            "Цена": d2.get('Цена'),
            "Детали": detali[0],
            "Адрес": d.get('Расположение'),
            "Площадь": ploshad,
            "Описание": opisanie,
            "Ориентир": d.get('Ориентир'),
            "Район города": d.get('Район города'),
            "Тип": d.get('Тип'),
            'Серия': d.get('Серия'),
            'Комнаты': d.get('Комнаты'),
            'Этаж': floor,
            'Тип дома': d.get('Тип дома'),
            #"test": d.keys(),
            "E-mail": email,
            "Photo": Handler.url_photo(response.doc('div.photos-list-container > div > img').items()),

        }
示例#2
0
    def land(self, response):

        for item in response.doc('ul.review_left > li ').items():
            information = item
            key = information('li').text()
            value = key.split(':')[1]
            key = key.split(':')[0]
            d[key] = value

        for item in response.doc('ul.review_right:first').items():
            information1 = item
            price_all = information1('li:first').text().split(":")
            price = information1('li:last').text().split(":")

        for item in response.doc('ul.review_right:last').items():
            information2 = item
            detali = information2('li:first').text().split(":")

        email = response.doc('div.rl_field_left > div:last').text().split(" ")
        for each in email:
            if re.findall("@", each):
                email = each
                break

        opisanie = response.doc('div.detail_realty_photo > div.rl_field').text()
        n = ''
        ploshad = str(d.get('Площадь\t'))
        if ploshad != None:
            ploshad = ploshad.replace('\t',' ')
        return {
            "path_screen": selen.screen_click_ufa1_(response.url),
            "Цена общая": price_all[1],
            "Цена за сотку": price[1],
            "Детали": detali[0],
            "Тип": d.get('Тип'),
            "Адрес": d.get('Расположение'),
            "Площадь": ploshad,
            "Описание": opisanie,
            "Форма собственности": d.get('Форма собственности'),
            "Ориентир": d.get('Ориентир'),
            "E-mail": email,
            "Photo": Handler.url_photo(response.doc('div.photos-list-container > div > img').items()),
            #"url": response.url,
        }
示例#3
0
    def foreign(self, response):
        for item in response.doc('ul.review_left > li ').items():
            information = item
            key = information('li').text()
            value = key.split(':')[1]
            key = key.split(':')[0]
            d[key] = value

        for item in response.doc('ul.review_right:first').items():
            information1 = item
            price_all = information1('li:first').text().split(":")
            price = information1('li:last').text().split(":")

        for item in response.doc('ul.review_right:last').items():
            information2 = item
            detali = information2('li:first').text().split(":")

        email = response.doc('div.rl_field_left > div:last').text().split(" ")
        for each in email:
            if re.findall("@", each):
                email = each
                break
            else:
                email = None
        opisanie = response.doc('div.detail_realty_photo > div.rl_field').text()
        ploshad = str(d.get('Площадь\t'))
        if ploshad != None:
            ploshad = ploshad.replace('\t',' ')
        return {
            "path_screen": selen.screen_click_ufa1_(response.url),
            "Цена общая": price_all[1],
            "Цена за кв.м": price[1],
            "Адрес": d.get('Расположение'),
            "Площадь": str(d.get('Площадь\t')).replace('\t',' '),
            "Описание": opisanie,
            "Район города": d.get('Район города'),
            "Тип помещения": d.get('Тип помещения'),
            "E-mail": email,
            "Photo": Handler.url_photo(response.doc('div.photos-list-container > div > img').items()),

        }