def parse(self, response): result = json.loads(response.body) item = Images360Item() for image in result.get('list'): # 遍历一个列表 item['id'] = image.get('imageid') # ID item['url'] = image.get('qhimg_url') # url item['title'] = image.get('group_title') #标题 yield item
def parse(self, response): images = json.loads(response.text).get('list') for image in images: item = Images360Item() item['id'] = image.get('id') item['url'] = image.get('qhimg_url') item['title'] = image.get('title') item['thumb'] = image.get('qhimg_thumb') yield item
def parse(self, response): result = json.loads(response.text) for image in result.get('list'): item = Images360Item() item['url'] = image.get('qhimg_url') item['id'] = image.get('imageid') item['title'] = image.get('group_title') item['thumb'] = image.get('qhimg_thumb_url') yield item
def parse(self, response): item = Images360Item() data = json.loads(response.text) for images in data['list']: item['id'] = images.get('imageid') item['thumb'] = images.get('qhimg_thumb_url') item['url'] = images.get('qhimg_url') item['title'] = images.get('group_title') yield item
def parse(self, response): content = json.loads(response.text) for image in content['list']: item = Images360Item() item['id'] = image['imageid'] item['url'] = image['qhimg_url'] item['title'] = image['group_title'] item['thumb'] = image['qhimg_thumb_url'] yield item
def parse(self, response): result = json.loads(response.text) lists = result.get('list') for list in lists: myitem = Images360Item() myitem['id'] = list.get('id') myitem['url'] = list.get('qhimg_url') myitem['title'] = list.get('title') myitem['thumb'] = list.get('qhimg_thumb') yield myitem
def parse( self, response): #首先解析JSON,遍历其list字段,取出一个个图片信息,然后再对ImageItem赋值,生成Item对象。 result = json.loads(response.text) # 字符串转dict类型 for image in result.get('list'): item = Images360Item() item['id'] = image.get('imageid') item['url'] = image.get('qhimg_url') item['title'] = image.get('group_title') item['thumb'] = image.get('qhimg_thumb_url') yield item
def parse(self, response): result = json.loads(response.text) for image in result.get('list'): # print(image) if image: item = Images360Item() item['group_title'] = image.get('group_title') item['tag'] = image.get('tag') item['qhimg_url'] = image.get('qhimg_url') # print(len(item)) yield item
def parse_item(self, response): item = Images360Item() result = json.loads(response.text) print('====================================================') #print(result.get('list')) for image in result.get('list'): item['id'] = image.get('imageid') item['url'] = image.get('qhimg_url') item['title'] = image.get('group_title') item['thumb'] = image.get('qhimg_thumb_url') #i['domain_id'] = response.xpath('//input[@id="sid"]/@value').extract() #i['name'] = response.xpath('//div[@id="name"]').extract() #i['description'] = response.xpath('//div[@id="description"]').extract() yield item
def parse(self, response): result = json.loads(response.text) print("---------------") if isinstance(result['list'], list): #print(result.get('list')) #print(type(result['list'])) for image in result.get('list'): item = Images360Item() item['id'] = image.get('imageid') item['url'] = image.get('qhimg_url') item['title'] = image.get('group_title') item['thumb'] = image.get('qhimg_thumb_url') #print(item) yield item
def parse(self, response): # 获取到的内容是json数据 # # 用json.loads()解析数据 # # 此处的response没有content model_dict = loads(response.text) # print(model_dict["list"]) for element in model_dict["list"]: item = Images360Item() item["id"] = element["imageid"] item["title"] = element["group_title"] item["tags"] = element["tag"] item["height"] = element["cover_height"] item["width"] = element["cover_width"] item["url"] = element["qhimg_thumb_url"] yield item
def parse(self, response): result = json.loads(response.text) if result.get('list'): print('正在爬取',response.url) for image in result.get('list'): item = Images360Item() item['id'] = image.get('imageid') item['url'] = image.get('qhimg_url') item['title'] = image.get('group_title') item['thumb'] = image.get('qhimg_thumb_url') item['img_paths'] = image.get('group_title') # item['urls'] = [image.get('qhimg_url') for image in result.get('list')] yield item # return item else: print('找不到节点。。。',response.url)