Python ProductLinkGetter示例

编程语言: Python

命名空间/包名称: DeliverySpiderProject.ProductLinkGetter

hotexamples.com的示例: 6

Python ProductLinkGetter - 已找到6个示例。这些是从开源项目中提取的最受好评的DeliverySpiderProject.ProductLinkGetter.ProductLinkGetter现实Python示例。您可以评价示例，以帮助我们提高示例质量。

常用方法

显示隐藏

ProductLinkGetter(4)

getLink(2)

示例#1

显示文件

class RestaurantSpider(CrawlSpider):
    name = "RestaurantSpider"
    allowed_domains = ["domiciliosbogota.com"]
    start_urls = ('http://www.domiciliosbogota.com/', )
    productLinkGetter = ProductLinkGetter()
    rules = [
        Rule(LinkExtractor(allow=(r"http://www\.domiciliosbogota\.com/$")),
             'parseMain')
    ]

    def parseMain(self, response):
        self.restaurantIDsGetter = RestaurantIDsGetter(response)
        linksExtractor = LinkExtractor(
            allow=(r"http\:\/\/www\.domiciliosbogota\.com\/domicilios\-.*"))
        links = linksExtractor.extract_links(response)
        for link in links:
            yield Request(link.url, callback=self.parseRestaurants)

    def parseRestaurants(self, response):
        sel = RestaurantSelector(response)
        restaurant = Restaurant()
        restaurant["url"] = response.url
        restaurant["name"] = sel.getName()
        restaurant["id"] = self.restaurantIDsGetter.getID(
            "/" + response.url.split("/")[-1])
        restaurant["deliveryTimeInMinutes"] = sel.getDeliveryTimeInMinutes()
        restaurant["minOrderPrice"] = sel.getMinOrderPrice()
        restaurant["deliveryCost"] = sel.getDeliveryCost()
        restaurant["payMethods"] = sel.getPayMethods()
        restaurant["menu"] = sel.getMenuCategories()
        restaurant["tagCategories"] = sel.getTagCategories()
        restaurant["averagePunctuation"] = sel.getAveragePunctuation()
        restaurant["quantityOfComments"] = sel.getQuantityOfComments()
        return restaurant

示例#2

显示文件

class ProductSpider(CrawlSpider):
    name = 'Product'
    allowed_domains = ['domiciliosbogota.com']
    start_urls = ['http://www.domiciliosbogota.com/']
    productLinkGetter = ProductLinkGetter()
    rules = (
        Rule(LinkExtractor(allow=()), follow=True),
        Rule(LinkExtractor(allow=(),
                               canonicalize = False,
                               tags = "li",
                               attrs = ("id",), 
                               process_value = productLinkGetter.getLink), 
             callback='parseProduct', follow=True),
    )
    
    def parseProduct(self, response):
        product = Product()
        product["product"] = json.loads(response.body)
        return product

示例#3

显示文件

文件： ProductLinkGetterTest.py 项目： divisiondeariza/Deliveries

 def testReturnNoneWhenLinkIsNotNumeric(self):
     id = "http://www.domiciliosbogota.com/cat-12345"
     productLinkGetter = ProductLinkGetter()
     self.assertEqual(None, productLinkGetter.getLink(id))

示例#4

显示文件

文件： ProductLinkGetterTest.py 项目： divisiondeariza/Deliveries

 def testGetUUrlFromProductID(self):
     id = "http://www.domiciliosbogota.com/12345"
     productLinkGetter = ProductLinkGetter()
     expectedLink = "http://www.domiciliosbogota.com/establecimientos/producto/12345"
     self.assertEqual(expectedLink, productLinkGetter.getLink(id))

示例#5

显示文件

文件： ProductLinkGetterTest.py 项目： divisiondeariza/Deliveries

 def testReturnNoneWhenLinkIsNotNumeric(self):
     id = "http://www.domiciliosbogota.com/cat-12345"
     productLinkGetter = ProductLinkGetter()
     self.assertEqual(None, productLinkGetter.getLink(id))

示例#6

显示文件

文件： ProductLinkGetterTest.py 项目： divisiondeariza/Deliveries

 def testGetUUrlFromProductID(self):
     id = "http://www.domiciliosbogota.com/12345"
     productLinkGetter = ProductLinkGetter()
     expectedLink = "http://www.domiciliosbogota.com/establecimientos/producto/12345"
     self.assertEqual(expectedLink, productLinkGetter.getLink(id))