예제 #1
0
    def test_parse_item_page(self):
        response = fake_response_from_file(
            'responses/craigslist_rentals_item_page.html')
        response.meta['item'] = {}

        item = self.spider.parse_item_page(response)
        self.assertEqual(37.491212, item['latitude'])
        self.assertEqual(-122.230883, item['longitude'])
        self.assertEqual(1, item['bedrooms'])
        self.assertEqual(1.0, item['bathrooms'])
        self.assertEqual(937, item['building_size'])
        self.assertEqual(u'2016-11-18T17:54:07-0800', item['posting_date'])
예제 #2
0
    def test_parse_item_page(self):
        response = fake_response_from_file(
            'responses/craigslist_rentals_hayward_5530420563.html')
        response.meta['item'] = {}

        item = self.spider.parse_item_page(response)
        self.assertEqual(item['latitude'], 37.649932)
        self.assertEqual(item['longitude'], -122.028772)
        self.assertEqual(item['bedrooms'], 4)
        self.assertEqual(item['bathrooms'], 3.0)
        self.assertEqual(item['building_size'], 2650)
        self.assertEqual(item['posting_date'], u'2016-04-08T20:17:38-0700')
예제 #3
0
 def test_parse_item_page(self):
   response = fake_response_from_file(
       'responses/craigslist_rentals_hayward_5530420563.html')
   response.meta['item'] = {}
   
   item = self.spider.parse_item_page(response)
   self.assertEqual(item['latitude'], 37.649932)
   self.assertEqual(item['longitude'], -122.028772)
   self.assertEqual(item['bedrooms'], 4)
   self.assertEqual(item['bathrooms'], 3.0)
   self.assertEqual(item['building_size'], 2650)
   self.assertEqual(item['posting_date'], u'2016-04-08T20:17:38-0700')
   
   
예제 #4
0
 def test_parse(self):
   response = fake_response_from_file(
       'responses/craigslist_rentals_hayward.html')
   results = self.spider.parse(response)
   
   count = 0
   for request in results:
     item = request.meta['item']
     self.assertIsNotNone(item['craigslist_id'])
     self.assertIsNotNone(item['title'])
     self.assertIsNotNone(item['price'])
     self.assertIsNotNone(item['link'])
     count += 1
   self.assertEqual(count, 99)
예제 #5
0
    def test_parse(self):
        response = fake_response_from_file(
            'responses/craigslist_rentals_hayward.html')
        results = self.spider.parse(response)

        count = 0
        for request in results:
            item = request.meta['item']
            self.assertIsNotNone(item['craigslist_id'])
            self.assertIsNotNone(item['title'])
            self.assertIsNotNone(item['price'])
            self.assertIsNotNone(item['link'])
            count += 1
        self.assertEqual(count, 99)
예제 #6
0
    def test_no_bathroom(self):
        response = fake_response_from_file(
            'responses/realtor_multi_family.html')
        results = list(self.spider.parse(response))

        item = results[0]
        self.assertIsNotNone(item['address'])
        self.assertIsNotNone(item['city'])
        self.assertIsNotNone(item['state'])
        self.assertIsNotNone(item['zip'])
        self.assertIsNotNone(item['purchase_price'])
        self.assertIsNotNone(item['bedrooms'])
        self.assertNotIn('bathrooms', item)
        self.assertIsNotNone(item['building_size'])
        self.assertEqual(len(results), 1)
예제 #7
0
    def test_parse(self):
        response = fake_response_from_file('responses/craigslist_rentals.html')
        results = list(self.spider.parse(response))

        count = 0
        for request in results:
            item = request.meta['item']
            self.assertIsNotNone(item['craigslist_id'])
            self.assertIsNotNone(item['title'])
            self.assertIsNotNone(item['price'])
            self.assertIsNotNone(item['link'])
            count += 1
        self.assertEqual(count, 99)

        self.assertEqual(
            'Huge top floor 1 bedroom apartment near downtown Redwood City!',
            results[0].meta['item']['title'])
        self.assertEqual(3703.0, results[0].meta['item']['price'])
        self.assertEqual('http://sfbay.craigslist.org/pen/apa/5883043515.html',
                         results[0].meta['item']['link'])
        self.assertEqual(5883043515, results[0].meta['item']['craigslist_id'])