Beispiel #1
0
 def test_local_crawl(self):
     starting_url = 'usher/tests/gutersloh_showtimes_test_1.html'
     expected_output = json.load(open('usher/tests/gutersloh_showtimes.json'))
     googlemovies = GoogleMovies(starting_url, None, True, 'crawl')
     assert googlemovies.to_json() == expected_output
     assert googlemovies.crawled_urls == ['usher/tests/gutersloh_showtimes_test_1.html',
                                          'usher/tests/gutersloh_showtimes_test_2.html']
Beispiel #2
0
 def test_local_crawl(self):
     starting_url = 'usher/tests/gutersloh_showtimes_test_1.html'
     expected_output = json.load(
         open('usher/tests/gutersloh_showtimes.json'))
     googlemovies = GoogleMovies(starting_url, None, True, 'crawl')
     assert googlemovies.to_json() == expected_output
     assert googlemovies.crawled_urls == [
         'usher/tests/gutersloh_showtimes_test_1.html',
         'usher/tests/gutersloh_showtimes_test_2.html'
     ]
Beispiel #3
0
 def test_crawl_with_only_one_page(self):
     starting_url = 'usher/tests/single_crawl_test.html'
     googlemovies = GoogleMovies(starting_url, None, True, 'crawl')
     assert len(googlemovies.movie_results) == 1  # 1 theatre
     assert len(
         googlemovies.movie_results[0].showtimes) == 2  # with 2 movies
     assert googlemovies.title_bar == 'Showtimes for Hinsdale, Mt'
     assert googlemovies.crawled_urls == [starting_url]
Beispiel #4
0
 def test_web_crawl(self):
     starting_url = 'http://google.com/movies'
     params = {"near": "Los Angelos"}
     googlemovies = GoogleMovies(starting_url, params)
     assert len(googlemovies.movie_results) == 23
     assert googlemovies.title_bar == 'Showtimes for Los Angeles, CA'
     assert googlemovies.crawled_urls == [
         'http://google.com/movies?near=Los+Angelos',
         'http://google.com/movies?near=Los+Angelos&start=10',
         'http://google.com/movies?near=Los+Angelos&start=20'
     ]
Beispiel #5
0
 def test_to_json_1(self):
     url = 'usher/tests/gutersloh_showtimes_test_1.html'
     expected_output = json.load(open('usher/tests/gutersloh_showtimes.json'))[0]
     googlemovies = GoogleMovies(url, None, True, 'scrape')
     assert googlemovies.to_json()[0] == expected_output
Beispiel #6
0
 def test_to_json_1(self):
     url = 'usher/tests/gutersloh_showtimes_test_1.html'
     expected_output = json.load(
         open('usher/tests/gutersloh_showtimes.json'))[0]
     googlemovies = GoogleMovies(url, None, True, 'scrape')
     assert googlemovies.to_json()[0] == expected_output
Beispiel #7
0
 def test_next_page(self):
     url = 'usher/tests/gutersloh_showtimes_test_1.html'
     expected_output = json.load(
         open('usher/tests/gutersloh_showtimes.json'))[0]
     googlemovies = GoogleMovies(url, None, True, 'scrape')
     assert googlemovies.next_href == 'usher/tests/gutersloh_showtimes_test_2.html'