Example #1
0
 def setUp(self):
     self.db = dataset.connect('postgres:///%s' % self.temp_db_name)
     seamus_scraper = SeamusScraper()
     seamus_stories = seamus_scraper.scrape_seamus(
         filename='tests/snapshots/query-current-04-21-2015.xml')
     seamus_scraper.write(self.db, seamus_stories)
     self.seamus_row = self.db['seamus'].find_one(id=6)
Example #2
0
def scrape_seamus():
    """
    Scrape Seamus API
    """
    db = dataset.connect(app_config.POSTGRES_URL)
    scraper = SeamusScraper()
    stories = scraper.scrape_seamus()
    scraper.write(db, stories)
Example #3
0
def scrape_seamus():
    """
    Scrape Seamus API
    """
    db = dataset.connect(app_config.POSTGRES_URL)
    scraper = SeamusScraper()
    stories = scraper.scrape_seamus()
    scraper.write(db, stories)
class TestScrapeSeamus(unittest.TestCase):
    def setUp(self):
        self.scraper = SeamusScraper()
        self.stories = self.scraper.scrape_seamus(filename='tests/snapshots/query-current-04-21-2015.xml')

    def test_story_id(self):
        self.assertEqual(self.stories[0].story_id, '401157787')

    def test_headline(self):
        self.assertEqual(self.stories[0].title, 'Top Stories: Ex-Egypt Leader Sentenced; Blue Bell Recall Expands')

    def test_story_date(self):
        self.assertEqual(self.stories[0].story_date, datetime(2015, 4, 21, 12, 40, 23))

    def test_publication_date(self):
        self.assertEqual(self.stories[0].publication_date, datetime(2015, 4, 21, 12, 40, 0))

    def test_last_modified_date(self):
        self.assertEqual(self.stories[0].last_modified_date, datetime(2015, 4, 21, 12, 40, 23))

    def test_canonical_url(self):
        self.assertEqual(self.stories[0].canonical_url, 'http://www.npr.org/blogs/thetwo-way/2015/04/21/401157787/top-stories-ex-egypt-leader-sentenced-blue-bell-recall-expands')

    def test_has_lead_art(self):
        self.assertEqual(self.stories[0].has_lead_art, False)
        self.assertEqual(self.stories[6].has_lead_art, True)

    def test_lead_art_provider(self):
        self.assertEqual(self.stories[6].lead_art_provider, 'AFP/Getty Images')

    def test_lead_art_url(self):
        self.assertEqual(self.stories[6].lead_art_url, 'http://media.npr.org/assets/img/2015/04/21/morsi-court_wide-905d13041b11b20aea8771f3a950a7b8c1e6b5d8.jpg')

    def test_lead_art_root_url(self):
        self.assertEqual(self.stories[6].lead_art_root_url, 'http://media.npr.org/assets/img/2015/04/21/morsi-court.jpg')

    def test_has_audio(self):
        self.assertEqual(self.stories[0].has_audio, False)
        self.assertEqual(self.stories[3].has_audio, True)

    def test_slug(self):
        self.assertEqual(self.stories[0].slug, 'The Two-Way')
 def setUp(self):
     self.scraper = SeamusScraper()
     self.stories = self.scraper.scrape_seamus(filename='tests/snapshots/query-current-04-21-2015.xml')
Example #6
0
 def setUp(self):
     self.db = dataset.connect('postgres:///%s' % self.temp_db_name)
     seamus_scraper = SeamusScraper()
     seamus_stories = seamus_scraper.scrape_seamus(filename='tests/snapshots/query-current-04-21-2015.xml')
     seamus_scraper.write(self.db, seamus_stories)
     self.seamus_row = self.db['seamus'].find_one(id=6)