Пример #1
0
    def test_L3_collection_11676(self):
        logger = logging.getLogger(__name__)
        requests_cache.install_cache(cachefile, backend='sqlite')
        session = requests.Session()

        aic = aiu.TroveCollection(11676, session=session, logger=logger)
        name = aic.get_collection_name()
        uri = aic.get_collection_uri()
        subject = aic.get_subject()
        archived_since = aic.get_archived_since()
        archived_until = aic.get_archived_until()
        collected_by = aic.get_collectedby()

        self.assertEqual(name,
                         "Communities - cultural, social and local web sites")
        self.assertEqual(
            uri, "https%3A%2F%2Fwebarchive.nla.gov.au%2Fcollection%2F11676")
        self.assertEqual(subject, "Business & Economy")
        self.assertEqual(archived_since, "Feb 2010")
        self.assertEqual(archived_until, "May 2020")
        self.assertEqual(
            collected_by, {
                'State Library of South Australia':
                'http://www.slsa.sa.gov.au/',
                'State Library of Western Australia':
                'http://www.slwa.wa.gov.au/',
                'State Library of Queensland': 'http://www.slq.qld.gov.au/',
                'National Library of Australia': 'http://www.nla.gov.au/',
                'State Library of Victoria': 'http://www.slv.vic.gov.au/'
            })
Пример #2
0
 def test_get_breadcrumbs_11666(self):
     logger = logging.getLogger(__name__)
     requests_cache.install_cache(cachefile, backend='sqlite')
     session = requests.Session()
     aic = aiu.TroveCollection(11666, session=session, logger=logger)
     breadcrumb_ids = aic.get_breadcrumbs()
     self.assertEqual(breadcrumb_ids, [0, 15003])
Пример #3
0
 def test_get_subcollections_11676(self):
     logger = logging.getLogger(__name__)
     requests_cache.install_cache(cachefile, backend='sqlite')
     session = requests.Session()
     aic = aiu.TroveCollection(11676, session=session, logger=logger)
     subcollection_ids = aic.get_subcollections()
     self.assertEqual(subcollection_ids, [])
Пример #4
0
 def test_list_memento_URIMs_11666(self):
     logger = logging.getLogger(__name__)
     requests_cache.install_cache(cachefile, backend='sqlite')
     session = requests.Session()
     aic = aiu.TroveCollection(11666, session=session, logger=logger)
     memento_urims = aic.list_memento_urims()
     self.assertEqual(memento_urims, [])
Пример #5
0
    def test_nonexistent_collection(self):
        logger = logging.getLogger(__name__)
        requests_cache.install_cache(cachefile, backend='sqlite')
        session = requests.Session()

        aic = aiu.TroveCollection(12345, session=session, logger=logger)
        self.assertFalse(aic.does_exist())
        session.close()
Пример #6
0
 def test_list_seed_URIs_11676(self):
     logger = logging.getLogger(__name__)
     requests_cache.install_cache(cachefile, backend='sqlite')
     session = requests.Session()
     aic = aiu.TroveCollection(11676, session=session, logger=logger)
     seed_uris = aic.list_seed_uris()
     self.assertEqual(seed_uris, [
         'http://boom09.com.au/',
         'http://www.socialinclusion.sa.gov.au/files/DiggingDeep.pdf',
         'http://kimberleydirectaction.wordpress.com/',
         'http://miningcommunities.com.au/', 'http://www.miningfm.com.au/',
         'http://www.roxbydowns.com', 'https://trackingonslow.com/'
     ])
Пример #7
0
 def test_list_memento_URIMs_11676(self):
     logger = logging.getLogger(__name__)
     requests_cache.install_cache(cachefile, backend='sqlite')
     session = requests.Session()
     aic = aiu.TroveCollection(11676, session=session, logger=logger)
     memento_urims = aic.list_memento_urims()
     self.assertEqual(memento_urims, [
         'https://webarchive.nla.gov.au/awa/20100210012123/http://pandora.nla.gov.au/pan/116281/20100210-1221/boom09.com.au/index.html',
         'https://webarchive.nla.gov.au/awa/20120803063643/http://pandora.nla.gov.au/pan/135435/20120803-1636/www.socialinclusion.sa.gov.au/files/DiggingDeep.pdf',
         'https://webarchive.nla.gov.au/awa/20140106084159/http://pandora.nla.gov.au/pan/129256/20140106-1941/kimberleydirectaction.wordpress.com/index.html',
         'https://webarchive.nla.gov.au/awa/20120904140027/http://pandora.nla.gov.au/pan/133943/20120905-0000/miningcommunities.com.au/news/index.html',
         'https://webarchive.nla.gov.au/awa/20130115130625/http://pandora.nla.gov.au/pan/136485/20130116-0006/www.miningfm.com.au/index.html',
         'https://webarchive.nla.gov.au/awa/20120604140044/http://pandora.nla.gov.au/pan/134289/20120605-0000/www.roxbydowns.com/index.html',
         'https://webarchive.nla.gov.au/awa/20150902083454/http://pandora.nla.gov.au/pan/153227/20150902-1834/trackingonslow.com/index.html'
     ])
Пример #8
0
    def test_L2_collection_11666(self):
        logger = logging.getLogger(__name__)
        requests_cache.install_cache(cachefile, backend='sqlite')
        session = requests.Session()

        aic = aiu.TroveCollection(11666, session=session, logger=logger)
        name = aic.get_collection_name()
        uri = aic.get_collection_uri()
        subject = aic.get_subject()
        archived_since = aic.get_archived_since()
        archived_until = aic.get_archived_until()

        self.assertEqual(name, "Australia's early 21st century resources boom")
        self.assertEqual(
            uri, "https%3A%2F%2Fwebarchive.nla.gov.au%2Fcollection%2F11666")
        self.assertEqual(subject, "Business & Economy")
        self.assertEqual(archived_since, "Nov 2006")
        self.assertEqual(archived_until, "Feb 2021")
Пример #9
0
    def test_collection_15003(self):
        logger = logging.getLogger(__name__)
        requests_cache.install_cache(cachefile, backend='sqlite')
        session = requests.Session()

        aic = aiu.TroveCollection(15003, session=session, logger=logger)
        name = aic.get_collection_name()
        uri = aic.get_collection_uri()
        subject = aic.get_subject()
        archived_since = aic.get_archived_since()
        archived_until = aic.get_archived_until()

        self.assertEqual(name, "Business & Economy")
        self.assertEqual(
            uri, "https%3A%2F%2Fwebarchive.nla.gov.au%2Fcollection%2F15003")
        self.assertEqual(subject, "Business & Economy")
        self.assertEqual(archived_since, "unknown")
        self.assertEqual(archived_until, "unknown")
Пример #10
0
    def test_subcollections_and_mementos_17918(self):
        logger = logging.getLogger(__name__)
        requests_cache.install_cache(cachefile, backend='sqlite')
        session = requests.Session()
        aic = aiu.TroveCollection(17918, session=session, logger=logger)
        seed_uris = aic.list_seed_uris()
        memento_urims = aic.list_memento_urims()
        subcollection_ids = aic.get_subcollections()
        breadcrumb_ids = aic.get_breadcrumbs()

        self.assertEqual(seed_uris, [
            'http://budget.liberal.org.au/',
            'http://www.budget.gov.au/2014-15/index.htm'
        ])
        self.assertEqual(memento_urims, [
            'https://webarchive.nla.gov.au/awa/20170510013313/http://pandora.nla.gov.au/pan/162677/20170510-1133/budget.liberal.org.au/index.html',
            'https://webarchive.nla.gov.au/awa/20140513231924/http://pandora.nla.gov.au/pan/126881/20140514-0919/www.budget.gov.au/2014-15/index.htm'
        ])
        self.assertEqual(breadcrumb_ids, [0, 15003, 15052])
        self.assertEqual(subcollection_ids, [17919, 17922, 17921])