def test_list_versions(): pairs = list_versions('nasa.gov') dt, url = next(pairs) assert dt == datetime(1996, 12, 31, 23, 58, 47) # Exhaust the generator and make sure not entries trigger errors. list(pairs)
def test_list_versions_multipage(): # cnn.com has enough 'mementos' to span multiple pages and exercise the # multi-page code path. pairs = list_versions('cnn.com') # Exhaust the generator and make sure not entries trigger errors. list(pairs)
def test_list_versions(): versions = list_versions('nasa.gov') version = next(versions) assert version.date == datetime(1996, 12, 31, 23, 58, 47) # Exhaust the generator and make sure no entries trigger errors. list(versions)
def import_ia(url, agency, site, from_date=None, to_date=None): # Pulling on this generator does the work. versions = (ia.timestamped_uri_to_version(version.date, version.raw_url, url=version.url, site=site, agency=agency, view_url=version.view_url) for version in ia.list_versions(url, from_date=from_date, to_date=to_date)) _add_and_monitor(versions)
def import_ia(url, agency, site): # Pulling on this generator does the work. versions = (ia.timestamped_uri_to_version(dt, uri, url=url, site=site, agency=agency) for dt, uri in ia.list_versions(url)) # Wrap it in a progress bar. versions = tqdm(versions, desc='importing', unit=' versions') return post_versions_batched(versions)
def import_ia(url, *, from_date=None, to_date=None, maintainers=None, tags=None, skip_unchanged='resolved-response'): # Pulling on this generator does the work. skip_responses = skip_unchanged == 'response' versions = (ia.timestamped_uri_to_version(version.date, version.raw_url, url=version.url, maintainers=maintainers, tags=tags, view_url=version.view_url) for version in ia.list_versions(url, from_date=from_date, to_date=to_date, skip_repeats=skip_responses)) if skip_unchanged == 'resolved-response': versions = _filter_unchanged_versions(versions) _add_and_monitor(versions)