コード例 #1
0
def test_import_inputset():
    # test github
    ds = Dataset.import_inputset('files/git_repo.json',
                                 registry='github',
                                 cache_dir=CACHE_DIR,
                                 debug=True,
                                 github_pat=os.getenv('GITHUB_PAT'))
    ds.update(**{'name': 'test', 'version': '1.0'})
    ds.backup('../test.p')
    ds = Dataset.restore('../test.p')
    ds.export_inputset('../test.json')

    ds = Dataset.import_inputset('files/git_repo_commit.json',
                                 registry='github',
                                 cache_dir=CACHE_DIR,
                                 debug=True,
                                 github_pat=os.getenv('GITHUB_PAT'))
    ds.update(**{'name': 'test', 'version': '1.0'})
    ds.backup('../test.p')
    ds = Dataset.restore('../test.p')
    ds.export_inputset('../test.json')

    # test npm
    ds = Dataset.import_inputset('files/name_version.json',
                                 registry='npm',
                                 cache_dir=CACHE_DIR,
                                 debug=True)
    ds.update(**{'name': 'test', 'version': '1.0'})
    ds.backup('../test.p')
    ds = Dataset.restore('../test.p')
    ds.export_inputset('../test.json')

    # test pypi
    ds = Dataset.import_inputset('files/name_version.json',
                                 registry='pypi',
                                 cache_dir=CACHE_DIR,
                                 debug=True)
    ds.update(**{'name': 'test', 'version': '1.0'})
    ds.backup('../test.p')
    ds = Dataset.restore('../test.p')
    ds.export_inputset('../test.json')

    # test vanilla
    ds = Dataset.import_inputset('files/http_url.json',
                                 cache_dir=CACHE_DIR,
                                 debug=True)
    ds.update(**{'name': 'test', 'version': '1.0'})
    ds.backup('../test.p')
    ds = Dataset.restore('../test.p')
    ds.export_inputset('../test.json')

    # cleanup files
    os.remove('../test.p')
    os.remove('../test.json')
コード例 #2
0
def test_load_weblist():
    # test github
    ds = Dataset.load_web('top1kstarred',
                          registry='github',
                          from_type='list',
                          cache_dir=CACHE_DIR,
                          debug=True,
                          github_pat=os.getenv('GITHUB_PAT'))
    ds.trim(10)
    ds.get_projects_meta()
    ds.get_project_versions(historical='latest')
    ds.update(**{'name': 'test', 'version': '1.0'})
    ds.backup('../test.p')
    ds = Dataset.restore('../test.p')
    ds.export_inputset('../test.json')

    # test npm
    ds = Dataset.load_web('allbydependents',
                          registry='npm',
                          from_type='list',
                          cache_dir=CACHE_DIR,
                          debug=True)
    ds.trim(10)
    ds.get_projects_meta()
    ds.get_project_versions(historical='latest')
    ds.update(**{'name': 'test', 'version': '1.0'})
    ds.backup('../test.p')
    ds = Dataset.restore('../test.p')
    ds.export_inputset('../test.json')

    # test pypi
    ds = Dataset.load_web('top4kyear',
                          registry='pypi',
                          from_type='list',
                          cache_dir=CACHE_DIR,
                          debug=True)
    ds.trim(10)
    ds.get_projects_meta()
    ds.get_project_versions(historical='latest')
    ds.update(**{'name': 'test', 'version': '1.0'})
    ds.backup('../test.p')
    ds = Dataset.restore('../test.p')
    ds.export_inputset('../test.json')

    # cleanup files
    os.remove('../test.p')
    os.remove('../test.json')
コード例 #3
0
def restore(ctx, filepath):
    """Restores a pickled dataset file."""
    backup_ds = None

    try:
        backup_ds = deepcopy(ctx.obj.get('dataset', None))

        ds = Dataset.restore(filepath)
        ctx.obj['dataset'] = ds

        # reset the temporary api/metadata dict
        global TEMP_SETTINGS
        TEMP_SETTINGS = dict()

    except Exception as e:
        print_error(e, DEBUG)

        # silently restore the dataset
        ctx.obj['dataset'] = backup_ds