Python get_datasets示例

编程语言: Python

命名空间/包名称: bibjson_util

方法/功能: get_datasets

hotexamples.com的示例: 7

Python get_datasets - 已找到7个示例。这些是从开源项目中提取的最受好评的bibjson_util.get_datasets现实Python示例。您可以评价示例，以帮助我们提高示例质量。

示例#1

显示文件

文件： bibjson_rdf.py 项目： opencitations/PubMed-OA-network-analysis-scripts

def process_articles(input_filename, writer, mappings):
    tar = tarfile.open(input_filename, 'r:gz')
    for tar_info, journal in get_datasets(tar, types=('Article',)):
        try:
            process_article(journal['recordList'], writer, mappings)
        except Exception:
            traceback.print_exc(file=sys.stderr)

示例#2

显示文件

文件： bibjson_rdf.py 项目： viveksck/OpenCitationsCorpus

def process_articles(input_filename, writer, mappings):
    tar = tarfile.open(input_filename, 'r:gz')
    for tar_info, journal in get_datasets(tar, types=('Article',)):
        try:
            process_article(journal['recordList'], writer, mappings)
        except Exception:
            traceback.print_exc(file=sys.stderr)

示例#3

显示文件

文件： error_counting.py 项目： HeinrichHartmann/OpenCitationsCorpus

tar = tarfile.open('../parsed-recent/articles-unified.bibjson.tar.gz', 'r:gz')

mappings = defaultdict(dict)

def format_article(article, mappings, records):
    authors = ', '.join(normalize_field(a, mappings, records).get('name', '-').replace(',', '').replace('.', '') for a in article.get('author', ()))
    return '%30s  %10s  %80s  %100s' % (
        article.get('doi', '')[:30].ljust(30),
        article.get('pmid', '')[:10].ljust(10),
        article.get('title', '')[:80].ljust(80),
        authors[:100].ljust(100),
    )



for tar_info, dataset in get_datasets(tar, ('Article',)):
    records = dataset['recordList']
    articles = [r for r in records if r.get('type') == 'Article']
    canonical, fields = majority_vote(records, ('Article',), mappings)

    records = dict((r['id'], r) for r in records)

    for record in records:
        v = compare(canonical, record, records)
        print v

    print '='*80
    print format_article(canonical, mappings, records)
    print '-'*80
    for article in articles:
        print format_article(article, mappings, records)

示例#4

显示文件

文件： bibjson_rdf.py 项目： opencitations/PubMed-OA-network-analysis-scripts

def process_errors(input_filename, writer, mappings):
    tar = tarfile.open(input_filename, 'r:gz')
    for tar_info, dataset in get_datasets(tar, types=None):
        process_error(dataset['recordList'], writer, mappings)

示例#5

显示文件

文件： bibjson_rdf.py 项目： opencitations/PubMed-OA-network-analysis-scripts

def process_citations(input_filename, writer, mappings):
    tar = tarfile.open(input_filename, 'r:gz')
    for tar_info, journal in get_datasets(tar, types=('Article',)):
        process_citation(journal['recordList'], writer, mappings)

示例#6

显示文件

文件： bibjson_rdf.py 项目： viveksck/OpenCitationsCorpus

def process_errors(input_filename, writer, mappings):
    tar = tarfile.open(input_filename, 'r:gz')
    for tar_info, dataset in get_datasets(tar, types=None):
        process_error(dataset['recordList'], writer, mappings)

示例#7

显示文件

文件： bibjson_rdf.py 项目： viveksck/OpenCitationsCorpus

def process_citations(input_filename, writer, mappings):
    tar = tarfile.open(input_filename, 'r:gz')
    for tar_info, journal in get_datasets(tar, types=('Article',)):
        process_citation(journal['recordList'], writer, mappings)