Python on_search Examples

Programming Language: Python

Namespace/Package Name: entrez

Method/Function: on_search

Examples at hotexamples.com: 8

Python on_search - 8 examples found. These are the top rated real world Python examples of entrez.on_search extracted from open source projects. You can rate examples to help us improve the quality of examples.

Example #1

Show file

File: acc2gi.py Project: khyox/entrez

def print_acc2gi(accessions):
    """Print GIs corresponding to the given accession numbers."""
    term = ' OR '.join(a + '[accn]' for a in accessions)
    for line in entrez.on_search(db='nucleotide', term=term, tool='summary'):
        if 'Name="Extra"' in line and any(a in line for a in accessions):
            _, gi, _, acc, _ = line.split('|', 4)
            print('%18s  ->  %s' % (acc, gi))

Example #2

Show file

File: sra2runacc.py Project: vramius1017/entrez

def main():
    parser = argparse.ArgumentParser(description=__doc__)
    parser.add_argument('-s', '--sra', metavar='SRAid', help='SRA identifier')
    args = parser.parse_args()

    for line in entrez.on_search(db='sra', term=args.sra, tool='summary'):
        if 'Name="Runs"' in line:
            acc = re.search('acc=\"(?P<acc>\w+[0-9]+)\"', line).group('acc')
            print(acc)

Example #3

Show file

File: acc2gi.py Project: vramius1017/entrez

def print_acc2gi(accessions):
    """Print GIs corresponding to the given accession numbers."""
    term = ' OR '.join(a + '[accn]' for a in accessions)
    for line in entrez.on_search(db='nucleotide', term=term, tool='summary'):
        if 'Name="Extra"' in line and any(a in line for a in accessions):
            gi = re.search('gi\|([0-9]+)\|', line).group(1)
            acc = re.search('((emb)|(gb)|(ref)|(dbj))\|(?P<acc>\w+\.[0-9]+)\|',
                            line).group('acc')
            print('%18s  ->  %s' % (acc, gi))

Example #4

Show file

File: acc2gi.py Project: jordibc/entrez

def print_acc2gi(accessions):
    """Print GIs corresponding to the given accession numbers."""
    term = ' OR '.join(a + '[accn]' for a in accessions)
    for line in entrez.on_search(db='nucleotide', term=term, tool='summary'):
        if 'Name="Extra"' in line and any(a in line for a in accessions):
            gi = re.search('gi\|([0-9]+)\|', line).group(1)
            acc = re.search('((emb)|(gb)|(ref)|(dbj))\|(?P<acc>\w+\.[0-9]+)\|',
                            line).group('acc')
            print('%18s  ->  %s' % (acc, gi))

Example #5

Show file

File: sample_applications.py Project: khyox/entrez

def application_3():
    """Retrieving large datasets.

    Download all chimpanzee mRNA sequences in FASTA format (>50,000 sequences).
    """
    query = 'chimpanzee[orgn] AND biomol mrna[prop]'
    with open('chimp.fna', 'w') as fout:
        for line in entrez.on_search(db='nucleotide', term=query,
                                     tool='fetch', rettype='fasta'):
            fout.write(line + '\n')

Example #6

Show file

def application_3():
    """Sample Application 3: Retrieving large datasets

    Download all chimpanzee mRNA sequences in FASTA format (>50,000 sequences).
    """
    query = 'chimpanzee[orgn] AND biomol mrna[prop]'
    with open('chimp.fna', 'w') as fout:
        for line in ez.on_search(db='nucleotide',
                                 term=query,
                                 tool='fetch',
                                 rettype='fasta'):
            fout.write(line + '\n')
    print('The results are in file chimp.fna.')

Example #7

Show file

File: sample_applications.py Project: khyox/entrez

def application_2():
    """Converting accession numbers to data.

    Starting with a list of protein accession numbers, return the sequences in
    FASTA format.
    """
    # Input: comma-delimited list of accessions.
    accs = 'NM_009417,NM_000547,NM_001003009,NM_019353'.split(',')
    query = ' OR '.join(a + '[accn]' for a in accs)

    # Output: FASTA data.
    for line in entrez.on_search(db='nucleotide', term=query, tool='fetch',
                                 db2='protein', rettype='fasta'):
        print(line)

Example #8

Show file

def application_2():
    """Sample Application 2: Converting accession numbers to data

    Starting with a list of protein accession numbers, return the sequences in
    FASTA format.
    """
    # Input: comma-delimited list of accessions.
    accs = 'NM_009417,NM_000547,NM_001003009,NM_019353'.split(',')
    query = ' OR '.join(a + '[accn]' for a in accs)

    # Output: FASTA data.
    for line in ez.on_search(db='nuccore',
                             term=query,
                             tool='fetch',
                             rettype='fasta'):
        print(line)