Python generate_hits示例

编程语言: Python

命名空间/包名称: edl.blastm8

方法/功能: generate_hits

hotexamples.com的示例: 5

Python generate_hits - 已找到5个示例。这些是从开源项目中提取的最受好评的edl.blastm8.generate_hits现实Python示例。您可以评价示例，以帮助我们提高示例质量。

示例#1

显示文件

文件： merge_gffs.py 项目： jmeppley/py-metagenomics

def merge_gffs(rna_gff_files, cds_gff_files, contigs_fasta_file,
               output_file_prefix):

    # parse RNA GFF files
    rna_hits = {f: get_gff_hits(f) for f in rna_gff_files}

    # parse CDS files
    cds_hits = {}
    for cds_gff_file in cds_gff_files:
        for contig, hits in generate_hits(cds_gff_file,
                                          format=GFF,
                                          sort='score'):
            # get regions with rRNAs for this contig
            rna_regions = get_rna_regions(rna_hits, contig)

            # collect CDSs that don't overlap
            cds_hits.setdefault(contig, []).extend(
                [h for h in hits if h.checkForOverlap(rna_regions)[1] is None])

    # the source data
    hit_list_dicts = list(rna_hits.values())
    hit_list_dicts.append(cds_hits)

    # output files
    with open(output_file_prefix + ".gff", 'w') as GFFOUT:
        with open(output_file_prefix + ".fna", 'w') as FNAOUT:
            with open(output_file_prefix + ".faa", 'w') as FAAOUT:
                write_annotations_to_files(hit_list_dicts,
                                           contigs_fasta_file,
                                           GFFOUT,
                                           FNAOUT,
                                           FAAOUT)

示例#2

显示文件

文件： merge_gffs.py 项目： jmeppley/py-metagenomics

def get_gff_hits(hit_table_gff, **filter_args):
    filter_args.setdefault('sort', 'score')
    filter_args.setdefault('nonoverlapping', True)
    return {
        c: list(h)
        for c, h in generate_hits(hit_table_gff, format=GFF, **filter_args)
    }

示例#3

显示文件

文件： merge_gffs.py 项目： Piplopp/py-metagenomics

def merge_gffs(rna_gff_files, cds_gff_files, contigs_fasta_file,
               output_file_prefix):

    # parse RNA GFF files
    rna_hits = {f: get_gff_hits(f) for f in rna_gff_files}

    # parse CDS files
    cds_hits = {}
    for cds_gff_file in cds_gff_files:
        for contig, hits in generate_hits(cds_gff_file,
                                          format=GFF,
                                          sort='score'):
            # get regions with rRNAs for this contig
            rna_regions = get_rna_regions(rna_hits, contig)

            # collect CDSs that don't overlap
            cds_hits.setdefault(contig, []).extend(
                [h for h in hits if h.checkForOverlap(rna_regions)[1] is None])

    # the source data
    hit_list_dicts = list(rna_hits.values())
    hit_list_dicts.append(cds_hits)

    # output files
    with open(output_file_prefix + ".gff", 'w') as GFFOUT:
        with open(output_file_prefix + ".fna", 'w') as FNAOUT:
            with open(output_file_prefix + ".faa", 'w') as FAAOUT:
                write_annotations_to_files(hit_list_dicts,
                                           contigs_fasta_file,
                                           GFFOUT,
                                           FNAOUT,
                                           FAAOUT)

示例#4

显示文件

文件： merge_gffs.py 项目： jmeppley/py-metagenomics

def get_gff_hits(hit_table_gff, **filter_args):
    filter_args.setdefault('sort', 'score')
    filter_args.setdefault('nonoverlapping', True)
    return {c: list(h) for c, h in generate_hits(hit_table_gff,
                                                 format=GFF,
                                                 **filter_args)}

示例#5

显示文件

文件： merge_gffs.py 项目： jmeppley/py-metagenomics

def get_gff_hits(hit_table_gff, **filter_args):
    return {c: list(h) for c, h in generate_hits(hit_table_gff, format=GFF, **filter_args)}