示例#1
0
def dnaseq_to_proteindb(ctx, config_file, input_fasta, translation_table,
                        num_orfs, num_orfs_complement, output_proteindb,
                        var_prefix, skip_including_all_cds, include_biotypes,
                        exclude_biotypes, biotype_str, expression_str,
                        expression_thresh):
    if input_fasta is None:
        print_help()

    pipeline_arguments = {}
    pipeline_arguments[
        EnsemblDataService.TRANSLATION_TABLE] = translation_table
    pipeline_arguments[EnsemblDataService.PROTEIN_DB_OUTPUT] = output_proteindb
    pipeline_arguments[EnsemblDataService.HEADER_VAR_PREFIX] = var_prefix
    pipeline_arguments[EnsemblDataService.EXCLUDE_BIOTYPES] = exclude_biotypes
    pipeline_arguments[
        EnsemblDataService.SKIP_INCLUDING_ALL_CDS] = skip_including_all_cds
    pipeline_arguments[EnsemblDataService.INCLUDE_BIOTYPES] = include_biotypes
    pipeline_arguments[EnsemblDataService.BIOTYPE_STR] = biotype_str
    pipeline_arguments[EnsemblDataService.NUM_ORFS] = num_orfs
    pipeline_arguments[
        EnsemblDataService.NUM_ORFS_COMPLEMENT] = num_orfs_complement
    pipeline_arguments[EnsemblDataService.EXPRESSION_STR] = expression_str
    pipeline_arguments[
        EnsemblDataService.EXPRESSION_THRESH] = expression_thresh

    ensembl_data_service = EnsemblDataService(config_file, pipeline_arguments)
    ensembl_data_service.dnaseq_to_proteindb(input_fasta)
示例#2
0
def vcf_to_proteindb(ctx, config_file, input_fasta, vcf, gene_annotations_gtf,
                     translation_table, mito_translation_table, var_prefix,
                     report_ref_seq, output_proteindb, annotation_field_name,
                     af_field, af_threshold, transcript_index,
                     consequence_index, exclude_consequences,
                     skip_including_all_cds, include_consequences,
                     ignore_filters, accepted_filters):
    if input_fasta is None or vcf is None or gene_annotations_gtf is None:
        print_help()

    pipeline_arguments = {
        EnsemblDataService.MITO_TRANSLATION_TABLE: mito_translation_table,
        EnsemblDataService.TRANSLATION_TABLE: translation_table,
        EnsemblDataService.HEADER_VAR_PREFIX: var_prefix,
        EnsemblDataService.REPORT_REFERENCE_SEQ: report_ref_seq,
        EnsemblDataService.PROTEIN_DB_OUTPUT: output_proteindb,
        EnsemblDataService.ANNOTATION_FIELD_NAME: annotation_field_name,
        EnsemblDataService.AF_FIELD: af_field,
        EnsemblDataService.AF_THRESHOLD: af_threshold,
        EnsemblDataService.TRANSCRIPT_INDEX: transcript_index,
        EnsemblDataService.CONSEQUENCE_INDEX: consequence_index,
        EnsemblDataService.EXCLUDE_CONSEQUENCES: exclude_consequences,
        EnsemblDataService.SKIP_INCLUDING_ALL_CDS: skip_including_all_cds,
        EnsemblDataService.INCLUDE_CONSEQUENCES: include_consequences,
        EnsemblDataService.IGNORE_FILTERS: ignore_filters,
        EnsemblDataService.ACCEPTED_FILTERS: accepted_filters
    }

    ensembl_data_service = EnsemblDataService(config_file, pipeline_arguments)
    ensembl_data_service.vcf_to_proteindb(vcf, input_fasta,
                                          gene_annotations_gtf)
示例#3
0
def ensembl_check(ctx, config_file, input_fasta, output, add_stop_codons, num_aa):
  if input_fasta is None:
    print_help()

  pipeline_arguments = {EnsemblDataService.PROTEIN_DB_OUTPUT: output}

  ensembl_data_service = EnsemblDataService(config_file, pipeline_arguments)
  ensembl_data_service.check_proteindb(input_fasta, add_stop_codons, num_aa)
def threeframe_translation(ctx, config_file, input_fasta, translation_table, output):
    if input_fasta is None:
        print_help()

    pipeline_arguments = {EnsemblDataService.TRANSLATION_TABLE: translation_table,
                          EnsemblDataService.PROTEIN_DB_OUTPUT: output}

    ensembl_data_service = EnsemblDataService(config_file, pipeline_arguments)
    ensembl_data_service.three_frame_translation(input_fasta)
示例#5
0
def cosmic_to_proteindb(ctx, config_file, input_mutation, input_genes, output_db, tissue_type, split_by_tissue_type):
    if input_mutation is None or input_genes is None or output_db is None:
        print_help()

    pipeline_arguments = {CancerGenomesService.CONFIG_CANCER_GENOMES_MUTATION_FILE: input_mutation,
                          CancerGenomesService.CONFIG_COMPLETE_GENES_FILE: input_genes,
                          CancerGenomesService.CONFIG_OUTPUT_FILE: output_db,
                          CancerGenomesService.TISSUE_TYPE: tissue_type,
                          CancerGenomesService.SPLIT_BY_TISSUE_TYPE: split_by_tissue_type}

    cosmic_to_proteindb_service = CancerGenomesService(config_file, pipeline_arguments)
    cosmic_to_proteindb_service.cosmic_to_proteindb()
def cosmic_to_proteindb(ctx, config_file, input_mutation, input_genes,
                        output_db, filter_column, accepted_values,
                        split_by_filter_column):
    if input_mutation is None or input_genes is None or output_db is None:
        print_help()

    pipeline_arguments = {
        CancerGenomesService.CONFIG_CANCER_GENOMES_MUTATION_FILE:
        input_mutation,
        CancerGenomesService.CONFIG_COMPLETE_GENES_FILE: input_genes,
        CancerGenomesService.CONFIG_OUTPUT_FILE: output_db,
        CancerGenomesService.FILTER_COLUMN: filter_column,
        CancerGenomesService.ACCEPTED_VALUES: accepted_values,
        CancerGenomesService.SPLIT_BY_FILTER_COLUMN: split_by_filter_column
    }

    cosmic_to_proteindb_service = CancerGenomesService(config_file,
                                                       pipeline_arguments)
    cosmic_to_proteindb_service.cosmic_to_proteindb()
示例#7
0
def vcf_to_proteindb(
        ctx, config_file, input_fasta, vep_annotated_vcf, gene_annotations_gtf,
        translation_table, mito_translation_table, var_prefix, report_ref_seq,
        output_proteindb, annotation_field_name, af_field, af_threshold,
        transcript_index, consequence_index, exclude_biotypes,
        exclude_consequences, skip_including_all_cds, include_biotypes,
        include_consequences, biotype_str, ignore_filters, accepted_filters):
    if input_fasta is None or vep_annotated_vcf is None or gene_annotations_gtf is None:
        print_help()

    pipeline_arguments = {}
    pipeline_arguments[
        EnsemblDataService.MITO_TRANSLATION_TABLE] = mito_translation_table
    pipeline_arguments[
        EnsemblDataService.TRANSLATION_TABLE] = translation_table
    pipeline_arguments[EnsemblDataService.HEADER_VAR_PREFIX] = var_prefix
    pipeline_arguments[
        EnsemblDataService.REPORT_REFERENCE_SEQ] = report_ref_seq
    pipeline_arguments[EnsemblDataService.PROTEIN_DB_OUTPUT] = output_proteindb
    pipeline_arguments[
        EnsemblDataService.ANNOTATION_FIELD_NAME] = annotation_field_name
    pipeline_arguments[EnsemblDataService.AF_FIELD] = af_field
    pipeline_arguments[EnsemblDataService.AF_THRESHOLD] = af_threshold
    pipeline_arguments[EnsemblDataService.TRANSCRIPT_INDEX] = transcript_index
    pipeline_arguments[
        EnsemblDataService.CONSEQUENCE_INDEX] = consequence_index
    pipeline_arguments[EnsemblDataService.EXCLUDE_BIOTYPES] = exclude_biotypes
    pipeline_arguments[
        EnsemblDataService.EXCLUDE_CONSEQUENCES] = exclude_consequences
    pipeline_arguments[
        EnsemblDataService.SKIP_INCLUDING_ALL_CDS] = skip_including_all_cds
    pipeline_arguments[EnsemblDataService.INCLUDE_BIOTYPES] = include_biotypes
    pipeline_arguments[
        EnsemblDataService.INCLUDE_CONSEQUENCES] = include_consequences
    pipeline_arguments[EnsemblDataService.BIOTYPE_STR] = biotype_str
    pipeline_arguments[EnsemblDataService.IGNORE_FILTERS] = ignore_filters
    pipeline_arguments[EnsemblDataService.ACCEPTED_FILTERS] = accepted_filters

    ensembl_data_service = EnsemblDataService(config_file, pipeline_arguments)
    ensembl_data_service.vcf_to_proteindb(vep_annotated_vcf, input_fasta,
                                          gene_annotations_gtf)