Python Pipeline.submit Beispiele

Programmiersprache: Python

Namespace / Paketname: CGAT

Klasse / Typ: Pipeline

Methode / Funktion: submit

Beispiele auf hotexamples.com: 21

Python Pipeline.submit - 21 Beispiele gefunden. Dies sind die am besten bewerteten Python Beispiele für die CGAT.Pipeline.submit, die aus Open Source-Projekten extrahiert wurden. Sie können Beispiele bewerten, um die Qualität der Beispiele zu verbessern.

Häufig verwendete Methoden

Anzeigen Verbergen

snip(30)

asList(30)

run(30)

touch(30)

toTable(30)

load(30)

getTempFilename(30)

getTempFile(30)

getTempDir(23)

getParameters(14)

PipelineError(12)

submit(11)

publish_report(8)

peekParameters(6)

asDict(5)

quote(5)

warn(4)

getProjectId(3)

info(3)

isEmpty(3)

run_report(3)

substituteParameters(3)

mergeAndLoad(3)

joinStatements(2)

which(2)

checkParameter(2)

matchParameter(1)

main(1)

loadParameters(1)

isTrue(1)

getProjectName(1)

execute(1)

concatenateAndLoad(1)

checkFiles(1)

checkExecutables(1)

Beispiel #1

Datei anzeigen

Datei: pipeline_metagenomebenchmark.py Projekt: Charlie-George/cgat

def buildExpectedGenomeCoverage(infiles, outfile):
    '''
    build the expected coverage over the genomes
    in the sample based on read depth and length
    '''
    P.submit("PipelineMetagenomeBenchmark",
             "buildExpectedCoverageOverGenomes", infiles=infiles, outfiles=outfile)

Beispiel #2

Datei anzeigen

Datei: pipeline_metagenomebenchmark.py Projekt: Charlie-George/cgat

def buildCoverageOverGenomes(infiles, outfile):
    '''
    create file with the coverage over each of the 
    simulated genomes
    '''
    P.submit("PipelineMetagenomeBenchmark", "buildCoverageOverGenomes",
             infiles=infiles, outfiles=outfile)

Beispiel #3

Datei anzeigen

Datei: pipeline_metagenomebenchmark.py Projekt: lesheng/cgat

def filterContigsByCoverage(infiles, outfile):
    '''
    filter contigs by their average base coverage
    '''
    P.submit("PipelineMetagenomeBenchmark",
             "filterByCoverage",
             infiles=infiles,
             outfiles=outfile)

Beispiel #4

Datei anzeigen

Datei: pipeline_metagenomebenchmark.py Projekt: lesheng/cgat

def buildCoverageOverGenomes(infiles, outfile):
    '''
    create file with the coverage over each of the 
    simulated genomes
    '''
    P.submit("PipelineMetagenomeBenchmark",
             "buildCoverageOverGenomes",
             infiles=infiles,
             outfiles=outfile)

Beispiel #5

Datei anzeigen

Datei: pipeline_idr.py Projekt: jmadzo/cgat

def findNPeaksForPooledPseudoreplicates(infiles, outfile):
    idr_thresh = PARAMS["idr_options_pooled_consistency_threshold"]
    module = P.snip(IDR.__file__, ".py")

    P.submit(module,
             "findNPeaks",
             params=[str(idr_thresh), ],
             infiles=infiles,
             outfiles=outfile)

Beispiel #6

Datei anzeigen

Datei: pipeline_idr.py Projekt: jmadzo/cgat

def findNPeaksForIndividualReplicates(infiles, outfile):
    idr_thresh = PARAMS["idr_options_inter_replicate_threshold"]
    module = P.snip(IDR.__file__, ".py")

    P.submit(module,
             "findNPeaks",
             params=[str(idr_thresh), ],
             infiles=infiles,
             outfiles=outfile)

Beispiel #7

Datei anzeigen

def findNPeaksForPooledPseudoreplicates(infiles, outfile):
    idr_thresh = PARAMS["idr_options_pooled_consistency_threshold"]
    module = P.snip(IDR.__file__, ".pyc")

    P.submit(module,
             "findNPeaks",
             params=[str(idr_thresh), ],
             infiles=infiles,
             outfiles=outfile)

Beispiel #8

Datei anzeigen

def findNPeaksForIndividualReplicates(infiles, outfile):
    idr_thresh = PARAMS["idr_options_inter_replicate_threshold"]
    module = P.snip(IDR.__file__, ".pyc")

    P.submit(module,
             "findNPeaks",
             params=[str(idr_thresh), ],
             infiles=infiles,
             outfiles=outfile)

Beispiel #9

Datei anzeigen

Datei: pipeline_metagenomebenchmark.py Projekt: lesheng/cgat

def buildExpectedGenomeCoverage(infiles, outfile):
    '''
    build the expected coverage over the genomes
    in the sample based on read depth and length
    '''
    P.submit("PipelineMetagenomeBenchmark",
             "buildExpectedCoverageOverGenomes",
             infiles=infiles,
             outfiles=outfile)

Beispiel #10

Datei anzeigen

Datei: pipeline_idr.py Projekt: Charlie-George/cgat

def findNPeaksForPseudoreplicates(infiles, outfile):
    idr_thresh = PARAMS["idr_options_self_consistency_threshold"]
    try:
        module = P.snip(IDR.__file__, ".py")
    except ValueError:
        module = P.snip(IDR.__file__, ".pyc")

    P.submit(module,
             "findNPeaks",
             params=[str(idr_thresh), ],
             infiles=infiles,
             outfiles=outfile)

Beispiel #11

Datei anzeigen

def splitPooledBamfiles(infile, sentinel):
    infile = P.snip(infile, ".sentinel") + ".bam"
    outfile = P.snip(sentinel, ".sentinel")
    params = '2'
    try:
        module = P.snip(IDR.__file__, ".py")
    except ValueError:
        module = P.snip(IDR.__file__, ".pyc")

    P.submit(module, "splitBam", params, infile, outfile)

    P.touch(sentinel)

Beispiel #12

Datei anzeigen

Datei: pipeline_idr.py Projekt: jmadzo/cgat

def splitPooledBamfiles(infile, sentinal):
    infile = P.snip(infile, ".sentinal") + ".bam"
    outfile = P.snip(sentinal, ".sentinal")
    params = '2'
    module = P.snip(IDR.__file__, ".py")

    P.submit(module,
             "splitBam",
             params,
             infile,
             outfile)

    P.touch(sentinal)

Beispiel #13

Datei anzeigen

def splitPooledBamfiles(infile, sentinal):
    infile = P.snip(infile, ".sentinal") + ".bam"
    outfile = P.snip(sentinal, ".sentinal")
    params = '2'
    module = P.snip(IDR.__file__, ".pyc")

    P.submit(module,
             "splitBam",
             params,
             infile,
             outfile)

    P.touch(sentinal)

Beispiel #14

Datei anzeigen

def findNPeaksForPseudoreplicates(infiles, outfile):
    idr_thresh = PARAMS["idr_options_self_consistency_threshold"]
    try:
        module = P.snip(IDR.__file__, ".py")
    except ValueError:
        module = P.snip(IDR.__file__, ".pyc")

    P.submit(module,
             "findNPeaks",
             params=[
                 str(idr_thresh),
             ],
             infiles=infiles,
             outfiles=outfile)

Beispiel #15

Datei anzeigen

def splitBamfiles(infile, sentinel):
    """
    For all tracks, split the filtered bamfile in two using pysam
    """
    infile = P.snip(infile, ".sentinel") + ".bam"
    outfile = P.snip(sentinel, ".sentinel")
    params = '2'
    try:
        module = P.snip(IDR.__file__, ".py")
    except ValueError:
        module = P.snip(IDR.__file__, ".pyc")

    P.submit(module, "splitBam", params, infile, outfile)

    P.touch(sentinel)

Beispiel #16

Datei anzeigen

Datei: pipeline_idr.py Projekt: jmadzo/cgat

def splitBamfiles(infile, sentinal):
    """
    For all tracks, split the filtered bamfile in two using pysam
    """
    infile = P.snip(infile, ".sentinal") + ".bam"
    outfile = P.snip(sentinal, ".sentinal")
    params = '2'
    module = P.snip(IDR.__file__, ".pyc")

    P.submit(module,
             "splitBam",
             params,
             infile,
             outfile)

    P.touch(sentinal)

Beispiel #17

Datei anzeigen

Datei: pipeline_metagenomebenchmark.py Projekt: yangjl/cgat

def buildChimerasBasedOnReads(infile, outfile):
    '''
    this function is an alternative to counting a contig as a chimera
    if it aligns to more than one genome. A contig is likely to align
    to multiple genomes with high idenitity if there contains very similar
    genomes in the sample. This is true of our simulation that contains
    subspecies of the same species e.g. B.fragilis subspecies

    A more appropriate method for assessing chimericity is to score
    each contig with a chimericity score. The chimericity score is the 
    ratio of "good" alignments / "bad" alignments. An alignment is considered
    "good" if it is from the species from which the majority of alignments
    from that contig are derived'''

    P.submit("CGATPipelines.PipelineMetagenomeBenchmark", "buildChimerasBasedOnReads"
             , infiles = infile, outfiles = outfile)

Beispiel #18

Datei anzeigen

Datei: pipeline_idr.py Projekt: Charlie-George/cgat

def splitPooledBamfiles(infile, sentinel):
    infile = P.snip(infile, ".sentinel") + ".bam"
    outfile = P.snip(sentinel, ".sentinel")
    params = '2'
    try:
        module = P.snip(IDR.__file__, ".py")
    except ValueError:
        module = P.snip(IDR.__file__, ".pyc")

    P.submit(module,
             "splitBam",
             params,
             infile,
             outfile)

    P.touch(sentinel)

Beispiel #19

Datei anzeigen

Datei: pipeline_metagenomebenchmark.py Projekt: lesheng/cgat

def buildChimerasBasedOnReads(infile, outfile):
    '''
    this function is an alternative to counting a contig as a chimera
    if it aligns to more than one genome. A contig is likely to align
    to multiple genomes with high idenitity if there contains very similar
    genomes in the sample. This is true of our simulation that contains
    subspecies of the same species e.g. B.fragilis subspecies

    A more appropriate method for assessing chimericity is to score
    each contig with a chimericity score. The chimericity score is the 
    ratio of "good" alignments / "bad" alignments. An alignment is considered
    "good" if it is from the species from which the majority of alignments
    from that contig are derived'''

    P.submit("CGATPipelines.PipelineMetagenomeBenchmark",
             "buildChimerasBasedOnReads",
             infiles=infile,
             outfiles=outfile)

Beispiel #20

Datei anzeigen

def buildCoverageOverContigs(infiles, outfile):
    '''
    build histograms of the coverage over each of the contigs
    '''
    bam = infiles[0]
    # genomecoveragebed does not like some of the 
    # output from bwa. bwa outputs some reads
    # that map off the end of contigs
    # as having a leftmost position of 0. This is
    # not ideal. Need to use temporary bam
    # files with only mapped reads - this is 
    # nasty and needs changing
    tempdir = P.getTempDir(".")
    tempname = P.getTempFilename(tempdir) + ".bam"
    P.submit("CGATPipelines.PipelineMetagenomeAssembly", 
             "filterBamOnPos", 
             infiles = bam, 
             outfiles = tempname)

    # tablename where alignment stats live
    tablename = os.path.dirname(
        bam)[:-len(".dir")] + "_" + P.snip(os.path.basename(bam), ".bam") + "_alignment_stats"

    # hack to convert to table - add .load
    tablename = P.toTable(tablename + ".load")
    
    # connect to database
    dbh = connect()
    cc = dbh.cursor()

    # get number of reads aligned from bam2stats
    if PARAMS.get("coverage_scale"):
        scale_factor = cc.execute("""SELECT counts FROM %s
                                     WHERE category == 'reads_mapped'""" % tablename).fetchone()[0]
        scale_factor = 1 / (float(scale_factor) / 1000000)
        scale_options = "-scale %(scale_factor)f"
    else:
        scale_options = ""

    statement = '''genomeCoverageBed -ibam %(tempname)s %(scale_options)s -d | gzip > %(outfile)s;
                   rm -rf %(tempdir)s'''
    P.run()

Beispiel #21

Datei anzeigen

Datei: pipeline_metagenomebenchmark.py Projekt: yangjl/cgat

def filterContigsByCoverage(infiles, outfile):
    '''
    filter contigs by their average base coverage
    '''
    P.submit("PipelineMetagenomeBenchmark", "filterByCoverage", infiles = infiles, outfiles = outfile)