Exemple #1
0
def get_parsed_files_list(d):
    fl = fn.get_files(d)
    pfl = parse_files_list(fl)
    return pfl
Exemple #2
0
inp1 = directory with maf and mod files
inp2 = Newick tree file
inp3 = output stump
'''
import os, sys, fn

dir = sys.argv[1]
newick = os.path.abspath(sys.argv[2])
out_nm = sys.argv[3]


def copy_tree__write_runccs(tree, fl, m_runcc, p_runcc):
    new_tree = "%s.%s.nwk" % (tree, fl.split("/")[-1].replace(".maf", ""))
    copy_command = "cp %s %s" % (tree, new_tree)
    os.system(copy_command)
    model_command = "module load PHAST;phastCons -i MAF --estimate-trees %s --no-post-probs %s %s.mod\n"%\
   (new_tree,fl,fl)
    m_runcc.write(model_command)
    phastCons_command = "module load PHAST;phastCons -i MAF %s %s.cons.mod,%s.noncons.mod > %s.wig\n"%\
   (fl,new_tree,new_tree,fl)
    p_runcc.write(phastCons_command)


files_list = fn.get_files(dir, ".maf", "tail")
model_runcc = open(out_nm + "-generate_models.runcc", "w")
phastCons_runcc = open(out_nm + "-run_phastCons.runcc", "w")
for file in files_list:
    copy_tree__write_runccs(newick, file, model_runcc, phastCons_runcc)
model_runcc.close()
phastCons_runcc.close()
print '''
inp1 = directory with .lav files
inp2 = output directory for .psl files
'''
import os, sys, fn

dir = sys.argv[1]
out_dir = os.path.abspath(sys.argv[2])

if os.path.isfile("lav2psl.sh") == True:
    chain_fl = fn.get_files(".", "chain_psl")
    iteration = len(chain_fl) + 1
    qsub_name = "lav2psl_%i.sh" % iteration
    shell = open(qsub_name, "w")
else:
    qsub_name = "lav2psl.sh"
    shell = open(qsub_name, "w")
shell.write('''#!/bin/bash -login
#PBS -q main
#PBS -l nodes=1:ppn=1,walltime=02:00:00,mem=1gb
''')
files_list = fn.get_files(dir, ".lav", "tail")
for file in files_list:
    command_line = "/mnt/home/lloydjo1/bin/liftOver/lavToPsl %s %s/%s\n" % (
        file, out_dir, file.split("/")[-1].replace("lav", "psl"))
    # os.system(command_line)
    shell.write(command_line)
shell.close()
os.system("qsub %s" % qsub_name)
print '''
inp1 = directory with .chain files
inp2 = output name
'''
import os, sys, fn

dir = os.path.abspath(sys.argv[1])
out_name = dir + "/" + sys.argv[2]
if not out_name.endswith(".chain.sorted"):
    out_name = out_name + ".chain.sorted"

if os.path.isfile("chainMergeSort.sh") == True:
    chain_fl = fn.get_files(".", "chainMergeSort")
    iteration = len(chain_fl) + 1
    qsub_name = "chainMergeSort_%i.sh" % iteration
    shell = open(qsub_name, "w")
else:
    qsub_name = "chainMergeSort.sh"
    shell = open(qsub_name, "w")
shell.write('''#!/bin/bash -login
#PBS -q main
#PBS -l nodes=1:ppn=1,walltime=01:00:00,mem=1gb
/mnt/home/lloydjo1/bin/liftOver/chainMergeSort %s/*.chain.sorted.merged > %s
''' % (dir, out_name))
shell.close()
os.system("qsub %s" % qsub_name)
print '''
inp1 = directory with fasta files
'''
import os, sys, fn

dir = sys.argv[1]


def parse_files_list(fl):
    l = []
    for item in fl:
        if item.endswith("lav") or item.endswith("psl") or item.endswith(
                "nib") or item.endswith(".sizes"):
            pass
        else:
            l.append(item)
    return l


files_list = fn.get_files(dir)
pfl = parse_files_list(files_list)
for file in pfl:
    print "Working on file:", file
    command_line = "/mnt/home/lloydjo1/bin/liftOver/faSize %s -detailed > %s.sizes" % (
        file, file)
    os.system(command_line)
print'''
inp1 = maf file 1
inp2 = maf file 2
inp3 = output name
'''
import os,sys,fn

maf1 = os.path.abspath(sys.argv[1])
maf2 = os.path.abspath(sys.argv[2])
out_nm = os.path.abspath(sys.argv[3])

if os.path.isfile("multiz_submit.sh") == True:
	chain_fl = fn.get_files(".","multiz_submit")
	iteration = len(chain_fl)+1
	qsub_name = "multiz_submit%i.sh"%iteration
	shell = open(qsub_name,"w")
else:
	qsub_name = "multiz_submit.sh"
	shell = open(qsub_name,"w")
shell.write('''#!/bin/bash -login
#PBS -q main
#PBS -l nodes=1:ppn=1,walltime=01:00:00,mem=1gb
/mnt/home/lloydjo1/bin/multiz-tba.012109/multiz %s %s v > %s
'''%(maf1,maf2,out_nm))
shell.close()
os.system("qsub %s"%qsub_name)