예제 #1
0
                writer.write(line.upper())
            else:
                writer.write(line)

original_backbone = MutableAlignment()
done = original_backbone.read_filepath(new_backbone_file)

# all query sequences
original_frag_file = (
    '/Users/gillianchu/warnow/bin/gitrepos/smirarab-sepp-17a33aa/trial/all_query.txt'
)
original_frag = MutableAlignment()
done = original_frag.read_filepath(original_frag_file)

# First build extended alignment on entire fragment set
extendedAlignment = ExtendedAlignment(original_frag.get_sequence_names())
dir = '/Users/gillianchu/warnow/bin/gitrepos/smirarab-sepp-17a33aa/trial/'

for a in [1, 2]:
    a = str(a)
    print("Working on HMM %s\n" % a)

    # query sequences
    aligned_files = glob.glob(str(dir) + 's' + str(a) + '_query.aln')
    if a == '1':
        sequence_files = glob.glob(str(dir) + 'query_x.txt')
    elif a == '2':
        sequence_files = glob.glob(str(dir) + 'query_y.txt')

    # sequences your hmm was trained on. Ensure you didn't just take the backbone alignment and
    # restrict the subset of sequences. This file must not have any gaps in it.
예제 #2
0
from sepp.scheduler import JobPool
from multiprocessing import Pool, Manager
from sepp.alignment import ExtendedAlignment
import glob

job_joiner = JoinAlignJobs
original_backbone_file = '/projects/sate8/namphuon/ultra_large/1000000/sate.fasta'
original_backbone = MutableAlignment()
done = original_backbone.read_filepath(original_backbone_file)

original_frag_file = '/projects/sate8/namphuon/ultra_large/1000000/initial.fas.100'
original_frag = MutableAlignment()
done = original_frag.read_filepath(original_frag_file)

#First build extended alignment on entire fragment set
extendedAlignment = ExtendedAlignment(original_frag.get_sequence_names())

dirs = glob.glob('/projects/sate8/namphuon/ultra_large/1000000/upp_100_10_new/temp/upp.1_HNlM/root/P_0/A_0_*/')

dirs.reverse()
for dir in dirs:
  print "Working on %s\n" % dir
  aligned_files = glob.glob('%sFC_*/hmmalign.results.*' % dir)
  sequence_files = glob.glob('%sFC_*/hmmalign.frag.*' % dir)
  base_alignment_file = glob.glob('%s/*.fasta' % dir)
  base_alignment = MutableAlignment()
  done = base_alignment.read_filepath(base_alignment_file[0])
  subbackbone = original_backbone.get_soft_sub_alignment(base_alignment.get_sequence_names())
  frags = MutableAlignment()
  sequence_names = []
  for file in sequence_files:
예제 #3
0
from sepp.problem import SeppProblem
import glob

job_joiner = JoinAlignJobs
original_backbone_file = ('/projects/sate8/namphuon/ultra_large/1000000/'
                          'sate.fasta')
original_backbone = MutableAlignment()
done = original_backbone.read_filepath(original_backbone_file)

original_frag_file = ('/projects/sate8/namphuon/ultra_large/1000000/'
                      'initial.fas.100')
original_frag = MutableAlignment()
done = original_frag.read_filepath(original_frag_file)

# First build extended alignment on entire fragment set
extendedAlignment = ExtendedAlignment(original_frag.get_sequence_names())

dirs = glob.glob('/projects/sate8/namphuon/ultra_large/1000000/upp_100_10_new/'
                 'temp/upp.1_HNlM/root/P_0/A_0_*/')

dirs.reverse()
for dir in dirs:
    print("Working on %s\n" % dir)
    aligned_files = glob.glob('%sFC_*/hmmalign.results.*' % dir)
    sequence_files = glob.glob('%sFC_*/hmmalign.frag.*' % dir)
    base_alignment_file = glob.glob('%s/*.fasta' % dir)
    base_alignment = MutableAlignment()
    done = base_alignment.read_filepath(base_alignment_file[0])
    subbackbone = original_backbone.get_soft_sub_alignment(
        base_alignment.get_sequence_names())
    frags = MutableAlignment()