Beispiel #1
0
 def test_sequence_conversion(self):
     pseq = PX.Sequence(
         type="protein",
         # id_ref=None,
         # id_source=None,
         symbol="ADHX",
         accession=PX.Accession("P81431", source="UniProtKB"),
         name="Alcohol dehydrogenase class-3",
         # location=None,
         mol_seq=PX.MolSeq(
             "TDATGKPIKCMAAIAWEAKKPLSIEEVEVAPPKSGEVRIKILHSGVCHTD"),
         uri=None,
         annotations=[
             PX.Annotation(ref="EC:1.1.1.1"),
             PX.Annotation(ref="GO:0004022")
         ],
         domain_architecture=PX.DomainArchitecture(
             length=50,
             domains=[
                 PX.ProteinDomain(*args) for args in (
                     # value, start, end, confidence
                     ("FOO", 0, 5, 7.0e-26),
                     ("BAR", 8, 13, 7.2e-117),
                     ("A-OK", 21, 34, 2.4e-06),
                     ("WD40", 40, 50, 0.3))
             ],
         ))
     srec = pseq.to_seqrecord()
     # TODO: check seqrec-specific traits (see args)
     #   Seq(letters, alphabet), id, name, description, features
     pseq2 = PX.Sequence.from_seqrecord(srec)
Beispiel #2
0
 def test_sequence_conversion(self):
     pseq = PX.Sequence(
         type='protein',
         # id_ref=None,
         # id_source=None,
         symbol='ADHX',
         accession=PX.Accession('P81431', source='UniProtKB'),
         name='Alcohol dehydrogenase class-3',
         # location=None,
         mol_seq=PX.MolSeq(
             'TDATGKPIKCMAAIAWEAKKPLSIEEVEVAPPKSGEVRIKILHSGVCHTD'),
         uri=None,
         annotations=[
             PX.Annotation(ref='EC:1.1.1.1'),
             PX.Annotation(ref='GO:0004022')
         ],
         domain_architecture=PX.DomainArchitecture(
             length=50,
             domains=[
                 PX.ProteinDomain(*args) for args in (
                     # value,   start,   end,    confidence
                     ('FOO', 0, 5, 7.0e-26),
                     ('BAR', 8, 13, 7.2e-117),
                     ('A-OK', 21, 34, 2.4e-06),
                     ('WD40', 40, 50, 0.3))
             ],
         ))
     srec = pseq.to_seqrecord()
     # TODO: check seqrec-specific traits (see args)
     #   Seq(letters, alphabet), id, name, description, features
     pseq2 = PX.Sequence.from_seqrecord(srec)
Beispiel #3
0
 def accession(self, elem):
     """Create accession object."""
     return PX.Accession(elem.text.strip(), elem.get("source"))
Beispiel #4
0
 def accession(self, elem):
     return PX.Accession(elem.text.strip(), elem.get('source'))
Beispiel #5
0
calculator = DistanceCalculator('identity')
dm = calculator.get_distance(aln)
print(dm)

constructor = DistanceTreeConstructor(calculator, 'nj')
tree = constructor.build_tree(aln)
print(tree)

scorer = ParsimonyScorer()
searcher = NNITreeSearcher(scorer)
constructor = ParsimonyTreeConstructor(searcher, tree)
pars_tree = constructor.build_tree(aln)

egfr_phy = pars_tree.as_phyloxml()

print(pars_tree)
print(egfr_phy)
print(list(pars_tree.find_elements('Inner3')))

for clade in egfr_phy.get_terminals():
    key = clade.name
    accession = PhyloXML.Accession(key, 'NCBI')
    mol_seq = PhyloXML.MolSeq(lookup[key], is_aligned=True)
    sequence = PhyloXML.Sequence(type='aa',
                                 accession=accession,
                                 mol_seq=mol_seq)
    clade.sequences.append(sequence)

Phylo.write(egfr_phy, 'egfr-family-annotated.xml', 'phyloxml')