Beispiel #1
0
 def t_gff3_iterator(self):
     """Iterated parsing in GFF3 files with nested features.
     """
     parser = GFFParser()
     recs = [r for r in parser.parse_in_parts(self._test_gff_file,
         target_lines=70)]
     # should be one big set because we don't have a good place to split
     assert len(recs) == 6
     assert len(recs[0].features) == 59
 def t_solid_iterator(self):
     """Iterated parsing in a flat file without nested features.
     """
     parser = GFFParser()
     feature_sizes = []
     for rec in parser.parse_in_parts(self._test_gff_file, target_lines=5):
         feature_sizes.append(len(rec.features))
     assert len(feature_sizes) == 112
     assert max(feature_sizes) == 1
 def t_solid_iterator(self):
     """Iterated parsing in a flat file without nested features.
     """
     parser = GFFParser()
     feature_sizes = []
     for rec in parser.parse_in_parts(self._test_gff_file,
             target_lines=5):
         feature_sizes.append(len(rec.features))
     assert len(feature_sizes) == 112
     assert max(feature_sizes) == 1
Beispiel #4
0
def main(in_file):
    base, ext = os.path.splitext(in_file)
    out_file = "%s.gff3" % (base)
    in_handle = open(in_file)
    out_handle = open(out_file, "w")
    reader = GFFParser()
    writer = GFF3Writer()
    writer.write(reader.parse_in_parts(in_handle, target_lines=25000),
            out_handle)
    in_handle.close()
    out_handle.close()
 def t_gff2_iteration(self):
     """Test iterated features with GFF2 files, breaking without parents.
     """
     parser = GFFParser()
     recs = []
     for rec in parser.parse_in_parts(self._wormbase_file, target_lines=15):
         recs.append(rec)
     assert len(recs) == 4
     assert recs[0].features[0].type == 'region'
     assert recs[0].features[1].type == 'SAGE_tag'
     assert len(recs[0].features[2].sub_features) == 29