def t_gff3_iterator(self): """Iterated parsing in GFF3 files with nested features. """ parser = GFFParser() recs = [r for r in parser.parse_in_parts(self._test_gff_file, target_lines=70)] # should be one big set because we don't have a good place to split assert len(recs) == 6 assert len(recs[0].features) == 59
def t_solid_iterator(self): """Iterated parsing in a flat file without nested features. """ parser = GFFParser() feature_sizes = [] for rec in parser.parse_in_parts(self._test_gff_file, target_lines=5): feature_sizes.append(len(rec.features)) assert len(feature_sizes) == 112 assert max(feature_sizes) == 1
def t_solid_iterator(self): """Iterated parsing in a flat file without nested features. """ parser = GFFParser() feature_sizes = [] for rec in parser.parse_in_parts(self._test_gff_file, target_lines=5): feature_sizes.append(len(rec.features)) assert len(feature_sizes) == 112 assert max(feature_sizes) == 1
def main(in_file): base, ext = os.path.splitext(in_file) out_file = "%s.gff3" % (base) in_handle = open(in_file) out_handle = open(out_file, "w") reader = GFFParser() writer = GFF3Writer() writer.write(reader.parse_in_parts(in_handle, target_lines=25000), out_handle) in_handle.close() out_handle.close()
def t_gff2_iteration(self): """Test iterated features with GFF2 files, breaking without parents. """ parser = GFFParser() recs = [] for rec in parser.parse_in_parts(self._wormbase_file, target_lines=15): recs.append(rec) assert len(recs) == 4 assert recs[0].features[0].type == 'region' assert recs[0].features[1].type == 'SAGE_tag' assert len(recs[0].features[2].sub_features) == 29