Python parse_data 예제들, gc_content.parse_data Python 예제들

예제 #1

0

파일 보기

파일: test_overlap.py 프로젝트: szeitlin/Rosalind

 def test_old_parser(self):
     parser = parse_data(self.big_data)
     name, sequence = next(parser)
     self.assertEqual(name, 'Rosalind_3496')
     self.assertEqual(sequence,
     'ATGGCAGTCCGAGTTCACGAACCGAATACGTTTAATAGGTAGTCGCCACCACTTAGACGGGTTCTCGCCTATAGGGAACATTAAAGGCGTGGAATTCG')
     self.assertEqual(len(self.big_data), 0)

예제 #2

0

파일 보기

 def test_old_parser(self):
     parser = parse_data(self.big_data)
     name, sequence = next(parser)
     self.assertEqual(name, 'Rosalind_3496')
     self.assertEqual(
         sequence,
         'ATGGCAGTCCGAGTTCACGAACCGAATACGTTTAATAGGTAGTCGCCACCACTTAGACGGGTTCTCGCCTATAGGGAACATTAAAGGCGTGGAATTCG'
     )
     self.assertEqual(len(self.big_data), 0)

예제 #3

0

파일 보기

파일: test_oo_overlap.py 프로젝트: szeitlin/Rosalind

    def setUp(cls):
        with open('CENPA_3chunks.txt', 'r') as f:
            data = f.readlines()

        labeled = list(parse_data(data))
        cls.matches = compare_all_pairs_both_ways(labeled)

        with open('CENPA_8chunks.txt', 'r') as g:
            big_data = g.readlines()

        longer = list(parse_data(big_data))
        cls.more_matches = compare_all_pairs_both_ways(longer)

        with open('CA_superstring3_expected.txt', 'r') as h:
            cls.ss = h.readline().strip()

        with open('CA_superstring8_expected.txt', 'r') as m:
            lines = m.readlines()
            cls.ss8 = ''.join([x.strip() for x in lines])

예제 #4

0

파일 보기

    def setUp(cls):
        with open('CENPA_3chunks.txt', 'r') as f:
            data = f.readlines()

        labeled = list(parse_data(data))
        cls.matches = compare_all_pairs_both_ways(labeled)

        with open('CENPA_8chunks.txt', 'r') as g:
            big_data = g.readlines()

        longer = list(parse_data(big_data))
        cls.more_matches = compare_all_pairs_both_ways(longer)

        with open('CA_superstring3_expected.txt', 'r') as h:
            cls.ss = h.readline().strip()

        with open('CA_superstring8_expected.txt', 'r') as m:
            lines = m.readlines()
            cls.ss8 = ''.join([x.strip() for x in lines])

예제 #5

0

파일 보기

파일: overlap.py 프로젝트: szeitlin/Rosalind

def get_rescore_from_labeled(rescore, data):
    """
    This should not be needed.
    :param rescore: list of (name,name) tuples
    :param data: raw data
    :return: subset of labeled where all names in rescore are keys in labeled
    """
    labeled_list = list(parse_data(data))
    labeled_dict = {x[0]:x[1] for x in labeled_list}

    losers = dict()

    for x in rescore:
        losers[x[0]] = labeled.get(x[0])
        losers[x[1]] = labeled.get(x[1])

    #convert back to tuples for rescoring
    underdogs = list(losers.items())

    return underdogs

예제 #6

0

파일 보기

파일: test_gc_content.py 프로젝트: szeitlin/Rosalind

 def test_multiple_sequences(self):
     name, sequence = parse_data(self.big_data)
     self.assertEqual(name, 'Rosalind_0808')
     name, percent = gc_content(name, sequence, debug=True)
     self.assertEqual(percent, 60.919540)

예제 #7

0

파일 보기

파일: test_gc_content.py 프로젝트: szeitlin/Rosalind

 def test_raw_parsing_one(self):
     self.assertEqual(len(self.data[1].strip() + self.data[2].strip()), 87)
     name, sequence = parse_data(self.data)
     self.assertEqual(name, 'Rosalind_0808')
     self.assertEqual(len(sequence), 87)

예제 #8

0

파일 보기

파일: test_gc_content.py 프로젝트: szeitlin/Rosalind

 def test_gc_content(self):
     name, sequence = parse_data(self.data)
     name, percent = gc_content(name, sequence, debug=True)
     self.assertEqual(percent, 60.919540)

예제 #9

0

파일 보기

파일: test_gc_content.py 프로젝트: szeitlin/Rosalind

 def test_gc_content(self):
     name, sequence = parse_data(self.data)
     name, percent = gc_content(name, sequence, debug=True)
     self.assertEqual(percent, 60.919540)

예제 #10

0

파일 보기

파일: oo_overlap.py 프로젝트: szeitlin/Rosalind

        try:
            newedge = next(edges)
            listofedges.append(newedge)
        except StopIteration:
            break

    return listofedges



if __name__=='__main__':

    with open('CENPA_8chunks.txt', 'r') as f:
        data = f.readlines()

    labeled = list(parse_data(data))
    expected_pairs=8

    matches = compare_all_pairs_both_ways(labeled)

    if len(matches) != expected_pairs:
        print("warning! expected {} but found {}"
              .format(expected_pairs, len(matches)))

    listofedges = make_listofedges(matches)
    newgraph = Graph(listofedges)
    newgraph.sort_edges()
    superstring = newgraph.flatten_graph(matches)

    print(superstring)

예제 #11

0

파일 보기

파일: test_oo_overlap.py 프로젝트: szeitlin/Rosalind

    def setUp(cls):
        with open('CENPA_3chunks.txt', 'r') as f:
            data = f.readlines()

        cls.labeled = list(parse_data(data))

예제 #12

0

파일 보기

파일: test_oo_overlap.py 프로젝트: szeitlin/Rosalind

    def setUp(cls):
        with open('CENPA_3chunks.txt', 'r') as f:
            data = f.readlines()

        labeled = list(parse_data(data))
        cls.matches = compare_all_pairs_both_ways(labeled)

예제 #13

0

파일 보기

                    if result[1] not in matches[result[0]]:
                        matches[result[0]].append((result[1], result[2]))

    if debug == True:
        for k, v in matches.items():
            print(k[0], [(x[0][0], x[1]) for x in v])

    return matches


if __name__ == '__main__':

    with open('CENPA_3chunks.txt', 'r') as f:
        data = f.readlines()

    labeled = list(parse_data(data))
    expected_pairs = 3

    matches = compare_all_pairs_both_ways(labeled, debug=True)

    #matches = itertools_combinations(labeled)

    if len(matches) != expected_pairs:
        print("warning! expected {} but found {}".format(
            expected_pairs, len(matches)))

    #to make a graph with Gephi:
    matches_to_graph(matches)

    #to make results file for Rosalind
    matches_to_rosalind(matches)

예제 #14

0

파일 보기

파일: test_oo_overlap.py 프로젝트: szeitlin/Rosalind

 def test_old_parser(self):
     parsed = list(parse_data(self.big_data))
     self.assertEqual(len(parsed), 100)

예제 #15

0

파일 보기

파일: test_gc_content.py 프로젝트: szeitlin/Rosalind

 def test_raw_parsing_one(self):
     self.assertEqual(len(self.data[1].strip() + self.data[2].strip()), 87)
     name, sequence = parse_data(self.data)
     self.assertEqual(name, 'Rosalind_0808')
     self.assertEqual(len(sequence), 87)

예제 #16

0

파일 보기

파일: test_gc_content.py 프로젝트: szeitlin/Rosalind

 def test_multiple_sequences(self):
     name, sequence = parse_data(self.big_data)
     self.assertEqual(name, 'Rosalind_0808')
     name, percent = gc_content(name, sequence, debug=True)
     self.assertEqual(percent, 60.919540)

예제 #17

0

파일 보기

파일: test_o3_overlap.py 프로젝트: szeitlin/Rosalind

 def test_old_parser(self):
     parsed = list(parse_data(self.big_data))
     self.assertEqual(len(parsed), 100)

예제 #18

0

파일 보기

    def setUp(cls):
        with open('CENPA_3chunks.txt', 'r') as f:
            data = f.readlines()

        cls.labeled = list(parse_data(data))

예제 #19

0

파일 보기

    def setUp(cls):
        with open('CENPA_3chunks.txt', 'r') as f:
            data = f.readlines()

        labeled = list(parse_data(data))
        cls.matches = compare_all_pairs_both_ways(labeled)