예제 #1
0
def compare_mishna_to_yachin(tractate_list):

    for tractate in tractate_list:
        r = Ref(tractate)
        name = r.he_book()
        m_name = name.replace(u'משנה', u'משניות')
        y_name = name.replace(u'משנה', u'יכין')
        output = codecs.open('tag_match_up.txt', 'a', 'utf-8')
        try:
            m_file = codecs.open(u'{}.txt'.format(m_name), 'r', 'utf-8')
            y_file = codecs.open(u'{}.txt'.format(y_name), 'r', 'utf-8')
        except IOError:
            output.write(u'missing file {}\n'.format(name))
            continue

        m_tag = TagTester(u'@44', m_file, name=m_name)
        y_tag = TagTester(u'@11', y_file, name=y_name)

        seg_tag = u'@00(?:פרק |פ)([א-ת,"]{1,3})'
        m_tag.segment_tag = seg_tag
        y_tag.segment_tag = seg_tag

        compare_tags_to_comments(m_tag, y_tag, output)

        m_file.close()
        y_file.close()
        output.close()
예제 #2
0
def compare_mishna_to_yachin(tractate_list):

    for tractate in tractate_list:
        r = Ref(tractate)
        name = r.he_book()
        m_name = name.replace(u'משנה', u'משניות')
        y_name = name.replace(u'משנה', u'יכין')
        output = codecs.open('tag_match_up.txt', 'a', 'utf-8')
        try:
            m_file = codecs.open(u'{}.txt'.format(m_name), 'r', 'utf-8')
            y_file = codecs.open(u'{}.txt'.format(y_name), 'r', 'utf-8')
        except IOError:
            output.write(u'missing file {}\n'.format(name))
            continue

        m_tag = TagTester(u'@44', m_file, name=m_name)
        y_tag = TagTester(u'@11', y_file, name=y_name)

        seg_tag = u'@00(?:פרק |פ)([א-ת,"]{1,3})'
        m_tag.segment_tag = seg_tag
        y_tag.segment_tag = seg_tag

        compare_tags_to_comments(m_tag, y_tag, output)

        m_file.close()
        y_file.close()
        output.close()