Python TMUtilsMatching.pos_bool 예제들

프로그래밍 언어: Python

네임스페이스/패키지 이름: TMMatching.TMUtilsMatching

클래스/타입: TMUtilsMatching

메소드/함수: pos_bool

hotexamples.com에서의 예제들: 2

Python TMUtilsMatching.pos_bool - 2개의 예제가 발견되었습니다. 이것들은 오픈소스 프로젝트에서 추출된 Python의 TMMatching.TMUtilsMatching.TMUtilsMatching.pos_bool에 대한 실세계 최고 등급의 예제들입니다. 예제들을 평가하여 예제의 품질 향상에 도움을 줄 수 있습니다.

자주 사용되는 메소드들

보기 숨기기

pre_process(12)

check_stopwords(6)

segment_2_universal(4)

_edit_distance(3)

_ter_score(3)

len_compare(2)

pos_bool(2)

position_distance(2)

strip_tags(2)

transfer_tags(2)

empty_list(1)

reduce_tags(1)

ter_distance(1)

un_match_distance(1)

예제 #1

파일 보기

파일: TMFuzzyMatchPosTagger.py 프로젝트: MittagQI/nectm

    def _align_source_target(self, un_match, un_pos, position, tgt_text,
                             tgt_pos, align_features):

        tgt_dic = {}  # list of pairs of words

        tgt_word_pos = TMUtilsMatching.segment_2_universal(
            tgt_text.lower(), tgt_pos, self.tgt_lang)
        for i in range(0, len(tgt_word_pos)):
            value_similarity = 0
            for f in align_features:
                if f == 'word_ter':  # TER between words
                    value_similarity = value_similarity + TMUtilsMatching.ter_distance(
                        un_match, tgt_word_pos[i][0])
                if f == 'posTag':  # Boolean PosTag
                    value_similarity = value_similarity + TMUtilsMatching.pos_bool(
                        un_pos, tgt_word_pos[i][1])
                if f == 'position':  # Word position
                    value_similarity = value_similarity + TMUtilsMatching.position_distance(
                        position, i)
                #if f == 'frequency':  # frequency of pairs of words
                #  value_similarity = value_similarity + self.target_importance(un_word, tgt_word_pos[i][0], segment,best_segments)
            # Dictionary have the target word and the position of the word in the target sentence
            tgt_dic[(tgt_word_pos[i][0], i)] = value_similarity
        tgt_align = sorted(tgt_dic.items(),
                           key=lambda item: item[1],
                           reverse=True)[0]  # Select the highest score
        return tgt_align[0][0], tgt_align[0][
            1]  # un_word, un_position  # Retorn the word with biggest score

예제 #2

파일 보기

    def _align_source_target(self, un_match, un_pos, position, tgt_word_pos,
                             align_features):  #tgt_text, tgt_pos,
        related_words = []
        tgt_dic = {}  # list of pairs of words

        equal_posTag = [[
            position_tgt, word, pos
        ] for position_tgt, [word, pos] in list(enumerate(tgt_word_pos))
                        if pos == un_pos.strip(' ') or pos == 'VERB'
                        or pos == 'NOUN' or pos == 'ADJ']
        #print('*************')
        #print(equal_posTag)
        if not equal_posTag:
            return None, None

        else:
            if 'glossary' in align_features:
                related_words = self.search_exact_value(un_match, 10)
            for i in range(0, len(equal_posTag)):
                value_similarity = 0
                for f in align_features:
                    if f == 'word_ter':  # TER between words
                        value_similarity = value_similarity + (
                            0.25 * TMUtilsMatching.un_match_distance(
                                un_match, equal_posTag[i][1]))
                    if f == 'posTag':  # Boolean PosTag
                        value_similarity = value_similarity + (
                            0.25 * TMUtilsMatching.pos_bool(
                                un_pos, equal_posTag[i][2]))
                    if f == 'position':  # Word position
                        value_similarity = value_similarity + (
                            0.25 * TMUtilsMatching.position_distance(
                                position, equal_posTag[i][0]))
                    if f == 'glossary':  # search word on elasticTM
                        if equal_posTag[i][1] in related_words:
                            is_related = 1
                        else:
                            is_related = 0
                        value_similarity = value_similarity + (
                            0.25 * is_related
                        )  #target_importance(un_word, tgt_word_pos[i][0], segment,best_segments)
                # Dictionary have the target word and the position of the word in the target sentence --> Low is the best
                tgt_dic[(equal_posTag[i][1],
                         equal_posTag[i][0])] = value_similarity
            tgt_align = sorted(tgt_dic.items(),
                               key=lambda item: item[1],
                               reverse=True)[0]  # Select the highest score
            print(
                sorted(tgt_dic.items(), key=lambda item: item[1],
                       reverse=True))
            if tgt_align[1] > G_CONFIG.get_src_tgt_threshold():
                return tgt_align[0][0], tgt_align[0][1]
            else:
                return None, None