Python create_mapping 예제들

프로그래밍 언어: Python

네임스페이스/패키지 이름: utils.model_utils

메소드/함수: create_mapping

hotexamples.com에서의 예제들: 6

Python create_mapping - 6개의 예제가 발견되었습니다. 이것들은 오픈소스 프로젝트에서 추출된 Python의 utils.model_utils.create_mapping에 대한 실세계 최고 등급의 예제들입니다. 예제들을 평가하여 예제의 품질 향상에 도움을 줄 수 있습니다.

예제 #1

파일 보기

def augment_with_pretrained(dictionary, ext_emb_path, words):
    """
    Augment the dictionary with words that have a pretrained embedding.
    If `words` is None, we add every word that has a pretrained embedding
    to the dictionary, otherwise, we only add the words that are given by
    `words` (typically the words in the development and test sets.)
    """
    print('Loading pre-trained embeddings from {}...'.format(ext_emb_path))
    assert os.path.isfile(ext_emb_path), '{} not found'.format(ext_emb_path)

    # Load pretrained embeddings from file
    pretrained = set([
        line.rstrip().split()[0].strip()
        for line in codecs.open(ext_emb_path, 'r', 'utf-8')
        if len(ext_emb_path) > 0
    ])

    # We either add every word in the pretrained file,
    # or only words given in the `words` list to which
    # we can assign a pretrained embedding
    if words is None:
        for word in pretrained:
            if word not in dictionary:
                dictionary[word] = 0
    else:
        for word in words:
            if any(
                    x in pretrained for x in
                [word, word.lower(),
                 re.sub('\d', '0', word.lower())]) and word not in dictionary:
                dictionary[word] = 0

    word_to_id, id_to_word = create_mapping(dictionary)
    return dictionary, word_to_id, id_to_word

예제 #2

파일 보기

def tag_mapping(sentences, idx=-1):
    """
    Create a dictionary and a mapping of tags, sorted by frequency.
    """
    tags = [[word[idx] for word in s] for s in sentences]
    dico = create_dico(tags)
    tag_to_id, id_to_tag = create_mapping(dico)
    print("Found {} unique named entity tags".format(len(dico)))
    return dico, tag_to_id, id_to_tag

예제 #3

파일 보기

def pos_mapping(sentences):
    """
    Create a dictionary and a mapping of POS tags, sorted by frequency.
    """
    tags = [[word[2] for word in s] for s in sentences]
    dico = create_dico(tags)
    dico['<UNK>'] = 10000000
    tag_to_id, id_to_tag = create_mapping(dico)
    print("Found {} unique POS tags".format(len(dico)))
    return dico, tag_to_id, id_to_tag

예제 #4

파일 보기

def char_mapping(sentences):
    """
    Create a dictionary and mapping of characters, sorted by frequency.
    """
    chars = ["".join([w[1] for w in s]) for s in sentences]
    dico = create_dico(chars)
    dico['<UNK>'] = 10000000
    char_to_id, id_to_char = create_mapping(dico)
    print("Found {} unique characters".format(len(dico)))
    return dico, char_to_id, id_to_char

예제 #5

파일 보기

def word_mapping(sentences, lower):
    """
    Create a dictionary and a mapping of words, sorted by frequency.
    """
    words = [[x[1].lower() if lower else x[1] for x in s] for s in sentences]
    dico = create_dico(words)
    dico['<UNK>'] = 10000000
    dico['<PADDING>'] = 500000
    word_to_id, id_to_word = create_mapping(dico)
    print('Found {} unique words ({} in total)'.format(
        len(dico), sum(len(x) for x in words)))
    return dico, word_to_id, id_to_word

예제 #6

파일 보기

def segment_mapping(sentences, only_i_o_tag=True):
    """
    Create a dictionary and a mapping of ner segmentation tags, sorted by frequency.
    """
    if only_i_o_tag:
        tags = [[word[4].replace('B-', 'I-') for word in s] for s in sentences]
    else:
        tags = [[word[4] for word in s] for s in sentences]
    dico = create_dico(tags)
    tag_to_id, id_to_tag = create_mapping(dico)
    print("Found {} unique segmentation tags".format(len(dico)))
    return dico, tag_to_id, id_to_tag