Exemplos de Preprocessor._line_cleanup em Python

Linguagem de programação: Python

Espaço para nome / nome do pacote: preprocess

Classe / Tipo: Preprocessor

Método / Função: _line_cleanup

Exemplos em hotexamples.com: 1

Preprocessor._line_cleanup em Python - 1 exemplos encontrados. Esses são os exemplos do mundo real mais bem avaliados de preprocess.Preprocessor._line_cleanup em Python extraídos de projetos de código aberto. Você pode avaliar os exemplos para nos ajudar a melhorar a qualidade deles.

Métodos Frequentes

Exibir Ocultar

Preprocessor(30)

add(4)

execute(3)

load(3)

import_video(3)

get_vocabulary(2)

get_states(2)

get_standard_form(2)

get_representer(2)

gen_data_vec(2)

setNextPitchCorner(2)

count_lines(1)

bgsub(1)

load_data(1)

_line_cleanup(1)

lda(1)

investigate_whitelist(1)

index_list_to_word_list(1)

apply(1)

basic_preprocess(1)

get_values_all(1)

get_training_data(1)

get_train_test_data_tag(1)

get_testing_data(1)

get_target_names(1)

build_vocab(1)

convert_text_to_index(1)

build_vocabulary_and_categories(1)

get_feature_names(1)

get_data(1)

get_all_text(1)

_clean_data(1)

getSentences(1)

generateTrainData(1)

convert_index_to_text(1)

gaussian(1)

format_to_nn(1)

format_to_lines(1)

fit_on_corpus(1)

get_all_tag_idx(1)

Métodos Frequentes

Preprocessor (30)

add (4)

execute (3)

load (3)

import_video (3)

get_vocabulary (2)

get_states (2)

get_standard_form (2)

get_representer (2)

gen_data_vec (2)

Métodos Frequentes

setNextPitchCorner (2)

count_lines (1)

bgsub (1)

load_data (1)

_line_cleanup (1)

lda (1)

investigate_whitelist (1)

index_list_to_word_list (1)

apply (1)

basic_preprocess (1)

get_values_all (1)

get_training_data (1)

get_train_test_data_tag (1)

get_testing_data (1)

get_target_names (1)

build_vocab (1)

convert_text_to_index (1)

build_vocabulary_and_categories (1)

get_feature_names (1)

get_data (1)

Métodos Frequentes

get_values_all (1)

get_training_data (1)

get_train_test_data_tag (1)

get_testing_data (1)

get_target_names (1)

build_vocab (1)

convert_text_to_index (1)

build_vocabulary_and_categories (1)

get_feature_names (1)

get_data (1)

get_all_text (1)

_clean_data (1)

getSentences (1)

generateTrainData (1)

convert_index_to_text (1)

gaussian (1)

format_to_nn (1)

format_to_lines (1)

fit_on_corpus (1)

get_all_tag_idx (1)

Métodos Frequentes

get_all_text (1)

_clean_data (1)

getSentences (1)

generateTrainData (1)

convert_index_to_text (1)

gaussian (1)

format_to_nn (1)

format_to_lines (1)

fit_on_corpus (1)

get_all_tag_idx (1)

Exemplo n.º 1

0

Exibir arquivo

Arquivo: knowledge_graph.py Projeto: Vidhan/allennlp

class KnowledgeGraph(object): def __init__(self): self._preprocess = Preprocessor() def _update_line(self, line, graph, context_so_far): ent_pattern = r"\[[a-zA-Z0-9' ]+\([a-zA-Z]+\[\d+\]\)\]" ref_pattern = r"\[[a-zA-Z0-9' ]+\]" words = r"[a-zA-Z0-9' ]+" entities = re.findall(ent_pattern, line) new_line = line for entity in entities: new_line = new_line.replace(entity, '') refs = re.findall(ref_pattern, new_line) for index, entity in enumerate(entities): name, class_type, identifier = re.findall(words, entity) # list of all objects that are of this entity graph_entity = graph.get(class_type) if graph_entity is None: graph_entity = {} graph[class_type] = graph_entity # check if identifier exists in the graph entity metadata = graph_entity.get(identifier) if metadata is None: metadata = { 'name': name, 'attributes': [], 'relation': {}, 'start_index': context_so_far.find(name) } graph_entity[identifier] = metadata other_entities = [ ent for pos, ent in enumerate(entities) if index != pos ] for ent in other_entities: ent_name, ent_class_type, ent_id = re.findall(words, ent) relation_ent = metadata['relation'].get(ent_class_type) if not relation_ent: relation_ent = [] metadata['relation'][ent_class_type] = relation_ent if ent_id not in relation_ent: relation_ent.append(ent_id) for ref in refs: attributes = re.findall(words, ref) for attr in attributes: if attr not in metadata['attributes']: metadata['attributes'].append( (attr, context_so_far.rfind(attr))) def prepare(self, path): graph = {} context_so_far = "" with open(path) as f: for line in f: if "question_" in line: continue context_so_far += ( " " if context_so_far else "") + self._preprocess._line_cleanup(line) + "." self._update_line(line, graph, context_so_far) graph[CONTEXT] = context_so_far return graph def prepare_edges(self, graph): nodes = [] for key in graph: if key == CONTEXT: continue nodes.extend([(key + "-" + elem) for elem in graph[key]]) sorted_nodes = sorted(nodes) nodes = {k: v for v, k in enumerate(sorted_nodes)} m_len = len(nodes) edges = [] for _ in range(m_len): edges.append([-1] * m_len) print(json.dumps(nodes)) for entry in nodes: class_type, id = entry.split("-") neighbors = graph[class_type][id]['relation'] entry_index = nodes[entry] edges[entry_index][entry_index] = 0 for neighbor_class, neighbor_nodes in neighbors.iteritems(): for neighbor_node in neighbor_nodes: neighbor = "%s-%s" % (neighbor_class, neighbor_node) neighbor_index = nodes[neighbor] edges[entry_index][neighbor_index] = 1 return nodes, edges, sorted_nodes