Ejemplo n.º 1
0
			tokens = sent.split()
			for i in range(len(tokens)):
				index -= len(tokens[i]) + 1
				if index < 0:
					for c in range(i, i + len(arg.split())):
						arg_list.append(c)
					break
		info_list.append(arg_list)
	return info_list

input = codecs.open('200DadeganSents.txt', 'r', encoding='utf8')
dadegan = DadeganReader('Resources/Dadegan/train.conll')
dadegan_trees = dadegan.trees()
informations = []
sentences = []
for sentence in dadegan.sents():
	sentences.append(' '.join([w for w, t in sentence]))
for tree, chunks, sent in zip(dadegan_trees, dadegan.chunked_trees(), sentences):
	info_list = ([], [], [])
	for information in dependencyExtractor.extract(tree):
		temp_list = positions(information, sent)
		for i in range(3):
			if len(temp_list[i]) > 0 and temp_list[i] not in info_list[i]:
						info_list[i].append(temp_list[i])
	if [] in info_list:
		continue
	else:
		tag_sent(chunks, info_list)

"""
for line in input.readlines():