예제 #1
0
	document = Document()
	article = os.path.join(corpus, fileName)
	content = open(article, 'r').read()
	document.add(Field("text", content, Field.Store.YES, Field.Index.ANALYZED))
	writer.addDocument(document)
print writer.numDocs()
writer.close()

# INDEX READER
reader = IndexReader.open(directory)
searcher = IndexSearcher(reader)

# QUERYING FOR A QUESTION
queryParser = QueryParser(util.Version.LUCENE_CURRENT, "text", analyzer)

'''
answers = ['A', 'B', 'C', 'D']
submissionFile = open("luceneModel.csv", "w")
writer = csv.writer(submissionFile, delimiter=',')
writer.writerow(['id', 'correctAnswer'])


# 10 - 0.3844
# 9 - 0.386
# 5 - 0.3742

with open(trainingFilePath) as trainData:
	reader = csv.reader(trainData, delimiter="\t")
	header=0
	accuracy = 0
	for row in reader: