Exemple #1
0
from Data import Data
from Lsi import fire_lsi
from Lda import fire_lda
from calcAccuracy import test_accuracy
import GensimFunctions as gen

# Load Data and parse it
data = Data()
data.load_statistics()
data.parse_questions()

# TFIDF --> Generate output file

# Testing TFIDF

# TFIDF with Synonymns --> Generate output file

# Testing TFIDF with Synonymns

# Context Topics --> Generate output file

# Testing Context Topics

# Generating Dictionary and Corpus for gensim 
(dictionary, corpus) = gen.create_dictionary(data.rawSamples)

# --------------------------LSI-------------------------------
# LSI Model Building
numOfTopics = 100
(lsiModel, lsiIndex) = gen.create_lsimodelindex(dictionary, corpus, numOfTopics)