def featureInsertion(): # if training: #=============================================================================== # Generating bag of words #=============================================================================== # print "Generating bag of words" # termExtractor.bagOfWordBuilder(questions,'words'+colName,insert) # print "Done" #=============================================================================== # Inserting bag of words to vector space #=============================================================================== print 'Inserting bag of words to vector space' # termExtractor.vectorSpaceBuilder(questions, colName, 'feature'+colName+'_'+classType,common,insert) print 'Done' #=============================================================================== # Generating data for classifier #=============================================================================== print 'Generating data for classifier' dataRetrieval = DataRetrieval() dataRetrieval.extractData('feature'+colName+'_'+classType,training,common,False,classType) dataRetrieval.extractData('feature'+colName+'_'+classType,training,common,True,classType) print 'Done'
def featureInsertion(): if training: # =============================================================================== # Generating bag of words # =============================================================================== print "Generating bag of words" termExtractor.bagOfWordBuilder(questions, "words" + colName, insert) print "Done" # =============================================================================== # Inserting bag of words to vector space # =============================================================================== print "Inserting bag of words to vector space" termExtractor.vectorSpaceBuilder(questions, colName, "feature" + colName + "_" + classType, common, insert) print "Done" # =============================================================================== # Generating data for classifier # =============================================================================== print "Generating data for classifier" dataRetrieval = DataRetrieval() dataRetrieval.extractData("feature" + colName + "_" + classType, training, common, False, classType) # dataRetrieval.extractData('feature'+colName+'_'+classType,training,common,True,classType) print "Done"