예제 #1
0
파일: Main.py 프로젝트: blodstone/CCS590v2
def featureInsertion():
#    if training:
        #===============================================================================
        # Generating bag of words
        #===============================================================================
#        print "Generating bag of words"
#        termExtractor.bagOfWordBuilder(questions,'words'+colName,insert)
#        print "Done"

    #===============================================================================
    # Inserting bag of words to vector space
    #===============================================================================
    print 'Inserting bag of words to vector space'
#    termExtractor.vectorSpaceBuilder(questions, colName, 'feature'+colName+'_'+classType,common,insert)
    print 'Done'
    
    #===============================================================================
    # Generating data for classifier
    #===============================================================================
    print 'Generating data for classifier'
    dataRetrieval = DataRetrieval()
    dataRetrieval.extractData('feature'+colName+'_'+classType,training,common,False,classType)
    dataRetrieval.extractData('feature'+colName+'_'+classType,training,common,True,classType)
    print 'Done'
예제 #2
0
def featureInsertion():
    if training:
        # ===============================================================================
        # Generating bag of words
        # ===============================================================================
        print "Generating bag of words"
        termExtractor.bagOfWordBuilder(questions, "words" + colName, insert)
        print "Done"

    # ===============================================================================
    # Inserting bag of words to vector space
    # ===============================================================================
    print "Inserting bag of words to vector space"
    termExtractor.vectorSpaceBuilder(questions, colName, "feature" + colName + "_" + classType, common, insert)
    print "Done"

    # ===============================================================================
    # Generating data for classifier
    # ===============================================================================
    print "Generating data for classifier"
    dataRetrieval = DataRetrieval()
    dataRetrieval.extractData("feature" + colName + "_" + classType, training, common, False, classType)
    #    dataRetrieval.extractData('feature'+colName+'_'+classType,training,common,True,classType)
    print "Done"