예제 #1
0
def constructPredictionWithOutput(classifier,classifierIndex,xTest, testBatchIndex):

    print "Predicting with classifier {}".format(classifierIndex)

    yPred = classifier.predict_proba(xTest)

    print "Writing to csv..."
    outputFileName="data\\ensembleTraining\\out"+str(classifierIndex)+".csv"
    dataReader.writePredToCsv(yPred,testBatchIndex,outputFileName=outputFileName)
예제 #2
0
def predictForSubmission():
    startTime = time.time()
    allAlgorithmStartTime = startTime

    numberOfTrainingExamples = -1
    classifier = trainClassifierOnTrainingData(numberOfTrainingExamples)

    print "Beginning to load test data..."

    partitionNumber = utils.numberOfPartitions
    for index in range(partitionNumber):

        miniTestData = dataReader.getSerializedMiniTestData(index)

        xTest,yTest = constructTestData(miniTestData)

        print "Predicting..."
        yPred = classifier.predict_proba(xTest)

        dataReader.writePredToCsv(yPred,index)

    print "Post processing..."
    dataReader.postProcessCsv()
    print("Total run time:{}".format(time.time() - allAlgorithmStartTime))