Python EVALUATOR 예제들

프로그래밍 언어: Python

네임스페이스/패키지 이름: MLIB.classify.predict

클래스/타입: EVALUATOR

hotexamples.com에서의 예제들: 6

Python EVALUATOR - 6개의 예제가 발견되었습니다. 이것들은 오픈소스 프로젝트에서 추출된 Python의 MLIB.classify.predict.EVALUATOR에 대한 실세계 최고 등급의 예제들입니다. 예제들을 평가하여 예제의 품질 향상에 도움을 줄 수 있습니다.

자주 사용되는 메소드들

보기 숨기기

EVALUATOR(3)

add(2)

show(2)

getMetrics(1)

예제 #1

파일 보기

파일: learner.py 프로젝트: dainis-boumber/MLIB

 def train(self, fvects, fids):
     """
     Train using SGD. Supports crossValidation. This function
     is called by outside programs.
     """
     # You cannot set both heldout and cross-validation.
     if self.folds and self.heldoutVects:
         sys.stderr.write(
             "Cannot perform heldout and cross-validation simultaneously\n")
         sys.exit(-1)
     if self.folds == 0:
         return self.train_client(fvects, fids)
     else:
         # store the training data folds.
         print "Performing %d-fold cross-validation" % self.folds
         trainVects = {}
         fold = 0
         count = 0
         for fv in fvects:
             trainVects.setdefault(fold, []).append(fv)
             fold += 1
             if fold == self.folds:
                 fold = 0
         # train for each fold. Accumulate statistics.
         stats = {}
         statKeys = ["macro", "micro"]
         statKeys.extend(self.labels)
         for sk in statKeys:
             stats[sk] = {}
             for metric in ["precision", "recall", "F", "accuracy"]:
                 stats[sk][metric] = 0
         for i in trainVects:
             print "Fold number = %d" % (i + 1)
             traindata = []
             for j in trainVects:
                 if j != i:
                     traindata.extend(trainVects[j])
             self.train_client(traindata, fids)
             e = self.get_performance(trainVects[i])
             results = e.getMetrics()
             e.show(results)
             # add the current metrics to stats.
             for sk in statKeys:
                 for metric in ["precision", "recall", "F", "accuracy"]:
                     stats[sk][metric] += results[sk][metric]
         # print the overall results and averages.
         print "Average Results over %d-fold cross validation" % self.folds
         for sk in statKeys:
             for metric in ["precision", "recall", "F", "accuracy"]:
                 stats[sk][metric] /= float(self.folds)
         E = EVALUATOR(self.n)
         E.show(stats)
     pass

예제 #2

파일 보기

파일: learner.py 프로젝트: dainis-boumber/MLIB

 def get_performance(self, fvects):
     """
     Compute precision, recall and F-scores with the current
     weight vector for the fvects using the EVALUATOR.. 
     """
     E = EVALUATOR(self.n)
     pred = PREDICTOR()
     pred.loadWeights(self.w, self.bias, self.n)
     for v in fvects:
         (lbl, prob) = pred.predictVect(v)
         E.add(v.label, lbl)
     return E

예제 #3

파일 보기

파일: learner.py 프로젝트: Bollegala/MLIB

 def train(self,fvects,fids):
     """
     Train using SGD. Supports crossValidation. This function
     is called by outside programs.
     """
     # You cannot set both heldout and cross-validation.
     if self.folds and self.heldoutVects:
         sys.stderr.write(
             "Cannot perform heldout and cross-validation simultaneously\n")
         sys.exit(-1)
     if self.folds == 0:
         return self.train_client(fvects,fids)
     else:
         # store the training data folds.
         print "Performing %d-fold cross-validation" % self.folds
         trainVects = {}
         fold = 0
         count = 0
         for fv in fvects:
             trainVects.setdefault(fold,[]).append(fv)
             fold += 1
             if fold == self.folds:
                 fold = 0
         # train for each fold. Accumulate statistics.
         stats = {}
         statKeys = ["macro","micro"]
         statKeys.extend(self.labels)
         for sk in statKeys:
             stats[sk] = {}
             for metric in ["precision","recall","F","accuracy"]:
                 stats[sk][metric] = 0
         for i in trainVects:
             print "Fold number = %d" % (i+1)
             traindata = []
             for j in trainVects:
                 if j != i:
                     traindata.extend(trainVects[j])
             self.train_client(traindata,fids)
             e = self.get_performance(trainVects[i])
             results = e.getMetrics()
             e.show(results)                
             # add the current metrics to stats.
             for sk in statKeys:
                 for metric in ["precision","recall","F","accuracy"]:
                     stats[sk][metric] += results[sk][metric]
         # print the overall results and averages.
         print "Average Results over %d-fold cross validation" % self.folds
         for sk in statKeys:
             for metric in ["precision","recall","F","accuracy"]:
                 stats[sk][metric] /= float(self.folds)
         E = EVALUATOR(self.n)
         E.show(stats)
     pass

예제 #4

파일 보기

파일: learner.py 프로젝트: Bollegala/MLIB

 def get_performance(self,fvects):
     """
     Compute precision, recall and F-scores with the current
     weight vector for the fvects using the EVALUATOR.. 
     """
     E = EVALUATOR(self.n)
     pred = PREDICTOR()
     pred.loadWeights(self.w,self.bias,self.n)
     for v in fvects:
         (lbl,prob) = pred.predictVect(v)
         E.add(v.label,lbl)
     return E

예제 #5

파일 보기

파일: learner.py 프로젝트: Bollegala/MLIB

def test_logreg(model_fname,test_fname,output_fname=None, prob=True,acc=True):
    """
    Predict labels for the test instances using the trained
    model. If prob is set to True, then show class probabilities.
    If acc is set to True and if the test instances have labels,
    then we will predict accuracies for the test instances.
    If an output_fname is specified we will write the predictions to
    the file instead of writing to the terminal.
    """
    pred = PREDICTOR()
    pred.loadModel(model_fname)
    testFile = SEQUENTIAL_FILE_READER(test_fname)
    count = 0
    E = EVALUATOR(pred.n)
    if output_fname:
        output = open(output_fname,"w")
    else:
        output = sys.stdout
    for mv in testFile:
        v = mv["vect"]
        (lbl,prob) = pred.predictVect(v)
        output.write("%d\t%s\n" % (lbl,str(prob)))
        if pred.n == 2 and v.label == -1 :
            trueLabel = 0
        else:
            trueLabel = v.label
        if v.label is not None:
            E.add(trueLabel,lbl)
        count += 1
    testFile.close()
    if acc:
        result = E.getMetrics()
        E.show(result)
    pass

예제 #6

파일 보기

파일: learner.py 프로젝트: dainis-boumber/MLIB

def test_logreg(model_fname,
                test_fname,
                output_fname=None,
                prob=True,
                acc=True):
    """
    Predict labels for the test instances using the trained
    model. If prob is set to True, then show class probabilities.
    If acc is set to True and if the test instances have labels,
    then we will predict accuracies for the test instances.
    If an output_fname is specified we will write the predictions to
    the file instead of writing to the terminal.
    """
    pred = PREDICTOR()
    pred.loadModel(model_fname)
    testFile = SEQUENTIAL_FILE_READER(test_fname)
    count = 0
    E = EVALUATOR(pred.n)
    if output_fname:
        output = open(output_fname, "w")
    else:
        output = sys.stdout
    for mv in testFile:
        v = mv["vect"]
        (lbl, prob) = pred.predictVect(v)
        output.write("%d\t%s\n" % (lbl, str(prob)))
        if pred.n == 2 and v.label == -1:
            trueLabel = 0
        else:
            trueLabel = v.label
        if v.label is not None:
            E.add(trueLabel, lbl)
        count += 1
    testFile.close()
    if acc:
        result = E.getMetrics()
        E.show(result)
    pass