forked from jayaram1125/NaiveBayesClassification
/
Run.py
35 lines (23 loc) · 859 Bytes
/
Run.py
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
#package lin567_p1
import argparse
import NaiveBayes
import io
def main():
parser = argparse.ArgumentParser(description="Parse Values.")
parser.add_argument('-arg1', 'trainPath', type= str, required=True)
parser.add_argument('-arg2', 'testPath', type= str, required=True)
parser.add_argument('-arg3', 'n', type= int, required=True)
parser.add_argument('-arg4', 'lamda', type= float, required=True)
args = parser.parse_args()
trainPath = args.trainPath
testPath = args.testPath
n = args.n
lamda = args.lamda
nbModel = NaiveBayes()
inout = io.IO()
trainSet = inout.readDocuments(trainPath,n)
testSet = inout.readDocuments(testPath,n)
nbModel.train(trainSet)
for doc in testSet:
bestLanguage = nbModel.mostLikelyLanguage(doc.text,lamda)
print( id + "|" + bestLanguage )