예제 #1
0
import sys 
import BayesDB

classifier = sys.argv[1].strip()
if classifier == 'NONE':
    classifier = None

training_data = open(sys.argv[2], 'r')
db_file = sys.argv[3]
db = BayesDB.createOrLoad(db_file)

docs = 0
for line in training_data:
    line = line.strip()

    ## assume non-trivial sanitisation done upstream
    if line == "":
        continue

    db.addDoc(line, classifier)
    docs+=1

print 'Classified %d docs as %s' % (docs, classifier)
print 'Writing DB file %s ...' % db_file
db.dump()
print 'New DB state:'
db.describe()
print 'Done'
예제 #2
0
import sys
from BayesFilter import BayesFilter
import BayesDB

db = BayesDB.createOrLoad(sys.argv[1])
filter = BayesFilter(db)
print filter.predict(sys.argv[2], sys.argv[3])

예제 #3
0
import sys
from BayesFilter import BayesFilter
import BayesDB

db = BayesDB.createOrLoad('out')
print db.describe()

예제 #4
0
import BayesDB

## create a DB via the constructor which always creates a new BayesDB file
db = BayesDB.BayesDB()
db.addDoc("offer is secret", "spam")
db.dump()

## load() looks for file called 'BayesDB' by default
db = BayesDB.load()
db.describe()