import sys import BayesDB classifier = sys.argv[1].strip() if classifier == 'NONE': classifier = None training_data = open(sys.argv[2], 'r') db_file = sys.argv[3] db = BayesDB.createOrLoad(db_file) docs = 0 for line in training_data: line = line.strip() ## assume non-trivial sanitisation done upstream if line == "": continue db.addDoc(line, classifier) docs+=1 print 'Classified %d docs as %s' % (docs, classifier) print 'Writing DB file %s ...' % db_file db.dump() print 'New DB state:' db.describe() print 'Done'
import sys from BayesFilter import BayesFilter import BayesDB db = BayesDB.createOrLoad(sys.argv[1]) filter = BayesFilter(db) print filter.predict(sys.argv[2], sys.argv[3])
import sys from BayesFilter import BayesFilter import BayesDB db = BayesDB.createOrLoad('out') print db.describe()
import BayesDB ## create a DB via the constructor which always creates a new BayesDB file db = BayesDB.BayesDB() db.addDoc("offer is secret", "spam") db.dump() ## load() looks for file called 'BayesDB' by default db = BayesDB.load() db.describe()