コード例 #1
0
ファイル: make_db.py プロジェクト: jameshicks/markovtwitter
#!/usr/bin/env python

# Makes a database for markovtwitter from a corpus file.
# The corpus file is expected to be one sentence per line.
#
# usage: make_db.py [-h] -c corpusfile -n depth -o outfile
import argparse
from markovchain import MarkovChain

parser = argparse.ArgumentParser()
parser.add_argument('-c', '--corpus',
                    help='Name of corpus file', required=True,
                    metavar='corpusfile')
parser.add_argument('-n', '--order', help='Chain depth', 
                    type=int, required=True, default=1, metavar='depth')
parser.add_argument('-o', '--out', help='Output DB filename',
                    required=True, metavar='outfile')
args = parser.parse_args()

print 'Generating markov chain database from %s' % args.corpus

mc = MarkovChain(corpusfile=args.corpus,order=args.order)
print mc

print 'Saving database to %s' % args.out
mc.save_db(args.out)