from creator import Creator

c = Creator("dewiki")
dataset = c.create(10000, batch_size=100, fname="dewiki_10000.json.bz2")
Beispiel #2
0
import logging

from creator import Creator

logging.basicConfig(level=logging.INFO)
logging.getLogger('requests').setLevel(logging.WARNING)
logging.getLogger('urllib3').setLevel(logging.WARNING)
logger = logging.getLogger()
fh = logging.FileHandler("creator.log")
logger.addHandler(fh)
logger.info("Starting...")
c = Creator("dewiki")
dataset = c.create(start=20170101000000,
                   stop=20171231235959,
                   batch_size=50,
                   fname="test2017.json.bz2")