Exemplo n.º 1
0
 def test_db_getter(self):
     from lembrar import db
     db.pymongo = MagicMock()
     grid = MagicMock()
     new_db = db.get_doc_db('prefix', 'ds', 'db_name', grid, 'a,b')
     assert db.pymongo.Connection()[None] == new_db.db
     assert grid == new_db.grid
     assert 'a,b' == new_db.accepted_languages
     assert 'prefix' == new_db.prefix
Exemplo n.º 2
0
 def test_db_getter(self):
     from lembrar import db
     db.pymongo = MagicMock()
     grid = MagicMock()
     new_db = db.get_doc_db('prefix', 'ds', 'db_name', grid, 'a,b')
     assert db.pymongo.Connection()[None] == new_db.db
     assert grid == new_db.grid
     assert 'a,b' == new_db.accepted_languages
     assert 'prefix' == new_db.prefix
Exemplo n.º 3
0
def parser_task(
    docids=None,
    initial=False,
    docdb=None,
    ):
    version = '0.1'
    docdb = get_doc_db(prefix='mimetype')
    if initial:
        for docid in docdb.find_unparsed(version):
            handle_update(docid, version)
    for docid in docids or []:
        handle_update(docdb, docid, version)
    return
Exemplo n.º 4
0
def parser_task(
    docids=None,
    initial=False,
    docdb=None,
):
    version = '0.1'
    docdb = get_doc_db(prefix='mimetype')
    if initial:
        for docid in docdb.find_unparsed(version):
            handle_update(docid, version)
    for docid in docids or []:
        handle_update(docdb, docid, version)
    return
Exemplo n.º 5
0
def parser_task(
    docids=None,
    initial=False,
    docdb=None,
    tikapath=None,
    ):
    print "DOOINGit"
    version = '0.1'
    tikapath = tikapath or os.environ.get('tikapath')
    docdb = get_doc_db(prefix='tika')
    if initial:
        for docid in docdb.find_unparsed(version):
            handle_update(docid, tikapath, version)
    for docid in docids or []:
        handle_update(docdb, docid, tikapath, version)
    return
Exemplo n.º 6
0
def parser_task(
    docids=None,
    initial=False,
    docdb=None,
    tikapath=None,
):
    print "DOOINGit"
    version = '0.1'
    tikapath = tikapath or os.environ.get('tikapath')
    docdb = get_doc_db(prefix='tika')
    if initial:
        for docid in docdb.find_unparsed(version):
            handle_update(docid, tikapath, version)
    for docid in docids or []:
        handle_update(docdb, docid, tikapath, version)
    return
Exemplo n.º 7
0
def parser_task(
    docids=None,
    initial=False,
    docdb=None,
    accepted_languages=None,
    ):
    version = '0.1'
    settings = get_current_registry().settings
    accepted_languages = accepted_languages \
        or (os.environ.get('accepted_languages')
            or settings.get('accepted_languages')).split(',')
    docdb = get_doc_db(prefix='ocr')
    if initial:
        for docid in docdb.find_unparsed(version):
            handle_update(docid, accepted_languages, version)
    for docid in docids or []:
        handle_update(docdb, docid, accepted_languages, version)
    return