Пример #1
0
    def upsert_document(self, index_task):

        update_dict = {
            "set__url": index_task['url'],
            "set__url_hash": hash_url(index_task['url']),
            "set__host": crawlmanager.extract_hostname(index_task['url']),
            "set__meta_data": index_task['document']['meta_data'],
            "set__features": index_task['document']['features']
        }

        IndexDocument.objects(url=index_task['url']).update_one(
            upsert=True,
            **update_dict
        )
Пример #2
0
    def delete_document(self, index_task):

        IndexDocument.objects(url=index_task['url']).delete()