def getUnupdatedArticles(): """ Returns a list of document id that is not contained in index. >>> getUnupdatedArticles() #doctest: +SKIP """ articles = Articles() articles.set() article_table_updated = articles.json index = Index() article_table_all = index._create() for key in article_table_updated: if article_table_all.has_key(key): article_table_all.pop(key) return article_table_all.keys()
def indexAllArticles(): index = Index() index.create()