"Hızlı kahverengi tilki tembel köpeğin üstünden atlar ve bunun cehenneme sikikleri", "Η γρήγορη καφέ αλεπού πηδάει πάνω από το μεσημέρι και τρέχει έξω από αυτό γιαγιάδες γιαγιαδες", #"Idź prosto i skręć w lewo/prawo Poczekaj chwilę Chodź ze mną Szukam John’a już" ] articles = [] for i, text in enumerate(texts): articles.append({"content" : text, "title" : text[:15], "id":i+1}) db = redis.Redis(host='192.168.1.3', port=6666, db=3) cp = CorpusHandler(debug=False, db=db) cp.drop() s = time.time() for a in articles: cp.index(a) print "indexing: " , time.time() - s q = QueryHandler(debug=False, db=db, use_lua=True) q2 = QueryHandler(debug=False, db=db, use_lua=False) s = time.time()
cnt = 0 l = len(text) while cnt < l: r = random.randint(400, 1200) try: data.append({"content":text[cnt:cnt+r], "title":text[cnt:cnt+random.randint(40, 130)], "id":cnt}) cnt += r except: break cp = CorpusHandler(debug=False, db=db) cp.drop() s = time.time() for a in data: try: cp.index(a) except: pass print "indexing: " , time.time() - s q = QueryHandler(debug=False, db=db, use_lua=True) q2 = QueryHandler(debug=False, db=db, use_lua=False)