def getMeme(cid, sub): path = str(os.getcwd() + "/stats/" + str(cid) + "/") os.makedirs(path, exist_ok=True) f = Path(path + "bloom.txt") print(f) filter = Bloom() if f.is_file(): file = open(f, "r") filter.getTable(file) file.close() else: file = open(f, "w+") global reddit for s in reddit.subreddit(sub).hot(): if not filter.find(str(s)) and s.is_reddit_media_domain: filter.insert(str(s)) with open(f, "w") as file: filter.writeTable(file) break request.urlretrieve(s.url, "temp.jpg") return open("temp.jpg", "rb") #getMeme(123,"dankmemes")
def simulation(): input = np.random.randint(1, 1000000, size=10000) test = np.random.randint(1, 1000000, size=1000) b = Bloom(input, 0.01) b.train_bloom() b.test_bloom(test)
def create_collection(self, genome): section_size = int(len(genome) / (self.k)) for i in range(self.k): section = genome[i * (section_size):(i + 1) * (section_size)] bloom = Bloom(1000000000, 0.3) for k in range(0, len(section) - segment_size + 1): s = section[k:k + segment_size] bloom.bloom_add(s) self.collection.append(bloom) print("Collection created successfully") self.collection = tuple(self.collection)
def post(self): bloom = memcache.get("filter") if bloom is None: bloom = Bloom(2**21, 5) value = self.request.POST["value"] value_already_included = False if value in bloom: value_already_included = True bloom.add(value) memcache.set("filter", bloom) self.redirect("/?success=" + str(not value_already_included) + "&value=" + value)
def main(): """Main function.""" bloom = Bloom(12) # Add some values to the set bloom.add("Curie") bloom.add("Laplace") # Now test some values person = "Pasteur" if (bloom.check(person)): print("%s is probably in the set." % person) else: print("%s is definitely not in the set." % person) # Test some more values person = "Curie" if (bloom.check(person)): print("%s is probably in the set." % person) else: print("%s is definitely not in the set." % person)
# rings, steps = gen_circle(rings=None, pixels_per=pixels_per, offset=0, invert=False) # layout = layout_from_rings(rings, origin=(0, 0, 0), z_diff=8) # driver = DriverSimPixel(sum(pixels_per), layout=layout) # led = LEDCircle(driver, rings=rings, maxAngleDiff=0) def shutdown(): log.debug('Force close server') driver.server.close() time.sleep(2) sys.exit() try: if isinstance(led, LEDMatrix): anim = Bloom(led, dir=True) anim.run(amt=2, fps=60) elif isinstance(led, LEDCube): # anim = cuby(led, color_list=c_list) # anim.run(amt=1, fps=8) anim = Simplex(led, freq=16, octaves=1) anim.run(amt=1, fps=30) # anim = Spectrum(led, vis_list=['Spread'], steps_per_vis=None, # bins=12, max_freq=4000, log_scale=True, auto_gain=False, gain=3) anim.run(amt=1, fps=8) elif isinstance(led, LEDCircle): anim = Diag(led, turns=1, angle=6, direction=False) anim.run(amt=6, fps=20) except Exception as e: shutdown() raise
def setUp(self): """Set up the Bloom Filter table.""" self.size = 10 self.b = Bloom(self.size)
import datetime from bloom import Bloom f = open("data/emerson_essays.txt", "r") sample = f.read() lines = sample.splitlines() mb = Bloom() false_positive = 0 new_key = 0 start_time = datetime.datetime.now() for line in lines: if not mb.Add(line): false_positive += 1 else: new_key += 1 end_time = datetime.datetime.now() print(" false_positive : %s - new_key: %s on %s " % (false_positive,new_key, len(lines))) diff = (start_time-end_time).microseconds ratio = diff / len(lines) print("{} ms for ratio: {}".format(diff,ratio)) print(" {} LEN ".format(mb.Len()))