def generate_entries(authors): date = START_DATE end_date = date + datetime.timedelta(days = NUM_DAYS) itercount = 0 while date < end_date: minute_delta = random.expovariate(ENTRIES_PER_MINUTE) date += datetime.timedelta(minutes = minute_delta) entry = Entry() entry.author = random.sample(authors, 1)[0] entry.title = generate_string(\ random.gauss(TITLE_LENGTH_MU, TITLE_LENGTH_SIGMA)) entry.contents = generate_string(\ random.gauss(ENTRY_LENGTH_MU, ENTRY_LENGTH_SIGMA)) entry.date = date entry.save() if (itercount % 1000) == 0: print "Making entry for %s" % (str(date)) itercount += 1
def generate_pages(): today = datetime.datetime.today() pageids = [] probs = [1.0/i for i in xrange(START_DIVISOR,NUM_PAGES+START_DIVISOR)] sumprob = sum(probs) probs = [prob/sumprob for prob in probs] for i in xrange(1, NUM_PAGES+1): #delta = datetime.timedelta(days = random.gauss(DAYMATH_MU, DAYMATH_SIGMA)) #date = today + delta #title = generate_string(\ # random.gauss(TITLE_LENGTH_MU, TITLE_LENGTH_SIGMA)) contents = generate_string(\ random.gauss(PAGE_LENGTH_MU, PAGE_LENGTH_SIGMA)) prob = probs[i-1] #page = Page(title=title, contents=contents, date=date, access_probability=prob) page = Page.objects.get(id=i) page.contents = contents page.save() pageids.append((i, prob)) return pageids