Exemplo n.º 1
0
def tfidf_gender(db):
    female_text = ""
    male_text = ""
    nb_text = ""
    for i in range(1, NUM_OF_PROFILES+1):
        # there is an errant frenchman
        if i == 1467:
            continue
        tiptup = db.getText_byID(i)
        if tiptup is not None:
            if isFemale(i, db):
                female_text += '\r'.join(tiptup)
            elif isFemale(i, db) is None:
                nb_text += '\r'.join(tiptup)
            else:
                male_text += '\r'.join(tiptup)
    corpus = [female_text, male_text, nb_text]
    tuple_lists = tf_idf(corpus)
    masks = [gal_mask, guy_mask, none_mask]
    for i in range(len(tuple_lists)):
        generate_tfidf_cloud(tuple_lists[i], masks[i])
Exemplo n.º 2
0
def t_test_gender(db, column_name):
    dudes = []
    ladies = []
    for i in range(1, NUM_OF_PROFILES+1):
        is_female = isFemale(i, db)
        if is_female:
            datum = db.getColumn_byID(i, column_name)
            if datum:
                ladies.append(datum)
        elif is_female == False:
            datum = db.getColumn_byID(i, column_name)
            if datum:
                dudes.append(datum)
    degrees, t = t_test_math(ladies, dudes)
    print(degrees, t)