Exemplo n.º 1
0
    global strongly_subj_list
    OpinionExtractor.add_opinion_column(df, strongly_subj_list)


def create_vulgar_column(df):
    global wordlist
    dftext = df[['text']]
    result = dftext.applymap(
        lambda x: VulgarExtractor.containsVulgar(x, wordlist))
    df['isVulgar'] = result


if __name__ == "__main__":
    #    exec(open('FileReader.py').read())

    full_df_list = FileReader.get_dataframe()

    #load strongly subjective list
    strongly_subj_list = OpinionExtractor.initialize_subjectivity()

    #load vulgar words list
    wordlist = VulgarExtractor.vulgarWords(
        "./feature-extraction/vulgar-extractor/badwords.txt")

    #this loop will generate all features
    for df in full_df_list:
        create_opinion_column(df)
        create_vulgar_column(df)

    train_df = full_df_list[0]
    dev_df = full_df_list[1]