def build_features(data_file, feat_name, binning):

    # read text data
    category_texts = data_helper.get_reviews(os.path.join("./", data_file))

    # build features
    features_category_tuples, texts = get_features_category_tuples(
        category_texts, feat_name, binning)

    return features_category_tuples, texts
def build_features(data_file, feat_name, save_feats=None, binning=False):
    # read text liwc
    positive_texts, negative_texts = data_helper.get_reviews(
        os.path.join(DATA_DIR, data_file))

    category_texts = {"positive": positive_texts, "negative": negative_texts}

    # build features
    features_category_tuples, texts = features.get_features_category_tuples(
        category_texts, feat_name, data_file)

    # save features to file
    if save_feats is not None:
        write_features_category(features_category_tuples, save_feats)

    return features_category_tuples, texts
Ejemplo n.º 3
0
def build_features(data_file, feat_name, save_feats=None, binning=False):
    # read text data
    raw_data = data_helper.read_file(data_file)
    positive_texts, negative_texts = data_helper.get_reviews(raw_data)

    category_texts = {"positive": positive_texts, "negative": negative_texts}

    # build features
    features_category_tuples, texts = get_features_category_tuples(
        category_texts, feat_name)

    # save features to file
    if save_feats is not None:
        write_features_category(features_category_tuples, save_feats)

    return features_category_tuples, texts
Ejemplo n.º 4
0
def build_features(data_file, feat_name, binning, save_feats=None, test=False):

    # read text data
    positive_texts, negative_texts = data_helper.get_reviews(os.path.join(DATA_DIR, data_file))
    if test:
        category_texts = {"unknown": positive_texts, "unknown2": negative_texts}
    else:
        category_texts = {"positive": positive_texts, "negative": negative_texts}

    # build features
    features_category_tuples, texts = get_features_category_tuples(category_texts, feat_name, binning)

    # save features to file
    if save_feats is not None:
        write_features_category(features_category_tuples, save_feats, test)

    return features_category_tuples, texts
Ejemplo n.º 5
0
def build_features(data_file, feat_name):
    # read text data
    positive_texts, negative_texts = data_helper.get_reviews(
        os.path.join(DATA_DIR, data_file))

    category_texts = {"positive": positive_texts, "negative": negative_texts}

    # build features
    features_category_tuples, texts = get_features_category_tuples(
        category_texts, feat_name)

    #labelDict = {}
    #for item in features_category_tuples:
    #    for tup in item[0]:  #go through items in dict
    #        if tup == "BIGRAM_service_friendly" and item[0][tup] == 1:
    #            print(tup)
    #        labelDict[(tup, item[0][tup])] = item[1]
    #print(labelDict)
    return features_category_tuples, texts
Ejemplo n.º 6
0
def build_features(data_file, feat_name):
    # read text data
    positive_texts, negative_texts = data_helper.get_reviews(
        os.path.join(DATA_DIR, data_file))

    category_texts = {"positive": positive_texts, "negative": negative_texts}

    # build features
    features_category_tuples, texts = get_features_category_tuples(
        category_texts, feat_name)

    # save features to file
    datamap = {}
    # print("Feature: " + str(feat_name)+"_ Data: "+str(data_file))
    datamap["dev_examples.tsv"] = "development"
    datamap["train_examples.tsv"] = "training"
    write_features_category(features_category_tuples, str(
        feat_name)+"-"+datamap[str(data_file)])

    return features_category_tuples, texts
Ejemplo n.º 7
0
def build_features(data_file, feat_name, save_feats=None):
    # read text data

    if data_file == "test.txt":
        test_texts = data_helper.get_reviews(os.path.join(DATA_DIR, data_file))
        category_texts = {"test data": test_texts}
    else:
        positive_texts, negative_texts = data_helper.get_reviews(
            os.path.join(DATA_DIR, data_file))

        category_texts = {
            "positive": positive_texts,
            "negative": negative_texts
        }

    # build features
    features_category_tuples, texts = get_features_category_tuples(
        category_texts, feat_name)

    # save features to file
    if save_feats is not None:
        write_features_category(features_category_tuples, save_feats)

    return features_category_tuples, texts