Python Features.add_item Examples

Programming Language: Python

Namespace/Package Name: experiments.data

Class/Type: Features

Method/Function: add_item

Examples at hotexamples.com: 4

Python Features.add_item - 4 examples found. These are the top rated real world Python examples of experiments.data.Features.add_item extracted from open source projects. You can rate examples to help us improve the quality of examples.

Frequently Used Methods

Show Hide

Features(3)

add_feature(3)

set_shape(3)

add_item(2)

add_title(1)

item_ids(1)

Example #1

Show file

File: data.py Project: pombredanne/lightfm-paper

def read_movie_features(titles=False, genres=False, genome_tag_threshold=1.0, tag_popularity_threshold=30):

    features = Features()

    with open(os.path.join(DATA_DIR, "movies.dat"), "r") as moviefile:
        for line in moviefile:
            (iid, title, genre_list) = line.split(SEPARATOR)
            genres_list = genre_list.split("|")

            features.add_item(iid)

            if genres:
                for genre in genres_list:
                    features.add_feature(iid, "genre:" + genre.lower().replace("\n", ""))

            if titles:
                features.add_feature(iid, "title:" + title.lower())

            features.add_title(iid, title)

    for iid, tag, relevance in read_genome_tags():
        # Do not include any tags for movies not in the 10M dataset
        if relevance >= genome_tag_threshold and iid in features.item_ids:
            features.add_feature(iid, "genome:" + tag.lower())

    # Tags applied by users
    ## for iid, tag, count in read_tags():
    ##     if count >= tag_popularity_threshold and iid in features.item_ids:
    ##         features.add_feature(iid, 'tag:' + tag)

    features.set_shape()

    return features

Example #2

Show file

def read_movie_features(titles=False,
                        genres=False,
                        genome_tag_threshold=1.0,
                        tag_popularity_threshold=30):

    features = Features()

    with open(os.path.join(DATA_DIR, 'movies.dat'), 'r') as moviefile:
        for line in moviefile:
            (iid, title, genre_list) = line.split(SEPARATOR)
            genres_list = genre_list.split('|')

            features.add_item(iid)

            if genres:
                for genre in genres_list:
                    features.add_feature(
                        iid, 'genre:' + genre.lower().replace('\n', ''))

            if titles:
                features.add_feature(iid, 'title:' + title.lower())

            features.add_title(iid, title)

    for iid, tag, relevance in read_genome_tags():
        # Do not include any tags for movies not in the 10M dataset
        if relevance >= genome_tag_threshold and iid in features.item_ids:
            features.add_feature(iid, 'genome:' + tag.lower())

    # Tags applied by users
    ## for iid, tag, count in read_tags():
    ##     if count >= tag_popularity_threshold and iid in features.item_ids:
    ##         features.add_feature(iid, 'tag:' + tag)

    features.set_shape()

    return features

Example #3

Show file

File: data.py Project: doheelab/lightfm_experiment

def read_post_features(tags, post_ids, post_text):

    features = Features()

    for post_id, user_id, post_tags, parent_post_id, body in read_post_data():
        # Only get features for questions, not answers.
        if parent_post_id is None:

            features.add_item(post_id)

            if post_ids:
                features.add_feature(post_id, 'post_id:' + post_id)

            if tags:
                for tag in post_tags:
                    features.add_feature(post_id, 'tag:' + tag)

            if post_text:
                for token in body:
                    features.add_feature(post_id, 'body:' + token)

    features.set_shape()

    return features

Example #4

Show file

File: data.py Project: hbudyanto/lightfm-paper

def read_post_features(tags, post_ids, post_text):

    features = Features()

    for post_id, user_id, post_tags, parent_post_id, body in read_post_data():
        # Only get features for questions, not answers.
        if parent_post_id is None:

            features.add_item(post_id)

            if post_ids:
                features.add_feature(post_id, 'post_id:' + post_id)

            if tags:
                for tag in post_tags:
                    features.add_feature(post_id, 'tag:' + tag)

            if post_text:
                for token in body:
                    features.add_feature(post_id, 'body:' + token)

    features.set_shape()

    return features