Exemplo n.º 1
0
    def __init__(self, populate_for_first_four_weeks):
        self.blog_post_count_map = unpickle(
            'blog_post_count_map' +
            get_pickle_file_suffix(populate_for_first_four_weeks))
        self.blog_author__post_count_map = unpickle(
            'blog_author__post_count_map' +
            get_pickle_file_suffix(populate_for_first_four_weeks))
        self.user_likes_map = unpickle(
            'user_likes_map' +
            get_pickle_file_suffix(populate_for_first_four_weeks))
        self.user_liked_blogs_map = unpickle(
            'user_liked_blogs_map' +
            get_pickle_file_suffix(populate_for_first_four_weeks))
        self.blog_liked_users_map = unpickle(
            'blog_liked_users_map' +
            get_pickle_file_suffix(populate_for_first_four_weeks))
        self.tag_blog_count_map = unpickle(
            'tag_blog_count_map' +
            get_pickle_file_suffix(populate_for_first_four_weeks))
        self.category_blog_count_map = unpickle(
            'category_blog_count_map' +
            get_pickle_file_suffix(populate_for_first_four_weeks))
        self.tag_user_count_map = unpickle(
            'tag_user_count_map' +
            get_pickle_file_suffix(populate_for_first_four_weeks))
        self.category_user_count_map = unpickle(
            'category_user_count_map' +
            get_pickle_file_suffix(populate_for_first_four_weeks))

        self.blog_topic_distribution_map = unpickle(
            'blog_topic_distribution_map')
Exemplo n.º 2
0
    def __init__(self, populate_for_first_four_weeks):
        self.blog_post_count_map         = unpickle('blog_post_count_map' + get_pickle_file_suffix(populate_for_first_four_weeks))
        self.blog_author__post_count_map = unpickle('blog_author__post_count_map' + get_pickle_file_suffix(populate_for_first_four_weeks))
        self.user_likes_map              = unpickle('user_likes_map' + get_pickle_file_suffix(populate_for_first_four_weeks))
        self.user_liked_blogs_map        = unpickle('user_liked_blogs_map' + get_pickle_file_suffix(populate_for_first_four_weeks))
        self.blog_liked_users_map        = unpickle('blog_liked_users_map' + get_pickle_file_suffix(populate_for_first_four_weeks))
        self.tag_blog_count_map          = unpickle('tag_blog_count_map' + get_pickle_file_suffix(populate_for_first_four_weeks))
        self.category_blog_count_map     = unpickle('category_blog_count_map' + get_pickle_file_suffix(populate_for_first_four_weeks))
        self.tag_user_count_map          = unpickle('tag_user_count_map' + get_pickle_file_suffix(populate_for_first_four_weeks))
        self.category_user_count_map     = unpickle('category_user_count_map' + get_pickle_file_suffix(populate_for_first_four_weeks))

        self.blog_topic_distribution_map = unpickle('blog_topic_distribution_map')
Exemplo n.º 3
0
from v2.train_feature_util import train_feature_util
from v1.test_util import load_test_users

lines_to_read = -1
max_post_to_compare = 2

test_start_date = '2012-04-30'
test_start_date__struct = datetime.strptime(test_start_date + ' 00:00:00',
                                            '%Y-%m-%d %H:%M:%S')

################################################################################################################################
logging.basicConfig(format='%(asctime)s : %(levelname)s : %(message)s',
                    level=logging.INFO)
logger = logging.getLogger('test_csv_generator')
################################################################################################################################
test_blog_post_tuples_map = unpickle('test_blog_post_tuples_map')


################################################################################################################################
def get_day_since_test_start_date(date_struct):
    d = (date_struct - test_start_date__struct).days + 1
    if d <= 1:
        return 1
    elif d >= 7:
        return 7
    else:
        return d


################################################################################################################################
#build test CSV
Exemplo n.º 4
0
import logging
from v1.config_and_pickle import generated_loc, unpickle
from v2.train_feature_util import train_feature_util
from v1.test_util import load_test_users

lines_to_read = -1
max_post_to_compare = 2

test_start_date = "2012-04-30"
test_start_date__struct = datetime.strptime(test_start_date + " 00:00:00", "%Y-%m-%d %H:%M:%S")

################################################################################################################################
logging.basicConfig(format="%(asctime)s : %(levelname)s : %(message)s", level=logging.INFO)
logger = logging.getLogger("test_csv_generator")
################################################################################################################################
test_blog_post_tuples_map = unpickle("test_blog_post_tuples_map")
################################################################################################################################
def get_day_since_test_start_date(date_struct):
    d = (date_struct - test_start_date__struct).days + 1
    if d <= 1:
        return 1
    elif d >= 7:
        return 7
    else:
        return d


################################################################################################################################
# build test CSV
logger.info("started building test CSV...")