def __init__(self, populate_for_first_four_weeks): self.blog_post_count_map = unpickle( 'blog_post_count_map' + get_pickle_file_suffix(populate_for_first_four_weeks)) self.blog_author__post_count_map = unpickle( 'blog_author__post_count_map' + get_pickle_file_suffix(populate_for_first_four_weeks)) self.user_likes_map = unpickle( 'user_likes_map' + get_pickle_file_suffix(populate_for_first_four_weeks)) self.user_liked_blogs_map = unpickle( 'user_liked_blogs_map' + get_pickle_file_suffix(populate_for_first_four_weeks)) self.blog_liked_users_map = unpickle( 'blog_liked_users_map' + get_pickle_file_suffix(populate_for_first_four_weeks)) self.tag_blog_count_map = unpickle( 'tag_blog_count_map' + get_pickle_file_suffix(populate_for_first_four_weeks)) self.category_blog_count_map = unpickle( 'category_blog_count_map' + get_pickle_file_suffix(populate_for_first_four_weeks)) self.tag_user_count_map = unpickle( 'tag_user_count_map' + get_pickle_file_suffix(populate_for_first_four_weeks)) self.category_user_count_map = unpickle( 'category_user_count_map' + get_pickle_file_suffix(populate_for_first_four_weeks)) self.blog_topic_distribution_map = unpickle( 'blog_topic_distribution_map')
def __init__(self, populate_for_first_four_weeks): self.blog_post_count_map = unpickle('blog_post_count_map' + get_pickle_file_suffix(populate_for_first_four_weeks)) self.blog_author__post_count_map = unpickle('blog_author__post_count_map' + get_pickle_file_suffix(populate_for_first_four_weeks)) self.user_likes_map = unpickle('user_likes_map' + get_pickle_file_suffix(populate_for_first_four_weeks)) self.user_liked_blogs_map = unpickle('user_liked_blogs_map' + get_pickle_file_suffix(populate_for_first_four_weeks)) self.blog_liked_users_map = unpickle('blog_liked_users_map' + get_pickle_file_suffix(populate_for_first_four_weeks)) self.tag_blog_count_map = unpickle('tag_blog_count_map' + get_pickle_file_suffix(populate_for_first_four_weeks)) self.category_blog_count_map = unpickle('category_blog_count_map' + get_pickle_file_suffix(populate_for_first_four_weeks)) self.tag_user_count_map = unpickle('tag_user_count_map' + get_pickle_file_suffix(populate_for_first_four_weeks)) self.category_user_count_map = unpickle('category_user_count_map' + get_pickle_file_suffix(populate_for_first_four_weeks)) self.blog_topic_distribution_map = unpickle('blog_topic_distribution_map')
from v2.train_feature_util import train_feature_util from v1.test_util import load_test_users lines_to_read = -1 max_post_to_compare = 2 test_start_date = '2012-04-30' test_start_date__struct = datetime.strptime(test_start_date + ' 00:00:00', '%Y-%m-%d %H:%M:%S') ################################################################################################################################ logging.basicConfig(format='%(asctime)s : %(levelname)s : %(message)s', level=logging.INFO) logger = logging.getLogger('test_csv_generator') ################################################################################################################################ test_blog_post_tuples_map = unpickle('test_blog_post_tuples_map') ################################################################################################################################ def get_day_since_test_start_date(date_struct): d = (date_struct - test_start_date__struct).days + 1 if d <= 1: return 1 elif d >= 7: return 7 else: return d ################################################################################################################################ #build test CSV
import logging from v1.config_and_pickle import generated_loc, unpickle from v2.train_feature_util import train_feature_util from v1.test_util import load_test_users lines_to_read = -1 max_post_to_compare = 2 test_start_date = "2012-04-30" test_start_date__struct = datetime.strptime(test_start_date + " 00:00:00", "%Y-%m-%d %H:%M:%S") ################################################################################################################################ logging.basicConfig(format="%(asctime)s : %(levelname)s : %(message)s", level=logging.INFO) logger = logging.getLogger("test_csv_generator") ################################################################################################################################ test_blog_post_tuples_map = unpickle("test_blog_post_tuples_map") ################################################################################################################################ def get_day_since_test_start_date(date_struct): d = (date_struct - test_start_date__struct).days + 1 if d <= 1: return 1 elif d >= 7: return 7 else: return d ################################################################################################################################ # build test CSV logger.info("started building test CSV...")