def create_user_api(userdata_file): api=UserAPI() with open(userdata_file, 'rb') as csvfile: i=0 user_data=csv.reader(csvfile) csvfile.next() #skip csv header print "Storing users in MongDB... Please Wait." for row in user_data: api.create_user(row) i+=1 # number of lines : 14,388,386 users print "%d users saved"%i
#!/usr/bin/env python # -*- coding: utf-8 -*- ''' This is a test for user db interactions ''' import csv from collections import Counter from test_helpers import TestHelpers helpers=TestHelpers() helpers.add_relative_path() from lib.users import UserAPI api=UserAPI() result = api.get_province("uHRWEYSX0") print result userdata_file="/home/clemsos/Dev/mitras/lib/cities/usersample.csv" def test_write_users(userdata_file): with open(userdata_file, 'rb') as csvfile: i=0 user_data=csv.reader(csvfile) csvfile.next() #skip csv header for row in user_data: api.create_user(row)
t0=time() minetweet.init_tweet_regex() locale.setlocale(locale.LC_ALL, "") nlp=NLPMiner() stoplist=[i.strip() for i in open("lib/stopwords/zh-stopwords","r")] stoplist+=[i.strip() for i in open("lib/stopwords/stopwords.txt","r")] stoplist+=["转发","微博","说 ","一个","【 ","年 ","转 ","请","" ","问题","知道","中 ","已经","现在","说","【",'"',"年","中","今天","应该","真的","月","希望","想","日","这是","太","转","支持"] # stoplist+=["事儿","中国"] api=UserAPI() words_users_time=[] def get_province(_userid): province_code= api.get_province(_userid) # print province_code try : return api.provinces[province_code] except KeyError : return 0 pass def analyze_meme(meme_name): # Init tstart=time()
#!/usr/bin/env python # -*- coding: utf-8 -*- import csv from lib.users import UserAPI api = UserAPI() userdata_file = "/home/clemsos/Dev/mitras/data/datazip/others/userdata.csv" # userdata_file="/home/clemsos/Dev/mitras/lib/cities/usersample.csv" # number of lines : 14,388,386 users with open(userdata_file, 'rb') as csvfile: i = 0 user_data = csv.reader(csvfile) csvfile.next() #skip csv header print "Storing users... Please Wait." for row in user_data: api.create_user(row) i += 1 print "%d users saved" % i
from collections import Counter from lib.users import UserAPI # variables meme_name = "thevoice" map_title = "Population of Sina Weibo users for The Voice" map_desc = "Based on Sina Weibo user profiles info. Data from HKU Weiboscope." map_credits = "by Clement Renaud - 2013" map_units = "Volume of tweets (per 100)" tweets_file = "/home/clemsos/Dev/mitras/results/" + meme_name + "/" + meme_name + ".csv" #tweets_file="/home/clemsos/Dev/mitras/lib/cities/usersample.csv" # get user data api = UserAPI() user_provinces = [] with open(tweets_file, 'rb') as csvfile: weibo_data = csv.reader(csvfile) csvfile.next() #skip csv header print "processing tweets..." for tweet in weibo_data: # print tweet[0] province_code = api.get_province(tweet[0]) # print province_code try: user_provinces.append(api.provinces[province_code]) except KeyError: print "error"
#!/usr/bin/env python # -*- coding: utf-8 -*- ''' This is a test for user db interactions ''' import csv from collections import Counter from test_helpers import TestHelpers helpers = TestHelpers() helpers.add_relative_path() from lib.users import UserAPI api = UserAPI() result = api.get_province("uHRWEYSX0") print result userdata_file = "/home/clemsos/Dev/mitras/lib/cities/usersample.csv" def test_write_users(userdata_file): with open(userdata_file, 'rb') as csvfile: i = 0 user_data = csv.reader(csvfile) csvfile.next() #skip csv header for row in user_data: api.create_user(row)
#!/usr/bin/env python # -*- coding: utf-8 -*- import csv from lib.users import UserAPI api=UserAPI() userdata_file="/home/clemsos/Dev/mitras/data/datazip/others/userdata.csv" # userdata_file="/home/clemsos/Dev/mitras/lib/cities/usersample.csv" # number of lines : 14,388,386 users with open(userdata_file, 'rb') as csvfile: i=0 user_data=csv.reader(csvfile) csvfile.next() #skip csv header print "Storing users... Please Wait." for row in user_data: api.create_user(row) i+=1 print "%d users saved"%i