Exemple #1
0
# -*- coding: utf-8 -*-
"""
Created on Thu Aug 15 22:13:12 2013

@author: Vasya
"""

import marginal_topics_distr as marg

agg = marg.compute_and_save('unbranded220topics',
                            r'Z:\ermunds\results\1 all 100 topics')
agg2002 = marg.compute_and_save('2002 20topics',
                                r'Z:\ermunds\results\2002 20topics')
agg2005 = marg.compute_and_save('2005 20topics',
                                r'Z:\ermunds\results\2005 20topics')
agg2009 = marg.compute_and_save('2009 20topics',
                                r'Z:\ermunds\results\2009 20topics')
agg2010 = marg.compute_and_save('2010 20topics',
                                r'Z:\ermunds\results\2010 20topics')
agg2011 = marg.compute_and_save('2011 20topics',
                                r'Z:\ermunds\results\2011 20topics')
agg2012 = marg.compute_and_save('2012 20topics',
                                r'Z:\ermunds\results\2012 20topics')
words = 'Arrogant	Authentic	Charming	Daring	Different	Distinctive	Dynamic	Friendly	Fun	Healthy	Helpful	Independent	Innovative	Intelligent	Kind	Leader	Obliging	Original	Prestigious	Progressive	Reliable	Restrained	Rugged	Simple	Social	Stylish	Traditional	Trendy	Trustworthy	Unique'.split()

import numpy as np
import os
import getLikes
import pandas as pd
import genSimLDAlib as gslib
import marginal_topics_distr as marginal

for year in range(2002,2013):
    print year
    modelDir = 'Z:\\ermunds\\results\\%d 20topics'%year
    modelName = '%d 20topics' %year
    
    marginal.compute_and_save(modelName=modelName, LDAdir=modelDir)
    topicsPs = np.genfromtxt(os.path.join(modelDir,'topics_marginal.csv'))
    
    (divs,_,_) = getLikes.get_divs (words,brands,indir=modelDir, modelName=modelName ,topics_marginal_probs=topicsPs)
    (sims,b,w) = getLikes.get_likes(words,brands,indir=modelDir, modelName=modelName )
    
    dirs = gslib.LDAdirs(modelName,modelDir)
    (dict1,_,lda)=gslib.loadStuff(dirs)  
    
    brands_df = getLikes.pruneWordsList(brands,lda)
    words_df = getLikes.pruneWordsList(words,lda)
    
    probs = getLikes.ptopic_given_word(lda,topicsPs)
    probs_df =  pd.DataFrame(probs, columns=lda.id2word.values())
    alls = pd.concat([ brands_df["IDs"] ,words_df["IDs"]])
    x = probs_df[alls]
Exemple #3
0
# -*- coding: utf-8 -*-
"""
Created on Thu Aug 15 22:13:12 2013

@author: Vasya
"""

import marginal_topics_distr as marg

agg =     marg.compute_and_save('unbranded220topics', r'Z:\ermunds\results\1 all 100 topics')
agg2002 = marg.compute_and_save('2002 20topics',r'Z:\ermunds\results\2002 20topics')
agg2005 = marg.compute_and_save('2005 20topics',r'Z:\ermunds\results\2005 20topics')
agg2009 = marg.compute_and_save('2009 20topics',r'Z:\ermunds\results\2009 20topics')
agg2010 = marg.compute_and_save('2010 20topics',r'Z:\ermunds\results\2010 20topics')
agg2011 = marg.compute_and_save('2011 20topics',r'Z:\ermunds\results\2011 20topics')
agg2012 = marg.compute_and_save('2012 20topics',r'Z:\ermunds\results\2012 20topics')
words = 'Arrogant	Authentic	Charming	Daring	Different	Distinctive	Dynamic	Friendly	Fun	Healthy	Helpful	Independent	Innovative	Intelligent	Kind	Leader	Obliging	Original	Prestigious	Progressive	Reliable	Restrained	Rugged	Simple	Social	Stylish	Traditional	Trendy	Trustworthy	Unique'.split(
)

import numpy as np
import os
import getLikes
import pandas as pd
import genSimLDAlib as gslib
import marginal_topics_distr as marginal

for year in range(2002, 2013):
    print year
    modelDir = 'Z:\\ermunds\\results\\%d 20topics' % year
    modelName = '%d 20topics' % year

    marginal.compute_and_save(modelName=modelName, LDAdir=modelDir)
    topicsPs = np.genfromtxt(os.path.join(modelDir, 'topics_marginal.csv'))

    (divs, _, _) = getLikes.get_divs(words,
                                     brands,
                                     indir=modelDir,
                                     modelName=modelName,
                                     topics_marginal_probs=topicsPs)
    (sims, b, w) = getLikes.get_likes(words,
                                      brands,
                                      indir=modelDir,
                                      modelName=modelName)

    dirs = gslib.LDAdirs(modelName, modelDir)
    (dict1, _, lda) = gslib.loadStuff(dirs)