Ejemplo n.º 1
0
def seed_tweets(query, starting_max_id, ending_max_id, count, number_of_queries):
    positive_tweets = 790178
    negative_tweets = 788437
    id_range = ending_max_id - starting_max_id
    iteration = id_range // number_of_queries
    for x in range(number_of_queries):
        twitter = Twython(APP_KEY, APP_SECRET)
        search = twitter.search(q=query, max_id=starting_max_id, count=count)
        tweets = search['statuses']
        for tweet in tweets:
            for candidate in candidate_list:
                if candidate in tweet['text']:
                    try:
                        formatted_timestamp = time.strftime('%Y-%m-%d %H:%M:%S', time.strptime(tweet['created_at'],'%a %b %d %H:%M:%S +0000 %Y'))
                        bayes_score = bayes_analysis(tweet['text'], positive_tweets, negative_tweets)
                        tweet_object = Tweet(text =tweet['text'], date=formatted_timestamp, query_string=query, candidate=candidate, score=bayes_score)
                        tweet_object.save()
                    except:
                        continue
        starting_max_id += iteration
Ejemplo n.º 2
0
# from sentiment.secret import * (pull in API credentials)

from twython import Twython
from sentiment.models import Tweet
import time
from sentiment.bayes import bayes_analysis, training_model

candidate_list = ["Trump", "Bush", "Walker", "Huckabee", "Carson", "Cruz", "Rubio", "Paul", "Christie", "Kasich"]

bayes_analysis("hello",2,1)

def seed_tweets(query, starting_max_id, ending_max_id, count, number_of_queries):
    positive_tweets = 790178
    negative_tweets = 788437
    id_range = ending_max_id - starting_max_id
    iteration = id_range // number_of_queries
    for x in range(number_of_queries):
        twitter = Twython(APP_KEY, APP_SECRET)
        search = twitter.search(q=query, max_id=starting_max_id, count=count)
        tweets = search['statuses']
        for tweet in tweets:
            for candidate in candidate_list:
                if candidate in tweet['text']:
                    try:
                        formatted_timestamp = time.strftime('%Y-%m-%d %H:%M:%S', time.strptime(tweet['created_at'],'%a %b %d %H:%M:%S +0000 %Y'))
                        bayes_score = bayes_analysis(tweet['text'], positive_tweets, negative_tweets)
                        tweet_object = Tweet(text =tweet['text'], date=formatted_timestamp, query_string=query, candidate=candidate, score=bayes_score)
                        tweet_object.save()
                    except:
                        continue