def main(): db = MongoClient().test_database n = 0.0 QUERY = read_in() first = Trend() first.setName(QUERY) for tweet in db.tweets.find({ "entities.hashtags.text": re.compile(QUERY, re.IGNORECASE) }).sort([("_id", pymongo.DESCENDING)]): trend_in_tweet = False for hashtag in tweet["entities"]["hashtags"]: if hashtag['text'].encode("utf-8").lower() != QUERY.lower(): first.addToRelated(hashtag['text'].encode("utf-8").lower(), 1) n = n + 1 print QUERY.lower(), ": ", str(n) top_10 = sorted(first.getRelated().items(), key=operator.itemgetter(1), reverse=True) for top in top_10: print top[0], ": ", float(top[1]) / n first.clear()
def main(): db = MongoClient().test_database n = 0.0 QUERY = read_in() first = Trend() first.setName(QUERY) for tweet in db.tweets.find({"entities.hashtags.text": re.compile(QUERY, re.IGNORECASE)}).sort([("_id", pymongo.DESCENDING)]): trend_in_tweet = False for hashtag in tweet["entities"]["hashtags"]: if hashtag['text'].encode("utf-8").lower() != QUERY.lower(): first.addToRelated(hashtag['text'].encode("utf-8").lower(),1) n = n + 1 print QUERY.lower(), ": ", str(n) top_10 = sorted(first.getRelated().items(), key=operator.itemgetter(1), reverse=True) for top in top_10: print top[0], ": ", float(top[1])/n first.clear()
import getopt def take(n, iterable): "Return first n items of the iterable as a list" return list(islice(iterable, n)) db = MongoClient().test_database n = 0.0 QUERY = "diabetes" first = Trend() first.setName(QUERY) for tweet in db.tweets.find({"entities.hashtags.text": re.compile(QUERY, re.IGNORECASE)}).sort( [("_id", pymongo.DESCENDING)] ): trend_in_tweet = False for hashtag in tweet["entities"]["hashtags"]: if hashtag["text"].encode("utf-8").lower() != QUERY.lower(): first.addToRelated(hashtag["text"].encode("utf-8").lower(), 1) n = n + 1 print QUERY.lower(), ": ", str(n) top_10 = sorted(first.getRelated().items(), key=operator.itemgetter(1), reverse=True) for top in top_10: print "\t", top[0], ": ", float(top[1]) / n first.clear()
def take(n, iterable): "Return first n items of the iterable as a list" return list(islice(iterable, n)) db = MongoClient().test_database n = 0.0 QUERY = 'ROOT' first = Trend() first.setName(QUERY) for tweet in db.tweets.find(): for hashtag in tweet["entities"]["hashtags"]: if hashtag['text'].encode("utf-8").lower() != QUERY.lower(): first.addToRelated(hashtag['text'].encode("utf-8").lower(), 1) n = n + 1 print QUERY.lower(), ": ", str(n) top_10 = sorted(first.getRelated().items(), key=operator.itemgetter(1), reverse=True) top_10 = take(20, top_10) for top in top_10: print "\t", top[0], ": ", float(top[1]) / n print len(top_10) first.clear()