Exemplo n.º 1
0
def createAnddisplayCatHisto():
    data = bowu.getSetOfCatagoriesWithCounts(10)
    X = np.arange(len(data))
    plt.bar(X, data.values(), align='center', width=0.5)
    plt.xticks(X, data.keys())
    ymax = max(data.values()) + 1
    plt.ylim(0, ymax)
    plt.title("Number of Review per Categorys ")
    plt.xlabel("Category")
    plt.ylabel("Number of Reviews")
    plt.show()
def sentenceCount(text):
    period_split = text.split(".")
    exclamation_split = []
    [exclamation_split.extend(s.split("!")) for s in period_split]
    question_split = []
    [question_split.extend(s.split("?")) for s in exclamation_split]
    return len(question_split)-1


if __name__ == "__main__":
    stars = (1,2,3,4,5)
    number_of_reviews = 5
    word_averages = []
    sentence_averages = []
    for star in stars:
        reviews = bow.getReviews(number_of_reviews, star)
        word_average = 0
        sentence_average = 0
        for r in reviews:
            word_average += wordCount(r)
            sentence_average += sentenceCount(r)
        word_averages.append(word_average / number_of_reviews)
        sentence_averages.append(sentence_average / number_of_reviews)
    print(word_averages)
    print(sentence_averages)

    bar_width = .75

    plt.title("Average Word Count Per Review by Star Rating")
    plt.xlabel("Star Rating")
    plt.ylabel("Number of Words")