Beispiel #1
0
def Graph_Ratings(sort="UserRatings",
                  order="DESC",
                  count=10,
                  minimum_reviews=20):
    conn = sqlite.connect(DATABASE_NAME)
    cur = conn.cursor()

    # sub query to get the average rating by movie from the ratings table
    sub_query = selectQueryBuilder(
        columns=['MovieID', 'AVG(Rating) AS UserRatings'],
        table='Ratings',
        group_by='MovieID',
        filter=['COUNT(*)', '>', minimum_reviews])
    query = selectQueryBuilder(
        columns=[
            'Title',
            'Release',
            'ROUND(((Rating_IMDB*10)+(Rating_RT*1)+Rating_MC)/3,2) AS AvgCriticRating',  # convert all of ratings to a 100 point scale and average them out
            'ROUND(UserRatings*20,2) AS AvgUserRating',  # covert the User ratings to a 100 point scale
            'ABS(ROUND(((((Rating_IMDB*10)+(Rating_RT*1)+Rating_MC)/3)-(UserRatings*20)),2)) AS RatingDiff '  # just ABS(AvgCriticRating-AvgUserRating)
        ],
        table='Film',
        joins="JOIN (" + sub_query + ") ON FilmID == MovieID",
        filter=["AvgCriticRating", "IS NOT", "NULL"],
        order_by="{} {}".format(sort, order),
        limit=count)

    cur.execute(query)
    trace1 = PlotlyBarTrace("Average Critic Rating")
    trace2 = PlotlyBarTrace("Average User Rating")
    raw_data = []
    for row in cur:
        trace1.labels.append("{} ({})".format(row[0], row[1]))
        trace1.values.append(row[2])

        trace2.labels.append("{} ({})".format(row[0], row[1]))
        trace2.values.append(row[3])

        raw_data.append(row)

    data = [trace1.GetBar(), trace2.GetBar()]

    layout = go.Layout(barmode="group",
                       title="Avg Critic Rating VS Avg User Rating")

    fig = go.Figure(data=data, layout=layout)

    return offline.plot(fig,
                        show_link=False,
                        output_type="div",
                        include_plotlyjs=False), raw_data
Beispiel #2
0
def Graph_MovieRatings(title, year):
    conn = sqlite.connect(DATABASE_NAME)
    cur = conn.cursor()

    sub_query = selectQueryBuilder(columns='FilmID',
                                   table='Film',
                                   filter=[['Title', "=", title], "AND",
                                           ['Release', 'LIKE', year + '%']])
    query = selectQueryBuilder(
        columns=[
            'UserID', 'Rating', 'datetime(Timestamp, \'unixepoch\') As Date'
        ],  #https://stackoverflow.com/questions/14629347/how-to-convert-unix-epoch-time-in-sqlite
        table='Ratings',
        filter=['MovieID', '=', "(" + sub_query + ")"],
        order_by="Date DESC")

    cur.execute(query)
    boxtrace = PlotlyBoxTrace("User Ratings")
    scattertrace = PlotlyScatterTrace("User Ratings")

    raw_data = []
    for row in cur:
        boxtrace.values.append(row[1])
        scattertrace.x.append(row[2])
        scattertrace.y.append(row[1])
        raw_data.append(row)

    box_data = [boxtrace.GetBox()]
    box_layout = go.Layout(
        title="User Ratings for {} ({})".format(title, year))
    box_fig = go.Figure(data=box_data, layout=box_layout)

    scatter_data = [scattertrace.GetScatter()]
    scatter_layout = go.Layout(
        title="User Ratings Over Time for {} ({})".format(title, year))
    scatter_fig = go.Figure(data=scatter_data, layout=scatter_layout)

    if len(raw_data) == 0:
        raw_data = None

    return offline.plot(box_fig,
                        show_link=False,
                        output_type="div",
                        include_plotlyjs=False), offline.plot(
                            scatter_fig,
                            show_link=False,
                            output_type="div",
                            include_plotlyjs=False), raw_data
Beispiel #3
0
def GetMoviesByPerson(id):
    conn = sqlite.connect(DATABASE_NAME)
    cur = conn.cursor()

    query = selectQueryBuilder(
        columns=[
            'People.Name', 'Film.Title AS Film', 'Film.Release', 'Role.Title'
        ],
        table='People',
        joins=[
            'JOIN CastByFilm ON CastByFilm.CastID = People.ID',
            'JOIN Role ON CastByFilm.RoleID = Role.ID',
            'JOIN Film ON Film.FilmID = CastByFilm.FilmID'
        ],
        filter=['People.ID', '=', id])

    cur.execute(query)
    data = []
    for row in cur:
        data.append(row)

    if len(data) > 0:
        return data
    else:
        return None
Beispiel #4
0
def GetReviewsByUser(id):
    conn = sqlite.connect(DATABASE_NAME)
    cur = conn.cursor()

    query = selectQueryBuilder(
        columns=[
            'Title', 'Release', 'Ratings.Rating',
            'ROUND(AvgRating, 2) AS AvgRating',
            'ROUND(Ratings.Rating - AvgRating,2) AS Difference', 'NumRatings'
        ],
        table='Ratings',
        joins=[
            'JOIN Film ON Film.FilmID = Ratings.MovieID',
            'JOIN (SELECT MovieID as AvgMovieID, AVG(Rating) AS AvgRating, COUNT(*) AS NumRatings FROM Ratings GROUP BY MovieID) ON AvgMovieID = Film.FilmID'
        ],
        filter=['UserID', '=', id],
        order_by='Ratings.Rating DESC')

    cur.execute(query)
    data = []
    for row in cur:
        data.append(row)

    if len(data) > 0:
        return UserReviews(data)
    else:
        return None
Beispiel #5
0
def Graph_Budget(sort="Budget", limit=20):
    conn = sqlite.connect(DATABASE_NAME)
    cur = conn.cursor()

    query = selectQueryBuilder(
        columns=['Title', 'Release', 'Budget', 'Revenue'],
        table='Film',
        filter=['Budget', '>', 0],
        order_by=sort + ' DESC',
        limit=limit)

    cur.execute(query)
    trace1 = PlotlyBarTrace("Budget")
    trace2 = PlotlyBarTrace("Revenue")
    raw_data = []
    for row in cur:
        trace1.values.append(row[2])
        trace1.labels.append(row[0])
        trace2.values.append(row[3])
        trace2.labels.append(row[0])
        row = list(row)
        row[2] = '${:,.0f}'.format(row[2])
        row[3] = '${:,.0f}'.format(row[3])
        raw_data.append(row)

    data = [trace1.GetBar(), trace2.GetBar()]

    layout = go.Layout(
        title='Top {} Movies with the Highest {}'.format(limit, sort))
    fig = go.Figure(data=data, layout=layout)
    return offline.plot(fig,
                        show_link=False,
                        output_type="div",
                        include_plotlyjs=False), raw_data
Beispiel #6
0
def Graph_BudgetPerStar():
    conn = sqlite.connect(DATABASE_NAME)
    cur = conn.cursor()

    subquery = selectQueryBuilder(
        columns=['MovieId AS RatingMovieID', 'AVG(Rating) AS UserRating'],
        table='Ratings',
        group_by='MovieID',
        filter=["COUNT(*)", ">", 30])

    query = selectQueryBuilder(columns=[
        'Title', 'Release', 'Budget', 'ROUND(UserRating, 2) AS AvgUserRating',
        'ROUND(Budget/UserRating, 2) AS DollarsPerStar'
    ],
                               table='Film',
                               joins='JOIN (' + subquery +
                               ') ON RatingMovieID = Film.FilmID',
                               filter=['Budget', '>', 100000],
                               order_by='DollarsPerStar DESC',
                               limit=30)

    cur.execute(query)
    trace = PlotlyBarTrace("Dollars Per Star")
    raw_data = []
    for row in cur:
        trace.values.append(row[4])
        trace.hovertext.append("{} ({})<br>{} for {} stars".format(
            row[0], row[1][:4], '${:,.0f}'.format(row[2]), row[3]))
        trace.labels.append(row[0])
        row = list(row)
        row[2] = '${:,.0f}'.format(row[2])
        row[4] = '${:,.0f}'.format(row[4])
        raw_data.append(row)

    data = [trace.GetBar()]
    layout = go.Layout(title="Dollars Spent Per Star (User Reviews)")
    fig = go.Figure(data=data, layout=layout)
    return offline.plot(fig,
                        show_link=False,
                        output_type="div",
                        include_plotlyjs=False), raw_data
Beispiel #7
0
def Graph_AAWinners(sort="wins", count=10, show_nominations=True):
    conn = sqlite.connect(DATABASE_NAME)
    cur = conn.cursor()

    if sort == "noms":
        order = ['AA_Nominations DESC', 'AA_Wins DESC']
    else:
        order = ['AA_Wins DESC', 'NomNotWon DESC']

    query = selectQueryBuilder(columns=[
        'Title', 'Release', 'AA_Wins',
        '(AA_Nominations - AA_Wins) AS NomNotWon', 'BestPicture'
    ],
                               table='Film',
                               order_by=order,
                               limit=count)

    cur.execute(query)
    trace1 = PlotlyBarTrace("Wins")
    trace2 = PlotlyBarTrace("Nominations")
    raw_data = []

    for row in cur:
        trace1.labels.append("{} ({})".format(row[0], row[1]))
        trace1.values.append(row[2])

        trace2.labels.append("{} ({})".format(row[0], row[1]))
        trace2.values.append(row[3])

        raw_data.append(row)

    data = [trace1.GetBar()]
    if show_nominations:
        data.append(trace2.GetBar())

    if sort == "wins":
        title = "Top {} films with the most Academy Award Wins".format(count)
    else:
        title = "Top {} films with the most Academy Award Nominations".format(
            count)

    layout = go.Layout(barmode='stack', title=title)

    fig = go.Figure(data=data, layout=layout)

    return offline.plot(fig,
                        show_link=False,
                        output_type="div",
                        include_plotlyjs=False), raw_data
Beispiel #8
0
def GetCastAndCrew(title, year):
    conn = sqlite.connect(DATABASE_NAME)
    cur = conn.cursor()

    sub_query1 = selectQueryBuilder(
        columns=['CastID As Credit', 'COUNT(*) AS CreditCount'],
        table='CastByFilm',
        group_by='CastID',
        filter=['COUNT(*)', ">", 1])

    sub_query2 = selectQueryBuilder(
        columns='FilmID',
        table='Film',
        filter=[['Title', "=", title], "AND",
                ['Release', 'LIKE', str(year) + '%']])

    query = selectQueryBuilder(
        columns=['People.ID', 'People.Name', 'Role.Title', 'CreditCount'],
        table='CastByFilm',
        joins=[
            'JOIN People ON CastID = People.ID',
            'JOIN Role ON RoleID = Role.ID',
            'LEFT JOIN (' + sub_query1 + ') ON Credit = People.ID '
        ],
        filter=['FilmID', '=', "(" + sub_query2 + ")"],
    )

    cur.execute(query)
    data = []
    for row in cur:
        data.append(row)

    if len(data) > 0:
        return data
    else:
        return None