Пример #1
0
def test_movie_rating():
    mm = Movie("Star Wars The Third Gathers: Backstroke of the West", 2000)
    mm.rating = 6.3
    assert mm.rating == 6.3
    mm.rating = -1
    assert mm.rating == 6.3
    mm.rating = 11
    assert mm.rating == 6.3
Пример #2
0
 def read_csv_file(self):
     with open(self.__file_name, mode='r', encoding='utf-8-sig') as csvfile:
         movie_file_reader = csv.DictReader(csvfile)
         index = 0
         for row in movie_file_reader:
             try:
                 movie = Movie(row['Title'], int(row['Year']))
             except ValueError:
                 print("Invalid release year")
             else:
                 director = Director(row['Director'].strip())
                 actors = row['Actors'].split(",")
                 genres = row['Genre'].split(",")
                 movie.director = director
                 if director not in self.__dataset_of_directors:
                     self.__dataset_of_directors.append(director)
                 movie.description = row['Description'].strip()
                 for actor_name in actors:
                     actor_name = actor_name.strip()
                     actor = Actor(actor_name.strip())
                     if actor in self.dataset_of_actors:
                         i = self.dataset_of_actors.index(actor)
                         actor = self.dataset_of_actors[i]
                     else:
                         self.__dataset_of_actors.append(actor)
                     for actor1_name in actors:
                         actor1_name = actor1_name.strip()
                         if not actor.check_if_this_actor_worked_with(Actor(actor1_name)) and (actor_name != actor1_name):
                             actor.add_actor_colleague(Actor(actor1_name))
                     movie.add_actor(actor)
                 for genre_name in genres:
                     genre = Genre(genre_name.strip())
                     movie.add_genre(genre)
                     if genre not in self.__dataset_of_genres:
                         self.__dataset_of_genres.append(genre)
                 try:
                     movie.runtime_minutes = int(row['Runtime (Minutes)'])
                 except ValueError:
                     movie.runtime_minutes = None
                 try:
                     movie.votes = int(row['Votes'])
                 except ValueError:
                     movie.votes = None
                 try:
                     movie.rating = float(row['Rating'])
                 except ValueError:
                     movie.rating = None
                 if movie not in self.__dataset_of_movies: # Check if this takes into account the same movie but different objects
                     self.__dataset_of_movies.append(movie)
             index += 1
Пример #3
0
    def read_csv_file(self):
        with open(self.__file_name, mode='r', encoding='utf-8-sig') as csvfile:
            movie_file_reader = csv.DictReader(csvfile)

            for row in movie_file_reader:
                title = row['Title']
                release_year = int(row['Year'])
                movie = Movie(title, release_year)
                movie.votes = row['Votes']
                movie.metascore = row['Metascore']
                movie.rating = row['Rating']
                movie.description = row['Description']
                self.__movies.append(movie)
                director = Director(row['Director'])
                if director not in self.__directors:
                    self.__directors.append(director)
                actors = re.split(", |,", row["Actors"])
                for actor_splited in actors:
                    actor = Actor(actor_splited)
                    if actor not in self.__actors:
                        self.__actors.append(actor)
                genres = row['Genre'].split(",")
                for genre_splited in genres:
                    genre = Genre(genre_splited)
                    if genre not in self.__genres:
                        self.__genres.append(genre)
Пример #4
0
def test_movies():
    movie_file_reader = MovieFileCSVReader('test.csv')
    movie_file_reader.read_csv_file()
    movie1 = Movie("Guardians of the Galaxy", 2014)
    movie1.description = "A group of intergalactic criminals are forced to work together to stop a fanatical warrior from taking control of the universe."
    movie1.runtime_minutes = 121
    movie1.votes = 757074
    movie1.rating = 8.1
    movie1.add_genre(Genre("Action"))
    movie1.add_genre(Genre("Adventure"))
    movie1.add_genre(Genre("Sci-Fi"))
    movie1.add_actor(Actor("Chris Pratt"))
    movie1.add_actor(Actor("Vin Diesel"))
    movie1.add_actor(Actor("Bradley Cooper"))
    movie1.add_actor(Actor("Zoe Saldana"))
    movie1.director = Director("James Gunn")
    assert movie_file_reader.dataset_of_movies[0] == movie1
    assert movie_file_reader.dataset_of_movies[0].runtime_minutes == movie1.runtime_minutes
    assert movie_file_reader.dataset_of_movies[0].description == movie1.description
    assert movie_file_reader.dataset_of_movies[0].votes == movie1.votes
    assert movie_file_reader.dataset_of_movies[0].rating == movie1.rating
    assert movie_file_reader.dataset_of_movies[0].actors == movie1.actors
    assert movie_file_reader.dataset_of_movies[0].genres == movie1.genres
    assert movie_file_reader.dataset_of_movies[0].director == movie1.director
    assert movie_file_reader.dataset_of_actors[0] == Actor("Chris Pratt")
    assert movie_file_reader.dataset_of_actors[1] == Actor("Vin Diesel")
    assert movie_file_reader.dataset_of_actors[2] == Actor("Bradley Cooper")
    assert movie_file_reader.dataset_of_actors[3] == Actor("Zoe Saldana")
    assert repr(movie_file_reader.dataset_of_actors[0].actor_colleague_list) == "[<Actor Vin Diesel>, <Actor Bradley Cooper>, <Actor Zoe Saldana>, <Actor Jennifer Lawrence>, <Actor Michael Sheen>, <Actor Laurence Fishburne>, <Actor Denzel Washington>, <Actor Ethan Hawke>, <Actor Vincent D'Onofrio>, <Actor Bryce Dallas Howard>, <Actor Ty Simpkins>, <Actor Judy Greer>, <Actor Will Ferrell>, <Actor Elizabeth Banks>, <Actor Will Arnett>, <Actor Jessica Chastain>, <Actor Joel Edgerton>, <Actor Mark Strong>, <Actor Channing Tatum>, <Actor Rosario Dawson>, <Actor Jenna Dewan Tatum>]"
    assert movie_file_reader.dataset_of_directors[0] == Director("James Gunn")
    assert movie_file_reader.dataset_of_genres[0] == Genre("Action")
    assert movie_file_reader.dataset_of_genres[1] == Genre("Adventure")
    assert movie_file_reader.dataset_of_genres[2] == Genre("Sci-Fi")
Пример #5
0
    def read_csv_file(self):
        with open(self.__file_name, mode='r', encoding='utf-8-sig') as csvfile:
            movie_file_reader = csv.DictReader(csvfile)

            for row in movie_file_reader:
                try:
                    rank = int(row['Rank'])
                except ValueError:
                    rank = None
                title = row['Title']
                genres = row['Genre'].split(',')
                description = row['Description']
                actors = row['Actors'].split(',')
                try:
                    release_year = int(row['Year'])
                except ValueError:
                    release_year = None
                try:
                    run_time = int(row['Runtime (Minutes)'])
                except ValueError:
                    run_time = None
                try:
                    rating = int(row['Rating'])
                except ValueError:
                    rating = 0
                try:
                    votes = int(row['Votes'])
                except ValueError:
                    votes = 0
                director = Director(row['Director'])
                try:
                    revenue = float(row['Revenue (Millions)'])
                except ValueError:
                    revenue = None
                try:
                    metascore = int(row['Metascore'])
                except ValueError:
                    metascore = None

                mov = Movie(title, release_year)
                mov.director = director
                mov.description = description
                mov.metascore = metascore
                mov.rank = rank
                mov.runtime_minutes = run_time
                mov.rating = rating
                mov.votes = votes
                mov.revenue = revenue

                self.load_actors(mov, actors)

                if director not in self.__directors:
                    self.__directors.add(director)

                self.load_genres(mov, genres)

                if mov not in self.__movies:
                    self.__movies.append(mov)
Пример #6
0
    def _read_row(self, row: _ROW) -> Movie:
        """
        Helper method to construct a Movie from a row.

        Raises:
            ValueError: unable to parse row: {row}
         """
        error = False

        try:
            title = row['Title']
            genres = [
                self._get_genre(Genre(name))
                for name in row['Genre'].split(',')
            ]
            description = row['Description']
            director = self._get_director(Director(row['Director']))
            actors = [
                self._get_actor(Actor(name))
                for name in row['Actors'].split(',')
            ]
            release_year = int(row['Year'])
            runtime_minutes = int(row['Runtime (Minutes)'])
            rating = float(row['Rating'])
            votes = int(row['Votes'])
            revenue_millions = float(
                row['Revenue (Millions)']
            ) if row['Revenue (Millions)'] != 'N/A' else None
            metascore = int(
                row['Metascore']) if row['Metascore'] != 'N/A' else None
        except KeyError:
            error = True
        except ValueError:
            error = True

        if error:
            raise ValueError(f'unable to parse row: {row}')

        movie = Movie(title, release_year)
        movie.genres = genres
        movie.description = description
        movie.director = director
        movie.actors = actors
        movie.runtime_minutes = runtime_minutes
        movie.rating = rating
        movie.votes = votes

        if revenue_millions:
            movie.revenue_millions = revenue_millions

        if metascore:
            movie.metascore = metascore

        return movie
    def read_csv_file(self):
        with open(self.__file_name, mode='r', encoding='utf-8-sig') as csvfile:
            movie_file_reader = csv.DictReader(csvfile)

            index = 0
            for row in movie_file_reader:
                title = row['Title']
                release_year = int(row['Year'])
                #print(f"Movie {index} with title: {title}, release year {release_year}")
                m = Movie(title, release_year)
                m.description = row['Description']

                director = Director(row['Director'])
                try:
                    # if director exists, assign the same director object to the movie
                    index = self.dataset_of_directors.index(director)
                    director = self.dataset_of_directors[index]
                except ValueError:
                    self.dataset_of_directors.append(director)
                m.director = director

                m.votes = int(row['Votes'])
                m.rating = float(row['Rating'])
                m.runtime_minutes = int(row['Runtime (Minutes)'])
                if row['Metascore'] != 'N/A':
                    m.metascore = float(row['Metascore'])
                if row['Revenue (Millions)'] != 'N/A':
                    m.revenue = float(row['Revenue (Millions)'])

                for g in row['Genre'].split(","):
                    genre = Genre(g)
                    try:
                        index = self.dataset_of_genres.index(genre)
                        genre = self.dataset_of_genres[index]
                    except ValueError:
                        self.dataset_of_genres.append(genre)
                    m.add_genre(genre)

                for a in row['Actors'].split(","):
                    actor = Actor(a)
                    try:
                        index = self.dataset_of_actors.index(actor)
                        actor = self.dataset_of_actors[index]
                    except ValueError:
                        self.dataset_of_actors.append(actor)
                    m.add_actor(actor)

                if m not in self.dataset_of_movies:
                    self.dataset_of_movies.append(m)
    def read_csv_file(self):
        with open(self.__file_name, mode='r', encoding='utf-8-sig') as csvfile:
            movie_file_reader = csv.DictReader(csvfile)

            for row in movie_file_reader:
                title = row['Title']
                release_year = int(row['Year'])
                actors_list = row['Actors']
                director = row['Director']
                genres_list = row['Genre']

                movie = Movie(title, release_year)
                if movie not in self.__dataset_of_movies:
                    self.__dataset_of_movies.append(movie)

                for actor in actors_list.split(','):
                    if Actor(actor) not in self.__dataset_of_actors:
                        self.__dataset_of_actors.add(Actor(actor))

                if Director(director) not in self.__dataset_of_directors:
                    self.__dataset_of_directors.add(Director(director))

                for genre in genres_list.split(','):
                    movie.genres.append(Genre(genre))
                    if Genre(genre) not in self.__dataset_of_genres:
                        self.__dataset_of_genres.add(Genre(genre))

                rank = row['Rank']
                if int(rank) > 0:
                    movie.rank = rank
                rating = row['Rating']
                if 0 <= float(rating) <= 10:
                    movie.rating = rating
                votes = row['Votes']
                movie.votes = int(votes)
                revenue_millions = row['Revenue (Millions)']
                movie.revenue_millions = revenue_millions
                metascore = row['Metascore']
                try:
                    if 0 <= float(metascore) <= 100:
                        movie.metascore = metascore
                except ValueError:
                    movie.metascore = metascore
Пример #9
0
def populated_movies(genres, directors, actors):
    movies = []

    for i in range(10):
        movie = Movie(f'Movie{i}', 2000 + i)
        movie.genres = [genres[i]]
        movie.description = f'Description{i}'
        movie.director = directors[i]
        movie.actors = [actors[i]]
        movie.runtime_minutes = i + 1
        movie.rating = float(i)
        movie.votes = i

        if i % 2 == 0:
            movie.revenue_millions = float(i + 1)

        if i % 4 == 0:
            movie.metascore = i * 10

        movies.append(movie)

    return movies
Пример #10
0
 def read_csv_file(self):
     csv_file_contents = csv.reader(open(self.__file_name, mode='r', encoding='utf-8-sig'))
     boolean = True
     for row in csv_file_contents:
         if boolean:
             boolean = False
             continue
         temp_movie = Movie("","")
         temp_movie.id = int(row[0])-1
         temp_movie.title = row[1]
         genre_list = row[2].split(",")
         genre_list = [Genre(genre) for genre in genre_list]
         temp_movie.genres = genre_list
         temp_movie.description = row[3]
         temp_movie.director = Director(row[4])
         actor_list = row[5].split(",")
         actor_list = [Actor(actor) for actor in actor_list]
         temp_movie.actors = actor_list
         temp_movie.releaseDate = int(row[6])
         temp_movie.runtime_minutes = int(row[7])
         temp_movie.rating = float(row[8])
         temp_movie.metascore = row[11]
         self.movie_full_details.append(temp_movie)
Пример #11
0
def load_movies_and_actors_genres_director(data_path: str,
                                           repo: MemoryRepository):
    actor_dict = dict()
    genre_dict = dict()
    directors = dict()

    for data_row in read_csv_file(os.path.join(data_path,
                                               'Data1000Movies.csv')):
        movie_key = int(data_row[0])
        genres = data_row[2]
        actors = data_row[5]
        director = data_row[4]
        genre_list = genres.rsplit(",")
        actor_list = actors.rsplit(",")

        for genre in genre_list:
            if genre not in genre_dict.keys():
                genre_dict[genre] = list()
            genre_dict[genre].append(movie_key)

        for actor in actor_list:
            if actor not in actor_dict.keys():
                actor_dict[actor] = list()
            actor_dict[actor].append(movie_key)

        if director not in directors.keys():
            directors[director] = list()
        directors[director].append(movie_key)

        movie = Movie(data_row[1], int(data_row[6]))
        movie.rank = movie_key
        movie.description = data_row[3]
        movie.runtime_minutes = int(data_row[7])
        if data_row[8] != "N/A":
            movie.rating = float(data_row[8])
        if data_row[9] != "N/A":
            movie.votes = int(data_row[9])
        if data_row[10] != "N/A":
            movie.revenue = float(data_row[10])
        if data_row[11] != "N/A":
            movie.metascore = float(data_row[11])

        repo.add_movie(movie)

    for genre_name in genre_dict.keys():
        genre = Genre(genre_name)
        for movie_id in genre_dict[genre_name]:
            movie = repo.get_movie(movie_id)
            genre.add_movie(movie)
            movie.add_genre(genre)
        repo.add_genre(genre)

    for actor_name in actor_dict.keys():
        actor = Actor(actor_name)
        for movie_id in actor_dict[actor_name]:
            movie = repo.get_movie(movie_id)
            actor.add_movie(movie)
            movie.add_actor(actor)
        repo.add_actor(actor)

    for director_name in directors.keys():
        director = Director(director_name)
        for movie_id in directors[director_name]:
            movie = repo.get_movie(movie_id)
            director.add_movie(movie)
            movie.director = director
        repo.add_director(director)
    def read_csv_file(self):
        with open(self.__file_name, mode='r', encoding='utf-8-sig') as csvfile:
            movie_file_reader = csv.DictReader(csvfile)

            index = 0
            for row in movie_file_reader:
                # read data of row into variables
                title = row['Title']

                genres_str = row['Genre'].split(",")
                genres = []
                for genre in genres_str:
                    genres.append(Genre(genre))

                year = int(row['Year'])

                description = row['Description']

                director = Director(row['Director'])

                actors_str = row['Actors'].split(",")
                actors = []
                for actor in actors_str:
                    actors.append(Actor(actor))

                runtime = row['Runtime (Minutes)']

                rating = row['Rating']

                votes = row['Votes']

                revenue = row['Revenue (Millions)']

                metascore = row['Metascore']

                # create and populate Movie obj
                movieObj = Movie(title, year)

                for genre in genres:
                    movieObj.add_genre(genre)

                movieObj.description = description

                movieObj.director = director

                for actor in actors:
                    movieObj.add_actor(actor)

                if not runtime == "N/A":
                    movieObj.runtime_minutes = int(runtime)

                if not rating == "N/A":
                    movieObj.rating = float(rating)

                if not votes == "N/A":
                    movieObj.votes = int(votes)

                if not revenue == "N/A":
                    movieObj.revenue = float(revenue)

                if not metascore == "N/A":
                    movieObj.metascore = int(metascore)

                # populate datasets
                self.dataset_of_movies.append(movieObj)

                for actor in actors:
                    if actor not in self.dataset_of_actors:
                        self.dataset_of_actors.append(actor)

                if director not in self.dataset_of_directors:
                    self.dataset_of_directors.append(director)

                for genre in genres:
                    if genre not in self.dataset_of_genres:
                        self.dataset_of_genres.append(genre)

                index += 1
Пример #13
0
    def read_csv_file(self):
        with open(self.__file_name, mode='r', encoding='utf-8-sig') as csvfile:
            movie_file_reader = csv.DictReader(csvfile)

            index = 0
            for row in movie_file_reader:
                # Read in Title
                title = row['Title']

                # Read in Year
                release_year = int(row['Year'])
                movie = Movie(title, release_year)
                self.__dataset_of_movies.append(movie)

                # Read in description
                description = row["Description"]
                movie.description = description

                # Read in runtime
                runtime = row["Runtime (Minutes)"]
                movie.runtime_minutes = int(runtime)

                # Read in Actors
                actors = row['Actors']
                actor = actors.split(",")
                for i in actor:
                    actor = i.strip()
                    movie.add_actor(Actor(actor))
                    self.__dataset_of_actors.add(Actor(actor))

                # Read in Directors
                director = row['Director']
                movie.director = Director(director)
                self.__dataset_of_directors.add(Director(director))

                # Read in Genre
                genres = row['Genre']
                genre = genres.split(",")
                for i in genre:
                    a = i.strip()
                    movie.add_genre(Genre(a))
                    self.__dataset_of_genres.add(Genre(a))

                # Read in Rank
                rank = row["Rank"]
                movie.rank = rank

                # Read in Rating
                rating = row["Rating"]
                movie.rating = rating

                # Read in Votes
                vote = row["Votes"]
                movie.votes = vote

                # Read in revenue
                revenue = row["Revenue (Millions)"]
                movie.revenue = revenue

                # Read in meta_scores
                metascore = row["Metascore"]
                movie.metascore = metascore

                index += 1