def parse(file): films = {} with open(file) as json_file: data = json.load(json_file) for film in data['films']: movie_title = film['Name'] movie_wiki_link = film['Link'] movie = Movie(movie_wiki_link, movie_title) films[movie_title] = movie Printer.print_minus(''.join( ['PARSING: ', str(len(films)), ". ", movie_title])) if film['IMDB'] is not None: imdb_link = film['IMDB']['Link'] movie.imdb = IMDB(imdb_link, movie_title) if film['Rotten Tomatoes'] is not None: rt_link = film['Rotten Tomatoes']['Link'] movie.rotten_tomatoes = RottenTomatoes(rt_link, movie_title) if film['Metacritic'] is not None: meta_link = film['Metacritic']['Link'] movie.metacritic = Metacritic(meta_link, movie_title) if film['Box Office Mojo'] is not None: bom_link = film['Box Office Mojo']['Link'] movie.box_office_mojo = BoxOfficeMojo(bom_link) return films
def parse_tsv(file): films = {} with open(file) as tsv_file: data = csv.reader(tsv_file, delimiter="\t", quotechar='"') next(data) for film in data: movie_title = film[1] movie_wiki_link = film[2] movie = Movie(movie_wiki_link, movie_title) films[movie_title] = movie Printer.print_minus(''.join( ['PARSING: ', str(len(films)), ". ", movie_title])) imdb_link = film[3] movie.imdb = IMDB(imdb_link, movie_title) rt_link = film[5] movie.rotten_tomatoes = RottenTomatoes(rt_link, movie_title) meta_link = film[6] movie.metacritic = Metacritic(meta_link, movie_title) bom_link = film[7] movie.box_office_mojo = BoxOfficeMojo(bom_link) return films