-
Notifications
You must be signed in to change notification settings - Fork 2
/
Copy pathProcessingData.py
47 lines (31 loc) · 1.54 KB
/
ProcessingData.py
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
import csv
if __name__ == '__main__':
movies_csv = open("Input/movies.csv", 'w', newline='')
movies_writer = csv.writer(movies_csv)
movies_writer.writerow(["MovieID", "Title", "Year", "Genre"])
ratings_csv = open("Input/ratings.csv", 'w', newline='')
ratings_writer = csv.writer(ratings_csv)
ratings_writer.writerow(["MovieID", "SourceSite", "Rating", "NumberOfRatings"])
imdb_file = open('Scraped Data/imdb_movie_list.csv')
imdb_reader = csv.reader(imdb_file)
next(imdb_reader)
i = 1
for movie in imdb_reader:
print(i)
if movie[3] == "":
movie[3] = "(no_genres_listed)"
movies_writer.writerow([i, movie[0].encode("ascii", "ignore").decode(), movie[1], movie[3].replace(' ', '|')])
ratings_writer.writerow([i, "IMDb", movie[2], movie[4]])
rottentomatoes_file = open('Scraped Data/rotten_tomatoes_movie_list.csv')
metacritic_file = open('Scraped Data/metacritic_movie_list.csv')
rottentomatoes_reader = csv.reader(rottentomatoes_file)
metacritic_reader = csv.reader(metacritic_file)
next(rottentomatoes_reader)
next(metacritic_reader)
for rottentomatoes in rottentomatoes_reader:
if rottentomatoes[0] == movie[0]:
ratings_writer.writerow([i, "RottenTomatoes", rottentomatoes[1], rottentomatoes[2]])
for metacritic in metacritic_reader:
if metacritic[0] == movie[0]:
ratings_writer.writerow([i, "Metacritic", metacritic[1], metacritic[2]])
i = i + 1