- Notifications
You must be signed in to change notification settings - Fork 46.7k
/
Copy pathget_imdb_top_250_movies_csv.py
30 lines (22 loc) · 937 Bytes
/
get_imdb_top_250_movies_csv.py
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
from __future__ importannotations
importcsv
importrequests
frombs4importBeautifulSoup
defget_imdb_top_250_movies(url: str="") ->dict[str, float]:
url=urlor"https://www.imdb.com/chart/top/?ref_=nv_mv_250"
soup=BeautifulSoup(requests.get(url, timeout=10).text, "html.parser")
titles=soup.find_all("td", attrs="titleColumn")
ratings=soup.find_all("td", class_="ratingColumn imdbRating")
return {
title.a.text: float(rating.strong.text)
fortitle, ratinginzip(titles, ratings)
}
defwrite_movies(filename: str="IMDb_Top_250_Movies.csv") ->None:
movies=get_imdb_top_250_movies()
withopen(filename, "w", newline="") asout_file:
writer=csv.writer(out_file)
writer.writerow(["Movie title", "IMDb rating"])
fortitle, ratinginmovies.items():
writer.writerow([title, rating])
if__name__=="__main__":
write_movies()