forked from pymavs-uta/web-scrapers
-
Notifications
You must be signed in to change notification settings - Fork 0
/
rotten_scrape.py
31 lines (25 loc) · 968 Bytes
/
rotten_scrape.py
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
import requests, os, bs4
url = 'https://editorial.rottentomatoes.com/guide/best-horror-movies-by-year-since-1920/'
# Download the page.
response = requests.get(url)
response.raise_for_status()
soup = bs4.BeautifulSoup(response.text, 'html.parser')
# Find the URL of the comic image.
movie_list = soup.select('.countdown-item')
if movie_list== []:
print('Could not find movies.')
for movie in movie_list:
image_list = movie.select('.article_movie_poster img')
image_url = image_list[0].get('src')
# Download the image.
image = requests.get(image_url)
image.raise_for_status()
title_list = movie.select('.article_movie_title a')
title = title_list[0].text
title = title.replace(':','')
# Save the image
poster_name = title + '.png'
imageFile = open(os.path.join('RT', poster_name),'wb')
for chunk in image.iter_content(100000):
imageFile.write(chunk)
imageFile.close()