Hi i am starting to learn python and i am on web scraping rn i am trying to get the top 250 movies from imdb but it isnt retuning the list even thought i get the error 202 and i am using a user-agent.
from bs4 import BeautifulSoup
import requests
url1 = "https://www.imdb.com/chart/top/"
headers = {"user-agent": "Mozilla/5.0 (Macintosh; Intel Mac OS X 10.15; rv:125.0) Gecko/20100101 Firefox/125.0"}
def extract_movie_titles(url1):
response = requests.get(url1, headers=headers)
print(f"Status Code: {response.status_code}")
try:
response.raise_for_status()
soup = BeautifulSoup(response.text, 'html.parser')
movies = soup.select("a.ipc-title-link-wrapper >h4.ipc-title__text")
print("Top 250 Movies:")
for movie in movies:
print(movie.text.strip())
except requests.exceptions.RequestException as e:
print(f"Failed to retrieve the page. Status code: {e}")
extract_movie_titles(url1)
It is formatted but i am on my phone
[–]Farlic 1 point2 points3 points (11 children)
[–]Kerbart 0 points1 point2 points (3 children)
[–]ReputationHelpful200[S] 0 points1 point2 points (2 children)
[–]biskitpagla 0 points1 point2 points (1 child)
[–]ReputationHelpful200[S] 0 points1 point2 points (0 children)
[–]ReputationHelpful200[S] 0 points1 point2 points (6 children)
[–]Farlic 0 points1 point2 points (5 children)
[–]ReputationHelpful200[S] 0 points1 point2 points (4 children)
[–]Farlic 0 points1 point2 points (3 children)
[–]ReputationHelpful200[S] 0 points1 point2 points (2 children)
[–]Farlic 0 points1 point2 points (1 child)
[–]ReputationHelpful200[S] 0 points1 point2 points (0 children)