Files
datamining_881/scripts/scrape.py
2026-03-10 14:14:59 -04:00

33 lines
667 B
Python

import requests
url = "https://en.wikipedia.org/w/api.php"
headers = {
"User-Agent": "CSE881-MovieProject/1.0 (ishaa@msu.edu)"
}
params = {
"action": "query",
"format": "json",
"titles": "Godfather",
"prop": "extracts",
"explaintext": True,
"redirects": 1
}
response = requests.get(url, headers=headers, params=params)
print("Status:", response.status_code)
print("Content-Type:", response.headers.get("content-type"))
print("First 200 chars:\n", response.text[:1000])
data = response.json()
pages = data["query"]["pages"]
page = next(iter(pages.values()))
print("\nTitle:", page["title"])
print("\nPreview:\n", page["extract"])