网络数据采集（爬虫基础）

完成课堂作业爬虫3.19
2026-03-19 21:25:46 +08:00 · 2026-03-19 20:58:44 +08:00
1 changed files with 19 additions and 0 deletions
--- a/爬虫2/爬虫课堂作业3.19.py.txt
+++ b/爬虫2/爬虫课堂作业3.19.py.txt
@@ -0,0 +1,19 @@
 import requests
 from bs4 import BeautifulSoup
 url = 'https://movie.douban.com/top250'
 params = {'start': '0', 'filter': ''}  
 response = requests.get(url, params=params)
 if response.status_code == 200:
    html_content = response.text
    print("请求成功，获取到 HTML 内容")
 else:
    print(f"请求失败，状态码: {response.status_code}")
 soup = BeautifulSoup(html_content, 'lxml')
 title = soup.find('title').string
 print("页面标题:", title)
 links = soup.find_all('a')
 for link in links:
    print("链接地址:", link.get('href'))
 div_elements = soup.select('div.item')
 for div in div_elements:
    print("电影条目内容:", div.text)
Author	SHA1	Message	Date
2509165020	792d62f71a	网络数据采集（爬虫基础）	2026-03-19 21:25:46 +08:00
2509165020	7be256b0d6	完成课堂作业爬虫3.19	2026-03-19 20:58:44 +08:00