Compare commits

..

5 Commits

Author SHA1 Message Date
81c1ceb86c 上传文件至 / 2026-03-26 16:09:25 +08:00
2509165036
c28f614355 完成作业X 2026-03-24 11:35:16 +08:00
2509165036
73cf5976cb 完成作业X 2026-03-24 11:22:10 +08:00
2509165036
374b06bb6e 完成作业X 2026-03-24 10:55:03 +08:00
2509165036
5ed4959e22 完成作业X 2026-03-24 10:46:04 +08:00
5 changed files with 91 additions and 0 deletions

27
2509165012+3.26.py Normal file
View File

@@ -0,0 +1,27 @@
import requests
from bs4 import BeautifulSoup
import time
headers = {'User-Agent': 'Mozilla/5.0 (Windows NT 6.1; Win64; x64) AppleWebKit/537.36 (KHTML, like Gecko) Chrome/96.0.4664.110 Safari/537.36'}
for i in range(5):
try:
response = requests.get('https://picsum.photos/', headers=headers, timeout=10)
response.encoding = 'utf-8'
soup = BeautifulSoup(response.text, 'html.parser')
img_tag = soup.select_one('img.resize')
if not img_tag:
print(f"{i+1}张:未找到图片标签,跳过")
continue
img_src = img_tag['src']
img_response = requests.get(img_src, headers=headers, timeout=10)
filename = f'image_{i+1}.jpg'
with open(filename, 'wb') as f:
f.write(img_response.content)
print(f"{i+1}张:下载完成 → {filename}")
time.sleep(1)
except Exception as e:
print(f"{i+1}张:下载失败 → {e}")

21
2509165036胡红辉.py Normal file
View File

@@ -0,0 +1,21 @@
import requests
from bs4 import BeautifulSoup
headers ={
'User-Agent': 'Mozilla/5.0 (Windows NT 10.0; Win64; x64) AppleWebKit/537.36 (KHTML, like Gecko) Chrome/120.0.0.0 Safari/537.36',
}
url = 'https://www.douban.com/doulist/3936288/?start=0&sort=time&playable=0&sub_type='
response = requests.get(url, headers=headers, timeout=10)
response.encoding = 'utf-8'
soup = BeautifulSoup(response.text, 'html.parser')
movies = []
for a in soup.find_all('a'):
href = a.get('href', '')
if '/subject/' in href:
title = a.get_text(strip=True)
print(title)
movies.append(title)
print('-----------')
print(movies)
print(f"{page+1}页:{title}")
print(f"1 第{page+1}页爬取完成,共{len(movies)}条数据\n")
print(f"错第{page+1}页爬取失败:{e}")

37
sh.exe.stackdump Normal file
View File

@@ -0,0 +1,37 @@
Stack trace:
Frame Function Args
0007FFFFCD30 00021006116E (000210281C30, 000210272B51, 0007FFFFCD30, 0007FFFFBA30) msys-2.0.dll+0x2116E
0007FFFFCD30 0002100469BA (000100002000, 000001F70A70, 000001F70A70, 000000000002) msys-2.0.dll+0x69BA
0007FFFFCD30 0002100469F2 (000000000002, 000800007F88, 0007FFFFCD30, 000700000008) msys-2.0.dll+0x69F2
0007FFFFCD30 00021005A029 (0007FFFFCC44, 0007FFFFCD30, 0007FFFFCC8F, 0007FFFFCC73) msys-2.0.dll+0x1A029
0007FFFFCD30 00021005A0DF (645C655C725C635C, 695C745C6E5C655C, 735C2D5C6C5C615C, 655C725C6F5C745C) msys-2.0.dll+0x1A0DF
0007FFFFCD30 000210047151 (000000000000, 000000000000, 000000000000, 000000000000) msys-2.0.dll+0x7151
0007FFFFFFF0 000210045C86 (000000000000, 000000000000, 000000000000, 000000000000) msys-2.0.dll+0x5C86
0007FFFFFFF0 000210045D34 (000000000000, 000000000000, 000000000000, 000000000000) msys-2.0.dll+0x5D34
End of stack trace
Loaded modules:
000100400000 sh.exe
000077A20000 ntdll.dll
000077800000 kernel32.dll
07FEFD8C0000 KERNELBASE.dll
000210040000 msys-2.0.dll
000077920000 USER32.dll
07FEFF9C0000 GDI32.dll
07FEFD930000 LPK.dll
07FEFF720000 USP10.dll
07FEFD940000 msvcrt.dll
07FEFF7F0000 advapi32.dll
07FEFF8D0000 sechost.dll
07FEFEEC0000 RPCRT4.dll
07FEFD410000 cryptbase.dll
07FEFF990000 IMM32.DLL
07FEFF5A0000 MSCTF.dll
07FEFB440000 netapi32.dll
07FEFB430000 netutils.dll
07FEFCF80000 srvcli.dll
07FEFB410000 wkscli.dll
07FEFB3F0000 SAMCLI.DLL
07FEFBBC0000 SAMLIB.dll
07FEFF6B0000 ws2_32.dll
07FEFFD00000 NSI.dll
07FEFCCC0000 mswsock.dll

Submodule task-2-1-data-collection added at 545a1e905e

5
text.py Normal file
View File

@@ -0,0 +1,5 @@
import requests
url = "https://m.douban.com/subject_collection/ECGRADN5Q"
response = requests.get(url,headers=header,params={'key':'value'})
print(response.status_code)
//*[@id="content"]/h1/span[1]