From da29ff0039faaabe54c7df4b842e7eaa11983848 Mon Sep 17 00:00:00 2001
From: 2509165015 <2509165015@student.edu.cn>
Date: Thu, 2 Apr 2026 15:53:53 +0800
Subject: [PATCH] =?UTF-8?q?=E6=AD=A3=E5=88=99=E8=A1=A8=E8=BE=BE=E5=BC=8F?=
 =?UTF-8?q?=EF=BC=9A=E7=88=AC=E8=99=AB=E5=86=85=E5=AE=B9=E6=8F=90=E5=8F=96?=
 =?UTF-8?q?=E5=88=A9=E5=99=A8?=
MIME-Version: 1.0
Content-Type: text/plain; charset=UTF-8
Content-Transfer-Encoding: 8bit

---
 0402+2509165015.CSV  | 45 +++++++++++++++++++++++++++++++++++++++
 0402+2509165015.JSON | 46 ++++++++++++++++++++++++++++++++++++++++
 0402+2509165015.txt  | 50 ++++++++++++++++++++++++++++++++++++++++++++
 3 files changed, 141 insertions(+)
 create mode 100644 0402+2509165015.CSV
 create mode 100644 0402+2509165015.JSON
 create mode 100644 0402+2509165015.txt

diff --git a/0402+2509165015.CSV b/0402+2509165015.CSV
new file mode 100644
index 0000000..d14d4b6
--- /dev/null
+++ b/0402+2509165015.CSV
@@ -0,0 +1,45 @@
+import requests
+from bs4 import BeautifulSoup
+import csv
+import time
+
+headers = {
+    "User-Agent": "Mozilla/5.0 (Windows NT 10.0; Win64; x64) AppleWebKit/537.36 (KHTML, like Gecko) Chrome/120.0.0.0 Safari/537.36"
+}
+
+movies = []
+
+for start in range(0, 250, 25):
+    url = f"https://movie.douban.com/top250?start={start}"
+    res = requests.get(url, headers=headers)
+    soup = BeautifulSoup(res.text, "html.parser")
+    items = soup.find_all("div", class_="item")
+
+    for item in items:
+        rank = item.find("em").text
+        title = item.find("span", class_="title").text
+        rating = item.find("span", class_="rating_num").text
+        people = item.find("div", class_="star").find_all("span")[-1].text.replace("äººè¯„ä»·", "")
+        quote = item.find("span", class_="inq").text if item.find("span", class_="inq") else "æ— "
+        info = item.find("p", class_="").text.strip().split("\n")
+        line1 = info[0].strip()
+        line2 = info[1].strip() if len(info) > 1 else ""
+
+        director = line1.split("å¯¼æ¼”: ")[1].split("ä¸»æ¼”: ")[0].strip() if "å¯¼æ¼”: " in line1 else "æœªçŸ¥"
+        actor = line1.split("ä¸»æ¼”: ")[1].strip() if "ä¸»æ¼”: " in line1 else "æœªçŸ¥"
+        parts = line2.split("/") if line2 else []
+        year = parts[0].strip() if len(parts) >= 1 else "æœªçŸ¥"
+        area = parts[1].strip() if len(parts) >= 2 else "æœªçŸ¥"
+        genre = parts[2].strip() if len(parts) >= 3 else "æœªçŸ¥"
+
+        movies.append({
+            "æŽ’å": rank, "ç”µå½±å": title, "è¯„åˆ†": rating, "è¯„ä»·äººæ•°": people, "ç»å…¸å°è¯": quote,
+            "å¯¼æ¼”": director, "ä¸»æ¼”": actor, "å¹´ä»½": year, "åœ°åŒº": area, "ç±»åž‹": genre
+        })
+        time.sleep(1)
+    print(f"å·²çˆ¬å– {start + 25} æ¡")
+with open("douban_top250.csv", "w", encoding="utf-8", newline="") as f:
+    writer = csv.DictWriter(f, fieldnames=movies[0].keys())
+    writer.writeheader()
+    writer.writerows(movies)
+print("âœ… CSV å¯¼å‡ºå®Œæˆ")
\ No newline at end of file
diff --git a/0402+2509165015.JSON b/0402+2509165015.JSON
new file mode 100644
index 0000000..d419a03
--- /dev/null
+++ b/0402+2509165015.JSON
@@ -0,0 +1,46 @@
+import requests
+from bs4 import BeautifulSoup
+import json
+import time
+
+headers = {
+    "User-Agent": "Mozilla/5.0 (Windows NT 10.0; Win64; x64) AppleWebKit/537.36 (KHTML, like Gecko) Chrome/120.0.0.0 Safari/537.36"
+}
+
+movies = []
+
+for start in range(0, 250, 25):
+    url = f"https://movie.douban.com/top250?start={start}"
+    res = requests.get(url, headers=headers)
+    soup = BeautifulSoup(res.text, "html.parser")
+    items = soup.find_all("div", class_="item")
+
+    for item in items:
+        rank = item.find("em").text
+        title = item.find("span", class_="title").text
+        rating = item.find("span", class_="rating_num").text
+        people = item.find("div", class_="star").find_all("span")[-1].text.replace("äººè¯„ä»·", "")
+        quote = item.find("span", class_="inq").text if item.find("span", class_="inq") else "æ— "
+        info = item.find("p", class_="").text.strip().split("\n")
+        line1 = info[0].strip()
+        line2 = info[1].strip() if len(info) > 1 else ""
+
+        director = line1.split("å¯¼æ¼”: ")[1].split("ä¸»æ¼”: ")[0].strip() if "å¯¼æ¼”: " in line1 else "æœªçŸ¥"
+        actor = line1.split("ä¸»æ¼”: ")[1].strip() if "ä¸»æ¼”: " in line1 else "æœªçŸ¥"
+        parts = line2.split("/") if line2 else []
+        year = parts[0].strip() if len(parts) >= 1 else "æœªçŸ¥"
+        area = parts[1].strip() if len(parts) >= 2 else "æœªçŸ¥"
+        genre = parts[2].strip() if len(parts) >= 3 else "æœªçŸ¥"
+
+        movies.append({
+            "æŽ’å": rank, "ç”µå½±å": title, "è¯„åˆ†": rating, "è¯„ä»·äººæ•°": people, "ç»å…¸å°è¯": quote,
+            "å¯¼æ¼”": director, "ä¸»æ¼”": actor, "å¹´ä»½": year, "åœ°åŒº": area, "ç±»åž‹": genre
+        })
+
+    time.sleep(1)
+    print(f"å·²çˆ¬å– {start + 25} æ¡")
+
+with open("douban_top250.json", "w", encoding="utf-8") as f:
+    json.dump(movies, f, ensure_ascii=False, indent=2)
+
+print("âœ… JSON å¯¼å‡ºå®Œæˆ")
\ No newline at end of file
diff --git a/0402+2509165015.txt b/0402+2509165015.txt
new file mode 100644
index 0000000..7ca51bd
--- /dev/null
+++ b/0402+2509165015.txt
@@ -0,0 +1,50 @@
+import requests
+from bs4 import BeautifulSoup
+import time
+
+headers = {
+    "User-Agent": "Mozilla/5.0 (Windows NT 10.0; Win64; x64) AppleWebKit/537.36 (KHTML, like Gecko) Chrome/120.0.0.0 Safari/537.36"
+}
+
+movies = []
+
+for start in range(0, 250, 25):
+    url = f"https://movie.douban.com/top250?start={start}"
+    res = requests.get(url, headers=headers)
+    soup = BeautifulSoup(res.text, "html.parser")
+    items = soup.find_all("div", class_="item")
+
+    for item in items:
+        rank = item.find("em").text
+        title = item.find("span", class_="title").text
+        rating = item.find("span", class_="rating_num").text
+        people = item.find("div", class_="star").find_all("span")[-1].text.replace("ÈËÆÀ¼Û", "")
+        quote = item.find("span", class_="inq").text if item.find("span", class_="inq") else "ÎÞ"
+        info = item.find("p", class_="").text.strip().split("\n")
+        line1 = info[0].strip()
+        line2 = info[1].strip() if len(info) > 1 else ""
+
+        director = line1.split("µ¼ÑÝ: ")[1].split("Ö÷ÑÝ: ")[0].strip() if "µ¼ÑÝ: " in line1 else "Î´Öª"
+        actor = line1.split("Ö÷ÑÝ: ")[1].strip() if "Ö÷ÑÝ: " in line1 else "Î´Öª"
+        parts = line2.split("/") if line2 else []
+        year = parts[0].strip() if len(parts) >= 1 else "Î´Öª"
+        area = parts[1].strip() if len(parts) >= 2 else "Î´Öª"
+        genre = parts[2].strip() if len(parts) >= 3 else "Î´Öª"
+
+        movies.append({
+            "ÅÅÃû": rank, "µçÓ°Ãû": title, "ÆÀ·Ö": rating, "ÆÀ¼ÛÈËÊý": people, "¾­µäÌ¨´Ê": quote,
+            "µ¼ÑÝ": director, "Ö÷ÑÝ": actor, "Äê·Ý": year, "µØÇø": area, "ÀàÐÍ": genre
+        })
+
+    time.sleep(1)
+    print(f"ÒÑÅÀÈ¡ {start + 25} Ìõ")
+
+with open("douban_top250.txt", "w", encoding="utf-8") as f:
+    for m in movies:
+        f.write(f"¡¾{m['ÅÅÃû']}¡¿{m['µçÓ°Ãû']}\n")
+        f.write(f"ÆÀ·Ö£º{m['ÆÀ·Ö']}  ÆÀ¼ÛÈËÊý£º{m['ÆÀ¼ÛÈËÊý']}\n")
+        f.write(f"µ¼ÑÝ£º{m['µ¼ÑÝ']}  Ö÷ÑÝ£º{m['Ö÷ÑÝ']}\n")
+        f.write(f"Äê·Ý£º{m['Äê·Ý']}  µØÇø£º{m['µØÇø']}  ÀàÐÍ£º{m['ÀàÐÍ']}\n")
+        f.write(f"Ì¨´Ê£º{m['¾­µäÌ¨´Ê']}\n\n")
+
+print("? TXT µ¼³öÍê³É")
\ No newline at end of file