diff --git a/4.2.py b/4.2.py new file mode 100644 index 0000000..190826e --- /dev/null +++ b/4.2.py @@ -0,0 +1,18 @@ +import requests +headers = { + 'User-Agent': 'Mozilla/5.0 (Windows NT 10.0; Win64; x64) AppleWebKit/537.36' +} +url = 'https://movie.douban.com/top250' +response = requests.get(url, headers=headers) + +html = response.text + +title_pattern = r'([^<]+)' +titles = re.findall(title_pattern, html) + +chinese_titles = [t for t in titles if not t.startswith('/')] +print('电影名称(前10部):') +for i, title in enumerate(chinese_titles[:10], 1): + print(f'{i}. {title}') +rating_pattern = r']*>(\d+\.\d)' +ratings = re.findall(rating_pattern, html)