import re
html = '''
《流浪地球》
(2024)
8.5
导演:郭帆
《你好,李焕英》
(2024)
7.9
导演:贾玲
'''
# 编写正则表达式,提取所有电影信息
# pattern = r'你的正则表达式'
# 提示:可以用多个正则分别提取,或者用一个复杂的正则提取所有
name_pattern = r'《([^》]+)》
'
year_pattern = r'\((\d{4})\)'
rating_pattern = r'([^<]+)'
director_pattern = r'导演:([^<]+)'
names = re.findall(name_pattern, html)
years = re.findall(year_pattern, html)
ratings = re.findall(rating_pattern, html)
directors = re.findall(director_pattern, html)
for i in range(len(names)):
print(f"{names[i]} | {years[i]} | 评分:{ratings[i]} | {directors[i]}")