import re
html = """
《流浪地球》
(2024)
8.5
导演: 郭帆
《你好,李焕英》
(2021)
7.9
导演: 贾玲
"""
name_pattern = r'《([^》]+)》
'
year_pattern = r'\((\d+)\)'
rating_pattern = r'([\d.]+)'
director_pattern = r'导演: ([^<]+)'
names = re.findall(name_pattern, html)
years = re.findall(year_pattern, html)
ratings = re.findall(rating_pattern, html)
directors = re.findall(director_pattern, html)
for
name, year, rating, director in zip(names, years, ratings, directors):
print(f"{name} {year} {rating} {director}")