1. hr_count soup should be article_soup
This commit is contained in:
ldy 2023-08-11 19:16:03 +08:00
parent 68a755a633
commit b1eba69085

View File

@ -252,7 +252,7 @@ def process_article(title, article_url):
# If no author table # If no author table
else: else:
match_type = 0 match_type = 0
hr_count = len(soup.find_all('hr')) hr_count = len(article_soup.find_all('hr'))
if hr_count < 3: if hr_count < 3:
pattern = r'<hr>(.*?)<hr>' pattern = r'<hr>(.*?)<hr>'
else: else: