1. hr_count soup should be article_soup
This commit is contained in:
ldy 2023-08-11 19:16:03 +08:00
parent 68a755a633
commit b1eba69085

View File

@ -252,7 +252,7 @@ def process_article(title, article_url):
# If no author table
else:
match_type = 0
hr_count = len(soup.find_all('hr'))
hr_count = len(article_soup.find_all('hr'))
if hr_count < 3:
pattern = r'<hr>(.*?)<hr>'
else: