diff --git a/01_EJDE_spider/ejde_main.py b/01_EJDE_spider/ejde_main.py index 2ea14c9..d13393f 100644 --- a/01_EJDE_spider/ejde_main.py +++ b/01_EJDE_spider/ejde_main.py @@ -252,7 +252,7 @@ def process_article(title, article_url): # If no author table else: match_type = 0 - hr_count = len(soup.find_all('hr')) + hr_count = len(article_soup.find_all('hr')) if hr_count < 3: pattern = r'