From 99aec503a78abf8edc995e2e0c46ac43ec26e3a2 Mon Sep 17 00:00:00 2001 From: JohannesBOT Date: Thu, 21 May 2026 12:37:32 +0200 Subject: [PATCH] getChapterLink --- .gitignore | 5 ++++- src/WebScrapper/OniichanyameteWebScrapper.py | 9 +++++++-- 2 files changed, 11 insertions(+), 3 deletions(-) diff --git a/.gitignore b/.gitignore index 3aae54c..abfc139 100644 --- a/.gitignore +++ b/.gitignore @@ -1,4 +1,7 @@ .idea *test*.py test.* -*.log \ No newline at end of file +*.log +.vscode +.venv +*pycache* \ No newline at end of file diff --git a/src/WebScrapper/OniichanyameteWebScrapper.py b/src/WebScrapper/OniichanyameteWebScrapper.py index e30ce7d..526e389 100644 --- a/src/WebScrapper/OniichanyameteWebScrapper.py +++ b/src/WebScrapper/OniichanyameteWebScrapper.py @@ -34,7 +34,12 @@ class OniichanyameteWebScrapper(WebScrapper): links =soup.select("p[style*='padding-left:60px'] > a") pprint(links) - + currChapterNumber = fromChapter for link in links: - chapterNumber = re.search(r'\d+', link.text).group() + tmpChapterNumber = re.search(r'\d+', link.text).group() + chapterNumber += 1 + + if tmpChapterNumber != str(currChapterNumber): + continue + yield chapterNumber, urljoin(self.baseLink, link["href"]) \ No newline at end of file