getChapterLink
This commit is contained in:
@@ -2,3 +2,6 @@
|
|||||||
*test*.py
|
*test*.py
|
||||||
test.*
|
test.*
|
||||||
*.log
|
*.log
|
||||||
|
.vscode
|
||||||
|
.venv
|
||||||
|
*pycache*
|
||||||
@@ -34,7 +34,12 @@ class OniichanyameteWebScrapper(WebScrapper):
|
|||||||
links =soup.select("p[style*='padding-left:60px'] > a")
|
links =soup.select("p[style*='padding-left:60px'] > a")
|
||||||
pprint(links)
|
pprint(links)
|
||||||
|
|
||||||
|
currChapterNumber = fromChapter
|
||||||
for link in links:
|
for link in links:
|
||||||
chapterNumber = re.search(r'\d+', link.text).group()
|
tmpChapterNumber = re.search(r'\d+', link.text).group()
|
||||||
|
chapterNumber += 1
|
||||||
|
|
||||||
|
if tmpChapterNumber != str(currChapterNumber):
|
||||||
|
continue
|
||||||
|
|
||||||
yield chapterNumber, urljoin(self.baseLink, link["href"])
|
yield chapterNumber, urljoin(self.baseLink, link["href"])
|
||||||
Reference in New Issue
Block a user