Files
mangaDownloader/manga-py-stable_1.x/manga_py/providers/webtoons_com.py
2019-12-14 22:33:14 -05:00

80 lines
2.6 KiB
Python

from manga_py.provider import Provider
from .helpers.std import Std
class WebToonsCom(Provider, Std):
__titleNo = 0
__mainUrl = ''
__next_page_urls = None
def get_archive_name(self) -> str:
i = self.re.search(r'\.com%s%s' % (
r'(?:/|%2F)[^/%]+' * 3,
r'(?:/|%2F)([^/%]+)',
), self.chapter)
return self.normal_arc_name([self.chapter_id, i.group(1)])
def get_chapter_index(self) -> str:
return self.re.search(r'\bepisode_no=(\d+)', self.chapter).group(1)
def get_main_content(self):
return self.http_get(self.__mainUrl)
def get_manga_name(self) -> str:
self.__titleNo = self._get_name(r'title_no=(\d+)')
name = self._get_name(r'\.com/([^/]+/[^/]+/[^/]+)')
self.__mainUrl = '{}/{}/list?title_no={}'.format(self.domain, name, self.__titleNo)
return self._get_name(r'\.com/[^/]+/[^/]+/([^/]+)')
def _chapters(self, content):
return self._elements('#_listUl li > a', content)
def _get_page_urls(self, content):
return self._elements('.paginate a:not([class]):not([onclick])', content)
def _get_pages_urls(self, content):
chapters = []
n = self.http().normalize_uri
for j in self._get_page_urls(content): # page-urls
_content = self.http_get(n(j.get('href')))
chapters += self._chapters(_content)
return chapters
def get_next_page_urls(self, content):
urls = self._elements('a + a.pg_next', content)
n = self.http().normalize_uri
if len(urls):
self.__next_page_urls.append(n(urls[0].get('href')))
_content = self.http().get(n(urls[0].get('href')))
self.get_next_page_urls(_content)
def get_chapters(self):
self.log('Parse chapters. Please, wait')
self.__next_page_urls = []
chapters = self._chapters(self.content)
n = self.http().normalize_uri
chapters += self._get_pages_urls(self.content) # main page paginator
self.get_next_page_urls(self.content)
for url in self.__next_page_urls:
content = self.http().get(n(url))
chapters += self._chapters(content)
chapters += self._get_pages_urls(content)
return chapters
def get_files(self):
parser = self.html_fromstring(self.chapter)
return self._images_helper(parser, '#_imageList img', 'data-url')
def get_cover(self) -> str:
img = self.html_fromstring(self.content, '#content > .detail_bg', 0)
return self.parse_background(img)
def book_meta(self) -> dict:
# todo meta
pass
main = WebToonsCom