2016-10-23 17:51:12 +02:00
|
|
|
# -*- coding: utf-8 -*-
|
|
|
|
|
2019-02-03 23:54:17 +01:00
|
|
|
# Copyright 2016-2019 Mike Fährmann
|
2016-10-23 17:51:12 +02:00
|
|
|
#
|
|
|
|
# This program is free software; you can redistribute it and/or modify
|
|
|
|
# it under the terms of the GNU General Public License version 2 as
|
|
|
|
# published by the Free Software Foundation.
|
|
|
|
|
2019-02-03 23:54:17 +01:00
|
|
|
"""Extractors for FoOlSlide based sites"""
|
2016-10-23 17:51:12 +02:00
|
|
|
|
2019-02-11 18:38:47 +01:00
|
|
|
from .common import (
|
2019-03-07 22:55:26 +01:00
|
|
|
Extractor,
|
|
|
|
ChapterExtractor,
|
|
|
|
MangaExtractor,
|
|
|
|
SharedConfigMixin,
|
|
|
|
Message,
|
|
|
|
generate_extractors,
|
|
|
|
)
|
|
|
|
from .. import text, util
|
2017-10-21 16:42:45 +02:00
|
|
|
import base64
|
2016-10-23 17:51:12 +02:00
|
|
|
import json
|
2017-04-11 21:03:40 +02:00
|
|
|
|
|
|
|
|
2019-02-04 13:46:02 +01:00
|
|
|
class FoolslideBase(SharedConfigMixin):
|
2017-09-24 16:57:47 +02:00
|
|
|
"""Base class for FoOlSlide extractors"""
|
2017-08-29 22:42:48 +02:00
|
|
|
basecategory = "foolslide"
|
2017-09-24 16:57:47 +02:00
|
|
|
|
|
|
|
def request(self, url):
|
2019-02-04 13:46:02 +01:00
|
|
|
return Extractor.request(
|
2019-02-03 23:54:17 +01:00
|
|
|
self, url, encoding="utf-8", method="POST", data={"adult": "true"})
|
2017-09-24 16:57:47 +02:00
|
|
|
|
|
|
|
@staticmethod
|
|
|
|
def parse_chapter_url(url, data):
|
2017-09-25 12:59:24 +02:00
|
|
|
info = url.partition("/read/")[2].rstrip("/").split("/")
|
2018-01-07 21:42:28 +01:00
|
|
|
lang = info[1].partition("-")[0]
|
|
|
|
data["lang"] = lang
|
|
|
|
data["language"] = util.code_to_language(lang)
|
2018-04-20 14:53:21 +02:00
|
|
|
data["volume"] = text.parse_int(info[2])
|
|
|
|
data["chapter"] = text.parse_int(info[3])
|
2017-09-25 12:59:24 +02:00
|
|
|
data["chapter_minor"] = "." + info[4] if len(info) >= 5 else ""
|
2019-04-19 23:02:29 +02:00
|
|
|
data["title"] = data["chapter_string"].partition(":")[2].strip()
|
2017-09-24 16:57:47 +02:00
|
|
|
return data
|
|
|
|
|
|
|
|
|
2019-02-11 18:38:47 +01:00
|
|
|
class FoolslideChapterExtractor(FoolslideBase, ChapterExtractor):
|
2017-09-24 16:57:47 +02:00
|
|
|
"""Base class for chapter extractors for FoOlSlide based sites"""
|
2019-02-08 13:45:40 +01:00
|
|
|
directory_fmt = (
|
|
|
|
"{category}", "{manga}", "{chapter_string}")
|
2018-01-30 22:49:16 +01:00
|
|
|
archive_fmt = "{id}"
|
2019-03-07 22:55:26 +01:00
|
|
|
pattern_fmt = r"(/read/[^/?&#]+/[a-z-]+/\d+/\d+(?:/\d+)?)"
|
2019-02-03 23:54:17 +01:00
|
|
|
decode = "default"
|
2016-10-23 17:51:12 +02:00
|
|
|
|
|
|
|
def items(self):
|
2019-02-11 18:38:47 +01:00
|
|
|
page = self.request(self.chapter_url).text
|
|
|
|
data = self.metadata(page)
|
|
|
|
imgs = self.images(page)
|
improved foolslide-based extractors
- this includes dokireader, fallenangels, jaiminisbox, powermanga,
sensescans, worldthree, yonkouprod, gomanga, yomanga
- added 'chapter_string', 'chapter_id', 'chapter_minor' and 'count'
keywords
- changed the 'chapter' keyword to always be just a number
- changed the default directory format
2017-02-16 23:42:30 +01:00
|
|
|
|
|
|
|
data["count"] = len(imgs)
|
2018-04-20 14:53:21 +02:00
|
|
|
data["chapter_id"] = text.parse_int(imgs[0]["chapter_id"])
|
improved foolslide-based extractors
- this includes dokireader, fallenangels, jaiminisbox, powermanga,
sensescans, worldthree, yonkouprod, gomanga, yomanga
- added 'chapter_string', 'chapter_id', 'chapter_minor' and 'count'
keywords
- changed the 'chapter' keyword to always be just a number
- changed the default directory format
2017-02-16 23:42:30 +01:00
|
|
|
|
2016-10-23 17:51:12 +02:00
|
|
|
yield Message.Version, 1
|
|
|
|
yield Message.Directory, data
|
improved foolslide-based extractors
- this includes dokireader, fallenangels, jaiminisbox, powermanga,
sensescans, worldthree, yonkouprod, gomanga, yomanga
- added 'chapter_string', 'chapter_id', 'chapter_minor' and 'count'
keywords
- changed the 'chapter' keyword to always be just a number
- changed the default directory format
2017-02-16 23:42:30 +01:00
|
|
|
for data["page"], image in enumerate(imgs, 1):
|
2016-10-23 17:51:12 +02:00
|
|
|
try:
|
|
|
|
url = image["url"]
|
|
|
|
del image["url"]
|
2017-09-24 16:57:47 +02:00
|
|
|
del image["chapter_id"]
|
2016-10-23 17:51:12 +02:00
|
|
|
del image["thumb_url"]
|
|
|
|
except KeyError:
|
|
|
|
pass
|
2017-09-24 16:57:47 +02:00
|
|
|
for key in ("height", "id", "size", "width"):
|
2018-04-20 14:53:21 +02:00
|
|
|
image[key] = text.parse_int(image[key])
|
2016-10-23 17:51:12 +02:00
|
|
|
data.update(image)
|
|
|
|
text.nameext_from_url(data["filename"], data)
|
|
|
|
yield Message.Url, url, data
|
|
|
|
|
2019-02-11 18:38:47 +01:00
|
|
|
def metadata(self, page):
|
2019-04-19 23:02:29 +02:00
|
|
|
extr = text.extract_from(page)
|
|
|
|
extr('<h1 class="tbtitle dnone">', '')
|
2019-02-11 18:38:47 +01:00
|
|
|
return self.parse_chapter_url(self.chapter_url, {
|
2019-04-19 23:02:29 +02:00
|
|
|
"manga" : text.unescape(extr('title="', '"')).strip(),
|
|
|
|
"chapter_string": text.unescape(extr('title="', '"')),
|
2017-09-24 16:57:47 +02:00
|
|
|
})
|
2016-10-23 17:51:12 +02:00
|
|
|
|
2019-02-11 18:38:47 +01:00
|
|
|
def images(self, page):
|
2019-02-03 23:54:17 +01:00
|
|
|
if self.decode == "base64":
|
2017-10-21 16:42:45 +02:00
|
|
|
base64_data = text.extract(page, 'atob("', '"')[0].encode()
|
|
|
|
data = base64.b64decode(base64_data).decode()
|
2019-02-03 23:54:17 +01:00
|
|
|
elif self.decode == "double":
|
2017-01-10 00:05:08 +01:00
|
|
|
pos = page.find("[{")
|
2017-10-21 16:42:45 +02:00
|
|
|
data = text.extract(page, " = ", ";", pos)[0]
|
|
|
|
else:
|
|
|
|
data = text.extract(page, "var pages = ", ";")[0]
|
|
|
|
return json.loads(data)
|
2017-04-11 21:03:40 +02:00
|
|
|
|
|
|
|
|
2019-02-04 13:46:02 +01:00
|
|
|
class FoolslideMangaExtractor(FoolslideBase, MangaExtractor):
|
2017-04-11 21:03:40 +02:00
|
|
|
"""Base class for manga extractors for FoOlSlide based sites"""
|
2019-03-07 22:55:26 +01:00
|
|
|
pattern_fmt = r"(/series/[^/?&#]+)"
|
2017-04-11 21:03:40 +02:00
|
|
|
|
2017-05-20 11:27:43 +02:00
|
|
|
def chapters(self, page):
|
2019-04-19 23:02:29 +02:00
|
|
|
extr = text.extract_from(page)
|
|
|
|
manga = text.unescape(extr('<h1 class="title">', '</h1>')).strip()
|
|
|
|
author = extr('<b>Author</b>: ', '<br')
|
|
|
|
artist = extr('<b>Artist</b>: ', '<br')
|
2017-09-12 16:44:38 +02:00
|
|
|
|
|
|
|
results = []
|
|
|
|
while True:
|
2019-04-19 23:02:29 +02:00
|
|
|
url = extr('<div class="title"><a href="', '"')
|
2017-09-12 16:44:38 +02:00
|
|
|
if not url:
|
|
|
|
return results
|
2017-09-24 16:57:47 +02:00
|
|
|
results.append((url, self.parse_chapter_url(url, {
|
2017-09-12 16:44:38 +02:00
|
|
|
"manga": manga, "author": author, "artist": artist,
|
2019-04-19 23:02:29 +02:00
|
|
|
"chapter_string": extr('title="', '"'),
|
|
|
|
"group" : extr('title="', '"'),
|
2017-09-24 16:57:47 +02:00
|
|
|
})))
|
2019-02-03 23:54:17 +01:00
|
|
|
|
|
|
|
|
|
|
|
EXTRACTORS = {
|
|
|
|
"dokireader": {
|
|
|
|
"root": "https://kobato.hologfx.com/reader",
|
2019-02-08 13:45:40 +01:00
|
|
|
"test-chapter":
|
2019-02-03 23:54:17 +01:00
|
|
|
(("https://kobato.hologfx.com/reader/read/"
|
|
|
|
"hitoribocchi_no_oo_seikatsu/en/3/34"), {
|
2019-02-14 16:07:17 +01:00
|
|
|
"keyword": "6e719ac86f0c6dab89390dd7e507e678459e0dbc",
|
2019-02-03 23:54:17 +01:00
|
|
|
}),
|
2019-02-08 13:45:40 +01:00
|
|
|
"test-manga":
|
2019-02-03 23:54:17 +01:00
|
|
|
(("https://kobato.hologfx.com/reader/series/"
|
|
|
|
"boku_ha_ohimesama_ni_narenai/"), {
|
|
|
|
"url": "1c1f5a7258ce4f631f5fc32be548d78a6a57990d",
|
|
|
|
"keyword": "614d89a6045b85c822cbd3e67578ea7577dfc995",
|
|
|
|
}),
|
|
|
|
},
|
|
|
|
"jaiminisbox": {
|
|
|
|
"root": "https://jaiminisbox.com/reader",
|
|
|
|
"pattern": r"(?:www\.)?jaiminisbox\.com/reader",
|
2019-03-07 22:55:26 +01:00
|
|
|
"extra": {"decode": "base64"},
|
2019-02-08 13:45:40 +01:00
|
|
|
"test-chapter": (
|
2019-02-03 23:54:17 +01:00
|
|
|
("https://jaiminisbox.com/reader/read/uratarou/en/0/1/", {
|
2019-02-14 16:07:17 +01:00
|
|
|
"keyword": "6009af77cc9c05528ab1fdda47b1ad9d4811c673",
|
2019-02-03 23:54:17 +01:00
|
|
|
}),
|
|
|
|
("https://jaiminisbox.com/reader/read/dr-stone/en/0/16/", {
|
2019-02-14 16:07:17 +01:00
|
|
|
"keyword": "8607375c24b1d0db7f52d059ef5baff793aa458e",
|
2019-02-03 23:54:17 +01:00
|
|
|
}),
|
2019-02-08 13:45:40 +01:00
|
|
|
),
|
|
|
|
"test-manga":
|
2019-02-03 23:54:17 +01:00
|
|
|
("https://jaiminisbox.com/reader/series/sora_no_kian/", {
|
|
|
|
"url": "66612be177dc3b3fa1d1f537ef02f4f701b163ea",
|
|
|
|
"keyword": "0908a4145bb03acc4210f5d01169988969f5acd1",
|
|
|
|
}),
|
|
|
|
},
|
|
|
|
"kireicake": {
|
|
|
|
"root": "https://reader.kireicake.com",
|
2019-02-08 13:45:40 +01:00
|
|
|
"test-chapter":
|
2019-02-03 23:54:17 +01:00
|
|
|
("https://reader.kireicake.com/read/wonderland/en/1/1/", {
|
|
|
|
"url": "b2d36bc0bc67e4c461c3a4d6444a2fd339f5d07e",
|
2019-02-14 16:07:17 +01:00
|
|
|
"keyword": "9f80947920a325e33aea7f5cd69ea669171903b6",
|
2019-02-03 23:54:17 +01:00
|
|
|
}),
|
2019-02-08 13:45:40 +01:00
|
|
|
"test-manga":
|
2019-02-03 23:54:17 +01:00
|
|
|
("https://reader.kireicake.com/series/wonderland/", {
|
|
|
|
"url": "d067b649af1cc88fa8c8b698fde04a10909fd169",
|
2019-04-19 23:02:29 +02:00
|
|
|
"keyword": "268f43772fb239888ca5c5f6a4f65f99ffb3eefb",
|
2019-02-03 23:54:17 +01:00
|
|
|
}),
|
|
|
|
},
|
|
|
|
"powermanga": {
|
|
|
|
"root": "https://read.powermanga.org",
|
|
|
|
"pattern": r"read(?:er)?\.powermanga\.org",
|
2019-02-08 13:45:40 +01:00
|
|
|
"test-chapter":
|
2019-02-03 23:54:17 +01:00
|
|
|
(("https://read.powermanga.org"
|
|
|
|
"/read/one_piece_digital_colour_comics/en/0/75/"), {
|
|
|
|
"url": "854c5817f8f767e1bccd05fa9d58ffb5a4b09384",
|
2019-02-14 16:07:17 +01:00
|
|
|
"keyword": "a60c42f2634b7387899299d411ff494ed0ad6dbe",
|
2019-02-03 23:54:17 +01:00
|
|
|
}),
|
2019-02-08 13:45:40 +01:00
|
|
|
"test-manga":
|
2019-02-03 23:54:17 +01:00
|
|
|
(("https://read.powermanga.org"
|
|
|
|
"/series/one_piece_digital_colour_comics/"), {
|
|
|
|
"count": ">= 1",
|
|
|
|
"keyword": {
|
|
|
|
"chapter": int,
|
|
|
|
"chapter_minor": str,
|
|
|
|
"chapter_string": str,
|
|
|
|
"group": "PowerManga",
|
|
|
|
"lang": "en",
|
|
|
|
"language": "English",
|
|
|
|
"manga": "One Piece Digital Colour Comics",
|
|
|
|
"title": str,
|
|
|
|
"volume": int,
|
|
|
|
},
|
|
|
|
}),
|
|
|
|
},
|
|
|
|
"sensescans": {
|
|
|
|
"root": "http://sensescans.com/reader",
|
|
|
|
"pattern": r"(?:(?:www\.)?sensescans\.com/reader"
|
|
|
|
r"|reader\.sensescans\.com)",
|
2019-02-08 13:45:40 +01:00
|
|
|
"test-chapter": (
|
|
|
|
(("http://sensescans.com/reader/read/"
|
2019-02-03 23:54:17 +01:00
|
|
|
"magi__labyrinth_of_magic/en/37/369/"), {
|
|
|
|
"url": "a399ef037cdfbc25b09d435cc2ea1e3e454a6812",
|
2019-02-14 16:07:17 +01:00
|
|
|
"keyword": "07acd84fb18a9f1fd6dff5befe711bcca0ff9988",
|
2019-02-03 23:54:17 +01:00
|
|
|
}),
|
2019-02-08 13:45:40 +01:00
|
|
|
(("http://reader.sensescans.com/read/"
|
2019-02-03 23:54:17 +01:00
|
|
|
"magi__labyrinth_of_magic/en/37/369/"), {
|
|
|
|
"url": "a399ef037cdfbc25b09d435cc2ea1e3e454a6812",
|
2019-02-14 16:07:17 +01:00
|
|
|
"keyword": "07acd84fb18a9f1fd6dff5befe711bcca0ff9988",
|
2019-02-03 23:54:17 +01:00
|
|
|
}),
|
2019-02-08 13:45:40 +01:00
|
|
|
),
|
|
|
|
"test-manga":
|
2019-02-03 23:54:17 +01:00
|
|
|
("http://sensescans.com/reader/series/hakkenden/", {
|
|
|
|
"url": "2360ccb0ead0ff2f5e27b7aef7eb17b9329de2f2",
|
2019-04-19 23:02:29 +02:00
|
|
|
"keyword": "4919f2bfed38e3a34dc984ec8d1dbd7a03044e23",
|
2019-02-03 23:54:17 +01:00
|
|
|
}),
|
|
|
|
},
|
|
|
|
"worldthree": {
|
|
|
|
"root": "http://www.slide.world-three.org",
|
|
|
|
"pattern": r"(?:www\.)?slide\.world-three\.org",
|
2019-02-08 13:45:40 +01:00
|
|
|
"test-chapter": (
|
2019-02-03 23:54:17 +01:00
|
|
|
(("http://www.slide.world-three.org"
|
|
|
|
"/read/black_bullet/en/2/7/page/1"), {
|
|
|
|
"url": "be2f04f6e2d311b35188094cfd3e768583271584",
|
2019-02-14 16:07:17 +01:00
|
|
|
"keyword": "967d536a65de4d52478d5b666a1760b181eddb6e",
|
2019-02-03 23:54:17 +01:00
|
|
|
}),
|
|
|
|
(("http://www.slide.world-three.org"
|
|
|
|
"/read/idolmster_cg_shuffle/en/0/4/2/"), {
|
|
|
|
"url": "6028ea5ca282744f925dfad92eeb98509f9cc78c",
|
2019-02-14 16:07:17 +01:00
|
|
|
"keyword": "f3cfe2ad3388991f1d045c85d0fa94795a7694dc",
|
2019-02-03 23:54:17 +01:00
|
|
|
}),
|
2019-02-08 13:45:40 +01:00
|
|
|
),
|
|
|
|
"test-manga":
|
2019-02-03 23:54:17 +01:00
|
|
|
("http://www.slide.world-three.org/series/black_bullet/", {
|
|
|
|
"url": "5743b93512d26e6b540d90a7a5d69208b6d4a738",
|
|
|
|
"keyword": "3a24f1088b4d7f3b798a96163f21ca251293a120",
|
|
|
|
}),
|
|
|
|
},
|
2019-03-07 22:55:26 +01:00
|
|
|
"_ckey": "chapterclass",
|
2019-02-03 23:54:17 +01:00
|
|
|
}
|
|
|
|
|
2019-03-07 22:55:26 +01:00
|
|
|
generate_extractors(EXTRACTORS, globals(), (
|
|
|
|
FoolslideChapterExtractor,
|
|
|
|
FoolslideMangaExtractor,
|
|
|
|
))
|