anime-downloader/anime_downloader/sites/anime8.py

import logging
import re
from anime_downloader.sites.anime import Anime, AnimeEpisode, SearchResult
from anime_downloader.sites import helpers

logger = logging.getLogger(__name__)


class Anime8(Anime, sitename='anime8'):
    sitename = 'anime8'

    @classmethod
    def search(cls, query):
        soup = helpers.soupify(helpers.get('https://anime8.ru/Search/', params={'s': query}).text)
        results = soup.select('div.ml-item > a')

        search_results = [
            SearchResult(
                title=i.find('h2').text,
                url=i['href'],
                meta_info={
                    'version_key_subbed': '(Sub)',
                    'version_key_dubbed': '(Dub)'
                })
            for i in results
        ]
        return search_results

    def _scrape_episodes(self):
        """
        Because of how the website is built,
        the only way to access the episodes is by going to the last episode available
        thats why im making two requests here.
        """
        link = helpers.soupify(helpers.get(self.url).text).select_one('div#mv-info > a')['href']
        soup = helpers.soupify(helpers.get(link).text)
        eps = soup.select('a[class*="btn-eps first-ep last-ep"]')
        eps = [x.get('href') for x in eps]

        # Seperating normal episodes from the special episodes
        correct_eps = []
        special_eps = []
        special_seperator = ['-Preview', '-Special']

        for episode in eps:
            ep_text = episode.split('/')[-1].split('?')[0]  # Getting the episode type from the url

            # Only "The God of High School" has a sneak peak episode and it is broken in the 1st 10 seconds
            if '-Sneak-Peak' in ep_text:
                continue

            # Here i add the special episodes to a seperate list
            if ep_text in special_seperator:
                special_eps.append(episode)

            # Here i add the normal episodes to the correct_eps list
            else:
                correct_eps.append(episode)

        # If configured to do so it will add all the special eps to the end of the list
        if self.config['include_special_eps']:
            correct_eps.extend(special_eps)
        return correct_eps

    def _scrape_metadata(self):
        soup = helpers.soupify(helpers.get(self.url))
        self.title = soup.select('div.thumb.mvic-thumb > img')[0]['alt']


class Anime8Episode(AnimeEpisode, sitename='anime8'):
    def _get_sources(self):
        resp = helpers.get(self.url)
        # Gets the ctk and id from the page used for a post request.
        ctk = re.search(r"ctk\s+=\s+'(.*)?';", resp.text).group(1)
        _id = re.search(r"episode_id\s*=\s*([^;]*)", resp.text).group(1)

        logger.info('ctk: {}'.format(ctk))
        logger.info('id: {}'.format(_id))

        for server in self.config['servers']:
            # The post request returns an embed.
            logger.info('server: {}'.format(server))
            resp = helpers.post("https://anime8.ru/ajax/anime/load_episodes_v2?s={}".format(server),
                                data={"episode_id": _id, "ctk": ctk})
            # Gets the real embed url. Json could be used on the post request, but this is probably more reliable.
            # Skips if no episode found.
            if not resp.json().get('status'):
                continue
            embed = re.search(r"iframe\s*src.*?\"([^\"]*)", resp.text).group(1).replace('\\', '')
            return [('streamx', embed)]
        return ''