bazarr/libs/subliminal_patch/providers/sucha.py

216 lines
7 KiB
Python
Raw Normal View History

2020-10-01 01:39:25 +08:00
# -*- coding: utf-8 -*-
2020-10-12 03:40:07 +08:00
import io
2020-10-01 01:39:25 +08:00
import logging
import os
import zipfile
2020-10-12 03:40:07 +08:00
import rarfile
2020-10-01 01:39:25 +08:00
from requests import Session
2020-10-12 03:40:07 +08:00
from subliminal import Episode, Movie
2020-10-01 01:39:25 +08:00
from subliminal.exceptions import ServiceUnavailable
2020-10-12 03:40:07 +08:00
from subliminal.subtitle import SUBTITLE_EXTENSIONS, fix_line_ending
from subliminal_patch.exceptions import APIThrottled
2020-10-01 01:39:25 +08:00
from subliminal_patch.providers import Provider
2020-10-12 03:40:07 +08:00
from subliminal_patch.subtitle import Subtitle
from subzero.language import Language
2020-10-01 01:39:25 +08:00
logger = logging.getLogger(__name__)
server_url = "http://sapi.caretas.club/"
page_url = "https://sucha.caretas.club/"
class SuchaSubtitle(Subtitle):
provider_name = "sucha"
hash_verifiable = False
def __init__(
2020-10-12 03:40:07 +08:00
self,
language,
page_link,
filename,
guessit_dict,
download_link,
hearing_impaired,
matches,
2020-10-01 01:39:25 +08:00
):
super(SuchaSubtitle, self).__init__(
language, hearing_impaired=hearing_impaired, page_link=page_url
)
self.download_link = download_link
self.referer = page_link
2020-10-12 03:40:07 +08:00
self.guessit = guessit_dict
2020-10-01 01:39:25 +08:00
self.language = language
self.release_info = filename
self.filename = filename
self.found_matches = matches
@property
def id(self):
return self.download_link
def get_matches(self, video):
2020-10-12 03:40:07 +08:00
if (
video.release_group
and str(video.release_group).lower() in self.filename.lower()
):
self.found_matches.add("release_group")
2020-10-02 02:29:16 +08:00
2020-10-12 03:40:07 +08:00
if video.source and video.source.lower() in self.guessit["source"].lower():
2020-10-02 02:29:16 +08:00
self.found_matches.add("source")
2020-10-12 03:40:07 +08:00
if (
video.resolution
and video.resolution.lower() in self.guessit["resolution"].lower()
):
self.found_matches.add("resolution")
if (
video.audio_codec
and video.audio_codec.lower() in self.guessit["audio_codec"].lower()
):
self.found_matches.add("audio_codec")
if (
video.video_codec
and video.video_codec.lower() in self.guessit["video_codec"].lower()
):
self.found_matches.add("video_codec")
2020-10-01 01:39:25 +08:00
return self.found_matches
class SuchaProvider(Provider):
"""Sucha Provider"""
languages = {Language.fromalpha2(l) for l in ["es"]}
language_list = list(languages)
logger.debug(languages)
video_types = (Episode, Movie)
def initialize(self):
self.session = Session()
self.session.headers = {
"User-Agent": os.environ.get("SZ_USER_AGENT", "Sub-Zero/2")
}
def terminate(self):
self.session.close()
def query(self, languages, video):
movie_year = video.year if video.year else None
is_episode = True if isinstance(video, Episode) else False
imdb_id = video.imdb_id if video.imdb_id else None
language = self.language_list[0]
if is_episode:
q = {
"query": "{} S{:02}E{:02}".format(
video.series, video.season, video.episode
)
}
else:
if imdb_id:
q = {"query": imdb_id}
else:
q = {"query": video.title, "year": movie_year}
logger.debug("Searching subtitles: {}".format(q["query"]))
res = self.session.get(server_url + "search", params=q, timeout=10)
res.raise_for_status()
result = res.json()
try:
subtitles = []
for i in result["results"]:
matches = set()
2020-10-02 02:29:16 +08:00
# We use 'in' instead of '==' since Subdivx titles are
# irregular
2020-10-01 01:39:25 +08:00
if video.title.lower() in i["title"].lower():
matches.add("title")
if is_episode:
2020-10-02 02:29:16 +08:00
if q["query"].lower() in i["title"].lower():
2020-10-01 01:39:25 +08:00
matches.add("title")
matches.add("series")
2020-10-12 03:40:07 +08:00
matches.add("imdb_id")
2020-10-01 01:39:25 +08:00
matches.add("season")
matches.add("episode")
matches.add("year")
if i["year"] == video.year:
matches.add("year")
if imdb_id:
matches.add("imdb_id")
2020-10-12 03:40:07 +08:00
# We'll add release group info (if found) to the pseudo filename
# in order to show it in the manual search
filename = i["pseudo_file"]
if (
video.release_group
and str(video.release_group).lower() in i["original_description"]
):
filename = i["pseudo_file"].replace(
".es.srt", "-" + str(video.release_group) + ".es.srt"
)
2020-10-01 01:39:25 +08:00
subtitles.append(
SuchaSubtitle(
language,
i["referer"],
2020-10-12 03:40:07 +08:00
filename,
i["guessit"],
2020-10-01 01:39:25 +08:00
i["download_url"],
i["hearing_impaired"],
matches,
)
)
return subtitles
except KeyError:
logger.debug("No subtitles found")
return []
def list_subtitles(self, video, languages):
return self.query(languages, video)
def _check_response(self, response):
if response.status_code != 200:
raise ServiceUnavailable("Bad status code: " + str(response.status_code))
def _get_archive(self, content):
archive_stream = io.BytesIO(content)
if rarfile.is_rarfile(archive_stream):
logger.debug("Identified rar archive")
archive = rarfile.RarFile(archive_stream)
elif zipfile.is_zipfile(archive_stream):
logger.debug("Identified zip archive")
archive = zipfile.ZipFile(archive_stream)
else:
raise APIThrottled("Unsupported compressed format")
return archive
def get_file(self, archive):
for name in archive.namelist():
if os.path.split(name)[-1].startswith("."):
continue
if not name.lower().endswith(SUBTITLE_EXTENSIONS):
continue
if (
"[eng]" in name.lower()
or ".en." in name.lower()
or ".eng." in name.lower()
):
continue
logger.debug("Returning from archive: {}".format(name))
return archive.read(name)
raise APIThrottled("Can not find the subtitle in the compressed file")
def download_subtitle(self, subtitle):
logger.info("Downloading subtitle %r", subtitle)
response = self.session.get(
subtitle.download_link, headers={"Referer": subtitle.page_link}, timeout=10
)
response.raise_for_status()
self._check_response(response)
archive = self._get_archive(response.content)
subtitle_file = self.get_file(archive)
subtitle.content = fix_line_ending(subtitle_file)