2018-03-24 07:59:59 +08:00
|
|
|
# -*- coding: utf-8 -*-
|
|
|
|
import io
|
|
|
|
import logging
|
|
|
|
import re
|
|
|
|
|
|
|
|
from babelfish import Language, language_converters
|
|
|
|
from guessit import guessit
|
|
|
|
try:
|
|
|
|
from lxml import etree
|
|
|
|
except ImportError:
|
|
|
|
try:
|
|
|
|
import xml.etree.cElementTree as etree
|
|
|
|
except ImportError:
|
|
|
|
import xml.etree.ElementTree as etree
|
|
|
|
from requests import Session
|
|
|
|
from zipfile import ZipFile
|
|
|
|
|
|
|
|
from . import Provider
|
|
|
|
from .. import __short_version__
|
|
|
|
from ..exceptions import ProviderError
|
|
|
|
from ..subtitle import Subtitle, fix_line_ending, guess_matches
|
|
|
|
from ..utils import sanitize
|
|
|
|
from ..video import Episode, Movie
|
|
|
|
|
|
|
|
logger = logging.getLogger(__name__)
|
|
|
|
|
|
|
|
|
|
|
|
class PodnapisiSubtitle(Subtitle):
|
|
|
|
"""Podnapisi Subtitle."""
|
|
|
|
provider_name = 'podnapisi'
|
|
|
|
|
|
|
|
def __init__(self, language, hearing_impaired, page_link, pid, releases, title, season=None, episode=None,
|
|
|
|
year=None):
|
2018-04-23 20:36:17 +08:00
|
|
|
super(PodnapisiSubtitle, self).__init__(language, hearing_impaired=hearing_impaired, page_link=page_link)
|
2018-03-24 07:59:59 +08:00
|
|
|
self.pid = pid
|
|
|
|
self.releases = releases
|
|
|
|
self.title = title
|
|
|
|
self.season = season
|
|
|
|
self.episode = episode
|
|
|
|
self.year = year
|
|
|
|
|
|
|
|
@property
|
|
|
|
def id(self):
|
|
|
|
return self.pid
|
|
|
|
|
|
|
|
def get_matches(self, video):
|
|
|
|
matches = set()
|
|
|
|
|
|
|
|
# episode
|
|
|
|
if isinstance(video, Episode):
|
|
|
|
# series
|
2018-04-23 20:36:17 +08:00
|
|
|
if video.series and (sanitize(self.title) in (
|
|
|
|
sanitize(name) for name in [video.series] + video.alternative_series)):
|
2018-03-24 07:59:59 +08:00
|
|
|
matches.add('series')
|
|
|
|
# year
|
|
|
|
if video.original_series and self.year is None or video.year and video.year == self.year:
|
|
|
|
matches.add('year')
|
|
|
|
# season
|
|
|
|
if video.season and self.season == video.season:
|
|
|
|
matches.add('season')
|
|
|
|
# episode
|
|
|
|
if video.episode and self.episode == video.episode:
|
|
|
|
matches.add('episode')
|
|
|
|
# guess
|
|
|
|
for release in self.releases:
|
|
|
|
matches |= guess_matches(video, guessit(release, {'type': 'episode'}))
|
|
|
|
# movie
|
|
|
|
elif isinstance(video, Movie):
|
|
|
|
# title
|
2018-04-23 20:36:17 +08:00
|
|
|
if video.title and (sanitize(self.title) in (
|
|
|
|
sanitize(name) for name in [video.title] + video.alternative_titles)):
|
2018-03-24 07:59:59 +08:00
|
|
|
matches.add('title')
|
|
|
|
# year
|
|
|
|
if video.year and self.year == video.year:
|
|
|
|
matches.add('year')
|
|
|
|
# guess
|
|
|
|
for release in self.releases:
|
|
|
|
matches |= guess_matches(video, guessit(release, {'type': 'movie'}))
|
|
|
|
|
|
|
|
return matches
|
|
|
|
|
|
|
|
|
|
|
|
class PodnapisiProvider(Provider):
|
|
|
|
"""Podnapisi Provider."""
|
|
|
|
languages = ({Language('por', 'BR'), Language('srp', script='Latn')} |
|
|
|
|
{Language.fromalpha2(l) for l in language_converters['alpha2'].codes})
|
2018-04-23 20:36:17 +08:00
|
|
|
server_url = 'https://www.podnapisi.net/subtitles/'
|
|
|
|
subtitle_class = PodnapisiSubtitle
|
|
|
|
|
|
|
|
def __init__(self):
|
|
|
|
self.session = None
|
2018-03-24 07:59:59 +08:00
|
|
|
|
|
|
|
def initialize(self):
|
|
|
|
self.session = Session()
|
|
|
|
self.session.headers['User-Agent'] = 'Subliminal/%s' % __short_version__
|
|
|
|
|
|
|
|
def terminate(self):
|
|
|
|
self.session.close()
|
|
|
|
|
|
|
|
def query(self, language, keyword, season=None, episode=None, year=None):
|
|
|
|
# set parameters, see http://www.podnapisi.net/forum/viewtopic.php?f=62&t=26164#p212652
|
|
|
|
params = {'sXML': 1, 'sL': str(language), 'sK': keyword}
|
|
|
|
is_episode = False
|
|
|
|
if season and episode:
|
|
|
|
is_episode = True
|
|
|
|
params['sTS'] = season
|
|
|
|
params['sTE'] = episode
|
|
|
|
if year:
|
|
|
|
params['sY'] = year
|
|
|
|
|
|
|
|
# loop over paginated results
|
|
|
|
logger.info('Searching subtitles %r', params)
|
|
|
|
subtitles = []
|
|
|
|
pids = set()
|
|
|
|
while True:
|
|
|
|
# query the server
|
2018-04-23 20:36:17 +08:00
|
|
|
r = self.session.get(self.server_url + 'search/old', params=params, timeout=10)
|
|
|
|
r.raise_for_status()
|
|
|
|
xml = etree.fromstring(r.content)
|
2018-03-24 07:59:59 +08:00
|
|
|
|
|
|
|
# exit if no results
|
|
|
|
if not int(xml.find('pagination/results').text):
|
|
|
|
logger.debug('No subtitles found')
|
|
|
|
break
|
|
|
|
|
|
|
|
# loop over subtitles
|
|
|
|
for subtitle_xml in xml.findall('subtitle'):
|
|
|
|
# read xml elements
|
2018-04-23 20:36:17 +08:00
|
|
|
pid = subtitle_xml.find('pid').text
|
|
|
|
# ignore duplicates, see http://www.podnapisi.net/forum/viewtopic.php?f=62&t=26164&start=10#p213321
|
|
|
|
if pid in pids:
|
|
|
|
continue
|
|
|
|
|
2018-03-24 07:59:59 +08:00
|
|
|
language = Language.fromietf(subtitle_xml.find('language').text)
|
|
|
|
hearing_impaired = 'n' in (subtitle_xml.find('flags').text or '')
|
|
|
|
page_link = subtitle_xml.find('url').text
|
|
|
|
releases = []
|
|
|
|
if subtitle_xml.find('release').text:
|
|
|
|
for release in subtitle_xml.find('release').text.split():
|
|
|
|
release = re.sub(r'\.+$', '', release) # remove trailing dots
|
|
|
|
release = ''.join(filter(lambda x: ord(x) < 128, release)) # remove non-ascii characters
|
|
|
|
releases.append(release)
|
|
|
|
title = subtitle_xml.find('title').text
|
|
|
|
season = int(subtitle_xml.find('tvSeason').text)
|
|
|
|
episode = int(subtitle_xml.find('tvEpisode').text)
|
|
|
|
year = int(subtitle_xml.find('year').text)
|
|
|
|
|
|
|
|
if is_episode:
|
2018-04-23 20:36:17 +08:00
|
|
|
subtitle = self.subtitle_class(language, hearing_impaired, page_link, pid, releases, title,
|
|
|
|
season=season, episode=episode, year=year)
|
2018-03-24 07:59:59 +08:00
|
|
|
else:
|
2018-04-23 20:36:17 +08:00
|
|
|
subtitle = self.subtitle_class(language, hearing_impaired, page_link, pid, releases, title,
|
|
|
|
year=year)
|
2018-03-24 07:59:59 +08:00
|
|
|
|
|
|
|
logger.debug('Found subtitle %r', subtitle)
|
|
|
|
subtitles.append(subtitle)
|
|
|
|
pids.add(pid)
|
|
|
|
|
|
|
|
# stop on last page
|
|
|
|
if int(xml.find('pagination/current').text) >= int(xml.find('pagination/count').text):
|
|
|
|
break
|
|
|
|
|
|
|
|
# increment current page
|
|
|
|
params['page'] = int(xml.find('pagination/current').text) + 1
|
|
|
|
logger.debug('Getting page %d', params['page'])
|
|
|
|
|
|
|
|
return subtitles
|
|
|
|
|
|
|
|
def list_subtitles(self, video, languages):
|
2018-04-23 20:36:17 +08:00
|
|
|
season = episode = None
|
2018-03-24 07:59:59 +08:00
|
|
|
if isinstance(video, Episode):
|
2018-04-23 20:36:17 +08:00
|
|
|
titles = [video.series] + video.alternative_series
|
|
|
|
season = video.season
|
|
|
|
episode = video.episode
|
|
|
|
else:
|
|
|
|
titles = [video.title] + video.alternative_titles
|
|
|
|
|
|
|
|
for title in titles:
|
|
|
|
subtitles = [s for l in languages for s in
|
|
|
|
self.query(l, title, season=season, episode=episode, year=video.year)]
|
|
|
|
if subtitles:
|
|
|
|
return subtitles
|
|
|
|
|
|
|
|
return []
|
2018-03-24 07:59:59 +08:00
|
|
|
|
|
|
|
def download_subtitle(self, subtitle):
|
|
|
|
# download as a zip
|
|
|
|
logger.info('Downloading subtitle %r', subtitle)
|
|
|
|
r = self.session.get(self.server_url + subtitle.pid + '/download', params={'container': 'zip'}, timeout=10)
|
|
|
|
r.raise_for_status()
|
|
|
|
|
|
|
|
# open the zip
|
|
|
|
with ZipFile(io.BytesIO(r.content)) as zf:
|
|
|
|
if len(zf.namelist()) > 1:
|
|
|
|
raise ProviderError('More than one file to unzip')
|
|
|
|
|
|
|
|
subtitle.content = fix_line_ending(zf.read(zf.namelist()[0]))
|