mirror of
https://github.com/clinton-hall/nzbToMedia.git
synced 2025-01-24 20:03:03 -08:00
f05b09f349
Updates rarfile to 3.1 Updates stevedore to 3.5.0 Updates appdirs to 1.4.4 Updates click to 8.1.3 Updates decorator to 5.1.1 Updates dogpile.cache to 1.1.8 Updates pbr to 5.11.0 Updates pysrt to 1.1.2 Updates pytz to 2022.6 Adds importlib-metadata version 3.1.1 Adds typing-extensions version 4.1.1 Adds zipp version 3.11.0
179 lines
6.3 KiB
Python
179 lines
6.3 KiB
Python
# -*- coding: utf-8 -*-
|
|
import io
|
|
import logging
|
|
import re
|
|
|
|
from babelfish import Language, language_converters
|
|
from guessit import guessit
|
|
try:
|
|
from lxml import etree
|
|
except ImportError:
|
|
try:
|
|
import xml.etree.cElementTree as etree
|
|
except ImportError:
|
|
import xml.etree.ElementTree as etree
|
|
from requests import Session
|
|
from zipfile import ZipFile
|
|
|
|
from . import Provider
|
|
from ..exceptions import ProviderError
|
|
from ..matches import guess_matches
|
|
from ..subtitle import Subtitle, fix_line_ending
|
|
from ..video import Episode
|
|
|
|
logger = logging.getLogger(__name__)
|
|
|
|
|
|
class PodnapisiSubtitle(Subtitle):
|
|
"""Podnapisi Subtitle."""
|
|
provider_name = 'podnapisi'
|
|
|
|
def __init__(self, language, hearing_impaired, page_link, pid, releases, title, season=None, episode=None,
|
|
year=None):
|
|
super(PodnapisiSubtitle, self).__init__(language, hearing_impaired=hearing_impaired, page_link=page_link)
|
|
self.pid = pid
|
|
self.releases = releases
|
|
self.title = title
|
|
self.season = season
|
|
self.episode = episode
|
|
self.year = year
|
|
|
|
@property
|
|
def id(self):
|
|
return self.pid
|
|
|
|
@property
|
|
def info(self):
|
|
return ' '.join(self.releases) or self.pid
|
|
|
|
def get_matches(self, video):
|
|
matches = guess_matches(video, {
|
|
'title': self.title,
|
|
'year': self.year,
|
|
'season': self.season,
|
|
'episode': self.episode
|
|
})
|
|
|
|
video_type = 'episode' if isinstance(video, Episode) else 'movie'
|
|
for release in self.releases:
|
|
matches |= guess_matches(video, guessit(release, {'type': video_type}))
|
|
|
|
return matches
|
|
|
|
|
|
class PodnapisiProvider(Provider):
|
|
"""Podnapisi Provider."""
|
|
languages = ({Language('por', 'BR'), Language('srp', script='Latn')} |
|
|
{Language.fromalpha2(l) for l in language_converters['alpha2'].codes})
|
|
server_url = 'https://www.podnapisi.net/subtitles/'
|
|
subtitle_class = PodnapisiSubtitle
|
|
|
|
def __init__(self):
|
|
self.session = None
|
|
|
|
def initialize(self):
|
|
self.session = Session()
|
|
self.session.headers['User-Agent'] = self.user_agent
|
|
|
|
def terminate(self):
|
|
self.session.close()
|
|
|
|
def query(self, language, keyword, season=None, episode=None, year=None):
|
|
# set parameters, see http://www.podnapisi.net/forum/viewtopic.php?f=62&t=26164#p212652
|
|
params = {'sXML': 1, 'sL': str(language), 'sK': keyword}
|
|
is_episode = False
|
|
if season and episode:
|
|
is_episode = True
|
|
params['sTS'] = season
|
|
params['sTE'] = episode
|
|
if year:
|
|
params['sY'] = year
|
|
|
|
# loop over paginated results
|
|
logger.info('Searching subtitles %r', params)
|
|
subtitles = []
|
|
pids = set()
|
|
while True:
|
|
# query the server
|
|
r = self.session.get(self.server_url + 'search/old', params=params, timeout=10)
|
|
r.raise_for_status()
|
|
xml = etree.fromstring(r.content)
|
|
|
|
# exit if no results
|
|
if not int(xml.find('pagination/results').text):
|
|
logger.debug('No subtitles found')
|
|
break
|
|
|
|
# loop over subtitles
|
|
for subtitle_xml in xml.findall('subtitle'):
|
|
# read xml elements
|
|
pid = subtitle_xml.find('pid').text
|
|
# ignore duplicates, see http://www.podnapisi.net/forum/viewtopic.php?f=62&t=26164&start=10#p213321
|
|
if pid in pids:
|
|
continue
|
|
|
|
language = Language.fromietf(subtitle_xml.find('language').text)
|
|
hearing_impaired = 'n' in (subtitle_xml.find('flags').text or '')
|
|
page_link = subtitle_xml.find('url').text
|
|
releases = []
|
|
if subtitle_xml.find('release').text:
|
|
for release in subtitle_xml.find('release').text.split():
|
|
release = re.sub(r'\.+$', '', release) # remove trailing dots
|
|
release = ''.join(filter(lambda x: ord(x) < 128, release)) # remove non-ascii characters
|
|
releases.append(release)
|
|
title = subtitle_xml.find('title').text
|
|
season = int(subtitle_xml.find('tvSeason').text)
|
|
episode = int(subtitle_xml.find('tvEpisode').text)
|
|
year = int(subtitle_xml.find('year').text)
|
|
|
|
if is_episode:
|
|
subtitle = self.subtitle_class(language, hearing_impaired, page_link, pid, releases, title,
|
|
season=season, episode=episode, year=year)
|
|
else:
|
|
subtitle = self.subtitle_class(language, hearing_impaired, page_link, pid, releases, title,
|
|
year=year)
|
|
|
|
logger.debug('Found subtitle %r', subtitle)
|
|
subtitles.append(subtitle)
|
|
pids.add(pid)
|
|
|
|
# stop on last page
|
|
if int(xml.find('pagination/current').text) >= int(xml.find('pagination/count').text):
|
|
break
|
|
|
|
# increment current page
|
|
params['page'] = int(xml.find('pagination/current').text) + 1
|
|
logger.debug('Getting page %d', params['page'])
|
|
|
|
return subtitles
|
|
|
|
def list_subtitles(self, video, languages):
|
|
season = episode = None
|
|
if isinstance(video, Episode):
|
|
titles = [video.series] + video.alternative_series
|
|
season = video.season
|
|
episode = video.episode
|
|
else:
|
|
titles = [video.title] + video.alternative_titles
|
|
|
|
for title in titles:
|
|
subtitles = [s for l in languages for s in
|
|
self.query(l, title, season=season, episode=episode, year=video.year)]
|
|
if subtitles:
|
|
return subtitles
|
|
|
|
return []
|
|
|
|
def download_subtitle(self, subtitle):
|
|
# download as a zip
|
|
logger.info('Downloading subtitle %r', subtitle)
|
|
r = self.session.get(self.server_url + subtitle.pid + '/download', params={'container': 'zip'}, timeout=10)
|
|
r.raise_for_status()
|
|
|
|
# open the zip
|
|
with ZipFile(io.BytesIO(r.content)) as zf:
|
|
if len(zf.namelist()) > 1:
|
|
raise ProviderError('More than one file to unzip')
|
|
|
|
subtitle.content = fix_line_ending(zf.read(zf.namelist()[0]))
|