mirror of https://github.com/morpheus65535/bazarr
update zimuku providers
This commit is contained in:
parent
209f22c6e2
commit
3173351590
|
@ -0,0 +1,27 @@
|
||||||
|
# -*- coding: utf-8 -*-
|
||||||
|
from __future__ import absolute_import
|
||||||
|
from babelfish import LanguageReverseConverter
|
||||||
|
from subliminal.exceptions import ConfigurationError
|
||||||
|
|
||||||
|
class zimukuConverter(LanguageReverseConverter):
|
||||||
|
def __init__(self):
|
||||||
|
self.from_zimuku = { u'简体': ('zho', 'CN', None), u'繁体': ('zho', 'TW', None),
|
||||||
|
u'簡體': ('zho', 'CN', None), u'繁體': ('zho', 'TW', None),
|
||||||
|
u'英文': ('eng',),
|
||||||
|
u'chs': ('zho', 'CN', None), u'cht': ('zho', 'TW', None),
|
||||||
|
u'chn': ('zho', 'CN', None), u'twn': ('zho', 'TW', None)}
|
||||||
|
self.to_zimuku = { ('zho', 'CN', None): u'chs', ('zho', 'TW', None): u'cht',
|
||||||
|
('eng', None, None) : u'eng', ('zho', None, None): u'chs'}
|
||||||
|
self.codes = set(self.from_zimuku.keys())
|
||||||
|
|
||||||
|
def convert(self, alpha3, country=None, script=None):
|
||||||
|
if (alpha3, country, script) in self.to_zimuku:
|
||||||
|
return self.to_zimuku[(alpha3, country, script)]
|
||||||
|
|
||||||
|
raise ConfigurationError('Unsupported language for zimuku: %s, %s, %s' % (alpha3, country, script))
|
||||||
|
|
||||||
|
def reverse(self, zimuku):
|
||||||
|
if zimuku in self.from_zimuku:
|
||||||
|
return self.from_zimuku[zimuku]
|
||||||
|
|
||||||
|
raise ConfigurationError('Unsupported language code for zimuku: %s' % zimuku)
|
|
@ -637,8 +637,8 @@ def _search_external_subtitles(path, languages=None, only_one=False, scandir_gen
|
||||||
hi = any(i for i in hi_tag if i in adv_tag)
|
hi = any(i for i in hi_tag if i in adv_tag)
|
||||||
|
|
||||||
#add simplified/traditional chinese detection
|
#add simplified/traditional chinese detection
|
||||||
simplified_chinese = ["chs", "sc", "zhs", "hans","zh-hans", "gb", "简", "简中", "简体", "简体中文", "中英双语", "中日双语","中法双语"]
|
simplified_chinese = ["chs", "sc", "zhs", "hans","zh-hans", "gb", "简", "简中", "简体", "简体中文", "中英双语", "中日双语","中法双语","简体&英文"]
|
||||||
traditional_chinese = ["cht", "tc", "zht", "hant","zh-hant", "big5", "繁", "繁中", "繁体", "繁體","繁体中文", "繁體中文", "正體中文", "中英雙語", "中日雙語","中法雙語"]
|
traditional_chinese = ["cht", "tc", "zht", "hant","zh-hant", "big5", "繁", "繁中", "繁体", "繁體","繁体中文", "繁體中文", "正體中文", "中英雙語", "中日雙語","中法雙語","繁体&英文"]
|
||||||
FULL_LANGUAGE_LIST.extend(simplified_chinese)
|
FULL_LANGUAGE_LIST.extend(simplified_chinese)
|
||||||
FULL_LANGUAGE_LIST.extend(traditional_chinese)
|
FULL_LANGUAGE_LIST.extend(traditional_chinese)
|
||||||
p_root = p_root.replace('zh-TW', 'zht')
|
p_root = p_root.replace('zh-TW', 'zht')
|
||||||
|
|
|
@ -13,23 +13,30 @@ except ImportError:
|
||||||
from urllib.parse import urljoin
|
from urllib.parse import urljoin
|
||||||
|
|
||||||
import rarfile
|
import rarfile
|
||||||
|
from babelfish import language_converters
|
||||||
from subzero.language import Language
|
from subzero.language import Language
|
||||||
from guessit import guessit
|
from guessit import guessit
|
||||||
from requests import Session
|
from requests import Session
|
||||||
from six import text_type
|
from six import text_type
|
||||||
|
|
||||||
from subliminal import __short_version__
|
from subliminal import __short_version__
|
||||||
from subliminal.providers import ParserBeautifulSoup, Provider
|
from subliminal.providers import ParserBeautifulSoup
|
||||||
|
from subliminal_patch.providers import Provider
|
||||||
from subliminal.subtitle import (
|
from subliminal.subtitle import (
|
||||||
SUBTITLE_EXTENSIONS,
|
SUBTITLE_EXTENSIONS,
|
||||||
|
fix_line_ending
|
||||||
|
)
|
||||||
|
from subliminal_patch.subtitle import (
|
||||||
Subtitle,
|
Subtitle,
|
||||||
fix_line_ending,
|
guess_matches
|
||||||
guess_matches,
|
|
||||||
)
|
)
|
||||||
from subliminal.video import Episode, Movie
|
from subliminal.video import Episode, Movie
|
||||||
|
|
||||||
logger = logging.getLogger(__name__)
|
logger = logging.getLogger(__name__)
|
||||||
|
|
||||||
|
language_converters.register('zimuku = subliminal_patch.converters.zimuku:zimukuConverter')
|
||||||
|
|
||||||
|
supported_languages = list(language_converters['zimuku'].to_zimuku.keys())
|
||||||
|
|
||||||
class ZimukuSubtitle(Subtitle):
|
class ZimukuSubtitle(Subtitle):
|
||||||
"""Zimuku Subtitle."""
|
"""Zimuku Subtitle."""
|
||||||
|
@ -77,7 +84,8 @@ class ZimukuSubtitle(Subtitle):
|
||||||
class ZimukuProvider(Provider):
|
class ZimukuProvider(Provider):
|
||||||
"""Zimuku Provider."""
|
"""Zimuku Provider."""
|
||||||
|
|
||||||
languages = {Language(l) for l in ["zho", "eng"]}
|
languages = {Language(*l) for l in supported_languages}
|
||||||
|
logger.info(str(supported_languages))
|
||||||
|
|
||||||
server_url = "http://www.zimuku.la"
|
server_url = "http://www.zimuku.la"
|
||||||
search_url = "/search?q={}"
|
search_url = "/search?q={}"
|
||||||
|
@ -114,11 +122,18 @@ class ZimukuProvider(Provider):
|
||||||
language = Language("eng")
|
language = Language("eng")
|
||||||
for img in sub.find("td", class_="tac lang").find_all("img"):
|
for img in sub.find("td", class_="tac lang").find_all("img"):
|
||||||
if (
|
if (
|
||||||
"hongkong" in img.attrs["src"]
|
"china" in img.attrs["src"]
|
||||||
or "china" in img.attrs["src"]
|
and "hongkong" in img.attrs["src"]
|
||||||
|
):
|
||||||
|
language = Language("zho").add(Language('zho', 'TW', None))
|
||||||
|
logger.debug("language:"+str(language))
|
||||||
|
elif (
|
||||||
|
"china" in img.attrs["src"]
|
||||||
or "jollyroger" in img.attrs["src"]
|
or "jollyroger" in img.attrs["src"]
|
||||||
):
|
):
|
||||||
language = Language("zho")
|
language = Language("zho")
|
||||||
|
elif "hongkong" in img.attrs["src"]:
|
||||||
|
language = Language('zho', 'TW', None)
|
||||||
break
|
break
|
||||||
sub_page_link = urljoin(self.server_url, a.attrs["href"])
|
sub_page_link = urljoin(self.server_url, a.attrs["href"])
|
||||||
backup_session = copy.deepcopy(self.session)
|
backup_session = copy.deepcopy(self.session)
|
||||||
|
@ -189,7 +204,7 @@ class ZimukuProvider(Provider):
|
||||||
new_subs = self._parse_episode_page(episode_link, subs_year)
|
new_subs = self._parse_episode_page(episode_link, subs_year)
|
||||||
subtitles += new_subs
|
subtitles += new_subs
|
||||||
|
|
||||||
# NOTE: shooter result pages are ignored due to the existence of assrt provider
|
# NOTE: shooter result pages are ignored due to the existence of zimuku provider
|
||||||
|
|
||||||
return subtitles
|
return subtitles
|
||||||
|
|
||||||
|
@ -305,15 +320,15 @@ def _get_subtitle_from_archive(archive):
|
||||||
if not subname.lower().endswith(SUBTITLE_EXTENSIONS):
|
if not subname.lower().endswith(SUBTITLE_EXTENSIONS):
|
||||||
continue
|
continue
|
||||||
|
|
||||||
# prefer ass/ssa subtitles with double languages or simplified chinese
|
# prefer ass/ssa/srt subtitles with double languages or simplified/traditional chinese
|
||||||
score = ("ass" in subname or "ssa" in subname) * 1
|
score = ("ass" in subname or "ssa" in subname or "srt" in subname) * 1
|
||||||
if "简体" in subname or "chs" in subname or ".gb." in subname:
|
if "简体" in subname or "chs" in subname or ".gb." in subname:
|
||||||
score += 2
|
score += 2
|
||||||
if "繁体" in subname or "cht" in subname or ".big5." in subname:
|
if "繁体" in subname or "cht" in subname or ".big5." in subname:
|
||||||
pass
|
|
||||||
if "chs.eng" in subname or "chs&eng" in subname:
|
|
||||||
score += 2
|
score += 2
|
||||||
if "中英" in subname or "简英" in subname or "双语" in subname or "简体&英文" in subname:
|
if "chs.eng" in subname or "chs&eng" in subname or "cht.eng" in subname or "cht&eng" in subname:
|
||||||
|
score += 2
|
||||||
|
if "中英" in subname or "简英" in subname or "繁英" in subname or "双语" in subname or "简体&英文" in subname or "繁体&英文" in subname:
|
||||||
score += 4
|
score += 4
|
||||||
logger.debug("subtitle {}, score: {}".format(subname, score))
|
logger.debug("subtitle {}, score: {}".format(subname, score))
|
||||||
if score > max_score:
|
if score > max_score:
|
||||||
|
@ -374,4 +389,4 @@ def num_to_cn(number):
|
||||||
else:
|
else:
|
||||||
part1 = "十" if number[0] == "1" else trans_map[number[0]] + "十"
|
part1 = "十" if number[0] == "1" else trans_map[number[0]] + "十"
|
||||||
part2 = trans_map[number[1]] if number[1] != "0" else ""
|
part2 = trans_map[number[1]] if number[1] != "0" else ""
|
||||||
return part1 + part2
|
return part1 + part2
|
Loading…
Reference in New Issue