|
| 1 | +# -*- coding: utf-8 -*- |
| 2 | +from __future__ import absolute_import |
| 3 | +import requests |
| 4 | +from ..utilities import log as _log |
| 5 | + |
| 6 | +import six |
| 7 | + |
| 8 | + |
| 9 | +ses = requests.Session() |
| 10 | + |
| 11 | +LANGUAGES = ( |
| 12 | + ("Albanian", "29", "sq", "alb", "0", 30201), |
| 13 | + ("Arabic", "12", "ar", "ara", "1", 30202), |
| 14 | + ("Belarusian", "0", "hy", "arm", "2", 30203), |
| 15 | + ("Bosnian", "10", "bs", "bos", "3", 30204), |
| 16 | + ("Bulgarian", "33", "bg", "bul", "4", 30205), |
| 17 | + ("Catalan", "53", "ca", "cat", "5", 30206), |
| 18 | + ("Chinese", "17", "zh", "chi", "6", 30207), |
| 19 | + ("Croatian", "38", "hr", "hrv", "7", 30208), |
| 20 | + ("Czech", "7", "cs", "cze", "8", 30209), |
| 21 | + ("Danish", "24", "da", "dan", "9", 30210), |
| 22 | + ("Dutch", "23", "nl", "dut", "10", 30211), |
| 23 | + ("English", "2", "en", "eng", "11", 30212), |
| 24 | + ("Estonian", "20", "et", "est", "12", 30213), |
| 25 | + ("Persian", "52", "fa", "per", "13", 30247), |
| 26 | + ("Finnish", "31", "fi", "fin", "14", 30214), |
| 27 | + ("French", "8", "fr", "fre", "15", 30215), |
| 28 | + ("German", "5", "de", "ger", "16", 30216), |
| 29 | + ("Greek", "16", "el", "ell", "17", 30217), |
| 30 | + ("Hebrew", "22", "he", "heb", "18", 30218), |
| 31 | + ("Hindi", "42", "hi", "hin", "19", 30219), |
| 32 | + ("Hungarian", "15", "hu", "hun", "20", 30220), |
| 33 | + ("Icelandic", "6", "is", "ice", "21", 30221), |
| 34 | + ("Indonesian", "0", "id", "ind", "22", 30222), |
| 35 | + ("Italian", "9", "it", "ita", "23", 30224), |
| 36 | + ("Japanese", "11", "ja", "jpn", "24", 30225), |
| 37 | + ("Korean", "4", "ko", "kor", "25", 30226), |
| 38 | + ("Latvian", "21", "lv", "lav", "26", 30227), |
| 39 | + ("Lithuanian", "0", "lt", "lit", "27", 30228), |
| 40 | + ("Macedonian", "35", "mk", "mac", "28", 30229), |
| 41 | + ("Malay", "0", "ms", "may", "29", 30248), |
| 42 | + ("Norwegian", "3", "no", "nor", "30", 30230), |
| 43 | + ("Polish", "26", "pl", "pol", "31", 30232), |
| 44 | + ("Portuguese", "32", "pt", "por", "32", 30233), |
| 45 | + ("PortugueseBrazil", "48", "pb", "pob", "33", 30234), |
| 46 | + ("Romanian", "13", "ro", "rum", "34", 30235), |
| 47 | + ("Russian", "27", "ru", "rus", "35", 30236), |
| 48 | + ("Serbian", "36", "sr", "scc", "36", 30237), |
| 49 | + ("Slovak", "37", "sk", "slo", "37", 30238), |
| 50 | + ("Slovenian", "1", "sl", "slv", "38", 30239), |
| 51 | + ("Spanish", "28", "es", "spa", "39", 30240), |
| 52 | + ("Swedish", "25", "sv", "swe", "40", 30242), |
| 53 | + ("Thai", "0", "th", "tha", "41", 30243), |
| 54 | + ("Turkish", "30", "tr", "tur", "42", 30244), |
| 55 | + ("Ukrainian", "46", "uk", "ukr", "43", 30245), |
| 56 | + ("Vietnamese", "51", "vi", "vie", "44", 30246), |
| 57 | + ("BosnianLatin", "10", "bs", "bos", "100", 30204), |
| 58 | + ("Farsi", "52", "fa", "per", "13", 30247), |
| 59 | + ("English (US)", "2", "en", "eng", "100", 30212), |
| 60 | + ("English (UK)", "2", "en", "eng", "100", 30212), |
| 61 | + ("Portuguese (Brazilian)", "48", "pt-br", "pob", "100", 30234), |
| 62 | + ("Portuguese (Brazil)", "48", "pb", "pob", "33", 30234), |
| 63 | + ("Portuguese-BR", "48", "pb", "pob", "33", 30234), |
| 64 | + ("Brazilian", "48", "pb", "pob", "33", 30234), |
| 65 | + ("Español (Latinoamérica)", "28", "es", "spa", "100", 30240), |
| 66 | + ("Español (España)", "28", "es", "spa", "100", 30240), |
| 67 | + ("Spanish (Latin America)", "28", "es", "spa", "100", 30240), |
| 68 | + ("Español", "28", "es", "spa", "100", 30240), |
| 69 | + ("SerbianLatin", "36", "sr", "scc", "100", 30237), |
| 70 | + ("Spanish (Spain)", "28", "es", "spa", "100", 30240), |
| 71 | + ("Chinese (Traditional)", "17", "zh", "chi", "100", 30207), |
| 72 | + ("Chinese (Simplified)", "17", "zh", "chi", "100", 30207)) |
| 73 | + |
| 74 | +opensubtitles2_languages = { |
| 75 | + 'Chinese BG code': 'Chinese', |
| 76 | + 'Brazillian Portuguese': 'Portuguese (Brazil)', |
| 77 | + 'Serbian': 'SerbianLatin', |
| 78 | + 'Ukranian': 'Ukrainian', |
| 79 | + 'Farsi/Persian': 'Persian' |
| 80 | +} |
| 81 | + |
| 82 | + |
| 83 | +def get_language_info(language): |
| 84 | + if language in opensubtitles2_languages: |
| 85 | + language = opensubtitles2_languages[language] |
| 86 | + |
| 87 | + for lang in LANGUAGES: |
| 88 | + if lang[0] == language: |
| 89 | + return {'name': lang[0], '2et': lang[2], '3et': lang[3]} |
| 90 | + |
| 91 | + |
| 92 | +def log(module, msg): |
| 93 | + _log(module, msg.encode('utf-8')) |
| 94 | + |
| 95 | + |
| 96 | +def geturl(url1, headers=None, params=None): |
| 97 | + try: |
| 98 | + res = ses.get(url1, headers=headers, verify=False, timeout=5) |
| 99 | + print('res.status_code', res.status_code) |
| 100 | + if res.status_code == 200: |
| 101 | + return six.ensure_str(res.content) |
| 102 | + e = res.raise_for_status() |
| 103 | + print(('Download error', e)) |
| 104 | + return '' |
| 105 | + except requests.exceptions.RequestException as e: |
| 106 | + print(('Download error', str(e))) |
| 107 | + return '' |
0 commit comments