mirror of
https://github.com/ytdl-org/youtube-dl.git
synced 2024-11-16 14:27:53 +00:00
Compare commits
2 Commits
f102e3dc4e
...
a874871801
Author | SHA1 | Date | |
---|---|---|---|
|
a874871801 | ||
|
b7c25959f0 |
@ -1,8 +1,20 @@
|
|||||||
# coding: utf-8
|
# coding: utf-8
|
||||||
from __future__ import unicode_literals
|
from __future__ import unicode_literals
|
||||||
|
|
||||||
from .compat import compat_str
|
from .compat import (
|
||||||
|
compat_str,
|
||||||
|
compat_chr,
|
||||||
|
)
|
||||||
|
|
||||||
|
# Below is included the text of icu/CaseFolding.txt retrieved from
|
||||||
|
# https://github.com/unicode-org/icu/blob/main/icu4c/source/data/unidata/CaseFolding.txt
|
||||||
|
# In case newly foldable Unicode characters are defined, paste the new version
|
||||||
|
# of the text inside the ''' marks.
|
||||||
|
# The text is expected to have only blank lines andlines with 1st character #,
|
||||||
|
# all ignored, and fold definitions like this:
|
||||||
|
# `from_hex_code; space_separated_to_hex_code_list; comment`
|
||||||
|
|
||||||
|
_map_str = '''
|
||||||
# CaseFolding-15.0.0.txt
|
# CaseFolding-15.0.0.txt
|
||||||
# Date: 2022-02-02, 23:35:35 GMT
|
# Date: 2022-02-02, 23:35:35 GMT
|
||||||
# © 2022 Unicode®, Inc.
|
# © 2022 Unicode®, Inc.
|
||||||
@ -65,7 +77,6 @@ from .compat import compat_str
|
|||||||
# have the value C for the status field, and the code point itself for the mapping field.
|
# have the value C for the status field, and the code point itself for the mapping field.
|
||||||
|
|
||||||
# =================================================================
|
# =================================================================
|
||||||
_map_str = '''
|
|
||||||
0041; C; 0061; # LATIN CAPITAL LETTER A
|
0041; C; 0061; # LATIN CAPITAL LETTER A
|
||||||
0042; C; 0062; # LATIN CAPITAL LETTER B
|
0042; C; 0062; # LATIN CAPITAL LETTER B
|
||||||
0043; C; 0063; # LATIN CAPITAL LETTER C
|
0043; C; 0063; # LATIN CAPITAL LETTER C
|
||||||
@ -1627,17 +1638,22 @@ FF3A; C; FF5A; # FULLWIDTH LATIN CAPITAL LETTER Z
|
|||||||
1E920; C; 1E942; # ADLAM CAPITAL LETTER KPO
|
1E920; C; 1E942; # ADLAM CAPITAL LETTER KPO
|
||||||
1E921; C; 1E943; # ADLAM CAPITAL LETTER SHA
|
1E921; C; 1E943; # ADLAM CAPITAL LETTER SHA
|
||||||
'''
|
'''
|
||||||
|
|
||||||
|
_parse_unichr = lambda s: compat_chr(int(s, 16))
|
||||||
|
|
||||||
_map = dict(
|
_map = dict(
|
||||||
(unichr(int(from_, 16)), ''.join((unichr(int(v, 16)) for v in to_.split(' '))))
|
(_parse_unichr(from_), ''.join(map(_parse_unichr, to_.split(' '))))
|
||||||
for from_, type_, to_, _ in (
|
for from_, type_, to_, _ in (
|
||||||
l.split('; ', 3) for l in _map_str.splitlines() if l)
|
l.split('; ', 3) for l in _map_str.splitlines() if l and not l[0] == '#')
|
||||||
if type_ in ('C', 'F'))
|
if type_ in ('C', 'F'))
|
||||||
del _map_str
|
del _map_str
|
||||||
|
|
||||||
|
|
||||||
def casefold(s):
|
def casefold(s):
|
||||||
assert isinstance(s, compat_str)
|
assert isinstance(s, compat_str)
|
||||||
return ''.join((_map.get(c, c) for c in s))
|
return ''.join((_map.get(c, c) for c in s))
|
||||||
|
|
||||||
|
|
||||||
__all__ = [
|
__all__ = [
|
||||||
casefold
|
casefold
|
||||||
]
|
]
|
||||||
|
@ -21,6 +21,19 @@ import subprocess
|
|||||||
import sys
|
import sys
|
||||||
import xml.etree.ElementTree
|
import xml.etree.ElementTree
|
||||||
|
|
||||||
|
# deal with critical unicode/str things first
|
||||||
|
try:
|
||||||
|
# Python 2
|
||||||
|
compat_str, compat_basestring, compat_chr = (
|
||||||
|
unicode, basestring, unichr
|
||||||
|
)
|
||||||
|
from .casefold import casefold as compat_casefold
|
||||||
|
except NameError:
|
||||||
|
compat_str, compat_basestring, compat_chr = (
|
||||||
|
str, str, chr
|
||||||
|
)
|
||||||
|
compat_casefold = lambda s: s.casefold()
|
||||||
|
|
||||||
try:
|
try:
|
||||||
import collections.abc as compat_collections_abc
|
import collections.abc as compat_collections_abc
|
||||||
except ImportError:
|
except ImportError:
|
||||||
@ -2373,13 +2386,6 @@ try:
|
|||||||
except ImportError:
|
except ImportError:
|
||||||
import BaseHTTPServer as compat_http_server
|
import BaseHTTPServer as compat_http_server
|
||||||
|
|
||||||
try:
|
|
||||||
compat_str = unicode # Python 2
|
|
||||||
from .casefold import casefold as compat_casefold
|
|
||||||
except NameError:
|
|
||||||
compat_str = str
|
|
||||||
compat_casefold = lambda s: s.casefold()
|
|
||||||
|
|
||||||
try:
|
try:
|
||||||
from urllib.parse import unquote_to_bytes as compat_urllib_parse_unquote_to_bytes
|
from urllib.parse import unquote_to_bytes as compat_urllib_parse_unquote_to_bytes
|
||||||
from urllib.parse import unquote as compat_urllib_parse_unquote
|
from urllib.parse import unquote as compat_urllib_parse_unquote
|
||||||
@ -2510,22 +2516,11 @@ except ImportError: # Python < 3.4
|
|||||||
|
|
||||||
return compat_urllib_response.addinfourl(io.BytesIO(data), headers, url)
|
return compat_urllib_response.addinfourl(io.BytesIO(data), headers, url)
|
||||||
|
|
||||||
try:
|
|
||||||
compat_basestring = basestring # Python 2
|
|
||||||
except NameError:
|
|
||||||
compat_basestring = str
|
|
||||||
|
|
||||||
try:
|
|
||||||
compat_chr = unichr # Python 2
|
|
||||||
except NameError:
|
|
||||||
compat_chr = chr
|
|
||||||
|
|
||||||
try:
|
try:
|
||||||
from xml.etree.ElementTree import ParseError as compat_xml_parse_error
|
from xml.etree.ElementTree import ParseError as compat_xml_parse_error
|
||||||
except ImportError: # Python 2.6
|
except ImportError: # Python 2.6
|
||||||
from xml.parsers.expat import ExpatError as compat_xml_parse_error
|
from xml.parsers.expat import ExpatError as compat_xml_parse_error
|
||||||
|
|
||||||
|
|
||||||
etree = xml.etree.ElementTree
|
etree = xml.etree.ElementTree
|
||||||
|
|
||||||
|
|
||||||
|
Loading…
Reference in New Issue
Block a user