mirror of
https://github.com/yt-dlp/yt-dlp.git
synced 2024-11-10 01:02:13 +01:00
[utils] Escape all HTML entities written in hexadecimal form
This commit is contained in:
parent
fbfcc2972b
commit
91757b0f37
2 changed files with 3 additions and 1 deletions
|
@ -200,6 +200,8 @@ def test_ordered_set(self):
|
|||
|
||||
def test_unescape_html(self):
|
||||
self.assertEqual(unescapeHTML('%20;'), '%20;')
|
||||
self.assertEqual(unescapeHTML('/'), '/')
|
||||
self.assertEqual(unescapeHTML('/'), '/')
|
||||
self.assertEqual(
|
||||
unescapeHTML('é'), 'é')
|
||||
|
||||
|
|
|
@ -348,7 +348,7 @@ def _htmlentity_transform(entity):
|
|||
if entity in compat_html_entities.name2codepoint:
|
||||
return compat_chr(compat_html_entities.name2codepoint[entity])
|
||||
|
||||
mobj = re.match(r'#(x?[0-9]+)', entity)
|
||||
mobj = re.match(r'#(x[0-9a-fA-F]+|[0-9]+)', entity)
|
||||
if mobj is not None:
|
||||
numstr = mobj.group(1)
|
||||
if numstr.startswith('x'):
|
||||
|
|
Loading…
Reference in a new issue