1
0
Fork 0
mirror of https://github.com/ytdl-org/youtube-dl.git synced 2024-06-02 10:29:28 +00:00

Fix detection of the webpage charset if it's declared using ' instead of "

Like in "<meta charset='utf-8'/>"
This commit is contained in:
Jaime Marquínez Ferrándiz 2013-08-29 11:35:15 +02:00
parent 2891932bf0
commit 0d75ae2ce3

View file

@ -150,7 +150,7 @@ class InfoExtractor(object):
if m: if m:
encoding = m.group(1) encoding = m.group(1)
else: else:
m = re.search(br'<meta[^>]+charset="?([^"]+)[ /">]', m = re.search(br'<meta[^>]+charset=[\'"]?([^\'")]+)[ /\'">]',
webpage_bytes[:1024]) webpage_bytes[:1024])
if m: if m:
encoding = m.group(1).decode('ascii') encoding = m.group(1).decode('ascii')