From 143907304908ee34bfcfe4914cda596d235291f8 Mon Sep 17 00:00:00 2001 From: =?UTF-8?q?Sergey=20M=E2=80=A4?= Date: Sat, 15 Mar 2014 04:38:49 +0700 Subject: [PATCH] [generic] Add comment for unescaping webpage contents --- youtube_dl/extractor/generic.py | 3 +++ 1 file changed, 3 insertions(+) diff --git a/youtube_dl/extractor/generic.py b/youtube_dl/extractor/generic.py index a3de0ba60a..300485c7f8 100644 --- a/youtube_dl/extractor/generic.py +++ b/youtube_dl/extractor/generic.py @@ -291,6 +291,9 @@ def _real_extract(self, url): except compat_xml_parse_error: pass + # Sometimes embedded video player is hidden behind percent encoding + # (e.g. https://github.com/rg3/youtube-dl/issues/2448) + # Unescaping the whole page allows to handle those cases in a generic way webpage = compat_urllib_parse.unquote(webpage) # it's tempting to parse this further, but you would