[youtube] Fix categories and improve tags extraction

2024-11-15 11:33:30 +01:00 · 2020-06-16 03:13:39 +07:00 · 2020-06-16 03:13:39 +07:00 · dbeafce5d5
commit dbeafce5d5
parent ed604ce7bc
1 changed files with 7 additions and 3 deletions
--- a/youtube_dl/extractor/youtube.py
+++ b/youtube_dl/extractor/youtube.py
@ -2356,17 +2356,21 @@ class YoutubeIE(YoutubeBaseInfoExtractor):
        m_cat_container = self._search_regex(
            r'(?s)<h4[^>]*>\s*Category\s*</h4>\s*<ul[^>]*>(.*?)</ul>',
            video_webpage, 'categories', default=None)
        category = None
        if m_cat_container:
            category = self._html_search_regex(
                r'(?s)<a[^<]+>(.*?)</a>', m_cat_container, 'category',
                default=None)
-            video_categories = None if category is None else [category]
+        if not category:
-        else:
+            category = try_get(
-            video_categories = None
+                microformat, lambda x: x['category'], compat_str)
        video_categories = None if category is None else [category]
        video_tags = [
            unescapeHTML(m.group('content'))
            for m in re.finditer(self._meta_regex('og:video:tag'), video_webpage)]
        if not video_tags:
            video_tags = try_get(video_details, lambda x: x['keywords'], list)
        def _extract_count(count_name):
            return str_to_int(self._search_regex(