[cbs] extract smpte and vtt subtitles
authorRemita Amine <remitamine@gmail.com>
Sat, 13 Apr 2019 16:00:24 +0000 (17:00 +0100)
committerRemita Amine <remitamine@gmail.com>
Sat, 13 Apr 2019 16:02:22 +0000 (17:02 +0100)
youtube_dl/extractor/cbs.py

index 1799d63ea86ad9f9b1d7048792b52385928e20f4..376db726326302972c7c7ab33b7d362fa1360e67 100644 (file)
@@ -13,13 +13,17 @@ from ..utils import (
 
 class CBSBaseIE(ThePlatformFeedIE):
     def _parse_smil_subtitles(self, smil, namespace=None, subtitles_lang='en'):
-        closed_caption_e = find_xpath_attr(smil, self._xpath_ns('.//param', namespace), 'name', 'ClosedCaptionURL')
-        return {
-            'en': [{
-                'ext': 'ttml',
-                'url': closed_caption_e.attrib['value'],
-            }]
-        } if closed_caption_e is not None and closed_caption_e.attrib.get('value') else []
+        subtitles = {}
+        for k, ext in [('sMPTE-TTCCURL', 'tt'), ('ClosedCaptionURL', 'ttml'), ('webVTTCaptionURL', 'vtt')]:
+            cc_e = find_xpath_attr(smil, self._xpath_ns('.//param', namespace), 'name', k)
+            if cc_e is not None:
+                cc_url = cc_e.get('value')
+                if cc_url:
+                    subtitles.setdefault(subtitles_lang, []).append({
+                        'ext': ext,
+                        'url': cc_url,
+                    })
+        return subtitles
 
 
 class CBSIE(CBSBaseIE):