youtube-dl

Another place where youtube-dl lives on
git clone git://git.oshgnacknak.de/youtube-dl.git
Log | Files | Refs | README | LICENSE

laola1tv.py (9454B)


      1 # coding: utf-8
      2 from __future__ import unicode_literals
      3 
      4 import json
      5 import re
      6 
      7 from .common import InfoExtractor
      8 from ..utils import (
      9     ExtractorError,
     10     unified_strdate,
     11     urlencode_postdata,
     12     xpath_element,
     13     xpath_text,
     14     update_url_query,
     15     js_to_json,
     16 )
     17 
     18 
     19 class Laola1TvEmbedIE(InfoExtractor):
     20     IE_NAME = 'laola1tv:embed'
     21     _VALID_URL = r'https?://(?:www\.)?laola1\.tv/titanplayer\.php\?.*?\bvideoid=(?P<id>\d+)'
     22     _TESTS = [{
     23         # flashvars.premium = "false";
     24         'url': 'https://www.laola1.tv/titanplayer.php?videoid=708065&type=V&lang=en&portal=int&customer=1024',
     25         'info_dict': {
     26             'id': '708065',
     27             'ext': 'mp4',
     28             'title': 'MA Long CHN - FAN Zhendong CHN',
     29             'uploader': 'ITTF - International Table Tennis Federation',
     30             'upload_date': '20161211',
     31         },
     32     }]
     33 
     34     def _extract_token_url(self, stream_access_url, video_id, data):
     35         return self._download_json(
     36             self._proto_relative_url(stream_access_url, 'https:'), video_id,
     37             headers={
     38                 'Content-Type': 'application/json',
     39             }, data=json.dumps(data).encode())['data']['stream-access'][0]
     40 
     41     def _extract_formats(self, token_url, video_id):
     42         token_doc = self._download_xml(
     43             token_url, video_id, 'Downloading token',
     44             headers=self.geo_verification_headers())
     45 
     46         token_attrib = xpath_element(token_doc, './/token').attrib
     47 
     48         if token_attrib['status'] != '0':
     49             raise ExtractorError(
     50                 'Token error: %s' % token_attrib['comment'], expected=True)
     51 
     52         formats = self._extract_akamai_formats(
     53             '%s?hdnea=%s' % (token_attrib['url'], token_attrib['auth']),
     54             video_id)
     55         self._sort_formats(formats)
     56         return formats
     57 
     58     def _real_extract(self, url):
     59         video_id = self._match_id(url)
     60         webpage = self._download_webpage(url, video_id)
     61         flash_vars = self._search_regex(
     62             r'(?s)flashvars\s*=\s*({.+?});', webpage, 'flash vars')
     63 
     64         def get_flashvar(x, *args, **kwargs):
     65             flash_var = self._search_regex(
     66                 r'%s\s*:\s*"([^"]+)"' % x,
     67                 flash_vars, x, default=None)
     68             if not flash_var:
     69                 flash_var = self._search_regex([
     70                     r'flashvars\.%s\s*=\s*"([^"]+)"' % x,
     71                     r'%s\s*=\s*"([^"]+)"' % x],
     72                     webpage, x, *args, **kwargs)
     73             return flash_var
     74 
     75         hd_doc = self._download_xml(
     76             'http://www.laola1.tv/server/hd_video.php', video_id, query={
     77                 'play': get_flashvar('streamid'),
     78                 'partner': get_flashvar('partnerid'),
     79                 'portal': get_flashvar('portalid'),
     80                 'lang': get_flashvar('sprache'),
     81                 'v5ident': '',
     82             })
     83 
     84         _v = lambda x, **k: xpath_text(hd_doc, './/video/' + x, **k)
     85         title = _v('title', fatal=True)
     86 
     87         token_url = None
     88         premium = get_flashvar('premium', default=None)
     89         if premium:
     90             token_url = update_url_query(
     91                 _v('url', fatal=True), {
     92                     'timestamp': get_flashvar('timestamp'),
     93                     'auth': get_flashvar('auth'),
     94                 })
     95         else:
     96             data_abo = urlencode_postdata(
     97                 dict((i, v) for i, v in enumerate(_v('req_liga_abos').split(','))))
     98             stream_access_url = update_url_query(
     99                 'https://club.laola1.tv/sp/laola1/api/v3/user/session/premium/player/stream-access', {
    100                     'videoId': _v('id'),
    101                     'target': self._search_regex(r'vs_target = (\d+);', webpage, 'vs target'),
    102                     'label': _v('label'),
    103                     'area': _v('area'),
    104                 })
    105             token_url = self._extract_token_url(stream_access_url, video_id, data_abo)
    106 
    107         formats = self._extract_formats(token_url, video_id)
    108 
    109         categories_str = _v('meta_sports')
    110         categories = categories_str.split(',') if categories_str else []
    111         is_live = _v('islive') == 'true'
    112 
    113         return {
    114             'id': video_id,
    115             'title': self._live_title(title) if is_live else title,
    116             'upload_date': unified_strdate(_v('time_date')),
    117             'uploader': _v('meta_organisation'),
    118             'categories': categories,
    119             'is_live': is_live,
    120             'formats': formats,
    121         }
    122 
    123 
    124 class Laola1TvBaseIE(Laola1TvEmbedIE):
    125     def _extract_video(self, url):
    126         display_id = self._match_id(url)
    127         webpage = self._download_webpage(url, display_id)
    128 
    129         if 'Dieser Livestream ist bereits beendet.' in webpage:
    130             raise ExtractorError('This live stream has already finished.', expected=True)
    131 
    132         conf = self._parse_json(self._search_regex(
    133             r'(?s)conf\s*=\s*({.+?});', webpage, 'conf'),
    134             display_id,
    135             transform_source=lambda s: js_to_json(re.sub(r'shareurl:.+,', '', s)))
    136         video_id = conf['videoid']
    137 
    138         config = self._download_json(conf['configUrl'], video_id, query={
    139             'videoid': video_id,
    140             'partnerid': conf['partnerid'],
    141             'language': conf.get('language', ''),
    142             'portal': conf.get('portalid', ''),
    143         })
    144         error = config.get('error')
    145         if error:
    146             raise ExtractorError('%s said: %s' % (self.IE_NAME, error), expected=True)
    147 
    148         video_data = config['video']
    149         title = video_data['title']
    150         is_live = video_data.get('isLivestream') and video_data.get('isLive')
    151         meta = video_data.get('metaInformation')
    152         sports = meta.get('sports')
    153         categories = sports.split(',') if sports else []
    154 
    155         token_url = self._extract_token_url(
    156             video_data['streamAccess'], video_id,
    157             video_data['abo']['required'])
    158 
    159         formats = self._extract_formats(token_url, video_id)
    160 
    161         return {
    162             'id': video_id,
    163             'display_id': display_id,
    164             'title': self._live_title(title) if is_live else title,
    165             'description': video_data.get('description'),
    166             'thumbnail': video_data.get('image'),
    167             'categories': categories,
    168             'formats': formats,
    169             'is_live': is_live,
    170         }
    171 
    172 
    173 class Laola1TvIE(Laola1TvBaseIE):
    174     IE_NAME = 'laola1tv'
    175     _VALID_URL = r'https?://(?:www\.)?laola1\.tv/[a-z]+-[a-z]+/[^/]+/(?P<id>[^/?#&]+)'
    176 
    177     _TESTS = [{
    178         'url': 'http://www.laola1.tv/de-de/video/straubing-tigers-koelner-haie/227883.html',
    179         'info_dict': {
    180             'id': '227883',
    181             'display_id': 'straubing-tigers-koelner-haie',
    182             'ext': 'flv',
    183             'title': 'Straubing Tigers - Kölner Haie',
    184             'upload_date': '20140912',
    185             'is_live': False,
    186             'categories': ['Eishockey'],
    187         },
    188         'params': {
    189             'skip_download': True,
    190         },
    191     }, {
    192         'url': 'http://www.laola1.tv/de-de/video/straubing-tigers-koelner-haie',
    193         'info_dict': {
    194             'id': '464602',
    195             'display_id': 'straubing-tigers-koelner-haie',
    196             'ext': 'flv',
    197             'title': 'Straubing Tigers - Kölner Haie',
    198             'upload_date': '20160129',
    199             'is_live': False,
    200             'categories': ['Eishockey'],
    201         },
    202         'params': {
    203             'skip_download': True,
    204         },
    205     }, {
    206         'url': 'http://www.laola1.tv/de-de/livestream/2016-03-22-belogorie-belgorod-trentino-diatec-lde',
    207         'info_dict': {
    208             'id': '487850',
    209             'display_id': '2016-03-22-belogorie-belgorod-trentino-diatec-lde',
    210             'ext': 'flv',
    211             'title': 'Belogorie BELGOROD - TRENTINO Diatec',
    212             'upload_date': '20160322',
    213             'uploader': 'CEV - Europäischer Volleyball Verband',
    214             'is_live': True,
    215             'categories': ['Volleyball'],
    216         },
    217         'params': {
    218             'skip_download': True,
    219         },
    220         'skip': 'This live stream has already finished.',
    221     }]
    222 
    223     def _real_extract(self, url):
    224         return self._extract_video(url)
    225 
    226 
    227 class EHFTVIE(Laola1TvBaseIE):
    228     IE_NAME = 'ehftv'
    229     _VALID_URL = r'https?://(?:www\.)?ehftv\.com/[a-z]+(?:-[a-z]+)?/[^/]+/(?P<id>[^/?#&]+)'
    230 
    231     _TESTS = [{
    232         'url': 'https://www.ehftv.com/int/video/paris-saint-germain-handball-pge-vive-kielce/1166761',
    233         'info_dict': {
    234             'id': '1166761',
    235             'display_id': 'paris-saint-germain-handball-pge-vive-kielce',
    236             'ext': 'mp4',
    237             'title': 'Paris Saint-Germain Handball - PGE Vive Kielce',
    238             'is_live': False,
    239             'categories': ['Handball'],
    240         },
    241         'params': {
    242             'skip_download': True,
    243         },
    244     }]
    245 
    246     def _real_extract(self, url):
    247         return self._extract_video(url)
    248 
    249 
    250 class ITTFIE(InfoExtractor):
    251     _VALID_URL = r'https?://tv\.ittf\.com/video/[^/]+/(?P<id>\d+)'
    252     _TEST = {
    253         'url': 'https://tv.ittf.com/video/peng-wang-wei-matsudaira-kenta/951802',
    254         'only_matching': True,
    255     }
    256 
    257     def _real_extract(self, url):
    258         return self.url_result(
    259             update_url_query('https://www.laola1.tv/titanplayer.php', {
    260                 'videoid': self._match_id(url),
    261                 'type': 'V',
    262                 'lang': 'en',
    263                 'portal': 'int',
    264                 'customer': 1024,
    265             }), Laola1TvEmbedIE.ie_key())