mirror of
				https://github.com/ytdl-org/youtube-dl.git
				synced 2025-10-29 09:26:20 -07:00 
			
		
		
		
	[zattoo] Improve and simplify (closes #14676)
This commit is contained in:
		| @@ -1,84 +1,82 @@ | |||||||
| # coding: utf-8 | # coding: utf-8 | ||||||
| from __future__ import unicode_literals | from __future__ import unicode_literals | ||||||
|  |  | ||||||
| from uuid import uuid4 |  | ||||||
| import re | import re | ||||||
|  | from uuid import uuid4 | ||||||
|  |  | ||||||
| from .common import InfoExtractor | from .common import InfoExtractor | ||||||
| from ..utils import ( | from ..compat import ( | ||||||
|  |     compat_HTTPError, | ||||||
|     compat_str, |     compat_str, | ||||||
|  | ) | ||||||
|  | from ..utils import ( | ||||||
|     ExtractorError, |     ExtractorError, | ||||||
|     sanitized_Request, |     int_or_none, | ||||||
|  |     try_get, | ||||||
|     urlencode_postdata, |     urlencode_postdata, | ||||||
| ) | ) | ||||||
|  |  | ||||||
|  |  | ||||||
| class ZattooBaseIE(InfoExtractor): | class ZattooBaseIE(InfoExtractor): | ||||||
|  |  | ||||||
|     _NETRC_MACHINE = 'zattoo' |     _NETRC_MACHINE = 'zattoo' | ||||||
|     _HOST_URL = 'https://zattoo.com' |     _HOST_URL = 'https://zattoo.com' | ||||||
|  |  | ||||||
|     _power_guide_hash = None |     _power_guide_hash = None | ||||||
|  |  | ||||||
|     def _login(self, uuid, session_id): |     def _login(self): | ||||||
|         (username, password) = self._get_login_info() |         (username, password) = self._get_login_info() | ||||||
|         if not username or not password: |         if not username or not password: | ||||||
|             raise ExtractorError( |             self.raise_login_required( | ||||||
|                 'A valid %s account is needed to access this media.' % self._NETRC_MACHINE, |                 'A valid %s account is needed to access this media.' | ||||||
|                 expected=True) |                 % self._NETRC_MACHINE) | ||||||
|         login_form = { |  | ||||||
|  |         try: | ||||||
|  |             data = self._download_json( | ||||||
|  |                 '%s/zapi/v2/account/login' % self._HOST_URL, None, 'Logging in', | ||||||
|  |                 data=urlencode_postdata({ | ||||||
|                     'login': username, |                     'login': username, | ||||||
|                     'password': password, |                     'password': password, | ||||||
|             'remember': True, |                     'remember': 'true', | ||||||
|         } |                 }), headers={ | ||||||
|         request = sanitized_Request( |                     'Referer': '%s/login' % self._HOST_URL, | ||||||
|             '%s/zapi/v2/account/login' % self._HOST_URL, |                     'Content-Type': 'application/x-www-form-urlencoded; charset=UTF-8', | ||||||
|             urlencode_postdata(login_form)) |                 }) | ||||||
|         request.add_header( |         except ExtractorError as e: | ||||||
|             'Referer', '%s/login' % self._HOST_URL) |             if isinstance(e.cause, compat_HTTPError) and e.cause.code == 400: | ||||||
|         request.add_header( |                 raise ExtractorError( | ||||||
|             'Content-Type', 'application/x-www-form-urlencoded; charset=UTF-8') |                     'Unable to login: incorrect username and/or password', | ||||||
|         request.add_header( |                     expected=True) | ||||||
|             'Cookie', 'uuid=%s; beaker.session.id=%s' % (uuid, session_id)) |             raise | ||||||
|         response = self._request_webpage( |  | ||||||
|             request, None, 'Logging in') |  | ||||||
|         data = self._parse_json(response.read(), None) |  | ||||||
|         return data['session']['power_guide_hash'] |  | ||||||
|  |  | ||||||
|     def _get_app_token_and_version(self): |         self._power_guide_hash = data['session']['power_guide_hash'] | ||||||
|         host_webpage = self._download_webpage( |  | ||||||
|             self._HOST_URL, None, 'Downloading %s' % self._HOST_URL) |     def _real_initialize(self): | ||||||
|  |         webpage = self._download_webpage( | ||||||
|  |             self._HOST_URL, None, 'Downloading app token') | ||||||
|         app_token = self._html_search_regex( |         app_token = self._html_search_regex( | ||||||
|             r'<script.+window\.appToken\s*=\s*\'(.+)\'', host_webpage, 'app token') |             r'appToken\s*=\s*(["\'])(?P<token>(?:(?!\1).)+?)\1', | ||||||
|  |             webpage, 'app token', group='token') | ||||||
|         app_version = self._html_search_regex( |         app_version = self._html_search_regex( | ||||||
|             r'<!--\w+-(.+?)-', host_webpage, 'app version', default='2.8.2') |             r'<!--\w+-(.+?)-', webpage, 'app version', default='2.8.2') | ||||||
|         return app_token, app_version |  | ||||||
|  |  | ||||||
|     def _say_hello(self, uuid, app_token, app_version): |         # Will setup appropriate cookies | ||||||
|         postdata = { |         self._request_webpage( | ||||||
|  |             '%s/zapi/v2/session/hello' % self._HOST_URL, None, | ||||||
|  |             'Opening session', data=urlencode_postdata({ | ||||||
|                 'client_app_token': app_token, |                 'client_app_token': app_token, | ||||||
|             'uuid': uuid, |                 'uuid': compat_str(uuid4()), | ||||||
|                 'lang': 'en', |                 'lang': 'en', | ||||||
|                 'app_version': app_version, |                 'app_version': app_version, | ||||||
|                 'format': 'json', |                 'format': 'json', | ||||||
|         } |             })) | ||||||
|         request = sanitized_Request( |  | ||||||
|             '%s/zapi/v2/session/hello' % self._HOST_URL, |  | ||||||
|             urlencode_postdata(postdata)) |  | ||||||
|         response = self._request_webpage( |  | ||||||
|             request, None, 'Say hello') |  | ||||||
|  |  | ||||||
|         cookie = response.headers.get('Set-Cookie') |         self._login() | ||||||
|         session_id = self._search_regex( |  | ||||||
|             r'beaker\.session\.id\s*=\s*(.+?);', cookie, 'session id') |  | ||||||
|         return session_id |  | ||||||
|  |  | ||||||
|     def _extract_cid(self, video_id, channel_name): |     def _extract_cid(self, video_id, channel_name): | ||||||
|         channel_groups = self._download_json( |         channel_groups = self._download_json( | ||||||
|             '%s/zapi/v2/cached/channels/%s' % (self._HOST_URL, |             '%s/zapi/v2/cached/channels/%s' % (self._HOST_URL, | ||||||
|                                                self._power_guide_hash), |                                                self._power_guide_hash), | ||||||
|             video_id, |             video_id, 'Downloading channel list', | ||||||
|             'Downloading available channel list', |  | ||||||
|             query={'details': False})['channel_groups'] |             query={'details': False})['channel_groups'] | ||||||
|         channel_list = [] |         channel_list = [] | ||||||
|         for chgrp in channel_groups: |         for chgrp in channel_groups: | ||||||
| @@ -86,7 +84,9 @@ class ZattooBaseIE(InfoExtractor): | |||||||
|         try: |         try: | ||||||
|             return next( |             return next( | ||||||
|                 chan['cid'] for chan in channel_list |                 chan['cid'] for chan in channel_list | ||||||
|                 if chan['display_alias'] == channel_name or chan['cid'] == channel_name) |                 if chan.get('cid') and ( | ||||||
|  |                     chan.get('display_alias') == channel_name or | ||||||
|  |                     chan.get('cid') == channel_name)) | ||||||
|         except StopIteration: |         except StopIteration: | ||||||
|             raise ExtractorError('Could not extract channel id') |             raise ExtractorError('Could not extract channel id') | ||||||
|  |  | ||||||
| @@ -100,72 +100,90 @@ class ZattooBaseIE(InfoExtractor): | |||||||
|                 'complete': True |                 'complete': True | ||||||
|             }) |             }) | ||||||
|  |  | ||||||
|  |         p = data['program'] | ||||||
|  |         cid = p['cid'] | ||||||
|  |  | ||||||
|         info_dict = { |         info_dict = { | ||||||
|             'id': video_id, |             'id': video_id, | ||||||
|             'title': data['program']['title'], |             'title': p.get('title') or p['episode_title'], | ||||||
|             'description': data['program'].get('description'), |             'description': p.get('description'), | ||||||
|             'thumbnail': data['program'].get('image_url') |             'thumbnail': p.get('image_url'), | ||||||
|  |             'creator': p.get('channel_name'), | ||||||
|  |             'episode': p.get('episode_title'), | ||||||
|  |             'episode_number': int_or_none(p.get('episode_number')), | ||||||
|  |             'season_number': int_or_none(p.get('season_number')), | ||||||
|  |             'release_year': int_or_none(p.get('year')), | ||||||
|  |             'categories': try_get(p, lambda x: x['categories'], list), | ||||||
|         } |         } | ||||||
|         cid = data['program']['cid'] |  | ||||||
|         return cid, info_dict |         return cid, info_dict | ||||||
|  |  | ||||||
|     def _extract_formats(self, cid, video_id, record_id=None, is_live=False): |     def _extract_formats(self, cid, video_id, record_id=None, is_live=False): | ||||||
|         postdata = { |         postdata_common = { | ||||||
|             'stream_type': 'dash', |  | ||||||
|             'https_watch_urls': True, |             'https_watch_urls': True, | ||||||
|         } |         } | ||||||
|         if record_id: |  | ||||||
|  |         if is_live: | ||||||
|  |             postdata_common.update({'timeshift': 10800}) | ||||||
|  |             url = '%s/zapi/watch/live/%s' % (self._HOST_URL, cid) | ||||||
|  |         elif record_id: | ||||||
|             url = '%s/zapi/watch/recording/%s' % (self._HOST_URL, record_id) |             url = '%s/zapi/watch/recording/%s' % (self._HOST_URL, record_id) | ||||||
|         else: |         else: | ||||||
|             url = '%s/zapi/watch/recall/%s/%s' % (self._HOST_URL, cid, video_id) |             url = '%s/zapi/watch/recall/%s/%s' % (self._HOST_URL, cid, video_id) | ||||||
|  |  | ||||||
|         if is_live: |  | ||||||
|             postdata.update({'timeshift': 10800}) |  | ||||||
|             url = '%s/zapi/watch/live/%s' % (self._HOST_URL, cid) |  | ||||||
|  |  | ||||||
|         data = self._download_json( |  | ||||||
|             sanitized_Request(url, urlencode_postdata(postdata)), |  | ||||||
|             video_id, 'Downloading dash formats') |  | ||||||
|  |  | ||||||
|         formats = [] |         formats = [] | ||||||
|         for elem in data['stream']['watch_urls']: |         for stream_type in ('dash', 'hls', 'hls5', 'hds'): | ||||||
|             audio_channel = elem.get('audio_channel') |             postdata = postdata_common.copy() | ||||||
|             maxrate = elem.get('maxrate') |             postdata['stream_type'] = stream_type | ||||||
|             formats.extend( |  | ||||||
|                 self._extract_mpd_formats( |  | ||||||
|                     elem['url'], video_id, |  | ||||||
|                     mpd_id='dash-maxrate-%s-channel-%s' % (maxrate, audio_channel), fatal=False)) |  | ||||||
|  |  | ||||||
|         postdata.update({'stream_type': 'hls'}) |  | ||||||
|         request = sanitized_Request( |  | ||||||
|             url, urlencode_postdata(postdata)) |  | ||||||
|             data = self._download_json( |             data = self._download_json( | ||||||
|             request, video_id, 'Downloading hls formats') |                 url, video_id, 'Downloading %s formats' % stream_type.upper(), | ||||||
|         for elem in data['stream']['watch_urls']: |                 data=urlencode_postdata(postdata), fatal=False) | ||||||
|             audio_channel = elem.get('audio_channel') |             if not data: | ||||||
|             preference = None |                 continue | ||||||
|  |  | ||||||
|             # Prefer audio channel A: |             watch_urls = try_get( | ||||||
|             if audio_channel == 'A': |                 data, lambda x: x['stream']['watch_urls'], list) | ||||||
|                 preference = 1 |             if not watch_urls: | ||||||
|  |                 continue | ||||||
|             maxrate = elem.get('maxrate') |  | ||||||
|             formats.extend( |  | ||||||
|                 self._extract_m3u8_formats( |  | ||||||
|                     elem['url'], video_id, 'mp4', entry_protocol='m3u8_native', |  | ||||||
|                     preference=preference, |  | ||||||
|                     m3u8_id='hls-maxrate-%s-channel-%s' % (maxrate, audio_channel), |  | ||||||
|                     fatal=False)) |  | ||||||
|  |  | ||||||
|  |             for watch in watch_urls: | ||||||
|  |                 if not isinstance(watch, dict): | ||||||
|  |                     continue | ||||||
|  |                 watch_url = watch.get('url') | ||||||
|  |                 if not watch_url or not isinstance(watch_url, compat_str): | ||||||
|  |                     continue | ||||||
|  |                 format_id_list = [stream_type] | ||||||
|  |                 maxrate = watch.get('maxrate') | ||||||
|  |                 if maxrate: | ||||||
|  |                     format_id_list.append(compat_str(maxrate)) | ||||||
|  |                 audio_channel = watch.get('audio_channel') | ||||||
|  |                 if audio_channel: | ||||||
|  |                     format_id_list.append(compat_str(audio_channel)) | ||||||
|  |                 preference = 1 if audio_channel == 'A' else None | ||||||
|  |                 format_id = '-'.join(format_id_list) | ||||||
|  |                 if stream_type in ('dash', 'dash_widevine', 'dash_playready'): | ||||||
|  |                     this_formats = self._extract_mpd_formats( | ||||||
|  |                         watch_url, video_id, mpd_id=format_id, fatal=False) | ||||||
|  |                 elif stream_type in ('hls', 'hls5', 'hls5_fairplay'): | ||||||
|  |                     this_formats = self._extract_m3u8_formats( | ||||||
|  |                         watch_url, video_id, 'mp4', | ||||||
|  |                         entry_protocol='m3u8_native', m3u8_id=format_id, | ||||||
|  |                         fatal=False) | ||||||
|  |                 elif stream_type == 'hds': | ||||||
|  |                     this_formats = self._extract_f4m_formats( | ||||||
|  |                         watch_url, video_id, f4m_id=format_id, fatal=False) | ||||||
|  |                 elif stream_type == 'smooth_playready': | ||||||
|  |                     this_formats = self._extract_ism_formats( | ||||||
|  |                         watch_url, video_id, ism_id=format_id, fatal=False) | ||||||
|  |                 else: | ||||||
|  |                     assert False | ||||||
|  |                 for this_format in this_formats: | ||||||
|  |                     this_format['preference'] = preference | ||||||
|  |                 formats.extend(this_formats) | ||||||
|         self._sort_formats(formats) |         self._sort_formats(formats) | ||||||
|         return formats |         return formats | ||||||
|  |  | ||||||
|     def _real_initialize(self): |  | ||||||
|         uuid = compat_str(uuid4()) |  | ||||||
|         app_token, app_version = self._get_app_token_and_version() |  | ||||||
|         session_id = self._say_hello(uuid, app_token, app_version) |  | ||||||
|         self._power_guide_hash = self._login(uuid, session_id) |  | ||||||
|  |  | ||||||
|     def _extract_video(self, channel_name, video_id, record_id=None, is_live=False): |     def _extract_video(self, channel_name, video_id, record_id=None, is_live=False): | ||||||
|         if is_live: |         if is_live: | ||||||
|             cid = self._extract_cid(video_id, channel_name) |             cid = self._extract_cid(video_id, channel_name) | ||||||
| @@ -190,13 +208,27 @@ class QuicklineBaseIE(ZattooBaseIE): | |||||||
| class QuicklineIE(QuicklineBaseIE): | class QuicklineIE(QuicklineBaseIE): | ||||||
|     _VALID_URL = r'https?://(?:www\.)?mobiltv\.quickline\.com/watch/(?P<channel>[^/]+)/(?P<id>[0-9]+)' |     _VALID_URL = r'https?://(?:www\.)?mobiltv\.quickline\.com/watch/(?P<channel>[^/]+)/(?P<id>[0-9]+)' | ||||||
|  |  | ||||||
|  |     _TEST = { | ||||||
|  |         'url': 'https://mobiltv.quickline.com/watch/prosieben/130671867-maze-runner-die-auserwaehlten-in-der-brandwueste', | ||||||
|  |         'only_matching': True, | ||||||
|  |     } | ||||||
|  |  | ||||||
|     def _real_extract(self, url): |     def _real_extract(self, url): | ||||||
|         channel_name, video_id = re.match(self._VALID_URL, url).groups() |         channel_name, video_id = re.match(self._VALID_URL, url).groups() | ||||||
|         return self._extract_video(channel_name, video_id) |         return self._extract_video(channel_name, video_id) | ||||||
|  |  | ||||||
|  |  | ||||||
| class QuicklineLiveIE(QuicklineBaseIE): | class QuicklineLiveIE(QuicklineBaseIE): | ||||||
|     _VALID_URL = r'https?://(?:www\.)?mobiltv\.quickline\.com/watch/(?P<id>[^/]+)$' |     _VALID_URL = r'https?://(?:www\.)?mobiltv\.quickline\.com/watch/(?P<id>[^/]+)' | ||||||
|  |  | ||||||
|  |     _TEST = { | ||||||
|  |         'url': 'https://mobiltv.quickline.com/watch/srf1', | ||||||
|  |         'only_matching': True, | ||||||
|  |     } | ||||||
|  |  | ||||||
|  |     @classmethod | ||||||
|  |     def suitable(cls, url): | ||||||
|  |         return False if QuicklineIE.suitable(url) else super(QuicklineLiveIE, cls).suitable(url) | ||||||
|  |  | ||||||
|     def _real_extract(self, url): |     def _real_extract(self, url): | ||||||
|         channel_name = video_id = self._match_id(url) |         channel_name = video_id = self._match_id(url) | ||||||
| @@ -222,13 +254,17 @@ class ZattooIE(ZattooBaseIE): | |||||||
|  |  | ||||||
|  |  | ||||||
| class ZattooLiveIE(ZattooBaseIE): | class ZattooLiveIE(ZattooBaseIE): | ||||||
|     _VALID_URL = r'https?://(?:www\.)?zattoo\.com/watch/(?P<id>[^/]+)$' |     _VALID_URL = r'https?://(?:www\.)?zattoo\.com/watch/(?P<id>[^/]+)' | ||||||
|  |  | ||||||
|     _TEST = { |     _TEST = { | ||||||
|         'url': 'https://zattoo.com/watch/srf1', |         'url': 'https://zattoo.com/watch/srf1', | ||||||
|         'only_matching': True, |         'only_matching': True, | ||||||
|     } |     } | ||||||
|  |  | ||||||
|  |     @classmethod | ||||||
|  |     def suitable(cls, url): | ||||||
|  |         return False if ZattooIE.suitable(url) else super(ZattooLiveIE, cls).suitable(url) | ||||||
|  |  | ||||||
|     def _real_extract(self, url): |     def _real_extract(self, url): | ||||||
|         channel_name = video_id = self._match_id(url) |         channel_name = video_id = self._match_id(url) | ||||||
|         return self._extract_video(channel_name, video_id, is_live=True) |         return self._extract_video(channel_name, video_id, is_live=True) | ||||||
|   | |||||||
		Reference in New Issue
	
	Block a user