mirror of
				https://github.com/ytdl-org/youtube-dl.git
				synced 2025-10-29 09:26:20 -07:00 
			
		
		
		
	[extractor/common] Add support for dl8-* media tags (closes #27283)
This commit is contained in:
		| @@ -2513,7 +2513,8 @@ class InfoExtractor(object): | |||||||
|         # amp-video and amp-audio are very similar to their HTML5 counterparts |         # amp-video and amp-audio are very similar to their HTML5 counterparts | ||||||
|         # so we wll include them right here (see |         # so we wll include them right here (see | ||||||
|         # https://www.ampproject.org/docs/reference/components/amp-video) |         # https://www.ampproject.org/docs/reference/components/amp-video) | ||||||
|         _MEDIA_TAG_NAME_RE = r'(?:amp-)?(video|audio)' |         # For dl8-* tags see https://delight-vr.com/documentation/dl8-video/ | ||||||
|  |         _MEDIA_TAG_NAME_RE = r'(?:(?:amp|dl8(?:-live)?)-)?(video|audio)' | ||||||
|         media_tags = [(media_tag, media_type, '') |         media_tags = [(media_tag, media_type, '') | ||||||
|                       for media_tag, media_type |                       for media_tag, media_type | ||||||
|                       in re.findall(r'(?s)(<%s[^>]*/>)' % _MEDIA_TAG_NAME_RE, webpage)] |                       in re.findall(r'(?s)(<%s[^>]*/>)' % _MEDIA_TAG_NAME_RE, webpage)] | ||||||
|   | |||||||
| @@ -2466,7 +2466,9 @@ class GenericIE(InfoExtractor): | |||||||
|         # Sometimes embedded video player is hidden behind percent encoding |         # Sometimes embedded video player is hidden behind percent encoding | ||||||
|         # (e.g. https://github.com/ytdl-org/youtube-dl/issues/2448) |         # (e.g. https://github.com/ytdl-org/youtube-dl/issues/2448) | ||||||
|         # Unescaping the whole page allows to handle those cases in a generic way |         # Unescaping the whole page allows to handle those cases in a generic way | ||||||
|         webpage = compat_urllib_parse_unquote(webpage) |         # FIXME: unescaping the whole page may break URLs, commenting out for now. | ||||||
|  |         # There probably should be a second run of generic extractor on unescaped webpage. | ||||||
|  |         # webpage = compat_urllib_parse_unquote(webpage) | ||||||
|  |  | ||||||
|         # Unescape squarespace embeds to be detected by generic extractor, |         # Unescape squarespace embeds to be detected by generic extractor, | ||||||
|         # see https://github.com/ytdl-org/youtube-dl/issues/21294 |         # see https://github.com/ytdl-org/youtube-dl/issues/21294 | ||||||
|   | |||||||
		Reference in New Issue
	
	Block a user