yt-dlp/yt_dlp/extractor/tviplayer.py
Francisco Pombal 9ae7df9a22
[ie/tviplayer] Fix extractor (#16527)
Closes #13132
Authored by: FranciscoPombal
2026-06-18 22:05:08 +00:00

73 lines
2.9 KiB
Python

from .common import InfoExtractor
from ..utils import int_or_none, js_to_json
from ..utils.traversal import traverse_obj
class TVIPlayerIE(InfoExtractor):
_VALID_URL = r'https?://tviplayer\.iol\.pt(/programa/[\w-]+/[a-f0-9]+)?/\w+/(?P<id>\w+)'
_TESTS = [{
'url': 'https://tviplayer.iol.pt/programa/jornal-das-8/53c6b3903004dc006243d0cf/video/61c8e8b90cf2c7ea0f0f71a9',
'info_dict': {
'id': '61c8e8b90cf2c7ea0f0f71a9',
'ext': 'mp4',
'duration': 4167,
'title': 'Jornal das 8 - 26 de dezembro de 2021',
'thumbnail': 'https://img.iol.pt/image/id/61c8ee630cf2cc58e7d98d9f/',
'season_number': 8,
'season': 'Season 8',
},
}, {
# no /programa/
'url': 'https://tviplayer.iol.pt/video/62c4131c0cf2f9a86eac06bb',
'info_dict': {
'id': '62c4131c0cf2f9a86eac06bb',
'ext': 'mp4',
'title': 'David e Mickael Carreira respondem: «Qual é o próximo a ser pai?»',
'thumbnail': 'https://img.iol.pt/image/id/62c416490cf2ea367d4433fd/',
'duration': 148,
},
}, {
# episodio url
'url': 'https://tviplayer.iol.pt/programa/para-sempre/61716c360cf2365a5ed894c4/episodio/t1e187',
'info_dict': {
'id': 't1e187',
'ext': 'mp4',
'season': 'Season 1',
'title': 'Quem denunciou Pedro?',
'thumbnail': 'https://img.iol.pt/image/id/62eda30b0cf2ea367d48973b/',
'duration': 1250,
'season_number': 1,
'episode_number': 187,
'episode': 'Episode 187',
},
}]
def _real_initialize(self):
self.wms_auth_sign_token = self._download_webpage(
'https://services.iol.pt/matrix?userId=', 'wmsAuthSign',
note='Trying to get wmsAuthSign token')
def _real_extract(self, url):
video_id = self._match_id(url)
webpage = self._download_webpage(url, video_id)
json_data = self._search_json(
r'\sopts\s*=\s*\{\s*video\s*:\s*\[', webpage, 'JSON data', video_id,
transform_source=js_to_json)
formats, subtitles = self._extract_m3u8_formats_and_subtitles(
f'{json_data["videoUrl"]}?wmsAuthSign={self.wms_auth_sign_token}',
video_id, ext='mp4')
return {
'id': video_id,
'title': json_data.get('title') or self._og_search_title(webpage),
'thumbnail': json_data.get('cover') or self._og_search_thumbnail(webpage),
'duration': int_or_none(json_data.get('duration')),
'formats': formats,
'subtitles': subtitles,
'season_number': traverse_obj(
self._yield_json_ld(webpage, video_id, default=None),
(lambda _, v: v['@type'] == 'TVEpisode', 'seasonNumber', {int_or_none}, any)),
'episode_number': int_or_none(json_data.get('episodeNum')),
}