aboutsummaryrefslogtreecommitdiff
diff options
context:
space:
mode:
authorCosmin Tanislav <demonsingur@gmail.com>2024-09-14 02:09:52 +0300
committerGitHub <noreply@github.com>2024-09-13 23:09:52 +0000
commitd02df303d8e49390599db9f34482697e4d1cf5b2 (patch)
tree6611aa170a304c536c7ec3f1ab0b3727ac53d4b0
parent5d0176547f16a3642cd71627126e9dfc24981e20 (diff)
[ie/RTP] Support more subpages (#10787)
Authored by: Demon000
-rw-r--r--yt_dlp/extractor/rtp.py26
1 files changed, 21 insertions, 5 deletions
diff --git a/yt_dlp/extractor/rtp.py b/yt_dlp/extractor/rtp.py
index 944e8636a..26aec2e4c 100644
--- a/yt_dlp/extractor/rtp.py
+++ b/yt_dlp/extractor/rtp.py
@@ -8,7 +8,7 @@ from ..utils import js_to_json
class RTPIE(InfoExtractor):
- _VALID_URL = r'https?://(?:www\.)?rtp\.pt/play/p(?P<program_id>[0-9]+)/(?P<id>[^/?#]+)/?'
+ _VALID_URL = r'https?://(?:www\.)?rtp\.pt/play/(?:(?:estudoemcasa|palco|zigzag)/)?p(?P<program_id>[0-9]+)/(?P<id>[^/?#]+)'
_TESTS = [{
'url': 'http://www.rtp.pt/play/p405/e174042/paixoes-cruzadas',
'md5': 'e736ce0c665e459ddb818546220b4ef8',
@@ -20,8 +20,24 @@ class RTPIE(InfoExtractor):
'thumbnail': r're:^https?://.*\.jpg',
},
}, {
+ 'url': 'https://www.rtp.pt/play/zigzag/p13166/e757904/25-curiosidades-25-de-abril',
+ 'md5': '9a81ed53f2b2197cfa7ed455b12f8ade',
+ 'info_dict': {
+ 'id': 'e757904',
+ 'ext': 'mp4',
+ 'title': '25 Curiosidades, 25 de Abril',
+ 'description': 'Estudar ou não estudar - Em cada um dos episódios descobrimos uma curiosidade acerca de como era viver em Portugal antes da revolução do 25 de abr',
+ 'thumbnail': r're:^https?://.*\.jpg',
+ },
+ }, {
'url': 'http://www.rtp.pt/play/p831/a-quimica-das-coisas',
'only_matching': True,
+ }, {
+ 'url': 'https://www.rtp.pt/play/estudoemcasa/p7776/portugues-1-ano',
+ 'only_matching': True,
+ }, {
+ 'url': 'https://www.rtp.pt/play/palco/p13785/l7nnon',
+ 'only_matching': True,
}]
_RX_OBFUSCATION = re.compile(r'''(?xs)
@@ -49,17 +65,17 @@ class RTPIE(InfoExtractor):
f, config = self._search_regex(
r'''(?sx)
- var\s+f\s*=\s*(?P<f>".*?"|{[^;]+?});\s*
+ (?:var\s+f\s*=\s*(?P<f>".*?"|{[^;]+?});\s*)?
var\s+player1\s+=\s+new\s+RTPPlayer\s*\((?P<config>{(?:(?!\*/).)+?})\);(?!\s*\*/)
''', webpage,
'player config', group=('f', 'config'))
- f = self._parse_json(
- f, video_id,
- lambda data: self.__unobfuscate(data, video_id=video_id))
config = self._parse_json(
config, video_id,
lambda data: self.__unobfuscate(data, video_id=video_id))
+ f = config['file'] if not f else self._parse_json(
+ f, video_id,
+ lambda data: self.__unobfuscate(data, video_id=video_id))
formats = []
if isinstance(f, dict):