2021-02-04 13:26:01 +05:30
|
|
|
|
from .common import InfoExtractor
|
2017-03-18 05:58:54 +07:00
|
|
|
|
from ..utils import (
|
2025-08-20 08:10:17 +09:00
|
|
|
|
clean_html,
|
|
|
|
|
|
determine_ext,
|
2021-02-04 13:26:01 +05:30
|
|
|
|
extract_attributes,
|
2017-03-18 05:58:54 +07:00
|
|
|
|
int_or_none,
|
2025-08-20 08:10:17 +09:00
|
|
|
|
parse_resolution,
|
|
|
|
|
|
str_or_none,
|
|
|
|
|
|
url_or_none,
|
2017-03-18 05:58:54 +07:00
|
|
|
|
)
|
2025-08-20 08:10:17 +09:00
|
|
|
|
from ..utils.traversal import find_elements, traverse_obj
|
|
|
|
|
|
|
2017-03-18 05:58:54 +07:00
|
|
|
|
|
2025-08-20 08:10:17 +09:00
|
|
|
|
class MedialaanBaseIE(InfoExtractor):
|
|
|
|
|
|
def _extract_from_mychannels_api(self, mychannels_id):
|
|
|
|
|
|
webpage = self._download_webpage(
|
|
|
|
|
|
f'https://mychannels.video/embed/{mychannels_id}', mychannels_id)
|
|
|
|
|
|
brand_config = self._search_json(
|
|
|
|
|
|
r'window\.mychannels\.brand_config\s*=', webpage, 'brand config', mychannels_id)
|
|
|
|
|
|
response = self._download_json(
|
|
|
|
|
|
f'https://api.mychannels.world/v1/embed/video/{mychannels_id}',
|
|
|
|
|
|
mychannels_id, headers={'X-Mychannels-Brand': brand_config['brand']})
|
2017-03-18 05:58:54 +07:00
|
|
|
|
|
2025-08-20 08:10:17 +09:00
|
|
|
|
formats = []
|
|
|
|
|
|
for stream in traverse_obj(response, (
|
|
|
|
|
|
'streams', lambda _, v: url_or_none(v['url']),
|
|
|
|
|
|
)):
|
|
|
|
|
|
source_url = stream['url']
|
|
|
|
|
|
ext = determine_ext(source_url)
|
|
|
|
|
|
if ext == 'm3u8':
|
|
|
|
|
|
formats.extend(self._extract_m3u8_formats(
|
|
|
|
|
|
source_url, mychannels_id, 'mp4', m3u8_id='hls', fatal=False))
|
|
|
|
|
|
else:
|
|
|
|
|
|
format_id = traverse_obj(stream, ('quality', {str}))
|
|
|
|
|
|
formats.append({
|
|
|
|
|
|
'ext': ext,
|
|
|
|
|
|
'format_id': format_id,
|
|
|
|
|
|
'url': source_url,
|
|
|
|
|
|
**parse_resolution(format_id),
|
|
|
|
|
|
})
|
|
|
|
|
|
|
|
|
|
|
|
return {
|
|
|
|
|
|
'id': mychannels_id,
|
|
|
|
|
|
'formats': formats,
|
|
|
|
|
|
**traverse_obj(response, {
|
|
|
|
|
|
'title': ('title', {clean_html}),
|
|
|
|
|
|
'description': ('description', {clean_html}, filter),
|
|
|
|
|
|
'duration': ('durationMs', {int_or_none(scale=1000)}, {lambda x: x if x >= 0 else None}),
|
|
|
|
|
|
'genres': ('genre', 'title', {str}, filter, all, filter),
|
|
|
|
|
|
'is_live': ('live', {bool}),
|
|
|
|
|
|
'release_timestamp': ('publicationTimestampMs', {int_or_none(scale=1000)}),
|
|
|
|
|
|
'tags': ('tags', ..., 'title', {str}, filter, all, filter),
|
|
|
|
|
|
'thumbnail': ('image', 'baseUrl', {url_or_none}),
|
|
|
|
|
|
}),
|
|
|
|
|
|
**traverse_obj(response, ('channel', {
|
|
|
|
|
|
'channel': ('title', {clean_html}),
|
|
|
|
|
|
'channel_id': ('id', {str_or_none}),
|
|
|
|
|
|
})),
|
|
|
|
|
|
**traverse_obj(response, ('organisation', {
|
|
|
|
|
|
'uploader': ('title', {clean_html}),
|
|
|
|
|
|
'uploader_id': ('id', {str_or_none}),
|
|
|
|
|
|
})),
|
|
|
|
|
|
**traverse_obj(response, ('show', {
|
|
|
|
|
|
'series': ('title', {clean_html}),
|
|
|
|
|
|
'series_id': ('id', {str_or_none}),
|
|
|
|
|
|
})),
|
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
class MedialaanIE(MedialaanBaseIE):
|
2017-03-18 05:58:54 +07:00
|
|
|
|
_VALID_URL = r'''(?x)
|
|
|
|
|
|
https?://
|
|
|
|
|
|
(?:
|
2021-02-04 13:26:01 +05:30
|
|
|
|
(?:embed\.)?mychannels.video/embed/|
|
|
|
|
|
|
embed\.mychannels\.video/(?:s(?:dk|cript)/)?production/|
|
|
|
|
|
|
(?:www\.)?(?:
|
|
|
|
|
|
(?:
|
|
|
|
|
|
7sur7|
|
|
|
|
|
|
demorgen|
|
|
|
|
|
|
hln|
|
|
|
|
|
|
joe|
|
|
|
|
|
|
qmusic
|
|
|
|
|
|
)\.be|
|
|
|
|
|
|
(?:
|
|
|
|
|
|
[abe]d|
|
|
|
|
|
|
bndestem|
|
|
|
|
|
|
destentor|
|
|
|
|
|
|
gelderlander|
|
|
|
|
|
|
pzc|
|
|
|
|
|
|
tubantia|
|
|
|
|
|
|
volkskrant
|
|
|
|
|
|
)\.nl
|
2025-08-20 08:10:17 +09:00
|
|
|
|
)/videos?/(?:[^/?#]+/)*[^/?&#]+(?:-|~p)
|
2017-03-18 05:58:54 +07:00
|
|
|
|
)
|
2021-02-04 13:26:01 +05:30
|
|
|
|
(?P<id>\d+)
|
2017-03-18 05:58:54 +07:00
|
|
|
|
'''
|
|
|
|
|
|
_TESTS = [{
|
2021-02-04 13:26:01 +05:30
|
|
|
|
'url': 'https://www.bndestem.nl/video/de-terugkeer-van-ally-de-aap-en-wie-vertrekt-er-nog-bij-nac~p193993',
|
2017-03-18 05:58:54 +07:00
|
|
|
|
'info_dict': {
|
2021-02-04 13:26:01 +05:30
|
|
|
|
'id': '193993',
|
2017-03-18 05:58:54 +07:00
|
|
|
|
'ext': 'mp4',
|
2021-02-04 13:26:01 +05:30
|
|
|
|
'title': 'De terugkeer van Ally de Aap en wie vertrekt er nog bij NAC?',
|
2025-08-20 08:10:17 +09:00
|
|
|
|
'description': 'In een nieuwe Gegenpressing video bespreken Yadran Blanco en Dennis Kas het nieuws omrent NAC.',
|
2021-02-04 13:26:01 +05:30
|
|
|
|
'duration': 238,
|
2025-08-20 08:10:17 +09:00
|
|
|
|
'channel': 'BN DeStem',
|
|
|
|
|
|
'channel_id': '418',
|
|
|
|
|
|
'genres': ['Sports'],
|
|
|
|
|
|
'release_date': '20210126',
|
|
|
|
|
|
'release_timestamp': 1611663540,
|
|
|
|
|
|
'series': 'Korte Reportage',
|
|
|
|
|
|
'series_id': '972',
|
|
|
|
|
|
'tags': 'count:2',
|
|
|
|
|
|
'thumbnail': r're:https?://images\.mychannels\.video/imgix/.+\.(?:jpe?g|png)',
|
|
|
|
|
|
'uploader': 'BN De Stem',
|
|
|
|
|
|
'uploader_id': '26',
|
2017-03-18 05:58:54 +07:00
|
|
|
|
},
|
|
|
|
|
|
}, {
|
2021-02-04 13:26:01 +05:30
|
|
|
|
'url': 'https://www.gelderlander.nl/video/kanalen/degelderlander~c320/series/snel-nieuws~s984/noodbevel-in-doetinchem-politie-stuurt-mensen-centrum-uit~p194093',
|
2025-08-20 08:10:17 +09:00
|
|
|
|
'info_dict': {
|
|
|
|
|
|
'id': '194093',
|
|
|
|
|
|
'ext': 'mp4',
|
|
|
|
|
|
'title': 'Noodbevel in Doetinchem: politie stuurt mensen centrum uit',
|
|
|
|
|
|
'description': 'md5:77e85b2cb26cfff9dc1fe2b1db524001',
|
|
|
|
|
|
'duration': 44,
|
|
|
|
|
|
'channel': 'De Gelderlander',
|
|
|
|
|
|
'channel_id': '320',
|
|
|
|
|
|
'genres': ['News'],
|
|
|
|
|
|
'release_date': '20210126',
|
|
|
|
|
|
'release_timestamp': 1611690600,
|
|
|
|
|
|
'series': 'Snel Nieuws',
|
|
|
|
|
|
'series_id': '984',
|
|
|
|
|
|
'tags': 'count:1',
|
|
|
|
|
|
'thumbnail': r're:https?://images\.mychannels\.video/imgix/.+\.(?:jpe?g|png)',
|
|
|
|
|
|
'uploader': 'De Gelderlander',
|
|
|
|
|
|
'uploader_id': '25',
|
|
|
|
|
|
},
|
2017-03-18 05:58:54 +07:00
|
|
|
|
}, {
|
2025-08-20 08:10:17 +09:00
|
|
|
|
'url': 'https://www.7sur7.be/videos/production/lla-tendance-tiktok-qui-enflamme-lespagne-707650',
|
|
|
|
|
|
'info_dict': {
|
|
|
|
|
|
'id': '707650',
|
|
|
|
|
|
'ext': 'mp4',
|
|
|
|
|
|
'title': 'La tendance TikTok qui enflamme l’Espagne',
|
|
|
|
|
|
'description': 'md5:c7ec4cb733190f227fc8935899f533b5',
|
|
|
|
|
|
'duration': 70,
|
|
|
|
|
|
'channel': 'Lifestyle',
|
|
|
|
|
|
'channel_id': '770',
|
|
|
|
|
|
'genres': ['Beauty & Lifestyle'],
|
|
|
|
|
|
'release_date': '20240906',
|
|
|
|
|
|
'release_timestamp': 1725617330,
|
|
|
|
|
|
'series': 'Lifestyle',
|
|
|
|
|
|
'series_id': '1848',
|
|
|
|
|
|
'tags': 'count:1',
|
|
|
|
|
|
'thumbnail': r're:https?://images\.mychannels\.video/imgix/.+\.(?:jpe?g|png)',
|
|
|
|
|
|
'uploader': '7sur7',
|
|
|
|
|
|
'uploader_id': '67',
|
|
|
|
|
|
},
|
|
|
|
|
|
}, {
|
|
|
|
|
|
'url': 'https://mychannels.video/embed/313117',
|
|
|
|
|
|
'info_dict': {
|
|
|
|
|
|
'id': '313117',
|
|
|
|
|
|
'ext': 'mp4',
|
|
|
|
|
|
'title': str,
|
|
|
|
|
|
'description': 'md5:255e2e52f6fe8a57103d06def438f016',
|
|
|
|
|
|
'channel': 'AD',
|
|
|
|
|
|
'channel_id': '238',
|
|
|
|
|
|
'genres': ['News'],
|
|
|
|
|
|
'live_status': 'is_live',
|
|
|
|
|
|
'release_date': '20241225',
|
|
|
|
|
|
'release_timestamp': 1735169425,
|
|
|
|
|
|
'series': 'Nieuws Update',
|
|
|
|
|
|
'series_id': '3337',
|
|
|
|
|
|
'tags': 'count:1',
|
|
|
|
|
|
'thumbnail': r're:https?://images\.mychannels\.video/imgix/.+\.(?:jpe?g|png)',
|
|
|
|
|
|
'uploader': 'AD',
|
|
|
|
|
|
'uploader_id': '1',
|
|
|
|
|
|
},
|
|
|
|
|
|
'params': {'skip_download': 'Livestream'},
|
|
|
|
|
|
}, {
|
|
|
|
|
|
'url': 'https://embed.mychannels.video/sdk/production/193993',
|
2017-03-18 05:58:54 +07:00
|
|
|
|
'only_matching': True,
|
|
|
|
|
|
}, {
|
2021-02-04 13:26:01 +05:30
|
|
|
|
'url': 'https://embed.mychannels.video/script/production/193993',
|
2017-03-18 05:58:54 +07:00
|
|
|
|
'only_matching': True,
|
|
|
|
|
|
}, {
|
2021-02-04 13:26:01 +05:30
|
|
|
|
'url': 'https://embed.mychannels.video/production/193993',
|
2017-03-18 05:58:54 +07:00
|
|
|
|
'only_matching': True,
|
2017-04-18 05:44:33 +02:00
|
|
|
|
}, {
|
2021-02-04 13:26:01 +05:30
|
|
|
|
'url': 'https://embed.mychannels.video/embed/193993',
|
2017-04-18 05:44:33 +02:00
|
|
|
|
'only_matching': True,
|
2017-03-18 05:58:54 +07:00
|
|
|
|
}]
|
2025-08-02 05:50:20 +09:00
|
|
|
|
_WEBPAGE_TESTS = [{
|
|
|
|
|
|
'url': 'https://www.demorgen.be/snelnieuws/tom-waes-promoot-alcoholtesten-op-werchter-ik-ben-de-laatste-persoon-die-met-de-vinger-moet-wijzen~b7457c0d/',
|
|
|
|
|
|
'info_dict': {
|
|
|
|
|
|
'id': '1576607',
|
|
|
|
|
|
'ext': 'mp4',
|
|
|
|
|
|
'title': 'Tom Waes blaastest',
|
2025-08-20 08:10:17 +09:00
|
|
|
|
'channel': 'De Morgen',
|
|
|
|
|
|
'channel_id': '352',
|
|
|
|
|
|
'description': 'Tom Waes werkt mee aan een alcoholcampagne op Werchter',
|
2025-08-02 05:50:20 +09:00
|
|
|
|
'duration': 62,
|
2025-08-20 08:10:17 +09:00
|
|
|
|
'genres': ['News'],
|
|
|
|
|
|
'release_date': '20250705',
|
|
|
|
|
|
'release_timestamp': 1751730795,
|
|
|
|
|
|
'series': 'Nieuwsvideo\'s',
|
|
|
|
|
|
'series_id': '1683',
|
|
|
|
|
|
'tags': 'count:1',
|
2025-08-02 05:50:20 +09:00
|
|
|
|
'thumbnail': r're:https?://video-images\.persgroep\.be/aws_generated.+\.jpg',
|
2025-08-20 08:10:17 +09:00
|
|
|
|
'uploader': 'De Morgen',
|
|
|
|
|
|
'uploader_id': '17',
|
2025-08-02 05:50:20 +09:00
|
|
|
|
},
|
|
|
|
|
|
'params': {'extractor_args': {'generic': {'impersonate': ['chrome']}}},
|
|
|
|
|
|
}]
|
2017-03-18 05:58:54 +07:00
|
|
|
|
|
2022-08-01 06:53:25 +05:30
|
|
|
|
@classmethod
|
|
|
|
|
|
def _extract_embed_urls(cls, url, webpage):
|
2025-08-20 08:10:17 +09:00
|
|
|
|
yield from traverse_obj(webpage, (
|
|
|
|
|
|
{find_elements(tag='div', attr='data-mychannels-type', value='video', html=True)},
|
|
|
|
|
|
..., {extract_attributes}, 'data-mychannels-id', {str}, filter,
|
|
|
|
|
|
{lambda x: f'https://mychannels.video/embed/{x}'}))
|
2017-03-18 05:58:54 +07:00
|
|
|
|
|
|
|
|
|
|
def _real_extract(self, url):
|
2025-08-20 08:10:17 +09:00
|
|
|
|
mychannels_id = self._match_id(url)
|
2021-02-04 13:26:01 +05:30
|
|
|
|
|
2025-08-20 08:10:17 +09:00
|
|
|
|
return self._extract_from_mychannels_api(mychannels_id)
|