yt-dlp/yt_dlp/extractor/youtube/_video.py

import base64
import binascii
import collections
import datetime as dt
import functools
import itertools
import json
import math
import os.path
import random
import re
import sys
import threading
import time
import traceback
import urllib.parse

from ._base import (
    INNERTUBE_CLIENTS,
    BadgeType,
    GvsPoTokenPolicy,
    PlayerPoTokenPolicy,
    StreamingProtocol,
    YoutubeBaseInfoExtractor,
    _PoTokenContext,
    _split_innertube_client,
    short_client_name,
)
from .pot._director import initialize_pot_director
from .pot.provider import PoTokenContext, PoTokenRequest
from ..openload import PhantomJSwrapper
from ...jsinterp import JSInterpreter, LocalNameSpace
from ...networking.exceptions import HTTPError
from ...utils import (
    NO_DEFAULT,
    ExtractorError,
    LazyList,
    bug_reports_message,
    clean_html,
    datetime_from_str,
    filesize_from_tbr,
    filter_dict,
    float_or_none,
    format_field,
    get_first,
    int_or_none,
    join_nonempty,
    js_to_json,
    mimetype2ext,
    orderedSet,
    parse_codecs,
    parse_count,
    parse_duration,
    parse_iso8601,
    parse_qs,
    qualities,
    remove_end,
    remove_start,
    smuggle_url,
    str_or_none,
    str_to_int,
    strftime_or_none,
    traverse_obj,
    try_call,
    try_get,
    unescapeHTML,
    unified_strdate,
    unsmuggle_url,
    update_url_query,
    url_or_none,
    urljoin,
    variadic,
)
from ...utils.networking import clean_headers, clean_proxies, select_proxy

STREAMING_DATA_CLIENT_NAME = '__yt_dlp_client'
STREAMING_DATA_FETCH_SUBS_PO_TOKEN = '__yt_dlp_fetch_subs_po_token'
STREAMING_DATA_FETCH_GVS_PO_TOKEN = '__yt_dlp_fetch_gvs_po_token'
STREAMING_DATA_PLAYER_TOKEN_PROVIDED = '__yt_dlp_player_token_provided'
STREAMING_DATA_INNERTUBE_CONTEXT = '__yt_dlp_innertube_context'
STREAMING_DATA_IS_PREMIUM_SUBSCRIBER = '__yt_dlp_is_premium_subscriber'
STREAMING_DATA_FETCHED_TIMESTAMP = '__yt_dlp_fetched_timestamp'

PO_TOKEN_GUIDE_URL = 'https://github.com/yt-dlp/yt-dlp/wiki/PO-Token-Guide'


class YoutubeIE(YoutubeBaseInfoExtractor):
    IE_DESC = 'YouTube'
    _VALID_URL = r'''(?x)^
                     (
                         (?:https?://|//)                                    # http(s):// or protocol-independent URL
                         (?:(?:(?:(?:\w+\.)?[yY][oO][uU][tT][uU][bB][eE](?:-nocookie|kids)?\.com|
                            (?:www\.)?deturl\.com/www\.youtube\.com|
                            (?:www\.)?pwnyoutube\.com|
                            (?:www\.)?hooktube\.com|
                            (?:www\.)?yourepeat\.com|
                            tube\.majestyc\.net|
                            {invidious}|
                            youtube\.googleapis\.com)/                        # the various hostnames, with wildcard subdomains
                         (?:.*?\#/)?                                          # handle anchor (#/) redirect urls
                         (?:                                                  # the various things that can precede the ID:
                             (?:(?:v|embed|e|shorts|live)/(?!videoseries|live_stream))  # v/ or embed/ or e/ or shorts/
                             |(?:                                             # or the v= param in all its forms
                                 (?:(?:watch|movie)(?:_popup)?(?:\.php)?/?)?  # preceding watch(_popup|.php) or nothing (like /?v=xxxx)
                                 (?:\?|\#!?)                                  # the params delimiter ? or # or #!
                                 (?:.*?[&;])??                                # any other preceding param (like /?s=tuff&v=xxxx or ?s=tuff&amp;v=V36LpHqtcDY)
                                 v=
                             )
                         ))
                         |(?:
                            youtu\.be|                                        # just youtu.be/xxxx
                            vid\.plus|                                        # or vid.plus/xxxx
                            zwearz\.com/watch|                                # or zwearz.com/watch/xxxx
                            {invidious}
                         )/
                         |(?:www\.)?cleanvideosearch\.com/media/action/yt/watch\?videoId=
                         )
                     )?                                                       # all until now is optional -> you can pass the naked ID
                     (?P<id>[0-9A-Za-z_-]{{11}})                              # here is it! the YouTube video ID
                     (?(1).+)?                                                # if we found the ID, everything can follow
                     (?:\#|$)'''.format(
        invidious='|'.join(YoutubeBaseInfoExtractor._INVIDIOUS_SITES),
    )
    _EMBED_REGEX = [
        r'''(?x)
            (?:
                <(?:[0-9A-Za-z-]+?)?iframe[^>]+?src=|
                data-video-url=|
                <embed[^>]+?src=|
                embedSWF\(?:\s*|
                <object[^>]+data=|
                new\s+SWFObject\(
            )
            (["\'])
                (?P<url>(?:https?:)?//(?:www\.)?youtube(?:-nocookie)?\.com/
                (?:embed|v|p)/[0-9A-Za-z_-]{11}.*?)
            \1''',
        # https://wordpress.org/plugins/lazy-load-for-videos/
        r'''(?xs)
            <a\s[^>]*\bhref="(?P<url>https://www\.youtube\.com/watch\?v=[0-9A-Za-z_-]{11})"
            \s[^>]*\bclass="[^"]*\blazy-load-youtube''',
    ]
    _RETURN_TYPE = 'video'  # XXX: How to handle multifeed?

    _PLAYER_INFO_RE = (
        r'/s/player/(?P<id>[a-zA-Z0-9_-]{8,})/(?:tv-)?player',
        r'/(?P<id>[a-zA-Z0-9_-]{8,})/player(?:_ias\.vflset(?:/[a-zA-Z]{2,3}_[a-zA-Z]{2,3})?|-plasma-ias-(?:phone|tablet)-[a-z]{2}_[A-Z]{2}\.vflset)/base\.js$',
        r'\b(?P<id>vfl[a-zA-Z0-9_-]+)\b.*?\.js$',
    )
    _formats = {  # NB: Used in YoutubeWebArchiveIE and GoogleDriveIE
        '5': {'ext': 'flv', 'width': 400, 'height': 240, 'acodec': 'mp3', 'abr': 64, 'vcodec': 'h263'},
        '6': {'ext': 'flv', 'width': 450, 'height': 270, 'acodec': 'mp3', 'abr': 64, 'vcodec': 'h263'},
        '13': {'ext': '3gp', 'acodec': 'aac', 'vcodec': 'mp4v'},
        '17': {'ext': '3gp', 'width': 176, 'height': 144, 'acodec': 'aac', 'abr': 24, 'vcodec': 'mp4v'},
        '18': {'ext': 'mp4', 'width': 640, 'height': 360, 'acodec': 'aac', 'abr': 96, 'vcodec': 'h264'},
        '22': {'ext': 'mp4', 'width': 1280, 'height': 720, 'acodec': 'aac', 'abr': 192, 'vcodec': 'h264'},
        '34': {'ext': 'flv', 'width': 640, 'height': 360, 'acodec': 'aac', 'abr': 128, 'vcodec': 'h264'},
        '35': {'ext': 'flv', 'width': 854, 'height': 480, 'acodec': 'aac', 'abr': 128, 'vcodec': 'h264'},
        # itag 36 videos are either 320x180 (BaW_jenozKc) or 320x240 (__2ABJjxzNo), abr varies as well
        '36': {'ext': '3gp', 'width': 320, 'acodec': 'aac', 'vcodec': 'mp4v'},
        '37': {'ext': 'mp4', 'width': 1920, 'height': 1080, 'acodec': 'aac', 'abr': 192, 'vcodec': 'h264'},
        '38': {'ext': 'mp4', 'width': 4096, 'height': 3072, 'acodec': 'aac', 'abr': 192, 'vcodec': 'h264'},
        '43': {'ext': 'webm', 'width': 640, 'height': 360, 'acodec': 'vorbis', 'abr': 128, 'vcodec': 'vp8'},
        '44': {'ext': 'webm', 'width': 854, 'height': 480, 'acodec': 'vorbis', 'abr': 128, 'vcodec': 'vp8'},
        '45': {'ext': 'webm', 'width': 1280, 'height': 720, 'acodec': 'vorbis', 'abr': 192, 'vcodec': 'vp8'},
        '46': {'ext': 'webm', 'width': 1920, 'height': 1080, 'acodec': 'vorbis', 'abr': 192, 'vcodec': 'vp8'},
        '59': {'ext': 'mp4', 'width': 854, 'height': 480, 'acodec': 'aac', 'abr': 128, 'vcodec': 'h264'},
        '78': {'ext': 'mp4', 'width': 854, 'height': 480, 'acodec': 'aac', 'abr': 128, 'vcodec': 'h264'},


        # 3D videos
        '82': {'ext': 'mp4', 'height': 360, 'format_note': '3D', 'acodec': 'aac', 'abr': 128, 'vcodec': 'h264', 'preference': -20},
        '83': {'ext': 'mp4', 'height': 480, 'format_note': '3D', 'acodec': 'aac', 'abr': 128, 'vcodec': 'h264', 'preference': -20},
        '84': {'ext': 'mp4', 'height': 720, 'format_note': '3D', 'acodec': 'aac', 'abr': 192, 'vcodec': 'h264', 'preference': -20},
        '85': {'ext': 'mp4', 'height': 1080, 'format_note': '3D', 'acodec': 'aac', 'abr': 192, 'vcodec': 'h264', 'preference': -20},
        '100': {'ext': 'webm', 'height': 360, 'format_note': '3D', 'acodec': 'vorbis', 'abr': 128, 'vcodec': 'vp8', 'preference': -20},
        '101': {'ext': 'webm', 'height': 480, 'format_note': '3D', 'acodec': 'vorbis', 'abr': 192, 'vcodec': 'vp8', 'preference': -20},
        '102': {'ext': 'webm', 'height': 720, 'format_note': '3D', 'acodec': 'vorbis', 'abr': 192, 'vcodec': 'vp8', 'preference': -20},

        # Apple HTTP Live Streaming
        '91': {'ext': 'mp4', 'height': 144, 'format_note': 'HLS', 'acodec': 'aac', 'abr': 48, 'vcodec': 'h264', 'preference': -10},
        '92': {'ext': 'mp4', 'height': 240, 'format_note': 'HLS', 'acodec': 'aac', 'abr': 48, 'vcodec': 'h264', 'preference': -10},
        '93': {'ext': 'mp4', 'height': 360, 'format_note': 'HLS', 'acodec': 'aac', 'abr': 128, 'vcodec': 'h264', 'preference': -10},
        '94': {'ext': 'mp4', 'height': 480, 'format_note': 'HLS', 'acodec': 'aac', 'abr': 128, 'vcodec': 'h264', 'preference': -10},
        '95': {'ext': 'mp4', 'height': 720, 'format_note': 'HLS', 'acodec': 'aac', 'abr': 256, 'vcodec': 'h264', 'preference': -10},
        '96': {'ext': 'mp4', 'height': 1080, 'format_note': 'HLS', 'acodec': 'aac', 'abr': 256, 'vcodec': 'h264', 'preference': -10},
        '132': {'ext': 'mp4', 'height': 240, 'format_note': 'HLS', 'acodec': 'aac', 'abr': 48, 'vcodec': 'h264', 'preference': -10},
        '151': {'ext': 'mp4', 'height': 72, 'format_note': 'HLS', 'acodec': 'aac', 'abr': 24, 'vcodec': 'h264', 'preference': -10},

        # DASH mp4 video
        '133': {'ext': 'mp4', 'height': 240, 'format_note': 'DASH video', 'vcodec': 'h264'},
        '134': {'ext': 'mp4', 'height': 360, 'format_note': 'DASH video', 'vcodec': 'h264'},
        '135': {'ext': 'mp4', 'height': 480, 'format_note': 'DASH video', 'vcodec': 'h264'},
        '136': {'ext': 'mp4', 'height': 720, 'format_note': 'DASH video', 'vcodec': 'h264'},
        '137': {'ext': 'mp4', 'height': 1080, 'format_note': 'DASH video', 'vcodec': 'h264'},
        '138': {'ext': 'mp4', 'format_note': 'DASH video', 'vcodec': 'h264'},  # Height can vary (https://github.com/ytdl-org/youtube-dl/issues/4559)
        '160': {'ext': 'mp4', 'height': 144, 'format_note': 'DASH video', 'vcodec': 'h264'},
        '212': {'ext': 'mp4', 'height': 480, 'format_note': 'DASH video', 'vcodec': 'h264'},
        '264': {'ext': 'mp4', 'height': 1440, 'format_note': 'DASH video', 'vcodec': 'h264'},
        '298': {'ext': 'mp4', 'height': 720, 'format_note': 'DASH video', 'vcodec': 'h264', 'fps': 60},
        '299': {'ext': 'mp4', 'height': 1080, 'format_note': 'DASH video', 'vcodec': 'h264', 'fps': 60},
        '266': {'ext': 'mp4', 'height': 2160, 'format_note': 'DASH video', 'vcodec': 'h264'},

        # Dash mp4 audio
        '139': {'ext': 'm4a', 'format_note': 'DASH audio', 'acodec': 'aac', 'abr': 48, 'container': 'm4a_dash'},
        '140': {'ext': 'm4a', 'format_note': 'DASH audio', 'acodec': 'aac', 'abr': 128, 'container': 'm4a_dash'},
        '141': {'ext': 'm4a', 'format_note': 'DASH audio', 'acodec': 'aac', 'abr': 256, 'container': 'm4a_dash'},
        '256': {'ext': 'm4a', 'format_note': 'DASH audio', 'acodec': 'aac', 'container': 'm4a_dash'},
        '258': {'ext': 'm4a', 'format_note': 'DASH audio', 'acodec': 'aac', 'container': 'm4a_dash'},
        '325': {'ext': 'm4a', 'format_note': 'DASH audio', 'acodec': 'dtse', 'container': 'm4a_dash'},
        '328': {'ext': 'm4a', 'format_note': 'DASH audio', 'acodec': 'ec-3', 'container': 'm4a_dash'},

        # Dash webm
        '167': {'ext': 'webm', 'height': 360, 'width': 640, 'format_note': 'DASH video', 'container': 'webm', 'vcodec': 'vp8'},
        '168': {'ext': 'webm', 'height': 480, 'width': 854, 'format_note': 'DASH video', 'container': 'webm', 'vcodec': 'vp8'},
        '169': {'ext': 'webm', 'height': 720, 'width': 1280, 'format_note': 'DASH video', 'container': 'webm', 'vcodec': 'vp8'},
        '170': {'ext': 'webm', 'height': 1080, 'width': 1920, 'format_note': 'DASH video', 'container': 'webm', 'vcodec': 'vp8'},
        '218': {'ext': 'webm', 'height': 480, 'width': 854, 'format_note': 'DASH video', 'container': 'webm', 'vcodec': 'vp8'},
        '219': {'ext': 'webm', 'height': 480, 'width': 854, 'format_note': 'DASH video', 'container': 'webm', 'vcodec': 'vp8'},
        '278': {'ext': 'webm', 'height': 144, 'format_note': 'DASH video', 'container': 'webm', 'vcodec': 'vp9'},
        '242': {'ext': 'webm', 'height': 240, 'format_note': 'DASH video', 'vcodec': 'vp9'},
        '243': {'ext': 'webm', 'height': 360, 'format_note': 'DASH video', 'vcodec': 'vp9'},
        '244': {'ext': 'webm', 'height': 480, 'format_note': 'DASH video', 'vcodec': 'vp9'},
        '245': {'ext': 'webm', 'height': 480, 'format_note': 'DASH video', 'vcodec': 'vp9'},
        '246': {'ext': 'webm', 'height': 480, 'format_note': 'DASH video', 'vcodec': 'vp9'},
        '247': {'ext': 'webm', 'height': 720, 'format_note': 'DASH video', 'vcodec': 'vp9'},
        '248': {'ext': 'webm', 'height': 1080, 'format_note': 'DASH video', 'vcodec': 'vp9'},
        '271': {'ext': 'webm', 'height': 1440, 'format_note': 'DASH video', 'vcodec': 'vp9'},
        # itag 272 videos are either 3840x2160 (e.g. RtoitU2A-3E) or 7680x4320 (sLprVF6d7Ug)
        '272': {'ext': 'webm', 'height': 2160, 'format_note': 'DASH video', 'vcodec': 'vp9'},
        '302': {'ext': 'webm', 'height': 720, 'format_note': 'DASH video', 'vcodec': 'vp9', 'fps': 60},
        '303': {'ext': 'webm', 'height': 1080, 'format_note': 'DASH video', 'vcodec': 'vp9', 'fps': 60},
        '308': {'ext': 'webm', 'height': 1440, 'format_note': 'DASH video', 'vcodec': 'vp9', 'fps': 60},
        '313': {'ext': 'webm', 'height': 2160, 'format_note': 'DASH video', 'vcodec': 'vp9'},
        '315': {'ext': 'webm', 'height': 2160, 'format_note': 'DASH video', 'vcodec': 'vp9', 'fps': 60},

        # Dash webm audio
        '171': {'ext': 'webm', 'acodec': 'vorbis', 'format_note': 'DASH audio', 'abr': 128},
        '172': {'ext': 'webm', 'acodec': 'vorbis', 'format_note': 'DASH audio', 'abr': 256},

        # Dash webm audio with opus inside
        '249': {'ext': 'webm', 'format_note': 'DASH audio', 'acodec': 'opus', 'abr': 50},
        '250': {'ext': 'webm', 'format_note': 'DASH audio', 'acodec': 'opus', 'abr': 70},
        '251': {'ext': 'webm', 'format_note': 'DASH audio', 'acodec': 'opus', 'abr': 160},

        # RTMP (unnamed)
        '_rtmp': {'protocol': 'rtmp'},

        # av01 video only formats sometimes served with "unknown" codecs
        '394': {'ext': 'mp4', 'height': 144, 'format_note': 'DASH video', 'vcodec': 'av01.0.00M.08'},
        '395': {'ext': 'mp4', 'height': 240, 'format_note': 'DASH video', 'vcodec': 'av01.0.00M.08'},
        '396': {'ext': 'mp4', 'height': 360, 'format_note': 'DASH video', 'vcodec': 'av01.0.01M.08'},
        '397': {'ext': 'mp4', 'height': 480, 'format_note': 'DASH video', 'vcodec': 'av01.0.04M.08'},
        '398': {'ext': 'mp4', 'height': 720, 'format_note': 'DASH video', 'vcodec': 'av01.0.05M.08'},
        '399': {'ext': 'mp4', 'height': 1080, 'format_note': 'DASH video', 'vcodec': 'av01.0.08M.08'},
        '400': {'ext': 'mp4', 'height': 1440, 'format_note': 'DASH video', 'vcodec': 'av01.0.12M.08'},
        '401': {'ext': 'mp4', 'height': 2160, 'format_note': 'DASH video', 'vcodec': 'av01.0.12M.08'},
    }
    _SUBTITLE_FORMATS = ('json3', 'srv1', 'srv2', 'srv3', 'ttml', 'srt', 'vtt')
    _DEFAULT_CLIENTS = ('tv_simply', 'tv', 'web')
    _DEFAULT_AUTHED_CLIENTS = ('tv', 'web_safari', 'web')
    # Premium does not require POT (except for subtitles)
    _DEFAULT_PREMIUM_CLIENTS = ('tv', 'web_creator', 'web')

    _GEO_BYPASS = False

    IE_NAME = 'youtube'
    _TESTS = [{
        'url': 'https://www.youtube.com/watch?v=BaW_jenozKc&t=1s&end=9',
        'info_dict': {
            'id': 'BaW_jenozKc',
            'ext': 'mp4',
            'title': 'youtube-dl test video "\'/\\ä↭𝕐',
            'age_limit': 0,
            'availability': 'public',
            'categories': ['Science & Technology'],
            'channel': 'Philipp Hagemeister',
            'channel_follower_count': int,
            'channel_id': 'UCLqxVugv74EIW3VWh2NOa3Q',
            'channel_url': 'https://www.youtube.com/channel/UCLqxVugv74EIW3VWh2NOa3Q',
            'comment_count': int,
            'description': 'md5:8fb536f4877b8a7455c2ec23794dbc22',
            'duration': 10,
            'end_time': 9,
            'heatmap': 'count:100',
            'like_count': int,
            'live_status': 'not_live',
            'playable_in_embed': True,
            'start_time': 1,
            'tags': 'count:1',
            'thumbnail': r're:https?://i\.ytimg\.com/.+',
            'timestamp': 1349198244,
            'upload_date': '20121002',
            'uploader': 'Philipp Hagemeister',
            'uploader_id': '@PhilippHagemeister',
            'uploader_url': 'https://www.youtube.com/@PhilippHagemeister',
            'view_count': int,
        },
        'skip': 'Video unavailable',
    }, {
        'note': 'Embed-only video (#1746)',
        'url': '//www.YouTube.com/watch?v=yZIXLfi8CZQ',
        'info_dict': {
            'id': 'yZIXLfi8CZQ',
            'ext': 'mp4',
            'title': 'Principal Sexually Assaults A Teacher - Episode 117 - 8th June 2012',
            'age_limit': 18,
            'description': 'md5:09b78bd971f1e3e289601dfba15ca4f7',
            'upload_date': '20120608',
        },
        'skip': 'Private video',
    }, {
        'note': 'Use the first video ID in the URL',
        'url': 'https://www.youtube.com/watch?v=BaW_jenozKc&v=yZIXLfi8CZQ',
        'info_dict': {
            'id': 'BaW_jenozKc',
            'ext': 'mp4',
            'title': 'youtube-dl test video "\'/\\ä↭𝕐',
            'age_limit': 0,
            'availability': 'public',
            'categories': ['Science & Technology'],
            'channel': 'Philipp Hagemeister',
            'channel_follower_count': int,
            'channel_id': 'UCLqxVugv74EIW3VWh2NOa3Q',
            'channel_url': 'https://www.youtube.com/channel/UCLqxVugv74EIW3VWh2NOa3Q',
            'comment_count': int,
            'description': 'md5:8fb536f4877b8a7455c2ec23794dbc22',
            'duration': 10,
            'heatmap': 'count:100',
            'like_count': int,
            'live_status': 'not_live',
            'playable_in_embed': True,
            'tags': 'count:1',
            'thumbnail': r're:https?://i\.ytimg\.com/.+',
            'timestamp': 1349198244,
            'upload_date': '20121002',
            'uploader': 'Philipp Hagemeister',
            'uploader_id': '@PhilippHagemeister',
            'uploader_url': 'https://www.youtube.com/@PhilippHagemeister',
            'view_count': int,
        },
        'skip': 'Video unavailable',
    }, {
        'note': '256k DASH audio (format 141) via DASH manifest',
        'url': 'https://www.youtube.com/watch?v=a9LDPn-MO4I',
        'info_dict': {
            'id': 'a9LDPn-MO4I',
            'ext': 'm4a',
            'title': 'UHDTV TEST 8K VIDEO.mp4',
            'age_limit': 0,
            'availability': 'public',
            'categories': ['Science & Technology'],
            'channel': '8KVIDEO',
            'channel_follower_count': int,
            'channel_id': 'UC8cn-cnCZ2FnxmjfkoLGpsQ',
            'channel_url': 'https://www.youtube.com/channel/UC8cn-cnCZ2FnxmjfkoLGpsQ',
            'comment_count': int,
            'description': '',
            'duration': 60,
            'like_count': int,
            'live_status': 'not_live',
            'media_type': 'video',
            'playable_in_embed': True,
            'tags': 'count:8',
            'thumbnail': r're:https?://i\.ytimg\.com/.+',
            'timestamp': 1349185252,
            'upload_date': '20121002',
            'uploader': '8KVIDEO',
            'uploader_id': '@8KVIDEO',
            'uploader_url': 'https://www.youtube.com/@8KVIDEO',
            'view_count': int,
        },
        'params': {
            'format': '141',
            'skip_download': True,
            'youtube_include_dash_manifest': True,
        },
        'skip': 'format 141 not served anymore',
    }, {
        # DASH manifest with encrypted signature
        'url': 'https://www.youtube.com/watch?v=IB3lcPjvWLA',
        'info_dict': {
            'id': 'IB3lcPjvWLA',
            'ext': 'm4a',
            'title': 'Afrojack, Spree Wilson - The Spark (Official Music Video) ft. Spree Wilson',
            'age_limit': 0,
            'availability': 'public',
            'categories': ['Music'],
            'channel': 'Afrojack',
            'channel_follower_count': int,
            'channel_id': 'UChuZAo1RKL85gev3Eal9_zg',
            'channel_is_verified': True,
            'channel_url': 'https://www.youtube.com/channel/UChuZAo1RKL85gev3Eal9_zg',
            'comment_count': int,
            'description': 'md5:8f5e2b82460520b619ccac1f509d43bf',
            'duration': 244,
            'heatmap': 'count:100',
            'like_count': int,
            'live_status': 'not_live',
            'media_type': 'video',
            'playable_in_embed': True,
            'tags': 'count:19',
            'thumbnail': r're:https?://i\.ytimg\.com/.+',
            'timestamp': 1381496404,
            'upload_date': '20131011',
            'uploader': 'Afrojack',
            'uploader_id': '@AfrojackVEVO',
            'uploader_url': 'https://www.youtube.com/@AfrojackVEVO',
            'view_count': int,
        },
        'params': {
            'format': '141/bestaudio[ext=m4a]',
            'skip_download': True,
            'youtube_include_dash_manifest': True,
        },
    }, {
        # Age-gated video
        # https://github.com/yt-dlp/yt-dlp/pull/575#issuecomment-888837000
        'note': 'Embed allowed age-gated video; works with web_embedded',
        'url': 'https://youtube.com/watch?v=HtVdAasjOgU',
        'info_dict': {
            'id': 'HtVdAasjOgU',
            'ext': 'mp4',
            'title': 'The Witcher 3: Wild Hunt - The Sword Of Destiny Trailer',
            'age_limit': 18,
            'availability': 'needs_auth',
            'categories': ['Gaming'],
            'channel': 'The Witcher',
            'channel_follower_count': int,
            'channel_id': 'UCzybXLxv08IApdjdN0mJhEg',
            'channel_is_verified': True,
            'channel_url': 'https://www.youtube.com/channel/UCzybXLxv08IApdjdN0mJhEg',
            'comment_count': int,
            'description': 'md5:595a43060c51c2a8cb61dd33c18e5fbd',
            'duration': 142,
            'heatmap': 'count:100',
            'like_count': int,
            'live_status': 'not_live',
            'media_type': 'video',
            'playable_in_embed': True,
            'tags': 'count:17',
            'thumbnail': r're:https?://i\.ytimg\.com/.+',
            'timestamp': 1401991663,
            'upload_date': '20140605',
            'uploader': 'The Witcher',
            'uploader_id': '@thewitcher',
            'uploader_url': 'https://www.youtube.com/@thewitcher',
            'view_count': int,
        },
        'params': {'skip_download': True},
        'skip': 'Age-restricted; requires authentication',
    }, {
        'note': 'Formerly an age-gated video with embed allowed in public site',
        'url': 'https://youtube.com/watch?v=HsUATh_Nc2U',
        'info_dict': {
            'id': 'HsUATh_Nc2U',
            'ext': 'mp4',
            'title': 'Godzilla 2 (Official Video)',
            'age_limit': 0,
            'availability': 'public',
            'categories': ['Entertainment'],
            'channel': 'FlyingKitty',
            'channel_follower_count': int,
            'channel_id': 'UCYQT13AtrJC0gsM1far_zJg',
            'channel_is_verified': True,
            'channel_url': 'https://www.youtube.com/channel/UCYQT13AtrJC0gsM1far_zJg',
            'comment_count': int,
            'description': 'md5:bf77e03fcae5529475e500129b05668a',
            'duration': 177,
            'heatmap': 'count:100',
            'like_count': int,
            'live_status': 'not_live',
            'media_type': 'video',
            'playable_in_embed': True,
            'tags': 'count:2',
            'thumbnail': r're:https?://i\.ytimg\.com/.+',
            'timestamp': 1586358900,
            'upload_date': '20200408',
            'uploader': 'FlyingKitty',
            'uploader_id': '@FlyingKitty900',
            'uploader_url': 'https://www.youtube.com/@FlyingKitty900',
            'view_count': int,
        },
        'params': {'skip_download': True},
    }, {
        'note': 'Age-gated video embedable only with clientScreen=EMBED',
        'url': 'https://youtube.com/watch?v=Tq92D6wQ1mg',
        'info_dict': {
            'id': 'Tq92D6wQ1mg',
            'ext': 'mp4',
            'title': '[MMD] Adios - EVERGLOW [+Motion DL]',
            'age_limit': 18,
            'availability': 'needs_auth',
            'categories': ['Entertainment'],
            'channel': 'Projekt Melody',
            'channel_follower_count': int,
            'channel_id': 'UC1yoRdFoFJaCY-AGfD9W0wQ',
            'channel_url': 'https://www.youtube.com/channel/UC1yoRdFoFJaCY-AGfD9W0wQ',
            'comment_count': int,
            'description': 'md5:17eccca93a786d51bc67646756894066',
            'duration': 106,
            'like_count': int,
            'live_status': 'not_live',
            'media_type': 'video',
            'playable_in_embed': True,
            'tags': 'count:5',
            'thumbnail': r're:https?://i\.ytimg\.com/.+',
            'timestamp': 1577508724,
            'upload_date': '20191228',
            'uploader': 'Projekt Melody',
            'uploader_id': '@ProjektMelody',
            'uploader_url': 'https://www.youtube.com/@ProjektMelody',
            'view_count': int,
        },
        'skip': 'Age-restricted; requires authentication',
    }, {
        'note': 'Non-age-gated non-embeddable video',
        'url': 'https://youtube.com/watch?v=MeJVWBSsPAY',
        'info_dict': {
            'id': 'MeJVWBSsPAY',
            'ext': 'mp4',
            'title': 'OOMPH! - Such Mich Find Mich (Lyrics)',
            'age_limit': 0,
            'availability': 'public',
            'categories': ['Music'],
            'channel': 'Herr Lurik',
            'channel_follower_count': int,
            'channel_id': 'UCdR3RSDPqub28LjZx0v9-aA',
            'channel_url': 'https://www.youtube.com/channel/UCdR3RSDPqub28LjZx0v9-aA',
            'description': 'md5:205c1049102a4dffa61e4831c1f16851',
            'duration': 210,
            'like_count': int,
            'live_status': 'not_live',
            'media_type': 'video',
            'playable_in_embed': False,
            'tags': 'count:5',
            'thumbnail': r're:https?://i\.ytimg\.com/.+',
            'timestamp': 1375214517,
            'upload_date': '20130730',
            'uploader': 'Herr Lurik',
            'uploader_id': '@HerrLurik',
            'uploader_url': 'https://www.youtube.com/@HerrLurik',
            'view_count': int,
        },
    }, {
        'note': 'Non-bypassable age-gated video',
        'url': 'https://youtube.com/watch?v=Cr381pDsSsA',
        'only_matching': True,
    }, {
        # video_info is None
        # https://github.com/ytdl-org/youtube-dl/issues/4421
        # YouTube Red ad is not captured for creator
        'url': '__2ABJjxzNo',
        'info_dict': {
            'id': '__2ABJjxzNo',
            'ext': 'mp4',
            'title': 'Deadmau5 - Some Chords (HD)',
            'age_limit': 0,
            'availability': 'public',
            'categories': ['Music'],
            'channel': 'deadmau5',
            'channel_follower_count': int,
            'channel_id': 'UCYEK6xds6eo-3tr4xRdflmQ',
            'channel_is_verified': True,
            'channel_url': 'https://www.youtube.com/channel/UCYEK6xds6eo-3tr4xRdflmQ',
            'comment_count': int,
            'description': 'md5:c27e1e9e095a3d9dd99de2f0f377ba06',
            'duration': 266,
            'heatmap': 'count:100',
            'like_count': int,
            'live_status': 'not_live',
            'media_type': 'video',
            'playable_in_embed': True,
            'tags': 'count:14',
            'thumbnail': r're:https?://i\.ytimg\.com/.+',
            'timestamp': 1272659179,
            'upload_date': '20100430',
            'uploader': 'deadmau5',
            'uploader_id': '@deadmau5',
            'uploader_url': 'https://www.youtube.com/@deadmau5',
            'view_count': int,
        },
        'expected_warnings': ['DASH manifest missing'],
        'params': {'skip_download': True},
    }, {
        # https://github.com/ytdl-org/youtube-dl/issues/4431
        'url': 'lqQg6PlCWgI',
        'info_dict': {
            'id': 'lqQg6PlCWgI',
            'ext': 'mp4',
            'title': 'Hockey - Women -  GER-AUS - London 2012 Olympic Games',
            'age_limit': 0,
            'availability': 'public',
            'categories': ['Sports'],
            'channel': 'Olympics',
            'channel_follower_count': int,
            'channel_id': 'UCTl3QQTvqHFjurroKxexy2Q',
            'channel_is_verified': True,
            'channel_url': 'https://www.youtube.com/channel/UCTl3QQTvqHFjurroKxexy2Q',
            'description': 'md5:04bbbf3ccceb6795947572ca36f45904',
            'duration': 6085,
            'like_count': int,
            'live_status': 'was_live',
            'media_type': 'livestream',
            'playable_in_embed': True,
            'release_date': '20120731',
            'release_timestamp': 1343767800,
            'tags': 'count:10',
            'thumbnail': r're:https?://i\.ytimg\.com/.+',
            'timestamp': 1440707674,
            'upload_date': '20150827',
            'uploader': 'Olympics',
            'uploader_id': '@Olympics',
            'uploader_url': 'https://www.youtube.com/@Olympics',
            'view_count': int,
        },
        'params': {'skip_download': True},
    }, {
        # Non-square pixels
        'url': 'https://www.youtube.com/watch?v=_b-2C3KPAM0',
        'info_dict': {
            'id': '_b-2C3KPAM0',
            'ext': 'mp4',
            'title': '[A-made] 變態妍字幕版 太妍 我就是這樣的人',
            'age_limit': 0,
            'availability': 'unlisted',
            'categories': ['People & Blogs'],
            'channel': '孫ᄋᄅ',
            'channel_follower_count': int,
            'channel_id': 'UCS-xxCmRaA6BFdmgDPA_BIw',
            'channel_url': 'https://www.youtube.com/channel/UCS-xxCmRaA6BFdmgDPA_BIw',
            'comment_count': int,
            'description': 'md5:636f03cf211e7687daffe5bded88a94f',
            'duration': 85,
            'like_count': int,
            'live_status': 'not_live',
            'media_type': 'video',
            'playable_in_embed': True,
            'stretched_ratio': 16 / 9.,
            'tags': 'count:11',
            'thumbnail': r're:https?://i\.ytimg\.com/.+',
            'timestamp': 1299776999,
            'upload_date': '20110310',
            'uploader': '孫ᄋᄅ',
            'uploader_id': '@AllenMeow',
            'uploader_url': 'https://www.youtube.com/@AllenMeow',
            'view_count': int,
        },
        'params': {'skip_download': True},
    }, {
        # url_encoded_fmt_stream_map is empty string (deprecated)
        # https://github.com/ytdl-org/youtube-dl/commit/3a9fadd6dfc127ed0707b218b11ac10c654af1e2
        # https://github.com/ytdl-org/youtube-dl/commit/67299f23d8b1894120e875edf97440de87e22308
        'url': 'qEJwOuvDf7I',
        'only_matching': True,
    }, {
        # Extraction from multiple DASH manifests
        # https://github.com/ytdl-org/youtube-dl/pull/6097
        'url': 'https://www.youtube.com/watch?v=FIl7x6_3R5Y',
        'info_dict': {
            'id': 'FIl7x6_3R5Y',
            'ext': 'mp4',
            'title': '[60fps] 150614  마마무 솔라 \'Mr. 애매모호\' 라이브 직캠 @대학로 게릴라 콘서트',
            'age_limit': 0,
            'availability': 'public',
            'categories': ['People & Blogs'],
            'channel': 'dorappi2000',
            'channel_follower_count': int,
            'channel_id': 'UCNlmrKRHLHcd2gq6LtPOTlQ',
            'channel_url': 'https://www.youtube.com/channel/UCNlmrKRHLHcd2gq6LtPOTlQ',
            'description': 'md5:116377fd2963b81ec4ce64b542173306',
            'duration': 220,
            'like_count': int,
            'live_status': 'not_live',
            'media_type': 'video',
            'playable_in_embed': True,
            'tags': 'count:12',
            'thumbnail': r're:https?://i\.ytimg\.com/.+',
            'timestamp': 1435276932,
            'upload_date': '20150626',
            'uploader': 'dorappi2000',
            'uploader_id': '@dorappi2000',
            'uploader_url': 'https://www.youtube.com/@dorappi2000',
            'view_count': int,
        },
        'params': {'skip_download': True},
    }, {
        # DASH manifest with segment_list
        # https://github.com/ytdl-org/youtube-dl/pull/5886
        'url': 'https://www.youtube.com/embed/CsmdDsKjzN8',
        'info_dict': {
            'id': 'CsmdDsKjzN8',
            'ext': 'mp4',
            'title': 'Retransmisión XVIII Media maratón Zaragoza 2015',
            'age_limit': 0,
            'availability': 'unlisted',
            'categories': ['Sports'],
            'channel': 'Airtek | LED streaming',
            'channel_follower_count': int,
            'channel_id': 'UCzTzUmjXxxacNnL8I3m4LnQ',
            'channel_url': 'https://www.youtube.com/channel/UCzTzUmjXxxacNnL8I3m4LnQ',
            'comment_count': int,
            'description': 'md5:fcac84e6c545114766f670236fc10196',
            'duration': 4394,
            'like_count': int,
            'live_status': 'was_live',
            'media_type': 'livestream',
            'playable_in_embed': True,
            'release_date': '20150510',
            'release_timestamp': 1431241011,
            'tags': 'count:31',
            'thumbnail': r're:https?://i\.ytimg\.com/.+',
            'timestamp': 1430505417,
            'upload_date': '20150501',
            'uploader': 'Airtek | LED streaming',
            'uploader_id': '@airtekledstreaming7916',
            'uploader_url': 'https://www.youtube.com/@airtekledstreaming7916',
            'view_count': int,
        },
        'params': {
            'format': '135',  # bestvideo
            'skip_download': True,
            'youtube_include_dash_manifest': True,
        },
    }, {
        # Multi-camera events (deprecated)
        # https://web.archive.org/web/20200308092705/https://support.google.com/youtube/answer/2853812
        'url': 'https://www.youtube.com/watch?v=zaPI8MvL8pg',
        'only_matching': True,
    }, {
        # Multi-camera events (deprecated)
        # https://github.com/ytdl-org/youtube-dl/issues/8536
        'url': 'https://www.youtube.com/watch?v=gVfLd0zydlo',
        'only_matching': True,
    }, {
        'url': 'https://vid.plus/FlRa-iH7PGw',
        'only_matching': True,
    }, {
        'url': 'https://zwearz.com/watch/9lWxNJF-ufM/electra-woman-dyna-girl-official-trailer-grace-helbig.html',
        'only_matching': True,
    }, {
        # Title with JS-like syntax "};"
        # https://github.com/ytdl-org/youtube-dl/issues/7468
        # Also tests cut-off URL expansion in video description
        # https://github.com/ytdl-org/youtube-dl/issues/1892
        # https://github.com/ytdl-org/youtube-dl/issues/8164
        'url': 'https://www.youtube.com/watch?v=lsguqyKfVQg',
        'info_dict': {
            'id': 'lsguqyKfVQg',
            'ext': 'mp4',
            'title': '{dark walk}; Loki/AC/Dishonored; collab w/Elflover21',
            'age_limit': 0,
            'availability': 'public',
            'categories': ['Film & Animation'],
            'channel': 'IronSoulElf',
            'channel_follower_count': int,
            'channel_id': 'UCTSRgz5jylBvFt_S7wnsqLQ',
            'channel_url': 'https://www.youtube.com/channel/UCTSRgz5jylBvFt_S7wnsqLQ',
            'comment_count': int,
            'description': 'md5:8085699c11dc3f597ce0410b0dcbb34a',
            'duration': 133,
            'like_count': int,
            'live_status': 'not_live',
            'media_type': 'video',
            'playable_in_embed': True,
            'tags': 'count:13',
            'thumbnail': r're:https?://i\.ytimg\.com/.+',
            'timestamp': 1447959261,
            'upload_date': '20151119',
            'uploader': 'IronSoulElf',
            'uploader_id': '@IronSoulElf',
            'uploader_url': 'https://www.youtube.com/@IronSoulElf',
            'view_count': int,
        },
        'params': {'skip_download': True},
    }, {
        # Tags with '};'
        # https://github.com/ytdl-org/youtube-dl/issues/7468
        'url': 'https://www.youtube.com/watch?v=Ms7iBXnlUO8',
        'only_matching': True,
    }, {
        # Video with yt:stretch=17:0
        'url': 'https://www.youtube.com/watch?v=Q39EVAstoRM',
        'info_dict': {
            'id': 'Q39EVAstoRM',
            'ext': 'mp4',
            'title': 'Clash Of Clans#14 Dicas De Ataque Para CV 4',
            'description': 'md5:ee18a25c350637c8faff806845bddee9',
            'upload_date': '20151107',
        },
        'skip': 'This video does not exist.',
    }, {
        # Video with incomplete 'yt:stretch=16:'
        'url': 'https://www.youtube.com/watch?v=FRhJzUSJbGI',
        'only_matching': True,
    }, {
        # Video licensed under Creative Commons
        'url': 'https://www.youtube.com/watch?v=M4gD1WSo5mA',
        'info_dict': {
            'id': 'M4gD1WSo5mA',
            'ext': 'mp4',
            'title': 'William Fisher, CopyrightX: Lecture 3.2, The Subject Matter of Copyright: Drama and choreography',
            'age_limit': 0,
            'availability': 'public',
            'categories': ['Education'],
            'channel': 'The Berkman Klein Center for Internet & Society',
            'channel_follower_count': int,
            'channel_id': 'UCuLGmD72gJDBwmLw06X58SA',
            'channel_url': 'https://www.youtube.com/channel/UCuLGmD72gJDBwmLw06X58SA',
            'chapters': 'count:4',
            'description': 'md5:a677553cf0840649b731a3024aeff4cc',
            'duration': 721,
            'license': 'Creative Commons Attribution license (reuse allowed)',
            'like_count': int,
            'live_status': 'not_live',
            'media_type': 'video',
            'playable_in_embed': True,
            'tags': 'count:3',
            'thumbnail': r're:https?://i\.ytimg\.com/.+',
            'timestamp': 1422422076,
            'upload_date': '20150128',
            'uploader': 'The Berkman Klein Center for Internet & Society',
            'uploader_id': '@BKCHarvard',
            'uploader_url': 'https://www.youtube.com/@BKCHarvard',
            'view_count': int,
        },
        'params': {'skip_download': True},
    }, {
        # https://github.com/ytdl-org/youtube-dl/commit/fd050249afce1bcc9e7f4a127069375467007b55
        'url': 'https://www.youtube.com/watch?v=eQcmzGIKrzg',
        'info_dict': {
            'id': 'eQcmzGIKrzg',
            'ext': 'mp4',
            'title': 'Democratic Socialism and Foreign Policy | Bernie Sanders',
            'age_limit': 0,
            'availability': 'public',
            'categories': ['News & Politics'],
            'channel': 'Bernie Sanders',
            'channel_follower_count': int,
            'channel_id': 'UCH1dpzjCEiGAt8CXkryhkZg',
            'channel_is_verified': True,
            'channel_url': 'https://www.youtube.com/channel/UCH1dpzjCEiGAt8CXkryhkZg',
            'chapters': 'count:5',
            'comment_count': int,
            'description': 'md5:13a2503d7b5904ef4b223aa101628f39',
            'duration': 4060,
            'heatmap': 'count:100',
            'license': 'Creative Commons Attribution license (reuse allowed)',
            'like_count': int,
            'live_status': 'not_live',
            'media_type': 'video',
            'playable_in_embed': True,
            'tags': 'count:12',
            'thumbnail': r're:https?://i\.ytimg\.com/.+',
            'timestamp': 1447987198,
            'upload_date': '20151120',
            'uploader': 'Bernie Sanders',
            'uploader_id': '@BernieSanders',
            'uploader_url': 'https://www.youtube.com/@BernieSanders',
            'view_count': int,
        },
        'params': {'skip_download': True},
    }, {
        'url': 'https://www.youtube.com/watch?feature=player_embedded&amp;amp;v=V36LpHqtcDY',
        'only_matching': True,
    }, {
        # YouTube Red paid video
        # https://github.com/ytdl-org/youtube-dl/issues/10059
        'url': 'https://www.youtube.com/watch?v=i1Ko8UG-Tdo',
        'only_matching': True,
    }, {
        # Rental video preview
        # https://github.com/ytdl-org/youtube-dl/commit/fd050249afce1bcc9e7f4a127069375467007b55
        'url': 'https://www.youtube.com/watch?v=yYr8q0y5Jfg',
        'info_dict': {
            'id': 'uGpuVWrhIzE',
            'ext': 'mp4',
            'title': 'Piku - Trailer',
            'description': 'md5:c36bd60c3fd6f1954086c083c72092eb',
            'upload_date': '20150811',
            'license': 'Standard YouTube License',
        },
        'skip': 'This video is not available.',
    }, {
        # YouTube Red video with episode data
        'url': 'https://www.youtube.com/watch?v=iqKdEhx-dD4',
        'info_dict': {
            'id': 'iqKdEhx-dD4',
            'ext': 'mp4',
            'title': 'Isolation - Mind Field (Ep 1)',
            'age_limit': 0,
            'availability': 'public',
            'categories': ['Entertainment'],
            'channel': 'Vsauce',
            'channel_follower_count': int,
            'channel_id': 'UC6nSFpj9HTCZ5t-N3Rm3-HA',
            'channel_is_verified': True,
            'channel_url': 'https://www.youtube.com/channel/UC6nSFpj9HTCZ5t-N3Rm3-HA',
            'comment_count': int,
            'description': 'md5:f540112edec5d09fc8cc752d3d4ba3cd',
            'duration': 2085,
            'heatmap': 'count:100',
            'like_count': int,
            'live_status': 'not_live',
            'media_type': 'video',
            'playable_in_embed': True,
            'tags': 'count:12',
            'thumbnail': r're:https?://i\.ytimg\.com/.+',
            'timestamp': 1484761047,
            'upload_date': '20170118',
            'uploader': 'Vsauce',
            'uploader_id': '@Vsauce',
            'uploader_url': 'https://www.youtube.com/@Vsauce',
            'view_count': int,
        },
        'expected_warnings': ['Skipping DASH manifest'],
        'params': {'skip_download': True},
    }, {
        # The following content has been identified by the YouTube community
        # as inappropriate or offensive to some audiences.
        'url': 'https://www.youtube.com/watch?v=6SJNVb0GnPI',
        'info_dict': {
            'id': '6SJNVb0GnPI',
            'ext': 'mp4',
            'title': 'Race Differences in Intelligence',
            'description': 'md5:5d161533167390427a1f8ee89a1fc6f1',
            'duration': 965,
            'upload_date': '20140124',
        },
        'skip': 'This video has been removed for violating YouTube\'s policy on hate speech.',
    }, {
        # itag 212
        'url': '1t24XAntNCY',
        'only_matching': True,
    }, {
        # geo restricted to JP
        'url': 'sJL6WA-aGkQ',
        'only_matching': True,
    }, {
        'url': 'https://invidio.us/watch?v=BaW_jenozKc',
        'only_matching': True,
    }, {
        'url': 'https://redirect.invidious.io/watch?v=BaW_jenozKc',
        'only_matching': True,
    }, {
        # from https://nitter.pussthecat.org/YouTube/status/1360363141947944964#m
        'url': 'https://redirect.invidious.io/Yh0AhrY9GjA',
        'only_matching': True,
    }, {
        # DRM protected
        'url': 'https://www.youtube.com/watch?v=s7_qI6_mIXc',
        'only_matching': True,
    }, {
        # Video with unsupported adaptive stream type formats
        # https://github.com/ytdl-org/youtube-dl/commit/4fe54c128a11d394874505af75aaa5a2276aa3ba
        'url': 'https://www.youtube.com/watch?v=Z4Vy8R84T1U',
        'only_matching': True,
    }, {
        # Youtube Music Auto-generated description
        # TODO: fix metadata extraction
        # https://github.com/ytdl-org/youtube-dl/issues/20599
        'url': 'https://music.youtube.com/watch?v=MgNrAu2pzNs',
        'info_dict': {
            'id': 'MgNrAu2pzNs',
            'ext': 'mp4',
            'title': 'Voyeur Girl',
            'age_limit': 0,
            'album': 'it\'s too much love to know my dear',
            'alt_title': 'Voyeur Girl',
            'artists': ['Stephen'],
            'availability': 'public',
            'categories': ['Music'],
            'channel': 'Stephen',  # TODO: should be 'Stephen - Topic'
            'channel_follower_count': int,
            'channel_id': 'UC-pWHpBjdGG69N9mM2auIAA',
            'channel_is_verified': True,
            'channel_url': 'https://www.youtube.com/channel/UC-pWHpBjdGG69N9mM2auIAA',
            'comment_count': int,
            'creators': ['Stephen'],
            'description': 'md5:7ae382a65843d6df2685993e90a8628f',
            'duration': 169,
            'heatmap': 'count:100',
            'like_count': int,
            'live_status': 'not_live',
            'media_type': 'video',
            'playable_in_embed': True,
            'release_date': '20190313',
            'tags': 'count:11',
            'thumbnail': r're:https?://i\.ytimg\.com/.+',
            'timestamp': 1552385807,
            'track': 'Voyeur Girl',
            'upload_date': '20190312',
            'uploader': 'Stephen',
            'view_count': int,
        },
        'params': {'skip_download': True},
    }, {
        'url': 'https://www.youtubekids.com/watch?v=3b8nCWDgZ6Q',
        'only_matching': True,
    }, {
        # invalid -> valid video id redirection
        # https://github.com/ytdl-org/youtube-dl/pull/25063
        'url': 'DJztXj2GPfl',
        'info_dict': {
            'id': 'DJztXj2GPfk',
            'ext': 'mp4',
            'title': 'Panjabi MC - Mundian To Bach Ke (The Dictator Soundtrack)',
            'description': 'md5:bf577a41da97918e94fa9798d9228825',
            'upload_date': '20090125',
            'artist': 'Panjabi MC',
            'track': 'Beware of the Boys (Mundian to Bach Ke) - Motivo Hi-Lectro Remix',
            'album': 'Beware of the Boys (Mundian To Bach Ke)',
        },
        'skip': 'Video unavailable',
    }, {
        # empty description results in an empty string
        # https://github.com/ytdl-org/youtube-dl/pull/26575
        'url': 'https://www.youtube.com/watch?v=x41yOUIvK2k',
        'info_dict': {
            'id': 'x41yOUIvK2k',
            'ext': 'mp4',
            'title': 'IMG 3456',
            'age_limit': 0,
            'availability': 'public',
            'categories': ['Pets & Animals'],
            'channel': 'l\'Or Vert asbl',
            'channel_follower_count': int,
            'channel_id': 'UCo03ZQPBW5U4UC3regpt1nw',
            'channel_url': 'https://www.youtube.com/channel/UCo03ZQPBW5U4UC3regpt1nw',
            'description': '',
            'duration': 7,
            'like_count': int,
            'live_status': 'not_live',
            'media_type': 'video',
            'playable_in_embed': True,
            'tags': [],
            'thumbnail': r're:https?://i\.ytimg\.com/.+',
            'timestamp': 1497343210,
            'upload_date': '20170613',
            'uploader': 'l\'Or Vert asbl',
            'uploader_id': '@ElevageOrVert',
            'uploader_url': 'https://www.youtube.com/@ElevageOrVert',
            'view_count': int,
        },
        'params': {'skip_download': True},
    }, {
        # with '};' inside yt initial data (see [1])
        # see [2] for an example with '};' inside ytInitialPlayerResponse
        # 1. https://github.com/ytdl-org/youtube-dl/issues/27093
        # 2. https://github.com/ytdl-org/youtube-dl/issues/27216
        'url': 'https://www.youtube.com/watch?v=CHqg6qOn4no',
        'info_dict': {
            'id': 'CHqg6qOn4no',
            'ext': 'mp4',
            'title': 'Part 77   Sort a list of simple types in c#',
            'age_limit': 0,
            'availability': 'public',
            'categories': ['Education'],
            'channel': 'kudvenkat',
            'channel_follower_count': int,
            'channel_id': 'UCCTVrRB5KpIiK6V2GGVsR1Q',
            'channel_is_verified': True,
            'channel_url': 'https://www.youtube.com/channel/UCCTVrRB5KpIiK6V2GGVsR1Q',
            'chapters': 'count:4',
            'comment_count': int,
            'description': 'md5:b8746fa52e10cdbf47997903f13b20dc',
            'duration': 522,
            'heatmap': 'count:100',
            'like_count': int,
            'live_status': 'not_live',
            'media_type': 'video',
            'playable_in_embed': True,
            'tags': 'count:12',
            'thumbnail': r're:https?://i\.ytimg\.com/.+',
            'timestamp': 1377976349,
            'upload_date': '20130831',
            'uploader': 'kudvenkat',
            'uploader_id': '@Csharp-video-tutorialsBlogspot',
            'uploader_url': 'https://www.youtube.com/@Csharp-video-tutorialsBlogspot',
            'view_count': int,
        },
        'params': {'skip_download': True},
    }, {
        # another example of '};' in ytInitialData
        'url': 'https://www.youtube.com/watch?v=gVfgbahppCY',
        'only_matching': True,
    }, {
        'url': 'https://www.youtube.com/watch_popup?v=63RmMXCd_bQ',
        'only_matching': True,
    }, {
        # https://github.com/ytdl-org/youtube-dl/pull/28094
        'url': 'OtqTfy26tG0',
        'info_dict': {
            'id': 'OtqTfy26tG0',
            'ext': 'mp4',
            'title': 'Burn Out',
            'age_limit': 0,
            'album': 'Every Day',
            'alt_title': 'Burn Out',
            'artists': ['The Cinematic Orchestra'],
            'availability': 'public',
            'categories': ['Music'],
            'channel': 'The Cinematic Orchestra',
            'channel_follower_count': int,
            'channel_id': 'UCIzsJBIyo8hhpFm1NK0uLgw',
            'channel_is_verified': True,
            'channel_url': 'https://www.youtube.com/channel/UCIzsJBIyo8hhpFm1NK0uLgw',
            'comment_count': int,
            'creators': ['The Cinematic Orchestra'],
            'description': 'md5:fee8b19b7ba433cc2957d1c7582067ac',
            'duration': 614,
            'heatmap': 'count:100',
            'like_count': int,
            'live_status': 'not_live',
            'media_type': 'video',
            'playable_in_embed': True,
            'release_date': '20020513',
            'release_year': 2023,
            'tags': 'count:3',
            'thumbnail': r're:https?://i\.ytimg\.com/.+',
            'timestamp': 1416497379,
            'track': 'Burn Out',
            'upload_date': '20141120',
            'uploader': 'The Cinematic Orchestra',
            'view_count': int,
        },
        'params': {'skip_download': True},
    }, {
        # controversial video, only works with bpctr when authenticated with cookies
        'url': 'https://www.youtube.com/watch?v=nGC3D_FkCmg',
        'only_matching': True,
    }, {
        # controversial video, requires bpctr/contentCheckOk
        'url': 'https://www.youtube.com/watch?v=SZJvDhaSDnc',
        'info_dict': {
            'id': 'SZJvDhaSDnc',
            'ext': 'mp4',
            'title': 'San Diego teen commits suicide after bullying over embarrassing video',
            'age_limit': 18,
            'availability': 'needs_auth',
            'categories': ['News & Politics'],
            'channel': 'CBS Mornings',
            'channel_follower_count': int,
            'channel_id': 'UC-SJ6nODDmufqBzPBwCvYvQ',
            'channel_is_verified': True,
            'channel_url': 'https://www.youtube.com/channel/UC-SJ6nODDmufqBzPBwCvYvQ',
            'comment_count': int,
            'description': 'md5:acde3a73d3f133fc97e837a9f76b53b7',
            'duration': 170,
            'like_count': int,
            'live_status': 'not_live',
            'media_type': 'video',
            'playable_in_embed': True,
            'tags': 'count:5',
            'thumbnail': r're:https?://i\.ytimg\.com/.+',
            'timestamp': 1405513526,
            'upload_date': '20140716',
            'uploader': 'CBS Mornings',
            'uploader_id': '@CBSMornings',
            'uploader_url': 'https://www.youtube.com/@CBSMornings',
            'view_count': int,
        },
        'skip': 'Age-restricted; requires authentication',
    }, {
        # restricted location
        # https://github.com/ytdl-org/youtube-dl/issues/28685
        'url': 'cBvYw8_A0vQ',
        'info_dict': {
            'id': 'cBvYw8_A0vQ',
            'ext': 'mp4',
            'title': '4K Ueno Okachimachi  Street  Scenes  上野御徒町歩き',
            'age_limit': 0,
            'availability': 'public',
            'categories': ['Travel & Events'],
            'channel': 'Walk around Japan',
            'channel_follower_count': int,
            'channel_id': 'UC3o_t8PzBmXf5S9b7GLx1Mw',
            'channel_url': 'https://www.youtube.com/channel/UC3o_t8PzBmXf5S9b7GLx1Mw',
            'description': 'md5:ea770e474b7cd6722b4c95b833c03630',
            'duration': 1456,
            'live_status': 'not_live',
            'media_type': 'video',
            'playable_in_embed': True,
            'tags': 'count:5',
            'thumbnail': r're:https?://i\.ytimg\.com/.+',
            'timestamp': 1605884416,
            'upload_date': '20201120',
            'uploader': 'Walk around Japan',
            'uploader_id': '@walkaroundjapan7124',
            'uploader_url': 'https://www.youtube.com/@walkaroundjapan7124',
            'view_count': int,
        },
        'params': {'skip_download': True},
    }, {
        # Has multiple audio streams
        'url': 'WaOKSUlf4TM',
        'only_matching': True,
    }, {
        # Requires Premium: has format 141 when requested using YTM url
        'url': 'https://music.youtube.com/watch?v=XclachpHxis',
        'only_matching': True,
    }, {
        # multiple subtitles with same lang_code
        'url': 'https://www.youtube.com/watch?v=wsQiKKfKxug',
        'only_matching': True,
    }, {
        # Force use android client fallback
        'url': 'https://www.youtube.com/watch?v=YOelRv7fMxY',
        'info_dict': {
            'id': 'YOelRv7fMxY',
            'ext': '3gp',
            'title': 'DIGGING A SECRET TUNNEL Part 1',
            'age_limit': 0,
            'availability': 'public',
            'categories': ['Entertainment'],
            'channel': 'colinfurze',
            'channel_follower_count': int,
            'channel_id': 'UCp68_FLety0O-n9QU6phsgw',
            'channel_is_verified': True,
            'channel_url': 'https://www.youtube.com/channel/UCp68_FLety0O-n9QU6phsgw',
            'chapters': 'count:4',
            'comment_count': int,
            'description': 'md5:5d5991195d599b56cd0c4148907eec50',
            'duration': 596,
            'heatmap': 'count:100',
            'like_count': int,
            'live_status': 'not_live',
            'media_type': 'video',
            'playable_in_embed': True,
            'tags': 'count:6',
            'thumbnail': r're:https?://i\.ytimg\.com/.+',
            'timestamp': 1624546829,
            'upload_date': '20210624',
            'uploader': 'colinfurze',
            'uploader_id': '@colinfurze',
            'uploader_url': 'https://www.youtube.com/@colinfurze',
            'view_count': int,
        },
        'params': {
            'extractor_args': {'youtube': {'player_client': ['android']}},
            'format': '17',  # 3gp format available on android
            'skip_download': True,
        },
        'skip': 'Android client broken',
    }, {
        # Skip download of additional client configs (remix client config in this case)
        'url': 'https://music.youtube.com/watch?v=MgNrAu2pzNs',
        'only_matching': True,
        'params': {'extractor_args': {'youtube': {'player_skip': ['configs']}}},
    }, {
        # shorts
        'url': 'https://www.youtube.com/shorts/BGQWPY4IigY',
        'only_matching': True,
    }, {
        'note': 'Storyboards',
        'url': 'https://www.youtube.com/watch?v=5KLPxDtMqe8',
        'info_dict': {
            'id': '5KLPxDtMqe8',
            'ext': 'mhtml',
            'title': 'Your Brain is Plastic',
            'age_limit': 0,
            'availability': 'public',
            'categories': ['Education'],
            'channel': 'SciShow',
            'channel_follower_count': int,
            'channel_id': 'UCZYTClx2T1of7BRZ86-8fow',
            'channel_is_verified': True,
            'channel_url': 'https://www.youtube.com/channel/UCZYTClx2T1of7BRZ86-8fow',
            'chapters': 'count:5',
            'comment_count': int,
            'description': 'md5:89cd86034bdb5466cd87c6ba206cd2bc',
            'duration': 248,
            'heatmap': 'count:100',
            'like_count': int,
            'live_status': 'not_live',
            'media_type': 'video',
            'playable_in_embed': True,
            'tags': 'count:12',
            'thumbnail': r're:https?://i\.ytimg\.com/.+',
            'timestamp': 1395685455,
            'upload_date': '20140324',
            'uploader': 'SciShow',
            'uploader_id': '@SciShow',
            'uploader_url': 'https://www.youtube.com/@SciShow',
            'view_count': int,
        },
        'params': {
            'format': 'mhtml',
            'skip_download': True,
        },
    }, {
        # Ensure video upload_date is in UTC timezone (video was uploaded 1641170939)
        'url': 'https://www.youtube.com/watch?v=2NUZ8W2llS4',
        'info_dict': {
            'id': '2NUZ8W2llS4',
            'ext': 'mp4',
            'title': 'The NP that test your phone performance 🙂',
            'age_limit': 0,
            'availability': 'public',
            'categories': ['Gaming'],
            'channel': 'Leon Nguyen',
            'channel_follower_count': int,
            'channel_id': 'UCRqNBSOHgilHfAczlUmlWHA',
            'channel_url': 'https://www.youtube.com/channel/UCRqNBSOHgilHfAczlUmlWHA',
            'comment_count': int,
            'description': 'md5:144494b24d4f9dfacb97c1bbef5de84d',
            'duration': 21,
            'heatmap': 'count:100',
            'like_count': int,
            'live_status': 'not_live',
            'media_type': 'video',
            'playable_in_embed': True,
            'tags': 'count:23',
            'thumbnail': r're:https?://i\.ytimg\.com/.+',
            'timestamp': 1641170939,
            'upload_date': '20220103',
            'uploader': 'Leon Nguyen',
            'uploader_id': '@LeonNguyen',
            'uploader_url': 'https://www.youtube.com/@LeonNguyen',
            'view_count': int,
        },
        'params': {'skip_download': True},
    }, {
        # date text is premiered video, ensure upload date in UTC (published 1641172509)
        'url': 'https://www.youtube.com/watch?v=mzZzzBU6lrM',
        'info_dict': {
            'id': 'mzZzzBU6lrM',
            'ext': 'mp4',
            'title': 'I Met GeorgeNotFound In Real Life...',
            'age_limit': 0,
            'availability': 'public',
            'categories': ['Entertainment'],
            'channel': 'Quackity',
            'channel_follower_count': int,
            'channel_id': 'UC_8NknAFiyhOUaZqHR3lq3Q',
            'channel_is_verified': True,
            'channel_url': 'https://www.youtube.com/channel/UC_8NknAFiyhOUaZqHR3lq3Q',
            'comment_count': int,
            'description': 'md5:42e72df3d4d5965903a2b9359c3ccd25',
            'duration': 955,
            'heatmap': 'count:100',
            'like_count': int,
            'live_status': 'not_live',
            'media_type': 'video',
            'playable_in_embed': True,
            'release_date': '20220103',
            'release_timestamp': 1641172509,
            'tags': 'count:26',
            'thumbnail': r're:https?://i\.ytimg\.com/.+',
            'timestamp': 1641172509,
            'upload_date': '20220103',
            'uploader': 'Quackity',
            'uploader_id': '@Quackity',
            'uploader_url': 'https://www.youtube.com/@Quackity',
            'view_count': int,
        },
        'params': {'skip_download': True},
    }, {
        # continuous livestream.
        # Upload date was 2022-07-12T05:12:29-07:00, while stream start is 2022-07-12T15:59:30+00:00
        'url': 'https://www.youtube.com/watch?v=jfKfPfyJRdk',
        'info_dict': {
            'id': 'jfKfPfyJRdk',
            'ext': 'mp4',
            'title': str,
            'age_limit': 0,
            'availability': 'public',
            'categories': ['Music'],
            'channel': 'Lofi Girl',
            'channel_follower_count': int,
            'channel_id': 'UCSJ4gkVC6NrvII8umztf0Ow',
            'channel_is_verified': True,
            'channel_url': 'https://www.youtube.com/channel/UCSJ4gkVC6NrvII8umztf0Ow',
            'concurrent_view_count': int,
            'description': 'md5:48841fcfc1be6131d729fa7b4a7784cb',
            'like_count': int,
            'live_status': 'is_live',
            'media_type': 'livestream',
            'playable_in_embed': True,
            'release_date': '20220712',
            'release_timestamp': 1657641570,
            'tags': 'count:32',
            'thumbnail': r're:https?://i\.ytimg\.com/.+',
            'timestamp': 1657627949,
            'upload_date': '20220712',
            'uploader': 'Lofi Girl',
            'uploader_id': '@LofiGirl',
            'uploader_url': 'https://www.youtube.com/@LofiGirl',
            'view_count': int,
        },
        'params': {'skip_download': True},
    }, {
        'url': 'https://www.youtube.com/watch?v=tjjjtzRLHvA',
        'info_dict': {
            'id': 'tjjjtzRLHvA',
            'ext': 'mp4',
            'title': 'ハッシュタグ無し };if window.ytcsi',
            'age_limit': 0,
            'availability': 'unlisted',
            'categories': ['Music'],
            'channel': 'Lesmiscore',
            'channel_follower_count': int,
            'channel_id': 'UCdqltm_7iv1Vs6kp6Syke5A',
            'channel_url': 'https://www.youtube.com/channel/UCdqltm_7iv1Vs6kp6Syke5A',
            'description': '',
            'duration': 6,
            'like_count': int,
            'live_status': 'not_live',
            'media_type': 'short',
            'playable_in_embed': True,
            'tags': [],
            'thumbnail': r're:https?://i\.ytimg\.com/.+',
            'timestamp': 1648005313,
            'upload_date': '20220323',
            'uploader': 'Lesmiscore',
            'uploader_id': '@lesmiscore',
            'uploader_url': 'https://www.youtube.com/@lesmiscore',
            'view_count': int,
        },
        'params': {'skip_download': True},
    }, {
        # Prefer primary title+description language metadata by default
        # Do not prefer translated description if primary is empty
        'url': 'https://www.youtube.com/watch?v=el3E4MbxRqQ',
        'info_dict': {
            'id': 'el3E4MbxRqQ',
            'ext': 'mp4',
            'title': 'dlp test video 2 - primary sv no desc',
            'age_limit': 0,
            'availability': 'unlisted',
            'categories': ['People & Blogs'],
            'channel': 'cole-dlp-test-acc',
            'channel_id': 'UCiu-3thuViMebBjw_5nWYrA',
            'channel_url': 'https://www.youtube.com/channel/UCiu-3thuViMebBjw_5nWYrA',
            'description': '',
            'duration': 5,
            'like_count': int,
            'live_status': 'not_live',
            'media_type': 'video',
            'playable_in_embed': True,
            'tags': [],
            'thumbnail': r're:https?://i\.ytimg\.com/.+',
            'timestamp': 1662677394,
            'upload_date': '20220908',
            'uploader': 'cole-dlp-test-acc',
            'uploader_id': '@coletdjnz',
            'uploader_url': 'https://www.youtube.com/@coletdjnz',
            'view_count': int,
        },
        'params': {'skip_download': True},
    }, {
        # Extractor argument: prefer translated title+description
        'url': 'https://www.youtube.com/watch?v=gHKT4uU8Zng',
        'info_dict': {
            'id': 'gHKT4uU8Zng',
            'ext': 'mp4',
            'title': 'dlp test video title primary (en-GB)',
            'age_limit': 0,
            'availability': 'public',
            'categories': ['People & Blogs'],
            'channel': 'cole-dlp-test-acc',
            'channel_id': 'UCiu-3thuViMebBjw_5nWYrA',
            'channel_url': 'https://www.youtube.com/channel/UCiu-3thuViMebBjw_5nWYrA',
            'description': 'md5:e8c098ba19888e08554f960ffbf6f90e',
            'duration': 5,
            'like_count': int,
            'live_status': 'not_live',
            'media_type': 'video',
            'playable_in_embed': True,
            'tags': [],
            'thumbnail': r're:https?://i\.ytimg\.com/.+',
            'timestamp': 1659073275,
            'upload_date': '20220729',
            'uploader': 'cole-dlp-test-acc',
            'uploader_id': '@coletdjnz',
            'uploader_url': 'https://www.youtube.com/@coletdjnz',
            'view_count': int,
        },
        'params': {
            'extractor_args': {'youtube': {'lang': ['fr']}},
            'skip_download': True,
        },
        'expected_warnings': [r'Preferring "fr" translated fields'],
    }, {
        'note': '6 channel audio',
        'url': 'https://www.youtube.com/watch?v=zgdo7-RRjgo',
        'only_matching': True,
    }, {
        'note': 'Multiple HLS formats with same itag',
        'url': 'https://www.youtube.com/watch?v=kX3nB4PpJko',
        'info_dict': {
            'id': 'kX3nB4PpJko',
            'ext': 'mp4',
            'title': 'Last To Take Hand Off Jet, Keeps It!',
            'age_limit': 0,
            'availability': 'public',
            'categories': ['Entertainment'],
            'channel': 'MrBeast',
            'channel_follower_count': int,
            'channel_id': 'UCX6OQ3DkcsbYNE6H8uQQuVA',
            'channel_is_verified': True,
            'channel_url': 'https://www.youtube.com/channel/UCX6OQ3DkcsbYNE6H8uQQuVA',
            'comment_count': int,
            'description': 'md5:42731fced13eff2c48c099fbb5c1b3a0',
            'duration': 937,
            'heatmap': 'count:100',
            'like_count': int,
            'live_status': 'not_live',
            'media_type': 'video',
            'playable_in_embed': True,
            'tags': [],
            'thumbnail': r're:https?://i\.ytimg\.com/.+',
            'timestamp': 1668286800,
            'upload_date': '20221112',
            'uploader': 'MrBeast',
            'uploader_id': '@MrBeast',
            'uploader_url': 'https://www.youtube.com/@MrBeast',
            'view_count': int,
        },
        'params': {
            'extractor_args': {'youtube': {'player_client': ['ios']}},
            'format': '233-1',
            'skip_download': True,
        },
        'skip': 'PO Token Required',
    }, {
        'note': 'Audio formats with Dynamic Range Compression',
        'url': 'https://www.youtube.com/watch?v=Tq92D6wQ1mg',
        'info_dict': {
            'id': 'Tq92D6wQ1mg',
            'ext': 'webm',
            'title': '[MMD] Adios - EVERGLOW [+Motion DL]',
            'age_limit': 18,
            'availability': 'needs_auth',
            'categories': ['Entertainment'],
            'channel': 'Projekt Melody',
            'channel_follower_count': int,
            'channel_id': 'UC1yoRdFoFJaCY-AGfD9W0wQ',
            'channel_url': 'https://www.youtube.com/channel/UC1yoRdFoFJaCY-AGfD9W0wQ',
            'comment_count': int,
            'description': 'md5:17eccca93a786d51bc67646756894066',
            'duration': 106,
            'like_count': int,
            'live_status': 'not_live',
            'media_type': 'video',
            'playable_in_embed': True,
            'tags': 'count:5',
            'thumbnail': r're:https?://i\.ytimg\.com/.+',
            'timestamp': 1577508724,
            'upload_date': '20191228',
            'uploader': 'Projekt Melody',
            'uploader_id': '@ProjektMelody',
            'uploader_url': 'https://www.youtube.com/@ProjektMelody',
            'view_count': int,
        },
        'params': {
            'extractor_args': {'youtube': {'player_client': ['tv_embedded']}},
            'format': '251-drc',
            'skip_download': True,
        },
        'skip': 'Age-restricted; requires authentication',
    }, {
        'note': 'Support /live/ URL + media type for post-live content',
        'url': 'https://www.youtube.com/live/qVv6vCqciTM',
        'info_dict': {
            'id': 'qVv6vCqciTM',
            'ext': 'mp4',
            'title': '【 #インターネット女クリスマス 】3Dで歌ってはしゃぐインターネットの女たち【月ノ美兎/名取さな】',
            'age_limit': 0,
            'availability': 'public',
            'categories': ['Entertainment'],
            'channel': 'さなちゃんねる',
            'channel_follower_count': int,
            'channel_id': 'UCIdEIHpS0TdkqRkHL5OkLtA',
            'channel_is_verified': True,
            'channel_url': 'https://www.youtube.com/channel/UCIdEIHpS0TdkqRkHL5OkLtA',
            'chapters': 'count:13',
            'comment_count': int,
            'description': 'md5:6aebf95cc4a1d731aebc01ad6cc9806d',
            'duration': 4438,
            'heatmap': 'count:100',
            'like_count': int,
            'live_status': 'was_live',
            'media_type': 'livestream',
            'playable_in_embed': True,
            'release_date': '20221223',
            'release_timestamp': 1671793345,
            'tags': 'count:6',
            'thumbnail': r're:https?://i\.ytimg\.com/.+',
            'timestamp': 1671798112,
            'upload_date': '20221223',
            'uploader': 'さなちゃんねる',
            'uploader_id': '@sana_natori',
            'uploader_url': 'https://www.youtube.com/@sana_natori',
            'view_count': int,
        },
        'params': {'skip_download': True},
    }, {
        # Fallbacks when webpage and web client is unavailable
        'url': 'https://www.youtube.com/watch?v=wSSmNUl9Snw',
        'info_dict': {
            'id': 'wSSmNUl9Snw',
            'ext': 'webm',
            'title': 'The Computer Hack That Saved Apollo 14',
            'age_limit': 0,
            # 'availability': 'public',
            # 'categories': ['Science & Technology'],
            'channel': 'Scott Manley',
            'channel_follower_count': int,
            'channel_id': 'UCxzC4EngIsMrPmbm6Nxvb-A',
            'channel_is_verified': True,
            'channel_url': 'https://www.youtube.com/channel/UCxzC4EngIsMrPmbm6Nxvb-A',
            'chapters': 'count:2',
            'comment_count': int,
            'description': 'md5:f4bed7b200404b72a394c2f97b782c02',
            'duration': 682,
            'heatmap': 'count:100',
            'like_count': int,
            'live_status': 'not_live',
            'media_type': 'video',
            'playable_in_embed': True,
            'tags': 'count:8',
            'thumbnail': r're:https?://i\.ytimg\.com/.+',
            'timestamp': 1504198713,
            'upload_date': '20170831',
            'uploader': 'Scott Manley',
            'uploader_id': '@scottmanley',
            'uploader_url': 'https://www.youtube.com/@scottmanley',
            'view_count': int,
        },
        'params': {
            'extractor_args': {'youtube': {
                'player_client': ['ios'],
                'player_skip': ['webpage'],
            }},
            'skip_download': True,
        },
        'skip': 'PO Token Required',
    }, {
        # uploader_id has non-ASCII characters that are percent-encoded in YT's JSON
        # https://github.com/yt-dlp/yt-dlp/pull/11818
        'url': 'https://www.youtube.com/shorts/18NGQq7p3LY',
        'info_dict': {
            'id': '18NGQq7p3LY',
            'ext': 'mp4',
            'title': '아이브 이서 장원영 리즈 삐끼삐끼 챌린지',
            'age_limit': 0,
            'availability': 'public',
            'categories': ['People & Blogs'],
            'channel': 'ㅇㅇ',
            'channel_follower_count': int,
            'channel_id': 'UCC25oTm2J7ZVoi5TngOHg9g',
            'channel_url': 'https://www.youtube.com/channel/UCC25oTm2J7ZVoi5TngOHg9g',
            'description': '',
            'duration': 3,
            'like_count': int,
            'live_status': 'not_live',
            'media_type': 'short',
            'playable_in_embed': True,
            'tags': [],
            'thumbnail': r're:https?://i\.ytimg\.com/.+',
            'timestamp': 1724306170,
            'upload_date': '20240822',
            'uploader': 'ㅇㅇ',
            'uploader_id': '@으아-v1k',
            'uploader_url': 'https://www.youtube.com/@으아-v1k',
            'view_count': int,
        },
        'params': {'skip_download': True},
    }]
    _WEBPAGE_TESTS = [{
        # <object>
        # https://github.com/ytdl-org/youtube-dl/pull/12696
        'url': 'http://www.improbable.com/2017/04/03/untrained-modern-youths-and-ancient-masters-in-selfie-portraits/',
        'info_dict': {
            'id': 'msN87y-iEx0',
            'ext': 'mp4',
            'title': 'Feynman: Mirrors FUN TO IMAGINE 6',
            'upload_date': '20080526',
            'description': 'md5:873c81d308b979f0e23ee7e620b312a3',
            'age_limit': 0,
            'tags': 'count:8',
            'channel_id': 'UCCeo--lls1vna5YJABWAcVA',
            'playable_in_embed': True,
            'thumbnail': r're:https?://i\.ytimg\.com/.+',
            'like_count': int,
            'comment_count': int,
            'channel': 'Christopher Sykes',
            'live_status': 'not_live',
            'channel_url': 'https://www.youtube.com/channel/UCCeo--lls1vna5YJABWAcVA',
            'availability': 'public',
            'duration': 195,
            'view_count': int,
            'categories': ['Science & Technology'],
            'channel_follower_count': int,
            'uploader': 'Christopher Sykes',
            'uploader_url': 'https://www.youtube.com/@ChristopherSykesDocumentaries',
            'uploader_id': '@ChristopherSykesDocumentaries',
            'heatmap': 'count:100',
            'timestamp': 1211825920,
            'media_type': 'video',
        },
        'params': {'skip_download': True},
    }, {
        # <embed>
        # https://github.com/ytdl-org/youtube-dl/commit/2b88feedf7993c24b03e0a7ff169a548794de70c
        'url': 'https://badzine.de/news/als-marc-zwiebler-taufik-hidayat-schlug',
        'info_dict': {
            'id': 'bSVcWOq397g',
            'ext': 'mp4',
            'title': 'TAUFIK TUNJUKKAN KELASNYA !!! : Taufik Hidayat VS Marc Zwiebler Canada Open 2011',
            'age_limit': 0,
            'availability': 'public',
            'categories': ['Sports'],
            'channel': 'Badminton Addict Id',
            'channel_follower_count': int,
            'channel_id': 'UCfCpKOwQGUe2FUJzYNadQcQ',
            'channel_url': 'https://www.youtube.com/channel/UCfCpKOwQGUe2FUJzYNadQcQ',
            'comment_count': int,
            'description': 'md5:2c3737da9a575f301a8380b4d60592a8',
            'duration': 756,
            'like_count': int,
            'live_status': 'not_live',
            'media_type': 'video',
            'playable_in_embed': True,
            'tags': 'count:9',
            'thumbnail': r're:https?://i\.ytimg\.com/.+',
            'timestamp': 1621418412,
            'upload_date': '20210519',
            'uploader': 'Badminton Addict Id',
            'uploader_id': '@badmintonaddictid8958',
            'uploader_url': 'https://www.youtube.com/@badmintonaddictid8958',
            'view_count': int,
        },
        'params': {'skip_download': True},
    }, {
        # WordPress Plugin: YouTube Video Importer
        # https://github.com/ytdl-org/youtube-dl/commit/7deef1ba6743bf11247565e63ed7e31d2e8a9382
        'url': 'https://lothype.com/2025-chino-hills-hs-snare-quad-features-wgi2025-drumline/',
        'info_dict': {
            'id': 'lC21AX_pCfA',
            'ext': 'mp4',
            'title': '2025 Chino Hills HS Snare & Quad Features! #wgi2025 #drumline',
            'age_limit': 0,
            'availability': 'public',
            'categories': ['Music'],
            'channel': 'DrumlineAV',
            'channel_follower_count': int,
            'channel_id': 'UCqdfUdyiQOZMvW5PcTTYikQ',
            'channel_url': 'https://www.youtube.com/channel/UCqdfUdyiQOZMvW5PcTTYikQ',
            'comment_count': int,
            'description': '',
            'duration': 48,
            'like_count': int,
            'live_status': 'not_live',
            'location': 'WESTMINSTER',
            'media_type': 'short',
            'playable_in_embed': True,
            'tags': 'count:72',
            'thumbnail': r're:https?://i\.ytimg\.com/.+',
            'timestamp': 1739910835,
            'upload_date': '20250218',
            'uploader': 'DrumlineAV',
            'uploader_id': '@DrumlineAV',
            'uploader_url': 'https://www.youtube.com/@DrumlineAV',
            'view_count': int,
        },
        'params': {'skip_download': True},
    }, {
        # lazyYT
        # https://github.com/ytdl-org/youtube-dl/commit/65f3a228b16c55fee959eee055767a796479270f
        'url': 'https://rabota7.ru/%D0%91%D1%83%D1%85%D0%B3%D0%B0%D0%BB%D1%82%D0%B5%D1%80',
        'info_dict': {
            'id': 'DexR8_tTSsQ',
            'ext': 'mp4',
            'title': 'Работа бухгалтером в Москве',
            'age_limit': 0,
            'availability': 'public',
            'categories': ['People & Blogs'],
            'channel': 'Работа в Москве свежие вакансии',
            'channel_follower_count': int,
            'channel_id': 'UCG3qz_gefGaMiSBvmaxN5WQ',
            'channel_url': 'https://www.youtube.com/channel/UCG3qz_gefGaMiSBvmaxN5WQ',
            'description': 'md5:b779d3d70af4efda26cf62b76808c0e3',
            'duration': 42,
            'like_count': int,
            'live_status': 'not_live',
            'media_type': 'video',
            'playable_in_embed': True,
            'tags': 'count:7',
            'thumbnail': r're:https?://i\.ytimg\.com/.+',
            'timestamp': 1496398980,
            'upload_date': '20170602',
            'uploader': 'Работа в Москве свежие вакансии',
            'uploader_id': '@РаботавМосквесвежиевакансии',
            'uploader_url': 'https://www.youtube.com/@РаботавМосквесвежиевакансии',
            'view_count': int,
        },
        'params': {
            'extractor_args': {'generic': {'impersonate': ['chrome']}},
            'skip_download': True,
        },
    }, {
        # data-video-url=
        # https://github.com/ytdl-org/youtube-dl/pull/2948
        'url': 'https://www.uca.ac.uk/',
        'info_dict': {
            'id': 'www.uca.ac',
            'title': 'UCA | Creative Arts Degrees UK | University for the Creative Arts',
            'age_limit': 0,
            'description': 'md5:179c7a06ea1ed01b94ff5d56cb18d73b',
            'thumbnail': '/media/uca-2020/hero-headers/2025-prospectus-all-2x2.jpg',
        },
        'playlist_count': 10,
        'params': {'skip_download': True},
    }]

    _PLAYER_JS_VARIANT_MAP = {
        'main': 'player_ias.vflset/en_US/base.js',
        'tcc': 'player_ias_tcc.vflset/en_US/base.js',
        'tce': 'player_ias_tce.vflset/en_US/base.js',
        'es5': 'player_es5.vflset/en_US/base.js',
        'es6': 'player_es6.vflset/en_US/base.js',
        'tv': 'tv-player-ias.vflset/tv-player-ias.js',
        'tv_es6': 'tv-player-es6.vflset/tv-player-es6.js',
        'phone': 'player-plasma-ias-phone-en_US.vflset/base.js',
        'tablet': 'player-plasma-ias-tablet-en_US.vflset/base.js',
    }
    _INVERSE_PLAYER_JS_VARIANT_MAP = {v: k for k, v in _PLAYER_JS_VARIANT_MAP.items()}
    _NSIG_FUNC_CACHE_ID = 'nsig func'
    _DUMMY_STRING = 'dlp_wins'

    @classmethod
    def suitable(cls, url):
        from yt_dlp.utils import parse_qs

        qs = parse_qs(url)
        if qs.get('list', [None])[0]:
            return False
        return super().suitable(url)

    def __init__(self, *args, **kwargs):
        super().__init__(*args, **kwargs)
        self._code_cache = {}
        self._player_cache = {}
        self._pot_director = None

    def _real_initialize(self):
        super()._real_initialize()
        self._pot_director = initialize_pot_director(self)

    def _prepare_live_from_start_formats(self, formats, video_id, live_start_time, url, webpage_url, smuggled_data, is_live):
        lock = threading.Lock()
        start_time = time.time()
        formats = [f for f in formats if f.get('is_from_start')]

        def refetch_manifest(format_id, delay):
            nonlocal formats, start_time, is_live
            if time.time() <= start_time + delay:
                return

            _, _, _, _, prs, player_url = self._initial_extract(
                url, smuggled_data, webpage_url, 'web', video_id)
            video_details = traverse_obj(prs, (..., 'videoDetails'), expected_type=dict)
            microformats = traverse_obj(
                prs, (..., 'microformat', 'playerMicroformatRenderer'),
                expected_type=dict)
            _, live_status, _, formats, _ = self._list_formats(video_id, microformats, video_details, prs, player_url)
            is_live = live_status == 'is_live'
            start_time = time.time()

        def mpd_feed(format_id, delay):
            """
            @returns (manifest_url, manifest_stream_number, is_live) or None
            """
            for retry in self.RetryManager(fatal=False):
                with lock:
                    refetch_manifest(format_id, delay)

                f = next((f for f in formats if f['format_id'] == format_id), None)
                if not f:
                    if not is_live:
                        retry.error = f'{video_id}: Video is no longer live'
                    else:
                        retry.error = f'Cannot find refreshed manifest for format {format_id}{bug_reports_message()}'
                    continue

                # Formats from ended premieres will be missing a manifest_url
                # See https://github.com/yt-dlp/yt-dlp/issues/8543
                if not f.get('manifest_url'):
                    break

                return f['manifest_url'], f['manifest_stream_number'], is_live
            return None

        for f in formats:
            f['is_live'] = is_live
            gen = functools.partial(self._live_dash_fragments, video_id, f['format_id'],
                                    live_start_time, mpd_feed, not is_live and f.copy())
            if is_live:
                f['fragments'] = gen
                f['protocol'] = 'http_dash_segments_generator'
            else:
                f['fragments'] = LazyList(gen({}))
                del f['is_from_start']

    def _live_dash_fragments(self, video_id, format_id, live_start_time, mpd_feed, manifestless_orig_fmt, ctx):
        FETCH_SPAN, MAX_DURATION = 5, 432000

        mpd_url, stream_number, is_live = None, None, True

        begin_index = 0
        download_start_time = ctx.get('start') or time.time()

        lack_early_segments = download_start_time - (live_start_time or download_start_time) > MAX_DURATION
        if lack_early_segments:
            self.report_warning(bug_reports_message(
                'Starting download from the last 120 hours of the live stream since '
                'YouTube does not have data before that. If you think this is wrong,'), only_once=True)
            lack_early_segments = True

        known_idx, no_fragment_score, last_segment_url = begin_index, 0, None
        fragments, fragment_base_url = None, None

        def _extract_sequence_from_mpd(refresh_sequence, immediate):
            nonlocal mpd_url, stream_number, is_live, no_fragment_score, fragments, fragment_base_url
            # Obtain from MPD's maximum seq value
            old_mpd_url = mpd_url
            last_error = ctx.pop('last_error', None)
            expire_fast = immediate or (last_error and isinstance(last_error, HTTPError) and last_error.status == 403)
            mpd_url, stream_number, is_live = (mpd_feed(format_id, 5 if expire_fast else 18000)
                                               or (mpd_url, stream_number, False))
            if not refresh_sequence:
                if expire_fast and not is_live:
                    return False, last_seq
                elif old_mpd_url == mpd_url:
                    return True, last_seq
            if manifestless_orig_fmt:
                fmt_info = manifestless_orig_fmt
            else:
                try:
                    fmts, _ = self._extract_mpd_formats_and_subtitles(
                        mpd_url, None, note=False, errnote=False, fatal=False)
                except ExtractorError:
                    fmts = None
                if not fmts:
                    no_fragment_score += 2
                    return False, last_seq
                fmt_info = next(x for x in fmts if x['manifest_stream_number'] == stream_number)
            fragments = fmt_info['fragments']
            fragment_base_url = fmt_info['fragment_base_url']
            assert fragment_base_url

            _last_seq = int(re.search(r'(?:/|^)sq/(\d+)', fragments[-1]['path']).group(1))
            return True, _last_seq

        self.write_debug(f'[{video_id}] Generating fragments for format {format_id}')
        while is_live:
            fetch_time = time.time()
            if no_fragment_score > 30:
                return
            if last_segment_url:
                # Obtain from "X-Head-Seqnum" header value from each segment
                try:
                    urlh = self._request_webpage(
                        last_segment_url, None, note=False, errnote=False, fatal=False)
                except ExtractorError:
                    urlh = None
                last_seq = try_get(urlh, lambda x: int_or_none(x.headers['X-Head-Seqnum']))
                if last_seq is None:
                    no_fragment_score += 2
                    last_segment_url = None
                    continue
            else:
                should_continue, last_seq = _extract_sequence_from_mpd(True, no_fragment_score > 15)
                no_fragment_score += 2
                if not should_continue:
                    continue

            if known_idx > last_seq:
                last_segment_url = None
                continue

            last_seq += 1

            if begin_index < 0 and known_idx < 0:
                # skip from the start when it's negative value
                known_idx = last_seq + begin_index
            if lack_early_segments:
                known_idx = max(known_idx, last_seq - int(MAX_DURATION // fragments[-1]['duration']))
            try:
                for idx in range(known_idx, last_seq):
                    # do not update sequence here or you'll get skipped some part of it
                    should_continue, _ = _extract_sequence_from_mpd(False, False)
                    if not should_continue:
                        known_idx = idx - 1
                        raise ExtractorError('breaking out of outer loop')
                    last_segment_url = urljoin(fragment_base_url, f'sq/{idx}')
                    yield {
                        'url': last_segment_url,
                        'fragment_count': last_seq,
                    }
                if known_idx == last_seq:
                    no_fragment_score += 5
                else:
                    no_fragment_score = 0
                known_idx = last_seq
            except ExtractorError:
                continue

            if manifestless_orig_fmt:
                # Stop at the first iteration if running for post-live manifestless;
                # fragment count no longer increase since it starts
                break

            time.sleep(max(0, FETCH_SPAN + fetch_time - time.time()))

    def _get_player_js_version(self):
        player_js_version = self._configuration_arg('player_js_version', [''])[0] or '20348@0004de42'
        if player_js_version == 'actual':
            return None, None
        if not re.fullmatch(r'[0-9]{5,}@[0-9a-f]{8,}', player_js_version):
            self.report_warning(
                f'Invalid player JS version "{player_js_version}" specified. '
                f'It should be "actual" or in the format of STS@HASH', only_once=True)
            return None, None
        return player_js_version.split('@')

    def _extract_player_url(self, *ytcfgs, webpage=None):
        player_url = traverse_obj(
            ytcfgs, (..., 'PLAYER_JS_URL'), (..., 'WEB_PLAYER_CONTEXT_CONFIGS', ..., 'jsUrl'),
            get_all=False, expected_type=str)
        if not player_url:
            return
        player_id_override = self._get_player_js_version()[1]

        requested_js_variant = self._configuration_arg('player_js_variant', [''])[0] or 'main'
        if requested_js_variant in self._PLAYER_JS_VARIANT_MAP:
            player_id = player_id_override or self._extract_player_info(player_url)
            original_url = player_url
            player_url = f'/s/player/{player_id}/{self._PLAYER_JS_VARIANT_MAP[requested_js_variant]}'
            if original_url != player_url:
                self.write_debug(
                    f'Forcing "{requested_js_variant}" player JS variant for player {player_id}\n'
                    f'        original url = {original_url}', only_once=True)
        elif requested_js_variant != 'actual':
            self.report_warning(
                f'Invalid player JS variant name "{requested_js_variant}" requested. '
                f'Valid choices are: {", ".join(self._PLAYER_JS_VARIANT_MAP)}', only_once=True)

        return urljoin('https://www.youtube.com', player_url)

    def _download_player_url(self, video_id, fatal=False):
        iframe_webpage = self._download_webpage_with_retries(
            'https://www.youtube.com/iframe_api',
            note='Downloading iframe API JS',
            video_id=video_id, retry_fatal=fatal)

        if iframe_webpage:
            player_version = self._search_regex(
                r'player\\?/([0-9a-fA-F]{8})\\?/', iframe_webpage, 'player version', fatal=fatal)
            if player_version:
                return f'https://www.youtube.com/s/player/{player_version}/player_ias.vflset/en_US/base.js'

    def _player_js_cache_key(self, player_url):
        player_id = self._extract_player_info(player_url)
        player_path = remove_start(urllib.parse.urlparse(player_url).path, f'/s/player/{player_id}/')
        variant = self._INVERSE_PLAYER_JS_VARIANT_MAP.get(player_path) or next((
            v for k, v in self._INVERSE_PLAYER_JS_VARIANT_MAP.items()
            if re.fullmatch(re.escape(k).replace('en_US', r'[a-zA-Z0-9_]+'), player_path)), None)
        if not variant:
            self.write_debug(
                f'Unable to determine player JS variant\n'
                f'        player = {player_url}', only_once=True)
            variant = re.sub(r'[^a-zA-Z0-9]', '_', remove_end(player_path, '.js'))
        return join_nonempty(player_id, variant)

    def _signature_cache_id(self, example_sig):
        """ Return a string representation of a signature """
        return '.'.join(str(len(part)) for part in example_sig.split('.'))

    @classmethod
    def _extract_player_info(cls, player_url):
        for player_re in cls._PLAYER_INFO_RE:
            id_m = re.search(player_re, player_url)
            if id_m:
                break
        else:
            raise ExtractorError(f'Cannot identify player {player_url!r}')
        return id_m.group('id')

    def _load_player(self, video_id, player_url, fatal=True):
        player_js_key = self._player_js_cache_key(player_url)
        if player_js_key not in self._code_cache:
            code = self._download_webpage(
                player_url, video_id, fatal=fatal,
                note=f'Downloading player {player_js_key}',
                errnote=f'Download of {player_js_key} failed')
            if code:
                self._code_cache[player_js_key] = code
        return self._code_cache.get(player_js_key)

    def _extract_signature_function(self, video_id, player_url, example_sig):
        # Read from filesystem cache
        func_id = join_nonempty(
            self._player_js_cache_key(player_url), self._signature_cache_id(example_sig))
        assert os.path.basename(func_id) == func_id

        self.write_debug(f'Extracting signature function {func_id}')
        cache_spec, code = self.cache.load('youtube-sigfuncs', func_id, min_ver='2025.07.21'), None

        if not cache_spec:
            code = self._load_player(video_id, player_url)
        if code:
            res = self._parse_sig_js(code, player_url)
            test_string = ''.join(map(chr, range(len(example_sig))))
            cache_spec = [ord(c) for c in res(test_string)]
            self.cache.store('youtube-sigfuncs', func_id, cache_spec)

        return lambda s: ''.join(s[i] for i in cache_spec)

    def _parse_sig_js(self, jscode, player_url):
        # Examples where `sig` is funcname:
        # sig=function(a){a=a.split(""); ... ;return a.join("")};
        # ;c&&(c=sig(decodeURIComponent(c)),a.set(b,encodeURIComponent(c)));return a};
        # {var l=f,m=h.sp,n=sig(decodeURIComponent(h.s));l.set(m,encodeURIComponent(n))}
        # sig=function(J){J=J.split(""); ... ;return J.join("")};
        # ;N&&(N=sig(decodeURIComponent(N)),J.set(R,encodeURIComponent(N)));return J};
        # {var H=u,k=f.sp,v=sig(decodeURIComponent(f.s));H.set(k,encodeURIComponent(v))}
        funcname = self._search_regex(
            (r'\b(?P<var>[a-zA-Z0-9_$]+)&&\((?P=var)=(?P<sig>[a-zA-Z0-9_$]{2,})\(decodeURIComponent\((?P=var)\)\)',
             r'(?P<sig>[a-zA-Z0-9_$]+)\s*=\s*function\(\s*(?P<arg>[a-zA-Z0-9_$]+)\s*\)\s*{\s*(?P=arg)\s*=\s*(?P=arg)\.split\(\s*""\s*\)\s*;\s*[^}]+;\s*return\s+(?P=arg)\.join\(\s*""\s*\)',
             r'(?:\b|[^a-zA-Z0-9_$])(?P<sig>[a-zA-Z0-9_$]{2,})\s*=\s*function\(\s*a\s*\)\s*{\s*a\s*=\s*a\.split\(\s*""\s*\)(?:;[a-zA-Z0-9_$]{2}\.[a-zA-Z0-9_$]{2}\(a,\d+\))?',
             # Old patterns
             r'\b[cs]\s*&&\s*[adf]\.set\([^,]+\s*,\s*encodeURIComponent\s*\(\s*(?P<sig>[a-zA-Z0-9$]+)\(',
             r'\b[a-zA-Z0-9]+\s*&&\s*[a-zA-Z0-9]+\.set\([^,]+\s*,\s*encodeURIComponent\s*\(\s*(?P<sig>[a-zA-Z0-9$]+)\(',
             r'\bm=(?P<sig>[a-zA-Z0-9$]{2,})\(decodeURIComponent\(h\.s\)\)',
             # Obsolete patterns
             r'("|\')signature\1\s*,\s*(?P<sig>[a-zA-Z0-9$]+)\(',
             r'\.sig\|\|(?P<sig>[a-zA-Z0-9$]+)\(',
             r'yt\.akamaized\.net/\)\s*\|\|\s*.*?\s*[cs]\s*&&\s*[adf]\.set\([^,]+\s*,\s*(?:encodeURIComponent\s*\()?\s*(?P<sig>[a-zA-Z0-9$]+)\(',
             r'\b[cs]\s*&&\s*[adf]\.set\([^,]+\s*,\s*(?P<sig>[a-zA-Z0-9$]+)\(',
             r'\bc\s*&&\s*[a-zA-Z0-9]+\.set\([^,]+\s*,\s*\([^)]*\)\s*\(\s*(?P<sig>[a-zA-Z0-9$]+)\('),
            jscode, 'Initial JS player signature function name', group='sig')

        varname, global_list = self._interpret_player_js_global_var(jscode, player_url)
        jsi = JSInterpreter(jscode)
        initial_function = jsi.extract_function(funcname, filter_dict({varname: global_list}))
        return lambda s: initial_function([s])

    def _cached(self, func, *cache_id):
        def inner(*args, **kwargs):
            if cache_id not in self._player_cache:
                try:
                    self._player_cache[cache_id] = func(*args, **kwargs)
                except ExtractorError as e:
                    self._player_cache[cache_id] = e
                except Exception as e:
                    self._player_cache[cache_id] = ExtractorError(traceback.format_exc(), cause=e)

            ret = self._player_cache[cache_id]
            if isinstance(ret, Exception):
                raise ret
            return ret
        return inner

    def _load_player_data_from_cache(self, name, player_url):
        cache_id = (f'youtube-{name}', self._player_js_cache_key(player_url))

        if data := self._player_cache.get(cache_id):
            return data

        data = self.cache.load(*cache_id, min_ver='2025.07.21')
        if data:
            self._player_cache[cache_id] = data

        return data

    def _store_player_data_to_cache(self, name, player_url, data):
        cache_id = (f'youtube-{name}', self._player_js_cache_key(player_url))
        if cache_id not in self._player_cache:
            self.cache.store(*cache_id, data)
            self._player_cache[cache_id] = data

    def _decrypt_signature(self, s, video_id, player_url):
        """Turn the encrypted s field into a working signature"""
        extract_sig = self._cached(
            self._extract_signature_function, 'sig', player_url, self._signature_cache_id(s))
        func = extract_sig(video_id, player_url, s)
        return func(s)

    def _decrypt_nsig(self, s, video_id, player_url):
        """Turn the encrypted n field into a working signature"""
        if player_url is None:
            raise ExtractorError('Cannot decrypt nsig without player_url')
        player_url = urljoin('https://www.youtube.com', player_url)

        try:
            jsi, _, func_code = self._extract_n_function_code(video_id, player_url)
        except ExtractorError as e:
            raise ExtractorError('Unable to extract nsig function code', cause=e)

        try:
            extract_nsig = self._cached(self._extract_n_function_from_code, self._NSIG_FUNC_CACHE_ID, player_url)
            ret = extract_nsig(jsi, func_code)(s)
        except JSInterpreter.Exception as e:
            try:
                jsi = PhantomJSwrapper(self, timeout=5000)
            except ExtractorError:
                raise e
            self.report_warning(
                f'Native nsig extraction failed: Trying with PhantomJS\n'
                f'         n = {s} ; player = {player_url}', video_id)
            self.write_debug(e, only_once=True)

            args, func_body = func_code
            ret = jsi.execute(
                f'console.log(function({", ".join(args)}) {{ {func_body} }}({s!r}));',
                video_id=video_id, note='Executing signature code').strip()

        self.write_debug(f'Decrypted nsig {s} => {ret}')
        # Only cache nsig func JS code to disk if successful, and only once
        self._store_player_data_to_cache('nsig', player_url, func_code)
        return ret

    def _extract_n_function_name(self, jscode, player_url=None):
        varname, global_list = self._interpret_player_js_global_var(jscode, player_url)
        if debug_str := traverse_obj(global_list, (lambda _, v: v.endswith('-_w8_'), any)):
            pattern = r'''(?x)
                \{\s*return\s+%s\[%d\]\s*\+\s*(?P<argname>[a-zA-Z0-9_$]+)\s*\}
            ''' % (re.escape(varname), global_list.index(debug_str))
            if match := re.search(pattern, jscode):
                pattern = r'''(?x)
                    \{\s*\)%s\(\s*
                    (?:
                        (?P<funcname_a>[a-zA-Z0-9_$]+)\s*noitcnuf\s*
                        |noitcnuf\s*=\s*(?P<funcname_b>[a-zA-Z0-9_$]+)(?:\s+rav)?
                    )[;\n]
                ''' % re.escape(match.group('argname')[::-1])
                if match := re.search(pattern, jscode[match.start()::-1]):
                    a, b = match.group('funcname_a', 'funcname_b')
                    return (a or b)[::-1]
            self.write_debug(join_nonempty(
                'Initial search was unable to find nsig function name',
                player_url and f'        player = {player_url}', delim='\n'), only_once=True)

        # Examples (with placeholders nfunc, narray, idx):
        # *  .get("n"))&&(b=nfunc(b)
        # *  .get("n"))&&(b=narray[idx](b)
        # *  b=String.fromCharCode(110),c=a.get(b))&&c=narray[idx](c)
        # *  a.D&&(b="nn"[+a.D],c=a.get(b))&&(c=narray[idx](c),a.set(b,c),narray.length||nfunc("")
        # *  a.D&&(PL(a),b=a.j.n||null)&&(b=narray[0](b),a.set("n",b),narray.length||nfunc("")
        # *  a.D&&(b="nn"[+a.D],vL(a),c=a.j[b]||null)&&(c=narray[idx](c),a.set(b,c),narray.length||nfunc("")
        # *  J.J="";J.url="";J.Z&&(R="nn"[+J.Z],mW(J),N=J.K[R]||null)&&(N=narray[idx](N),J.set(R,N))}};
        funcname, idx = self._search_regex(
            r'''(?x)
            (?:
                \.get\("n"\)\)&&\(b=|
                (?:
                    b=String\.fromCharCode\(110\)|
                    (?P<str_idx>[a-zA-Z0-9_$.]+)&&\(b="nn"\[\+(?P=str_idx)\]
                )
                (?:
                    ,[a-zA-Z0-9_$]+\(a\))?,c=a\.
                    (?:
                        get\(b\)|
                        [a-zA-Z0-9_$]+\[b\]\|\|null
                    )\)&&\(c=|
                \b(?P<var>[a-zA-Z0-9_$]+)=
            )(?P<nfunc>[a-zA-Z0-9_$]+)(?:\[(?P<idx>\d+)\])?\([a-zA-Z]\)
            (?(var),[a-zA-Z0-9_$]+\.set\((?:"n+"|[a-zA-Z0-9_$]+)\,(?P=var)\))''',
            jscode, 'n function name', group=('nfunc', 'idx'), default=(None, None))
        if not funcname:
            self.report_warning(join_nonempty(
                'Falling back to generic n function search',
                player_url and f'         player = {player_url}', delim='\n'), only_once=True)
            return self._search_regex(
                r'''(?xs)
                ;\s*(?P<name>[a-zA-Z0-9_$]+)\s*=\s*function\([a-zA-Z0-9_$]+\)
                \s*\{(?:(?!};).)+?return\s*(?P<q>["'])[\w-]+_w8_(?P=q)\s*\+\s*[a-zA-Z0-9_$]+''',
                jscode, 'Initial JS player n function name', group='name')
        elif not idx:
            return funcname

        return json.loads(js_to_json(self._search_regex(
            rf'var {re.escape(funcname)}\s*=\s*(\[.+?\])\s*[,;]', jscode,
            f'Initial JS player n function list ({funcname}.{idx})')))[int(idx)]

    def _interpret_player_js_global_var(self, jscode, player_url):
        """Returns tuple of: variable name string, variable value list"""
        extract_global_var = self._cached(self._search_regex, 'js global array', player_url)
        varcode, varname, varvalue = extract_global_var(
            r'''(?x)
                (?P<q1>["\'])use\s+strict(?P=q1);\s*
                (?P<code>
                    var\s+(?P<name>[a-zA-Z0-9_$]+)\s*=\s*
                    (?P<value>
                        (?P<q2>["\'])(?:(?!(?P=q2)).|\\.)+(?P=q2)
                        \.split\((?P<q3>["\'])(?:(?!(?P=q3)).)+(?P=q3)\)
                        |\[\s*(?:(?P<q4>["\'])(?:(?!(?P=q4)).|\\.)*(?P=q4)\s*,?\s*)+\]
                    )
                )[;,]
            ''', jscode, 'global variable', group=('code', 'name', 'value'), default=(None, None, None))
        if not varcode:
            self.write_debug(join_nonempty(
                'No global array variable found in player JS',
                player_url and f'        player = {player_url}', delim='\n'), only_once=True)
            return None, None

        jsi = JSInterpreter(varcode)
        interpret_global_var = self._cached(jsi.interpret_expression, 'js global list', player_url)
        return varname, interpret_global_var(varvalue, LocalNameSpace(), allow_recursion=10)

    def _fixup_n_function_code(self, argnames, nsig_code, jscode, player_url):
        # Fixup global array
        varname, global_list = self._interpret_player_js_global_var(jscode, player_url)
        if varname and global_list:
            nsig_code = f'var {varname}={json.dumps(global_list)}; {nsig_code}'
        else:
            varname = self._DUMMY_STRING
            global_list = []

        # Fixup typeof check
        undefined_idx = global_list.index('undefined') if 'undefined' in global_list else r'\d+'
        fixed_code = re.sub(
            fr'''(?x)
                ;\s*if\s*\(\s*typeof\s+[a-zA-Z0-9_$]+\s*===?\s*(?:
                    (["\'])undefined\1|
                    {re.escape(varname)}\[{undefined_idx}\]
                )\s*\)\s*return\s+{re.escape(argnames[0])};
            ''', ';', nsig_code)
        if fixed_code == nsig_code:
            self.write_debug(join_nonempty(
                'No typeof statement found in nsig function code',
                player_url and f'        player = {player_url}', delim='\n'), only_once=True)

        # Fixup global funcs
        jsi = JSInterpreter(fixed_code)
        cache_id = (self._NSIG_FUNC_CACHE_ID, player_url)
        try:
            self._cached(
                self._extract_n_function_from_code, *cache_id)(jsi, (argnames, fixed_code))(self._DUMMY_STRING)
        except JSInterpreter.Exception:
            self._player_cache.pop(cache_id, None)

        global_funcnames = jsi._undefined_varnames
        debug_names = []
        jsi = JSInterpreter(jscode)
        for func_name in global_funcnames:
            try:
                func_args, func_code = jsi.extract_function_code(func_name)
                fixed_code = f'var {func_name} = function({", ".join(func_args)}) {{ {func_code} }}; {fixed_code}'
                debug_names.append(func_name)
            except Exception:
                self.report_warning(join_nonempty(
                    f'Unable to extract global nsig function {func_name} from player JS',
                    player_url and f'        player = {player_url}', delim='\n'), only_once=True)

        if debug_names:
            self.write_debug(f'Extracted global nsig functions: {", ".join(debug_names)}')

        return argnames, fixed_code

    def _extract_n_function_code(self, video_id, player_url):
        player_id = self._extract_player_info(player_url)
        func_code = self._load_player_data_from_cache('nsig', player_url)
        jscode = func_code or self._load_player(video_id, player_url)
        jsi = JSInterpreter(jscode)

        if func_code:
            return jsi, player_id, func_code

        func_name = self._extract_n_function_name(jscode, player_url=player_url)

        # XXX: Work around (a) global array variable, (b) `typeof` short-circuit, (c) global functions
        func_code = self._fixup_n_function_code(*jsi.extract_function_code(func_name), jscode, player_url)

        return jsi, player_id, func_code

    def _extract_n_function_from_code(self, jsi, func_code):
        func = jsi.extract_function_from_code(*func_code)

        def extract_nsig(s):
            try:
                ret = func([s])
            except JSInterpreter.Exception:
                raise
            except Exception as e:
                raise JSInterpreter.Exception(traceback.format_exc(), cause=e)

            if ret.startswith('enhanced_except_') or ret.endswith(s):
                raise JSInterpreter.Exception('Signature function returned an exception')
            return ret

        return extract_nsig

    def _extract_signature_timestamp(self, video_id, player_url, ytcfg=None, fatal=False):
        """
        Extract signatureTimestamp (sts)
        Required to tell API what sig/player version is in use.
        """
        player_sts_override = self._get_player_js_version()[0]
        if player_sts_override:
            return int(player_sts_override)

        if sts := traverse_obj(ytcfg, ('STS', {int_or_none})):
            return sts

        if not player_url:
            error_msg = 'Cannot extract signature timestamp without player url'
            if fatal:
                raise ExtractorError(error_msg)
            self.report_warning(error_msg)
            return None

        sts = self._load_player_data_from_cache('sts', player_url)
        if sts:
            return sts

        if code := self._load_player(video_id, player_url, fatal=fatal):
            sts = int_or_none(self._search_regex(
                r'(?:signatureTimestamp|sts)\s*:\s*(?P<sts>[0-9]{5})', code,
                'JS player signature timestamp', group='sts', fatal=fatal))
            if sts:
                self._store_player_data_to_cache('sts', player_url, sts)

        return sts

    def _mark_watched(self, video_id, player_responses):
        # cpn generation algorithm is reverse engineered from base.js.
        # In fact it works even with dummy cpn.
        CPN_ALPHABET = 'abcdefghijklmnopqrstuvwxyzABCDEFGHIJKLMNOPQRSTUVWXYZ0123456789-_'
        cpn = ''.join(CPN_ALPHABET[random.randint(0, 256) & 63] for _ in range(16))

        for is_full, key in enumerate(('videostatsPlaybackUrl', 'videostatsWatchtimeUrl')):
            label = 'fully ' if is_full else ''
            url = get_first(player_responses, ('playbackTracking', key, 'baseUrl'),
                            expected_type=url_or_none)
            if not url:
                self.report_warning(f'Unable to mark {label}watched')
                return
            parsed_url = urllib.parse.urlparse(url)
            qs = urllib.parse.parse_qs(parsed_url.query)

            # # more consistent results setting it to right before the end
            video_length = [str(float((qs.get('len') or ['1.5'])[0]) - 1)]

            qs.update({
                'ver': ['2'],
                'cpn': [cpn],
                'cmt': video_length,
                'el': 'detailpage',  # otherwise defaults to "shorts"
            })

            if is_full:
                # these seem to mark watchtime "history" in the real world
                # they're required, so send in a single value
                qs.update({
                    'st': 0,
                    'et': video_length,
                })

            url = urllib.parse.urlunparse(
                parsed_url._replace(query=urllib.parse.urlencode(qs, True)))

            self._download_webpage(
                url, video_id, f'Marking {label}watched',
                'Unable to mark watched', fatal=False)

    @classmethod
    def _extract_from_webpage(cls, url, webpage):
        # Invidious Instances
        # https://github.com/yt-dlp/yt-dlp/issues/195
        # https://github.com/iv-org/invidious/pull/1730
        mobj = re.search(
            r'<link rel="alternate" href="(?P<url>https://www\.youtube\.com/watch\?v=[0-9A-Za-z_-]{11})"',
            webpage)
        if mobj:
            yield cls.url_result(mobj.group('url'), cls)
            raise cls.StopExtraction

        yield from super()._extract_from_webpage(url, webpage)

        # lazyYT YouTube embed
        for id_ in re.findall(r'class="lazyYT" data-youtube-id="([^"]+)"', webpage):
            yield cls.url_result(unescapeHTML(id_), cls, id_)

        # Wordpress "YouTube Video Importer" plugin
        for m in re.findall(r'''(?x)<div[^>]+
                class=(?P<q1>[\'"])[^\'"]*\byvii_single_video_player\b[^\'"]*(?P=q1)[^>]+
                data-video_id=(?P<q2>[\'"])([^\'"]+)(?P=q2)''', webpage):
            yield cls.url_result(m[-1], cls, m[-1])

    @classmethod
    def extract_id(cls, url):
        video_id = cls.get_temp_id(url)
        if not video_id:
            raise ExtractorError(f'Invalid URL: {url}')
        return video_id

    def _extract_chapters_from_json(self, data, duration):
        chapter_list = traverse_obj(
            data, (
                'playerOverlays', 'playerOverlayRenderer', 'decoratedPlayerBarRenderer',
                'decoratedPlayerBarRenderer', 'playerBar', 'chapteredPlayerBarRenderer', 'chapters',
            ), expected_type=list)

        return self._extract_chapters_helper(
            chapter_list,
            start_function=lambda chapter: float_or_none(
                traverse_obj(chapter, ('chapterRenderer', 'timeRangeStartMillis')), scale=1000),
            title_function=lambda chapter: traverse_obj(
                chapter, ('chapterRenderer', 'title', 'simpleText'), expected_type=str),
            duration=duration)

    def _extract_chapters_from_engagement_panel(self, data, duration):
        content_list = traverse_obj(
            data,
            ('engagementPanels', ..., 'engagementPanelSectionListRenderer', 'content', 'macroMarkersListRenderer', 'contents'),
            expected_type=list)
        chapter_time = lambda chapter: parse_duration(self._get_text(chapter, 'timeDescription'))
        chapter_title = lambda chapter: self._get_text(chapter, 'title')

        return next(filter(None, (
            self._extract_chapters_helper(traverse_obj(contents, (..., 'macroMarkersListItemRenderer')),
                                          chapter_time, chapter_title, duration)
            for contents in content_list)), [])

    def _extract_heatmap(self, data):
        return traverse_obj(data, (
            'frameworkUpdates', 'entityBatchUpdate', 'mutations',
            lambda _, v: v['payload']['macroMarkersListEntity']['markersList']['markerType'] == 'MARKER_TYPE_HEATMAP',
            'payload', 'macroMarkersListEntity', 'markersList', 'markers', ..., {
                'start_time': ('startMillis', {float_or_none(scale=1000)}),
                'end_time': {lambda x: (int(x['startMillis']) + int(x['durationMillis'])) / 1000},
                'value': ('intensityScoreNormalized', {float_or_none}),
            })) or None

    def _extract_comment(self, entities, parent=None):
        comment_entity_payload = get_first(entities, ('payload', 'commentEntityPayload', {dict}))
        if not (comment_id := traverse_obj(comment_entity_payload, ('properties', 'commentId', {str}))):
            return

        toolbar_entity_payload = get_first(entities, ('payload', 'engagementToolbarStateEntityPayload', {dict}))
        time_text = traverse_obj(comment_entity_payload, ('properties', 'publishedTime', {str})) or ''

        return {
            'id': comment_id,
            'parent': parent or 'root',
            **traverse_obj(comment_entity_payload, {
                'text': ('properties', 'content', 'content', {str}),
                'like_count': ('toolbar', 'likeCountA11y', {parse_count}),
                'author_id': ('author', 'channelId', {self.ucid_or_none}),
                'author': ('author', 'displayName', {str}),
                'author_thumbnail': ('author', 'avatarThumbnailUrl', {url_or_none}),
                'author_is_uploader': ('author', 'isCreator', {bool}),
                'author_is_verified': ('author', 'isVerified', {bool}),
                'author_url': ('author', 'channelCommand', 'innertubeCommand', (
                    ('browseEndpoint', 'canonicalBaseUrl'), ('commandMetadata', 'webCommandMetadata', 'url'),
                ), {urljoin('https://www.youtube.com')}),
            }, get_all=False),
            'is_favorited': (None if toolbar_entity_payload is None else
                             toolbar_entity_payload.get('heartState') == 'TOOLBAR_HEART_STATE_HEARTED'),
            '_time_text': time_text,  # FIXME: non-standard, but we need a way of showing that it is an estimate.
            'timestamp': self._parse_time_text(time_text),
        }

    def _extract_comment_old(self, comment_renderer, parent=None):
        comment_id = comment_renderer.get('commentId')
        if not comment_id:
            return

        info = {
            'id': comment_id,
            'text': self._get_text(comment_renderer, 'contentText'),
            'like_count': self._get_count(comment_renderer, 'voteCount'),
            'author_id': traverse_obj(comment_renderer, ('authorEndpoint', 'browseEndpoint', 'browseId', {self.ucid_or_none})),
            'author': self._get_text(comment_renderer, 'authorText'),
            'author_thumbnail': traverse_obj(comment_renderer, ('authorThumbnail', 'thumbnails', -1, 'url', {url_or_none})),
            'parent': parent or 'root',
        }

        # Timestamp is an estimate calculated from the current time and time_text
        time_text = self._get_text(comment_renderer, 'publishedTimeText') or ''
        timestamp = self._parse_time_text(time_text)

        info.update({
            # FIXME: non-standard, but we need a way of showing that it is an estimate.
            '_time_text': time_text,
            'timestamp': timestamp,
        })

        info['author_url'] = urljoin(
            'https://www.youtube.com', traverse_obj(comment_renderer, ('authorEndpoint', (
                ('browseEndpoint', 'canonicalBaseUrl'), ('commandMetadata', 'webCommandMetadata', 'url'))),
                expected_type=str, get_all=False))

        author_is_uploader = traverse_obj(comment_renderer, 'authorIsChannelOwner')
        if author_is_uploader is not None:
            info['author_is_uploader'] = author_is_uploader

        comment_abr = traverse_obj(
            comment_renderer, ('actionButtons', 'commentActionButtonsRenderer'), expected_type=dict)
        if comment_abr is not None:
            info['is_favorited'] = 'creatorHeart' in comment_abr

        badges = self._extract_badges([traverse_obj(comment_renderer, 'authorCommentBadge')])
        if self._has_badge(badges, BadgeType.VERIFIED):
            info['author_is_verified'] = True

        is_pinned = traverse_obj(comment_renderer, 'pinnedCommentBadge')
        if is_pinned:
            info['is_pinned'] = True

        return info

    def _comment_entries(self, root_continuation_data, ytcfg, video_id, parent=None, tracker=None):

        get_single_config_arg = lambda c: self._configuration_arg(c, [''])[0]

        def extract_header(contents):
            _continuation = None
            for content in contents:
                comments_header_renderer = traverse_obj(content, 'commentsHeaderRenderer')
                expected_comment_count = self._get_count(
                    comments_header_renderer, 'countText', 'commentsCount')

                if expected_comment_count is not None:
                    tracker['est_total'] = expected_comment_count
                    self.to_screen(f'Downloading ~{expected_comment_count} comments')
                comment_sort_index = int(get_single_config_arg('comment_sort') != 'top')  # 1 = new, 0 = top

                sort_menu_item = try_get(
                    comments_header_renderer,
                    lambda x: x['sortMenu']['sortFilterSubMenuRenderer']['subMenuItems'][comment_sort_index], dict) or {}
                sort_continuation_ep = sort_menu_item.get('serviceEndpoint') or {}

                _continuation = self._extract_continuation_ep_data(sort_continuation_ep) or self._extract_continuation(sort_menu_item)
                if not _continuation:
                    continue

                sort_text = str_or_none(sort_menu_item.get('title'))
                if not sort_text:
                    sort_text = 'top comments' if comment_sort_index == 0 else 'newest first'
                self.to_screen(f'Sorting comments by {sort_text.lower()}')
                break
            return _continuation

        def extract_thread(contents, entity_payloads):
            if not parent:
                tracker['current_page_thread'] = 0
            for content in contents:
                if not parent and tracker['total_parent_comments'] >= max_parents:
                    yield
                comment_thread_renderer = try_get(content, lambda x: x['commentThreadRenderer'])

                # old comment format
                if not entity_payloads:
                    comment_renderer = get_first(
                        (comment_thread_renderer, content), [['commentRenderer', ('comment', 'commentRenderer')]],
                        expected_type=dict, default={})

                    comment = self._extract_comment_old(comment_renderer, parent)

                # new comment format
                else:
                    view_model = (
                        traverse_obj(comment_thread_renderer, ('commentViewModel', 'commentViewModel', {dict}))
                        or traverse_obj(content, ('commentViewModel', {dict})))
                    comment_keys = traverse_obj(view_model, (('commentKey', 'toolbarStateKey'), {str}))
                    if not comment_keys:
                        continue
                    entities = traverse_obj(entity_payloads, lambda _, v: v['entityKey'] in comment_keys)
                    comment = self._extract_comment(entities, parent)
                    if comment:
                        comment['is_pinned'] = traverse_obj(view_model, ('pinnedText', {str})) is not None

                if not comment:
                    continue
                comment_id = comment['id']

                if comment.get('is_pinned'):
                    tracker['pinned_comment_ids'].add(comment_id)
                # Sometimes YouTube may break and give us infinite looping comments.
                # See: https://github.com/yt-dlp/yt-dlp/issues/6290
                if comment_id in tracker['seen_comment_ids']:
                    if comment_id in tracker['pinned_comment_ids'] and not comment.get('is_pinned'):
                        # Pinned comments may appear a second time in newest first sort
                        # See: https://github.com/yt-dlp/yt-dlp/issues/6712
                        continue
                    self.report_warning(
                        'Detected YouTube comments looping. Stopping comment extraction '
                        f'{"for this thread" if parent else ""} as we probably cannot get any more.')
                    yield
                else:
                    tracker['seen_comment_ids'].add(comment['id'])

                tracker['running_total'] += 1
                tracker['total_reply_comments' if parent else 'total_parent_comments'] += 1
                yield comment

                # Attempt to get the replies
                comment_replies_renderer = try_get(
                    comment_thread_renderer, lambda x: x['replies']['commentRepliesRenderer'], dict)

                if comment_replies_renderer:
                    tracker['current_page_thread'] += 1
                    comment_entries_iter = self._comment_entries(
                        comment_replies_renderer, ytcfg, video_id,
                        parent=comment.get('id'), tracker=tracker)
                    yield from itertools.islice(comment_entries_iter, min(
                        max_replies_per_thread, max(0, max_replies - tracker['total_reply_comments'])))

        # Keeps track of counts across recursive calls
        if not tracker:
            tracker = {
                'running_total': 0,
                'est_total': None,
                'current_page_thread': 0,
                'total_parent_comments': 0,
                'total_reply_comments': 0,
                'seen_comment_ids': set(),
                'pinned_comment_ids': set(),
            }

        # TODO: Deprecated
        # YouTube comments have a max depth of 2
        max_depth = int_or_none(get_single_config_arg('max_comment_depth'))
        if max_depth:
            self._downloader.deprecated_feature('[youtube] max_comment_depth extractor argument is deprecated. '
                                                'Set max replies in the max-comments extractor argument instead')
        if max_depth == 1 and parent:
            return

        _max_comments, max_parents, max_replies, max_replies_per_thread, *_ = (
            int_or_none(p, default=sys.maxsize) for p in self._configuration_arg('max_comments') + [''] * 4)

        continuation = self._extract_continuation(root_continuation_data)

        response = None
        is_forced_continuation = False
        is_first_continuation = parent is None
        if is_first_continuation and not continuation:
            # Sometimes you can get comments by generating the continuation yourself,
            # even if YouTube initially reports them being disabled - e.g. stories comments.
            # Note: if the comment section is actually disabled, YouTube may return a response with
            # required check_get_keys missing. So we will disable that check initially in this case.
            continuation = self._build_api_continuation_query(self._generate_comment_continuation(video_id))
            is_forced_continuation = True

        continuation_items_path = (
            'onResponseReceivedEndpoints', ..., ('reloadContinuationItemsCommand', 'appendContinuationItemsAction'), 'continuationItems')
        for page_num in itertools.count(0):
            if not continuation:
                break
            headers = self.generate_api_headers(ytcfg=ytcfg, visitor_data=self._extract_visitor_data(response))
            comment_prog_str = f"({tracker['running_total']}/~{tracker['est_total']})"
            if page_num == 0:
                if is_first_continuation:
                    note_prefix = 'Downloading comment section API JSON'
                else:
                    note_prefix = '    Downloading comment API JSON reply thread %d %s' % (
                        tracker['current_page_thread'], comment_prog_str)
            else:
                note_prefix = '{}Downloading comment{} API JSON page {} {}'.format(
                    '       ' if parent else '', ' replies' if parent else '',
                    page_num, comment_prog_str)

            # Do a deep check for incomplete data as sometimes YouTube may return no comments for a continuation
            # Ignore check if YouTube says the comment count is 0.
            check_get_keys = None
            if not is_forced_continuation and not (tracker['est_total'] == 0 and tracker['running_total'] == 0):
                check_get_keys = [[*continuation_items_path, ..., (
                    'commentsHeaderRenderer' if is_first_continuation else ('commentThreadRenderer', 'commentViewModel', 'commentRenderer'))]]
            try:
                response = self._extract_response(
                    item_id=None, query=continuation,
                    ep='next', ytcfg=ytcfg, headers=headers, note=note_prefix,
                    check_get_keys=check_get_keys)
            except ExtractorError as e:
                # Ignore incomplete data error for replies if retries didn't work.
                # This is to allow any other parent comments and comment threads to be downloaded.
                # See: https://github.com/yt-dlp/yt-dlp/issues/4669
                if 'incomplete data' in str(e).lower() and parent:
                    if self.get_param('ignoreerrors') in (True, 'only_download'):
                        self.report_warning(
                            'Received incomplete data for a comment reply thread and retrying did not help. '
                            'Ignoring to let other comments be downloaded. Pass --no-ignore-errors to not ignore.')
                        return
                    else:
                        raise ExtractorError(
                            'Incomplete data received for comment reply thread. '
                            'Pass --ignore-errors to ignore and allow rest of comments to download.',
                            expected=True)
                raise
            is_forced_continuation = False
            continuation = None
            mutations = traverse_obj(response, ('frameworkUpdates', 'entityBatchUpdate', 'mutations', ..., {dict}))
            for continuation_items in traverse_obj(response, continuation_items_path, expected_type=list, default=[]):
                if is_first_continuation:
                    continuation = extract_header(continuation_items)
                    is_first_continuation = False
                    if continuation:
                        break
                    continue

                for entry in extract_thread(continuation_items, mutations):
                    if not entry:
                        return
                    yield entry
                continuation = self._extract_continuation({'contents': continuation_items})
                if continuation:
                    break

        message = self._get_text(root_continuation_data, ('contents', ..., 'messageRenderer', 'text'), max_runs=1)
        if message and not parent and tracker['running_total'] == 0:
            self.report_warning(f'Youtube said: {message}', video_id=video_id, only_once=True)
            raise self.CommentsDisabled

    @staticmethod
    def _generate_comment_continuation(video_id):
        """
        Generates initial comment section continuation token from given video id
        """
        token = f'\x12\r\x12\x0b{video_id}\x18\x062\'"\x11"\x0b{video_id}0\x00x\x020\x00B\x10comments-section'
        return base64.b64encode(token.encode()).decode()

    def _get_comments(self, ytcfg, video_id, contents, webpage):
        """Entry for comment extraction"""
        def _real_comment_extract(contents):
            renderer = next((
                item for item in traverse_obj(contents, (..., 'itemSectionRenderer'), default={})
                if item.get('sectionIdentifier') == 'comment-item-section'), None)
            yield from self._comment_entries(renderer, ytcfg, video_id)

        max_comments = int_or_none(self._configuration_arg('max_comments', [''])[0])
        return itertools.islice(_real_comment_extract(contents), 0, max_comments)

    @staticmethod
    def _get_checkok_params():
        return {'contentCheckOk': True, 'racyCheckOk': True}

    @classmethod
    def _generate_player_context(cls, sts=None):
        context = {
            'html5Preference': 'HTML5_PREF_WANTS',
        }
        if sts is not None:
            context['signatureTimestamp'] = sts
        return {
            'playbackContext': {
                'contentPlaybackContext': context,
            },
            **cls._get_checkok_params(),
        }

    def _get_config_po_token(self, client: str, context: _PoTokenContext):
        po_token_strs = self._configuration_arg('po_token', [], ie_key=YoutubeIE, casesense=True)
        for token_str in po_token_strs:
            po_token_meta, sep, po_token = token_str.partition('+')
            if not sep:
                self.report_warning(
                    f'Invalid po_token configuration format. '
                    f'Expected "CLIENT.CONTEXT+PO_TOKEN", got "{token_str}"', only_once=True)
                continue

            po_token_client, sep, po_token_context = po_token_meta.partition('.')
            if po_token_client.lower() != client:
                continue

            if not sep:
                # TODO(future): deprecate the old format?
                self.write_debug(
                    f'po_token configuration for {client} client is missing a context; assuming GVS. '
                    'You can provide a context with the format "CLIENT.CONTEXT+PO_TOKEN"',
                    only_once=True)
                po_token_context = _PoTokenContext.GVS.value

            if po_token_context.lower() != context.value:
                continue

            # Clean and validate the PO Token. This will strip invalid characters off
            # (e.g. additional url params the user may accidentally include)
            try:
                return base64.urlsafe_b64encode(base64.urlsafe_b64decode(urllib.parse.unquote(po_token))).decode()
            except (binascii.Error, ValueError):
                self.report_warning(
                    f'Invalid po_token configuration for {client} client: '
                    f'{po_token_context} PO Token should be a base64url-encoded string.',
                    only_once=True)
                continue

    def fetch_po_token(self, client='web', context: _PoTokenContext = _PoTokenContext.GVS, ytcfg=None, visitor_data=None,
                       data_sync_id=None, session_index=None, player_url=None, video_id=None, webpage=None,
                       required=False, **kwargs):
        """
        Fetch a PO Token for a given client and context. This function will validate required parameters for a given context and client.

        EXPERIMENTAL: This method is unstable and may change or be removed without notice.

        @param client: The client to fetch the PO Token for.
        @param context: The context in which the PO Token is used.
        @param ytcfg: The ytcfg for the client.
        @param visitor_data: visitor data.
        @param data_sync_id: data sync ID.
        @param session_index: session index.
        @param player_url: player URL.
        @param video_id: video ID.
        @param webpage: video webpage.
        @param required: Whether the PO Token is required (i.e. try to fetch unless policy is "never").
        @param kwargs: Additional arguments to pass down. May be more added in the future.
        @return: The fetched PO Token. None if it could not be fetched.
        """

        # TODO(future): This validation should be moved into pot framework.
        #  Some sort of middleware or validation provider perhaps?

        # GVS WebPO Token is bound to visitor_data / Visitor ID when logged out.
        # Must have visitor_data for it to function.
        if player_url and context == _PoTokenContext.GVS and not visitor_data and not self.is_authenticated:
            self.report_warning(
                f'Unable to fetch GVS PO Token for {client} client: Missing required Visitor Data. '
                f'You may need to pass Visitor Data with --extractor-args "youtube:visitor_data=XXX"', only_once=True)
            return

        if context == _PoTokenContext.PLAYER and not video_id:
            self.report_warning(
                f'Unable to fetch Player PO Token for {client} client: Missing required Video ID')
            return

        config_po_token = self._get_config_po_token(client, context)
        if config_po_token:
            # GVS WebPO token is bound to data_sync_id / account Session ID when logged in.
            if player_url and context == _PoTokenContext.GVS and not data_sync_id and self.is_authenticated:
                self.report_warning(
                    f'Got a GVS PO Token for {client} client, but missing Data Sync ID for account. Formats may not work.'
                    f'You may need to pass a Data Sync ID with --extractor-args "youtube:data_sync_id=XXX"')

            self.write_debug(f'{video_id}: Retrieved a {context.value} PO Token for {client} client from config')
            return config_po_token

        # Require GVS WebPO Token if logged in for external fetching
        if player_url and context == _PoTokenContext.GVS and not data_sync_id and self.is_authenticated:
            self.report_warning(
                f'Unable to fetch GVS PO Token for {client} client: Missing required Data Sync ID for account. '
                f'You may need to pass a Data Sync ID with --extractor-args "youtube:data_sync_id=XXX"', only_once=True)
            return

        po_token = self._fetch_po_token(
            client=client,
            context=context.value,
            ytcfg=ytcfg,
            visitor_data=visitor_data,
            data_sync_id=data_sync_id,
            session_index=session_index,
            player_url=player_url,
            video_id=video_id,
            video_webpage=webpage,
            required=required,
            **kwargs,
        )

        if po_token:
            self.write_debug(f'{video_id}: Retrieved a {context.value} PO Token for {client} client')
            return po_token

    def _fetch_po_token(self, client, **kwargs):
        context = kwargs.get('context')

        # Avoid fetching PO Tokens when not required
        fetch_pot_policy = self._configuration_arg('fetch_pot', [''], ie_key=YoutubeIE)[0]
        if fetch_pot_policy not in ('never', 'auto', 'always'):
            fetch_pot_policy = 'auto'
        if (
            fetch_pot_policy == 'never'
            or (
                fetch_pot_policy == 'auto'
                and not kwargs.get('required', False)
            )
        ):
            return None

        headers = self.get_param('http_headers').copy()
        proxies = self._downloader.proxies.copy()
        clean_headers(headers)
        clean_proxies(proxies, headers)

        innertube_host = self._select_api_hostname(None, default_client=client)

        pot_request = PoTokenRequest(
            context=PoTokenContext(context),
            innertube_context=traverse_obj(kwargs, ('ytcfg', 'INNERTUBE_CONTEXT')),
            innertube_host=innertube_host,
            internal_client_name=client,
            session_index=kwargs.get('session_index'),
            player_url=kwargs.get('player_url'),
            video_webpage=kwargs.get('video_webpage'),
            is_authenticated=self.is_authenticated,
            visitor_data=kwargs.get('visitor_data'),
            data_sync_id=kwargs.get('data_sync_id'),
            video_id=kwargs.get('video_id'),
            request_cookiejar=self._downloader.cookiejar,

            # All requests that would need to be proxied should be in the
            # context of www.youtube.com or the innertube host
            request_proxy=(
                select_proxy('https://www.youtube.com', proxies)
                or select_proxy(f'https://{innertube_host}', proxies)
            ),
            request_headers=headers,
            request_timeout=self.get_param('socket_timeout'),
            request_verify_tls=not self.get_param('nocheckcertificate'),
            request_source_address=self.get_param('source_address'),

            bypass_cache=False,
        )

        return self._pot_director.get_po_token(pot_request)

    @staticmethod
    def _is_agegated(player_response):
        if traverse_obj(player_response, ('playabilityStatus', 'desktopLegacyAgeGateReason')):
            return True

        reasons = traverse_obj(player_response, ('playabilityStatus', ('status', 'reason')))
        AGE_GATE_REASONS = (
            'confirm your age', 'age-restricted', 'inappropriate',  # reason
            'age_verification_required', 'age_check_required',  # status
        )
        return any(expected in reason for expected in AGE_GATE_REASONS for reason in reasons)

    @staticmethod
    def _is_unplayable(player_response):
        return traverse_obj(player_response, ('playabilityStatus', 'status')) == 'UNPLAYABLE'

    def _extract_player_response(self, client, video_id, webpage_ytcfg, player_ytcfg, player_url, initial_pr, visitor_data, data_sync_id, po_token):
        headers = self.generate_api_headers(
            ytcfg=player_ytcfg,
            default_client=client,
            visitor_data=visitor_data,
            session_index=self._extract_session_index(webpage_ytcfg, player_ytcfg),
            delegated_session_id=(
                self._parse_data_sync_id(data_sync_id)[0]
                or self._extract_delegated_session_id(webpage_ytcfg, initial_pr, player_ytcfg)
            ),
            user_session_id=(
                self._parse_data_sync_id(data_sync_id)[1]
                or self._extract_user_session_id(webpage_ytcfg, initial_pr, player_ytcfg)
            ),
        )

        yt_query = {
            'videoId': video_id,
        }

        default_pp = traverse_obj(
            INNERTUBE_CLIENTS, (_split_innertube_client(client)[0], 'PLAYER_PARAMS', {str}))
        if player_params := self._configuration_arg('player_params', [default_pp], casesense=True)[0]:
            yt_query['params'] = player_params

        if po_token:
            yt_query['serviceIntegrityDimensions'] = {'poToken': po_token}

        sts = self._extract_signature_timestamp(video_id, player_url, webpage_ytcfg, fatal=False) if player_url else None
        yt_query.update(self._generate_player_context(sts))
        return self._extract_response(
            item_id=video_id, ep='player', query=yt_query,
            ytcfg=player_ytcfg, headers=headers, fatal=True,
            default_client=client,
            note='Downloading {} player API JSON'.format(client.replace('_', ' ').strip()),
        ) or None

    def _get_requested_clients(self, url, smuggled_data, is_premium_subscriber):
        requested_clients = []
        excluded_clients = []
        default_clients = (
            self._DEFAULT_PREMIUM_CLIENTS if is_premium_subscriber
            else self._DEFAULT_AUTHED_CLIENTS if self.is_authenticated
            else self._DEFAULT_CLIENTS
        )
        allowed_clients = sorted(
            (client for client in INNERTUBE_CLIENTS if client[:1] != '_'),
            key=lambda client: INNERTUBE_CLIENTS[client]['priority'], reverse=True)
        for client in self._configuration_arg('player_client'):
            if client == 'default':
                requested_clients.extend(default_clients)
            elif client == 'all':
                requested_clients.extend(allowed_clients)
            elif client.startswith('-'):
                excluded_clients.append(client[1:])
            elif client not in allowed_clients:
                self.report_warning(f'Skipping unsupported client "{client}"')
            else:
                requested_clients.append(client)
        if not requested_clients:
            requested_clients.extend(default_clients)
        for excluded_client in excluded_clients:
            if excluded_client in requested_clients:
                requested_clients.remove(excluded_client)
        if not requested_clients:
            raise ExtractorError('No player clients have been requested', expected=True)

        if self.is_authenticated:
            if (smuggled_data.get('is_music_url') or self.is_music_url(url)) and 'web_music' not in requested_clients:
                requested_clients.append('web_music')

            unsupported_clients = [
                client for client in requested_clients if not INNERTUBE_CLIENTS[client]['SUPPORTS_COOKIES']
            ]
            for client in unsupported_clients:
                self.report_warning(f'Skipping client "{client}" since it does not support cookies', only_once=True)
                requested_clients.remove(client)

        return orderedSet(requested_clients)

    def _invalid_player_response(self, pr, video_id):
        # YouTube may return a different video player response than expected.
        # See: https://github.com/TeamNewPipe/NewPipe/issues/8713
        if (pr_id := traverse_obj(pr, ('videoDetails', 'videoId'))) != video_id:
            return pr_id

    def _extract_player_responses(self, clients, video_id, webpage, webpage_client, webpage_ytcfg, is_premium_subscriber):
        initial_pr = None
        if webpage:
            initial_pr = self._search_json(
                self._YT_INITIAL_PLAYER_RESPONSE_RE, webpage,
                f'{webpage_client} client initial player response', video_id, fatal=False)

        prs = []
        deprioritized_prs = []

        if initial_pr and not self._invalid_player_response(initial_pr, video_id):
            # Android player_response does not have microFormats which are needed for
            # extraction of some data. So we return the initial_pr with formats
            # stripped out even if not requested by the user
            # See: https://github.com/yt-dlp/yt-dlp/issues/501
            prs.append({**initial_pr, 'streamingData': None})

        all_clients = set(clients)
        clients = clients[::-1]

        def append_client(*client_names):
            """ Append the first client name that exists but not already used """
            for client_name in client_names:
                actual_client = _split_innertube_client(client_name)[0]
                if actual_client in INNERTUBE_CLIENTS:
                    if actual_client not in all_clients:
                        clients.append(client_name)
                        all_clients.add(actual_client)
                        return

        tried_iframe_fallback = False
        player_url = visitor_data = data_sync_id = None
        skipped_clients = {}
        while clients:
            deprioritize_pr = False
            client, base_client, variant = _split_innertube_client(clients.pop())
            player_ytcfg = webpage_ytcfg if client == webpage_client else {}
            if 'configs' not in self._configuration_arg('player_skip') and client != webpage_client:
                player_ytcfg = self._download_ytcfg(client, video_id) or player_ytcfg

            player_url = player_url or self._extract_player_url(webpage_ytcfg, player_ytcfg, webpage=webpage)
            require_js_player = self._get_default_ytcfg(client).get('REQUIRE_JS_PLAYER')
            if 'js' in self._configuration_arg('player_skip'):
                require_js_player = False
                player_url = None

            if not player_url and not tried_iframe_fallback and require_js_player:
                player_url = self._download_player_url(video_id)
                tried_iframe_fallback = True

            pr = None
            if client == webpage_client and 'player_response' not in self._configuration_arg('webpage_skip'):
                pr = initial_pr

            visitor_data = visitor_data or self._extract_visitor_data(webpage_ytcfg, initial_pr, player_ytcfg)
            data_sync_id = data_sync_id or self._extract_data_sync_id(webpage_ytcfg, initial_pr, player_ytcfg)

            fetch_po_token_args = {
                'client': client,
                'visitor_data': visitor_data,
                'video_id': video_id,
                'data_sync_id': data_sync_id if self.is_authenticated else None,
                'player_url': player_url if require_js_player else None,
                'webpage': webpage,
                'session_index': self._extract_session_index(webpage_ytcfg, player_ytcfg),
                'ytcfg': player_ytcfg or self._get_default_ytcfg(client),
            }

            # Don't need a player PO token for WEB if using player response from webpage
            player_pot_policy: PlayerPoTokenPolicy = self._get_default_ytcfg(client)['PLAYER_PO_TOKEN_POLICY']
            player_po_token = None if pr else self.fetch_po_token(
                context=_PoTokenContext.PLAYER, **fetch_po_token_args,
                required=player_pot_policy.required or player_pot_policy.recommended)

            fetch_gvs_po_token_func = functools.partial(
                self.fetch_po_token, context=_PoTokenContext.GVS, **fetch_po_token_args)

            fetch_subs_po_token_func = functools.partial(
                self.fetch_po_token, context=_PoTokenContext.SUBS, **fetch_po_token_args)

            try:
                pr = pr or self._extract_player_response(
                    client, video_id,
                    webpage_ytcfg=player_ytcfg or webpage_ytcfg,
                    player_ytcfg=player_ytcfg,
                    player_url=player_url,
                    initial_pr=initial_pr,
                    visitor_data=visitor_data,
                    data_sync_id=data_sync_id,
                    po_token=player_po_token)
            except ExtractorError as e:
                self.report_warning(e)
                continue

            if pr_id := self._invalid_player_response(pr, video_id):
                skipped_clients[client] = pr_id
            elif pr:
                # Save client details for introspection later
                innertube_context = traverse_obj(player_ytcfg or self._get_default_ytcfg(client), 'INNERTUBE_CONTEXT')
                fetched_timestamp = int(time.time())
                sd = pr.setdefault('streamingData', {})
                sd[STREAMING_DATA_CLIENT_NAME] = client
                sd[STREAMING_DATA_FETCH_GVS_PO_TOKEN] = fetch_gvs_po_token_func
                sd[STREAMING_DATA_PLAYER_TOKEN_PROVIDED] = bool(player_po_token)
                sd[STREAMING_DATA_INNERTUBE_CONTEXT] = innertube_context
                sd[STREAMING_DATA_FETCH_SUBS_PO_TOKEN] = fetch_subs_po_token_func
                sd[STREAMING_DATA_IS_PREMIUM_SUBSCRIBER] = is_premium_subscriber
                for f in traverse_obj(sd, (('formats', 'adaptiveFormats'), ..., {dict})):
                    f[STREAMING_DATA_CLIENT_NAME] = client
                    f[STREAMING_DATA_FETCH_GVS_PO_TOKEN] = fetch_gvs_po_token_func
                    f[STREAMING_DATA_IS_PREMIUM_SUBSCRIBER] = is_premium_subscriber
                    f[STREAMING_DATA_PLAYER_TOKEN_PROVIDED] = bool(player_po_token)
                    f[STREAMING_DATA_FETCHED_TIMESTAMP] = fetched_timestamp
                if deprioritize_pr:
                    deprioritized_prs.append(pr)
                else:
                    prs.append(pr)

            # web_embedded can work around age-gate and age-verification for some embeddable videos
            if self._is_agegated(pr) and variant != 'web_embedded':
                append_client(f'web_embedded.{base_client}')
            # Unauthenticated users will only get web_embedded client formats if age-gated
            if self._is_agegated(pr) and not self.is_authenticated:
                self.to_screen(
                    f'{video_id}: This video is age-restricted; some formats may be missing '
                    f'without authentication. {self._youtube_login_hint}', only_once=True)

            # EU countries require age-verification for accounts to access age-restricted videos
            # If account is not age-verified, _is_agegated() will be truthy for non-embedded clients
            embedding_is_disabled = variant == 'web_embedded' and self._is_unplayable(pr)
            if self.is_authenticated and (self._is_agegated(pr) or embedding_is_disabled):
                self.to_screen(
                    f'{video_id}: This video is age-restricted and YouTube is requiring '
                    'account age-verification; some formats may be missing', only_once=True)
                # tv_embedded can work around the age-verification requirement for embeddable videos
                # web_creator may work around age-verification for all videos but requires PO token
                append_client('tv_embedded', 'web_creator')

            status = traverse_obj(pr, ('playabilityStatus', 'status', {str}))
            if status not in ('OK', 'LIVE_STREAM_OFFLINE', 'AGE_CHECK_REQUIRED', 'AGE_VERIFICATION_REQUIRED'):
                self.write_debug(f'{video_id}: {client} player response playability status: {status}')

        prs.extend(deprioritized_prs)

        if skipped_clients:
            self.report_warning(
                f'Skipping player responses from {"/".join(skipped_clients)} clients '
                f'(got player responses for video "{"/".join(set(skipped_clients.values()))}" instead of "{video_id}")')
            if not prs:
                raise ExtractorError(
                    'All player responses are invalid. Your IP is likely being blocked by Youtube', expected=True)
        elif not prs:
            raise ExtractorError('Failed to extract any player response')
        return prs, player_url

    def _needs_live_processing(self, live_status, duration):
        if ((live_status == 'is_live' and self.get_param('live_from_start'))
                or (live_status == 'post_live' and (duration or 0) > 2 * 3600)):
            return live_status

    def _report_pot_format_skipped(self, video_id, client_name, proto):
        msg = (
            f'{video_id}: {client_name} client {proto} formats require a GVS PO Token which was not provided. '
            'They will be skipped as they may yield HTTP Error 403. '
            f'You can manually pass a GVS PO Token for this client with --extractor-args "youtube:po_token={client_name}.gvs+XXX". '
            f'For more information, refer to  {PO_TOKEN_GUIDE_URL}')

        # Only raise a warning for non-default clients, to not confuse users.
        if client_name in (*self._DEFAULT_CLIENTS, *self._DEFAULT_AUTHED_CLIENTS):
            self.write_debug(msg, only_once=True)
        else:
            self.report_warning(msg, only_once=True)

    def _report_pot_subtitles_skipped(self, video_id, client_name, msg=None):
        msg = msg or (
            f'{video_id}: Some {client_name} client subtitles require a PO Token which was not provided. '
            'They will be discarded since they are not downloadable as-is. '
            f'You can manually pass a Subtitles PO Token for this client with '
            f'--extractor-args "youtube:po_token={client_name}.subs+XXX" . '
            f'For more information, refer to  {PO_TOKEN_GUIDE_URL}')

        subs_wanted = any((
            self.get_param('writesubtitles'),
            self.get_param('writeautomaticsub'),
            self.get_param('listsubtitles')))

        # Only raise a warning for non-default clients, to not confuse users.
        if not subs_wanted or client_name in (*self._DEFAULT_CLIENTS, *self._DEFAULT_AUTHED_CLIENTS):
            self.write_debug(msg, only_once=True)
        else:
            self.report_warning(msg, only_once=True)

    def _extract_formats_and_subtitles(self, streaming_data, video_id, player_url, live_status, duration):
        CHUNK_SIZE = 10 << 20
        PREFERRED_LANG_VALUE = 10
        original_language = None
        itags, stream_ids = collections.defaultdict(set), []
        itag_qualities, res_qualities = {}, {0: None}
        q = qualities([
            # Normally tiny is the smallest video-only formats. But
            # audio-only formats with unknown quality may get tagged as tiny
            'tiny',
            'audio_quality_ultralow', 'audio_quality_low', 'audio_quality_medium', 'audio_quality_high',  # Audio only formats
            'small', 'medium', 'large', 'hd720', 'hd1080', 'hd1440', 'hd2160', 'hd2880', 'highres',
        ])
        streaming_formats = traverse_obj(streaming_data, (..., ('formats', 'adaptiveFormats'), ...))
        format_types = self._configuration_arg('formats')
        all_formats = 'duplicate' in format_types
        if self._configuration_arg('include_duplicate_formats'):
            all_formats = True
            self._downloader.deprecated_feature('[youtube] include_duplicate_formats extractor argument is deprecated. '
                                                'Use formats=duplicate extractor argument instead')

        def build_fragments(f):
            return LazyList({
                'url': update_url_query(f['url'], {
                    'range': f'{range_start}-{min(range_start + CHUNK_SIZE - 1, f["filesize"])}',
                }),
            } for range_start in range(0, f['filesize'], CHUNK_SIZE))

        def gvs_pot_required(policy, is_premium_subscriber, has_player_token):
            return (
                policy.required
                and not (policy.not_required_with_player_token and has_player_token)
                and not (policy.not_required_for_premium and is_premium_subscriber))

        # save pots per client to avoid fetching again
        gvs_pots = {}

        # For handling potential pre-playback required waiting period
        playback_wait = int_or_none(self._configuration_arg('playback_wait', [None])[0], default=6)

        for fmt in streaming_formats:
            client_name = fmt[STREAMING_DATA_CLIENT_NAME]
            available_at = fmt[STREAMING_DATA_FETCHED_TIMESTAMP] + playback_wait
            if fmt.get('targetDurationSec'):
                continue

            itag = str_or_none(fmt.get('itag'))
            audio_track = fmt.get('audioTrack') or {}
            stream_id = (itag, audio_track.get('id'), fmt.get('isDrc'))
            if not all_formats:
                if stream_id in stream_ids:
                    continue

            quality = fmt.get('quality')
            height = int_or_none(fmt.get('height'))
            if quality == 'tiny' or not quality:
                quality = fmt.get('audioQuality', '').lower() or quality
            # The 3gp format (17) in android client has a quality of "small",
            # but is actually worse than other formats
            if itag == '17':
                quality = 'tiny'
            if quality:
                if itag:
                    itag_qualities[itag] = quality
                if height:
                    res_qualities[height] = quality

            display_name = audio_track.get('displayName') or ''
            is_original = 'original' in display_name.lower()
            is_descriptive = 'descriptive' in display_name.lower()
            is_default = audio_track.get('audioIsDefault')
            language_code = audio_track.get('id', '').split('.')[0]
            if language_code and (is_original or (is_default and not original_language)):
                original_language = language_code

            has_drm = bool(fmt.get('drmFamilies'))

            # FORMAT_STREAM_TYPE_OTF(otf=1) requires downloading the init fragment
            # (adding `&sq=0` to the URL) and parsing emsg box to determine the
            # number of fragment that would subsequently requested with (`&sq=N`)
            if fmt.get('type') == 'FORMAT_STREAM_TYPE_OTF' and not has_drm:
                continue

            if has_drm:
                msg = f'Some {client_name} client https formats have been skipped as they are DRM protected. '
                if client_name == 'tv':
                    msg += (
                        f'{"Your account" if self.is_authenticated else "The current session"} may have '
                        f'an experiment that applies DRM to all videos on the tv client. '
                        f'See  https://github.com/yt-dlp/yt-dlp/issues/12563  for more details.'
                    )
                self.report_warning(msg, video_id, only_once=True)

            fmt_url = fmt.get('url')
            if not fmt_url:
                sc = urllib.parse.parse_qs(fmt.get('signatureCipher'))
                fmt_url = url_or_none(try_get(sc, lambda x: x['url'][0]))
                encrypted_sig = try_get(sc, lambda x: x['s'][0])
                if not all((sc, fmt_url, player_url, encrypted_sig)):
                    msg = f'Some {client_name} client https formats have been skipped as they are missing a url. '
                    if client_name in ('web', 'web_safari'):
                        msg += 'YouTube is forcing SABR streaming for this client. '
                    else:
                        msg += (
                            f'YouTube may have enabled the SABR-only or Server-Side Ad Placement experiment for '
                            f'{"your account" if self.is_authenticated else "the current session"}. '
                        )
                    msg += 'See  https://github.com/yt-dlp/yt-dlp/issues/12482  for more details'
                    self.report_warning(msg, video_id, only_once=True)
                    continue
                try:
                    fmt_url += '&{}={}'.format(
                        traverse_obj(sc, ('sp', -1)) or 'signature',
                        self._decrypt_signature(encrypted_sig, video_id, player_url),
                    )
                except ExtractorError as e:
                    self.report_warning(
                        f'Signature extraction failed: Some formats may be missing\n'
                        f'         player = {player_url}\n'
                        f'         {bug_reports_message(before="")}',
                        video_id=video_id, only_once=True)
                    self.write_debug(
                        f'{video_id}: Signature extraction failure info:\n'
                        f'         encrypted sig = {encrypted_sig}\n'
                        f'         player = {player_url}')
                    self.write_debug(e, only_once=True)
                    continue

            query = parse_qs(fmt_url)
            if query.get('n'):
                try:
                    decrypt_nsig = self._cached(self._decrypt_nsig, 'nsig', query['n'][0])
                    fmt_url = update_url_query(fmt_url, {
                        'n': decrypt_nsig(query['n'][0], video_id, player_url),
                    })
                except ExtractorError as e:
                    if player_url:
                        self.report_warning(
                            f'nsig extraction failed: Some formats may be missing\n'
                            f'         n = {query["n"][0]} ; player = {player_url}\n'
                            f'         {bug_reports_message(before="")}',
                            video_id=video_id, only_once=True)
                        self.write_debug(e, only_once=True)
                    else:
                        self.report_warning(
                            'Cannot decrypt nsig without player_url: Some formats may be missing',
                            video_id=video_id, only_once=True)
                    continue

            tbr = float_or_none(fmt.get('averageBitrate') or fmt.get('bitrate'), 1000)
            format_duration = traverse_obj(fmt, ('approxDurationMs', {float_or_none(scale=1000)}))
            # Some formats may have much smaller duration than others (possibly damaged during encoding)
            # E.g. 2-nOtRESiUc Ref: https://github.com/yt-dlp/yt-dlp/issues/2823
            # Make sure to avoid false positives with small duration differences.
            # E.g. __2ABJjxzNo, ySuUZEjARPY
            is_damaged = try_call(lambda: format_duration < duration // 2)
            if is_damaged:
                self.report_warning(
                    'Some formats are possibly damaged. They will be deprioritized', video_id, only_once=True)

            fetch_po_token_func = fmt[STREAMING_DATA_FETCH_GVS_PO_TOKEN]
            pot_policy: GvsPoTokenPolicy = self._get_default_ytcfg(client_name)['GVS_PO_TOKEN_POLICY'][StreamingProtocol.HTTPS]

            require_po_token = (
                itag not in ['18']
                and gvs_pot_required(
                    pot_policy, fmt[STREAMING_DATA_IS_PREMIUM_SUBSCRIBER],
                    fmt[STREAMING_DATA_PLAYER_TOKEN_PROVIDED]))

            po_token = (
                gvs_pots.get(client_name)
                or fetch_po_token_func(required=require_po_token or pot_policy.recommended))

            if po_token:
                fmt_url = update_url_query(fmt_url, {'pot': po_token})
                if client_name not in gvs_pots:
                    gvs_pots[client_name] = po_token

            if not po_token and require_po_token and 'missing_pot' not in self._configuration_arg('formats'):
                self._report_pot_format_skipped(video_id, client_name, 'https')
                continue

            name = fmt.get('qualityLabel') or quality.replace('audio_quality_', '') or ''
            fps = int_or_none(fmt.get('fps')) or 0
            dct = {
                'asr': int_or_none(fmt.get('audioSampleRate')),
                'filesize': int_or_none(fmt.get('contentLength')),
                'format_id': f'{itag}{"-drc" if fmt.get("isDrc") else ""}',
                'format_note': join_nonempty(
                    join_nonempty(display_name, is_default and ' (default)', delim=''),
                    name, fmt.get('isDrc') and 'DRC',
                    try_get(fmt, lambda x: x['projectionType'].replace('RECTANGULAR', '').lower()),
                    try_get(fmt, lambda x: x['spatialAudioType'].replace('SPATIAL_AUDIO_TYPE_', '').lower()),
                    is_damaged and 'DAMAGED', require_po_token and not po_token and 'MISSING POT',
                    (self.get_param('verbose') or all_formats) and short_client_name(client_name),
                    delim=', '),
                # Format 22 is likely to be damaged. See https://github.com/yt-dlp/yt-dlp/issues/3372
                'source_preference': (-5 if itag == '22' else -1) + (100 if 'Premium' in name else 0),
                'fps': fps if fps > 1 else None,  # For some formats, fps is wrongly returned as 1
                'audio_channels': fmt.get('audioChannels'),
                'height': height,
                'quality': q(quality) - bool(fmt.get('isDrc')) / 2,
                'has_drm': has_drm,
                'tbr': tbr,
                'filesize_approx': filesize_from_tbr(tbr, format_duration),
                'url': fmt_url,
                'width': int_or_none(fmt.get('width')),
                'language': join_nonempty(language_code, 'desc' if is_descriptive else '') or None,
                'language_preference': PREFERRED_LANG_VALUE if is_original else 5 if is_default else -10 if is_descriptive else -1,
                # Strictly de-prioritize damaged and 3gp formats
                'preference': -10 if is_damaged else -2 if itag == '17' else None,
            }
            mime_mobj = re.match(
                r'((?:[^/]+)/(?:[^;]+))(?:;\s*codecs="([^"]+)")?', fmt.get('mimeType') or '')
            if mime_mobj:
                dct['ext'] = mimetype2ext(mime_mobj.group(1))
                dct.update(parse_codecs(mime_mobj.group(2)))
            if itag:
                itags[itag].add(('https', dct.get('language')))
                stream_ids.append(stream_id)
            single_stream = 'none' in (dct.get('acodec'), dct.get('vcodec'))
            if single_stream and dct.get('ext'):
                dct['container'] = dct['ext'] + '_dash'

            # For handling potential pre-playback required waiting period
            if live_status not in ('is_live', 'post_live'):
                dct['available_at'] = available_at

            if (all_formats or 'dashy' in format_types) and dct['filesize']:
                yield {
                    **dct,
                    'format_id': f'{dct["format_id"]}-dashy' if all_formats else dct['format_id'],
                    'protocol': 'http_dash_segments',
                    'fragments': build_fragments(dct),
                }
            if all_formats or 'dashy' not in format_types:
                dct['downloader_options'] = {'http_chunk_size': CHUNK_SIZE}
                yield dct

        needs_live_processing = self._needs_live_processing(live_status, duration)
        skip_bad_formats = 'incomplete' not in format_types

        skip_manifests = set(self._configuration_arg('skip'))
        if (needs_live_processing == 'is_live'  # These will be filtered out by YoutubeDL anyway
                or (needs_live_processing and skip_bad_formats)):
            skip_manifests.add('hls')
        if skip_bad_formats and live_status == 'is_live' and needs_live_processing != 'is_live':
            skip_manifests.add('dash')

        def process_manifest_format(f, proto, client_name, itag, missing_pot):
            key = (proto, f.get('language'))
            if not all_formats and key in itags[itag]:
                return False

            # For handling potential pre-playback required waiting period
            if live_status not in ('is_live', 'post_live'):
                f['available_at'] = available_at

            if f.get('source_preference') is None:
                f['source_preference'] = -1

            # Deprioritize since its pre-merged m3u8 formats may have lower quality audio streams
            if client_name == 'web_safari' and proto == 'hls' and live_status != 'is_live':
                f['source_preference'] -= 1

            if missing_pot:
                f['format_note'] = join_nonempty(f.get('format_note'), 'MISSING POT', delim=' ')
                f['source_preference'] -= 20

            itags[itag].add(key)

            if itag and all_formats:
                f['format_id'] = f'{itag}-{proto}'
            elif any(p != proto for p, _ in itags[itag]):
                f['format_id'] = f'{itag}-{proto}'
            elif itag:
                f['format_id'] = itag

            if original_language and f.get('language') == original_language:
                f['format_note'] = join_nonempty(f.get('format_note'), '(default)', delim=' ')
                f['language_preference'] = PREFERRED_LANG_VALUE

            if itag in ('616', '235'):
                f['format_note'] = join_nonempty(f.get('format_note'), 'Premium', delim=' ')
                f['source_preference'] += 100

            f['quality'] = q(itag_qualities.get(try_get(f, lambda f: f['format_id'].split('-')[0]), -1))
            if f['quality'] == -1 and f.get('height'):
                f['quality'] = q(res_qualities[min(res_qualities, key=lambda x: abs(x - f['height']))])
            if self.get_param('verbose') or all_formats:
                f['format_note'] = join_nonempty(
                    f.get('format_note'), short_client_name(client_name), delim=', ')
            if f.get('fps') and f['fps'] <= 1:
                del f['fps']

            if proto == 'hls' and f.get('has_drm'):
                f['has_drm'] = 'maybe'
                f['source_preference'] -= 5
            return True

        subtitles = {}
        for sd in streaming_data:
            client_name = sd[STREAMING_DATA_CLIENT_NAME]
            fetch_pot_func = sd[STREAMING_DATA_FETCH_GVS_PO_TOKEN]
            is_premium_subscriber = sd[STREAMING_DATA_IS_PREMIUM_SUBSCRIBER]
            has_player_token = sd[STREAMING_DATA_PLAYER_TOKEN_PROVIDED]

            hls_manifest_url = 'hls' not in skip_manifests and sd.get('hlsManifestUrl')
            if hls_manifest_url:
                pot_policy: GvsPoTokenPolicy = self._get_default_ytcfg(
                    client_name)['GVS_PO_TOKEN_POLICY'][StreamingProtocol.HLS]
                require_po_token = gvs_pot_required(pot_policy, is_premium_subscriber, has_player_token)
                po_token = gvs_pots.get(client_name, fetch_pot_func(required=require_po_token or pot_policy.recommended))
                if po_token:
                    hls_manifest_url = hls_manifest_url.rstrip('/') + f'/pot/{po_token}'
                    if client_name not in gvs_pots:
                        gvs_pots[client_name] = po_token
                if require_po_token and not po_token and 'missing_pot' not in self._configuration_arg('formats'):
                    self._report_pot_format_skipped(video_id, client_name, 'hls')
                else:
                    fmts, subs = self._extract_m3u8_formats_and_subtitles(
                        hls_manifest_url, video_id, 'mp4', fatal=False, live=live_status == 'is_live')
                    for sub in traverse_obj(subs, (..., ..., {dict})):
                        # TODO: If HLS video requires a PO Token, do the subs also require pot?
                        # Save client name for debugging
                        sub[STREAMING_DATA_CLIENT_NAME] = client_name
                    subtitles = self._merge_subtitles(subs, subtitles)
                    for f in fmts:
                        if process_manifest_format(f, 'hls', client_name, self._search_regex(
                                r'/itag/(\d+)', f['url'], 'itag', default=None), require_po_token and not po_token):
                            yield f

            dash_manifest_url = 'dash' not in skip_manifests and sd.get('dashManifestUrl')
            if dash_manifest_url:
                pot_policy: GvsPoTokenPolicy = self._get_default_ytcfg(
                    client_name)['GVS_PO_TOKEN_POLICY'][StreamingProtocol.DASH]
                require_po_token = gvs_pot_required(pot_policy, is_premium_subscriber, has_player_token)
                po_token = gvs_pots.get(client_name, fetch_pot_func(required=require_po_token or pot_policy.recommended))
                if po_token:
                    dash_manifest_url = dash_manifest_url.rstrip('/') + f'/pot/{po_token}'
                    if client_name not in gvs_pots:
                        gvs_pots[client_name] = po_token
                if require_po_token and not po_token and 'missing_pot' not in self._configuration_arg('formats'):
                    self._report_pot_format_skipped(video_id, client_name, 'dash')
                else:
                    formats, subs = self._extract_mpd_formats_and_subtitles(dash_manifest_url, video_id, fatal=False)
                    for sub in traverse_obj(subs, (..., ..., {dict})):
                        # TODO: If DASH video requires a PO Token, do the subs also require pot?
                        # Save client name for debugging
                        sub[STREAMING_DATA_CLIENT_NAME] = client_name
                    subtitles = self._merge_subtitles(subs, subtitles)  # Prioritize HLS subs over DASH
                    for f in formats:
                        if process_manifest_format(f, 'dash', client_name, f['format_id'], require_po_token and not po_token):
                            f['filesize'] = int_or_none(self._search_regex(
                                r'/clen/(\d+)', f.get('fragment_base_url') or f['url'], 'file size', default=None))
                            if needs_live_processing:
                                f['is_from_start'] = True

                            yield f
        yield subtitles

    def _extract_storyboard(self, player_responses, duration):
        spec = get_first(
            player_responses, ('storyboards', 'playerStoryboardSpecRenderer', 'spec'), default='').split('|')[::-1]
        base_url = url_or_none(urljoin('https://i.ytimg.com/', spec.pop() or None))
        if not base_url:
            return
        L = len(spec) - 1
        for i, args in enumerate(spec):
            args = args.split('#')
            counts = list(map(int_or_none, args[:5]))
            if len(args) != 8 or not all(counts):
                self.report_warning(f'Malformed storyboard {i}: {"#".join(args)}{bug_reports_message()}')
                continue
            width, height, frame_count, cols, rows = counts
            N, sigh = args[6:]

            url = base_url.replace('$L', str(L - i)).replace('$N', N) + f'&sigh={sigh}'
            fragment_count = frame_count / (cols * rows)
            fragment_duration = duration / fragment_count
            yield {
                'format_id': f'sb{i}',
                'format_note': 'storyboard',
                'ext': 'mhtml',
                'protocol': 'mhtml',
                'acodec': 'none',
                'vcodec': 'none',
                'url': url,
                'width': width,
                'height': height,
                'fps': frame_count / duration,
                'rows': rows,
                'columns': cols,
                'fragments': [{
                    'url': url.replace('$M', str(j)),
                    'duration': min(fragment_duration, duration - (j * fragment_duration)),
                } for j in range(math.ceil(fragment_count))],
            }

    def _download_initial_webpage(self, webpage_url, webpage_client, video_id):
        webpage = None
        if webpage_url and 'webpage' not in self._configuration_arg('player_skip'):
            query = {'bpctr': '9999999999', 'has_verified': '1'}
            pp = (
                self._configuration_arg('player_params', [None], casesense=True)[0]
                or traverse_obj(INNERTUBE_CLIENTS, (webpage_client, 'PLAYER_PARAMS', {str}))
            )
            if pp:
                query['pp'] = pp
            webpage = self._download_webpage_with_retries(
                webpage_url, video_id, query=query,
                headers=traverse_obj(self._get_default_ytcfg(webpage_client), {
                    'User-Agent': ('INNERTUBE_CONTEXT', 'client', 'userAgent', {str}),
                }))
        return webpage

    def _list_formats(self, video_id, microformats, video_details, player_responses, player_url, duration=None):
        live_broadcast_details = traverse_obj(microformats, (..., 'liveBroadcastDetails'))
        is_live = get_first(video_details, 'isLive')
        if is_live is None:
            is_live = get_first(live_broadcast_details, 'isLiveNow')
        live_content = get_first(video_details, 'isLiveContent')
        is_upcoming = get_first(video_details, 'isUpcoming')
        post_live = get_first(video_details, 'isPostLiveDvr')
        live_status = ('post_live' if post_live
                       else 'is_live' if is_live
                       else 'is_upcoming' if is_upcoming
                       else 'was_live' if live_content
                       else 'not_live' if False in (is_live, live_content)
                       else None)
        streaming_data = traverse_obj(player_responses, (..., 'streamingData'))
        *formats, subtitles = self._extract_formats_and_subtitles(streaming_data, video_id, player_url, live_status, duration)
        if all(f.get('has_drm') for f in formats):
            # If there are no formats that definitely don't have DRM, all have DRM
            for f in formats:
                f['has_drm'] = True

        return live_broadcast_details, live_status, streaming_data, formats, subtitles

    def _download_initial_data(self, video_id, webpage, webpage_client, webpage_ytcfg):
        initial_data = None
        if webpage and 'initial_data' not in self._configuration_arg('webpage_skip'):
            initial_data = self.extract_yt_initial_data(video_id, webpage, fatal=False)
            if not traverse_obj(initial_data, 'contents'):
                self.report_warning('Incomplete data received in embedded initial data; re-fetching using API.')
                initial_data = None
        if not initial_data and 'initial_data' not in self._configuration_arg('player_skip'):
            query = {'videoId': video_id}
            query.update(self._get_checkok_params())
            initial_data = self._extract_response(
                item_id=video_id, ep='next', fatal=False,
                ytcfg=webpage_ytcfg, query=query, check_get_keys='contents',
                note='Downloading initial data API JSON', default_client=webpage_client)
        return initial_data

    def _is_premium_subscriber(self, initial_data):
        if not self.is_authenticated or not initial_data:
            return False

        tlr = traverse_obj(
            initial_data, ('topbar', 'desktopTopbarRenderer', 'logo', 'topbarLogoRenderer'))
        return (
            traverse_obj(tlr, ('iconImage', 'iconType')) == 'YOUTUBE_PREMIUM_LOGO'
            or 'premium' in (self._get_text(tlr, 'tooltipText') or '').lower()
        )

    def _initial_extract(self, url, smuggled_data, webpage_url, webpage_client, video_id):
        # This function is also used by live-from-start refresh
        webpage = self._download_initial_webpage(webpage_url, webpage_client, video_id)
        webpage_ytcfg = self.extract_ytcfg(video_id, webpage) or self._get_default_ytcfg(webpage_client)

        initial_data = self._download_initial_data(video_id, webpage, webpage_client, webpage_ytcfg)

        is_premium_subscriber = self._is_premium_subscriber(initial_data)
        if is_premium_subscriber:
            self.write_debug('Detected YouTube Premium subscription')

        player_responses, player_url = self._extract_player_responses(
            self._get_requested_clients(url, smuggled_data, is_premium_subscriber),
            video_id, webpage, webpage_client, webpage_ytcfg, is_premium_subscriber)

        return webpage, webpage_ytcfg, initial_data, is_premium_subscriber, player_responses, player_url

    def _real_extract(self, url):
        url, smuggled_data = unsmuggle_url(url, {})
        video_id = self._match_id(url)

        base_url = self.http_scheme() + '//www.youtube.com/'
        webpage_url = base_url + 'watch?v=' + video_id
        webpage_client = 'web'

        webpage, webpage_ytcfg, initial_data, is_premium_subscriber, player_responses, player_url = self._initial_extract(
            url, smuggled_data, webpage_url, webpage_client, video_id)

        playability_statuses = traverse_obj(
            player_responses, (..., 'playabilityStatus'), expected_type=dict)

        trailer_video_id = get_first(
            playability_statuses,
            ('errorScreen', 'playerLegacyDesktopYpcTrailerRenderer', 'trailerVideoId'),
            expected_type=str)
        if trailer_video_id:
            return self.url_result(
                trailer_video_id, self.ie_key(), trailer_video_id)

        search_meta = ((lambda x: self._html_search_meta(x, webpage, default=None))
                       if webpage else (lambda x: None))

        video_details = traverse_obj(player_responses, (..., 'videoDetails'), expected_type=dict)
        microformats = traverse_obj(
            player_responses, (..., 'microformat', 'playerMicroformatRenderer'),
            expected_type=dict)

        # Fallbacks in case player responses are missing metadata
        initial_sdcr = traverse_obj(initial_data, (
            'engagementPanels', ..., 'engagementPanelSectionListRenderer',
            'content', 'structuredDescriptionContentRenderer', {dict}, any))
        initial_description = traverse_obj(initial_sdcr, (
            'items', ..., 'expandableVideoDescriptionBodyRenderer',
            'attributedDescriptionBodyText', 'content', {str}, any))
        # videoDescriptionHeaderRenderer also has publishDate/channel/handle/ucid, but not needed
        initial_vdhr = traverse_obj(initial_sdcr, (
            'items', ..., 'videoDescriptionHeaderRenderer', {dict}, any)) or {}
        initial_video_details_renderer = traverse_obj(initial_data, (
            'playerOverlays', 'playerOverlayRenderer', 'videoDetails',
            'playerOverlayVideoDetailsRenderer', {dict})) or {}
        initial_title = (
            self._get_text(initial_vdhr, 'title')
            or self._get_text(initial_video_details_renderer, 'title'))

        translated_title = self._get_text(microformats, (..., 'title'))
        video_title = ((self._preferred_lang and translated_title)
                       or get_first(video_details, 'title')  # primary
                       or translated_title
                       or search_meta(['og:title', 'twitter:title', 'title']))
        if not video_title and initial_title:
            self.report_warning(
                'No title found in player responses; falling back to title from initial data. '
                'Other metadata may also be missing')
            video_title = initial_title
        translated_description = self._get_text(microformats, (..., 'description'))
        original_description = get_first(video_details, 'shortDescription')
        video_description = (
            (self._preferred_lang and translated_description)
            # If original description is blank, it will be an empty string.
            # Do not prefer translated description in this case.
            or original_description if original_description is not None else translated_description)
        if video_description is None:
            video_description = initial_description

        multifeed_metadata_list = get_first(
            player_responses,
            ('multicamera', 'playerLegacyMulticameraRenderer', 'metadataList'),
            expected_type=str)
        if multifeed_metadata_list and not smuggled_data.get('force_singlefeed'):
            if self.get_param('noplaylist'):
                self.to_screen(f'Downloading just video {video_id} because of --no-playlist')
            else:
                entries = []
                feed_ids = []
                for feed in multifeed_metadata_list.split(','):
                    # Unquote should take place before split on comma (,) since textual
                    # fields may contain comma as well (see
                    # https://github.com/ytdl-org/youtube-dl/issues/8536)
                    feed_data = urllib.parse.parse_qs(
                        urllib.parse.unquote_plus(feed))

                    def feed_entry(name):
                        return try_get(
                            feed_data, lambda x: x[name][0], str)

                    feed_id = feed_entry('id')
                    if not feed_id:
                        continue
                    feed_title = feed_entry('title')
                    title = video_title
                    if feed_title:
                        title += f' ({feed_title})'
                    entries.append({
                        '_type': 'url_transparent',
                        'ie_key': 'Youtube',
                        'url': smuggle_url(
                            '{}watch?v={}'.format(base_url, feed_data['id'][0]),
                            {'force_singlefeed': True}),
                        'title': title,
                    })
                    feed_ids.append(feed_id)
                self.to_screen(
                    'Downloading multifeed video ({}) - add --no-playlist to just download video {}'.format(
                        ', '.join(feed_ids), video_id))
                return self.playlist_result(
                    entries, video_id, video_title, video_description)

        duration = (int_or_none(get_first(video_details, 'lengthSeconds'))
                    or int_or_none(get_first(microformats, 'lengthSeconds'))
                    or parse_duration(search_meta('duration')) or None)

        live_broadcast_details, live_status, streaming_data, formats, automatic_captions = \
            self._list_formats(video_id, microformats, video_details, player_responses, player_url, duration)
        if live_status == 'post_live':
            self.write_debug(f'{video_id}: Video is in Post-Live Manifestless mode')

        if not formats:
            if not self.get_param('allow_unplayable_formats') and traverse_obj(streaming_data, (..., 'licenseInfos')):
                self.report_drm(video_id)
            pemr = get_first(
                playability_statuses,
                ('errorScreen', 'playerErrorMessageRenderer'), expected_type=dict) or {}
            reason = self._get_text(pemr, 'reason') or get_first(playability_statuses, 'reason')
            subreason = clean_html(self._get_text(pemr, 'subreason') or '')
            if subreason:
                if subreason.startswith('The uploader has not made this video available in your country'):
                    countries = get_first(microformats, 'availableCountries')
                    if not countries:
                        regions_allowed = search_meta('regionsAllowed')
                        countries = regions_allowed.split(',') if regions_allowed else None
                    self.raise_geo_restricted(subreason, countries, metadata_available=True)
                reason += f'. {subreason}'
            if reason:
                if 'sign in' in reason.lower():
                    reason = remove_end(reason, 'This helps protect our community. Learn more')
                    reason = f'{remove_end(reason.strip(), ".")}. {self._youtube_login_hint}'
                elif get_first(playability_statuses, ('errorScreen', 'playerCaptchaViewModel', {dict})):
                    reason += '. YouTube is requiring a captcha challenge before playback'
                elif "This content isn't available, try again later" in reason:
                    reason = (
                        f'{remove_end(reason.strip(), ".")}. {"Your account" if self.is_authenticated else "The current session"} '
                        f'has been rate-limited by YouTube for up to an hour. It is recommended to use `-t sleep` to add a delay '
                        f'between video requests to avoid exceeding the rate limit. For more information, refer to  '
                        f'https://github.com/yt-dlp/yt-dlp/wiki/Extractors#this-content-isnt-available-try-again-later'
                    )
                self.raise_no_formats(reason, expected=True)

        keywords = get_first(video_details, 'keywords', expected_type=list) or []
        if not keywords and webpage:
            keywords = [
                unescapeHTML(m.group('content'))
                for m in re.finditer(self._meta_regex('og:video:tag'), webpage)]
        for keyword in keywords:
            if keyword.startswith('yt:stretch='):
                mobj = re.search(r'(\d+)\s*:\s*(\d+)', keyword)
                if mobj:
                    # NB: float is intentional for forcing float division
                    w, h = (float(v) for v in mobj.groups())
                    if w > 0 and h > 0:
                        ratio = w / h
                        for f in formats:
                            if f.get('vcodec') != 'none':
                                f['stretched_ratio'] = ratio
                        break
        thumbnails = self._extract_thumbnails((video_details, microformats), (..., ..., 'thumbnail'))
        thumbnail_url = search_meta(['og:image', 'twitter:image'])
        if thumbnail_url:
            thumbnails.append({
                'url': thumbnail_url,
            })
        original_thumbnails = thumbnails.copy()

        # The best resolution thumbnails sometimes does not appear in the webpage
        # See: https://github.com/yt-dlp/yt-dlp/issues/340
        # List of possible thumbnails - Ref: <https://stackoverflow.com/a/20542029>
        thumbnail_names = [
            # While the *1,*2,*3 thumbnails are just below their corresponding "*default" variants
            # in resolution, these are not the custom thumbnail. So de-prioritize them
            'maxresdefault', 'hq720', 'sddefault', 'hqdefault', '0', 'mqdefault', 'default',
            'sd1', 'sd2', 'sd3', 'hq1', 'hq2', 'hq3', 'mq1', 'mq2', 'mq3', '1', '2', '3',
        ]
        n_thumbnail_names = len(thumbnail_names)
        thumbnails.extend({
            'url': 'https://i.ytimg.com/vi{webp}/{video_id}/{name}{live}.{ext}'.format(
                video_id=video_id, name=name, ext=ext,
                webp='_webp' if ext == 'webp' else '', live='_live' if live_status == 'is_live' else ''),
        } for name in thumbnail_names for ext in ('webp', 'jpg'))
        for thumb in thumbnails:
            i = next((i for i, t in enumerate(thumbnail_names) if f'/{video_id}/{t}' in thumb['url']), n_thumbnail_names)
            thumb['preference'] = (0 if '.webp' in thumb['url'] else -1) - (2 * i)
        self._remove_duplicate_formats(thumbnails)
        self._downloader._sort_thumbnails(original_thumbnails)

        category = get_first(microformats, 'category') or search_meta('genre')
        channel_id = self.ucid_or_none(str_or_none(
            get_first(video_details, 'channelId')
            or get_first(microformats, 'externalChannelId')
            or search_meta('channelId')))
        owner_profile_url = get_first(microformats, 'ownerProfileUrl')

        live_start_time = parse_iso8601(get_first(live_broadcast_details, 'startTimestamp'))
        live_end_time = parse_iso8601(get_first(live_broadcast_details, 'endTimestamp'))
        if not duration and live_end_time and live_start_time:
            duration = live_end_time - live_start_time

        needs_live_processing = self._needs_live_processing(live_status, duration)

        def is_bad_format(fmt):
            if needs_live_processing and not fmt.get('is_from_start'):
                return True
            elif (live_status == 'is_live' and needs_live_processing != 'is_live'
                    and fmt.get('protocol') == 'http_dash_segments'):
                return True

        for fmt in filter(is_bad_format, formats):
            fmt['preference'] = (fmt.get('preference') or -1) - 10
            fmt['format_note'] = join_nonempty(fmt.get('format_note'), '(Last 2 hours)', delim=' ')

        if needs_live_processing:
            self._prepare_live_from_start_formats(
                formats, video_id, live_start_time, url, webpage_url, smuggled_data, live_status == 'is_live')

        formats.extend(self._extract_storyboard(player_responses, duration))

        channel_handle = self.handle_from_url(owner_profile_url)

        info = {
            'id': video_id,
            'title': video_title,
            'formats': formats,
            'thumbnails': thumbnails,
            # The best thumbnail that we are sure exists. Prevents unnecessary
            # URL checking if user don't care about getting the best possible thumbnail
            'thumbnail': traverse_obj(original_thumbnails, (-1, 'url')),
            'description': video_description,
            'channel_id': channel_id,
            'channel_url': format_field(channel_id, None, 'https://www.youtube.com/channel/%s', default=None),
            'duration': duration,
            'view_count': int_or_none(
                get_first((video_details, microformats), (..., 'viewCount'))
                or search_meta('interactionCount')),
            'average_rating': float_or_none(get_first(video_details, 'averageRating')),
            'age_limit': 18 if (
                get_first(microformats, 'isFamilySafe') is False
                or search_meta('isFamilyFriendly') == 'false'
                or search_meta('og:restrictions:age') == '18+') else 0,
            'webpage_url': webpage_url,
            'categories': [category] if category else None,
            'tags': keywords,
            'playable_in_embed': get_first(playability_statuses, 'playableInEmbed'),
            'live_status': live_status,
            'media_type': (
                'livestream' if get_first(video_details, 'isLiveContent')
                else 'short' if get_first(microformats, 'isShortsEligible')
                else 'video'),
            'release_timestamp': live_start_time,
            '_format_sort_fields': (  # source_preference is lower for potentially damaged formats
                'quality', 'res', 'fps', 'hdr:12', 'source', 'vcodec', 'channels', 'acodec', 'lang', 'proto'),
        }

        def get_lang_code(track):
            return (remove_start(track.get('vssId') or '', '.').replace('.', '-')
                    or track.get('languageCode'))

        def process_language(container, base_url, lang_code, sub_name, client_name, query):
            lang_subs = container.setdefault(lang_code, [])
            for fmt in self._SUBTITLE_FORMATS:
                # xosf=1 results in undesirable text position data for vtt, json3 & srv* subtitles
                # See: https://github.com/yt-dlp/yt-dlp/issues/13654
                query = {**query, 'fmt': fmt, 'xosf': []}
                lang_subs.append({
                    'ext': fmt,
                    'url': urljoin('https://www.youtube.com', update_url_query(base_url, query)),
                    'name': sub_name,
                    'impersonate': True,
                    STREAMING_DATA_CLIENT_NAME: client_name,
                })

        subtitles = {}
        skipped_subs_clients = set()

        # Only web/mweb clients provide translationLanguages, so include initial_pr in the traversal
        translation_languages = {
            lang['languageCode']: self._get_text(lang['languageName'], max_runs=1)
            for lang in traverse_obj(player_responses, (
                ..., 'captions', 'playerCaptionsTracklistRenderer', 'translationLanguages',
                lambda _, v: v['languageCode'] and v['languageName']))
        }
        # NB: Constructing the full subtitle dictionary is slow
        get_translated_subs = 'translated_subs' not in self._configuration_arg('skip') and (
            self.get_param('writeautomaticsub', False) or self.get_param('listsubtitles'))

        # Filter out initial_pr which does not have streamingData (smuggled client context)
        prs = traverse_obj(player_responses, (
            lambda _, v: v['streamingData'] and v['captions']['playerCaptionsTracklistRenderer']))
        all_captions = traverse_obj(prs, (
            ..., 'captions', 'playerCaptionsTracklistRenderer', 'captionTracks', ..., {dict}))
        need_subs_langs = {get_lang_code(sub) for sub in all_captions if sub.get('kind') != 'asr'}
        need_caps_langs = {
            remove_start(get_lang_code(sub), 'a-')
            for sub in all_captions if sub.get('kind') == 'asr'}

        for pr in prs:
            pctr = pr['captions']['playerCaptionsTracklistRenderer']
            client_name = pr['streamingData'][STREAMING_DATA_CLIENT_NAME]
            innertube_client_name = pr['streamingData'][STREAMING_DATA_INNERTUBE_CONTEXT]['client']['clientName']
            pot_policy: GvsPoTokenPolicy = self._get_default_ytcfg(client_name)['SUBS_PO_TOKEN_POLICY']
            fetch_subs_po_token_func = pr['streamingData'][STREAMING_DATA_FETCH_SUBS_PO_TOKEN]

            pot_params = {}
            already_fetched_pot = False

            for caption_track in traverse_obj(pctr, ('captionTracks', lambda _, v: v['baseUrl'])):
                base_url = caption_track['baseUrl']
                qs = parse_qs(base_url)
                lang_code = get_lang_code(caption_track)
                requires_pot = (
                    # We can detect the experiment for now
                    any(e in traverse_obj(qs, ('exp', ...)) for e in ('xpe', 'xpv'))
                    or (pot_policy.required and not (pot_policy.not_required_for_premium and is_premium_subscriber)))

                if not already_fetched_pot:
                    already_fetched_pot = True
                    if subs_po_token := fetch_subs_po_token_func(required=requires_pot or pot_policy.recommended):
                        pot_params.update({
                            'pot': subs_po_token,
                            'potc': '1',
                            'c': innertube_client_name,
                        })

                if not pot_params and requires_pot:
                    skipped_subs_clients.add(client_name)
                    self._report_pot_subtitles_skipped(video_id, client_name)
                    break

                orig_lang = qs.get('lang', [None])[-1]
                lang_name = self._get_text(caption_track, 'name', max_runs=1)
                if caption_track.get('kind') != 'asr':
                    if not lang_code:
                        continue
                    process_language(
                        subtitles, base_url, lang_code, lang_name, client_name, pot_params)
                    if not caption_track.get('isTranslatable'):
                        continue
                for trans_code, trans_name in translation_languages.items():
                    if not trans_code:
                        continue
                    orig_trans_code = trans_code
                    if caption_track.get('kind') != 'asr' and trans_code != 'und':
                        if not get_translated_subs:
                            continue
                        trans_code += f'-{lang_code}'
                        trans_name += format_field(lang_name, None, ' from %s')
                    if lang_code == f'a-{orig_trans_code}':
                        # Set audio language based on original subtitles
                        for f in formats:
                            if f.get('acodec') != 'none' and not f.get('language'):
                                f['language'] = orig_trans_code
                        # Add an "-orig" label to the original language so that it can be distinguished.
                        # The subs are returned without "-orig" as well for compatibility
                        process_language(
                            automatic_captions, base_url, f'{trans_code}-orig',
                            f'{trans_name} (Original)', client_name, pot_params)
                    # Setting tlang=lang returns damaged subtitles.
                    process_language(
                        automatic_captions, base_url, trans_code, trans_name, client_name,
                        pot_params if orig_lang == orig_trans_code else {'tlang': trans_code, **pot_params})

            # Avoid duplication if we've already got everything we need
            need_subs_langs.difference_update(subtitles)
            need_caps_langs.difference_update(automatic_captions)
            if not (need_subs_langs or need_caps_langs):
                break

        if skipped_subs_clients and (need_subs_langs or need_caps_langs):
            self._report_pot_subtitles_skipped(video_id, True, msg=join_nonempty(
                f'{video_id}: There are missing subtitles languages because a PO token was not provided.',
                need_subs_langs and f'Subtitles for these languages are missing: {", ".join(need_subs_langs)}.',
                need_caps_langs and f'Automatic captions for {len(need_caps_langs)} languages are missing.',
                delim=' '))

        info['automatic_captions'] = automatic_captions
        info['subtitles'] = subtitles

        parsed_url = urllib.parse.urlparse(url)
        for component in [parsed_url.fragment, parsed_url.query]:
            query = urllib.parse.parse_qs(component)
            for k, v in query.items():
                for d_k, s_ks in [('start', ('start', 't')), ('end', ('end',))]:
                    d_k += '_time'
                    if d_k not in info and k in s_ks:
                        info[d_k] = parse_duration(v[0])

        # Youtube Music Auto-generated description
        if (video_description or '').strip().endswith('\nAuto-generated by YouTube.'):
            # XXX: Causes catastrophic backtracking if description has "·"
            # E.g. https://www.youtube.com/watch?v=DoPaAxMQoiI
            # Simulating atomic groups:  (?P<a>[^xy]+)x  =>  (?=(?P<a>[^xy]+))(?P=a)x
            # reduces it, but does not fully fix it. https://regex101.com/r/8Ssf2h/2
            mobj = re.search(
                r'''(?xs)
                    (?=(?P<track>[^\n·]+))(?P=track)·
                    (?=(?P<artist>[^\n]+))(?P=artist)\n+
                    (?=(?P<album>[^\n]+))(?P=album)\n
                    (?:.+?℗\s*(?P<release_year>\d{4})(?!\d))?
                    (?:.+?Released\ on\s*:\s*(?P<release_date>\d{4}-\d{2}-\d{2}))?
                    (.+?\nArtist\s*:\s*
                        (?=(?P<clean_artist>[^\n]+))(?P=clean_artist)\n
                    )?.+\nAuto-generated\ by\ YouTube\.\s*$
                ''', video_description)
            if mobj:
                release_year = mobj.group('release_year')
                release_date = mobj.group('release_date')
                if release_date:
                    release_date = release_date.replace('-', '')
                    if not release_year:
                        release_year = release_date[:4]
                info.update({
                    'album': mobj.group('album'.strip()),
                    'artists': ([a] if (a := mobj.group('clean_artist'))
                                else [a.strip() for a in mobj.group('artist').split('·')]),
                    'track': mobj.group('track').strip(),
                    'release_date': release_date,
                    'release_year': int_or_none(release_year),
                })

        COMMENTS_SECTION_IDS = ('comment-item-section', 'engagement-panel-comments-section')
        info['comment_count'] = traverse_obj(initial_data, (
            'contents', 'twoColumnWatchNextResults', 'results', 'results', 'contents', ..., 'itemSectionRenderer',
            'contents', ..., 'commentsEntryPointHeaderRenderer', 'commentCount',
        ), (
            'engagementPanels', lambda _, v: v['engagementPanelSectionListRenderer']['panelIdentifier'] in COMMENTS_SECTION_IDS,
            'engagementPanelSectionListRenderer', 'header', 'engagementPanelTitleHeaderRenderer', 'contextualInfo',
        ), expected_type=self._get_count, get_all=False)

        try:  # This will error if there is no livechat
            initial_data['contents']['twoColumnWatchNextResults']['conversationBar']['liveChatRenderer']['continuations'][0]['reloadContinuationData']['continuation']
        except (KeyError, IndexError, TypeError):
            pass
        else:
            info.setdefault('subtitles', {})['live_chat'] = [{
                # url is needed to set cookies
                'url': f'https://www.youtube.com/watch?v={video_id}&bpctr=9999999999&has_verified=1',
                'video_id': video_id,
                'ext': 'json',
                'protocol': ('youtube_live_chat' if live_status in ('is_live', 'is_upcoming')
                             else 'youtube_live_chat_replay'),
            }]

        if initial_data:
            info['chapters'] = (
                self._extract_chapters_from_json(initial_data, duration)
                or self._extract_chapters_from_engagement_panel(initial_data, duration)
                or self._extract_chapters_from_description(video_description, duration)
                or None)

            info['heatmap'] = self._extract_heatmap(initial_data)

        contents = traverse_obj(
            initial_data, ('contents', 'twoColumnWatchNextResults', 'results', 'results', 'contents'),
            expected_type=list, default=[])

        vpir = get_first(contents, 'videoPrimaryInfoRenderer')
        if vpir:
            stl = vpir.get('superTitleLink')
            if stl:
                stl = self._get_text(stl)
                if try_get(
                        vpir,
                        lambda x: x['superTitleIcon']['iconType']) == 'LOCATION_PIN':
                    info['location'] = stl
                else:
                    mobj = re.search(r'(.+?)\s*S(\d+)\s*•?\s*E(\d+)', stl)
                    if mobj:
                        info.update({
                            'series': mobj.group(1),
                            'season_number': int(mobj.group(2)),
                            'episode_number': int(mobj.group(3)),
                        })
            for tlb in (try_get(
                    vpir,
                    lambda x: x['videoActions']['menuRenderer']['topLevelButtons'],
                    list) or []):
                tbrs = variadic(
                    traverse_obj(
                        tlb, ('toggleButtonRenderer', ...),
                        ('segmentedLikeDislikeButtonRenderer', ..., 'toggleButtonRenderer')))
                for tbr in tbrs:
                    for getter, regex in [(
                            lambda x: x['defaultText']['accessibility']['accessibilityData'],
                            r'(?P<count>[\d,]+)\s*(?P<type>(?:dis)?like)'), ([
                                lambda x: x['accessibility'],
                                lambda x: x['accessibilityData']['accessibilityData'],
                            ], r'(?P<type>(?:dis)?like) this video along with (?P<count>[\d,]+) other people')]:
                        label = (try_get(tbr, getter, dict) or {}).get('label')
                        if label:
                            mobj = re.match(regex, label)
                            if mobj:
                                info[mobj.group('type') + '_count'] = str_to_int(mobj.group('count'))
                                break

            info['like_count'] = traverse_obj(vpir, (
                'videoActions', 'menuRenderer', 'topLevelButtons', ...,
                'segmentedLikeDislikeButtonViewModel', 'likeButtonViewModel', 'likeButtonViewModel',
                'toggleButtonViewModel', 'toggleButtonViewModel', 'defaultButtonViewModel',
                'buttonViewModel', 'accessibilityText', {parse_count}), get_all=False)

            vcr = traverse_obj(vpir, ('viewCount', 'videoViewCountRenderer'))
            if vcr:
                vc = self._get_count(vcr, 'viewCount')
                # Upcoming premieres with waiting count are treated as live here
                if vcr.get('isLive'):
                    info['concurrent_view_count'] = vc
                elif info.get('view_count') is None:
                    info['view_count'] = vc

        vsir = get_first(contents, 'videoSecondaryInfoRenderer')
        if vsir:
            vor = traverse_obj(vsir, ('owner', 'videoOwnerRenderer'))
            info.update({
                'channel': self._get_text(vor, 'title'),
                'channel_follower_count': self._get_count(vor, 'subscriberCountText')})

            if not channel_handle:
                channel_handle = self.handle_from_url(
                    traverse_obj(vor, (
                        ('navigationEndpoint', ('title', 'runs', ..., 'navigationEndpoint')),
                        (('commandMetadata', 'webCommandMetadata', 'url'), ('browseEndpoint', 'canonicalBaseUrl')),
                        {str}), get_all=False))

            rows = try_get(
                vsir,
                lambda x: x['metadataRowContainer']['metadataRowContainerRenderer']['rows'],
                list) or []
            multiple_songs = False
            for row in rows:
                if try_get(row, lambda x: x['metadataRowRenderer']['hasDividerLine']) is True:
                    multiple_songs = True
                    break
            for row in rows:
                mrr = row.get('metadataRowRenderer') or {}
                mrr_title = mrr.get('title')
                if not mrr_title:
                    continue
                mrr_title = self._get_text(mrr, 'title')
                mrr_contents_text = self._get_text(mrr, ('contents', 0))
                if mrr_title == 'License':
                    info['license'] = mrr_contents_text
                elif not multiple_songs:
                    if mrr_title == 'Album':
                        info['album'] = mrr_contents_text
                    elif mrr_title == 'Artist':
                        info['artists'] = [mrr_contents_text] if mrr_contents_text else None
                    elif mrr_title == 'Song':
                        info['track'] = mrr_contents_text
            owner_badges = self._extract_badges(traverse_obj(vsir, ('owner', 'videoOwnerRenderer', 'badges')))
            if self._has_badge(owner_badges, BadgeType.VERIFIED):
                info['channel_is_verified'] = True

        info.update({
            'uploader': info.get('channel'),
            'uploader_id': channel_handle,
            'uploader_url': format_field(channel_handle, None, 'https://www.youtube.com/%s', default=None),
        })

        # We only want timestamp IF it has time precision AND a timezone
        # Currently the uploadDate in microformats appears to be in US/Pacific timezone.
        timestamp = (
            parse_iso8601(get_first(microformats, 'uploadDate'), timezone=NO_DEFAULT)
            or parse_iso8601(search_meta('uploadDate'), timezone=NO_DEFAULT)
        )
        upload_date = (
            dt.datetime.fromtimestamp(timestamp, dt.timezone.utc).strftime('%Y%m%d') if timestamp else
            (
                unified_strdate(get_first(microformats, 'uploadDate'))
                or unified_strdate(search_meta('uploadDate'))
            ))

        # In the case we cannot get the timestamp:
        # The upload date for scheduled, live and past live streams / premieres in microformats
        # may be different from the stream date. Although not in UTC, we will prefer it in this case.
        # See: https://github.com/yt-dlp/yt-dlp/pull/2223#issuecomment-1008485139
        if not upload_date or (not timestamp and live_status in ('not_live', None)):
            # this should be in UTC, as configured in the cookie/client context
            upload_date = strftime_or_none(
                self._parse_time_text(self._get_text(vpir, 'dateText'))) or upload_date

        info['upload_date'] = upload_date
        info['timestamp'] = timestamp

        if upload_date and live_status not in ('is_live', 'post_live', 'is_upcoming'):
            # Newly uploaded videos' HLS formats are potentially problematic and need to be checked
            upload_datetime = datetime_from_str(upload_date).replace(tzinfo=dt.timezone.utc)
            if upload_datetime >= datetime_from_str('today-2days'):
                for fmt in info['formats']:
                    if fmt.get('protocol') == 'm3u8_native':
                        fmt['__needs_testing'] = True

        for s_k, d_k in [('artists', 'creators'), ('track', 'alt_title')]:
            v = info.get(s_k)
            if v:
                info[d_k] = v

        badges = self._extract_badges(traverse_obj(vpir, 'badges'))

        is_private = (self._has_badge(badges, BadgeType.AVAILABILITY_PRIVATE)
                      or get_first(video_details, 'isPrivate', expected_type=bool))

        info['availability'] = (
            'public' if self._has_badge(badges, BadgeType.AVAILABILITY_PUBLIC)
            else self._availability(
                is_private=is_private,
                needs_premium=(
                    self._has_badge(badges, BadgeType.AVAILABILITY_PREMIUM)
                    or False if initial_data and is_private is not None else None),
                needs_subscription=(
                    self._has_badge(badges, BadgeType.AVAILABILITY_SUBSCRIPTION)
                    or False if initial_data and is_private is not None else None),
                needs_auth=info['age_limit'] >= 18,
                is_unlisted=None if is_private is None else (
                    self._has_badge(badges, BadgeType.AVAILABILITY_UNLISTED)
                    or get_first(microformats, 'isUnlisted', expected_type=bool))))

        info['__post_extractor'] = self.extract_comments(webpage_ytcfg, video_id, contents, webpage)

        self.mark_watched(video_id, player_responses)

        return info
-												[youtube] Add YoutubeStoriesIE (#3362)

Get channel stories with `ytstories:<channel UCID>`

Authored-by: coletdjnz
											
										
										
											2022-05-01 18:46:28 +12:00
+								import base64
-												[ie/youtube] Use different PO token for GVS and Player (#12090)

Authored by: coletdjnz
											
										
										
											2025-01-25 13:17:37 +13:00
+								import binascii
-												[extractor/youtube] Consider language in format de-duplication

											
										
										
											2022-11-15 05:23:32 +05:30
+								import collections
-												[cleanup] Standardize `import datetime as dt` (#8978)

											
										
										
											2024-02-25 05:46:34 +05:30
+								import datetime as dt
-												[cleanup] Misc (#10075)

Closes #10303
Authored by: bashonly, seproDev, jucor, c-basalt

Co-authored-by: sepro <4618135+seproDev@users.noreply.github.com>
Co-authored-by: Julien Cornebise <julien@cornebise.com>
Co-authored-by: c-basalt <117849907+c-basalt@users.noreply.github.com>
											
										
										
											2024-07-01 17:51:27 -05:00
+								import functools
-												[youtube] Improve source code quality

											
										
										
											2013-09-22 10:37:23 +02:00
+								import itertools
-												Move youtube extractors to youtube_dl.extractor.youtube

											
										
										
											2013-06-23 19:58:33 +02:00
+								import json
-												[youtube] Add storyboard formats
Closes: #1553, https://github.com/ytdl-org/youtube-dl/issues/9868
Related: https://github.com/ytdl-org/youtube-dl/pull/14951

											
										
										
											2021-11-17 01:26:23 +05:30
+								import math
-												[youtube] Add filesystem signature cache

											
										
										
											2013-09-22 00:35:03 +02:00
+								import os.path
-												Add --mark-watched feature (Closes #5054)

											
										
										
											2016-03-01 01:01:33 +06:00
+								import random
-												Move youtube extractors to youtube_dl.extractor.youtube

											
										
										
											2013-06-23 19:58:33 +02:00
+								import re
-												[youtube:comments] Add more options for limiting number of comments extracted (#1626)

Extends `max_comments` extractor arg to support `max-parents,max-replies,max-replies-per-thread`.
Authored-by: coletdjnz
											
										
										
											2021-12-15 04:29:48 +00:00
+								import sys
-												[cleanup] Sort imports

Using https://github.com/PyCQA/isort

    isort -m VERTICAL_HANGING_INDENT --py 36 -l 80 --rr -n --tc .

											
										
										
											2022-04-12 04:02:57 +05:30
+								import threading
-												[linter] youtube.py

											
										
										
											2021-02-04 20:27:26 +05:30
+								import time
-												Restore accidentally deleted commits

That's what happens if you let Windows machines write :(

											
										
										
											2013-09-21 14:19:30 +02:00
+								import traceback
-												[compat] Remove more functions

Removing any more will require changes to a large number of extractors

											
										
										
											2022-06-24 13:40:17 +05:30
+								import urllib.parse
-												Move youtube extractors to youtube_dl.extractor.youtube

											
										
										
											2013-06-23 19:58:33 +02:00
-												[ie/youtube] Split into package (#12557)

Authored by: coletdjnz
											
										
										
											2025-03-13 17:37:33 +13:00
+								from ._base import (
 								    INNERTUBE_CLIENTS,
 								    BadgeType,
-												[ie/youtube] Do not require PO Token for premium accounts (#13640)

Authored by: coletdjnz
											
										
										
											2025-07-11 18:54:01 +12:00
+								    GvsPoTokenPolicy,
 								    PlayerPoTokenPolicy,
 								    StreamingProtocol,
-												[ie/youtube] Split into package (#12557)

Authored by: coletdjnz
											
										
										
											2025-03-13 17:37:33 +13:00
+								    YoutubeBaseInfoExtractor,
 								    _PoTokenContext,
 								    _split_innertube_client,
 								    short_client_name,
 								)
-												[ie/youtube] Add a PO Token Provider Framework (#12840)

https://github.com/yt-dlp/yt-dlp/tree/master/yt_dlp/extractor/youtube/pot/README.md

Authored by: coletdjnz
											
										
										
											2025-05-18 13:45:26 +12:00
+								from .pot._director import initialize_pot_director
 								from .pot.provider import PoTokenContext, PoTokenRequest
-												[ie/youtube] Split into package (#12557)

Authored by: coletdjnz
											
										
										
											2025-03-13 17:37:33 +13:00
+								from ..openload import PhantomJSwrapper
-												[ie/youtube] Extract global nsig helper functions (#13639)

Authored by: bashonly, seproDev

Co-authored-by: sepro <sepro@sepr0.com>

											
										
										
											2025-07-05 17:03:25 -05:00
+								from ...jsinterp import JSInterpreter, LocalNameSpace
-												[ie/youtube] Split into package (#12557)

Authored by: coletdjnz
											
										
										
											2025-03-13 17:37:33 +13:00
+								from ...networking.exceptions import HTTPError
 								from ...utils import (
-												[cleanup] Sort imports

Using https://github.com/PyCQA/isort

    isort -m VERTICAL_HANGING_INDENT --py 36 -l 80 --rr -n --tc .

											
										
										
											2022-04-12 04:02:57 +05:30
+								    NO_DEFAULT,
 								    ExtractorError,
-												[extractor/youtube] Download `post_live` videos from start (#5091)

* The fragments are generated as a `LazyList`. So only the required formats are expanded during download, but all fragment lists are printed/written in infojson.
* The m3u8 formats which cannot be downloaded from start are not extracted by default, but can be enabled with an extractor-arg. The extractor-arg `include_live_dash` is renamed to `include_incomplete_formats` to account for this new use-case.

Closes #1564
Authored by: Lesmiscore, pukkandan
											
										
										
											2022-10-04 11:48:31 +09:00
+								    LazyList,
-												[youtube] Add storyboard formats
Closes: #1553, https://github.com/ytdl-org/youtube-dl/issues/9868
Related: https://github.com/ytdl-org/youtube-dl/pull/14951

											
										
										
											2021-11-17 01:26:23 +05:30
+								    bug_reports_message,
-												Move youtube extractors to youtube_dl.extractor.youtube

											
										
										
											2013-06-23 19:58:33 +02:00
+								    clean_html,
-												[youtube] Extract comments' approximate timestamp (#221)

Authored by: colethedj
											
										
										
											2021-04-07 11:37:43 +00:00
+								    datetime_from_str,
-												[ie/youtube] Calculate more accurate `filesize`

YouTube provides slightly different duration for each format.
Calculating file-size based on this duration instead of the
video duration gives more accurate results.

Ref: https://github.com/yt-dlp/yt-dlp/issues/1400#issuecomment-2007441207

											
										
										
											2024-04-01 02:20:03 +05:30
+								    filesize_from_tbr,
-												[ie/youtube] Make signature and nsig extraction more robust (#12761)

Authored by: bashonly, seproDev

Co-authored-by: sepro <sepro@sepr0.com>
											
										
										
											2025-03-27 17:31:01 -05:00
+								    filter_dict,
-												[youtube] Extract average rating (closes #2362)

											
										
										
											2015-02-11 18:39:31 +01:00
+								    float_or_none,
-												[youtube] Extract data from multiple clients (#536)

* `player_client` accepts multiple clients
* default `player_client` = `android,web`
* music clients can be specifically requested
* Add IOS `player_client`
* Hide live dash since they can't be downloaded

Closes #501

Authored-by: pukkandan, colethedj
											
										
										
											2021-07-21 09:22:34 +05:30
+								    format_field,
-												[utils] Add `get_first`

											
										
										
											2022-03-09 02:24:41 +05:30
+								    get_first,
-												[youtube] Download DASH manifest

If given, download and parse the DASH manifest file, in order to get ultra-HQ formats.
Fixes #2166

											
										
										
											2014-01-19 05:47:20 +01:00
+								    int_or_none,
-												[utils] Add `join_nonempty`

											
										
										
											2021-11-06 06:35:24 +05:30
+								    join_nonempty,
-												[youtube] Fix n-sig for player e06dea74

											
										
										
											2022-02-01 08:10:19 +05:30
+								    js_to_json,
-												[youtube] Prefer info from YouTube than _formats (#8293)

											
										
										
											2016-01-25 01:02:19 +08:00
+								    mimetype2ext,
-												[youtube] Extract data from multiple clients (#536)

* `player_client` accepts multiple clients
* default `player_client` = `android,web`
* music clients can be specifically requested
* Add IOS `player_client`
* Hide live dash since they can't be downloaded

Closes #501

Authored-by: pukkandan, colethedj
											
										
										
											2021-07-21 09:22:34 +05:30
+								    orderedSet,
-												[youtube] Fix parsing codecs (closes #12091)

											
										
										
											2017-02-12 18:09:53 +07:00
+								    parse_codecs,
-												[youtube:comments] Improve comment vote count parsing (fixes #506) (#508)

Authored by: colethedj
											
										
										
											2021-07-15 11:24:42 +12:00
+								    parse_count,
-												[youtube] Extract start_time

From the 't=*' in the url.
Currently youtube-dl doesn't use the value, but it was requested for the mpv plugin.

											
										
										
											2015-07-20 21:10:28 +02:00
+								    parse_duration,
-												[youtube] Improve extraction of livestream metadata
Modified from and closes #441
Authored by: pukkandan, krichbanana

											
										
										
											2021-07-21 20:45:45 +05:30
+								    parse_iso8601,
-												[utils] Add `parse_qs`

											
										
										
											2021-08-23 00:32:00 +05:30
+								    parse_qs,
-												[formatsort] Remove forced priority of `quality`

When making `FormatSort`, I misinterpreted the purpose `quality`

											
										
										
											2021-02-18 23:42:56 +05:30
+								    qualities,
-												[ie/youtube] Remove broken OAuth support (#11558)

Closes #11462
Authored by: bashonly
											
										
										
											2024-11-16 23:40:21 +00:00
+								    remove_end,
-												[youtube] Fix TFA (#12927)

											
										
										
											2017-05-07 04:19:11 +07:00
+								    remove_start,
-												[youtube] Add support for multifeed videos

											
										
										
											2015-07-25 21:30:34 +06:00
+								    smuggle_url,
-												[youtube] Add fallback metadata extraction from videoDetails (closes #18052)

											
										
										
											2018-11-03 06:26:16 +07:00
+								    str_or_none,
-												[youtube] Fix likes/dislike extraction

											
										
										
											2015-06-29 00:48:06 +06:00
+								    str_to_int,
-												[youtube:tab] Extract more metadata from feeds/channels/playlists (#1018)

Parse relative time text, extract live, upcoming status, availability and channel id from feeds/channels/playlists (where applicable). 
Closes #1883
Authored-by: coletdjnz

											
										
										
											2021-12-20 17:47:53 +13:00
+								    strftime_or_none,
-												[youtube] Sanity check `chapters` (and refactor related code)
Closes #520

											
										
										
											2021-07-20 05:32:41 +05:30
+								    traverse_obj,
-												[ie/youtube] Calculate more accurate `filesize`

YouTube provides slightly different duration for each format.
Calculating file-size based on this duration instead of the
video duration gives more accurate results.

Ref: https://github.com/yt-dlp/yt-dlp/issues/1400#issuecomment-2007441207

											
										
										
											2024-04-01 02:20:03 +05:30
+								    try_call,
-												[youtube] Add fallback for duration extraction (closes #11841)

											
										
										
											2017-01-26 21:43:14 +07:00
+								    try_get,
-												Move youtube extractors to youtube_dl.extractor.youtube

											
										
										
											2013-06-23 19:58:33 +02:00
+								    unescapeHTML,
 								    unified_strdate,
-												[youtube] Add support for multifeed videos

											
										
										
											2015-07-25 21:30:34 +06:00
+								    unsmuggle_url,
-												Merge 'ytdl-org/youtube-dl/master' release 2020.11.19

Old Extractors left behind:
	VLivePlaylistIE
	YoutubeSearchURLIE
	YoutubeShowIE
	YoutubeFavouritesIE

If removing old extractors, make corresponding changes in
	docs/supportedsites.md
	youtube_dlc/extractor/extractors.py

Not merged:
	.github/ISSUE_TEMPLATE/1_broken_site.md
	.github/ISSUE_TEMPLATE/2_site_support_request.md
	.github/ISSUE_TEMPLATE/3_site_feature_request.md
	.github/ISSUE_TEMPLATE/4_bug_report.md
	.github/ISSUE_TEMPLATE/5_feature_request.md
	test/test_all_urls.py
	youtube_dlc/version.py
	Changelog

											
										
										
											2020-11-20 00:52:59 +05:30
+								    update_url_query,
-												[youtube] Fix mark watched (closes #18546)

											
										
										
											2018-12-16 19:35:48 +07:00
+								    url_or_none,
-												[youtube] misc cleanup and bug fixes (#505)

* Update some `_extract_response` calls to keep them consistent
* Cleanup continuation extraction related code using new API format
* Improve `_extract_account_syncid` to support multiple parameters
* Generalize `get_text` and related functions into one
* Update `INNERTUBE_CONTEXT_CLIENT_NAME` with integer values

Authored by: colethedj
											
										
										
											2021-07-19 16:55:07 +12:00
+								    urljoin,
-												[youtube] Sanity check `chapters` (and refactor related code)
Closes #520

											
										
										
											2021-07-20 05:32:41 +05:30
+								    variadic,
-												Move youtube extractors to youtube_dl.extractor.youtube

											
										
										
											2013-06-23 19:58:33 +02:00
+								)
-												[ie/youtube] Add a PO Token Provider Framework (#12840)

https://github.com/yt-dlp/yt-dlp/tree/master/yt_dlp/extractor/youtube/pot/README.md

Authored by: coletdjnz
											
										
										
											2025-05-18 13:45:26 +12:00
+								from ...utils.networking import clean_headers, clean_proxies, select_proxy
-												Move youtube extractors to youtube_dl.extractor.youtube

											
										
										
											2013-06-23 19:58:33 +02:00
-												[extractor/youtube] Add client name to `format_note` when `-v` (#6254)

Authored by: Lesmiscore, pukkandan
											
										
										
											2023-03-12 02:03:23 +09:00
+								STREAMING_DATA_CLIENT_NAME = '__yt_dlp_client'
-												[ie/youtube] Add PO token support for subtitles (#13234)

Closes #13075
Authored by: bashonly, coletdjnz

Co-authored-by: coletdjnz <coletdjnz@protonmail.com>
											
										
										
											2025-05-22 04:13:42 -05:00
+								STREAMING_DATA_FETCH_SUBS_PO_TOKEN = '__yt_dlp_fetch_subs_po_token'
-												[ie/youtube] Do not require PO Token for premium accounts (#13640)

Authored by: coletdjnz
											
										
										
											2025-07-11 18:54:01 +12:00
+								STREAMING_DATA_FETCH_GVS_PO_TOKEN = '__yt_dlp_fetch_gvs_po_token'
 								STREAMING_DATA_PLAYER_TOKEN_PROVIDED = '__yt_dlp_player_token_provided'
-												[ie/youtube] Add PO token support for subtitles (#13234)

Closes #13075
Authored by: bashonly, coletdjnz

Co-authored-by: coletdjnz <coletdjnz@protonmail.com>
											
										
										
											2025-05-22 04:13:42 -05:00
+								STREAMING_DATA_INNERTUBE_CONTEXT = '__yt_dlp_innertube_context'
-												[ie/youtube] Do not require PO Token for premium accounts (#13640)

Authored by: coletdjnz
											
										
										
											2025-07-11 18:54:01 +12:00
+								STREAMING_DATA_IS_PREMIUM_SUBSCRIBER = '__yt_dlp_is_premium_subscriber'
-												[ie/youtube] Optimize playback wait times (#14124)

Authored by: bashonly
											
										
										
											2025-08-22 18:53:28 -05:00
+								STREAMING_DATA_FETCHED_TIMESTAMP = '__yt_dlp_fetched_timestamp'
-												[ie/youtube] Add PO token support for subtitles (#13234)

Closes #13075
Authored by: bashonly, coletdjnz

Co-authored-by: coletdjnz <coletdjnz@protonmail.com>
											
										
										
											2025-05-22 04:13:42 -05:00
-												[ie/youtube] Use different PO token for GVS and Player (#12090)

Authored by: coletdjnz
											
										
										
											2025-01-25 13:17:37 +13:00
+								PO_TOKEN_GUIDE_URL = 'https://github.com/yt-dlp/yt-dlp/wiki/PO-Token-Guide'
-												[youtube] Convert to new subtitles system

The automatic captions are stored in the 'automactic_captions' field, which is used if no normal subtitles are found for an specific language.

											
										
										
											2015-02-16 21:44:17 +01:00
+								class YoutubeIE(YoutubeBaseInfoExtractor):
-												[cleanup] Add keyword automatically to SearchIE descriptions
and some minor cleanup of docs

											
										
										
											2021-10-23 19:59:52 +05:30
+								    IE_DESC = 'YouTube'
-												[cleanup] Add more ruff rules (#10149)

Authored by: seproDev

Reviewed-by: bashonly <88596187+bashonly@users.noreply.github.com>
Reviewed-by: Simon Sawicki <contact@grub4k.xyz>
											
										
										
											2024-06-12 01:09:58 +02:00
+								    _VALID_URL = r'''(?x)^
-												Move youtube extractors to youtube_dl.extractor.youtube

											
										
										
											2013-06-23 19:58:33 +02:00
+								                     (
-												[youtube] Don't make the url protocol optional

The generic extractor will add it.

											
										
										
											2014-09-11 21:47:25 +02:00
+								                         (?:https?://|//)                                    # http(s):// or protocol-independent URL
-												Update to ytdl-commit-cf2dbec
https://github.com/ytdl-org/youtube-dl/commit/cf2dbec6301177a1fddf72862de05fa912d9869d

Except: [kakao] improve info extraction and detect geo restriction
https://github.com/ytdl-org/youtube-dl/commit/d8085580f63ad3b146a31712ff76cf41d5a4558a

											
										
										
											2021-02-20 02:14:36 +05:30
+								                         (?:(?:(?:(?:\w+\.)?[yY][oO][uU][tT][uU][bB][eE](?:-nocookie|kids)?\.com|
 								                            (?:www\.)?deturl\.com/www\.youtube\.com|
 								                            (?:www\.)?pwnyoutube\.com|
 								                            (?:www\.)?hooktube\.com|
 								                            (?:www\.)?yourepeat\.com|
 								                            tube\.majestyc\.net|
-												[cleanup] Add more ruff rules (#10149)

Authored by: seproDev

Reviewed-by: bashonly <88596187+bashonly@users.noreply.github.com>
Reviewed-by: Simon Sawicki <contact@grub4k.xyz>
											
										
										
											2024-06-12 01:09:58 +02:00
+								                            {invidious}|
-												Update to ytdl-commit-cf2dbec
https://github.com/ytdl-org/youtube-dl/commit/cf2dbec6301177a1fddf72862de05fa912d9869d

Except: [kakao] improve info extraction and detect geo restriction
https://github.com/ytdl-org/youtube-dl/commit/d8085580f63ad3b146a31712ff76cf41d5a4558a

											
										
										
											2021-02-20 02:14:36 +05:30
+								                            youtube\.googleapis\.com)/                        # the various hostnames, with wildcard subdomains
-												Move youtube extractors to youtube_dl.extractor.youtube

											
										
										
											2013-06-23 19:58:33 +02:00
+								                         (?:.*?\#/)?                                          # handle anchor (#/) redirect urls
 								                         (?:                                                  # the various things that can precede the ID:
-												[extractor/youtube] Support `/live/` URL

											
										
										
											2023-02-03 23:47:13 +05:30
+								                             (?:(?:v|embed|e|shorts|live)/(?!videoseries|live_stream))  # v/ or embed/ or e/ or shorts/
-												Move youtube extractors to youtube_dl.extractor.youtube

											
										
										
											2013-06-23 19:58:33 +02:00
+								                             |(?:                                             # or the v= param in all its forms
-												[youtube] Add support for yourepeat.com URLs (Closes #2397)
											
										
										
											2014-02-19 02:00:54 +07:00
+								                                 (?:(?:watch|movie)(?:_popup)?(?:\.php)?/?)?  # preceding watch(_popup|.php) or nothing (like /?v=xxxx)
-												Move youtube extractors to youtube_dl.extractor.youtube

											
										
										
											2013-06-23 19:58:33 +02:00
+								                                 (?:\?|\#!?)                                  # the params delimiter ? or # or #!
-												[youtube] Extend _VALID_URL (Closes #7694)

											
										
										
											2015-11-29 21:01:59 +06:00
+								                                 (?:.*?[&;])??                                # any other preceding param (like /?s=tuff&v=xxxx or ?s=tuff&amp;v=V36LpHqtcDY)
-												Move youtube extractors to youtube_dl.extractor.youtube

											
										
										
											2013-06-23 19:58:33 +02:00
+								                                 v=
 								                             )
-												[youtube] Urls like youtube.com/NASA are now interpreted as users (fixes #1069)

Video urls like http://youtube.com/BaW_jenozKc are not valid, but http://youtu.be/BaW_jenozKc is correct.

											
										
										
											2013-09-05 22:38:23 +02:00
+								                         ))
-												[youtube] Expand _VALID_URL to support vid.plus

											
										
										
											2015-08-17 02:04:13 +06:00
+								                         |(?:
 								                            youtu\.be|                                        # just youtu.be/xxxx
-												[youtube] Add support for zwearz (Closes #9062)

											
										
										
											2016-04-04 02:26:20 +06:00
+								                            vid\.plus|                                        # or vid.plus/xxxx
 								                            zwearz\.com/watch|                                # or zwearz.com/watch/xxxx
-												[cleanup] Add more ruff rules (#10149)

Authored by: seproDev

Reviewed-by: bashonly <88596187+bashonly@users.noreply.github.com>
Reviewed-by: Simon Sawicki <contact@grub4k.xyz>
											
										
										
											2024-06-12 01:09:58 +02:00
+								                            {invidious}
-												[youtube] Expand _VALID_URL to support vid.plus

											
										
										
											2015-08-17 02:04:13 +06:00
+								                         )/
-												[youtube] Don't make the url protocol optional

The generic extractor will add it.

											
										
										
											2014-09-11 21:47:25 +02:00
+								                         |(?:www\.)?cleanvideosearch\.com/media/action/yt/watch\?videoId=
-												[youtube] Urls like youtube.com/NASA are now interpreted as users (fixes #1069)

Video urls like http://youtube.com/BaW_jenozKc are not valid, but http://youtu.be/BaW_jenozKc is correct.

											
										
										
											2013-09-05 22:38:23 +02:00
+								                         )
-												Move youtube extractors to youtube_dl.extractor.youtube

											
										
										
											2013-06-23 19:58:33 +02:00
+								                     )?                                                       # all until now is optional -> you can pass the naked ID
-												[cleanup] Add more ruff rules (#10149)

Authored by: seproDev

Reviewed-by: bashonly <88596187+bashonly@users.noreply.github.com>
Reviewed-by: Simon Sawicki <contact@grub4k.xyz>
											
										
										
											2024-06-12 01:09:58 +02:00
+								                     (?P<id>[0-9A-Za-z_-]{{11}})                              # here is it! the YouTube video ID
-												Move youtube extractors to youtube_dl.extractor.youtube

											
										
										
											2013-06-23 19:58:33 +02:00
+								                     (?(1).+)?                                                # if we found the ID, everything can follow
-												[cleanup] Add more ruff rules (#10149)

Authored by: seproDev

Reviewed-by: bashonly <88596187+bashonly@users.noreply.github.com>
Reviewed-by: Simon Sawicki <contact@grub4k.xyz>
											
										
										
											2024-06-12 01:09:58 +02:00
+								                     (?:\#|$)'''.format(
 								        invidious='|'.join(YoutubeBaseInfoExtractor._INVIDIOUS_SITES),
 								    )
-												[extractor/youtube] Detect `lazy-load-for-videos` embeds

Closes #4812

											
										
										
											2022-09-02 01:28:56 +05:30
+								    _EMBED_REGEX = [
 								        r'''(?x)
 								            (?:
-												[extractor/heise] Fix extractor (#5029)

Fixes https://github.com/yt-dlp/yt-dlp/issues/1520
Authored by: coletdjnz
											
										
										
											2022-09-26 00:58:06 +00:00
+								                <(?:[0-9A-Za-z-]+?)?iframe[^>]+?src=|
-												[extractor/youtube] Detect `lazy-load-for-videos` embeds

Closes #4812

											
										
										
											2022-09-02 01:28:56 +05:30
+								                data-video-url=|
 								                <embed[^>]+?src=|
 								                embedSWF\(?:\s*|
 								                <object[^>]+data=|
 								                new\s+SWFObject\(
 								            )
 								            (["\'])
 								                (?P<url>(?:https?:)?//(?:www\.)?youtube(?:-nocookie)?\.com/
 								                (?:embed|v|p)/[0-9A-Za-z_-]{11}.*?)
 								            \1''',
 								        # https://wordpress.org/plugins/lazy-load-for-videos/
 								        r'''(?xs)
 								            <a\s[^>]*\bhref="(?P<url>https://www\.youtube\.com/watch\?v=[0-9A-Za-z_-]{11})"
 								            \s[^>]*\bclass="[^"]*\blazy-load-youtube''',
 								    ]
-												[cleanup] Misc

Closes #5541

											
										
										
											2022-11-16 06:27:43 +05:30
+								    _RETURN_TYPE = 'video'  # XXX: How to handle multifeed?
-												[extractor/youtube] Detect `lazy-load-for-videos` embeds

Closes #4812

											
										
										
											2022-09-02 01:28:56 +05:30
-												[youtube] Improve player id extraction and add tests

											
										
										
											2020-05-02 07:18:08 +07:00
+								    _PLAYER_INFO_RE = (
-												[ie/youtube] Fix nsig and signature extraction for player `643afba4` (#12684)

Closes #12677, Closes #12682
Authored by: seproDev, bashonly

Co-authored-by: bashonly <88596187+bashonly@users.noreply.github.com>
											
										
										
											2025-03-21 21:58:10 +01:00
+								        r'/s/player/(?P<id>[a-zA-Z0-9_-]{8,})/(?:tv-)?player',
-												Update to ytdl-2021.02.10

Except: [archiveorg] Fix and improve extraction (5fc53690cbe6abb11941a3f4846b566a7472753e)

											
										
										
											2021-02-11 02:52:55 +05:30
+								        r'/(?P<id>[a-zA-Z0-9_-]{8,})/player(?:_ias\.vflset(?:/[a-zA-Z]{2,3}_[a-zA-Z]{2,3})?|-plasma-ias-(?:phone|tablet)-[a-z]{2}_[A-Z]{2}\.vflset)/base\.js$',
-												[youtube] Update to ytdl-2021.02.04.1

											
										
										
											2021-02-04 20:07:17 +05:30
+								        r'\b(?P<id>vfl[a-zA-Z0-9_-]+)\b.*?\.js$',
-												[youtube] Improve player id extraction and add tests

											
										
										
											2020-05-02 07:18:08 +07:00
+								    )
-												[ie/googledrive] Fix formats extraction (#9908)

Closes #8281
Authored by: WyohKnott
											
										
										
											2024-05-13 01:05:47 +02:00
+								    _formats = {  # NB: Used in YoutubeWebArchiveIE and GoogleDriveIE
-												Revert "[youtube] add tbr to _formats extracted from watch_as3.swf"

This reverts commit 4a5ba28a87a1a1632e58a1de404eb1fa268118a3.

											
										
										
											2016-03-02 17:35:04 +01:00
+								        '5': {'ext': 'flv', 'width': 400, 'height': 240, 'acodec': 'mp3', 'abr': 64, 'vcodec': 'h263'},
 								        '6': {'ext': 'flv', 'width': 450, 'height': 270, 'acodec': 'mp3', 'abr': 64, 'vcodec': 'h263'},
 								        '13': {'ext': '3gp', 'acodec': 'aac', 'vcodec': 'mp4v'},
 								        '17': {'ext': '3gp', 'width': 176, 'height': 144, 'acodec': 'aac', 'abr': 24, 'vcodec': 'mp4v'},
 								        '18': {'ext': 'mp4', 'width': 640, 'height': 360, 'acodec': 'aac', 'abr': 96, 'vcodec': 'h264'},
 								        '22': {'ext': 'mp4', 'width': 1280, 'height': 720, 'acodec': 'aac', 'abr': 192, 'vcodec': 'h264'},
 								        '34': {'ext': 'flv', 'width': 640, 'height': 360, 'acodec': 'aac', 'abr': 128, 'vcodec': 'h264'},
 								        '35': {'ext': 'flv', 'width': 854, 'height': 480, 'acodec': 'aac', 'abr': 128, 'vcodec': 'h264'},
-												[youtube] Clarify itag 36 height and abr (Closes #8457)

											
										
										
											2016-02-08 01:30:57 +06:00
+								        # itag 36 videos are either 320x180 (BaW_jenozKc) or 320x240 (__2ABJjxzNo), abr varies as well
-												Revert "[youtube] add tbr to _formats extracted from watch_as3.swf"

This reverts commit 4a5ba28a87a1a1632e58a1de404eb1fa268118a3.

											
										
										
											2016-03-02 17:35:04 +01:00
+								        '36': {'ext': '3gp', 'width': 320, 'acodec': 'aac', 'vcodec': 'mp4v'},
 								        '37': {'ext': 'mp4', 'width': 1920, 'height': 1080, 'acodec': 'aac', 'abr': 192, 'vcodec': 'h264'},
 								        '38': {'ext': 'mp4', 'width': 4096, 'height': 3072, 'acodec': 'aac', 'abr': 192, 'vcodec': 'h264'},
 								        '43': {'ext': 'webm', 'width': 640, 'height': 360, 'acodec': 'vorbis', 'abr': 128, 'vcodec': 'vp8'},
 								        '44': {'ext': 'webm', 'width': 854, 'height': 480, 'acodec': 'vorbis', 'abr': 128, 'vcodec': 'vp8'},
 								        '45': {'ext': 'webm', 'width': 1280, 'height': 720, 'acodec': 'vorbis', 'abr': 192, 'vcodec': 'vp8'},
-												[youtube] added vcodec/acodec/abr for multiple itags

Should make downloading with filters more precise and easier, ie. bestvideo[vcodec=h264]. By default a lot of codecs are specified as avc1.xxxxxx and unique for each format, which makes them unusable for bestvideo selection.
											
										
										
											2016-01-03 04:11:19 +01:00
+								        '46': {'ext': 'webm', 'width': 1920, 'height': 1080, 'acodec': 'vorbis', 'abr': 192, 'vcodec': 'vp8'},
-												Revert "[youtube] add tbr to _formats extracted from watch_as3.swf"

This reverts commit 4a5ba28a87a1a1632e58a1de404eb1fa268118a3.

											
										
										
											2016-03-02 17:35:04 +01:00
+								        '59': {'ext': 'mp4', 'width': 854, 'height': 480, 'acodec': 'aac', 'abr': 128, 'vcodec': 'h264'},
 								        '78': {'ext': 'mp4', 'width': 854, 'height': 480, 'acodec': 'aac', 'abr': 128, 'vcodec': 'h264'},
-												[youtube] added vcodec/acodec/abr for multiple itags

Should make downloading with filters more precise and easier, ie. bestvideo[vcodec=h264]. By default a lot of codecs are specified as avc1.xxxxxx and unique for each format, which makes them unusable for bestvideo selection.
											
										
										
											2016-01-03 04:11:19 +01:00
 								        # 3D videos
-												Revert "[youtube] add tbr to _formats extracted from watch_as3.swf"

This reverts commit 4a5ba28a87a1a1632e58a1de404eb1fa268118a3.

											
										
										
											2016-03-02 17:35:04 +01:00
+								        '82': {'ext': 'mp4', 'height': 360, 'format_note': '3D', 'acodec': 'aac', 'abr': 128, 'vcodec': 'h264', 'preference': -20},
 								        '83': {'ext': 'mp4', 'height': 480, 'format_note': '3D', 'acodec': 'aac', 'abr': 128, 'vcodec': 'h264', 'preference': -20},
 								        '84': {'ext': 'mp4', 'height': 720, 'format_note': '3D', 'acodec': 'aac', 'abr': 192, 'vcodec': 'h264', 'preference': -20},
 								        '85': {'ext': 'mp4', 'height': 1080, 'format_note': '3D', 'acodec': 'aac', 'abr': 192, 'vcodec': 'h264', 'preference': -20},
-												[youtube] added vcodec/acodec/abr for multiple itags

Should make downloading with filters more precise and easier, ie. bestvideo[vcodec=h264]. By default a lot of codecs are specified as avc1.xxxxxx and unique for each format, which makes them unusable for bestvideo selection.
											
										
										
											2016-01-03 04:11:19 +01:00
+								        '100': {'ext': 'webm', 'height': 360, 'format_note': '3D', 'acodec': 'vorbis', 'abr': 128, 'vcodec': 'vp8', 'preference': -20},
 								        '101': {'ext': 'webm', 'height': 480, 'format_note': '3D', 'acodec': 'vorbis', 'abr': 192, 'vcodec': 'vp8', 'preference': -20},
 								        '102': {'ext': 'webm', 'height': 720, 'format_note': '3D', 'acodec': 'vorbis', 'abr': 192, 'vcodec': 'vp8', 'preference': -20},
-												Add YouTube DASH formats to YouTubeIE

											
										
										
											2013-08-19 18:22:25 -07:00
-												AHLS -> Apple HTTP Live Streaming

											
										
										
											2013-09-03 18:49:35 -07:00
+								        # Apple HTTP Live Streaming
-												[youtube] Added itag 91

Seen in https://www.youtube.com/watch?v=jMN4cxyhJjk

											
										
										
											2016-03-17 19:25:37 +08:00
+								        '91': {'ext': 'mp4', 'height': 144, 'format_note': 'HLS', 'acodec': 'aac', 'abr': 48, 'vcodec': 'h264', 'preference': -10},
-												Revert "[youtube] add tbr to _formats extracted from watch_as3.swf"

This reverts commit 4a5ba28a87a1a1632e58a1de404eb1fa268118a3.

											
										
										
											2016-03-02 17:35:04 +01:00
+								        '92': {'ext': 'mp4', 'height': 240, 'format_note': 'HLS', 'acodec': 'aac', 'abr': 48, 'vcodec': 'h264', 'preference': -10},
 								        '93': {'ext': 'mp4', 'height': 360, 'format_note': 'HLS', 'acodec': 'aac', 'abr': 128, 'vcodec': 'h264', 'preference': -10},
 								        '94': {'ext': 'mp4', 'height': 480, 'format_note': 'HLS', 'acodec': 'aac', 'abr': 128, 'vcodec': 'h264', 'preference': -10},
 								        '95': {'ext': 'mp4', 'height': 720, 'format_note': 'HLS', 'acodec': 'aac', 'abr': 256, 'vcodec': 'h264', 'preference': -10},
 								        '96': {'ext': 'mp4', 'height': 1080, 'format_note': 'HLS', 'acodec': 'aac', 'abr': 256, 'vcodec': 'h264', 'preference': -10},
-												[youtube] added vcodec/acodec/abr for multiple itags

Should make downloading with filters more precise and easier, ie. bestvideo[vcodec=h264]. By default a lot of codecs are specified as avc1.xxxxxx and unique for each format, which makes them unusable for bestvideo selection.
											
										
										
											2016-01-03 04:11:19 +01:00
+								        '132': {'ext': 'mp4', 'height': 240, 'format_note': 'HLS', 'acodec': 'aac', 'abr': 48, 'vcodec': 'h264', 'preference': -10},
 								        '151': {'ext': 'mp4', 'height': 72, 'format_note': 'HLS', 'acodec': 'aac', 'abr': 24, 'vcodec': 'h264', 'preference': -10},
-												[youtube] Simplify format specification

											
										
										
											2013-12-24 12:34:09 +01:00
 								        # DASH mp4 video
-												[youtube] Remove explicit preference for audio-only and video-only formats
In order not to break sorting when new formats appear

											
										
										
											2017-04-11 22:41:48 +07:00
+								        '133': {'ext': 'mp4', 'height': 240, 'format_note': 'DASH video', 'vcodec': 'h264'},
 								        '134': {'ext': 'mp4', 'height': 360, 'format_note': 'DASH video', 'vcodec': 'h264'},
 								        '135': {'ext': 'mp4', 'height': 480, 'format_note': 'DASH video', 'vcodec': 'h264'},
 								        '136': {'ext': 'mp4', 'height': 720, 'format_note': 'DASH video', 'vcodec': 'h264'},
 								        '137': {'ext': 'mp4', 'height': 1080, 'format_note': 'DASH video', 'vcodec': 'h264'},
-												Start moving to ytdl-org

											
										
										
											2019-03-09 19:14:41 +07:00
+								        '138': {'ext': 'mp4', 'format_note': 'DASH video', 'vcodec': 'h264'},  # Height can vary (https://github.com/ytdl-org/youtube-dl/issues/4559)
-												[youtube] Remove explicit preference for audio-only and video-only formats
In order not to break sorting when new formats appear

											
										
										
											2017-04-11 22:41:48 +07:00
+								        '160': {'ext': 'mp4', 'height': 144, 'format_note': 'DASH video', 'vcodec': 'h264'},
 								        '212': {'ext': 'mp4', 'height': 480, 'format_note': 'DASH video', 'vcodec': 'h264'},
 								        '264': {'ext': 'mp4', 'height': 1440, 'format_note': 'DASH video', 'vcodec': 'h264'},
 								        '298': {'ext': 'mp4', 'height': 720, 'format_note': 'DASH video', 'vcodec': 'h264', 'fps': 60},
 								        '299': {'ext': 'mp4', 'height': 1080, 'format_note': 'DASH video', 'vcodec': 'h264', 'fps': 60},
 								        '266': {'ext': 'mp4', 'height': 2160, 'format_note': 'DASH video', 'vcodec': 'h264'},
-												Add YouTube DASH formats to YouTubeIE

											
										
										
											2013-08-19 18:22:25 -07:00
-												extractor: youtube: Fix extension of dash formats.

While we are at it, separate the audio formats from the video formats.

Signed-off-by: Rogério Brito <rbrito@ime.usp.br>

											
										
										
											2013-10-18 18:53:00 -03:00
+								        # Dash mp4 audio
-												[youtube] Remove explicit preference for audio-only and video-only formats
In order not to break sorting when new formats appear

											
										
										
											2017-04-11 22:41:48 +07:00
+								        '139': {'ext': 'm4a', 'format_note': 'DASH audio', 'acodec': 'aac', 'abr': 48, 'container': 'm4a_dash'},
 								        '140': {'ext': 'm4a', 'format_note': 'DASH audio', 'acodec': 'aac', 'abr': 128, 'container': 'm4a_dash'},
 								        '141': {'ext': 'm4a', 'format_note': 'DASH audio', 'acodec': 'aac', 'abr': 256, 'container': 'm4a_dash'},
 								        '256': {'ext': 'm4a', 'format_note': 'DASH audio', 'acodec': 'aac', 'container': 'm4a_dash'},
 								        '258': {'ext': 'm4a', 'format_note': 'DASH audio', 'acodec': 'aac', 'container': 'm4a_dash'},
 								        '325': {'ext': 'm4a', 'format_note': 'DASH audio', 'acodec': 'dtse', 'container': 'm4a_dash'},
 								        '328': {'ext': 'm4a', 'format_note': 'DASH audio', 'acodec': 'ec-3', 'container': 'm4a_dash'},
-												Add YouTube DASH formats to YouTubeIE

											
										
										
											2013-08-19 18:22:25 -07:00
 								        # Dash webm
-												[youtube] Remove explicit preference for audio-only and video-only formats
In order not to break sorting when new formats appear

											
										
										
											2017-04-11 22:41:48 +07:00
+								        '167': {'ext': 'webm', 'height': 360, 'width': 640, 'format_note': 'DASH video', 'container': 'webm', 'vcodec': 'vp8'},
 								        '168': {'ext': 'webm', 'height': 480, 'width': 854, 'format_note': 'DASH video', 'container': 'webm', 'vcodec': 'vp8'},
 								        '169': {'ext': 'webm', 'height': 720, 'width': 1280, 'format_note': 'DASH video', 'container': 'webm', 'vcodec': 'vp8'},
 								        '170': {'ext': 'webm', 'height': 1080, 'width': 1920, 'format_note': 'DASH video', 'container': 'webm', 'vcodec': 'vp8'},
 								        '218': {'ext': 'webm', 'height': 480, 'width': 854, 'format_note': 'DASH video', 'container': 'webm', 'vcodec': 'vp8'},
 								        '219': {'ext': 'webm', 'height': 480, 'width': 854, 'format_note': 'DASH video', 'container': 'webm', 'vcodec': 'vp8'},
 								        '278': {'ext': 'webm', 'height': 144, 'format_note': 'DASH video', 'container': 'webm', 'vcodec': 'vp9'},
 								        '242': {'ext': 'webm', 'height': 240, 'format_note': 'DASH video', 'vcodec': 'vp9'},
 								        '243': {'ext': 'webm', 'height': 360, 'format_note': 'DASH video', 'vcodec': 'vp9'},
 								        '244': {'ext': 'webm', 'height': 480, 'format_note': 'DASH video', 'vcodec': 'vp9'},
 								        '245': {'ext': 'webm', 'height': 480, 'format_note': 'DASH video', 'vcodec': 'vp9'},
 								        '246': {'ext': 'webm', 'height': 480, 'format_note': 'DASH video', 'vcodec': 'vp9'},
 								        '247': {'ext': 'webm', 'height': 720, 'format_note': 'DASH video', 'vcodec': 'vp9'},
 								        '248': {'ext': 'webm', 'height': 1080, 'format_note': 'DASH video', 'vcodec': 'vp9'},
 								        '271': {'ext': 'webm', 'height': 1440, 'format_note': 'DASH video', 'vcodec': 'vp9'},
-												[youtube] Clarify itag 272 possible resolutions (#7699)

											
										
										
											2015-11-30 20:42:05 +06:00
+								        # itag 272 videos are either 3840x2160 (e.g. RtoitU2A-3E) or 7680x4320 (sLprVF6d7Ug)
-												[youtube] Remove explicit preference for audio-only and video-only formats
In order not to break sorting when new formats appear

											
										
										
											2017-04-11 22:41:48 +07:00
+								        '272': {'ext': 'webm', 'height': 2160, 'format_note': 'DASH video', 'vcodec': 'vp9'},
 								        '302': {'ext': 'webm', 'height': 720, 'format_note': 'DASH video', 'vcodec': 'vp9', 'fps': 60},
 								        '303': {'ext': 'webm', 'height': 1080, 'format_note': 'DASH video', 'vcodec': 'vp9', 'fps': 60},
 								        '308': {'ext': 'webm', 'height': 1440, 'format_note': 'DASH video', 'vcodec': 'vp9', 'fps': 60},
 								        '313': {'ext': 'webm', 'height': 2160, 'format_note': 'DASH video', 'vcodec': 'vp9'},
 								        '315': {'ext': 'webm', 'height': 2160, 'format_note': 'DASH video', 'vcodec': 'vp9', 'fps': 60},
-												[youtube] Simplify format specification

											
										
										
											2013-12-24 12:34:09 +01:00
 								        # Dash webm audio
-												[youtube] Remove explicit preference for audio-only and video-only formats
In order not to break sorting when new formats appear

											
										
										
											2017-04-11 22:41:48 +07:00
+								        '171': {'ext': 'webm', 'acodec': 'vorbis', 'format_note': 'DASH audio', 'abr': 128},
 								        '172': {'ext': 'webm', 'acodec': 'vorbis', 'format_note': 'DASH audio', 'abr': 256},
-												[youtube] Add a pseudo format for rtmp videos (#2123)

											
										
										
											2014-01-09 02:38:50 +01:00
-												[youtube] Add webm audio formats (Fixes #4229)

											
										
										
											2014-11-18 11:06:09 +01:00
+								        # Dash webm audio with opus inside
-												[youtube] Remove explicit preference for audio-only and video-only formats
In order not to break sorting when new formats appear

											
										
										
											2017-04-11 22:41:48 +07:00
+								        '249': {'ext': 'webm', 'format_note': 'DASH audio', 'acodec': 'opus', 'abr': 50},
 								        '250': {'ext': 'webm', 'format_note': 'DASH audio', 'acodec': 'opus', 'abr': 70},
 								        '251': {'ext': 'webm', 'format_note': 'DASH audio', 'acodec': 'opus', 'abr': 160},
-												[youtube] Add webm audio formats (Fixes #4229)

											
										
										
											2014-11-18 11:06:09 +01:00
-												[youtube] Add a pseudo format for rtmp videos (#2123)

											
										
										
											2014-01-09 02:38:50 +01:00
+								        # RTMP (unnamed)
 								        '_rtmp': {'protocol': 'rtmp'},
-												[youtube] Hardcode codec metadata for av01 video only formats (closes #21381)

											
										
										
											2019-06-14 01:59:05 +07:00
 								        # av01 video only formats sometimes served with "unknown" codecs
-												[youtube] Add av01 itags to known formats list (#747)

Authored by: blackjack4494
											
										
										
											2021-08-22 21:59:43 +02:00
+								        '394': {'ext': 'mp4', 'height': 144, 'format_note': 'DASH video', 'vcodec': 'av01.0.00M.08'},
 								        '395': {'ext': 'mp4', 'height': 240, 'format_note': 'DASH video', 'vcodec': 'av01.0.00M.08'},
 								        '396': {'ext': 'mp4', 'height': 360, 'format_note': 'DASH video', 'vcodec': 'av01.0.01M.08'},
 								        '397': {'ext': 'mp4', 'height': 480, 'format_note': 'DASH video', 'vcodec': 'av01.0.04M.08'},
 								        '398': {'ext': 'mp4', 'height': 720, 'format_note': 'DASH video', 'vcodec': 'av01.0.05M.08'},
 								        '399': {'ext': 'mp4', 'height': 1080, 'format_note': 'DASH video', 'vcodec': 'av01.0.08M.08'},
 								        '400': {'ext': 'mp4', 'height': 1440, 'format_note': 'DASH video', 'vcodec': 'av01.0.12M.08'},
 								        '401': {'ext': 'mp4', 'height': 2160, 'format_note': 'DASH video', 'vcodec': 'av01.0.12M.08'},
-												Move youtube extractors to youtube_dl.extractor.youtube

											
										
										
											2013-06-23 19:58:33 +02:00
+								    }
-												[ie/youtube] Extract srt subtitles (#13411)

Closes #1734
Authored by: gamer191
											
										
										
											2025-06-07 05:32:03 +10:00
+								    _SUBTITLE_FORMATS = ('json3', 'srv1', 'srv2', 'srv3', 'ttml', 'srt', 'vtt')
-												[ie/youtube] Player client maintenance (#14135)

- Prioritize `tv_simply` over `tv` in default logged-out clients
- Revert `tv` client user-agent to work around 403 errors

Authored by: bashonly
											
										
										
											2025-08-23 18:45:29 -05:00
+								    _DEFAULT_CLIENTS = ('tv_simply', 'tv', 'web')
-												[ie/youtube] Replace `ios` with `tv_simply` in default clients (#14123)

Also:
- Add `web_safari` to default logged-in clients
- Add `web_creator` to default premium clients
- Flag `ios` HLS formats as requiring PO token

Closes #13702
Authored by: bashonly, coletdjnz

Co-authored-by: coletdjnz <coletdjnz@protonmail.com>
											
										
										
											2025-08-22 18:49:54 -05:00
+								    _DEFAULT_AUTHED_CLIENTS = ('tv', 'web_safari', 'web')
-												[ie/youtube] Do not require PO Token for premium accounts (#13640)

Authored by: coletdjnz
											
										
										
											2025-07-11 18:54:01 +12:00
+								    # Premium does not require POT (except for subtitles)
-												[ie/youtube] Replace `ios` with `tv_simply` in default clients (#14123)

Also:
- Add `web_safari` to default logged-in clients
- Add `web_creator` to default premium clients
- Flag `ios` HLS formats as requiring PO token

Closes #13702
Authored by: bashonly, coletdjnz

Co-authored-by: coletdjnz <coletdjnz@protonmail.com>
											
										
										
											2025-08-22 18:49:54 -05:00
+								    _DEFAULT_PREMIUM_CLIENTS = ('tv', 'web_creator', 'web')
-												Add YouTube DASH formats to YouTubeIE

											
										
										
											2013-08-19 18:22:25 -07:00
-												[youtube] Raise GeoRestrictedError

											
										
										
											2017-02-26 16:51:21 +07:00
+								    _GEO_BYPASS = False
-												[youtube] Modernize

											
										
										
											2014-09-13 07:51:06 +02:00
+								    IE_NAME = 'youtube'
-												[cleanup] Move embed tests to dedicated extractors (#13782)

Authored by: doe1080
											
										
										
											2025-08-02 05:50:20 +09:00
+								    _TESTS = [{
 								        'url': 'https://www.youtube.com/watch?v=BaW_jenozKc&t=1s&end=9',
 								        'info_dict': {
 								            'id': 'BaW_jenozKc',
 								            'ext': 'mp4',
 								            'title': 'youtube-dl test video "\'/\\ä↭𝕐',
 								            'age_limit': 0,
 								            'availability': 'public',
 								            'categories': ['Science & Technology'],
 								            'channel': 'Philipp Hagemeister',
 								            'channel_follower_count': int,
 								            'channel_id': 'UCLqxVugv74EIW3VWh2NOa3Q',
 								            'channel_url': 'https://www.youtube.com/channel/UCLqxVugv74EIW3VWh2NOa3Q',
 								            'comment_count': int,
 								            'description': 'md5:8fb536f4877b8a7455c2ec23794dbc22',
 								            'duration': 10,
 								            'end_time': 9,
 								            'heatmap': 'count:100',
 								            'like_count': int,
 								            'live_status': 'not_live',
 								            'playable_in_embed': True,
 								            'start_time': 1,
 								            'tags': 'count:1',
 								            'thumbnail': r're:https?://i\.ytimg\.com/.+',
 								            'timestamp': 1349198244,
 								            'upload_date': '20121002',
 								            'uploader': 'Philipp Hagemeister',
 								            'uploader_id': '@PhilippHagemeister',
 								            'uploader_url': 'https://www.youtube.com/@PhilippHagemeister',
 								            'view_count': int,
-												[youtube] Fix tests in 2.x

											
										
										
											2013-06-27 19:55:39 +02:00
+								        },
-												[cleanup] Move embed tests to dedicated extractors (#13782)

Authored by: doe1080
											
										
										
											2025-08-02 05:50:20 +09:00
+								        'skip': 'Video unavailable',
 								    }, {
 								        'note': 'Embed-only video (#1746)',
 								        'url': '//www.YouTube.com/watch?v=yZIXLfi8CZQ',
 								        'info_dict': {
 								            'id': 'yZIXLfi8CZQ',
 								            'ext': 'mp4',
 								            'title': 'Principal Sexually Assaults A Teacher - Episode 117 - 8th June 2012',
 								            'age_limit': 18,
 								            'description': 'md5:09b78bd971f1e3e289601dfba15ca4f7',
 								            'upload_date': '20120608',
-												Suppor embed-only videos (Fixes #1746)

											
										
										
											2013-11-18 13:05:18 +01:00
+								        },
-												[cleanup] Move embed tests to dedicated extractors (#13782)

Authored by: doe1080
											
										
										
											2025-08-02 05:50:20 +09:00
+								        'skip': 'Private video',
 								    }, {
 								        'note': 'Use the first video ID in the URL',
 								        'url': 'https://www.youtube.com/watch?v=BaW_jenozKc&v=yZIXLfi8CZQ',
 								        'info_dict': {
 								            'id': 'BaW_jenozKc',
 								            'ext': 'mp4',
 								            'title': 'youtube-dl test video "\'/\\ä↭𝕐',
 								            'age_limit': 0,
 								            'availability': 'public',
 								            'categories': ['Science & Technology'],
 								            'channel': 'Philipp Hagemeister',
 								            'channel_follower_count': int,
 								            'channel_id': 'UCLqxVugv74EIW3VWh2NOa3Q',
 								            'channel_url': 'https://www.youtube.com/channel/UCLqxVugv74EIW3VWh2NOa3Q',
 								            'comment_count': int,
 								            'description': 'md5:8fb536f4877b8a7455c2ec23794dbc22',
 								            'duration': 10,
 								            'heatmap': 'count:100',
 								            'like_count': int,
 								            'live_status': 'not_live',
 								            'playable_in_embed': True,
 								            'tags': 'count:1',
 								            'thumbnail': r're:https?://i\.ytimg\.com/.+',
 								            'timestamp': 1349198244,
 								            'upload_date': '20121002',
 								            'uploader': 'Philipp Hagemeister',
 								            'uploader_id': '@PhilippHagemeister',
 								            'uploader_url': 'https://www.youtube.com/@PhilippHagemeister',
 								            'view_count': int,
-												[youtube] Use the first v= argument in the URL

This is according to how youtube handles multiple v= values in one URL.
Before this, it was possible to make a single URL show up differently
 on youtube itself, and if you downloaded/viewed it with youtube-dl/mpv

											
										
										
											2015-08-10 20:52:38 +02:00
+								        },
-												[cleanup] Move embed tests to dedicated extractors (#13782)

Authored by: doe1080
											
										
										
											2025-08-02 05:50:20 +09:00
+								        'skip': 'Video unavailable',
 								    }, {
 								        'note': '256k DASH audio (format 141) via DASH manifest',
 								        'url': 'https://www.youtube.com/watch?v=a9LDPn-MO4I',
 								        'info_dict': {
 								            'id': 'a9LDPn-MO4I',
 								            'ext': 'm4a',
 								            'title': 'UHDTV TEST 8K VIDEO.mp4',
 								            'age_limit': 0,
 								            'availability': 'public',
 								            'categories': ['Science & Technology'],
 								            'channel': '8KVIDEO',
 								            'channel_follower_count': int,
 								            'channel_id': 'UC8cn-cnCZ2FnxmjfkoLGpsQ',
 								            'channel_url': 'https://www.youtube.com/channel/UC8cn-cnCZ2FnxmjfkoLGpsQ',
 								            'comment_count': int,
 								            'description': '',
 								            'duration': 60,
 								            'like_count': int,
 								            'live_status': 'not_live',
 								            'media_type': 'video',
 								            'playable_in_embed': True,
 								            'tags': 'count:8',
 								            'thumbnail': r're:https?://i\.ytimg\.com/.+',
 								            'timestamp': 1349185252,
 								            'upload_date': '20121002',
 								            'uploader': '8KVIDEO',
 								            'uploader_id': '@8KVIDEO',
 								            'uploader_url': 'https://www.youtube.com/@8KVIDEO',
 								            'view_count': int,
-												[youtube] Download DASH manifest

If given, download and parse the DASH manifest file, in order to get ultra-HQ formats.
Fixes #2166

											
										
										
											2014-01-19 05:47:20 +01:00
+								        },
-												[cleanup] Move embed tests to dedicated extractors (#13782)

Authored by: doe1080
											
										
										
											2025-08-02 05:50:20 +09:00
+								        'params': {
 								            'format': '141',
 								            'skip_download': True,
 								            'youtube_include_dash_manifest': True,
 								        },
 								        'skip': 'format 141 not served anymore',
 								    }, {
-												Merge 'ytdl-org/youtube-dl/master' release 2020.11.19

Old Extractors left behind:
	VLivePlaylistIE
	YoutubeSearchURLIE
	YoutubeShowIE
	YoutubeFavouritesIE

If removing old extractors, make corresponding changes in
	docs/supportedsites.md
	youtube_dlc/extractor/extractors.py

Not merged:
	.github/ISSUE_TEMPLATE/1_broken_site.md
	.github/ISSUE_TEMPLATE/2_site_support_request.md
	.github/ISSUE_TEMPLATE/3_site_feature_request.md
	.github/ISSUE_TEMPLATE/4_bug_report.md
	.github/ISSUE_TEMPLATE/5_feature_request.md
	test/test_all_urls.py
	youtube_dlc/version.py
	Changelog

											
										
										
											2020-11-20 00:52:59 +05:30
+								        # DASH manifest with encrypted signature
-												[cleanup] Move embed tests to dedicated extractors (#13782)

Authored by: doe1080
											
										
										
											2025-08-02 05:50:20 +09:00
+								        'url': 'https://www.youtube.com/watch?v=IB3lcPjvWLA',
 								        'info_dict': {
 								            'id': 'IB3lcPjvWLA',
 								            'ext': 'm4a',
 								            'title': 'Afrojack, Spree Wilson - The Spark (Official Music Video) ft. Spree Wilson',
 								            'age_limit': 0,
 								            'availability': 'public',
 								            'categories': ['Music'],
 								            'channel': 'Afrojack',
 								            'channel_follower_count': int,
 								            'channel_id': 'UChuZAo1RKL85gev3Eal9_zg',
 								            'channel_is_verified': True,
 								            'channel_url': 'https://www.youtube.com/channel/UChuZAo1RKL85gev3Eal9_zg',
 								            'comment_count': int,
 								            'description': 'md5:8f5e2b82460520b619ccac1f509d43bf',
 								            'duration': 244,
 								            'heatmap': 'count:100',
 								            'like_count': int,
 								            'live_status': 'not_live',
 								            'media_type': 'video',
 								            'playable_in_embed': True,
 								            'tags': 'count:19',
 								            'thumbnail': r're:https?://i\.ytimg\.com/.+',
 								            'timestamp': 1381496404,
 								            'upload_date': '20131011',
 								            'uploader': 'Afrojack',
 								            'uploader_id': '@AfrojackVEVO',
 								            'uploader_url': 'https://www.youtube.com/@AfrojackVEVO',
 								            'view_count': int,
-												Merge 'ytdl-org/youtube-dl/master' release 2020.11.19

Old Extractors left behind:
	VLivePlaylistIE
	YoutubeSearchURLIE
	YoutubeShowIE
	YoutubeFavouritesIE

If removing old extractors, make corresponding changes in
	docs/supportedsites.md
	youtube_dlc/extractor/extractors.py

Not merged:
	.github/ISSUE_TEMPLATE/1_broken_site.md
	.github/ISSUE_TEMPLATE/2_site_support_request.md
	.github/ISSUE_TEMPLATE/3_site_feature_request.md
	.github/ISSUE_TEMPLATE/4_bug_report.md
	.github/ISSUE_TEMPLATE/5_feature_request.md
	test/test_all_urls.py
	youtube_dlc/version.py
	Changelog

											
										
										
											2020-11-20 00:52:59 +05:30
+								        },
-												[cleanup] Move embed tests to dedicated extractors (#13782)

Authored by: doe1080
											
										
										
											2025-08-02 05:50:20 +09:00
+								        'params': {
 								            'format': '141/bestaudio[ext=m4a]',
 								            'skip_download': True,
 								            'youtube_include_dash_manifest': True,
-												[youtube] Add a normal age-gate test video

											
										
										
											2014-11-30 21:45:49 +01:00
+								        },
-												[cleanup] Move embed tests to dedicated extractors (#13782)

Authored by: doe1080
											
										
										
											2025-08-02 05:50:20 +09:00
+								    }, {
 								        # Age-gated video
 								        # https://github.com/yt-dlp/yt-dlp/pull/575#issuecomment-888837000
 								        'note': 'Embed allowed age-gated video; works with web_embedded',
 								        'url': 'https://youtube.com/watch?v=HtVdAasjOgU',
 								        'info_dict': {
 								            'id': 'HtVdAasjOgU',
 								            'ext': 'mp4',
 								            'title': 'The Witcher 3: Wild Hunt - The Sword Of Destiny Trailer',
 								            'age_limit': 18,
 								            'availability': 'needs_auth',
 								            'categories': ['Gaming'],
 								            'channel': 'The Witcher',
 								            'channel_follower_count': int,
 								            'channel_id': 'UCzybXLxv08IApdjdN0mJhEg',
 								            'channel_is_verified': True,
 								            'channel_url': 'https://www.youtube.com/channel/UCzybXLxv08IApdjdN0mJhEg',
 								            'comment_count': int,
 								            'description': 'md5:595a43060c51c2a8cb61dd33c18e5fbd',
 								            'duration': 142,
 								            'heatmap': 'count:100',
 								            'like_count': int,
 								            'live_status': 'not_live',
 								            'media_type': 'video',
 								            'playable_in_embed': True,
 								            'tags': 'count:17',
 								            'thumbnail': r're:https?://i\.ytimg\.com/.+',
 								            'timestamp': 1401991663,
 								            'upload_date': '20140605',
 								            'uploader': 'The Witcher',
 								            'uploader_id': '@thewitcher',
 								            'uploader_url': 'https://www.youtube.com/@thewitcher',
 								            'view_count': int,
-												[youtube] Add `thirdParty` to agegate clients (#577)
* This allows more videos like `tf2U5Vyj0oU` to become embeddable
    See https://github.com/yt-dlp/yt-dlp/pull/575#issuecomment-888837000
* Also added tests for all types of age-gate

Closes #581

											
										
										
											2021-07-27 19:33:59 +05:30
+								        },
-												[cleanup] Move embed tests to dedicated extractors (#13782)

Authored by: doe1080
											
										
										
											2025-08-02 05:50:20 +09:00
+								        'params': {'skip_download': True},
 								        'skip': 'Age-restricted; requires authentication',
 								    }, {
 								        'note': 'Formerly an age-gated video with embed allowed in public site',
 								        'url': 'https://youtube.com/watch?v=HsUATh_Nc2U',
 								        'info_dict': {
 								            'id': 'HsUATh_Nc2U',
 								            'ext': 'mp4',
 								            'title': 'Godzilla 2 (Official Video)',
 								            'age_limit': 0,
 								            'availability': 'public',
 								            'categories': ['Entertainment'],
 								            'channel': 'FlyingKitty',
 								            'channel_follower_count': int,
 								            'channel_id': 'UCYQT13AtrJC0gsM1far_zJg',
 								            'channel_is_verified': True,
 								            'channel_url': 'https://www.youtube.com/channel/UCYQT13AtrJC0gsM1far_zJg',
 								            'comment_count': int,
 								            'description': 'md5:bf77e03fcae5529475e500129b05668a',
 								            'duration': 177,
 								            'heatmap': 'count:100',
 								            'like_count': int,
 								            'live_status': 'not_live',
 								            'media_type': 'video',
 								            'playable_in_embed': True,
 								            'tags': 'count:2',
 								            'thumbnail': r're:https?://i\.ytimg\.com/.+',
 								            'timestamp': 1586358900,
 								            'upload_date': '20200408',
 								            'uploader': 'FlyingKitty',
 								            'uploader_id': '@FlyingKitty900',
 								            'uploader_url': 'https://www.youtube.com/@FlyingKitty900',
 								            'view_count': int,
-												[youtube] Add `thirdParty` to agegate clients (#577)
* This allows more videos like `tf2U5Vyj0oU` to become embeddable
    See https://github.com/yt-dlp/yt-dlp/pull/575#issuecomment-888837000
* Also added tests for all types of age-gate

Closes #581

											
										
										
											2021-07-27 19:33:59 +05:30
+								        },
-												[cleanup] Move embed tests to dedicated extractors (#13782)

Authored by: doe1080
											
										
										
											2025-08-02 05:50:20 +09:00
+								        'params': {'skip_download': True},
 								    }, {
 								        'note': 'Age-gated video embedable only with clientScreen=EMBED',
 								        'url': 'https://youtube.com/watch?v=Tq92D6wQ1mg',
 								        'info_dict': {
 								            'id': 'Tq92D6wQ1mg',
 								            'ext': 'mp4',
 								            'title': '[MMD] Adios - EVERGLOW [+Motion DL]',
 								            'age_limit': 18,
 								            'availability': 'needs_auth',
 								            'categories': ['Entertainment'],
 								            'channel': 'Projekt Melody',
 								            'channel_follower_count': int,
 								            'channel_id': 'UC1yoRdFoFJaCY-AGfD9W0wQ',
 								            'channel_url': 'https://www.youtube.com/channel/UC1yoRdFoFJaCY-AGfD9W0wQ',
 								            'comment_count': int,
 								            'description': 'md5:17eccca93a786d51bc67646756894066',
 								            'duration': 106,
 								            'like_count': int,
 								            'live_status': 'not_live',
 								            'media_type': 'video',
 								            'playable_in_embed': True,
 								            'tags': 'count:5',
 								            'thumbnail': r're:https?://i\.ytimg\.com/.+',
 								            'timestamp': 1577508724,
 								            'upload_date': '20191228',
 								            'uploader': 'Projekt Melody',
 								            'uploader_id': '@ProjektMelody',
 								            'uploader_url': 'https://www.youtube.com/@ProjektMelody',
 								            'view_count': int,
-												[youtube] Add `thirdParty` to agegate clients (#577)
* This allows more videos like `tf2U5Vyj0oU` to become embeddable
    See https://github.com/yt-dlp/yt-dlp/pull/575#issuecomment-888837000
* Also added tests for all types of age-gate

Closes #581

											
										
										
											2021-07-27 19:33:59 +05:30
+								        },
-												[cleanup] Move embed tests to dedicated extractors (#13782)

Authored by: doe1080
											
										
										
											2025-08-02 05:50:20 +09:00
+								        'skip': 'Age-restricted; requires authentication',
 								    }, {
 								        'note': 'Non-age-gated non-embeddable video',
 								        'url': 'https://youtube.com/watch?v=MeJVWBSsPAY',
 								        'info_dict': {
 								            'id': 'MeJVWBSsPAY',
 								            'ext': 'mp4',
 								            'title': 'OOMPH! - Such Mich Find Mich (Lyrics)',
 								            'age_limit': 0,
 								            'availability': 'public',
 								            'categories': ['Music'],
 								            'channel': 'Herr Lurik',
 								            'channel_follower_count': int,
 								            'channel_id': 'UCdR3RSDPqub28LjZx0v9-aA',
 								            'channel_url': 'https://www.youtube.com/channel/UCdR3RSDPqub28LjZx0v9-aA',
 								            'description': 'md5:205c1049102a4dffa61e4831c1f16851',
 								            'duration': 210,
 								            'like_count': int,
 								            'live_status': 'not_live',
 								            'media_type': 'video',
 								            'playable_in_embed': False,
 								            'tags': 'count:5',
 								            'thumbnail': r're:https?://i\.ytimg\.com/.+',
 								            'timestamp': 1375214517,
 								            'upload_date': '20130730',
 								            'uploader': 'Herr Lurik',
 								            'uploader_id': '@HerrLurik',
 								            'uploader_url': 'https://www.youtube.com/@HerrLurik',
 								            'view_count': int,
-												[youtube] Add `thirdParty` to agegate clients (#577)
* This allows more videos like `tf2U5Vyj0oU` to become embeddable
    See https://github.com/yt-dlp/yt-dlp/pull/575#issuecomment-888837000
* Also added tests for all types of age-gate

Closes #581

											
										
										
											2021-07-27 19:33:59 +05:30
+								        },
-												[cleanup] Move embed tests to dedicated extractors (#13782)

Authored by: doe1080
											
										
										
											2025-08-02 05:50:20 +09:00
+								    }, {
 								        'note': 'Non-bypassable age-gated video',
 								        'url': 'https://youtube.com/watch?v=Cr381pDsSsA',
 								        'only_matching': True,
 								    }, {
 								        # video_info is None
 								        # https://github.com/ytdl-org/youtube-dl/issues/4421
-												Merge 'ytdl-org/youtube-dl/master' release 2020.11.19

Old Extractors left behind:
	VLivePlaylistIE
	YoutubeSearchURLIE
	YoutubeShowIE
	YoutubeFavouritesIE

If removing old extractors, make corresponding changes in
	docs/supportedsites.md
	youtube_dlc/extractor/extractors.py

Not merged:
	.github/ISSUE_TEMPLATE/1_broken_site.md
	.github/ISSUE_TEMPLATE/2_site_support_request.md
	.github/ISSUE_TEMPLATE/3_site_feature_request.md
	.github/ISSUE_TEMPLATE/4_bug_report.md
	.github/ISSUE_TEMPLATE/5_feature_request.md
	test/test_all_urls.py
	youtube_dlc/version.py
	Changelog

											
										
										
											2020-11-20 00:52:59 +05:30
+								        # YouTube Red ad is not captured for creator
-												[cleanup] Move embed tests to dedicated extractors (#13782)

Authored by: doe1080
											
										
										
											2025-08-02 05:50:20 +09:00
+								        'url': '__2ABJjxzNo',
 								        'info_dict': {
 								            'id': '__2ABJjxzNo',
 								            'ext': 'mp4',
 								            'title': 'Deadmau5 - Some Chords (HD)',
 								            'age_limit': 0,
 								            'availability': 'public',
 								            'categories': ['Music'],
 								            'channel': 'deadmau5',
 								            'channel_follower_count': int,
 								            'channel_id': 'UCYEK6xds6eo-3tr4xRdflmQ',
 								            'channel_is_verified': True,
 								            'channel_url': 'https://www.youtube.com/channel/UCYEK6xds6eo-3tr4xRdflmQ',
 								            'comment_count': int,
 								            'description': 'md5:c27e1e9e095a3d9dd99de2f0f377ba06',
 								            'duration': 266,
 								            'heatmap': 'count:100',
 								            'like_count': int,
 								            'live_status': 'not_live',
 								            'media_type': 'video',
 								            'playable_in_embed': True,
 								            'tags': 'count:14',
 								            'thumbnail': r're:https?://i\.ytimg\.com/.+',
 								            'timestamp': 1272659179,
 								            'upload_date': '20100430',
 								            'uploader': 'deadmau5',
 								            'uploader_id': '@deadmau5',
 								            'uploader_url': 'https://www.youtube.com/@deadmau5',
 								            'view_count': int,
-												Merge 'ytdl-org/youtube-dl/master' release 2020.11.19

Old Extractors left behind:
	VLivePlaylistIE
	YoutubeSearchURLIE
	YoutubeShowIE
	YoutubeFavouritesIE

If removing old extractors, make corresponding changes in
	docs/supportedsites.md
	youtube_dlc/extractor/extractors.py

Not merged:
	.github/ISSUE_TEMPLATE/1_broken_site.md
	.github/ISSUE_TEMPLATE/2_site_support_request.md
	.github/ISSUE_TEMPLATE/3_site_feature_request.md
	.github/ISSUE_TEMPLATE/4_bug_report.md
	.github/ISSUE_TEMPLATE/5_feature_request.md
	test/test_all_urls.py
	youtube_dlc/version.py
	Changelog

											
										
										
											2020-11-20 00:52:59 +05:30
+								        },
-												[cleanup] Move embed tests to dedicated extractors (#13782)

Authored by: doe1080
											
										
										
											2025-08-02 05:50:20 +09:00
+								        'expected_warnings': ['DASH manifest missing'],
 								        'params': {'skip_download': True},
 								    }, {
 								        # https://github.com/ytdl-org/youtube-dl/issues/4431
 								        'url': 'lqQg6PlCWgI',
 								        'info_dict': {
 								            'id': 'lqQg6PlCWgI',
 								            'ext': 'mp4',
 								            'title': 'Hockey - Women -  GER-AUS - London 2012 Olympic Games',
 								            'age_limit': 0,
 								            'availability': 'public',
 								            'categories': ['Sports'],
 								            'channel': 'Olympics',
 								            'channel_follower_count': int,
 								            'channel_id': 'UCTl3QQTvqHFjurroKxexy2Q',
 								            'channel_is_verified': True,
 								            'channel_url': 'https://www.youtube.com/channel/UCTl3QQTvqHFjurroKxexy2Q',
 								            'description': 'md5:04bbbf3ccceb6795947572ca36f45904',
 								            'duration': 6085,
 								            'like_count': int,
 								            'live_status': 'was_live',
 								            'media_type': 'livestream',
 								            'playable_in_embed': True,
 								            'release_date': '20120731',
 								            'release_timestamp': 1343767800,
 								            'tags': 'count:10',
 								            'thumbnail': r're:https?://i\.ytimg\.com/.+',
 								            'timestamp': 1440707674,
 								            'upload_date': '20150827',
 								            'uploader': 'Olympics',
 								            'uploader_id': '@Olympics',
 								            'uploader_url': 'https://www.youtube.com/@Olympics',
 								            'view_count': int,
-												[youtube] Amend test

											
										
										
											2014-12-11 16:34:37 +01:00
+								        },
-												[cleanup] Move embed tests to dedicated extractors (#13782)

Authored by: doe1080
											
										
										
											2025-08-02 05:50:20 +09:00
+								        'params': {'skip_download': True},
 								    }, {
-												[youtube|ffmpeg] Automatically correct video with non-square pixels (Fixes #4674)

											
										
										
											2015-01-10 05:45:51 +01:00
+								        # Non-square pixels
-												[cleanup] Move embed tests to dedicated extractors (#13782)

Authored by: doe1080
											
										
										
											2025-08-02 05:50:20 +09:00
+								        'url': 'https://www.youtube.com/watch?v=_b-2C3KPAM0',
 								        'info_dict': {
 								            'id': '_b-2C3KPAM0',
 								            'ext': 'mp4',
 								            'title': '[A-made] 變態妍字幕版 太妍 我就是這樣的人',
 								            'age_limit': 0,
 								            'availability': 'unlisted',
 								            'categories': ['People & Blogs'],
 								            'channel': '孫ᄋᄅ',
 								            'channel_follower_count': int,
 								            'channel_id': 'UCS-xxCmRaA6BFdmgDPA_BIw',
 								            'channel_url': 'https://www.youtube.com/channel/UCS-xxCmRaA6BFdmgDPA_BIw',
 								            'comment_count': int,
 								            'description': 'md5:636f03cf211e7687daffe5bded88a94f',
 								            'duration': 85,
 								            'like_count': int,
 								            'live_status': 'not_live',
 								            'media_type': 'video',
 								            'playable_in_embed': True,
 								            'stretched_ratio': 16 / 9.,
 								            'tags': 'count:11',
 								            'thumbnail': r're:https?://i\.ytimg\.com/.+',
 								            'timestamp': 1299776999,
 								            'upload_date': '20110310',
 								            'uploader': '孫ᄋᄅ',
 								            'uploader_id': '@AllenMeow',
 								            'uploader_url': 'https://www.youtube.com/@AllenMeow',
 								            'view_count': int,
-												[youtube] Add test for #5361

											
										
										
											2015-04-06 00:35:55 +06:00
+								        },
-												[cleanup] Move embed tests to dedicated extractors (#13782)

Authored by: doe1080
											
										
										
											2025-08-02 05:50:20 +09:00
+								        'params': {'skip_download': True},
 								    }, {
 								        # url_encoded_fmt_stream_map is empty string (deprecated)
 								        # https://github.com/ytdl-org/youtube-dl/commit/3a9fadd6dfc127ed0707b218b11ac10c654af1e2
 								        # https://github.com/ytdl-org/youtube-dl/commit/67299f23d8b1894120e875edf97440de87e22308
 								        'url': 'qEJwOuvDf7I',
 								        'only_matching': True,
 								    }, {
 								        # Extraction from multiple DASH manifests
 								        # https://github.com/ytdl-org/youtube-dl/pull/6097
 								        'url': 'https://www.youtube.com/watch?v=FIl7x6_3R5Y',
 								        'info_dict': {
 								            'id': 'FIl7x6_3R5Y',
 								            'ext': 'mp4',
 								            'title': '[60fps] 150614  마마무 솔라 \'Mr. 애매모호\' 라이브 직캠 @대학로 게릴라 콘서트',
 								            'age_limit': 0,
 								            'availability': 'public',
 								            'categories': ['People & Blogs'],
 								            'channel': 'dorappi2000',
 								            'channel_follower_count': int,
 								            'channel_id': 'UCNlmrKRHLHcd2gq6LtPOTlQ',
 								            'channel_url': 'https://www.youtube.com/channel/UCNlmrKRHLHcd2gq6LtPOTlQ',
 								            'description': 'md5:116377fd2963b81ec4ce64b542173306',
 								            'duration': 220,
 								            'like_count': int,
 								            'live_status': 'not_live',
 								            'media_type': 'video',
 								            'playable_in_embed': True,
 								            'tags': 'count:12',
 								            'thumbnail': r're:https?://i\.ytimg\.com/.+',
 								            'timestamp': 1435276932,
 								            'upload_date': '20150626',
 								            'uploader': 'dorappi2000',
 								            'uploader_id': '@dorappi2000',
 								            'uploader_url': 'https://www.youtube.com/@dorappi2000',
 								            'view_count': int,
-												Merge remote-tracking branch 'yan12125/download-dash-segments' (#5886)

											
										
										
											2015-07-20 19:34:24 +02:00
+								        },
-												[cleanup] Move embed tests to dedicated extractors (#13782)

Authored by: doe1080
											
										
										
											2025-08-02 05:50:20 +09:00
+								        'params': {'skip_download': True},
 								    }, {
-												[youtube] Add a test for the DASH segment downloader

											
										
										
											2015-06-10 14:47:02 +08:00
+								        # DASH manifest with segment_list
-												[cleanup] Move embed tests to dedicated extractors (#13782)

Authored by: doe1080
											
										
										
											2025-08-02 05:50:20 +09:00
+								        # https://github.com/ytdl-org/youtube-dl/pull/5886
 								        'url': 'https://www.youtube.com/embed/CsmdDsKjzN8',
 								        'info_dict': {
 								            'id': 'CsmdDsKjzN8',
 								            'ext': 'mp4',
 								            'title': 'Retransmisión XVIII Media maratón Zaragoza 2015',
 								            'age_limit': 0,
 								            'availability': 'unlisted',
 								            'categories': ['Sports'],
 								            'channel': 'Airtek | LED streaming',
 								            'channel_follower_count': int,
 								            'channel_id': 'UCzTzUmjXxxacNnL8I3m4LnQ',
 								            'channel_url': 'https://www.youtube.com/channel/UCzTzUmjXxxacNnL8I3m4LnQ',
 								            'comment_count': int,
 								            'description': 'md5:fcac84e6c545114766f670236fc10196',
 								            'duration': 4394,
 								            'like_count': int,
 								            'live_status': 'was_live',
 								            'media_type': 'livestream',
 								            'playable_in_embed': True,
 								            'release_date': '20150510',
 								            'release_timestamp': 1431241011,
 								            'tags': 'count:31',
 								            'thumbnail': r're:https?://i\.ytimg\.com/.+',
 								            'timestamp': 1430505417,
 								            'upload_date': '20150501',
 								            'uploader': 'Airtek | LED streaming',
 								            'uploader_id': '@airtekledstreaming7916',
 								            'uploader_url': 'https://www.youtube.com/@airtekledstreaming7916',
 								            'view_count': int,
-												Merge remote-tracking branch 'yan12125/download-dash-segments' (#5886)

											
										
										
											2015-07-20 19:34:24 +02:00
+								        },
-												[cleanup] Move embed tests to dedicated extractors (#13782)

Authored by: doe1080
											
										
										
											2025-08-02 05:50:20 +09:00
+								        'params': {
 								            'format': '135',  # bestvideo
 								            'skip_download': True,
 								            'youtube_include_dash_manifest': True,
-												[youtube] Expand _VALID_URL to support vid.plus

											
										
										
											2015-08-17 02:04:13 +06:00
+								        },
-												[cleanup] Move embed tests to dedicated extractors (#13782)

Authored by: doe1080
											
										
										
											2025-08-02 05:50:20 +09:00
+								    }, {
 								        # Multi-camera events (deprecated)
 								        # https://web.archive.org/web/20200308092705/https://support.google.com/youtube/answer/2853812
 								        'url': 'https://www.youtube.com/watch?v=zaPI8MvL8pg',
 								        'only_matching': True,
 								    }, {
 								        # Multi-camera events (deprecated)
 								        # https://github.com/ytdl-org/youtube-dl/issues/8536
 								        'url': 'https://www.youtube.com/watch?v=gVfLd0zydlo',
 								        'only_matching': True,
 								    }, {
 								        'url': 'https://vid.plus/FlRa-iH7PGw',
 								        'only_matching': True,
 								    }, {
 								        'url': 'https://zwearz.com/watch/9lWxNJF-ufM/electra-woman-dyna-girl-official-trailer-grace-helbig.html',
 								        'only_matching': True,
 								    }, {
 								        # Title with JS-like syntax "};"
 								        # https://github.com/ytdl-org/youtube-dl/issues/7468
 								        # Also tests cut-off URL expansion in video description
 								        # https://github.com/ytdl-org/youtube-dl/issues/1892
 								        # https://github.com/ytdl-org/youtube-dl/issues/8164
 								        'url': 'https://www.youtube.com/watch?v=lsguqyKfVQg',
 								        'info_dict': {
 								            'id': 'lsguqyKfVQg',
 								            'ext': 'mp4',
 								            'title': '{dark walk}; Loki/AC/Dishonored; collab w/Elflover21',
 								            'age_limit': 0,
 								            'availability': 'public',
 								            'categories': ['Film & Animation'],
 								            'channel': 'IronSoulElf',
 								            'channel_follower_count': int,
 								            'channel_id': 'UCTSRgz5jylBvFt_S7wnsqLQ',
 								            'channel_url': 'https://www.youtube.com/channel/UCTSRgz5jylBvFt_S7wnsqLQ',
 								            'comment_count': int,
 								            'description': 'md5:8085699c11dc3f597ce0410b0dcbb34a',
 								            'duration': 133,
 								            'like_count': int,
 								            'live_status': 'not_live',
 								            'media_type': 'video',
 								            'playable_in_embed': True,
 								            'tags': 'count:13',
 								            'thumbnail': r're:https?://i\.ytimg\.com/.+',
 								            'timestamp': 1447959261,
 								            'upload_date': '20151119',
 								            'uploader': 'IronSoulElf',
 								            'uploader_id': '@IronSoulElf',
 								            'uploader_url': 'https://www.youtube.com/@IronSoulElf',
 								            'view_count': int,
-												[youtube] Add test for #8536

											
										
										
											2016-02-13 05:18:58 +06:00
+								        },
-												[cleanup] Move embed tests to dedicated extractors (#13782)

Authored by: doe1080
											
										
										
											2025-08-02 05:50:20 +09:00
+								        'params': {'skip_download': True},
 								    }, {
 								        # Tags with '};'
 								        # https://github.com/ytdl-org/youtube-dl/issues/7468
 								        'url': 'https://www.youtube.com/watch?v=Ms7iBXnlUO8',
 								        'only_matching': True,
 								    }, {
 								        # Video with yt:stretch=17:0
 								        'url': 'https://www.youtube.com/watch?v=Q39EVAstoRM',
 								        'info_dict': {
 								            'id': 'Q39EVAstoRM',
 								            'ext': 'mp4',
 								            'title': 'Clash Of Clans#14 Dicas De Ataque Para CV 4',
 								            'description': 'md5:ee18a25c350637c8faff806845bddee9',
 								            'upload_date': '20151107',
-												[youtube] Fall back to the original regex for ytplayer.config

											
										
										
											2015-11-22 13:49:33 +01:00
+								        },
-												[cleanup] Move embed tests to dedicated extractors (#13782)

Authored by: doe1080
											
										
										
											2025-08-02 05:50:20 +09:00
+								        'skip': 'This video does not exist.',
 								    }, {
 								        # Video with incomplete 'yt:stretch=16:'
 								        'url': 'https://www.youtube.com/watch?v=FRhJzUSJbGI',
 								        'only_matching': True,
 								    }, {
 								        # Video licensed under Creative Commons
 								        'url': 'https://www.youtube.com/watch?v=M4gD1WSo5mA',
 								        'info_dict': {
 								            'id': 'M4gD1WSo5mA',
 								            'ext': 'mp4',
 								            'title': 'William Fisher, CopyrightX: Lecture 3.2, The Subject Matter of Copyright: Drama and choreography',
 								            'age_limit': 0,
 								            'availability': 'public',
 								            'categories': ['Education'],
 								            'channel': 'The Berkman Klein Center for Internet & Society',
 								            'channel_follower_count': int,
 								            'channel_id': 'UCuLGmD72gJDBwmLw06X58SA',
 								            'channel_url': 'https://www.youtube.com/channel/UCuLGmD72gJDBwmLw06X58SA',
 								            'chapters': 'count:4',
 								            'description': 'md5:a677553cf0840649b731a3024aeff4cc',
 								            'duration': 721,
 								            'license': 'Creative Commons Attribution license (reuse allowed)',
 								            'like_count': int,
 								            'live_status': 'not_live',
 								            'media_type': 'video',
 								            'playable_in_embed': True,
 								            'tags': 'count:3',
 								            'thumbnail': r're:https?://i\.ytimg\.com/.+',
 								            'timestamp': 1422422076,
 								            'upload_date': '20150128',
 								            'uploader': 'The Berkman Klein Center for Internet & Society',
 								            'uploader_id': '@BKCHarvard',
 								            'uploader_url': 'https://www.youtube.com/@BKCHarvard',
 								            'view_count': int,
-												[youtube] Add support for zwearz (Closes #9062)

											
										
										
											2016-04-04 02:26:20 +06:00
+								        },
-												[cleanup] Move embed tests to dedicated extractors (#13782)

Authored by: doe1080
											
										
										
											2025-08-02 05:50:20 +09:00
+								        'params': {'skip_download': True},
 								    }, {
 								        # https://github.com/ytdl-org/youtube-dl/commit/fd050249afce1bcc9e7f4a127069375467007b55
 								        'url': 'https://www.youtube.com/watch?v=eQcmzGIKrzg',
 								        'info_dict': {
 								            'id': 'eQcmzGIKrzg',
 								            'ext': 'mp4',
 								            'title': 'Democratic Socialism and Foreign Policy | Bernie Sanders',
 								            'age_limit': 0,
 								            'availability': 'public',
 								            'categories': ['News & Politics'],
 								            'channel': 'Bernie Sanders',
 								            'channel_follower_count': int,
 								            'channel_id': 'UCH1dpzjCEiGAt8CXkryhkZg',
 								            'channel_is_verified': True,
 								            'channel_url': 'https://www.youtube.com/channel/UCH1dpzjCEiGAt8CXkryhkZg',
 								            'chapters': 'count:5',
 								            'comment_count': int,
 								            'description': 'md5:13a2503d7b5904ef4b223aa101628f39',
 								            'duration': 4060,
 								            'heatmap': 'count:100',
 								            'license': 'Creative Commons Attribution license (reuse allowed)',
 								            'like_count': int,
 								            'live_status': 'not_live',
 								            'media_type': 'video',
 								            'playable_in_embed': True,
 								            'tags': 'count:12',
 								            'thumbnail': r're:https?://i\.ytimg\.com/.+',
 								            'timestamp': 1447987198,
 								            'upload_date': '20151120',
 								            'uploader': 'Bernie Sanders',
 								            'uploader_id': '@BernieSanders',
 								            'uploader_url': 'https://www.youtube.com/@BernieSanders',
 								            'view_count': int,
-												[youtube] Fall back to the original regex for ytplayer.config

											
										
										
											2015-11-22 13:49:33 +01:00
+								        },
-												[cleanup] Move embed tests to dedicated extractors (#13782)

Authored by: doe1080
											
										
										
											2025-08-02 05:50:20 +09:00
+								        'params': {'skip_download': True},
 								    }, {
 								        'url': 'https://www.youtube.com/watch?feature=player_embedded&amp;amp;v=V36LpHqtcDY',
 								        'only_matching': True,
 								    }, {
 								        # YouTube Red paid video
 								        # https://github.com/ytdl-org/youtube-dl/issues/10059
 								        'url': 'https://www.youtube.com/watch?v=i1Ko8UG-Tdo',
 								        'only_matching': True,
 								    }, {
 								        # Rental video preview
 								        # https://github.com/ytdl-org/youtube-dl/commit/fd050249afce1bcc9e7f4a127069375467007b55
 								        'url': 'https://www.youtube.com/watch?v=yYr8q0y5Jfg',
 								        'info_dict': {
 								            'id': 'uGpuVWrhIzE',
 								            'ext': 'mp4',
 								            'title': 'Piku - Trailer',
 								            'description': 'md5:c36bd60c3fd6f1954086c083c72092eb',
 								            'upload_date': '20150811',
 								            'license': 'Standard YouTube License',
-												[youtube] Add test with '};' in tags

											
										
										
											2015-11-23 21:02:37 +06:00
+								        },
-												[cleanup] Move embed tests to dedicated extractors (#13782)

Authored by: doe1080
											
										
										
											2025-08-02 05:50:20 +09:00
+								        'skip': 'This video is not available.',
 								    }, {
 								        # YouTube Red video with episode data
 								        'url': 'https://www.youtube.com/watch?v=iqKdEhx-dD4',
 								        'info_dict': {
 								            'id': 'iqKdEhx-dD4',
 								            'ext': 'mp4',
 								            'title': 'Isolation - Mind Field (Ep 1)',
 								            'age_limit': 0,
 								            'availability': 'public',
 								            'categories': ['Entertainment'],
 								            'channel': 'Vsauce',
 								            'channel_follower_count': int,
 								            'channel_id': 'UC6nSFpj9HTCZ5t-N3Rm3-HA',
 								            'channel_is_verified': True,
 								            'channel_url': 'https://www.youtube.com/channel/UC6nSFpj9HTCZ5t-N3Rm3-HA',
 								            'comment_count': int,
 								            'description': 'md5:f540112edec5d09fc8cc752d3d4ba3cd',
 								            'duration': 2085,
 								            'heatmap': 'count:100',
 								            'like_count': int,
 								            'live_status': 'not_live',
 								            'media_type': 'video',
 								            'playable_in_embed': True,
 								            'tags': 'count:12',
 								            'thumbnail': r're:https?://i\.ytimg\.com/.+',
 								            'timestamp': 1484761047,
 								            'upload_date': '20170118',
 								            'uploader': 'Vsauce',
 								            'uploader_id': '@Vsauce',
 								            'uploader_url': 'https://www.youtube.com/@Vsauce',
 								            'view_count': int,
-												[youtube] Ignore yt:stretch with zero width/height

											
										
										
											2015-11-28 01:07:07 +01:00
+								        },
-												[cleanup] Move embed tests to dedicated extractors (#13782)

Authored by: doe1080
											
										
										
											2025-08-02 05:50:20 +09:00
+								        'expected_warnings': ['Skipping DASH manifest'],
 								        'params': {'skip_download': True},
 								    }, {
 								        # The following content has been identified by the YouTube community
 								        # as inappropriate or offensive to some audiences.
 								        'url': 'https://www.youtube.com/watch?v=6SJNVb0GnPI',
 								        'info_dict': {
 								            'id': '6SJNVb0GnPI',
 								            'ext': 'mp4',
 								            'title': 'Race Differences in Intelligence',
 								            'description': 'md5:5d161533167390427a1f8ee89a1fc6f1',
 								            'duration': 965,
 								            'upload_date': '20140124',
-												Update to ytdl-commit-9f6c03

[cbsnews] Fix extraction for python <3.6
https://github.com/ytdl-org/youtube-dl/commit/9f6c03a00602eb1119e43a522cf50682f6d6a6dd

											
										
										
											2021-04-17 08:32:33 +05:30
+								        },
-												[cleanup] Move embed tests to dedicated extractors (#13782)

Authored by: doe1080
											
										
										
											2025-08-02 05:50:20 +09:00
+								        'skip': 'This video has been removed for violating YouTube\'s policy on hate speech.',
 								    }, {
 								        # itag 212
 								        'url': '1t24XAntNCY',
 								        'only_matching': True,
 								    }, {
 								        # geo restricted to JP
 								        'url': 'sJL6WA-aGkQ',
 								        'only_matching': True,
 								    }, {
 								        'url': 'https://invidio.us/watch?v=BaW_jenozKc',
 								        'only_matching': True,
 								    }, {
 								        'url': 'https://redirect.invidious.io/watch?v=BaW_jenozKc',
 								        'only_matching': True,
 								    }, {
 								        # from https://nitter.pussthecat.org/YouTube/status/1360363141947944964#m
 								        'url': 'https://redirect.invidious.io/Yh0AhrY9GjA',
 								        'only_matching': True,
 								    }, {
 								        # DRM protected
 								        'url': 'https://www.youtube.com/watch?v=s7_qI6_mIXc',
 								        'only_matching': True,
 								    }, {
 								        # Video with unsupported adaptive stream type formats
 								        # https://github.com/ytdl-org/youtube-dl/commit/4fe54c128a11d394874505af75aaa5a2276aa3ba
 								        'url': 'https://www.youtube.com/watch?v=Z4Vy8R84T1U',
 								        'only_matching': True,
 								    }, {
 								        # Youtube Music Auto-generated description
 								        # TODO: fix metadata extraction
 								        # https://github.com/ytdl-org/youtube-dl/issues/20599
 								        'url': 'https://music.youtube.com/watch?v=MgNrAu2pzNs',
 								        'info_dict': {
 								            'id': 'MgNrAu2pzNs',
 								            'ext': 'mp4',
 								            'title': 'Voyeur Girl',
 								            'age_limit': 0,
 								            'album': 'it\'s too much love to know my dear',
 								            'alt_title': 'Voyeur Girl',
 								            'artists': ['Stephen'],
 								            'availability': 'public',
 								            'categories': ['Music'],
 								            'channel': 'Stephen',  # TODO: should be 'Stephen - Topic'
 								            'channel_follower_count': int,
 								            'channel_id': 'UC-pWHpBjdGG69N9mM2auIAA',
 								            'channel_is_verified': True,
 								            'channel_url': 'https://www.youtube.com/channel/UC-pWHpBjdGG69N9mM2auIAA',
 								            'comment_count': int,
 								            'creators': ['Stephen'],
 								            'description': 'md5:7ae382a65843d6df2685993e90a8628f',
 								            'duration': 169,
 								            'heatmap': 'count:100',
 								            'like_count': int,
 								            'live_status': 'not_live',
 								            'media_type': 'video',
 								            'playable_in_embed': True,
 								            'release_date': '20190313',
 								            'tags': 'count:11',
 								            'thumbnail': r're:https?://i\.ytimg\.com/.+',
 								            'timestamp': 1552385807,
 								            'track': 'Voyeur Girl',
 								            'upload_date': '20190312',
 								            'uploader': 'Stephen',
 								            'view_count': int,
-												[youtube] Extract license (Closes #8725)

											
										
										
											2016-03-02 23:07:25 +06:00
+								        },
-												[cleanup] Move embed tests to dedicated extractors (#13782)

Authored by: doe1080
											
										
										
											2025-08-02 05:50:20 +09:00
+								        'params': {'skip_download': True},
 								    }, {
 								        'url': 'https://www.youtubekids.com/watch?v=3b8nCWDgZ6Q',
 								        'only_matching': True,
 								    }, {
 								        # invalid -> valid video id redirection
 								        # https://github.com/ytdl-org/youtube-dl/pull/25063
 								        'url': 'DJztXj2GPfl',
 								        'info_dict': {
 								            'id': 'DJztXj2GPfk',
 								            'ext': 'mp4',
 								            'title': 'Panjabi MC - Mundian To Bach Ke (The Dictator Soundtrack)',
 								            'description': 'md5:bf577a41da97918e94fa9798d9228825',
 								            'upload_date': '20090125',
 								            'artist': 'Panjabi MC',
 								            'track': 'Beware of the Boys (Mundian to Bach Ke) - Motivo Hi-Lectro Remix',
 								            'album': 'Beware of the Boys (Mundian To Bach Ke)',
-												[youtube] Extract uploader_url (Closes #8724)

											
										
										
											2016-03-02 23:49:10 +06:00
+								        },
-												[cleanup] Move embed tests to dedicated extractors (#13782)

Authored by: doe1080
											
										
										
											2025-08-02 05:50:20 +09:00
+								        'skip': 'Video unavailable',
 								    }, {
 								        # empty description results in an empty string
 								        # https://github.com/ytdl-org/youtube-dl/pull/26575
 								        'url': 'https://www.youtube.com/watch?v=x41yOUIvK2k',
 								        'info_dict': {
 								            'id': 'x41yOUIvK2k',
 								            'ext': 'mp4',
 								            'title': 'IMG 3456',
 								            'age_limit': 0,
 								            'availability': 'public',
 								            'categories': ['Pets & Animals'],
 								            'channel': 'l\'Or Vert asbl',
 								            'channel_follower_count': int,
 								            'channel_id': 'UCo03ZQPBW5U4UC3regpt1nw',
 								            'channel_url': 'https://www.youtube.com/channel/UCo03ZQPBW5U4UC3regpt1nw',
 								            'description': '',
 								            'duration': 7,
 								            'like_count': int,
 								            'live_status': 'not_live',
 								            'media_type': 'video',
 								            'playable_in_embed': True,
 								            'tags': [],
 								            'thumbnail': r're:https?://i\.ytimg\.com/.+',
 								            'timestamp': 1497343210,
 								            'upload_date': '20170613',
 								            'uploader': 'l\'Or Vert asbl',
 								            'uploader_id': '@ElevageOrVert',
 								            'uploader_url': 'https://www.youtube.com/@ElevageOrVert',
 								            'view_count': int,
-												[youtube] Add YouTube Red paid video reference test (#10059)

											
										
										
											2016-07-12 02:10:35 +07:00
+								        },
-												[cleanup] Move embed tests to dedicated extractors (#13782)

Authored by: doe1080
											
										
										
											2025-08-02 05:50:20 +09:00
+								        'params': {'skip_download': True},
 								    }, {
 								        # with '};' inside yt initial data (see [1])
 								        # see [2] for an example with '};' inside ytInitialPlayerResponse
 								        # 1. https://github.com/ytdl-org/youtube-dl/issues/27093
 								        # 2. https://github.com/ytdl-org/youtube-dl/issues/27216
 								        'url': 'https://www.youtube.com/watch?v=CHqg6qOn4no',
 								        'info_dict': {
 								            'id': 'CHqg6qOn4no',
 								            'ext': 'mp4',
 								            'title': 'Part 77   Sort a list of simple types in c#',
 								            'age_limit': 0,
 								            'availability': 'public',
 								            'categories': ['Education'],
 								            'channel': 'kudvenkat',
 								            'channel_follower_count': int,
 								            'channel_id': 'UCCTVrRB5KpIiK6V2GGVsR1Q',
 								            'channel_is_verified': True,
 								            'channel_url': 'https://www.youtube.com/channel/UCCTVrRB5KpIiK6V2GGVsR1Q',
 								            'chapters': 'count:4',
 								            'comment_count': int,
 								            'description': 'md5:b8746fa52e10cdbf47997903f13b20dc',
 								            'duration': 522,
 								            'heatmap': 'count:100',
 								            'like_count': int,
 								            'live_status': 'not_live',
 								            'media_type': 'video',
 								            'playable_in_embed': True,
 								            'tags': 'count:12',
 								            'thumbnail': r're:https?://i\.ytimg\.com/.+',
 								            'timestamp': 1377976349,
 								            'upload_date': '20130831',
 								            'uploader': 'kudvenkat',
 								            'uploader_id': '@Csharp-video-tutorialsBlogspot',
 								            'uploader_url': 'https://www.youtube.com/@Csharp-video-tutorialsBlogspot',
 								            'view_count': int,
-												[youtube] Add support for rental videos' previews (Closes #10532)

											
										
										
											2016-09-03 01:17:15 +07:00
+								        },
-												[cleanup] Move embed tests to dedicated extractors (#13782)

Authored by: doe1080
											
										
										
											2025-08-02 05:50:20 +09:00
+								        'params': {'skip_download': True},
 								    }, {
 								        # another example of '};' in ytInitialData
 								        'url': 'https://www.youtube.com/watch?v=gVfgbahppCY',
 								        'only_matching': True,
 								    }, {
 								        'url': 'https://www.youtube.com/watch_popup?v=63RmMXCd_bQ',
 								        'only_matching': True,
 								    }, {
 								        # https://github.com/ytdl-org/youtube-dl/pull/28094
 								        'url': 'OtqTfy26tG0',
 								        'info_dict': {
 								            'id': 'OtqTfy26tG0',
 								            'ext': 'mp4',
 								            'title': 'Burn Out',
 								            'age_limit': 0,
 								            'album': 'Every Day',
 								            'alt_title': 'Burn Out',
 								            'artists': ['The Cinematic Orchestra'],
 								            'availability': 'public',
 								            'categories': ['Music'],
 								            'channel': 'The Cinematic Orchestra',
 								            'channel_follower_count': int,
 								            'channel_id': 'UCIzsJBIyo8hhpFm1NK0uLgw',
 								            'channel_is_verified': True,
 								            'channel_url': 'https://www.youtube.com/channel/UCIzsJBIyo8hhpFm1NK0uLgw',
 								            'comment_count': int,
 								            'creators': ['The Cinematic Orchestra'],
 								            'description': 'md5:fee8b19b7ba433cc2957d1c7582067ac',
 								            'duration': 614,
 								            'heatmap': 'count:100',
 								            'like_count': int,
 								            'live_status': 'not_live',
 								            'media_type': 'video',
 								            'playable_in_embed': True,
 								            'release_date': '20020513',
 								            'release_year': 2023,
 								            'tags': 'count:3',
 								            'thumbnail': r're:https?://i\.ytimg\.com/.+',
 								            'timestamp': 1416497379,
 								            'track': 'Burn Out',
 								            'upload_date': '20141120',
 								            'uploader': 'The Cinematic Orchestra',
 								            'view_count': int,
-												[youtube] Add test for itag 212 (#11575)

											
										
										
											2017-01-09 22:30:46 +07:00
+								        },
-												[cleanup] Move embed tests to dedicated extractors (#13782)

Authored by: doe1080
											
										
										
											2025-08-02 05:50:20 +09:00
+								        'params': {'skip_download': True},
 								    }, {
 								        # controversial video, only works with bpctr when authenticated with cookies
 								        'url': 'https://www.youtube.com/watch?v=nGC3D_FkCmg',
 								        'only_matching': True,
 								    }, {
 								        # controversial video, requires bpctr/contentCheckOk
 								        'url': 'https://www.youtube.com/watch?v=SZJvDhaSDnc',
 								        'info_dict': {
 								            'id': 'SZJvDhaSDnc',
 								            'ext': 'mp4',
 								            'title': 'San Diego teen commits suicide after bullying over embarrassing video',
 								            'age_limit': 18,
 								            'availability': 'needs_auth',
 								            'categories': ['News & Politics'],
 								            'channel': 'CBS Mornings',
 								            'channel_follower_count': int,
 								            'channel_id': 'UC-SJ6nODDmufqBzPBwCvYvQ',
 								            'channel_is_verified': True,
 								            'channel_url': 'https://www.youtube.com/channel/UC-SJ6nODDmufqBzPBwCvYvQ',
 								            'comment_count': int,
 								            'description': 'md5:acde3a73d3f133fc97e837a9f76b53b7',
 								            'duration': 170,
 								            'like_count': int,
 								            'live_status': 'not_live',
 								            'media_type': 'video',
 								            'playable_in_embed': True,
 								            'tags': 'count:5',
 								            'thumbnail': r're:https?://i\.ytimg\.com/.+',
 								            'timestamp': 1405513526,
 								            'upload_date': '20140716',
 								            'uploader': 'CBS Mornings',
 								            'uploader_id': '@CBSMornings',
 								            'uploader_url': 'https://www.youtube.com/@CBSMornings',
 								            'view_count': int,
-												[youtube] Extract episode metadata (closes #9695, closes #11774)

											
										
										
											2017-01-21 18:10:32 +07:00
+								        },
-												[cleanup] Move embed tests to dedicated extractors (#13782)

Authored by: doe1080
											
										
										
											2025-08-02 05:50:20 +09:00
+								        'skip': 'Age-restricted; requires authentication',
 								    }, {
 								        # restricted location
 								        # https://github.com/ytdl-org/youtube-dl/issues/28685
 								        'url': 'cBvYw8_A0vQ',
 								        'info_dict': {
 								            'id': 'cBvYw8_A0vQ',
 								            'ext': 'mp4',
 								            'title': '4K Ueno Okachimachi  Street  Scenes  上野御徒町歩き',
 								            'age_limit': 0,
 								            'availability': 'public',
 								            'categories': ['Travel & Events'],
 								            'channel': 'Walk around Japan',
 								            'channel_follower_count': int,
 								            'channel_id': 'UC3o_t8PzBmXf5S9b7GLx1Mw',
 								            'channel_url': 'https://www.youtube.com/channel/UC3o_t8PzBmXf5S9b7GLx1Mw',
 								            'description': 'md5:ea770e474b7cd6722b4c95b833c03630',
 								            'duration': 1456,
 								            'live_status': 'not_live',
 								            'media_type': 'video',
 								            'playable_in_embed': True,
 								            'tags': 'count:5',
 								            'thumbnail': r're:https?://i\.ytimg\.com/.+',
 								            'timestamp': 1605884416,
 								            'upload_date': '20201120',
 								            'uploader': 'Walk around Japan',
 								            'uploader_id': '@walkaroundjapan7124',
 								            'uploader_url': 'https://www.youtube.com/@walkaroundjapan7124',
 								            'view_count': int,
-												[youtube] Fix controversy videos extraction (closes #14027, closes #14029)

											
										
										
											2017-08-26 15:38:38 +07:00
+								        },
-												[cleanup] Move embed tests to dedicated extractors (#13782)

Authored by: doe1080
											
										
										
											2025-08-02 05:50:20 +09:00
+								        'params': {'skip_download': True},
 								    }, {
 								        # Has multiple audio streams
 								        'url': 'WaOKSUlf4TM',
 								        'only_matching': True,
 								    }, {
 								        # Requires Premium: has format 141 when requested using YTM url
 								        'url': 'https://music.youtube.com/watch?v=XclachpHxis',
 								        'only_matching': True,
 								    }, {
 								        # multiple subtitles with same lang_code
 								        'url': 'https://www.youtube.com/watch?v=wsQiKKfKxug',
 								        'only_matching': True,
 								    }, {
 								        # Force use android client fallback
 								        'url': 'https://www.youtube.com/watch?v=YOelRv7fMxY',
 								        'info_dict': {
 								            'id': 'YOelRv7fMxY',
 								            'ext': '3gp',
 								            'title': 'DIGGING A SECRET TUNNEL Part 1',
 								            'age_limit': 0,
 								            'availability': 'public',
 								            'categories': ['Entertainment'],
 								            'channel': 'colinfurze',
 								            'channel_follower_count': int,
 								            'channel_id': 'UCp68_FLety0O-n9QU6phsgw',
 								            'channel_is_verified': True,
 								            'channel_url': 'https://www.youtube.com/channel/UCp68_FLety0O-n9QU6phsgw',
 								            'chapters': 'count:4',
 								            'comment_count': int,
 								            'description': 'md5:5d5991195d599b56cd0c4148907eec50',
 								            'duration': 596,
 								            'heatmap': 'count:100',
 								            'like_count': int,
 								            'live_status': 'not_live',
 								            'media_type': 'video',
 								            'playable_in_embed': True,
 								            'tags': 'count:6',
 								            'thumbnail': r're:https?://i\.ytimg\.com/.+',
 								            'timestamp': 1624546829,
 								            'upload_date': '20210624',
 								            'uploader': 'colinfurze',
 								            'uploader_id': '@colinfurze',
 								            'uploader_url': 'https://www.youtube.com/@colinfurze',
 								            'view_count': int,
-												[youtube] Raise GeoRestrictedError

											
										
										
											2017-02-26 16:51:21 +07:00
+								        },
-												[cleanup] Move embed tests to dedicated extractors (#13782)

Authored by: doe1080
											
										
										
											2025-08-02 05:50:20 +09:00
+								        'params': {
 								            'extractor_args': {'youtube': {'player_client': ['android']}},
 								            'format': '17',  # 3gp format available on android
 								            'skip_download': True,
-												[youtube] Raise GeoRestrictedError

											
										
										
											2017-02-26 16:51:21 +07:00
+								        },
-												[cleanup] Move embed tests to dedicated extractors (#13782)

Authored by: doe1080
											
										
										
											2025-08-02 05:50:20 +09:00
+								        'skip': 'Android client broken',
 								    }, {
 								        # Skip download of additional client configs (remix client config in this case)
 								        'url': 'https://music.youtube.com/watch?v=MgNrAu2pzNs',
 								        'only_matching': True,
 								        'params': {'extractor_args': {'youtube': {'player_skip': ['configs']}}},
 								    }, {
 								        # shorts
 								        'url': 'https://www.youtube.com/shorts/BGQWPY4IigY',
 								        'only_matching': True,
 								    }, {
 								        'note': 'Storyboards',
 								        'url': 'https://www.youtube.com/watch?v=5KLPxDtMqe8',
 								        'info_dict': {
 								            'id': '5KLPxDtMqe8',
 								            'ext': 'mhtml',
 								            'title': 'Your Brain is Plastic',
 								            'age_limit': 0,
 								            'availability': 'public',
 								            'categories': ['Education'],
 								            'channel': 'SciShow',
 								            'channel_follower_count': int,
 								            'channel_id': 'UCZYTClx2T1of7BRZ86-8fow',
 								            'channel_is_verified': True,
 								            'channel_url': 'https://www.youtube.com/channel/UCZYTClx2T1of7BRZ86-8fow',
 								            'chapters': 'count:5',
 								            'comment_count': int,
 								            'description': 'md5:89cd86034bdb5466cd87c6ba206cd2bc',
 								            'duration': 248,
 								            'heatmap': 'count:100',
 								            'like_count': int,
 								            'live_status': 'not_live',
 								            'media_type': 'video',
 								            'playable_in_embed': True,
 								            'tags': 'count:12',
 								            'thumbnail': r're:https?://i\.ytimg\.com/.+',
 								            'timestamp': 1395685455,
 								            'upload_date': '20140324',
 								            'uploader': 'SciShow',
 								            'uploader_id': '@SciShow',
 								            'uploader_url': 'https://www.youtube.com/@SciShow',
 								            'view_count': int,
-												[youtube] Add support for invidio.us (closes #17613)

											
										
										
											2018-09-24 00:14:49 +07:00
+								        },
-												[cleanup] Move embed tests to dedicated extractors (#13782)

Authored by: doe1080
											
										
										
											2025-08-02 05:50:20 +09:00
+								        'params': {
 								            'format': 'mhtml',
 								            'skip_download': True,
-												Update to ytdl-commit-cf2dbec
https://github.com/ytdl-org/youtube-dl/commit/cf2dbec6301177a1fddf72862de05fa912d9869d

Except: [kakao] improve info extraction and detect geo restriction
https://github.com/ytdl-org/youtube-dl/commit/d8085580f63ad3b146a31712ff76cf41d5a4558a

											
										
										
											2021-02-20 02:14:36 +05:30
+								        },
-												[cleanup] Move embed tests to dedicated extractors (#13782)

Authored by: doe1080
											
										
										
											2025-08-02 05:50:20 +09:00
+								    }, {
 								        # Ensure video upload_date is in UTC timezone (video was uploaded 1641170939)
 								        'url': 'https://www.youtube.com/watch?v=2NUZ8W2llS4',
 								        'info_dict': {
 								            'id': '2NUZ8W2llS4',
 								            'ext': 'mp4',
 								            'title': 'The NP that test your phone performance 🙂',
 								            'age_limit': 0,
 								            'availability': 'public',
 								            'categories': ['Gaming'],
 								            'channel': 'Leon Nguyen',
 								            'channel_follower_count': int,
 								            'channel_id': 'UCRqNBSOHgilHfAczlUmlWHA',
 								            'channel_url': 'https://www.youtube.com/channel/UCRqNBSOHgilHfAczlUmlWHA',
 								            'comment_count': int,
 								            'description': 'md5:144494b24d4f9dfacb97c1bbef5de84d',
 								            'duration': 21,
 								            'heatmap': 'count:100',
 								            'like_count': int,
 								            'live_status': 'not_live',
 								            'media_type': 'video',
 								            'playable_in_embed': True,
 								            'tags': 'count:23',
 								            'thumbnail': r're:https?://i\.ytimg\.com/.+',
 								            'timestamp': 1641170939,
 								            'upload_date': '20220103',
 								            'uploader': 'Leon Nguyen',
 								            'uploader_id': '@LeonNguyen',
 								            'uploader_url': 'https://www.youtube.com/@LeonNguyen',
 								            'view_count': int,
-												Update to ytdl-commit-cf2dbec
https://github.com/ytdl-org/youtube-dl/commit/cf2dbec6301177a1fddf72862de05fa912d9869d

Except: [kakao] improve info extraction and detect geo restriction
https://github.com/ytdl-org/youtube-dl/commit/d8085580f63ad3b146a31712ff76cf41d5a4558a

											
										
										
											2021-02-20 02:14:36 +05:30
+								        },
-												[cleanup] Move embed tests to dedicated extractors (#13782)

Authored by: doe1080
											
										
										
											2025-08-02 05:50:20 +09:00
+								        'params': {'skip_download': True},
 								    }, {
 								        # date text is premiered video, ensure upload date in UTC (published 1641172509)
 								        'url': 'https://www.youtube.com/watch?v=mzZzzBU6lrM',
 								        'info_dict': {
 								            'id': 'mzZzzBU6lrM',
 								            'ext': 'mp4',
 								            'title': 'I Met GeorgeNotFound In Real Life...',
 								            'age_limit': 0,
 								            'availability': 'public',
 								            'categories': ['Entertainment'],
 								            'channel': 'Quackity',
 								            'channel_follower_count': int,
 								            'channel_id': 'UC_8NknAFiyhOUaZqHR3lq3Q',
 								            'channel_is_verified': True,
 								            'channel_url': 'https://www.youtube.com/channel/UC_8NknAFiyhOUaZqHR3lq3Q',
 								            'comment_count': int,
 								            'description': 'md5:42e72df3d4d5965903a2b9359c3ccd25',
 								            'duration': 955,
 								            'heatmap': 'count:100',
 								            'like_count': int,
 								            'live_status': 'not_live',
 								            'media_type': 'video',
 								            'playable_in_embed': True,
 								            'release_date': '20220103',
 								            'release_timestamp': 1641172509,
 								            'tags': 'count:26',
 								            'thumbnail': r're:https?://i\.ytimg\.com/.+',
 								            'timestamp': 1641172509,
 								            'upload_date': '20220103',
 								            'uploader': 'Quackity',
 								            'uploader_id': '@Quackity',
 								            'uploader_url': 'https://www.youtube.com/@Quackity',
 								            'view_count': int,
-												[youtube] Update tests and add a tests for #18804

											
										
										
											2019-01-16 02:18:27 +07:00
+								        },
-												[cleanup] Move embed tests to dedicated extractors (#13782)

Authored by: doe1080
											
										
										
											2025-08-02 05:50:20 +09:00
+								        'params': {'skip_download': True},
 								    }, {
 								        # continuous livestream.
 								        # Upload date was 2022-07-12T05:12:29-07:00, while stream start is 2022-07-12T15:59:30+00:00
 								        'url': 'https://www.youtube.com/watch?v=jfKfPfyJRdk',
 								        'info_dict': {
 								            'id': 'jfKfPfyJRdk',
 								            'ext': 'mp4',
 								            'title': str,
 								            'age_limit': 0,
 								            'availability': 'public',
 								            'categories': ['Music'],
 								            'channel': 'Lofi Girl',
 								            'channel_follower_count': int,
 								            'channel_id': 'UCSJ4gkVC6NrvII8umztf0Ow',
 								            'channel_is_verified': True,
 								            'channel_url': 'https://www.youtube.com/channel/UCSJ4gkVC6NrvII8umztf0Ow',
 								            'concurrent_view_count': int,
 								            'description': 'md5:48841fcfc1be6131d729fa7b4a7784cb',
 								            'like_count': int,
 								            'live_status': 'is_live',
 								            'media_type': 'livestream',
 								            'playable_in_embed': True,
 								            'release_date': '20220712',
 								            'release_timestamp': 1657641570,
 								            'tags': 'count:32',
 								            'thumbnail': r're:https?://i\.ytimg\.com/.+',
 								            'timestamp': 1657627949,
 								            'upload_date': '20220712',
 								            'uploader': 'Lofi Girl',
 								            'uploader_id': '@LofiGirl',
 								            'uploader_url': 'https://www.youtube.com/@LofiGirl',
 								            'view_count': int,
-												[youtube] Extract additional meta data from video description on youtube music videos

YouTube music videos often have auto-generated video descriptions that can be
utilized to extract additional information about the video. This is desirable
in order to provide the user with as much meta data as possible. This commit
adds extraction methods for the following fields for youtube music videos:
- artist (fallback extraction methods added)
- track (fallback extraction methods added)
- album (new in this commit)
- release_date (new in this commit)
- release_year (new in this commit)

4 tests have been added to test this new functionality:
- YoutubeIE tests 27, 28, 29, and 30

Resolves: #20599

											
										
										
											2019-04-22 00:26:48 -04:00
+								        },
-												[cleanup] Move embed tests to dedicated extractors (#13782)

Authored by: doe1080
											
										
										
											2025-08-02 05:50:20 +09:00
+								        'params': {'skip_download': True},
 								    }, {
 								        'url': 'https://www.youtube.com/watch?v=tjjjtzRLHvA',
 								        'info_dict': {
 								            'id': 'tjjjtzRLHvA',
 								            'ext': 'mp4',
 								            'title': 'ハッシュタグ無し };if window.ytcsi',
 								            'age_limit': 0,
 								            'availability': 'unlisted',
 								            'categories': ['Music'],
 								            'channel': 'Lesmiscore',
 								            'channel_follower_count': int,
 								            'channel_id': 'UCdqltm_7iv1Vs6kp6Syke5A',
 								            'channel_url': 'https://www.youtube.com/channel/UCdqltm_7iv1Vs6kp6Syke5A',
 								            'description': '',
 								            'duration': 6,
 								            'like_count': int,
 								            'live_status': 'not_live',
 								            'media_type': 'short',
 								            'playable_in_embed': True,
 								            'tags': [],
 								            'thumbnail': r're:https?://i\.ytimg\.com/.+',
 								            'timestamp': 1648005313,
 								            'upload_date': '20220323',
 								            'uploader': 'Lesmiscore',
 								            'uploader_id': '@lesmiscore',
 								            'uploader_url': 'https://www.youtube.com/@lesmiscore',
 								            'view_count': int,
-												[youtube] Extract additional meta data from video description on youtube music videos

YouTube music videos often have auto-generated video descriptions that can be
utilized to extract additional information about the video. This is desirable
in order to provide the user with as much meta data as possible. This commit
adds extraction methods for the following fields for youtube music videos:
- artist (fallback extraction methods added)
- track (fallback extraction methods added)
- album (new in this commit)
- release_date (new in this commit)
- release_year (new in this commit)

4 tests have been added to test this new functionality:
- YoutubeIE tests 27, 28, 29, and 30

Resolves: #20599

											
										
										
											2019-04-22 00:26:48 -04:00
+								        },
-												[cleanup] Move embed tests to dedicated extractors (#13782)

Authored by: doe1080
											
										
										
											2025-08-02 05:50:20 +09:00
+								        'params': {'skip_download': True},
 								    }, {
 								        # Prefer primary title+description language metadata by default
 								        # Do not prefer translated description if primary is empty
 								        'url': 'https://www.youtube.com/watch?v=el3E4MbxRqQ',
 								        'info_dict': {
 								            'id': 'el3E4MbxRqQ',
 								            'ext': 'mp4',
 								            'title': 'dlp test video 2 - primary sv no desc',
 								            'age_limit': 0,
 								            'availability': 'unlisted',
 								            'categories': ['People & Blogs'],
 								            'channel': 'cole-dlp-test-acc',
 								            'channel_id': 'UCiu-3thuViMebBjw_5nWYrA',
 								            'channel_url': 'https://www.youtube.com/channel/UCiu-3thuViMebBjw_5nWYrA',
 								            'description': '',
 								            'duration': 5,
 								            'like_count': int,
 								            'live_status': 'not_live',
 								            'media_type': 'video',
 								            'playable_in_embed': True,
 								            'tags': [],
 								            'thumbnail': r're:https?://i\.ytimg\.com/.+',
 								            'timestamp': 1662677394,
 								            'upload_date': '20220908',
 								            'uploader': 'cole-dlp-test-acc',
 								            'uploader_id': '@coletdjnz',
 								            'uploader_url': 'https://www.youtube.com/@coletdjnz',
 								            'view_count': int,
-												[youtube] add support youtubekids.com(closes #23272)

											
										
										
											2019-11-30 17:51:34 +01:00
+								        },
-												[cleanup] Move embed tests to dedicated extractors (#13782)

Authored by: doe1080
											
										
										
											2025-08-02 05:50:20 +09:00
+								        'params': {'skip_download': True},
 								    }, {
 								        # Extractor argument: prefer translated title+description
 								        'url': 'https://www.youtube.com/watch?v=gHKT4uU8Zng',
 								        'info_dict': {
 								            'id': 'gHKT4uU8Zng',
 								            'ext': 'mp4',
 								            'title': 'dlp test video title primary (en-GB)',
 								            'age_limit': 0,
 								            'availability': 'public',
 								            'categories': ['People & Blogs'],
 								            'channel': 'cole-dlp-test-acc',
 								            'channel_id': 'UCiu-3thuViMebBjw_5nWYrA',
 								            'channel_url': 'https://www.youtube.com/channel/UCiu-3thuViMebBjw_5nWYrA',
 								            'description': 'md5:e8c098ba19888e08554f960ffbf6f90e',
 								            'duration': 5,
 								            'like_count': int,
 								            'live_status': 'not_live',
 								            'media_type': 'video',
 								            'playable_in_embed': True,
 								            'tags': [],
 								            'thumbnail': r're:https?://i\.ytimg\.com/.+',
 								            'timestamp': 1659073275,
 								            'upload_date': '20220729',
 								            'uploader': 'cole-dlp-test-acc',
 								            'uploader_id': '@coletdjnz',
 								            'uploader_url': 'https://www.youtube.com/@coletdjnz',
 								            'view_count': int,
-												[youtube] Fix empty description extraction (#26575) (closes #26006)


											
										
										
											2020-09-13 16:23:21 +02:00
+								        },
-												[cleanup] Move embed tests to dedicated extractors (#13782)

Authored by: doe1080
											
										
										
											2025-08-02 05:50:20 +09:00
+								        'params': {
 								            'extractor_args': {'youtube': {'lang': ['fr']}},
 								            'skip_download': True,
-												[youtube] Fix empty description extraction (#26575) (closes #26006)


											
										
										
											2020-09-13 16:23:21 +02:00
+								        },
-												[cleanup] Move embed tests to dedicated extractors (#13782)

Authored by: doe1080
											
										
										
											2025-08-02 05:50:20 +09:00
+								        'expected_warnings': [r'Preferring "fr" translated fields'],
 								    }, {
 								        'note': '6 channel audio',
 								        'url': 'https://www.youtube.com/watch?v=zgdo7-RRjgo',
 								        'only_matching': True,
 								    }, {
 								        'note': 'Multiple HLS formats with same itag',
 								        'url': 'https://www.youtube.com/watch?v=kX3nB4PpJko',
 								        'info_dict': {
 								            'id': 'kX3nB4PpJko',
 								            'ext': 'mp4',
 								            'title': 'Last To Take Hand Off Jet, Keeps It!',
 								            'age_limit': 0,
 								            'availability': 'public',
 								            'categories': ['Entertainment'],
 								            'channel': 'MrBeast',
 								            'channel_follower_count': int,
 								            'channel_id': 'UCX6OQ3DkcsbYNE6H8uQQuVA',
 								            'channel_is_verified': True,
 								            'channel_url': 'https://www.youtube.com/channel/UCX6OQ3DkcsbYNE6H8uQQuVA',
 								            'comment_count': int,
 								            'description': 'md5:42731fced13eff2c48c099fbb5c1b3a0',
 								            'duration': 937,
 								            'heatmap': 'count:100',
 								            'like_count': int,
 								            'live_status': 'not_live',
 								            'media_type': 'video',
 								            'playable_in_embed': True,
 								            'tags': [],
 								            'thumbnail': r're:https?://i\.ytimg\.com/.+',
 								            'timestamp': 1668286800,
 								            'upload_date': '20221112',
 								            'uploader': 'MrBeast',
 								            'uploader_id': '@MrBeast',
 								            'uploader_url': 'https://www.youtube.com/@MrBeast',
 								            'view_count': int,
-												Updated to release 2020.11.21.1

											
										
										
											2020-11-21 20:20:42 +05:30
+								        },
-												[cleanup] Move embed tests to dedicated extractors (#13782)

Authored by: doe1080
											
										
										
											2025-08-02 05:50:20 +09:00
+								        'params': {
 								            'extractor_args': {'youtube': {'player_client': ['ios']}},
 								            'format': '233-1',
 								            'skip_download': True,
-												Update to ytdl-2021.01.03

											
										
										
											2021-01-01 17:56:37 +05:30
+								        },
-												[cleanup] Move embed tests to dedicated extractors (#13782)

Authored by: doe1080
											
										
										
											2025-08-02 05:50:20 +09:00
+								        'skip': 'PO Token Required',
 								    }, {
 								        'note': 'Audio formats with Dynamic Range Compression',
 								        'url': 'https://www.youtube.com/watch?v=Tq92D6wQ1mg',
 								        'info_dict': {
 								            'id': 'Tq92D6wQ1mg',
 								            'ext': 'webm',
 								            'title': '[MMD] Adios - EVERGLOW [+Motion DL]',
 								            'age_limit': 18,
 								            'availability': 'needs_auth',
 								            'categories': ['Entertainment'],
 								            'channel': 'Projekt Melody',
 								            'channel_follower_count': int,
 								            'channel_id': 'UC1yoRdFoFJaCY-AGfD9W0wQ',
 								            'channel_url': 'https://www.youtube.com/channel/UC1yoRdFoFJaCY-AGfD9W0wQ',
 								            'comment_count': int,
 								            'description': 'md5:17eccca93a786d51bc67646756894066',
 								            'duration': 106,
 								            'like_count': int,
 								            'live_status': 'not_live',
 								            'media_type': 'video',
 								            'playable_in_embed': True,
 								            'tags': 'count:5',
 								            'thumbnail': r're:https?://i\.ytimg\.com/.+',
 								            'timestamp': 1577508724,
 								            'upload_date': '20191228',
 								            'uploader': 'Projekt Melody',
 								            'uploader_id': '@ProjektMelody',
 								            'uploader_url': 'https://www.youtube.com/@ProjektMelody',
 								            'view_count': int,
-												Update to ytdl-2021.01.03

											
										
										
											2021-01-01 17:56:37 +05:30
+								        },
-												[cleanup] Move embed tests to dedicated extractors (#13782)

Authored by: doe1080
											
										
										
											2025-08-02 05:50:20 +09:00
+								        'params': {
 								            'extractor_args': {'youtube': {'player_client': ['tv_embedded']}},
 								            'format': '251-drc',
 								            'skip_download': True,
-												[youtube] Update to ytdl-2021.02.04.1

											
										
										
											2021-02-04 20:07:17 +05:30
+								        },
-												[cleanup] Move embed tests to dedicated extractors (#13782)

Authored by: doe1080
											
										
										
											2025-08-02 05:50:20 +09:00
+								        'skip': 'Age-restricted; requires authentication',
 								    }, {
 								        'note': 'Support /live/ URL + media type for post-live content',
 								        'url': 'https://www.youtube.com/live/qVv6vCqciTM',
 								        'info_dict': {
 								            'id': 'qVv6vCqciTM',
 								            'ext': 'mp4',
 								            'title': '【 #インターネット女クリスマス 】3Dで歌ってはしゃぐインターネットの女たち【月ノ美兎/名取さな】',
 								            'age_limit': 0,
 								            'availability': 'public',
 								            'categories': ['Entertainment'],
 								            'channel': 'さなちゃんねる',
 								            'channel_follower_count': int,
 								            'channel_id': 'UCIdEIHpS0TdkqRkHL5OkLtA',
 								            'channel_is_verified': True,
 								            'channel_url': 'https://www.youtube.com/channel/UCIdEIHpS0TdkqRkHL5OkLtA',
 								            'chapters': 'count:13',
 								            'comment_count': int,
 								            'description': 'md5:6aebf95cc4a1d731aebc01ad6cc9806d',
 								            'duration': 4438,
 								            'heatmap': 'count:100',
 								            'like_count': int,
 								            'live_status': 'was_live',
 								            'media_type': 'livestream',
 								            'playable_in_embed': True,
 								            'release_date': '20221223',
 								            'release_timestamp': 1671793345,
 								            'tags': 'count:6',
 								            'thumbnail': r're:https?://i\.ytimg\.com/.+',
 								            'timestamp': 1671798112,
 								            'upload_date': '20221223',
 								            'uploader': 'さなちゃんねる',
 								            'uploader_id': '@sana_natori',
 								            'uploader_url': 'https://www.youtube.com/@sana_natori',
 								            'view_count': int,
-												Update to ytdl-commit-cf2dbec
https://github.com/ytdl-org/youtube-dl/commit/cf2dbec6301177a1fddf72862de05fa912d9869d

Except: [kakao] improve info extraction and detect geo restriction
https://github.com/ytdl-org/youtube-dl/commit/d8085580f63ad3b146a31712ff76cf41d5a4558a

											
										
										
											2021-02-20 02:14:36 +05:30
+								        },
-												[cleanup] Move embed tests to dedicated extractors (#13782)

Authored by: doe1080
											
										
										
											2025-08-02 05:50:20 +09:00
+								        'params': {'skip_download': True},
 								    }, {
 								        # Fallbacks when webpage and web client is unavailable
 								        'url': 'https://www.youtube.com/watch?v=wSSmNUl9Snw',
 								        'info_dict': {
 								            'id': 'wSSmNUl9Snw',
 								            'ext': 'webm',
 								            'title': 'The Computer Hack That Saved Apollo 14',
 								            'age_limit': 0,
 								            # 'availability': 'public',
 								            # 'categories': ['Science & Technology'],
 								            'channel': 'Scott Manley',
 								            'channel_follower_count': int,
 								            'channel_id': 'UCxzC4EngIsMrPmbm6Nxvb-A',
 								            'channel_is_verified': True,
 								            'channel_url': 'https://www.youtube.com/channel/UCxzC4EngIsMrPmbm6Nxvb-A',
 								            'chapters': 'count:2',
 								            'comment_count': int,
 								            'description': 'md5:f4bed7b200404b72a394c2f97b782c02',
 								            'duration': 682,
 								            'heatmap': 'count:100',
 								            'like_count': int,
 								            'live_status': 'not_live',
 								            'media_type': 'video',
 								            'playable_in_embed': True,
 								            'tags': 'count:8',
 								            'thumbnail': r're:https?://i\.ytimg\.com/.+',
 								            'timestamp': 1504198713,
 								            'upload_date': '20170831',
 								            'uploader': 'Scott Manley',
 								            'uploader_id': '@scottmanley',
 								            'uploader_url': 'https://www.youtube.com/@scottmanley',
 								            'view_count': int,
-												[youtube] Fix controversial videos when requested via API (#533)

Closes: https://github.com/yt-dlp/yt-dlp/issues/511#issuecomment-883024350
Authored by: colethedj
											
										
										
											2021-07-21 06:01:28 +12:00
+								        },
-												[cleanup] Move embed tests to dedicated extractors (#13782)

Authored by: doe1080
											
										
										
											2025-08-02 05:50:20 +09:00
+								        'params': {
 								            'extractor_args': {'youtube': {
 								                'player_client': ['ios'],
 								                'player_skip': ['webpage'],
 								            }},
 								            'skip_download': True,
-												[youtube] multiple subtitles in same language

Fixes: https://github.com/ytdl-org/youtube-dl/issues/21164
Related: #310, https://github.com/ytdl-org/youtube-dl/pull/26112

											
										
										
											2021-05-13 00:50:02 +05:30
+								        },
-												[cleanup] Move embed tests to dedicated extractors (#13782)

Authored by: doe1080
											
										
										
											2025-08-02 05:50:20 +09:00
+								        'skip': 'PO Token Required',
 								    }, {
 								        # uploader_id has non-ASCII characters that are percent-encoded in YT's JSON
 								        # https://github.com/yt-dlp/yt-dlp/pull/11818
 								        'url': 'https://www.youtube.com/shorts/18NGQq7p3LY',
 								        'info_dict': {
 								            'id': '18NGQq7p3LY',
 								            'ext': 'mp4',
 								            'title': '아이브 이서 장원영 리즈 삐끼삐끼 챌린지',
 								            'age_limit': 0,
 								            'availability': 'public',
 								            'categories': ['People & Blogs'],
 								            'channel': 'ㅇㅇ',
 								            'channel_follower_count': int,
 								            'channel_id': 'UCC25oTm2J7ZVoi5TngOHg9g',
 								            'channel_url': 'https://www.youtube.com/channel/UCC25oTm2J7ZVoi5TngOHg9g',
 								            'description': '',
 								            'duration': 3,
 								            'like_count': int,
 								            'live_status': 'not_live',
 								            'media_type': 'short',
 								            'playable_in_embed': True,
 								            'tags': [],
 								            'thumbnail': r're:https?://i\.ytimg\.com/.+',
 								            'timestamp': 1724306170,
 								            'upload_date': '20240822',
 								            'uploader': 'ㅇㅇ',
 								            'uploader_id': '@으아-v1k',
 								            'uploader_url': 'https://www.youtube.com/@으아-v1k',
 								            'view_count': int,
-												[youtube] Prefer UTC upload date for videos (#2223)

Except for live/scheduled streams/premieres. 
Closes #1881
Related: #2402 
Authored-by: coletdjnz
											
										
										
											2022-03-08 20:28:00 +13:00
+								        },
-												[cleanup] Move embed tests to dedicated extractors (#13782)

Authored by: doe1080
											
										
										
											2025-08-02 05:50:20 +09:00
+								        'params': {'skip_download': True},
 								    }]
 								    _WEBPAGE_TESTS = [{
 								        # <object>
 								        # https://github.com/ytdl-org/youtube-dl/pull/12696
 								        'url': 'http://www.improbable.com/2017/04/03/untrained-modern-youths-and-ancient-masters-in-selfie-portraits/',
 								        'info_dict': {
 								            'id': 'msN87y-iEx0',
 								            'ext': 'mp4',
 								            'title': 'Feynman: Mirrors FUN TO IMAGINE 6',
 								            'upload_date': '20080526',
 								            'description': 'md5:873c81d308b979f0e23ee7e620b312a3',
 								            'age_limit': 0,
 								            'tags': 'count:8',
 								            'channel_id': 'UCCeo--lls1vna5YJABWAcVA',
 								            'playable_in_embed': True,
 								            'thumbnail': r're:https?://i\.ytimg\.com/.+',
 								            'like_count': int,
 								            'comment_count': int,
 								            'channel': 'Christopher Sykes',
 								            'live_status': 'not_live',
 								            'channel_url': 'https://www.youtube.com/channel/UCCeo--lls1vna5YJABWAcVA',
 								            'availability': 'public',
 								            'duration': 195,
 								            'view_count': int,
 								            'categories': ['Science & Technology'],
 								            'channel_follower_count': int,
 								            'uploader': 'Christopher Sykes',
 								            'uploader_url': 'https://www.youtube.com/@ChristopherSykesDocumentaries',
 								            'uploader_id': '@ChristopherSykesDocumentaries',
 								            'heatmap': 'count:100',
 								            'timestamp': 1211825920,
 								            'media_type': 'video',
-												[extractor/youtube] Support `/live/` URL

											
										
										
											2023-02-03 23:47:13 +05:30
+								        },
-												[cleanup] Move embed tests to dedicated extractors (#13782)

Authored by: doe1080
											
										
										
											2025-08-02 05:50:20 +09:00
+								        'params': {'skip_download': True},
 								    }, {
 								        # <embed>
 								        # https://github.com/ytdl-org/youtube-dl/commit/2b88feedf7993c24b03e0a7ff169a548794de70c
 								        'url': 'https://badzine.de/news/als-marc-zwiebler-taufik-hidayat-schlug',
 								        'info_dict': {
 								            'id': 'bSVcWOq397g',
 								            'ext': 'mp4',
 								            'title': 'TAUFIK TUNJUKKAN KELASNYA !!! : Taufik Hidayat VS Marc Zwiebler Canada Open 2011',
 								            'age_limit': 0,
 								            'availability': 'public',
 								            'categories': ['Sports'],
 								            'channel': 'Badminton Addict Id',
 								            'channel_follower_count': int,
 								            'channel_id': 'UCfCpKOwQGUe2FUJzYNadQcQ',
 								            'channel_url': 'https://www.youtube.com/channel/UCfCpKOwQGUe2FUJzYNadQcQ',
 								            'comment_count': int,
 								            'description': 'md5:2c3737da9a575f301a8380b4d60592a8',
 								            'duration': 756,
 								            'like_count': int,
 								            'live_status': 'not_live',
 								            'media_type': 'video',
 								            'playable_in_embed': True,
 								            'tags': 'count:9',
 								            'thumbnail': r're:https?://i\.ytimg\.com/.+',
 								            'timestamp': 1621418412,
 								            'upload_date': '20210519',
 								            'uploader': 'Badminton Addict Id',
 								            'uploader_id': '@badmintonaddictid8958',
 								            'uploader_url': 'https://www.youtube.com/@badmintonaddictid8958',
 								            'view_count': int,
-												[extractor/youtube] Define strict uploader metadata mapping (#6384)

New mapping:
```
channel -> channel name
channel_id -> UCID
channel_url -> UCID channel url

uploader -> channel name (same as channel field)
uploader_id -> @handle
uploader_url -> @handle channel url 
```

Authored by: coletdjnz
											
										
										
											2023-04-14 07:58:36 +00:00
+								        },
-												[cleanup] Move embed tests to dedicated extractors (#13782)

Authored by: doe1080
											
										
										
											2025-08-02 05:50:20 +09:00
+								        'params': {'skip_download': True},
 								    }, {
 								        # WordPress Plugin: YouTube Video Importer
 								        # https://github.com/ytdl-org/youtube-dl/commit/7deef1ba6743bf11247565e63ed7e31d2e8a9382
 								        'url': 'https://lothype.com/2025-chino-hills-hs-snare-quad-features-wgi2025-drumline/',
 								        'info_dict': {
 								            'id': 'lC21AX_pCfA',
 								            'ext': 'mp4',
 								            'title': '2025 Chino Hills HS Snare & Quad Features! #wgi2025 #drumline',
 								            'age_limit': 0,
 								            'availability': 'public',
 								            'categories': ['Music'],
 								            'channel': 'DrumlineAV',
 								            'channel_follower_count': int,
 								            'channel_id': 'UCqdfUdyiQOZMvW5PcTTYikQ',
 								            'channel_url': 'https://www.youtube.com/channel/UCqdfUdyiQOZMvW5PcTTYikQ',
 								            'comment_count': int,
 								            'description': '',
 								            'duration': 48,
 								            'like_count': int,
 								            'live_status': 'not_live',
 								            'location': 'WESTMINSTER',
 								            'media_type': 'short',
 								            'playable_in_embed': True,
 								            'tags': 'count:72',
 								            'thumbnail': r're:https?://i\.ytimg\.com/.+',
 								            'timestamp': 1739910835,
 								            'upload_date': '20250218',
 								            'uploader': 'DrumlineAV',
 								            'uploader_id': '@DrumlineAV',
 								            'uploader_url': 'https://www.youtube.com/@DrumlineAV',
 								            'view_count': int,
-												[extractor/youtube] Support `/live/` URL

											
										
										
											2023-02-03 23:47:13 +05:30
+								        },
-												[cleanup] Move embed tests to dedicated extractors (#13782)

Authored by: doe1080
											
										
										
											2025-08-02 05:50:20 +09:00
+								        'params': {'skip_download': True},
 								    }, {
 								        # lazyYT
 								        # https://github.com/ytdl-org/youtube-dl/commit/65f3a228b16c55fee959eee055767a796479270f
 								        'url': 'https://rabota7.ru/%D0%91%D1%83%D1%85%D0%B3%D0%B0%D0%BB%D1%82%D0%B5%D1%80',
 								        'info_dict': {
 								            'id': 'DexR8_tTSsQ',
 								            'ext': 'mp4',
 								            'title': 'Работа бухгалтером в Москве',
 								            'age_limit': 0,
 								            'availability': 'public',
 								            'categories': ['People & Blogs'],
 								            'channel': 'Работа в Москве свежие вакансии',
 								            'channel_follower_count': int,
 								            'channel_id': 'UCG3qz_gefGaMiSBvmaxN5WQ',
 								            'channel_url': 'https://www.youtube.com/channel/UCG3qz_gefGaMiSBvmaxN5WQ',
 								            'description': 'md5:b779d3d70af4efda26cf62b76808c0e3',
 								            'duration': 42,
 								            'like_count': int,
 								            'live_status': 'not_live',
 								            'media_type': 'video',
 								            'playable_in_embed': True,
 								            'tags': 'count:7',
 								            'thumbnail': r're:https?://i\.ytimg\.com/.+',
 								            'timestamp': 1496398980,
 								            'upload_date': '20170602',
 								            'uploader': 'Работа в Москве свежие вакансии',
 								            'uploader_id': '@РаботавМосквесвежиевакансии',
 								            'uploader_url': 'https://www.youtube.com/@РаботавМосквесвежиевакансии',
 								            'view_count': int,
-												[ie/youtube] Fix `uploader_id` extraction (#11818)

Closes #11816
Authored by: bashonly
											
										
										
											2024-12-15 20:07:18 +00:00
+								        },
-												[cleanup] Move embed tests to dedicated extractors (#13782)

Authored by: doe1080
											
										
										
											2025-08-02 05:50:20 +09:00
+								        'params': {
 								            'extractor_args': {'generic': {'impersonate': ['chrome']}},
 								            'skip_download': True,
-												[extractor, test] Basic framework for embed tests (#4307)

and split download tests so they can be more easily run in CI

Authored by: coletdjnz

											
										
										
											2022-07-08 16:53:05 +05:30
+								        },
-												[cleanup] Move embed tests to dedicated extractors (#13782)

Authored by: doe1080
											
										
										
											2025-08-02 05:50:20 +09:00
+								    }, {
 								        # data-video-url=
 								        # https://github.com/ytdl-org/youtube-dl/pull/2948
 								        'url': 'https://www.uca.ac.uk/',
 								        'info_dict': {
 								            'id': 'www.uca.ac',
 								            'title': 'UCA | Creative Arts Degrees UK | University for the Creative Arts',
 								            'age_limit': 0,
 								            'description': 'md5:179c7a06ea1ed01b94ff5d56cb18d73b',
 								            'thumbnail': '/media/uca-2020/hero-headers/2025-prospectus-all-2x2.jpg',
 								        },
 								        'playlist_count': 10,
 								        'params': {'skip_download': True},
 								    }]
-												[extractor, test] Basic framework for embed tests (#4307)

and split download tests so they can be more easily run in CI

Authored by: coletdjnz

											
										
										
											2022-07-08 16:53:05 +05:30
-												[ie/youtube] Add `player_js_variant` extractor-arg  (#12767)

- Always distinguish between different JS variants' code/functions
- Change naming scheme for nsig and sigfuncs in disk cache

Authored by: bashonly
											
										
										
											2025-03-31 14:45:48 -05:00
+								    _PLAYER_JS_VARIANT_MAP = {
 								        'main': 'player_ias.vflset/en_US/base.js',
-												[ie/youtube] Add `tcc` player JS variant (#14134)

Authored by: bashonly
											
										
										
											2025-08-23 18:43:50 -05:00
+								        'tcc': 'player_ias_tcc.vflset/en_US/base.js',
-												[ie/youtube] Add `player_js_variant` extractor-arg  (#12767)

- Always distinguish between different JS variants' code/functions
- Change naming scheme for nsig and sigfuncs in disk cache

Authored by: bashonly
											
										
										
											2025-03-31 14:45:48 -05:00
+								        'tce': 'player_ias_tce.vflset/en_US/base.js',
-												[ie/youtube] Add `es5` and `es6` player JS variants (#14005)

Authored by: bashonly
											
										
										
											2025-08-12 18:24:31 -05:00
+								        'es5': 'player_es5.vflset/en_US/base.js',
 								        'es6': 'player_es6.vflset/en_US/base.js',
-												[ie/youtube] Add `player_js_variant` extractor-arg  (#12767)

- Always distinguish between different JS variants' code/functions
- Change naming scheme for nsig and sigfuncs in disk cache

Authored by: bashonly
											
										
										
											2025-03-31 14:45:48 -05:00
+								        'tv': 'tv-player-ias.vflset/tv-player-ias.js',
 								        'tv_es6': 'tv-player-es6.vflset/tv-player-es6.js',
 								        'phone': 'player-plasma-ias-phone-en_US.vflset/base.js',
 								        'tablet': 'player-plasma-ias-tablet-en_US.vflset/base.js',
 								    }
-												[cleanup] Misc (#12802)

Authored by: bashonly
											
										
										
											2025-03-31 16:38:21 -05:00
+								    _INVERSE_PLAYER_JS_VARIANT_MAP = {v: k for k, v in _PLAYER_JS_VARIANT_MAP.items()}
-												[ie/youtube] Extract global nsig helper functions (#13639)

Authored by: bashonly, seproDev

Co-authored-by: sepro <sepro@sepr0.com>

											
										
										
											2025-07-05 17:03:25 -05:00
+								    _NSIG_FUNC_CACHE_ID = 'nsig func'
 								    _DUMMY_STRING = 'dlp_wins'
-												[ie/youtube] Add `player_js_variant` extractor-arg  (#12767)

- Always distinguish between different JS variants' code/functions
- Change naming scheme for nsig and sigfuncs in disk cache

Authored by: bashonly
											
										
										
											2025-03-31 14:45:48 -05:00
-												Update to ytdl-commit-9f6c03

[cbsnews] Fix extraction for python <3.6
https://github.com/ytdl-org/youtube-dl/commit/9f6c03a00602eb1119e43a522cf50682f6d6a6dd

											
										
										
											2021-04-17 08:32:33 +05:30
+								    @classmethod
 								    def suitable(cls, url):
-												[ie/youtube] Split into package (#12557)

Authored by: coletdjnz
											
										
										
											2025-03-13 17:37:33 +13:00
+								        from yt_dlp.utils import parse_qs
-												[utils] Add `parse_qs`

											
										
										
											2021-08-23 00:32:00 +05:30
-												Update to ytdl-commit-9f6c03

[cbsnews] Fix extraction for python <3.6
https://github.com/ytdl-org/youtube-dl/commit/9f6c03a00602eb1119e43a522cf50682f6d6a6dd

											
										
										
											2021-04-17 08:32:33 +05:30
+								        qs = parse_qs(url)
 								        if qs.get('list', [None])[0]:
 								            return False
-												[cleanup] Upgrade syntax

Using https://github.com/asottile/pyupgrade

1. `__future__` imports and `coding: utf-8` were removed
2. Files were rewritten with `pyupgrade --py36-plus --keep-percent-format`
3. f-strings were cherry-picked from `pyupgrade --py36-plus`

Extractors are left untouched (except removing header) to avoid unnecessary merge conflicts

											
										
										
											2022-04-11 20:40:28 +05:30
+								        return super().suitable(url)
-												Update to ytdl-commit-9f6c03

[cbsnews] Fix extraction for python <3.6
https://github.com/ytdl-org/youtube-dl/commit/9f6c03a00602eb1119e43a522cf50682f6d6a6dd

											
										
										
											2021-04-17 08:32:33 +05:30
-												Restore accidentally deleted commits

That's what happens if you let Windows machines write :(

											
										
										
											2013-09-21 14:19:30 +02:00
+								    def __init__(self, *args, **kwargs):
-												[cleanup] Upgrade syntax

Using https://github.com/asottile/pyupgrade

1. `__future__` imports and `coding: utf-8` were removed
2. Files were rewritten with `pyupgrade --py36-plus --keep-percent-format`
3. f-strings were cherry-picked from `pyupgrade --py36-plus`

Extractors are left untouched (except removing header) to avoid unnecessary merge conflicts

											
										
										
											2022-04-11 20:40:28 +05:30
+								        super().__init__(*args, **kwargs)
-												[youtube] Update to ytdl-2021.02.04.1

											
										
										
											2021-02-04 20:07:17 +05:30
+								        self._code_cache = {}
-												Prepare signature function caching

											
										
										
											2013-09-21 15:19:48 +02:00
+								        self._player_cache = {}
-												[ie/youtube] Add a PO Token Provider Framework (#12840)

https://github.com/yt-dlp/yt-dlp/tree/master/yt_dlp/extractor/youtube/pot/README.md

Authored by: coletdjnz
											
										
										
											2025-05-18 13:45:26 +12:00
+								        self._pot_director = None
 								    def _real_initialize(self):
 								        super()._real_initialize()
 								        self._pot_director = initialize_pot_director(self)
-												Restore accidentally deleted commits

That's what happens if you let Windows machines write :(

											
										
										
											2013-09-21 14:19:30 +02:00
-												[extractor/youtube] Download `post_live` videos from start (#5091)

* The fragments are generated as a `LazyList`. So only the required formats are expanded during download, but all fragment lists are printed/written in infojson.
* The m3u8 formats which cannot be downloaded from start are not extracted by default, but can be enabled with an extractor-arg. The extractor-arg `include_live_dash` is renamed to `include_incomplete_formats` to account for this new use-case.

Closes #1564
Authored by: Lesmiscore, pukkandan
											
										
										
											2022-10-04 11:48:31 +09:00
+								    def _prepare_live_from_start_formats(self, formats, video_id, live_start_time, url, webpage_url, smuggled_data, is_live):
-												[dash,youtube] Download live from start to end (#888)

* Add option `--live-from-start` to enable downloading live videos from start
* Add key `is_from_start` in formats to identify formats (of live videos) that downloads from start
* [dash] Create protocol `http_dash_segments_generator` that allows a function to be passed instead of fragments
* [fragment] Allow multiple live dash formats to download simultaneously
* [youtube] Implement fragment re-fetching for the live dash formats
* [youtube] Re-extract dash manifest every 5 hours (manifest expires in 6hrs)
* [postprocessor/ffmpeg] Add `FFmpegFixupDuplicateMoovPP` to fixup duplicated moov atoms

Known issue: Ctrl+C doesn't work on Windows when downloading multiple formats

Closes #1521
Authored by: nao20010128nao, pukkandan

											
										
										
											2021-12-20 15:06:46 +09:00
+								        lock = threading.Lock()
-												[youtube] End `live-from-start` properly when stream ends with 403

Closes #2089

											
										
										
											2021-12-26 15:49:35 +05:30
+								        start_time = time.time()
-												[dash,youtube] Download live from start to end (#888)

* Add option `--live-from-start` to enable downloading live videos from start
* Add key `is_from_start` in formats to identify formats (of live videos) that downloads from start
* [dash] Create protocol `http_dash_segments_generator` that allows a function to be passed instead of fragments
* [fragment] Allow multiple live dash formats to download simultaneously
* [youtube] Implement fragment re-fetching for the live dash formats
* [youtube] Re-extract dash manifest every 5 hours (manifest expires in 6hrs)
* [postprocessor/ffmpeg] Add `FFmpegFixupDuplicateMoovPP` to fixup duplicated moov atoms

Known issue: Ctrl+C doesn't work on Windows when downloading multiple formats

Closes #1521
Authored by: nao20010128nao, pukkandan

											
										
										
											2021-12-20 15:06:46 +09:00
+								        formats = [f for f in formats if f.get('is_from_start')]
-												[youtube] End `live-from-start` properly when stream ends with 403

Closes #2089

											
										
										
											2021-12-26 15:49:35 +05:30
+								        def refetch_manifest(format_id, delay):
 								            nonlocal formats, start_time, is_live
 								            if time.time() <= start_time + delay:
-												[dash,youtube] Download live from start to end (#888)

* Add option `--live-from-start` to enable downloading live videos from start
* Add key `is_from_start` in formats to identify formats (of live videos) that downloads from start
* [dash] Create protocol `http_dash_segments_generator` that allows a function to be passed instead of fragments
* [fragment] Allow multiple live dash formats to download simultaneously
* [youtube] Implement fragment re-fetching for the live dash formats
* [youtube] Re-extract dash manifest every 5 hours (manifest expires in 6hrs)
* [postprocessor/ffmpeg] Add `FFmpegFixupDuplicateMoovPP` to fixup duplicated moov atoms

Known issue: Ctrl+C doesn't work on Windows when downloading multiple formats

Closes #1521
Authored by: nao20010128nao, pukkandan

											
										
										
											2021-12-20 15:06:46 +09:00
+								                return
-												[ie/youtube] Do not require PO Token for premium accounts (#13640)

Authored by: coletdjnz
											
										
										
											2025-07-11 18:54:01 +12:00
+								            _, _, _, _, prs, player_url = self._initial_extract(
 								                url, smuggled_data, webpage_url, 'web', video_id)
-												[utils] `traverse_obj`: Fix more bugs

and cleanup uses of `default=[]`

Continued from b1bde57bef878478e3503ab07190fd207914ade9

											
										
										
											2023-02-10 03:56:26 +05:30
+								            video_details = traverse_obj(prs, (..., 'videoDetails'), expected_type=dict)
-												[dash,youtube] Download live from start to end (#888)

* Add option `--live-from-start` to enable downloading live videos from start
* Add key `is_from_start` in formats to identify formats (of live videos) that downloads from start
* [dash] Create protocol `http_dash_segments_generator` that allows a function to be passed instead of fragments
* [fragment] Allow multiple live dash formats to download simultaneously
* [youtube] Implement fragment re-fetching for the live dash formats
* [youtube] Re-extract dash manifest every 5 hours (manifest expires in 6hrs)
* [postprocessor/ffmpeg] Add `FFmpegFixupDuplicateMoovPP` to fixup duplicated moov atoms

Known issue: Ctrl+C doesn't work on Windows when downloading multiple formats

Closes #1521
Authored by: nao20010128nao, pukkandan

											
										
										
											2021-12-20 15:06:46 +09:00
+								            microformats = traverse_obj(
 								                prs, (..., 'microformat', 'playerMicroformatRenderer'),
-												[utils] `traverse_obj`: Fix more bugs

and cleanup uses of `default=[]`

Continued from b1bde57bef878478e3503ab07190fd207914ade9

											
										
										
											2023-02-10 03:56:26 +05:30
+								                expected_type=dict)
-												[extractor/youtube] Download `post_live` videos from start (#5091)

* The fragments are generated as a `LazyList`. So only the required formats are expanded during download, but all fragment lists are printed/written in infojson.
* The m3u8 formats which cannot be downloaded from start are not extracted by default, but can be enabled with an extractor-arg. The extractor-arg `include_live_dash` is renamed to `include_incomplete_formats` to account for this new use-case.

Closes #1564
Authored by: Lesmiscore, pukkandan
											
										
										
											2022-10-04 11:48:31 +09:00
+								            _, live_status, _, formats, _ = self._list_formats(video_id, microformats, video_details, prs, player_url)
 								            is_live = live_status == 'is_live'
-												[youtube] End `live-from-start` properly when stream ends with 403

Closes #2089

											
										
										
											2021-12-26 15:49:35 +05:30
+								            start_time = time.time()
-												[dash,youtube] Download live from start to end (#888)

* Add option `--live-from-start` to enable downloading live videos from start
* Add key `is_from_start` in formats to identify formats (of live videos) that downloads from start
* [dash] Create protocol `http_dash_segments_generator` that allows a function to be passed instead of fragments
* [fragment] Allow multiple live dash formats to download simultaneously
* [youtube] Implement fragment re-fetching for the live dash formats
* [youtube] Re-extract dash manifest every 5 hours (manifest expires in 6hrs)
* [postprocessor/ffmpeg] Add `FFmpegFixupDuplicateMoovPP` to fixup duplicated moov atoms

Known issue: Ctrl+C doesn't work on Windows when downloading multiple formats

Closes #1521
Authored by: nao20010128nao, pukkandan

											
										
										
											2021-12-20 15:06:46 +09:00
-												[youtube] End `live-from-start` properly when stream ends with 403

Closes #2089

											
										
										
											2021-12-26 15:49:35 +05:30
+								        def mpd_feed(format_id, delay):
-												[dash,youtube] Download live from start to end (#888)

* Add option `--live-from-start` to enable downloading live videos from start
* Add key `is_from_start` in formats to identify formats (of live videos) that downloads from start
* [dash] Create protocol `http_dash_segments_generator` that allows a function to be passed instead of fragments
* [fragment] Allow multiple live dash formats to download simultaneously
* [youtube] Implement fragment re-fetching for the live dash formats
* [youtube] Re-extract dash manifest every 5 hours (manifest expires in 6hrs)
* [postprocessor/ffmpeg] Add `FFmpegFixupDuplicateMoovPP` to fixup duplicated moov atoms

Known issue: Ctrl+C doesn't work on Windows when downloading multiple formats

Closes #1521
Authored by: nao20010128nao, pukkandan

											
										
										
											2021-12-20 15:06:46 +09:00
+								            """
 								            @returns (manifest_url, manifest_stream_number, is_live) or None
 								            """
-												[extractor/youtube] Retry manifest refresh for live-from-start (#5670)

Avoids ending download early when live stream is temporarily offline.
Best used with somewhat large `--retry-sleep extractor:` and `--extractor-retries`

Authored by: mzhou
											
										
										
											2023-01-07 04:30:42 +09:00
+								            for retry in self.RetryManager(fatal=False):
 								                with lock:
 								                    refetch_manifest(format_id, delay)
 								                f = next((f for f in formats if f['format_id'] == format_id), None)
 								                if not f:
 								                    if not is_live:
 								                        retry.error = f'{video_id}: Video is no longer live'
 								                    else:
 								                        retry.error = f'Cannot find refreshed manifest for format {format_id}{bug_reports_message()}'
 								                    continue
-												[ie/youtube] Fix `--live-from-start` support for premieres (#13079)

Closes #8543
Authored by: arabcoders
											
										
										
											2025-05-03 18:23:28 +03:00
 								                # Formats from ended premieres will be missing a manifest_url
 								                # See https://github.com/yt-dlp/yt-dlp/issues/8543
 								                if not f.get('manifest_url'):
 								                    break
-												[extractor/youtube] Retry manifest refresh for live-from-start (#5670)

Avoids ending download early when live stream is temporarily offline.
Best used with somewhat large `--retry-sleep extractor:` and `--extractor-retries`

Authored by: mzhou
											
										
										
											2023-01-07 04:30:42 +09:00
+								                return f['manifest_url'], f['manifest_stream_number'], is_live
 								            return None
-												[dash,youtube] Download live from start to end (#888)

* Add option `--live-from-start` to enable downloading live videos from start
* Add key `is_from_start` in formats to identify formats (of live videos) that downloads from start
* [dash] Create protocol `http_dash_segments_generator` that allows a function to be passed instead of fragments
* [fragment] Allow multiple live dash formats to download simultaneously
* [youtube] Implement fragment re-fetching for the live dash formats
* [youtube] Re-extract dash manifest every 5 hours (manifest expires in 6hrs)
* [postprocessor/ffmpeg] Add `FFmpegFixupDuplicateMoovPP` to fixup duplicated moov atoms

Known issue: Ctrl+C doesn't work on Windows when downloading multiple formats

Closes #1521
Authored by: nao20010128nao, pukkandan

											
										
										
											2021-12-20 15:06:46 +09:00
 								        for f in formats:
-												[extractor/youtube] Download `post_live` videos from start (#5091)

* The fragments are generated as a `LazyList`. So only the required formats are expanded during download, but all fragment lists are printed/written in infojson.
* The m3u8 formats which cannot be downloaded from start are not extracted by default, but can be enabled with an extractor-arg. The extractor-arg `include_live_dash` is renamed to `include_incomplete_formats` to account for this new use-case.

Closes #1564
Authored by: Lesmiscore, pukkandan
											
										
										
											2022-10-04 11:48:31 +09:00
+								            f['is_live'] = is_live
 								            gen = functools.partial(self._live_dash_fragments, video_id, f['format_id'],
 								                                    live_start_time, mpd_feed, not is_live and f.copy())
 								            if is_live:
 								                f['fragments'] = gen
 								                f['protocol'] = 'http_dash_segments_generator'
 								            else:
 								                f['fragments'] = LazyList(gen({}))
 								                del f['is_from_start']
-												[dash,youtube] Download live from start to end (#888)

* Add option `--live-from-start` to enable downloading live videos from start
* Add key `is_from_start` in formats to identify formats (of live videos) that downloads from start
* [dash] Create protocol `http_dash_segments_generator` that allows a function to be passed instead of fragments
* [fragment] Allow multiple live dash formats to download simultaneously
* [youtube] Implement fragment re-fetching for the live dash formats
* [youtube] Re-extract dash manifest every 5 hours (manifest expires in 6hrs)
* [postprocessor/ffmpeg] Add `FFmpegFixupDuplicateMoovPP` to fixup duplicated moov atoms

Known issue: Ctrl+C doesn't work on Windows when downloading multiple formats

Closes #1521
Authored by: nao20010128nao, pukkandan

											
										
										
											2021-12-20 15:06:46 +09:00
-												[extractor/youtube] Download `post_live` videos from start (#5091)

* The fragments are generated as a `LazyList`. So only the required formats are expanded during download, but all fragment lists are printed/written in infojson.
* The m3u8 formats which cannot be downloaded from start are not extracted by default, but can be enabled with an extractor-arg. The extractor-arg `include_live_dash` is renamed to `include_incomplete_formats` to account for this new use-case.

Closes #1564
Authored by: Lesmiscore, pukkandan
											
										
										
											2022-10-04 11:48:31 +09:00
+								    def _live_dash_fragments(self, video_id, format_id, live_start_time, mpd_feed, manifestless_orig_fmt, ctx):
-												[dash,youtube] Download live from start to end (#888)

* Add option `--live-from-start` to enable downloading live videos from start
* Add key `is_from_start` in formats to identify formats (of live videos) that downloads from start
* [dash] Create protocol `http_dash_segments_generator` that allows a function to be passed instead of fragments
* [fragment] Allow multiple live dash formats to download simultaneously
* [youtube] Implement fragment re-fetching for the live dash formats
* [youtube] Re-extract dash manifest every 5 hours (manifest expires in 6hrs)
* [postprocessor/ffmpeg] Add `FFmpegFixupDuplicateMoovPP` to fixup duplicated moov atoms

Known issue: Ctrl+C doesn't work on Windows when downloading multiple formats

Closes #1521
Authored by: nao20010128nao, pukkandan

											
										
										
											2021-12-20 15:06:46 +09:00
+								        FETCH_SPAN, MAX_DURATION = 5, 432000
 								        mpd_url, stream_number, is_live = None, None, True
 								        begin_index = 0
 								        download_start_time = ctx.get('start') or time.time()
 								        lack_early_segments = download_start_time - (live_start_time or download_start_time) > MAX_DURATION
 								        if lack_early_segments:
 								            self.report_warning(bug_reports_message(
 								                'Starting download from the last 120 hours of the live stream since '
 								                'YouTube does not have data before that. If you think this is wrong,'), only_once=True)
 								            lack_early_segments = True
 								        known_idx, no_fragment_score, last_segment_url = begin_index, 0, None
 								        fragments, fragment_base_url = None, None
-												[downloader/fragment] Improve `--live-from-start` for YouTube livestreams (#2870)


											
										
										
											2022-02-25 02:00:46 +09:00
+								        def _extract_sequence_from_mpd(refresh_sequence, immediate):
-												[dash,youtube] Download live from start to end (#888)

* Add option `--live-from-start` to enable downloading live videos from start
* Add key `is_from_start` in formats to identify formats (of live videos) that downloads from start
* [dash] Create protocol `http_dash_segments_generator` that allows a function to be passed instead of fragments
* [fragment] Allow multiple live dash formats to download simultaneously
* [youtube] Implement fragment re-fetching for the live dash formats
* [youtube] Re-extract dash manifest every 5 hours (manifest expires in 6hrs)
* [postprocessor/ffmpeg] Add `FFmpegFixupDuplicateMoovPP` to fixup duplicated moov atoms

Known issue: Ctrl+C doesn't work on Windows when downloading multiple formats

Closes #1521
Authored by: nao20010128nao, pukkandan

											
										
										
											2021-12-20 15:06:46 +09:00
+								            nonlocal mpd_url, stream_number, is_live, no_fragment_score, fragments, fragment_base_url
 								            # Obtain from MPD's maximum seq value
 								            old_mpd_url = mpd_url
-												[youtube] End `live-from-start` properly when stream ends with 403

Closes #2089

											
										
										
											2021-12-26 15:49:35 +05:30
+								            last_error = ctx.pop('last_error', None)
-												[cleanup] Bump ruff to 0.8.x (#11608)

Authored by: seproDev
											
										
										
											2024-12-02 16:29:30 +01:00
+								            expire_fast = immediate or (last_error and isinstance(last_error, HTTPError) and last_error.status == 403)
-												[youtube] End `live-from-start` properly when stream ends with 403

Closes #2089

											
										
										
											2021-12-26 15:49:35 +05:30
+								            mpd_url, stream_number, is_live = (mpd_feed(format_id, 5 if expire_fast else 18000)
 								                                               or (mpd_url, stream_number, False))
 								            if not refresh_sequence:
 								                if expire_fast and not is_live:
 								                    return False, last_seq
 								                elif old_mpd_url == mpd_url:
 								                    return True, last_seq
-												[extractor/youtube] Download `post_live` videos from start (#5091)

* The fragments are generated as a `LazyList`. So only the required formats are expanded during download, but all fragment lists are printed/written in infojson.
* The m3u8 formats which cannot be downloaded from start are not extracted by default, but can be enabled with an extractor-arg. The extractor-arg `include_live_dash` is renamed to `include_incomplete_formats` to account for this new use-case.

Closes #1564
Authored by: Lesmiscore, pukkandan
											
										
										
											2022-10-04 11:48:31 +09:00
+								            if manifestless_orig_fmt:
 								                fmt_info = manifestless_orig_fmt
 								            else:
 								                try:
 								                    fmts, _ = self._extract_mpd_formats_and_subtitles(
 								                        mpd_url, None, note=False, errnote=False, fatal=False)
 								                except ExtractorError:
 								                    fmts = None
 								                if not fmts:
 								                    no_fragment_score += 2
 								                    return False, last_seq
 								                fmt_info = next(x for x in fmts if x['manifest_stream_number'] == stream_number)
-												[dash,youtube] Download live from start to end (#888)

* Add option `--live-from-start` to enable downloading live videos from start
* Add key `is_from_start` in formats to identify formats (of live videos) that downloads from start
* [dash] Create protocol `http_dash_segments_generator` that allows a function to be passed instead of fragments
* [fragment] Allow multiple live dash formats to download simultaneously
* [youtube] Implement fragment re-fetching for the live dash formats
* [youtube] Re-extract dash manifest every 5 hours (manifest expires in 6hrs)
* [postprocessor/ffmpeg] Add `FFmpegFixupDuplicateMoovPP` to fixup duplicated moov atoms

Known issue: Ctrl+C doesn't work on Windows when downloading multiple formats

Closes #1521
Authored by: nao20010128nao, pukkandan

											
										
										
											2021-12-20 15:06:46 +09:00
+								            fragments = fmt_info['fragments']
 								            fragment_base_url = fmt_info['fragment_base_url']
 								            assert fragment_base_url
 								            _last_seq = int(re.search(r'(?:/|^)sq/(\d+)', fragments[-1]['path']).group(1))
 								            return True, _last_seq
-												[extractor/youtube] Download `post_live` videos from start (#5091)

* The fragments are generated as a `LazyList`. So only the required formats are expanded during download, but all fragment lists are printed/written in infojson.
* The m3u8 formats which cannot be downloaded from start are not extracted by default, but can be enabled with an extractor-arg. The extractor-arg `include_live_dash` is renamed to `include_incomplete_formats` to account for this new use-case.

Closes #1564
Authored by: Lesmiscore, pukkandan
											
										
										
											2022-10-04 11:48:31 +09:00
+								        self.write_debug(f'[{video_id}] Generating fragments for format {format_id}')
-												[dash,youtube] Download live from start to end (#888)

* Add option `--live-from-start` to enable downloading live videos from start
* Add key `is_from_start` in formats to identify formats (of live videos) that downloads from start
* [dash] Create protocol `http_dash_segments_generator` that allows a function to be passed instead of fragments
* [fragment] Allow multiple live dash formats to download simultaneously
* [youtube] Implement fragment re-fetching for the live dash formats
* [youtube] Re-extract dash manifest every 5 hours (manifest expires in 6hrs)
* [postprocessor/ffmpeg] Add `FFmpegFixupDuplicateMoovPP` to fixup duplicated moov atoms

Known issue: Ctrl+C doesn't work on Windows when downloading multiple formats

Closes #1521
Authored by: nao20010128nao, pukkandan

											
										
										
											2021-12-20 15:06:46 +09:00
+								        while is_live:
 								            fetch_time = time.time()
 								            if no_fragment_score > 30:
 								                return
 								            if last_segment_url:
 								                # Obtain from "X-Head-Seqnum" header value from each segment
 								                try:
 								                    urlh = self._request_webpage(
 								                        last_segment_url, None, note=False, errnote=False, fatal=False)
 								                except ExtractorError:
 								                    urlh = None
 								                last_seq = try_get(urlh, lambda x: int_or_none(x.headers['X-Head-Seqnum']))
 								                if last_seq is None:
-												[downloader/fragment] Improve `--live-from-start` for YouTube livestreams (#2870)


											
										
										
											2022-02-25 02:00:46 +09:00
+								                    no_fragment_score += 2
-												[dash,youtube] Download live from start to end (#888)

* Add option `--live-from-start` to enable downloading live videos from start
* Add key `is_from_start` in formats to identify formats (of live videos) that downloads from start
* [dash] Create protocol `http_dash_segments_generator` that allows a function to be passed instead of fragments
* [fragment] Allow multiple live dash formats to download simultaneously
* [youtube] Implement fragment re-fetching for the live dash formats
* [youtube] Re-extract dash manifest every 5 hours (manifest expires in 6hrs)
* [postprocessor/ffmpeg] Add `FFmpegFixupDuplicateMoovPP` to fixup duplicated moov atoms

Known issue: Ctrl+C doesn't work on Windows when downloading multiple formats

Closes #1521
Authored by: nao20010128nao, pukkandan

											
										
										
											2021-12-20 15:06:46 +09:00
+								                    last_segment_url = None
 								                    continue
 								            else:
-												[downloader/fragment] Improve `--live-from-start` for YouTube livestreams (#2870)


											
										
										
											2022-02-25 02:00:46 +09:00
+								                should_continue, last_seq = _extract_sequence_from_mpd(True, no_fragment_score > 15)
 								                no_fragment_score += 2
-												[youtube] End `live-from-start` properly when stream ends with 403

Closes #2089

											
										
										
											2021-12-26 15:49:35 +05:30
+								                if not should_continue:
-												[dash,youtube] Download live from start to end (#888)

* Add option `--live-from-start` to enable downloading live videos from start
* Add key `is_from_start` in formats to identify formats (of live videos) that downloads from start
* [dash] Create protocol `http_dash_segments_generator` that allows a function to be passed instead of fragments
* [fragment] Allow multiple live dash formats to download simultaneously
* [youtube] Implement fragment re-fetching for the live dash formats
* [youtube] Re-extract dash manifest every 5 hours (manifest expires in 6hrs)
* [postprocessor/ffmpeg] Add `FFmpegFixupDuplicateMoovPP` to fixup duplicated moov atoms

Known issue: Ctrl+C doesn't work on Windows when downloading multiple formats

Closes #1521
Authored by: nao20010128nao, pukkandan

											
										
										
											2021-12-20 15:06:46 +09:00
+								                    continue
 								            if known_idx > last_seq:
 								                last_segment_url = None
 								                continue
 								            last_seq += 1
 								            if begin_index < 0 and known_idx < 0:
 								                # skip from the start when it's negative value
 								                known_idx = last_seq + begin_index
 								            if lack_early_segments:
 								                known_idx = max(known_idx, last_seq - int(MAX_DURATION // fragments[-1]['duration']))
 								            try:
 								                for idx in range(known_idx, last_seq):
 								                    # do not update sequence here or you'll get skipped some part of it
-												[downloader/fragment] Improve `--live-from-start` for YouTube livestreams (#2870)


											
										
										
											2022-02-25 02:00:46 +09:00
+								                    should_continue, _ = _extract_sequence_from_mpd(False, False)
-												[youtube] End `live-from-start` properly when stream ends with 403

Closes #2089

											
										
										
											2021-12-26 15:49:35 +05:30
+								                    if not should_continue:
-												[dash,youtube] Download live from start to end (#888)

* Add option `--live-from-start` to enable downloading live videos from start
* Add key `is_from_start` in formats to identify formats (of live videos) that downloads from start
* [dash] Create protocol `http_dash_segments_generator` that allows a function to be passed instead of fragments
* [fragment] Allow multiple live dash formats to download simultaneously
* [youtube] Implement fragment re-fetching for the live dash formats
* [youtube] Re-extract dash manifest every 5 hours (manifest expires in 6hrs)
* [postprocessor/ffmpeg] Add `FFmpegFixupDuplicateMoovPP` to fixup duplicated moov atoms

Known issue: Ctrl+C doesn't work on Windows when downloading multiple formats

Closes #1521
Authored by: nao20010128nao, pukkandan

											
										
										
											2021-12-20 15:06:46 +09:00
+								                        known_idx = idx - 1
 								                        raise ExtractorError('breaking out of outer loop')
-												[cleanup] Add more ruff rules (#10149)

Authored by: seproDev

Reviewed-by: bashonly <88596187+bashonly@users.noreply.github.com>
Reviewed-by: Simon Sawicki <contact@grub4k.xyz>
											
										
										
											2024-06-12 01:09:58 +02:00
+								                    last_segment_url = urljoin(fragment_base_url, f'sq/{idx}')
-												[dash,youtube] Download live from start to end (#888)

* Add option `--live-from-start` to enable downloading live videos from start
* Add key `is_from_start` in formats to identify formats (of live videos) that downloads from start
* [dash] Create protocol `http_dash_segments_generator` that allows a function to be passed instead of fragments
* [fragment] Allow multiple live dash formats to download simultaneously
* [youtube] Implement fragment re-fetching for the live dash formats
* [youtube] Re-extract dash manifest every 5 hours (manifest expires in 6hrs)
* [postprocessor/ffmpeg] Add `FFmpegFixupDuplicateMoovPP` to fixup duplicated moov atoms

Known issue: Ctrl+C doesn't work on Windows when downloading multiple formats

Closes #1521
Authored by: nao20010128nao, pukkandan

											
										
										
											2021-12-20 15:06:46 +09:00
+								                    yield {
 								                        'url': last_segment_url,
-												[dash] Show fragment count with `--live-from-start` (#3493)

Authored by: flashdagger
											
										
										
											2022-06-07 14:44:08 +02:00
+								                        'fragment_count': last_seq,
-												[dash,youtube] Download live from start to end (#888)

* Add option `--live-from-start` to enable downloading live videos from start
* Add key `is_from_start` in formats to identify formats (of live videos) that downloads from start
* [dash] Create protocol `http_dash_segments_generator` that allows a function to be passed instead of fragments
* [fragment] Allow multiple live dash formats to download simultaneously
* [youtube] Implement fragment re-fetching for the live dash formats
* [youtube] Re-extract dash manifest every 5 hours (manifest expires in 6hrs)
* [postprocessor/ffmpeg] Add `FFmpegFixupDuplicateMoovPP` to fixup duplicated moov atoms

Known issue: Ctrl+C doesn't work on Windows when downloading multiple formats

Closes #1521
Authored by: nao20010128nao, pukkandan

											
										
										
											2021-12-20 15:06:46 +09:00
+								                    }
 								                if known_idx == last_seq:
 								                    no_fragment_score += 5
 								                else:
 								                    no_fragment_score = 0
 								                known_idx = last_seq
 								            except ExtractorError:
 								                continue
-												[extractor/youtube] Download `post_live` videos from start (#5091)

* The fragments are generated as a `LazyList`. So only the required formats are expanded during download, but all fragment lists are printed/written in infojson.
* The m3u8 formats which cannot be downloaded from start are not extracted by default, but can be enabled with an extractor-arg. The extractor-arg `include_live_dash` is renamed to `include_incomplete_formats` to account for this new use-case.

Closes #1564
Authored by: Lesmiscore, pukkandan
											
										
										
											2022-10-04 11:48:31 +09:00
+								            if manifestless_orig_fmt:
 								                # Stop at the first iteration if running for post-live manifestless;
 								                # fragment count no longer increase since it starts
 								                break
-												[dash,youtube] Download live from start to end (#888)

* Add option `--live-from-start` to enable downloading live videos from start
* Add key `is_from_start` in formats to identify formats (of live videos) that downloads from start
* [dash] Create protocol `http_dash_segments_generator` that allows a function to be passed instead of fragments
* [fragment] Allow multiple live dash formats to download simultaneously
* [youtube] Implement fragment re-fetching for the live dash formats
* [youtube] Re-extract dash manifest every 5 hours (manifest expires in 6hrs)
* [postprocessor/ffmpeg] Add `FFmpegFixupDuplicateMoovPP` to fixup duplicated moov atoms

Known issue: Ctrl+C doesn't work on Windows when downloading multiple formats

Closes #1521
Authored by: nao20010128nao, pukkandan

											
										
										
											2021-12-20 15:06:46 +09:00
+								            time.sleep(max(0, FETCH_SPAN + fetch_time - time.time()))
-												[ie/youtube] Force player `0004de42` (#14398)

Closes #14400
Authored by: seproDev
											
										
										
											2025-09-23 07:07:28 +02:00
+								    def _get_player_js_version(self):
 								        player_js_version = self._configuration_arg('player_js_version', [''])[0] or '20348@0004de42'
 								        if player_js_version == 'actual':
 								            return None, None
 								        if not re.fullmatch(r'[0-9]{5,}@[0-9a-f]{8,}', player_js_version):
 								            self.report_warning(
 								                f'Invalid player JS version "{player_js_version}" specified. '
 								                f'It should be "actual" or in the format of STS@HASH', only_once=True)
 								            return None, None
 								        return player_js_version.split('@')
-												[youtube] Improvements to JS player extraction (See desc) (#860)

* fallback player url extraction when it fails to be extracted from the webpage
* don't download js player unnecessarily for clients that don't require it
* try to extract js player url from any additional client configs
* ability to skip the js player usage/download using `player_skip=js`
* ability to skip the initial webpage download using `player_skip=webpage`

known issue:
* authentication for multi-channel accounts and multi-account cookies may not work correctly if the webpage or client configs are skipped
*  formats from the web client requiring signature decryption will be skipped if player js extraction is skipped

Authored by: coletdjnz
											
										
										
											2021-09-06 07:26:41 +00:00
+								    def _extract_player_url(self, *ytcfgs, webpage=None):
 								        player_url = traverse_obj(
 								            ytcfgs, (..., 'PLAYER_JS_URL'), (..., 'WEB_PLAYER_CONTEXT_CONFIGS', ..., 'jsUrl'),
-												[compat] Remove deprecated functions from core code

											
										
										
											2022-06-24 16:24:43 +05:30
+								            get_all=False, expected_type=str)
-												[youtube] Extract data from multiple clients (#536)

* `player_client` accepts multiple clients
* default `player_client` = `android,web`
* music clients can be specifically requested
* Add IOS `player_client`
* Hide live dash since they can't be downloaded

Closes #501

Authored-by: pukkandan, colethedj
											
										
										
											2021-07-21 09:22:34 +05:30
+								        if not player_url:
-												[youtube] Improvements to JS player extraction (See desc) (#860)

* fallback player url extraction when it fails to be extracted from the webpage
* don't download js player unnecessarily for clients that don't require it
* try to extract js player url from any additional client configs
* ability to skip the js player usage/download using `player_skip=js`
* ability to skip the initial webpage download using `player_skip=webpage`

known issue:
* authentication for multi-channel accounts and multi-account cookies may not work correctly if the webpage or client configs are skipped
*  formats from the web client requiring signature decryption will be skipped if player js extraction is skipped

Authored by: coletdjnz
											
										
										
											2021-09-06 07:26:41 +00:00
+								            return
-												[ie/youtube] Force player `0004de42` (#14398)

Closes #14400
Authored by: seproDev
											
										
										
											2025-09-23 07:07:28 +02:00
+								        player_id_override = self._get_player_js_version()[1]
-												[ie/youtube] Add `player_js_variant` extractor-arg  (#12767)

- Always distinguish between different JS variants' code/functions
- Change naming scheme for nsig and sigfuncs in disk cache

Authored by: bashonly
											
										
										
											2025-03-31 14:45:48 -05:00
-												[ie/youtube] Default to `main` player JS variant (#14079)

Authored by: bashonly
											
										
										
											2025-08-19 14:28:15 -05:00
+								        requested_js_variant = self._configuration_arg('player_js_variant', [''])[0] or 'main'
-												[ie/youtube] Add `player_js_variant` extractor-arg  (#12767)

- Always distinguish between different JS variants' code/functions
- Change naming scheme for nsig and sigfuncs in disk cache

Authored by: bashonly
											
										
										
											2025-03-31 14:45:48 -05:00
+								        if requested_js_variant in self._PLAYER_JS_VARIANT_MAP:
-												[ie/youtube] Force player `0004de42` (#14398)

Closes #14400
Authored by: seproDev
											
										
										
											2025-09-23 07:07:28 +02:00
+								            player_id = player_id_override or self._extract_player_info(player_url)
-												[ie/youtube] Add `player_js_variant` extractor-arg  (#12767)

- Always distinguish between different JS variants' code/functions
- Change naming scheme for nsig and sigfuncs in disk cache

Authored by: bashonly
											
										
										
											2025-03-31 14:45:48 -05:00
+								            original_url = player_url
 								            player_url = f'/s/player/{player_id}/{self._PLAYER_JS_VARIANT_MAP[requested_js_variant]}'
 								            if original_url != player_url:
 								                self.write_debug(
 								                    f'Forcing "{requested_js_variant}" player JS variant for player {player_id}\n'
 								                    f'        original url = {original_url}', only_once=True)
 								        elif requested_js_variant != 'actual':
 								            self.report_warning(
 								                f'Invalid player JS variant name "{requested_js_variant}" requested. '
 								                f'Valid choices are: {", ".join(self._PLAYER_JS_VARIANT_MAP)}', only_once=True)
-												[youtube] Ensure subtitle urls are absolute (#2765)

Closes #2755

Authored by: coletdjnz
											
										
										
											2022-02-13 21:36:01 +00:00
+								        return urljoin('https://www.youtube.com', player_url)
-												[youtube] Use new API for additional video extraction requests (#328)

Co-authored-by: colethedj, pukkandan
Closes https://github.com/yt-dlp/yt-dlp/issues/427
Workarounds for https://github.com/ytdl-org/youtube-dl/issues/29326, https://github.com/yt-dlp/yt-dlp/issues/319, https://github.com/ytdl-org/youtube-dl/issues/29086
											
										
										
											2021-06-30 10:07:49 +12:00
-												[youtube] Improvements to JS player extraction (See desc) (#860)

* fallback player url extraction when it fails to be extracted from the webpage
* don't download js player unnecessarily for clients that don't require it
* try to extract js player url from any additional client configs
* ability to skip the js player usage/download using `player_skip=js`
* ability to skip the initial webpage download using `player_skip=webpage`

known issue:
* authentication for multi-channel accounts and multi-account cookies may not work correctly if the webpage or client configs are skipped
*  formats from the web client requiring signature decryption will be skipped if player js extraction is skipped

Authored by: coletdjnz
											
										
										
											2021-09-06 07:26:41 +00:00
+								    def _download_player_url(self, video_id, fatal=False):
-												[ie/youtube] Retry on more critical requests (#12339)

Authored by: coletdjnz
											
										
										
											2025-02-19 13:39:51 +13:00
+								        iframe_webpage = self._download_webpage_with_retries(
-												[youtube] Improvements to JS player extraction (See desc) (#860)

* fallback player url extraction when it fails to be extracted from the webpage
* don't download js player unnecessarily for clients that don't require it
* try to extract js player url from any additional client configs
* ability to skip the js player usage/download using `player_skip=js`
* ability to skip the initial webpage download using `player_skip=webpage`

known issue:
* authentication for multi-channel accounts and multi-account cookies may not work correctly if the webpage or client configs are skipped
*  formats from the web client requiring signature decryption will be skipped if player js extraction is skipped

Authored by: coletdjnz
											
										
										
											2021-09-06 07:26:41 +00:00
+								            'https://www.youtube.com/iframe_api',
-												[ie/youtube] Retry on more critical requests (#12339)

Authored by: coletdjnz
											
										
										
											2025-02-19 13:39:51 +13:00
+								            note='Downloading iframe API JS',
 								            video_id=video_id, retry_fatal=fatal)
 								        if iframe_webpage:
-												[youtube] Improvements to JS player extraction (See desc) (#860)

* fallback player url extraction when it fails to be extracted from the webpage
* don't download js player unnecessarily for clients that don't require it
* try to extract js player url from any additional client configs
* ability to skip the js player usage/download using `player_skip=js`
* ability to skip the initial webpage download using `player_skip=webpage`

known issue:
* authentication for multi-channel accounts and multi-account cookies may not work correctly if the webpage or client configs are skipped
*  formats from the web client requiring signature decryption will be skipped if player js extraction is skipped

Authored by: coletdjnz
											
										
										
											2021-09-06 07:26:41 +00:00
+								            player_version = self._search_regex(
-												[ie/youtube] Retry on more critical requests (#12339)

Authored by: coletdjnz
											
										
										
											2025-02-19 13:39:51 +13:00
+								                r'player\\?/([0-9a-fA-F]{8})\\?/', iframe_webpage, 'player version', fatal=fatal)
-												[youtube] Improvements to JS player extraction (See desc) (#860)

* fallback player url extraction when it fails to be extracted from the webpage
* don't download js player unnecessarily for clients that don't require it
* try to extract js player url from any additional client configs
* ability to skip the js player usage/download using `player_skip=js`
* ability to skip the initial webpage download using `player_skip=webpage`

known issue:
* authentication for multi-channel accounts and multi-account cookies may not work correctly if the webpage or client configs are skipped
*  formats from the web client requiring signature decryption will be skipped if player js extraction is skipped

Authored by: coletdjnz
											
										
										
											2021-09-06 07:26:41 +00:00
+								            if player_version:
 								                return f'https://www.youtube.com/s/player/{player_version}/player_ias.vflset/en_US/base.js'
-												[ie/youtube] Add `player_js_variant` extractor-arg  (#12767)

- Always distinguish between different JS variants' code/functions
- Change naming scheme for nsig and sigfuncs in disk cache

Authored by: bashonly
											
										
										
											2025-03-31 14:45:48 -05:00
+								    def _player_js_cache_key(self, player_url):
 								        player_id = self._extract_player_info(player_url)
 								        player_path = remove_start(urllib.parse.urlparse(player_url).path, f'/s/player/{player_id}/')
-												[ie/youtube] Detect player JS variants for any locale (#13003)

Authored by: bashonly
											
										
										
											2025-04-26 17:08:34 -05:00
+								        variant = self._INVERSE_PLAYER_JS_VARIANT_MAP.get(player_path) or next((
 								            v for k, v in self._INVERSE_PLAYER_JS_VARIANT_MAP.items()
 								            if re.fullmatch(re.escape(k).replace('en_US', r'[a-zA-Z0-9_]+'), player_path)), None)
-												[ie/youtube] Add `player_js_variant` extractor-arg  (#12767)

- Always distinguish between different JS variants' code/functions
- Change naming scheme for nsig and sigfuncs in disk cache

Authored by: bashonly
											
										
										
											2025-03-31 14:45:48 -05:00
+								        if not variant:
 								            self.write_debug(
 								                f'Unable to determine player JS variant\n'
 								                f'        player = {player_url}', only_once=True)
 								            variant = re.sub(r'[^a-zA-Z0-9]', '_', remove_end(player_path, '.js'))
 								        return join_nonempty(player_id, variant)
-												[youtube] Make cache ID a tuple of lengths instead of just the whole length

											
										
										
											2014-08-02 12:21:53 +02:00
+								    def _signature_cache_id(self, example_sig):
 								        """ Return a string representation of a signature """
-												[compat] Remove deprecated functions from core code

											
										
										
											2022-06-24 16:24:43 +05:30
+								        return '.'.join(str(len(part)) for part in example_sig.split('.'))
-												[youtube] Make cache ID a tuple of lengths instead of just the whole length

											
										
										
											2014-08-02 12:21:53 +02:00
-												[youtube] Improve player id extraction and add tests

											
										
										
											2020-05-02 07:18:08 +07:00
+								    @classmethod
 								    def _extract_player_info(cls, player_url):
 								        for player_re in cls._PLAYER_INFO_RE:
 								            id_m = re.search(player_re, player_url)
 								            if id_m:
 								                break
 								        else:
-												[cleanup] Add more ruff rules (#10149)

Authored by: seproDev

Reviewed-by: bashonly <88596187+bashonly@users.noreply.github.com>
Reviewed-by: Simon Sawicki <contact@grub4k.xyz>
											
										
										
											2024-06-12 01:09:58 +02:00
+								            raise ExtractorError(f'Cannot identify player {player_url!r}')
-												[youtube] Update to ytdl-2021.02.04.1

											
										
										
											2021-02-04 20:07:17 +05:30
+								        return id_m.group('id')
-												[youtube] Improve player id extraction and add tests

											
										
										
											2020-05-02 07:18:08 +07:00
-												[youtube] Fix throttling by decrypting n-sig (#1437)


											
										
										
											2021-10-31 09:53:58 +05:30
+								    def _load_player(self, video_id, player_url, fatal=True):
-												[ie/youtube] Add `player_js_variant` extractor-arg  (#12767)

- Always distinguish between different JS variants' code/functions
- Change naming scheme for nsig and sigfuncs in disk cache

Authored by: bashonly
											
										
										
											2025-03-31 14:45:48 -05:00
+								        player_js_key = self._player_js_cache_key(player_url)
 								        if player_js_key not in self._code_cache:
-												[youtube] Fix non-fatal errors in fetching player

											
										
										
											2021-10-04 02:44:55 +05:30
+								            code = self._download_webpage(
-												[youtube] Use new API for additional video extraction requests (#328)

Co-authored-by: colethedj, pukkandan
Closes https://github.com/yt-dlp/yt-dlp/issues/427
Workarounds for https://github.com/ytdl-org/youtube-dl/issues/29326, https://github.com/yt-dlp/yt-dlp/issues/319, https://github.com/ytdl-org/youtube-dl/issues/29086
											
										
										
											2021-06-30 10:07:49 +12:00
+								                player_url, video_id, fatal=fatal,
-												[ie/youtube] Add `player_js_variant` extractor-arg  (#12767)

- Always distinguish between different JS variants' code/functions
- Change naming scheme for nsig and sigfuncs in disk cache

Authored by: bashonly
											
										
										
											2025-03-31 14:45:48 -05:00
+								                note=f'Downloading player {player_js_key}',
 								                errnote=f'Download of {player_js_key} failed')
-												[youtube] Fix non-fatal errors in fetching player

											
										
										
											2021-10-04 02:44:55 +05:30
+								            if code:
-												[ie/youtube] Add `player_js_variant` extractor-arg  (#12767)

- Always distinguish between different JS variants' code/functions
- Change naming scheme for nsig and sigfuncs in disk cache

Authored by: bashonly
											
										
										
											2025-03-31 14:45:48 -05:00
+								                self._code_cache[player_js_key] = code
 								        return self._code_cache.get(player_js_key)
-												[youtube] Use new API for additional video extraction requests (#328)

Co-authored-by: colethedj, pukkandan
Closes https://github.com/yt-dlp/yt-dlp/issues/427
Workarounds for https://github.com/ytdl-org/youtube-dl/issues/29326, https://github.com/yt-dlp/yt-dlp/issues/319, https://github.com/ytdl-org/youtube-dl/issues/29086
											
										
										
											2021-06-30 10:07:49 +12:00
-												[youtube] Improve player id extraction and add tests

											
										
										
											2020-05-02 07:18:08 +07:00
+								    def _extract_signature_function(self, video_id, player_url, example_sig):
-												[youtube] Add filesystem signature cache

											
										
										
											2013-09-22 00:35:03 +02:00
+								        # Read from filesystem cache
-												[ie/youtube] Add `player_js_variant` extractor-arg  (#12767)

- Always distinguish between different JS variants' code/functions
- Change naming scheme for nsig and sigfuncs in disk cache

Authored by: bashonly
											
										
										
											2025-03-31 14:45:48 -05:00
+								        func_id = join_nonempty(
 								            self._player_js_cache_key(player_url), self._signature_cache_id(example_sig))
-												[youtube] Add filesystem signature cache

											
										
										
											2013-09-22 00:35:03 +02:00
+								        assert os.path.basename(func_id) == func_id
-												[youtube] Move cache into its own module

											
										
										
											2014-09-03 12:41:05 +02:00
-												[cleanup] Misc cleanup

											
										
										
											2022-06-28 10:40:54 +05:30
+								        self.write_debug(f'Extracting signature function {func_id}')
-												[cleanup] Misc (#13595)

Closes #10853, Closes #12436, Closes #13314, Closes #13609
Authored by: seproDev, InvalidUsernameException, doe1080, hseg, bashonly, adamralph

Co-authored-by: bashonly <88596187+bashonly@users.noreply.github.com>
Co-authored-by: InvalidUsernameException <InvalidUsernameException@users.noreply.github.com>
Co-authored-by: gesh <gesh@gesh.uni.cx>
Co-authored-by: Adam Ralph <adam@adamralph.com>
Co-authored-by: doe1080 <98906116+doe1080@users.noreply.github.com>
											
										
										
											2025-07-22 01:43:30 +02:00
+								        cache_spec, code = self.cache.load('youtube-sigfuncs', func_id, min_ver='2025.07.21'), None
-												Prepare signature function caching

											
										
										
											2013-09-21 15:19:48 +02:00
-												[youtube] Improve signature caching

and refactor related functions

											
										
										
											2022-08-18 21:27:41 +05:30
+								        if not cache_spec:
 								            code = self._load_player(video_id, player_url)
-												[youtube] Fix throttling by decrypting n-sig (#1437)


											
										
										
											2021-10-31 09:53:58 +05:30
+								        if code:
-												[ie/youtube] Make signature and nsig extraction more robust (#12761)

Authored by: bashonly, seproDev

Co-authored-by: sepro <sepro@sepr0.com>
											
										
										
											2025-03-27 17:31:01 -05:00
+								            res = self._parse_sig_js(code, player_url)
-												[compat] Remove more functions

Removing any more will require changes to a large number of extractors

											
										
										
											2022-06-24 13:40:17 +05:30
+								            test_string = ''.join(map(chr, range(len(example_sig))))
-												[youtube] Improve signature caching

and refactor related functions

											
										
										
											2022-08-18 21:27:41 +05:30
+								            cache_spec = [ord(c) for c in res(test_string)]
-												[extractor, cleanup] Reduce direct use of `_downloader`

											
										
										
											2022-06-23 09:44:22 +05:30
+								            self.cache.store('youtube-sigfuncs', func_id, cache_spec)
-												[youtube] Improve signature caching

and refactor related functions

											
										
										
											2022-08-18 21:27:41 +05:30
 								        return lambda s: ''.join(s[i] for i in cache_spec)
-												Prepare signature function caching

											
										
										
											2013-09-21 15:19:48 +02:00
-												[ie/youtube] Make signature and nsig extraction more robust (#12761)

Authored by: bashonly, seproDev

Co-authored-by: sepro <sepro@sepr0.com>
											
										
										
											2025-03-27 17:31:01 -05:00
+								    def _parse_sig_js(self, jscode, player_url):
-												[ie/youtube] Fix signature function extraction (#11751)

Closes #11748
Authored by: bashonly
											
										
										
											2024-12-06 15:34:13 +00:00
+								        # Examples where `sig` is funcname:
 								        # sig=function(a){a=a.split(""); ... ;return a.join("")};
 								        # ;c&&(c=sig(decodeURIComponent(c)),a.set(b,encodeURIComponent(c)));return a};
 								        # {var l=f,m=h.sp,n=sig(decodeURIComponent(h.s));l.set(m,encodeURIComponent(n))}
 								        # sig=function(J){J=J.split(""); ... ;return J.join("")};
 								        # ;N&&(N=sig(decodeURIComponent(N)),J.set(R,encodeURIComponent(N)));return J};
 								        # {var H=u,k=f.sp,v=sig(decodeURIComponent(f.s));H.set(k,encodeURIComponent(v))}
-												Restore accidentally deleted commits

That's what happens if you let Windows machines write :(

											
										
										
											2013-09-21 14:19:30 +02:00
+								        funcname = self._search_regex(
-												[ie/youtube] Fix signature function extraction for `2f1832d2` (#11801)

Closes #11798
Authored by: bashonly
											
										
										
											2024-12-13 09:43:08 +00:00
+								            (r'\b(?P<var>[a-zA-Z0-9_$]+)&&\((?P=var)=(?P<sig>[a-zA-Z0-9_$]{2,})\(decodeURIComponent\((?P=var)\)\)',
 								             r'(?P<sig>[a-zA-Z0-9_$]+)\s*=\s*function\(\s*(?P<arg>[a-zA-Z0-9_$]+)\s*\)\s*{\s*(?P=arg)\s*=\s*(?P=arg)\.split\(\s*""\s*\)\s*;\s*[^}]+;\s*return\s+(?P=arg)\.join\(\s*""\s*\)',
 								             r'(?:\b|[^a-zA-Z0-9_$])(?P<sig>[a-zA-Z0-9_$]{2,})\s*=\s*function\(\s*a\s*\)\s*{\s*a\s*=\s*a\.split\(\s*""\s*\)(?:;[a-zA-Z0-9_$]{2}\.[a-zA-Z0-9_$]{2}\(a,\d+\))?',
-												[ie/youtube] Fix signature function extraction (#11751)

Closes #11748
Authored by: bashonly
											
										
										
											2024-12-06 15:34:13 +00:00
+								             # Old patterns
 								             r'\b[cs]\s*&&\s*[adf]\.set\([^,]+\s*,\s*encodeURIComponent\s*\(\s*(?P<sig>[a-zA-Z0-9$]+)\(',
-												[youtube] Update signature function patterns (closes #21469, closes #21476)

											
										
										
											2019-06-21 22:58:42 +07:00
+								             r'\b[a-zA-Z0-9]+\s*&&\s*[a-zA-Z0-9]+\.set\([^,]+\s*,\s*encodeURIComponent\s*\(\s*(?P<sig>[a-zA-Z0-9$]+)\(',
-												[youtube] Improve signature function detection (#641)

Authored by: PSlava (Slava <slash@i-slash.com>)
											
										
										
											2021-08-08 09:54:37 +06:00
+								             r'\bm=(?P<sig>[a-zA-Z0-9$]{2,})\(decodeURIComponent\(h\.s\)\)',
-												[youtube] Update signature function patterns (closes #21469, closes #21476)

											
										
										
											2019-06-21 22:58:42 +07:00
+								             # Obsolete patterns
-												Update to ytdl-commit-d1c6c5

[YouTube] [core] Improve platform debug log, based on yt-dlp
https://github.com/ytdl-org/youtube-dl/commit/d1c6c5c4d618fa950813c0c71aede34a5ac851e9

Except:
    * 6ed34338285f722d0da312ce0af3a15a077a3e2a [jsinterp] Add short-cut evaluation for common expression
        * There was no performance improvement when tested with https://github.com/ytdl-org/youtube-dl/issues/30641
    * e8de54bce50f6f77a4d7e8e80675f7003d5bf630 [core] Handle `/../` sequences in HTTP URLs
        * We plan to implement this differently

											
										
										
											2023-05-24 23:30:43 +05:30
+								             r'("|\')signature\1\s*,\s*(?P<sig>[a-zA-Z0-9$]+)\(',
-												[youtube] Fix extraction (closes #17457, closes #17464)

											
										
										
											2018-09-08 03:36:10 +07:00
+								             r'\.sig\|\|(?P<sig>[a-zA-Z0-9$]+)\(',
-												[youtube] Update signature function patterns (closes #21469, closes #21476)

											
										
										
											2019-06-21 22:58:42 +07:00
+								             r'yt\.akamaized\.net/\)\s*\|\|\s*.*?\s*[cs]\s*&&\s*[adf]\.set\([^,]+\s*,\s*(?:encodeURIComponent\s*\()?\s*(?P<sig>[a-zA-Z0-9$]+)\(',
 								             r'\b[cs]\s*&&\s*[adf]\.set\([^,]+\s*,\s*(?P<sig>[a-zA-Z0-9$]+)\(',
 								             r'\bc\s*&&\s*[a-zA-Z0-9]+\.set\([^,]+\s*,\s*\([^)]*\)\s*\(\s*(?P<sig>[a-zA-Z0-9$]+)\('),
-												[youtube] Fix extraction for domainless player URLs

Closes #11890
Closes #11891
Closes #11892
Closes #11894
Closes #11895
Closes #11897
Closes #11900
Closes #11903
Closes #11904
Closes #11906
Closes #11907
Closes #11909
Closes #11913
Closes #11914
Closes #11915
Closes #11916
Closes #11917
Closes #11918
Closes #11919

											
										
										
											2017-01-31 22:19:29 +07:00
+								            jscode, 'Initial JS player signature function name', group='sig')
-												[youtube] Move JavaScript interpreter into its own module

											
										
										
											2014-03-30 07:02:58 +02:00
-												[ie/youtube] Make signature and nsig extraction more robust (#12761)

Authored by: bashonly, seproDev

Co-authored-by: sepro <sepro@sepr0.com>
											
										
										
											2025-03-27 17:31:01 -05:00
+								        varname, global_list = self._interpret_player_js_global_var(jscode, player_url)
-												[youtube] Move JavaScript interpreter into its own module

											
										
										
											2014-03-30 07:02:58 +02:00
+								        jsi = JSInterpreter(jscode)
-												[ie/youtube] Make signature and nsig extraction more robust (#12761)

Authored by: bashonly, seproDev

Co-authored-by: sepro <sepro@sepr0.com>
											
										
										
											2025-03-27 17:31:01 -05:00
+								        initial_function = jsi.extract_function(funcname, filter_dict({varname: global_list}))
-												Restore accidentally deleted commits

That's what happens if you let Windows machines write :(

											
										
										
											2013-09-21 14:19:30 +02:00
+								        return lambda s: initial_function([s])
-												[youtube] Improve signature caching

and refactor related functions

											
										
										
											2022-08-18 21:27:41 +05:30
+								    def _cached(self, func, *cache_id):
 								        def inner(*args, **kwargs):
 								            if cache_id not in self._player_cache:
 								                try:
 								                    self._player_cache[cache_id] = func(*args, **kwargs)
 								                except ExtractorError as e:
 								                    self._player_cache[cache_id] = e
 								                except Exception as e:
 								                    self._player_cache[cache_id] = ExtractorError(traceback.format_exc(), cause=e)
 								            ret = self._player_cache[cache_id]
 								            if isinstance(ret, Exception):
 								                raise ret
 								            return ret
 								        return inner
-												[ie/youtube] Cache signature timestamps (#13047)

Closes #12825
Authored by: bashonly
											
										
										
											2025-04-29 20:15:17 -05:00
+								    def _load_player_data_from_cache(self, name, player_url):
 								        cache_id = (f'youtube-{name}', self._player_js_cache_key(player_url))
-												[ie/youtube] Only cache nsig code on successful decoding (#12750)

Authored by: seproDev, bashonly

Co-authored-by: bashonly <88596187+bashonly@users.noreply.github.com>
											
										
										
											2025-03-26 00:47:45 +01:00
-												[ie/youtube] Cache signature timestamps (#13047)

Closes #12825
Authored by: bashonly
											
										
										
											2025-04-29 20:15:17 -05:00
+								        if data := self._player_cache.get(cache_id):
 								            return data
-												[ie/youtube] Only cache nsig code on successful decoding (#12750)

Authored by: seproDev, bashonly

Co-authored-by: bashonly <88596187+bashonly@users.noreply.github.com>
											
										
										
											2025-03-26 00:47:45 +01:00
-												[cleanup] Misc (#13595)

Closes #10853, Closes #12436, Closes #13314, Closes #13609
Authored by: seproDev, InvalidUsernameException, doe1080, hseg, bashonly, adamralph

Co-authored-by: bashonly <88596187+bashonly@users.noreply.github.com>
Co-authored-by: InvalidUsernameException <InvalidUsernameException@users.noreply.github.com>
Co-authored-by: gesh <gesh@gesh.uni.cx>
Co-authored-by: Adam Ralph <adam@adamralph.com>
Co-authored-by: doe1080 <98906116+doe1080@users.noreply.github.com>
											
										
										
											2025-07-22 01:43:30 +02:00
+								        data = self.cache.load(*cache_id, min_ver='2025.07.21')
-												[ie/youtube] Cache signature timestamps (#13047)

Closes #12825
Authored by: bashonly
											
										
										
											2025-04-29 20:15:17 -05:00
+								        if data:
 								            self._player_cache[cache_id] = data
-												[ie/youtube] Only cache nsig code on successful decoding (#12750)

Authored by: seproDev, bashonly

Co-authored-by: bashonly <88596187+bashonly@users.noreply.github.com>
											
										
										
											2025-03-26 00:47:45 +01:00
-												[ie/youtube] Cache signature timestamps (#13047)

Closes #12825
Authored by: bashonly
											
										
										
											2025-04-29 20:15:17 -05:00
+								        return data
-												[ie/youtube] Only cache nsig code on successful decoding (#12750)

Authored by: seproDev, bashonly

Co-authored-by: bashonly <88596187+bashonly@users.noreply.github.com>
											
										
										
											2025-03-26 00:47:45 +01:00
-												[ie/youtube] Cache signature timestamps (#13047)

Closes #12825
Authored by: bashonly
											
										
										
											2025-04-29 20:15:17 -05:00
+								    def _store_player_data_to_cache(self, name, player_url, data):
 								        cache_id = (f'youtube-{name}', self._player_js_cache_key(player_url))
-												[ie/youtube] Only cache nsig code on successful decoding (#12750)

Authored by: seproDev, bashonly

Co-authored-by: bashonly <88596187+bashonly@users.noreply.github.com>
											
										
										
											2025-03-26 00:47:45 +01:00
+								        if cache_id not in self._player_cache:
-												[ie/youtube] Cache signature timestamps (#13047)

Closes #12825
Authored by: bashonly
											
										
										
											2025-04-29 20:15:17 -05:00
+								            self.cache.store(*cache_id, data)
 								            self._player_cache[cache_id] = data
-												[ie/youtube] Only cache nsig code on successful decoding (#12750)

Authored by: seproDev, bashonly

Co-authored-by: bashonly <88596187+bashonly@users.noreply.github.com>
											
										
										
											2025-03-26 00:47:45 +01:00
-												[youtube] Update to ytdl-2021.02.04.1

											
										
										
											2021-02-04 20:07:17 +05:30
+								    def _decrypt_signature(self, s, video_id, player_url):
-												keep track of the dates and html5player versions of working YT signature algos

											
										
										
											2013-06-27 22:20:50 +02:00
+								        """Turn the encrypted s field into a working signature"""
-												[youtube] Improve signature caching

and refactor related functions

											
										
										
											2022-08-18 21:27:41 +05:30
+								        extract_sig = self._cached(
 								            self._extract_signature_function, 'sig', player_url, self._signature_cache_id(s))
 								        func = extract_sig(video_id, player_url, s)
 								        return func(s)
-												[youtube] Fix throttling by decrypting n-sig (#1437)


											
										
										
											2021-10-31 09:53:58 +05:30
 								    def _decrypt_nsig(self, s, video_id, player_url):
 								        """Turn the encrypted n field into a working signature"""
 								        if player_url is None:
 								            raise ExtractorError('Cannot decrypt nsig without player_url')
-												[youtube] Ensure subtitle urls are absolute (#2765)

Closes #2755

Authored by: coletdjnz
											
										
										
											2022-02-13 21:36:01 +00:00
+								        player_url = urljoin('https://www.youtube.com', player_url)
-												[youtube] Fix throttling by decrypting n-sig (#1437)


											
										
										
											2021-10-31 09:53:58 +05:30
-												[extractor/youtube] Fallback regex for nsig code extraction

											
										
										
											2022-09-01 13:38:25 +05:30
+								        try:
-												[cleanup] Deprecate various options (#13821)

Closes #14198, Closes #12909
Authored by: seproDev
											
										
										
											2025-09-21 17:10:37 +02:00
+								            jsi, _, func_code = self._extract_n_function_code(video_id, player_url)
-												[extractor/youtube] Fallback regex for nsig code extraction

											
										
										
											2022-09-01 13:38:25 +05:30
+								        except ExtractorError as e:
 								            raise ExtractorError('Unable to extract nsig function code', cause=e)
-												[youtube] Fix throttling by decrypting n-sig (#1437)


											
										
										
											2021-10-31 09:53:58 +05:30
-												[extractor/youtube] Add fallback to phantomjs

Related #4635

											
										
										
											2022-08-18 21:35:18 +05:30
+								        try:
-												[ie/youtube] Extract global nsig helper functions (#13639)

Authored by: bashonly, seproDev

Co-authored-by: sepro <sepro@sepr0.com>

											
										
										
											2025-07-05 17:03:25 -05:00
+								            extract_nsig = self._cached(self._extract_n_function_from_code, self._NSIG_FUNC_CACHE_ID, player_url)
-												[extractor/youtube] Add fallback to phantomjs

Related #4635

											
										
										
											2022-08-18 21:35:18 +05:30
+								            ret = extract_nsig(jsi, func_code)(s)
 								        except JSInterpreter.Exception as e:
 								            try:
-												[jsinterp] Implement timeout

Workaround for #4716

											
										
										
											2022-08-22 06:19:06 +05:30
+								                jsi = PhantomJSwrapper(self, timeout=5000)
-												[extractor/youtube] Add fallback to phantomjs

Related #4635

											
										
										
											2022-08-18 21:35:18 +05:30
+								            except ExtractorError:
 								                raise e
 								            self.report_warning(
 								                f'Native nsig extraction failed: Trying with PhantomJS\n'
 								                f'         n = {s} ; player = {player_url}', video_id)
-												[jsinterp] Improve separating regex

Fixes https://github.com/yt-dlp/yt-dlp/issues/4635#issuecomment-1273974909

											
										
										
											2022-10-11 07:59:27 +05:30
+								            self.write_debug(e, only_once=True)
-												[extractor/youtube] Add fallback to phantomjs

Related #4635

											
										
										
											2022-08-18 21:35:18 +05:30
 								            args, func_body = func_code
 								            ret = jsi.execute(
 								                f'console.log(function({", ".join(args)}) {{ {func_body} }}({s!r}));',
 								                video_id=video_id, note='Executing signature code').strip()
-												[youtube] Improve signature caching

and refactor related functions

											
										
										
											2022-08-18 21:27:41 +05:30
 								        self.write_debug(f'Decrypted nsig {s} => {ret}')
-												[ie/youtube] Only cache nsig code on successful decoding (#12750)

Authored by: seproDev, bashonly

Co-authored-by: bashonly <88596187+bashonly@users.noreply.github.com>
											
										
										
											2025-03-26 00:47:45 +01:00
+								        # Only cache nsig func JS code to disk if successful, and only once
-												[ie/youtube] Cache signature timestamps (#13047)

Closes #12825
Authored by: bashonly
											
										
										
											2025-04-29 20:15:17 -05:00
+								        self._store_player_data_to_cache('nsig', player_url, func_code)
-												[youtube] Improve signature caching

and refactor related functions

											
										
										
											2022-08-18 21:27:41 +05:30
+								        return ret
-												[cleanup] Misc (#10623)

Authored by: bashonly
											
										
										
											2024-08-01 10:03:49 -05:00
+								    def _extract_n_function_name(self, jscode, player_url=None):
-												[ie/youtube] Make signature and nsig extraction more robust (#12761)

Authored by: bashonly, seproDev

Co-authored-by: sepro <sepro@sepr0.com>
											
										
										
											2025-03-27 17:31:01 -05:00
+								        varname, global_list = self._interpret_player_js_global_var(jscode, player_url)
-												[ie/youtube] nsig code improvements and cleanup (#13280)

Authored by: bashonly
											
										
										
											2025-05-26 17:54:43 -05:00
+								        if debug_str := traverse_obj(global_list, (lambda _, v: v.endswith('-_w8_'), any)):
-												[ie/youtube] Rework nsig function name extraction (#13403)

Closes #13401

Authored by: Grub4K
											
										
										
											2025-06-05 23:50:58 +02:00
+								            pattern = r'''(?x)
 								                \{\s*return\s+%s\[%d\]\s*\+\s*(?P<argname>[a-zA-Z0-9_$]+)\s*\}
 								            ''' % (re.escape(varname), global_list.index(debug_str))
 								            if match := re.search(pattern, jscode):
 								                pattern = r'''(?x)
 								                    \{\s*\)%s\(\s*
 								                    (?:
 								                        (?P<funcname_a>[a-zA-Z0-9_$]+)\s*noitcnuf\s*
 								                        |noitcnuf\s*=\s*(?P<funcname_b>[a-zA-Z0-9_$]+)(?:\s+rav)?
 								                    )[;\n]
 								                ''' % re.escape(match.group('argname')[::-1])
 								                if match := re.search(pattern, jscode[match.start()::-1]):
 								                    a, b = match.group('funcname_a', 'funcname_b')
 								                    return (a or b)[::-1]
-												[ie/youtube] Make signature and nsig extraction more robust (#12761)

Authored by: bashonly, seproDev

Co-authored-by: sepro <sepro@sepr0.com>
											
										
										
											2025-03-27 17:31:01 -05:00
+								            self.write_debug(join_nonempty(
 								                'Initial search was unable to find nsig function name',
 								                player_url and f'        player = {player_url}', delim='\n'), only_once=True)
-												[ie/youtube] Fix `n` function name extraction for player `20dfca59` (#10611)

Closes #10608
Authored by: bashonly
											
										
										
											2024-07-31 16:19:30 -05:00
+								        # Examples (with placeholders nfunc, narray, idx):
 								        # *  .get("n"))&&(b=nfunc(b)
 								        # *  .get("n"))&&(b=narray[idx](b)
 								        # *  b=String.fromCharCode(110),c=a.get(b))&&c=narray[idx](c)
 								        # *  a.D&&(b="nn"[+a.D],c=a.get(b))&&(c=narray[idx](c),a.set(b,c),narray.length||nfunc("")
 								        # *  a.D&&(PL(a),b=a.j.n||null)&&(b=narray[0](b),a.set("n",b),narray.length||nfunc("")
-												[ie/youtube] Fix `n` function name extraction for player `b12cc44b` (#10668)

Authored by: seproDev
											
										
										
											2024-08-05 22:36:11 +02:00
+								        # *  a.D&&(b="nn"[+a.D],vL(a),c=a.j[b]||null)&&(c=narray[idx](c),a.set(b,c),narray.length||nfunc("")
-												[ie/youtube] Fix `n` sig extraction for player `3bb1f723` (#11750)

Closes #11744
Authored by: bashonly
											
										
										
											2024-12-06 15:35:18 +00:00
+								        # *  J.J="";J.url="";J.Z&&(R="nn"[+J.Z],mW(J),N=J.K[R]||null)&&(N=narray[idx](N),J.set(R,N))}};
-												[test] Fix test_youtube_signature

											
										
										
											2022-08-21 00:51:03 +05:30
+								        funcname, idx = self._search_regex(
-												[ie/youtube] Fix `n` function name extraction for player `3400486c` (#10542)

Authored by: bashonly
											
										
										
											2024-07-23 16:25:49 -05:00
+								            r'''(?x)
 								            (?:
 								                \.get\("n"\)\)&&\(b=|
 								                (?:
 								                    b=String\.fromCharCode\(110\)|
-												[ie/youtube] Fix `n` function name extraction for player `20dfca59` (#10611)

Closes #10608
Authored by: bashonly
											
										
										
											2024-07-31 16:19:30 -05:00
+								                    (?P<str_idx>[a-zA-Z0-9_$.]+)&&\(b="nn"\[\+(?P=str_idx)\]
-												[ie/youtube] Fix `n` function name extraction for player `b12cc44b` (#10668)

Authored by: seproDev
											
										
										
											2024-08-05 22:36:11 +02:00
+								                )
 								                (?:
 								                    ,[a-zA-Z0-9_$]+\(a\))?,c=a\.
 								                    (?:
 								                        get\(b\)|
 								                        [a-zA-Z0-9_$]+\[b\]\|\|null
 								                    )\)&&\(c=|
-												[ie/youtube] Fix `n` function name extraction for player `20dfca59` (#10611)

Closes #10608
Authored by: bashonly
											
										
										
											2024-07-31 16:19:30 -05:00
+								                \b(?P<var>[a-zA-Z0-9_$]+)=
 								            )(?P<nfunc>[a-zA-Z0-9_$]+)(?:\[(?P<idx>\d+)\])?\([a-zA-Z]\)
-												[ie/youtube] Fix `n` sig extraction for player `3bb1f723` (#11750)

Closes #11744
Authored by: bashonly
											
										
										
											2024-12-06 15:35:18 +00:00
+								            (?(var),[a-zA-Z0-9_$]+\.set\((?:"n+"|[a-zA-Z0-9_$]+)\,(?P=var)\))''',
-												[ie/youtube] Fix `n` function name extraction for player `20dfca59` (#10611)

Closes #10608
Authored by: bashonly
											
										
										
											2024-07-31 16:19:30 -05:00
+								            jscode, 'n function name', group=('nfunc', 'idx'), default=(None, None))
 								        if not funcname:
-												[cleanup] Misc (#10623)

Authored by: bashonly
											
										
										
											2024-08-01 10:03:49 -05:00
+								            self.report_warning(join_nonempty(
 								                'Falling back to generic n function search',
-												[ie/youtube] Make signature and nsig extraction more robust (#12761)

Authored by: bashonly, seproDev

Co-authored-by: sepro <sepro@sepr0.com>
											
										
										
											2025-03-27 17:31:01 -05:00
+								                player_url and f'         player = {player_url}', delim='\n'), only_once=True)
-												[ie/youtube] Fix `n` function name extraction for player `20dfca59` (#10611)

Closes #10608
Authored by: bashonly
											
										
										
											2024-07-31 16:19:30 -05:00
+								            return self._search_regex(
 								                r'''(?xs)
 								                ;\s*(?P<name>[a-zA-Z0-9_$]+)\s*=\s*function\([a-zA-Z0-9_$]+\)
-												[ie/youtube] Fix `n` sig extraction for player `3bb1f723` (#11750)

Closes #11744
Authored by: bashonly
											
										
										
											2024-12-06 15:35:18 +00:00
+								                \s*\{(?:(?!};).)+?return\s*(?P<q>["'])[\w-]+_w8_(?P=q)\s*\+\s*[a-zA-Z0-9_$]+''',
-												[ie/youtube] Fix `n` function name extraction for player `20dfca59` (#10611)

Closes #10608
Authored by: bashonly
											
										
										
											2024-07-31 16:19:30 -05:00
+								                jscode, 'Initial JS player n function name', group='name')
 								        elif not idx:
-												[test] Fix test_youtube_signature

											
										
										
											2022-08-21 00:51:03 +05:30
+								            return funcname
 								        return json.loads(js_to_json(self._search_regex(
-												[cleanup] Misc

											
										
										
											2023-07-06 20:09:42 +05:30
+								            rf'var {re.escape(funcname)}\s*=\s*(\[.+?\])\s*[,;]', jscode,
-												[test] Fix test_youtube_signature

											
										
										
											2022-08-21 00:51:03 +05:30
+								            f'Initial JS player n function list ({funcname}.{idx})')))[int(idx)]
-												[ie/youtube] nsig code improvements and cleanup (#13280)

Authored by: bashonly
											
										
										
											2025-05-26 17:54:43 -05:00
+								    def _interpret_player_js_global_var(self, jscode, player_url):
 								        """Returns tuple of: variable name string, variable value list"""
-												[ie/youtube] Make signature and nsig extraction more robust (#12761)

Authored by: bashonly, seproDev

Co-authored-by: sepro <sepro@sepr0.com>
											
										
										
											2025-03-27 17:31:01 -05:00
+								        extract_global_var = self._cached(self._search_regex, 'js global array', player_url)
 								        varcode, varname, varvalue = extract_global_var(
-												[ie/youtube] Fix nsig and signature extraction for player `643afba4` (#12684)

Closes #12677, Closes #12682
Authored by: seproDev, bashonly

Co-authored-by: bashonly <88596187+bashonly@users.noreply.github.com>
											
										
										
											2025-03-21 21:58:10 +01:00
+								            r'''(?x)
-												[ie/youtube] Fix signature and nsig extraction for player `363db69b` (#12725)

Closes #12724
Authored by: bashonly
											
										
										
											2025-03-24 16:18:51 -05:00
+								                (?P<q1>["\'])use\s+strict(?P=q1);\s*
-												[ie/youtube] Fix nsig and signature extraction for player `643afba4` (#12684)

Closes #12677, Closes #12682
Authored by: seproDev, bashonly

Co-authored-by: bashonly <88596187+bashonly@users.noreply.github.com>
											
										
										
											2025-03-21 21:58:10 +01:00
+								                (?P<code>
 								                    var\s+(?P<name>[a-zA-Z0-9_$]+)\s*=\s*
-												[ie/youtube] Fix signature and nsig extraction for player `363db69b` (#12725)

Closes #12724
Authored by: bashonly
											
										
										
											2025-03-24 16:18:51 -05:00
+								                    (?P<value>
 								                        (?P<q2>["\'])(?:(?!(?P=q2)).|\\.)+(?P=q2)
 								                        \.split\((?P<q3>["\'])(?:(?!(?P=q3)).)+(?P=q3)\)
-												[ie/youtube] Fix signature and nsig extraction for player `4fcd6e4a` (#12748)

Closes #12746
Authored by: seproDev
											
										
										
											2025-03-26 00:40:58 +01:00
+								                        |\[\s*(?:(?P<q4>["\'])(?:(?!(?P=q4)).|\\.)*(?P=q4)\s*,?\s*)+\]
-												[ie/youtube] Fix signature and nsig extraction for player `363db69b` (#12725)

Closes #12724
Authored by: bashonly
											
										
										
											2025-03-24 16:18:51 -05:00
+								                    )
-												[ie/youtube] Fix nsig and signature extraction for player `643afba4` (#12684)

Closes #12677, Closes #12682
Authored by: seproDev, bashonly

Co-authored-by: bashonly <88596187+bashonly@users.noreply.github.com>
											
										
										
											2025-03-21 21:58:10 +01:00
+								                )[;,]
 								            ''', jscode, 'global variable', group=('code', 'name', 'value'), default=(None, None, None))
-												[ie/youtube] Make signature and nsig extraction more robust (#12761)

Authored by: bashonly, seproDev

Co-authored-by: sepro <sepro@sepr0.com>
											
										
										
											2025-03-27 17:31:01 -05:00
+								        if not varcode:
 								            self.write_debug(join_nonempty(
 								                'No global array variable found in player JS',
 								                player_url and f'        player = {player_url}', delim='\n'), only_once=True)
-												[ie/youtube] nsig code improvements and cleanup (#13280)

Authored by: bashonly
											
										
										
											2025-05-26 17:54:43 -05:00
+								            return None, None
-												[ie/youtube] Make signature and nsig extraction more robust (#12761)

Authored by: bashonly, seproDev

Co-authored-by: sepro <sepro@sepr0.com>
											
										
										
											2025-03-27 17:31:01 -05:00
-												[ie/youtube] nsig code improvements and cleanup (#13280)

Authored by: bashonly
											
										
										
											2025-05-26 17:54:43 -05:00
+								        jsi = JSInterpreter(varcode)
-												[ie/youtube] Make signature and nsig extraction more robust (#12761)

Authored by: bashonly, seproDev

Co-authored-by: sepro <sepro@sepr0.com>
											
										
										
											2025-03-27 17:31:01 -05:00
+								        interpret_global_var = self._cached(jsi.interpret_expression, 'js global list', player_url)
-												[ie/youtube] Extract global nsig helper functions (#13639)

Authored by: bashonly, seproDev

Co-authored-by: sepro <sepro@sepr0.com>

											
										
										
											2025-07-05 17:03:25 -05:00
+								        return varname, interpret_global_var(varvalue, LocalNameSpace(), allow_recursion=10)
-												[ie/youtube] Make signature and nsig extraction more robust (#12761)

Authored by: bashonly, seproDev

Co-authored-by: sepro <sepro@sepr0.com>
											
										
										
											2025-03-27 17:31:01 -05:00
 								    def _fixup_n_function_code(self, argnames, nsig_code, jscode, player_url):
-												[ie/youtube] Extract global nsig helper functions (#13639)

Authored by: bashonly, seproDev

Co-authored-by: sepro <sepro@sepr0.com>

											
										
										
											2025-07-05 17:03:25 -05:00
+								        # Fixup global array
-												[ie/youtube] nsig code improvements and cleanup (#13280)

Authored by: bashonly
											
										
										
											2025-05-26 17:54:43 -05:00
+								        varname, global_list = self._interpret_player_js_global_var(jscode, player_url)
 								        if varname and global_list:
 								            nsig_code = f'var {varname}={json.dumps(global_list)}; {nsig_code}'
-												[ie/youtube] Fix nsig and signature extraction for player `643afba4` (#12684)

Closes #12677, Closes #12682
Authored by: seproDev, bashonly

Co-authored-by: bashonly <88596187+bashonly@users.noreply.github.com>
											
										
										
											2025-03-21 21:58:10 +01:00
+								        else:
-												[ie/youtube] Extract global nsig helper functions (#13639)

Authored by: bashonly, seproDev

Co-authored-by: sepro <sepro@sepr0.com>

											
										
										
											2025-07-05 17:03:25 -05:00
+								            varname = self._DUMMY_STRING
-												[ie/youtube] Make signature and nsig extraction more robust (#12761)

Authored by: bashonly, seproDev

Co-authored-by: sepro <sepro@sepr0.com>
											
										
										
											2025-03-27 17:31:01 -05:00
+								            global_list = []
-												[ie/youtube] Extract global nsig helper functions (#13639)

Authored by: bashonly, seproDev

Co-authored-by: sepro <sepro@sepr0.com>

											
										
										
											2025-07-05 17:03:25 -05:00
+								        # Fixup typeof check
-												[ie/youtube] Make signature and nsig extraction more robust (#12761)

Authored by: bashonly, seproDev

Co-authored-by: sepro <sepro@sepr0.com>
											
										
										
											2025-03-27 17:31:01 -05:00
+								        undefined_idx = global_list.index('undefined') if 'undefined' in global_list else r'\d+'
 								        fixed_code = re.sub(
-												[ie/youtube] nsig code improvements and cleanup (#13280)

Authored by: bashonly
											
										
										
											2025-05-26 17:54:43 -05:00
+								            fr'''(?x)
-												[ie/youtube] Make signature and nsig extraction more robust (#12761)

Authored by: bashonly, seproDev

Co-authored-by: sepro <sepro@sepr0.com>
											
										
										
											2025-03-27 17:31:01 -05:00
+								                ;\s*if\s*\(\s*typeof\s+[a-zA-Z0-9_$]+\s*===?\s*(?:
 								                    (["\'])undefined\1|
 								                    {re.escape(varname)}\[{undefined_idx}\]
 								                )\s*\)\s*return\s+{re.escape(argnames[0])};
 								            ''', ';', nsig_code)
 								        if fixed_code == nsig_code:
 								            self.write_debug(join_nonempty(
 								                'No typeof statement found in nsig function code',
 								                player_url and f'        player = {player_url}', delim='\n'), only_once=True)
-												[ie/youtube] Extract global nsig helper functions (#13639)

Authored by: bashonly, seproDev

Co-authored-by: sepro <sepro@sepr0.com>

											
										
										
											2025-07-05 17:03:25 -05:00
 								        # Fixup global funcs
 								        jsi = JSInterpreter(fixed_code)
 								        cache_id = (self._NSIG_FUNC_CACHE_ID, player_url)
 								        try:
 								            self._cached(
 								                self._extract_n_function_from_code, *cache_id)(jsi, (argnames, fixed_code))(self._DUMMY_STRING)
 								        except JSInterpreter.Exception:
 								            self._player_cache.pop(cache_id, None)
 								        global_funcnames = jsi._undefined_varnames
 								        debug_names = []
 								        jsi = JSInterpreter(jscode)
 								        for func_name in global_funcnames:
 								            try:
 								                func_args, func_code = jsi.extract_function_code(func_name)
 								                fixed_code = f'var {func_name} = function({", ".join(func_args)}) {{ {func_code} }}; {fixed_code}'
 								                debug_names.append(func_name)
 								            except Exception:
 								                self.report_warning(join_nonempty(
 								                    f'Unable to extract global nsig function {func_name} from player JS',
 								                    player_url and f'        player = {player_url}', delim='\n'), only_once=True)
 								        if debug_names:
 								            self.write_debug(f'Extracted global nsig functions: {", ".join(debug_names)}')
-												[ie/youtube] Make signature and nsig extraction more robust (#12761)

Authored by: bashonly, seproDev

Co-authored-by: sepro <sepro@sepr0.com>
											
										
										
											2025-03-27 17:31:01 -05:00
+								        return argnames, fixed_code
-												[ie/youtube] Fix `n` sig extraction for player `3bb1f723` (#11750)

Closes #11744
Authored by: bashonly
											
										
										
											2024-12-06 15:35:18 +00:00
-												[youtube] Improve signature caching

and refactor related functions

											
										
										
											2022-08-18 21:27:41 +05:30
+								    def _extract_n_function_code(self, video_id, player_url):
-												[youtube] Fix throttling by decrypting n-sig (#1437)


											
										
										
											2021-10-31 09:53:58 +05:30
+								        player_id = self._extract_player_info(player_url)
-												[ie/youtube] Cache signature timestamps (#13047)

Closes #12825
Authored by: bashonly
											
										
										
											2025-04-29 20:15:17 -05:00
+								        func_code = self._load_player_data_from_cache('nsig', player_url)
-												[youtube] Improve signature caching

and refactor related functions

											
										
										
											2022-08-18 21:27:41 +05:30
+								        jscode = func_code or self._load_player(video_id, player_url)
 								        jsi = JSInterpreter(jscode)
-												[youtube] Fix throttling by decrypting n-sig (#1437)


											
										
										
											2021-10-31 09:53:58 +05:30
 								        if func_code:
-												[youtube] Improve signature caching

and refactor related functions

											
										
										
											2022-08-18 21:27:41 +05:30
+								            return jsi, player_id, func_code
-												[youtube] Fix throttling by decrypting n-sig (#1437)


											
										
										
											2021-10-31 09:53:58 +05:30
-												[cleanup] Misc (#10623)

Authored by: bashonly
											
										
										
											2024-08-01 10:03:49 -05:00
+								        func_name = self._extract_n_function_name(jscode, player_url=player_url)
-												[extractor/youtube] Fallback regex for nsig code extraction

											
										
										
											2022-09-01 13:38:25 +05:30
-												[ie/youtube] Extract global nsig helper functions (#13639)

Authored by: bashonly, seproDev

Co-authored-by: sepro <sepro@sepr0.com>

											
										
										
											2025-07-05 17:03:25 -05:00
+								        # XXX: Work around (a) global array variable, (b) `typeof` short-circuit, (c) global functions
-												[ie/youtube] Make signature and nsig extraction more robust (#12761)

Authored by: bashonly, seproDev

Co-authored-by: sepro <sepro@sepr0.com>
											
										
										
											2025-03-27 17:31:01 -05:00
+								        func_code = self._fixup_n_function_code(*jsi.extract_function_code(func_name), jscode, player_url)
-												[extractor/youtube] Fallback regex for nsig code extraction

											
										
										
											2022-09-01 13:38:25 +05:30
-												[youtube] Improve signature caching

and refactor related functions

											
										
										
											2022-08-18 21:27:41 +05:30
+								        return jsi, player_id, func_code
 								    def _extract_n_function_from_code(self, jsi, func_code):
-												[jsinterp] Handle new youtube signature functions

Closes #4635

											
										
										
											2022-08-14 04:51:54 +05:30
+								        func = jsi.extract_function_from_code(*func_code)
-												[jsinterp] Fix for youtube player 1f7d5369

Closes #4635 again

											
										
										
											2022-08-18 16:38:35 +05:30
-												[youtube] Improve signature caching

and refactor related functions

											
										
										
											2022-08-18 21:27:41 +05:30
+								        def extract_nsig(s):
-												[extractor/youtube] Add fallback to phantomjs

Related #4635

											
										
										
											2022-08-18 21:35:18 +05:30
+								            try:
 								                ret = func([s])
 								            except JSInterpreter.Exception:
 								                raise
 								            except Exception as e:
 								                raise JSInterpreter.Exception(traceback.format_exc(), cause=e)
-												[ie/youtube] Raise if `n` function returns input value (#11752)

Improve a95ee6d8803fca9157adecf63732ab58bf87fd88

Authored by: bashonly
											
										
										
											2024-12-06 15:58:44 +00:00
+								            if ret.startswith('enhanced_except_') or ret.endswith(s):
-												[extractor/youtube] Add fallback to phantomjs

Related #4635

											
										
										
											2022-08-18 21:35:18 +05:30
+								                raise JSInterpreter.Exception('Signature function returned an exception')
-												[jsinterp] Fix for youtube player 1f7d5369

Closes #4635 again

											
										
										
											2022-08-18 16:38:35 +05:30
+								            return ret
-												[youtube] Improve signature caching

and refactor related functions

											
										
										
											2022-08-18 21:27:41 +05:30
 								        return extract_nsig
-												Restore accidentally deleted commits

That's what happens if you let Windows machines write :(

											
										
										
											2013-09-21 14:19:30 +02:00
-												[youtube] Use new API for additional video extraction requests (#328)

Co-authored-by: colethedj, pukkandan
Closes https://github.com/yt-dlp/yt-dlp/issues/427
Workarounds for https://github.com/ytdl-org/youtube-dl/issues/29326, https://github.com/yt-dlp/yt-dlp/issues/319, https://github.com/ytdl-org/youtube-dl/issues/29086
											
										
										
											2021-06-30 10:07:49 +12:00
+								    def _extract_signature_timestamp(self, video_id, player_url, ytcfg=None, fatal=False):
 								        """
 								        Extract signatureTimestamp (sts)
 								        Required to tell API what sig/player version is in use.
 								        """
-												[ie/youtube] Force player `0004de42` (#14398)

Closes #14400
Authored by: seproDev
											
										
										
											2025-09-23 07:07:28 +02:00
+								        player_sts_override = self._get_player_js_version()[0]
 								        if player_sts_override:
 								            return int(player_sts_override)
-												[ie/youtube] Cache signature timestamps (#13047)

Closes #12825
Authored by: bashonly
											
										
										
											2025-04-29 20:15:17 -05:00
+								        if sts := traverse_obj(ytcfg, ('STS', {int_or_none})):
 								            return sts
 								        if not player_url:
 								            error_msg = 'Cannot extract signature timestamp without player url'
 								            if fatal:
 								                raise ExtractorError(error_msg)
 								            self.report_warning(error_msg)
 								            return None
 								        sts = self._load_player_data_from_cache('sts', player_url)
 								        if sts:
 								            return sts
 								        if code := self._load_player(video_id, player_url, fatal=fatal):
 								            sts = int_or_none(self._search_regex(
 								                r'(?:signatureTimestamp|sts)\s*:\s*(?P<sts>[0-9]{5})', code,
 								                'JS player signature timestamp', group='sts', fatal=fatal))
 								            if sts:
 								                self._store_player_data_to_cache('sts', player_url, sts)
-												[youtube] Use new API for additional video extraction requests (#328)

Co-authored-by: colethedj, pukkandan
Closes https://github.com/yt-dlp/yt-dlp/issues/427
Workarounds for https://github.com/ytdl-org/youtube-dl/issues/29326, https://github.com/yt-dlp/yt-dlp/issues/319, https://github.com/ytdl-org/youtube-dl/issues/29086
											
										
										
											2021-06-30 10:07:49 +12:00
+								        return sts
-												[youtube] Extract data from multiple clients (#536)

* `player_client` accepts multiple clients
* default `player_client` = `android,web`
* music clients can be specifically requested
* Add IOS `player_client`
* Hide live dash since they can't be downloaded

Closes #501

Authored-by: pukkandan, colethedj
											
										
										
											2021-07-21 09:22:34 +05:30
+								    def _mark_watched(self, video_id, player_responses):
-												[ie/youtube] Fix `--mark-watched` support (#13222)

Closes #11532
Authored by: iednod55, brian6932

Co-authored-by: iednod55 <210167282+iednod55@users.noreply.github.com>
											
										
										
											2025-05-26 18:31:22 -04:00
+								        # cpn generation algorithm is reverse engineered from base.js.
 								        # In fact it works even with dummy cpn.
 								        CPN_ALPHABET = 'abcdefghijklmnopqrstuvwxyzABCDEFGHIJKLMNOPQRSTUVWXYZ0123456789-_'
 								        cpn = ''.join(CPN_ALPHABET[random.randint(0, 256) & 63] for _ in range(16))
-												[extractor/youtube] Mark videos as fully watched (#4146)

* Also fixes videos appearing as shorts in watch history

Closes #2555
Authored by: Brett824
											
										
										
											2022-06-23 19:30:17 -04:00
+								        for is_full, key in enumerate(('videostatsPlaybackUrl', 'videostatsWatchtimeUrl')):
 								            label = 'fully ' if is_full else ''
 								            url = get_first(player_responses, ('playbackTracking', key, 'baseUrl'),
 								                            expected_type=url_or_none)
 								            if not url:
 								                self.report_warning(f'Unable to mark {label}watched')
 								                return
-												[compat] Remove deprecated functions from core code

											
										
										
											2022-06-24 16:24:43 +05:30
+								            parsed_url = urllib.parse.urlparse(url)
 								            qs = urllib.parse.parse_qs(parsed_url.query)
-												[extractor/youtube] Mark videos as fully watched (#4146)

* Also fixes videos appearing as shorts in watch history

Closes #2555
Authored by: Brett824
											
										
										
											2022-06-23 19:30:17 -04:00
 								            # # more consistent results setting it to right before the end
 								            video_length = [str(float((qs.get('len') or ['1.5'])[0]) - 1)]
 								            qs.update({
 								                'ver': ['2'],
 								                'cpn': [cpn],
 								                'cmt': video_length,
 								                'el': 'detailpage',  # otherwise defaults to "shorts"
 								            })
 								            if is_full:
 								                # these seem to mark watchtime "history" in the real world
 								                # they're required, so send in a single value
 								                qs.update({
-												[extractor/youtube] Mark videos as fully watched

Closes #2555
Authored by: bsun0000

											
										
										
											2022-10-19 00:05:54 +05:30
+								                    'st': 0,
-												[extractor/youtube] Mark videos as fully watched (#4146)

* Also fixes videos appearing as shorts in watch history

Closes #2555
Authored by: Brett824
											
										
										
											2022-06-23 19:30:17 -04:00
+								                    'et': video_length,
 								                })
-												[compat] Remove deprecated functions from core code

											
										
										
											2022-06-24 16:24:43 +05:30
+								            url = urllib.parse.urlunparse(
 								                parsed_url._replace(query=urllib.parse.urlencode(qs, True)))
-												[extractor/youtube] Mark videos as fully watched (#4146)

* Also fixes videos appearing as shorts in watch history

Closes #2555
Authored by: Brett824
											
										
										
											2022-06-23 19:30:17 -04:00
 								            self._download_webpage(
 								                url, video_id, f'Marking {label}watched',
-												[ie/youtube] Remove broken OAuth support (#11558)

Closes #11462
Authored by: bashonly
											
										
										
											2024-11-16 23:40:21 +00:00
+								                'Unable to mark watched', fatal=False)
-												Add --mark-watched feature (Closes #5054)

											
										
										
											2016-03-01 01:01:33 +06:00
-												[extractors] Use new framework for existing embeds (#4307)

`Brightcove` is difficult to migrate because it's subclasses may depend
on the signature of the current functions. So it is left as-is for now

Note: Tests have not been migrated

											
										
										
											2022-08-01 06:53:25 +05:30
+								    @classmethod
 								    def _extract_from_webpage(cls, url, webpage):
 								        # Invidious Instances
 								        # https://github.com/yt-dlp/yt-dlp/issues/195
 								        # https://github.com/iv-org/invidious/pull/1730
 								        mobj = re.search(
 								            r'<link rel="alternate" href="(?P<url>https://www\.youtube\.com/watch\?v=[0-9A-Za-z_-]{11})"',
 								            webpage)
 								        if mobj:
 								            yield cls.url_result(mobj.group('url'), cls)
-												[cleanup] Add more ruff rules (#10149)

Authored by: seproDev

Reviewed-by: bashonly <88596187+bashonly@users.noreply.github.com>
Reviewed-by: Simon Sawicki <contact@grub4k.xyz>
											
										
										
											2024-06-12 01:09:58 +02:00
+								            raise cls.StopExtraction
-												[extractors] Use new framework for existing embeds (#4307)

`Brightcove` is difficult to migrate because it's subclasses may depend
on the signature of the current functions. So it is left as-is for now

Note: Tests have not been migrated

											
										
										
											2022-08-01 06:53:25 +05:30
 								        yield from super()._extract_from_webpage(url, webpage)
-												[youtube] Separate methods for embeds extraction

											
										
										
											2017-09-06 00:48:37 +07:00
 								        # lazyYT YouTube embed
-												[extractors] Use new framework for existing embeds (#4307)

`Brightcove` is difficult to migrate because it's subclasses may depend
on the signature of the current functions. So it is left as-is for now

Note: Tests have not been migrated

											
										
										
											2022-08-01 06:53:25 +05:30
+								        for id_ in re.findall(r'class="lazyYT" data-youtube-id="([^"]+)"', webpage):
 								            yield cls.url_result(unescapeHTML(id_), cls, id_)
-												[youtube] Separate methods for embeds extraction

											
										
										
											2017-09-06 00:48:37 +07:00
 								        # Wordpress "YouTube Video Importer" plugin
-												[extractors] Use new framework for existing embeds (#4307)

`Brightcove` is difficult to migrate because it's subclasses may depend
on the signature of the current functions. So it is left as-is for now

Note: Tests have not been migrated

											
										
										
											2022-08-01 06:53:25 +05:30
+								        for m in re.findall(r'''(?x)<div[^>]+
 								                class=(?P<q1>[\'"])[^\'"]*\byvii_single_video_player\b[^\'"]*(?P=q1)[^>]+
 								                data-video_id=(?P<q2>[\'"])([^\'"]+)(?P=q2)''', webpage):
 								            yield cls.url_result(m[-1], cls, m[-1])
-												[youtube] Separate methods for embeds extraction

											
										
										
											2017-09-06 00:48:37 +07:00
-												[jadorecettepub] Add extractor (Fixes #2148)

											
										
										
											2014-02-08 19:20:11 +01:00
+								    @classmethod
 								    def extract_id(cls, url):
-												[cleanup] Misc cleanup

											
										
										
											2022-06-28 10:40:54 +05:30
+								        video_id = cls.get_temp_id(url)
 								        if not video_id:
 								            raise ExtractorError(f'Invalid URL: {url}')
 								        return video_id
-												Move youtube extractors to youtube_dl.extractor.youtube

											
										
										
											2013-06-23 19:58:33 +02:00
-												[youtube] Sanity check `chapters` (and refactor related code)
Closes #520

											
										
										
											2021-07-20 05:32:41 +05:30
+								    def _extract_chapters_from_json(self, data, duration):
 								        chapter_list = traverse_obj(
 								            data, (
 								                'playerOverlays', 'playerOverlayRenderer', 'decoratedPlayerBarRenderer',
-												[cleanup] Add more ruff rules (#10149)

Authored by: seproDev

Reviewed-by: bashonly <88596187+bashonly@users.noreply.github.com>
Reviewed-by: Simon Sawicki <contact@grub4k.xyz>
											
										
										
											2024-06-12 01:09:58 +02:00
+								                'decoratedPlayerBarRenderer', 'playerBar', 'chapteredPlayerBarRenderer', 'chapters',
-												[youtube] Sanity check `chapters` (and refactor related code)
Closes #520

											
										
										
											2021-07-20 05:32:41 +05:30
+								            ), expected_type=list)
-												[extractor/rutube] Extract chapters from description (#6345)

Authored by: mushbite
											
										
										
											2023-03-04 15:33:17 +02:00
+								        return self._extract_chapters_helper(
-												[youtube] Sanity check `chapters` (and refactor related code)
Closes #520

											
										
										
											2021-07-20 05:32:41 +05:30
+								            chapter_list,
-												[extractor/rutube] Extract chapters from description (#6345)

Authored by: mushbite
											
										
										
											2023-03-04 15:33:17 +02:00
+								            start_function=lambda chapter: float_or_none(
-												[youtube] Sanity check `chapters` (and refactor related code)
Closes #520

											
										
										
											2021-07-20 05:32:41 +05:30
+								                traverse_obj(chapter, ('chapterRenderer', 'timeRangeStartMillis')), scale=1000),
-												[extractor/rutube] Extract chapters from description (#6345)

Authored by: mushbite
											
										
										
											2023-03-04 15:33:17 +02:00
+								            title_function=lambda chapter: traverse_obj(
-												[youtube] Sanity check `chapters` (and refactor related code)
Closes #520

											
										
										
											2021-07-20 05:32:41 +05:30
+								                chapter, ('chapterRenderer', 'title', 'simpleText'), expected_type=str),
 								            duration=duration)
 								    def _extract_chapters_from_engagement_panel(self, data, duration):
 								        content_list = traverse_obj(
-												Merge 'ytdl-org/youtube-dl/master' release 2020.11.19

Old Extractors left behind:
	VLivePlaylistIE
	YoutubeSearchURLIE
	YoutubeShowIE
	YoutubeFavouritesIE

If removing old extractors, make corresponding changes in
	docs/supportedsites.md
	youtube_dlc/extractor/extractors.py

Not merged:
	.github/ISSUE_TEMPLATE/1_broken_site.md
	.github/ISSUE_TEMPLATE/2_site_support_request.md
	.github/ISSUE_TEMPLATE/3_site_feature_request.md
	.github/ISSUE_TEMPLATE/4_bug_report.md
	.github/ISSUE_TEMPLATE/5_feature_request.md
	test/test_all_urls.py
	youtube_dlc/version.py
	Changelog

											
										
										
											2020-11-20 00:52:59 +05:30
+								            data,
-												[youtube] Sanity check `chapters` (and refactor related code)
Closes #520

											
										
										
											2021-07-20 05:32:41 +05:30
+								            ('engagementPanels', ..., 'engagementPanelSectionListRenderer', 'content', 'macroMarkersListRenderer', 'contents'),
-												[utils] `traverse_obj`: Fix more bugs

and cleanup uses of `default=[]`

Continued from b1bde57bef878478e3503ab07190fd207914ade9

											
										
										
											2023-02-10 03:56:26 +05:30
+								            expected_type=list)
-												[youtube] Simplify `_get_text` early

											
										
										
											2021-07-24 06:16:46 +05:30
+								        chapter_time = lambda chapter: parse_duration(self._get_text(chapter, 'timeDescription'))
 								        chapter_title = lambda chapter: self._get_text(chapter, 'title')
-												[youtube] Sanity check `chapters` (and refactor related code)
Closes #520

											
										
										
											2021-07-20 05:32:41 +05:30
-												[cleanup] Misc fixes

Cherry-picks from: #3498, #3947
Related: #3949, https://github.com/yt-dlp/yt-dlp/issues/1839#issuecomment-1140313836
Authored by: pukkandan, flashdagger, gamer191

											
										
										
											2022-06-03 21:29:03 +05:30
+								        return next(filter(None, (
-												[extractor/rutube] Extract chapters from description (#6345)

Authored by: mushbite
											
										
										
											2023-03-04 15:33:17 +02:00
+								            self._extract_chapters_helper(traverse_obj(contents, (..., 'macroMarkersListItemRenderer')),
 								                                          chapter_time, chapter_title, duration)
-												[cleanup] Misc fixes

Cherry-picks from: #3498, #3947
Related: #3949, https://github.com/yt-dlp/yt-dlp/issues/1839#issuecomment-1140313836
Authored by: pukkandan, flashdagger, gamer191

											
										
										
											2022-06-03 21:29:03 +05:30
+								            for contents in content_list)), [])
-												[youtube] Sanity check `chapters` (and refactor related code)
Closes #520

											
										
										
											2021-07-20 05:32:41 +05:30
-												[ie/youtube] Fix `heatmap` extraction (#8299)

Closes #8189
Authored by: bashonly
											
										
										
											2023-10-06 20:00:15 -05:00
+								    def _extract_heatmap(self, data):
 								        return traverse_obj(data, (
 								            'frameworkUpdates', 'entityBatchUpdate', 'mutations',
 								            lambda _, v: v['payload']['macroMarkersListEntity']['markersList']['markerType'] == 'MARKER_TYPE_HEATMAP',
 								            'payload', 'macroMarkersListEntity', 'markersList', 'markers', ..., {
-												[cleanup] Misc (#11347)

Closes #11361
Authored by: avagordon01, bashonly, grqz, Grub4K, seproDev

Co-authored-by: Ava Gordon <avagordon01@gmail.com>
Co-authored-by: bashonly <bashonly@protonmail.com>
Co-authored-by: N/Ame <173015200+grqz@users.noreply.github.com>
Co-authored-by: Simon Sawicki <contact@grub4k.xyz>
											
										
										
											2024-11-04 01:33:21 +01:00
+								                'start_time': ('startMillis', {float_or_none(scale=1000)}),
-												[ie/youtube] Fix `heatmap` extraction (#8299)

Closes #8189
Authored by: bashonly
											
										
										
											2023-10-06 20:00:15 -05:00
+								                'end_time': {lambda x: (int(x['startMillis']) + int(x['durationMillis'])) / 1000},
 								                'value': ('intensityScoreNormalized', {float_or_none}),
 								            })) or None
-												[extractor/youtube] Extract `heatmap` data (#7100)

Closes #3888
Authored by: tntmod54321
											
										
										
											2023-05-26 08:24:39 -04:00
-												[ie/youtube] Fix comments extraction (#9775)

Closes #9358
Authored by: jakeogh, minamotorin, shoxie007, bbilly1

Co-authored-by: minamotorin <76122224+minamotorin@users.noreply.github.com>
Co-authored-by: shoxie007 <74592022+shoxie007@users.noreply.github.com>
Co-authored-by: Simon <35427372+bbilly1@users.noreply.github.com>
											
										
										
											2024-05-17 07:37:30 -07:00
+								    def _extract_comment(self, entities, parent=None):
 								        comment_entity_payload = get_first(entities, ('payload', 'commentEntityPayload', {dict}))
 								        if not (comment_id := traverse_obj(comment_entity_payload, ('properties', 'commentId', {str}))):
 								            return
 								        toolbar_entity_payload = get_first(entities, ('payload', 'engagementToolbarStateEntityPayload', {dict}))
 								        time_text = traverse_obj(comment_entity_payload, ('properties', 'publishedTime', {str})) or ''
 								        return {
 								            'id': comment_id,
 								            'parent': parent or 'root',
 								            **traverse_obj(comment_entity_payload, {
 								                'text': ('properties', 'content', 'content', {str}),
 								                'like_count': ('toolbar', 'likeCountA11y', {parse_count}),
 								                'author_id': ('author', 'channelId', {self.ucid_or_none}),
 								                'author': ('author', 'displayName', {str}),
 								                'author_thumbnail': ('author', 'avatarThumbnailUrl', {url_or_none}),
 								                'author_is_uploader': ('author', 'isCreator', {bool}),
 								                'author_is_verified': ('author', 'isVerified', {bool}),
 								                'author_url': ('author', 'channelCommand', 'innertubeCommand', (
-												[cleanup] Add more ruff rules (#10149)

Authored by: seproDev

Reviewed-by: bashonly <88596187+bashonly@users.noreply.github.com>
Reviewed-by: Simon Sawicki <contact@grub4k.xyz>
											
										
										
											2024-06-12 01:09:58 +02:00
+								                    ('browseEndpoint', 'canonicalBaseUrl'), ('commandMetadata', 'webCommandMetadata', 'url'),
-												[cleanup] Misc (#11347)

Closes #11361
Authored by: avagordon01, bashonly, grqz, Grub4K, seproDev

Co-authored-by: Ava Gordon <avagordon01@gmail.com>
Co-authored-by: bashonly <bashonly@protonmail.com>
Co-authored-by: N/Ame <173015200+grqz@users.noreply.github.com>
Co-authored-by: Simon Sawicki <contact@grub4k.xyz>
											
										
										
											2024-11-04 01:33:21 +01:00
+								                ), {urljoin('https://www.youtube.com')}),
-												[ie/youtube] Fix comments extraction (#9775)

Closes #9358
Authored by: jakeogh, minamotorin, shoxie007, bbilly1

Co-authored-by: minamotorin <76122224+minamotorin@users.noreply.github.com>
Co-authored-by: shoxie007 <74592022+shoxie007@users.noreply.github.com>
Co-authored-by: Simon <35427372+bbilly1@users.noreply.github.com>
											
										
										
											2024-05-17 07:37:30 -07:00
+								            }, get_all=False),
 								            'is_favorited': (None if toolbar_entity_payload is None else
 								                             toolbar_entity_payload.get('heartState') == 'TOOLBAR_HEART_STATE_HEARTED'),
 								            '_time_text': time_text,  # FIXME: non-standard, but we need a way of showing that it is an estimate.
 								            'timestamp': self._parse_time_text(time_text),
 								        }
 								    def _extract_comment_old(self, comment_renderer, parent=None):
-												[Youtube] Rewrite comment extraction (#167)

Closes #121

TODO:
* Add an option for the user to specify newest/popular and max number of comments
* Refactor the download code and generalize with TabIE
* Parse time_text to timestamp

											
										
										
											2021-03-14 22:41:11 +00:00
+								        comment_id = comment_renderer.get('commentId')
 								        if not comment_id:
 								            return
-												[youtube] misc cleanup and bug fixes (#505)

* Update some `_extract_response` calls to keep them consistent
* Cleanup continuation extraction related code using new API format
* Improve `_extract_account_syncid` to support multiple parameters
* Generalize `get_text` and related functions into one
* Update `INNERTUBE_CONTEXT_CLIENT_NAME` with integer values

Authored by: colethedj
											
										
										
											2021-07-19 16:55:07 +12:00
-												[extractor/youtube] Extract more metadata for comments (#7179)

Adds new comment fields:
* `author_url` - The url to the comment author's page
* `author_is_verified` - Whether the author is verified on the platform
* `is_pinned` - Whether the comment is pinned to the top of the comments

Closes https://github.com/yt-dlp/yt-dlp/issues/5411

Authored by: coletdjnz
											
										
										
											2023-06-01 20:43:32 +12:00
+								        info = {
 								            'id': comment_id,
 								            'text': self._get_text(comment_renderer, 'contentText'),
 								            'like_count': self._get_count(comment_renderer, 'voteCount'),
 								            'author_id': traverse_obj(comment_renderer, ('authorEndpoint', 'browseEndpoint', 'browseId', {self.ucid_or_none})),
 								            'author': self._get_text(comment_renderer, 'authorText'),
 								            'author_thumbnail': traverse_obj(comment_renderer, ('authorThumbnail', 'thumbnails', -1, 'url', {url_or_none})),
 								            'parent': parent or 'root',
 								        }
-												[youtube] misc cleanup and bug fixes (#505)

* Update some `_extract_response` calls to keep them consistent
* Cleanup continuation extraction related code using new API format
* Improve `_extract_account_syncid` to support multiple parameters
* Generalize `get_text` and related functions into one
* Update `INNERTUBE_CONTEXT_CLIENT_NAME` with integer values

Authored by: colethedj
											
										
										
											2021-07-19 16:55:07 +12:00
-												[extractor/youtube] Support changing extraction language (#4470)

Adds `--extractor-args youtube:lang=<supported lang code>` extractor arg to prefer translated fields (e.g. title and description) of that language, if available, for all YouTube extractors. See README or error message for list of supported language codes.

Closes https://github.com/yt-dlp/yt-dlp/issues/387

Authored by: coletdjnz
											
										
										
											2022-09-09 05:16:46 +00:00
+								        # Timestamp is an estimate calculated from the current time and time_text
 								        time_text = self._get_text(comment_renderer, 'publishedTimeText') or ''
 								        timestamp = self._parse_time_text(time_text)
-												[extractor/youtube] Extract more metadata for comments (#7179)

Adds new comment fields:
* `author_url` - The url to the comment author's page
* `author_is_verified` - Whether the author is verified on the platform
* `is_pinned` - Whether the comment is pinned to the top of the comments

Closes https://github.com/yt-dlp/yt-dlp/issues/5411

Authored by: coletdjnz
											
										
										
											2023-06-01 20:43:32 +12:00
+								        info.update({
 								            # FIXME: non-standard, but we need a way of showing that it is an estimate.
 								            '_time_text': time_text,
 								            'timestamp': timestamp,
 								        })
-												[youtube] misc cleanup and bug fixes (#505)

* Update some `_extract_response` calls to keep them consistent
* Cleanup continuation extraction related code using new API format
* Improve `_extract_account_syncid` to support multiple parameters
* Generalize `get_text` and related functions into one
* Update `INNERTUBE_CONTEXT_CLIENT_NAME` with integer values

Authored by: colethedj
											
										
										
											2021-07-19 16:55:07 +12:00
-												[extractor/youtube] Extract more metadata for comments (#7179)

Adds new comment fields:
* `author_url` - The url to the comment author's page
* `author_is_verified` - Whether the author is verified on the platform
* `is_pinned` - Whether the comment is pinned to the top of the comments

Closes https://github.com/yt-dlp/yt-dlp/issues/5411

Authored by: coletdjnz
											
										
										
											2023-06-01 20:43:32 +12:00
+								        info['author_url'] = urljoin(
 								            'https://www.youtube.com', traverse_obj(comment_renderer, ('authorEndpoint', (
 								                ('browseEndpoint', 'canonicalBaseUrl'), ('commandMetadata', 'webCommandMetadata', 'url'))),
 								                expected_type=str, get_all=False))
-												[Youtube] Rewrite comment extraction (#167)

Closes #121

TODO:
* Add an option for the user to specify newest/popular and max number of comments
* Refactor the download code and generalize with TabIE
* Parse time_text to timestamp

											
										
										
											2021-03-14 22:41:11 +00:00
-												[extractor/youtube] Extract more metadata for comments (#7179)

Adds new comment fields:
* `author_url` - The url to the comment author's page
* `author_is_verified` - Whether the author is verified on the platform
* `is_pinned` - Whether the comment is pinned to the top of the comments

Closes https://github.com/yt-dlp/yt-dlp/issues/5411

Authored by: coletdjnz
											
										
										
											2023-06-01 20:43:32 +12:00
+								        author_is_uploader = traverse_obj(comment_renderer, 'authorIsChannelOwner')
 								        if author_is_uploader is not None:
 								            info['author_is_uploader'] = author_is_uploader
 								        comment_abr = traverse_obj(
-												[extractor/youtube] Fix comments' `is_favorited` (#7390)

Authored by: bbilly1
Closes #7389
											
										
										
											2023-06-23 01:08:42 +07:00
+								            comment_renderer, ('actionButtons', 'commentActionButtonsRenderer'), expected_type=dict)
-												[extractor/youtube] Extract more metadata for comments (#7179)

Adds new comment fields:
* `author_url` - The url to the comment author's page
* `author_is_verified` - Whether the author is verified on the platform
* `is_pinned` - Whether the comment is pinned to the top of the comments

Closes https://github.com/yt-dlp/yt-dlp/issues/5411

Authored by: coletdjnz
											
										
										
											2023-06-01 20:43:32 +12:00
+								        if comment_abr is not None:
 								            info['is_favorited'] = 'creatorHeart' in comment_abr
-												[extractor/youtube] Misc cleanup

Authored by: coletdjnz

											
										
										
											2023-06-08 18:58:49 +05:30
+								        badges = self._extract_badges([traverse_obj(comment_renderer, 'authorCommentBadge')])
 								        if self._has_badge(badges, BadgeType.VERIFIED):
 								            info['author_is_verified'] = True
-												[extractor/youtube] Extract more metadata for comments (#7179)

Adds new comment fields:
* `author_url` - The url to the comment author's page
* `author_is_verified` - Whether the author is verified on the platform
* `is_pinned` - Whether the comment is pinned to the top of the comments

Closes https://github.com/yt-dlp/yt-dlp/issues/5411

Authored by: coletdjnz
											
										
										
											2023-06-01 20:43:32 +12:00
 								        is_pinned = traverse_obj(comment_renderer, 'pinnedCommentBadge')
 								        if is_pinned:
 								            info['is_pinned'] = True
 								        return info
-												[Youtube] Rewrite comment extraction (#167)

Closes #121

TODO:
* Add an option for the user to specify newest/popular and max number of comments
* Refactor the download code and generalize with TabIE
* Parse time_text to timestamp

											
										
										
											2021-03-14 22:41:11 +00:00
-												[youtube:comments] Add more options for limiting number of comments extracted (#1626)

Extends `max_comments` extractor arg to support `max-parents,max-replies,max-replies-per-thread`.
Authored-by: coletdjnz
											
										
										
											2021-12-15 04:29:48 +00:00
+								    def _comment_entries(self, root_continuation_data, ytcfg, video_id, parent=None, tracker=None):
 								        get_single_config_arg = lambda c: self._configuration_arg(c, [''])[0]
-												[youtube:comments] Move comment extraction to new API (#466)

Closes #438, #481, #485 

Authored by: colethedj
											
										
										
											2021-07-12 11:18:40 +12:00
 								        def extract_header(contents):
 								            _continuation = None
 								            for content in contents:
-												[youtube:comments] Add more options for limiting number of comments extracted (#1626)

Extends `max_comments` extractor arg to support `max-parents,max-replies,max-replies-per-thread`.
Authored-by: coletdjnz
											
										
										
											2021-12-15 04:29:48 +00:00
+								                comments_header_renderer = traverse_obj(content, 'commentsHeaderRenderer')
-												[youtube:tab] Extract more playlist metadata (#2069)

* Add fields modified_date, modified_timestamp
* Add field playlist_count
* [youtube:tab] Extract view_count, playlist_count, modified_date

Authored by: coletdjnz, pukkandan
											
										
										
											2022-01-07 11:03:02 +00:00
+								                expected_comment_count = self._get_count(
 								                    comments_header_renderer, 'countText', 'commentsCount')
-												[youtube] misc cleanup and bug fixes (#505)

* Update some `_extract_response` calls to keep them consistent
* Cleanup continuation extraction related code using new API format
* Improve `_extract_account_syncid` to support multiple parameters
* Generalize `get_text` and related functions into one
* Update `INNERTUBE_CONTEXT_CLIENT_NAME` with integer values

Authored by: colethedj
											
										
										
											2021-07-19 16:55:07 +12:00
-												[extractor/youtube] Fix continuation loop with no comments (#7148)

Deep check the response for incomplete data.

Authored by: coletdjnz

											
										
										
											2023-05-31 19:08:28 +12:00
+								                if expected_comment_count is not None:
-												[youtube:comments] Add more options for limiting number of comments extracted (#1626)

Extends `max_comments` extractor arg to support `max-parents,max-replies,max-replies-per-thread`.
Authored-by: coletdjnz
											
										
										
											2021-12-15 04:29:48 +00:00
+								                    tracker['est_total'] = expected_comment_count
 								                    self.to_screen(f'Downloading ~{expected_comment_count} comments')
 								                comment_sort_index = int(get_single_config_arg('comment_sort') != 'top')  # 1 = new, 0 = top
-												[youtube:comments] Move comment extraction to new API (#466)

Closes #438, #481, #485 

Authored by: colethedj
											
										
										
											2021-07-12 11:18:40 +12:00
 								                sort_menu_item = try_get(
 								                    comments_header_renderer,
 								                    lambda x: x['sortMenu']['sortFilterSubMenuRenderer']['subMenuItems'][comment_sort_index], dict) or {}
 								                sort_continuation_ep = sort_menu_item.get('serviceEndpoint') or {}
 								                _continuation = self._extract_continuation_ep_data(sort_continuation_ep) or self._extract_continuation(sort_menu_item)
 								                if not _continuation:
 								                    continue
-												[youtube:comments] Add more options for limiting number of comments extracted (#1626)

Extends `max_comments` extractor arg to support `max-parents,max-replies,max-replies-per-thread`.
Authored-by: coletdjnz
											
										
										
											2021-12-15 04:29:48 +00:00
+								                sort_text = str_or_none(sort_menu_item.get('title'))
 								                if not sort_text:
-												[youtube:comments] Move comment extraction to new API (#466)

Closes #438, #481, #485 

Authored by: colethedj
											
										
										
											2021-07-12 11:18:40 +12:00
+								                    sort_text = 'top comments' if comment_sort_index == 0 else 'newest first'
-												[cleanup] Add more ruff rules (#10149)

Authored by: seproDev

Reviewed-by: bashonly <88596187+bashonly@users.noreply.github.com>
Reviewed-by: Simon Sawicki <contact@grub4k.xyz>
											
										
										
											2024-06-12 01:09:58 +02:00
+								                self.to_screen(f'Sorting comments by {sort_text.lower()}')
-												[youtube:comments] Move comment extraction to new API (#466)

Closes #438, #481, #485 

Authored by: colethedj
											
										
										
											2021-07-12 11:18:40 +12:00
+								                break
-												[extractor] Generalize `getcomments` implementation

											
										
										
											2021-10-12 15:20:50 +05:30
+								            return _continuation
-												[Youtube] Rewrite comment extraction (#167)

Closes #121

TODO:
* Add an option for the user to specify newest/popular and max number of comments
* Refactor the download code and generalize with TabIE
* Parse time_text to timestamp

											
										
										
											2021-03-14 22:41:11 +00:00
-												[ie/youtube] Fix comments extraction (#9775)

Closes #9358
Authored by: jakeogh, minamotorin, shoxie007, bbilly1

Co-authored-by: minamotorin <76122224+minamotorin@users.noreply.github.com>
Co-authored-by: shoxie007 <74592022+shoxie007@users.noreply.github.com>
Co-authored-by: Simon <35427372+bbilly1@users.noreply.github.com>
											
										
										
											2024-05-17 07:37:30 -07:00
+								        def extract_thread(contents, entity_payloads):
-												[Youtube] Rewrite comment extraction (#167)

Closes #121

TODO:
* Add an option for the user to specify newest/popular and max number of comments
* Refactor the download code and generalize with TabIE
* Parse time_text to timestamp

											
										
										
											2021-03-14 22:41:11 +00:00
+								            if not parent:
-												[youtube:comments] Add more options for limiting number of comments extracted (#1626)

Extends `max_comments` extractor arg to support `max-parents,max-replies,max-replies-per-thread`.
Authored-by: coletdjnz
											
										
										
											2021-12-15 04:29:48 +00:00
+								                tracker['current_page_thread'] = 0
-												[Youtube] Rewrite comment extraction (#167)

Closes #121

TODO:
* Add an option for the user to specify newest/popular and max number of comments
* Refactor the download code and generalize with TabIE
* Parse time_text to timestamp

											
										
										
											2021-03-14 22:41:11 +00:00
+								            for content in contents:
-												[youtube:comments] Add more options for limiting number of comments extracted (#1626)

Extends `max_comments` extractor arg to support `max-parents,max-replies,max-replies-per-thread`.
Authored-by: coletdjnz
											
										
										
											2021-12-15 04:29:48 +00:00
+								                if not parent and tracker['total_parent_comments'] >= max_parents:
 								                    yield
-												[Youtube] Rewrite comment extraction (#167)

Closes #121

TODO:
* Add an option for the user to specify newest/popular and max number of comments
* Refactor the download code and generalize with TabIE
* Parse time_text to timestamp

											
										
										
											2021-03-14 22:41:11 +00:00
+								                comment_thread_renderer = try_get(content, lambda x: x['commentThreadRenderer'])
-												[ie/youtube] Fix comments extraction (#9775)

Closes #9358
Authored by: jakeogh, minamotorin, shoxie007, bbilly1

Co-authored-by: minamotorin <76122224+minamotorin@users.noreply.github.com>
Co-authored-by: shoxie007 <74592022+shoxie007@users.noreply.github.com>
Co-authored-by: Simon <35427372+bbilly1@users.noreply.github.com>
											
										
										
											2024-05-17 07:37:30 -07:00
+								                # old comment format
 								                if not entity_payloads:
 								                    comment_renderer = get_first(
 								                        (comment_thread_renderer, content), [['commentRenderer', ('comment', 'commentRenderer')]],
 								                        expected_type=dict, default={})
 								                    comment = self._extract_comment_old(comment_renderer, parent)
 								                # new comment format
 								                else:
 								                    view_model = (
 								                        traverse_obj(comment_thread_renderer, ('commentViewModel', 'commentViewModel', {dict}))
 								                        or traverse_obj(content, ('commentViewModel', {dict})))
 								                    comment_keys = traverse_obj(view_model, (('commentKey', 'toolbarStateKey'), {str}))
 								                    if not comment_keys:
 								                        continue
 								                    entities = traverse_obj(entity_payloads, lambda _, v: v['entityKey'] in comment_keys)
 								                    comment = self._extract_comment(entities, parent)
 								                    if comment:
 								                        comment['is_pinned'] = traverse_obj(view_model, ('pinnedText', {str})) is not None
-												[Youtube] Rewrite comment extraction (#167)

Closes #121

TODO:
* Add an option for the user to specify newest/popular and max number of comments
* Refactor the download code and generalize with TabIE
* Parse time_text to timestamp

											
										
										
											2021-03-14 22:41:11 +00:00
+								                if not comment:
 								                    continue
-												[extractor/youtube] Fix comment loop detection for pinned comments (#6714)

Pinned comments may repeat a second time - this is expected.

Fixes https://github.com/yt-dlp/yt-dlp/issues/6712

Authored by: coletdjnz
											
										
										
											2023-04-06 19:44:22 +12:00
+								                comment_id = comment['id']
-												[ie/youtube] Fix comments extraction (#9775)

Closes #9358
Authored by: jakeogh, minamotorin, shoxie007, bbilly1

Co-authored-by: minamotorin <76122224+minamotorin@users.noreply.github.com>
Co-authored-by: shoxie007 <74592022+shoxie007@users.noreply.github.com>
Co-authored-by: Simon <35427372+bbilly1@users.noreply.github.com>
											
										
										
											2024-05-17 07:37:30 -07:00
-												[extractor/youtube] Extract more metadata for comments (#7179)

Adds new comment fields:
* `author_url` - The url to the comment author's page
* `author_is_verified` - Whether the author is verified on the platform
* `is_pinned` - Whether the comment is pinned to the top of the comments

Closes https://github.com/yt-dlp/yt-dlp/issues/5411

Authored by: coletdjnz
											
										
										
											2023-06-01 20:43:32 +12:00
+								                if comment.get('is_pinned'):
-												[extractor/youtube] Fix comment loop detection for pinned comments (#6714)

Pinned comments may repeat a second time - this is expected.

Fixes https://github.com/yt-dlp/yt-dlp/issues/6712

Authored by: coletdjnz
											
										
										
											2023-04-06 19:44:22 +12:00
+								                    tracker['pinned_comment_ids'].add(comment_id)
-												[extractor/youtube] Detect and break on looping comments (#6301)

Fixes https://github.com/yt-dlp/yt-dlp/issues/6290

Authored by: coletdjnz
											
										
										
											2023-03-01 07:56:53 +00:00
+								                # Sometimes YouTube may break and give us infinite looping comments.
 								                # See: https://github.com/yt-dlp/yt-dlp/issues/6290
-												[extractor/youtube] Fix comment loop detection for pinned comments (#6714)

Pinned comments may repeat a second time - this is expected.

Fixes https://github.com/yt-dlp/yt-dlp/issues/6712

Authored by: coletdjnz
											
										
										
											2023-04-06 19:44:22 +12:00
+								                if comment_id in tracker['seen_comment_ids']:
-												[extractor/youtube] Extract more metadata for comments (#7179)

Adds new comment fields:
* `author_url` - The url to the comment author's page
* `author_is_verified` - Whether the author is verified on the platform
* `is_pinned` - Whether the comment is pinned to the top of the comments

Closes https://github.com/yt-dlp/yt-dlp/issues/5411

Authored by: coletdjnz
											
										
										
											2023-06-01 20:43:32 +12:00
+								                    if comment_id in tracker['pinned_comment_ids'] and not comment.get('is_pinned'):
-												[extractor/youtube] Fix comment loop detection for pinned comments (#6714)

Pinned comments may repeat a second time - this is expected.

Fixes https://github.com/yt-dlp/yt-dlp/issues/6712

Authored by: coletdjnz
											
										
										
											2023-04-06 19:44:22 +12:00
+								                        # Pinned comments may appear a second time in newest first sort
 								                        # See: https://github.com/yt-dlp/yt-dlp/issues/6712
 								                        continue
-												[extractor/youtube] Ignore incomplete data for comment threads by default (#7475)

For both `--ignore-errors` and `--ignore-errors only_download`. Pass `--no-ignore-errors` to not ignore.

Closes https://github.com/yt-dlp/yt-dlp/issues/7474

Authored by: coletdjnz
											
										
										
											2023-07-03 10:47:10 +00:00
+								                    self.report_warning(
 								                        'Detected YouTube comments looping. Stopping comment extraction '
 								                        f'{"for this thread" if parent else ""} as we probably cannot get any more.')
-												[extractor/youtube] Detect and break on looping comments (#6301)

Fixes https://github.com/yt-dlp/yt-dlp/issues/6290

Authored by: coletdjnz
											
										
										
											2023-03-01 07:56:53 +00:00
+								                    yield
 								                else:
 								                    tracker['seen_comment_ids'].add(comment['id'])
-												[youtube:comments] Add more options for limiting number of comments extracted (#1626)

Extends `max_comments` extractor arg to support `max-parents,max-replies,max-replies-per-thread`.
Authored-by: coletdjnz
											
										
										
											2021-12-15 04:29:48 +00:00
 								                tracker['running_total'] += 1
 								                tracker['total_reply_comments' if parent else 'total_parent_comments'] += 1
-												[Youtube] Rewrite comment extraction (#167)

Closes #121

TODO:
* Add an option for the user to specify newest/popular and max number of comments
* Refactor the download code and generalize with TabIE
* Parse time_text to timestamp

											
										
										
											2021-03-14 22:41:11 +00:00
+								                yield comment
-												[youtube:comments] Add more options for limiting number of comments extracted (#1626)

Extends `max_comments` extractor arg to support `max-parents,max-replies,max-replies-per-thread`.
Authored-by: coletdjnz
											
										
										
											2021-12-15 04:29:48 +00:00
-												[Youtube] Rewrite comment extraction (#167)

Closes #121

TODO:
* Add an option for the user to specify newest/popular and max number of comments
* Refactor the download code and generalize with TabIE
* Parse time_text to timestamp

											
										
										
											2021-03-14 22:41:11 +00:00
+								                # Attempt to get the replies
 								                comment_replies_renderer = try_get(
 								                    comment_thread_renderer, lambda x: x['replies']['commentRepliesRenderer'], dict)
 								                if comment_replies_renderer:
-												[youtube:comments] Add more options for limiting number of comments extracted (#1626)

Extends `max_comments` extractor arg to support `max-parents,max-replies,max-replies-per-thread`.
Authored-by: coletdjnz
											
										
										
											2021-12-15 04:29:48 +00:00
+								                    tracker['current_page_thread'] += 1
-												[Youtube] Rewrite comment extraction (#167)

Closes #121

TODO:
* Add an option for the user to specify newest/popular and max number of comments
* Refactor the download code and generalize with TabIE
* Parse time_text to timestamp

											
										
										
											2021-03-14 22:41:11 +00:00
+								                    comment_entries_iter = self._comment_entries(
-												[youtube] Cleanup authentication code (#786)

Authored by: coletdjnz
											
										
										
											2021-09-24 00:52:17 +00:00
+								                        comment_replies_renderer, ytcfg, video_id,
-												[youtube:comments] Add more options for limiting number of comments extracted (#1626)

Extends `max_comments` extractor arg to support `max-parents,max-replies,max-replies-per-thread`.
Authored-by: coletdjnz
											
										
										
											2021-12-15 04:29:48 +00:00
+								                        parent=comment.get('id'), tracker=tracker)
-												[cleanup] Upgrade syntax

Using https://github.com/asottile/pyupgrade

1. `__future__` imports and `coding: utf-8` were removed
2. Files were rewritten with `pyupgrade --py36-plus --keep-percent-format`
3. f-strings were cherry-picked from `pyupgrade --py36-plus`

Extractors are left untouched (except removing header) to avoid unnecessary merge conflicts

											
										
										
											2022-04-11 20:40:28 +05:30
+								                    yield from itertools.islice(comment_entries_iter, min(
 								                        max_replies_per_thread, max(0, max_replies - tracker['total_reply_comments'])))
-												[Youtube] Rewrite comment extraction (#167)

Closes #121

TODO:
* Add an option for the user to specify newest/popular and max number of comments
* Refactor the download code and generalize with TabIE
* Parse time_text to timestamp

											
										
										
											2021-03-14 22:41:11 +00:00
-												[youtube:comments] Add more options for limiting number of comments extracted (#1626)

Extends `max_comments` extractor arg to support `max-parents,max-replies,max-replies-per-thread`.
Authored-by: coletdjnz
											
										
										
											2021-12-15 04:29:48 +00:00
+								        # Keeps track of counts across recursive calls
 								        if not tracker:
-												[cleanup] Add more ruff rules (#10149)

Authored by: seproDev

Reviewed-by: bashonly <88596187+bashonly@users.noreply.github.com>
Reviewed-by: Simon Sawicki <contact@grub4k.xyz>
											
										
										
											2024-06-12 01:09:58 +02:00
+								            tracker = {
 								                'running_total': 0,
 								                'est_total': None,
 								                'current_page_thread': 0,
 								                'total_parent_comments': 0,
 								                'total_reply_comments': 0,
 								                'seen_comment_ids': set(),
 								                'pinned_comment_ids': set(),
 								            }
-												[youtube:comments] Add more options for limiting number of comments extracted (#1626)

Extends `max_comments` extractor arg to support `max-parents,max-replies,max-replies-per-thread`.
Authored-by: coletdjnz
											
										
										
											2021-12-15 04:29:48 +00:00
 								        # TODO: Deprecated
-												[youtube:comments] Move comment extraction to new API (#466)

Closes #438, #481, #485 

Authored by: colethedj
											
										
										
											2021-07-12 11:18:40 +12:00
+								        # YouTube comments have a max depth of 2
-												[youtube:comments] Add more options for limiting number of comments extracted (#1626)

Extends `max_comments` extractor arg to support `max-parents,max-replies,max-replies-per-thread`.
Authored-by: coletdjnz
											
										
										
											2021-12-15 04:29:48 +00:00
+								        max_depth = int_or_none(get_single_config_arg('max_comment_depth'))
 								        if max_depth:
-												[utils] Add `deprecation_warning`

See https://github.com/yt-dlp/yt-dlp/pull/2173#issuecomment-1097021515

											
										
										
											2022-08-30 20:58:28 +05:30
+								            self._downloader.deprecated_feature('[youtube] max_comment_depth extractor argument is deprecated. '
 								                                                'Set max replies in the max-comments extractor argument instead')
-												[youtube:comments] Move comment extraction to new API (#466)

Closes #438, #481, #485 

Authored by: colethedj
											
										
										
											2021-07-12 11:18:40 +12:00
+								        if max_depth == 1 and parent:
 								            return
-												[Youtube] Rewrite comment extraction (#167)

Closes #121

TODO:
* Add an option for the user to specify newest/popular and max number of comments
* Refactor the download code and generalize with TabIE
* Parse time_text to timestamp

											
										
										
											2021-03-14 22:41:11 +00:00
-												[cleanup] Bump ruff to 0.13.x (#14293)

Authored by: bashonly
											
										
										
											2025-09-11 10:18:01 -05:00
+								        _max_comments, max_parents, max_replies, max_replies_per_thread, *_ = (
-												[cleanup] Add more ruff rules (#10149)

Authored by: seproDev

Reviewed-by: bashonly <88596187+bashonly@users.noreply.github.com>
Reviewed-by: Simon Sawicki <contact@grub4k.xyz>
											
										
										
											2024-06-12 01:09:58 +02:00
+								            int_or_none(p, default=sys.maxsize) for p in self._configuration_arg('max_comments') + [''] * 4)
-												[youtube:comments] Move comment extraction to new API (#466)

Closes #438, #481, #485 

Authored by: colethedj
											
										
										
											2021-07-12 11:18:40 +12:00
-												[youtube:comments] Add more options for limiting number of comments extracted (#1626)

Extends `max_comments` extractor arg to support `max-parents,max-replies,max-replies-per-thread`.
Authored-by: coletdjnz
											
										
										
											2021-12-15 04:29:48 +00:00
+								        continuation = self._extract_continuation(root_continuation_data)
-												[youtube:comments] Fix comment section not being extracted in new layouts (#1324)

Co-authored-by: coletdjnz, pukkandan
											
										
										
											2021-10-18 15:58:42 +13:00
-												[youtube:comments] Add more options for limiting number of comments extracted (#1626)

Extends `max_comments` extractor arg to support `max-parents,max-replies,max-replies-per-thread`.
Authored-by: coletdjnz
											
										
										
											2021-12-15 04:29:48 +00:00
+								        response = None
-												[youtube] Add YoutubeStoriesIE (#3362)

Get channel stories with `ytstories:<channel UCID>`

Authored-by: coletdjnz
											
										
										
											2022-05-01 18:46:28 +12:00
+								        is_forced_continuation = False
-												[youtube:comments] Move comment extraction to new API (#466)

Closes #438, #481, #485 

Authored by: colethedj
											
										
										
											2021-07-12 11:18:40 +12:00
+								        is_first_continuation = parent is None
-												[youtube] Add YoutubeStoriesIE (#3362)

Get channel stories with `ytstories:<channel UCID>`

Authored-by: coletdjnz
											
										
										
											2022-05-01 18:46:28 +12:00
+								        if is_first_continuation and not continuation:
 								            # Sometimes you can get comments by generating the continuation yourself,
 								            # even if YouTube initially reports them being disabled - e.g. stories comments.
 								            # Note: if the comment section is actually disabled, YouTube may return a response with
 								            # required check_get_keys missing. So we will disable that check initially in this case.
 								            continuation = self._build_api_continuation_query(self._generate_comment_continuation(video_id))
 								            is_forced_continuation = True
-												[Youtube] Rewrite comment extraction (#167)

Closes #121

TODO:
* Add an option for the user to specify newest/popular and max number of comments
* Refactor the download code and generalize with TabIE
* Parse time_text to timestamp

											
										
										
											2021-03-14 22:41:11 +00:00
-												[extractor/youtube] Fix continuation loop with no comments (#7148)

Deep check the response for incomplete data.

Authored by: coletdjnz

											
										
										
											2023-05-31 19:08:28 +12:00
+								        continuation_items_path = (
 								            'onResponseReceivedEndpoints', ..., ('reloadContinuationItemsCommand', 'appendContinuationItemsAction'), 'continuationItems')
-												[Youtube] Rewrite comment extraction (#167)

Closes #121

TODO:
* Add an option for the user to specify newest/popular and max number of comments
* Refactor the download code and generalize with TabIE
* Parse time_text to timestamp

											
										
										
											2021-03-14 22:41:11 +00:00
+								        for page_num in itertools.count(0):
 								            if not continuation:
 								                break
-												[youtube:comments] Add more options for limiting number of comments extracted (#1626)

Extends `max_comments` extractor arg to support `max-parents,max-replies,max-replies-per-thread`.
Authored-by: coletdjnz
											
										
										
											2021-12-15 04:29:48 +00:00
+								            headers = self.generate_api_headers(ytcfg=ytcfg, visitor_data=self._extract_visitor_data(response))
-												[extractor/youtube] Fix continuation loop with no comments (#7148)

Deep check the response for incomplete data.

Authored by: coletdjnz

											
										
										
											2023-05-31 19:08:28 +12:00
+								            comment_prog_str = f"({tracker['running_total']}/~{tracker['est_total']})"
-												[youtube:comments] Move comment extraction to new API (#466)

Closes #438, #481, #485 

Authored by: colethedj
											
										
										
											2021-07-12 11:18:40 +12:00
+								            if page_num == 0:
 								                if is_first_continuation:
 								                    note_prefix = 'Downloading comment section API JSON'
-												[Youtube] Rewrite comment extraction (#167)

Closes #121

TODO:
* Add an option for the user to specify newest/popular and max number of comments
* Refactor the download code and generalize with TabIE
* Parse time_text to timestamp

											
										
										
											2021-03-14 22:41:11 +00:00
+								                else:
-												[youtube:comments] Move comment extraction to new API (#466)

Closes #438, #481, #485 

Authored by: colethedj
											
										
										
											2021-07-12 11:18:40 +12:00
+								                    note_prefix = '    Downloading comment API JSON reply thread %d %s' % (
-												[youtube:comments] Add more options for limiting number of comments extracted (#1626)

Extends `max_comments` extractor arg to support `max-parents,max-replies,max-replies-per-thread`.
Authored-by: coletdjnz
											
										
										
											2021-12-15 04:29:48 +00:00
+								                        tracker['current_page_thread'], comment_prog_str)
-												[youtube:comments] Move comment extraction to new API (#466)

Closes #438, #481, #485 

Authored by: colethedj
											
										
										
											2021-07-12 11:18:40 +12:00
+								            else:
-												[cleanup] Add more ruff rules (#10149)

Authored by: seproDev

Reviewed-by: bashonly <88596187+bashonly@users.noreply.github.com>
Reviewed-by: Simon Sawicki <contact@grub4k.xyz>
											
										
										
											2024-06-12 01:09:58 +02:00
+								                note_prefix = '{}Downloading comment{} API JSON page {} {}'.format(
-												[youtube:comments] Move comment extraction to new API (#466)

Closes #438, #481, #485 

Authored by: colethedj
											
										
										
											2021-07-12 11:18:40 +12:00
+								                    '       ' if parent else '', ' replies' if parent else '',
 								                    page_num, comment_prog_str)
-												[extractor/youtube] Fix continuation loop with no comments (#7148)

Deep check the response for incomplete data.

Authored by: coletdjnz

											
										
										
											2023-05-31 19:08:28 +12:00
 								            # Do a deep check for incomplete data as sometimes YouTube may return no comments for a continuation
 								            # Ignore check if YouTube says the comment count is 0.
 								            check_get_keys = None
 								            if not is_forced_continuation and not (tracker['est_total'] == 0 and tracker['running_total'] == 0):
 								                check_get_keys = [[*continuation_items_path, ..., (
-												[ie/youtube] Fix comments extraction (#9775)

Closes #9358
Authored by: jakeogh, minamotorin, shoxie007, bbilly1

Co-authored-by: minamotorin <76122224+minamotorin@users.noreply.github.com>
Co-authored-by: shoxie007 <74592022+shoxie007@users.noreply.github.com>
Co-authored-by: Simon <35427372+bbilly1@users.noreply.github.com>
											
										
										
											2024-05-17 07:37:30 -07:00
+								                    'commentsHeaderRenderer' if is_first_continuation else ('commentThreadRenderer', 'commentViewModel', 'commentRenderer'))]]
-												[extractor/youtube] Ignore incomplete data error for comment replies (#5490)

When --ignore-errors is used.
Closes https://github.com/yt-dlp/yt-dlp/issues/4669
Authored by: coletdjnz
											
										
										
											2022-11-10 19:35:22 +13:00
+								            try:
 								                response = self._extract_response(
 								                    item_id=None, query=continuation,
 								                    ep='next', ytcfg=ytcfg, headers=headers, note=note_prefix,
-												[extractor/youtube] Fix continuation loop with no comments (#7148)

Deep check the response for incomplete data.

Authored by: coletdjnz

											
										
										
											2023-05-31 19:08:28 +12:00
+								                    check_get_keys=check_get_keys)
-												[extractor/youtube] Ignore incomplete data error for comment replies (#5490)

When --ignore-errors is used.
Closes https://github.com/yt-dlp/yt-dlp/issues/4669
Authored by: coletdjnz
											
										
										
											2022-11-10 19:35:22 +13:00
+								            except ExtractorError as e:
 								                # Ignore incomplete data error for replies if retries didn't work.
 								                # This is to allow any other parent comments and comment threads to be downloaded.
 								                # See: https://github.com/yt-dlp/yt-dlp/issues/4669
-												[extractor/youtube] Ignore incomplete data for comment threads by default (#7475)

For both `--ignore-errors` and `--ignore-errors only_download`. Pass `--no-ignore-errors` to not ignore.

Closes https://github.com/yt-dlp/yt-dlp/issues/7474

Authored by: coletdjnz
											
										
										
											2023-07-03 10:47:10 +00:00
+								                if 'incomplete data' in str(e).lower() and parent:
 								                    if self.get_param('ignoreerrors') in (True, 'only_download'):
 								                        self.report_warning(
 								                            'Received incomplete data for a comment reply thread and retrying did not help. '
 								                            'Ignoring to let other comments be downloaded. Pass --no-ignore-errors to not ignore.')
 								                        return
 								                    else:
 								                        raise ExtractorError(
 								                            'Incomplete data received for comment reply thread. '
 								                            'Pass --ignore-errors to ignore and allow rest of comments to download.',
 								                            expected=True)
 								                raise
-												[youtube] Add YoutubeStoriesIE (#3362)

Get channel stories with `ytstories:<channel UCID>`

Authored-by: coletdjnz
											
										
										
											2022-05-01 18:46:28 +12:00
+								            is_forced_continuation = False
-												[youtube:comments] Move comment extraction to new API (#466)

Closes #438, #481, #485 

Authored by: colethedj
											
										
										
											2021-07-12 11:18:40 +12:00
+								            continuation = None
-												[ie/youtube] Fix comments extraction (#9775)

Closes #9358
Authored by: jakeogh, minamotorin, shoxie007, bbilly1

Co-authored-by: minamotorin <76122224+minamotorin@users.noreply.github.com>
Co-authored-by: shoxie007 <74592022+shoxie007@users.noreply.github.com>
Co-authored-by: Simon <35427372+bbilly1@users.noreply.github.com>
											
										
										
											2024-05-17 07:37:30 -07:00
+								            mutations = traverse_obj(response, ('frameworkUpdates', 'entityBatchUpdate', 'mutations', ..., {dict}))
-												[extractor/youtube] Fix continuation loop with no comments (#7148)

Deep check the response for incomplete data.

Authored by: coletdjnz

											
										
										
											2023-05-31 19:08:28 +12:00
+								            for continuation_items in traverse_obj(response, continuation_items_path, expected_type=list, default=[]):
-												[youtube:comments] Add more options for limiting number of comments extracted (#1626)

Extends `max_comments` extractor arg to support `max-parents,max-replies,max-replies-per-thread`.
Authored-by: coletdjnz
											
										
										
											2021-12-15 04:29:48 +00:00
+								                if is_first_continuation:
 								                    continuation = extract_header(continuation_items)
 								                    is_first_continuation = False
-												[youtube:comments] Move comment extraction to new API (#466)

Closes #438, #481, #485 

Authored by: colethedj
											
										
										
											2021-07-12 11:18:40 +12:00
+								                    if continuation:
-												[Youtube] Rewrite comment extraction (#167)

Closes #121

TODO:
* Add an option for the user to specify newest/popular and max number of comments
* Refactor the download code and generalize with TabIE
* Parse time_text to timestamp

											
										
										
											2021-03-14 22:41:11 +00:00
+								                        break
-												[youtube:comments] Add more options for limiting number of comments extracted (#1626)

Extends `max_comments` extractor arg to support `max-parents,max-replies,max-replies-per-thread`.
Authored-by: coletdjnz
											
										
										
											2021-12-15 04:29:48 +00:00
+								                    continue
-												[Youtube] Rewrite comment extraction (#167)

Closes #121

TODO:
* Add an option for the user to specify newest/popular and max number of comments
* Refactor the download code and generalize with TabIE
* Parse time_text to timestamp

											
										
										
											2021-03-14 22:41:11 +00:00
-												[ie/youtube] Fix comments extraction (#9775)

Closes #9358
Authored by: jakeogh, minamotorin, shoxie007, bbilly1

Co-authored-by: minamotorin <76122224+minamotorin@users.noreply.github.com>
Co-authored-by: shoxie007 <74592022+shoxie007@users.noreply.github.com>
Co-authored-by: Simon <35427372+bbilly1@users.noreply.github.com>
											
										
										
											2024-05-17 07:37:30 -07:00
+								                for entry in extract_thread(continuation_items, mutations):
-												[youtube:comments] Add more options for limiting number of comments extracted (#1626)

Extends `max_comments` extractor arg to support `max-parents,max-replies,max-replies-per-thread`.
Authored-by: coletdjnz
											
										
										
											2021-12-15 04:29:48 +00:00
+								                    if not entry:
 								                        return
 								                    yield entry
 								                continuation = self._extract_continuation({'contents': continuation_items})
 								                if continuation:
-												[youtube:comments] Move comment extraction to new API (#466)

Closes #438, #481, #485 

Authored by: colethedj
											
										
										
											2021-07-12 11:18:40 +12:00
+								                    break
-												[Youtube] Rewrite comment extraction (#167)

Closes #121

TODO:
* Add an option for the user to specify newest/popular and max number of comments
* Refactor the download code and generalize with TabIE
* Parse time_text to timestamp

											
										
										
											2021-03-14 22:41:11 +00:00
-												[youtube] Add YoutubeStoriesIE (#3362)

Get channel stories with `ytstories:<channel UCID>`

Authored-by: coletdjnz
											
										
										
											2022-05-01 18:46:28 +12:00
+								        message = self._get_text(root_continuation_data, ('contents', ..., 'messageRenderer', 'text'), max_runs=1)
 								        if message and not parent and tracker['running_total'] == 0:
 								            self.report_warning(f'Youtube said: {message}', video_id=video_id, only_once=True)
-												[extractor/youtube] Differentiate between no and disabled comments (#5491)

`comments` and `comment_count` will be set to None, as opposed to 
an empty list and 0, respectively.

Fixes https://github.com/yt-dlp/yt-dlp/issues/5068

Authored by: coletdjnz, pukkandan
											
										
										
											2022-11-10 16:33:03 +13:00
+								            raise self.CommentsDisabled
-												[youtube] Add YoutubeStoriesIE (#3362)

Get channel stories with `ytstories:<channel UCID>`

Authored-by: coletdjnz
											
										
										
											2022-05-01 18:46:28 +12:00
 								    @staticmethod
 								    def _generate_comment_continuation(video_id):
 								        """
 								        Generates initial comment section continuation token from given video id
 								        """
 								        token = f'\x12\r\x12\x0b{video_id}\x18\x062\'"\x11"\x0b{video_id}0\x00x\x020\x00B\x10comments-section'
 								        return base64.b64encode(token.encode()).decode()
-												[extractor] Generalize `getcomments` implementation

											
										
										
											2021-10-12 15:20:50 +05:30
+								    def _get_comments(self, ytcfg, video_id, contents, webpage):
-												[Youtube] Rewrite comment extraction (#167)

Closes #121

TODO:
* Add an option for the user to specify newest/popular and max number of comments
* Refactor the download code and generalize with TabIE
* Parse time_text to timestamp

											
										
										
											2021-03-14 22:41:11 +00:00
+								        """Entry for comment extraction"""
-												[youtube:comments] Move comment extraction to new API (#466)

Closes #438, #481, #485 

Authored by: colethedj
											
										
										
											2021-07-12 11:18:40 +12:00
+								        def _real_comment_extract(contents):
-												[youtube:comments] Fix comment section not being extracted in new layouts (#1324)

Co-authored-by: coletdjnz, pukkandan
											
										
										
											2021-10-18 15:58:42 +13:00
+								            renderer = next((
 								                item for item in traverse_obj(contents, (..., 'itemSectionRenderer'), default={})
 								                if item.get('sectionIdentifier') == 'comment-item-section'), None)
 								            yield from self._comment_entries(renderer, ytcfg, video_id)
-												[youtube] Cleanup authentication code (#786)

Authored by: coletdjnz
											
										
										
											2021-09-24 00:52:17 +00:00
-												[extractor] Generalize `getcomments` implementation

											
										
										
											2021-10-12 15:20:50 +05:30
+								        max_comments = int_or_none(self._configuration_arg('max_comments', [''])[0])
 								        return itertools.islice(_real_comment_extract(contents), 0, max_comments)
-												[Youtube] Rewrite comment extraction (#167)

Closes #121

TODO:
* Add an option for the user to specify newest/popular and max number of comments
* Refactor the download code and generalize with TabIE
* Parse time_text to timestamp

											
										
										
											2021-03-14 22:41:11 +00:00
-												[youtube] Use new API for additional video extraction requests (#328)

Co-authored-by: colethedj, pukkandan
Closes https://github.com/yt-dlp/yt-dlp/issues/427
Workarounds for https://github.com/ytdl-org/youtube-dl/issues/29326, https://github.com/yt-dlp/yt-dlp/issues/319, https://github.com/ytdl-org/youtube-dl/issues/29086
											
										
										
											2021-06-30 10:07:49 +12:00
+								    @staticmethod
-												[youtube] Cleanup authentication code (#786)

Authored by: coletdjnz
											
										
										
											2021-09-24 00:52:17 +00:00
+								    def _get_checkok_params():
 								        return {'contentCheckOk': True, 'racyCheckOk': True}
 								    @classmethod
 								    def _generate_player_context(cls, sts=None):
-												[youtube] Use new API for additional video extraction requests (#328)

Co-authored-by: colethedj, pukkandan
Closes https://github.com/yt-dlp/yt-dlp/issues/427
Workarounds for https://github.com/ytdl-org/youtube-dl/issues/29326, https://github.com/yt-dlp/yt-dlp/issues/319, https://github.com/ytdl-org/youtube-dl/issues/29086
											
										
										
											2021-06-30 10:07:49 +12:00
+								        context = {
 								            'html5Preference': 'HTML5_PREF_WANTS',
 								        }
 								        if sts is not None:
 								            context['signatureTimestamp'] = sts
 								        return {
 								            'playbackContext': {
-												[cleanup] Add more ruff rules (#10149)

Authored by: seproDev

Reviewed-by: bashonly <88596187+bashonly@users.noreply.github.com>
Reviewed-by: Simon Sawicki <contact@grub4k.xyz>
											
										
										
											2024-06-12 01:09:58 +02:00
+								                'contentPlaybackContext': context,
-												[youtube] Fix controversial videos when requested via API (#533)

Closes: https://github.com/yt-dlp/yt-dlp/issues/511#issuecomment-883024350
Authored by: colethedj
											
										
										
											2021-07-21 06:01:28 +12:00
+								            },
-												[cleanup] Add more ruff rules (#10149)

Authored by: seproDev

Reviewed-by: bashonly <88596187+bashonly@users.noreply.github.com>
Reviewed-by: Simon Sawicki <contact@grub4k.xyz>
											
										
										
											2024-06-12 01:09:58 +02:00
+								            **cls._get_checkok_params(),
-												[youtube] Use new API for additional video extraction requests (#328)

Co-authored-by: colethedj, pukkandan
Closes https://github.com/yt-dlp/yt-dlp/issues/427
Workarounds for https://github.com/ytdl-org/youtube-dl/issues/29326, https://github.com/yt-dlp/yt-dlp/issues/319, https://github.com/ytdl-org/youtube-dl/issues/29086
											
										
										
											2021-06-30 10:07:49 +12:00
+								        }
-												[ie/youtube] Use different PO token for GVS and Player (#12090)

Authored by: coletdjnz
											
										
										
											2025-01-25 13:17:37 +13:00
+								    def _get_config_po_token(self, client: str, context: _PoTokenContext):
-												[ie/youtube] Add `po_token`, `visitor_data`, `data_sync_id` extractor args (#10648)

Authored by:  seproDev, coletdjnz, bashonly
											
										
										
											2024-09-13 12:51:58 +02:00
+								        po_token_strs = self._configuration_arg('po_token', [], ie_key=YoutubeIE, casesense=True)
 								        for token_str in po_token_strs:
-												[ie/youtube] Use different PO token for GVS and Player (#12090)

Authored by: coletdjnz
											
										
										
											2025-01-25 13:17:37 +13:00
+								            po_token_meta, sep, po_token = token_str.partition('+')
 								            if not sep:
 								                self.report_warning(
 								                    f'Invalid po_token configuration format. '
 								                    f'Expected "CLIENT.CONTEXT+PO_TOKEN", got "{token_str}"', only_once=True)
 								                continue
 								            po_token_client, sep, po_token_context = po_token_meta.partition('.')
 								            if po_token_client.lower() != client:
 								                continue
-												[ie/youtube] Add `po_token`, `visitor_data`, `data_sync_id` extractor args (#10648)

Authored by:  seproDev, coletdjnz, bashonly
											
										
										
											2024-09-13 12:51:58 +02:00
+								            if not sep:
-												[ie/youtube] Use different PO token for GVS and Player (#12090)

Authored by: coletdjnz
											
										
										
											2025-01-25 13:17:37 +13:00
+								                # TODO(future): deprecate the old format?
 								                self.write_debug(
 								                    f'po_token configuration for {client} client is missing a context; assuming GVS. '
 								                    'You can provide a context with the format "CLIENT.CONTEXT+PO_TOKEN"',
 								                    only_once=True)
 								                po_token_context = _PoTokenContext.GVS.value
 								            if po_token_context.lower() != context.value:
 								                continue
 								            # Clean and validate the PO Token. This will strip invalid characters off
 								            # (e.g. additional url params the user may accidentally include)
 								            try:
 								                return base64.urlsafe_b64encode(base64.urlsafe_b64decode(urllib.parse.unquote(po_token))).decode()
 								            except (binascii.Error, ValueError):
-												[ie/youtube] Add `po_token`, `visitor_data`, `data_sync_id` extractor args (#10648)

Authored by:  seproDev, coletdjnz, bashonly
											
										
										
											2024-09-13 12:51:58 +02:00
+								                self.report_warning(
-												[ie/youtube] Use different PO token for GVS and Player (#12090)

Authored by: coletdjnz
											
										
										
											2025-01-25 13:17:37 +13:00
+								                    f'Invalid po_token configuration for {client} client: '
 								                    f'{po_token_context} PO Token should be a base64url-encoded string.',
 								                    only_once=True)
-												[ie/youtube] Add `po_token`, `visitor_data`, `data_sync_id` extractor args (#10648)

Authored by:  seproDev, coletdjnz, bashonly
											
										
										
											2024-09-13 12:51:58 +02:00
+								                continue
-												[ie/youtube] Do not require PO Token for premium accounts (#13640)

Authored by: coletdjnz
											
										
										
											2025-07-11 18:54:01 +12:00
+								    def fetch_po_token(self, client='web', context: _PoTokenContext = _PoTokenContext.GVS, ytcfg=None, visitor_data=None,
-												[ie/youtube] Add PO token support for subtitles (#13234)

Closes #13075
Authored by: bashonly, coletdjnz

Co-authored-by: coletdjnz <coletdjnz@protonmail.com>
											
										
										
											2025-05-22 04:13:42 -05:00
+								                       data_sync_id=None, session_index=None, player_url=None, video_id=None, webpage=None,
 								                       required=False, **kwargs):
-												[ie/youtube] Use different PO token for GVS and Player (#12090)

Authored by: coletdjnz
											
										
										
											2025-01-25 13:17:37 +13:00
+								        """
 								        Fetch a PO Token for a given client and context. This function will validate required parameters for a given context and client.
 								        EXPERIMENTAL: This method is unstable and may change or be removed without notice.
 								        @param client: The client to fetch the PO Token for.
 								        @param context: The context in which the PO Token is used.
 								        @param ytcfg: The ytcfg for the client.
 								        @param visitor_data: visitor data.
 								        @param data_sync_id: data sync ID.
 								        @param session_index: session index.
 								        @param player_url: player URL.
 								        @param video_id: video ID.
-												[ie/youtube] Add a PO Token Provider Framework (#12840)

https://github.com/yt-dlp/yt-dlp/tree/master/yt_dlp/extractor/youtube/pot/README.md

Authored by: coletdjnz
											
										
										
											2025-05-18 13:45:26 +12:00
+								        @param webpage: video webpage.
-												[ie/youtube] Add PO token support for subtitles (#13234)

Closes #13075
Authored by: bashonly, coletdjnz

Co-authored-by: coletdjnz <coletdjnz@protonmail.com>
											
										
										
											2025-05-22 04:13:42 -05:00
+								        @param required: Whether the PO Token is required (i.e. try to fetch unless policy is "never").
-												[ie/youtube] Use different PO token for GVS and Player (#12090)

Authored by: coletdjnz
											
										
										
											2025-01-25 13:17:37 +13:00
+								        @param kwargs: Additional arguments to pass down. May be more added in the future.
 								        @return: The fetched PO Token. None if it could not be fetched.
 								        """
-												[ie/youtube] Add a PO Token Provider Framework (#12840)

https://github.com/yt-dlp/yt-dlp/tree/master/yt_dlp/extractor/youtube/pot/README.md

Authored by: coletdjnz
											
										
										
											2025-05-18 13:45:26 +12:00
+								        # TODO(future): This validation should be moved into pot framework.
 								        #  Some sort of middleware or validation provider perhaps?
-												[ie/youtube] Use different PO token for GVS and Player (#12090)

Authored by: coletdjnz
											
										
										
											2025-01-25 13:17:37 +13:00
+								        # GVS WebPO Token is bound to visitor_data / Visitor ID when logged out.
 								        # Must have visitor_data for it to function.
 								        if player_url and context == _PoTokenContext.GVS and not visitor_data and not self.is_authenticated:
-												[ie/youtube] Add `po_token`, `visitor_data`, `data_sync_id` extractor args (#10648)

Authored by:  seproDev, coletdjnz, bashonly
											
										
										
											2024-09-13 12:51:58 +02:00
+								            self.report_warning(
-												[ie/youtube] Use different PO token for GVS and Player (#12090)

Authored by: coletdjnz
											
										
										
											2025-01-25 13:17:37 +13:00
+								                f'Unable to fetch GVS PO Token for {client} client: Missing required Visitor Data. '
-												[ie/youtube] Improve PO token logging (#14447)

Authored by: seproDev
											
										
										
											2025-09-26 20:12:16 +02:00
+								                f'You may need to pass Visitor Data with --extractor-args "youtube:visitor_data=XXX"', only_once=True)
-												[ie/youtube] Add `po_token`, `visitor_data`, `data_sync_id` extractor args (#10648)

Authored by:  seproDev, coletdjnz, bashonly
											
										
										
											2024-09-13 12:51:58 +02:00
+								            return
-												[ie/youtube] Use different PO token for GVS and Player (#12090)

Authored by: coletdjnz
											
										
										
											2025-01-25 13:17:37 +13:00
+								        if context == _PoTokenContext.PLAYER and not video_id:
 								            self.report_warning(
 								                f'Unable to fetch Player PO Token for {client} client: Missing required Video ID')
 								            return
 								        config_po_token = self._get_config_po_token(client, context)
-												[ie/youtube] Add `po_token`, `visitor_data`, `data_sync_id` extractor args (#10648)

Authored by:  seproDev, coletdjnz, bashonly
											
										
										
											2024-09-13 12:51:58 +02:00
+								        if config_po_token:
-												[ie/youtube] Use different PO token for GVS and Player (#12090)

Authored by: coletdjnz
											
										
										
											2025-01-25 13:17:37 +13:00
+								            # GVS WebPO token is bound to data_sync_id / account Session ID when logged in.
 								            if player_url and context == _PoTokenContext.GVS and not data_sync_id and self.is_authenticated:
-												[ie/youtube] Add `po_token`, `visitor_data`, `data_sync_id` extractor args (#10648)

Authored by:  seproDev, coletdjnz, bashonly
											
										
										
											2024-09-13 12:51:58 +02:00
+								                self.report_warning(
-												[ie/youtube] Use different PO token for GVS and Player (#12090)

Authored by: coletdjnz
											
										
										
											2025-01-25 13:17:37 +13:00
+								                    f'Got a GVS PO Token for {client} client, but missing Data Sync ID for account. Formats may not work.'
-												[ie/youtube] Add `po_token`, `visitor_data`, `data_sync_id` extractor args (#10648)

Authored by:  seproDev, coletdjnz, bashonly
											
										
										
											2024-09-13 12:51:58 +02:00
+								                    f'You may need to pass a Data Sync ID with --extractor-args "youtube:data_sync_id=XXX"')
-												[ie/youtube] Add a PO Token Provider Framework (#12840)

https://github.com/yt-dlp/yt-dlp/tree/master/yt_dlp/extractor/youtube/pot/README.md

Authored by: coletdjnz
											
										
										
											2025-05-18 13:45:26 +12:00
+								            self.write_debug(f'{video_id}: Retrieved a {context.value} PO Token for {client} client from config')
-												[ie/youtube] Add `po_token`, `visitor_data`, `data_sync_id` extractor args (#10648)

Authored by:  seproDev, coletdjnz, bashonly
											
										
										
											2024-09-13 12:51:58 +02:00
+								            return config_po_token
-												[ie/youtube] Use different PO token for GVS and Player (#12090)

Authored by: coletdjnz
											
										
										
											2025-01-25 13:17:37 +13:00
+								        # Require GVS WebPO Token if logged in for external fetching
 								        if player_url and context == _PoTokenContext.GVS and not data_sync_id and self.is_authenticated:
-												[ie/youtube] Add `po_token`, `visitor_data`, `data_sync_id` extractor args (#10648)

Authored by:  seproDev, coletdjnz, bashonly
											
										
										
											2024-09-13 12:51:58 +02:00
+								            self.report_warning(
-												[ie/youtube] Use different PO token for GVS and Player (#12090)

Authored by: coletdjnz
											
										
										
											2025-01-25 13:17:37 +13:00
+								                f'Unable to fetch GVS PO Token for {client} client: Missing required Data Sync ID for account. '
-												[ie/youtube] Improve PO token logging (#14447)

Authored by: seproDev
											
										
										
											2025-09-26 20:12:16 +02:00
+								                f'You may need to pass a Data Sync ID with --extractor-args "youtube:data_sync_id=XXX"', only_once=True)
-												[ie/youtube] Add `po_token`, `visitor_data`, `data_sync_id` extractor args (#10648)

Authored by:  seproDev, coletdjnz, bashonly
											
										
										
											2024-09-13 12:51:58 +02:00
+								            return
-												[ie/youtube] Add a PO Token Provider Framework (#12840)

https://github.com/yt-dlp/yt-dlp/tree/master/yt_dlp/extractor/youtube/pot/README.md

Authored by: coletdjnz
											
										
										
											2025-05-18 13:45:26 +12:00
+								        po_token = self._fetch_po_token(
-												[ie/youtube] Add `po_token`, `visitor_data`, `data_sync_id` extractor args (#10648)

Authored by:  seproDev, coletdjnz, bashonly
											
										
										
											2024-09-13 12:51:58 +02:00
+								            client=client,
-												[ie/youtube] Use different PO token for GVS and Player (#12090)

Authored by: coletdjnz
											
										
										
											2025-01-25 13:17:37 +13:00
+								            context=context.value,
 								            ytcfg=ytcfg,
-												[ie/youtube] Add `po_token`, `visitor_data`, `data_sync_id` extractor args (#10648)

Authored by:  seproDev, coletdjnz, bashonly
											
										
										
											2024-09-13 12:51:58 +02:00
+								            visitor_data=visitor_data,
 								            data_sync_id=data_sync_id,
-												[ie/youtube] Use different PO token for GVS and Player (#12090)

Authored by: coletdjnz
											
										
										
											2025-01-25 13:17:37 +13:00
+								            session_index=session_index,
-												[ie/youtube] Add `po_token`, `visitor_data`, `data_sync_id` extractor args (#10648)

Authored by:  seproDev, coletdjnz, bashonly
											
										
										
											2024-09-13 12:51:58 +02:00
+								            player_url=player_url,
-												[ie/youtube] Use different PO token for GVS and Player (#12090)

Authored by: coletdjnz
											
										
										
											2025-01-25 13:17:37 +13:00
+								            video_id=video_id,
-												[ie/youtube] Add a PO Token Provider Framework (#12840)

https://github.com/yt-dlp/yt-dlp/tree/master/yt_dlp/extractor/youtube/pot/README.md

Authored by: coletdjnz
											
										
										
											2025-05-18 13:45:26 +12:00
+								            video_webpage=webpage,
-												[ie/youtube] Add PO token support for subtitles (#13234)

Closes #13075
Authored by: bashonly, coletdjnz

Co-authored-by: coletdjnz <coletdjnz@protonmail.com>
											
										
										
											2025-05-22 04:13:42 -05:00
+								            required=required,
-												[ie/youtube] Add `po_token`, `visitor_data`, `data_sync_id` extractor args (#10648)

Authored by:  seproDev, coletdjnz, bashonly
											
										
										
											2024-09-13 12:51:58 +02:00
+								            **kwargs,
 								        )
-												[ie/youtube] Add a PO Token Provider Framework (#12840)

https://github.com/yt-dlp/yt-dlp/tree/master/yt_dlp/extractor/youtube/pot/README.md

Authored by: coletdjnz
											
										
										
											2025-05-18 13:45:26 +12:00
+								        if po_token:
 								            self.write_debug(f'{video_id}: Retrieved a {context.value} PO Token for {client} client')
 								            return po_token
-												[ie/youtube] Use different PO token for GVS and Player (#12090)

Authored by: coletdjnz
											
										
										
											2025-01-25 13:17:37 +13:00
+								    def _fetch_po_token(self, client, **kwargs):
-												[ie/youtube] Add a PO Token Provider Framework (#12840)

https://github.com/yt-dlp/yt-dlp/tree/master/yt_dlp/extractor/youtube/pot/README.md

Authored by: coletdjnz
											
										
										
											2025-05-18 13:45:26 +12:00
+								        context = kwargs.get('context')
 								        # Avoid fetching PO Tokens when not required
 								        fetch_pot_policy = self._configuration_arg('fetch_pot', [''], ie_key=YoutubeIE)[0]
 								        if fetch_pot_policy not in ('never', 'auto', 'always'):
 								            fetch_pot_policy = 'auto'
 								        if (
 								            fetch_pot_policy == 'never'
 								            or (
 								                fetch_pot_policy == 'auto'
-												[ie/youtube] Add PO token support for subtitles (#13234)

Closes #13075
Authored by: bashonly, coletdjnz

Co-authored-by: coletdjnz <coletdjnz@protonmail.com>
											
										
										
											2025-05-22 04:13:42 -05:00
+								                and not kwargs.get('required', False)
-												[ie/youtube] Add a PO Token Provider Framework (#12840)

https://github.com/yt-dlp/yt-dlp/tree/master/yt_dlp/extractor/youtube/pot/README.md

Authored by: coletdjnz
											
										
										
											2025-05-18 13:45:26 +12:00
+								            )
 								        ):
 								            return None
 								        headers = self.get_param('http_headers').copy()
 								        proxies = self._downloader.proxies.copy()
 								        clean_headers(headers)
 								        clean_proxies(proxies, headers)
 								        innertube_host = self._select_api_hostname(None, default_client=client)
 								        pot_request = PoTokenRequest(
 								            context=PoTokenContext(context),
 								            innertube_context=traverse_obj(kwargs, ('ytcfg', 'INNERTUBE_CONTEXT')),
 								            innertube_host=innertube_host,
 								            internal_client_name=client,
 								            session_index=kwargs.get('session_index'),
 								            player_url=kwargs.get('player_url'),
 								            video_webpage=kwargs.get('video_webpage'),
 								            is_authenticated=self.is_authenticated,
 								            visitor_data=kwargs.get('visitor_data'),
 								            data_sync_id=kwargs.get('data_sync_id'),
 								            video_id=kwargs.get('video_id'),
 								            request_cookiejar=self._downloader.cookiejar,
 								            # All requests that would need to be proxied should be in the
 								            # context of www.youtube.com or the innertube host
 								            request_proxy=(
 								                select_proxy('https://www.youtube.com', proxies)
 								                or select_proxy(f'https://{innertube_host}', proxies)
 								            ),
 								            request_headers=headers,
 								            request_timeout=self.get_param('socket_timeout'),
 								            request_verify_tls=not self.get_param('nocheckcertificate'),
 								            request_source_address=self.get_param('source_address'),
 								            bypass_cache=False,
 								        )
 								        return self._pot_director.get_po_token(pot_request)
-												[ie/youtube] Add `po_token`, `visitor_data`, `data_sync_id` extractor args (#10648)

Authored by:  seproDev, coletdjnz, bashonly
											
										
										
											2024-09-13 12:51:58 +02:00
-												[youtube] Add age-gate bypass for unverified accounts (#600)

Adds `_creator` variants for each client

Authored by: zerodytrash, colethedj, pukkandan
											
										
										
											2021-08-01 23:13:46 +02:00
+								    @staticmethod
 								    def _is_agegated(player_response):
 								        if traverse_obj(player_response, ('playabilityStatus', 'desktopLegacyAgeGateReason')):
-												[youtube] Improve age-gate detection (#577)

Authored by: colethedj

											
										
										
											2021-07-29 17:23:56 +12:00
+								            return True
-												[youtube] Add age-gate bypass for unverified accounts (#600)

Adds `_creator` variants for each client

Authored by: zerodytrash, colethedj, pukkandan
											
										
										
											2021-08-01 23:13:46 +02:00
-												[utils] `traverse_obj`: Fix more bugs

and cleanup uses of `default=[]`

Continued from b1bde57bef878478e3503ab07190fd207914ade9

											
										
										
											2023-02-10 03:56:26 +05:30
+								        reasons = traverse_obj(player_response, ('playabilityStatus', ('status', 'reason')))
-												[youtube] Add age-gate bypass for unverified accounts (#600)

Adds `_creator` variants for each client

Authored by: zerodytrash, colethedj, pukkandan
											
										
										
											2021-08-01 23:13:46 +02:00
+								        AGE_GATE_REASONS = (
 								            'confirm your age', 'age-restricted', 'inappropriate',  # reason
 								            'age_verification_required', 'age_check_required',  # status
 								        )
 								        return any(expected in reason for expected in AGE_GATE_REASONS for reason in reasons)
 								    @staticmethod
 								    def _is_unplayable(player_response):
 								        return traverse_obj(player_response, ('playabilityStatus', 'status')) == 'UNPLAYABLE'
-												[youtube] Improve age-gate detection (#577)

Authored by: colethedj

											
										
										
											2021-07-29 17:23:56 +12:00
-												[ie/youtube] Do not require PO Token for premium accounts (#13640)

Authored by: coletdjnz
											
										
										
											2025-07-11 18:54:01 +12:00
+								    def _extract_player_response(self, client, video_id, webpage_ytcfg, player_ytcfg, player_url, initial_pr, visitor_data, data_sync_id, po_token):
-												[youtube] Extract data from multiple clients (#536)

* `player_client` accepts multiple clients
* default `player_client` = `android,web`
* music clients can be specifically requested
* Add IOS `player_client`
* Hide live dash since they can't be downloaded

Closes #501

Authored-by: pukkandan, colethedj
											
										
										
											2021-07-21 09:22:34 +05:30
+								        headers = self.generate_api_headers(
-												[ie/youtube] Add `po_token`, `visitor_data`, `data_sync_id` extractor args (#10648)

Authored by:  seproDev, coletdjnz, bashonly
											
										
										
											2024-09-13 12:51:58 +02:00
+								            ytcfg=player_ytcfg,
 								            default_client=client,
 								            visitor_data=visitor_data,
-												[ie/youtube] Do not require PO Token for premium accounts (#13640)

Authored by: coletdjnz
											
										
										
											2025-07-11 18:54:01 +12:00
+								            session_index=self._extract_session_index(webpage_ytcfg, player_ytcfg),
-												[ie/youtube] Refactor cookie auth (#11989)

Authored by: coletdjnz
											
										
										
											2025-01-12 15:02:57 +13:00
+								            delegated_session_id=(
 								                self._parse_data_sync_id(data_sync_id)[0]
-												[ie/youtube] Do not require PO Token for premium accounts (#13640)

Authored by: coletdjnz
											
										
										
											2025-07-11 18:54:01 +12:00
+								                or self._extract_delegated_session_id(webpage_ytcfg, initial_pr, player_ytcfg)
-												[ie/youtube] Refactor cookie auth (#11989)

Authored by: coletdjnz
											
										
										
											2025-01-12 15:02:57 +13:00
+								            ),
 								            user_session_id=(
 								                self._parse_data_sync_id(data_sync_id)[1]
-												[ie/youtube] Do not require PO Token for premium accounts (#13640)

Authored by: coletdjnz
											
										
										
											2025-07-11 18:54:01 +12:00
+								                or self._extract_user_session_id(webpage_ytcfg, initial_pr, player_ytcfg)
-												[ie/youtube] Add `po_token`, `visitor_data`, `data_sync_id` extractor args (#10648)

Authored by:  seproDev, coletdjnz, bashonly
											
										
										
											2024-09-13 12:51:58 +02:00
+								            ),
 								        )
-												[Youtube] Extract more formats for `music.youtube` URLs (#311)

Based on: https://github.com/ytdl-org/youtube-dl/pull/28778, https://github.com/ytdl-org/youtube-dl/pull/26160

Co-authored-by: craftingmod, colethedj, pukkandan
											
										
										
											2021-05-16 02:38:47 +12:00
-												[youtube] Add YoutubeStoriesIE (#3362)

Get channel stories with `ytstories:<channel UCID>`

Authored-by: coletdjnz
											
										
										
											2022-05-01 18:46:28 +12:00
+								        yt_query = {
 								            'videoId': video_id,
 								        }
-												[ie/youtube] Add `player_params` extractor arg (#7719)

Authored by: coletdjnz
											
										
										
											2023-07-29 18:20:42 +12:00
-												[ie/youtube] Player client maintenance (#10573)

- Add clients: android_producer, android_testsuite, android_vr, tv, web_safari
- Remove obsolete clients: android_embedded, ios_embedded, *_embedscreen

Authored by: bashonly
											
										
										
											2024-07-30 16:27:06 -05:00
+								        default_pp = traverse_obj(
 								            INNERTUBE_CLIENTS, (_split_innertube_client(client)[0], 'PLAYER_PARAMS', {str}))
 								        if player_params := self._configuration_arg('player_params', [default_pp], casesense=True)[0]:
 								            yt_query['params'] = player_params
-												[extractor/youtube] Use device-specific user agent (#4770)

Thwart latest fingerprinting attempt (see https://github.com/iv-org/invidious/issues/3230#issuecomment-1226887639)

Authored by: coletdjnz
											
										
										
											2022-08-28 22:59:54 +00:00
-												[ie/youtube] Add `po_token`, `visitor_data`, `data_sync_id` extractor args (#10648)

Authored by:  seproDev, coletdjnz, bashonly
											
										
										
											2024-09-13 12:51:58 +02:00
+								        if po_token:
 								            yt_query['serviceIntegrityDimensions'] = {'poToken': po_token}
-												[ie/youtube] Do not require PO Token for premium accounts (#13640)

Authored by: coletdjnz
											
										
										
											2025-07-11 18:54:01 +12:00
+								        sts = self._extract_signature_timestamp(video_id, player_url, webpage_ytcfg, fatal=False) if player_url else None
-												[youtube] Extract data from multiple clients (#536)

* `player_client` accepts multiple clients
* default `player_client` = `android,web`
* music clients can be specifically requested
* Add IOS `player_client`
* Hide live dash since they can't be downloaded

Closes #501

Authored-by: pukkandan, colethedj
											
										
										
											2021-07-21 09:22:34 +05:30
+								        yt_query.update(self._generate_player_context(sts))
 								        return self._extract_response(
 								            item_id=video_id, ep='player', query=yt_query,
-												[youtube] Raise appropriate error when API pages can't be downloaded

											
										
										
											2021-08-07 12:15:58 +05:30
+								            ytcfg=player_ytcfg, headers=headers, fatal=True,
-												[youtube] simplify and de-duplicate client definitions (#577)

											
										
										
											2021-07-31 01:15:04 +05:30
+								            default_client=client,
-												[cleanup] Add more ruff rules (#10149)

Authored by: seproDev

Reviewed-by: bashonly <88596187+bashonly@users.noreply.github.com>
Reviewed-by: Simon Sawicki <contact@grub4k.xyz>
											
										
										
											2024-06-12 01:09:58 +02:00
+								            note='Downloading {} player API JSON'.format(client.replace('_', ' ').strip()),
-												[youtube] Extract data from multiple clients (#536)

* `player_client` accepts multiple clients
* default `player_client` = `android,web`
* music clients can be specifically requested
* Add IOS `player_client`
* Hide live dash since they can't be downloaded

Closes #501

Authored-by: pukkandan, colethedj
											
										
										
											2021-07-21 09:22:34 +05:30
+								        ) or None
-												[ie/youtube] Do not require PO Token for premium accounts (#13640)

Authored by: coletdjnz
											
										
										
											2025-07-11 18:54:01 +12:00
+								    def _get_requested_clients(self, url, smuggled_data, is_premium_subscriber):
-												[youtube] Add `player_client=all`

											
										
										
											2021-07-26 03:25:53 +05:30
+								        requested_clients = []
-												[ie/youtube] Support excluding `player_client`s in extractor-arg (#10710)

Closes #10699
Authored by: bashonly
											
										
										
											2024-08-12 04:12:46 -05:00
+								        excluded_clients = []
-												[ie/youtube] Do not require PO Token for premium accounts (#13640)

Authored by: coletdjnz
											
										
										
											2025-07-11 18:54:01 +12:00
+								        default_clients = (
 								            self._DEFAULT_PREMIUM_CLIENTS if is_premium_subscriber
 								            else self._DEFAULT_AUTHED_CLIENTS if self.is_authenticated
 								            else self._DEFAULT_CLIENTS
 								        )
-												[youtube] simplify and de-duplicate client definitions (#577)

											
										
										
											2021-07-31 01:15:04 +05:30
+								        allowed_clients = sorted(
-												[cleanup] Add more ruff rules (#10149)

Authored by: seproDev

Reviewed-by: bashonly <88596187+bashonly@users.noreply.github.com>
Reviewed-by: Simon Sawicki <contact@grub4k.xyz>
											
										
										
											2024-06-12 01:09:58 +02:00
+								            (client for client in INNERTUBE_CLIENTS if client[:1] != '_'),
-												[youtube] simplify and de-duplicate client definitions (#577)

											
										
										
											2021-07-31 01:15:04 +05:30
+								            key=lambda client: INNERTUBE_CLIENTS[client]['priority'], reverse=True)
-												[youtube] Add `player_client=all`

											
										
										
											2021-07-26 03:25:53 +05:30
+								        for client in self._configuration_arg('player_client'):
-												[ie/youtube] Remove `android` from default clients (#9553)

Closes #9554
Authored by: coletdjnz, bashonly

Co-authored-by: bashonly <88596187+bashonly@users.noreply.github.com>
											
										
										
											2024-05-18 04:03:02 +12:00
+								            if client == 'default':
-												[ie/youtube] Adjust player clients for site changes (#11663)

Closes #11640
Authored by: bashonly
											
										
										
											2024-12-01 15:25:09 +00:00
+								                requested_clients.extend(default_clients)
-												[youtube] Add `player_client=all`

											
										
										
											2021-07-26 03:25:53 +05:30
+								            elif client == 'all':
 								                requested_clients.extend(allowed_clients)
-												[ie/youtube] Support excluding `player_client`s in extractor-arg (#10710)

Closes #10699
Authored by: bashonly
											
										
										
											2024-08-12 04:12:46 -05:00
+								            elif client.startswith('-'):
 								                excluded_clients.append(client[1:])
-												[ie/youtube] Remove `android` from default clients (#9553)

Closes #9554
Authored by: coletdjnz, bashonly

Co-authored-by: bashonly <88596187+bashonly@users.noreply.github.com>
											
										
										
											2024-05-18 04:03:02 +12:00
+								            elif client not in allowed_clients:
-												[ie/youtube] Support excluding `player_client`s in extractor-arg (#10710)

Closes #10699
Authored by: bashonly
											
										
										
											2024-08-12 04:12:46 -05:00
+								                self.report_warning(f'Skipping unsupported client "{client}"')
-												[ie/youtube] Remove `android` from default clients (#9553)

Closes #9554
Authored by: coletdjnz, bashonly

Co-authored-by: bashonly <88596187+bashonly@users.noreply.github.com>
											
										
										
											2024-05-18 04:03:02 +12:00
+								            else:
 								                requested_clients.append(client)
-												[youtube] Extract data from multiple clients (#536)

* `player_client` accepts multiple clients
* default `player_client` = `android,web`
* music clients can be specifically requested
* Add IOS `player_client`
* Hide live dash since they can't be downloaded

Closes #501

Authored-by: pukkandan, colethedj
											
										
										
											2021-07-21 09:22:34 +05:30
+								        if not requested_clients:
-												[ie/youtube] Adjust player clients for site changes (#11663)

Closes #11640
Authored by: bashonly
											
										
										
											2024-12-01 15:25:09 +00:00
+								            requested_clients.extend(default_clients)
-												[ie/youtube] Support excluding `player_client`s in extractor-arg (#10710)

Closes #10699
Authored by: bashonly
											
										
										
											2024-08-12 04:12:46 -05:00
+								        for excluded_client in excluded_clients:
 								            if excluded_client in requested_clients:
 								                requested_clients.remove(excluded_client)
 								        if not requested_clients:
 								            raise ExtractorError('No player clients have been requested', expected=True)
-												[youtube] Add support for multifeed videos

											
										
										
											2015-07-25 21:30:34 +06:00
-												[ie/youtube] Adjust player clients for site changes (#11663)

Closes #11640
Authored by: bashonly
											
										
										
											2024-12-01 15:25:09 +00:00
+								        if self.is_authenticated:
-												[ie/youtube] Restore convenience workarounds (#12181)

Authored by: bashonly
											
										
										
											2025-01-25 10:18:15 -06:00
+								            if (smuggled_data.get('is_music_url') or self.is_music_url(url)) and 'web_music' not in requested_clients:
 								                requested_clients.append('web_music')
-												[ie/youtube] Adjust player clients for site changes (#11663)

Closes #11640
Authored by: bashonly
											
										
										
											2024-12-01 15:25:09 +00:00
+								            unsupported_clients = [
 								                client for client in requested_clients if not INNERTUBE_CLIENTS[client]['SUPPORTS_COOKIES']
 								            ]
 								            for client in unsupported_clients:
 								                self.report_warning(f'Skipping client "{client}" since it does not support cookies', only_once=True)
 								                requested_clients.remove(client)
-												[youtube] Extract data from multiple clients (#536)

* `player_client` accepts multiple clients
* default `player_client` = `android,web`
* music clients can be specifically requested
* Add IOS `player_client`
* Hide live dash since they can't be downloaded

Closes #501

Authored-by: pukkandan, colethedj
											
										
										
											2021-07-21 09:22:34 +05:30
+								        return orderedSet(requested_clients)
-												[youtube] Add support for multifeed videos

											
										
										
											2015-07-25 21:30:34 +06:00
-												[ie/youtube] Better error when all player responses are skipped (#9083)

Authored by: Grub4K, pukkandan

Co-authored-by: pukkandan <pukkandan.ytdlp@gmail.com>
											
										
										
											2024-02-25 00:20:22 +01:00
+								    def _invalid_player_response(self, pr, video_id):
 								        # YouTube may return a different video player response than expected.
 								        # See: https://github.com/TeamNewPipe/NewPipe/issues/8713
 								        if (pr_id := traverse_obj(pr, ('videoDetails', 'videoId'))) != video_id:
 								            return pr_id
-												[ie/youtube] Do not require PO Token for premium accounts (#13640)

Authored by: coletdjnz
											
										
										
											2025-07-11 18:54:01 +12:00
+								    def _extract_player_responses(self, clients, video_id, webpage, webpage_client, webpage_ytcfg, is_premium_subscriber):
-												[ie/youtube] Add `po_token`, `visitor_data`, `data_sync_id` extractor args (#10648)

Authored by:  seproDev, coletdjnz, bashonly
											
										
										
											2024-09-13 12:51:58 +02:00
+								        initial_pr = None
-												[youtube] Extract data from multiple clients (#536)

* `player_client` accepts multiple clients
* default `player_client` = `android,web`
* music clients can be specifically requested
* Add IOS `player_client`
* Hide live dash since they can't be downloaded

Closes #501

Authored-by: pukkandan, colethedj
											
										
										
											2021-07-21 09:22:34 +05:30
+								        if webpage:
-												[ie/youtube] Fix initial player response usage (Bugfix for 8b8b442cb005a8d85315f301615f83fb736b967a) (#10464)

Authored by: seproDev
											
										
										
											2024-07-14 20:42:11 +02:00
+								            initial_pr = self._search_json(
-												[ie/youtube] Do not require PO Token for premium accounts (#13640)

Authored by: coletdjnz
											
										
										
											2025-07-11 18:54:01 +12:00
+								                self._YT_INITIAL_PLAYER_RESPONSE_RE, webpage,
 								                f'{webpage_client} client initial player response', video_id, fatal=False)
-												[youtube] Skip broken multifeed videos (closes #24711)

											
										
										
											2020-04-09 22:42:43 +07:00
-												[ie/youtube] Better error when all player responses are skipped (#9083)

Authored by: Grub4K, pukkandan

Co-authored-by: pukkandan <pukkandan.ytdlp@gmail.com>
											
										
										
											2024-02-25 00:20:22 +01:00
+								        prs = []
-												[ie/youtube] Add `po_token`, `visitor_data`, `data_sync_id` extractor args (#10648)

Authored by:  seproDev, coletdjnz, bashonly
											
										
										
											2024-09-13 12:51:58 +02:00
+								        deprioritized_prs = []
-												[ie/youtube] Better error when all player responses are skipped (#9083)

Authored by: Grub4K, pukkandan

Co-authored-by: pukkandan <pukkandan.ytdlp@gmail.com>
											
										
										
											2024-02-25 00:20:22 +01:00
+								        if initial_pr and not self._invalid_player_response(initial_pr, video_id):
 								            # Android player_response does not have microFormats which are needed for
 								            # extraction of some data. So we return the initial_pr with formats
 								            # stripped out even if not requested by the user
 								            # See: https://github.com/yt-dlp/yt-dlp/issues/501
 								            prs.append({**initial_pr, 'streamingData': None})
-												[youtube] Try embedded client variants before agegate

agegate variants appears to be broken, but don't remove them for the time-being

											
										
										
											2022-03-25 05:00:41 +05:30
+								        all_clients = set(clients)
-												[YouTube] Age-gate bypass implementation (#575)

* Calling the API with `clientScreen=EMBED` allows access to most age-gated videos - discovered by @ccdffddfddfdsfedeee (https://github.com/yt-dlp/yt-dlp/issues/574#issuecomment-887171136)
* Adds clients: (web/android/ios)_(embedded/agegate), mweb_embedded
* Renamed mobile_web to mweb

Closes #574

Authored by pukkandan, MinePlayersPE
											
										
										
											2021-07-27 16:40:44 +07:00
+								        clients = clients[::-1]
-												[youtube] Add age-gate bypass for unverified accounts (#600)

Adds `_creator` variants for each client

Authored by: zerodytrash, colethedj, pukkandan
											
										
										
											2021-08-01 23:13:46 +02:00
-												[youtube] Try embedded client variants before agegate

agegate variants appears to be broken, but don't remove them for the time-being

											
										
										
											2022-03-25 05:00:41 +05:30
+								        def append_client(*client_names):
-												[YouTube] Add new age-gate bypass (#3233)

Closes #3182
Authored by: zerodytrash, pukkandan
											
										
										
											2022-03-29 03:05:31 -07:00
+								            """ Append the first client name that exists but not already used """
-												[youtube] Try embedded client variants before agegate

agegate variants appears to be broken, but don't remove them for the time-being

											
										
										
											2022-03-25 05:00:41 +05:30
+								            for client_name in client_names:
-												[YouTube] Add new age-gate bypass (#3233)

Closes #3182
Authored by: zerodytrash, pukkandan
											
										
										
											2022-03-29 03:05:31 -07:00
+								                actual_client = _split_innertube_client(client_name)[0]
 								                if actual_client in INNERTUBE_CLIENTS:
 								                    if actual_client not in all_clients:
-												[youtube] Try embedded client variants before agegate

agegate variants appears to be broken, but don't remove them for the time-being

											
										
										
											2022-03-25 05:00:41 +05:30
+								                        clients.append(client_name)
-												[YouTube] Add new age-gate bypass (#3233)

Closes #3182
Authored by: zerodytrash, pukkandan
											
										
										
											2022-03-29 03:05:31 -07:00
+								                        all_clients.add(actual_client)
 								                        return
-												[youtube] Add age-gate bypass for unverified accounts (#600)

Adds `_creator` variants for each client

Authored by: zerodytrash, colethedj, pukkandan
											
										
										
											2021-08-01 23:13:46 +02:00
-												[youtube] Improvements to JS player extraction (See desc) (#860)

* fallback player url extraction when it fails to be extracted from the webpage
* don't download js player unnecessarily for clients that don't require it
* try to extract js player url from any additional client configs
* ability to skip the js player usage/download using `player_skip=js`
* ability to skip the initial webpage download using `player_skip=webpage`

known issue:
* authentication for multi-channel accounts and multi-account cookies may not work correctly if the webpage or client configs are skipped
*  formats from the web client requiring signature decryption will be skipped if player js extraction is skipped

Authored by: coletdjnz
											
										
										
											2021-09-06 07:26:41 +00:00
+								        tried_iframe_fallback = False
-												[ie/youtube] Add `po_token`, `visitor_data`, `data_sync_id` extractor args (#10648)

Authored by:  seproDev, coletdjnz, bashonly
											
										
										
											2024-09-13 12:51:58 +02:00
+								        player_url = visitor_data = data_sync_id = None
-												[ie/youtube] Better error when all player responses are skipped (#9083)

Authored by: Grub4K, pukkandan

Co-authored-by: pukkandan <pukkandan.ytdlp@gmail.com>
											
										
										
											2024-02-25 00:20:22 +01:00
+								        skipped_clients = {}
-												[YouTube] Age-gate bypass implementation (#575)

* Calling the API with `clientScreen=EMBED` allows access to most age-gated videos - discovered by @ccdffddfddfdsfedeee (https://github.com/yt-dlp/yt-dlp/issues/574#issuecomment-887171136)
* Adds clients: (web/android/ios)_(embedded/agegate), mweb_embedded
* Renamed mobile_web to mweb

Closes #574

Authored by pukkandan, MinePlayersPE
											
										
										
											2021-07-27 16:40:44 +07:00
+								        while clients:
-												[ie/youtube] Add `po_token`, `visitor_data`, `data_sync_id` extractor args (#10648)

Authored by:  seproDev, coletdjnz, bashonly
											
										
										
											2024-09-13 12:51:58 +02:00
+								            deprioritize_pr = False
-												[YouTube] Add new age-gate bypass (#3233)

Closes #3182
Authored by: zerodytrash, pukkandan
											
										
										
											2022-03-29 03:05:31 -07:00
+								            client, base_client, variant = _split_innertube_client(clients.pop())
-												[ie/youtube] Do not require PO Token for premium accounts (#13640)

Authored by: coletdjnz
											
										
										
											2025-07-11 18:54:01 +12:00
+								            player_ytcfg = webpage_ytcfg if client == webpage_client else {}
 								            if 'configs' not in self._configuration_arg('player_skip') and client != webpage_client:
-												[youtube, cleanup] Minor refactoring

Authored by: coletdjnz, pukkandan

											
										
										
											2022-04-10 01:00:21 +05:30
+								                player_ytcfg = self._download_ytcfg(client, video_id) or player_ytcfg
-												[YouTube] Age-gate bypass implementation (#575)

* Calling the API with `clientScreen=EMBED` allows access to most age-gated videos - discovered by @ccdffddfddfdsfedeee (https://github.com/yt-dlp/yt-dlp/issues/574#issuecomment-887171136)
* Adds clients: (web/android/ios)_(embedded/agegate), mweb_embedded
* Renamed mobile_web to mweb

Closes #574

Authored by pukkandan, MinePlayersPE
											
										
										
											2021-07-27 16:40:44 +07:00
-												[ie/youtube] Do not require PO Token for premium accounts (#13640)

Authored by: coletdjnz
											
										
										
											2025-07-11 18:54:01 +12:00
+								            player_url = player_url or self._extract_player_url(webpage_ytcfg, player_ytcfg, webpage=webpage)
-												[youtube] Improvements to JS player extraction (See desc) (#860)

* fallback player url extraction when it fails to be extracted from the webpage
* don't download js player unnecessarily for clients that don't require it
* try to extract js player url from any additional client configs
* ability to skip the js player usage/download using `player_skip=js`
* ability to skip the initial webpage download using `player_skip=webpage`

known issue:
* authentication for multi-channel accounts and multi-account cookies may not work correctly if the webpage or client configs are skipped
*  formats from the web client requiring signature decryption will be skipped if player js extraction is skipped

Authored by: coletdjnz
											
										
										
											2021-09-06 07:26:41 +00:00
+								            require_js_player = self._get_default_ytcfg(client).get('REQUIRE_JS_PLAYER')
 								            if 'js' in self._configuration_arg('player_skip'):
 								                require_js_player = False
 								                player_url = None
 								            if not player_url and not tried_iframe_fallback and require_js_player:
 								                player_url = self._download_player_url(video_id)
 								                tried_iframe_fallback = True
-												[ie/youtube] Do not require PO Token for premium accounts (#13640)

Authored by: coletdjnz
											
										
										
											2025-07-11 18:54:01 +12:00
+								            pr = None
 								            if client == webpage_client and 'player_response' not in self._configuration_arg('webpage_skip'):
 								                pr = initial_pr
-												[ie/youtube] Add PO token support for subtitles (#13234)

Closes #13075
Authored by: bashonly, coletdjnz

Co-authored-by: coletdjnz <coletdjnz@protonmail.com>
											
										
										
											2025-05-22 04:13:42 -05:00
-												[ie/youtube] Do not require PO Token for premium accounts (#13640)

Authored by: coletdjnz
											
										
										
											2025-07-11 18:54:01 +12:00
+								            visitor_data = visitor_data or self._extract_visitor_data(webpage_ytcfg, initial_pr, player_ytcfg)
 								            data_sync_id = data_sync_id or self._extract_data_sync_id(webpage_ytcfg, initial_pr, player_ytcfg)
-												[ie/youtube] Add `po_token`, `visitor_data`, `data_sync_id` extractor args (#10648)

Authored by:  seproDev, coletdjnz, bashonly
											
										
										
											2024-09-13 12:51:58 +02:00
-												[ie/youtube] Use different PO token for GVS and Player (#12090)

Authored by: coletdjnz
											
										
										
											2025-01-25 13:17:37 +13:00
+								            fetch_po_token_args = {
 								                'client': client,
 								                'visitor_data': visitor_data,
 								                'video_id': video_id,
 								                'data_sync_id': data_sync_id if self.is_authenticated else None,
 								                'player_url': player_url if require_js_player else None,
-												[ie/youtube] Add a PO Token Provider Framework (#12840)

https://github.com/yt-dlp/yt-dlp/tree/master/yt_dlp/extractor/youtube/pot/README.md

Authored by: coletdjnz
											
										
										
											2025-05-18 13:45:26 +12:00
+								                'webpage': webpage,
-												[ie/youtube] Do not require PO Token for premium accounts (#13640)

Authored by: coletdjnz
											
										
										
											2025-07-11 18:54:01 +12:00
+								                'session_index': self._extract_session_index(webpage_ytcfg, player_ytcfg),
-												[ie/youtube] Add a PO Token Provider Framework (#12840)

https://github.com/yt-dlp/yt-dlp/tree/master/yt_dlp/extractor/youtube/pot/README.md

Authored by: coletdjnz
											
										
										
											2025-05-18 13:45:26 +12:00
+								                'ytcfg': player_ytcfg or self._get_default_ytcfg(client),
-												[ie/youtube] Use different PO token for GVS and Player (#12090)

Authored by: coletdjnz
											
										
										
											2025-01-25 13:17:37 +13:00
+								            }
-												[ie/youtube] Add PO token support for subtitles (#13234)

Closes #13075
Authored by: bashonly, coletdjnz

Co-authored-by: coletdjnz <coletdjnz@protonmail.com>
											
										
										
											2025-05-22 04:13:42 -05:00
+								            # Don't need a player PO token for WEB if using player response from webpage
-												[ie/youtube] Do not require PO Token for premium accounts (#13640)

Authored by: coletdjnz
											
										
										
											2025-07-11 18:54:01 +12:00
+								            player_pot_policy: PlayerPoTokenPolicy = self._get_default_ytcfg(client)['PLAYER_PO_TOKEN_POLICY']
-												[ie/youtube] Add PO token support for subtitles (#13234)

Closes #13075
Authored by: bashonly, coletdjnz

Co-authored-by: coletdjnz <coletdjnz@protonmail.com>
											
										
										
											2025-05-22 04:13:42 -05:00
+								            player_po_token = None if pr else self.fetch_po_token(
-												[ie/youtube] Do not require PO Token for premium accounts (#13640)

Authored by: coletdjnz
											
										
										
											2025-07-11 18:54:01 +12:00
+								                context=_PoTokenContext.PLAYER, **fetch_po_token_args,
 								                required=player_pot_policy.required or player_pot_policy.recommended)
-												[ie/youtube] Use different PO token for GVS and Player (#12090)

Authored by: coletdjnz
											
										
										
											2025-01-25 13:17:37 +13:00
-												[ie/youtube] Do not require PO Token for premium accounts (#13640)

Authored by: coletdjnz
											
										
										
											2025-07-11 18:54:01 +12:00
+								            fetch_gvs_po_token_func = functools.partial(
 								                self.fetch_po_token, context=_PoTokenContext.GVS, **fetch_po_token_args)
-												[ie/youtube] Use different PO token for GVS and Player (#12090)

Authored by: coletdjnz
											
										
										
											2025-01-25 13:17:37 +13:00
-												[ie/youtube] Add PO token support for subtitles (#13234)

Closes #13075
Authored by: bashonly, coletdjnz

Co-authored-by: coletdjnz <coletdjnz@protonmail.com>
											
										
										
											2025-05-22 04:13:42 -05:00
+								            fetch_subs_po_token_func = functools.partial(
-												[ie/youtube] Do not require PO Token for premium accounts (#13640)

Authored by: coletdjnz
											
										
										
											2025-07-11 18:54:01 +12:00
+								                self.fetch_po_token, context=_PoTokenContext.SUBS, **fetch_po_token_args)
-												[ie/youtube] Add `po_token`, `visitor_data`, `data_sync_id` extractor args (#10648)

Authored by:  seproDev, coletdjnz, bashonly
											
										
										
											2024-09-13 12:51:58 +02:00
 								            try:
 								                pr = pr or self._extract_player_response(
 								                    client, video_id,
-												[ie/youtube] Do not require PO Token for premium accounts (#13640)

Authored by: coletdjnz
											
										
										
											2025-07-11 18:54:01 +12:00
+								                    webpage_ytcfg=player_ytcfg or webpage_ytcfg,
-												[ie/youtube] Add `po_token`, `visitor_data`, `data_sync_id` extractor args (#10648)

Authored by:  seproDev, coletdjnz, bashonly
											
										
										
											2024-09-13 12:51:58 +02:00
+								                    player_ytcfg=player_ytcfg,
 								                    player_url=player_url,
 								                    initial_pr=initial_pr,
 								                    visitor_data=visitor_data,
 								                    data_sync_id=data_sync_id,
-												[ie/youtube] Use different PO token for GVS and Player (#12090)

Authored by: coletdjnz
											
										
										
											2025-01-25 13:17:37 +13:00
+								                    po_token=player_po_token)
-												[ie/youtube] Add `po_token`, `visitor_data`, `data_sync_id` extractor args (#10648)

Authored by:  seproDev, coletdjnz, bashonly
											
										
										
											2024-09-13 12:51:58 +02:00
+								            except ExtractorError as e:
 								                self.report_warning(e)
-												[youtube] Raise appropriate error when API pages can't be downloaded

											
										
										
											2021-08-07 12:15:58 +05:30
+								                continue
-												[ie/youtube] Better error when all player responses are skipped (#9083)

Authored by: Grub4K, pukkandan

Co-authored-by: pukkandan <pukkandan.ytdlp@gmail.com>
											
										
										
											2024-02-25 00:20:22 +01:00
+								            if pr_id := self._invalid_player_response(pr, video_id):
 								                skipped_clients[client] = pr_id
 								            elif pr:
-												[ie/youtube] Add PO token support for subtitles (#13234)

Closes #13075
Authored by: bashonly, coletdjnz

Co-authored-by: coletdjnz <coletdjnz@protonmail.com>
											
										
										
											2025-05-22 04:13:42 -05:00
+								                # Save client details for introspection later
 								                innertube_context = traverse_obj(player_ytcfg or self._get_default_ytcfg(client), 'INNERTUBE_CONTEXT')
-												[ie/youtube] Optimize playback wait times (#14124)

Authored by: bashonly
											
										
										
											2025-08-22 18:53:28 -05:00
+								                fetched_timestamp = int(time.time())
-												[ie/youtube] Add PO token support for subtitles (#13234)

Closes #13075
Authored by: bashonly, coletdjnz

Co-authored-by: coletdjnz <coletdjnz@protonmail.com>
											
										
										
											2025-05-22 04:13:42 -05:00
+								                sd = pr.setdefault('streamingData', {})
-												[ie/youtube] Add `po_token`, `visitor_data`, `data_sync_id` extractor args (#10648)

Authored by:  seproDev, coletdjnz, bashonly
											
										
										
											2024-09-13 12:51:58 +02:00
+								                sd[STREAMING_DATA_CLIENT_NAME] = client
-												[ie/youtube] Do not require PO Token for premium accounts (#13640)

Authored by: coletdjnz
											
										
										
											2025-07-11 18:54:01 +12:00
+								                sd[STREAMING_DATA_FETCH_GVS_PO_TOKEN] = fetch_gvs_po_token_func
 								                sd[STREAMING_DATA_PLAYER_TOKEN_PROVIDED] = bool(player_po_token)
-												[ie/youtube] Add PO token support for subtitles (#13234)

Closes #13075
Authored by: bashonly, coletdjnz

Co-authored-by: coletdjnz <coletdjnz@protonmail.com>
											
										
										
											2025-05-22 04:13:42 -05:00
+								                sd[STREAMING_DATA_INNERTUBE_CONTEXT] = innertube_context
 								                sd[STREAMING_DATA_FETCH_SUBS_PO_TOKEN] = fetch_subs_po_token_func
-												[ie/youtube] Do not require PO Token for premium accounts (#13640)

Authored by: coletdjnz
											
										
										
											2025-07-11 18:54:01 +12:00
+								                sd[STREAMING_DATA_IS_PREMIUM_SUBSCRIBER] = is_premium_subscriber
-												[ie/youtube] Better error when all player responses are skipped (#9083)

Authored by: Grub4K, pukkandan

Co-authored-by: pukkandan <pukkandan.ytdlp@gmail.com>
											
										
										
											2024-02-25 00:20:22 +01:00
+								                for f in traverse_obj(sd, (('formats', 'adaptiveFormats'), ..., {dict})):
-												[ie/youtube] Add `po_token`, `visitor_data`, `data_sync_id` extractor args (#10648)

Authored by:  seproDev, coletdjnz, bashonly
											
										
										
											2024-09-13 12:51:58 +02:00
+								                    f[STREAMING_DATA_CLIENT_NAME] = client
-												[ie/youtube] Do not require PO Token for premium accounts (#13640)

Authored by: coletdjnz
											
										
										
											2025-07-11 18:54:01 +12:00
+								                    f[STREAMING_DATA_FETCH_GVS_PO_TOKEN] = fetch_gvs_po_token_func
 								                    f[STREAMING_DATA_IS_PREMIUM_SUBSCRIBER] = is_premium_subscriber
 								                    f[STREAMING_DATA_PLAYER_TOKEN_PROVIDED] = bool(player_po_token)
-												[ie/youtube] Optimize playback wait times (#14124)

Authored by: bashonly
											
										
										
											2025-08-22 18:53:28 -05:00
+								                    f[STREAMING_DATA_FETCHED_TIMESTAMP] = fetched_timestamp
-												[ie/youtube] Add `po_token`, `visitor_data`, `data_sync_id` extractor args (#10648)

Authored by:  seproDev, coletdjnz, bashonly
											
										
										
											2024-09-13 12:51:58 +02:00
+								                if deprioritize_pr:
 								                    deprioritized_prs.append(pr)
 								                else:
 								                    prs.append(pr)
-												[YouTube] Age-gate bypass implementation (#575)

* Calling the API with `clientScreen=EMBED` allows access to most age-gated videos - discovered by @ccdffddfddfdsfedeee (https://github.com/yt-dlp/yt-dlp/issues/574#issuecomment-887171136)
* Adds clients: (web/android/ios)_(embedded/agegate), mweb_embedded
* Renamed mobile_web to mweb

Closes #574

Authored by pukkandan, MinePlayersPE
											
										
										
											2021-07-27 16:40:44 +07:00
-												[ie/youtube] Add `web_embedded` client for age-restricted videos (#13089)

Authored by: bashonly
											
										
										
											2025-05-03 15:11:40 -05:00
+								            # web_embedded can work around age-gate and age-verification for some embeddable videos
 								            if self._is_agegated(pr) and variant != 'web_embedded':
 								                append_client(f'web_embedded.{base_client}')
 								            # Unauthenticated users will only get web_embedded client formats if age-gated
 								            if self._is_agegated(pr) and not self.is_authenticated:
 								                self.to_screen(
 								                    f'{video_id}: This video is age-restricted; some formats may be missing '
 								                    f'without authentication. {self._youtube_login_hint}', only_once=True)
-												[ie/youtube] Restore convenience workarounds (#12181)

Authored by: bashonly
											
										
										
											2025-01-25 10:18:15 -06:00
+								            # EU countries require age-verification for accounts to access age-restricted videos
 								            # If account is not age-verified, _is_agegated() will be truthy for non-embedded clients
-												[ie/youtube] Add `web_embedded` client for age-restricted videos (#13089)

Authored by: bashonly
											
										
										
											2025-05-03 15:11:40 -05:00
+								            embedding_is_disabled = variant == 'web_embedded' and self._is_unplayable(pr)
 								            if self.is_authenticated and (self._is_agegated(pr) or embedding_is_disabled):
-												[ie/youtube] Restore convenience workarounds (#12181)

Authored by: bashonly
											
										
										
											2025-01-25 10:18:15 -06:00
+								                self.to_screen(
 								                    f'{video_id}: This video is age-restricted and YouTube is requiring '
 								                    'account age-verification; some formats may be missing', only_once=True)
 								                # tv_embedded can work around the age-verification requirement for embeddable videos
 								                # web_creator may work around age-verification for all videos but requires PO token
 								                append_client('tv_embedded', 'web_creator')
-												[ie/youtube] Log bad playability statuses of player responses (#13647)

Authored by: coletdjnz
											
										
										
											2025-07-09 18:29:54 +12:00
+								            status = traverse_obj(pr, ('playabilityStatus', 'status', {str}))
 								            if status not in ('OK', 'LIVE_STREAM_OFFLINE', 'AGE_CHECK_REQUIRED', 'AGE_VERIFICATION_REQUIRED'):
 								                self.write_debug(f'{video_id}: {client} player response playability status: {status}')
-												[ie/youtube] Add `po_token`, `visitor_data`, `data_sync_id` extractor args (#10648)

Authored by:  seproDev, coletdjnz, bashonly
											
										
										
											2024-09-13 12:51:58 +02:00
+								        prs.extend(deprioritized_prs)
-												[ie/youtube] Better error when all player responses are skipped (#9083)

Authored by: Grub4K, pukkandan

Co-authored-by: pukkandan <pukkandan.ytdlp@gmail.com>
											
										
										
											2024-02-25 00:20:22 +01:00
+								        if skipped_clients:
 								            self.report_warning(
 								                f'Skipping player responses from {"/".join(skipped_clients)} clients '
 								                f'(got player responses for video "{"/".join(set(skipped_clients.values()))}" instead of "{video_id}")')
 								            if not prs:
 								                raise ExtractorError(
 								                    'All player responses are invalid. Your IP is likely being blocked by Youtube', expected=True)
 								        elif not prs:
 								            raise ExtractorError('Failed to extract any player response')
-												[youtube] Improvements to JS player extraction (See desc) (#860)

* fallback player url extraction when it fails to be extracted from the webpage
* don't download js player unnecessarily for clients that don't require it
* try to extract js player url from any additional client configs
* ability to skip the js player usage/download using `player_skip=js`
* ability to skip the initial webpage download using `player_skip=webpage`

known issue:
* authentication for multi-channel accounts and multi-account cookies may not work correctly if the webpage or client configs are skipped
*  formats from the web client requiring signature decryption will be skipped if player js extraction is skipped

Authored by: coletdjnz
											
										
										
											2021-09-06 07:26:41 +00:00
+								        return prs, player_url
-												[youtube] Extract data from multiple clients (#536)

* `player_client` accepts multiple clients
* default `player_client` = `android,web`
* music clients can be specifically requested
* Add IOS `player_client`
* Hide live dash since they can't be downloaded

Closes #501

Authored-by: pukkandan, colethedj
											
										
										
											2021-07-21 09:22:34 +05:30
-												[extractor/youtube] Download `post_live` videos from start (#5091)

* The fragments are generated as a `LazyList`. So only the required formats are expanded during download, but all fragment lists are printed/written in infojson.
* The m3u8 formats which cannot be downloaded from start are not extracted by default, but can be enabled with an extractor-arg. The extractor-arg `include_live_dash` is renamed to `include_incomplete_formats` to account for this new use-case.

Closes #1564
Authored by: Lesmiscore, pukkandan
											
										
										
											2022-10-04 11:48:31 +09:00
+								    def _needs_live_processing(self, live_status, duration):
-												[cleanup] Bump ruff to 0.8.x (#11608)

Authored by: seproDev
											
										
										
											2024-12-02 16:29:30 +01:00
+								        if ((live_status == 'is_live' and self.get_param('live_from_start'))
 								                or (live_status == 'post_live' and (duration or 0) > 2 * 3600)):
-												[extractor/youtube] Download `post_live` videos from start (#5091)

* The fragments are generated as a `LazyList`. So only the required formats are expanded during download, but all fragment lists are printed/written in infojson.
* The m3u8 formats which cannot be downloaded from start are not extracted by default, but can be enabled with an extractor-arg. The extractor-arg `include_live_dash` is renamed to `include_incomplete_formats` to account for this new use-case.

Closes #1564
Authored by: Lesmiscore, pukkandan
											
										
										
											2022-10-04 11:48:31 +09:00
+								            return live_status
-												[ie/youtube] Skip iOS formats that require PO Token (#11890)

Partial fix for https://github.com/yt-dlp/yt-dlp/issues/11868

Authored by: coletdjnz
											
										
										
											2024-12-24 12:03:28 +13:00
+								    def _report_pot_format_skipped(self, video_id, client_name, proto):
 								        msg = (
-												[ie/youtube] Use different PO token for GVS and Player (#12090)

Authored by: coletdjnz
											
										
										
											2025-01-25 13:17:37 +13:00
+								            f'{video_id}: {client_name} client {proto} formats require a GVS PO Token which was not provided. '
-												[ie/youtube] Skip iOS formats that require PO Token (#11890)

Partial fix for https://github.com/yt-dlp/yt-dlp/issues/11868

Authored by: coletdjnz
											
										
										
											2024-12-24 12:03:28 +13:00
+								            'They will be skipped as they may yield HTTP Error 403. '
-												[ie/youtube] Use different PO token for GVS and Player (#12090)

Authored by: coletdjnz
											
										
										
											2025-01-25 13:17:37 +13:00
+								            f'You can manually pass a GVS PO Token for this client with --extractor-args "youtube:po_token={client_name}.gvs+XXX". '
-												[ie/youtube] Replace `ios` with `tv_simply` in default clients (#14123)

Also:
- Add `web_safari` to default logged-in clients
- Add `web_creator` to default premium clients
- Flag `ios` HLS formats as requiring PO token

Closes #13702
Authored by: bashonly, coletdjnz

Co-authored-by: coletdjnz <coletdjnz@protonmail.com>
											
										
										
											2025-08-22 18:49:54 -05:00
+								            f'For more information, refer to  {PO_TOKEN_GUIDE_URL}')
-												[ie/youtube] Skip iOS formats that require PO Token (#11890)

Partial fix for https://github.com/yt-dlp/yt-dlp/issues/11868

Authored by: coletdjnz
											
										
										
											2024-12-24 12:03:28 +13:00
 								        # Only raise a warning for non-default clients, to not confuse users.
 								        if client_name in (*self._DEFAULT_CLIENTS, *self._DEFAULT_AUTHED_CLIENTS):
 								            self.write_debug(msg, only_once=True)
 								        else:
 								            self.report_warning(msg, only_once=True)
-												[ie/youtube] Add PO token support for subtitles (#13234)

Closes #13075
Authored by: bashonly, coletdjnz

Co-authored-by: coletdjnz <coletdjnz@protonmail.com>
											
										
										
											2025-05-22 04:13:42 -05:00
+								    def _report_pot_subtitles_skipped(self, video_id, client_name, msg=None):
 								        msg = msg or (
 								            f'{video_id}: Some {client_name} client subtitles require a PO Token which was not provided. '
 								            'They will be discarded since they are not downloadable as-is. '
 								            f'You can manually pass a Subtitles PO Token for this client with '
 								            f'--extractor-args "youtube:po_token={client_name}.subs+XXX" . '
 								            f'For more information, refer to  {PO_TOKEN_GUIDE_URL}')
 								        subs_wanted = any((
 								            self.get_param('writesubtitles'),
 								            self.get_param('writeautomaticsub'),
 								            self.get_param('listsubtitles')))
 								        # Only raise a warning for non-default clients, to not confuse users.
 								        if not subs_wanted or client_name in (*self._DEFAULT_CLIENTS, *self._DEFAULT_AUTHED_CLIENTS):
 								            self.write_debug(msg, only_once=True)
 								        else:
 								            self.report_warning(msg, only_once=True)
-												[extractor/youtube] Download `post_live` videos from start (#5091)

* The fragments are generated as a `LazyList`. So only the required formats are expanded during download, but all fragment lists are printed/written in infojson.
* The m3u8 formats which cannot be downloaded from start are not extracted by default, but can be enabled with an extractor-arg. The extractor-arg `include_live_dash` is renamed to `include_incomplete_formats` to account for this new use-case.

Closes #1564
Authored by: Lesmiscore, pukkandan
											
										
										
											2022-10-04 11:48:31 +09:00
+								    def _extract_formats_and_subtitles(self, streaming_data, video_id, player_url, live_status, duration):
-												Fix 2a23d92d9ec44a0168079e38bcf3d383e5c4c7bb

Closes #6517

											
										
										
											2023-03-12 14:46:09 +05:30
+								        CHUNK_SIZE = 10 << 20
-												[ie/youtube] Extract all formats from multi-language m3u8s (#9875)

Authored by: clienthax, bashonly

Co-authored-by: bashonly <88596187+bashonly@users.noreply.github.com>
											
										
										
											2024-06-20 22:54:53 +01:00
+								        PREFERRED_LANG_VALUE = 10
 								        original_language = None
-												[extractor/youtube] Consider language in format de-duplication

											
										
										
											2022-11-15 05:23:32 +05:30
+								        itags, stream_ids = collections.defaultdict(set), []
-												[extractor/youtube] Fix bug in format sorting

											
										
										
											2022-08-21 00:56:27 +05:30
+								        itag_qualities, res_qualities = {}, {0: None}
-												[youtube] Sort audio-only formats correctly
Closes #317

											
										
										
											2021-05-18 01:11:57 +05:30
+								        q = qualities([
-												[youtube] Fix format sorting when using alternate clients

											
										
										
											2021-07-26 03:33:42 +05:30
+								            # Normally tiny is the smallest video-only formats. But
 								            # audio-only formats with unknown quality may get tagged as tiny
 								            'tiny',
 								            'audio_quality_ultralow', 'audio_quality_low', 'audio_quality_medium', 'audio_quality_high',  # Audio only formats
-												[cleanup] Add more ruff rules (#10149)

Authored by: seproDev

Reviewed-by: bashonly <88596187+bashonly@users.noreply.github.com>
Reviewed-by: Simon Sawicki <contact@grub4k.xyz>
											
										
										
											2024-06-12 01:09:58 +02:00
+								            'small', 'medium', 'large', 'hd720', 'hd1080', 'hd1440', 'hd2160', 'hd2880', 'highres',
-												[youtube] Sort audio-only formats correctly
Closes #317

											
										
										
											2021-05-18 01:11:57 +05:30
+								        ])
-												[utils] `traverse_obj`: Fix more bugs

and cleanup uses of `default=[]`

Continued from b1bde57bef878478e3503ab07190fd207914ade9

											
										
										
											2023-02-10 03:56:26 +05:30
+								        streaming_formats = traverse_obj(streaming_data, (..., ('formats', 'adaptiveFormats'), ...))
-												[extractor/youtube] Add extractor-arg `formats`

Closes #7417

											
										
										
											2023-06-25 20:10:00 +05:30
+								        format_types = self._configuration_arg('formats')
 								        all_formats = 'duplicate' in format_types
 								        if self._configuration_arg('include_duplicate_formats'):
 								            all_formats = True
 								            self._downloader.deprecated_feature('[youtube] include_duplicate_formats extractor argument is deprecated. '
 								                                                'Use formats=duplicate extractor argument instead')
-												[Youtube] Extract more formats for `music.youtube` URLs (#311)

Based on: https://github.com/ytdl-org/youtube-dl/pull/28778, https://github.com/ytdl-org/youtube-dl/pull/26160

Co-authored-by: craftingmod, colethedj, pukkandan
											
										
										
											2021-05-16 02:38:47 +12:00
-												Fix 2a23d92d9ec44a0168079e38bcf3d383e5c4c7bb

Closes #6517

											
										
										
											2023-03-12 14:46:09 +05:30
+								        def build_fragments(f):
 								            return LazyList({
 								                'url': update_url_query(f['url'], {
-												[cleanup] Add more ruff rules (#10149)

Authored by: seproDev

Reviewed-by: bashonly <88596187+bashonly@users.noreply.github.com>
Reviewed-by: Simon Sawicki <contact@grub4k.xyz>
											
										
										
											2024-06-12 01:09:58 +02:00
+								                    'range': f'{range_start}-{min(range_start + CHUNK_SIZE - 1, f["filesize"])}',
 								                }),
-												Fix 2a23d92d9ec44a0168079e38bcf3d383e5c4c7bb

Closes #6517

											
										
										
											2023-03-12 14:46:09 +05:30
+								            } for range_start in range(0, f['filesize'], CHUNK_SIZE))
-												[ie/youtube] Do not require PO Token for premium accounts (#13640)

Authored by: coletdjnz
											
										
										
											2025-07-11 18:54:01 +12:00
+								        def gvs_pot_required(policy, is_premium_subscriber, has_player_token):
 								            return (
 								                policy.required
 								                and not (policy.not_required_with_player_token and has_player_token)
 								                and not (policy.not_required_for_premium and is_premium_subscriber))
 								        # save pots per client to avoid fetching again
 								        gvs_pots = {}
-												[ie/youtube] Optimize playback wait times (#14124)

Authored by: bashonly
											
										
										
											2025-08-22 18:53:28 -05:00
+								        # For handling potential pre-playback required waiting period
 								        playback_wait = int_or_none(self._configuration_arg('playback_wait', [None])[0], default=6)
-												[youtube] Update to ytdl-2021.02.04.1

											
										
										
											2021-02-04 20:07:17 +05:30
+								        for fmt in streaming_formats:
-												[ie/youtube] Warn on missing formats due to SSAP (#12483)

See https://github.com/yt-dlp/yt-dlp/issues/12482

Authored by: coletdjnz
											
										
										
											2025-02-28 19:33:31 +13:00
+								            client_name = fmt[STREAMING_DATA_CLIENT_NAME]
-												[ie/youtube] Optimize playback wait times (#14124)

Authored by: bashonly
											
										
										
											2025-08-22 18:53:28 -05:00
+								            available_at = fmt[STREAMING_DATA_FETCHED_TIMESTAMP] + playback_wait
-												[youtube] Detect DRM better

Authored by: shirt-dev

											
										
										
											2022-03-27 01:28:26 -04:00
+								            if fmt.get('targetDurationSec'):
-												[youtube] Update to ytdl-2021.02.04.1

											
										
										
											2021-02-04 20:07:17 +05:30
+								                continue
-												check live chat replay existence

											
										
										
											2020-08-05 03:30:10 +03:00
-												Update to ytdl-2021.02.10

Except: [archiveorg] Fix and improve extraction (5fc53690cbe6abb11941a3f4846b566a7472753e)

											
										
										
											2021-02-11 02:52:55 +05:30
+								            itag = str_or_none(fmt.get('itag'))
-												[Youtube] Extract more formats for `music.youtube` URLs (#311)

Based on: https://github.com/ytdl-org/youtube-dl/pull/28778, https://github.com/ytdl-org/youtube-dl/pull/26160

Co-authored-by: craftingmod, colethedj, pukkandan
											
										
										
											2021-05-16 02:38:47 +12:00
+								            audio_track = fmt.get('audioTrack') or {}
-												[extractor/youtube] Extract DRC formats

											
										
										
											2022-12-30 15:32:33 +05:30
+								            stream_id = (itag, audio_track.get('id'), fmt.get('isDrc'))
-												[extractor/youtube] Add extractor-arg `include_duplicate_formats`

											
										
										
											2023-03-09 23:13:02 +05:30
+								            if not all_formats:
 								                if stream_id in stream_ids:
 								                    continue
-												[Youtube] Extract more formats for `music.youtube` URLs (#311)

Based on: https://github.com/ytdl-org/youtube-dl/pull/28778, https://github.com/ytdl-org/youtube-dl/pull/26160

Co-authored-by: craftingmod, colethedj, pukkandan
											
										
										
											2021-05-16 02:38:47 +12:00
-												Update to ytdl-2021.02.10

Except: [archiveorg] Fix and improve extraction (5fc53690cbe6abb11941a3f4846b566a7472753e)

											
										
										
											2021-02-11 02:52:55 +05:30
+								            quality = fmt.get('quality')
-												[youtube] Fix format sorting when using alternate clients

											
										
										
											2021-07-26 03:33:42 +05:30
+								            height = int_or_none(fmt.get('height'))
-												[youtube] Sort audio-only formats correctly
Closes #317

											
										
										
											2021-05-18 01:11:57 +05:30
+								            if quality == 'tiny' or not quality:
 								                quality = fmt.get('audioQuality', '').lower() or quality
-												[youtube] Fix format sorting when using alternate clients

											
										
										
											2021-07-26 03:33:42 +05:30
+								            # The 3gp format (17) in android client has a quality of "small",
 								            # but is actually worse than other formats
 								            if itag == '17':
 								                quality = 'tiny'
 								            if quality:
 								                if itag:
 								                    itag_qualities[itag] = quality
 								                if height:
 								                    res_qualities[height] = quality
-												[ie/youtube] Skip formats if nsig decoding fails (#10223)

Ref: https://github.com/ytdl-org/youtube-dl/issues/32815

Authored by: bashonly
											
										
										
											2024-06-21 18:19:59 -05:00
-												[ie/youtube] Prioritize original language over auto-dubbed audio (#11803)

Closes #11753
Authored by: bashonly
											
										
										
											2024-12-13 10:21:48 +00:00
+								            display_name = audio_track.get('displayName') or ''
 								            is_original = 'original' in display_name.lower()
 								            is_descriptive = 'descriptive' in display_name.lower()
-												[ie/youtube] Skip formats if nsig decoding fails (#10223)

Ref: https://github.com/ytdl-org/youtube-dl/issues/32815

Authored by: bashonly
											
										
										
											2024-06-21 18:19:59 -05:00
+								            is_default = audio_track.get('audioIsDefault')
 								            language_code = audio_track.get('id', '').split('.')[0]
-												[ie/youtube] Prioritize original language over auto-dubbed audio (#11803)

Closes #11753
Authored by: bashonly
											
										
										
											2024-12-13 10:21:48 +00:00
+								            if language_code and (is_original or (is_default and not original_language)):
-												[ie/youtube] Skip formats if nsig decoding fails (#10223)

Ref: https://github.com/ytdl-org/youtube-dl/issues/32815

Authored by: bashonly
											
										
										
											2024-06-21 18:19:59 -05:00
+								                original_language = language_code
-												[ie/youtube] Warn on DRM formats (#12593)

Authored by: coletdjnz
											
										
										
											2025-03-16 10:28:16 +13:00
+								            has_drm = bool(fmt.get('drmFamilies'))
-												Update to ytdl-2021.02.10

Except: [archiveorg] Fix and improve extraction (5fc53690cbe6abb11941a3f4846b566a7472753e)

											
										
										
											2021-02-11 02:52:55 +05:30
+								            # FORMAT_STREAM_TYPE_OTF(otf=1) requires downloading the init fragment
 								            # (adding `&sq=0` to the URL) and parsing emsg box to determine the
 								            # number of fragment that would subsequently requested with (`&sq=N`)
-												[ie/youtube] Warn on DRM formats (#12593)

Authored by: coletdjnz
											
										
										
											2025-03-16 10:28:16 +13:00
+								            if fmt.get('type') == 'FORMAT_STREAM_TYPE_OTF' and not has_drm:
-												Update to ytdl-2021.02.10

Except: [archiveorg] Fix and improve extraction (5fc53690cbe6abb11941a3f4846b566a7472753e)

											
										
										
											2021-02-11 02:52:55 +05:30
+								                continue
-												[ie/youtube] Warn on DRM formats (#12593)

Authored by: coletdjnz
											
										
										
											2025-03-16 10:28:16 +13:00
+								            if has_drm:
 								                msg = f'Some {client_name} client https formats have been skipped as they are DRM protected. '
 								                if client_name == 'tv':
 								                    msg += (
 								                        f'{"Your account" if self.is_authenticated else "The current session"} may have '
 								                        f'an experiment that applies DRM to all videos on the tv client. '
 								                        f'See  https://github.com/yt-dlp/yt-dlp/issues/12563  for more details.'
 								                    )
 								                self.report_warning(msg, video_id, only_once=True)
-												[youtube] Update to ytdl-2021.02.04.1

											
										
										
											2021-02-04 20:07:17 +05:30
+								            fmt_url = fmt.get('url')
 								            if not fmt_url:
-												[compat] Remove deprecated functions from core code

											
										
										
											2022-06-24 16:24:43 +05:30
+								                sc = urllib.parse.parse_qs(fmt.get('signatureCipher'))
-												[youtube] Update to ytdl-2021.02.04.1

											
										
										
											2021-02-04 20:07:17 +05:30
+								                fmt_url = url_or_none(try_get(sc, lambda x: x['url'][0]))
 								                encrypted_sig = try_get(sc, lambda x: x['s'][0])
-												[extractor/youtube] Make signature extraction non-fatal

and reduce verbosity of it's warning

Closes #3882

											
										
										
											2022-05-28 23:44:36 +05:30
+								                if not all((sc, fmt_url, player_url, encrypted_sig)):
-												[ie/youtube] Improve warning for SABR-only/SSAP player responses (#13049)

Ref: https://github.com/yt-dlp/yt-dlp/issues/12482

Authored by: bashonly
											
										
										
											2025-04-29 20:13:35 -05:00
+								                    msg = f'Some {client_name} client https formats have been skipped as they are missing a url. '
-												[ie/youtube] Do not require PO Token for premium accounts (#13640)

Authored by: coletdjnz
											
										
										
											2025-07-11 18:54:01 +12:00
+								                    if client_name in ('web', 'web_safari'):
-												[ie/youtube] Improve warning for SABR-only/SSAP player responses (#13049)

Ref: https://github.com/yt-dlp/yt-dlp/issues/12482

Authored by: bashonly
											
										
										
											2025-04-29 20:13:35 -05:00
+								                        msg += 'YouTube is forcing SABR streaming for this client. '
 								                    else:
 								                        msg += (
 								                            f'YouTube may have enabled the SABR-only or Server-Side Ad Placement experiment for '
 								                            f'{"your account" if self.is_authenticated else "the current session"}. '
 								                        )
 								                    msg += 'See  https://github.com/yt-dlp/yt-dlp/issues/12482  for more details'
 								                    self.report_warning(msg, video_id, only_once=True)
-												[youtube] Update to ytdl-2021.02.04.1

											
										
										
											2021-02-04 20:07:17 +05:30
+								                    continue
-												[extractor/youtube] Make signature extraction non-fatal

and reduce verbosity of it's warning

Closes #3882

											
										
										
											2022-05-28 23:44:36 +05:30
+								                try:
-												[cleanup] Add more ruff rules (#10149)

Authored by: seproDev

Reviewed-by: bashonly <88596187+bashonly@users.noreply.github.com>
Reviewed-by: Simon Sawicki <contact@grub4k.xyz>
											
										
										
											2024-06-12 01:09:58 +02:00
+								                    fmt_url += '&{}={}'.format(
-												[extractor/youtube] Make signature extraction non-fatal

and reduce verbosity of it's warning

Closes #3882

											
										
										
											2022-05-28 23:44:36 +05:30
+								                        traverse_obj(sc, ('sp', -1)) or 'signature',
-												[cleanup] Add more ruff rules (#10149)

Authored by: seproDev

Reviewed-by: bashonly <88596187+bashonly@users.noreply.github.com>
Reviewed-by: Simon Sawicki <contact@grub4k.xyz>
											
										
										
											2024-06-12 01:09:58 +02:00
+								                        self._decrypt_signature(encrypted_sig, video_id, player_url),
-												[extractor/youtube] Make signature extraction non-fatal

and reduce verbosity of it's warning

Closes #3882

											
										
										
											2022-05-28 23:44:36 +05:30
+								                    )
 								                except ExtractorError as e:
-												[ie/youtube] Improve signature extraction debug output (#13327)

Authored by: bashonly
											
										
										
											2025-05-30 18:16:47 -05:00
+								                    self.report_warning(
 								                        f'Signature extraction failed: Some formats may be missing\n'
 								                        f'         player = {player_url}\n'
 								                        f'         {bug_reports_message(before="")}',
 								                        video_id=video_id, only_once=True)
 								                    self.write_debug(
 								                        f'{video_id}: Signature extraction failure info:\n'
 								                        f'         encrypted sig = {encrypted_sig}\n'
 								                        f'         player = {player_url}')
-												[extractor/youtube] Make signature extraction non-fatal

and reduce verbosity of it's warning

Closes #3882

											
										
										
											2022-05-28 23:44:36 +05:30
+								                    self.write_debug(e, only_once=True)
-												[youtube] Show format ID in signature deobfuscation -v output

											
										
										
											2014-08-02 06:35:18 +02:00
+								                    continue
-												[youtube] Update to ytdl-2021.02.04.1

											
										
										
											2021-02-04 20:07:17 +05:30
-												[youtube] Fix throttling by decrypting n-sig (#1437)


											
										
										
											2021-10-31 09:53:58 +05:30
+								            query = parse_qs(fmt_url)
-												[youtube] Decrypt n-sig for URLs with `ratebypass`
Closes #1796

											
										
										
											2021-11-28 18:01:46 +05:30
+								            if query.get('n'):
-												[youtube] Fix throttling by decrypting n-sig (#1437)


											
										
										
											2021-10-31 09:53:58 +05:30
+								                try:
-												[youtube] Improve signature caching

and refactor related functions

											
										
										
											2022-08-18 21:27:41 +05:30
+								                    decrypt_nsig = self._cached(self._decrypt_nsig, 'nsig', query['n'][0])
-												[youtube] Fix throttling by decrypting n-sig (#1437)


											
										
										
											2021-10-31 09:53:58 +05:30
+								                    fmt_url = update_url_query(fmt_url, {
-												[cleanup] Add more ruff rules (#10149)

Authored by: seproDev

Reviewed-by: bashonly <88596187+bashonly@users.noreply.github.com>
Reviewed-by: Simon Sawicki <contact@grub4k.xyz>
											
										
										
											2024-06-12 01:09:58 +02:00
+								                        'n': decrypt_nsig(query['n'][0], video_id, player_url),
-												[youtube] Improve signature caching

and refactor related functions

											
										
										
											2022-08-18 21:27:41 +05:30
+								                    })
-												[youtube] Fix throttling by decrypting n-sig (#1437)


											
										
										
											2021-10-31 09:53:58 +05:30
+								                except ExtractorError as e:
-												[docs] Improvements

* Move detailed installation instructions to https://github.com/yt-dlp/yt-dlp/wiki/Installation
* Link to wiki where applicable
* Fix some mistakes. Closes #4853, Closes #4855, Closes #4852
* Improve some error messages

											
										
										
											2022-09-07 17:35:45 +05:30
+								                    if player_url:
 								                        self.report_warning(
-												[ie/youtube] Fix nsig and signature extraction for player `643afba4` (#12684)

Closes #12677, Closes #12682
Authored by: seproDev, bashonly

Co-authored-by: bashonly <88596187+bashonly@users.noreply.github.com>
											
										
										
											2025-03-21 21:58:10 +01:00
+								                            f'nsig extraction failed: Some formats may be missing\n'
-												[ie/youtube] Add `player_js_variant` extractor-arg  (#12767)

- Always distinguish between different JS variants' code/functions
- Change naming scheme for nsig and sigfuncs in disk cache

Authored by: bashonly
											
										
										
											2025-03-31 14:45:48 -05:00
+								                            f'         n = {query["n"][0]} ; player = {player_url}\n'
 								                            f'         {bug_reports_message(before="")}',
-												[ie/youtube] Fix nsig and signature extraction for player `643afba4` (#12684)

Closes #12677, Closes #12682
Authored by: seproDev, bashonly

Co-authored-by: bashonly <88596187+bashonly@users.noreply.github.com>
											
										
										
											2025-03-21 21:58:10 +01:00
+								                            video_id=video_id, only_once=True)
-												[docs] Improvements

* Move detailed installation instructions to https://github.com/yt-dlp/yt-dlp/wiki/Installation
* Link to wiki where applicable
* Fix some mistakes. Closes #4853, Closes #4855, Closes #4852
* Improve some error messages

											
										
										
											2022-09-07 17:35:45 +05:30
+								                        self.write_debug(e, only_once=True)
 								                    else:
 								                        self.report_warning(
-												[ie/youtube] Skip formats if nsig decoding fails (#10223)

Ref: https://github.com/ytdl-org/youtube-dl/issues/32815

Authored by: bashonly
											
										
										
											2024-06-21 18:19:59 -05:00
+								                            'Cannot decrypt nsig without player_url: Some formats may be missing',
-												[docs] Improvements

* Move detailed installation instructions to https://github.com/yt-dlp/yt-dlp/wiki/Installation
* Link to wiki where applicable
* Fix some mistakes. Closes #4853, Closes #4855, Closes #4852
* Improve some error messages

											
										
										
											2022-09-07 17:35:45 +05:30
+								                            video_id=video_id, only_once=True)
-												[ie/youtube] Skip formats if nsig decoding fails (#10223)

Ref: https://github.com/ytdl-org/youtube-dl/issues/32815

Authored by: bashonly
											
										
										
											2024-06-21 18:19:59 -05:00
+								                    continue
-												[youtube] Fix throttling by decrypting n-sig (#1437)


											
										
										
											2021-10-31 09:53:58 +05:30
-												[core] Fix `filesize_approx` calculation (#9560)

Reverts 22e4dfacb61f62dfbb3eb41b31c7b69ba1059b80

Despite being documented as `Kbit/s`, the extractors/manifests were returning bitrates in SI units of kilobits/sec.

Authored by: seproDev, pukkandan
											
										
										
											2024-04-01 01:17:24 +02:00
+								            tbr = float_or_none(fmt.get('averageBitrate') or fmt.get('bitrate'), 1000)
-												[cleanup] Misc (#11347)

Closes #11361
Authored by: avagordon01, bashonly, grqz, Grub4K, seproDev

Co-authored-by: Ava Gordon <avagordon01@gmail.com>
Co-authored-by: bashonly <bashonly@protonmail.com>
Co-authored-by: N/Ame <173015200+grqz@users.noreply.github.com>
Co-authored-by: Simon Sawicki <contact@grub4k.xyz>
											
										
										
											2024-11-04 01:33:21 +01:00
+								            format_duration = traverse_obj(fmt, ('approxDurationMs', {float_or_none(scale=1000)}))
-												[youtube] De-prioritize potentially damaged formats

Closes #2823

											
										
										
											2022-02-18 19:41:37 +05:30
+								            # Some formats may have much smaller duration than others (possibly damaged during encoding)
-												[docs] Consistent use of `e.g.` (#4643)

Authored by: Lesmiscore
											
										
										
											2022-08-14 21:04:13 +09:00
+								            # E.g. 2-nOtRESiUc Ref: https://github.com/yt-dlp/yt-dlp/issues/2823
-												[youtube] Avoid false positives when detecting damaged formats

Closes #3083

											
										
										
											2022-03-16 19:46:19 +05:30
+								            # Make sure to avoid false positives with small duration differences.
-												[docs] Consistent use of `e.g.` (#4643)

Authored by: Lesmiscore
											
										
										
											2022-08-14 21:04:13 +09:00
+								            # E.g. __2ABJjxzNo, ySuUZEjARPY
-												[ie/youtube] Calculate more accurate `filesize`

YouTube provides slightly different duration for each format.
Calculating file-size based on this duration instead of the
video duration gives more accurate results.

Ref: https://github.com/yt-dlp/yt-dlp/issues/1400#issuecomment-2007441207

											
										
										
											2024-04-01 02:20:03 +05:30
+								            is_damaged = try_call(lambda: format_duration < duration // 2)
-												[cleanup, docs] Misc cleanup

Closes #2828, closes #2734, closes #2802, closes #2937

											
										
										
											2022-03-04 19:38:55 +05:30
+								            if is_damaged:
-												[cleanup] Minor fixes (See desc)

* [youtube] Fix `--youtube-skip-dash-manifest`
* [build] Use `$()` in `Makefile`. Closes #3684
* Fix bug in 385ffb467b2285e85a2a5495b90314ba1f8e0700
* Fix bug in 43d7f5a5d0c77556156a3f8caa6976d3908a1e38
* [cleanup] Remove unnecessary `utf-8` from `str.encode`/`bytes.decode`
* [utils] LazyList: Expose unnecessarily "protected" attributes
and other minor cleanup

											
										
										
											2022-05-09 17:24:28 +05:30
+								                self.report_warning(
-												[cleanup] Misc (#12802)

Authored by: bashonly
											
										
										
											2025-03-31 16:38:21 -05:00
+								                    'Some formats are possibly damaged. They will be deprioritized', video_id, only_once=True)
-												[extractor/youtube] Add client name to `format_note` when `-v` (#6254)

Authored by: Lesmiscore, pukkandan
											
										
										
											2023-03-12 02:03:23 +09:00
-												[ie/youtube] Do not require PO Token for premium accounts (#13640)

Authored by: coletdjnz
											
										
										
											2025-07-11 18:54:01 +12:00
+								            fetch_po_token_func = fmt[STREAMING_DATA_FETCH_GVS_PO_TOKEN]
 								            pot_policy: GvsPoTokenPolicy = self._get_default_ytcfg(client_name)['GVS_PO_TOKEN_POLICY'][StreamingProtocol.HTTPS]
 								            require_po_token = (
 								                itag not in ['18']
 								                and gvs_pot_required(
 								                    pot_policy, fmt[STREAMING_DATA_IS_PREMIUM_SUBSCRIBER],
 								                    fmt[STREAMING_DATA_PLAYER_TOKEN_PROVIDED]))
 								            po_token = (
 								                gvs_pots.get(client_name)
 								                or fetch_po_token_func(required=require_po_token or pot_policy.recommended))
-												[ie/youtube] Add `po_token`, `visitor_data`, `data_sync_id` extractor args (#10648)

Authored by:  seproDev, coletdjnz, bashonly
											
										
										
											2024-09-13 12:51:58 +02:00
 								            if po_token:
 								                fmt_url = update_url_query(fmt_url, {'pot': po_token})
-												[ie/youtube] Do not require PO Token for premium accounts (#13640)

Authored by: coletdjnz
											
										
										
											2025-07-11 18:54:01 +12:00
+								                if client_name not in gvs_pots:
 								                    gvs_pots[client_name] = po_token
-												[ie/youtube] Add `po_token`, `visitor_data`, `data_sync_id` extractor args (#10648)

Authored by:  seproDev, coletdjnz, bashonly
											
										
										
											2024-09-13 12:51:58 +02:00
-												[ie/youtube] Do not require PO Token for premium accounts (#13640)

Authored by: coletdjnz
											
										
										
											2025-07-11 18:54:01 +12:00
+								            if not po_token and require_po_token and 'missing_pot' not in self._configuration_arg('formats'):
-												[ie/youtube] Skip iOS formats that require PO Token (#11890)

Partial fix for https://github.com/yt-dlp/yt-dlp/issues/11868

Authored by: coletdjnz
											
										
										
											2024-12-24 12:03:28 +13:00
+								                self._report_pot_format_skipped(video_id, client_name, 'https')
 								                continue
-												[ie/youtube] Remove `android` from default clients (#9553)

Closes #9554
Authored by: coletdjnz, bashonly

Co-authored-by: bashonly <88596187+bashonly@users.noreply.github.com>
											
										
										
											2024-05-18 04:03:02 +12:00
-												[extractor/youtube] Prioritize premium formats

Closes #7283

											
										
										
											2023-06-19 14:09:26 +05:30
+								            name = fmt.get('qualityLabel') or quality.replace('audio_quality_', '') or ''
-												[extractor/youtube] Ignore wrong fps of some formats

											
										
										
											2023-06-21 05:11:14 +05:30
+								            fps = int_or_none(fmt.get('fps')) or 0
-												[youtube] Update to ytdl-2021.02.04.1

											
										
										
											2021-02-04 20:07:17 +05:30
+								            dct = {
 								                'asr': int_or_none(fmt.get('audioSampleRate')),
 								                'filesize': int_or_none(fmt.get('contentLength')),
-												[extractor/youtube] Extract DRC formats

											
										
										
											2022-12-30 15:32:33 +05:30
+								                'format_id': f'{itag}{"-drc" if fmt.get("isDrc") else ""}',
-												[utils] Add `join_nonempty`

											
										
										
											2021-11-06 06:35:24 +05:30
+								                'format_note': join_nonempty(
-												[ie/youtube] Prioritize original language over auto-dubbed audio (#11803)

Closes #11753
Authored by: bashonly
											
										
										
											2024-12-13 10:21:48 +00:00
+								                    join_nonempty(display_name, is_default and ' (default)', delim=''),
-												[extractor/youtube] Prioritize premium formats

Closes #7283

											
										
										
											2023-06-19 14:09:26 +05:30
+								                    name, fmt.get('isDrc') and 'DRC',
-												[extractor/youtube] Extract more format info

											
										
										
											2022-08-08 01:36:11 +05:30
+								                    try_get(fmt, lambda x: x['projectionType'].replace('RECTANGULAR', '').lower()),
 								                    try_get(fmt, lambda x: x['spatialAudioType'].replace('SPATIAL_AUDIO_TYPE_', '').lower()),
-												[ie/youtube] Do not require PO Token for premium accounts (#13640)

Authored by: coletdjnz
											
										
										
											2025-07-11 18:54:01 +12:00
+								                    is_damaged and 'DAMAGED', require_po_token and not po_token and 'MISSING POT',
-												[ie/youtube] Fix `format_note` (Bugfix for 3a3bd00037e9908e87da4fa9f2ad772aa34dc60e) (#11028)

Authored by: bashonly
											
										
										
											2024-09-24 17:12:02 -05:00
+								                    (self.get_param('verbose') or all_formats) and short_client_name(client_name),
-												[extractor/youtube] Add client name to `format_note` when `-v` (#6254)

Authored by: Lesmiscore, pukkandan
											
										
										
											2023-03-12 02:03:23 +09:00
+								                    delim=', '),
-												[youtube] Deprioritize format 22

Reduces chance of encountering #3372

											
										
										
											2022-05-07 08:03:41 +05:30
+								                # Format 22 is likely to be damaged. See https://github.com/yt-dlp/yt-dlp/issues/3372
-												[ie/youtube] Skip formats if nsig decoding fails (#10223)

Ref: https://github.com/ytdl-org/youtube-dl/issues/32815

Authored by: bashonly
											
										
										
											2024-06-21 18:19:59 -05:00
+								                'source_preference': (-5 if itag == '22' else -1) + (100 if 'Premium' in name else 0),
-												[extractor/youtube] Ignore wrong fps of some formats

											
										
										
											2023-06-21 05:11:14 +05:30
+								                'fps': fps if fps > 1 else None,  # For some formats, fps is wrongly returned as 1
-												[extractor/youtube] Extract more format info

											
										
										
											2022-08-08 01:36:11 +05:30
+								                'audio_channels': fmt.get('audioChannels'),
-												[youtube] Fix format sorting when using alternate clients

											
										
										
											2021-07-26 03:33:42 +05:30
+								                'height': height,
-												[extractor/youtube] Extract DRC formats

											
										
										
											2022-12-30 15:32:33 +05:30
+								                'quality': q(quality) - bool(fmt.get('isDrc')) / 2,
-												[ie/youtube] Warn on DRM formats (#12593)

Authored by: coletdjnz
											
										
										
											2025-03-16 10:28:16 +13:00
+								                'has_drm': has_drm,
-												Update to ytdl-2021.02.10

Except: [archiveorg] Fix and improve extraction (5fc53690cbe6abb11941a3f4846b566a7472753e)

											
										
										
											2021-02-11 02:52:55 +05:30
+								                'tbr': tbr,
-												[ie/youtube] Calculate more accurate `filesize`

YouTube provides slightly different duration for each format.
Calculating file-size based on this duration instead of the
video duration gives more accurate results.

Ref: https://github.com/yt-dlp/yt-dlp/issues/1400#issuecomment-2007441207

											
										
										
											2024-04-01 02:20:03 +05:30
+								                'filesize_approx': filesize_from_tbr(tbr, format_duration),
-												[youtube] Update to ytdl-2021.02.04.1

											
										
										
											2021-02-04 20:07:17 +05:30
+								                'url': fmt_url,
-												[youtube] Fix format sorting when using alternate clients

											
										
										
											2021-07-26 03:33:42 +05:30
+								                'width': int_or_none(fmt.get('width')),
-												[ie/youtube] Extract all formats from multi-language m3u8s (#9875)

Authored by: clienthax, bashonly

Co-authored-by: bashonly <88596187+bashonly@users.noreply.github.com>
											
										
										
											2024-06-20 22:54:53 +01:00
+								                'language': join_nonempty(language_code, 'desc' if is_descriptive else '') or None,
-												[ie/youtube] Prioritize original language over auto-dubbed audio (#11803)

Closes #11753
Authored by: bashonly
											
										
										
											2024-12-13 10:21:48 +00:00
+								                'language_preference': PREFERRED_LANG_VALUE if is_original else 5 if is_default else -10 if is_descriptive else -1,
-												[ie/youtube] Do not strictly deprioritize `missing_pot` formats (#13061)

Deprioritization was redundant; they're already hidden behind an extractor-arg

Authored by: bashonly
											
										
										
											2025-04-30 17:51:40 -05:00
+								                # Strictly de-prioritize damaged and 3gp formats
 								                'preference': -10 if is_damaged else -2 if itag == '17' else None,
-												[youtube] Update to ytdl-2021.02.04.1

											
										
										
											2021-02-04 20:07:17 +05:30
+								            }
-												[youtube] Fix sorting of 3gp format

											
										
										
											2021-07-08 21:41:08 +05:30
+								            mime_mobj = re.match(
 								                r'((?:[^/]+)/(?:[^;]+))(?:;\s*codecs="([^"]+)")?', fmt.get('mimeType') or '')
 								            if mime_mobj:
 								                dct['ext'] = mimetype2ext(mime_mobj.group(1))
 								                dct.update(parse_codecs(mime_mobj.group(2)))
-												[extractor/youtube] Add extractor-arg `include_duplicate_formats`

											
										
										
											2023-03-09 23:13:02 +05:30
+								            if itag:
 								                itags[itag].add(('https', dct.get('language')))
 								                stream_ids.append(stream_id)
-												[extractor/youtube] Bypass throttling for `-f17`

and related cleanup

Thanks @AudricV for the finding

											
										
										
											2023-03-09 22:09:23 +05:30
+								            single_stream = 'none' in (dct.get('acodec'), dct.get('vcodec'))
 								            if single_stream and dct.get('ext'):
 								                dct['container'] = dct['ext'] + '_dash'
-												[extractor/youtube] Add extractor-arg `include_duplicate_formats`

											
										
										
											2023-03-09 23:13:02 +05:30
-												[ie/youtube] Optimize playback wait times (#14124)

Authored by: bashonly
											
										
										
											2025-08-22 18:53:28 -05:00
+								            # For handling potential pre-playback required waiting period
 								            if live_status not in ('is_live', 'post_live'):
 								                dct['available_at'] = available_at
-												[extractor/youtube] Add extractor-arg `formats`

Closes #7417

											
										
										
											2023-06-25 20:10:00 +05:30
+								            if (all_formats or 'dashy' in format_types) and dct['filesize']:
-												[extractor/youtube] Add extractor-arg `include_duplicate_formats`

											
										
										
											2023-03-09 23:13:02 +05:30
+								                yield {
 								                    **dct,
 								                    'format_id': f'{dct["format_id"]}-dashy' if all_formats else dct['format_id'],
-												[extractor/youtube] Construct dash formats with `range` query

Closes #6369

											
										
										
											2023-02-28 23:03:44 +05:30
+								                    'protocol': 'http_dash_segments',
-												Fix 2a23d92d9ec44a0168079e38bcf3d383e5c4c7bb

Closes #6517

											
										
										
											2023-03-12 14:46:09 +05:30
+								                    'fragments': build_fragments(dct),
-												[extractor/youtube] Add extractor-arg `include_duplicate_formats`

											
										
										
											2023-03-09 23:13:02 +05:30
+								                }
-												[extractor/youtube] Add extractor-arg `formats`

Closes #7417

											
										
										
											2023-06-25 20:10:00 +05:30
+								            if all_formats or 'dashy' not in format_types:
 								                dct['downloader_options'] = {'http_chunk_size': CHUNK_SIZE}
 								                yield dct
-												[youtube] Update to ytdl-2021.02.04.1

											
										
										
											2021-02-04 20:07:17 +05:30
-												[extractor/youtube] Download `post_live` videos from start (#5091)

* The fragments are generated as a `LazyList`. So only the required formats are expanded during download, but all fragment lists are printed/written in infojson.
* The m3u8 formats which cannot be downloaded from start are not extracted by default, but can be enabled with an extractor-arg. The extractor-arg `include_live_dash` is renamed to `include_incomplete_formats` to account for this new use-case.

Closes #1564
Authored by: Lesmiscore, pukkandan
											
										
										
											2022-10-04 11:48:31 +09:00
+								        needs_live_processing = self._needs_live_processing(live_status, duration)
-												[extractor/youtube] Add extractor-arg `formats`

Closes #7417

											
										
										
											2023-06-25 20:10:00 +05:30
+								        skip_bad_formats = 'incomplete' not in format_types
-												[extractor/youtube] Download `post_live` videos from start (#5091)

* The fragments are generated as a `LazyList`. So only the required formats are expanded during download, but all fragment lists are printed/written in infojson.
* The m3u8 formats which cannot be downloaded from start are not extracted by default, but can be enabled with an extractor-arg. The extractor-arg `include_live_dash` is renamed to `include_incomplete_formats` to account for this new use-case.

Closes #1564
Authored by: Lesmiscore, pukkandan
											
										
										
											2022-10-04 11:48:31 +09:00
 								        skip_manifests = set(self._configuration_arg('skip'))
-												[cleanup] Deprecate various options (#13821)

Closes #14198, Closes #12909
Authored by: seproDev
											
										
										
											2025-09-21 17:10:37 +02:00
+								        if (needs_live_processing == 'is_live'  # These will be filtered out by YoutubeDL anyway
-												[cleanup] Bump ruff to 0.8.x (#11608)

Authored by: seproDev
											
										
										
											2024-12-02 16:29:30 +01:00
+								                or (needs_live_processing and skip_bad_formats)):
-												[extractor/youtube] Download `post_live` videos from start (#5091)

* The fragments are generated as a `LazyList`. So only the required formats are expanded during download, but all fragment lists are printed/written in infojson.
* The m3u8 formats which cannot be downloaded from start are not extracted by default, but can be enabled with an extractor-arg. The extractor-arg `include_live_dash` is renamed to `include_incomplete_formats` to account for this new use-case.

Closes #1564
Authored by: Lesmiscore, pukkandan
											
										
										
											2022-10-04 11:48:31 +09:00
+								            skip_manifests.add('hls')
-												[cleanup] Deprecate various options (#13821)

Closes #14198, Closes #12909
Authored by: seproDev
											
										
										
											2025-09-21 17:10:37 +02:00
+								        if skip_bad_formats and live_status == 'is_live' and needs_live_processing != 'is_live':
-												[extractor/youtube] Download `post_live` videos from start (#5091)

* The fragments are generated as a `LazyList`. So only the required formats are expanded during download, but all fragment lists are printed/written in infojson.
* The m3u8 formats which cannot be downloaded from start are not extracted by default, but can be enabled with an extractor-arg. The extractor-arg `include_live_dash` is renamed to `include_incomplete_formats` to account for this new use-case.

Closes #1564
Authored by: Lesmiscore, pukkandan
											
										
										
											2022-10-04 11:48:31 +09:00
+								            skip_manifests.add('dash')
-												Add `--extractor-args` to pass extractor-specific arguments

											
										
										
											2021-06-25 19:35:41 +05:30
-												[ie/youtube] Do not require PO Token for premium accounts (#13640)

Authored by: coletdjnz
											
										
										
											2025-07-11 18:54:01 +12:00
+								        def process_manifest_format(f, proto, client_name, itag, missing_pot):
-												[extractor/youtube] Consider language in format de-duplication

											
										
										
											2022-11-15 05:23:32 +05:30
+								            key = (proto, f.get('language'))
-												[extractor/youtube] Add extractor-arg `include_duplicate_formats`

											
										
										
											2023-03-09 23:13:02 +05:30
+								            if not all_formats and key in itags[itag]:
-												[extractor/youtube] Consider language in format de-duplication

											
										
										
											2022-11-15 05:23:32 +05:30
+								                return False
-												[ie/youtube] Optimize playback wait times (#14124)

Authored by: bashonly
											
										
										
											2025-08-22 18:53:28 -05:00
+								            # For handling potential pre-playback required waiting period
 								            if live_status not in ('is_live', 'post_live'):
 								                f['available_at'] = available_at
-												[ie/youtube] Add `po_token`, `visitor_data`, `data_sync_id` extractor args (#10648)

Authored by:  seproDev, coletdjnz, bashonly
											
										
										
											2024-09-13 12:51:58 +02:00
+								            if f.get('source_preference') is None:
 								                f['source_preference'] = -1
-												[ie/youtube] Deprioritize `web_safari` m3u8 formats (#14168)

Authored by: bashonly
											
										
										
											2025-08-27 17:31:51 -05:00
+								            # Deprioritize since its pre-merged m3u8 formats may have lower quality audio streams
 								            if client_name == 'web_safari' and proto == 'hls' and live_status != 'is_live':
 								                f['source_preference'] -= 1
-												[ie/youtube] Do not require PO Token for premium accounts (#13640)

Authored by: coletdjnz
											
										
										
											2025-07-11 18:54:01 +12:00
+								            if missing_pot:
-												[ie/youtube] Skip iOS formats that require PO Token (#11890)

Partial fix for https://github.com/yt-dlp/yt-dlp/issues/11868

Authored by: coletdjnz
											
										
										
											2024-12-24 12:03:28 +13:00
+								                f['format_note'] = join_nonempty(f.get('format_note'), 'MISSING POT', delim=' ')
-												[ie/youtube] Add `po_token`, `visitor_data`, `data_sync_id` extractor args (#10648)

Authored by:  seproDev, coletdjnz, bashonly
											
										
										
											2024-09-13 12:51:58 +02:00
+								                f['source_preference'] -= 20
-												[ie/youtube] Fix DASH formats incorrectly skipped in some situations (#11910)

Closes https://github.com/yt-dlp/yt-dlp/issues/11907
Authored by: coletdjnz
											
										
										
											2024-12-26 14:19:17 +13:00
+								            itags[itag].add(key)
-												[extractor/youtube] Add extractor-arg `include_duplicate_formats`

											
										
										
											2023-03-09 23:13:02 +05:30
+								            if itag and all_formats:
 								                f['format_id'] = f'{itag}-{proto}'
 								            elif any(p != proto for p, _ in itags[itag]):
-												[extractor/youtube] Consider language in format de-duplication

											
										
										
											2022-11-15 05:23:32 +05:30
+								                f['format_id'] = f'{itag}-{proto}'
 								            elif itag:
-												[youtube] refactor itag processing

											
										
										
											2021-10-31 13:26:44 +05:30
+								                f['format_id'] = itag
-												[ie/youtube] Extract all formats from multi-language m3u8s (#9875)

Authored by: clienthax, bashonly

Co-authored-by: bashonly <88596187+bashonly@users.noreply.github.com>
											
										
										
											2024-06-20 22:54:53 +01:00
+								            if original_language and f.get('language') == original_language:
 								                f['format_note'] = join_nonempty(f.get('format_note'), '(default)', delim=' ')
 								                f['language_preference'] = PREFERRED_LANG_VALUE
-												[extractor/youtube] Add `ios` to default clients used

* IOS is affected neither by 403 or by nsig so helps mitigate them preemptively
* IOS also has higher bit-rate "premium" formats though they are not labeled as such

											
										
										
											2023-06-22 00:20:04 +05:30
+								            if itag in ('616', '235'):
 								                f['format_note'] = join_nonempty(f.get('format_note'), 'Premium', delim=' ')
-												[ie/youtube] Avoid false DRM detection (#7396)

Some master manifests contain a mix of DRM and non-DRM formats

											
										
										
											2023-06-23 18:16:07 +05:30
+								                f['source_preference'] += 100
-												[extractor/youtube] Add `ios` to default clients used

* IOS is affected neither by 403 or by nsig so helps mitigate them preemptively
* IOS also has higher bit-rate "premium" formats though they are not labeled as such

											
										
										
											2023-06-22 00:20:04 +05:30
-												[extractor/youtube] Fix bug in format sorting

											
										
										
											2022-08-21 00:56:27 +05:30
+								            f['quality'] = q(itag_qualities.get(try_get(f, lambda f: f['format_id'].split('-')[0]), -1))
-												[youtube] Improve format sorting for IOS formats

When no itag/resolution is available for reference, use the closest resolution

											
										
										
											2022-08-15 13:58:39 +05:30
+								            if f['quality'] == -1 and f.get('height'):
 								                f['quality'] = q(res_qualities[min(res_qualities, key=lambda x: abs(x - f['height']))])
-												[cleanup] Misc

Closes #6288, Closes #7197, Closes #7265, Closes #7353, Closes #5773
Authored by: mikf, freezboltz, pukkandan

											
										
										
											2023-06-21 09:21:20 +05:30
+								            if self.get_param('verbose') or all_formats:
-												[ie/youtube] Fix `format_note` (Bugfix for 3a3bd00037e9908e87da4fa9f2ad772aa34dc60e) (#11028)

Authored by: bashonly
											
										
										
											2024-09-24 17:12:02 -05:00
+								                f['format_note'] = join_nonempty(
 								                    f.get('format_note'), short_client_name(client_name), delim=', ')
-												[extractor/youtube] Ignore wrong fps of some formats

											
										
										
											2023-06-21 05:11:14 +05:30
+								            if f.get('fps') and f['fps'] <= 1:
 								                del f['fps']
-												[ie/youtube] Avoid false DRM detection (#7396)

Some master manifests contain a mix of DRM and non-DRM formats

											
										
										
											2023-06-23 18:16:07 +05:30
 								            if proto == 'hls' and f.get('has_drm'):
 								                f['has_drm'] = 'maybe'
 								                f['source_preference'] -= 5
-												[youtube] refactor itag processing

											
										
										
											2021-10-31 13:26:44 +05:30
+								            return True
-												[youtube] Fix format sorting when using alternate clients

											
										
										
											2021-07-26 03:33:42 +05:30
-												[webvtt, extractor/youtube] Extract auto-subs from livestream VODs

Closes #4130

Authored by: pukkandan, fstirlitz

											
										
										
											2022-06-22 03:46:54 +05:30
+								        subtitles = {}
-												[youtube] Extract data from multiple clients (#536)

* `player_client` accepts multiple clients
* default `player_client` = `android,web`
* music clients can be specifically requested
* Add IOS `player_client`
* Hide live dash since they can't be downloaded

Closes #501

Authored-by: pukkandan, colethedj
											
										
										
											2021-07-21 09:22:34 +05:30
+								        for sd in streaming_data:
-												[ie/youtube] Fix `format_note` (Bugfix for 3a3bd00037e9908e87da4fa9f2ad772aa34dc60e) (#11028)

Authored by: bashonly
											
										
										
											2024-09-24 17:12:02 -05:00
+								            client_name = sd[STREAMING_DATA_CLIENT_NAME]
-												[ie/youtube] Do not require PO Token for premium accounts (#13640)

Authored by: coletdjnz
											
										
										
											2025-07-11 18:54:01 +12:00
+								            fetch_pot_func = sd[STREAMING_DATA_FETCH_GVS_PO_TOKEN]
 								            is_premium_subscriber = sd[STREAMING_DATA_IS_PREMIUM_SUBSCRIBER]
 								            has_player_token = sd[STREAMING_DATA_PLAYER_TOKEN_PROVIDED]
-												[extractor/youtube] Download `post_live` videos from start (#5091)

* The fragments are generated as a `LazyList`. So only the required formats are expanded during download, but all fragment lists are printed/written in infojson.
* The m3u8 formats which cannot be downloaded from start are not extracted by default, but can be enabled with an extractor-arg. The extractor-arg `include_live_dash` is renamed to `include_incomplete_formats` to account for this new use-case.

Closes #1564
Authored by: Lesmiscore, pukkandan
											
										
										
											2022-10-04 11:48:31 +09:00
+								            hls_manifest_url = 'hls' not in skip_manifests and sd.get('hlsManifestUrl')
-												[Youtube] Extract more formats for `music.youtube` URLs (#311)

Based on: https://github.com/ytdl-org/youtube-dl/pull/28778, https://github.com/ytdl-org/youtube-dl/pull/26160

Co-authored-by: craftingmod, colethedj, pukkandan
											
										
										
											2021-05-16 02:38:47 +12:00
+								            if hls_manifest_url:
-												[ie/youtube] Do not require PO Token for premium accounts (#13640)

Authored by: coletdjnz
											
										
										
											2025-07-11 18:54:01 +12:00
+								                pot_policy: GvsPoTokenPolicy = self._get_default_ytcfg(
 								                    client_name)['GVS_PO_TOKEN_POLICY'][StreamingProtocol.HLS]
 								                require_po_token = gvs_pot_required(pot_policy, is_premium_subscriber, has_player_token)
 								                po_token = gvs_pots.get(client_name, fetch_pot_func(required=require_po_token or pot_policy.recommended))
-												[ie/youtube] Add `po_token`, `visitor_data`, `data_sync_id` extractor args (#10648)

Authored by:  seproDev, coletdjnz, bashonly
											
										
										
											2024-09-13 12:51:58 +02:00
+								                if po_token:
 								                    hls_manifest_url = hls_manifest_url.rstrip('/') + f'/pot/{po_token}'
-												[ie/youtube] Do not require PO Token for premium accounts (#13640)

Authored by: coletdjnz
											
										
										
											2025-07-11 18:54:01 +12:00
+								                    if client_name not in gvs_pots:
 								                        gvs_pots[client_name] = po_token
 								                if require_po_token and not po_token and 'missing_pot' not in self._configuration_arg('formats'):
 								                    self._report_pot_format_skipped(video_id, client_name, 'hls')
 								                else:
 								                    fmts, subs = self._extract_m3u8_formats_and_subtitles(
 								                        hls_manifest_url, video_id, 'mp4', fatal=False, live=live_status == 'is_live')
 								                    for sub in traverse_obj(subs, (..., ..., {dict})):
 								                        # TODO: If HLS video requires a PO Token, do the subs also require pot?
 								                        # Save client name for debugging
 								                        sub[STREAMING_DATA_CLIENT_NAME] = client_name
 								                    subtitles = self._merge_subtitles(subs, subtitles)
 								                    for f in fmts:
 								                        if process_manifest_format(f, 'hls', client_name, self._search_regex(
 								                                r'/itag/(\d+)', f['url'], 'itag', default=None), require_po_token and not po_token):
 								                            yield f
-												[youtube] Update to ytdl-2021.02.04.1

											
										
										
											2021-02-04 20:07:17 +05:30
-												[extractor/youtube] Download `post_live` videos from start (#5091)

* The fragments are generated as a `LazyList`. So only the required formats are expanded during download, but all fragment lists are printed/written in infojson.
* The m3u8 formats which cannot be downloaded from start are not extracted by default, but can be enabled with an extractor-arg. The extractor-arg `include_live_dash` is renamed to `include_incomplete_formats` to account for this new use-case.

Closes #1564
Authored by: Lesmiscore, pukkandan
											
										
										
											2022-10-04 11:48:31 +09:00
+								            dash_manifest_url = 'dash' not in skip_manifests and sd.get('dashManifestUrl')
-												Add `--extractor-args` to pass extractor-specific arguments

											
										
										
											2021-06-25 19:35:41 +05:30
+								            if dash_manifest_url:
-												[ie/youtube] Do not require PO Token for premium accounts (#13640)

Authored by: coletdjnz
											
										
										
											2025-07-11 18:54:01 +12:00
+								                pot_policy: GvsPoTokenPolicy = self._get_default_ytcfg(
 								                    client_name)['GVS_PO_TOKEN_POLICY'][StreamingProtocol.DASH]
 								                require_po_token = gvs_pot_required(pot_policy, is_premium_subscriber, has_player_token)
 								                po_token = gvs_pots.get(client_name, fetch_pot_func(required=require_po_token or pot_policy.recommended))
-												[ie/youtube] Add `po_token`, `visitor_data`, `data_sync_id` extractor args (#10648)

Authored by:  seproDev, coletdjnz, bashonly
											
										
										
											2024-09-13 12:51:58 +02:00
+								                if po_token:
 								                    dash_manifest_url = dash_manifest_url.rstrip('/') + f'/pot/{po_token}'
-												[ie/youtube] Do not require PO Token for premium accounts (#13640)

Authored by: coletdjnz
											
										
										
											2025-07-11 18:54:01 +12:00
+								                    if client_name not in gvs_pots:
 								                        gvs_pots[client_name] = po_token
 								                if require_po_token and not po_token and 'missing_pot' not in self._configuration_arg('formats'):
 								                    self._report_pot_format_skipped(video_id, client_name, 'dash')
 								                else:
 								                    formats, subs = self._extract_mpd_formats_and_subtitles(dash_manifest_url, video_id, fatal=False)
 								                    for sub in traverse_obj(subs, (..., ..., {dict})):
 								                        # TODO: If DASH video requires a PO Token, do the subs also require pot?
 								                        # Save client name for debugging
 								                        sub[STREAMING_DATA_CLIENT_NAME] = client_name
 								                    subtitles = self._merge_subtitles(subs, subtitles)  # Prioritize HLS subs over DASH
 								                    for f in formats:
 								                        if process_manifest_format(f, 'dash', client_name, f['format_id'], require_po_token and not po_token):
 								                            f['filesize'] = int_or_none(self._search_regex(
 								                                r'/clen/(\d+)', f.get('fragment_base_url') or f['url'], 'file size', default=None))
 								                            if needs_live_processing:
 								                                f['is_from_start'] = True
 								                            yield f
-												[webvtt, extractor/youtube] Extract auto-subs from livestream VODs

Closes #4130

Authored by: pukkandan, fstirlitz

											
										
										
											2022-06-22 03:46:54 +05:30
+								        yield subtitles
-												[youtube] Extract data from multiple clients (#536)

* `player_client` accepts multiple clients
* default `player_client` = `android,web`
* music clients can be specifically requested
* Add IOS `player_client`
* Hide live dash since they can't be downloaded

Closes #501

Authored-by: pukkandan, colethedj
											
										
										
											2021-07-21 09:22:34 +05:30
-												[youtube] Add storyboard formats
Closes: #1553, https://github.com/ytdl-org/youtube-dl/issues/9868
Related: https://github.com/ytdl-org/youtube-dl/pull/14951

											
										
										
											2021-11-17 01:26:23 +05:30
+								    def _extract_storyboard(self, player_responses, duration):
 								        spec = get_first(
 								            player_responses, ('storyboards', 'playerStoryboardSpecRenderer', 'spec'), default='').split('|')[::-1]
-												[youtube] Make invalid storyboard URL non-fatal

Closes #2382

											
										
										
											2022-01-19 18:09:52 +05:30
+								        base_url = url_or_none(urljoin('https://i.ytimg.com/', spec.pop() or None))
 								        if not base_url:
-												[youtube] Add storyboard formats
Closes: #1553, https://github.com/ytdl-org/youtube-dl/issues/9868
Related: https://github.com/ytdl-org/youtube-dl/pull/14951

											
										
										
											2021-11-17 01:26:23 +05:30
+								            return
 								        L = len(spec) - 1
 								        for i, args in enumerate(spec):
 								            args = args.split('#')
 								            counts = list(map(int_or_none, args[:5]))
 								            if len(args) != 8 or not all(counts):
 								                self.report_warning(f'Malformed storyboard {i}: {"#".join(args)}{bug_reports_message()}')
 								                continue
 								            width, height, frame_count, cols, rows = counts
 								            N, sigh = args[6:]
 								            url = base_url.replace('$L', str(L - i)).replace('$N', N) + f'&sigh={sigh}'
 								            fragment_count = frame_count / (cols * rows)
 								            fragment_duration = duration / fragment_count
 								            yield {
 								                'format_id': f'sb{i}',
 								                'format_note': 'storyboard',
 								                'ext': 'mhtml',
 								                'protocol': 'mhtml',
 								                'acodec': 'none',
 								                'vcodec': 'none',
 								                'url': url,
 								                'width': width,
 								                'height': height,
-												[extractor/youtube] More metadata for storyboards (#4334)

Authored by: ftk
											
										
										
											2022-07-12 15:16:45 +00:00
+								                'fps': frame_count / duration,
 								                'rows': rows,
 								                'columns': cols,
-												[youtube] Add storyboard formats
Closes: #1553, https://github.com/ytdl-org/youtube-dl/issues/9868
Related: https://github.com/ytdl-org/youtube-dl/pull/14951

											
										
										
											2021-11-17 01:26:23 +05:30
+								                'fragments': [{
-												[downloader/mhtml] Fix fragments with absolute urls (#3044)

Authored-by: coletdjnz
											
										
										
											2022-03-14 11:03:40 +13:00
+								                    'url': url.replace('$M', str(j)),
-												[youtube] Add storyboard formats
Closes: #1553, https://github.com/ytdl-org/youtube-dl/issues/9868
Related: https://github.com/ytdl-org/youtube-dl/pull/14951

											
										
										
											2021-11-17 01:26:23 +05:30
+								                    'duration': min(fragment_duration, duration - (j * fragment_duration)),
 								                } for j in range(math.ceil(fragment_count))],
 								            }
-												[ie/youtube] Do not require PO Token for premium accounts (#13640)

Authored by: coletdjnz
											
										
										
											2025-07-11 18:54:01 +12:00
+								    def _download_initial_webpage(self, webpage_url, webpage_client, video_id):
-												[youtube] Improvements to JS player extraction (See desc) (#860)

* fallback player url extraction when it fails to be extracted from the webpage
* don't download js player unnecessarily for clients that don't require it
* try to extract js player url from any additional client configs
* ability to skip the js player usage/download using `player_skip=js`
* ability to skip the initial webpage download using `player_skip=webpage`

known issue:
* authentication for multi-channel accounts and multi-account cookies may not work correctly if the webpage or client configs are skipped
*  formats from the web client requiring signature decryption will be skipped if player js extraction is skipped

Authored by: coletdjnz
											
										
										
											2021-09-06 07:26:41 +00:00
+								        webpage = None
-												[ie/youtube] Do not require PO Token for premium accounts (#13640)

Authored by: coletdjnz
											
										
										
											2025-07-11 18:54:01 +12:00
+								        if webpage_url and 'webpage' not in self._configuration_arg('player_skip'):
-												[extractor/youtube] Use device-specific user agent (#4770)

Thwart latest fingerprinting attempt (see https://github.com/iv-org/invidious/issues/3230#issuecomment-1226887639)

Authored by: coletdjnz
											
										
										
											2022-08-28 22:59:54 +00:00
+								            query = {'bpctr': '9999999999', 'has_verified': '1'}
-												[ie/youtube] Do not require PO Token for premium accounts (#13640)

Authored by: coletdjnz
											
										
										
											2025-07-11 18:54:01 +12:00
+								            pp = (
 								                self._configuration_arg('player_params', [None], casesense=True)[0]
 								                or traverse_obj(INNERTUBE_CLIENTS, (webpage_client, 'PLAYER_PARAMS', {str}))
 								            )
-												[ie/youtube] Add `player_params` extractor arg (#7719)

Authored by: coletdjnz
											
										
										
											2023-07-29 18:20:42 +12:00
+								            if pp:
 								                query['pp'] = pp
-												[ie/youtube] Do not require PO Token for premium accounts (#13640)

Authored by: coletdjnz
											
										
										
											2025-07-11 18:54:01 +12:00
+								            webpage = self._download_webpage_with_retries(
 								                webpage_url, video_id, query=query,
 								                headers=traverse_obj(self._get_default_ytcfg(webpage_client), {
 								                    'User-Agent': ('INNERTUBE_CONTEXT', 'client', 'userAgent', {str}),
 								                }))
 								        return webpage
-												[dash,youtube] Download live from start to end (#888)

* Add option `--live-from-start` to enable downloading live videos from start
* Add key `is_from_start` in formats to identify formats (of live videos) that downloads from start
* [dash] Create protocol `http_dash_segments_generator` that allows a function to be passed instead of fragments
* [fragment] Allow multiple live dash formats to download simultaneously
* [youtube] Implement fragment re-fetching for the live dash formats
* [youtube] Re-extract dash manifest every 5 hours (manifest expires in 6hrs)
* [postprocessor/ffmpeg] Add `FFmpegFixupDuplicateMoovPP` to fixup duplicated moov atoms

Known issue: Ctrl+C doesn't work on Windows when downloading multiple formats

Closes #1521
Authored by: nao20010128nao, pukkandan

											
										
										
											2021-12-20 15:06:46 +09:00
-												[youtube] Avoid false positives when detecting damaged formats

Closes #3083

											
										
										
											2022-03-16 19:46:19 +05:30
+								    def _list_formats(self, video_id, microformats, video_details, player_responses, player_url, duration=None):
-												[dash,youtube] Download live from start to end (#888)

* Add option `--live-from-start` to enable downloading live videos from start
* Add key `is_from_start` in formats to identify formats (of live videos) that downloads from start
* [dash] Create protocol `http_dash_segments_generator` that allows a function to be passed instead of fragments
* [fragment] Allow multiple live dash formats to download simultaneously
* [youtube] Implement fragment re-fetching for the live dash formats
* [youtube] Re-extract dash manifest every 5 hours (manifest expires in 6hrs)
* [postprocessor/ffmpeg] Add `FFmpegFixupDuplicateMoovPP` to fixup duplicated moov atoms

Known issue: Ctrl+C doesn't work on Windows when downloading multiple formats

Closes #1521
Authored by: nao20010128nao, pukkandan

											
										
										
											2021-12-20 15:06:46 +09:00
+								        live_broadcast_details = traverse_obj(microformats, (..., 'liveBroadcastDetails'))
 								        is_live = get_first(video_details, 'isLive')
 								        if is_live is None:
 								            is_live = get_first(live_broadcast_details, 'isLiveNow')
-												[extractor/youtube] Download `post_live` videos from start (#5091)

* The fragments are generated as a `LazyList`. So only the required formats are expanded during download, but all fragment lists are printed/written in infojson.
* The m3u8 formats which cannot be downloaded from start are not extracted by default, but can be enabled with an extractor-arg. The extractor-arg `include_live_dash` is renamed to `include_incomplete_formats` to account for this new use-case.

Closes #1564
Authored by: Lesmiscore, pukkandan
											
										
										
											2022-10-04 11:48:31 +09:00
+								        live_content = get_first(video_details, 'isLiveContent')
 								        is_upcoming = get_first(video_details, 'isUpcoming')
 								        post_live = get_first(video_details, 'isPostLiveDvr')
 								        live_status = ('post_live' if post_live
 								                       else 'is_live' if is_live
 								                       else 'is_upcoming' if is_upcoming
-												[extractor/youtube] Fix live_status

Bug in 4d37720a0c5f1c9c4768ea20b0f943277f55bc12

											
										
										
											2022-10-14 07:41:53 +05:30
+								                       else 'was_live' if live_content
 								                       else 'not_live' if False in (is_live, live_content)
 								                       else None)
-												[utils] `traverse_obj`: Fix more bugs

and cleanup uses of `default=[]`

Continued from b1bde57bef878478e3503ab07190fd207914ade9

											
										
										
											2023-02-10 03:56:26 +05:30
+								        streaming_data = traverse_obj(player_responses, (..., 'streamingData'))
-												[extractor/youtube] Download `post_live` videos from start (#5091)

* The fragments are generated as a `LazyList`. So only the required formats are expanded during download, but all fragment lists are printed/written in infojson.
* The m3u8 formats which cannot be downloaded from start are not extracted by default, but can be enabled with an extractor-arg. The extractor-arg `include_live_dash` is renamed to `include_incomplete_formats` to account for this new use-case.

Closes #1564
Authored by: Lesmiscore, pukkandan
											
										
										
											2022-10-04 11:48:31 +09:00
+								        *formats, subtitles = self._extract_formats_and_subtitles(streaming_data, video_id, player_url, live_status, duration)
-												[ie/youtube] Avoid false DRM detection (#7396)

Some master manifests contain a mix of DRM and non-DRM formats

											
										
										
											2023-06-23 18:16:07 +05:30
+								        if all(f.get('has_drm') for f in formats):
 								            # If there are no formats that definitely don't have DRM, all have DRM
 								            for f in formats:
 								                f['has_drm'] = True
-												[dash,youtube] Download live from start to end (#888)

* Add option `--live-from-start` to enable downloading live videos from start
* Add key `is_from_start` in formats to identify formats (of live videos) that downloads from start
* [dash] Create protocol `http_dash_segments_generator` that allows a function to be passed instead of fragments
* [fragment] Allow multiple live dash formats to download simultaneously
* [youtube] Implement fragment re-fetching for the live dash formats
* [youtube] Re-extract dash manifest every 5 hours (manifest expires in 6hrs)
* [postprocessor/ffmpeg] Add `FFmpegFixupDuplicateMoovPP` to fixup duplicated moov atoms

Known issue: Ctrl+C doesn't work on Windows when downloading multiple formats

Closes #1521
Authored by: nao20010128nao, pukkandan

											
										
										
											2021-12-20 15:06:46 +09:00
-												[extractor/youtube] Download `post_live` videos from start (#5091)

* The fragments are generated as a `LazyList`. So only the required formats are expanded during download, but all fragment lists are printed/written in infojson.
* The m3u8 formats which cannot be downloaded from start are not extracted by default, but can be enabled with an extractor-arg. The extractor-arg `include_live_dash` is renamed to `include_incomplete_formats` to account for this new use-case.

Closes #1564
Authored by: Lesmiscore, pukkandan
											
										
										
											2022-10-04 11:48:31 +09:00
+								        return live_broadcast_details, live_status, streaming_data, formats, subtitles
-												[dash,youtube] Download live from start to end (#888)

* Add option `--live-from-start` to enable downloading live videos from start
* Add key `is_from_start` in formats to identify formats (of live videos) that downloads from start
* [dash] Create protocol `http_dash_segments_generator` that allows a function to be passed instead of fragments
* [fragment] Allow multiple live dash formats to download simultaneously
* [youtube] Implement fragment re-fetching for the live dash formats
* [youtube] Re-extract dash manifest every 5 hours (manifest expires in 6hrs)
* [postprocessor/ffmpeg] Add `FFmpegFixupDuplicateMoovPP` to fixup duplicated moov atoms

Known issue: Ctrl+C doesn't work on Windows when downloading multiple formats

Closes #1521
Authored by: nao20010128nao, pukkandan

											
										
										
											2021-12-20 15:06:46 +09:00
-												[ie/youtube] Do not require PO Token for premium accounts (#13640)

Authored by: coletdjnz
											
										
										
											2025-07-11 18:54:01 +12:00
+								    def _download_initial_data(self, video_id, webpage, webpage_client, webpage_ytcfg):
 								        initial_data = None
 								        if webpage and 'initial_data' not in self._configuration_arg('webpage_skip'):
 								            initial_data = self.extract_yt_initial_data(video_id, webpage, fatal=False)
 								            if not traverse_obj(initial_data, 'contents'):
 								                self.report_warning('Incomplete data received in embedded initial data; re-fetching using API.')
 								                initial_data = None
 								        if not initial_data and 'initial_data' not in self._configuration_arg('player_skip'):
 								            query = {'videoId': video_id}
 								            query.update(self._get_checkok_params())
 								            initial_data = self._extract_response(
 								                item_id=video_id, ep='next', fatal=False,
 								                ytcfg=webpage_ytcfg, query=query, check_get_keys='contents',
 								                note='Downloading initial data API JSON', default_client=webpage_client)
 								        return initial_data
 								    def _is_premium_subscriber(self, initial_data):
 								        if not self.is_authenticated or not initial_data:
 								            return False
 								        tlr = traverse_obj(
 								            initial_data, ('topbar', 'desktopTopbarRenderer', 'logo', 'topbarLogoRenderer'))
 								        return (
 								            traverse_obj(tlr, ('iconImage', 'iconType')) == 'YOUTUBE_PREMIUM_LOGO'
 								            or 'premium' in (self._get_text(tlr, 'tooltipText') or '').lower()
 								        )
 								    def _initial_extract(self, url, smuggled_data, webpage_url, webpage_client, video_id):
 								        # This function is also used by live-from-start refresh
 								        webpage = self._download_initial_webpage(webpage_url, webpage_client, video_id)
 								        webpage_ytcfg = self.extract_ytcfg(video_id, webpage) or self._get_default_ytcfg(webpage_client)
 								        initial_data = self._download_initial_data(video_id, webpage, webpage_client, webpage_ytcfg)
 								        is_premium_subscriber = self._is_premium_subscriber(initial_data)
 								        if is_premium_subscriber:
 								            self.write_debug('Detected YouTube Premium subscription')
 								        player_responses, player_url = self._extract_player_responses(
 								            self._get_requested_clients(url, smuggled_data, is_premium_subscriber),
 								            video_id, webpage, webpage_client, webpage_ytcfg, is_premium_subscriber)
 								        return webpage, webpage_ytcfg, initial_data, is_premium_subscriber, player_responses, player_url
-												[dash,youtube] Download live from start to end (#888)

* Add option `--live-from-start` to enable downloading live videos from start
* Add key `is_from_start` in formats to identify formats (of live videos) that downloads from start
* [dash] Create protocol `http_dash_segments_generator` that allows a function to be passed instead of fragments
* [fragment] Allow multiple live dash formats to download simultaneously
* [youtube] Implement fragment re-fetching for the live dash formats
* [youtube] Re-extract dash manifest every 5 hours (manifest expires in 6hrs)
* [postprocessor/ffmpeg] Add `FFmpegFixupDuplicateMoovPP` to fixup duplicated moov atoms

Known issue: Ctrl+C doesn't work on Windows when downloading multiple formats

Closes #1521
Authored by: nao20010128nao, pukkandan

											
										
										
											2021-12-20 15:06:46 +09:00
+								    def _real_extract(self, url):
 								        url, smuggled_data = unsmuggle_url(url, {})
 								        video_id = self._match_id(url)
 								        base_url = self.http_scheme() + '//www.youtube.com/'
 								        webpage_url = base_url + 'watch?v=' + video_id
-												[ie/youtube] Do not require PO Token for premium accounts (#13640)

Authored by: coletdjnz
											
										
										
											2025-07-11 18:54:01 +12:00
+								        webpage_client = 'web'
-												[dash,youtube] Download live from start to end (#888)

* Add option `--live-from-start` to enable downloading live videos from start
* Add key `is_from_start` in formats to identify formats (of live videos) that downloads from start
* [dash] Create protocol `http_dash_segments_generator` that allows a function to be passed instead of fragments
* [fragment] Allow multiple live dash formats to download simultaneously
* [youtube] Implement fragment re-fetching for the live dash formats
* [youtube] Re-extract dash manifest every 5 hours (manifest expires in 6hrs)
* [postprocessor/ffmpeg] Add `FFmpegFixupDuplicateMoovPP` to fixup duplicated moov atoms

Known issue: Ctrl+C doesn't work on Windows when downloading multiple formats

Closes #1521
Authored by: nao20010128nao, pukkandan

											
										
										
											2021-12-20 15:06:46 +09:00
-												[ie/youtube] Do not require PO Token for premium accounts (#13640)

Authored by: coletdjnz
											
										
										
											2025-07-11 18:54:01 +12:00
+								        webpage, webpage_ytcfg, initial_data, is_premium_subscriber, player_responses, player_url = self._initial_extract(
 								            url, smuggled_data, webpage_url, webpage_client, video_id)
-												[dash,youtube] Download live from start to end (#888)

* Add option `--live-from-start` to enable downloading live videos from start
* Add key `is_from_start` in formats to identify formats (of live videos) that downloads from start
* [dash] Create protocol `http_dash_segments_generator` that allows a function to be passed instead of fragments
* [fragment] Allow multiple live dash formats to download simultaneously
* [youtube] Implement fragment re-fetching for the live dash formats
* [youtube] Re-extract dash manifest every 5 hours (manifest expires in 6hrs)
* [postprocessor/ffmpeg] Add `FFmpegFixupDuplicateMoovPP` to fixup duplicated moov atoms

Known issue: Ctrl+C doesn't work on Windows when downloading multiple formats

Closes #1521
Authored by: nao20010128nao, pukkandan

											
										
										
											2021-12-20 15:06:46 +09:00
-												[youtube] Extract data from multiple clients (#536)

* `player_client` accepts multiple clients
* default `player_client` = `android,web`
* music clients can be specifically requested
* Add IOS `player_client`
* Hide live dash since they can't be downloaded

Closes #501

Authored-by: pukkandan, colethedj
											
										
										
											2021-07-21 09:22:34 +05:30
+								        playability_statuses = traverse_obj(
-												[utils] `traverse_obj`: Fix more bugs

and cleanup uses of `default=[]`

Continued from b1bde57bef878478e3503ab07190fd207914ade9

											
										
										
											2023-02-10 03:56:26 +05:30
+								            player_responses, (..., 'playabilityStatus'), expected_type=dict)
-												[youtube] Extract data from multiple clients (#536)

* `player_client` accepts multiple clients
* default `player_client` = `android,web`
* music clients can be specifically requested
* Add IOS `player_client`
* Hide live dash since they can't be downloaded

Closes #501

Authored-by: pukkandan, colethedj
											
										
										
											2021-07-21 09:22:34 +05:30
 								        trailer_video_id = get_first(
 								            playability_statuses,
 								            ('errorScreen', 'playerLegacyDesktopYpcTrailerRenderer', 'trailerVideoId'),
 								            expected_type=str)
 								        if trailer_video_id:
 								            return self.url_result(
 								                trailer_video_id, self.ie_key(), trailer_video_id)
 								        search_meta = ((lambda x: self._html_search_meta(x, webpage, default=None))
 								                       if webpage else (lambda x: None))
-												[utils] `traverse_obj`: Fix more bugs

and cleanup uses of `default=[]`

Continued from b1bde57bef878478e3503ab07190fd207914ade9

											
										
										
											2023-02-10 03:56:26 +05:30
+								        video_details = traverse_obj(player_responses, (..., 'videoDetails'), expected_type=dict)
-												[youtube] Extract data from multiple clients (#536)

* `player_client` accepts multiple clients
* default `player_client` = `android,web`
* music clients can be specifically requested
* Add IOS `player_client`
* Hide live dash since they can't be downloaded

Closes #501

Authored-by: pukkandan, colethedj
											
										
										
											2021-07-21 09:22:34 +05:30
+								        microformats = traverse_obj(
 								            player_responses, (..., 'microformat', 'playerMicroformatRenderer'),
-												[utils] `traverse_obj`: Fix more bugs

and cleanup uses of `default=[]`

Continued from b1bde57bef878478e3503ab07190fd207914ade9

											
										
										
											2023-02-10 03:56:26 +05:30
+								            expected_type=dict)
-												[extractor/youtube] Support changing extraction language (#4470)

Adds `--extractor-args youtube:lang=<supported lang code>` extractor arg to prefer translated fields (e.g. title and description) of that language, if available, for all YouTube extractors. See README or error message for list of supported language codes.

Closes https://github.com/yt-dlp/yt-dlp/issues/387

Authored by: coletdjnz
											
										
										
											2022-09-09 05:16:46 +00:00
-												[ie/youtube] Extract title and description from initial data (#14078)

Closes #13604
Authored by: bashonly
											
										
										
											2025-08-19 14:27:17 -05:00
+								        # Fallbacks in case player responses are missing metadata
 								        initial_sdcr = traverse_obj(initial_data, (
 								            'engagementPanels', ..., 'engagementPanelSectionListRenderer',
 								            'content', 'structuredDescriptionContentRenderer', {dict}, any))
 								        initial_description = traverse_obj(initial_sdcr, (
 								            'items', ..., 'expandableVideoDescriptionBodyRenderer',
 								            'attributedDescriptionBodyText', 'content', {str}, any))
 								        # videoDescriptionHeaderRenderer also has publishDate/channel/handle/ucid, but not needed
 								        initial_vdhr = traverse_obj(initial_sdcr, (
 								            'items', ..., 'videoDescriptionHeaderRenderer', {dict}, any)) or {}
 								        initial_video_details_renderer = traverse_obj(initial_data, (
 								            'playerOverlays', 'playerOverlayRenderer', 'videoDetails',
 								            'playerOverlayVideoDetailsRenderer', {dict})) or {}
 								        initial_title = (
 								            self._get_text(initial_vdhr, 'title')
 								            or self._get_text(initial_video_details_renderer, 'title'))
-												[extractor/youtube] Support changing extraction language (#4470)

Adds `--extractor-args youtube:lang=<supported lang code>` extractor arg to prefer translated fields (e.g. title and description) of that language, if available, for all YouTube extractors. See README or error message for list of supported language codes.

Closes https://github.com/yt-dlp/yt-dlp/issues/387

Authored by: coletdjnz
											
										
										
											2022-09-09 05:16:46 +00:00
+								        translated_title = self._get_text(microformats, (..., 'title'))
-												[cleanup] Bump ruff to 0.8.x (#11608)

Authored by: seproDev
											
										
										
											2024-12-02 16:29:30 +01:00
+								        video_title = ((self._preferred_lang and translated_title)
-												[extractor/youtube] Support changing extraction language (#4470)

Adds `--extractor-args youtube:lang=<supported lang code>` extractor arg to prefer translated fields (e.g. title and description) of that language, if available, for all YouTube extractors. See README or error message for list of supported language codes.

Closes https://github.com/yt-dlp/yt-dlp/issues/387

Authored by: coletdjnz
											
										
										
											2022-09-09 05:16:46 +00:00
+								                       or get_first(video_details, 'title')  # primary
 								                       or translated_title
 								                       or search_meta(['og:title', 'twitter:title', 'title']))
-												[ie/youtube] Extract title and description from initial data (#14078)

Closes #13604
Authored by: bashonly
											
										
										
											2025-08-19 14:27:17 -05:00
+								        if not video_title and initial_title:
 								            self.report_warning(
 								                'No title found in player responses; falling back to title from initial data. '
 								                'Other metadata may also be missing')
 								            video_title = initial_title
-												[extractor/youtube] Support changing extraction language (#4470)

Adds `--extractor-args youtube:lang=<supported lang code>` extractor arg to prefer translated fields (e.g. title and description) of that language, if available, for all YouTube extractors. See README or error message for list of supported language codes.

Closes https://github.com/yt-dlp/yt-dlp/issues/387

Authored by: coletdjnz
											
										
										
											2022-09-09 05:16:46 +00:00
+								        translated_description = self._get_text(microformats, (..., 'description'))
 								        original_description = get_first(video_details, 'shortDescription')
 								        video_description = (
-												[cleanup] Bump ruff to 0.8.x (#11608)

Authored by: seproDev
											
										
										
											2024-12-02 16:29:30 +01:00
+								            (self._preferred_lang and translated_description)
-												[extractor/youtube] Support changing extraction language (#4470)

Adds `--extractor-args youtube:lang=<supported lang code>` extractor arg to prefer translated fields (e.g. title and description) of that language, if available, for all YouTube extractors. See README or error message for list of supported language codes.

Closes https://github.com/yt-dlp/yt-dlp/issues/387

Authored by: coletdjnz
											
										
										
											2022-09-09 05:16:46 +00:00
+								            # If original description is blank, it will be an empty string.
 								            # Do not prefer translated description in this case.
 								            or original_description if original_description is not None else translated_description)
-												[ie/youtube] Extract title and description from initial data (#14078)

Closes #13604
Authored by: bashonly
											
										
										
											2025-08-19 14:27:17 -05:00
+								        if video_description is None:
 								            video_description = initial_description
-												[youtube] Extract data from multiple clients (#536)

* `player_client` accepts multiple clients
* default `player_client` = `android,web`
* music clients can be specifically requested
* Add IOS `player_client`
* Hide live dash since they can't be downloaded

Closes #501

Authored-by: pukkandan, colethedj
											
										
										
											2021-07-21 09:22:34 +05:30
-												[youtube] Remove unnecessary no-playlist warning

											
										
										
											2021-11-03 16:27:34 +05:30
+								        multifeed_metadata_list = get_first(
 								            player_responses,
 								            ('multicamera', 'playerLegacyMulticameraRenderer', 'metadataList'),
 								            expected_type=str)
 								        if multifeed_metadata_list and not smuggled_data.get('force_singlefeed'):
 								            if self.get_param('noplaylist'):
-												[cleanup] Add more ruff rules (#10149)

Authored by: seproDev

Reviewed-by: bashonly <88596187+bashonly@users.noreply.github.com>
Reviewed-by: Simon Sawicki <contact@grub4k.xyz>
											
										
										
											2024-06-12 01:09:58 +02:00
+								                self.to_screen(f'Downloading just video {video_id} because of --no-playlist')
-												[youtube] Remove unnecessary no-playlist warning

											
										
										
											2021-11-03 16:27:34 +05:30
+								            else:
 								                entries = []
 								                feed_ids = []
 								                for feed in multifeed_metadata_list.split(','):
 								                    # Unquote should take place before split on comma (,) since textual
 								                    # fields may contain comma as well (see
 								                    # https://github.com/ytdl-org/youtube-dl/issues/8536)
-												[compat] Remove deprecated functions from core code

											
										
										
											2022-06-24 16:24:43 +05:30
+								                    feed_data = urllib.parse.parse_qs(
-												[compat] Remove more functions

Removing any more will require changes to a large number of extractors

											
										
										
											2022-06-24 13:40:17 +05:30
+								                        urllib.parse.unquote_plus(feed))
-												[youtube] Remove unnecessary no-playlist warning

											
										
										
											2021-11-03 16:27:34 +05:30
 								                    def feed_entry(name):
 								                        return try_get(
-												[compat] Remove deprecated functions from core code

											
										
										
											2022-06-24 16:24:43 +05:30
+								                            feed_data, lambda x: x[name][0], str)
-												[youtube] Remove unnecessary no-playlist warning

											
										
										
											2021-11-03 16:27:34 +05:30
 								                    feed_id = feed_entry('id')
 								                    if not feed_id:
 								                        continue
 								                    feed_title = feed_entry('title')
 								                    title = video_title
 								                    if feed_title:
-												[cleanup] Add more ruff rules (#10149)

Authored by: seproDev

Reviewed-by: bashonly <88596187+bashonly@users.noreply.github.com>
Reviewed-by: Simon Sawicki <contact@grub4k.xyz>
											
										
										
											2024-06-12 01:09:58 +02:00
+								                        title += f' ({feed_title})'
-												[youtube] Remove unnecessary no-playlist warning

											
										
										
											2021-11-03 16:27:34 +05:30
+								                    entries.append({
 								                        '_type': 'url_transparent',
 								                        'ie_key': 'Youtube',
 								                        'url': smuggle_url(
-												[cleanup] Add more ruff rules (#10149)

Authored by: seproDev

Reviewed-by: bashonly <88596187+bashonly@users.noreply.github.com>
Reviewed-by: Simon Sawicki <contact@grub4k.xyz>
											
										
										
											2024-06-12 01:09:58 +02:00
+								                            '{}watch?v={}'.format(base_url, feed_data['id'][0]),
-												[youtube] Remove unnecessary no-playlist warning

											
										
										
											2021-11-03 16:27:34 +05:30
+								                            {'force_singlefeed': True}),
 								                        'title': title,
 								                    })
 								                    feed_ids.append(feed_id)
 								                self.to_screen(
-												[cleanup] Add more ruff rules (#10149)

Authored by: seproDev

Reviewed-by: bashonly <88596187+bashonly@users.noreply.github.com>
Reviewed-by: Simon Sawicki <contact@grub4k.xyz>
											
										
										
											2024-06-12 01:09:58 +02:00
+								                    'Downloading multifeed video ({}) - add --no-playlist to just download video {}'.format(
 								                        ', '.join(feed_ids), video_id))
-												[youtube] Remove unnecessary no-playlist warning

											
										
										
											2021-11-03 16:27:34 +05:30
+								                return self.playlist_result(
 								                    entries, video_id, video_title, video_description)
-												[youtube] Extract data from multiple clients (#536)

* `player_client` accepts multiple clients
* default `player_client` = `android,web`
* music clients can be specifically requested
* Add IOS `player_client`
* Hide live dash since they can't be downloaded

Closes #501

Authored-by: pukkandan, colethedj
											
										
										
											2021-07-21 09:22:34 +05:30
-												[extractor/youtube] Fix `duration` for premieres (#5382)

Closes #5378
Authored by: nosoop
											
										
										
											2022-10-28 11:30:33 -07:00
+								        duration = (int_or_none(get_first(video_details, 'lengthSeconds'))
 								                    or int_or_none(get_first(microformats, 'lengthSeconds'))
 								                    or parse_duration(search_meta('duration')) or None)
-												[youtube] Avoid false positives when detecting damaged formats

Closes #3083

											
										
										
											2022-03-16 19:46:19 +05:30
-												[extractor/youtube] Download `post_live` videos from start (#5091)

* The fragments are generated as a `LazyList`. So only the required formats are expanded during download, but all fragment lists are printed/written in infojson.
* The m3u8 formats which cannot be downloaded from start are not extracted by default, but can be enabled with an extractor-arg. The extractor-arg `include_live_dash` is renamed to `include_incomplete_formats` to account for this new use-case.

Closes #1564
Authored by: Lesmiscore, pukkandan
											
										
										
											2022-10-04 11:48:31 +09:00
+								        live_broadcast_details, live_status, streaming_data, formats, automatic_captions = \
 								            self._list_formats(video_id, microformats, video_details, player_responses, player_url, duration)
 								        if live_status == 'post_live':
 								            self.write_debug(f'{video_id}: Video is in Post-Live Manifestless mode')
-												[youtube] Quick extraction tempfix (closes #22367, closes #22163)

											
										
										
											2019-09-11 22:44:47 +07:00
-												[youtube] Update to ytdl-2021.02.04.1

											
										
										
											2021-02-04 20:07:17 +05:30
+								        if not formats:
-												[youtube] Extract data from multiple clients (#536)

* `player_client` accepts multiple clients
* default `player_client` = `android,web`
* music clients can be specifically requested
* Add IOS `player_client`
* Hide live dash since they can't be downloaded

Closes #501

Authored-by: pukkandan, colethedj
											
										
										
											2021-07-21 09:22:34 +05:30
+								            if not self.get_param('allow_unplayable_formats') and traverse_obj(streaming_data, (..., 'licenseInfos')):
-												[extractor] Better error message for DRM (#729)

Closes #636
											
										
										
											2021-08-23 01:38:38 +05:30
+								                self.report_drm(video_id)
-												[youtube] Extract data from multiple clients (#536)

* `player_client` accepts multiple clients
* default `player_client` = `android,web`
* music clients can be specifically requested
* Add IOS `player_client`
* Hide live dash since they can't be downloaded

Closes #501

Authored-by: pukkandan, colethedj
											
										
										
											2021-07-21 09:22:34 +05:30
+								            pemr = get_first(
 								                playability_statuses,
 								                ('errorScreen', 'playerErrorMessageRenderer'), expected_type=dict) or {}
 								            reason = self._get_text(pemr, 'reason') or get_first(playability_statuses, 'reason')
 								            subreason = clean_html(self._get_text(pemr, 'subreason') or '')
-												[youtube] Update to ytdl-2021.02.04.1

											
										
										
											2021-02-04 20:07:17 +05:30
+								            if subreason:
-												[ie/youtube] Fix geo-restriction error handling (#13217)

Authored by: yozel
											
										
										
											2025-05-20 23:39:27 +02:00
+								                if subreason.startswith('The uploader has not made this video available in your country'):
-												[youtube] Extract data from multiple clients (#536)

* `player_client` accepts multiple clients
* default `player_client` = `android,web`
* music clients can be specifically requested
* Add IOS `player_client`
* Hide live dash since they can't be downloaded

Closes #501

Authored-by: pukkandan, colethedj
											
										
										
											2021-07-21 09:22:34 +05:30
+								                    countries = get_first(microformats, 'availableCountries')
-												[youtube] Update to ytdl-2021.02.04.1

											
										
										
											2021-02-04 20:07:17 +05:30
+								                    if not countries:
 								                        regions_allowed = search_meta('regionsAllowed')
 								                        countries = regions_allowed.split(',') if regions_allowed else None
-												Add option `--ignore-no-formats-error`
* Ignores the "no video format" and similar errors
* Experimental - Some extractors may still throw these errors

											
										
										
											2021-04-17 05:39:58 +05:30
+								                    self.raise_geo_restricted(subreason, countries, metadata_available=True)
-												[youtube] Extract data from multiple clients (#536)

* `player_client` accepts multiple clients
* default `player_client` = `android,web`
* music clients can be specifically requested
* Add IOS `player_client`
* Hide live dash since they can't be downloaded

Closes #501

Authored-by: pukkandan, colethedj
											
										
										
											2021-07-21 09:22:34 +05:30
+								                reason += f'. {subreason}'
-												[youtube] Update to ytdl-2021.02.04.1

											
										
										
											2021-02-04 20:07:17 +05:30
+								            if reason:
-												[ie/youtube] Remove broken OAuth support (#11558)

Closes #11462
Authored by: bashonly
											
										
										
											2024-11-16 23:40:21 +00:00
+								                if 'sign in' in reason.lower():
 								                    reason = remove_end(reason, 'This helps protect our community. Learn more')
 								                    reason = f'{remove_end(reason.strip(), ".")}. {self._youtube_login_hint}'
-												[ie/youtube] Add warning on video captcha challenge (#12939)

Authored by: coletdjnz
											
										
										
											2025-04-18 11:40:39 +12:00
+								                elif get_first(playability_statuses, ('errorScreen', 'playerCaptchaViewModel', {dict})):
 								                    reason += '. YouTube is requiring a captcha challenge before playback'
-												[ie/youtube] Add context to video request rate limit error (#12958)

Related: https://github.com/yt-dlp/yt-dlp/issues/11426

Authored by: coletdjnz
											
										
										
											2025-04-25 16:11:07 +12:00
+								                elif "This content isn't available, try again later" in reason:
 								                    reason = (
 								                        f'{remove_end(reason.strip(), ".")}. {"Your account" if self.is_authenticated else "The current session"} '
 								                        f'has been rate-limited by YouTube for up to an hour. It is recommended to use `-t sleep` to add a delay '
 								                        f'between video requests to avoid exceeding the rate limit. For more information, refer to  '
 								                        f'https://github.com/yt-dlp/yt-dlp/wiki/Extractors#this-content-isnt-available-try-again-later'
 								                    )
-												Add option `--ignore-no-formats-error`
* Ignores the "no video format" and similar errors
* Experimental - Some extractors may still throw these errors

											
										
										
											2021-04-17 05:39:58 +05:30
+								                self.raise_no_formats(reason, expected=True)
-												[youtube] Quick extraction tempfix (closes #22367, closes #22163)

											
										
										
											2019-09-11 22:44:47 +07:00
-												[youtube] Extract data from multiple clients (#536)

* `player_client` accepts multiple clients
* default `player_client` = `android,web`
* music clients can be specifically requested
* Add IOS `player_client`
* Hide live dash since they can't be downloaded

Closes #501

Authored-by: pukkandan, colethedj
											
										
										
											2021-07-21 09:22:34 +05:30
+								        keywords = get_first(video_details, 'keywords', expected_type=list) or []
-												[youtube] Update to ytdl-2021.02.04.1

											
										
										
											2021-02-04 20:07:17 +05:30
+								        if not keywords and webpage:
 								            keywords = [
 								                unescapeHTML(m.group('content'))
 								                for m in re.finditer(self._meta_regex('og:video:tag'), webpage)]
 								        for keyword in keywords:
 								            if keyword.startswith('yt:stretch='):
-												Update to ytdl-commit-9f6c03

[cbsnews] Fix extraction for python <3.6
https://github.com/ytdl-org/youtube-dl/commit/9f6c03a00602eb1119e43a522cf50682f6d6a6dd

											
										
										
											2021-04-17 08:32:33 +05:30
+								                mobj = re.search(r'(\d+)\s*:\s*(\d+)', keyword)
 								                if mobj:
 								                    # NB: float is intentional for forcing float division
 								                    w, h = (float(v) for v in mobj.groups())
 								                    if w > 0 and h > 0:
 								                        ratio = w / h
 								                        for f in formats:
 								                            if f.get('vcodec') != 'none':
 								                                f['stretched_ratio'] = ratio
 								                        break
-												[youtube:tab] Extract video thumbnails from playlist (#2096)

closes #1184
Co-Authored-by: coletdjnz, pukkandan
											
										
										
											2021-12-24 03:42:02 +00:00
+								        thumbnails = self._extract_thumbnails((video_details, microformats), (..., ..., 'thumbnail'))
-												[youtube] Always extract `maxresdefault` thumbnail
Fixes: https://github.com/ytdl-org/youtube-dl/issues/29049

											
										
										
											2021-05-18 19:15:11 +05:30
+								        thumbnail_url = search_meta(['og:image', 'twitter:image'])
 								        if thumbnail_url:
 								            thumbnails.append({
 								                'url': thumbnail_url,
 								            })
-												[youtube] Populate `thumbnail` with the best "known" thumbnail
Closes #402, Related: https://github.com/yt-dlp/yt-dlp/issues/340#issuecomment-950290624

											
										
										
											2021-10-24 14:55:28 +05:30
+								        original_thumbnails = thumbnails.copy()
-												[youtube] Extract more thumbnails

* The thumbnail URLs are hard-coded and their actual existence is tested lazily
* Added option `--no-check-formats` to not test them

Closes #340, Related: #402, #337, https://github.com/ytdl-org/youtube-dl/issues/29049

											
										
										
											2021-07-15 22:49:59 +05:30
+								        # The best resolution thumbnails sometimes does not appear in the webpage
-												[youtube] De-prioritize auto-generated thumbnails

Closes #3112

											
										
										
											2022-04-29 00:31:34 +05:30
+								        # See: https://github.com/yt-dlp/yt-dlp/issues/340
-												[youtube] Extract even more thumbnails and reduce testing

* Also fix bug where `_test_url` was being ignored

Ref: https://stackoverflow.com/a/20542029
Related: #340

											
										
										
											2021-07-20 03:40:35 +05:30
+								        # List of possible thumbnails - Ref: <https://stackoverflow.com/a/20542029>
-												Do not verify thumbnail URLs by default

Partially reverts cca80fe6110653582e8c8a8d06490b4028ffd755 and 0ba692acc8feffd46b6e1085fb4a2849b685945c

Unless `--check-formats` is specified, this causes yt-dlp to return incorrect thumbnail urls.
See https://github.com/yt-dlp/yt-dlp/issues/340#issuecomment-877909966, #402

But the overhead in general use is not worth it

Closes #694, #725

											
										
										
											2021-10-18 15:23:42 +05:30
+								        thumbnail_names = [
-												[cleanup] Fix some typos (#4194)

Authored by: crazymoose77756
											
										
										
											2022-06-26 20:50:06 -04:00
+								            # While the *1,*2,*3 thumbnails are just below their corresponding "*default" variants
-												[youtube] De-prioritize auto-generated thumbnails

Closes #3112

											
										
										
											2022-04-29 00:31:34 +05:30
+								            # in resolution, these are not the custom thumbnail. So de-prioritize them
 								            'maxresdefault', 'hq720', 'sddefault', 'hqdefault', '0', 'mqdefault', 'default',
-												[cleanup] Add more ruff rules (#10149)

Authored by: seproDev

Reviewed-by: bashonly <88596187+bashonly@users.noreply.github.com>
Reviewed-by: Simon Sawicki <contact@grub4k.xyz>
											
										
										
											2024-06-12 01:09:58 +02:00
+								            'sd1', 'sd2', 'sd3', 'hq1', 'hq2', 'hq3', 'mq1', 'mq2', 'mq3', '1', '2', '3',
-												[youtube] Extract even more thumbnails and reduce testing

* Also fix bug where `_test_url` was being ignored

Ref: https://stackoverflow.com/a/20542029
Related: #340

											
										
										
											2021-07-20 03:40:35 +05:30
+								        ]
 								        n_thumbnail_names = len(thumbnail_names)
-												[youtube] Extract more thumbnails

* The thumbnail URLs are hard-coded and their actual existence is tested lazily
* Added option `--no-check-formats` to not test them

Closes #340, Related: #402, #337, https://github.com/ytdl-org/youtube-dl/issues/29049

											
										
										
											2021-07-15 22:49:59 +05:30
+								        thumbnails.extend({
 								            'url': 'https://i.ytimg.com/vi{webp}/{video_id}/{name}{live}.{ext}'.format(
 								                video_id=video_id, name=name, ext=ext,
-												[extractor/youtube] Download `post_live` videos from start (#5091)

* The fragments are generated as a `LazyList`. So only the required formats are expanded during download, but all fragment lists are printed/written in infojson.
* The m3u8 formats which cannot be downloaded from start are not extracted by default, but can be enabled with an extractor-arg. The extractor-arg `include_live_dash` is renamed to `include_incomplete_formats` to account for this new use-case.

Closes #1564
Authored by: Lesmiscore, pukkandan
											
										
										
											2022-10-04 11:48:31 +09:00
+								                webp='_webp' if ext == 'webp' else '', live='_live' if live_status == 'is_live' else ''),
-												[youtube] Extract even more thumbnails and reduce testing

* Also fix bug where `_test_url` was being ignored

Ref: https://stackoverflow.com/a/20542029
Related: #340

											
										
										
											2021-07-20 03:40:35 +05:30
+								        } for name in thumbnail_names for ext in ('webp', 'jpg'))
-												[youtube] Extract more thumbnails

* The thumbnail URLs are hard-coded and their actual existence is tested lazily
* Added option `--no-check-formats` to not test them

Closes #340, Related: #402, #337, https://github.com/ytdl-org/youtube-dl/issues/29049

											
										
										
											2021-07-15 22:49:59 +05:30
+								        for thumb in thumbnails:
-												[youtube] Extract even more thumbnails and reduce testing

* Also fix bug where `_test_url` was being ignored

Ref: https://stackoverflow.com/a/20542029
Related: #340

											
										
										
											2021-07-20 03:40:35 +05:30
+								            i = next((i for i, t in enumerate(thumbnail_names) if f'/{video_id}/{t}' in thumb['url']), n_thumbnail_names)
-												[youtube] Extract more thumbnails

* The thumbnail URLs are hard-coded and their actual existence is tested lazily
* Added option `--no-check-formats` to not test them

Closes #340, Related: #402, #337, https://github.com/ytdl-org/youtube-dl/issues/29049

											
										
										
											2021-07-15 22:49:59 +05:30
+								            thumb['preference'] = (0 if '.webp' in thumb['url'] else -1) - (2 * i)
-												[youtube] Always extract `maxresdefault` thumbnail
Fixes: https://github.com/ytdl-org/youtube-dl/issues/29049

											
										
										
											2021-05-18 19:15:11 +05:30
+								        self._remove_duplicate_formats(thumbnails)
-												[youtube] Populate `thumbnail` with the best "known" thumbnail
Closes #402, Related: https://github.com/yt-dlp/yt-dlp/issues/340#issuecomment-950290624

											
										
										
											2021-10-24 14:55:28 +05:30
+								        self._downloader._sort_thumbnails(original_thumbnails)
-												[youtube] Update to ytdl-2021.02.04.1

											
										
										
											2021-02-04 20:07:17 +05:30
-												[youtube] Improve extraction of livestream metadata
Modified from and closes #441
Authored by: pukkandan, krichbanana

											
										
										
											2021-07-21 20:45:45 +05:30
+								        category = get_first(microformats, 'category') or search_meta('genre')
-												[extractor/youtube] Define strict uploader metadata mapping (#6384)

New mapping:
```
channel -> channel name
channel_id -> UCID
channel_url -> UCID channel url

uploader -> channel name (same as channel field)
uploader_id -> @handle
uploader_url -> @handle channel url 
```

Authored by: coletdjnz
											
										
										
											2023-04-14 07:58:36 +00:00
+								        channel_id = self.ucid_or_none(str_or_none(
-												[youtube] Improve extraction of livestream metadata
Modified from and closes #441
Authored by: pukkandan, krichbanana

											
										
										
											2021-07-21 20:45:45 +05:30
+								            get_first(video_details, 'channelId')
 								            or get_first(microformats, 'externalChannelId')
-												[extractor/youtube] Define strict uploader metadata mapping (#6384)

New mapping:
```
channel -> channel name
channel_id -> UCID
channel_url -> UCID channel url

uploader -> channel name (same as channel field)
uploader_id -> @handle
uploader_url -> @handle channel url 
```

Authored by: coletdjnz
											
										
										
											2023-04-14 07:58:36 +00:00
+								            or search_meta('channelId')))
-												[youtube] Improve extraction of livestream metadata
Modified from and closes #441
Authored by: pukkandan, krichbanana

											
										
										
											2021-07-21 20:45:45 +05:30
+								        owner_profile_url = get_first(microformats, 'ownerProfileUrl')
-												[dash,youtube] Download live from start to end (#888)

* Add option `--live-from-start` to enable downloading live videos from start
* Add key `is_from_start` in formats to identify formats (of live videos) that downloads from start
* [dash] Create protocol `http_dash_segments_generator` that allows a function to be passed instead of fragments
* [fragment] Allow multiple live dash formats to download simultaneously
* [youtube] Implement fragment re-fetching for the live dash formats
* [youtube] Re-extract dash manifest every 5 hours (manifest expires in 6hrs)
* [postprocessor/ffmpeg] Add `FFmpegFixupDuplicateMoovPP` to fixup duplicated moov atoms

Known issue: Ctrl+C doesn't work on Windows when downloading multiple formats

Closes #1521
Authored by: nao20010128nao, pukkandan

											
										
										
											2021-12-20 15:06:46 +09:00
+								        live_start_time = parse_iso8601(get_first(live_broadcast_details, 'startTimestamp'))
 								        live_end_time = parse_iso8601(get_first(live_broadcast_details, 'endTimestamp'))
 								        if not duration and live_end_time and live_start_time:
 								            duration = live_end_time - live_start_time
-												[extractor/youtube] Download `post_live` videos from start (#5091)

* The fragments are generated as a `LazyList`. So only the required formats are expanded during download, but all fragment lists are printed/written in infojson.
* The m3u8 formats which cannot be downloaded from start are not extracted by default, but can be enabled with an extractor-arg. The extractor-arg `include_live_dash` is renamed to `include_incomplete_formats` to account for this new use-case.

Closes #1564
Authored by: Lesmiscore, pukkandan
											
										
										
											2022-10-04 11:48:31 +09:00
+								        needs_live_processing = self._needs_live_processing(live_status, duration)
 								        def is_bad_format(fmt):
 								            if needs_live_processing and not fmt.get('is_from_start'):
 								                return True
 								            elif (live_status == 'is_live' and needs_live_processing != 'is_live'
 								                    and fmt.get('protocol') == 'http_dash_segments'):
 								                return True
 								        for fmt in filter(is_bad_format, formats):
 								            fmt['preference'] = (fmt.get('preference') or -1) - 10
-												[extractor/youtube] Process `post_live` over 2 hours

											
										
										
											2023-06-26 07:25:47 +05:30
+								            fmt['format_note'] = join_nonempty(fmt.get('format_note'), '(Last 2 hours)', delim=' ')
-												[extractor/youtube] Download `post_live` videos from start (#5091)

* The fragments are generated as a `LazyList`. So only the required formats are expanded during download, but all fragment lists are printed/written in infojson.
* The m3u8 formats which cannot be downloaded from start are not extracted by default, but can be enabled with an extractor-arg. The extractor-arg `include_live_dash` is renamed to `include_incomplete_formats` to account for this new use-case.

Closes #1564
Authored by: Lesmiscore, pukkandan
											
										
										
											2022-10-04 11:48:31 +09:00
 								        if needs_live_processing:
 								            self._prepare_live_from_start_formats(
 								                formats, video_id, live_start_time, url, webpage_url, smuggled_data, live_status == 'is_live')
-												[youtube] Improve extraction of livestream metadata
Modified from and closes #441
Authored by: pukkandan, krichbanana

											
										
										
											2021-07-21 20:45:45 +05:30
-												[youtube] Add storyboard formats
Closes: #1553, https://github.com/ytdl-org/youtube-dl/issues/9868
Related: https://github.com/ytdl-org/youtube-dl/pull/14951

											
										
										
											2021-11-17 01:26:23 +05:30
+								        formats.extend(self._extract_storyboard(player_responses, duration))
-												[extractor/youtube] Define strict uploader metadata mapping (#6384)

New mapping:
```
channel -> channel name
channel_id -> UCID
channel_url -> UCID channel url

uploader -> channel name (same as channel field)
uploader_id -> @handle
uploader_url -> @handle channel url 
```

Authored by: coletdjnz
											
										
										
											2023-04-14 07:58:36 +00:00
+								        channel_handle = self.handle_from_url(owner_profile_url)
-												[youtube] Update to ytdl-2021.02.04.1

											
										
										
											2021-02-04 20:07:17 +05:30
+								        info = {
 								            'id': video_id,
-												[extractor] Standardize `_live_title`

											
										
										
											2021-12-15 21:30:46 +05:30
+								            'title': video_title,
-												[youtube] Update to ytdl-2021.02.04.1

											
										
										
											2021-02-04 20:07:17 +05:30
+								            'formats': formats,
 								            'thumbnails': thumbnails,
-												[youtube] Populate `thumbnail` with the best "known" thumbnail
Closes #402, Related: https://github.com/yt-dlp/yt-dlp/issues/340#issuecomment-950290624

											
										
										
											2021-10-24 14:55:28 +05:30
+								            # The best thumbnail that we are sure exists. Prevents unnecessary
 								            # URL checking if user don't care about getting the best possible thumbnail
 								            'thumbnail': traverse_obj(original_thumbnails, (-1, 'url')),
-												[youtube] Update to ytdl-2021.02.04.1

											
										
										
											2021-02-04 20:07:17 +05:30
+								            'description': video_description,
 								            'channel_id': channel_id,
-												[extractor/youtube] Define strict uploader metadata mapping (#6384)

New mapping:
```
channel -> channel name
channel_id -> UCID
channel_url -> UCID channel url

uploader -> channel name (same as channel field)
uploader_id -> @handle
uploader_url -> @handle channel url 
```

Authored by: coletdjnz
											
										
										
											2023-04-14 07:58:36 +00:00
+								            'channel_url': format_field(channel_id, None, 'https://www.youtube.com/channel/%s', default=None),
-												[youtube] Update to ytdl-2021.02.04.1

											
										
										
											2021-02-04 20:07:17 +05:30
+								            'duration': duration,
 								            'view_count': int_or_none(
-												[youtube] Extract data from multiple clients (#536)

* `player_client` accepts multiple clients
* default `player_client` = `android,web`
* music clients can be specifically requested
* Add IOS `player_client`
* Hide live dash since they can't be downloaded

Closes #501

Authored-by: pukkandan, colethedj
											
										
										
											2021-07-21 09:22:34 +05:30
+								                get_first((video_details, microformats), (..., 'viewCount'))
-												[youtube] Update to ytdl-2021.02.04.1

											
										
										
											2021-02-04 20:07:17 +05:30
+								                or search_meta('interactionCount')),
-												[youtube] Extract data from multiple clients (#536)

* `player_client` accepts multiple clients
* default `player_client` = `android,web`
* music clients can be specifically requested
* Add IOS `player_client`
* Hide live dash since they can't be downloaded

Closes #501

Authored-by: pukkandan, colethedj
											
										
										
											2021-07-21 09:22:34 +05:30
+								            'average_rating': float_or_none(get_first(video_details, 'averageRating')),
-												[youtube] Update to ytdl-2021.02.04.1

											
										
										
											2021-02-04 20:07:17 +05:30
+								            'age_limit': 18 if (
-												[youtube] Extract data from multiple clients (#536)

* `player_client` accepts multiple clients
* default `player_client` = `android,web`
* music clients can be specifically requested
* Add IOS `player_client`
* Hide live dash since they can't be downloaded

Closes #501

Authored-by: pukkandan, colethedj
											
										
										
											2021-07-21 09:22:34 +05:30
+								                get_first(microformats, 'isFamilySafe') is False
-												[youtube] Update to ytdl-2021.02.04.1

											
										
										
											2021-02-04 20:07:17 +05:30
+								                or search_meta('isFamilyFriendly') == 'false'
 								                or search_meta('og:restrictions:age') == '18+') else 0,
 								            'webpage_url': webpage_url,
 								            'categories': [category] if category else None,
 								            'tags': keywords,
-												[youtube] Extract data from multiple clients (#536)

* `player_client` accepts multiple clients
* default `player_client` = `android,web`
* music clients can be specifically requested
* Add IOS `player_client`
* Hide live dash since they can't be downloaded

Closes #501

Authored-by: pukkandan, colethedj
											
										
										
											2021-07-21 09:22:34 +05:30
+								            'playable_in_embed': get_first(playability_statuses, 'playableInEmbed'),
-												[extractor/youtube] Download `post_live` videos from start (#5091)

* The fragments are generated as a `LazyList`. So only the required formats are expanded during download, but all fragment lists are printed/written in infojson.
* The m3u8 formats which cannot be downloaded from start are not extracted by default, but can be enabled with an extractor-arg. The extractor-arg `include_live_dash` is renamed to `include_incomplete_formats` to account for this new use-case.

Closes #1564
Authored by: Lesmiscore, pukkandan
											
										
										
											2022-10-04 11:48:31 +09:00
+								            'live_status': live_status,
-												[ie/youtube] Extract `media_type` for all videos (#13136)

Authored by: bashonly
											
										
										
											2025-05-10 17:33:57 -05:00
+								            'media_type': (
 								                'livestream' if get_first(video_details, 'isLiveContent')
 								                else 'short' if get_first(microformats, 'isShortsEligible')
 								                else 'video'),
-												[dash,youtube] Download live from start to end (#888)

* Add option `--live-from-start` to enable downloading live videos from start
* Add key `is_from_start` in formats to identify formats (of live videos) that downloads from start
* [dash] Create protocol `http_dash_segments_generator` that allows a function to be passed instead of fragments
* [fragment] Allow multiple live dash formats to download simultaneously
* [youtube] Implement fragment re-fetching for the live dash formats
* [youtube] Re-extract dash manifest every 5 hours (manifest expires in 6hrs)
* [postprocessor/ffmpeg] Add `FFmpegFixupDuplicateMoovPP` to fixup duplicated moov atoms

Known issue: Ctrl+C doesn't work on Windows when downloading multiple formats

Closes #1521
Authored by: nao20010128nao, pukkandan

											
										
										
											2021-12-20 15:06:46 +09:00
+								            'release_timestamp': live_start_time,
-												[ie/youtube] Skip formats if nsig decoding fails (#10223)

Ref: https://github.com/ytdl-org/youtube-dl/issues/32815

Authored by: bashonly
											
										
										
											2024-06-21 18:19:59 -05:00
+								            '_format_sort_fields': (  # source_preference is lower for potentially damaged formats
-												[core] Prioritize AV1 (#11153)

Authored by: seproDev
											
										
										
											2024-11-03 20:39:10 +01:00
+								                'quality', 'res', 'fps', 'hdr:12', 'source', 'vcodec', 'channels', 'acodec', 'lang', 'proto'),
-												[youtube] Update to ytdl-2021.02.04.1

											
										
										
											2021-02-04 20:07:17 +05:30
+								        }
-												[youtube] Fix thumbnails extraction and remove uploader id extraction warning (closes #25676)

											
										
										
											2020-06-16 02:29:04 +07:00
-												[ie/youtube] Add PO token support for subtitles (#13234)

Closes #13075
Authored by: bashonly, coletdjnz

Co-authored-by: coletdjnz <coletdjnz@protonmail.com>
											
										
										
											2025-05-22 04:13:42 -05:00
+								        def get_lang_code(track):
 								            return (remove_start(track.get('vssId') or '', '.').replace('.', '-')
 								                    or track.get('languageCode'))
 								        def process_language(container, base_url, lang_code, sub_name, client_name, query):
 								            lang_subs = container.setdefault(lang_code, [])
 								            for fmt in self._SUBTITLE_FORMATS:
-												[ie/youtube] Fix subtitles extraction (#13659)

Fixes regression introduced in 2ba5391cd68ed4f2415c827d2cecbcbc75ace10b

Closes #13654
Authored by: bashonly
											
										
										
											2025-07-06 17:07:21 -05:00
+								                # xosf=1 results in undesirable text position data for vtt, json3 & srv* subtitles
 								                # See: https://github.com/yt-dlp/yt-dlp/issues/13654
 								                query = {**query, 'fmt': fmt, 'xosf': []}
-												[ie/youtube] Add PO token support for subtitles (#13234)

Closes #13075
Authored by: bashonly, coletdjnz

Co-authored-by: coletdjnz <coletdjnz@protonmail.com>
											
										
										
											2025-05-22 04:13:42 -05:00
+								                lang_subs.append({
 								                    'ext': fmt,
 								                    'url': urljoin('https://www.youtube.com', update_url_query(base_url, query)),
 								                    'name': sub_name,
-												[ie/youtube] Use impersonation for downloading subtitles (#13786)

Closes #13770
Authored by: bashonly
											
										
										
											2025-07-20 18:22:04 -05:00
+								                    'impersonate': True,
-												[ie/youtube] Add PO token support for subtitles (#13234)

Closes #13075
Authored by: bashonly, coletdjnz

Co-authored-by: coletdjnz <coletdjnz@protonmail.com>
											
										
										
											2025-05-22 04:13:42 -05:00
+								                    STREAMING_DATA_CLIENT_NAME: client_name,
 								                })
-												[webvtt, extractor/youtube] Extract auto-subs from livestream VODs

Closes #4130

Authored by: pukkandan, fstirlitz

											
										
										
											2022-06-22 03:46:54 +05:30
+								        subtitles = {}
-												[ie/youtube] Add PO token support for subtitles (#13234)

Closes #13075
Authored by: bashonly, coletdjnz

Co-authored-by: coletdjnz <coletdjnz@protonmail.com>
											
										
										
											2025-05-22 04:13:42 -05:00
+								        skipped_subs_clients = set()
-												[ie/youtube] Fix automatic captions for some client combinations (#13268)

Fix 32ed5f107c6c641958d1cd2752e130de4db55a13

Authored by: bashonly
											
										
										
											2025-05-22 17:41:31 -05:00
+								        # Only web/mweb clients provide translationLanguages, so include initial_pr in the traversal
-												[ie/youtube] Add PO token support for subtitles (#13234)

Closes #13075
Authored by: bashonly, coletdjnz

Co-authored-by: coletdjnz <coletdjnz@protonmail.com>
											
										
										
											2025-05-22 04:13:42 -05:00
+								        translation_languages = {
-												[ie/youtube] Fix automatic captions for some client combinations (#13268)

Fix 32ed5f107c6c641958d1cd2752e130de4db55a13

Authored by: bashonly
											
										
										
											2025-05-22 17:41:31 -05:00
+								            lang['languageCode']: self._get_text(lang['languageName'], max_runs=1)
 								            for lang in traverse_obj(player_responses, (
 								                ..., 'captions', 'playerCaptionsTracklistRenderer', 'translationLanguages',
 								                lambda _, v: v['languageCode'] and v['languageName']))
 								        }
-												[ie/youtube] Add PO token support for subtitles (#13234)

Closes #13075
Authored by: bashonly, coletdjnz

Co-authored-by: coletdjnz <coletdjnz@protonmail.com>
											
										
										
											2025-05-22 04:13:42 -05:00
+								        # NB: Constructing the full subtitle dictionary is slow
 								        get_translated_subs = 'translated_subs' not in self._configuration_arg('skip') and (
 								            self.get_param('writeautomaticsub', False) or self.get_param('listsubtitles'))
-												[ie/youtube] Fix automatic captions for some client combinations (#13268)

Fix 32ed5f107c6c641958d1cd2752e130de4db55a13

Authored by: bashonly
											
										
										
											2025-05-22 17:41:31 -05:00
+								        # Filter out initial_pr which does not have streamingData (smuggled client context)
 								        prs = traverse_obj(player_responses, (
 								            lambda _, v: v['streamingData'] and v['captions']['playerCaptionsTracklistRenderer']))
 								        all_captions = traverse_obj(prs, (
 								            ..., 'captions', 'playerCaptionsTracklistRenderer', 'captionTracks', ..., {dict}))
-												[ie/youtube] Add PO token support for subtitles (#13234)

Closes #13075
Authored by: bashonly, coletdjnz

Co-authored-by: coletdjnz <coletdjnz@protonmail.com>
											
										
										
											2025-05-22 04:13:42 -05:00
+								        need_subs_langs = {get_lang_code(sub) for sub in all_captions if sub.get('kind') != 'asr'}
 								        need_caps_langs = {
 								            remove_start(get_lang_code(sub), 'a-')
 								            for sub in all_captions if sub.get('kind') == 'asr'}
 								        for pr in prs:
 								            pctr = pr['captions']['playerCaptionsTracklistRenderer']
 								            client_name = pr['streamingData'][STREAMING_DATA_CLIENT_NAME]
 								            innertube_client_name = pr['streamingData'][STREAMING_DATA_INNERTUBE_CONTEXT]['client']['clientName']
-												[ie/youtube] Do not require PO Token for premium accounts (#13640)

Authored by: coletdjnz
											
										
										
											2025-07-11 18:54:01 +12:00
+								            pot_policy: GvsPoTokenPolicy = self._get_default_ytcfg(client_name)['SUBS_PO_TOKEN_POLICY']
-												[ie/youtube] Add PO token support for subtitles (#13234)

Closes #13075
Authored by: bashonly, coletdjnz

Co-authored-by: coletdjnz <coletdjnz@protonmail.com>
											
										
										
											2025-05-22 04:13:42 -05:00
+								            fetch_subs_po_token_func = pr['streamingData'][STREAMING_DATA_FETCH_SUBS_PO_TOKEN]
 								            pot_params = {}
 								            already_fetched_pot = False
 								            for caption_track in traverse_obj(pctr, ('captionTracks', lambda _, v: v['baseUrl'])):
 								                base_url = caption_track['baseUrl']
 								                qs = parse_qs(base_url)
 								                lang_code = get_lang_code(caption_track)
 								                requires_pot = (
 								                    # We can detect the experiment for now
 								                    any(e in traverse_obj(qs, ('exp', ...)) for e in ('xpe', 'xpv'))
-												[ie/youtube] Do not require PO Token for premium accounts (#13640)

Authored by: coletdjnz
											
										
										
											2025-07-11 18:54:01 +12:00
+								                    or (pot_policy.required and not (pot_policy.not_required_for_premium and is_premium_subscriber)))
-												[ie/youtube] Add PO token support for subtitles (#13234)

Closes #13075
Authored by: bashonly, coletdjnz

Co-authored-by: coletdjnz <coletdjnz@protonmail.com>
											
										
										
											2025-05-22 04:13:42 -05:00
 								                if not already_fetched_pot:
 								                    already_fetched_pot = True
-												[ie/youtube] Do not require PO Token for premium accounts (#13640)

Authored by: coletdjnz
											
										
										
											2025-07-11 18:54:01 +12:00
+								                    if subs_po_token := fetch_subs_po_token_func(required=requires_pot or pot_policy.recommended):
-												[ie/youtube] Add PO token support for subtitles (#13234)

Closes #13075
Authored by: bashonly, coletdjnz

Co-authored-by: coletdjnz <coletdjnz@protonmail.com>
											
										
										
											2025-05-22 04:13:42 -05:00
+								                        pot_params.update({
 								                            'pot': subs_po_token,
 								                            'potc': '1',
 								                            'c': innertube_client_name,
 								                        })
 								                if not pot_params and requires_pot:
 								                    skipped_subs_clients.add(client_name)
 								                    self._report_pot_subtitles_skipped(video_id, client_name)
 								                    break
-												[youtube] Move metadata extraction after video availability check

											
										
										
											2018-06-03 02:08:38 +07:00
-												[ie/youtube] Add PO token support for subtitles (#13234)

Closes #13075
Authored by: bashonly, coletdjnz

Co-authored-by: coletdjnz <coletdjnz@protonmail.com>
											
										
										
											2025-05-22 04:13:42 -05:00
+								                orig_lang = qs.get('lang', [None])[-1]
-												[YouTube] Add auto-translated subtitles
Closes #1245

											
										
										
											2021-10-12 12:03:56 +05:30
+								                lang_name = self._get_text(caption_track, 'name', max_runs=1)
-												[youtube] Update to ytdl-2021.02.04.1

											
										
										
											2021-02-04 20:07:17 +05:30
+								                if caption_track.get('kind') != 'asr':
 								                    if not lang_code:
 								                        continue
 								                    process_language(
-												[ie/youtube] Add PO token support for subtitles (#13234)

Closes #13075
Authored by: bashonly, coletdjnz

Co-authored-by: coletdjnz <coletdjnz@protonmail.com>
											
										
										
											2025-05-22 04:13:42 -05:00
+								                        subtitles, base_url, lang_code, lang_name, client_name, pot_params)
-												[YouTube] Add auto-translated subtitles
Closes #1245

											
										
										
											2021-10-12 12:03:56 +05:30
+								                    if not caption_track.get('isTranslatable'):
 								                        continue
-												[youtube] Fix subtitles only being extracted from the first client
Closes #547

											
										
										
											2021-07-23 09:37:15 +05:30
+								                for trans_code, trans_name in translation_languages.items():
 								                    if not trans_code:
-												[youtube] Update to ytdl-2021.02.04.1

											
										
										
											2021-02-04 20:07:17 +05:30
+								                        continue
-												[youtube] Fix auto-translated automatic captions

d49669acad71f640ffd8b78f0ea7911ae1f67720 only covered ASR

Closes #2956

											
										
										
											2022-03-27 14:06:26 +05:30
+								                    orig_trans_code = trans_code
-												[extractor/youtube] Subtitles cannot be translated to `und`


Closes #5674

											
										
										
											2022-11-30 05:17:45 +05:30
+								                    if caption_track.get('kind') != 'asr' and trans_code != 'und':
-												[extractor/youtube] Parse translated subtitles only when requested

Closes #4274

											
										
										
											2022-07-18 04:19:43 +05:30
+								                        if not get_translated_subs:
-												[youtube] Add extractor-arg to skip auto-translated subs

											
										
										
											2022-03-27 14:04:20 +05:30
+								                            continue
-												[YouTube] Add auto-translated subtitles
Closes #1245

											
										
										
											2021-10-12 12:03:56 +05:30
+								                        trans_code += f'-{lang_code}'
-												[cleanup, utils] Don't use kwargs for `format_field`

											
										
										
											2022-06-18 07:30:12 +05:30
+								                        trans_name += format_field(lang_name, None, ' from %s')
-												[youtube] Fix auto-translated automatic captions

d49669acad71f640ffd8b78f0ea7911ae1f67720 only covered ASR

Closes #2956

											
										
										
											2022-03-27 14:06:26 +05:30
+								                    if lang_code == f'a-{orig_trans_code}':
-												[extractor/youtube] Determine audio language using automatic captions

											
										
										
											2023-06-14 19:08:46 +05:30
+								                        # Set audio language based on original subtitles
 								                        for f in formats:
 								                            if f.get('acodec') != 'none' and not f.get('language'):
 								                                f['language'] = orig_trans_code
 								                        # Add an "-orig" label to the original language so that it can be distinguished.
 								                        # The subs are returned without "-orig" as well for compatibility
-												[youtube] Label original auto-subs

Closes #2655

											
										
										
											2022-02-12 01:50:25 +05:30
+								                        process_language(
-												[ie/youtube] Add PO token support for subtitles (#13234)

Closes #13075
Authored by: bashonly, coletdjnz

Co-authored-by: coletdjnz <coletdjnz@protonmail.com>
											
										
										
											2025-05-22 04:13:42 -05:00
+								                            automatic_captions, base_url, f'{trans_code}-orig',
 								                            f'{trans_name} (Original)', client_name, pot_params)
-												[youtube] Fix automatic captions

Closes #2956

											
										
										
											2022-03-05 09:38:03 +05:30
+								                    # Setting tlang=lang returns damaged subtitles.
-												[ie/youtube] Add PO token support for subtitles (#13234)

Closes #13075
Authored by: bashonly, coletdjnz

Co-authored-by: coletdjnz <coletdjnz@protonmail.com>
											
										
										
											2025-05-22 04:13:42 -05:00
+								                    process_language(
 								                        automatic_captions, base_url, trans_code, trans_name, client_name,
 								                        pot_params if orig_lang == orig_trans_code else {'tlang': trans_code, **pot_params})
 								            # Avoid duplication if we've already got everything we need
 								            need_subs_langs.difference_update(subtitles)
 								            need_caps_langs.difference_update(automatic_captions)
 								            if not (need_subs_langs or need_caps_langs):
 								                break
 								        if skipped_subs_clients and (need_subs_langs or need_caps_langs):
 								            self._report_pot_subtitles_skipped(video_id, True, msg=join_nonempty(
 								                f'{video_id}: There are missing subtitles languages because a PO token was not provided.',
 								                need_subs_langs and f'Subtitles for these languages are missing: {", ".join(need_subs_langs)}.',
 								                need_caps_langs and f'Automatic captions for {len(need_caps_langs)} languages are missing.',
 								                delim=' '))
-												[webvtt, extractor/youtube] Extract auto-subs from livestream VODs

Closes #4130

Authored by: pukkandan, fstirlitz

											
										
										
											2022-06-22 03:46:54 +05:30
 								        info['automatic_captions'] = automatic_captions
 								        info['subtitles'] = subtitles
-												[youtube] Move metadata extraction after video availability check

											
										
										
											2018-06-03 02:08:38 +07:00
-												[compat] Remove deprecated functions from core code

											
										
										
											2022-06-24 16:24:43 +05:30
+								        parsed_url = urllib.parse.urlparse(url)
-												[youtube] Update to ytdl-2021.02.04.1

											
										
										
											2021-02-04 20:07:17 +05:30
+								        for component in [parsed_url.fragment, parsed_url.query]:
-												[compat] Remove deprecated functions from core code

											
										
										
											2022-06-24 16:24:43 +05:30
+								            query = urllib.parse.parse_qs(component)
-												[youtube] Update to ytdl-2021.02.04.1

											
										
										
											2021-02-04 20:07:17 +05:30
+								            for k, v in query.items():
 								                for d_k, s_ks in [('start', ('start', 't')), ('end', ('end',))]:
 								                    d_k += '_time'
 								                    if d_k not in info and k in s_ks:
-												[cleanup] Add more ruff rules (#10149)

Authored by: seproDev

Reviewed-by: bashonly <88596187+bashonly@users.noreply.github.com>
Reviewed-by: Simon Sawicki <contact@grub4k.xyz>
											
										
										
											2024-06-12 01:09:58 +02:00
+								                        info[d_k] = parse_duration(v[0])
-												[youtube] improve Youtube Music Auto-generated description parsing(closes #20742)

											
										
										
											2019-04-27 09:16:17 +01:00
 								        # Youtube Music Auto-generated description
-												[extractor/youtube] Improve description parsing performance (#7315)

* The parsing is skipped when not needed
* The regex is improved by simulating atomic groups with lookaheads

Authored by: pukkandan, berkanteber
											
										
										
											2023-06-22 10:27:54 +03:00
+								        if (video_description or '').strip().endswith('\nAuto-generated by YouTube.'):
 								            # XXX: Causes catastrophic backtracking if description has "·"
 								            # E.g. https://www.youtube.com/watch?v=DoPaAxMQoiI
 								            # Simulating atomic groups:  (?P<a>[^xy]+)x  =>  (?=(?P<a>[^xy]+))(?P=a)x
 								            # reduces it, but does not fully fix it. https://regex101.com/r/8Ssf2h/2
-												[cleanup] Misc fixes

Cherry-picks from: #3498, #3947
Related: #3949, https://github.com/yt-dlp/yt-dlp/issues/1839#issuecomment-1140313836
Authored by: pukkandan, flashdagger, gamer191

											
										
										
											2022-06-03 21:29:03 +05:30
+								            mobj = re.search(
 								                r'''(?xs)
-												[extractor/youtube] Improve description parsing performance (#7315)

* The parsing is skipped when not needed
* The regex is improved by simulating atomic groups with lookaheads

Authored by: pukkandan, berkanteber
											
										
										
											2023-06-22 10:27:54 +03:00
+								                    (?=(?P<track>[^\n·]+))(?P=track)·
 								                    (?=(?P<artist>[^\n]+))(?P=artist)\n+
 								                    (?=(?P<album>[^\n]+))(?P=album)\n
-												[cleanup] Misc fixes

Cherry-picks from: #3498, #3947
Related: #3949, https://github.com/yt-dlp/yt-dlp/issues/1839#issuecomment-1140313836
Authored by: pukkandan, flashdagger, gamer191

											
										
										
											2022-06-03 21:29:03 +05:30
+								                    (?:.+?℗\s*(?P<release_year>\d{4})(?!\d))?
-												[ie/youtube] Fix `release_date` extraction (#11759)

Authored by: MutantPiggieGolem1
											
										
										
											2024-12-12 05:46:52 -08:00
+								                    (?:.+?Released\ on\s*:\s*(?P<release_date>\d{4}-\d{2}-\d{2}))?
-												[extractor/youtube] Improve description parsing performance (#7315)

* The parsing is skipped when not needed
* The regex is improved by simulating atomic groups with lookaheads

Authored by: pukkandan, berkanteber
											
										
										
											2023-06-22 10:27:54 +03:00
+								                    (.+?\nArtist\s*:\s*
 								                        (?=(?P<clean_artist>[^\n]+))(?P=clean_artist)\n
 								                    )?.+\nAuto-generated\ by\ YouTube\.\s*$
-												[cleanup] Misc fixes

Cherry-picks from: #3498, #3947
Related: #3949, https://github.com/yt-dlp/yt-dlp/issues/1839#issuecomment-1140313836
Authored by: pukkandan, flashdagger, gamer191

											
										
										
											2022-06-03 21:29:03 +05:30
+								                ''', video_description)
-												[youtube] improve Youtube Music Auto-generated description parsing(closes #20742)

											
										
										
											2019-04-27 09:16:17 +01:00
+								            if mobj:
 								                release_year = mobj.group('release_year')
 								                release_date = mobj.group('release_date')
 								                if release_date:
 								                    release_date = release_date.replace('-', '')
 								                    if not release_year:
-												[youtube] Update to ytdl-2021.02.04.1

											
										
										
											2021-02-04 20:07:17 +05:30
+								                        release_year = release_date[:4]
 								                info.update({
 								                    'album': mobj.group('album'.strip()),
-												[ie] Migrate commonly plural fields to lists (#8917)

Authored by: llistochek, pukkandan
Related: #3944
											
										
										
											2024-02-20 07:19:24 +00:00
+								                    'artists': ([a] if (a := mobj.group('clean_artist'))
 								                                else [a.strip() for a in mobj.group('artist').split('·')]),
-												[youtube] Update to ytdl-2021.02.04.1

											
										
										
											2021-02-04 20:07:17 +05:30
+								                    'track': mobj.group('track').strip(),
 								                    'release_date': release_date,
-												Update to ytdl-2021.02.10

Except: [archiveorg] Fix and improve extraction (5fc53690cbe6abb11941a3f4846b566a7472753e)

											
										
										
											2021-02-11 02:52:55 +05:30
+								                    'release_year': int_or_none(release_year),
-												[youtube] Update to ytdl-2021.02.04.1

											
										
										
											2021-02-04 20:07:17 +05:30
+								                })
-												[youtube] Move metadata extraction after video availability check

											
										
										
											2018-06-03 02:08:38 +07:00
-												[ie/youtube] Fix `comment_count` extraction (#11274)

Authored by: bashonly
											
										
										
											2024-10-19 21:40:20 +00:00
+								        COMMENTS_SECTION_IDS = ('comment-item-section', 'engagement-panel-comments-section')
-												[youtube] Extract `comment_count` from webpage

Closes #4091

											
										
										
											2022-06-17 12:00:55 +05:30
+								        info['comment_count'] = traverse_obj(initial_data, (
 								            'contents', 'twoColumnWatchNextResults', 'results', 'results', 'contents', ..., 'itemSectionRenderer',
-												[cleanup] Add more ruff rules (#10149)

Authored by: seproDev

Reviewed-by: bashonly <88596187+bashonly@users.noreply.github.com>
Reviewed-by: Simon Sawicki <contact@grub4k.xyz>
											
										
										
											2024-06-12 01:09:58 +02:00
+								            'contents', ..., 'commentsEntryPointHeaderRenderer', 'commentCount',
-												[youtube] Extract `comment_count` from webpage

Closes #4091

											
										
										
											2022-06-17 12:00:55 +05:30
+								        ), (
-												[ie/youtube] Fix `comment_count` extraction (#11274)

Authored by: bashonly
											
										
										
											2024-10-19 21:40:20 +00:00
+								            'engagementPanels', lambda _, v: v['engagementPanelSectionListRenderer']['panelIdentifier'] in COMMENTS_SECTION_IDS,
-												[cleanup] Add more ruff rules (#10149)

Authored by: seproDev

Reviewed-by: bashonly <88596187+bashonly@users.noreply.github.com>
Reviewed-by: Simon Sawicki <contact@grub4k.xyz>
											
										
										
											2024-06-12 01:09:58 +02:00
+								            'engagementPanelSectionListRenderer', 'header', 'engagementPanelTitleHeaderRenderer', 'contextualInfo',
-												[extractor/youtube] Fix parsing `comment_count` (#6523)

Closes #5849
Authored by: nick-cd
											
										
										
											2023-03-14 19:21:14 -04:00
+								        ), expected_type=self._get_count, get_all=False)
-												[youtube] Extract `comment_count` from webpage

Closes #4091

											
										
										
											2022-06-17 12:00:55 +05:30
-												[cleanup] Misc cleanup and refactor (#2173)

											
										
										
											2022-04-18 02:28:28 +05:30
+								        try:  # This will error if there is no livechat
-												[youtube_live_chat] Support ongoing live chat (#422)

Authored by: siikamiika
											
										
										
											2021-06-23 03:12:39 +03:00
+								            initial_data['contents']['twoColumnWatchNextResults']['conversationBar']['liveChatRenderer']['continuations'][0]['reloadContinuationData']['continuation']
-												[cleanup] Misc cleanup and refactor (#2173)

											
										
										
											2022-04-18 02:28:28 +05:30
+								        except (KeyError, IndexError, TypeError):
 								            pass
 								        else:
-												[YouTube] Add auto-translated subtitles
Closes #1245

											
										
										
											2021-10-12 12:03:56 +05:30
+								            info.setdefault('subtitles', {})['live_chat'] = [{
-												[extractor/youtube] Fix live chat for videos with content warning

Fixes #4051
Authored by: coletdjnz

											
										
										
											2022-06-12 17:56:50 +12:00
+								                # url is needed to set cookies
 								                'url': f'https://www.youtube.com/watch?v={video_id}&bpctr=9999999999&has_verified=1',
-												[youtube_live_chat] Support ongoing live chat (#422)

Authored by: siikamiika
											
										
										
											2021-06-23 03:12:39 +03:00
+								                'video_id': video_id,
 								                'ext': 'json',
-												[extractor/youtube] Download `post_live` videos from start (#5091)

* The fragments are generated as a `LazyList`. So only the required formats are expanded during download, but all fragment lists are printed/written in infojson.
* The m3u8 formats which cannot be downloaded from start are not extracted by default, but can be enabled with an extractor-arg. The extractor-arg `include_live_dash` is renamed to `include_incomplete_formats` to account for this new use-case.

Closes #1564
Authored by: Lesmiscore, pukkandan
											
										
										
											2022-10-04 11:48:31 +09:00
+								                'protocol': ('youtube_live_chat' if live_status in ('is_live', 'is_upcoming')
 								                             else 'youtube_live_chat_replay'),
-												[youtube_live_chat] Support ongoing live chat (#422)

Authored by: siikamiika
											
										
										
											2021-06-23 03:12:39 +03:00
+								            }]
-												[youtube] Update to ytdl-2021.02.04.1

											
										
										
											2021-02-04 20:07:17 +05:30
 								        if initial_data:
-												[youtube] Sanity check `chapters` (and refactor related code)
Closes #520

											
										
										
											2021-07-20 05:32:41 +05:30
+								            info['chapters'] = (
 								                self._extract_chapters_from_json(initial_data, duration)
 								                or self._extract_chapters_from_engagement_panel(initial_data, duration)
-												[extractor/youtube] Bring back `_extract_chapters_from_description`

Closes #3886

											
										
										
											2022-05-29 01:00:41 +05:30
+								                or self._extract_chapters_from_description(video_description, duration)
-												[youtube] Sanity check `chapters` (and refactor related code)
Closes #520

											
										
										
											2021-07-20 05:32:41 +05:30
+								                or None)
-												[youtube] Update to ytdl-2021.02.04.1

											
										
										
											2021-02-04 20:07:17 +05:30
-												[ie/youtube] Fix `heatmap` extraction (#8299)

Closes #8189
Authored by: bashonly
											
										
										
											2023-10-06 20:00:15 -05:00
+								            info['heatmap'] = self._extract_heatmap(initial_data)
-												[extractor/youtube] Extract `heatmap` data (#7100)

Closes #3888
Authored by: tntmod54321
											
										
										
											2023-05-26 08:24:39 -04:00
-												[youtube] Improve video upload date handling (#3029)

* Don't prefer UTC upload date for past live streams/premieres
* Improve regex (fixes a regression)

Authored-by: coletdjnz
											
										
										
											2022-03-14 11:02:44 +13:00
+								        contents = traverse_obj(
 								            initial_data, ('contents', 'twoColumnWatchNextResults', 'results', 'results', 'contents'),
 								            expected_type=list, default=[])
 								        vpir = get_first(contents, 'videoPrimaryInfoRenderer')
 								        if vpir:
 								            stl = vpir.get('superTitleLink')
 								            if stl:
 								                stl = self._get_text(stl)
 								                if try_get(
 								                        vpir,
 								                        lambda x: x['superTitleIcon']['iconType']) == 'LOCATION_PIN':
 								                    info['location'] = stl
 								                else:
-												[youtube] Fix episode metadata extraction

											
										
										
											2022-04-15 16:22:03 +12:00
+								                    mobj = re.search(r'(.+?)\s*S(\d+)\s*•?\s*E(\d+)', stl)
-												[youtube] Improve video upload date handling (#3029)

* Don't prefer UTC upload date for past live streams/premieres
* Improve regex (fixes a regression)

Authored-by: coletdjnz
											
										
										
											2022-03-14 11:02:44 +13:00
+								                    if mobj:
-												[youtube] Update to ytdl-2021.02.04.1

											
										
										
											2021-02-04 20:07:17 +05:30
+								                        info.update({
-												[youtube] Improve video upload date handling (#3029)

* Don't prefer UTC upload date for past live streams/premieres
* Improve regex (fixes a regression)

Authored-by: coletdjnz
											
										
										
											2022-03-14 11:02:44 +13:00
+								                            'series': mobj.group(1),
 								                            'season_number': int(mobj.group(2)),
 								                            'episode_number': int(mobj.group(3)),
-												[youtube] Update to ytdl-2021.02.04.1

											
										
										
											2021-02-04 20:07:17 +05:30
+								                        })
-												[youtube] Improve video upload date handling (#3029)

* Don't prefer UTC upload date for past live streams/premieres
* Improve regex (fixes a regression)

Authored-by: coletdjnz
											
										
										
											2022-03-14 11:02:44 +13:00
+								            for tlb in (try_get(
 								                    vpir,
 								                    lambda x: x['videoActions']['menuRenderer']['topLevelButtons'],
 								                    list) or []):
-												[extractor/youtube] Fix video like count extraction

Support new combined button layout
Authored by: coletdjnz

											
										
										
											2022-09-09 12:34:39 +12:00
+								                tbrs = variadic(
 								                    traverse_obj(
-												[utils] `traverse_obj`: Fix more bugs

and cleanup uses of `default=[]`

Continued from b1bde57bef878478e3503ab07190fd207914ade9

											
										
										
											2023-02-10 03:56:26 +05:30
+								                        tlb, ('toggleButtonRenderer', ...),
 								                        ('segmentedLikeDislikeButtonRenderer', ..., 'toggleButtonRenderer')))
-												[extractor/youtube] Fix video like count extraction

Support new combined button layout
Authored by: coletdjnz

											
										
										
											2022-09-09 12:34:39 +12:00
+								                for tbr in tbrs:
 								                    for getter, regex in [(
 								                            lambda x: x['defaultText']['accessibility']['accessibilityData'],
 								                            r'(?P<count>[\d,]+)\s*(?P<type>(?:dis)?like)'), ([
 								                                lambda x: x['accessibility'],
 								                                lambda x: x['accessibilityData']['accessibilityData'],
 								                            ], r'(?P<type>(?:dis)?like) this video along with (?P<count>[\d,]+) other people')]:
 								                        label = (try_get(tbr, getter, dict) or {}).get('label')
 								                        if label:
 								                            mobj = re.match(regex, label)
 								                            if mobj:
 								                                info[mobj.group('type') + '_count'] = str_to_int(mobj.group('count'))
 								                                break
-												[ie/youtube] Fix `like_count` extraction (#8763)

Closes #8759
Authored by: Ganesh910
											
										
										
											2023-12-13 12:34:12 +05:30
 								            info['like_count'] = traverse_obj(vpir, (
 								                'videoActions', 'menuRenderer', 'topLevelButtons', ...,
 								                'segmentedLikeDislikeButtonViewModel', 'likeButtonViewModel', 'likeButtonViewModel',
 								                'toggleButtonViewModel', 'toggleButtonViewModel', 'defaultButtonViewModel',
 								                'buttonViewModel', 'accessibilityText', {parse_count}), get_all=False)
-												[extractor/youtube] Extract concurrent view count for livestreams (#5152)

Adds new field `concurrent_view_count`
Closes https://github.com/yt-dlp/yt-dlp/issues/4843

Authored by: coletdjnz
											
										
										
											2022-10-07 20:00:40 +13:00
+								            vcr = traverse_obj(vpir, ('viewCount', 'videoViewCountRenderer'))
 								            if vcr:
 								                vc = self._get_count(vcr, 'viewCount')
 								                # Upcoming premieres with waiting count are treated as live here
 								                if vcr.get('isLive'):
 								                    info['concurrent_view_count'] = vc
 								                elif info.get('view_count') is None:
 								                    info['view_count'] = vc
-												[youtube] Improve video upload date handling (#3029)

* Don't prefer UTC upload date for past live streams/premieres
* Improve regex (fixes a regression)

Authored-by: coletdjnz
											
										
										
											2022-03-14 11:02:44 +13:00
+								        vsir = get_first(contents, 'videoSecondaryInfoRenderer')
 								        if vsir:
 								            vor = traverse_obj(vsir, ('owner', 'videoOwnerRenderer'))
 								            info.update({
 								                'channel': self._get_text(vor, 'title'),
 								                'channel_follower_count': self._get_count(vor, 'subscriberCountText')})
-												[extractor/youtube] Define strict uploader metadata mapping (#6384)

New mapping:
```
channel -> channel name
channel_id -> UCID
channel_url -> UCID channel url

uploader -> channel name (same as channel field)
uploader_id -> @handle
uploader_url -> @handle channel url 
```

Authored by: coletdjnz
											
										
										
											2023-04-14 07:58:36 +00:00
+								            if not channel_handle:
 								                channel_handle = self.handle_from_url(
 								                    traverse_obj(vor, (
 								                        ('navigationEndpoint', ('title', 'runs', ..., 'navigationEndpoint')),
 								                        (('commandMetadata', 'webCommandMetadata', 'url'), ('browseEndpoint', 'canonicalBaseUrl')),
 								                        {str}), get_all=False))
-												[youtube] Improve video upload date handling (#3029)

* Don't prefer UTC upload date for past live streams/premieres
* Improve regex (fixes a regression)

Authored-by: coletdjnz
											
										
										
											2022-03-14 11:02:44 +13:00
+								            rows = try_get(
 								                vsir,
 								                lambda x: x['metadataRowContainer']['metadataRowContainerRenderer']['rows'],
 								                list) or []
 								            multiple_songs = False
 								            for row in rows:
 								                if try_get(row, lambda x: x['metadataRowRenderer']['hasDividerLine']) is True:
 								                    multiple_songs = True
 								                    break
 								            for row in rows:
 								                mrr = row.get('metadataRowRenderer') or {}
 								                mrr_title = mrr.get('title')
 								                if not mrr_title:
 								                    continue
 								                mrr_title = self._get_text(mrr, 'title')
 								                mrr_contents_text = self._get_text(mrr, ('contents', 0))
 								                if mrr_title == 'License':
 								                    info['license'] = mrr_contents_text
 								                elif not multiple_songs:
 								                    if mrr_title == 'Album':
 								                        info['album'] = mrr_contents_text
 								                    elif mrr_title == 'Artist':
-												[ie] Migrate commonly plural fields to lists (#8917)

Authored by: llistochek, pukkandan
Related: #3944
											
										
										
											2024-02-20 07:19:24 +00:00
+								                        info['artists'] = [mrr_contents_text] if mrr_contents_text else None
-												[youtube] Improve video upload date handling (#3029)

* Don't prefer UTC upload date for past live streams/premieres
* Improve regex (fixes a regression)

Authored-by: coletdjnz
											
										
										
											2022-03-14 11:02:44 +13:00
+								                    elif mrr_title == 'Song':
 								                        info['track'] = mrr_contents_text
-												[extractor/youtube] Extract `channel_is_verified` (#7213)

Authored by: coletdjnz

											
										
										
											2023-06-08 19:50:05 +12:00
+								            owner_badges = self._extract_badges(traverse_obj(vsir, ('owner', 'videoOwnerRenderer', 'badges')))
 								            if self._has_badge(owner_badges, BadgeType.VERIFIED):
 								                info['channel_is_verified'] = True
-												[youtube] Update to ytdl-2021.02.04.1

											
										
										
											2021-02-04 20:07:17 +05:30
-												[extractor/youtube] Define strict uploader metadata mapping (#6384)

New mapping:
```
channel -> channel name
channel_id -> UCID
channel_url -> UCID channel url

uploader -> channel name (same as channel field)
uploader_id -> @handle
uploader_url -> @handle channel url 
```

Authored by: coletdjnz
											
										
										
											2023-04-14 07:58:36 +00:00
+								        info.update({
 								            'uploader': info.get('channel'),
 								            'uploader_id': channel_handle,
 								            'uploader_url': format_field(channel_handle, None, 'https://www.youtube.com/%s', default=None),
 								        })
-												[ie/youtube] Extract upload timestamp if available (#9856)

Closes #4962, Closes #9829
Authored by: coletdjnz
											
										
										
											2024-05-27 09:13:12 +12:00
 								        # We only want timestamp IF it has time precision AND a timezone
 								        # Currently the uploadDate in microformats appears to be in US/Pacific timezone.
 								        timestamp = (
 								            parse_iso8601(get_first(microformats, 'uploadDate'), timezone=NO_DEFAULT)
 								            or parse_iso8601(search_meta('uploadDate'), timezone=NO_DEFAULT)
 								        )
 								        upload_date = (
 								            dt.datetime.fromtimestamp(timestamp, dt.timezone.utc).strftime('%Y%m%d') if timestamp else
 								            (
 								                unified_strdate(get_first(microformats, 'uploadDate'))
 								                or unified_strdate(search_meta('uploadDate'))
 								            ))
 								        # In the case we cannot get the timestamp:
-												[youtube] Improve video upload date handling (#3029)

* Don't prefer UTC upload date for past live streams/premieres
* Improve regex (fixes a regression)

Authored-by: coletdjnz
											
										
										
											2022-03-14 11:02:44 +13:00
+								        # The upload date for scheduled, live and past live streams / premieres in microformats
 								        # may be different from the stream date. Although not in UTC, we will prefer it in this case.
-												[youtube] Prefer UTC upload date for videos (#2223)

Except for live/scheduled streams/premieres. 
Closes #1881
Related: #2402 
Authored-by: coletdjnz
											
										
										
											2022-03-08 20:28:00 +13:00
+								        # See: https://github.com/yt-dlp/yt-dlp/pull/2223#issuecomment-1008485139
-												[ie/youtube] Extract upload timestamp if available (#9856)

Closes #4962, Closes #9829
Authored by: coletdjnz
											
										
										
											2024-05-27 09:13:12 +12:00
+								        if not upload_date or (not timestamp and live_status in ('not_live', None)):
 								            # this should be in UTC, as configured in the cookie/client context
-												[extractor/youtube] Support changing extraction language (#4470)

Adds `--extractor-args youtube:lang=<supported lang code>` extractor arg to prefer translated fields (e.g. title and description) of that language, if available, for all YouTube extractors. See README or error message for list of supported language codes.

Closes https://github.com/yt-dlp/yt-dlp/issues/387

Authored by: coletdjnz
											
										
										
											2022-09-09 05:16:46 +00:00
+								            upload_date = strftime_or_none(
-												[cleanup] Misc

Closes #6288, Closes #7197, Closes #7265, Closes #7353, Closes #5773
Authored by: mikf, freezboltz, pukkandan

											
										
										
											2023-06-21 09:21:20 +05:30
+								                self._parse_time_text(self._get_text(vpir, 'dateText'))) or upload_date
-												[ie/youtube] Extract upload timestamp if available (#9856)

Closes #4962, Closes #9829
Authored by: coletdjnz
											
										
										
											2024-05-27 09:13:12 +12:00
-												[youtube] Improve video upload date handling (#3029)

* Don't prefer UTC upload date for past live streams/premieres
* Improve regex (fixes a regression)

Authored-by: coletdjnz
											
										
										
											2022-03-14 11:02:44 +13:00
+								        info['upload_date'] = upload_date
-												[ie/youtube] Extract upload timestamp if available (#9856)

Closes #4962, Closes #9829
Authored by: coletdjnz
											
										
										
											2024-05-27 09:13:12 +12:00
+								        info['timestamp'] = timestamp
-												[youtube] Prefer UTC upload date for videos (#2223)

Except for live/scheduled streams/premieres. 
Closes #1881
Related: #2402 
Authored-by: coletdjnz
											
										
										
											2022-03-08 20:28:00 +13:00
-												[ie/youtube] Check newly uploaded iOS HLS formats (#8336)

Closes #7747
Authored by: bashonly
											
										
										
											2023-10-28 03:02:13 -05:00
+								        if upload_date and live_status not in ('is_live', 'post_live', 'is_upcoming'):
 								            # Newly uploaded videos' HLS formats are potentially problematic and need to be checked
-												[cleanup] Standardize `import datetime as dt` (#8978)

											
										
										
											2024-02-25 05:46:34 +05:30
+								            upload_datetime = datetime_from_str(upload_date).replace(tzinfo=dt.timezone.utc)
-												[ie/youtube] Improve detection of faulty HLS formats (#8646)

Closes #7747
Authored by: bashonly
											
										
										
											2023-11-25 20:21:29 -06:00
+								            if upload_datetime >= datetime_from_str('today-2days'):
-												[ie/youtube] Check newly uploaded iOS HLS formats (#8336)

Closes #7747
Authored by: bashonly
											
										
										
											2023-10-28 03:02:13 -05:00
+								                for fmt in info['formats']:
 								                    if fmt.get('protocol') == 'm3u8_native':
 								                        fmt['__needs_testing'] = True
-												[ie] Migrate commonly plural fields to lists (#8917)

Authored by: llistochek, pukkandan
Related: #3944
											
										
										
											2024-02-20 07:19:24 +00:00
+								        for s_k, d_k in [('artists', 'creators'), ('track', 'alt_title')]:
-												[youtube] Update to ytdl-2021.02.04.1

											
										
										
											2021-02-04 20:07:17 +05:30
+								            v = info.get(s_k)
 								            if v:
 								                info[d_k] = v
-												[youtube] Added 'subscriber_count' to extraction

											
										
										
											2020-09-15 17:16:58 +02:00
-												[extractor/youtube] Misc cleanup

Authored by: coletdjnz

											
										
										
											2023-06-08 18:58:49 +05:30
+								        badges = self._extract_badges(traverse_obj(vpir, 'badges'))
-												[extractor/youtube] Support changing extraction language (#4470)

Adds `--extractor-args youtube:lang=<supported lang code>` extractor arg to prefer translated fields (e.g. title and description) of that language, if available, for all YouTube extractors. See README or error message for list of supported language codes.

Closes https://github.com/yt-dlp/yt-dlp/issues/387

Authored by: coletdjnz
											
										
										
											2022-09-09 05:16:46 +00:00
 								        is_private = (self._has_badge(badges, BadgeType.AVAILABILITY_PRIVATE)
 								                      or get_first(video_details, 'isPrivate', expected_type=bool))
 								        info['availability'] = (
 								            'public' if self._has_badge(badges, BadgeType.AVAILABILITY_PUBLIC)
 								            else self._availability(
 								                is_private=is_private,
 								                needs_premium=(
 								                    self._has_badge(badges, BadgeType.AVAILABILITY_PREMIUM)
 								                    or False if initial_data and is_private is not None else None),
 								                needs_subscription=(
 								                    self._has_badge(badges, BadgeType.AVAILABILITY_SUBSCRIPTION)
 								                    or False if initial_data and is_private is not None else None),
 								                needs_auth=info['age_limit'] >= 18,
 								                is_unlisted=None if is_private is None else (
 								                    self._has_badge(badges, BadgeType.AVAILABILITY_UNLISTED)
 								                    or get_first(microformats, 'isUnlisted', expected_type=bool))))
-												[youtube] Show if video is `private`, `unlisted` etc in new field `availability` (#188)
Closes: #185, https://github.com/ytdl-org/youtube-dl/issues/25631

Authored by: colethedj, pukkandan

											
										
										
											2021-03-21 21:23:34 +00:00
-												[ie/youtube] Do not require PO Token for premium accounts (#13640)

Authored by: coletdjnz
											
										
										
											2025-07-11 18:54:01 +12:00
+								        info['__post_extractor'] = self.extract_comments(webpage_ytcfg, video_id, contents, webpage)
-												[YoutubeIE] Externalize format selection

											
										
										
											2013-12-18 03:30:55 +01:00
-												[youtube] Extract data from multiple clients (#536)

* `player_client` accepts multiple clients
* default `player_client` = `android,web`
* music clients can be specifically requested
* Add IOS `player_client`
* Hide live dash since they can't be downloaded

Closes #501

Authored-by: pukkandan, colethedj
											
										
										
											2021-07-21 09:22:34 +05:30
+								        self.mark_watched(video_id, player_responses)
-												Add --mark-watched feature (Closes #5054)

											
										
										
											2016-03-01 01:01:33 +06:00
-												[youtube] Update to ytdl-2021.02.04.1

											
										
										
											2021-02-04 20:07:17 +05:30
+								        return info