yt-dlp/yt_dlp/extractor/youtube/_video.py

import base64
import binascii
import collections
import datetime as dt
import functools
import itertools
import json
import math
import os.path
import random
import re
import sys
import threading
import time
import traceback
import urllib.parse

from ._base import (
    INNERTUBE_CLIENTS,
    BadgeType,
    YoutubeBaseInfoExtractor,
    _PoTokenContext,
    _split_innertube_client,
    short_client_name,
)
from ..openload import PhantomJSwrapper
from ...jsinterp import JSInterpreter
from ...networking.exceptions import HTTPError
from ...utils import (
    NO_DEFAULT,
    ExtractorError,
    LazyList,
    bug_reports_message,
    clean_html,
    datetime_from_str,
    filesize_from_tbr,
    float_or_none,
    format_field,
    get_first,
    int_or_none,
    join_nonempty,
    js_to_json,
    mimetype2ext,
    orderedSet,
    parse_codecs,
    parse_count,
    parse_duration,
    parse_iso8601,
    parse_qs,
    qualities,
    remove_end,
    remove_start,
    smuggle_url,
    str_or_none,
    str_to_int,
    strftime_or_none,
    traverse_obj,
    try_call,
    try_get,
    unescapeHTML,
    unified_strdate,
    unsmuggle_url,
    update_url_query,
    url_or_none,
    urljoin,
    variadic,
)

STREAMING_DATA_CLIENT_NAME = '__yt_dlp_client'
STREAMING_DATA_INITIAL_PO_TOKEN = '__yt_dlp_po_token'
PO_TOKEN_GUIDE_URL = 'https://github.com/yt-dlp/yt-dlp/wiki/PO-Token-Guide'


class YoutubeIE(YoutubeBaseInfoExtractor):
    IE_DESC = 'YouTube'
    _VALID_URL = r'''(?x)^
                     (
                         (?:https?://|//)                                    # http(s):// or protocol-independent URL
                         (?:(?:(?:(?:\w+\.)?[yY][oO][uU][tT][uU][bB][eE](?:-nocookie|kids)?\.com|
                            (?:www\.)?deturl\.com/www\.youtube\.com|
                            (?:www\.)?pwnyoutube\.com|
                            (?:www\.)?hooktube\.com|
                            (?:www\.)?yourepeat\.com|
                            tube\.majestyc\.net|
                            {invidious}|
                            youtube\.googleapis\.com)/                        # the various hostnames, with wildcard subdomains
                         (?:.*?\#/)?                                          # handle anchor (#/) redirect urls
                         (?:                                                  # the various things that can precede the ID:
                             (?:(?:v|embed|e|shorts|live)/(?!videoseries|live_stream))  # v/ or embed/ or e/ or shorts/
                             |(?:                                             # or the v= param in all its forms
                                 (?:(?:watch|movie)(?:_popup)?(?:\.php)?/?)?  # preceding watch(_popup|.php) or nothing (like /?v=xxxx)
                                 (?:\?|\#!?)                                  # the params delimiter ? or # or #!
                                 (?:.*?[&;])??                                # any other preceding param (like /?s=tuff&v=xxxx or ?s=tuff&amp;v=V36LpHqtcDY)
                                 v=
                             )
                         ))
                         |(?:
                            youtu\.be|                                        # just youtu.be/xxxx
                            vid\.plus|                                        # or vid.plus/xxxx
                            zwearz\.com/watch|                                # or zwearz.com/watch/xxxx
                            {invidious}
                         )/
                         |(?:www\.)?cleanvideosearch\.com/media/action/yt/watch\?videoId=
                         )
                     )?                                                       # all until now is optional -> you can pass the naked ID
                     (?P<id>[0-9A-Za-z_-]{{11}})                              # here is it! the YouTube video ID
                     (?(1).+)?                                                # if we found the ID, everything can follow
                     (?:\#|$)'''.format(
        invidious='|'.join(YoutubeBaseInfoExtractor._INVIDIOUS_SITES),
    )
    _EMBED_REGEX = [
        r'''(?x)
            (?:
                <(?:[0-9A-Za-z-]+?)?iframe[^>]+?src=|
                data-video-url=|
                <embed[^>]+?src=|
                embedSWF\(?:\s*|
                <object[^>]+data=|
                new\s+SWFObject\(
            )
            (["\'])
                (?P<url>(?:https?:)?//(?:www\.)?youtube(?:-nocookie)?\.com/
                (?:embed|v|p)/[0-9A-Za-z_-]{11}.*?)
            \1''',
        # https://wordpress.org/plugins/lazy-load-for-videos/
        r'''(?xs)
            <a\s[^>]*\bhref="(?P<url>https://www\.youtube\.com/watch\?v=[0-9A-Za-z_-]{11})"
            \s[^>]*\bclass="[^"]*\blazy-load-youtube''',
    ]
    _RETURN_TYPE = 'video'  # XXX: How to handle multifeed?

    _PLAYER_INFO_RE = (
        r'/s/player/(?P<id>[a-zA-Z0-9_-]{8,})/(?:tv-)?player',
        r'/(?P<id>[a-zA-Z0-9_-]{8,})/player(?:_ias\.vflset(?:/[a-zA-Z]{2,3}_[a-zA-Z]{2,3})?|-plasma-ias-(?:phone|tablet)-[a-z]{2}_[A-Z]{2}\.vflset)/base\.js$',
        r'\b(?P<id>vfl[a-zA-Z0-9_-]+)\b.*?\.js$',
    )
    _formats = {  # NB: Used in YoutubeWebArchiveIE and GoogleDriveIE
        '5': {'ext': 'flv', 'width': 400, 'height': 240, 'acodec': 'mp3', 'abr': 64, 'vcodec': 'h263'},
        '6': {'ext': 'flv', 'width': 450, 'height': 270, 'acodec': 'mp3', 'abr': 64, 'vcodec': 'h263'},
        '13': {'ext': '3gp', 'acodec': 'aac', 'vcodec': 'mp4v'},
        '17': {'ext': '3gp', 'width': 176, 'height': 144, 'acodec': 'aac', 'abr': 24, 'vcodec': 'mp4v'},
        '18': {'ext': 'mp4', 'width': 640, 'height': 360, 'acodec': 'aac', 'abr': 96, 'vcodec': 'h264'},
        '22': {'ext': 'mp4', 'width': 1280, 'height': 720, 'acodec': 'aac', 'abr': 192, 'vcodec': 'h264'},
        '34': {'ext': 'flv', 'width': 640, 'height': 360, 'acodec': 'aac', 'abr': 128, 'vcodec': 'h264'},
        '35': {'ext': 'flv', 'width': 854, 'height': 480, 'acodec': 'aac', 'abr': 128, 'vcodec': 'h264'},
        # itag 36 videos are either 320x180 (BaW_jenozKc) or 320x240 (__2ABJjxzNo), abr varies as well
        '36': {'ext': '3gp', 'width': 320, 'acodec': 'aac', 'vcodec': 'mp4v'},
        '37': {'ext': 'mp4', 'width': 1920, 'height': 1080, 'acodec': 'aac', 'abr': 192, 'vcodec': 'h264'},
        '38': {'ext': 'mp4', 'width': 4096, 'height': 3072, 'acodec': 'aac', 'abr': 192, 'vcodec': 'h264'},
        '43': {'ext': 'webm', 'width': 640, 'height': 360, 'acodec': 'vorbis', 'abr': 128, 'vcodec': 'vp8'},
        '44': {'ext': 'webm', 'width': 854, 'height': 480, 'acodec': 'vorbis', 'abr': 128, 'vcodec': 'vp8'},
        '45': {'ext': 'webm', 'width': 1280, 'height': 720, 'acodec': 'vorbis', 'abr': 192, 'vcodec': 'vp8'},
        '46': {'ext': 'webm', 'width': 1920, 'height': 1080, 'acodec': 'vorbis', 'abr': 192, 'vcodec': 'vp8'},
        '59': {'ext': 'mp4', 'width': 854, 'height': 480, 'acodec': 'aac', 'abr': 128, 'vcodec': 'h264'},
        '78': {'ext': 'mp4', 'width': 854, 'height': 480, 'acodec': 'aac', 'abr': 128, 'vcodec': 'h264'},


        # 3D videos
        '82': {'ext': 'mp4', 'height': 360, 'format_note': '3D', 'acodec': 'aac', 'abr': 128, 'vcodec': 'h264', 'preference': -20},
        '83': {'ext': 'mp4', 'height': 480, 'format_note': '3D', 'acodec': 'aac', 'abr': 128, 'vcodec': 'h264', 'preference': -20},
        '84': {'ext': 'mp4', 'height': 720, 'format_note': '3D', 'acodec': 'aac', 'abr': 192, 'vcodec': 'h264', 'preference': -20},
        '85': {'ext': 'mp4', 'height': 1080, 'format_note': '3D', 'acodec': 'aac', 'abr': 192, 'vcodec': 'h264', 'preference': -20},
        '100': {'ext': 'webm', 'height': 360, 'format_note': '3D', 'acodec': 'vorbis', 'abr': 128, 'vcodec': 'vp8', 'preference': -20},
        '101': {'ext': 'webm', 'height': 480, 'format_note': '3D', 'acodec': 'vorbis', 'abr': 192, 'vcodec': 'vp8', 'preference': -20},
        '102': {'ext': 'webm', 'height': 720, 'format_note': '3D', 'acodec': 'vorbis', 'abr': 192, 'vcodec': 'vp8', 'preference': -20},

        # Apple HTTP Live Streaming
        '91': {'ext': 'mp4', 'height': 144, 'format_note': 'HLS', 'acodec': 'aac', 'abr': 48, 'vcodec': 'h264', 'preference': -10},
        '92': {'ext': 'mp4', 'height': 240, 'format_note': 'HLS', 'acodec': 'aac', 'abr': 48, 'vcodec': 'h264', 'preference': -10},
        '93': {'ext': 'mp4', 'height': 360, 'format_note': 'HLS', 'acodec': 'aac', 'abr': 128, 'vcodec': 'h264', 'preference': -10},
        '94': {'ext': 'mp4', 'height': 480, 'format_note': 'HLS', 'acodec': 'aac', 'abr': 128, 'vcodec': 'h264', 'preference': -10},
        '95': {'ext': 'mp4', 'height': 720, 'format_note': 'HLS', 'acodec': 'aac', 'abr': 256, 'vcodec': 'h264', 'preference': -10},
        '96': {'ext': 'mp4', 'height': 1080, 'format_note': 'HLS', 'acodec': 'aac', 'abr': 256, 'vcodec': 'h264', 'preference': -10},
        '132': {'ext': 'mp4', 'height': 240, 'format_note': 'HLS', 'acodec': 'aac', 'abr': 48, 'vcodec': 'h264', 'preference': -10},
        '151': {'ext': 'mp4', 'height': 72, 'format_note': 'HLS', 'acodec': 'aac', 'abr': 24, 'vcodec': 'h264', 'preference': -10},

        # DASH mp4 video
        '133': {'ext': 'mp4', 'height': 240, 'format_note': 'DASH video', 'vcodec': 'h264'},
        '134': {'ext': 'mp4', 'height': 360, 'format_note': 'DASH video', 'vcodec': 'h264'},
        '135': {'ext': 'mp4', 'height': 480, 'format_note': 'DASH video', 'vcodec': 'h264'},
        '136': {'ext': 'mp4', 'height': 720, 'format_note': 'DASH video', 'vcodec': 'h264'},
        '137': {'ext': 'mp4', 'height': 1080, 'format_note': 'DASH video', 'vcodec': 'h264'},
        '138': {'ext': 'mp4', 'format_note': 'DASH video', 'vcodec': 'h264'},  # Height can vary (https://github.com/ytdl-org/youtube-dl/issues/4559)
        '160': {'ext': 'mp4', 'height': 144, 'format_note': 'DASH video', 'vcodec': 'h264'},
        '212': {'ext': 'mp4', 'height': 480, 'format_note': 'DASH video', 'vcodec': 'h264'},
        '264': {'ext': 'mp4', 'height': 1440, 'format_note': 'DASH video', 'vcodec': 'h264'},
        '298': {'ext': 'mp4', 'height': 720, 'format_note': 'DASH video', 'vcodec': 'h264', 'fps': 60},
        '299': {'ext': 'mp4', 'height': 1080, 'format_note': 'DASH video', 'vcodec': 'h264', 'fps': 60},
        '266': {'ext': 'mp4', 'height': 2160, 'format_note': 'DASH video', 'vcodec': 'h264'},

        # Dash mp4 audio
        '139': {'ext': 'm4a', 'format_note': 'DASH audio', 'acodec': 'aac', 'abr': 48, 'container': 'm4a_dash'},
        '140': {'ext': 'm4a', 'format_note': 'DASH audio', 'acodec': 'aac', 'abr': 128, 'container': 'm4a_dash'},
        '141': {'ext': 'm4a', 'format_note': 'DASH audio', 'acodec': 'aac', 'abr': 256, 'container': 'm4a_dash'},
        '256': {'ext': 'm4a', 'format_note': 'DASH audio', 'acodec': 'aac', 'container': 'm4a_dash'},
        '258': {'ext': 'm4a', 'format_note': 'DASH audio', 'acodec': 'aac', 'container': 'm4a_dash'},
        '325': {'ext': 'm4a', 'format_note': 'DASH audio', 'acodec': 'dtse', 'container': 'm4a_dash'},
        '328': {'ext': 'm4a', 'format_note': 'DASH audio', 'acodec': 'ec-3', 'container': 'm4a_dash'},

        # Dash webm
        '167': {'ext': 'webm', 'height': 360, 'width': 640, 'format_note': 'DASH video', 'container': 'webm', 'vcodec': 'vp8'},
        '168': {'ext': 'webm', 'height': 480, 'width': 854, 'format_note': 'DASH video', 'container': 'webm', 'vcodec': 'vp8'},
        '169': {'ext': 'webm', 'height': 720, 'width': 1280, 'format_note': 'DASH video', 'container': 'webm', 'vcodec': 'vp8'},
        '170': {'ext': 'webm', 'height': 1080, 'width': 1920, 'format_note': 'DASH video', 'container': 'webm', 'vcodec': 'vp8'},
        '218': {'ext': 'webm', 'height': 480, 'width': 854, 'format_note': 'DASH video', 'container': 'webm', 'vcodec': 'vp8'},
        '219': {'ext': 'webm', 'height': 480, 'width': 854, 'format_note': 'DASH video', 'container': 'webm', 'vcodec': 'vp8'},
        '278': {'ext': 'webm', 'height': 144, 'format_note': 'DASH video', 'container': 'webm', 'vcodec': 'vp9'},
        '242': {'ext': 'webm', 'height': 240, 'format_note': 'DASH video', 'vcodec': 'vp9'},
        '243': {'ext': 'webm', 'height': 360, 'format_note': 'DASH video', 'vcodec': 'vp9'},
        '244': {'ext': 'webm', 'height': 480, 'format_note': 'DASH video', 'vcodec': 'vp9'},
        '245': {'ext': 'webm', 'height': 480, 'format_note': 'DASH video', 'vcodec': 'vp9'},
        '246': {'ext': 'webm', 'height': 480, 'format_note': 'DASH video', 'vcodec': 'vp9'},
        '247': {'ext': 'webm', 'height': 720, 'format_note': 'DASH video', 'vcodec': 'vp9'},
        '248': {'ext': 'webm', 'height': 1080, 'format_note': 'DASH video', 'vcodec': 'vp9'},
        '271': {'ext': 'webm', 'height': 1440, 'format_note': 'DASH video', 'vcodec': 'vp9'},
        # itag 272 videos are either 3840x2160 (e.g. RtoitU2A-3E) or 7680x4320 (sLprVF6d7Ug)
        '272': {'ext': 'webm', 'height': 2160, 'format_note': 'DASH video', 'vcodec': 'vp9'},
        '302': {'ext': 'webm', 'height': 720, 'format_note': 'DASH video', 'vcodec': 'vp9', 'fps': 60},
        '303': {'ext': 'webm', 'height': 1080, 'format_note': 'DASH video', 'vcodec': 'vp9', 'fps': 60},
        '308': {'ext': 'webm', 'height': 1440, 'format_note': 'DASH video', 'vcodec': 'vp9', 'fps': 60},
        '313': {'ext': 'webm', 'height': 2160, 'format_note': 'DASH video', 'vcodec': 'vp9'},
        '315': {'ext': 'webm', 'height': 2160, 'format_note': 'DASH video', 'vcodec': 'vp9', 'fps': 60},

        # Dash webm audio
        '171': {'ext': 'webm', 'acodec': 'vorbis', 'format_note': 'DASH audio', 'abr': 128},
        '172': {'ext': 'webm', 'acodec': 'vorbis', 'format_note': 'DASH audio', 'abr': 256},

        # Dash webm audio with opus inside
        '249': {'ext': 'webm', 'format_note': 'DASH audio', 'acodec': 'opus', 'abr': 50},
        '250': {'ext': 'webm', 'format_note': 'DASH audio', 'acodec': 'opus', 'abr': 70},
        '251': {'ext': 'webm', 'format_note': 'DASH audio', 'acodec': 'opus', 'abr': 160},

        # RTMP (unnamed)
        '_rtmp': {'protocol': 'rtmp'},

        # av01 video only formats sometimes served with "unknown" codecs
        '394': {'ext': 'mp4', 'height': 144, 'format_note': 'DASH video', 'vcodec': 'av01.0.00M.08'},
        '395': {'ext': 'mp4', 'height': 240, 'format_note': 'DASH video', 'vcodec': 'av01.0.00M.08'},
        '396': {'ext': 'mp4', 'height': 360, 'format_note': 'DASH video', 'vcodec': 'av01.0.01M.08'},
        '397': {'ext': 'mp4', 'height': 480, 'format_note': 'DASH video', 'vcodec': 'av01.0.04M.08'},
        '398': {'ext': 'mp4', 'height': 720, 'format_note': 'DASH video', 'vcodec': 'av01.0.05M.08'},
        '399': {'ext': 'mp4', 'height': 1080, 'format_note': 'DASH video', 'vcodec': 'av01.0.08M.08'},
        '400': {'ext': 'mp4', 'height': 1440, 'format_note': 'DASH video', 'vcodec': 'av01.0.12M.08'},
        '401': {'ext': 'mp4', 'height': 2160, 'format_note': 'DASH video', 'vcodec': 'av01.0.12M.08'},
    }
    _SUBTITLE_FORMATS = ('json3', 'srv1', 'srv2', 'srv3', 'ttml', 'vtt')
    _DEFAULT_CLIENTS = ('tv', 'ios', 'web')
    _DEFAULT_AUTHED_CLIENTS = ('tv', 'web')

    _GEO_BYPASS = False

    IE_NAME = 'youtube'
    _TESTS = [
        {
            'url': 'https://www.youtube.com/watch?v=BaW_jenozKc&t=1s&end=9',
            'info_dict': {
                'id': 'BaW_jenozKc',
                'ext': 'mp4',
                'title': 'youtube-dl test video "\'/\\ä↭𝕐',
                'channel': 'Philipp Hagemeister',
                'channel_id': 'UCLqxVugv74EIW3VWh2NOa3Q',
                'channel_url': r're:https?://(?:www\.)?youtube\.com/channel/UCLqxVugv74EIW3VWh2NOa3Q',
                'upload_date': '20121002',
                'description': 'md5:8fb536f4877b8a7455c2ec23794dbc22',
                'categories': ['Science & Technology'],
                'tags': ['youtube-dl'],
                'duration': 10,
                'view_count': int,
                'like_count': int,
                'availability': 'public',
                'playable_in_embed': True,
                'thumbnail': 'https://i.ytimg.com/vi/BaW_jenozKc/maxresdefault.jpg',
                'live_status': 'not_live',
                'age_limit': 0,
                'start_time': 1,
                'end_time': 9,
                'comment_count': int,
                'channel_follower_count': int,
                'uploader': 'Philipp Hagemeister',
                'uploader_url': 'https://www.youtube.com/@PhilippHagemeister',
                'uploader_id': '@PhilippHagemeister',
                'heatmap': 'count:100',
                'timestamp': 1349198244,
            },
        },
        {
            'url': '//www.YouTube.com/watch?v=yZIXLfi8CZQ',
            'note': 'Embed-only video (#1746)',
            'info_dict': {
                'id': 'yZIXLfi8CZQ',
                'ext': 'mp4',
                'upload_date': '20120608',
                'title': 'Principal Sexually Assaults A Teacher - Episode 117 - 8th June 2012',
                'description': 'md5:09b78bd971f1e3e289601dfba15ca4f7',
                'age_limit': 18,
            },
            'skip': 'Private video',
        },
        {
            'url': 'https://www.youtube.com/watch?v=BaW_jenozKc&v=yZIXLfi8CZQ',
            'note': 'Use the first video ID in the URL',
            'info_dict': {
                'id': 'BaW_jenozKc',
                'ext': 'mp4',
                'title': 'youtube-dl test video "\'/\\ä↭𝕐',
                'channel': 'Philipp Hagemeister',
                'channel_id': 'UCLqxVugv74EIW3VWh2NOa3Q',
                'channel_url': r're:https?://(?:www\.)?youtube\.com/channel/UCLqxVugv74EIW3VWh2NOa3Q',
                'upload_date': '20121002',
                'description': 'md5:8fb536f4877b8a7455c2ec23794dbc22',
                'categories': ['Science & Technology'],
                'tags': ['youtube-dl'],
                'duration': 10,
                'view_count': int,
                'like_count': int,
                'availability': 'public',
                'playable_in_embed': True,
                'thumbnail': 'https://i.ytimg.com/vi/BaW_jenozKc/maxresdefault.jpg',
                'live_status': 'not_live',
                'age_limit': 0,
                'comment_count': int,
                'channel_follower_count': int,
                'uploader': 'Philipp Hagemeister',
                'uploader_url': 'https://www.youtube.com/@PhilippHagemeister',
                'uploader_id': '@PhilippHagemeister',
                'heatmap': 'count:100',
                'timestamp': 1349198244,
            },
            'params': {
                'skip_download': True,
            },
        },
        {
            'url': 'https://www.youtube.com/watch?v=a9LDPn-MO4I',
            'note': '256k DASH audio (format 141) via DASH manifest',
            'info_dict': {
                'id': 'a9LDPn-MO4I',
                'ext': 'm4a',
                'upload_date': '20121002',
                'description': '',
                'title': 'UHDTV TEST 8K VIDEO.mp4',
            },
            'params': {
                'youtube_include_dash_manifest': True,
                'format': '141',
            },
            'skip': 'format 141 not served anymore',
        },
        # DASH manifest with encrypted signature
        {
            'url': 'https://www.youtube.com/watch?v=IB3lcPjvWLA',
            'info_dict': {
                'id': 'IB3lcPjvWLA',
                'ext': 'm4a',
                'title': 'Afrojack, Spree Wilson - The Spark (Official Music Video) ft. Spree Wilson',
                'description': 'md5:8f5e2b82460520b619ccac1f509d43bf',
                'duration': 244,
                'upload_date': '20131011',
                'abr': 129.495,
                'like_count': int,
                'channel_id': 'UChuZAo1RKL85gev3Eal9_zg',
                'playable_in_embed': True,
                'channel_url': 'https://www.youtube.com/channel/UChuZAo1RKL85gev3Eal9_zg',
                'view_count': int,
                'track': 'The Spark',
                'live_status': 'not_live',
                'thumbnail': 'https://i.ytimg.com/vi_webp/IB3lcPjvWLA/maxresdefault.webp',
                'channel': 'Afrojack',
                'tags': 'count:19',
                'availability': 'public',
                'categories': ['Music'],
                'age_limit': 0,
                'alt_title': 'The Spark',
                'channel_follower_count': int,
                'uploader': 'Afrojack',
                'uploader_url': 'https://www.youtube.com/@Afrojack',
                'uploader_id': '@Afrojack',
            },
            'params': {
                'youtube_include_dash_manifest': True,
                'format': '141/bestaudio[ext=m4a]',
            },
        },
        # Age-gate videos. See https://github.com/yt-dlp/yt-dlp/pull/575#issuecomment-888837000
        {
            'note': 'Embed allowed age-gate video; works with web_embedded',
            'url': 'https://youtube.com/watch?v=HtVdAasjOgU',
            'info_dict': {
                'id': 'HtVdAasjOgU',
                'ext': 'mp4',
                'title': 'The Witcher 3: Wild Hunt - The Sword Of Destiny Trailer',
                'description': r're:(?s).{100,}About the Game\n.*?The Witcher 3: Wild Hunt.{100,}',
                'duration': 142,
                'upload_date': '20140605',
                'age_limit': 18,
                'categories': ['Gaming'],
                'thumbnail': 'https://i.ytimg.com/vi_webp/HtVdAasjOgU/maxresdefault.webp',
                'availability': 'needs_auth',
                'channel_url': 'https://www.youtube.com/channel/UCzybXLxv08IApdjdN0mJhEg',
                'like_count': int,
                'channel': 'The Witcher',
                'live_status': 'not_live',
                'tags': 'count:17',
                'channel_id': 'UCzybXLxv08IApdjdN0mJhEg',
                'playable_in_embed': True,
                'view_count': int,
                'channel_follower_count': int,
                'uploader': 'The Witcher',
                'uploader_url': 'https://www.youtube.com/@thewitcher',
                'uploader_id': '@thewitcher',
                'comment_count': int,
                'channel_is_verified': True,
                'heatmap': 'count:100',
                'timestamp': 1401991663,
            },
        },
        {
            'note': 'Age-gate video with embed allowed in public site',
            'url': 'https://youtube.com/watch?v=HsUATh_Nc2U',
            'info_dict': {
                'id': 'HsUATh_Nc2U',
                'ext': 'mp4',
                'title': 'Godzilla 2 (Official Video)',
                'description': 'md5:bf77e03fcae5529475e500129b05668a',
                'upload_date': '20200408',
                'age_limit': 18,
                'availability': 'needs_auth',
                'channel_id': 'UCYQT13AtrJC0gsM1far_zJg',
                'channel': 'FlyingKitty',
                'channel_url': 'https://www.youtube.com/channel/UCYQT13AtrJC0gsM1far_zJg',
                'view_count': int,
                'categories': ['Entertainment'],
                'live_status': 'not_live',
                'tags': ['Flyingkitty', 'godzilla 2'],
                'thumbnail': 'https://i.ytimg.com/vi/HsUATh_Nc2U/maxresdefault.jpg',
                'like_count': int,
                'duration': 177,
                'playable_in_embed': True,
                'channel_follower_count': int,
                'uploader': 'FlyingKitty',
                'uploader_url': 'https://www.youtube.com/@FlyingKitty900',
                'uploader_id': '@FlyingKitty900',
                'comment_count': int,
                'channel_is_verified': True,
            },
            'skip': 'Age-restricted; requires authentication',
        },
        {
            'note': 'Age-gate video embedable only with clientScreen=EMBED',
            'url': 'https://youtube.com/watch?v=Tq92D6wQ1mg',
            'info_dict': {
                'id': 'Tq92D6wQ1mg',
                'title': '[MMD] Adios - EVERGLOW [+Motion DL]',
                'ext': 'mp4',
                'upload_date': '20191228',
                'description': 'md5:17eccca93a786d51bc67646756894066',
                'age_limit': 18,
                'like_count': int,
                'availability': 'needs_auth',
                'channel_id': 'UC1yoRdFoFJaCY-AGfD9W0wQ',
                'view_count': int,
                'thumbnail': 'https://i.ytimg.com/vi_webp/Tq92D6wQ1mg/sddefault.webp',
                'channel': 'Projekt Melody',
                'live_status': 'not_live',
                'tags': ['mmd', 'dance', 'mikumikudance', 'kpop', 'vtuber'],
                'playable_in_embed': True,
                'categories': ['Entertainment'],
                'duration': 106,
                'channel_url': 'https://www.youtube.com/channel/UC1yoRdFoFJaCY-AGfD9W0wQ',
                'comment_count': int,
                'channel_follower_count': int,
                'uploader': 'Projekt Melody',
                'uploader_url': 'https://www.youtube.com/@ProjektMelody',
                'uploader_id': '@ProjektMelody',
                'timestamp': 1577508724,
            },
            'skip': 'Age-restricted; requires authentication',
        },
        {
            'note': 'Non-Agegated non-embeddable video',
            'url': 'https://youtube.com/watch?v=MeJVWBSsPAY',
            'info_dict': {
                'id': 'MeJVWBSsPAY',
                'ext': 'mp4',
                'title': 'OOMPH! - Such Mich Find Mich (Lyrics)',
                'description': 'Fan Video. Music & Lyrics by OOMPH!.',
                'upload_date': '20130730',
                'track': 'Such mich find mich',
                'age_limit': 0,
                'tags': ['oomph', 'such mich find mich', 'lyrics', 'german industrial', 'musica industrial'],
                'like_count': int,
                'playable_in_embed': False,
                'creator': 'OOMPH!',
                'thumbnail': 'https://i.ytimg.com/vi/MeJVWBSsPAY/sddefault.jpg',
                'view_count': int,
                'alt_title': 'Such mich find mich',
                'duration': 210,
                'channel': 'Herr Lurik',
                'channel_id': 'UCdR3RSDPqub28LjZx0v9-aA',
                'categories': ['Music'],
                'availability': 'public',
                'channel_url': 'https://www.youtube.com/channel/UCdR3RSDPqub28LjZx0v9-aA',
                'live_status': 'not_live',
                'artist': 'OOMPH!',
                'channel_follower_count': int,
                'uploader': 'Herr Lurik',
                'uploader_url': 'https://www.youtube.com/@HerrLurik',
                'uploader_id': '@HerrLurik',
            },
        },
        {
            'note': 'Non-bypassable age-gated video',
            'url': 'https://youtube.com/watch?v=Cr381pDsSsA',
            'only_matching': True,
        },
        # video_info is None (https://github.com/ytdl-org/youtube-dl/issues/4421)
        # YouTube Red ad is not captured for creator
        {
            'url': '__2ABJjxzNo',
            'info_dict': {
                'id': '__2ABJjxzNo',
                'ext': 'mp4',
                'duration': 266,
                'upload_date': '20100430',
                'creator': 'deadmau5',
                'description': 'md5:6cbcd3a92ce1bc676fc4d6ab4ace2336',
                'title': 'Deadmau5 - Some Chords (HD)',
                'alt_title': 'Some Chords',
                'availability': 'public',
                'tags': 'count:14',
                'channel_id': 'UCYEK6xds6eo-3tr4xRdflmQ',
                'view_count': int,
                'live_status': 'not_live',
                'channel': 'deadmau5',
                'thumbnail': 'https://i.ytimg.com/vi_webp/__2ABJjxzNo/maxresdefault.webp',
                'like_count': int,
                'track': 'Some Chords',
                'artist': 'deadmau5',
                'playable_in_embed': True,
                'age_limit': 0,
                'channel_url': 'https://www.youtube.com/channel/UCYEK6xds6eo-3tr4xRdflmQ',
                'categories': ['Music'],
                'album': 'Some Chords',
                'channel_follower_count': int,
                'uploader': 'deadmau5',
                'uploader_url': 'https://www.youtube.com/@deadmau5',
                'uploader_id': '@deadmau5',
            },
            'expected_warnings': [
                'DASH manifest missing',
            ],
        },
        # Olympics (https://github.com/ytdl-org/youtube-dl/issues/4431)
        {
            'url': 'lqQg6PlCWgI',
            'info_dict': {
                'id': 'lqQg6PlCWgI',
                'ext': 'mp4',
                'duration': 6085,
                'upload_date': '20150827',
                'description': 'md5:04bbbf3ccceb6795947572ca36f45904',
                'title': 'Hockey - Women -  GER-AUS - London 2012 Olympic Games',
                'like_count': int,
                'release_timestamp': 1343767800,
                'playable_in_embed': True,
                'categories': ['Sports'],
                'release_date': '20120731',
                'channel': 'Olympics',
                'tags': ['Hockey', '2012-07-31', '31 July 2012', 'Riverbank Arena', 'Session', 'Olympics', 'Olympic Games', 'London 2012', '2012 Summer Olympics', 'Summer Games'],
                'channel_id': 'UCTl3QQTvqHFjurroKxexy2Q',
                'thumbnail': 'https://i.ytimg.com/vi/lqQg6PlCWgI/maxresdefault.jpg',
                'age_limit': 0,
                'availability': 'public',
                'live_status': 'was_live',
                'view_count': int,
                'channel_url': 'https://www.youtube.com/channel/UCTl3QQTvqHFjurroKxexy2Q',
                'channel_follower_count': int,
                'uploader': 'Olympics',
                'uploader_url': 'https://www.youtube.com/@Olympics',
                'uploader_id': '@Olympics',
                'channel_is_verified': True,
                'timestamp': 1440707674,
            },
            'params': {
                'skip_download': 'requires avconv',
            },
        },
        # Non-square pixels
        {
            'url': 'https://www.youtube.com/watch?v=_b-2C3KPAM0',
            'info_dict': {
                'id': '_b-2C3KPAM0',
                'ext': 'mp4',
                'stretched_ratio': 16 / 9.,
                'duration': 85,
                'upload_date': '20110310',
                'description': 'made by Wacom from Korea | 字幕&加油添醋 by TY\'s Allen | 感謝heylisa00cavey1001同學熱情提供梗及翻譯',
                'title': '[A-made] 變態妍字幕版 太妍 我就是這樣的人',
                'playable_in_embed': True,
                'channel': '孫ᄋᄅ',
                'age_limit': 0,
                'tags': 'count:11',
                'channel_url': 'https://www.youtube.com/channel/UCS-xxCmRaA6BFdmgDPA_BIw',
                'channel_id': 'UCS-xxCmRaA6BFdmgDPA_BIw',
                'thumbnail': 'https://i.ytimg.com/vi/_b-2C3KPAM0/maxresdefault.jpg',
                'view_count': int,
                'categories': ['People & Blogs'],
                'like_count': int,
                'live_status': 'not_live',
                'availability': 'unlisted',
                'comment_count': int,
                'channel_follower_count': int,
                'uploader': '孫ᄋᄅ',
                'uploader_url': 'https://www.youtube.com/@AllenMeow',
                'uploader_id': '@AllenMeow',
                'timestamp': 1299776999,
            },
        },
        # url_encoded_fmt_stream_map is empty string
        {
            'url': 'qEJwOuvDf7I',
            'info_dict': {
                'id': 'qEJwOuvDf7I',
                'ext': 'webm',
                'title': 'Обсуждение судебной практики по выборам 14 сентября 2014 года в Санкт-Петербурге',
                'description': '',
                'upload_date': '20150404',
            },
            'params': {
                'skip_download': 'requires avconv',
            },
            'skip': 'This live event has ended.',
        },
        # Extraction from multiple DASH manifests (https://github.com/ytdl-org/youtube-dl/pull/6097)
        {
            'url': 'https://www.youtube.com/watch?v=FIl7x6_3R5Y',
            'info_dict': {
                'id': 'FIl7x6_3R5Y',
                'ext': 'webm',
                'title': 'md5:7b81415841e02ecd4313668cde88737a',
                'description': 'md5:116377fd2963b81ec4ce64b542173306',
                'duration': 220,
                'upload_date': '20150625',
                'formats': 'mincount:31',
            },
            'skip': 'not actual anymore',
        },
        # DASH manifest with segment_list
        {
            'url': 'https://www.youtube.com/embed/CsmdDsKjzN8',
            'md5': '8ce563a1d667b599d21064e982ab9e31',
            'info_dict': {
                'id': 'CsmdDsKjzN8',
                'ext': 'mp4',
                'upload_date': '20150501',  # According to '<meta itemprop="datePublished"', but in other places it's 20150510
                'description': 'Retransmisión en directo de la XVIII media maratón de Zaragoza.',
                'title': 'Retransmisión XVIII Media maratón Zaragoza 2015',
            },
            'params': {
                'youtube_include_dash_manifest': True,
                'format': '135',  # bestvideo
            },
            'skip': 'This live event has ended.',
        },
        {
            # Multifeed videos (multiple cameras), URL can be of any Camera
            # TODO: fix multifeed titles
            'url': 'https://www.youtube.com/watch?v=zaPI8MvL8pg',
            'info_dict': {
                'id': 'zaPI8MvL8pg',
                'title': 'Terraria 1.2 Live Stream | Let\'s Play - Part 04',
                'description': 'md5:563ccbc698b39298481ca3c571169519',
            },
            'playlist': [{
                'info_dict': {
                    'id': 'j5yGuxZ8lLU',
                    'ext': 'mp4',
                    'title': 'Terraria 1.2 Live Stream | Let\'s Play - Part 04 (Chris)',
                    'description': 'md5:563ccbc698b39298481ca3c571169519',
                    'duration': 10120,
                    'channel_follower_count': int,
                    'channel_url': 'https://www.youtube.com/channel/UCN2XePorRokPB9TEgRZpddg',
                    'availability': 'public',
                    'playable_in_embed': True,
                    'upload_date': '20131105',
                    'categories': ['Gaming'],
                    'live_status': 'was_live',
                    'tags': 'count:24',
                    'release_timestamp': 1383701910,
                    'thumbnail': 'https://i.ytimg.com/vi/j5yGuxZ8lLU/maxresdefault.jpg',
                    'comment_count': int,
                    'age_limit': 0,
                    'like_count': int,
                    'channel_id': 'UCN2XePorRokPB9TEgRZpddg',
                    'channel': 'WiiLikeToPlay',
                    'view_count': int,
                    'release_date': '20131106',
                    'uploader': 'WiiLikeToPlay',
                    'uploader_id': '@WLTP',
                    'uploader_url': 'https://www.youtube.com/@WLTP',
                },
            }, {
                'info_dict': {
                    'id': 'zaPI8MvL8pg',
                    'ext': 'mp4',
                    'title': 'Terraria 1.2 Live Stream | Let\'s Play - Part 04 (Tyson)',
                    'availability': 'public',
                    'channel_url': 'https://www.youtube.com/channel/UCN2XePorRokPB9TEgRZpddg',
                    'channel': 'WiiLikeToPlay',
                    'channel_follower_count': int,
                    'description': 'md5:563ccbc698b39298481ca3c571169519',
                    'duration': 10108,
                    'age_limit': 0,
                    'like_count': int,
                    'tags': 'count:24',
                    'channel_id': 'UCN2XePorRokPB9TEgRZpddg',
                    'release_timestamp': 1383701915,
                    'comment_count': int,
                    'upload_date': '20131105',
                    'thumbnail': 'https://i.ytimg.com/vi/zaPI8MvL8pg/maxresdefault.jpg',
                    'release_date': '20131106',
                    'playable_in_embed': True,
                    'live_status': 'was_live',
                    'categories': ['Gaming'],
                    'view_count': int,
                    'uploader': 'WiiLikeToPlay',
                    'uploader_id': '@WLTP',
                    'uploader_url': 'https://www.youtube.com/@WLTP',
                },
            }, {
                'info_dict': {
                    'id': 'R7r3vfO7Hao',
                    'ext': 'mp4',
                    'title': 'Terraria 1.2 Live Stream | Let\'s Play - Part 04 (Spencer)',
                    'thumbnail': 'https://i.ytimg.com/vi/R7r3vfO7Hao/maxresdefault.jpg',
                    'channel_id': 'UCN2XePorRokPB9TEgRZpddg',
                    'like_count': int,
                    'availability': 'public',
                    'playable_in_embed': True,
                    'upload_date': '20131105',
                    'description': 'md5:563ccbc698b39298481ca3c571169519',
                    'channel_follower_count': int,
                    'tags': 'count:24',
                    'release_date': '20131106',
                    'comment_count': int,
                    'channel_url': 'https://www.youtube.com/channel/UCN2XePorRokPB9TEgRZpddg',
                    'channel': 'WiiLikeToPlay',
                    'categories': ['Gaming'],
                    'release_timestamp': 1383701914,
                    'live_status': 'was_live',
                    'age_limit': 0,
                    'duration': 10128,
                    'view_count': int,
                    'uploader': 'WiiLikeToPlay',
                    'uploader_id': '@WLTP',
                    'uploader_url': 'https://www.youtube.com/@WLTP',
                },
            }],
            'params': {'skip_download': True},
            'skip': 'Not multifeed anymore',
        },
        {
            # Multifeed video with comma in title (see https://github.com/ytdl-org/youtube-dl/issues/8536)
            'url': 'https://www.youtube.com/watch?v=gVfLd0zydlo',
            'info_dict': {
                'id': 'gVfLd0zydlo',
                'title': 'DevConf.cz 2016 Day 2 Workshops 1 14:00 - 15:30',
            },
            'playlist_count': 2,
            'skip': 'Not multifeed anymore',
        },
        {
            'url': 'https://vid.plus/FlRa-iH7PGw',
            'only_matching': True,
        },
        {
            'url': 'https://zwearz.com/watch/9lWxNJF-ufM/electra-woman-dyna-girl-official-trailer-grace-helbig.html',
            'only_matching': True,
        },
        {
            # Title with JS-like syntax "};" (see https://github.com/ytdl-org/youtube-dl/issues/7468)
            # Also tests cut-off URL expansion in video description (see
            # https://github.com/ytdl-org/youtube-dl/issues/1892,
            # https://github.com/ytdl-org/youtube-dl/issues/8164)
            'url': 'https://www.youtube.com/watch?v=lsguqyKfVQg',
            'info_dict': {
                'id': 'lsguqyKfVQg',
                'ext': 'mp4',
                'title': '{dark walk}; Loki/AC/Dishonored; collab w/Elflover21',
                'alt_title': 'Dark Walk',
                'description': 'md5:8085699c11dc3f597ce0410b0dcbb34a',
                'duration': 133,
                'upload_date': '20151119',
                'creator': 'Todd Haberman;\nDaniel Law Heath and Aaron Kaplan',
                'track': 'Dark Walk',
                'artist': 'Todd Haberman;\nDaniel Law Heath and Aaron Kaplan',
                'album': 'Position Music - Production Music Vol. 143 - Dark Walk',
                'thumbnail': 'https://i.ytimg.com/vi_webp/lsguqyKfVQg/maxresdefault.webp',
                'categories': ['Film & Animation'],
                'view_count': int,
                'live_status': 'not_live',
                'channel_url': 'https://www.youtube.com/channel/UCTSRgz5jylBvFt_S7wnsqLQ',
                'channel_id': 'UCTSRgz5jylBvFt_S7wnsqLQ',
                'tags': 'count:13',
                'availability': 'public',
                'channel': 'IronSoulElf',
                'playable_in_embed': True,
                'like_count': int,
                'age_limit': 0,
                'channel_follower_count': int,
            },
            'params': {
                'skip_download': True,
            },
        },
        {
            # Tags with '};' (see https://github.com/ytdl-org/youtube-dl/issues/7468)
            'url': 'https://www.youtube.com/watch?v=Ms7iBXnlUO8',
            'only_matching': True,
        },
        {
            # Video with yt:stretch=17:0
            'url': 'https://www.youtube.com/watch?v=Q39EVAstoRM',
            'info_dict': {
                'id': 'Q39EVAstoRM',
                'ext': 'mp4',
                'title': 'Clash Of Clans#14 Dicas De Ataque Para CV 4',
                'description': 'md5:ee18a25c350637c8faff806845bddee9',
                'upload_date': '20151107',
            },
            'params': {
                'skip_download': True,
            },
            'skip': 'This video does not exist.',
        },
        {
            # Video with incomplete 'yt:stretch=16:'
            'url': 'https://www.youtube.com/watch?v=FRhJzUSJbGI',
            'only_matching': True,
        },
        {
            # Video licensed under Creative Commons
            'url': 'https://www.youtube.com/watch?v=M4gD1WSo5mA',
            'info_dict': {
                'id': 'M4gD1WSo5mA',
                'ext': 'mp4',
                'title': 'md5:e41008789470fc2533a3252216f1c1d1',
                'description': 'md5:a677553cf0840649b731a3024aeff4cc',
                'duration': 721,
                'upload_date': '20150128',
                'license': 'Creative Commons Attribution license (reuse allowed)',
                'channel_id': 'UCuLGmD72gJDBwmLw06X58SA',
                'channel_url': 'https://www.youtube.com/channel/UCuLGmD72gJDBwmLw06X58SA',
                'like_count': int,
                'age_limit': 0,
                'tags': ['Copyright (Legal Subject)', 'Law (Industry)', 'William W. Fisher (Author)'],
                'channel': 'The Berkman Klein Center for Internet & Society',
                'availability': 'public',
                'view_count': int,
                'categories': ['Education'],
                'thumbnail': 'https://i.ytimg.com/vi_webp/M4gD1WSo5mA/maxresdefault.webp',
                'live_status': 'not_live',
                'playable_in_embed': True,
                'channel_follower_count': int,
                'chapters': list,
                'uploader': 'The Berkman Klein Center for Internet & Society',
                'uploader_id': '@BKCHarvard',
                'uploader_url': 'https://www.youtube.com/@BKCHarvard',
                'timestamp': 1422422076,
            },
            'params': {
                'skip_download': True,
            },
        },
        {
            'url': 'https://www.youtube.com/watch?v=eQcmzGIKrzg',
            'info_dict': {
                'id': 'eQcmzGIKrzg',
                'ext': 'mp4',
                'title': 'Democratic Socialism and Foreign Policy | Bernie Sanders',
                'description': 'md5:13a2503d7b5904ef4b223aa101628f39',
                'duration': 4060,
                'upload_date': '20151120',
                'license': 'Creative Commons Attribution license (reuse allowed)',
                'playable_in_embed': True,
                'tags': 'count:12',
                'like_count': int,
                'channel_id': 'UCH1dpzjCEiGAt8CXkryhkZg',
                'age_limit': 0,
                'availability': 'public',
                'categories': ['News & Politics'],
                'channel': 'Bernie Sanders',
                'thumbnail': 'https://i.ytimg.com/vi_webp/eQcmzGIKrzg/maxresdefault.webp',
                'view_count': int,
                'live_status': 'not_live',
                'channel_url': 'https://www.youtube.com/channel/UCH1dpzjCEiGAt8CXkryhkZg',
                'comment_count': int,
                'channel_follower_count': int,
                'chapters': list,
                'uploader': 'Bernie Sanders',
                'uploader_url': 'https://www.youtube.com/@BernieSanders',
                'uploader_id': '@BernieSanders',
                'channel_is_verified': True,
                'heatmap': 'count:100',
                'timestamp': 1447987198,
            },
            'params': {
                'skip_download': True,
            },
        },
        {
            'url': 'https://www.youtube.com/watch?feature=player_embedded&amp;amp;v=V36LpHqtcDY',
            'only_matching': True,
        },
        {
            # YouTube Red paid video (https://github.com/ytdl-org/youtube-dl/issues/10059)
            'url': 'https://www.youtube.com/watch?v=i1Ko8UG-Tdo',
            'only_matching': True,
        },
        {
            # Rental video preview
            'url': 'https://www.youtube.com/watch?v=yYr8q0y5Jfg',
            'info_dict': {
                'id': 'uGpuVWrhIzE',
                'ext': 'mp4',
                'title': 'Piku - Trailer',
                'description': 'md5:c36bd60c3fd6f1954086c083c72092eb',
                'upload_date': '20150811',
                'license': 'Standard YouTube License',
            },
            'params': {
                'skip_download': True,
            },
            'skip': 'This video is not available.',
        },
        {
            # YouTube Red video with episode data
            'url': 'https://www.youtube.com/watch?v=iqKdEhx-dD4',
            'info_dict': {
                'id': 'iqKdEhx-dD4',
                'ext': 'mp4',
                'title': 'Isolation - Mind Field (Ep 1)',
                'description': 'md5:f540112edec5d09fc8cc752d3d4ba3cd',
                'duration': 2085,
                'upload_date': '20170118',
                'series': 'Mind Field',
                'season_number': 1,
                'episode_number': 1,
                'thumbnail': 'https://i.ytimg.com/vi_webp/iqKdEhx-dD4/maxresdefault.webp',
                'tags': 'count:12',
                'view_count': int,
                'availability': 'public',
                'age_limit': 0,
                'channel': 'Vsauce',
                'episode': 'Episode 1',
                'categories': ['Entertainment'],
                'season': 'Season 1',
                'channel_id': 'UC6nSFpj9HTCZ5t-N3Rm3-HA',
                'channel_url': 'https://www.youtube.com/channel/UC6nSFpj9HTCZ5t-N3Rm3-HA',
                'like_count': int,
                'playable_in_embed': True,
                'live_status': 'not_live',
                'channel_follower_count': int,
                'uploader': 'Vsauce',
                'uploader_url': 'https://www.youtube.com/@Vsauce',
                'uploader_id': '@Vsauce',
                'comment_count': int,
                'channel_is_verified': True,
                'timestamp': 1484761047,
            },
            'params': {
                'skip_download': True,
            },
            'expected_warnings': [
                'Skipping DASH manifest',
            ],
        },
        {
            # The following content has been identified by the YouTube community
            # as inappropriate or offensive to some audiences.
            'url': 'https://www.youtube.com/watch?v=6SJNVb0GnPI',
            'info_dict': {
                'id': '6SJNVb0GnPI',
                'ext': 'mp4',
                'title': 'Race Differences in Intelligence',
                'description': 'md5:5d161533167390427a1f8ee89a1fc6f1',
                'duration': 965,
                'upload_date': '20140124',
            },
            'params': {
                'skip_download': True,
            },
            'skip': 'This video has been removed for violating YouTube\'s policy on hate speech.',
        },
        {
            # itag 212
            'url': '1t24XAntNCY',
            'only_matching': True,
        },
        {
            # geo restricted to JP
            'url': 'sJL6WA-aGkQ',
            'only_matching': True,
        },
        {
            'url': 'https://invidio.us/watch?v=BaW_jenozKc',
            'only_matching': True,
        },
        {
            'url': 'https://redirect.invidious.io/watch?v=BaW_jenozKc',
            'only_matching': True,
        },
        {
            # from https://nitter.pussthecat.org/YouTube/status/1360363141947944964#m
            'url': 'https://redirect.invidious.io/Yh0AhrY9GjA',
            'only_matching': True,
        },
        {
            # DRM protected
            'url': 'https://www.youtube.com/watch?v=s7_qI6_mIXc',
            'only_matching': True,
        },
        {
            # Video with unsupported adaptive stream type formats
            'url': 'https://www.youtube.com/watch?v=Z4Vy8R84T1U',
            'info_dict': {
                'id': 'Z4Vy8R84T1U',
                'ext': 'mp4',
                'title': 'saman SMAN 53 Jakarta(Sancety) opening COFFEE4th at SMAN 53 Jakarta',
                'description': 'md5:d41d8cd98f00b204e9800998ecf8427e',
                'duration': 433,
                'upload_date': '20130923',
                'formats': 'maxcount:10',
            },
            'params': {
                'skip_download': True,
                'youtube_include_dash_manifest': False,
            },
            'skip': 'not actual anymore',
        },
        {
            # Youtube Music Auto-generated description
            # TODO: fix metadata extraction
            'url': 'https://music.youtube.com/watch?v=MgNrAu2pzNs',
            'info_dict': {
                'id': 'MgNrAu2pzNs',
                'ext': 'mp4',
                'title': 'Voyeur Girl',
                'description': 'md5:7ae382a65843d6df2685993e90a8628f',
                'upload_date': '20190312',
                'artists': ['Stephen'],
                'creators': ['Stephen'],
                'track': 'Voyeur Girl',
                'album': 'it\'s too much love to know my dear',
                'release_date': '20190313',
                'alt_title': 'Voyeur Girl',
                'view_count': int,
                'playable_in_embed': True,
                'like_count': int,
                'categories': ['Music'],
                'channel_url': 'https://www.youtube.com/channel/UC-pWHpBjdGG69N9mM2auIAA',
                'channel': 'Stephen',  # TODO: should be "Stephen - Topic"
                'uploader': 'Stephen',
                'availability': 'public',
                'duration': 169,
                'thumbnail': 'https://i.ytimg.com/vi_webp/MgNrAu2pzNs/maxresdefault.webp',
                'age_limit': 0,
                'channel_id': 'UC-pWHpBjdGG69N9mM2auIAA',
                'tags': 'count:11',
                'live_status': 'not_live',
                'channel_follower_count': int,
            },
            'params': {
                'skip_download': True,
            },
        },
        {
            'url': 'https://www.youtubekids.com/watch?v=3b8nCWDgZ6Q',
            'only_matching': True,
        },
        {
            # invalid -> valid video id redirection
            'url': 'DJztXj2GPfl',
            'info_dict': {
                'id': 'DJztXj2GPfk',
                'ext': 'mp4',
                'title': 'Panjabi MC - Mundian To Bach Ke (The Dictator Soundtrack)',
                'description': 'md5:bf577a41da97918e94fa9798d9228825',
                'upload_date': '20090125',
                'artist': 'Panjabi MC',
                'track': 'Beware of the Boys (Mundian to Bach Ke) - Motivo Hi-Lectro Remix',
                'album': 'Beware of the Boys (Mundian To Bach Ke)',
            },
            'params': {
                'skip_download': True,
            },
            'skip': 'Video unavailable',
        },
        {
            # empty description results in an empty string
            'url': 'https://www.youtube.com/watch?v=x41yOUIvK2k',
            'info_dict': {
                'id': 'x41yOUIvK2k',
                'ext': 'mp4',
                'title': 'IMG 3456',
                'description': '',
                'upload_date': '20170613',
                'view_count': int,
                'thumbnail': 'https://i.ytimg.com/vi_webp/x41yOUIvK2k/maxresdefault.webp',
                'like_count': int,
                'channel_id': 'UCo03ZQPBW5U4UC3regpt1nw',
                'tags': [],
                'channel_url': 'https://www.youtube.com/channel/UCo03ZQPBW5U4UC3regpt1nw',
                'availability': 'public',
                'age_limit': 0,
                'categories': ['Pets & Animals'],
                'duration': 7,
                'playable_in_embed': True,
                'live_status': 'not_live',
                'channel': 'l\'Or Vert asbl',
                'channel_follower_count': int,
                'uploader': 'l\'Or Vert asbl',
                'uploader_url': 'https://www.youtube.com/@ElevageOrVert',
                'uploader_id': '@ElevageOrVert',
                'timestamp': 1497343210,
            },
            'params': {
                'skip_download': True,
            },
        },
        {
            # with '};' inside yt initial data (see [1])
            # see [2] for an example with '};' inside ytInitialPlayerResponse
            # 1. https://github.com/ytdl-org/youtube-dl/issues/27093
            # 2. https://github.com/ytdl-org/youtube-dl/issues/27216
            'url': 'https://www.youtube.com/watch?v=CHqg6qOn4no',
            'info_dict': {
                'id': 'CHqg6qOn4no',
                'ext': 'mp4',
                'title': 'Part 77   Sort a list of simple types in c#',
                'description': 'md5:b8746fa52e10cdbf47997903f13b20dc',
                'upload_date': '20130831',
                'channel_id': 'UCCTVrRB5KpIiK6V2GGVsR1Q',
                'like_count': int,
                'channel_url': 'https://www.youtube.com/channel/UCCTVrRB5KpIiK6V2GGVsR1Q',
                'live_status': 'not_live',
                'categories': ['Education'],
                'availability': 'public',
                'thumbnail': 'https://i.ytimg.com/vi/CHqg6qOn4no/sddefault.jpg',
                'tags': 'count:12',
                'playable_in_embed': True,
                'age_limit': 0,
                'view_count': int,
                'duration': 522,
                'channel': 'kudvenkat',
                'comment_count': int,
                'channel_follower_count': int,
                'chapters': list,
                'uploader': 'kudvenkat',
                'uploader_url': 'https://www.youtube.com/@Csharp-video-tutorialsBlogspot',
                'uploader_id': '@Csharp-video-tutorialsBlogspot',
                'channel_is_verified': True,
                'heatmap': 'count:100',
                'timestamp': 1377976349,
            },
            'params': {
                'skip_download': True,
            },
        },
        {
            # another example of '};' in ytInitialData
            'url': 'https://www.youtube.com/watch?v=gVfgbahppCY',
            'only_matching': True,
        },
        {
            'url': 'https://www.youtube.com/watch_popup?v=63RmMXCd_bQ',
            'only_matching': True,
        },
        {
            # https://github.com/ytdl-org/youtube-dl/pull/28094
            'url': 'OtqTfy26tG0',
            'info_dict': {
                'id': 'OtqTfy26tG0',
                'ext': 'mp4',
                'title': 'Burn Out',
                'description': 'md5:8d07b84dcbcbfb34bc12a56d968b6131',
                'upload_date': '20141120',
                'artist': 'The Cinematic Orchestra',
                'track': 'Burn Out',
                'album': 'Every Day',
                'like_count': int,
                'live_status': 'not_live',
                'alt_title': 'Burn Out',
                'duration': 614,
                'age_limit': 0,
                'view_count': int,
                'channel_url': 'https://www.youtube.com/channel/UCIzsJBIyo8hhpFm1NK0uLgw',
                'creator': 'The Cinematic Orchestra',
                'channel': 'The Cinematic Orchestra',
                'tags': ['The Cinematic Orchestra', 'Every Day', 'Burn Out'],
                'channel_id': 'UCIzsJBIyo8hhpFm1NK0uLgw',
                'availability': 'public',
                'thumbnail': 'https://i.ytimg.com/vi/OtqTfy26tG0/maxresdefault.jpg',
                'categories': ['Music'],
                'playable_in_embed': True,
                'channel_follower_count': int,
                'uploader': 'The Cinematic Orchestra',
                'comment_count': int,
            },
            'params': {
                'skip_download': True,
            },
        },
        {
            # controversial video, only works with bpctr when authenticated with cookies
            'url': 'https://www.youtube.com/watch?v=nGC3D_FkCmg',
            'only_matching': True,
        },
        {
            # controversial video, requires bpctr/contentCheckOk
            'url': 'https://www.youtube.com/watch?v=SZJvDhaSDnc',
            'info_dict': {
                'id': 'SZJvDhaSDnc',
                'ext': 'mp4',
                'title': 'San Diego teen commits suicide after bullying over embarrassing video',
                'channel_id': 'UC-SJ6nODDmufqBzPBwCvYvQ',
                'upload_date': '20140716',
                'description': 'md5:acde3a73d3f133fc97e837a9f76b53b7',
                'duration': 170,
                'categories': ['News & Politics'],
                'view_count': int,
                'channel': 'CBS Mornings',
                'tags': ['suicide', 'bullying', 'video', 'cbs', 'news'],
                'thumbnail': 'https://i.ytimg.com/vi/SZJvDhaSDnc/hqdefault.jpg',
                'age_limit': 18,
                'availability': 'needs_auth',
                'channel_url': 'https://www.youtube.com/channel/UC-SJ6nODDmufqBzPBwCvYvQ',
                'like_count': int,
                'live_status': 'not_live',
                'playable_in_embed': True,
                'channel_follower_count': int,
                'uploader': 'CBS Mornings',
                'uploader_url': 'https://www.youtube.com/@CBSMornings',
                'uploader_id': '@CBSMornings',
                'comment_count': int,
                'channel_is_verified': True,
                'timestamp': 1405513526,
            },
            'skip': 'Age-restricted; requires authentication',
        },
        {
            # restricted location, https://github.com/ytdl-org/youtube-dl/issues/28685
            'url': 'cBvYw8_A0vQ',
            'info_dict': {
                'id': 'cBvYw8_A0vQ',
                'ext': 'mp4',
                'title': '4K Ueno Okachimachi  Street  Scenes  上野御徒町歩き',
                'description': 'md5:ea770e474b7cd6722b4c95b833c03630',
                'upload_date': '20201120',
                'duration': 1456,
                'categories': ['Travel & Events'],
                'channel_id': 'UC3o_t8PzBmXf5S9b7GLx1Mw',
                'view_count': int,
                'channel': 'Walk around Japan',
                'tags': ['Ueno Tokyo', 'Okachimachi Tokyo', 'Ameyoko Street', 'Tokyo attraction', 'Travel in Tokyo'],
                'thumbnail': 'https://i.ytimg.com/vi/cBvYw8_A0vQ/hqdefault.jpg',
                'age_limit': 0,
                'availability': 'public',
                'channel_url': 'https://www.youtube.com/channel/UC3o_t8PzBmXf5S9b7GLx1Mw',
                'live_status': 'not_live',
                'playable_in_embed': True,
                'channel_follower_count': int,
                'uploader': 'Walk around Japan',
                'uploader_url': 'https://www.youtube.com/@walkaroundjapan7124',
                'uploader_id': '@walkaroundjapan7124',
                'timestamp': 1605884416,
            },
            'params': {
                'skip_download': True,
            },
        }, {
            # Has multiple audio streams
            'url': 'WaOKSUlf4TM',
            'only_matching': True,
        }, {
            # Requires Premium: has format 141 when requested using YTM url
            'url': 'https://music.youtube.com/watch?v=XclachpHxis',
            'only_matching': True,
        }, {
            # multiple subtitles with same lang_code
            'url': 'https://www.youtube.com/watch?v=wsQiKKfKxug',
            'only_matching': True,
        }, {
            # Force use android client fallback
            'url': 'https://www.youtube.com/watch?v=YOelRv7fMxY',
            'info_dict': {
                'id': 'YOelRv7fMxY',
                'title': 'DIGGING A SECRET TUNNEL Part 1',
                'ext': '3gp',
                'upload_date': '20210624',
                'channel_id': 'UCp68_FLety0O-n9QU6phsgw',
                'channel_url': r're:https?://(?:www\.)?youtube\.com/channel/UCp68_FLety0O-n9QU6phsgw',
                'description': 'md5:5d5991195d599b56cd0c4148907eec50',
                'duration': 596,
                'categories': ['Entertainment'],
                'view_count': int,
                'channel': 'colinfurze',
                'tags': ['Colin', 'furze', 'Terry', 'tunnel', 'underground', 'bunker'],
                'thumbnail': 'https://i.ytimg.com/vi/YOelRv7fMxY/maxresdefault.jpg',
                'age_limit': 0,
                'availability': 'public',
                'like_count': int,
                'live_status': 'not_live',
                'playable_in_embed': True,
                'channel_follower_count': int,
                'chapters': list,
                'uploader': 'colinfurze',
                'uploader_url': 'https://www.youtube.com/@colinfurze',
                'uploader_id': '@colinfurze',
                'comment_count': int,
                'channel_is_verified': True,
                'heatmap': 'count:100',
            },
            'params': {
                'format': '17',  # 3gp format available on android
                'extractor_args': {'youtube': {'player_client': ['android']}},
            },
            'skip': 'android client broken',
        },
        {
            # Skip download of additional client configs (remix client config in this case)
            'url': 'https://music.youtube.com/watch?v=MgNrAu2pzNs',
            'only_matching': True,
            'params': {
                'extractor_args': {'youtube': {'player_skip': ['configs']}},
            },
        }, {
            # shorts
            'url': 'https://www.youtube.com/shorts/BGQWPY4IigY',
            'only_matching': True,
        }, {
            'note': 'Storyboards',
            'url': 'https://www.youtube.com/watch?v=5KLPxDtMqe8',
            'info_dict': {
                'id': '5KLPxDtMqe8',
                'ext': 'mhtml',
                'format_id': 'sb0',
                'title': 'Your Brain is Plastic',
                'description': 'md5:89cd86034bdb5466cd87c6ba206cd2bc',
                'upload_date': '20140324',
                'like_count': int,
                'channel_id': 'UCZYTClx2T1of7BRZ86-8fow',
                'channel_url': 'https://www.youtube.com/channel/UCZYTClx2T1of7BRZ86-8fow',
                'view_count': int,
                'thumbnail': 'https://i.ytimg.com/vi/5KLPxDtMqe8/maxresdefault.jpg',
                'playable_in_embed': True,
                'tags': 'count:12',
                'availability': 'public',
                'channel': 'SciShow',
                'live_status': 'not_live',
                'duration': 248,
                'categories': ['Education'],
                'age_limit': 0,
                'channel_follower_count': int,
                'chapters': list,
                'uploader': 'SciShow',
                'uploader_url': 'https://www.youtube.com/@SciShow',
                'uploader_id': '@SciShow',
                'comment_count': int,
                'channel_is_verified': True,
                'heatmap': 'count:100',
                'timestamp': 1395685455,
            }, 'params': {'format': 'mhtml', 'skip_download': True},
        }, {
            # Ensure video upload_date is in UTC timezone (video was uploaded 1641170939)
            'url': 'https://www.youtube.com/watch?v=2NUZ8W2llS4',
            'info_dict': {
                'id': '2NUZ8W2llS4',
                'ext': 'mp4',
                'title': 'The NP that test your phone performance 🙂',
                'description': 'md5:144494b24d4f9dfacb97c1bbef5de84d',
                'channel_id': 'UCRqNBSOHgilHfAczlUmlWHA',
                'channel_url': 'https://www.youtube.com/channel/UCRqNBSOHgilHfAczlUmlWHA',
                'duration': 21,
                'view_count': int,
                'age_limit': 0,
                'categories': ['Gaming'],
                'tags': 'count:23',
                'playable_in_embed': True,
                'live_status': 'not_live',
                'upload_date': '20220103',
                'like_count': int,
                'availability': 'public',
                'channel': 'Leon Nguyen',
                'thumbnail': 'https://i.ytimg.com/vi_webp/2NUZ8W2llS4/maxresdefault.webp',
                'comment_count': int,
                'channel_follower_count': int,
                'uploader': 'Leon Nguyen',
                'uploader_url': 'https://www.youtube.com/@LeonNguyen',
                'uploader_id': '@LeonNguyen',
                'heatmap': 'count:100',
                'timestamp': 1641170939,
            },
        }, {
            # date text is premiered video, ensure upload date in UTC (published 1641172509)
            'url': 'https://www.youtube.com/watch?v=mzZzzBU6lrM',
            'info_dict': {
                'id': 'mzZzzBU6lrM',
                'ext': 'mp4',
                'title': 'I Met GeorgeNotFound In Real Life...',
                'description': 'md5:978296ec9783a031738b684d4ebf302d',
                'channel_id': 'UC_8NknAFiyhOUaZqHR3lq3Q',
                'channel_url': 'https://www.youtube.com/channel/UC_8NknAFiyhOUaZqHR3lq3Q',
                'duration': 955,
                'view_count': int,
                'age_limit': 0,
                'categories': ['Entertainment'],
                'tags': 'count:26',
                'playable_in_embed': True,
                'live_status': 'not_live',
                'release_timestamp': 1641172509,
                'release_date': '20220103',
                'upload_date': '20220103',
                'like_count': int,
                'availability': 'public',
                'channel': 'Quackity',
                'thumbnail': 'https://i.ytimg.com/vi/mzZzzBU6lrM/maxresdefault.jpg',
                'channel_follower_count': int,
                'uploader': 'Quackity',
                'uploader_id': '@Quackity',
                'uploader_url': 'https://www.youtube.com/@Quackity',
                'comment_count': int,
                'channel_is_verified': True,
                'heatmap': 'count:100',
                'timestamp': 1641172509,
            },
        },
        {   # continuous livestream.
            # Upload date was 2022-07-12T05:12:29-07:00, while stream start is 2022-07-12T15:59:30+00:00
            'url': 'https://www.youtube.com/watch?v=jfKfPfyJRdk',
            'info_dict': {
                'id': 'jfKfPfyJRdk',
                'ext': 'mp4',
                'channel_id': 'UCSJ4gkVC6NrvII8umztf0Ow',
                'like_count': int,
                'uploader': 'Lofi Girl',
                'categories': ['Music'],
                'concurrent_view_count': int,
                'playable_in_embed': True,
                'timestamp': 1657627949,
                'release_date': '20220712',
                'channel_url': 'https://www.youtube.com/channel/UCSJ4gkVC6NrvII8umztf0Ow',
                'description': 'md5:452d5c82f72bb7e62a4e0297c3f01c23',
                'age_limit': 0,
                'thumbnail': 'https://i.ytimg.com/vi/jfKfPfyJRdk/maxresdefault.jpg',
                'release_timestamp': 1657641570,
                'uploader_url': 'https://www.youtube.com/@LofiGirl',
                'channel_follower_count': int,
                'channel_is_verified': True,
                'title': r're:^lofi hip hop radio 📚 beats to relax/study to',
                'view_count': int,
                'live_status': 'is_live',
                'media_type': 'livestream',
                'tags': 'count:32',
                'channel': 'Lofi Girl',
                'availability': 'public',
                'upload_date': '20220712',
                'uploader_id': '@LofiGirl',
            },
            'params': {'skip_download': True},
        }, {
            'url': 'https://www.youtube.com/watch?v=tjjjtzRLHvA',
            'info_dict': {
                'id': 'tjjjtzRLHvA',
                'ext': 'mp4',
                'title': 'ハッシュタグ無し };if window.ytcsi',
                'upload_date': '20220323',
                'like_count': int,
                'availability': 'unlisted',
                'channel': 'Lesmiscore',
                'thumbnail': r're:^https?://.*\.jpg',
                'age_limit': 0,
                'categories': ['Music'],
                'view_count': int,
                'description': '',
                'channel_url': 'https://www.youtube.com/channel/UCdqltm_7iv1Vs6kp6Syke5A',
                'channel_id': 'UCdqltm_7iv1Vs6kp6Syke5A',
                'live_status': 'not_live',
                'playable_in_embed': True,
                'channel_follower_count': int,
                'duration': 6,
                'tags': [],
                'uploader_id': '@lesmiscore',
                'uploader': 'Lesmiscore',
                'uploader_url': 'https://www.youtube.com/@lesmiscore',
                'timestamp': 1648005313,
            },
        }, {
            # Prefer primary title+description language metadata by default
            # Do not prefer translated description if primary is empty
            'url': 'https://www.youtube.com/watch?v=el3E4MbxRqQ',
            'info_dict': {
                'id': 'el3E4MbxRqQ',
                'ext': 'mp4',
                'title': 'dlp test video 2 - primary sv no desc',
                'description': '',
                'channel': 'cole-dlp-test-acc',
                'tags': [],
                'view_count': int,
                'channel_url': 'https://www.youtube.com/channel/UCiu-3thuViMebBjw_5nWYrA',
                'like_count': int,
                'playable_in_embed': True,
                'availability': 'unlisted',
                'thumbnail': r're:^https?://.*\.jpg',
                'age_limit': 0,
                'duration': 5,
                'live_status': 'not_live',
                'upload_date': '20220908',
                'categories': ['People & Blogs'],
                'channel_id': 'UCiu-3thuViMebBjw_5nWYrA',
                'uploader_url': 'https://www.youtube.com/@coletdjnz',
                'uploader_id': '@coletdjnz',
                'uploader': 'cole-dlp-test-acc',
                'timestamp': 1662677394,
            },
            'params': {'skip_download': True},
        }, {
            # Extractor argument: prefer translated title+description
            'url': 'https://www.youtube.com/watch?v=gHKT4uU8Zng',
            'info_dict': {
                'id': 'gHKT4uU8Zng',
                'ext': 'mp4',
                'channel': 'cole-dlp-test-acc',
                'tags': [],
                'duration': 5,
                'live_status': 'not_live',
                'channel_id': 'UCiu-3thuViMebBjw_5nWYrA',
                'upload_date': '20220729',
                'view_count': int,
                'categories': ['People & Blogs'],
                'thumbnail': r're:^https?://.*\.jpg',
                'title': 'dlp test video title translated (fr)',
                'availability': 'public',
                'age_limit': 0,
                'description': 'dlp test video description translated (fr)',
                'playable_in_embed': True,
                'channel_url': 'https://www.youtube.com/channel/UCiu-3thuViMebBjw_5nWYrA',
                'uploader_url': 'https://www.youtube.com/@coletdjnz',
                'uploader_id': '@coletdjnz',
                'uploader': 'cole-dlp-test-acc',
                'timestamp': 1659073275,
                'like_count': int,
            },
            'params': {'skip_download': True, 'extractor_args': {'youtube': {'lang': ['fr']}}},
            'expected_warnings': [r'Preferring "fr" translated fields'],
        }, {
            'note': '6 channel audio',
            'url': 'https://www.youtube.com/watch?v=zgdo7-RRjgo',
            'only_matching': True,
        }, {
            'note': 'Multiple HLS formats with same itag',
            'url': 'https://www.youtube.com/watch?v=kX3nB4PpJko',
            'info_dict': {
                'id': 'kX3nB4PpJko',
                'ext': 'mp4',
                'categories': ['Entertainment'],
                'description': 'md5:e8031ff6e426cdb6a77670c9b81f6fa6',
                'live_status': 'not_live',
                'duration': 937,
                'channel_follower_count': int,
                'thumbnail': 'https://i.ytimg.com/vi_webp/kX3nB4PpJko/maxresdefault.webp',
                'title': 'Last To Take Hand Off Jet, Keeps It!',
                'channel': 'MrBeast',
                'playable_in_embed': True,
                'view_count': int,
                'upload_date': '20221112',
                'channel_url': 'https://www.youtube.com/channel/UCX6OQ3DkcsbYNE6H8uQQuVA',
                'age_limit': 0,
                'availability': 'public',
                'channel_id': 'UCX6OQ3DkcsbYNE6H8uQQuVA',
                'like_count': int,
                'tags': [],
                'uploader': 'MrBeast',
                'uploader_url': 'https://www.youtube.com/@MrBeast',
                'uploader_id': '@MrBeast',
                'comment_count': int,
                'channel_is_verified': True,
                'heatmap': 'count:100',
            },
            'params': {'extractor_args': {'youtube': {'player_client': ['ios']}}, 'format': '233-1'},
        }, {
            'note': 'Audio formats with Dynamic Range Compression',
            'url': 'https://www.youtube.com/watch?v=Tq92D6wQ1mg',
            'info_dict': {
                'id': 'Tq92D6wQ1mg',
                'ext': 'webm',
                'title': '[MMD] Adios - EVERGLOW [+Motion DL]',
                'channel_url': 'https://www.youtube.com/channel/UC1yoRdFoFJaCY-AGfD9W0wQ',
                'channel_id': 'UC1yoRdFoFJaCY-AGfD9W0wQ',
                'channel_follower_count': int,
                'description': 'md5:17eccca93a786d51bc67646756894066',
                'upload_date': '20191228',
                'tags': ['mmd', 'dance', 'mikumikudance', 'kpop', 'vtuber'],
                'playable_in_embed': True,
                'like_count': int,
                'categories': ['Entertainment'],
                'thumbnail': 'https://i.ytimg.com/vi/Tq92D6wQ1mg/sddefault.jpg',
                'age_limit': 18,
                'channel': 'Projekt Melody',
                'view_count': int,
                'availability': 'needs_auth',
                'comment_count': int,
                'live_status': 'not_live',
                'duration': 106,
                'uploader': 'Projekt Melody',
                'uploader_id': '@ProjektMelody',
                'uploader_url': 'https://www.youtube.com/@ProjektMelody',
                'timestamp': 1577508724,
            },
            'params': {'extractor_args': {'youtube': {'player_client': ['tv_embedded']}}, 'format': '251-drc'},
            'skip': 'Age-restricted; requires authentication',
        },
        {
            'note': 'Support /live/ URL + media type for post-live content',
            'url': 'https://www.youtube.com/live/qVv6vCqciTM',
            'info_dict': {
                'id': 'qVv6vCqciTM',
                'ext': 'mp4',
                'age_limit': 0,
                'comment_count': int,
                'chapters': 'count:13',
                'upload_date': '20221223',
                'thumbnail': 'https://i.ytimg.com/vi/qVv6vCqciTM/maxresdefault.jpg',
                'channel_url': 'https://www.youtube.com/channel/UCIdEIHpS0TdkqRkHL5OkLtA',
                'like_count': int,
                'release_date': '20221223',
                'tags': ['Vtuber', '月ノ美兎', '名取さな', 'にじさんじ', 'クリスマス', '3D配信'],
                'title': '【 #インターネット女クリスマス 】3Dで歌ってはしゃぐインターネットの女たち【月ノ美兎/名取さな】',
                'view_count': int,
                'playable_in_embed': True,
                'duration': 4438,
                'availability': 'public',
                'channel_follower_count': int,
                'channel_id': 'UCIdEIHpS0TdkqRkHL5OkLtA',
                'categories': ['Entertainment'],
                'live_status': 'was_live',
                'media_type': 'livestream',
                'release_timestamp': 1671793345,
                'channel': 'さなちゃんねる',
                'description': 'md5:6aebf95cc4a1d731aebc01ad6cc9806d',
                'uploader': 'さなちゃんねる',
                'uploader_url': 'https://www.youtube.com/@sana_natori',
                'uploader_id': '@sana_natori',
                'channel_is_verified': True,
                'heatmap': 'count:100',
                'timestamp': 1671798112,
            },
        },
        {
            # Fallbacks when webpage and web client is unavailable
            'url': 'https://www.youtube.com/watch?v=wSSmNUl9Snw',
            'info_dict': {
                'id': 'wSSmNUl9Snw',
                'ext': 'mp4',
                # 'categories': ['Science & Technology'],
                'view_count': int,
                'chapters': 'count:2',
                'channel': 'Scott Manley',
                'like_count': int,
                'age_limit': 0,
                # 'availability': 'public',
                'channel_follower_count': int,
                'live_status': 'not_live',
                'upload_date': '20170831',
                'duration': 682,
                'tags': 'count:8',
                'uploader_url': 'https://www.youtube.com/@scottmanley',
                'description': 'md5:f4bed7b200404b72a394c2f97b782c02',
                'uploader': 'Scott Manley',
                'uploader_id': '@scottmanley',
                'title': 'The Computer Hack That Saved Apollo 14',
                'channel_id': 'UCxzC4EngIsMrPmbm6Nxvb-A',
                'thumbnail': r're:^https?://.*\.webp',
                'channel_url': 'https://www.youtube.com/channel/UCxzC4EngIsMrPmbm6Nxvb-A',
                'playable_in_embed': True,
                'comment_count': int,
                'channel_is_verified': True,
                'heatmap': 'count:100',
            },
            'params': {
                'extractor_args': {'youtube': {'player_client': ['ios'], 'player_skip': ['webpage']}},
            },
        },
        {
            # uploader_id has non-ASCII characters that are percent-encoded in YT's JSON
            'url': 'https://www.youtube.com/shorts/18NGQq7p3LY',
            'info_dict': {
                'id': '18NGQq7p3LY',
                'ext': 'mp4',
                'title': '아이브 이서 장원영 리즈 삐끼삐끼 챌린지',
                'description': '',
                'uploader': 'ㅇㅇ',
                'uploader_id': '@으아-v1k',
                'uploader_url': 'https://www.youtube.com/@으아-v1k',
                'channel': 'ㅇㅇ',
                'channel_id': 'UCC25oTm2J7ZVoi5TngOHg9g',
                'channel_url': 'https://www.youtube.com/channel/UCC25oTm2J7ZVoi5TngOHg9g',
                'thumbnail': r're:https?://.+/.+\.jpg',
                'playable_in_embed': True,
                'age_limit': 0,
                'duration': 3,
                'timestamp': 1724306170,
                'upload_date': '20240822',
                'availability': 'public',
                'live_status': 'not_live',
                'view_count': int,
                'like_count': int,
                'channel_follower_count': int,
                'categories': ['People & Blogs'],
                'tags': [],
            },
        },
    ]

    _WEBPAGE_TESTS = [
        # YouTube <object> embed
        {
            'url': 'http://www.improbable.com/2017/04/03/untrained-modern-youths-and-ancient-masters-in-selfie-portraits/',
            'md5': '873c81d308b979f0e23ee7e620b312a3',
            'info_dict': {
                'id': 'msN87y-iEx0',
                'ext': 'mp4',
                'title': 'Feynman: Mirrors FUN TO IMAGINE 6',
                'upload_date': '20080526',
                'description': 'md5:873c81d308b979f0e23ee7e620b312a3',
                'age_limit': 0,
                'tags': ['feynman', 'mirror', 'science', 'physics', 'imagination', 'fun', 'cool', 'puzzle'],
                'channel_id': 'UCCeo--lls1vna5YJABWAcVA',
                'playable_in_embed': True,
                'thumbnail': 'https://i.ytimg.com/vi/msN87y-iEx0/hqdefault.jpg',
                'like_count': int,
                'comment_count': int,
                'channel': 'Christopher Sykes',
                'live_status': 'not_live',
                'channel_url': 'https://www.youtube.com/channel/UCCeo--lls1vna5YJABWAcVA',
                'availability': 'public',
                'duration': 195,
                'view_count': int,
                'categories': ['Science & Technology'],
                'channel_follower_count': int,
                'uploader': 'Christopher Sykes',
                'uploader_url': 'https://www.youtube.com/@ChristopherSykesDocumentaries',
                'uploader_id': '@ChristopherSykesDocumentaries',
                'heatmap': 'count:100',
                'timestamp': 1211825920,
            },
            'params': {
                'skip_download': True,
            },
        },
    ]

    @classmethod
    def suitable(cls, url):
        from yt_dlp.utils import parse_qs

        qs = parse_qs(url)
        if qs.get('list', [None])[0]:
            return False
        return super().suitable(url)

    def __init__(self, *args, **kwargs):
        super().__init__(*args, **kwargs)
        self._code_cache = {}
        self._player_cache = {}

    def _prepare_live_from_start_formats(self, formats, video_id, live_start_time, url, webpage_url, smuggled_data, is_live):
        lock = threading.Lock()
        start_time = time.time()
        formats = [f for f in formats if f.get('is_from_start')]

        def refetch_manifest(format_id, delay):
            nonlocal formats, start_time, is_live
            if time.time() <= start_time + delay:
                return

            _, _, prs, player_url = self._download_player_responses(url, smuggled_data, video_id, webpage_url)
            video_details = traverse_obj(prs, (..., 'videoDetails'), expected_type=dict)
            microformats = traverse_obj(
                prs, (..., 'microformat', 'playerMicroformatRenderer'),
                expected_type=dict)
            _, live_status, _, formats, _ = self._list_formats(video_id, microformats, video_details, prs, player_url)
            is_live = live_status == 'is_live'
            start_time = time.time()

        def mpd_feed(format_id, delay):
            """
            @returns (manifest_url, manifest_stream_number, is_live) or None
            """
            for retry in self.RetryManager(fatal=False):
                with lock:
                    refetch_manifest(format_id, delay)

                f = next((f for f in formats if f['format_id'] == format_id), None)
                if not f:
                    if not is_live:
                        retry.error = f'{video_id}: Video is no longer live'
                    else:
                        retry.error = f'Cannot find refreshed manifest for format {format_id}{bug_reports_message()}'
                    continue
                return f['manifest_url'], f['manifest_stream_number'], is_live
            return None

        for f in formats:
            f['is_live'] = is_live
            gen = functools.partial(self._live_dash_fragments, video_id, f['format_id'],
                                    live_start_time, mpd_feed, not is_live and f.copy())
            if is_live:
                f['fragments'] = gen
                f['protocol'] = 'http_dash_segments_generator'
            else:
                f['fragments'] = LazyList(gen({}))
                del f['is_from_start']

    def _live_dash_fragments(self, video_id, format_id, live_start_time, mpd_feed, manifestless_orig_fmt, ctx):
        FETCH_SPAN, MAX_DURATION = 5, 432000

        mpd_url, stream_number, is_live = None, None, True

        begin_index = 0
        download_start_time = ctx.get('start') or time.time()

        lack_early_segments = download_start_time - (live_start_time or download_start_time) > MAX_DURATION
        if lack_early_segments:
            self.report_warning(bug_reports_message(
                'Starting download from the last 120 hours of the live stream since '
                'YouTube does not have data before that. If you think this is wrong,'), only_once=True)
            lack_early_segments = True

        known_idx, no_fragment_score, last_segment_url = begin_index, 0, None
        fragments, fragment_base_url = None, None

        def _extract_sequence_from_mpd(refresh_sequence, immediate):
            nonlocal mpd_url, stream_number, is_live, no_fragment_score, fragments, fragment_base_url
            # Obtain from MPD's maximum seq value
            old_mpd_url = mpd_url
            last_error = ctx.pop('last_error', None)
            expire_fast = immediate or (last_error and isinstance(last_error, HTTPError) and last_error.status == 403)
            mpd_url, stream_number, is_live = (mpd_feed(format_id, 5 if expire_fast else 18000)
                                               or (mpd_url, stream_number, False))
            if not refresh_sequence:
                if expire_fast and not is_live:
                    return False, last_seq
                elif old_mpd_url == mpd_url:
                    return True, last_seq
            if manifestless_orig_fmt:
                fmt_info = manifestless_orig_fmt
            else:
                try:
                    fmts, _ = self._extract_mpd_formats_and_subtitles(
                        mpd_url, None, note=False, errnote=False, fatal=False)
                except ExtractorError:
                    fmts = None
                if not fmts:
                    no_fragment_score += 2
                    return False, last_seq
                fmt_info = next(x for x in fmts if x['manifest_stream_number'] == stream_number)
            fragments = fmt_info['fragments']
            fragment_base_url = fmt_info['fragment_base_url']
            assert fragment_base_url

            _last_seq = int(re.search(r'(?:/|^)sq/(\d+)', fragments[-1]['path']).group(1))
            return True, _last_seq

        self.write_debug(f'[{video_id}] Generating fragments for format {format_id}')
        while is_live:
            fetch_time = time.time()
            if no_fragment_score > 30:
                return
            if last_segment_url:
                # Obtain from "X-Head-Seqnum" header value from each segment
                try:
                    urlh = self._request_webpage(
                        last_segment_url, None, note=False, errnote=False, fatal=False)
                except ExtractorError:
                    urlh = None
                last_seq = try_get(urlh, lambda x: int_or_none(x.headers['X-Head-Seqnum']))
                if last_seq is None:
                    no_fragment_score += 2
                    last_segment_url = None
                    continue
            else:
                should_continue, last_seq = _extract_sequence_from_mpd(True, no_fragment_score > 15)
                no_fragment_score += 2
                if not should_continue:
                    continue

            if known_idx > last_seq:
                last_segment_url = None
                continue

            last_seq += 1

            if begin_index < 0 and known_idx < 0:
                # skip from the start when it's negative value
                known_idx = last_seq + begin_index
            if lack_early_segments:
                known_idx = max(known_idx, last_seq - int(MAX_DURATION // fragments[-1]['duration']))
            try:
                for idx in range(known_idx, last_seq):
                    # do not update sequence here or you'll get skipped some part of it
                    should_continue, _ = _extract_sequence_from_mpd(False, False)
                    if not should_continue:
                        known_idx = idx - 1
                        raise ExtractorError('breaking out of outer loop')
                    last_segment_url = urljoin(fragment_base_url, f'sq/{idx}')
                    yield {
                        'url': last_segment_url,
                        'fragment_count': last_seq,
                    }
                if known_idx == last_seq:
                    no_fragment_score += 5
                else:
                    no_fragment_score = 0
                known_idx = last_seq
            except ExtractorError:
                continue

            if manifestless_orig_fmt:
                # Stop at the first iteration if running for post-live manifestless;
                # fragment count no longer increase since it starts
                break

            time.sleep(max(0, FETCH_SPAN + fetch_time - time.time()))

    def _extract_player_url(self, *ytcfgs, webpage=None):
        player_url = traverse_obj(
            ytcfgs, (..., 'PLAYER_JS_URL'), (..., 'WEB_PLAYER_CONTEXT_CONFIGS', ..., 'jsUrl'),
            get_all=False, expected_type=str)
        if not player_url:
            return
        return urljoin('https://www.youtube.com', player_url)

    def _download_player_url(self, video_id, fatal=False):
        iframe_webpage = self._download_webpage_with_retries(
            'https://www.youtube.com/iframe_api',
            note='Downloading iframe API JS',
            video_id=video_id, retry_fatal=fatal)

        if iframe_webpage:
            player_version = self._search_regex(
                r'player\\?/([0-9a-fA-F]{8})\\?/', iframe_webpage, 'player version', fatal=fatal)
            if player_version:
                return f'https://www.youtube.com/s/player/{player_version}/player_ias.vflset/en_US/base.js'

    def _signature_cache_id(self, example_sig):
        """ Return a string representation of a signature """
        return '.'.join(str(len(part)) for part in example_sig.split('.'))

    @classmethod
    def _extract_player_info(cls, player_url):
        for player_re in cls._PLAYER_INFO_RE:
            id_m = re.search(player_re, player_url)
            if id_m:
                break
        else:
            raise ExtractorError(f'Cannot identify player {player_url!r}')
        return id_m.group('id')

    def _load_player(self, video_id, player_url, fatal=True):
        player_id = self._extract_player_info(player_url)
        if player_id not in self._code_cache:
            code = self._download_webpage(
                player_url, video_id, fatal=fatal,
                note='Downloading player ' + player_id,
                errnote=f'Download of {player_url} failed')
            if code:
                self._code_cache[player_id] = code
        return self._code_cache.get(player_id)

    def _extract_signature_function(self, video_id, player_url, example_sig):
        player_id = self._extract_player_info(player_url)

        # Read from filesystem cache
        func_id = f'js_{player_id}_{self._signature_cache_id(example_sig)}'
        assert os.path.basename(func_id) == func_id

        self.write_debug(f'Extracting signature function {func_id}')
        cache_spec, code = self.cache.load('youtube-sigfuncs', func_id), None

        if not cache_spec:
            code = self._load_player(video_id, player_url)
        if code:
            res = self._parse_sig_js(code)
            test_string = ''.join(map(chr, range(len(example_sig))))
            cache_spec = [ord(c) for c in res(test_string)]
            self.cache.store('youtube-sigfuncs', func_id, cache_spec)

        return lambda s: ''.join(s[i] for i in cache_spec)

    def _print_sig_code(self, func, example_sig):
        if not self.get_param('youtube_print_sig_code'):
            return

        def gen_sig_code(idxs):
            def _genslice(start, end, step):
                starts = '' if start == 0 else str(start)
                ends = (':%d' % (end + step)) if end + step >= 0 else ':'
                steps = '' if step == 1 else (':%d' % step)
                return f's[{starts}{ends}{steps}]'

            step = None
            # Quelch pyflakes warnings - start will be set when step is set
            start = '(Never used)'
            for i, prev in zip(idxs[1:], idxs[:-1]):
                if step is not None:
                    if i - prev == step:
                        continue
                    yield _genslice(start, prev, step)
                    step = None
                    continue
                if i - prev in [-1, 1]:
                    step = i - prev
                    start = prev
                    continue
                else:
                    yield 's[%d]' % prev
            if step is None:
                yield 's[%d]' % i
            else:
                yield _genslice(start, i, step)

        test_string = ''.join(map(chr, range(len(example_sig))))
        cache_res = func(test_string)
        cache_spec = [ord(c) for c in cache_res]
        expr_code = ' + '.join(gen_sig_code(cache_spec))
        signature_id_tuple = '({})'.format(', '.join(str(len(p)) for p in example_sig.split('.')))
        code = (f'if tuple(len(p) for p in s.split(\'.\')) == {signature_id_tuple}:\n'
                f'    return {expr_code}\n')
        self.to_screen('Extracted signature function:\n' + code)

    def _parse_sig_js(self, jscode):
        # Examples where `sig` is funcname:
        # sig=function(a){a=a.split(""); ... ;return a.join("")};
        # ;c&&(c=sig(decodeURIComponent(c)),a.set(b,encodeURIComponent(c)));return a};
        # {var l=f,m=h.sp,n=sig(decodeURIComponent(h.s));l.set(m,encodeURIComponent(n))}
        # sig=function(J){J=J.split(""); ... ;return J.join("")};
        # ;N&&(N=sig(decodeURIComponent(N)),J.set(R,encodeURIComponent(N)));return J};
        # {var H=u,k=f.sp,v=sig(decodeURIComponent(f.s));H.set(k,encodeURIComponent(v))}
        funcname = self._search_regex(
            (r'\b(?P<var>[a-zA-Z0-9_$]+)&&\((?P=var)=(?P<sig>[a-zA-Z0-9_$]{2,})\(decodeURIComponent\((?P=var)\)\)',
             r'(?P<sig>[a-zA-Z0-9_$]+)\s*=\s*function\(\s*(?P<arg>[a-zA-Z0-9_$]+)\s*\)\s*{\s*(?P=arg)\s*=\s*(?P=arg)\.split\(\s*""\s*\)\s*;\s*[^}]+;\s*return\s+(?P=arg)\.join\(\s*""\s*\)',
             r'(?:\b|[^a-zA-Z0-9_$])(?P<sig>[a-zA-Z0-9_$]{2,})\s*=\s*function\(\s*a\s*\)\s*{\s*a\s*=\s*a\.split\(\s*""\s*\)(?:;[a-zA-Z0-9_$]{2}\.[a-zA-Z0-9_$]{2}\(a,\d+\))?',
             # Old patterns
             r'\b[cs]\s*&&\s*[adf]\.set\([^,]+\s*,\s*encodeURIComponent\s*\(\s*(?P<sig>[a-zA-Z0-9$]+)\(',
             r'\b[a-zA-Z0-9]+\s*&&\s*[a-zA-Z0-9]+\.set\([^,]+\s*,\s*encodeURIComponent\s*\(\s*(?P<sig>[a-zA-Z0-9$]+)\(',
             r'\bm=(?P<sig>[a-zA-Z0-9$]{2,})\(decodeURIComponent\(h\.s\)\)',
             # Obsolete patterns
             r'("|\')signature\1\s*,\s*(?P<sig>[a-zA-Z0-9$]+)\(',
             r'\.sig\|\|(?P<sig>[a-zA-Z0-9$]+)\(',
             r'yt\.akamaized\.net/\)\s*\|\|\s*.*?\s*[cs]\s*&&\s*[adf]\.set\([^,]+\s*,\s*(?:encodeURIComponent\s*\()?\s*(?P<sig>[a-zA-Z0-9$]+)\(',
             r'\b[cs]\s*&&\s*[adf]\.set\([^,]+\s*,\s*(?P<sig>[a-zA-Z0-9$]+)\(',
             r'\bc\s*&&\s*[a-zA-Z0-9]+\.set\([^,]+\s*,\s*\([^)]*\)\s*\(\s*(?P<sig>[a-zA-Z0-9$]+)\('),
            jscode, 'Initial JS player signature function name', group='sig')

        jsi = JSInterpreter(jscode)
        global_var_map = {}
        _, varname, value = self._extract_player_js_global_var(jscode)
        if varname:
            global_var_map[varname] = jsi.interpret_expression(value, {}, allow_recursion=100)
        initial_function = jsi.extract_function(funcname, global_var_map)
        return lambda s: initial_function([s])

    def _cached(self, func, *cache_id):
        def inner(*args, **kwargs):
            if cache_id not in self._player_cache:
                try:
                    self._player_cache[cache_id] = func(*args, **kwargs)
                except ExtractorError as e:
                    self._player_cache[cache_id] = e
                except Exception as e:
                    self._player_cache[cache_id] = ExtractorError(traceback.format_exc(), cause=e)

            ret = self._player_cache[cache_id]
            if isinstance(ret, Exception):
                raise ret
            return ret
        return inner

    def _load_nsig_code_from_cache(self, player_id):
        cache_id = ('nsig code', player_id)

        if func_code := self._player_cache.get(cache_id):
            return func_code

        func_code = self.cache.load('youtube-nsig', player_id, min_ver='2025.03.26')
        if func_code:
            self._player_cache[cache_id] = func_code

        return func_code

    def _store_nsig_code_to_cache(self, player_id, func_code):
        cache_id = ('nsig code', player_id)
        if cache_id not in self._player_cache:
            self.cache.store('youtube-nsig', player_id, func_code)
            self._player_cache[cache_id] = func_code

    def _decrypt_signature(self, s, video_id, player_url):
        """Turn the encrypted s field into a working signature"""
        extract_sig = self._cached(
            self._extract_signature_function, 'sig', player_url, self._signature_cache_id(s))
        func = extract_sig(video_id, player_url, s)
        self._print_sig_code(func, s)
        return func(s)

    def _decrypt_nsig(self, s, video_id, player_url):
        """Turn the encrypted n field into a working signature"""
        if player_url is None:
            raise ExtractorError('Cannot decrypt nsig without player_url')
        player_url = urljoin('https://www.youtube.com', player_url)

        try:
            jsi, player_id, func_code = self._extract_n_function_code(video_id, player_url)
        except ExtractorError as e:
            raise ExtractorError('Unable to extract nsig function code', cause=e)
        if self.get_param('youtube_print_sig_code'):
            self.to_screen(f'Extracted nsig function from {player_id}:\n{func_code[1]}\n')

        try:
            extract_nsig = self._cached(self._extract_n_function_from_code, 'nsig func', player_url)
            ret = extract_nsig(jsi, func_code)(s)
        except JSInterpreter.Exception as e:
            try:
                jsi = PhantomJSwrapper(self, timeout=5000)
            except ExtractorError:
                raise e
            self.report_warning(
                f'Native nsig extraction failed: Trying with PhantomJS\n'
                f'         n = {s} ; player = {player_url}', video_id)
            self.write_debug(e, only_once=True)

            args, func_body = func_code
            ret = jsi.execute(
                f'console.log(function({", ".join(args)}) {{ {func_body} }}({s!r}));',
                video_id=video_id, note='Executing signature code').strip()

        self.write_debug(f'Decrypted nsig {s} => {ret}')
        # Only cache nsig func JS code to disk if successful, and only once
        self._store_nsig_code_to_cache(player_id, func_code)
        return ret

    def _extract_n_function_name(self, jscode, player_url=None):
        # Examples (with placeholders nfunc, narray, idx):
        # *  .get("n"))&&(b=nfunc(b)
        # *  .get("n"))&&(b=narray[idx](b)
        # *  b=String.fromCharCode(110),c=a.get(b))&&c=narray[idx](c)
        # *  a.D&&(b="nn"[+a.D],c=a.get(b))&&(c=narray[idx](c),a.set(b,c),narray.length||nfunc("")
        # *  a.D&&(PL(a),b=a.j.n||null)&&(b=narray[0](b),a.set("n",b),narray.length||nfunc("")
        # *  a.D&&(b="nn"[+a.D],vL(a),c=a.j[b]||null)&&(c=narray[idx](c),a.set(b,c),narray.length||nfunc("")
        # *  J.J="";J.url="";J.Z&&(R="nn"[+J.Z],mW(J),N=J.K[R]||null)&&(N=narray[idx](N),J.set(R,N))}};
        funcname, idx = self._search_regex(
            r'''(?x)
            (?:
                \.get\("n"\)\)&&\(b=|
                (?:
                    b=String\.fromCharCode\(110\)|
                    (?P<str_idx>[a-zA-Z0-9_$.]+)&&\(b="nn"\[\+(?P=str_idx)\]
                )
                (?:
                    ,[a-zA-Z0-9_$]+\(a\))?,c=a\.
                    (?:
                        get\(b\)|
                        [a-zA-Z0-9_$]+\[b\]\|\|null
                    )\)&&\(c=|
                \b(?P<var>[a-zA-Z0-9_$]+)=
            )(?P<nfunc>[a-zA-Z0-9_$]+)(?:\[(?P<idx>\d+)\])?\([a-zA-Z]\)
            (?(var),[a-zA-Z0-9_$]+\.set\((?:"n+"|[a-zA-Z0-9_$]+)\,(?P=var)\))''',
            jscode, 'n function name', group=('nfunc', 'idx'), default=(None, None))
        if not funcname:
            self.report_warning(join_nonempty(
                'Falling back to generic n function search',
                player_url and f'         player = {player_url}', delim='\n'))
            return self._search_regex(
                r'''(?xs)
                ;\s*(?P<name>[a-zA-Z0-9_$]+)\s*=\s*function\([a-zA-Z0-9_$]+\)
                \s*\{(?:(?!};).)+?return\s*(?P<q>["'])[\w-]+_w8_(?P=q)\s*\+\s*[a-zA-Z0-9_$]+''',
                jscode, 'Initial JS player n function name', group='name')
        elif not idx:
            return funcname

        return json.loads(js_to_json(self._search_regex(
            rf'var {re.escape(funcname)}\s*=\s*(\[.+?\])\s*[,;]', jscode,
            f'Initial JS player n function list ({funcname}.{idx})')))[int(idx)]

    def _extract_player_js_global_var(self, jscode):
        """Returns tuple of strings: variable assignment code, variable name, variable value code"""
        return self._search_regex(
            r'''(?x)
                (?P<q1>["\'])use\s+strict(?P=q1);\s*
                (?P<code>
                    var\s+(?P<name>[a-zA-Z0-9_$]+)\s*=\s*
                    (?P<value>
                        (?P<q2>["\'])(?:(?!(?P=q2)).|\\.)+(?P=q2)
                        \.split\((?P<q3>["\'])(?:(?!(?P=q3)).)+(?P=q3)\)
                        |\[\s*(?:(?P<q4>["\'])(?:(?!(?P=q4)).|\\.)*(?P=q4)\s*,?\s*)+\]
                    )
                )[;,]
            ''', jscode, 'global variable', group=('code', 'name', 'value'), default=(None, None, None))

    def _fixup_n_function_code(self, argnames, code, full_code):
        global_var, varname, _ = self._extract_player_js_global_var(full_code)
        if global_var:
            self.write_debug(f'Prepending n function code with global array variable "{varname}"')
            code = global_var + '; ' + code
        else:
            self.write_debug('No global array variable found in player JS')
        return argnames, re.sub(
            rf';\s*if\s*\(\s*typeof\s+[a-zA-Z0-9_$]+\s*===?\s*(?:(["\'])undefined\1|{varname}\[\d+\])\s*\)\s*return\s+{argnames[0]};',
            ';', code)

    def _extract_n_function_code(self, video_id, player_url):
        player_id = self._extract_player_info(player_url)
        func_code = self._load_nsig_code_from_cache(player_id)
        jscode = func_code or self._load_player(video_id, player_url)
        jsi = JSInterpreter(jscode)

        if func_code:
            return jsi, player_id, func_code

        func_name = self._extract_n_function_name(jscode, player_url=player_url)

        # XXX: Workaround for the global array variable and lack of `typeof` implementation
        func_code = self._fixup_n_function_code(*jsi.extract_function_code(func_name), jscode)

        return jsi, player_id, func_code

    def _extract_n_function_from_code(self, jsi, func_code):
        func = jsi.extract_function_from_code(*func_code)

        def extract_nsig(s):
            try:
                ret = func([s])
            except JSInterpreter.Exception:
                raise
            except Exception as e:
                raise JSInterpreter.Exception(traceback.format_exc(), cause=e)

            if ret.startswith('enhanced_except_') or ret.endswith(s):
                raise JSInterpreter.Exception('Signature function returned an exception')
            return ret

        return extract_nsig

    def _extract_signature_timestamp(self, video_id, player_url, ytcfg=None, fatal=False):
        """
        Extract signatureTimestamp (sts)
        Required to tell API what sig/player version is in use.
        """
        sts = None
        if isinstance(ytcfg, dict):
            sts = int_or_none(ytcfg.get('STS'))

        if not sts:
            # Attempt to extract from player
            if player_url is None:
                error_msg = 'Cannot extract signature timestamp without player_url.'
                if fatal:
                    raise ExtractorError(error_msg)
                self.report_warning(error_msg)
                return
            code = self._load_player(video_id, player_url, fatal=fatal)
            if code:
                sts = int_or_none(self._search_regex(
                    r'(?:signatureTimestamp|sts)\s*:\s*(?P<sts>[0-9]{5})', code,
                    'JS player signature timestamp', group='sts', fatal=fatal))
        return sts

    def _mark_watched(self, video_id, player_responses):
        for is_full, key in enumerate(('videostatsPlaybackUrl', 'videostatsWatchtimeUrl')):
            label = 'fully ' if is_full else ''
            url = get_first(player_responses, ('playbackTracking', key, 'baseUrl'),
                            expected_type=url_or_none)
            if not url:
                self.report_warning(f'Unable to mark {label}watched')
                return
            parsed_url = urllib.parse.urlparse(url)
            qs = urllib.parse.parse_qs(parsed_url.query)

            # cpn generation algorithm is reverse engineered from base.js.
            # In fact it works even with dummy cpn.
            CPN_ALPHABET = 'abcdefghijklmnopqrstuvwxyzABCDEFGHIJKLMNOPQRSTUVWXYZ0123456789-_'
            cpn = ''.join(CPN_ALPHABET[random.randint(0, 256) & 63] for _ in range(16))

            # # more consistent results setting it to right before the end
            video_length = [str(float((qs.get('len') or ['1.5'])[0]) - 1)]

            qs.update({
                'ver': ['2'],
                'cpn': [cpn],
                'cmt': video_length,
                'el': 'detailpage',  # otherwise defaults to "shorts"
            })

            if is_full:
                # these seem to mark watchtime "history" in the real world
                # they're required, so send in a single value
                qs.update({
                    'st': 0,
                    'et': video_length,
                })

            url = urllib.parse.urlunparse(
                parsed_url._replace(query=urllib.parse.urlencode(qs, True)))

            self._download_webpage(
                url, video_id, f'Marking {label}watched',
                'Unable to mark watched', fatal=False)

    @classmethod
    def _extract_from_webpage(cls, url, webpage):
        # Invidious Instances
        # https://github.com/yt-dlp/yt-dlp/issues/195
        # https://github.com/iv-org/invidious/pull/1730
        mobj = re.search(
            r'<link rel="alternate" href="(?P<url>https://www\.youtube\.com/watch\?v=[0-9A-Za-z_-]{11})"',
            webpage)
        if mobj:
            yield cls.url_result(mobj.group('url'), cls)
            raise cls.StopExtraction

        yield from super()._extract_from_webpage(url, webpage)

        # lazyYT YouTube embed
        for id_ in re.findall(r'class="lazyYT" data-youtube-id="([^"]+)"', webpage):
            yield cls.url_result(unescapeHTML(id_), cls, id_)

        # Wordpress "YouTube Video Importer" plugin
        for m in re.findall(r'''(?x)<div[^>]+
                class=(?P<q1>[\'"])[^\'"]*\byvii_single_video_player\b[^\'"]*(?P=q1)[^>]+
                data-video_id=(?P<q2>[\'"])([^\'"]+)(?P=q2)''', webpage):
            yield cls.url_result(m[-1], cls, m[-1])

    @classmethod
    def extract_id(cls, url):
        video_id = cls.get_temp_id(url)
        if not video_id:
            raise ExtractorError(f'Invalid URL: {url}')
        return video_id

    def _extract_chapters_from_json(self, data, duration):
        chapter_list = traverse_obj(
            data, (
                'playerOverlays', 'playerOverlayRenderer', 'decoratedPlayerBarRenderer',
                'decoratedPlayerBarRenderer', 'playerBar', 'chapteredPlayerBarRenderer', 'chapters',
            ), expected_type=list)

        return self._extract_chapters_helper(
            chapter_list,
            start_function=lambda chapter: float_or_none(
                traverse_obj(chapter, ('chapterRenderer', 'timeRangeStartMillis')), scale=1000),
            title_function=lambda chapter: traverse_obj(
                chapter, ('chapterRenderer', 'title', 'simpleText'), expected_type=str),
            duration=duration)

    def _extract_chapters_from_engagement_panel(self, data, duration):
        content_list = traverse_obj(
            data,
            ('engagementPanels', ..., 'engagementPanelSectionListRenderer', 'content', 'macroMarkersListRenderer', 'contents'),
            expected_type=list)
        chapter_time = lambda chapter: parse_duration(self._get_text(chapter, 'timeDescription'))
        chapter_title = lambda chapter: self._get_text(chapter, 'title')

        return next(filter(None, (
            self._extract_chapters_helper(traverse_obj(contents, (..., 'macroMarkersListItemRenderer')),
                                          chapter_time, chapter_title, duration)
            for contents in content_list)), [])

    def _extract_heatmap(self, data):
        return traverse_obj(data, (
            'frameworkUpdates', 'entityBatchUpdate', 'mutations',
            lambda _, v: v['payload']['macroMarkersListEntity']['markersList']['markerType'] == 'MARKER_TYPE_HEATMAP',
            'payload', 'macroMarkersListEntity', 'markersList', 'markers', ..., {
                'start_time': ('startMillis', {float_or_none(scale=1000)}),
                'end_time': {lambda x: (int(x['startMillis']) + int(x['durationMillis'])) / 1000},
                'value': ('intensityScoreNormalized', {float_or_none}),
            })) or None

    def _extract_comment(self, entities, parent=None):
        comment_entity_payload = get_first(entities, ('payload', 'commentEntityPayload', {dict}))
        if not (comment_id := traverse_obj(comment_entity_payload, ('properties', 'commentId', {str}))):
            return

        toolbar_entity_payload = get_first(entities, ('payload', 'engagementToolbarStateEntityPayload', {dict}))
        time_text = traverse_obj(comment_entity_payload, ('properties', 'publishedTime', {str})) or ''

        return {
            'id': comment_id,
            'parent': parent or 'root',
            **traverse_obj(comment_entity_payload, {
                'text': ('properties', 'content', 'content', {str}),
                'like_count': ('toolbar', 'likeCountA11y', {parse_count}),
                'author_id': ('author', 'channelId', {self.ucid_or_none}),
                'author': ('author', 'displayName', {str}),
                'author_thumbnail': ('author', 'avatarThumbnailUrl', {url_or_none}),
                'author_is_uploader': ('author', 'isCreator', {bool}),
                'author_is_verified': ('author', 'isVerified', {bool}),
                'author_url': ('author', 'channelCommand', 'innertubeCommand', (
                    ('browseEndpoint', 'canonicalBaseUrl'), ('commandMetadata', 'webCommandMetadata', 'url'),
                ), {urljoin('https://www.youtube.com')}),
            }, get_all=False),
            'is_favorited': (None if toolbar_entity_payload is None else
                             toolbar_entity_payload.get('heartState') == 'TOOLBAR_HEART_STATE_HEARTED'),
            '_time_text': time_text,  # FIXME: non-standard, but we need a way of showing that it is an estimate.
            'timestamp': self._parse_time_text(time_text),
        }

    def _extract_comment_old(self, comment_renderer, parent=None):
        comment_id = comment_renderer.get('commentId')
        if not comment_id:
            return

        info = {
            'id': comment_id,
            'text': self._get_text(comment_renderer, 'contentText'),
            'like_count': self._get_count(comment_renderer, 'voteCount'),
            'author_id': traverse_obj(comment_renderer, ('authorEndpoint', 'browseEndpoint', 'browseId', {self.ucid_or_none})),
            'author': self._get_text(comment_renderer, 'authorText'),
            'author_thumbnail': traverse_obj(comment_renderer, ('authorThumbnail', 'thumbnails', -1, 'url', {url_or_none})),
            'parent': parent or 'root',
        }

        # Timestamp is an estimate calculated from the current time and time_text
        time_text = self._get_text(comment_renderer, 'publishedTimeText') or ''
        timestamp = self._parse_time_text(time_text)

        info.update({
            # FIXME: non-standard, but we need a way of showing that it is an estimate.
            '_time_text': time_text,
            'timestamp': timestamp,
        })

        info['author_url'] = urljoin(
            'https://www.youtube.com', traverse_obj(comment_renderer, ('authorEndpoint', (
                ('browseEndpoint', 'canonicalBaseUrl'), ('commandMetadata', 'webCommandMetadata', 'url'))),
                expected_type=str, get_all=False))

        author_is_uploader = traverse_obj(comment_renderer, 'authorIsChannelOwner')
        if author_is_uploader is not None:
            info['author_is_uploader'] = author_is_uploader

        comment_abr = traverse_obj(
            comment_renderer, ('actionButtons', 'commentActionButtonsRenderer'), expected_type=dict)
        if comment_abr is not None:
            info['is_favorited'] = 'creatorHeart' in comment_abr

        badges = self._extract_badges([traverse_obj(comment_renderer, 'authorCommentBadge')])
        if self._has_badge(badges, BadgeType.VERIFIED):
            info['author_is_verified'] = True

        is_pinned = traverse_obj(comment_renderer, 'pinnedCommentBadge')
        if is_pinned:
            info['is_pinned'] = True

        return info

    def _comment_entries(self, root_continuation_data, ytcfg, video_id, parent=None, tracker=None):

        get_single_config_arg = lambda c: self._configuration_arg(c, [''])[0]

        def extract_header(contents):
            _continuation = None
            for content in contents:
                comments_header_renderer = traverse_obj(content, 'commentsHeaderRenderer')
                expected_comment_count = self._get_count(
                    comments_header_renderer, 'countText', 'commentsCount')

                if expected_comment_count is not None:
                    tracker['est_total'] = expected_comment_count
                    self.to_screen(f'Downloading ~{expected_comment_count} comments')
                comment_sort_index = int(get_single_config_arg('comment_sort') != 'top')  # 1 = new, 0 = top

                sort_menu_item = try_get(
                    comments_header_renderer,
                    lambda x: x['sortMenu']['sortFilterSubMenuRenderer']['subMenuItems'][comment_sort_index], dict) or {}
                sort_continuation_ep = sort_menu_item.get('serviceEndpoint') or {}

                _continuation = self._extract_continuation_ep_data(sort_continuation_ep) or self._extract_continuation(sort_menu_item)
                if not _continuation:
                    continue

                sort_text = str_or_none(sort_menu_item.get('title'))
                if not sort_text:
                    sort_text = 'top comments' if comment_sort_index == 0 else 'newest first'
                self.to_screen(f'Sorting comments by {sort_text.lower()}')
                break
            return _continuation

        def extract_thread(contents, entity_payloads):
            if not parent:
                tracker['current_page_thread'] = 0
            for content in contents:
                if not parent and tracker['total_parent_comments'] >= max_parents:
                    yield
                comment_thread_renderer = try_get(content, lambda x: x['commentThreadRenderer'])

                # old comment format
                if not entity_payloads:
                    comment_renderer = get_first(
                        (comment_thread_renderer, content), [['commentRenderer', ('comment', 'commentRenderer')]],
                        expected_type=dict, default={})

                    comment = self._extract_comment_old(comment_renderer, parent)

                # new comment format
                else:
                    view_model = (
                        traverse_obj(comment_thread_renderer, ('commentViewModel', 'commentViewModel', {dict}))
                        or traverse_obj(content, ('commentViewModel', {dict})))
                    comment_keys = traverse_obj(view_model, (('commentKey', 'toolbarStateKey'), {str}))
                    if not comment_keys:
                        continue
                    entities = traverse_obj(entity_payloads, lambda _, v: v['entityKey'] in comment_keys)
                    comment = self._extract_comment(entities, parent)
                    if comment:
                        comment['is_pinned'] = traverse_obj(view_model, ('pinnedText', {str})) is not None

                if not comment:
                    continue
                comment_id = comment['id']

                if comment.get('is_pinned'):
                    tracker['pinned_comment_ids'].add(comment_id)
                # Sometimes YouTube may break and give us infinite looping comments.
                # See: https://github.com/yt-dlp/yt-dlp/issues/6290
                if comment_id in tracker['seen_comment_ids']:
                    if comment_id in tracker['pinned_comment_ids'] and not comment.get('is_pinned'):
                        # Pinned comments may appear a second time in newest first sort
                        # See: https://github.com/yt-dlp/yt-dlp/issues/6712
                        continue
                    self.report_warning(
                        'Detected YouTube comments looping. Stopping comment extraction '
                        f'{"for this thread" if parent else ""} as we probably cannot get any more.')
                    yield
                else:
                    tracker['seen_comment_ids'].add(comment['id'])

                tracker['running_total'] += 1
                tracker['total_reply_comments' if parent else 'total_parent_comments'] += 1
                yield comment

                # Attempt to get the replies
                comment_replies_renderer = try_get(
                    comment_thread_renderer, lambda x: x['replies']['commentRepliesRenderer'], dict)

                if comment_replies_renderer:
                    tracker['current_page_thread'] += 1
                    comment_entries_iter = self._comment_entries(
                        comment_replies_renderer, ytcfg, video_id,
                        parent=comment.get('id'), tracker=tracker)
                    yield from itertools.islice(comment_entries_iter, min(
                        max_replies_per_thread, max(0, max_replies - tracker['total_reply_comments'])))

        # Keeps track of counts across recursive calls
        if not tracker:
            tracker = {
                'running_total': 0,
                'est_total': None,
                'current_page_thread': 0,
                'total_parent_comments': 0,
                'total_reply_comments': 0,
                'seen_comment_ids': set(),
                'pinned_comment_ids': set(),
            }

        # TODO: Deprecated
        # YouTube comments have a max depth of 2
        max_depth = int_or_none(get_single_config_arg('max_comment_depth'))
        if max_depth:
            self._downloader.deprecated_feature('[youtube] max_comment_depth extractor argument is deprecated. '
                                                'Set max replies in the max-comments extractor argument instead')
        if max_depth == 1 and parent:
            return

        max_comments, max_parents, max_replies, max_replies_per_thread, *_ = (
            int_or_none(p, default=sys.maxsize) for p in self._configuration_arg('max_comments') + [''] * 4)

        continuation = self._extract_continuation(root_continuation_data)

        response = None
        is_forced_continuation = False
        is_first_continuation = parent is None
        if is_first_continuation and not continuation:
            # Sometimes you can get comments by generating the continuation yourself,
            # even if YouTube initially reports them being disabled - e.g. stories comments.
            # Note: if the comment section is actually disabled, YouTube may return a response with
            # required check_get_keys missing. So we will disable that check initially in this case.
            continuation = self._build_api_continuation_query(self._generate_comment_continuation(video_id))
            is_forced_continuation = True

        continuation_items_path = (
            'onResponseReceivedEndpoints', ..., ('reloadContinuationItemsCommand', 'appendContinuationItemsAction'), 'continuationItems')
        for page_num in itertools.count(0):
            if not continuation:
                break
            headers = self.generate_api_headers(ytcfg=ytcfg, visitor_data=self._extract_visitor_data(response))
            comment_prog_str = f"({tracker['running_total']}/~{tracker['est_total']})"
            if page_num == 0:
                if is_first_continuation:
                    note_prefix = 'Downloading comment section API JSON'
                else:
                    note_prefix = '    Downloading comment API JSON reply thread %d %s' % (
                        tracker['current_page_thread'], comment_prog_str)
            else:
                note_prefix = '{}Downloading comment{} API JSON page {} {}'.format(
                    '       ' if parent else '', ' replies' if parent else '',
                    page_num, comment_prog_str)

            # Do a deep check for incomplete data as sometimes YouTube may return no comments for a continuation
            # Ignore check if YouTube says the comment count is 0.
            check_get_keys = None
            if not is_forced_continuation and not (tracker['est_total'] == 0 and tracker['running_total'] == 0):
                check_get_keys = [[*continuation_items_path, ..., (
                    'commentsHeaderRenderer' if is_first_continuation else ('commentThreadRenderer', 'commentViewModel', 'commentRenderer'))]]
            try:
                response = self._extract_response(
                    item_id=None, query=continuation,
                    ep='next', ytcfg=ytcfg, headers=headers, note=note_prefix,
                    check_get_keys=check_get_keys)
            except ExtractorError as e:
                # Ignore incomplete data error for replies if retries didn't work.
                # This is to allow any other parent comments and comment threads to be downloaded.
                # See: https://github.com/yt-dlp/yt-dlp/issues/4669
                if 'incomplete data' in str(e).lower() and parent:
                    if self.get_param('ignoreerrors') in (True, 'only_download'):
                        self.report_warning(
                            'Received incomplete data for a comment reply thread and retrying did not help. '
                            'Ignoring to let other comments be downloaded. Pass --no-ignore-errors to not ignore.')
                        return
                    else:
                        raise ExtractorError(
                            'Incomplete data received for comment reply thread. '
                            'Pass --ignore-errors to ignore and allow rest of comments to download.',
                            expected=True)
                raise
            is_forced_continuation = False
            continuation = None
            mutations = traverse_obj(response, ('frameworkUpdates', 'entityBatchUpdate', 'mutations', ..., {dict}))
            for continuation_items in traverse_obj(response, continuation_items_path, expected_type=list, default=[]):
                if is_first_continuation:
                    continuation = extract_header(continuation_items)
                    is_first_continuation = False
                    if continuation:
                        break
                    continue

                for entry in extract_thread(continuation_items, mutations):
                    if not entry:
                        return
                    yield entry
                continuation = self._extract_continuation({'contents': continuation_items})
                if continuation:
                    break

        message = self._get_text(root_continuation_data, ('contents', ..., 'messageRenderer', 'text'), max_runs=1)
        if message and not parent and tracker['running_total'] == 0:
            self.report_warning(f'Youtube said: {message}', video_id=video_id, only_once=True)
            raise self.CommentsDisabled

    @staticmethod
    def _generate_comment_continuation(video_id):
        """
        Generates initial comment section continuation token from given video id
        """
        token = f'\x12\r\x12\x0b{video_id}\x18\x062\'"\x11"\x0b{video_id}0\x00x\x020\x00B\x10comments-section'
        return base64.b64encode(token.encode()).decode()

    def _get_comments(self, ytcfg, video_id, contents, webpage):
        """Entry for comment extraction"""
        def _real_comment_extract(contents):
            renderer = next((
                item for item in traverse_obj(contents, (..., 'itemSectionRenderer'), default={})
                if item.get('sectionIdentifier') == 'comment-item-section'), None)
            yield from self._comment_entries(renderer, ytcfg, video_id)

        max_comments = int_or_none(self._configuration_arg('max_comments', [''])[0])
        return itertools.islice(_real_comment_extract(contents), 0, max_comments)

    @staticmethod
    def _get_checkok_params():
        return {'contentCheckOk': True, 'racyCheckOk': True}

    @classmethod
    def _generate_player_context(cls, sts=None):
        context = {
            'html5Preference': 'HTML5_PREF_WANTS',
        }
        if sts is not None:
            context['signatureTimestamp'] = sts
        return {
            'playbackContext': {
                'contentPlaybackContext': context,
            },
            **cls._get_checkok_params(),
        }

    def _get_config_po_token(self, client: str, context: _PoTokenContext):
        po_token_strs = self._configuration_arg('po_token', [], ie_key=YoutubeIE, casesense=True)
        for token_str in po_token_strs:
            po_token_meta, sep, po_token = token_str.partition('+')
            if not sep:
                self.report_warning(
                    f'Invalid po_token configuration format. '
                    f'Expected "CLIENT.CONTEXT+PO_TOKEN", got "{token_str}"', only_once=True)
                continue

            po_token_client, sep, po_token_context = po_token_meta.partition('.')
            if po_token_client.lower() != client:
                continue

            if not sep:
                # TODO(future): deprecate the old format?
                self.write_debug(
                    f'po_token configuration for {client} client is missing a context; assuming GVS. '
                    'You can provide a context with the format "CLIENT.CONTEXT+PO_TOKEN"',
                    only_once=True)
                po_token_context = _PoTokenContext.GVS.value

            if po_token_context.lower() != context.value:
                continue

            # Clean and validate the PO Token. This will strip invalid characters off
            # (e.g. additional url params the user may accidentally include)
            try:
                return base64.urlsafe_b64encode(base64.urlsafe_b64decode(urllib.parse.unquote(po_token))).decode()
            except (binascii.Error, ValueError):
                self.report_warning(
                    f'Invalid po_token configuration for {client} client: '
                    f'{po_token_context} PO Token should be a base64url-encoded string.',
                    only_once=True)
                continue

    def fetch_po_token(self, client='web', context=_PoTokenContext.GVS, ytcfg=None, visitor_data=None,
                       data_sync_id=None, session_index=None, player_url=None, video_id=None, **kwargs):
        """
        Fetch a PO Token for a given client and context. This function will validate required parameters for a given context and client.

        EXPERIMENTAL: This method is unstable and may change or be removed without notice.

        @param client: The client to fetch the PO Token for.
        @param context: The context in which the PO Token is used.
        @param ytcfg: The ytcfg for the client.
        @param visitor_data: visitor data.
        @param data_sync_id: data sync ID.
        @param session_index: session index.
        @param player_url: player URL.
        @param video_id: video ID.
        @param kwargs: Additional arguments to pass down. May be more added in the future.
        @return: The fetched PO Token. None if it could not be fetched.
        """

        # GVS WebPO Token is bound to visitor_data / Visitor ID when logged out.
        # Must have visitor_data for it to function.
        if player_url and context == _PoTokenContext.GVS and not visitor_data and not self.is_authenticated:
            self.report_warning(
                f'Unable to fetch GVS PO Token for {client} client: Missing required Visitor Data. '
                f'You may need to pass Visitor Data with --extractor-args "youtube:visitor_data=XXX"')
            return

        if context == _PoTokenContext.PLAYER and not video_id:
            self.report_warning(
                f'Unable to fetch Player PO Token for {client} client: Missing required Video ID')
            return

        config_po_token = self._get_config_po_token(client, context)
        if config_po_token:
            # GVS WebPO token is bound to data_sync_id / account Session ID when logged in.
            if player_url and context == _PoTokenContext.GVS and not data_sync_id and self.is_authenticated:
                self.report_warning(
                    f'Got a GVS PO Token for {client} client, but missing Data Sync ID for account. Formats may not work.'
                    f'You may need to pass a Data Sync ID with --extractor-args "youtube:data_sync_id=XXX"')

            return config_po_token

        # Require GVS WebPO Token if logged in for external fetching
        if player_url and context == _PoTokenContext.GVS and not data_sync_id and self.is_authenticated:
            self.report_warning(
                f'Unable to fetch GVS PO Token for {client} client: Missing required Data Sync ID for account. '
                f'You may need to pass a Data Sync ID with --extractor-args "youtube:data_sync_id=XXX"')
            return

        return self._fetch_po_token(
            client=client,
            context=context.value,
            ytcfg=ytcfg,
            visitor_data=visitor_data,
            data_sync_id=data_sync_id,
            session_index=session_index,
            player_url=player_url,
            video_id=video_id,
            **kwargs,
        )

    def _fetch_po_token(self, client, **kwargs):
        """(Unstable) External PO Token fetch stub"""

    @staticmethod
    def _is_agegated(player_response):
        if traverse_obj(player_response, ('playabilityStatus', 'desktopLegacyAgeGateReason')):
            return True

        reasons = traverse_obj(player_response, ('playabilityStatus', ('status', 'reason')))
        AGE_GATE_REASONS = (
            'confirm your age', 'age-restricted', 'inappropriate',  # reason
            'age_verification_required', 'age_check_required',  # status
        )
        return any(expected in reason for expected in AGE_GATE_REASONS for reason in reasons)

    @staticmethod
    def _is_unplayable(player_response):
        return traverse_obj(player_response, ('playabilityStatus', 'status')) == 'UNPLAYABLE'

    def _extract_player_response(self, client, video_id, master_ytcfg, player_ytcfg, player_url, initial_pr, visitor_data, data_sync_id, po_token):
        headers = self.generate_api_headers(
            ytcfg=player_ytcfg,
            default_client=client,
            visitor_data=visitor_data,
            session_index=self._extract_session_index(master_ytcfg, player_ytcfg),
            delegated_session_id=(
                self._parse_data_sync_id(data_sync_id)[0]
                or self._extract_delegated_session_id(master_ytcfg, initial_pr, player_ytcfg)
            ),
            user_session_id=(
                self._parse_data_sync_id(data_sync_id)[1]
                or self._extract_user_session_id(master_ytcfg, initial_pr, player_ytcfg)
            ),
        )

        yt_query = {
            'videoId': video_id,
        }

        default_pp = traverse_obj(
            INNERTUBE_CLIENTS, (_split_innertube_client(client)[0], 'PLAYER_PARAMS', {str}))
        if player_params := self._configuration_arg('player_params', [default_pp], casesense=True)[0]:
            yt_query['params'] = player_params

        if po_token:
            yt_query['serviceIntegrityDimensions'] = {'poToken': po_token}

        sts = self._extract_signature_timestamp(video_id, player_url, master_ytcfg, fatal=False) if player_url else None
        yt_query.update(self._generate_player_context(sts))
        return self._extract_response(
            item_id=video_id, ep='player', query=yt_query,
            ytcfg=player_ytcfg, headers=headers, fatal=True,
            default_client=client,
            note='Downloading {} player API JSON'.format(client.replace('_', ' ').strip()),
        ) or None

    def _get_requested_clients(self, url, smuggled_data):
        requested_clients = []
        excluded_clients = []
        default_clients = self._DEFAULT_AUTHED_CLIENTS if self.is_authenticated else self._DEFAULT_CLIENTS
        allowed_clients = sorted(
            (client for client in INNERTUBE_CLIENTS if client[:1] != '_'),
            key=lambda client: INNERTUBE_CLIENTS[client]['priority'], reverse=True)
        for client in self._configuration_arg('player_client'):
            if client == 'default':
                requested_clients.extend(default_clients)
            elif client == 'all':
                requested_clients.extend(allowed_clients)
            elif client.startswith('-'):
                excluded_clients.append(client[1:])
            elif client not in allowed_clients:
                self.report_warning(f'Skipping unsupported client "{client}"')
            else:
                requested_clients.append(client)
        if not requested_clients:
            requested_clients.extend(default_clients)
        for excluded_client in excluded_clients:
            if excluded_client in requested_clients:
                requested_clients.remove(excluded_client)
        if not requested_clients:
            raise ExtractorError('No player clients have been requested', expected=True)

        if self.is_authenticated:
            if (smuggled_data.get('is_music_url') or self.is_music_url(url)) and 'web_music' not in requested_clients:
                requested_clients.append('web_music')

            unsupported_clients = [
                client for client in requested_clients if not INNERTUBE_CLIENTS[client]['SUPPORTS_COOKIES']
            ]
            for client in unsupported_clients:
                self.report_warning(f'Skipping client "{client}" since it does not support cookies', only_once=True)
                requested_clients.remove(client)

        return orderedSet(requested_clients)

    def _invalid_player_response(self, pr, video_id):
        # YouTube may return a different video player response than expected.
        # See: https://github.com/TeamNewPipe/NewPipe/issues/8713
        if (pr_id := traverse_obj(pr, ('videoDetails', 'videoId'))) != video_id:
            return pr_id

    def _extract_player_responses(self, clients, video_id, webpage, master_ytcfg, smuggled_data):
        initial_pr = None
        if webpage:
            initial_pr = self._search_json(
                self._YT_INITIAL_PLAYER_RESPONSE_RE, webpage, 'initial player response', video_id, fatal=False)

        prs = []
        deprioritized_prs = []

        if initial_pr and not self._invalid_player_response(initial_pr, video_id):
            # Android player_response does not have microFormats which are needed for
            # extraction of some data. So we return the initial_pr with formats
            # stripped out even if not requested by the user
            # See: https://github.com/yt-dlp/yt-dlp/issues/501
            prs.append({**initial_pr, 'streamingData': None})

        all_clients = set(clients)
        clients = clients[::-1]

        def append_client(*client_names):
            """ Append the first client name that exists but not already used """
            for client_name in client_names:
                actual_client = _split_innertube_client(client_name)[0]
                if actual_client in INNERTUBE_CLIENTS:
                    if actual_client not in all_clients:
                        clients.append(client_name)
                        all_clients.add(actual_client)
                        return

        tried_iframe_fallback = False
        player_url = visitor_data = data_sync_id = None
        skipped_clients = {}
        while clients:
            deprioritize_pr = False
            client, base_client, variant = _split_innertube_client(clients.pop())
            player_ytcfg = master_ytcfg if client == 'web' else {}
            if 'configs' not in self._configuration_arg('player_skip') and client != 'web':
                player_ytcfg = self._download_ytcfg(client, video_id) or player_ytcfg

            player_url = player_url or self._extract_player_url(master_ytcfg, player_ytcfg, webpage=webpage)
            require_js_player = self._get_default_ytcfg(client).get('REQUIRE_JS_PLAYER')
            if 'js' in self._configuration_arg('player_skip'):
                require_js_player = False
                player_url = None

            if not player_url and not tried_iframe_fallback and require_js_player:
                player_url = self._download_player_url(video_id)
                tried_iframe_fallback = True

            visitor_data = visitor_data or self._extract_visitor_data(master_ytcfg, initial_pr, player_ytcfg)
            data_sync_id = data_sync_id or self._extract_data_sync_id(master_ytcfg, initial_pr, player_ytcfg)

            fetch_po_token_args = {
                'client': client,
                'visitor_data': visitor_data,
                'video_id': video_id,
                'data_sync_id': data_sync_id if self.is_authenticated else None,
                'player_url': player_url if require_js_player else None,
                'session_index': self._extract_session_index(master_ytcfg, player_ytcfg),
                'ytcfg': player_ytcfg,
            }

            player_po_token = self.fetch_po_token(
                context=_PoTokenContext.PLAYER, **fetch_po_token_args)

            gvs_po_token = self.fetch_po_token(
                context=_PoTokenContext.GVS, **fetch_po_token_args)

            required_pot_contexts = self._get_default_ytcfg(client)['PO_TOKEN_REQUIRED_CONTEXTS']

            if (
                not player_po_token
                and _PoTokenContext.PLAYER in required_pot_contexts
            ):
                # TODO: may need to skip player response request. Unsure yet..
                self.report_warning(
                    f'No Player PO Token provided for {client} client, '
                    f'which may be required for working {client} formats. This client will be deprioritized'
                    f'You can manually pass a Player PO Token for this client with --extractor-args "youtube:po_token={client}.player+XXX". '
                    f'For more information, refer to {PO_TOKEN_GUIDE_URL} .', only_once=True)
                deprioritize_pr = True

            if (
                not gvs_po_token
                and _PoTokenContext.GVS in required_pot_contexts
                and 'missing_pot' in self._configuration_arg('formats')
            ):
                # note: warning with help message is provided later during format processing
                self.report_warning(
                    f'No GVS PO Token provided for {client} client, '
                    f'which may be required for working {client} formats. This client will be deprioritized',
                    only_once=True)
                deprioritize_pr = True

            pr = initial_pr if client == 'web' else None
            try:
                pr = pr or self._extract_player_response(
                    client, video_id,
                    master_ytcfg=player_ytcfg or master_ytcfg,
                    player_ytcfg=player_ytcfg,
                    player_url=player_url,
                    initial_pr=initial_pr,
                    visitor_data=visitor_data,
                    data_sync_id=data_sync_id,
                    po_token=player_po_token)
            except ExtractorError as e:
                self.report_warning(e)
                continue

            if pr_id := self._invalid_player_response(pr, video_id):
                skipped_clients[client] = pr_id
            elif pr:
                # Save client name for introspection later
                sd = traverse_obj(pr, ('streamingData', {dict})) or {}
                sd[STREAMING_DATA_CLIENT_NAME] = client
                sd[STREAMING_DATA_INITIAL_PO_TOKEN] = gvs_po_token
                for f in traverse_obj(sd, (('formats', 'adaptiveFormats'), ..., {dict})):
                    f[STREAMING_DATA_CLIENT_NAME] = client
                    f[STREAMING_DATA_INITIAL_PO_TOKEN] = gvs_po_token
                if deprioritize_pr:
                    deprioritized_prs.append(pr)
                else:
                    prs.append(pr)

            # EU countries require age-verification for accounts to access age-restricted videos
            # If account is not age-verified, _is_agegated() will be truthy for non-embedded clients
            if self.is_authenticated and self._is_agegated(pr):
                self.to_screen(
                    f'{video_id}: This video is age-restricted and YouTube is requiring '
                    'account age-verification; some formats may be missing', only_once=True)
                # tv_embedded can work around the age-verification requirement for embeddable videos
                # web_creator may work around age-verification for all videos but requires PO token
                append_client('tv_embedded', 'web_creator')

        prs.extend(deprioritized_prs)

        if skipped_clients:
            self.report_warning(
                f'Skipping player responses from {"/".join(skipped_clients)} clients '
                f'(got player responses for video "{"/".join(set(skipped_clients.values()))}" instead of "{video_id}")')
            if not prs:
                raise ExtractorError(
                    'All player responses are invalid. Your IP is likely being blocked by Youtube', expected=True)
        elif not prs:
            raise ExtractorError('Failed to extract any player response')
        return prs, player_url

    def _needs_live_processing(self, live_status, duration):
        if ((live_status == 'is_live' and self.get_param('live_from_start'))
                or (live_status == 'post_live' and (duration or 0) > 2 * 3600)):
            return live_status

    def _report_pot_format_skipped(self, video_id, client_name, proto):
        msg = (
            f'{video_id}: {client_name} client {proto} formats require a GVS PO Token which was not provided. '
            'They will be skipped as they may yield HTTP Error 403. '
            f'You can manually pass a GVS PO Token for this client with --extractor-args "youtube:po_token={client_name}.gvs+XXX". '
            f'For more information, refer to  {PO_TOKEN_GUIDE_URL} . '
            'To enable these broken formats anyway, pass --extractor-args "youtube:formats=missing_pot"')

        # Only raise a warning for non-default clients, to not confuse users.
        # iOS HLS formats still work without PO Token, so we don't need to warn about them.
        if client_name in (*self._DEFAULT_CLIENTS, *self._DEFAULT_AUTHED_CLIENTS):
            self.write_debug(msg, only_once=True)
        else:
            self.report_warning(msg, only_once=True)

    def _extract_formats_and_subtitles(self, streaming_data, video_id, player_url, live_status, duration):
        CHUNK_SIZE = 10 << 20
        PREFERRED_LANG_VALUE = 10
        original_language = None
        itags, stream_ids = collections.defaultdict(set), []
        itag_qualities, res_qualities = {}, {0: None}
        q = qualities([
            # Normally tiny is the smallest video-only formats. But
            # audio-only formats with unknown quality may get tagged as tiny
            'tiny',
            'audio_quality_ultralow', 'audio_quality_low', 'audio_quality_medium', 'audio_quality_high',  # Audio only formats
            'small', 'medium', 'large', 'hd720', 'hd1080', 'hd1440', 'hd2160', 'hd2880', 'highres',
        ])
        streaming_formats = traverse_obj(streaming_data, (..., ('formats', 'adaptiveFormats'), ...))
        format_types = self._configuration_arg('formats')
        all_formats = 'duplicate' in format_types
        if self._configuration_arg('include_duplicate_formats'):
            all_formats = True
            self._downloader.deprecated_feature('[youtube] include_duplicate_formats extractor argument is deprecated. '
                                                'Use formats=duplicate extractor argument instead')

        def build_fragments(f):
            return LazyList({
                'url': update_url_query(f['url'], {
                    'range': f'{range_start}-{min(range_start + CHUNK_SIZE - 1, f["filesize"])}',
                }),
            } for range_start in range(0, f['filesize'], CHUNK_SIZE))

        for fmt in streaming_formats:
            client_name = fmt[STREAMING_DATA_CLIENT_NAME]
            if fmt.get('targetDurationSec'):
                continue

            itag = str_or_none(fmt.get('itag'))
            audio_track = fmt.get('audioTrack') or {}
            stream_id = (itag, audio_track.get('id'), fmt.get('isDrc'))
            if not all_formats:
                if stream_id in stream_ids:
                    continue

            quality = fmt.get('quality')
            height = int_or_none(fmt.get('height'))
            if quality == 'tiny' or not quality:
                quality = fmt.get('audioQuality', '').lower() or quality
            # The 3gp format (17) in android client has a quality of "small",
            # but is actually worse than other formats
            if itag == '17':
                quality = 'tiny'
            if quality:
                if itag:
                    itag_qualities[itag] = quality
                if height:
                    res_qualities[height] = quality

            display_name = audio_track.get('displayName') or ''
            is_original = 'original' in display_name.lower()
            is_descriptive = 'descriptive' in display_name.lower()
            is_default = audio_track.get('audioIsDefault')
            language_code = audio_track.get('id', '').split('.')[0]
            if language_code and (is_original or (is_default and not original_language)):
                original_language = language_code

            has_drm = bool(fmt.get('drmFamilies'))

            # FORMAT_STREAM_TYPE_OTF(otf=1) requires downloading the init fragment
            # (adding `&sq=0` to the URL) and parsing emsg box to determine the
            # number of fragment that would subsequently requested with (`&sq=N`)
            if fmt.get('type') == 'FORMAT_STREAM_TYPE_OTF' and not has_drm:
                continue

            if has_drm:
                msg = f'Some {client_name} client https formats have been skipped as they are DRM protected. '
                if client_name == 'tv':
                    msg += (
                        f'{"Your account" if self.is_authenticated else "The current session"} may have '
                        f'an experiment that applies DRM to all videos on the tv client. '
                        f'See  https://github.com/yt-dlp/yt-dlp/issues/12563  for more details.'
                    )
                self.report_warning(msg, video_id, only_once=True)

            fmt_url = fmt.get('url')
            if not fmt_url:
                sc = urllib.parse.parse_qs(fmt.get('signatureCipher'))
                fmt_url = url_or_none(try_get(sc, lambda x: x['url'][0]))
                encrypted_sig = try_get(sc, lambda x: x['s'][0])
                if not all((sc, fmt_url, player_url, encrypted_sig)):
                    self.report_warning(
                        f'Some {client_name} client https formats have been skipped as they are missing a url. '
                        f'{"Your account" if self.is_authenticated else "The current session"} may have '
                        f'the SSAP (server-side ads) experiment which interferes with yt-dlp. '
                        f'Please see  https://github.com/yt-dlp/yt-dlp/issues/12482  for more details.',
                        video_id, only_once=True)
                    continue
                try:
                    fmt_url += '&{}={}'.format(
                        traverse_obj(sc, ('sp', -1)) or 'signature',
                        self._decrypt_signature(encrypted_sig, video_id, player_url),
                    )
                except ExtractorError as e:
                    self.report_warning('Signature extraction failed: Some formats may be missing',
                                        video_id=video_id, only_once=True)
                    self.write_debug(e, only_once=True)
                    continue

            query = parse_qs(fmt_url)
            if query.get('n'):
                try:
                    decrypt_nsig = self._cached(self._decrypt_nsig, 'nsig', query['n'][0])
                    fmt_url = update_url_query(fmt_url, {
                        'n': decrypt_nsig(query['n'][0], video_id, player_url),
                    })
                except ExtractorError as e:
                    if player_url:
                        self.report_warning(
                            f'nsig extraction failed: Some formats may be missing\n'
                            f'         n = {query["n"][0]} ; player = {player_url}',
                            video_id=video_id, only_once=True)
                        self.write_debug(e, only_once=True)
                    else:
                        self.report_warning(
                            'Cannot decrypt nsig without player_url: Some formats may be missing',
                            video_id=video_id, only_once=True)
                    continue

            tbr = float_or_none(fmt.get('averageBitrate') or fmt.get('bitrate'), 1000)
            format_duration = traverse_obj(fmt, ('approxDurationMs', {float_or_none(scale=1000)}))
            # Some formats may have much smaller duration than others (possibly damaged during encoding)
            # E.g. 2-nOtRESiUc Ref: https://github.com/yt-dlp/yt-dlp/issues/2823
            # Make sure to avoid false positives with small duration differences.
            # E.g. __2ABJjxzNo, ySuUZEjARPY
            is_damaged = try_call(lambda: format_duration < duration // 2)
            if is_damaged:
                self.report_warning(
                    f'{video_id}: Some formats are possibly damaged. They will be deprioritized', only_once=True)

            po_token = fmt.get(STREAMING_DATA_INITIAL_PO_TOKEN)

            if po_token:
                fmt_url = update_url_query(fmt_url, {'pot': po_token})

            # Clients that require PO Token return videoplayback URLs that may return 403
            require_po_token = (
                not po_token
                and _PoTokenContext.GVS in self._get_default_ytcfg(client_name)['PO_TOKEN_REQUIRED_CONTEXTS']
                and itag not in ['18'])  # these formats do not require PO Token

            if require_po_token and 'missing_pot' not in self._configuration_arg('formats'):
                self._report_pot_format_skipped(video_id, client_name, 'https')
                continue

            name = fmt.get('qualityLabel') or quality.replace('audio_quality_', '') or ''
            fps = int_or_none(fmt.get('fps')) or 0
            dct = {
                'asr': int_or_none(fmt.get('audioSampleRate')),
                'filesize': int_or_none(fmt.get('contentLength')),
                'format_id': f'{itag}{"-drc" if fmt.get("isDrc") else ""}',
                'format_note': join_nonempty(
                    join_nonempty(display_name, is_default and ' (default)', delim=''),
                    name, fmt.get('isDrc') and 'DRC',
                    try_get(fmt, lambda x: x['projectionType'].replace('RECTANGULAR', '').lower()),
                    try_get(fmt, lambda x: x['spatialAudioType'].replace('SPATIAL_AUDIO_TYPE_', '').lower()),
                    is_damaged and 'DAMAGED', require_po_token and 'MISSING POT',
                    (self.get_param('verbose') or all_formats) and short_client_name(client_name),
                    delim=', '),
                # Format 22 is likely to be damaged. See https://github.com/yt-dlp/yt-dlp/issues/3372
                'source_preference': (-5 if itag == '22' else -1) + (100 if 'Premium' in name else 0),
                'fps': fps if fps > 1 else None,  # For some formats, fps is wrongly returned as 1
                'audio_channels': fmt.get('audioChannels'),
                'height': height,
                'quality': q(quality) - bool(fmt.get('isDrc')) / 2,
                'has_drm': has_drm,
                'tbr': tbr,
                'filesize_approx': filesize_from_tbr(tbr, format_duration),
                'url': fmt_url,
                'width': int_or_none(fmt.get('width')),
                'language': join_nonempty(language_code, 'desc' if is_descriptive else '') or None,
                'language_preference': PREFERRED_LANG_VALUE if is_original else 5 if is_default else -10 if is_descriptive else -1,
                # Strictly de-prioritize broken, damaged and 3gp formats
                'preference': -20 if require_po_token else -10 if is_damaged else -2 if itag == '17' else None,
            }
            mime_mobj = re.match(
                r'((?:[^/]+)/(?:[^;]+))(?:;\s*codecs="([^"]+)")?', fmt.get('mimeType') or '')
            if mime_mobj:
                dct['ext'] = mimetype2ext(mime_mobj.group(1))
                dct.update(parse_codecs(mime_mobj.group(2)))
            if itag:
                itags[itag].add(('https', dct.get('language')))
                stream_ids.append(stream_id)
            single_stream = 'none' in (dct.get('acodec'), dct.get('vcodec'))
            if single_stream and dct.get('ext'):
                dct['container'] = dct['ext'] + '_dash'

            if (all_formats or 'dashy' in format_types) and dct['filesize']:
                yield {
                    **dct,
                    'format_id': f'{dct["format_id"]}-dashy' if all_formats else dct['format_id'],
                    'protocol': 'http_dash_segments',
                    'fragments': build_fragments(dct),
                }
            if all_formats or 'dashy' not in format_types:
                dct['downloader_options'] = {'http_chunk_size': CHUNK_SIZE}
                yield dct

        needs_live_processing = self._needs_live_processing(live_status, duration)
        skip_bad_formats = 'incomplete' not in format_types
        if self._configuration_arg('include_incomplete_formats'):
            skip_bad_formats = False
            self._downloader.deprecated_feature('[youtube] include_incomplete_formats extractor argument is deprecated. '
                                                'Use formats=incomplete extractor argument instead')

        skip_manifests = set(self._configuration_arg('skip'))
        if (not self.get_param('youtube_include_hls_manifest', True)
                or needs_live_processing == 'is_live'  # These will be filtered out by YoutubeDL anyway
                or (needs_live_processing and skip_bad_formats)):
            skip_manifests.add('hls')

        if not self.get_param('youtube_include_dash_manifest', True):
            skip_manifests.add('dash')
        if self._configuration_arg('include_live_dash'):
            self._downloader.deprecated_feature('[youtube] include_live_dash extractor argument is deprecated. '
                                                'Use formats=incomplete extractor argument instead')
        elif skip_bad_formats and live_status == 'is_live' and needs_live_processing != 'is_live':
            skip_manifests.add('dash')

        def process_manifest_format(f, proto, client_name, itag, po_token):
            key = (proto, f.get('language'))
            if not all_formats and key in itags[itag]:
                return False

            if f.get('source_preference') is None:
                f['source_preference'] = -1

            # Clients that require PO Token return videoplayback URLs that may return 403
            # hls does not currently require PO Token
            if (
                not po_token
                and _PoTokenContext.GVS in self._get_default_ytcfg(client_name)['PO_TOKEN_REQUIRED_CONTEXTS']
                and proto != 'hls'
            ):
                if 'missing_pot' not in self._configuration_arg('formats'):
                    self._report_pot_format_skipped(video_id, client_name, proto)
                    return False
                f['format_note'] = join_nonempty(f.get('format_note'), 'MISSING POT', delim=' ')
                f['source_preference'] -= 20

            itags[itag].add(key)

            if itag and all_formats:
                f['format_id'] = f'{itag}-{proto}'
            elif any(p != proto for p, _ in itags[itag]):
                f['format_id'] = f'{itag}-{proto}'
            elif itag:
                f['format_id'] = itag

            if original_language and f.get('language') == original_language:
                f['format_note'] = join_nonempty(f.get('format_note'), '(default)', delim=' ')
                f['language_preference'] = PREFERRED_LANG_VALUE

            if itag in ('616', '235'):
                f['format_note'] = join_nonempty(f.get('format_note'), 'Premium', delim=' ')
                f['source_preference'] += 100

            f['quality'] = q(itag_qualities.get(try_get(f, lambda f: f['format_id'].split('-')[0]), -1))
            if f['quality'] == -1 and f.get('height'):
                f['quality'] = q(res_qualities[min(res_qualities, key=lambda x: abs(x - f['height']))])
            if self.get_param('verbose') or all_formats:
                f['format_note'] = join_nonempty(
                    f.get('format_note'), short_client_name(client_name), delim=', ')
            if f.get('fps') and f['fps'] <= 1:
                del f['fps']

            if proto == 'hls' and f.get('has_drm'):
                f['has_drm'] = 'maybe'
                f['source_preference'] -= 5
            return True

        subtitles = {}
        for sd in streaming_data:
            client_name = sd[STREAMING_DATA_CLIENT_NAME]
            po_token = sd.get(STREAMING_DATA_INITIAL_PO_TOKEN)
            hls_manifest_url = 'hls' not in skip_manifests and sd.get('hlsManifestUrl')
            if hls_manifest_url:
                if po_token:
                    hls_manifest_url = hls_manifest_url.rstrip('/') + f'/pot/{po_token}'
                fmts, subs = self._extract_m3u8_formats_and_subtitles(
                    hls_manifest_url, video_id, 'mp4', fatal=False, live=live_status == 'is_live')
                subtitles = self._merge_subtitles(subs, subtitles)
                for f in fmts:
                    if process_manifest_format(f, 'hls', client_name, self._search_regex(
                            r'/itag/(\d+)', f['url'], 'itag', default=None), po_token):
                        yield f

            dash_manifest_url = 'dash' not in skip_manifests and sd.get('dashManifestUrl')
            if dash_manifest_url:
                if po_token:
                    dash_manifest_url = dash_manifest_url.rstrip('/') + f'/pot/{po_token}'
                formats, subs = self._extract_mpd_formats_and_subtitles(dash_manifest_url, video_id, fatal=False)
                subtitles = self._merge_subtitles(subs, subtitles)  # Prioritize HLS subs over DASH
                for f in formats:
                    if process_manifest_format(f, 'dash', client_name, f['format_id'], po_token):
                        f['filesize'] = int_or_none(self._search_regex(
                            r'/clen/(\d+)', f.get('fragment_base_url') or f['url'], 'file size', default=None))
                        if needs_live_processing:
                            f['is_from_start'] = True

                        yield f
        yield subtitles

    def _extract_storyboard(self, player_responses, duration):
        spec = get_first(
            player_responses, ('storyboards', 'playerStoryboardSpecRenderer', 'spec'), default='').split('|')[::-1]
        base_url = url_or_none(urljoin('https://i.ytimg.com/', spec.pop() or None))
        if not base_url:
            return
        L = len(spec) - 1
        for i, args in enumerate(spec):
            args = args.split('#')
            counts = list(map(int_or_none, args[:5]))
            if len(args) != 8 or not all(counts):
                self.report_warning(f'Malformed storyboard {i}: {"#".join(args)}{bug_reports_message()}')
                continue
            width, height, frame_count, cols, rows = counts
            N, sigh = args[6:]

            url = base_url.replace('$L', str(L - i)).replace('$N', N) + f'&sigh={sigh}'
            fragment_count = frame_count / (cols * rows)
            fragment_duration = duration / fragment_count
            yield {
                'format_id': f'sb{i}',
                'format_note': 'storyboard',
                'ext': 'mhtml',
                'protocol': 'mhtml',
                'acodec': 'none',
                'vcodec': 'none',
                'url': url,
                'width': width,
                'height': height,
                'fps': frame_count / duration,
                'rows': rows,
                'columns': cols,
                'fragments': [{
                    'url': url.replace('$M', str(j)),
                    'duration': min(fragment_duration, duration - (j * fragment_duration)),
                } for j in range(math.ceil(fragment_count))],
            }

    def _download_player_responses(self, url, smuggled_data, video_id, webpage_url):
        webpage = None
        if 'webpage' not in self._configuration_arg('player_skip'):
            query = {'bpctr': '9999999999', 'has_verified': '1'}
            pp = self._configuration_arg('player_params', [None], casesense=True)[0]
            if pp:
                query['pp'] = pp
            webpage = self._download_webpage_with_retries(webpage_url, video_id, query=query)

        master_ytcfg = self.extract_ytcfg(video_id, webpage) or self._get_default_ytcfg()

        player_responses, player_url = self._extract_player_responses(
            self._get_requested_clients(url, smuggled_data),
            video_id, webpage, master_ytcfg, smuggled_data)

        return webpage, master_ytcfg, player_responses, player_url

    def _list_formats(self, video_id, microformats, video_details, player_responses, player_url, duration=None):
        live_broadcast_details = traverse_obj(microformats, (..., 'liveBroadcastDetails'))
        is_live = get_first(video_details, 'isLive')
        if is_live is None:
            is_live = get_first(live_broadcast_details, 'isLiveNow')
        live_content = get_first(video_details, 'isLiveContent')
        is_upcoming = get_first(video_details, 'isUpcoming')
        post_live = get_first(video_details, 'isPostLiveDvr')
        live_status = ('post_live' if post_live
                       else 'is_live' if is_live
                       else 'is_upcoming' if is_upcoming
                       else 'was_live' if live_content
                       else 'not_live' if False in (is_live, live_content)
                       else None)
        streaming_data = traverse_obj(player_responses, (..., 'streamingData'))
        *formats, subtitles = self._extract_formats_and_subtitles(streaming_data, video_id, player_url, live_status, duration)
        if all(f.get('has_drm') for f in formats):
            # If there are no formats that definitely don't have DRM, all have DRM
            for f in formats:
                f['has_drm'] = True

        return live_broadcast_details, live_status, streaming_data, formats, subtitles

    def _real_extract(self, url):
        url, smuggled_data = unsmuggle_url(url, {})
        video_id = self._match_id(url)

        base_url = self.http_scheme() + '//www.youtube.com/'
        webpage_url = base_url + 'watch?v=' + video_id

        webpage, master_ytcfg, player_responses, player_url = self._download_player_responses(url, smuggled_data, video_id, webpage_url)

        playability_statuses = traverse_obj(
            player_responses, (..., 'playabilityStatus'), expected_type=dict)

        trailer_video_id = get_first(
            playability_statuses,
            ('errorScreen', 'playerLegacyDesktopYpcTrailerRenderer', 'trailerVideoId'),
            expected_type=str)
        if trailer_video_id:
            return self.url_result(
                trailer_video_id, self.ie_key(), trailer_video_id)

        search_meta = ((lambda x: self._html_search_meta(x, webpage, default=None))
                       if webpage else (lambda x: None))

        video_details = traverse_obj(player_responses, (..., 'videoDetails'), expected_type=dict)
        microformats = traverse_obj(
            player_responses, (..., 'microformat', 'playerMicroformatRenderer'),
            expected_type=dict)

        translated_title = self._get_text(microformats, (..., 'title'))
        video_title = ((self._preferred_lang and translated_title)
                       or get_first(video_details, 'title')  # primary
                       or translated_title
                       or search_meta(['og:title', 'twitter:title', 'title']))
        translated_description = self._get_text(microformats, (..., 'description'))
        original_description = get_first(video_details, 'shortDescription')
        video_description = (
            (self._preferred_lang and translated_description)
            # If original description is blank, it will be an empty string.
            # Do not prefer translated description in this case.
            or original_description if original_description is not None else translated_description)

        multifeed_metadata_list = get_first(
            player_responses,
            ('multicamera', 'playerLegacyMulticameraRenderer', 'metadataList'),
            expected_type=str)
        if multifeed_metadata_list and not smuggled_data.get('force_singlefeed'):
            if self.get_param('noplaylist'):
                self.to_screen(f'Downloading just video {video_id} because of --no-playlist')
            else:
                entries = []
                feed_ids = []
                for feed in multifeed_metadata_list.split(','):
                    # Unquote should take place before split on comma (,) since textual
                    # fields may contain comma as well (see
                    # https://github.com/ytdl-org/youtube-dl/issues/8536)
                    feed_data = urllib.parse.parse_qs(
                        urllib.parse.unquote_plus(feed))

                    def feed_entry(name):
                        return try_get(
                            feed_data, lambda x: x[name][0], str)

                    feed_id = feed_entry('id')
                    if not feed_id:
                        continue
                    feed_title = feed_entry('title')
                    title = video_title
                    if feed_title:
                        title += f' ({feed_title})'
                    entries.append({
                        '_type': 'url_transparent',
                        'ie_key': 'Youtube',
                        'url': smuggle_url(
                            '{}watch?v={}'.format(base_url, feed_data['id'][0]),
                            {'force_singlefeed': True}),
                        'title': title,
                    })
                    feed_ids.append(feed_id)
                self.to_screen(
                    'Downloading multifeed video ({}) - add --no-playlist to just download video {}'.format(
                        ', '.join(feed_ids), video_id))
                return self.playlist_result(
                    entries, video_id, video_title, video_description)

        duration = (int_or_none(get_first(video_details, 'lengthSeconds'))
                    or int_or_none(get_first(microformats, 'lengthSeconds'))
                    or parse_duration(search_meta('duration')) or None)

        live_broadcast_details, live_status, streaming_data, formats, automatic_captions = \
            self._list_formats(video_id, microformats, video_details, player_responses, player_url, duration)
        if live_status == 'post_live':
            self.write_debug(f'{video_id}: Video is in Post-Live Manifestless mode')

        if not formats:
            if not self.get_param('allow_unplayable_formats') and traverse_obj(streaming_data, (..., 'licenseInfos')):
                self.report_drm(video_id)
            pemr = get_first(
                playability_statuses,
                ('errorScreen', 'playerErrorMessageRenderer'), expected_type=dict) or {}
            reason = self._get_text(pemr, 'reason') or get_first(playability_statuses, 'reason')
            subreason = clean_html(self._get_text(pemr, 'subreason') or '')
            if subreason:
                if subreason == 'The uploader has not made this video available in your country.':
                    countries = get_first(microformats, 'availableCountries')
                    if not countries:
                        regions_allowed = search_meta('regionsAllowed')
                        countries = regions_allowed.split(',') if regions_allowed else None
                    self.raise_geo_restricted(subreason, countries, metadata_available=True)
                reason += f'. {subreason}'
            if reason:
                if 'sign in' in reason.lower():
                    reason = remove_end(reason, 'This helps protect our community. Learn more')
                    reason = f'{remove_end(reason.strip(), ".")}. {self._youtube_login_hint}'
                self.raise_no_formats(reason, expected=True)

        keywords = get_first(video_details, 'keywords', expected_type=list) or []
        if not keywords and webpage:
            keywords = [
                unescapeHTML(m.group('content'))
                for m in re.finditer(self._meta_regex('og:video:tag'), webpage)]
        for keyword in keywords:
            if keyword.startswith('yt:stretch='):
                mobj = re.search(r'(\d+)\s*:\s*(\d+)', keyword)
                if mobj:
                    # NB: float is intentional for forcing float division
                    w, h = (float(v) for v in mobj.groups())
                    if w > 0 and h > 0:
                        ratio = w / h
                        for f in formats:
                            if f.get('vcodec') != 'none':
                                f['stretched_ratio'] = ratio
                        break
        thumbnails = self._extract_thumbnails((video_details, microformats), (..., ..., 'thumbnail'))
        thumbnail_url = search_meta(['og:image', 'twitter:image'])
        if thumbnail_url:
            thumbnails.append({
                'url': thumbnail_url,
            })
        original_thumbnails = thumbnails.copy()

        # The best resolution thumbnails sometimes does not appear in the webpage
        # See: https://github.com/yt-dlp/yt-dlp/issues/340
        # List of possible thumbnails - Ref: <https://stackoverflow.com/a/20542029>
        thumbnail_names = [
            # While the *1,*2,*3 thumbnails are just below their corresponding "*default" variants
            # in resolution, these are not the custom thumbnail. So de-prioritize them
            'maxresdefault', 'hq720', 'sddefault', 'hqdefault', '0', 'mqdefault', 'default',
            'sd1', 'sd2', 'sd3', 'hq1', 'hq2', 'hq3', 'mq1', 'mq2', 'mq3', '1', '2', '3',
        ]
        n_thumbnail_names = len(thumbnail_names)
        thumbnails.extend({
            'url': 'https://i.ytimg.com/vi{webp}/{video_id}/{name}{live}.{ext}'.format(
                video_id=video_id, name=name, ext=ext,
                webp='_webp' if ext == 'webp' else '', live='_live' if live_status == 'is_live' else ''),
        } for name in thumbnail_names for ext in ('webp', 'jpg'))
        for thumb in thumbnails:
            i = next((i for i, t in enumerate(thumbnail_names) if f'/{video_id}/{t}' in thumb['url']), n_thumbnail_names)
            thumb['preference'] = (0 if '.webp' in thumb['url'] else -1) - (2 * i)
        self._remove_duplicate_formats(thumbnails)
        self._downloader._sort_thumbnails(original_thumbnails)

        category = get_first(microformats, 'category') or search_meta('genre')
        channel_id = self.ucid_or_none(str_or_none(
            get_first(video_details, 'channelId')
            or get_first(microformats, 'externalChannelId')
            or search_meta('channelId')))
        owner_profile_url = get_first(microformats, 'ownerProfileUrl')

        live_start_time = parse_iso8601(get_first(live_broadcast_details, 'startTimestamp'))
        live_end_time = parse_iso8601(get_first(live_broadcast_details, 'endTimestamp'))
        if not duration and live_end_time and live_start_time:
            duration = live_end_time - live_start_time

        needs_live_processing = self._needs_live_processing(live_status, duration)

        def is_bad_format(fmt):
            if needs_live_processing and not fmt.get('is_from_start'):
                return True
            elif (live_status == 'is_live' and needs_live_processing != 'is_live'
                    and fmt.get('protocol') == 'http_dash_segments'):
                return True

        for fmt in filter(is_bad_format, formats):
            fmt['preference'] = (fmt.get('preference') or -1) - 10
            fmt['format_note'] = join_nonempty(fmt.get('format_note'), '(Last 2 hours)', delim=' ')

        if needs_live_processing:
            self._prepare_live_from_start_formats(
                formats, video_id, live_start_time, url, webpage_url, smuggled_data, live_status == 'is_live')

        formats.extend(self._extract_storyboard(player_responses, duration))

        channel_handle = self.handle_from_url(owner_profile_url)

        info = {
            'id': video_id,
            'title': video_title,
            'formats': formats,
            'thumbnails': thumbnails,
            # The best thumbnail that we are sure exists. Prevents unnecessary
            # URL checking if user don't care about getting the best possible thumbnail
            'thumbnail': traverse_obj(original_thumbnails, (-1, 'url')),
            'description': video_description,
            'channel_id': channel_id,
            'channel_url': format_field(channel_id, None, 'https://www.youtube.com/channel/%s', default=None),
            'duration': duration,
            'view_count': int_or_none(
                get_first((video_details, microformats), (..., 'viewCount'))
                or search_meta('interactionCount')),
            'average_rating': float_or_none(get_first(video_details, 'averageRating')),
            'age_limit': 18 if (
                get_first(microformats, 'isFamilySafe') is False
                or search_meta('isFamilyFriendly') == 'false'
                or search_meta('og:restrictions:age') == '18+') else 0,
            'webpage_url': webpage_url,
            'categories': [category] if category else None,
            'tags': keywords,
            'playable_in_embed': get_first(playability_statuses, 'playableInEmbed'),
            'live_status': live_status,
            'media_type': 'livestream' if get_first(video_details, 'isLiveContent') else None,
            'release_timestamp': live_start_time,
            '_format_sort_fields': (  # source_preference is lower for potentially damaged formats
                'quality', 'res', 'fps', 'hdr:12', 'source', 'vcodec', 'channels', 'acodec', 'lang', 'proto'),
        }

        subtitles = {}
        pctr = traverse_obj(player_responses, (..., 'captions', 'playerCaptionsTracklistRenderer'), expected_type=dict)
        if pctr:
            def get_lang_code(track):
                return (remove_start(track.get('vssId') or '', '.').replace('.', '-')
                        or track.get('languageCode'))

            # Converted into dicts to remove duplicates
            captions = {
                get_lang_code(sub): sub
                for sub in traverse_obj(pctr, (..., 'captionTracks', ...))}
            translation_languages = {
                lang.get('languageCode'): self._get_text(lang.get('languageName'), max_runs=1)
                for lang in traverse_obj(pctr, (..., 'translationLanguages', ...))}

            def process_language(container, base_url, lang_code, sub_name, query):
                lang_subs = container.setdefault(lang_code, [])
                for fmt in self._SUBTITLE_FORMATS:
                    query.update({
                        'fmt': fmt,
                    })
                    lang_subs.append({
                        'ext': fmt,
                        'url': urljoin('https://www.youtube.com', update_url_query(base_url, query)),
                        'name': sub_name,
                    })

            # NB: Constructing the full subtitle dictionary is slow
            get_translated_subs = 'translated_subs' not in self._configuration_arg('skip') and (
                self.get_param('writeautomaticsub', False) or self.get_param('listsubtitles'))
            for lang_code, caption_track in captions.items():
                base_url = caption_track.get('baseUrl')
                orig_lang = parse_qs(base_url).get('lang', [None])[-1]
                if not base_url:
                    continue
                lang_name = self._get_text(caption_track, 'name', max_runs=1)
                if caption_track.get('kind') != 'asr':
                    if not lang_code:
                        continue
                    process_language(
                        subtitles, base_url, lang_code, lang_name, {})
                    if not caption_track.get('isTranslatable'):
                        continue
                for trans_code, trans_name in translation_languages.items():
                    if not trans_code:
                        continue
                    orig_trans_code = trans_code
                    if caption_track.get('kind') != 'asr' and trans_code != 'und':
                        if not get_translated_subs:
                            continue
                        trans_code += f'-{lang_code}'
                        trans_name += format_field(lang_name, None, ' from %s')
                    if lang_code == f'a-{orig_trans_code}':
                        # Set audio language based on original subtitles
                        for f in formats:
                            if f.get('acodec') != 'none' and not f.get('language'):
                                f['language'] = orig_trans_code
                        # Add an "-orig" label to the original language so that it can be distinguished.
                        # The subs are returned without "-orig" as well for compatibility
                        process_language(
                            automatic_captions, base_url, f'{trans_code}-orig', f'{trans_name} (Original)', {})
                    # Setting tlang=lang returns damaged subtitles.
                    process_language(automatic_captions, base_url, trans_code, trans_name,
                                     {} if orig_lang == orig_trans_code else {'tlang': trans_code})

        info['automatic_captions'] = automatic_captions
        info['subtitles'] = subtitles

        parsed_url = urllib.parse.urlparse(url)
        for component in [parsed_url.fragment, parsed_url.query]:
            query = urllib.parse.parse_qs(component)
            for k, v in query.items():
                for d_k, s_ks in [('start', ('start', 't')), ('end', ('end',))]:
                    d_k += '_time'
                    if d_k not in info and k in s_ks:
                        info[d_k] = parse_duration(v[0])

        # Youtube Music Auto-generated description
        if (video_description or '').strip().endswith('\nAuto-generated by YouTube.'):
            # XXX: Causes catastrophic backtracking if description has "·"
            # E.g. https://www.youtube.com/watch?v=DoPaAxMQoiI
            # Simulating atomic groups:  (?P<a>[^xy]+)x  =>  (?=(?P<a>[^xy]+))(?P=a)x
            # reduces it, but does not fully fix it. https://regex101.com/r/8Ssf2h/2
            mobj = re.search(
                r'''(?xs)
                    (?=(?P<track>[^\n·]+))(?P=track)·
                    (?=(?P<artist>[^\n]+))(?P=artist)\n+
                    (?=(?P<album>[^\n]+))(?P=album)\n
                    (?:.+?℗\s*(?P<release_year>\d{4})(?!\d))?
                    (?:.+?Released\ on\s*:\s*(?P<release_date>\d{4}-\d{2}-\d{2}))?
                    (.+?\nArtist\s*:\s*
                        (?=(?P<clean_artist>[^\n]+))(?P=clean_artist)\n
                    )?.+\nAuto-generated\ by\ YouTube\.\s*$
                ''', video_description)
            if mobj:
                release_year = mobj.group('release_year')
                release_date = mobj.group('release_date')
                if release_date:
                    release_date = release_date.replace('-', '')
                    if not release_year:
                        release_year = release_date[:4]
                info.update({
                    'album': mobj.group('album'.strip()),
                    'artists': ([a] if (a := mobj.group('clean_artist'))
                                else [a.strip() for a in mobj.group('artist').split('·')]),
                    'track': mobj.group('track').strip(),
                    'release_date': release_date,
                    'release_year': int_or_none(release_year),
                })

        initial_data = None
        if webpage:
            initial_data = self.extract_yt_initial_data(video_id, webpage, fatal=False)
            if not traverse_obj(initial_data, 'contents'):
                self.report_warning('Incomplete data received in embedded initial data; re-fetching using API.')
                initial_data = None
        if not initial_data:
            query = {'videoId': video_id}
            query.update(self._get_checkok_params())
            initial_data = self._extract_response(
                item_id=video_id, ep='next', fatal=False,
                ytcfg=master_ytcfg, query=query, check_get_keys='contents',
                headers=self.generate_api_headers(ytcfg=master_ytcfg),
                note='Downloading initial data API JSON')

        COMMENTS_SECTION_IDS = ('comment-item-section', 'engagement-panel-comments-section')
        info['comment_count'] = traverse_obj(initial_data, (
            'contents', 'twoColumnWatchNextResults', 'results', 'results', 'contents', ..., 'itemSectionRenderer',
            'contents', ..., 'commentsEntryPointHeaderRenderer', 'commentCount',
        ), (
            'engagementPanels', lambda _, v: v['engagementPanelSectionListRenderer']['panelIdentifier'] in COMMENTS_SECTION_IDS,
            'engagementPanelSectionListRenderer', 'header', 'engagementPanelTitleHeaderRenderer', 'contextualInfo',
        ), expected_type=self._get_count, get_all=False)

        try:  # This will error if there is no livechat
            initial_data['contents']['twoColumnWatchNextResults']['conversationBar']['liveChatRenderer']['continuations'][0]['reloadContinuationData']['continuation']
        except (KeyError, IndexError, TypeError):
            pass
        else:
            info.setdefault('subtitles', {})['live_chat'] = [{
                # url is needed to set cookies
                'url': f'https://www.youtube.com/watch?v={video_id}&bpctr=9999999999&has_verified=1',
                'video_id': video_id,
                'ext': 'json',
                'protocol': ('youtube_live_chat' if live_status in ('is_live', 'is_upcoming')
                             else 'youtube_live_chat_replay'),
            }]

        if initial_data:
            info['chapters'] = (
                self._extract_chapters_from_json(initial_data, duration)
                or self._extract_chapters_from_engagement_panel(initial_data, duration)
                or self._extract_chapters_from_description(video_description, duration)
                or None)

            info['heatmap'] = self._extract_heatmap(initial_data)

        contents = traverse_obj(
            initial_data, ('contents', 'twoColumnWatchNextResults', 'results', 'results', 'contents'),
            expected_type=list, default=[])

        vpir = get_first(contents, 'videoPrimaryInfoRenderer')
        if vpir:
            stl = vpir.get('superTitleLink')
            if stl:
                stl = self._get_text(stl)
                if try_get(
                        vpir,
                        lambda x: x['superTitleIcon']['iconType']) == 'LOCATION_PIN':
                    info['location'] = stl
                else:
                    mobj = re.search(r'(.+?)\s*S(\d+)\s*•?\s*E(\d+)', stl)
                    if mobj:
                        info.update({
                            'series': mobj.group(1),
                            'season_number': int(mobj.group(2)),
                            'episode_number': int(mobj.group(3)),
                        })
            for tlb in (try_get(
                    vpir,
                    lambda x: x['videoActions']['menuRenderer']['topLevelButtons'],
                    list) or []):
                tbrs = variadic(
                    traverse_obj(
                        tlb, ('toggleButtonRenderer', ...),
                        ('segmentedLikeDislikeButtonRenderer', ..., 'toggleButtonRenderer')))
                for tbr in tbrs:
                    for getter, regex in [(
                            lambda x: x['defaultText']['accessibility']['accessibilityData'],
                            r'(?P<count>[\d,]+)\s*(?P<type>(?:dis)?like)'), ([
                                lambda x: x['accessibility'],
                                lambda x: x['accessibilityData']['accessibilityData'],
                            ], r'(?P<type>(?:dis)?like) this video along with (?P<count>[\d,]+) other people')]:
                        label = (try_get(tbr, getter, dict) or {}).get('label')
                        if label:
                            mobj = re.match(regex, label)
                            if mobj:
                                info[mobj.group('type') + '_count'] = str_to_int(mobj.group('count'))
                                break

            info['like_count'] = traverse_obj(vpir, (
                'videoActions', 'menuRenderer', 'topLevelButtons', ...,
                'segmentedLikeDislikeButtonViewModel', 'likeButtonViewModel', 'likeButtonViewModel',
                'toggleButtonViewModel', 'toggleButtonViewModel', 'defaultButtonViewModel',
                'buttonViewModel', 'accessibilityText', {parse_count}), get_all=False)

            vcr = traverse_obj(vpir, ('viewCount', 'videoViewCountRenderer'))
            if vcr:
                vc = self._get_count(vcr, 'viewCount')
                # Upcoming premieres with waiting count are treated as live here
                if vcr.get('isLive'):
                    info['concurrent_view_count'] = vc
                elif info.get('view_count') is None:
                    info['view_count'] = vc

        vsir = get_first(contents, 'videoSecondaryInfoRenderer')
        if vsir:
            vor = traverse_obj(vsir, ('owner', 'videoOwnerRenderer'))
            info.update({
                'channel': self._get_text(vor, 'title'),
                'channel_follower_count': self._get_count(vor, 'subscriberCountText')})

            if not channel_handle:
                channel_handle = self.handle_from_url(
                    traverse_obj(vor, (
                        ('navigationEndpoint', ('title', 'runs', ..., 'navigationEndpoint')),
                        (('commandMetadata', 'webCommandMetadata', 'url'), ('browseEndpoint', 'canonicalBaseUrl')),
                        {str}), get_all=False))

            rows = try_get(
                vsir,
                lambda x: x['metadataRowContainer']['metadataRowContainerRenderer']['rows'],
                list) or []
            multiple_songs = False
            for row in rows:
                if try_get(row, lambda x: x['metadataRowRenderer']['hasDividerLine']) is True:
                    multiple_songs = True
                    break
            for row in rows:
                mrr = row.get('metadataRowRenderer') or {}
                mrr_title = mrr.get('title')
                if not mrr_title:
                    continue
                mrr_title = self._get_text(mrr, 'title')
                mrr_contents_text = self._get_text(mrr, ('contents', 0))
                if mrr_title == 'License':
                    info['license'] = mrr_contents_text
                elif not multiple_songs:
                    if mrr_title == 'Album':
                        info['album'] = mrr_contents_text
                    elif mrr_title == 'Artist':
                        info['artists'] = [mrr_contents_text] if mrr_contents_text else None
                    elif mrr_title == 'Song':
                        info['track'] = mrr_contents_text
            owner_badges = self._extract_badges(traverse_obj(vsir, ('owner', 'videoOwnerRenderer', 'badges')))
            if self._has_badge(owner_badges, BadgeType.VERIFIED):
                info['channel_is_verified'] = True

        info.update({
            'uploader': info.get('channel'),
            'uploader_id': channel_handle,
            'uploader_url': format_field(channel_handle, None, 'https://www.youtube.com/%s', default=None),
        })

        # We only want timestamp IF it has time precision AND a timezone
        # Currently the uploadDate in microformats appears to be in US/Pacific timezone.
        timestamp = (
            parse_iso8601(get_first(microformats, 'uploadDate'), timezone=NO_DEFAULT)
            or parse_iso8601(search_meta('uploadDate'), timezone=NO_DEFAULT)
        )
        upload_date = (
            dt.datetime.fromtimestamp(timestamp, dt.timezone.utc).strftime('%Y%m%d') if timestamp else
            (
                unified_strdate(get_first(microformats, 'uploadDate'))
                or unified_strdate(search_meta('uploadDate'))
            ))

        # In the case we cannot get the timestamp:
        # The upload date for scheduled, live and past live streams / premieres in microformats
        # may be different from the stream date. Although not in UTC, we will prefer it in this case.
        # See: https://github.com/yt-dlp/yt-dlp/pull/2223#issuecomment-1008485139
        if not upload_date or (not timestamp and live_status in ('not_live', None)):
            # this should be in UTC, as configured in the cookie/client context
            upload_date = strftime_or_none(
                self._parse_time_text(self._get_text(vpir, 'dateText'))) or upload_date

        info['upload_date'] = upload_date
        info['timestamp'] = timestamp

        if upload_date and live_status not in ('is_live', 'post_live', 'is_upcoming'):
            # Newly uploaded videos' HLS formats are potentially problematic and need to be checked
            upload_datetime = datetime_from_str(upload_date).replace(tzinfo=dt.timezone.utc)
            if upload_datetime >= datetime_from_str('today-2days'):
                for fmt in info['formats']:
                    if fmt.get('protocol') == 'm3u8_native':
                        fmt['__needs_testing'] = True

        for s_k, d_k in [('artists', 'creators'), ('track', 'alt_title')]:
            v = info.get(s_k)
            if v:
                info[d_k] = v

        badges = self._extract_badges(traverse_obj(vpir, 'badges'))

        is_private = (self._has_badge(badges, BadgeType.AVAILABILITY_PRIVATE)
                      or get_first(video_details, 'isPrivate', expected_type=bool))

        info['availability'] = (
            'public' if self._has_badge(badges, BadgeType.AVAILABILITY_PUBLIC)
            else self._availability(
                is_private=is_private,
                needs_premium=(
                    self._has_badge(badges, BadgeType.AVAILABILITY_PREMIUM)
                    or False if initial_data and is_private is not None else None),
                needs_subscription=(
                    self._has_badge(badges, BadgeType.AVAILABILITY_SUBSCRIPTION)
                    or False if initial_data and is_private is not None else None),
                needs_auth=info['age_limit'] >= 18,
                is_unlisted=None if is_private is None else (
                    self._has_badge(badges, BadgeType.AVAILABILITY_UNLISTED)
                    or get_first(microformats, 'isUnlisted', expected_type=bool))))

        info['__post_extractor'] = self.extract_comments(master_ytcfg, video_id, contents, webpage)

        self.mark_watched(video_id, player_responses)

        return info
-												[youtube] Add YoutubeStoriesIE (#3362)

Get channel stories with `ytstories:<channel UCID>`

Authored-by: coletdjnz
											
										
										
											2022-05-01 01:46:28 -05:00
+								import base64
-												[ie/youtube] Use different PO token for GVS and Player (#12090)

Authored by: coletdjnz
											
										
										
											2025-01-24 18:17:37 -06:00
+								import binascii
-												[extractor/youtube] Consider language in format de-duplication

											
										
										
											2022-11-14 17:53:32 -06:00
+								import collections
-												[cleanup] Standardize `import datetime as dt` (#8978)

											
										
										
											2024-02-24 18:16:34 -06:00
+								import datetime as dt
-												[cleanup] Misc (#10075)

Closes #10303
Authored by: bashonly, seproDev, jucor, c-basalt

Co-authored-by: sepro <4618135+seproDev@users.noreply.github.com>
Co-authored-by: Julien Cornebise <julien@cornebise.com>
Co-authored-by: c-basalt <117849907+c-basalt@users.noreply.github.com>
											
										
										
											2024-07-01 17:51:27 -05:00
+								import functools
-												[youtube] Improve source code quality

											
										
										
											2013-09-22 03:37:23 -05:00
+								import itertools
-												Move youtube extractors to youtube_dl.extractor.youtube

											
										
										
											2013-06-23 12:58:33 -05:00
+								import json
-												[youtube] Add storyboard formats
Closes: #1553, https://github.com/ytdl-org/youtube-dl/issues/9868
Related: https://github.com/ytdl-org/youtube-dl/pull/14951

											
										
										
											2021-11-16 13:56:23 -06:00
+								import math
-												[youtube] Add filesystem signature cache

											
										
										
											2013-09-21 17:35:03 -05:00
+								import os.path
-												Add --mark-watched feature (Closes #5054)

											
										
										
											2016-02-29 13:01:33 -06:00
+								import random
-												Move youtube extractors to youtube_dl.extractor.youtube

											
										
										
											2013-06-23 12:58:33 -05:00
+								import re
-												[youtube:comments] Add more options for limiting number of comments extracted (#1626)

Extends `max_comments` extractor arg to support `max-parents,max-replies,max-replies-per-thread`.
Authored-by: coletdjnz
											
										
										
											2021-12-14 22:29:48 -06:00
+								import sys
-												[cleanup] Sort imports

Using https://github.com/PyCQA/isort

    isort -m VERTICAL_HANGING_INDENT --py 36 -l 80 --rr -n --tc .

											
										
										
											2022-04-11 17:32:57 -05:00
+								import threading
-												[linter] youtube.py

											
										
										
											2021-02-04 08:57:26 -06:00
+								import time
-												Restore accidentally deleted commits

That's what happens if you let Windows machines write :(

											
										
										
											2013-09-21 07:19:30 -05:00
+								import traceback
-												[compat] Remove more functions

Removing any more will require changes to a large number of extractors

											
										
										
											2022-06-24 03:10:17 -05:00
+								import urllib.parse
-												Move youtube extractors to youtube_dl.extractor.youtube

											
										
										
											2013-06-23 12:58:33 -05:00
-												[ie/youtube] Split into package (#12557)

Authored by: coletdjnz
											
										
										
											2025-03-12 23:37:33 -05:00
+								from ._base import (
 								    INNERTUBE_CLIENTS,
 								    BadgeType,
 								    YoutubeBaseInfoExtractor,
 								    _PoTokenContext,
 								    _split_innertube_client,
 								    short_client_name,
 								)
 								from ..openload import PhantomJSwrapper
 								from ...jsinterp import JSInterpreter
 								from ...networking.exceptions import HTTPError
 								from ...utils import (
-												[cleanup] Sort imports

Using https://github.com/PyCQA/isort

    isort -m VERTICAL_HANGING_INDENT --py 36 -l 80 --rr -n --tc .

											
										
										
											2022-04-11 17:32:57 -05:00
+								    NO_DEFAULT,
 								    ExtractorError,
-												[extractor/youtube] Download `post_live` videos from start (#5091)

* The fragments are generated as a `LazyList`. So only the required formats are expanded during download, but all fragment lists are printed/written in infojson.
* The m3u8 formats which cannot be downloaded from start are not extracted by default, but can be enabled with an extractor-arg. The extractor-arg `include_live_dash` is renamed to `include_incomplete_formats` to account for this new use-case.

Closes #1564
Authored by: Lesmiscore, pukkandan
											
										
										
											2022-10-03 21:48:31 -05:00
+								    LazyList,
-												[youtube] Add storyboard formats
Closes: #1553, https://github.com/ytdl-org/youtube-dl/issues/9868
Related: https://github.com/ytdl-org/youtube-dl/pull/14951

											
										
										
											2021-11-16 13:56:23 -06:00
+								    bug_reports_message,
-												Move youtube extractors to youtube_dl.extractor.youtube

											
										
										
											2013-06-23 12:58:33 -05:00
+								    clean_html,
-												[youtube] Extract comments' approximate timestamp (#221)

Authored by: colethedj
											
										
										
											2021-04-07 06:37:43 -05:00
+								    datetime_from_str,
-												[ie/youtube] Calculate more accurate `filesize`

YouTube provides slightly different duration for each format.
Calculating file-size based on this duration instead of the
video duration gives more accurate results.

Ref: https://github.com/yt-dlp/yt-dlp/issues/1400#issuecomment-2007441207

											
										
										
											2024-03-31 15:50:03 -05:00
+								    filesize_from_tbr,
-												[youtube] Extract average rating (closes #2362)

											
										
										
											2015-02-11 11:39:31 -06:00
+								    float_or_none,
-												[youtube] Extract data from multiple clients (#536)

* `player_client` accepts multiple clients
* default `player_client` = `android,web`
* music clients can be specifically requested
* Add IOS `player_client`
* Hide live dash since they can't be downloaded

Closes #501

Authored-by: pukkandan, colethedj
											
										
										
											2021-07-20 22:52:34 -05:00
+								    format_field,
-												[utils] Add `get_first`

											
										
										
											2022-03-08 14:54:41 -06:00
+								    get_first,
-												[youtube] Download DASH manifest

If given, download and parse the DASH manifest file, in order to get ultra-HQ formats.
Fixes #2166

											
										
										
											2014-01-18 22:47:20 -06:00
+								    int_or_none,
-												[utils] Add `join_nonempty`

											
										
										
											2021-11-05 20:05:24 -05:00
+								    join_nonempty,
-												[youtube] Fix n-sig for player e06dea74

											
										
										
											2022-01-31 20:40:19 -06:00
+								    js_to_json,
-												[youtube] Prefer info from YouTube than _formats (#8293)

											
										
										
											2016-01-24 11:02:19 -06:00
+								    mimetype2ext,
-												[youtube] Extract data from multiple clients (#536)

* `player_client` accepts multiple clients
* default `player_client` = `android,web`
* music clients can be specifically requested
* Add IOS `player_client`
* Hide live dash since they can't be downloaded

Closes #501

Authored-by: pukkandan, colethedj
											
										
										
											2021-07-20 22:52:34 -05:00
+								    orderedSet,
-												[youtube] Fix parsing codecs (closes #12091)

											
										
										
											2017-02-12 05:09:53 -06:00
+								    parse_codecs,
-												[youtube:comments] Improve comment vote count parsing (fixes #506) (#508)

Authored by: colethedj
											
										
										
											2021-07-14 18:24:42 -05:00
+								    parse_count,
-												[youtube] Extract start_time

From the 't=*' in the url.
Currently youtube-dl doesn't use the value, but it was requested for the mpv plugin.

											
										
										
											2015-07-20 14:10:28 -05:00
+								    parse_duration,
-												[youtube] Improve extraction of livestream metadata
Modified from and closes #441
Authored by: pukkandan, krichbanana

											
										
										
											2021-07-21 10:15:45 -05:00
+								    parse_iso8601,
-												[utils] Add `parse_qs`

											
										
										
											2021-08-22 14:02:00 -05:00
+								    parse_qs,
-												[formatsort] Remove forced priority of `quality`

When making `FormatSort`, I misinterpreted the purpose `quality`

											
										
										
											2021-02-18 12:12:56 -06:00
+								    qualities,
-												[ie/youtube] Remove broken OAuth support (#11558)

Closes #11462
Authored by: bashonly
											
										
										
											2024-11-16 17:40:21 -06:00
+								    remove_end,
-												[youtube] Fix TFA (#12927)

											
										
										
											2017-05-06 16:19:11 -05:00
+								    remove_start,
-												[youtube] Add support for multifeed videos

											
										
										
											2015-07-25 10:30:34 -05:00
+								    smuggle_url,
-												[youtube] Add fallback metadata extraction from videoDetails (closes #18052)

											
										
										
											2018-11-02 18:26:16 -05:00
+								    str_or_none,
-												[youtube] Fix likes/dislike extraction

											
										
										
											2015-06-28 13:48:06 -05:00
+								    str_to_int,
-												[youtube:tab] Extract more metadata from feeds/channels/playlists (#1018)

Parse relative time text, extract live, upcoming status, availability and channel id from feeds/channels/playlists (where applicable). 
Closes #1883
Authored-by: coletdjnz

											
										
										
											2021-12-19 22:47:53 -06:00
+								    strftime_or_none,
-												[youtube] Sanity check `chapters` (and refactor related code)
Closes #520

											
										
										
											2021-07-19 19:02:41 -05:00
+								    traverse_obj,
-												[ie/youtube] Calculate more accurate `filesize`

YouTube provides slightly different duration for each format.
Calculating file-size based on this duration instead of the
video duration gives more accurate results.

Ref: https://github.com/yt-dlp/yt-dlp/issues/1400#issuecomment-2007441207

											
										
										
											2024-03-31 15:50:03 -05:00
+								    try_call,
-												[youtube] Add fallback for duration extraction (closes #11841)

											
										
										
											2017-01-26 08:43:14 -06:00
+								    try_get,
-												Move youtube extractors to youtube_dl.extractor.youtube

											
										
										
											2013-06-23 12:58:33 -05:00
+								    unescapeHTML,
 								    unified_strdate,
-												[youtube] Add support for multifeed videos

											
										
										
											2015-07-25 10:30:34 -05:00
+								    unsmuggle_url,
-												Merge 'ytdl-org/youtube-dl/master' release 2020.11.19

Old Extractors left behind:
	VLivePlaylistIE
	YoutubeSearchURLIE
	YoutubeShowIE
	YoutubeFavouritesIE

If removing old extractors, make corresponding changes in
	docs/supportedsites.md
	youtube_dlc/extractor/extractors.py

Not merged:
	.github/ISSUE_TEMPLATE/1_broken_site.md
	.github/ISSUE_TEMPLATE/2_site_support_request.md
	.github/ISSUE_TEMPLATE/3_site_feature_request.md
	.github/ISSUE_TEMPLATE/4_bug_report.md
	.github/ISSUE_TEMPLATE/5_feature_request.md
	test/test_all_urls.py
	youtube_dlc/version.py
	Changelog

											
										
										
											2020-11-19 13:22:59 -06:00
+								    update_url_query,
-												[youtube] Fix mark watched (closes #18546)

											
										
										
											2018-12-16 06:35:48 -06:00
+								    url_or_none,
-												[youtube] misc cleanup and bug fixes (#505)

* Update some `_extract_response` calls to keep them consistent
* Cleanup continuation extraction related code using new API format
* Improve `_extract_account_syncid` to support multiple parameters
* Generalize `get_text` and related functions into one
* Update `INNERTUBE_CONTEXT_CLIENT_NAME` with integer values

Authored by: colethedj
											
										
										
											2021-07-18 23:55:07 -05:00
+								    urljoin,
-												[youtube] Sanity check `chapters` (and refactor related code)
Closes #520

											
										
										
											2021-07-19 19:02:41 -05:00
+								    variadic,
-												Move youtube extractors to youtube_dl.extractor.youtube

											
										
										
											2013-06-23 12:58:33 -05:00
+								)
-												[extractor/youtube] Add client name to `format_note` when `-v` (#6254)

Authored by: Lesmiscore, pukkandan
											
										
										
											2023-03-11 11:03:23 -06:00
+								STREAMING_DATA_CLIENT_NAME = '__yt_dlp_client'
-												[ie/youtube] Use different PO token for GVS and Player (#12090)

Authored by: coletdjnz
											
										
										
											2025-01-24 18:17:37 -06:00
+								STREAMING_DATA_INITIAL_PO_TOKEN = '__yt_dlp_po_token'
 								PO_TOKEN_GUIDE_URL = 'https://github.com/yt-dlp/yt-dlp/wiki/PO-Token-Guide'
-												[youtube] Convert to new subtitles system

The automatic captions are stored in the 'automactic_captions' field, which is used if no normal subtitles are found for an specific language.

											
										
										
											2015-02-16 14:44:17 -06:00
+								class YoutubeIE(YoutubeBaseInfoExtractor):
-												[cleanup] Add keyword automatically to SearchIE descriptions
and some minor cleanup of docs

											
										
										
											2021-10-23 09:29:52 -05:00
+								    IE_DESC = 'YouTube'
-												[cleanup] Add more ruff rules (#10149)

Authored by: seproDev

Reviewed-by: bashonly <88596187+bashonly@users.noreply.github.com>
Reviewed-by: Simon Sawicki <contact@grub4k.xyz>
											
										
										
											2024-06-11 18:09:58 -05:00
+								    _VALID_URL = r'''(?x)^
-												Move youtube extractors to youtube_dl.extractor.youtube

											
										
										
											2013-06-23 12:58:33 -05:00
+								                     (
-												[youtube] Don't make the url protocol optional

The generic extractor will add it.

											
										
										
											2014-09-11 14:47:25 -05:00
+								                         (?:https?://|//)                                    # http(s):// or protocol-independent URL
-												Update to ytdl-commit-cf2dbec
https://github.com/ytdl-org/youtube-dl/commit/cf2dbec6301177a1fddf72862de05fa912d9869d

Except: [kakao] improve info extraction and detect geo restriction
https://github.com/ytdl-org/youtube-dl/commit/d8085580f63ad3b146a31712ff76cf41d5a4558a

											
										
										
											2021-02-19 14:44:36 -06:00
+								                         (?:(?:(?:(?:\w+\.)?[yY][oO][uU][tT][uU][bB][eE](?:-nocookie|kids)?\.com|
 								                            (?:www\.)?deturl\.com/www\.youtube\.com|
 								                            (?:www\.)?pwnyoutube\.com|
 								                            (?:www\.)?hooktube\.com|
 								                            (?:www\.)?yourepeat\.com|
 								                            tube\.majestyc\.net|
-												[cleanup] Add more ruff rules (#10149)

Authored by: seproDev

Reviewed-by: bashonly <88596187+bashonly@users.noreply.github.com>
Reviewed-by: Simon Sawicki <contact@grub4k.xyz>
											
										
										
											2024-06-11 18:09:58 -05:00
+								                            {invidious}|
-												Update to ytdl-commit-cf2dbec
https://github.com/ytdl-org/youtube-dl/commit/cf2dbec6301177a1fddf72862de05fa912d9869d

Except: [kakao] improve info extraction and detect geo restriction
https://github.com/ytdl-org/youtube-dl/commit/d8085580f63ad3b146a31712ff76cf41d5a4558a

											
										
										
											2021-02-19 14:44:36 -06:00
+								                            youtube\.googleapis\.com)/                        # the various hostnames, with wildcard subdomains
-												Move youtube extractors to youtube_dl.extractor.youtube

											
										
										
											2013-06-23 12:58:33 -05:00
+								                         (?:.*?\#/)?                                          # handle anchor (#/) redirect urls
 								                         (?:                                                  # the various things that can precede the ID:
-												[extractor/youtube] Support `/live/` URL

											
										
										
											2023-02-03 12:17:13 -06:00
+								                             (?:(?:v|embed|e|shorts|live)/(?!videoseries|live_stream))  # v/ or embed/ or e/ or shorts/
-												Move youtube extractors to youtube_dl.extractor.youtube

											
										
										
											2013-06-23 12:58:33 -05:00
+								                             |(?:                                             # or the v= param in all its forms
-												[youtube] Add support for yourepeat.com URLs (Closes #2397)
											
										
										
											2014-02-18 13:00:54 -06:00
+								                                 (?:(?:watch|movie)(?:_popup)?(?:\.php)?/?)?  # preceding watch(_popup|.php) or nothing (like /?v=xxxx)
-												Move youtube extractors to youtube_dl.extractor.youtube

											
										
										
											2013-06-23 12:58:33 -05:00
+								                                 (?:\?|\#!?)                                  # the params delimiter ? or # or #!
-												[youtube] Extend _VALID_URL (Closes #7694)

											
										
										
											2015-11-29 09:01:59 -06:00
+								                                 (?:.*?[&;])??                                # any other preceding param (like /?s=tuff&v=xxxx or ?s=tuff&amp;v=V36LpHqtcDY)
-												Move youtube extractors to youtube_dl.extractor.youtube

											
										
										
											2013-06-23 12:58:33 -05:00
+								                                 v=
 								                             )
-												[youtube] Urls like youtube.com/NASA are now interpreted as users (fixes #1069)

Video urls like http://youtube.com/BaW_jenozKc are not valid, but http://youtu.be/BaW_jenozKc is correct.

											
										
										
											2013-09-05 15:38:23 -05:00
+								                         ))
-												[youtube] Expand _VALID_URL to support vid.plus

											
										
										
											2015-08-16 15:04:13 -05:00
+								                         |(?:
 								                            youtu\.be|                                        # just youtu.be/xxxx
-												[youtube] Add support for zwearz (Closes #9062)

											
										
										
											2016-04-03 15:26:20 -05:00
+								                            vid\.plus|                                        # or vid.plus/xxxx
 								                            zwearz\.com/watch|                                # or zwearz.com/watch/xxxx
-												[cleanup] Add more ruff rules (#10149)

Authored by: seproDev

Reviewed-by: bashonly <88596187+bashonly@users.noreply.github.com>
Reviewed-by: Simon Sawicki <contact@grub4k.xyz>
											
										
										
											2024-06-11 18:09:58 -05:00
+								                            {invidious}
-												[youtube] Expand _VALID_URL to support vid.plus

											
										
										
											2015-08-16 15:04:13 -05:00
+								                         )/
-												[youtube] Don't make the url protocol optional

The generic extractor will add it.

											
										
										
											2014-09-11 14:47:25 -05:00
+								                         |(?:www\.)?cleanvideosearch\.com/media/action/yt/watch\?videoId=
-												[youtube] Urls like youtube.com/NASA are now interpreted as users (fixes #1069)

Video urls like http://youtube.com/BaW_jenozKc are not valid, but http://youtu.be/BaW_jenozKc is correct.

											
										
										
											2013-09-05 15:38:23 -05:00
+								                         )
-												Move youtube extractors to youtube_dl.extractor.youtube

											
										
										
											2013-06-23 12:58:33 -05:00
+								                     )?                                                       # all until now is optional -> you can pass the naked ID
-												[cleanup] Add more ruff rules (#10149)

Authored by: seproDev

Reviewed-by: bashonly <88596187+bashonly@users.noreply.github.com>
Reviewed-by: Simon Sawicki <contact@grub4k.xyz>
											
										
										
											2024-06-11 18:09:58 -05:00
+								                     (?P<id>[0-9A-Za-z_-]{{11}})                              # here is it! the YouTube video ID
-												Move youtube extractors to youtube_dl.extractor.youtube

											
										
										
											2013-06-23 12:58:33 -05:00
+								                     (?(1).+)?                                                # if we found the ID, everything can follow
-												[cleanup] Add more ruff rules (#10149)

Authored by: seproDev

Reviewed-by: bashonly <88596187+bashonly@users.noreply.github.com>
Reviewed-by: Simon Sawicki <contact@grub4k.xyz>
											
										
										
											2024-06-11 18:09:58 -05:00
+								                     (?:\#|$)'''.format(
 								        invidious='|'.join(YoutubeBaseInfoExtractor._INVIDIOUS_SITES),
 								    )
-												[extractor/youtube] Detect `lazy-load-for-videos` embeds

Closes #4812

											
										
										
											2022-09-01 14:58:56 -05:00
+								    _EMBED_REGEX = [
 								        r'''(?x)
 								            (?:
-												[extractor/heise] Fix extractor (#5029)

Fixes https://github.com/yt-dlp/yt-dlp/issues/1520
Authored by: coletdjnz
											
										
										
											2022-09-25 19:58:06 -05:00
+								                <(?:[0-9A-Za-z-]+?)?iframe[^>]+?src=|
-												[extractor/youtube] Detect `lazy-load-for-videos` embeds

Closes #4812

											
										
										
											2022-09-01 14:58:56 -05:00
+								                data-video-url=|
 								                <embed[^>]+?src=|
 								                embedSWF\(?:\s*|
 								                <object[^>]+data=|
 								                new\s+SWFObject\(
 								            )
 								            (["\'])
 								                (?P<url>(?:https?:)?//(?:www\.)?youtube(?:-nocookie)?\.com/
 								                (?:embed|v|p)/[0-9A-Za-z_-]{11}.*?)
 								            \1''',
 								        # https://wordpress.org/plugins/lazy-load-for-videos/
 								        r'''(?xs)
 								            <a\s[^>]*\bhref="(?P<url>https://www\.youtube\.com/watch\?v=[0-9A-Za-z_-]{11})"
 								            \s[^>]*\bclass="[^"]*\blazy-load-youtube''',
 								    ]
-												[cleanup] Misc

Closes #5541

											
										
										
											2022-11-15 18:57:43 -06:00
+								    _RETURN_TYPE = 'video'  # XXX: How to handle multifeed?
-												[extractor/youtube] Detect `lazy-load-for-videos` embeds

Closes #4812

											
										
										
											2022-09-01 14:58:56 -05:00
-												[youtube] Improve player id extraction and add tests

											
										
										
											2020-05-01 19:18:08 -05:00
+								    _PLAYER_INFO_RE = (
-												[ie/youtube] Fix nsig and signature extraction for player `643afba4` (#12684)

Closes #12677, Closes #12682
Authored by: seproDev, bashonly

Co-authored-by: bashonly <88596187+bashonly@users.noreply.github.com>
											
										
										
											2025-03-21 15:58:10 -05:00
+								        r'/s/player/(?P<id>[a-zA-Z0-9_-]{8,})/(?:tv-)?player',
-												Update to ytdl-2021.02.10

Except: [archiveorg] Fix and improve extraction (5fc53690cbe6abb11941a3f4846b566a7472753e)

											
										
										
											2021-02-10 15:22:55 -06:00
+								        r'/(?P<id>[a-zA-Z0-9_-]{8,})/player(?:_ias\.vflset(?:/[a-zA-Z]{2,3}_[a-zA-Z]{2,3})?|-plasma-ias-(?:phone|tablet)-[a-z]{2}_[A-Z]{2}\.vflset)/base\.js$',
-												[youtube] Update to ytdl-2021.02.04.1

											
										
										
											2021-02-04 08:37:17 -06:00
+								        r'\b(?P<id>vfl[a-zA-Z0-9_-]+)\b.*?\.js$',
-												[youtube] Improve player id extraction and add tests

											
										
										
											2020-05-01 19:18:08 -05:00
+								    )
-												[ie/googledrive] Fix formats extraction (#9908)

Closes #8281
Authored by: WyohKnott
											
										
										
											2024-05-12 18:05:47 -05:00
+								    _formats = {  # NB: Used in YoutubeWebArchiveIE and GoogleDriveIE
-												Revert "[youtube] add tbr to _formats extracted from watch_as3.swf"

This reverts commit 4a5ba28a87a1a1632e58a1de404eb1fa268118a3.

											
										
										
											2016-03-02 10:35:04 -06:00
+								        '5': {'ext': 'flv', 'width': 400, 'height': 240, 'acodec': 'mp3', 'abr': 64, 'vcodec': 'h263'},
 								        '6': {'ext': 'flv', 'width': 450, 'height': 270, 'acodec': 'mp3', 'abr': 64, 'vcodec': 'h263'},
 								        '13': {'ext': '3gp', 'acodec': 'aac', 'vcodec': 'mp4v'},
 								        '17': {'ext': '3gp', 'width': 176, 'height': 144, 'acodec': 'aac', 'abr': 24, 'vcodec': 'mp4v'},
 								        '18': {'ext': 'mp4', 'width': 640, 'height': 360, 'acodec': 'aac', 'abr': 96, 'vcodec': 'h264'},
 								        '22': {'ext': 'mp4', 'width': 1280, 'height': 720, 'acodec': 'aac', 'abr': 192, 'vcodec': 'h264'},
 								        '34': {'ext': 'flv', 'width': 640, 'height': 360, 'acodec': 'aac', 'abr': 128, 'vcodec': 'h264'},
 								        '35': {'ext': 'flv', 'width': 854, 'height': 480, 'acodec': 'aac', 'abr': 128, 'vcodec': 'h264'},
-												[youtube] Clarify itag 36 height and abr (Closes #8457)

											
										
										
											2016-02-07 13:30:57 -06:00
+								        # itag 36 videos are either 320x180 (BaW_jenozKc) or 320x240 (__2ABJjxzNo), abr varies as well
-												Revert "[youtube] add tbr to _formats extracted from watch_as3.swf"

This reverts commit 4a5ba28a87a1a1632e58a1de404eb1fa268118a3.

											
										
										
											2016-03-02 10:35:04 -06:00
+								        '36': {'ext': '3gp', 'width': 320, 'acodec': 'aac', 'vcodec': 'mp4v'},
 								        '37': {'ext': 'mp4', 'width': 1920, 'height': 1080, 'acodec': 'aac', 'abr': 192, 'vcodec': 'h264'},
 								        '38': {'ext': 'mp4', 'width': 4096, 'height': 3072, 'acodec': 'aac', 'abr': 192, 'vcodec': 'h264'},
 								        '43': {'ext': 'webm', 'width': 640, 'height': 360, 'acodec': 'vorbis', 'abr': 128, 'vcodec': 'vp8'},
 								        '44': {'ext': 'webm', 'width': 854, 'height': 480, 'acodec': 'vorbis', 'abr': 128, 'vcodec': 'vp8'},
 								        '45': {'ext': 'webm', 'width': 1280, 'height': 720, 'acodec': 'vorbis', 'abr': 192, 'vcodec': 'vp8'},
-												[youtube] added vcodec/acodec/abr for multiple itags

Should make downloading with filters more precise and easier, ie. bestvideo[vcodec=h264]. By default a lot of codecs are specified as avc1.xxxxxx and unique for each format, which makes them unusable for bestvideo selection.
											
										
										
											2016-01-02 21:11:19 -06:00
+								        '46': {'ext': 'webm', 'width': 1920, 'height': 1080, 'acodec': 'vorbis', 'abr': 192, 'vcodec': 'vp8'},
-												Revert "[youtube] add tbr to _formats extracted from watch_as3.swf"

This reverts commit 4a5ba28a87a1a1632e58a1de404eb1fa268118a3.

											
										
										
											2016-03-02 10:35:04 -06:00
+								        '59': {'ext': 'mp4', 'width': 854, 'height': 480, 'acodec': 'aac', 'abr': 128, 'vcodec': 'h264'},
 								        '78': {'ext': 'mp4', 'width': 854, 'height': 480, 'acodec': 'aac', 'abr': 128, 'vcodec': 'h264'},
-												[youtube] added vcodec/acodec/abr for multiple itags

Should make downloading with filters more precise and easier, ie. bestvideo[vcodec=h264]. By default a lot of codecs are specified as avc1.xxxxxx and unique for each format, which makes them unusable for bestvideo selection.
											
										
										
											2016-01-02 21:11:19 -06:00
 								        # 3D videos
-												Revert "[youtube] add tbr to _formats extracted from watch_as3.swf"

This reverts commit 4a5ba28a87a1a1632e58a1de404eb1fa268118a3.

											
										
										
											2016-03-02 10:35:04 -06:00
+								        '82': {'ext': 'mp4', 'height': 360, 'format_note': '3D', 'acodec': 'aac', 'abr': 128, 'vcodec': 'h264', 'preference': -20},
 								        '83': {'ext': 'mp4', 'height': 480, 'format_note': '3D', 'acodec': 'aac', 'abr': 128, 'vcodec': 'h264', 'preference': -20},
 								        '84': {'ext': 'mp4', 'height': 720, 'format_note': '3D', 'acodec': 'aac', 'abr': 192, 'vcodec': 'h264', 'preference': -20},
 								        '85': {'ext': 'mp4', 'height': 1080, 'format_note': '3D', 'acodec': 'aac', 'abr': 192, 'vcodec': 'h264', 'preference': -20},
-												[youtube] added vcodec/acodec/abr for multiple itags

Should make downloading with filters more precise and easier, ie. bestvideo[vcodec=h264]. By default a lot of codecs are specified as avc1.xxxxxx and unique for each format, which makes them unusable for bestvideo selection.
											
										
										
											2016-01-02 21:11:19 -06:00
+								        '100': {'ext': 'webm', 'height': 360, 'format_note': '3D', 'acodec': 'vorbis', 'abr': 128, 'vcodec': 'vp8', 'preference': -20},
 								        '101': {'ext': 'webm', 'height': 480, 'format_note': '3D', 'acodec': 'vorbis', 'abr': 192, 'vcodec': 'vp8', 'preference': -20},
 								        '102': {'ext': 'webm', 'height': 720, 'format_note': '3D', 'acodec': 'vorbis', 'abr': 192, 'vcodec': 'vp8', 'preference': -20},
-												Add YouTube DASH formats to YouTubeIE

											
										
										
											2013-08-19 20:22:25 -05:00
-												AHLS -> Apple HTTP Live Streaming

											
										
										
											2013-09-03 20:49:35 -05:00
+								        # Apple HTTP Live Streaming
-												[youtube] Added itag 91

Seen in https://www.youtube.com/watch?v=jMN4cxyhJjk

											
										
										
											2016-03-17 06:25:37 -05:00
+								        '91': {'ext': 'mp4', 'height': 144, 'format_note': 'HLS', 'acodec': 'aac', 'abr': 48, 'vcodec': 'h264', 'preference': -10},
-												Revert "[youtube] add tbr to _formats extracted from watch_as3.swf"

This reverts commit 4a5ba28a87a1a1632e58a1de404eb1fa268118a3.

											
										
										
											2016-03-02 10:35:04 -06:00
+								        '92': {'ext': 'mp4', 'height': 240, 'format_note': 'HLS', 'acodec': 'aac', 'abr': 48, 'vcodec': 'h264', 'preference': -10},
 								        '93': {'ext': 'mp4', 'height': 360, 'format_note': 'HLS', 'acodec': 'aac', 'abr': 128, 'vcodec': 'h264', 'preference': -10},
 								        '94': {'ext': 'mp4', 'height': 480, 'format_note': 'HLS', 'acodec': 'aac', 'abr': 128, 'vcodec': 'h264', 'preference': -10},
 								        '95': {'ext': 'mp4', 'height': 720, 'format_note': 'HLS', 'acodec': 'aac', 'abr': 256, 'vcodec': 'h264', 'preference': -10},
 								        '96': {'ext': 'mp4', 'height': 1080, 'format_note': 'HLS', 'acodec': 'aac', 'abr': 256, 'vcodec': 'h264', 'preference': -10},
-												[youtube] added vcodec/acodec/abr for multiple itags

Should make downloading with filters more precise and easier, ie. bestvideo[vcodec=h264]. By default a lot of codecs are specified as avc1.xxxxxx and unique for each format, which makes them unusable for bestvideo selection.
											
										
										
											2016-01-02 21:11:19 -06:00
+								        '132': {'ext': 'mp4', 'height': 240, 'format_note': 'HLS', 'acodec': 'aac', 'abr': 48, 'vcodec': 'h264', 'preference': -10},
 								        '151': {'ext': 'mp4', 'height': 72, 'format_note': 'HLS', 'acodec': 'aac', 'abr': 24, 'vcodec': 'h264', 'preference': -10},
-												[youtube] Simplify format specification

											
										
										
											2013-12-24 05:34:09 -06:00
 								        # DASH mp4 video
-												[youtube] Remove explicit preference for audio-only and video-only formats
In order not to break sorting when new formats appear

											
										
										
											2017-04-11 10:41:48 -05:00
+								        '133': {'ext': 'mp4', 'height': 240, 'format_note': 'DASH video', 'vcodec': 'h264'},
 								        '134': {'ext': 'mp4', 'height': 360, 'format_note': 'DASH video', 'vcodec': 'h264'},
 								        '135': {'ext': 'mp4', 'height': 480, 'format_note': 'DASH video', 'vcodec': 'h264'},
 								        '136': {'ext': 'mp4', 'height': 720, 'format_note': 'DASH video', 'vcodec': 'h264'},
 								        '137': {'ext': 'mp4', 'height': 1080, 'format_note': 'DASH video', 'vcodec': 'h264'},
-												Start moving to ytdl-org

											
										
										
											2019-03-09 06:14:41 -06:00
+								        '138': {'ext': 'mp4', 'format_note': 'DASH video', 'vcodec': 'h264'},  # Height can vary (https://github.com/ytdl-org/youtube-dl/issues/4559)
-												[youtube] Remove explicit preference for audio-only and video-only formats
In order not to break sorting when new formats appear

											
										
										
											2017-04-11 10:41:48 -05:00
+								        '160': {'ext': 'mp4', 'height': 144, 'format_note': 'DASH video', 'vcodec': 'h264'},
 								        '212': {'ext': 'mp4', 'height': 480, 'format_note': 'DASH video', 'vcodec': 'h264'},
 								        '264': {'ext': 'mp4', 'height': 1440, 'format_note': 'DASH video', 'vcodec': 'h264'},
 								        '298': {'ext': 'mp4', 'height': 720, 'format_note': 'DASH video', 'vcodec': 'h264', 'fps': 60},
 								        '299': {'ext': 'mp4', 'height': 1080, 'format_note': 'DASH video', 'vcodec': 'h264', 'fps': 60},
 								        '266': {'ext': 'mp4', 'height': 2160, 'format_note': 'DASH video', 'vcodec': 'h264'},
-												Add YouTube DASH formats to YouTubeIE

											
										
										
											2013-08-19 20:22:25 -05:00
-												extractor: youtube: Fix extension of dash formats.

While we are at it, separate the audio formats from the video formats.

Signed-off-by: Rogério Brito <rbrito@ime.usp.br>

											
										
										
											2013-10-18 16:53:00 -05:00
+								        # Dash mp4 audio
-												[youtube] Remove explicit preference for audio-only and video-only formats
In order not to break sorting when new formats appear

											
										
										
											2017-04-11 10:41:48 -05:00
+								        '139': {'ext': 'm4a', 'format_note': 'DASH audio', 'acodec': 'aac', 'abr': 48, 'container': 'm4a_dash'},
 								        '140': {'ext': 'm4a', 'format_note': 'DASH audio', 'acodec': 'aac', 'abr': 128, 'container': 'm4a_dash'},
 								        '141': {'ext': 'm4a', 'format_note': 'DASH audio', 'acodec': 'aac', 'abr': 256, 'container': 'm4a_dash'},
 								        '256': {'ext': 'm4a', 'format_note': 'DASH audio', 'acodec': 'aac', 'container': 'm4a_dash'},
 								        '258': {'ext': 'm4a', 'format_note': 'DASH audio', 'acodec': 'aac', 'container': 'm4a_dash'},
 								        '325': {'ext': 'm4a', 'format_note': 'DASH audio', 'acodec': 'dtse', 'container': 'm4a_dash'},
 								        '328': {'ext': 'm4a', 'format_note': 'DASH audio', 'acodec': 'ec-3', 'container': 'm4a_dash'},
-												Add YouTube DASH formats to YouTubeIE

											
										
										
											2013-08-19 20:22:25 -05:00
 								        # Dash webm
-												[youtube] Remove explicit preference for audio-only and video-only formats
In order not to break sorting when new formats appear

											
										
										
											2017-04-11 10:41:48 -05:00
+								        '167': {'ext': 'webm', 'height': 360, 'width': 640, 'format_note': 'DASH video', 'container': 'webm', 'vcodec': 'vp8'},
 								        '168': {'ext': 'webm', 'height': 480, 'width': 854, 'format_note': 'DASH video', 'container': 'webm', 'vcodec': 'vp8'},
 								        '169': {'ext': 'webm', 'height': 720, 'width': 1280, 'format_note': 'DASH video', 'container': 'webm', 'vcodec': 'vp8'},
 								        '170': {'ext': 'webm', 'height': 1080, 'width': 1920, 'format_note': 'DASH video', 'container': 'webm', 'vcodec': 'vp8'},
 								        '218': {'ext': 'webm', 'height': 480, 'width': 854, 'format_note': 'DASH video', 'container': 'webm', 'vcodec': 'vp8'},
 								        '219': {'ext': 'webm', 'height': 480, 'width': 854, 'format_note': 'DASH video', 'container': 'webm', 'vcodec': 'vp8'},
 								        '278': {'ext': 'webm', 'height': 144, 'format_note': 'DASH video', 'container': 'webm', 'vcodec': 'vp9'},
 								        '242': {'ext': 'webm', 'height': 240, 'format_note': 'DASH video', 'vcodec': 'vp9'},
 								        '243': {'ext': 'webm', 'height': 360, 'format_note': 'DASH video', 'vcodec': 'vp9'},
 								        '244': {'ext': 'webm', 'height': 480, 'format_note': 'DASH video', 'vcodec': 'vp9'},
 								        '245': {'ext': 'webm', 'height': 480, 'format_note': 'DASH video', 'vcodec': 'vp9'},
 								        '246': {'ext': 'webm', 'height': 480, 'format_note': 'DASH video', 'vcodec': 'vp9'},
 								        '247': {'ext': 'webm', 'height': 720, 'format_note': 'DASH video', 'vcodec': 'vp9'},
 								        '248': {'ext': 'webm', 'height': 1080, 'format_note': 'DASH video', 'vcodec': 'vp9'},
 								        '271': {'ext': 'webm', 'height': 1440, 'format_note': 'DASH video', 'vcodec': 'vp9'},
-												[youtube] Clarify itag 272 possible resolutions (#7699)

											
										
										
											2015-11-30 08:42:05 -06:00
+								        # itag 272 videos are either 3840x2160 (e.g. RtoitU2A-3E) or 7680x4320 (sLprVF6d7Ug)
-												[youtube] Remove explicit preference for audio-only and video-only formats
In order not to break sorting when new formats appear

											
										
										
											2017-04-11 10:41:48 -05:00
+								        '272': {'ext': 'webm', 'height': 2160, 'format_note': 'DASH video', 'vcodec': 'vp9'},
 								        '302': {'ext': 'webm', 'height': 720, 'format_note': 'DASH video', 'vcodec': 'vp9', 'fps': 60},
 								        '303': {'ext': 'webm', 'height': 1080, 'format_note': 'DASH video', 'vcodec': 'vp9', 'fps': 60},
 								        '308': {'ext': 'webm', 'height': 1440, 'format_note': 'DASH video', 'vcodec': 'vp9', 'fps': 60},
 								        '313': {'ext': 'webm', 'height': 2160, 'format_note': 'DASH video', 'vcodec': 'vp9'},
 								        '315': {'ext': 'webm', 'height': 2160, 'format_note': 'DASH video', 'vcodec': 'vp9', 'fps': 60},
-												[youtube] Simplify format specification

											
										
										
											2013-12-24 05:34:09 -06:00
 								        # Dash webm audio
-												[youtube] Remove explicit preference for audio-only and video-only formats
In order not to break sorting when new formats appear

											
										
										
											2017-04-11 10:41:48 -05:00
+								        '171': {'ext': 'webm', 'acodec': 'vorbis', 'format_note': 'DASH audio', 'abr': 128},
 								        '172': {'ext': 'webm', 'acodec': 'vorbis', 'format_note': 'DASH audio', 'abr': 256},
-												[youtube] Add a pseudo format for rtmp videos (#2123)

											
										
										
											2014-01-08 19:38:50 -06:00
-												[youtube] Add webm audio formats (Fixes #4229)

											
										
										
											2014-11-18 04:06:09 -06:00
+								        # Dash webm audio with opus inside
-												[youtube] Remove explicit preference for audio-only and video-only formats
In order not to break sorting when new formats appear

											
										
										
											2017-04-11 10:41:48 -05:00
+								        '249': {'ext': 'webm', 'format_note': 'DASH audio', 'acodec': 'opus', 'abr': 50},
 								        '250': {'ext': 'webm', 'format_note': 'DASH audio', 'acodec': 'opus', 'abr': 70},
 								        '251': {'ext': 'webm', 'format_note': 'DASH audio', 'acodec': 'opus', 'abr': 160},
-												[youtube] Add webm audio formats (Fixes #4229)

											
										
										
											2014-11-18 04:06:09 -06:00
-												[youtube] Add a pseudo format for rtmp videos (#2123)

											
										
										
											2014-01-08 19:38:50 -06:00
+								        # RTMP (unnamed)
 								        '_rtmp': {'protocol': 'rtmp'},
-												[youtube] Hardcode codec metadata for av01 video only formats (closes #21381)

											
										
										
											2019-06-13 13:59:05 -05:00
 								        # av01 video only formats sometimes served with "unknown" codecs
-												[youtube] Add av01 itags to known formats list (#747)

Authored by: blackjack4494
											
										
										
											2021-08-22 14:59:43 -05:00
+								        '394': {'ext': 'mp4', 'height': 144, 'format_note': 'DASH video', 'vcodec': 'av01.0.00M.08'},
 								        '395': {'ext': 'mp4', 'height': 240, 'format_note': 'DASH video', 'vcodec': 'av01.0.00M.08'},
 								        '396': {'ext': 'mp4', 'height': 360, 'format_note': 'DASH video', 'vcodec': 'av01.0.01M.08'},
 								        '397': {'ext': 'mp4', 'height': 480, 'format_note': 'DASH video', 'vcodec': 'av01.0.04M.08'},
 								        '398': {'ext': 'mp4', 'height': 720, 'format_note': 'DASH video', 'vcodec': 'av01.0.05M.08'},
 								        '399': {'ext': 'mp4', 'height': 1080, 'format_note': 'DASH video', 'vcodec': 'av01.0.08M.08'},
 								        '400': {'ext': 'mp4', 'height': 1440, 'format_note': 'DASH video', 'vcodec': 'av01.0.12M.08'},
 								        '401': {'ext': 'mp4', 'height': 2160, 'format_note': 'DASH video', 'vcodec': 'av01.0.12M.08'},
-												Move youtube extractors to youtube_dl.extractor.youtube

											
										
										
											2013-06-23 12:58:33 -05:00
+								    }
-												Update to ytdl-2021.01.03

											
										
										
											2021-01-01 06:26:37 -06:00
+								    _SUBTITLE_FORMATS = ('json3', 'srv1', 'srv2', 'srv3', 'ttml', 'vtt')
-												[ie/youtube] Do not use `web_creator` as a default client (#12087)

Closes #12085
Authored by: bashonly
											
										
										
											2025-01-15 12:21:56 -06:00
+								    _DEFAULT_CLIENTS = ('tv', 'ios', 'web')
 								    _DEFAULT_AUTHED_CLIENTS = ('tv', 'web')
-												Add YouTube DASH formats to YouTubeIE

											
										
										
											2013-08-19 20:22:25 -05:00
-												[youtube] Raise GeoRestrictedError

											
										
										
											2017-02-26 03:51:21 -06:00
+								    _GEO_BYPASS = False
-												[youtube] Modernize

											
										
										
											2014-09-13 00:51:06 -05:00
+								    IE_NAME = 'youtube'
-												Allow _TESTS attribute for IEs with multiple tests

This also improves the numbering of duplicate tests

											
										
										
											2013-06-27 12:13:11 -05:00
+								    _TESTS = [
 								        {
-												[youtube] Change test URLs from http to https

											
										
										
											2016-09-17 09:48:20 -05:00
+								            'url': 'https://www.youtube.com/watch?v=BaW_jenozKc&t=1s&end=9',
-												[youtube] Modernize

											
										
										
											2014-09-24 02:49:53 -05:00
+								            'info_dict': {
 								                'id': 'BaW_jenozKc',
 								                'ext': 'mp4',
-												renaming issues resolved


											
										
										
											2020-09-02 15:37:35 -05:00
+								                'title': 'youtube-dl test video "\'/\\ä↭𝕐',
-												[test/download] Add more fields

											
										
										
											2021-12-14 16:02:40 -06:00
+								                'channel': 'Philipp Hagemeister',
-												[youtube] Extract channel meta fields (closes #9676, closes #12939)

											
										
										
											2018-09-14 13:24:26 -05:00
+								                'channel_id': 'UCLqxVugv74EIW3VWh2NOa3Q',
 								                'channel_url': r're:https?://(?:www\.)?youtube\.com/channel/UCLqxVugv74EIW3VWh2NOa3Q',
-												[youtube] Modernize

											
										
										
											2014-09-24 02:49:53 -05:00
+								                'upload_date': '20121002',
-												[test/download] Add more fields

											
										
										
											2021-12-14 16:02:40 -06:00
+								                'description': 'md5:8fb536f4877b8a7455c2ec23794dbc22',
-												[youtube] Modernize

											
										
										
											2014-09-24 02:49:53 -05:00
+								                'categories': ['Science & Technology'],
-												renaming issues resolved


											
										
										
											2020-09-02 15:37:35 -05:00
+								                'tags': ['youtube-dl'],
-												[youtube] Add fallback for duration extraction (closes #11841)

											
										
										
											2017-01-26 08:43:14 -06:00
+								                'duration': 10,
-												[youtube] Add fallback metadata extraction from videoDetails (closes #18052)

											
										
										
											2018-11-02 18:26:16 -05:00
+								                'view_count': int,
-												[youtube] Test for like_count and dislike_count (#3633)

											
										
										
											2014-08-31 11:10:05 -05:00
+								                'like_count': int,
-												[test/download] Add more fields

											
										
										
											2021-12-14 16:02:40 -06:00
+								                'availability': 'public',
 								                'playable_in_embed': True,
 								                'thumbnail': 'https://i.ytimg.com/vi/BaW_jenozKc/maxresdefault.jpg',
 								                'live_status': 'not_live',
 								                'age_limit': 0,
-												[youtube] Extract start_time

From the 't=*' in the url.
Currently youtube-dl doesn't use the value, but it was requested for the mpv plugin.

											
										
										
											2015-07-20 14:10:28 -05:00
+								                'start_time': 1,
-												[youtube] Extract end_time

											
										
										
											2015-07-23 06:20:21 -05:00
+								                'end_time': 9,
-												[extractor/youtube, cleanup] Fix tests (#4293)

Authored by: sheerluck
											
										
										
											2022-07-07 16:20:02 -05:00
+								                'comment_count': int,
-												[extractor/youtube] Define strict uploader metadata mapping (#6384)

New mapping:
```
channel -> channel name
channel_id -> UCID
channel_url -> UCID channel url

uploader -> channel name (same as channel field)
uploader_id -> @handle
uploader_url -> @handle channel url 
```

Authored by: coletdjnz
											
										
										
											2023-04-14 02:58:36 -05:00
+								                'channel_follower_count': int,
 								                'uploader': 'Philipp Hagemeister',
 								                'uploader_url': 'https://www.youtube.com/@PhilippHagemeister',
 								                'uploader_id': '@PhilippHagemeister',
-												[extractor/youtube] Extract `heatmap` data (#7100)

Closes #3888
Authored by: tntmod54321
											
										
										
											2023-05-26 07:24:39 -05:00
+								                'heatmap': 'count:100',
-												[ie/youtube] Extract upload timestamp if available (#9856)

Closes #4962, Closes #9829
Authored by: coletdjnz
											
										
										
											2024-05-26 16:13:12 -05:00
+								                'timestamp': 1349198244,
-												[cleanup] Add more ruff rules (#10149)

Authored by: seproDev

Reviewed-by: bashonly <88596187+bashonly@users.noreply.github.com>
Reviewed-by: Simon Sawicki <contact@grub4k.xyz>
											
										
										
											2024-06-11 18:09:58 -05:00
+								            },
-												[youtube] Fix tests in 2.x

											
										
										
											2013-06-27 12:55:39 -05:00
+								        },
-												Suppor embed-only videos (Fixes #1746)

											
										
										
											2013-11-18 06:05:18 -06:00
+								        {
-												[youtube] Modernize

											
										
										
											2014-09-24 02:49:53 -05:00
+								            'url': '//www.YouTube.com/watch?v=yZIXLfi8CZQ',
 								            'note': 'Embed-only video (#1746)',
 								            'info_dict': {
 								                'id': 'yZIXLfi8CZQ',
 								                'ext': 'mp4',
 								                'upload_date': '20120608',
 								                'title': 'Principal Sexually Assaults A Teacher - Episode 117 - 8th June 2012',
 								                'description': 'md5:09b78bd971f1e3e289601dfba15ca4f7',
-												[youtube] Fix test

											
										
										
											2015-11-23 09:35:23 -06:00
+								                'age_limit': 18,
-												[youtube] Update to ytdl-2021.02.04.1

											
										
										
											2021-02-04 08:37:17 -06:00
+								            },
 								            'skip': 'Private video',
-												Suppor embed-only videos (Fixes #1746)

											
										
										
											2013-11-18 06:05:18 -06:00
+								        },
-												[youtube] Use the first v= argument in the URL

This is according to how youtube handles multiple v= values in one URL.
Before this, it was possible to make a single URL show up differently
 on youtube itself, and if you downloaded/viewed it with youtube-dl/mpv

											
										
										
											2015-08-10 13:52:38 -05:00
+								        {
-												Merge 'ytdl-org/youtube-dl/master' release 2020.11.19

Old Extractors left behind:
	VLivePlaylistIE
	YoutubeSearchURLIE
	YoutubeShowIE
	YoutubeFavouritesIE

If removing old extractors, make corresponding changes in
	docs/supportedsites.md
	youtube_dlc/extractor/extractors.py

Not merged:
	.github/ISSUE_TEMPLATE/1_broken_site.md
	.github/ISSUE_TEMPLATE/2_site_support_request.md
	.github/ISSUE_TEMPLATE/3_site_feature_request.md
	.github/ISSUE_TEMPLATE/4_bug_report.md
	.github/ISSUE_TEMPLATE/5_feature_request.md
	test/test_all_urls.py
	youtube_dlc/version.py
	Changelog

											
										
										
											2020-11-19 13:22:59 -06:00
+								            'url': 'https://www.youtube.com/watch?v=BaW_jenozKc&v=yZIXLfi8CZQ',
-												[youtube] Use the first v= argument in the URL

This is according to how youtube handles multiple v= values in one URL.
Before this, it was possible to make a single URL show up differently
 on youtube itself, and if you downloaded/viewed it with youtube-dl/mpv

											
										
										
											2015-08-10 13:52:38 -05:00
+								            'note': 'Use the first video ID in the URL',
 								            'info_dict': {
 								                'id': 'BaW_jenozKc',
 								                'ext': 'mp4',
-												renaming issues resolved


											
										
										
											2020-09-02 15:37:35 -05:00
+								                'title': 'youtube-dl test video "\'/\\ä↭𝕐',
-												[youtube] Update tests

											
										
										
											2022-01-07 05:54:57 -06:00
+								                'channel': 'Philipp Hagemeister',
 								                'channel_id': 'UCLqxVugv74EIW3VWh2NOa3Q',
 								                'channel_url': r're:https?://(?:www\.)?youtube\.com/channel/UCLqxVugv74EIW3VWh2NOa3Q',
-												[youtube] Use the first v= argument in the URL

This is according to how youtube handles multiple v= values in one URL.
Before this, it was possible to make a single URL show up differently
 on youtube itself, and if you downloaded/viewed it with youtube-dl/mpv

											
										
										
											2015-08-10 13:52:38 -05:00
+								                'upload_date': '20121002',
-												[youtube] Update tests

											
										
										
											2022-01-07 05:54:57 -06:00
+								                'description': 'md5:8fb536f4877b8a7455c2ec23794dbc22',
-												[youtube] Use the first v= argument in the URL

This is according to how youtube handles multiple v= values in one URL.
Before this, it was possible to make a single URL show up differently
 on youtube itself, and if you downloaded/viewed it with youtube-dl/mpv

											
										
										
											2015-08-10 13:52:38 -05:00
+								                'categories': ['Science & Technology'],
-												renaming issues resolved


											
										
										
											2020-09-02 15:37:35 -05:00
+								                'tags': ['youtube-dl'],
-												[youtube] Add fallback for duration extraction (closes #11841)

											
										
										
											2017-01-26 08:43:14 -06:00
+								                'duration': 10,
-												[youtube] Add fallback metadata extraction from videoDetails (closes #18052)

											
										
										
											2018-11-02 18:26:16 -05:00
+								                'view_count': int,
-												[youtube] Use the first v= argument in the URL

This is according to how youtube handles multiple v= values in one URL.
Before this, it was possible to make a single URL show up differently
 on youtube itself, and if you downloaded/viewed it with youtube-dl/mpv

											
										
										
											2015-08-10 13:52:38 -05:00
+								                'like_count': int,
-												[youtube] Update tests

											
										
										
											2022-01-07 05:54:57 -06:00
+								                'availability': 'public',
 								                'playable_in_embed': True,
 								                'thumbnail': 'https://i.ytimg.com/vi/BaW_jenozKc/maxresdefault.jpg',
 								                'live_status': 'not_live',
 								                'age_limit': 0,
-												[extractor/youtube, cleanup] Fix tests (#4293)

Authored by: sheerluck
											
										
										
											2022-07-07 16:20:02 -05:00
+								                'comment_count': int,
-												[extractor/youtube] Define strict uploader metadata mapping (#6384)

New mapping:
```
channel -> channel name
channel_id -> UCID
channel_url -> UCID channel url

uploader -> channel name (same as channel field)
uploader_id -> @handle
uploader_url -> @handle channel url 
```

Authored by: coletdjnz
											
										
										
											2023-04-14 02:58:36 -05:00
+								                'channel_follower_count': int,
 								                'uploader': 'Philipp Hagemeister',
 								                'uploader_url': 'https://www.youtube.com/@PhilippHagemeister',
 								                'uploader_id': '@PhilippHagemeister',
-												[extractor/youtube] Misc cleanup

Authored by: coletdjnz

											
										
										
											2023-06-08 08:28:49 -05:00
+								                'heatmap': 'count:100',
-												[ie/youtube] Extract upload timestamp if available (#9856)

Closes #4962, Closes #9829
Authored by: coletdjnz
											
										
										
											2024-05-26 16:13:12 -05:00
+								                'timestamp': 1349198244,
-												[youtube] Skip download for multiple v= test

											
										
										
											2015-08-10 14:22:06 -05:00
+								            },
 								            'params': {
 								                'skip_download': True,
 								            },
-												[youtube] Use the first v= argument in the URL

This is according to how youtube handles multiple v= values in one URL.
Before this, it was possible to make a single URL show up differently
 on youtube itself, and if you downloaded/viewed it with youtube-dl/mpv

											
										
										
											2015-08-10 13:52:38 -05:00
+								        },
-												[youtube] Download DASH manifest

If given, download and parse the DASH manifest file, in order to get ultra-HQ formats.
Fixes #2166

											
										
										
											2014-01-18 22:47:20 -06:00
+								        {
-												[youtube] Change test URLs from http to https

											
										
										
											2016-09-17 09:48:20 -05:00
+								            'url': 'https://www.youtube.com/watch?v=a9LDPn-MO4I',
-												[youtube] Modernize

											
										
										
											2014-09-24 02:49:53 -05:00
+								            'note': '256k DASH audio (format 141) via DASH manifest',
 								            'info_dict': {
 								                'id': 'a9LDPn-MO4I',
 								                'ext': 'm4a',
 								                'upload_date': '20121002',
 								                'description': '',
-												[cleanup] Add more ruff rules (#10149)

Authored by: seproDev

Reviewed-by: bashonly <88596187+bashonly@users.noreply.github.com>
Reviewed-by: Simon Sawicki <contact@grub4k.xyz>
											
										
										
											2024-06-11 18:09:58 -05:00
+								                'title': 'UHDTV TEST 8K VIDEO.mp4',
-												[youtube] Make DASH manifest download conditional for now

DASH download fails on many videos (all with encrypted signatures? not sure yet), for example 07FYdnEawAQ, with a 403.

											
										
										
											2014-01-22 14:56:37 -06:00
+								            },
-												[youtube] Modernize

											
										
										
											2014-09-24 02:49:53 -05:00
+								            'params': {
 								                'youtube_include_dash_manifest': True,
 								                'format': '141',
-												[youtube] Make DASH manifest download conditional for now

DASH download fails on many videos (all with encrypted signatures? not sure yet), for example 07FYdnEawAQ, with a 403.

											
										
										
											2014-01-22 14:56:37 -06:00
+								            },
-												[youtube] Fix 141 format tests

											
										
										
											2016-06-24 10:27:55 -05:00
+								            'skip': 'format 141 not served anymore',
-												[youtube] Download DASH manifest

If given, download and parse the DASH manifest file, in order to get ultra-HQ formats.
Fixes #2166

											
										
										
											2014-01-18 22:47:20 -06:00
+								        },
-												Merge 'ytdl-org/youtube-dl/master' release 2020.11.19

Old Extractors left behind:
	VLivePlaylistIE
	YoutubeSearchURLIE
	YoutubeShowIE
	YoutubeFavouritesIE

If removing old extractors, make corresponding changes in
	docs/supportedsites.md
	youtube_dlc/extractor/extractors.py

Not merged:
	.github/ISSUE_TEMPLATE/1_broken_site.md
	.github/ISSUE_TEMPLATE/2_site_support_request.md
	.github/ISSUE_TEMPLATE/3_site_feature_request.md
	.github/ISSUE_TEMPLATE/4_bug_report.md
	.github/ISSUE_TEMPLATE/5_feature_request.md
	test/test_all_urls.py
	youtube_dlc/version.py
	Changelog

											
										
										
											2020-11-19 13:22:59 -06:00
+								        # DASH manifest with encrypted signature
 								        {
 								            'url': 'https://www.youtube.com/watch?v=IB3lcPjvWLA',
 								            'info_dict': {
 								                'id': 'IB3lcPjvWLA',
 								                'ext': 'm4a',
 								                'title': 'Afrojack, Spree Wilson - The Spark (Official Music Video) ft. Spree Wilson',
 								                'description': 'md5:8f5e2b82460520b619ccac1f509d43bf',
 								                'duration': 244,
 								                'upload_date': '20131011',
-												Update to ytdl-2021.02.10

Except: [archiveorg] Fix and improve extraction (5fc53690cbe6abb11941a3f4846b566a7472753e)

											
										
										
											2021-02-10 15:22:55 -06:00
+								                'abr': 129.495,
-												[youtube] Update tests

											
										
										
											2022-01-07 05:54:57 -06:00
+								                'like_count': int,
 								                'channel_id': 'UChuZAo1RKL85gev3Eal9_zg',
 								                'playable_in_embed': True,
 								                'channel_url': 'https://www.youtube.com/channel/UChuZAo1RKL85gev3Eal9_zg',
 								                'view_count': int,
 								                'track': 'The Spark',
 								                'live_status': 'not_live',
 								                'thumbnail': 'https://i.ytimg.com/vi_webp/IB3lcPjvWLA/maxresdefault.webp',
 								                'channel': 'Afrojack',
 								                'tags': 'count:19',
 								                'availability': 'public',
 								                'categories': ['Music'],
 								                'age_limit': 0,
 								                'alt_title': 'The Spark',
-												[extractor/youtube] Define strict uploader metadata mapping (#6384)

New mapping:
```
channel -> channel name
channel_id -> UCID
channel_url -> UCID channel url

uploader -> channel name (same as channel field)
uploader_id -> @handle
uploader_url -> @handle channel url 
```

Authored by: coletdjnz
											
										
										
											2023-04-14 02:58:36 -05:00
+								                'channel_follower_count': int,
 								                'uploader': 'Afrojack',
 								                'uploader_url': 'https://www.youtube.com/@Afrojack',
 								                'uploader_id': '@Afrojack',
-												Merge 'ytdl-org/youtube-dl/master' release 2020.11.19

Old Extractors left behind:
	VLivePlaylistIE
	YoutubeSearchURLIE
	YoutubeShowIE
	YoutubeFavouritesIE

If removing old extractors, make corresponding changes in
	docs/supportedsites.md
	youtube_dlc/extractor/extractors.py

Not merged:
	.github/ISSUE_TEMPLATE/1_broken_site.md
	.github/ISSUE_TEMPLATE/2_site_support_request.md
	.github/ISSUE_TEMPLATE/3_site_feature_request.md
	.github/ISSUE_TEMPLATE/4_bug_report.md
	.github/ISSUE_TEMPLATE/5_feature_request.md
	test/test_all_urls.py
	youtube_dlc/version.py
	Changelog

											
										
										
											2020-11-19 13:22:59 -06:00
+								            },
 								            'params': {
 								                'youtube_include_dash_manifest': True,
 								                'format': '141/bestaudio[ext=m4a]',
 								            },
 								        },
-												[youtube] Add `thirdParty` to agegate clients (#577)
* This allows more videos like `tf2U5Vyj0oU` to become embeddable
    See https://github.com/yt-dlp/yt-dlp/pull/575#issuecomment-888837000
* Also added tests for all types of age-gate

Closes #581

											
										
										
											2021-07-27 09:03:59 -05:00
+								        # Age-gate videos. See https://github.com/yt-dlp/yt-dlp/pull/575#issuecomment-888837000
-												[youtube] Add a normal age-gate test video

											
										
										
											2014-11-30 14:45:49 -06:00
+								        {
-												[ie/youtube] Add age-gate workaround for some embeddable videos (#11821)

Closes #11296
Authored by: bashonly
											
										
										
											2024-12-15 14:09:48 -06:00
+								            'note': 'Embed allowed age-gate video; works with web_embedded',
-												[youtube] Change test URLs from http to https

											
										
										
											2016-09-17 09:48:20 -05:00
+								            'url': 'https://youtube.com/watch?v=HtVdAasjOgU',
-												[youtube] Add a normal age-gate test video

											
										
										
											2014-11-30 14:45:49 -06:00
+								            'info_dict': {
 								                'id': 'HtVdAasjOgU',
 								                'ext': 'mp4',
 								                'title': 'The Witcher 3: Wild Hunt - The Sword Of Destiny Trailer',
-												Fix "invalid escape sequences" error on Python 3.6

											
										
										
											2017-01-02 06:08:07 -06:00
+								                'description': r're:(?s).{100,}About the Game\n.*?The Witcher 3: Wild Hunt.{100,}',
-												[youtube] Add fallback for duration extraction (closes #11841)

											
										
										
											2017-01-26 08:43:14 -06:00
+								                'duration': 142,
-												[youtube] Add a normal age-gate test video

											
										
										
											2014-11-30 14:45:49 -06:00
+								                'upload_date': '20140605',
-												[youtube] Add age limit to tests

											
										
										
											2015-08-10 14:24:53 -05:00
+								                'age_limit': 18,
-												[youtube] Update tests

											
										
										
											2022-01-07 05:54:57 -06:00
+								                'categories': ['Gaming'],
 								                'thumbnail': 'https://i.ytimg.com/vi_webp/HtVdAasjOgU/maxresdefault.webp',
 								                'availability': 'needs_auth',
 								                'channel_url': 'https://www.youtube.com/channel/UCzybXLxv08IApdjdN0mJhEg',
 								                'like_count': int,
 								                'channel': 'The Witcher',
 								                'live_status': 'not_live',
 								                'tags': 'count:17',
 								                'channel_id': 'UCzybXLxv08IApdjdN0mJhEg',
 								                'playable_in_embed': True,
 								                'view_count': int,
-												[extractor/youtube] Define strict uploader metadata mapping (#6384)

New mapping:
```
channel -> channel name
channel_id -> UCID
channel_url -> UCID channel url

uploader -> channel name (same as channel field)
uploader_id -> @handle
uploader_url -> @handle channel url 
```

Authored by: coletdjnz
											
										
										
											2023-04-14 02:58:36 -05:00
+								                'channel_follower_count': int,
 								                'uploader': 'The Witcher',
 								                'uploader_url': 'https://www.youtube.com/@thewitcher',
 								                'uploader_id': '@thewitcher',
-												[extractor/youtube] Misc cleanup

Authored by: coletdjnz

											
										
										
											2023-06-08 08:28:49 -05:00
+								                'comment_count': int,
-												[extractor/youtube] Extract `channel_is_verified` (#7213)

Authored by: coletdjnz

											
										
										
											2023-06-08 02:50:05 -05:00
+								                'channel_is_verified': True,
-												[extractor/youtube] Misc cleanup

Authored by: coletdjnz

											
										
										
											2023-06-08 08:28:49 -05:00
+								                'heatmap': 'count:100',
-												[ie/youtube] Extract upload timestamp if available (#9856)

Closes #4962, Closes #9829
Authored by: coletdjnz
											
										
										
											2024-05-26 16:13:12 -05:00
+								                'timestamp': 1401991663,
-												[youtube] Add a normal age-gate test video

											
										
										
											2014-11-30 14:45:49 -06:00
+								            },
 								        },
-												[youtube] Add `thirdParty` to agegate clients (#577)
* This allows more videos like `tf2U5Vyj0oU` to become embeddable
    See https://github.com/yt-dlp/yt-dlp/pull/575#issuecomment-888837000
* Also added tests for all types of age-gate

Closes #581

											
										
										
											2021-07-27 09:03:59 -05:00
+								        {
 								            'note': 'Age-gate video with embed allowed in public site',
 								            'url': 'https://youtube.com/watch?v=HsUATh_Nc2U',
 								            'info_dict': {
 								                'id': 'HsUATh_Nc2U',
 								                'ext': 'mp4',
 								                'title': 'Godzilla 2 (Official Video)',
 								                'description': 'md5:bf77e03fcae5529475e500129b05668a',
 								                'upload_date': '20200408',
 								                'age_limit': 18,
-												[youtube] Update tests

											
										
										
											2022-01-07 05:54:57 -06:00
+								                'availability': 'needs_auth',
 								                'channel_id': 'UCYQT13AtrJC0gsM1far_zJg',
 								                'channel': 'FlyingKitty',
 								                'channel_url': 'https://www.youtube.com/channel/UCYQT13AtrJC0gsM1far_zJg',
 								                'view_count': int,
 								                'categories': ['Entertainment'],
 								                'live_status': 'not_live',
 								                'tags': ['Flyingkitty', 'godzilla 2'],
 								                'thumbnail': 'https://i.ytimg.com/vi/HsUATh_Nc2U/maxresdefault.jpg',
 								                'like_count': int,
 								                'duration': 177,
 								                'playable_in_embed': True,
-												[extractor/youtube] Define strict uploader metadata mapping (#6384)

New mapping:
```
channel -> channel name
channel_id -> UCID
channel_url -> UCID channel url

uploader -> channel name (same as channel field)
uploader_id -> @handle
uploader_url -> @handle channel url 
```

Authored by: coletdjnz
											
										
										
											2023-04-14 02:58:36 -05:00
+								                'channel_follower_count': int,
 								                'uploader': 'FlyingKitty',
 								                'uploader_url': 'https://www.youtube.com/@FlyingKitty900',
 								                'uploader_id': '@FlyingKitty900',
-												[extractor/youtube] Extract `heatmap` data (#7100)

Closes #3888
Authored by: tntmod54321
											
										
										
											2023-05-26 07:24:39 -05:00
+								                'comment_count': int,
-												[extractor/youtube] Extract `channel_is_verified` (#7213)

Authored by: coletdjnz

											
										
										
											2023-06-08 02:50:05 -05:00
+								                'channel_is_verified': True,
-												[youtube] Add `thirdParty` to agegate clients (#577)
* This allows more videos like `tf2U5Vyj0oU` to become embeddable
    See https://github.com/yt-dlp/yt-dlp/pull/575#issuecomment-888837000
* Also added tests for all types of age-gate

Closes #581

											
										
										
											2021-07-27 09:03:59 -05:00
+								            },
-												[ie/youtube] Remove broken age-restriction workaround (#11297)

Closes #11296
Authored by: bashonly

											
										
										
											2024-10-20 17:25:29 -05:00
+								            'skip': 'Age-restricted; requires authentication',
-												[youtube] Add `thirdParty` to agegate clients (#577)
* This allows more videos like `tf2U5Vyj0oU` to become embeddable
    See https://github.com/yt-dlp/yt-dlp/pull/575#issuecomment-888837000
* Also added tests for all types of age-gate

Closes #581

											
										
										
											2021-07-27 09:03:59 -05:00
+								        },
 								        {
 								            'note': 'Age-gate video embedable only with clientScreen=EMBED',
 								            'url': 'https://youtube.com/watch?v=Tq92D6wQ1mg',
 								            'info_dict': {
 								                'id': 'Tq92D6wQ1mg',
 								                'title': '[MMD] Adios - EVERGLOW [+Motion DL]',
-												[youtube] Misc cleanup (#577)

Authored by: pukkandan, colethedj

											
										
										
											2021-07-30 14:43:26 -05:00
+								                'ext': 'mp4',
-												[youtube] Improve video upload date handling (#3029)

* Don't prefer UTC upload date for past live streams/premieres
* Improve regex (fixes a regression)

Authored-by: coletdjnz
											
										
										
											2022-03-13 17:02:44 -05:00
+								                'upload_date': '20191228',
-												[youtube] Add `thirdParty` to agegate clients (#577)
* This allows more videos like `tf2U5Vyj0oU` to become embeddable
    See https://github.com/yt-dlp/yt-dlp/pull/575#issuecomment-888837000
* Also added tests for all types of age-gate

Closes #581

											
										
										
											2021-07-27 09:03:59 -05:00
+								                'description': 'md5:17eccca93a786d51bc67646756894066',
 								                'age_limit': 18,
-												[youtube] Update tests

											
										
										
											2022-01-07 05:54:57 -06:00
+								                'like_count': int,
 								                'availability': 'needs_auth',
 								                'channel_id': 'UC1yoRdFoFJaCY-AGfD9W0wQ',
 								                'view_count': int,
 								                'thumbnail': 'https://i.ytimg.com/vi_webp/Tq92D6wQ1mg/sddefault.webp',
 								                'channel': 'Projekt Melody',
 								                'live_status': 'not_live',
 								                'tags': ['mmd', 'dance', 'mikumikudance', 'kpop', 'vtuber'],
 								                'playable_in_embed': True,
 								                'categories': ['Entertainment'],
 								                'duration': 106,
 								                'channel_url': 'https://www.youtube.com/channel/UC1yoRdFoFJaCY-AGfD9W0wQ',
-												[extractor/youtube, cleanup] Fix tests (#4293)

Authored by: sheerluck
											
										
										
											2022-07-07 16:20:02 -05:00
+								                'comment_count': int,
-												[extractor/youtube] Define strict uploader metadata mapping (#6384)

New mapping:
```
channel -> channel name
channel_id -> UCID
channel_url -> UCID channel url

uploader -> channel name (same as channel field)
uploader_id -> @handle
uploader_url -> @handle channel url 
```

Authored by: coletdjnz
											
										
										
											2023-04-14 02:58:36 -05:00
+								                'channel_follower_count': int,
 								                'uploader': 'Projekt Melody',
 								                'uploader_url': 'https://www.youtube.com/@ProjektMelody',
 								                'uploader_id': '@ProjektMelody',
-												[ie/youtube] Extract upload timestamp if available (#9856)

Closes #4962, Closes #9829
Authored by: coletdjnz
											
										
										
											2024-05-26 16:13:12 -05:00
+								                'timestamp': 1577508724,
-												[youtube] Add `thirdParty` to agegate clients (#577)
* This allows more videos like `tf2U5Vyj0oU` to become embeddable
    See https://github.com/yt-dlp/yt-dlp/pull/575#issuecomment-888837000
* Also added tests for all types of age-gate

Closes #581

											
										
										
											2021-07-27 09:03:59 -05:00
+								            },
-												[ie/youtube] Remove broken age-restriction workaround (#11297)

Closes #11296
Authored by: bashonly

											
										
										
											2024-10-20 17:25:29 -05:00
+								            'skip': 'Age-restricted; requires authentication',
-												[youtube] Add `thirdParty` to agegate clients (#577)
* This allows more videos like `tf2U5Vyj0oU` to become embeddable
    See https://github.com/yt-dlp/yt-dlp/pull/575#issuecomment-888837000
* Also added tests for all types of age-gate

Closes #581

											
										
										
											2021-07-27 09:03:59 -05:00
+								        },
 								        {
 								            'note': 'Non-Agegated non-embeddable video',
 								            'url': 'https://youtube.com/watch?v=MeJVWBSsPAY',
 								            'info_dict': {
 								                'id': 'MeJVWBSsPAY',
 								                'ext': 'mp4',
 								                'title': 'OOMPH! - Such Mich Find Mich (Lyrics)',
 								                'description': 'Fan Video. Music & Lyrics by OOMPH!.',
 								                'upload_date': '20130730',
-												[youtube] Update tests

											
										
										
											2022-01-07 05:54:57 -06:00
+								                'track': 'Such mich find mich',
 								                'age_limit': 0,
 								                'tags': ['oomph', 'such mich find mich', 'lyrics', 'german industrial', 'musica industrial'],
 								                'like_count': int,
 								                'playable_in_embed': False,
 								                'creator': 'OOMPH!',
 								                'thumbnail': 'https://i.ytimg.com/vi/MeJVWBSsPAY/sddefault.jpg',
 								                'view_count': int,
 								                'alt_title': 'Such mich find mich',
 								                'duration': 210,
 								                'channel': 'Herr Lurik',
 								                'channel_id': 'UCdR3RSDPqub28LjZx0v9-aA',
 								                'categories': ['Music'],
 								                'availability': 'public',
 								                'channel_url': 'https://www.youtube.com/channel/UCdR3RSDPqub28LjZx0v9-aA',
 								                'live_status': 'not_live',
 								                'artist': 'OOMPH!',
-												[extractor/youtube] Define strict uploader metadata mapping (#6384)

New mapping:
```
channel -> channel name
channel_id -> UCID
channel_url -> UCID channel url

uploader -> channel name (same as channel field)
uploader_id -> @handle
uploader_url -> @handle channel url 
```

Authored by: coletdjnz
											
										
										
											2023-04-14 02:58:36 -05:00
+								                'channel_follower_count': int,
 								                'uploader': 'Herr Lurik',
 								                'uploader_url': 'https://www.youtube.com/@HerrLurik',
 								                'uploader_id': '@HerrLurik',
-												[youtube] Add `thirdParty` to agegate clients (#577)
* This allows more videos like `tf2U5Vyj0oU` to become embeddable
    See https://github.com/yt-dlp/yt-dlp/pull/575#issuecomment-888837000
* Also added tests for all types of age-gate

Closes #581

											
										
										
											2021-07-27 09:03:59 -05:00
+								            },
 								        },
 								        {
 								            'note': 'Non-bypassable age-gated video',
 								            'url': 'https://youtube.com/watch?v=Cr381pDsSsA',
 								            'only_matching': True,
 								        },
-												Merge 'ytdl-org/youtube-dl/master' release 2020.11.19

Old Extractors left behind:
	VLivePlaylistIE
	YoutubeSearchURLIE
	YoutubeShowIE
	YoutubeFavouritesIE

If removing old extractors, make corresponding changes in
	docs/supportedsites.md
	youtube_dlc/extractor/extractors.py

Not merged:
	.github/ISSUE_TEMPLATE/1_broken_site.md
	.github/ISSUE_TEMPLATE/2_site_support_request.md
	.github/ISSUE_TEMPLATE/3_site_feature_request.md
	.github/ISSUE_TEMPLATE/4_bug_report.md
	.github/ISSUE_TEMPLATE/5_feature_request.md
	test/test_all_urls.py
	youtube_dlc/version.py
	Changelog

											
										
										
											2020-11-19 13:22:59 -06:00
+								        # video_info is None (https://github.com/ytdl-org/youtube-dl/issues/4421)
 								        # YouTube Red ad is not captured for creator
 								        {
 								            'url': '__2ABJjxzNo',
 								            'info_dict': {
 								                'id': '__2ABJjxzNo',
 								                'ext': 'mp4',
 								                'duration': 266,
 								                'upload_date': '20100430',
-												[youtube] Update to ytdl-2021.02.04.1

											
										
										
											2021-02-04 08:37:17 -06:00
+								                'creator': 'deadmau5',
 								                'description': 'md5:6cbcd3a92ce1bc676fc4d6ab4ace2336',
-												Merge 'ytdl-org/youtube-dl/master' release 2020.11.19

Old Extractors left behind:
	VLivePlaylistIE
	YoutubeSearchURLIE
	YoutubeShowIE
	YoutubeFavouritesIE

If removing old extractors, make corresponding changes in
	docs/supportedsites.md
	youtube_dlc/extractor/extractors.py

Not merged:
	.github/ISSUE_TEMPLATE/1_broken_site.md
	.github/ISSUE_TEMPLATE/2_site_support_request.md
	.github/ISSUE_TEMPLATE/3_site_feature_request.md
	.github/ISSUE_TEMPLATE/4_bug_report.md
	.github/ISSUE_TEMPLATE/5_feature_request.md
	test/test_all_urls.py
	youtube_dlc/version.py
	Changelog

											
										
										
											2020-11-19 13:22:59 -06:00
+								                'title': 'Deadmau5 - Some Chords (HD)',
-												[youtube] Update to ytdl-2021.02.04.1

											
										
										
											2021-02-04 08:37:17 -06:00
+								                'alt_title': 'Some Chords',
-												[youtube] Update tests

											
										
										
											2022-01-07 05:54:57 -06:00
+								                'availability': 'public',
 								                'tags': 'count:14',
 								                'channel_id': 'UCYEK6xds6eo-3tr4xRdflmQ',
 								                'view_count': int,
 								                'live_status': 'not_live',
 								                'channel': 'deadmau5',
 								                'thumbnail': 'https://i.ytimg.com/vi_webp/__2ABJjxzNo/maxresdefault.webp',
 								                'like_count': int,
 								                'track': 'Some Chords',
 								                'artist': 'deadmau5',
 								                'playable_in_embed': True,
 								                'age_limit': 0,
 								                'channel_url': 'https://www.youtube.com/channel/UCYEK6xds6eo-3tr4xRdflmQ',
 								                'categories': ['Music'],
 								                'album': 'Some Chords',
-												[extractor/youtube] Define strict uploader metadata mapping (#6384)

New mapping:
```
channel -> channel name
channel_id -> UCID
channel_url -> UCID channel url

uploader -> channel name (same as channel field)
uploader_id -> @handle
uploader_url -> @handle channel url 
```

Authored by: coletdjnz
											
										
										
											2023-04-14 02:58:36 -05:00
+								                'channel_follower_count': int,
 								                'uploader': 'deadmau5',
 								                'uploader_url': 'https://www.youtube.com/@deadmau5',
 								                'uploader_id': '@deadmau5',
-												Merge 'ytdl-org/youtube-dl/master' release 2020.11.19

Old Extractors left behind:
	VLivePlaylistIE
	YoutubeSearchURLIE
	YoutubeShowIE
	YoutubeFavouritesIE

If removing old extractors, make corresponding changes in
	docs/supportedsites.md
	youtube_dlc/extractor/extractors.py

Not merged:
	.github/ISSUE_TEMPLATE/1_broken_site.md
	.github/ISSUE_TEMPLATE/2_site_support_request.md
	.github/ISSUE_TEMPLATE/3_site_feature_request.md
	.github/ISSUE_TEMPLATE/4_bug_report.md
	.github/ISSUE_TEMPLATE/5_feature_request.md
	test/test_all_urls.py
	youtube_dlc/version.py
	Changelog

											
										
										
											2020-11-19 13:22:59 -06:00
+								            },
 								            'expected_warnings': [
 								                'DASH manifest missing',
-												[cleanup] Add more ruff rules (#10149)

Authored by: seproDev

Reviewed-by: bashonly <88596187+bashonly@users.noreply.github.com>
Reviewed-by: Simon Sawicki <contact@grub4k.xyz>
											
										
										
											2024-06-11 18:09:58 -05:00
+								            ],
-												Merge 'ytdl-org/youtube-dl/master' release 2020.11.19

Old Extractors left behind:
	VLivePlaylistIE
	YoutubeSearchURLIE
	YoutubeShowIE
	YoutubeFavouritesIE

If removing old extractors, make corresponding changes in
	docs/supportedsites.md
	youtube_dlc/extractor/extractors.py

Not merged:
	.github/ISSUE_TEMPLATE/1_broken_site.md
	.github/ISSUE_TEMPLATE/2_site_support_request.md
	.github/ISSUE_TEMPLATE/3_site_feature_request.md
	.github/ISSUE_TEMPLATE/4_bug_report.md
	.github/ISSUE_TEMPLATE/5_feature_request.md
	test/test_all_urls.py
	youtube_dlc/version.py
	Changelog

											
										
										
											2020-11-19 13:22:59 -06:00
+								        },
-												Start moving to ytdl-org

											
										
										
											2019-03-09 06:14:41 -06:00
+								        # Olympics (https://github.com/ytdl-org/youtube-dl/issues/4431)
-												[youtube] Add test case for #4431

											
										
										
											2014-12-11 09:28:07 -06:00
+								        {
 								            'url': 'lqQg6PlCWgI',
 								            'info_dict': {
 								                'id': 'lqQg6PlCWgI',
 								                'ext': 'mp4',
-												[youtube] Add fallback for duration extraction (closes #11841)

											
										
										
											2017-01-26 08:43:14 -06:00
+								                'duration': 6085,
-												[youtube] Fix test

											
										
										
											2015-11-23 09:37:21 -06:00
+								                'upload_date': '20150827',
-												[extractor/youtube, cleanup] Fix tests (#4293)

Authored by: sheerluck
											
										
										
											2022-07-07 16:20:02 -05:00
+								                'description': 'md5:04bbbf3ccceb6795947572ca36f45904',
-												[youtube] Amend test

											
										
										
											2014-12-11 09:34:37 -06:00
+								                'title': 'Hockey - Women -  GER-AUS - London 2012 Olympic Games',
-												[youtube] Update tests

											
										
										
											2022-01-07 05:54:57 -06:00
+								                'like_count': int,
 								                'release_timestamp': 1343767800,
 								                'playable_in_embed': True,
 								                'categories': ['Sports'],
 								                'release_date': '20120731',
 								                'channel': 'Olympics',
 								                'tags': ['Hockey', '2012-07-31', '31 July 2012', 'Riverbank Arena', 'Session', 'Olympics', 'Olympic Games', 'London 2012', '2012 Summer Olympics', 'Summer Games'],
 								                'channel_id': 'UCTl3QQTvqHFjurroKxexy2Q',
 								                'thumbnail': 'https://i.ytimg.com/vi/lqQg6PlCWgI/maxresdefault.jpg',
 								                'age_limit': 0,
 								                'availability': 'public',
 								                'live_status': 'was_live',
 								                'view_count': int,
 								                'channel_url': 'https://www.youtube.com/channel/UCTl3QQTvqHFjurroKxexy2Q',
-												[extractor/youtube] Define strict uploader metadata mapping (#6384)

New mapping:
```
channel -> channel name
channel_id -> UCID
channel_url -> UCID channel url

uploader -> channel name (same as channel field)
uploader_id -> @handle
uploader_url -> @handle channel url 
```

Authored by: coletdjnz
											
										
										
											2023-04-14 02:58:36 -05:00
+								                'channel_follower_count': int,
 								                'uploader': 'Olympics',
 								                'uploader_url': 'https://www.youtube.com/@Olympics',
 								                'uploader_id': '@Olympics',
-												[extractor/youtube] Extract `channel_is_verified` (#7213)

Authored by: coletdjnz

											
										
										
											2023-06-08 02:50:05 -05:00
+								                'channel_is_verified': True,
-												[ie/youtube] Extract upload timestamp if available (#9856)

Closes #4962, Closes #9829
Authored by: coletdjnz
											
										
										
											2024-05-26 16:13:12 -05:00
+								                'timestamp': 1440707674,
-												[youtube] Amend test

											
										
										
											2014-12-11 09:34:37 -06:00
+								            },
 								            'params': {
 								                'skip_download': 'requires avconv',
-												[cleanup] Add more ruff rules (#10149)

Authored by: seproDev

Reviewed-by: bashonly <88596187+bashonly@users.noreply.github.com>
Reviewed-by: Simon Sawicki <contact@grub4k.xyz>
											
										
										
											2024-06-11 18:09:58 -05:00
+								            },
-												[youtube] Amend test

											
										
										
											2014-12-11 09:34:37 -06:00
+								        },
-												[youtube|ffmpeg] Automatically correct video with non-square pixels (Fixes #4674)

											
										
										
											2015-01-09 22:45:51 -06:00
+								        # Non-square pixels
 								        {
 								            'url': 'https://www.youtube.com/watch?v=_b-2C3KPAM0',
 								            'info_dict': {
 								                'id': '_b-2C3KPAM0',
 								                'ext': 'mp4',
 								                'stretched_ratio': 16 / 9.,
-												[youtube] Add fallback for duration extraction (closes #11841)

											
										
										
											2017-01-26 08:43:14 -06:00
+								                'duration': 85,
-												[youtube|ffmpeg] Automatically correct video with non-square pixels (Fixes #4674)

											
										
										
											2015-01-09 22:45:51 -06:00
+								                'upload_date': '20110310',
 								                'description': 'made by Wacom from Korea | 字幕&加油添醋 by TY\'s Allen | 感謝heylisa00cavey1001同學熱情提供梗及翻譯',
 								                'title': '[A-made] 變態妍字幕版 太妍 我就是這樣的人',
-												[youtube] Update tests

											
										
										
											2022-01-07 05:54:57 -06:00
+								                'playable_in_embed': True,
 								                'channel': '孫ᄋᄅ',
 								                'age_limit': 0,
 								                'tags': 'count:11',
 								                'channel_url': 'https://www.youtube.com/channel/UCS-xxCmRaA6BFdmgDPA_BIw',
 								                'channel_id': 'UCS-xxCmRaA6BFdmgDPA_BIw',
 								                'thumbnail': 'https://i.ytimg.com/vi/_b-2C3KPAM0/maxresdefault.jpg',
 								                'view_count': int,
 								                'categories': ['People & Blogs'],
 								                'like_count': int,
 								                'live_status': 'not_live',
 								                'availability': 'unlisted',
-												[extractor/youtube, cleanup] Fix tests (#4293)

Authored by: sheerluck
											
										
										
											2022-07-07 16:20:02 -05:00
+								                'comment_count': int,
-												[extractor/youtube] Define strict uploader metadata mapping (#6384)

New mapping:
```
channel -> channel name
channel_id -> UCID
channel_url -> UCID channel url

uploader -> channel name (same as channel field)
uploader_id -> @handle
uploader_url -> @handle channel url 
```

Authored by: coletdjnz
											
										
										
											2023-04-14 02:58:36 -05:00
+								                'channel_follower_count': int,
 								                'uploader': '孫ᄋᄅ',
 								                'uploader_url': 'https://www.youtube.com/@AllenMeow',
 								                'uploader_id': '@AllenMeow',
-												[ie/youtube] Extract upload timestamp if available (#9856)

Closes #4962, Closes #9829
Authored by: coletdjnz
											
										
										
											2024-05-26 16:13:12 -05:00
+								                'timestamp': 1299776999,
-												[youtube|ffmpeg] Automatically correct video with non-square pixels (Fixes #4674)

											
										
										
											2015-01-09 22:45:51 -06:00
+								            },
-												[youtube] Add test for #5361

											
										
										
											2015-04-05 13:35:55 -05:00
+								        },
 								        # url_encoded_fmt_stream_map is empty string
 								        {
 								            'url': 'qEJwOuvDf7I',
 								            'info_dict': {
 								                'id': 'qEJwOuvDf7I',
-												[youtube] Update tests

											
										
										
											2015-08-12 10:27:58 -05:00
+								                'ext': 'webm',
-												[youtube] Add test for #5361

											
										
										
											2015-04-05 13:35:55 -05:00
+								                'title': 'Обсуждение судебной практики по выборам 14 сентября 2014 года в Санкт-Петербурге',
 								                'description': '',
 								                'upload_date': '20150404',
 								            },
 								            'params': {
 								                'skip_download': 'requires avconv',
-												[youtube] Skip test

											
										
										
											2016-01-19 08:56:04 -06:00
+								            },
 								            'skip': 'This live event has ended.',
-												[youtube] Add test for #5361

											
										
										
											2015-04-05 13:35:55 -05:00
+								        },
-												Start moving to ytdl-org

											
										
										
											2019-03-09 06:14:41 -06:00
+								        # Extraction from multiple DASH manifests (https://github.com/ytdl-org/youtube-dl/pull/6097)
-												[youtube] Add test for #6093

											
										
										
											2015-06-27 03:55:46 -05:00
+								        {
 								            'url': 'https://www.youtube.com/watch?v=FIl7x6_3R5Y',
 								            'info_dict': {
 								                'id': 'FIl7x6_3R5Y',
-												[youtube] Update tests

											
										
										
											2018-06-02 14:23:45 -05:00
+								                'ext': 'webm',
-												[youtube] Add test for #6093

											
										
										
											2015-06-27 03:55:46 -05:00
+								                'title': 'md5:7b81415841e02ecd4313668cde88737a',
 								                'description': 'md5:116377fd2963b81ec4ce64b542173306',
-												[youtube] Add fallback for duration extraction (closes #11841)

											
										
										
											2017-01-26 08:43:14 -06:00
+								                'duration': 220,
-												[youtube] Add test for #6093

											
										
										
											2015-06-27 03:55:46 -05:00
+								                'upload_date': '20150625',
-												[youtube] Update tests

											
										
										
											2018-06-02 14:23:45 -05:00
+								                'formats': 'mincount:31',
-												[youtube] Add test for #6093

											
										
										
											2015-06-27 03:55:46 -05:00
+								            },
-												[youtube] Update tests

											
										
										
											2018-06-02 14:23:45 -05:00
+								            'skip': 'not actual anymore',
-												Merge remote-tracking branch 'yan12125/download-dash-segments' (#5886)

											
										
										
											2015-07-20 12:34:24 -05:00
+								        },
-												[youtube] Add a test for the DASH segment downloader

											
										
										
											2015-06-10 01:47:02 -05:00
+								        # DASH manifest with segment_list
 								        {
 								            'url': 'https://www.youtube.com/embed/CsmdDsKjzN8',
 								            'md5': '8ce563a1d667b599d21064e982ab9e31',
 								            'info_dict': {
 								                'id': 'CsmdDsKjzN8',
 								                'ext': 'mp4',
-												[youtube] Fix upload_date in test

											
										
										
											2015-07-20 12:48:50 -05:00
+								                'upload_date': '20150501',  # According to '<meta itemprop="datePublished"', but in other places it's 20150510
-												[youtube] Add a test for the DASH segment downloader

											
										
										
											2015-06-10 01:47:02 -05:00
+								                'description': 'Retransmisión en directo de la XVIII media maratón de Zaragoza.',
 								                'title': 'Retransmisión XVIII Media maratón Zaragoza 2015',
 								            },
 								            'params': {
 								                'youtube_include_dash_manifest': True,
 								                'format': '135',  # bestvideo
-												[youtube] Fix and skip some tests

											
										
										
											2016-06-24 10:47:19 -05:00
+								            },
 								            'skip': 'This live event has ended.',
-												Merge remote-tracking branch 'yan12125/download-dash-segments' (#5886)

											
										
										
											2015-07-20 12:34:24 -05:00
+								        },
-												[youtube] Add support for multifeed videos

											
										
										
											2015-07-25 10:30:34 -05:00
+								        {
-												[cleanup] Misc

Closes #5541

											
										
										
											2022-11-15 18:57:43 -06:00
+								            # Multifeed videos (multiple cameras), URL can be of any Camera
-												[extractor/youtube] Define strict uploader metadata mapping (#6384)

New mapping:
```
channel -> channel name
channel_id -> UCID
channel_url -> UCID channel url

uploader -> channel name (same as channel field)
uploader_id -> @handle
uploader_url -> @handle channel url 
```

Authored by: coletdjnz
											
										
										
											2023-04-14 02:58:36 -05:00
+								            # TODO: fix multifeed titles
-												[cleanup] Misc

Closes #5541

											
										
										
											2022-11-15 18:57:43 -06:00
+								            'url': 'https://www.youtube.com/watch?v=zaPI8MvL8pg',
-												[youtube] Add support for multifeed videos

											
										
										
											2015-07-25 10:30:34 -05:00
+								            'info_dict': {
-												[cleanup] Misc

Closes #5541

											
										
										
											2022-11-15 18:57:43 -06:00
+								                'id': 'zaPI8MvL8pg',
 								                'title': 'Terraria 1.2 Live Stream | Let\'s Play - Part 04',
 								                'description': 'md5:563ccbc698b39298481ca3c571169519',
-												[youtube] Add support for multifeed videos

											
										
										
											2015-07-25 10:30:34 -05:00
+								            },
 								            'playlist': [{
 								                'info_dict': {
-												[cleanup] Misc

Closes #5541

											
										
										
											2022-11-15 18:57:43 -06:00
+								                    'id': 'j5yGuxZ8lLU',
-												[youtube] Add support for multifeed videos

											
										
										
											2015-07-25 10:30:34 -05:00
+								                    'ext': 'mp4',
-												[cleanup] Misc

Closes #5541

											
										
										
											2022-11-15 18:57:43 -06:00
+								                    'title': 'Terraria 1.2 Live Stream | Let\'s Play - Part 04 (Chris)',
 								                    'description': 'md5:563ccbc698b39298481ca3c571169519',
 								                    'duration': 10120,
 								                    'channel_follower_count': int,
 								                    'channel_url': 'https://www.youtube.com/channel/UCN2XePorRokPB9TEgRZpddg',
 								                    'availability': 'public',
 								                    'playable_in_embed': True,
 								                    'upload_date': '20131105',
 								                    'categories': ['Gaming'],
 								                    'live_status': 'was_live',
 								                    'tags': 'count:24',
 								                    'release_timestamp': 1383701910,
 								                    'thumbnail': 'https://i.ytimg.com/vi/j5yGuxZ8lLU/maxresdefault.jpg',
 								                    'comment_count': int,
 								                    'age_limit': 0,
 								                    'like_count': int,
 								                    'channel_id': 'UCN2XePorRokPB9TEgRZpddg',
 								                    'channel': 'WiiLikeToPlay',
 								                    'view_count': int,
 								                    'release_date': '20131106',
-												[extractor/youtube] Define strict uploader metadata mapping (#6384)

New mapping:
```
channel -> channel name
channel_id -> UCID
channel_url -> UCID channel url

uploader -> channel name (same as channel field)
uploader_id -> @handle
uploader_url -> @handle channel url 
```

Authored by: coletdjnz
											
										
										
											2023-04-14 02:58:36 -05:00
+								                    'uploader': 'WiiLikeToPlay',
 								                    'uploader_id': '@WLTP',
 								                    'uploader_url': 'https://www.youtube.com/@WLTP',
-												[youtube] Add support for multifeed videos

											
										
										
											2015-07-25 10:30:34 -05:00
+								                },
 								            }, {
 								                'info_dict': {
-												[cleanup] Misc

Closes #5541

											
										
										
											2022-11-15 18:57:43 -06:00
+								                    'id': 'zaPI8MvL8pg',
-												[youtube] Add support for multifeed videos

											
										
										
											2015-07-25 10:30:34 -05:00
+								                    'ext': 'mp4',
-												[cleanup] Misc

Closes #5541

											
										
										
											2022-11-15 18:57:43 -06:00
+								                    'title': 'Terraria 1.2 Live Stream | Let\'s Play - Part 04 (Tyson)',
 								                    'availability': 'public',
 								                    'channel_url': 'https://www.youtube.com/channel/UCN2XePorRokPB9TEgRZpddg',
 								                    'channel': 'WiiLikeToPlay',
 								                    'channel_follower_count': int,
 								                    'description': 'md5:563ccbc698b39298481ca3c571169519',
 								                    'duration': 10108,
 								                    'age_limit': 0,
 								                    'like_count': int,
 								                    'tags': 'count:24',
 								                    'channel_id': 'UCN2XePorRokPB9TEgRZpddg',
 								                    'release_timestamp': 1383701915,
 								                    'comment_count': int,
 								                    'upload_date': '20131105',
 								                    'thumbnail': 'https://i.ytimg.com/vi/zaPI8MvL8pg/maxresdefault.jpg',
 								                    'release_date': '20131106',
 								                    'playable_in_embed': True,
 								                    'live_status': 'was_live',
 								                    'categories': ['Gaming'],
 								                    'view_count': int,
-												[extractor/youtube] Define strict uploader metadata mapping (#6384)

New mapping:
```
channel -> channel name
channel_id -> UCID
channel_url -> UCID channel url

uploader -> channel name (same as channel field)
uploader_id -> @handle
uploader_url -> @handle channel url 
```

Authored by: coletdjnz
											
										
										
											2023-04-14 02:58:36 -05:00
+								                    'uploader': 'WiiLikeToPlay',
 								                    'uploader_id': '@WLTP',
 								                    'uploader_url': 'https://www.youtube.com/@WLTP',
-												[youtube] Add support for multifeed videos

											
										
										
											2015-07-25 10:30:34 -05:00
+								                },
 								            }, {
 								                'info_dict': {
-												[cleanup] Misc

Closes #5541

											
										
										
											2022-11-15 18:57:43 -06:00
+								                    'id': 'R7r3vfO7Hao',
-												[youtube] Add support for multifeed videos

											
										
										
											2015-07-25 10:30:34 -05:00
+								                    'ext': 'mp4',
-												[cleanup] Misc

Closes #5541

											
										
										
											2022-11-15 18:57:43 -06:00
+								                    'title': 'Terraria 1.2 Live Stream | Let\'s Play - Part 04 (Spencer)',
 								                    'thumbnail': 'https://i.ytimg.com/vi/R7r3vfO7Hao/maxresdefault.jpg',
 								                    'channel_id': 'UCN2XePorRokPB9TEgRZpddg',
 								                    'like_count': int,
 								                    'availability': 'public',
 								                    'playable_in_embed': True,
 								                    'upload_date': '20131105',
 								                    'description': 'md5:563ccbc698b39298481ca3c571169519',
 								                    'channel_follower_count': int,
 								                    'tags': 'count:24',
 								                    'release_date': '20131106',
 								                    'comment_count': int,
 								                    'channel_url': 'https://www.youtube.com/channel/UCN2XePorRokPB9TEgRZpddg',
 								                    'channel': 'WiiLikeToPlay',
 								                    'categories': ['Gaming'],
 								                    'release_timestamp': 1383701914,
 								                    'live_status': 'was_live',
 								                    'age_limit': 0,
 								                    'duration': 10128,
 								                    'view_count': int,
-												[extractor/youtube] Define strict uploader metadata mapping (#6384)

New mapping:
```
channel -> channel name
channel_id -> UCID
channel_url -> UCID channel url

uploader -> channel name (same as channel field)
uploader_id -> @handle
uploader_url -> @handle channel url 
```

Authored by: coletdjnz
											
										
										
											2023-04-14 02:58:36 -05:00
+								                    'uploader': 'WiiLikeToPlay',
 								                    'uploader_id': '@WLTP',
 								                    'uploader_url': 'https://www.youtube.com/@WLTP',
-												[youtube] Add support for multifeed videos

											
										
										
											2015-07-25 10:30:34 -05:00
+								                },
 								            }],
-												[cleanup] Misc

Closes #5541

											
										
										
											2022-11-15 18:57:43 -06:00
+								            'params': {'skip_download': True},
-												[ie/youtube] Extract upload timestamp if available (#9856)

Closes #4962, Closes #9829
Authored by: coletdjnz
											
										
										
											2024-05-26 16:13:12 -05:00
+								            'skip': 'Not multifeed anymore',
-												[youtube] Expand _VALID_URL to support vid.plus

											
										
										
											2015-08-16 15:04:13 -05:00
+								        },
-												[youtube] Add test for #8536

											
										
										
											2016-02-12 17:18:58 -06:00
+								        {
-												Start moving to ytdl-org

											
										
										
											2019-03-09 06:14:41 -06:00
+								            # Multifeed video with comma in title (see https://github.com/ytdl-org/youtube-dl/issues/8536)
-												[youtube] Add test for #8536

											
										
										
											2016-02-12 17:18:58 -06:00
+								            'url': 'https://www.youtube.com/watch?v=gVfLd0zydlo',
 								            'info_dict': {
 								                'id': 'gVfLd0zydlo',
 								                'title': 'DevConf.cz 2016 Day 2 Workshops 1 14:00 - 15:30',
 								            },
 								            'playlist_count': 2,
-												[youtube] Fix and skip some tests

											
										
										
											2016-06-24 10:47:19 -05:00
+								            'skip': 'Not multifeed anymore',
-												[youtube] Add test for #8536

											
										
										
											2016-02-12 17:18:58 -06:00
+								        },
-												[youtube] Expand _VALID_URL to support vid.plus

											
										
										
											2015-08-16 15:04:13 -05:00
+								        {
-												[youtube] Change test URLs from http to https

											
										
										
											2016-09-17 09:48:20 -05:00
+								            'url': 'https://vid.plus/FlRa-iH7PGw',
-												[youtube] Expand _VALID_URL to support vid.plus

											
										
										
											2015-08-16 15:04:13 -05:00
+								            'only_matching': True,
-												[youtube] Fall back to the original regex for ytplayer.config

											
										
										
											2015-11-22 06:49:33 -06:00
+								        },
-												[youtube] Add support for zwearz (Closes #9062)

											
										
										
											2016-04-03 15:26:20 -05:00
+								        {
-												[youtube] Change test URLs from http to https

											
										
										
											2016-09-17 09:48:20 -05:00
+								            'url': 'https://zwearz.com/watch/9lWxNJF-ufM/electra-woman-dyna-girl-official-trailer-grace-helbig.html',
-												[youtube] Add support for zwearz (Closes #9062)

											
										
										
											2016-04-03 15:26:20 -05:00
+								            'only_matching': True,
 								        },
-												[youtube] Fall back to the original regex for ytplayer.config

											
										
										
											2015-11-22 06:49:33 -06:00
+								        {
-												Start moving to ytdl-org

											
										
										
											2019-03-09 06:14:41 -06:00
+								            # Title with JS-like syntax "};" (see https://github.com/ytdl-org/youtube-dl/issues/7468)
-												[youtube] Clarify test_Youtube_18

											
										
										
											2016-01-18 11:19:38 -06:00
+								            # Also tests cut-off URL expansion in video description (see
-												Start moving to ytdl-org

											
										
										
											2019-03-09 06:14:41 -06:00
+								            # https://github.com/ytdl-org/youtube-dl/issues/1892,
 								            # https://github.com/ytdl-org/youtube-dl/issues/8164)
-												[youtube] Fall back to the original regex for ytplayer.config

											
										
										
											2015-11-22 06:49:33 -06:00
+								            'url': 'https://www.youtube.com/watch?v=lsguqyKfVQg',
 								            'info_dict': {
 								                'id': 'lsguqyKfVQg',
 								                'ext': 'mp4',
 								                'title': '{dark walk}; Loki/AC/Dishonored; collab w/Elflover21',
-												[youtube] Extract data from multiple clients (#536)

* `player_client` accepts multiple clients
* default `player_client` = `android,web`
* music clients can be specifically requested
* Add IOS `player_client`
* Hide live dash since they can't be downloaded

Closes #501

Authored-by: pukkandan, colethedj
											
										
										
											2021-07-20 22:52:34 -05:00
+								                'alt_title': 'Dark Walk',
-												[youtube] Fall back to the original regex for ytplayer.config

											
										
										
											2015-11-22 06:49:33 -06:00
+								                'description': 'md5:8085699c11dc3f597ce0410b0dcbb34a',
-												[youtube] Add fallback for duration extraction (closes #11841)

											
										
										
											2017-01-26 08:43:14 -06:00
+								                'duration': 133,
-												[youtube] Fall back to the original regex for ytplayer.config

											
										
										
											2015-11-22 06:49:33 -06:00
+								                'upload_date': '20151119',
-												[youtube] Extract data from multiple clients (#536)

* `player_client` accepts multiple clients
* default `player_client` = `android,web`
* music clients can be specifically requested
* Add IOS `player_client`
* Hide live dash since they can't be downloaded

Closes #501

Authored-by: pukkandan, colethedj
											
										
										
											2021-07-20 22:52:34 -05:00
+								                'creator': 'Todd Haberman;\nDaniel Law Heath and Aaron Kaplan',
 								                'track': 'Dark Walk',
 								                'artist': 'Todd Haberman;\nDaniel Law Heath and Aaron Kaplan',
-												[youtube] extract album from Music in this video section(#20301)

											
										
										
											2019-04-28 11:37:46 -05:00
+								                'album': 'Position Music - Production Music Vol. 143 - Dark Walk',
-												[youtube] Update tests

											
										
										
											2022-01-07 05:54:57 -06:00
+								                'thumbnail': 'https://i.ytimg.com/vi_webp/lsguqyKfVQg/maxresdefault.webp',
 								                'categories': ['Film & Animation'],
 								                'view_count': int,
 								                'live_status': 'not_live',
 								                'channel_url': 'https://www.youtube.com/channel/UCTSRgz5jylBvFt_S7wnsqLQ',
 								                'channel_id': 'UCTSRgz5jylBvFt_S7wnsqLQ',
 								                'tags': 'count:13',
 								                'availability': 'public',
 								                'channel': 'IronSoulElf',
 								                'playable_in_embed': True,
 								                'like_count': int,
 								                'age_limit': 0,
-												[cleanup] Add more ruff rules (#10149)

Authored by: seproDev

Reviewed-by: bashonly <88596187+bashonly@users.noreply.github.com>
Reviewed-by: Simon Sawicki <contact@grub4k.xyz>
											
										
										
											2024-06-11 18:09:58 -05:00
+								                'channel_follower_count': int,
-												[youtube] Fall back to the original regex for ytplayer.config

											
										
										
											2015-11-22 06:49:33 -06:00
+								            },
 								            'params': {
 								                'skip_download': True,
 								            },
 								        },
-												[youtube] Add test with '};' in tags

											
										
										
											2015-11-23 09:02:37 -06:00
+								        {
-												Start moving to ytdl-org

											
										
										
											2019-03-09 06:14:41 -06:00
+								            # Tags with '};' (see https://github.com/ytdl-org/youtube-dl/issues/7468)
-												[youtube] Add test with '};' in tags

											
										
										
											2015-11-23 09:02:37 -06:00
+								            'url': 'https://www.youtube.com/watch?v=Ms7iBXnlUO8',
 								            'only_matching': True,
 								        },
-												[youtube] Ignore yt:stretch with zero width/height

											
										
										
											2015-11-27 18:07:07 -06:00
+								        {
 								            # Video with yt:stretch=17:0
 								            'url': 'https://www.youtube.com/watch?v=Q39EVAstoRM',
 								            'info_dict': {
 								                'id': 'Q39EVAstoRM',
 								                'ext': 'mp4',
 								                'title': 'Clash Of Clans#14 Dicas De Ataque Para CV 4',
 								                'description': 'md5:ee18a25c350637c8faff806845bddee9',
 								                'upload_date': '20151107',
 								            },
 								            'params': {
 								                'skip_download': True,
 								            },
-												[youtube] Fix and skip some tests

											
										
										
											2016-06-24 10:47:19 -05:00
+								            'skip': 'This video does not exist.',
-												[youtube] Ignore yt:stretch with zero width/height

											
										
										
											2015-11-27 18:07:07 -06:00
+								        },
-												Update to ytdl-commit-9f6c03

[cbsnews] Fix extraction for python <3.6
https://github.com/ytdl-org/youtube-dl/commit/9f6c03a00602eb1119e43a522cf50682f6d6a6dd

											
										
										
											2021-04-16 22:02:33 -05:00
+								        {
 								            # Video with incomplete 'yt:stretch=16:'
 								            'url': 'https://www.youtube.com/watch?v=FRhJzUSJbGI',
 								            'only_matching': True,
 								        },
-												[youtube] Extract license (Closes #8725)

											
										
										
											2016-03-02 11:07:25 -06:00
+								        {
 								            # Video licensed under Creative Commons
 								            'url': 'https://www.youtube.com/watch?v=M4gD1WSo5mA',
 								            'info_dict': {
 								                'id': 'M4gD1WSo5mA',
 								                'ext': 'mp4',
 								                'title': 'md5:e41008789470fc2533a3252216f1c1d1',
 								                'description': 'md5:a677553cf0840649b731a3024aeff4cc',
-												[youtube] Add fallback for duration extraction (closes #11841)

											
										
										
											2017-01-26 08:43:14 -06:00
+								                'duration': 721,
-												[youtube] Improve video upload date handling (#3029)

* Don't prefer UTC upload date for past live streams/premieres
* Improve regex (fixes a regression)

Authored-by: coletdjnz
											
										
										
											2022-03-13 17:02:44 -05:00
+								                'upload_date': '20150128',
-												[youtube] Extract license (Closes #8725)

											
										
										
											2016-03-02 11:07:25 -06:00
+								                'license': 'Creative Commons Attribution license (reuse allowed)',
-												[youtube] Update tests

											
										
										
											2022-01-07 05:54:57 -06:00
+								                'channel_id': 'UCuLGmD72gJDBwmLw06X58SA',
 								                'channel_url': 'https://www.youtube.com/channel/UCuLGmD72gJDBwmLw06X58SA',
 								                'like_count': int,
 								                'age_limit': 0,
 								                'tags': ['Copyright (Legal Subject)', 'Law (Industry)', 'William W. Fisher (Author)'],
 								                'channel': 'The Berkman Klein Center for Internet & Society',
 								                'availability': 'public',
 								                'view_count': int,
 								                'categories': ['Education'],
 								                'thumbnail': 'https://i.ytimg.com/vi_webp/M4gD1WSo5mA/maxresdefault.webp',
 								                'live_status': 'not_live',
 								                'playable_in_embed': True,
-												[cleanup Misc

Closes #5162

											
										
										
											2022-10-18 12:58:57 -05:00
+								                'channel_follower_count': int,
 								                'chapters': list,
-												[extractor/youtube] Define strict uploader metadata mapping (#6384)

New mapping:
```
channel -> channel name
channel_id -> UCID
channel_url -> UCID channel url

uploader -> channel name (same as channel field)
uploader_id -> @handle
uploader_url -> @handle channel url 
```

Authored by: coletdjnz
											
										
										
											2023-04-14 02:58:36 -05:00
+								                'uploader': 'The Berkman Klein Center for Internet & Society',
 								                'uploader_id': '@BKCHarvard',
 								                'uploader_url': 'https://www.youtube.com/@BKCHarvard',
-												[ie/youtube] Extract upload timestamp if available (#9856)

Closes #4962, Closes #9829
Authored by: coletdjnz
											
										
										
											2024-05-26 16:13:12 -05:00
+								                'timestamp': 1422422076,
-												[youtube] Extract license (Closes #8725)

											
										
										
											2016-03-02 11:07:25 -06:00
+								            },
 								            'params': {
 								                'skip_download': True,
 								            },
 								        },
-												[youtube] Extract uploader_url (Closes #8724)

											
										
										
											2016-03-02 11:49:10 -06:00
+								        {
 								            'url': 'https://www.youtube.com/watch?v=eQcmzGIKrzg',
 								            'info_dict': {
 								                'id': 'eQcmzGIKrzg',
 								                'ext': 'mp4',
 								                'title': 'Democratic Socialism and Foreign Policy | Bernie Sanders',
-												[youtube] Update to ytdl-2021.02.04.1

											
										
										
											2021-02-04 08:37:17 -06:00
+								                'description': 'md5:13a2503d7b5904ef4b223aa101628f39',
-												[youtube] Add fallback for duration extraction (closes #11841)

											
										
										
											2017-01-26 08:43:14 -06:00
+								                'duration': 4060,
-												[youtube] Improve video upload date handling (#3029)

* Don't prefer UTC upload date for past live streams/premieres
* Improve regex (fixes a regression)

Authored-by: coletdjnz
											
										
										
											2022-03-13 17:02:44 -05:00
+								                'upload_date': '20151120',
-												[youtube] Extract uploader_url (Closes #8724)

											
										
										
											2016-03-02 11:49:10 -06:00
+								                'license': 'Creative Commons Attribution license (reuse allowed)',
-												[youtube] Update tests

											
										
										
											2022-01-07 05:54:57 -06:00
+								                'playable_in_embed': True,
 								                'tags': 'count:12',
 								                'like_count': int,
 								                'channel_id': 'UCH1dpzjCEiGAt8CXkryhkZg',
 								                'age_limit': 0,
 								                'availability': 'public',
 								                'categories': ['News & Politics'],
 								                'channel': 'Bernie Sanders',
 								                'thumbnail': 'https://i.ytimg.com/vi_webp/eQcmzGIKrzg/maxresdefault.webp',
 								                'view_count': int,
 								                'live_status': 'not_live',
 								                'channel_url': 'https://www.youtube.com/channel/UCH1dpzjCEiGAt8CXkryhkZg',
-												[extractor/youtube, cleanup] Fix tests (#4293)

Authored by: sheerluck
											
										
										
											2022-07-07 16:20:02 -05:00
+								                'comment_count': int,
-												[cleanup Misc

Closes #5162

											
										
										
											2022-10-18 12:58:57 -05:00
+								                'channel_follower_count': int,
 								                'chapters': list,
-												[extractor/youtube] Define strict uploader metadata mapping (#6384)

New mapping:
```
channel -> channel name
channel_id -> UCID
channel_url -> UCID channel url

uploader -> channel name (same as channel field)
uploader_id -> @handle
uploader_url -> @handle channel url 
```

Authored by: coletdjnz
											
										
										
											2023-04-14 02:58:36 -05:00
+								                'uploader': 'Bernie Sanders',
 								                'uploader_url': 'https://www.youtube.com/@BernieSanders',
 								                'uploader_id': '@BernieSanders',
-												[extractor/youtube] Extract `channel_is_verified` (#7213)

Authored by: coletdjnz

											
										
										
											2023-06-08 02:50:05 -05:00
+								                'channel_is_verified': True,
-												[extractor/youtube] Misc cleanup

Authored by: coletdjnz

											
										
										
											2023-06-08 08:28:49 -05:00
+								                'heatmap': 'count:100',
-												[ie/youtube] Extract upload timestamp if available (#9856)

Closes #4962, Closes #9829
Authored by: coletdjnz
											
										
										
											2024-05-26 16:13:12 -05:00
+								                'timestamp': 1447987198,
-												[youtube] Extract uploader_url (Closes #8724)

											
										
										
											2016-03-02 11:49:10 -06:00
+								            },
 								            'params': {
 								                'skip_download': True,
 								            },
 								        },
-												[youtube] Extend _VALID_URL (Closes #7694)

											
										
										
											2015-11-29 09:01:59 -06:00
+								        {
 								            'url': 'https://www.youtube.com/watch?feature=player_embedded&amp;amp;v=V36LpHqtcDY',
 								            'only_matching': True,
-												[youtube] Add YouTube Red paid video reference test (#10059)

											
										
										
											2016-07-11 14:10:35 -05:00
+								        },
 								        {
-												Start moving to ytdl-org

											
										
										
											2019-03-09 06:14:41 -06:00
+								            # YouTube Red paid video (https://github.com/ytdl-org/youtube-dl/issues/10059)
-												[youtube] Add YouTube Red paid video reference test (#10059)

											
										
										
											2016-07-11 14:10:35 -05:00
+								            'url': 'https://www.youtube.com/watch?v=i1Ko8UG-Tdo',
 								            'only_matching': True,
-												[youtube] Add support for rental videos' previews (Closes #10532)

											
										
										
											2016-09-02 13:17:15 -05:00
+								        },
 								        {
 								            # Rental video preview
 								            'url': 'https://www.youtube.com/watch?v=yYr8q0y5Jfg',
 								            'info_dict': {
 								                'id': 'uGpuVWrhIzE',
 								                'ext': 'mp4',
 								                'title': 'Piku - Trailer',
 								                'description': 'md5:c36bd60c3fd6f1954086c083c72092eb',
 								                'upload_date': '20150811',
 								                'license': 'Standard YouTube License',
 								            },
 								            'params': {
 								                'skip_download': True,
 								            },
-												[youtube] Update tests

											
										
										
											2018-06-02 14:23:45 -05:00
+								            'skip': 'This video is not available.',
-												[youtube] Add test for itag 212 (#11575)

											
										
										
											2017-01-09 09:30:46 -06:00
+								        },
-												[youtube] Extract episode metadata (closes #9695, closes #11774)

											
										
										
											2017-01-21 05:10:32 -06:00
+								        {
 								            # YouTube Red video with episode data
 								            'url': 'https://www.youtube.com/watch?v=iqKdEhx-dD4',
 								            'info_dict': {
 								                'id': 'iqKdEhx-dD4',
 								                'ext': 'mp4',
 								                'title': 'Isolation - Mind Field (Ep 1)',
-												[youtube] Update to ytdl-2021.02.04.1

											
										
										
											2021-02-04 08:37:17 -06:00
+								                'description': 'md5:f540112edec5d09fc8cc752d3d4ba3cd',
-												[youtube] Add fallback for duration extraction (closes #11841)

											
										
										
											2017-01-26 08:43:14 -06:00
+								                'duration': 2085,
-												[youtube] Extract episode metadata (closes #9695, closes #11774)

											
										
										
											2017-01-21 05:10:32 -06:00
+								                'upload_date': '20170118',
 								                'series': 'Mind Field',
 								                'season_number': 1,
 								                'episode_number': 1,
-												[youtube] Update tests

											
										
										
											2022-01-07 05:54:57 -06:00
+								                'thumbnail': 'https://i.ytimg.com/vi_webp/iqKdEhx-dD4/maxresdefault.webp',
 								                'tags': 'count:12',
 								                'view_count': int,
 								                'availability': 'public',
 								                'age_limit': 0,
 								                'channel': 'Vsauce',
 								                'episode': 'Episode 1',
 								                'categories': ['Entertainment'],
 								                'season': 'Season 1',
 								                'channel_id': 'UC6nSFpj9HTCZ5t-N3Rm3-HA',
 								                'channel_url': 'https://www.youtube.com/channel/UC6nSFpj9HTCZ5t-N3Rm3-HA',
 								                'like_count': int,
 								                'playable_in_embed': True,
 								                'live_status': 'not_live',
-												[extractor/youtube] Define strict uploader metadata mapping (#6384)

New mapping:
```
channel -> channel name
channel_id -> UCID
channel_url -> UCID channel url

uploader -> channel name (same as channel field)
uploader_id -> @handle
uploader_url -> @handle channel url 
```

Authored by: coletdjnz
											
										
										
											2023-04-14 02:58:36 -05:00
+								                'channel_follower_count': int,
 								                'uploader': 'Vsauce',
 								                'uploader_url': 'https://www.youtube.com/@Vsauce',
 								                'uploader_id': '@Vsauce',
-												[extractor/youtube] Misc cleanup

Authored by: coletdjnz

											
										
										
											2023-06-08 08:28:49 -05:00
+								                'comment_count': int,
-												[extractor/youtube] Extract `channel_is_verified` (#7213)

Authored by: coletdjnz

											
										
										
											2023-06-08 02:50:05 -05:00
+								                'channel_is_verified': True,
-												[ie/youtube] Extract upload timestamp if available (#9856)

Closes #4962, Closes #9829
Authored by: coletdjnz
											
										
										
											2024-05-26 16:13:12 -05:00
+								                'timestamp': 1484761047,
-												[youtube] Extract episode metadata (closes #9695, closes #11774)

											
										
										
											2017-01-21 05:10:32 -06:00
+								            },
 								            'params': {
 								                'skip_download': True,
 								            },
 								            'expected_warnings': [
 								                'Skipping DASH manifest',
 								            ],
 								        },
-												[youtube] Fix controversy videos extraction (closes #14027, closes #14029)

											
										
										
											2017-08-26 03:38:38 -05:00
+								        {
 								            # The following content has been identified by the YouTube community
 								            # as inappropriate or offensive to some audiences.
 								            'url': 'https://www.youtube.com/watch?v=6SJNVb0GnPI',
 								            'info_dict': {
 								                'id': '6SJNVb0GnPI',
 								                'ext': 'mp4',
 								                'title': 'Race Differences in Intelligence',
 								                'description': 'md5:5d161533167390427a1f8ee89a1fc6f1',
 								                'duration': 965,
 								                'upload_date': '20140124',
 								            },
 								            'params': {
 								                'skip_download': True,
 								            },
-												[youtube] Update to ytdl-2021.02.04.1

											
										
										
											2021-02-04 08:37:17 -06:00
+								            'skip': 'This video has been removed for violating YouTube\'s policy on hate speech.',
-												[youtube] Fix controversy videos extraction (closes #14027, closes #14029)

											
										
										
											2017-08-26 03:38:38 -05:00
+								        },
-												[youtube] Add test for itag 212 (#11575)

											
										
										
											2017-01-09 09:30:46 -06:00
+								        {
 								            # itag 212
 								            'url': '1t24XAntNCY',
 								            'only_matching': True,
-												[youtube] Raise GeoRestrictedError

											
										
										
											2017-02-26 03:51:21 -06:00
+								        },
 								        {
 								            # geo restricted to JP
 								            'url': 'sJL6WA-aGkQ',
 								            'only_matching': True,
 								        },
-												[youtube] Add support for invidio.us (closes #17613)

											
										
										
											2018-09-23 12:14:49 -05:00
+								        {
 								            'url': 'https://invidio.us/watch?v=BaW_jenozKc',
 								            'only_matching': True,
 								        },
-												Update to ytdl-commit-cf2dbec
https://github.com/ytdl-org/youtube-dl/commit/cf2dbec6301177a1fddf72862de05fa912d9869d

Except: [kakao] improve info extraction and detect geo restriction
https://github.com/ytdl-org/youtube-dl/commit/d8085580f63ad3b146a31712ff76cf41d5a4558a

											
										
										
											2021-02-19 14:44:36 -06:00
+								        {
 								            'url': 'https://redirect.invidious.io/watch?v=BaW_jenozKc',
 								            'only_matching': True,
 								        },
 								        {
 								            # from https://nitter.pussthecat.org/YouTube/status/1360363141947944964#m
 								            'url': 'https://redirect.invidious.io/Yh0AhrY9GjA',
 								            'only_matching': True,
 								        },
-												[youtube] detect DRM protected videos(#1774)

											
										
										
											2018-12-26 02:30:48 -06:00
+								        {
 								            # DRM protected
 								            'url': 'https://www.youtube.com/watch?v=s7_qI6_mIXc',
 								            'only_matching': True,
-												[youtube] Update tests and add a tests for #18804

											
										
										
											2019-01-15 13:18:27 -06:00
+								        },
 								        {
 								            # Video with unsupported adaptive stream type formats
 								            'url': 'https://www.youtube.com/watch?v=Z4Vy8R84T1U',
 								            'info_dict': {
 								                'id': 'Z4Vy8R84T1U',
 								                'ext': 'mp4',
 								                'title': 'saman SMAN 53 Jakarta(Sancety) opening COFFEE4th at SMAN 53 Jakarta',
 								                'description': 'md5:d41d8cd98f00b204e9800998ecf8427e',
 								                'duration': 433,
 								                'upload_date': '20130923',
 								                'formats': 'maxcount:10',
 								            },
 								            'params': {
 								                'skip_download': True,
 								                'youtube_include_dash_manifest': False,
 								            },
-												[youtube] Fix tests

											
										
										
											2020-03-05 11:05:50 -06:00
+								            'skip': 'not actual anymore',
-												[youtube] Extract additional meta data from video description on youtube music videos

YouTube music videos often have auto-generated video descriptions that can be
utilized to extract additional information about the video. This is desirable
in order to provide the user with as much meta data as possible. This commit
adds extraction methods for the following fields for youtube music videos:
- artist (fallback extraction methods added)
- track (fallback extraction methods added)
- album (new in this commit)
- release_date (new in this commit)
- release_year (new in this commit)

4 tests have been added to test this new functionality:
- YoutubeIE tests 27, 28, 29, and 30

Resolves: #20599

											
										
										
											2019-04-21 23:26:48 -05:00
+								        },
 								        {
-												[youtube] improve Youtube Music Auto-generated description parsing(closes #20742)

											
										
										
											2019-04-27 03:16:17 -05:00
+								            # Youtube Music Auto-generated description
-												[extractor/youtube] Define strict uploader metadata mapping (#6384)

New mapping:
```
channel -> channel name
channel_id -> UCID
channel_url -> UCID channel url

uploader -> channel name (same as channel field)
uploader_id -> @handle
uploader_url -> @handle channel url 
```

Authored by: coletdjnz
											
										
										
											2023-04-14 02:58:36 -05:00
+								            # TODO: fix metadata extraction
-												[youtube] Extract additional meta data from video description on youtube music videos

YouTube music videos often have auto-generated video descriptions that can be
utilized to extract additional information about the video. This is desirable
in order to provide the user with as much meta data as possible. This commit
adds extraction methods for the following fields for youtube music videos:
- artist (fallback extraction methods added)
- track (fallback extraction methods added)
- album (new in this commit)
- release_date (new in this commit)
- release_year (new in this commit)

4 tests have been added to test this new functionality:
- YoutubeIE tests 27, 28, 29, and 30

Resolves: #20599

											
										
										
											2019-04-21 23:26:48 -05:00
+								            'url': 'https://music.youtube.com/watch?v=MgNrAu2pzNs',
 								            'info_dict': {
 								                'id': 'MgNrAu2pzNs',
 								                'ext': 'mp4',
 								                'title': 'Voyeur Girl',
 								                'description': 'md5:7ae382a65843d6df2685993e90a8628f',
 								                'upload_date': '20190312',
-												[ie] Migrate commonly plural fields to lists (#8917)

Authored by: llistochek, pukkandan
Related: #3944
											
										
										
											2024-02-20 01:19:24 -06:00
+								                'artists': ['Stephen'],
 								                'creators': ['Stephen'],
-												[youtube] Extract additional meta data from video description on youtube music videos

YouTube music videos often have auto-generated video descriptions that can be
utilized to extract additional information about the video. This is desirable
in order to provide the user with as much meta data as possible. This commit
adds extraction methods for the following fields for youtube music videos:
- artist (fallback extraction methods added)
- track (fallback extraction methods added)
- album (new in this commit)
- release_date (new in this commit)
- release_year (new in this commit)

4 tests have been added to test this new functionality:
- YoutubeIE tests 27, 28, 29, and 30

Resolves: #20599

											
										
										
											2019-04-21 23:26:48 -05:00
+								                'track': 'Voyeur Girl',
 								                'album': 'it\'s too much love to know my dear',
 								                'release_date': '20190313',
-												[youtube] Update tests

											
										
										
											2022-01-07 05:54:57 -06:00
+								                'alt_title': 'Voyeur Girl',
 								                'view_count': int,
 								                'playable_in_embed': True,
 								                'like_count': int,
 								                'categories': ['Music'],
 								                'channel_url': 'https://www.youtube.com/channel/UC-pWHpBjdGG69N9mM2auIAA',
-												[extractor/youtube] Define strict uploader metadata mapping (#6384)

New mapping:
```
channel -> channel name
channel_id -> UCID
channel_url -> UCID channel url

uploader -> channel name (same as channel field)
uploader_id -> @handle
uploader_url -> @handle channel url 
```

Authored by: coletdjnz
											
										
										
											2023-04-14 02:58:36 -05:00
+								                'channel': 'Stephen',  # TODO: should be "Stephen - Topic"
 								                'uploader': 'Stephen',
-												[youtube] Update tests

											
										
										
											2022-01-07 05:54:57 -06:00
+								                'availability': 'public',
 								                'duration': 169,
 								                'thumbnail': 'https://i.ytimg.com/vi_webp/MgNrAu2pzNs/maxresdefault.webp',
 								                'age_limit': 0,
 								                'channel_id': 'UC-pWHpBjdGG69N9mM2auIAA',
 								                'tags': 'count:11',
 								                'live_status': 'not_live',
-												[cleanup] Add more ruff rules (#10149)

Authored by: seproDev

Reviewed-by: bashonly <88596187+bashonly@users.noreply.github.com>
Reviewed-by: Simon Sawicki <contact@grub4k.xyz>
											
										
										
											2024-06-11 18:09:58 -05:00
+								                'channel_follower_count': int,
-												[youtube] Extract additional meta data from video description on youtube music videos

YouTube music videos often have auto-generated video descriptions that can be
utilized to extract additional information about the video. This is desirable
in order to provide the user with as much meta data as possible. This commit
adds extraction methods for the following fields for youtube music videos:
- artist (fallback extraction methods added)
- track (fallback extraction methods added)
- album (new in this commit)
- release_date (new in this commit)
- release_year (new in this commit)

4 tests have been added to test this new functionality:
- YoutubeIE tests 27, 28, 29, and 30

Resolves: #20599

											
										
										
											2019-04-21 23:26:48 -05:00
+								            },
 								            'params': {
 								                'skip_download': True,
 								            },
 								        },
-												[youtube] add support youtubekids.com(closes #23272)

											
										
										
											2019-11-30 10:51:34 -06:00
+								        {
 								            'url': 'https://www.youtubekids.com/watch?v=3b8nCWDgZ6Q',
 								            'only_matching': True,
 								        },
-												[youtube] Use redirected video id if any (closes #25063)

											
										
										
											2020-04-30 12:40:38 -05:00
+								        {
 								            # invalid -> valid video id redirection
 								            'url': 'DJztXj2GPfl',
 								            'info_dict': {
 								                'id': 'DJztXj2GPfk',
 								                'ext': 'mp4',
 								                'title': 'Panjabi MC - Mundian To Bach Ke (The Dictator Soundtrack)',
 								                'description': 'md5:bf577a41da97918e94fa9798d9228825',
 								                'upload_date': '20090125',
 								                'artist': 'Panjabi MC',
 								                'track': 'Beware of the Boys (Mundian to Bach Ke) - Motivo Hi-Lectro Remix',
 								                'album': 'Beware of the Boys (Mundian To Bach Ke)',
 								            },
 								            'params': {
 								                'skip_download': True,
 								            },
-												[youtube] Update to ytdl-2021.02.04.1

											
										
										
											2021-02-04 08:37:17 -06:00
+								            'skip': 'Video unavailable',
-												[youtube] Fix empty description extraction (#26575) (closes #26006)


											
										
										
											2020-09-13 09:23:21 -05:00
+								        },
 								        {
 								            # empty description results in an empty string
 								            'url': 'https://www.youtube.com/watch?v=x41yOUIvK2k',
 								            'info_dict': {
 								                'id': 'x41yOUIvK2k',
 								                'ext': 'mp4',
 								                'title': 'IMG 3456',
 								                'description': '',
 								                'upload_date': '20170613',
-												[youtube] Update tests

											
										
										
											2022-01-07 05:54:57 -06:00
+								                'view_count': int,
 								                'thumbnail': 'https://i.ytimg.com/vi_webp/x41yOUIvK2k/maxresdefault.webp',
 								                'like_count': int,
 								                'channel_id': 'UCo03ZQPBW5U4UC3regpt1nw',
 								                'tags': [],
 								                'channel_url': 'https://www.youtube.com/channel/UCo03ZQPBW5U4UC3regpt1nw',
 								                'availability': 'public',
 								                'age_limit': 0,
 								                'categories': ['Pets & Animals'],
 								                'duration': 7,
 								                'playable_in_embed': True,
 								                'live_status': 'not_live',
-												[extractor/youtube] Define strict uploader metadata mapping (#6384)

New mapping:
```
channel -> channel name
channel_id -> UCID
channel_url -> UCID channel url

uploader -> channel name (same as channel field)
uploader_id -> @handle
uploader_url -> @handle channel url 
```

Authored by: coletdjnz
											
										
										
											2023-04-14 02:58:36 -05:00
+								                'channel': 'l\'Or Vert asbl',
 								                'channel_follower_count': int,
 								                'uploader': 'l\'Or Vert asbl',
 								                'uploader_url': 'https://www.youtube.com/@ElevageOrVert',
 								                'uploader_id': '@ElevageOrVert',
-												[ie/youtube] Extract upload timestamp if available (#9856)

Closes #4962, Closes #9829
Authored by: coletdjnz
											
										
										
											2024-05-26 16:13:12 -05:00
+								                'timestamp': 1497343210,
-												[youtube] Fix empty description extraction (#26575) (closes #26006)


											
										
										
											2020-09-13 09:23:21 -05:00
+								            },
 								            'params': {
 								                'skip_download': True,
 								            },
 								        },
-												Updated to release 2020.11.21.1

											
										
										
											2020-11-21 08:50:42 -06:00
+								        {
-												Update to ytdl-2021.01.03

											
										
										
											2021-01-01 06:26:37 -06:00
+								            # with '};' inside yt initial data (see [1])
 								            # see [2] for an example with '};' inside ytInitialPlayerResponse
 								            # 1. https://github.com/ytdl-org/youtube-dl/issues/27093
 								            # 2. https://github.com/ytdl-org/youtube-dl/issues/27216
-												Updated to release 2020.11.21.1

											
										
										
											2020-11-21 08:50:42 -06:00
+								            'url': 'https://www.youtube.com/watch?v=CHqg6qOn4no',
 								            'info_dict': {
 								                'id': 'CHqg6qOn4no',
 								                'ext': 'mp4',
 								                'title': 'Part 77   Sort a list of simple types in c#',
 								                'description': 'md5:b8746fa52e10cdbf47997903f13b20dc',
 								                'upload_date': '20130831',
-												[youtube] Update tests

											
										
										
											2022-01-07 05:54:57 -06:00
+								                'channel_id': 'UCCTVrRB5KpIiK6V2GGVsR1Q',
 								                'like_count': int,
 								                'channel_url': 'https://www.youtube.com/channel/UCCTVrRB5KpIiK6V2GGVsR1Q',
 								                'live_status': 'not_live',
 								                'categories': ['Education'],
 								                'availability': 'public',
 								                'thumbnail': 'https://i.ytimg.com/vi/CHqg6qOn4no/sddefault.jpg',
 								                'tags': 'count:12',
 								                'playable_in_embed': True,
 								                'age_limit': 0,
 								                'view_count': int,
 								                'duration': 522,
 								                'channel': 'kudvenkat',
-												[extractor/youtube, cleanup] Fix tests (#4293)

Authored by: sheerluck
											
										
										
											2022-07-07 16:20:02 -05:00
+								                'comment_count': int,
-												[cleanup Misc

Closes #5162

											
										
										
											2022-10-18 12:58:57 -05:00
+								                'channel_follower_count': int,
 								                'chapters': list,
-												[extractor/youtube] Define strict uploader metadata mapping (#6384)

New mapping:
```
channel -> channel name
channel_id -> UCID
channel_url -> UCID channel url

uploader -> channel name (same as channel field)
uploader_id -> @handle
uploader_url -> @handle channel url 
```

Authored by: coletdjnz
											
										
										
											2023-04-14 02:58:36 -05:00
+								                'uploader': 'kudvenkat',
 								                'uploader_url': 'https://www.youtube.com/@Csharp-video-tutorialsBlogspot',
 								                'uploader_id': '@Csharp-video-tutorialsBlogspot',
-												[extractor/youtube] Extract `channel_is_verified` (#7213)

Authored by: coletdjnz

											
										
										
											2023-06-08 02:50:05 -05:00
+								                'channel_is_verified': True,
-												[extractor/youtube] Misc cleanup

Authored by: coletdjnz

											
										
										
											2023-06-08 08:28:49 -05:00
+								                'heatmap': 'count:100',
-												[ie/youtube] Extract upload timestamp if available (#9856)

Closes #4962, Closes #9829
Authored by: coletdjnz
											
										
										
											2024-05-26 16:13:12 -05:00
+								                'timestamp': 1377976349,
-												Updated to release 2020.11.21.1

											
										
										
											2020-11-21 08:50:42 -06:00
+								            },
 								            'params': {
 								                'skip_download': True,
 								            },
 								        },
-												Update to ytdl-2021.01.03

											
										
										
											2021-01-01 06:26:37 -06:00
+								        {
 								            # another example of '};' in ytInitialData
 								            'url': 'https://www.youtube.com/watch?v=gVfgbahppCY',
 								            'only_matching': True,
 								        },
 								        {
 								            'url': 'https://www.youtube.com/watch_popup?v=63RmMXCd_bQ',
 								            'only_matching': True,
 								        },
-												[youtube] Update to ytdl-2021.02.04.1

											
										
										
											2021-02-04 08:37:17 -06:00
+								        {
-												Update to ytdl-2021.02.10

Except: [archiveorg] Fix and improve extraction (5fc53690cbe6abb11941a3f4846b566a7472753e)

											
										
										
											2021-02-10 15:22:55 -06:00
+								            # https://github.com/ytdl-org/youtube-dl/pull/28094
 								            'url': 'OtqTfy26tG0',
 								            'info_dict': {
 								                'id': 'OtqTfy26tG0',
 								                'ext': 'mp4',
 								                'title': 'Burn Out',
 								                'description': 'md5:8d07b84dcbcbfb34bc12a56d968b6131',
 								                'upload_date': '20141120',
 								                'artist': 'The Cinematic Orchestra',
 								                'track': 'Burn Out',
 								                'album': 'Every Day',
-												[youtube] Update tests

											
										
										
											2022-01-07 05:54:57 -06:00
+								                'like_count': int,
 								                'live_status': 'not_live',
 								                'alt_title': 'Burn Out',
 								                'duration': 614,
 								                'age_limit': 0,
 								                'view_count': int,
 								                'channel_url': 'https://www.youtube.com/channel/UCIzsJBIyo8hhpFm1NK0uLgw',
 								                'creator': 'The Cinematic Orchestra',
 								                'channel': 'The Cinematic Orchestra',
 								                'tags': ['The Cinematic Orchestra', 'Every Day', 'Burn Out'],
 								                'channel_id': 'UCIzsJBIyo8hhpFm1NK0uLgw',
 								                'availability': 'public',
 								                'thumbnail': 'https://i.ytimg.com/vi/OtqTfy26tG0/maxresdefault.jpg',
 								                'categories': ['Music'],
 								                'playable_in_embed': True,
-												[extractor/youtube] Define strict uploader metadata mapping (#6384)

New mapping:
```
channel -> channel name
channel_id -> UCID
channel_url -> UCID channel url

uploader -> channel name (same as channel field)
uploader_id -> @handle
uploader_url -> @handle channel url 
```

Authored by: coletdjnz
											
										
										
											2023-04-14 02:58:36 -05:00
+								                'channel_follower_count': int,
 								                'uploader': 'The Cinematic Orchestra',
 								                'comment_count': int,
-												Update to ytdl-2021.02.10

Except: [archiveorg] Fix and improve extraction (5fc53690cbe6abb11941a3f4846b566a7472753e)

											
										
										
											2021-02-10 15:22:55 -06:00
+								            },
 								            'params': {
 								                'skip_download': True,
 								            },
-												[youtube] Update to ytdl-2021.02.04.1

											
										
										
											2021-02-04 08:37:17 -06:00
+								        },
-												Update to ytdl-commit-cf2dbec
https://github.com/ytdl-org/youtube-dl/commit/cf2dbec6301177a1fddf72862de05fa912d9869d

Except: [kakao] improve info extraction and detect geo restriction
https://github.com/ytdl-org/youtube-dl/commit/d8085580f63ad3b146a31712ff76cf41d5a4558a

											
										
										
											2021-02-19 14:44:36 -06:00
+								        {
 								            # controversial video, only works with bpctr when authenticated with cookies
 								            'url': 'https://www.youtube.com/watch?v=nGC3D_FkCmg',
 								            'only_matching': True,
 								        },
-												[youtube] Fix controversial videos when requested via API (#533)

Closes: https://github.com/yt-dlp/yt-dlp/issues/511#issuecomment-883024350
Authored by: colethedj
											
										
										
											2021-07-20 13:01:28 -05:00
+								        {
 								            # controversial video, requires bpctr/contentCheckOk
 								            'url': 'https://www.youtube.com/watch?v=SZJvDhaSDnc',
 								            'info_dict': {
 								                'id': 'SZJvDhaSDnc',
 								                'ext': 'mp4',
 								                'title': 'San Diego teen commits suicide after bullying over embarrassing video',
 								                'channel_id': 'UC-SJ6nODDmufqBzPBwCvYvQ',
 								                'upload_date': '20140716',
-												[youtube] Update tests

											
										
										
											2022-01-07 05:54:57 -06:00
+								                'description': 'md5:acde3a73d3f133fc97e837a9f76b53b7',
 								                'duration': 170,
 								                'categories': ['News & Politics'],
 								                'view_count': int,
 								                'channel': 'CBS Mornings',
 								                'tags': ['suicide', 'bullying', 'video', 'cbs', 'news'],
 								                'thumbnail': 'https://i.ytimg.com/vi/SZJvDhaSDnc/hqdefault.jpg',
 								                'age_limit': 18,
 								                'availability': 'needs_auth',
 								                'channel_url': 'https://www.youtube.com/channel/UC-SJ6nODDmufqBzPBwCvYvQ',
 								                'like_count': int,
 								                'live_status': 'not_live',
 								                'playable_in_embed': True,
-												[extractor/youtube] Define strict uploader metadata mapping (#6384)

New mapping:
```
channel -> channel name
channel_id -> UCID
channel_url -> UCID channel url

uploader -> channel name (same as channel field)
uploader_id -> @handle
uploader_url -> @handle channel url 
```

Authored by: coletdjnz
											
										
										
											2023-04-14 02:58:36 -05:00
+								                'channel_follower_count': int,
 								                'uploader': 'CBS Mornings',
 								                'uploader_url': 'https://www.youtube.com/@CBSMornings',
 								                'uploader_id': '@CBSMornings',
-												[extractor/youtube] Misc cleanup

Authored by: coletdjnz

											
										
										
											2023-06-08 08:28:49 -05:00
+								                'comment_count': int,
-												[extractor/youtube] Extract `channel_is_verified` (#7213)

Authored by: coletdjnz

											
										
										
											2023-06-08 02:50:05 -05:00
+								                'channel_is_verified': True,
-												[ie/youtube] Extract upload timestamp if available (#9856)

Closes #4962, Closes #9829
Authored by: coletdjnz
											
										
										
											2024-05-26 16:13:12 -05:00
+								                'timestamp': 1405513526,
-												[cleanup] Add more ruff rules (#10149)

Authored by: seproDev

Reviewed-by: bashonly <88596187+bashonly@users.noreply.github.com>
Reviewed-by: Simon Sawicki <contact@grub4k.xyz>
											
										
										
											2024-06-11 18:09:58 -05:00
+								            },
-												[ie/youtube] Remove broken age-restriction workaround (#11297)

Closes #11296
Authored by: bashonly

											
										
										
											2024-10-20 17:25:29 -05:00
+								            'skip': 'Age-restricted; requires authentication',
-												[youtube] Fix controversial videos when requested via API (#533)

Closes: https://github.com/yt-dlp/yt-dlp/issues/511#issuecomment-883024350
Authored by: colethedj
											
										
										
											2021-07-20 13:01:28 -05:00
+								        },
-												Update to ytdl-commit-4fb25ff

[maoritv] Add new extractor
https://github.com/ytdl-org/youtube-dl/commit/4fb25ff5a3be5206bb72e5c4046715b1529fb2c7

Except:
[vimeo] improve extraction https://github.com/ytdl-org/youtube-dl/commit/3ae9c0f410b1d4f63e8bada67dd62a8d2852be32
[youtube:tab] Pass innertube context... https://github.com/ytdl-org/youtube-dl/commit/1b0a13f33cfb3644cc718d35951ea85bb1905459

											
										
										
											2021-04-10 11:47:11 -05:00
+								        {
 								            # restricted location, https://github.com/ytdl-org/youtube-dl/issues/28685
 								            'url': 'cBvYw8_A0vQ',
 								            'info_dict': {
 								                'id': 'cBvYw8_A0vQ',
 								                'ext': 'mp4',
 								                'title': '4K Ueno Okachimachi  Street  Scenes  上野御徒町歩き',
 								                'description': 'md5:ea770e474b7cd6722b4c95b833c03630',
 								                'upload_date': '20201120',
-												[youtube] Update tests

											
										
										
											2022-01-07 05:54:57 -06:00
+								                'duration': 1456,
 								                'categories': ['Travel & Events'],
 								                'channel_id': 'UC3o_t8PzBmXf5S9b7GLx1Mw',
 								                'view_count': int,
 								                'channel': 'Walk around Japan',
 								                'tags': ['Ueno Tokyo', 'Okachimachi Tokyo', 'Ameyoko Street', 'Tokyo attraction', 'Travel in Tokyo'],
-												[ie/youtube] Extract upload timestamp if available (#9856)

Closes #4962, Closes #9829
Authored by: coletdjnz
											
										
										
											2024-05-26 16:13:12 -05:00
+								                'thumbnail': 'https://i.ytimg.com/vi/cBvYw8_A0vQ/hqdefault.jpg',
-												[youtube] Update tests

											
										
										
											2022-01-07 05:54:57 -06:00
+								                'age_limit': 0,
 								                'availability': 'public',
 								                'channel_url': 'https://www.youtube.com/channel/UC3o_t8PzBmXf5S9b7GLx1Mw',
 								                'live_status': 'not_live',
 								                'playable_in_embed': True,
-												[extractor/youtube] Define strict uploader metadata mapping (#6384)

New mapping:
```
channel -> channel name
channel_id -> UCID
channel_url -> UCID channel url

uploader -> channel name (same as channel field)
uploader_id -> @handle
uploader_url -> @handle channel url 
```

Authored by: coletdjnz
											
										
										
											2023-04-14 02:58:36 -05:00
+								                'channel_follower_count': int,
 								                'uploader': 'Walk around Japan',
 								                'uploader_url': 'https://www.youtube.com/@walkaroundjapan7124',
 								                'uploader_id': '@walkaroundjapan7124',
-												[ie/youtube] Extract upload timestamp if available (#9856)

Closes #4962, Closes #9829
Authored by: coletdjnz
											
										
										
											2024-05-26 16:13:12 -05:00
+								                'timestamp': 1605884416,
-												Update to ytdl-commit-4fb25ff

[maoritv] Add new extractor
https://github.com/ytdl-org/youtube-dl/commit/4fb25ff5a3be5206bb72e5c4046715b1529fb2c7

Except:
[vimeo] improve extraction https://github.com/ytdl-org/youtube-dl/commit/3ae9c0f410b1d4f63e8bada67dd62a8d2852be32
[youtube:tab] Pass innertube context... https://github.com/ytdl-org/youtube-dl/commit/1b0a13f33cfb3644cc718d35951ea85bb1905459

											
										
										
											2021-04-10 11:47:11 -05:00
+								            },
 								            'params': {
 								                'skip_download': True,
 								            },
-												[youtube] Extract audio language

											
										
										
											2021-05-14 02:01:53 -05:00
+								        }, {
 								            # Has multiple audio streams
 								            'url': 'WaOKSUlf4TM',
-												[cleanup] Add more ruff rules (#10149)

Authored by: seproDev

Reviewed-by: bashonly <88596187+bashonly@users.noreply.github.com>
Reviewed-by: Simon Sawicki <contact@grub4k.xyz>
											
										
										
											2024-06-11 18:09:58 -05:00
+								            'only_matching': True,
-												[Youtube] Extract more formats for `music.youtube` URLs (#311)

Based on: https://github.com/ytdl-org/youtube-dl/pull/28778, https://github.com/ytdl-org/youtube-dl/pull/26160

Co-authored-by: craftingmod, colethedj, pukkandan
											
										
										
											2021-05-15 09:38:47 -05:00
+								        }, {
 								            # Requires Premium: has format 141 when requested using YTM url
 								            'url': 'https://music.youtube.com/watch?v=XclachpHxis',
-												[cleanup] Add more ruff rules (#10149)

Authored by: seproDev

Reviewed-by: bashonly <88596187+bashonly@users.noreply.github.com>
Reviewed-by: Simon Sawicki <contact@grub4k.xyz>
											
										
										
											2024-06-11 18:09:58 -05:00
+								            'only_matching': True,
-												[Youtube] Extract more formats for `music.youtube` URLs (#311)

Based on: https://github.com/ytdl-org/youtube-dl/pull/28778, https://github.com/ytdl-org/youtube-dl/pull/26160

Co-authored-by: craftingmod, colethedj, pukkandan
											
										
										
											2021-05-15 09:38:47 -05:00
+								        }, {
-												[youtube] multiple subtitles in same language

Fixes: https://github.com/ytdl-org/youtube-dl/issues/21164
Related: #310, https://github.com/ytdl-org/youtube-dl/pull/26112

											
										
										
											2021-05-12 14:20:02 -05:00
+								            # multiple subtitles with same lang_code
 								            'url': 'https://www.youtube.com/watch?v=wsQiKKfKxug',
 								            'only_matching': True,
-												[youtube] Use new API for additional video extraction requests (#328)

Co-authored-by: colethedj, pukkandan
Closes https://github.com/yt-dlp/yt-dlp/issues/427
Workarounds for https://github.com/ytdl-org/youtube-dl/issues/29326, https://github.com/yt-dlp/yt-dlp/issues/319, https://github.com/ytdl-org/youtube-dl/issues/29086
											
										
										
											2021-06-29 17:07:49 -05:00
+								        }, {
 								            # Force use android client fallback
 								            'url': 'https://www.youtube.com/watch?v=YOelRv7fMxY',
 								            'info_dict': {
 								                'id': 'YOelRv7fMxY',
-												[youtube] Extract data from multiple clients (#536)

* `player_client` accepts multiple clients
* default `player_client` = `android,web`
* music clients can be specifically requested
* Add IOS `player_client`
* Hide live dash since they can't be downloaded

Closes #501

Authored-by: pukkandan, colethedj
											
										
										
											2021-07-20 22:52:34 -05:00
+								                'title': 'DIGGING A SECRET TUNNEL Part 1',
-												[youtube] Use new API for additional video extraction requests (#328)

Co-authored-by: colethedj, pukkandan
Closes https://github.com/yt-dlp/yt-dlp/issues/427
Workarounds for https://github.com/ytdl-org/youtube-dl/issues/29326, https://github.com/yt-dlp/yt-dlp/issues/319, https://github.com/ytdl-org/youtube-dl/issues/29086
											
										
										
											2021-06-29 17:07:49 -05:00
+								                'ext': '3gp',
 								                'upload_date': '20210624',
 								                'channel_id': 'UCp68_FLety0O-n9QU6phsgw',
 								                'channel_url': r're:https?://(?:www\.)?youtube\.com/channel/UCp68_FLety0O-n9QU6phsgw',
-												[youtube] Update tests

											
										
										
											2022-01-07 05:54:57 -06:00
+								                'description': 'md5:5d5991195d599b56cd0c4148907eec50',
 								                'duration': 596,
 								                'categories': ['Entertainment'],
 								                'view_count': int,
 								                'channel': 'colinfurze',
 								                'tags': ['Colin', 'furze', 'Terry', 'tunnel', 'underground', 'bunker'],
 								                'thumbnail': 'https://i.ytimg.com/vi/YOelRv7fMxY/maxresdefault.jpg',
 								                'age_limit': 0,
 								                'availability': 'public',
 								                'like_count': int,
 								                'live_status': 'not_live',
 								                'playable_in_embed': True,
-												[cleanup Misc

Closes #5162

											
										
										
											2022-10-18 12:58:57 -05:00
+								                'channel_follower_count': int,
 								                'chapters': list,
-												[extractor/youtube] Define strict uploader metadata mapping (#6384)

New mapping:
```
channel -> channel name
channel_id -> UCID
channel_url -> UCID channel url

uploader -> channel name (same as channel field)
uploader_id -> @handle
uploader_url -> @handle channel url 
```

Authored by: coletdjnz
											
										
										
											2023-04-14 02:58:36 -05:00
+								                'uploader': 'colinfurze',
 								                'uploader_url': 'https://www.youtube.com/@colinfurze',
 								                'uploader_id': '@colinfurze',
-												[extractor/youtube] Misc cleanup

Authored by: coletdjnz

											
										
										
											2023-06-08 08:28:49 -05:00
+								                'comment_count': int,
-												[extractor/youtube] Extract `channel_is_verified` (#7213)

Authored by: coletdjnz

											
										
										
											2023-06-08 02:50:05 -05:00
+								                'channel_is_verified': True,
-												[extractor/youtube] Misc cleanup

Authored by: coletdjnz

											
										
										
											2023-06-08 08:28:49 -05:00
+								                'heatmap': 'count:100',
-												[youtube] Use new API for additional video extraction requests (#328)

Co-authored-by: colethedj, pukkandan
Closes https://github.com/yt-dlp/yt-dlp/issues/427
Workarounds for https://github.com/ytdl-org/youtube-dl/issues/29326, https://github.com/yt-dlp/yt-dlp/issues/319, https://github.com/ytdl-org/youtube-dl/issues/29086
											
										
										
											2021-06-29 17:07:49 -05:00
+								            },
 								            'params': {
 								                'format': '17',  # 3gp format available on android
 								                'extractor_args': {'youtube': {'player_client': ['android']}},
 								            },
-												[ie/youtube] Remove `android` from default clients (#9553)

Closes #9554
Authored by: coletdjnz, bashonly

Co-authored-by: bashonly <88596187+bashonly@users.noreply.github.com>
											
										
										
											2024-05-17 11:03:02 -05:00
+								            'skip': 'android client broken',
-												[youtube] multiple subtitles in same language

Fixes: https://github.com/ytdl-org/youtube-dl/issues/21164
Related: #310, https://github.com/ytdl-org/youtube-dl/pull/26112

											
										
										
											2021-05-12 14:20:02 -05:00
+								        },
-												[youtube] Use new API for additional video extraction requests (#328)

Co-authored-by: colethedj, pukkandan
Closes https://github.com/yt-dlp/yt-dlp/issues/427
Workarounds for https://github.com/ytdl-org/youtube-dl/issues/29326, https://github.com/yt-dlp/yt-dlp/issues/319, https://github.com/ytdl-org/youtube-dl/issues/29086
											
										
										
											2021-06-29 17:07:49 -05:00
+								        {
 								            # Skip download of additional client configs (remix client config in this case)
 								            'url': 'https://music.youtube.com/watch?v=MgNrAu2pzNs',
 								            'only_matching': True,
 								            'params': {
 								                'extractor_args': {'youtube': {'player_skip': ['configs']}},
 								            },
-												[youtube] Add `shorts` to `_VALID_URL`
Normally the generic extractor will redirect the URL,
but the cookies consent screen may sometimes appear instead

Closes #752

											
										
										
											2021-08-22 10:04:59 -05:00
+								        }, {
 								            # shorts
 								            'url': 'https://www.youtube.com/shorts/BGQWPY4IigY',
 								            'only_matching': True,
-												[cleanup] Minor cleanup

Closes #1696, Closes #1673

											
										
										
											2021-11-18 18:06:28 -06:00
+								        }, {
 								            'note': 'Storyboards',
 								            'url': 'https://www.youtube.com/watch?v=5KLPxDtMqe8',
 								            'info_dict': {
 								                'id': '5KLPxDtMqe8',
 								                'ext': 'mhtml',
 								                'format_id': 'sb0',
 								                'title': 'Your Brain is Plastic',
 								                'description': 'md5:89cd86034bdb5466cd87c6ba206cd2bc',
 								                'upload_date': '20140324',
-												[youtube] Update tests

											
										
										
											2022-01-07 05:54:57 -06:00
+								                'like_count': int,
 								                'channel_id': 'UCZYTClx2T1of7BRZ86-8fow',
 								                'channel_url': 'https://www.youtube.com/channel/UCZYTClx2T1of7BRZ86-8fow',
 								                'view_count': int,
 								                'thumbnail': 'https://i.ytimg.com/vi/5KLPxDtMqe8/maxresdefault.jpg',
 								                'playable_in_embed': True,
 								                'tags': 'count:12',
 								                'availability': 'public',
 								                'channel': 'SciShow',
 								                'live_status': 'not_live',
 								                'duration': 248,
 								                'categories': ['Education'],
 								                'age_limit': 0,
-												[cleanup Misc

Closes #5162

											
										
										
											2022-10-18 12:58:57 -05:00
+								                'channel_follower_count': int,
 								                'chapters': list,
-												[extractor/youtube] Define strict uploader metadata mapping (#6384)

New mapping:
```
channel -> channel name
channel_id -> UCID
channel_url -> UCID channel url

uploader -> channel name (same as channel field)
uploader_id -> @handle
uploader_url -> @handle channel url 
```

Authored by: coletdjnz
											
										
										
											2023-04-14 02:58:36 -05:00
+								                'uploader': 'SciShow',
 								                'uploader_url': 'https://www.youtube.com/@SciShow',
 								                'uploader_id': '@SciShow',
-												[extractor/youtube] Misc cleanup

Authored by: coletdjnz

											
										
										
											2023-06-08 08:28:49 -05:00
+								                'comment_count': int,
-												[extractor/youtube] Extract `channel_is_verified` (#7213)

Authored by: coletdjnz

											
										
										
											2023-06-08 02:50:05 -05:00
+								                'channel_is_verified': True,
-												[extractor/youtube] Misc cleanup

Authored by: coletdjnz

											
										
										
											2023-06-08 08:28:49 -05:00
+								                'heatmap': 'count:100',
-												[ie/youtube] Extract upload timestamp if available (#9856)

Closes #4962, Closes #9829
Authored by: coletdjnz
											
										
										
											2024-05-26 16:13:12 -05:00
+								                'timestamp': 1395685455,
-												[cleanup] Add more ruff rules (#10149)

Authored by: seproDev

Reviewed-by: bashonly <88596187+bashonly@users.noreply.github.com>
Reviewed-by: Simon Sawicki <contact@grub4k.xyz>
											
										
										
											2024-06-11 18:09:58 -05:00
+								            }, 'params': {'format': 'mhtml', 'skip_download': True},
-												[youtube] Prefer UTC upload date for videos (#2223)

Except for live/scheduled streams/premieres. 
Closes #1881
Related: #2402 
Authored-by: coletdjnz
											
										
										
											2022-03-08 01:28:00 -06:00
+								        }, {
 								            # Ensure video upload_date is in UTC timezone (video was uploaded 1641170939)
 								            'url': 'https://www.youtube.com/watch?v=2NUZ8W2llS4',
 								            'info_dict': {
 								                'id': '2NUZ8W2llS4',
 								                'ext': 'mp4',
 								                'title': 'The NP that test your phone performance 🙂',
 								                'description': 'md5:144494b24d4f9dfacb97c1bbef5de84d',
 								                'channel_id': 'UCRqNBSOHgilHfAczlUmlWHA',
 								                'channel_url': 'https://www.youtube.com/channel/UCRqNBSOHgilHfAczlUmlWHA',
 								                'duration': 21,
 								                'view_count': int,
 								                'age_limit': 0,
 								                'categories': ['Gaming'],
 								                'tags': 'count:23',
 								                'playable_in_embed': True,
 								                'live_status': 'not_live',
 								                'upload_date': '20220103',
 								                'like_count': int,
 								                'availability': 'public',
 								                'channel': 'Leon Nguyen',
 								                'thumbnail': 'https://i.ytimg.com/vi_webp/2NUZ8W2llS4/maxresdefault.webp',
-												[extractor/youtube, cleanup] Fix tests (#4293)

Authored by: sheerluck
											
										
										
											2022-07-07 16:20:02 -05:00
+								                'comment_count': int,
-												[extractor/youtube] Define strict uploader metadata mapping (#6384)

New mapping:
```
channel -> channel name
channel_id -> UCID
channel_url -> UCID channel url

uploader -> channel name (same as channel field)
uploader_id -> @handle
uploader_url -> @handle channel url 
```

Authored by: coletdjnz
											
										
										
											2023-04-14 02:58:36 -05:00
+								                'channel_follower_count': int,
 								                'uploader': 'Leon Nguyen',
 								                'uploader_url': 'https://www.youtube.com/@LeonNguyen',
 								                'uploader_id': '@LeonNguyen',
-												[extractor/youtube] Misc cleanup

Authored by: coletdjnz

											
										
										
											2023-06-08 08:28:49 -05:00
+								                'heatmap': 'count:100',
-												[ie/youtube] Extract upload timestamp if available (#9856)

Closes #4962, Closes #9829
Authored by: coletdjnz
											
										
										
											2024-05-26 16:13:12 -05:00
+								                'timestamp': 1641170939,
-												[cleanup] Add more ruff rules (#10149)

Authored by: seproDev

Reviewed-by: bashonly <88596187+bashonly@users.noreply.github.com>
Reviewed-by: Simon Sawicki <contact@grub4k.xyz>
											
										
										
											2024-06-11 18:09:58 -05:00
+								            },
-												[youtube] Prefer UTC upload date for videos (#2223)

Except for live/scheduled streams/premieres. 
Closes #1881
Related: #2402 
Authored-by: coletdjnz
											
										
										
											2022-03-08 01:28:00 -06:00
+								        }, {
 								            # date text is premiered video, ensure upload date in UTC (published 1641172509)
 								            'url': 'https://www.youtube.com/watch?v=mzZzzBU6lrM',
 								            'info_dict': {
 								                'id': 'mzZzzBU6lrM',
 								                'ext': 'mp4',
 								                'title': 'I Met GeorgeNotFound In Real Life...',
-												[extractor/youtube] Define strict uploader metadata mapping (#6384)

New mapping:
```
channel -> channel name
channel_id -> UCID
channel_url -> UCID channel url

uploader -> channel name (same as channel field)
uploader_id -> @handle
uploader_url -> @handle channel url 
```

Authored by: coletdjnz
											
										
										
											2023-04-14 02:58:36 -05:00
+								                'description': 'md5:978296ec9783a031738b684d4ebf302d',
-												[youtube] Prefer UTC upload date for videos (#2223)

Except for live/scheduled streams/premieres. 
Closes #1881
Related: #2402 
Authored-by: coletdjnz
											
										
										
											2022-03-08 01:28:00 -06:00
+								                'channel_id': 'UC_8NknAFiyhOUaZqHR3lq3Q',
 								                'channel_url': 'https://www.youtube.com/channel/UC_8NknAFiyhOUaZqHR3lq3Q',
 								                'duration': 955,
 								                'view_count': int,
 								                'age_limit': 0,
 								                'categories': ['Entertainment'],
 								                'tags': 'count:26',
 								                'playable_in_embed': True,
 								                'live_status': 'not_live',
 								                'release_timestamp': 1641172509,
 								                'release_date': '20220103',
 								                'upload_date': '20220103',
 								                'like_count': int,
 								                'availability': 'public',
 								                'channel': 'Quackity',
 								                'thumbnail': 'https://i.ytimg.com/vi/mzZzzBU6lrM/maxresdefault.jpg',
-												[extractor/youtube] Define strict uploader metadata mapping (#6384)

New mapping:
```
channel -> channel name
channel_id -> UCID
channel_url -> UCID channel url

uploader -> channel name (same as channel field)
uploader_id -> @handle
uploader_url -> @handle channel url 
```

Authored by: coletdjnz
											
										
										
											2023-04-14 02:58:36 -05:00
+								                'channel_follower_count': int,
 								                'uploader': 'Quackity',
 								                'uploader_id': '@Quackity',
 								                'uploader_url': 'https://www.youtube.com/@Quackity',
-												[extractor/youtube] Misc cleanup

Authored by: coletdjnz

											
										
										
											2023-06-08 08:28:49 -05:00
+								                'comment_count': int,
-												[extractor/youtube] Extract `channel_is_verified` (#7213)

Authored by: coletdjnz

											
										
										
											2023-06-08 02:50:05 -05:00
+								                'channel_is_verified': True,
-												[extractor/youtube] Misc cleanup

Authored by: coletdjnz

											
										
										
											2023-06-08 08:28:49 -05:00
+								                'heatmap': 'count:100',
-												[ie/youtube] Extract upload timestamp if available (#9856)

Closes #4962, Closes #9829
Authored by: coletdjnz
											
										
										
											2024-05-26 16:13:12 -05:00
+								                'timestamp': 1641172509,
-												[cleanup] Add more ruff rules (#10149)

Authored by: seproDev

Reviewed-by: bashonly <88596187+bashonly@users.noreply.github.com>
Reviewed-by: Simon Sawicki <contact@grub4k.xyz>
											
										
										
											2024-06-11 18:09:58 -05:00
+								            },
-												[youtube] Prefer UTC upload date for videos (#2223)

Except for live/scheduled streams/premieres. 
Closes #1881
Related: #2402 
Authored-by: coletdjnz
											
										
										
											2022-03-08 01:28:00 -06:00
+								        },
-												[ie/youtube] Extract upload timestamp if available (#9856)

Closes #4962, Closes #9829
Authored by: coletdjnz
											
										
										
											2024-05-26 16:13:12 -05:00
+								        {   # continuous livestream.
 								            # Upload date was 2022-07-12T05:12:29-07:00, while stream start is 2022-07-12T15:59:30+00:00
 								            'url': 'https://www.youtube.com/watch?v=jfKfPfyJRdk',
-												[youtube] Prefer UTC upload date for videos (#2223)

Except for live/scheduled streams/premieres. 
Closes #1881
Related: #2402 
Authored-by: coletdjnz
											
										
										
											2022-03-08 01:28:00 -06:00
+								            'info_dict': {
-												[ie/youtube] Extract upload timestamp if available (#9856)

Closes #4962, Closes #9829
Authored by: coletdjnz
											
										
										
											2024-05-26 16:13:12 -05:00
+								                'id': 'jfKfPfyJRdk',
-												[youtube] Prefer UTC upload date for videos (#2223)

Except for live/scheduled streams/premieres. 
Closes #1881
Related: #2402 
Authored-by: coletdjnz
											
										
										
											2022-03-08 01:28:00 -06:00
+								                'ext': 'mp4',
-												[ie/youtube] Extract upload timestamp if available (#9856)

Closes #4962, Closes #9829
Authored by: coletdjnz
											
										
										
											2024-05-26 16:13:12 -05:00
+								                'channel_id': 'UCSJ4gkVC6NrvII8umztf0Ow',
 								                'like_count': int,
 								                'uploader': 'Lofi Girl',
 								                'categories': ['Music'],
 								                'concurrent_view_count': int,
 								                'playable_in_embed': True,
 								                'timestamp': 1657627949,
 								                'release_date': '20220712',
 								                'channel_url': 'https://www.youtube.com/channel/UCSJ4gkVC6NrvII8umztf0Ow',
-												[ie/youtube] Extract `media_type` for livestreams (#11605)

Closes #11563
Authored by: nosoop
											
										
										
											2025-01-25 21:27:12 -06:00
+								                'description': 'md5:452d5c82f72bb7e62a4e0297c3f01c23',
-												[youtube] Prefer UTC upload date for videos (#2223)

Except for live/scheduled streams/premieres. 
Closes #1881
Related: #2402 
Authored-by: coletdjnz
											
										
										
											2022-03-08 01:28:00 -06:00
+								                'age_limit': 0,
-												[ie/youtube] Extract upload timestamp if available (#9856)

Closes #4962, Closes #9829
Authored by: coletdjnz
											
										
										
											2024-05-26 16:13:12 -05:00
+								                'thumbnail': 'https://i.ytimg.com/vi/jfKfPfyJRdk/maxresdefault.jpg',
 								                'release_timestamp': 1657641570,
 								                'uploader_url': 'https://www.youtube.com/@LofiGirl',
-												[youtube] Prefer UTC upload date for videos (#2223)

Except for live/scheduled streams/premieres. 
Closes #1881
Related: #2402 
Authored-by: coletdjnz
											
										
										
											2022-03-08 01:28:00 -06:00
+								                'channel_follower_count': int,
-												[ie/youtube] Extract upload timestamp if available (#9856)

Closes #4962, Closes #9829
Authored by: coletdjnz
											
										
										
											2024-05-26 16:13:12 -05:00
+								                'channel_is_verified': True,
-												[ie/youtube] Extract `media_type` for livestreams (#11605)

Closes #11563
Authored by: nosoop
											
										
										
											2025-01-25 21:27:12 -06:00
+								                'title': r're:^lofi hip hop radio 📚 beats to relax/study to',
-												[youtube] Prefer UTC upload date for videos (#2223)

Except for live/scheduled streams/premieres. 
Closes #1881
Related: #2402 
Authored-by: coletdjnz
											
										
										
											2022-03-08 01:28:00 -06:00
+								                'view_count': int,
-												[ie/youtube] Extract upload timestamp if available (#9856)

Closes #4962, Closes #9829
Authored by: coletdjnz
											
										
										
											2024-05-26 16:13:12 -05:00
+								                'live_status': 'is_live',
-												[ie/youtube] Extract `media_type` for livestreams (#11605)

Closes #11563
Authored by: nosoop
											
										
										
											2025-01-25 21:27:12 -06:00
+								                'media_type': 'livestream',
-												[ie/youtube] Extract upload timestamp if available (#9856)

Closes #4962, Closes #9829
Authored by: coletdjnz
											
										
										
											2024-05-26 16:13:12 -05:00
+								                'tags': 'count:32',
 								                'channel': 'Lofi Girl',
 								                'availability': 'public',
 								                'upload_date': '20220712',
 								                'uploader_id': '@LofiGirl',
-												[youtube] Prefer UTC upload date for videos (#2223)

Except for live/scheduled streams/premieres. 
Closes #1881
Related: #2402 
Authored-by: coletdjnz
											
										
										
											2022-03-08 01:28:00 -06:00
+								            },
-												[ie/youtube] Extract upload timestamp if available (#9856)

Closes #4962, Closes #9829
Authored by: coletdjnz
											
										
										
											2024-05-26 16:13:12 -05:00
+								            'params': {'skip_download': True},
-												[extractor/youtube] Fix initial player response extraction

Authored by: pukkandan, coletdjnz

											
										
										
											2022-05-29 02:54:22 -05:00
+								        }, {
 								            'url': 'https://www.youtube.com/watch?v=tjjjtzRLHvA',
 								            'info_dict': {
 								                'id': 'tjjjtzRLHvA',
 								                'ext': 'mp4',
 								                'title': 'ハッシュタグ無し };if window.ytcsi',
 								                'upload_date': '20220323',
 								                'like_count': int,
 								                'availability': 'unlisted',
-												[extractor/youtube] Define strict uploader metadata mapping (#6384)

New mapping:
```
channel -> channel name
channel_id -> UCID
channel_url -> UCID channel url

uploader -> channel name (same as channel field)
uploader_id -> @handle
uploader_url -> @handle channel url 
```

Authored by: coletdjnz
											
										
										
											2023-04-14 02:58:36 -05:00
+								                'channel': 'Lesmiscore',
 								                'thumbnail': r're:^https?://.*\.jpg',
-												[extractor/youtube] Fix initial player response extraction

Authored by: pukkandan, coletdjnz

											
										
										
											2022-05-29 02:54:22 -05:00
+								                'age_limit': 0,
 								                'categories': ['Music'],
-												[youtube] Add YoutubeStoriesIE (#3362)

Get channel stories with `ytstories:<channel UCID>`

Authored-by: coletdjnz
											
										
										
											2022-05-01 01:46:28 -05:00
+								                'view_count': int,
 								                'description': '',
-												[extractor/youtube] Fix initial player response extraction

Authored by: pukkandan, coletdjnz

											
										
										
											2022-05-29 02:54:22 -05:00
+								                'channel_url': 'https://www.youtube.com/channel/UCdqltm_7iv1Vs6kp6Syke5A',
 								                'channel_id': 'UCdqltm_7iv1Vs6kp6Syke5A',
 								                'live_status': 'not_live',
 								                'playable_in_embed': True,
 								                'channel_follower_count': int,
 								                'duration': 6,
 								                'tags': [],
-												[extractor/youtube] Define strict uploader metadata mapping (#6384)

New mapping:
```
channel -> channel name
channel_id -> UCID
channel_url -> UCID channel url

uploader -> channel name (same as channel field)
uploader_id -> @handle
uploader_url -> @handle channel url 
```

Authored by: coletdjnz
											
										
										
											2023-04-14 02:58:36 -05:00
+								                'uploader_id': '@lesmiscore',
 								                'uploader': 'Lesmiscore',
 								                'uploader_url': 'https://www.youtube.com/@lesmiscore',
-												[ie/youtube] Extract upload timestamp if available (#9856)

Closes #4962, Closes #9829
Authored by: coletdjnz
											
										
										
											2024-05-26 16:13:12 -05:00
+								                'timestamp': 1648005313,
-												[cleanup] Add more ruff rules (#10149)

Authored by: seproDev

Reviewed-by: bashonly <88596187+bashonly@users.noreply.github.com>
Reviewed-by: Simon Sawicki <contact@grub4k.xyz>
											
										
										
											2024-06-11 18:09:58 -05:00
+								            },
-												[extractor/youtube] Support changing extraction language (#4470)

Adds `--extractor-args youtube:lang=<supported lang code>` extractor arg to prefer translated fields (e.g. title and description) of that language, if available, for all YouTube extractors. See README or error message for list of supported language codes.

Closes https://github.com/yt-dlp/yt-dlp/issues/387

Authored by: coletdjnz
											
										
										
											2022-09-09 00:16:46 -05:00
+								        }, {
 								            # Prefer primary title+description language metadata by default
 								            # Do not prefer translated description if primary is empty
 								            'url': 'https://www.youtube.com/watch?v=el3E4MbxRqQ',
 								            'info_dict': {
 								                'id': 'el3E4MbxRqQ',
 								                'ext': 'mp4',
 								                'title': 'dlp test video 2 - primary sv no desc',
 								                'description': '',
 								                'channel': 'cole-dlp-test-acc',
 								                'tags': [],
 								                'view_count': int,
 								                'channel_url': 'https://www.youtube.com/channel/UCiu-3thuViMebBjw_5nWYrA',
 								                'like_count': int,
 								                'playable_in_embed': True,
 								                'availability': 'unlisted',
-												[extractor/youtube] Define strict uploader metadata mapping (#6384)

New mapping:
```
channel -> channel name
channel_id -> UCID
channel_url -> UCID channel url

uploader -> channel name (same as channel field)
uploader_id -> @handle
uploader_url -> @handle channel url 
```

Authored by: coletdjnz
											
										
										
											2023-04-14 02:58:36 -05:00
+								                'thumbnail': r're:^https?://.*\.jpg',
-												[extractor/youtube] Support changing extraction language (#4470)

Adds `--extractor-args youtube:lang=<supported lang code>` extractor arg to prefer translated fields (e.g. title and description) of that language, if available, for all YouTube extractors. See README or error message for list of supported language codes.

Closes https://github.com/yt-dlp/yt-dlp/issues/387

Authored by: coletdjnz
											
										
										
											2022-09-09 00:16:46 -05:00
+								                'age_limit': 0,
 								                'duration': 5,
 								                'live_status': 'not_live',
 								                'upload_date': '20220908',
 								                'categories': ['People & Blogs'],
 								                'channel_id': 'UCiu-3thuViMebBjw_5nWYrA',
-												[extractor/youtube] Define strict uploader metadata mapping (#6384)

New mapping:
```
channel -> channel name
channel_id -> UCID
channel_url -> UCID channel url

uploader -> channel name (same as channel field)
uploader_id -> @handle
uploader_url -> @handle channel url 
```

Authored by: coletdjnz
											
										
										
											2023-04-14 02:58:36 -05:00
+								                'uploader_url': 'https://www.youtube.com/@coletdjnz',
 								                'uploader_id': '@coletdjnz',
 								                'uploader': 'cole-dlp-test-acc',
-												[ie/youtube] Extract upload timestamp if available (#9856)

Closes #4962, Closes #9829
Authored by: coletdjnz
											
										
										
											2024-05-26 16:13:12 -05:00
+								                'timestamp': 1662677394,
-												[extractor/youtube] Support changing extraction language (#4470)

Adds `--extractor-args youtube:lang=<supported lang code>` extractor arg to prefer translated fields (e.g. title and description) of that language, if available, for all YouTube extractors. See README or error message for list of supported language codes.

Closes https://github.com/yt-dlp/yt-dlp/issues/387

Authored by: coletdjnz
											
										
										
											2022-09-09 00:16:46 -05:00
+								            },
-												[cleanup] Add more ruff rules (#10149)

Authored by: seproDev

Reviewed-by: bashonly <88596187+bashonly@users.noreply.github.com>
Reviewed-by: Simon Sawicki <contact@grub4k.xyz>
											
										
										
											2024-06-11 18:09:58 -05:00
+								            'params': {'skip_download': True},
-												[extractor/youtube] Support changing extraction language (#4470)

Adds `--extractor-args youtube:lang=<supported lang code>` extractor arg to prefer translated fields (e.g. title and description) of that language, if available, for all YouTube extractors. See README or error message for list of supported language codes.

Closes https://github.com/yt-dlp/yt-dlp/issues/387

Authored by: coletdjnz
											
										
										
											2022-09-09 00:16:46 -05:00
+								        }, {
 								            # Extractor argument: prefer translated title+description
 								            'url': 'https://www.youtube.com/watch?v=gHKT4uU8Zng',
 								            'info_dict': {
 								                'id': 'gHKT4uU8Zng',
 								                'ext': 'mp4',
 								                'channel': 'cole-dlp-test-acc',
 								                'tags': [],
 								                'duration': 5,
 								                'live_status': 'not_live',
 								                'channel_id': 'UCiu-3thuViMebBjw_5nWYrA',
-												[ie/youtube] Extract upload timestamp if available (#9856)

Closes #4962, Closes #9829
Authored by: coletdjnz
											
										
										
											2024-05-26 16:13:12 -05:00
+								                'upload_date': '20220729',
-												[extractor/youtube] Support changing extraction language (#4470)

Adds `--extractor-args youtube:lang=<supported lang code>` extractor arg to prefer translated fields (e.g. title and description) of that language, if available, for all YouTube extractors. See README or error message for list of supported language codes.

Closes https://github.com/yt-dlp/yt-dlp/issues/387

Authored by: coletdjnz
											
										
										
											2022-09-09 00:16:46 -05:00
+								                'view_count': int,
 								                'categories': ['People & Blogs'],
-												[extractor/youtube] Define strict uploader metadata mapping (#6384)

New mapping:
```
channel -> channel name
channel_id -> UCID
channel_url -> UCID channel url

uploader -> channel name (same as channel field)
uploader_id -> @handle
uploader_url -> @handle channel url 
```

Authored by: coletdjnz
											
										
										
											2023-04-14 02:58:36 -05:00
+								                'thumbnail': r're:^https?://.*\.jpg',
-												[extractor/youtube] Support changing extraction language (#4470)

Adds `--extractor-args youtube:lang=<supported lang code>` extractor arg to prefer translated fields (e.g. title and description) of that language, if available, for all YouTube extractors. See README or error message for list of supported language codes.

Closes https://github.com/yt-dlp/yt-dlp/issues/387

Authored by: coletdjnz
											
										
										
											2022-09-09 00:16:46 -05:00
+								                'title': 'dlp test video title translated (fr)',
 								                'availability': 'public',
 								                'age_limit': 0,
 								                'description': 'dlp test video description translated (fr)',
 								                'playable_in_embed': True,
 								                'channel_url': 'https://www.youtube.com/channel/UCiu-3thuViMebBjw_5nWYrA',
-												[extractor/youtube] Define strict uploader metadata mapping (#6384)

New mapping:
```
channel -> channel name
channel_id -> UCID
channel_url -> UCID channel url

uploader -> channel name (same as channel field)
uploader_id -> @handle
uploader_url -> @handle channel url 
```

Authored by: coletdjnz
											
										
										
											2023-04-14 02:58:36 -05:00
+								                'uploader_url': 'https://www.youtube.com/@coletdjnz',
 								                'uploader_id': '@coletdjnz',
 								                'uploader': 'cole-dlp-test-acc',
-												[ie/youtube] Extract upload timestamp if available (#9856)

Closes #4962, Closes #9829
Authored by: coletdjnz
											
										
										
											2024-05-26 16:13:12 -05:00
+								                'timestamp': 1659073275,
 								                'like_count': int,
-												[extractor/youtube] Support changing extraction language (#4470)

Adds `--extractor-args youtube:lang=<supported lang code>` extractor arg to prefer translated fields (e.g. title and description) of that language, if available, for all YouTube extractors. See README or error message for list of supported language codes.

Closes https://github.com/yt-dlp/yt-dlp/issues/387

Authored by: coletdjnz
											
										
										
											2022-09-09 00:16:46 -05:00
+								            },
 								            'params': {'skip_download': True, 'extractor_args': {'youtube': {'lang': ['fr']}}},
 								            'expected_warnings': [r'Preferring "fr" translated fields'],
-												[extractor/youtube] Extract more format info

											
										
										
											2022-08-07 15:06:11 -05:00
+								        }, {
 								            'note': '6 channel audio',
 								            'url': 'https://www.youtube.com/watch?v=zgdo7-RRjgo',
 								            'only_matching': True,
-												[extractor/youtube] Consider language in format de-duplication

											
										
										
											2022-11-14 17:53:32 -06:00
+								        }, {
 								            'note': 'Multiple HLS formats with same itag',
 								            'url': 'https://www.youtube.com/watch?v=kX3nB4PpJko',
 								            'info_dict': {
 								                'id': 'kX3nB4PpJko',
 								                'ext': 'mp4',
 								                'categories': ['Entertainment'],
 								                'description': 'md5:e8031ff6e426cdb6a77670c9b81f6fa6',
 								                'live_status': 'not_live',
 								                'duration': 937,
 								                'channel_follower_count': int,
 								                'thumbnail': 'https://i.ytimg.com/vi_webp/kX3nB4PpJko/maxresdefault.webp',
 								                'title': 'Last To Take Hand Off Jet, Keeps It!',
 								                'channel': 'MrBeast',
 								                'playable_in_embed': True,
 								                'view_count': int,
 								                'upload_date': '20221112',
 								                'channel_url': 'https://www.youtube.com/channel/UCX6OQ3DkcsbYNE6H8uQQuVA',
 								                'age_limit': 0,
 								                'availability': 'public',
 								                'channel_id': 'UCX6OQ3DkcsbYNE6H8uQQuVA',
 								                'like_count': int,
 								                'tags': [],
-												[extractor/youtube] Define strict uploader metadata mapping (#6384)

New mapping:
```
channel -> channel name
channel_id -> UCID
channel_url -> UCID channel url

uploader -> channel name (same as channel field)
uploader_id -> @handle
uploader_url -> @handle channel url 
```

Authored by: coletdjnz
											
										
										
											2023-04-14 02:58:36 -05:00
+								                'uploader': 'MrBeast',
 								                'uploader_url': 'https://www.youtube.com/@MrBeast',
 								                'uploader_id': '@MrBeast',
-												[extractor/youtube] Misc cleanup

Authored by: coletdjnz

											
										
										
											2023-06-08 08:28:49 -05:00
+								                'comment_count': int,
-												[extractor/youtube] Extract `channel_is_verified` (#7213)

Authored by: coletdjnz

											
										
										
											2023-06-08 02:50:05 -05:00
+								                'channel_is_verified': True,
-												[extractor/youtube] Misc cleanup

Authored by: coletdjnz

											
										
										
											2023-06-08 08:28:49 -05:00
+								                'heatmap': 'count:100',
-												[extractor/youtube] Consider language in format de-duplication

											
										
										
											2022-11-14 17:53:32 -06:00
+								            },
 								            'params': {'extractor_args': {'youtube': {'player_client': ['ios']}}, 'format': '233-1'},
-												[extractor/youtube] Extract DRC formats

											
										
										
											2022-12-30 04:02:33 -06:00
+								        }, {
 								            'note': 'Audio formats with Dynamic Range Compression',
 								            'url': 'https://www.youtube.com/watch?v=Tq92D6wQ1mg',
 								            'info_dict': {
 								                'id': 'Tq92D6wQ1mg',
-												[extractor/youtube] Define strict uploader metadata mapping (#6384)

New mapping:
```
channel -> channel name
channel_id -> UCID
channel_url -> UCID channel url

uploader -> channel name (same as channel field)
uploader_id -> @handle
uploader_url -> @handle channel url 
```

Authored by: coletdjnz
											
										
										
											2023-04-14 02:58:36 -05:00
+								                'ext': 'webm',
-												[extractor/youtube] Extract DRC formats

											
										
										
											2022-12-30 04:02:33 -06:00
+								                'title': '[MMD] Adios - EVERGLOW [+Motion DL]',
 								                'channel_url': 'https://www.youtube.com/channel/UC1yoRdFoFJaCY-AGfD9W0wQ',
 								                'channel_id': 'UC1yoRdFoFJaCY-AGfD9W0wQ',
 								                'channel_follower_count': int,
 								                'description': 'md5:17eccca93a786d51bc67646756894066',
 								                'upload_date': '20191228',
 								                'tags': ['mmd', 'dance', 'mikumikudance', 'kpop', 'vtuber'],
 								                'playable_in_embed': True,
 								                'like_count': int,
 								                'categories': ['Entertainment'],
 								                'thumbnail': 'https://i.ytimg.com/vi/Tq92D6wQ1mg/sddefault.jpg',
 								                'age_limit': 18,
 								                'channel': 'Projekt Melody',
 								                'view_count': int,
 								                'availability': 'needs_auth',
 								                'comment_count': int,
 								                'live_status': 'not_live',
 								                'duration': 106,
-												[extractor/youtube] Define strict uploader metadata mapping (#6384)

New mapping:
```
channel -> channel name
channel_id -> UCID
channel_url -> UCID channel url

uploader -> channel name (same as channel field)
uploader_id -> @handle
uploader_url -> @handle channel url 
```

Authored by: coletdjnz
											
										
										
											2023-04-14 02:58:36 -05:00
+								                'uploader': 'Projekt Melody',
 								                'uploader_id': '@ProjektMelody',
 								                'uploader_url': 'https://www.youtube.com/@ProjektMelody',
-												[ie/youtube] Extract upload timestamp if available (#9856)

Closes #4962, Closes #9829
Authored by: coletdjnz
											
										
										
											2024-05-26 16:13:12 -05:00
+								                'timestamp': 1577508724,
-												[extractor/youtube] Extract DRC formats

											
										
										
											2022-12-30 04:02:33 -06:00
+								            },
 								            'params': {'extractor_args': {'youtube': {'player_client': ['tv_embedded']}}, 'format': '251-drc'},
-												[ie/youtube] Remove broken age-restriction workaround (#11297)

Closes #11296
Authored by: bashonly

											
										
										
											2024-10-20 17:25:29 -05:00
+								            'skip': 'Age-restricted; requires authentication',
-												[extractor/youtube] Support `/live/` URL

											
										
										
											2023-02-03 12:17:13 -06:00
+								        },
 								        {
-												[ie/youtube] Extract `media_type` for livestreams (#11605)

Closes #11563
Authored by: nosoop
											
										
										
											2025-01-25 21:27:12 -06:00
+								            'note': 'Support /live/ URL + media type for post-live content',
-												[extractor/youtube] Support `/live/` URL

											
										
										
											2023-02-03 12:17:13 -06:00
+								            'url': 'https://www.youtube.com/live/qVv6vCqciTM',
 								            'info_dict': {
 								                'id': 'qVv6vCqciTM',
 								                'ext': 'mp4',
 								                'age_limit': 0,
 								                'comment_count': int,
 								                'chapters': 'count:13',
 								                'upload_date': '20221223',
 								                'thumbnail': 'https://i.ytimg.com/vi/qVv6vCqciTM/maxresdefault.jpg',
 								                'channel_url': 'https://www.youtube.com/channel/UCIdEIHpS0TdkqRkHL5OkLtA',
 								                'like_count': int,
 								                'release_date': '20221223',
 								                'tags': ['Vtuber', '月ノ美兎', '名取さな', 'にじさんじ', 'クリスマス', '3D配信'],
 								                'title': '【 #インターネット女クリスマス 】3Dで歌ってはしゃぐインターネットの女たち【月ノ美兎/名取さな】',
 								                'view_count': int,
 								                'playable_in_embed': True,
 								                'duration': 4438,
 								                'availability': 'public',
 								                'channel_follower_count': int,
 								                'channel_id': 'UCIdEIHpS0TdkqRkHL5OkLtA',
 								                'categories': ['Entertainment'],
 								                'live_status': 'was_live',
-												[ie/youtube] Extract `media_type` for livestreams (#11605)

Closes #11563
Authored by: nosoop
											
										
										
											2025-01-25 21:27:12 -06:00
+								                'media_type': 'livestream',
-												[extractor/youtube] Support `/live/` URL

											
										
										
											2023-02-03 12:17:13 -06:00
+								                'release_timestamp': 1671793345,
 								                'channel': 'さなちゃんねる',
 								                'description': 'md5:6aebf95cc4a1d731aebc01ad6cc9806d',
 								                'uploader': 'さなちゃんねる',
-												[extractor/youtube] Define strict uploader metadata mapping (#6384)

New mapping:
```
channel -> channel name
channel_id -> UCID
channel_url -> UCID channel url

uploader -> channel name (same as channel field)
uploader_id -> @handle
uploader_url -> @handle channel url 
```

Authored by: coletdjnz
											
										
										
											2023-04-14 02:58:36 -05:00
+								                'uploader_url': 'https://www.youtube.com/@sana_natori',
 								                'uploader_id': '@sana_natori',
-												[extractor/youtube] Extract `channel_is_verified` (#7213)

Authored by: coletdjnz

											
										
										
											2023-06-08 02:50:05 -05:00
+								                'channel_is_verified': True,
-												[extractor/youtube] Misc cleanup

Authored by: coletdjnz

											
										
										
											2023-06-08 08:28:49 -05:00
+								                'heatmap': 'count:100',
-												[ie/youtube] Extract upload timestamp if available (#9856)

Closes #4962, Closes #9829
Authored by: coletdjnz
											
										
										
											2024-05-26 16:13:12 -05:00
+								                'timestamp': 1671798112,
-												[extractor/youtube] Define strict uploader metadata mapping (#6384)

New mapping:
```
channel -> channel name
channel_id -> UCID
channel_url -> UCID channel url

uploader -> channel name (same as channel field)
uploader_id -> @handle
uploader_url -> @handle channel url 
```

Authored by: coletdjnz
											
										
										
											2023-04-14 02:58:36 -05:00
+								            },
 								        },
 								        {
 								            # Fallbacks when webpage and web client is unavailable
 								            'url': 'https://www.youtube.com/watch?v=wSSmNUl9Snw',
 								            'info_dict': {
 								                'id': 'wSSmNUl9Snw',
 								                'ext': 'mp4',
 								                # 'categories': ['Science & Technology'],
 								                'view_count': int,
 								                'chapters': 'count:2',
 								                'channel': 'Scott Manley',
 								                'like_count': int,
 								                'age_limit': 0,
 								                # 'availability': 'public',
 								                'channel_follower_count': int,
 								                'live_status': 'not_live',
 								                'upload_date': '20170831',
 								                'duration': 682,
 								                'tags': 'count:8',
 								                'uploader_url': 'https://www.youtube.com/@scottmanley',
 								                'description': 'md5:f4bed7b200404b72a394c2f97b782c02',
 								                'uploader': 'Scott Manley',
 								                'uploader_id': '@scottmanley',
 								                'title': 'The Computer Hack That Saved Apollo 14',
 								                'channel_id': 'UCxzC4EngIsMrPmbm6Nxvb-A',
 								                'thumbnail': r're:^https?://.*\.webp',
 								                'channel_url': 'https://www.youtube.com/channel/UCxzC4EngIsMrPmbm6Nxvb-A',
 								                'playable_in_embed': True,
-												[extractor/youtube] Misc cleanup

Authored by: coletdjnz

											
										
										
											2023-06-08 08:28:49 -05:00
+								                'comment_count': int,
-												[extractor/youtube] Extract `channel_is_verified` (#7213)

Authored by: coletdjnz

											
										
										
											2023-06-08 02:50:05 -05:00
+								                'channel_is_verified': True,
-												[extractor/youtube] Misc cleanup

Authored by: coletdjnz

											
										
										
											2023-06-08 08:28:49 -05:00
+								                'heatmap': 'count:100',
-												[extractor/youtube] Define strict uploader metadata mapping (#6384)

New mapping:
```
channel -> channel name
channel_id -> UCID
channel_url -> UCID channel url

uploader -> channel name (same as channel field)
uploader_id -> @handle
uploader_url -> @handle channel url 
```

Authored by: coletdjnz
											
										
										
											2023-04-14 02:58:36 -05:00
+								            },
 								            'params': {
-												[ie/youtube] Remove `android` from default clients (#9553)

Closes #9554
Authored by: coletdjnz, bashonly

Co-authored-by: bashonly <88596187+bashonly@users.noreply.github.com>
											
										
										
											2024-05-17 11:03:02 -05:00
+								                'extractor_args': {'youtube': {'player_client': ['ios'], 'player_skip': ['webpage']}},
-												[extractor/youtube] Support `/live/` URL

											
										
										
											2023-02-03 12:17:13 -06:00
+								            },
 								        },
-												[ie/youtube] Fix `uploader_id` extraction (#11818)

Closes #11816
Authored by: bashonly
											
										
										
											2024-12-15 14:07:18 -06:00
+								        {
 								            # uploader_id has non-ASCII characters that are percent-encoded in YT's JSON
 								            'url': 'https://www.youtube.com/shorts/18NGQq7p3LY',
 								            'info_dict': {
 								                'id': '18NGQq7p3LY',
 								                'ext': 'mp4',
 								                'title': '아이브 이서 장원영 리즈 삐끼삐끼 챌린지',
 								                'description': '',
 								                'uploader': 'ㅇㅇ',
 								                'uploader_id': '@으아-v1k',
 								                'uploader_url': 'https://www.youtube.com/@으아-v1k',
 								                'channel': 'ㅇㅇ',
 								                'channel_id': 'UCC25oTm2J7ZVoi5TngOHg9g',
 								                'channel_url': 'https://www.youtube.com/channel/UCC25oTm2J7ZVoi5TngOHg9g',
 								                'thumbnail': r're:https?://.+/.+\.jpg',
 								                'playable_in_embed': True,
 								                'age_limit': 0,
 								                'duration': 3,
 								                'timestamp': 1724306170,
 								                'upload_date': '20240822',
 								                'availability': 'public',
 								                'live_status': 'not_live',
 								                'view_count': int,
 								                'like_count': int,
 								                'channel_follower_count': int,
 								                'categories': ['People & Blogs'],
 								                'tags': [],
 								            },
 								        },
-												Allow _TESTS attribute for IEs with multiple tests

This also improves the numbering of duplicate tests

											
										
										
											2013-06-27 12:13:11 -05:00
+								    ]
-												[extractor, test] Basic framework for embed tests (#4307)

and split download tests so they can be more easily run in CI

Authored by: coletdjnz

											
										
										
											2022-07-08 06:23:05 -05:00
+								    _WEBPAGE_TESTS = [
 								        # YouTube <object> embed
 								        {
 								            'url': 'http://www.improbable.com/2017/04/03/untrained-modern-youths-and-ancient-masters-in-selfie-portraits/',
 								            'md5': '873c81d308b979f0e23ee7e620b312a3',
 								            'info_dict': {
 								                'id': 'msN87y-iEx0',
 								                'ext': 'mp4',
 								                'title': 'Feynman: Mirrors FUN TO IMAGINE 6',
 								                'upload_date': '20080526',
 								                'description': 'md5:873c81d308b979f0e23ee7e620b312a3',
 								                'age_limit': 0,
 								                'tags': ['feynman', 'mirror', 'science', 'physics', 'imagination', 'fun', 'cool', 'puzzle'],
 								                'channel_id': 'UCCeo--lls1vna5YJABWAcVA',
 								                'playable_in_embed': True,
 								                'thumbnail': 'https://i.ytimg.com/vi/msN87y-iEx0/hqdefault.jpg',
 								                'like_count': int,
 								                'comment_count': int,
 								                'channel': 'Christopher Sykes',
 								                'live_status': 'not_live',
 								                'channel_url': 'https://www.youtube.com/channel/UCCeo--lls1vna5YJABWAcVA',
 								                'availability': 'public',
 								                'duration': 195,
 								                'view_count': int,
 								                'categories': ['Science & Technology'],
 								                'channel_follower_count': int,
-												[extractor/youtube] Define strict uploader metadata mapping (#6384)

New mapping:
```
channel -> channel name
channel_id -> UCID
channel_url -> UCID channel url

uploader -> channel name (same as channel field)
uploader_id -> @handle
uploader_url -> @handle channel url 
```

Authored by: coletdjnz
											
										
										
											2023-04-14 02:58:36 -05:00
+								                'uploader': 'Christopher Sykes',
 								                'uploader_url': 'https://www.youtube.com/@ChristopherSykesDocumentaries',
 								                'uploader_id': '@ChristopherSykesDocumentaries',
-												[extractor/youtube] Misc cleanup

Authored by: coletdjnz

											
										
										
											2023-06-08 08:28:49 -05:00
+								                'heatmap': 'count:100',
-												[ie/youtube] Extract upload timestamp if available (#9856)

Closes #4962, Closes #9829
Authored by: coletdjnz
											
										
										
											2024-05-26 16:13:12 -05:00
+								                'timestamp': 1211825920,
-												[extractor, test] Basic framework for embed tests (#4307)

and split download tests so they can be more easily run in CI

Authored by: coletdjnz

											
										
										
											2022-07-08 06:23:05 -05:00
+								            },
 								            'params': {
 								                'skip_download': True,
-												[cleanup] Add more ruff rules (#10149)

Authored by: seproDev

Reviewed-by: bashonly <88596187+bashonly@users.noreply.github.com>
Reviewed-by: Simon Sawicki <contact@grub4k.xyz>
											
										
										
											2024-06-11 18:09:58 -05:00
+								            },
-												[extractor, test] Basic framework for embed tests (#4307)

and split download tests so they can be more easily run in CI

Authored by: coletdjnz

											
										
										
											2022-07-08 06:23:05 -05:00
+								        },
 								    ]
-												Update to ytdl-commit-9f6c03

[cbsnews] Fix extraction for python <3.6
https://github.com/ytdl-org/youtube-dl/commit/9f6c03a00602eb1119e43a522cf50682f6d6a6dd

											
										
										
											2021-04-16 22:02:33 -05:00
+								    @classmethod
 								    def suitable(cls, url):
-												[ie/youtube] Split into package (#12557)

Authored by: coletdjnz
											
										
										
											2025-03-12 23:37:33 -05:00
+								        from yt_dlp.utils import parse_qs
-												[utils] Add `parse_qs`

											
										
										
											2021-08-22 14:02:00 -05:00
-												Update to ytdl-commit-9f6c03

[cbsnews] Fix extraction for python <3.6
https://github.com/ytdl-org/youtube-dl/commit/9f6c03a00602eb1119e43a522cf50682f6d6a6dd

											
										
										
											2021-04-16 22:02:33 -05:00
+								        qs = parse_qs(url)
 								        if qs.get('list', [None])[0]:
 								            return False
-												[cleanup] Upgrade syntax

Using https://github.com/asottile/pyupgrade

1. `__future__` imports and `coding: utf-8` were removed
2. Files were rewritten with `pyupgrade --py36-plus --keep-percent-format`
3. f-strings were cherry-picked from `pyupgrade --py36-plus`

Extractors are left untouched (except removing header) to avoid unnecessary merge conflicts

											
										
										
											2022-04-11 10:10:28 -05:00
+								        return super().suitable(url)
-												Update to ytdl-commit-9f6c03

[cbsnews] Fix extraction for python <3.6
https://github.com/ytdl-org/youtube-dl/commit/9f6c03a00602eb1119e43a522cf50682f6d6a6dd

											
										
										
											2021-04-16 22:02:33 -05:00
-												Restore accidentally deleted commits

That's what happens if you let Windows machines write :(

											
										
										
											2013-09-21 07:19:30 -05:00
+								    def __init__(self, *args, **kwargs):
-												[cleanup] Upgrade syntax

Using https://github.com/asottile/pyupgrade

1. `__future__` imports and `coding: utf-8` were removed
2. Files were rewritten with `pyupgrade --py36-plus --keep-percent-format`
3. f-strings were cherry-picked from `pyupgrade --py36-plus`

Extractors are left untouched (except removing header) to avoid unnecessary merge conflicts

											
										
										
											2022-04-11 10:10:28 -05:00
+								        super().__init__(*args, **kwargs)
-												[youtube] Update to ytdl-2021.02.04.1

											
										
										
											2021-02-04 08:37:17 -06:00
+								        self._code_cache = {}
-												Prepare signature function caching

											
										
										
											2013-09-21 08:19:48 -05:00
+								        self._player_cache = {}
-												Restore accidentally deleted commits

That's what happens if you let Windows machines write :(

											
										
										
											2013-09-21 07:19:30 -05:00
-												[extractor/youtube] Download `post_live` videos from start (#5091)

* The fragments are generated as a `LazyList`. So only the required formats are expanded during download, but all fragment lists are printed/written in infojson.
* The m3u8 formats which cannot be downloaded from start are not extracted by default, but can be enabled with an extractor-arg. The extractor-arg `include_live_dash` is renamed to `include_incomplete_formats` to account for this new use-case.

Closes #1564
Authored by: Lesmiscore, pukkandan
											
										
										
											2022-10-03 21:48:31 -05:00
+								    def _prepare_live_from_start_formats(self, formats, video_id, live_start_time, url, webpage_url, smuggled_data, is_live):
-												[dash,youtube] Download live from start to end (#888)

* Add option `--live-from-start` to enable downloading live videos from start
* Add key `is_from_start` in formats to identify formats (of live videos) that downloads from start
* [dash] Create protocol `http_dash_segments_generator` that allows a function to be passed instead of fragments
* [fragment] Allow multiple live dash formats to download simultaneously
* [youtube] Implement fragment re-fetching for the live dash formats
* [youtube] Re-extract dash manifest every 5 hours (manifest expires in 6hrs)
* [postprocessor/ffmpeg] Add `FFmpegFixupDuplicateMoovPP` to fixup duplicated moov atoms

Known issue: Ctrl+C doesn't work on Windows when downloading multiple formats

Closes #1521
Authored by: nao20010128nao, pukkandan

											
										
										
											2021-12-20 00:06:46 -06:00
+								        lock = threading.Lock()
-												[youtube] End `live-from-start` properly when stream ends with 403

Closes #2089

											
										
										
											2021-12-26 04:19:35 -06:00
+								        start_time = time.time()
-												[dash,youtube] Download live from start to end (#888)

* Add option `--live-from-start` to enable downloading live videos from start
* Add key `is_from_start` in formats to identify formats (of live videos) that downloads from start
* [dash] Create protocol `http_dash_segments_generator` that allows a function to be passed instead of fragments
* [fragment] Allow multiple live dash formats to download simultaneously
* [youtube] Implement fragment re-fetching for the live dash formats
* [youtube] Re-extract dash manifest every 5 hours (manifest expires in 6hrs)
* [postprocessor/ffmpeg] Add `FFmpegFixupDuplicateMoovPP` to fixup duplicated moov atoms

Known issue: Ctrl+C doesn't work on Windows when downloading multiple formats

Closes #1521
Authored by: nao20010128nao, pukkandan

											
										
										
											2021-12-20 00:06:46 -06:00
+								        formats = [f for f in formats if f.get('is_from_start')]
-												[youtube] End `live-from-start` properly when stream ends with 403

Closes #2089

											
										
										
											2021-12-26 04:19:35 -06:00
+								        def refetch_manifest(format_id, delay):
 								            nonlocal formats, start_time, is_live
 								            if time.time() <= start_time + delay:
-												[dash,youtube] Download live from start to end (#888)

* Add option `--live-from-start` to enable downloading live videos from start
* Add key `is_from_start` in formats to identify formats (of live videos) that downloads from start
* [dash] Create protocol `http_dash_segments_generator` that allows a function to be passed instead of fragments
* [fragment] Allow multiple live dash formats to download simultaneously
* [youtube] Implement fragment re-fetching for the live dash formats
* [youtube] Re-extract dash manifest every 5 hours (manifest expires in 6hrs)
* [postprocessor/ffmpeg] Add `FFmpegFixupDuplicateMoovPP` to fixup duplicated moov atoms

Known issue: Ctrl+C doesn't work on Windows when downloading multiple formats

Closes #1521
Authored by: nao20010128nao, pukkandan

											
										
										
											2021-12-20 00:06:46 -06:00
+								                return
 								            _, _, prs, player_url = self._download_player_responses(url, smuggled_data, video_id, webpage_url)
-												[utils] `traverse_obj`: Fix more bugs

and cleanup uses of `default=[]`

Continued from b1bde57bef878478e3503ab07190fd207914ade9

											
										
										
											2023-02-09 16:26:26 -06:00
+								            video_details = traverse_obj(prs, (..., 'videoDetails'), expected_type=dict)
-												[dash,youtube] Download live from start to end (#888)

* Add option `--live-from-start` to enable downloading live videos from start
* Add key `is_from_start` in formats to identify formats (of live videos) that downloads from start
* [dash] Create protocol `http_dash_segments_generator` that allows a function to be passed instead of fragments
* [fragment] Allow multiple live dash formats to download simultaneously
* [youtube] Implement fragment re-fetching for the live dash formats
* [youtube] Re-extract dash manifest every 5 hours (manifest expires in 6hrs)
* [postprocessor/ffmpeg] Add `FFmpegFixupDuplicateMoovPP` to fixup duplicated moov atoms

Known issue: Ctrl+C doesn't work on Windows when downloading multiple formats

Closes #1521
Authored by: nao20010128nao, pukkandan

											
										
										
											2021-12-20 00:06:46 -06:00
+								            microformats = traverse_obj(
 								                prs, (..., 'microformat', 'playerMicroformatRenderer'),
-												[utils] `traverse_obj`: Fix more bugs

and cleanup uses of `default=[]`

Continued from b1bde57bef878478e3503ab07190fd207914ade9

											
										
										
											2023-02-09 16:26:26 -06:00
+								                expected_type=dict)
-												[extractor/youtube] Download `post_live` videos from start (#5091)

* The fragments are generated as a `LazyList`. So only the required formats are expanded during download, but all fragment lists are printed/written in infojson.
* The m3u8 formats which cannot be downloaded from start are not extracted by default, but can be enabled with an extractor-arg. The extractor-arg `include_live_dash` is renamed to `include_incomplete_formats` to account for this new use-case.

Closes #1564
Authored by: Lesmiscore, pukkandan
											
										
										
											2022-10-03 21:48:31 -05:00
+								            _, live_status, _, formats, _ = self._list_formats(video_id, microformats, video_details, prs, player_url)
 								            is_live = live_status == 'is_live'
-												[youtube] End `live-from-start` properly when stream ends with 403

Closes #2089

											
										
										
											2021-12-26 04:19:35 -06:00
+								            start_time = time.time()
-												[dash,youtube] Download live from start to end (#888)

* Add option `--live-from-start` to enable downloading live videos from start
* Add key `is_from_start` in formats to identify formats (of live videos) that downloads from start
* [dash] Create protocol `http_dash_segments_generator` that allows a function to be passed instead of fragments
* [fragment] Allow multiple live dash formats to download simultaneously
* [youtube] Implement fragment re-fetching for the live dash formats
* [youtube] Re-extract dash manifest every 5 hours (manifest expires in 6hrs)
* [postprocessor/ffmpeg] Add `FFmpegFixupDuplicateMoovPP` to fixup duplicated moov atoms

Known issue: Ctrl+C doesn't work on Windows when downloading multiple formats

Closes #1521
Authored by: nao20010128nao, pukkandan

											
										
										
											2021-12-20 00:06:46 -06:00
-												[youtube] End `live-from-start` properly when stream ends with 403

Closes #2089

											
										
										
											2021-12-26 04:19:35 -06:00
+								        def mpd_feed(format_id, delay):
-												[dash,youtube] Download live from start to end (#888)

* Add option `--live-from-start` to enable downloading live videos from start
* Add key `is_from_start` in formats to identify formats (of live videos) that downloads from start
* [dash] Create protocol `http_dash_segments_generator` that allows a function to be passed instead of fragments
* [fragment] Allow multiple live dash formats to download simultaneously
* [youtube] Implement fragment re-fetching for the live dash formats
* [youtube] Re-extract dash manifest every 5 hours (manifest expires in 6hrs)
* [postprocessor/ffmpeg] Add `FFmpegFixupDuplicateMoovPP` to fixup duplicated moov atoms

Known issue: Ctrl+C doesn't work on Windows when downloading multiple formats

Closes #1521
Authored by: nao20010128nao, pukkandan

											
										
										
											2021-12-20 00:06:46 -06:00
+								            """
 								            @returns (manifest_url, manifest_stream_number, is_live) or None
 								            """
-												[extractor/youtube] Retry manifest refresh for live-from-start (#5670)

Avoids ending download early when live stream is temporarily offline.
Best used with somewhat large `--retry-sleep extractor:` and `--extractor-retries`

Authored by: mzhou
											
										
										
											2023-01-06 13:30:42 -06:00
+								            for retry in self.RetryManager(fatal=False):
 								                with lock:
 								                    refetch_manifest(format_id, delay)
 								                f = next((f for f in formats if f['format_id'] == format_id), None)
 								                if not f:
 								                    if not is_live:
 								                        retry.error = f'{video_id}: Video is no longer live'
 								                    else:
 								                        retry.error = f'Cannot find refreshed manifest for format {format_id}{bug_reports_message()}'
 								                    continue
 								                return f['manifest_url'], f['manifest_stream_number'], is_live
 								            return None
-												[dash,youtube] Download live from start to end (#888)

* Add option `--live-from-start` to enable downloading live videos from start
* Add key `is_from_start` in formats to identify formats (of live videos) that downloads from start
* [dash] Create protocol `http_dash_segments_generator` that allows a function to be passed instead of fragments
* [fragment] Allow multiple live dash formats to download simultaneously
* [youtube] Implement fragment re-fetching for the live dash formats
* [youtube] Re-extract dash manifest every 5 hours (manifest expires in 6hrs)
* [postprocessor/ffmpeg] Add `FFmpegFixupDuplicateMoovPP` to fixup duplicated moov atoms

Known issue: Ctrl+C doesn't work on Windows when downloading multiple formats

Closes #1521
Authored by: nao20010128nao, pukkandan

											
										
										
											2021-12-20 00:06:46 -06:00
 								        for f in formats:
-												[extractor/youtube] Download `post_live` videos from start (#5091)

* The fragments are generated as a `LazyList`. So only the required formats are expanded during download, but all fragment lists are printed/written in infojson.
* The m3u8 formats which cannot be downloaded from start are not extracted by default, but can be enabled with an extractor-arg. The extractor-arg `include_live_dash` is renamed to `include_incomplete_formats` to account for this new use-case.

Closes #1564
Authored by: Lesmiscore, pukkandan
											
										
										
											2022-10-03 21:48:31 -05:00
+								            f['is_live'] = is_live
 								            gen = functools.partial(self._live_dash_fragments, video_id, f['format_id'],
 								                                    live_start_time, mpd_feed, not is_live and f.copy())
 								            if is_live:
 								                f['fragments'] = gen
 								                f['protocol'] = 'http_dash_segments_generator'
 								            else:
 								                f['fragments'] = LazyList(gen({}))
 								                del f['is_from_start']
-												[dash,youtube] Download live from start to end (#888)

* Add option `--live-from-start` to enable downloading live videos from start
* Add key `is_from_start` in formats to identify formats (of live videos) that downloads from start
* [dash] Create protocol `http_dash_segments_generator` that allows a function to be passed instead of fragments
* [fragment] Allow multiple live dash formats to download simultaneously
* [youtube] Implement fragment re-fetching for the live dash formats
* [youtube] Re-extract dash manifest every 5 hours (manifest expires in 6hrs)
* [postprocessor/ffmpeg] Add `FFmpegFixupDuplicateMoovPP` to fixup duplicated moov atoms

Known issue: Ctrl+C doesn't work on Windows when downloading multiple formats

Closes #1521
Authored by: nao20010128nao, pukkandan

											
										
										
											2021-12-20 00:06:46 -06:00
-												[extractor/youtube] Download `post_live` videos from start (#5091)

* The fragments are generated as a `LazyList`. So only the required formats are expanded during download, but all fragment lists are printed/written in infojson.
* The m3u8 formats which cannot be downloaded from start are not extracted by default, but can be enabled with an extractor-arg. The extractor-arg `include_live_dash` is renamed to `include_incomplete_formats` to account for this new use-case.

Closes #1564
Authored by: Lesmiscore, pukkandan
											
										
										
											2022-10-03 21:48:31 -05:00
+								    def _live_dash_fragments(self, video_id, format_id, live_start_time, mpd_feed, manifestless_orig_fmt, ctx):
-												[dash,youtube] Download live from start to end (#888)

* Add option `--live-from-start` to enable downloading live videos from start
* Add key `is_from_start` in formats to identify formats (of live videos) that downloads from start
* [dash] Create protocol `http_dash_segments_generator` that allows a function to be passed instead of fragments
* [fragment] Allow multiple live dash formats to download simultaneously
* [youtube] Implement fragment re-fetching for the live dash formats
* [youtube] Re-extract dash manifest every 5 hours (manifest expires in 6hrs)
* [postprocessor/ffmpeg] Add `FFmpegFixupDuplicateMoovPP` to fixup duplicated moov atoms

Known issue: Ctrl+C doesn't work on Windows when downloading multiple formats

Closes #1521
Authored by: nao20010128nao, pukkandan

											
										
										
											2021-12-20 00:06:46 -06:00
+								        FETCH_SPAN, MAX_DURATION = 5, 432000
 								        mpd_url, stream_number, is_live = None, None, True
 								        begin_index = 0
 								        download_start_time = ctx.get('start') or time.time()
 								        lack_early_segments = download_start_time - (live_start_time or download_start_time) > MAX_DURATION
 								        if lack_early_segments:
 								            self.report_warning(bug_reports_message(
 								                'Starting download from the last 120 hours of the live stream since '
 								                'YouTube does not have data before that. If you think this is wrong,'), only_once=True)
 								            lack_early_segments = True
 								        known_idx, no_fragment_score, last_segment_url = begin_index, 0, None
 								        fragments, fragment_base_url = None, None
-												[downloader/fragment] Improve `--live-from-start` for YouTube livestreams (#2870)


											
										
										
											2022-02-24 11:00:46 -06:00
+								        def _extract_sequence_from_mpd(refresh_sequence, immediate):
-												[dash,youtube] Download live from start to end (#888)

* Add option `--live-from-start` to enable downloading live videos from start
* Add key `is_from_start` in formats to identify formats (of live videos) that downloads from start
* [dash] Create protocol `http_dash_segments_generator` that allows a function to be passed instead of fragments
* [fragment] Allow multiple live dash formats to download simultaneously
* [youtube] Implement fragment re-fetching for the live dash formats
* [youtube] Re-extract dash manifest every 5 hours (manifest expires in 6hrs)
* [postprocessor/ffmpeg] Add `FFmpegFixupDuplicateMoovPP` to fixup duplicated moov atoms

Known issue: Ctrl+C doesn't work on Windows when downloading multiple formats

Closes #1521
Authored by: nao20010128nao, pukkandan

											
										
										
											2021-12-20 00:06:46 -06:00
+								            nonlocal mpd_url, stream_number, is_live, no_fragment_score, fragments, fragment_base_url
 								            # Obtain from MPD's maximum seq value
 								            old_mpd_url = mpd_url
-												[youtube] End `live-from-start` properly when stream ends with 403

Closes #2089

											
										
										
											2021-12-26 04:19:35 -06:00
+								            last_error = ctx.pop('last_error', None)
-												[cleanup] Bump ruff to 0.8.x (#11608)

Authored by: seproDev
											
										
										
											2024-12-02 09:29:30 -06:00
+								            expire_fast = immediate or (last_error and isinstance(last_error, HTTPError) and last_error.status == 403)
-												[youtube] End `live-from-start` properly when stream ends with 403

Closes #2089

											
										
										
											2021-12-26 04:19:35 -06:00
+								            mpd_url, stream_number, is_live = (mpd_feed(format_id, 5 if expire_fast else 18000)
 								                                               or (mpd_url, stream_number, False))
 								            if not refresh_sequence:
 								                if expire_fast and not is_live:
 								                    return False, last_seq
 								                elif old_mpd_url == mpd_url:
 								                    return True, last_seq
-												[extractor/youtube] Download `post_live` videos from start (#5091)

* The fragments are generated as a `LazyList`. So only the required formats are expanded during download, but all fragment lists are printed/written in infojson.
* The m3u8 formats which cannot be downloaded from start are not extracted by default, but can be enabled with an extractor-arg. The extractor-arg `include_live_dash` is renamed to `include_incomplete_formats` to account for this new use-case.

Closes #1564
Authored by: Lesmiscore, pukkandan
											
										
										
											2022-10-03 21:48:31 -05:00
+								            if manifestless_orig_fmt:
 								                fmt_info = manifestless_orig_fmt
 								            else:
 								                try:
 								                    fmts, _ = self._extract_mpd_formats_and_subtitles(
 								                        mpd_url, None, note=False, errnote=False, fatal=False)
 								                except ExtractorError:
 								                    fmts = None
 								                if not fmts:
 								                    no_fragment_score += 2
 								                    return False, last_seq
 								                fmt_info = next(x for x in fmts if x['manifest_stream_number'] == stream_number)
-												[dash,youtube] Download live from start to end (#888)

* Add option `--live-from-start` to enable downloading live videos from start
* Add key `is_from_start` in formats to identify formats (of live videos) that downloads from start
* [dash] Create protocol `http_dash_segments_generator` that allows a function to be passed instead of fragments
* [fragment] Allow multiple live dash formats to download simultaneously
* [youtube] Implement fragment re-fetching for the live dash formats
* [youtube] Re-extract dash manifest every 5 hours (manifest expires in 6hrs)
* [postprocessor/ffmpeg] Add `FFmpegFixupDuplicateMoovPP` to fixup duplicated moov atoms

Known issue: Ctrl+C doesn't work on Windows when downloading multiple formats

Closes #1521
Authored by: nao20010128nao, pukkandan

											
										
										
											2021-12-20 00:06:46 -06:00
+								            fragments = fmt_info['fragments']
 								            fragment_base_url = fmt_info['fragment_base_url']
 								            assert fragment_base_url
 								            _last_seq = int(re.search(r'(?:/|^)sq/(\d+)', fragments[-1]['path']).group(1))
 								            return True, _last_seq
-												[extractor/youtube] Download `post_live` videos from start (#5091)

* The fragments are generated as a `LazyList`. So only the required formats are expanded during download, but all fragment lists are printed/written in infojson.
* The m3u8 formats which cannot be downloaded from start are not extracted by default, but can be enabled with an extractor-arg. The extractor-arg `include_live_dash` is renamed to `include_incomplete_formats` to account for this new use-case.

Closes #1564
Authored by: Lesmiscore, pukkandan
											
										
										
											2022-10-03 21:48:31 -05:00
+								        self.write_debug(f'[{video_id}] Generating fragments for format {format_id}')
-												[dash,youtube] Download live from start to end (#888)

* Add option `--live-from-start` to enable downloading live videos from start
* Add key `is_from_start` in formats to identify formats (of live videos) that downloads from start
* [dash] Create protocol `http_dash_segments_generator` that allows a function to be passed instead of fragments
* [fragment] Allow multiple live dash formats to download simultaneously
* [youtube] Implement fragment re-fetching for the live dash formats
* [youtube] Re-extract dash manifest every 5 hours (manifest expires in 6hrs)
* [postprocessor/ffmpeg] Add `FFmpegFixupDuplicateMoovPP` to fixup duplicated moov atoms

Known issue: Ctrl+C doesn't work on Windows when downloading multiple formats

Closes #1521
Authored by: nao20010128nao, pukkandan

											
										
										
											2021-12-20 00:06:46 -06:00
+								        while is_live:
 								            fetch_time = time.time()
 								            if no_fragment_score > 30:
 								                return
 								            if last_segment_url:
 								                # Obtain from "X-Head-Seqnum" header value from each segment
 								                try:
 								                    urlh = self._request_webpage(
 								                        last_segment_url, None, note=False, errnote=False, fatal=False)
 								                except ExtractorError:
 								                    urlh = None
 								                last_seq = try_get(urlh, lambda x: int_or_none(x.headers['X-Head-Seqnum']))
 								                if last_seq is None:
-												[downloader/fragment] Improve `--live-from-start` for YouTube livestreams (#2870)


											
										
										
											2022-02-24 11:00:46 -06:00
+								                    no_fragment_score += 2
-												[dash,youtube] Download live from start to end (#888)

* Add option `--live-from-start` to enable downloading live videos from start
* Add key `is_from_start` in formats to identify formats (of live videos) that downloads from start
* [dash] Create protocol `http_dash_segments_generator` that allows a function to be passed instead of fragments
* [fragment] Allow multiple live dash formats to download simultaneously
* [youtube] Implement fragment re-fetching for the live dash formats
* [youtube] Re-extract dash manifest every 5 hours (manifest expires in 6hrs)
* [postprocessor/ffmpeg] Add `FFmpegFixupDuplicateMoovPP` to fixup duplicated moov atoms

Known issue: Ctrl+C doesn't work on Windows when downloading multiple formats

Closes #1521
Authored by: nao20010128nao, pukkandan

											
										
										
											2021-12-20 00:06:46 -06:00
+								                    last_segment_url = None
 								                    continue
 								            else:
-												[downloader/fragment] Improve `--live-from-start` for YouTube livestreams (#2870)


											
										
										
											2022-02-24 11:00:46 -06:00
+								                should_continue, last_seq = _extract_sequence_from_mpd(True, no_fragment_score > 15)
 								                no_fragment_score += 2
-												[youtube] End `live-from-start` properly when stream ends with 403

Closes #2089

											
										
										
											2021-12-26 04:19:35 -06:00
+								                if not should_continue:
-												[dash,youtube] Download live from start to end (#888)

* Add option `--live-from-start` to enable downloading live videos from start
* Add key `is_from_start` in formats to identify formats (of live videos) that downloads from start
* [dash] Create protocol `http_dash_segments_generator` that allows a function to be passed instead of fragments
* [fragment] Allow multiple live dash formats to download simultaneously
* [youtube] Implement fragment re-fetching for the live dash formats
* [youtube] Re-extract dash manifest every 5 hours (manifest expires in 6hrs)
* [postprocessor/ffmpeg] Add `FFmpegFixupDuplicateMoovPP` to fixup duplicated moov atoms

Known issue: Ctrl+C doesn't work on Windows when downloading multiple formats

Closes #1521
Authored by: nao20010128nao, pukkandan

											
										
										
											2021-12-20 00:06:46 -06:00
+								                    continue
 								            if known_idx > last_seq:
 								                last_segment_url = None
 								                continue
 								            last_seq += 1
 								            if begin_index < 0 and known_idx < 0:
 								                # skip from the start when it's negative value
 								                known_idx = last_seq + begin_index
 								            if lack_early_segments:
 								                known_idx = max(known_idx, last_seq - int(MAX_DURATION // fragments[-1]['duration']))
 								            try:
 								                for idx in range(known_idx, last_seq):
 								                    # do not update sequence here or you'll get skipped some part of it
-												[downloader/fragment] Improve `--live-from-start` for YouTube livestreams (#2870)


											
										
										
											2022-02-24 11:00:46 -06:00
+								                    should_continue, _ = _extract_sequence_from_mpd(False, False)
-												[youtube] End `live-from-start` properly when stream ends with 403

Closes #2089

											
										
										
											2021-12-26 04:19:35 -06:00
+								                    if not should_continue:
-												[dash,youtube] Download live from start to end (#888)

* Add option `--live-from-start` to enable downloading live videos from start
* Add key `is_from_start` in formats to identify formats (of live videos) that downloads from start
* [dash] Create protocol `http_dash_segments_generator` that allows a function to be passed instead of fragments
* [fragment] Allow multiple live dash formats to download simultaneously
* [youtube] Implement fragment re-fetching for the live dash formats
* [youtube] Re-extract dash manifest every 5 hours (manifest expires in 6hrs)
* [postprocessor/ffmpeg] Add `FFmpegFixupDuplicateMoovPP` to fixup duplicated moov atoms

Known issue: Ctrl+C doesn't work on Windows when downloading multiple formats

Closes #1521
Authored by: nao20010128nao, pukkandan

											
										
										
											2021-12-20 00:06:46 -06:00
+								                        known_idx = idx - 1
 								                        raise ExtractorError('breaking out of outer loop')
-												[cleanup] Add more ruff rules (#10149)

Authored by: seproDev

Reviewed-by: bashonly <88596187+bashonly@users.noreply.github.com>
Reviewed-by: Simon Sawicki <contact@grub4k.xyz>
											
										
										
											2024-06-11 18:09:58 -05:00
+								                    last_segment_url = urljoin(fragment_base_url, f'sq/{idx}')
-												[dash,youtube] Download live from start to end (#888)

* Add option `--live-from-start` to enable downloading live videos from start
* Add key `is_from_start` in formats to identify formats (of live videos) that downloads from start
* [dash] Create protocol `http_dash_segments_generator` that allows a function to be passed instead of fragments
* [fragment] Allow multiple live dash formats to download simultaneously
* [youtube] Implement fragment re-fetching for the live dash formats
* [youtube] Re-extract dash manifest every 5 hours (manifest expires in 6hrs)
* [postprocessor/ffmpeg] Add `FFmpegFixupDuplicateMoovPP` to fixup duplicated moov atoms

Known issue: Ctrl+C doesn't work on Windows when downloading multiple formats

Closes #1521
Authored by: nao20010128nao, pukkandan

											
										
										
											2021-12-20 00:06:46 -06:00
+								                    yield {
 								                        'url': last_segment_url,
-												[dash] Show fragment count with `--live-from-start` (#3493)

Authored by: flashdagger
											
										
										
											2022-06-07 07:44:08 -05:00
+								                        'fragment_count': last_seq,
-												[dash,youtube] Download live from start to end (#888)

* Add option `--live-from-start` to enable downloading live videos from start
* Add key `is_from_start` in formats to identify formats (of live videos) that downloads from start
* [dash] Create protocol `http_dash_segments_generator` that allows a function to be passed instead of fragments
* [fragment] Allow multiple live dash formats to download simultaneously
* [youtube] Implement fragment re-fetching for the live dash formats
* [youtube] Re-extract dash manifest every 5 hours (manifest expires in 6hrs)
* [postprocessor/ffmpeg] Add `FFmpegFixupDuplicateMoovPP` to fixup duplicated moov atoms

Known issue: Ctrl+C doesn't work on Windows when downloading multiple formats

Closes #1521
Authored by: nao20010128nao, pukkandan

											
										
										
											2021-12-20 00:06:46 -06:00
+								                    }
 								                if known_idx == last_seq:
 								                    no_fragment_score += 5
 								                else:
 								                    no_fragment_score = 0
 								                known_idx = last_seq
 								            except ExtractorError:
 								                continue
-												[extractor/youtube] Download `post_live` videos from start (#5091)

* The fragments are generated as a `LazyList`. So only the required formats are expanded during download, but all fragment lists are printed/written in infojson.
* The m3u8 formats which cannot be downloaded from start are not extracted by default, but can be enabled with an extractor-arg. The extractor-arg `include_live_dash` is renamed to `include_incomplete_formats` to account for this new use-case.

Closes #1564
Authored by: Lesmiscore, pukkandan
											
										
										
											2022-10-03 21:48:31 -05:00
+								            if manifestless_orig_fmt:
 								                # Stop at the first iteration if running for post-live manifestless;
 								                # fragment count no longer increase since it starts
 								                break
-												[dash,youtube] Download live from start to end (#888)

* Add option `--live-from-start` to enable downloading live videos from start
* Add key `is_from_start` in formats to identify formats (of live videos) that downloads from start
* [dash] Create protocol `http_dash_segments_generator` that allows a function to be passed instead of fragments
* [fragment] Allow multiple live dash formats to download simultaneously
* [youtube] Implement fragment re-fetching for the live dash formats
* [youtube] Re-extract dash manifest every 5 hours (manifest expires in 6hrs)
* [postprocessor/ffmpeg] Add `FFmpegFixupDuplicateMoovPP` to fixup duplicated moov atoms

Known issue: Ctrl+C doesn't work on Windows when downloading multiple formats

Closes #1521
Authored by: nao20010128nao, pukkandan

											
										
										
											2021-12-20 00:06:46 -06:00
+								            time.sleep(max(0, FETCH_SPAN + fetch_time - time.time()))
-												[youtube] Improvements to JS player extraction (See desc) (#860)

* fallback player url extraction when it fails to be extracted from the webpage
* don't download js player unnecessarily for clients that don't require it
* try to extract js player url from any additional client configs
* ability to skip the js player usage/download using `player_skip=js`
* ability to skip the initial webpage download using `player_skip=webpage`

known issue:
* authentication for multi-channel accounts and multi-account cookies may not work correctly if the webpage or client configs are skipped
*  formats from the web client requiring signature decryption will be skipped if player js extraction is skipped

Authored by: coletdjnz
											
										
										
											2021-09-06 02:26:41 -05:00
+								    def _extract_player_url(self, *ytcfgs, webpage=None):
 								        player_url = traverse_obj(
 								            ytcfgs, (..., 'PLAYER_JS_URL'), (..., 'WEB_PLAYER_CONTEXT_CONFIGS', ..., 'jsUrl'),
-												[compat] Remove deprecated functions from core code

											
										
										
											2022-06-24 05:54:43 -05:00
+								            get_all=False, expected_type=str)
-												[youtube] Extract data from multiple clients (#536)

* `player_client` accepts multiple clients
* default `player_client` = `android,web`
* music clients can be specifically requested
* Add IOS `player_client`
* Hide live dash since they can't be downloaded

Closes #501

Authored-by: pukkandan, colethedj
											
										
										
											2021-07-20 22:52:34 -05:00
+								        if not player_url:
-												[youtube] Improvements to JS player extraction (See desc) (#860)

* fallback player url extraction when it fails to be extracted from the webpage
* don't download js player unnecessarily for clients that don't require it
* try to extract js player url from any additional client configs
* ability to skip the js player usage/download using `player_skip=js`
* ability to skip the initial webpage download using `player_skip=webpage`

known issue:
* authentication for multi-channel accounts and multi-account cookies may not work correctly if the webpage or client configs are skipped
*  formats from the web client requiring signature decryption will be skipped if player js extraction is skipped

Authored by: coletdjnz
											
										
										
											2021-09-06 02:26:41 -05:00
+								            return
-												[youtube] Ensure subtitle urls are absolute (#2765)

Closes #2755

Authored by: coletdjnz
											
										
										
											2022-02-13 15:36:01 -06:00
+								        return urljoin('https://www.youtube.com', player_url)
-												[youtube] Use new API for additional video extraction requests (#328)

Co-authored-by: colethedj, pukkandan
Closes https://github.com/yt-dlp/yt-dlp/issues/427
Workarounds for https://github.com/ytdl-org/youtube-dl/issues/29326, https://github.com/yt-dlp/yt-dlp/issues/319, https://github.com/ytdl-org/youtube-dl/issues/29086
											
										
										
											2021-06-29 17:07:49 -05:00
-												[youtube] Improvements to JS player extraction (See desc) (#860)

* fallback player url extraction when it fails to be extracted from the webpage
* don't download js player unnecessarily for clients that don't require it
* try to extract js player url from any additional client configs
* ability to skip the js player usage/download using `player_skip=js`
* ability to skip the initial webpage download using `player_skip=webpage`

known issue:
* authentication for multi-channel accounts and multi-account cookies may not work correctly if the webpage or client configs are skipped
*  formats from the web client requiring signature decryption will be skipped if player js extraction is skipped

Authored by: coletdjnz
											
										
										
											2021-09-06 02:26:41 -05:00
+								    def _download_player_url(self, video_id, fatal=False):
-												[ie/youtube] Retry on more critical requests (#12339)

Authored by: coletdjnz
											
										
										
											2025-02-18 18:39:51 -06:00
+								        iframe_webpage = self._download_webpage_with_retries(
-												[youtube] Improvements to JS player extraction (See desc) (#860)

* fallback player url extraction when it fails to be extracted from the webpage
* don't download js player unnecessarily for clients that don't require it
* try to extract js player url from any additional client configs
* ability to skip the js player usage/download using `player_skip=js`
* ability to skip the initial webpage download using `player_skip=webpage`

known issue:
* authentication for multi-channel accounts and multi-account cookies may not work correctly if the webpage or client configs are skipped
*  formats from the web client requiring signature decryption will be skipped if player js extraction is skipped

Authored by: coletdjnz
											
										
										
											2021-09-06 02:26:41 -05:00
+								            'https://www.youtube.com/iframe_api',
-												[ie/youtube] Retry on more critical requests (#12339)

Authored by: coletdjnz
											
										
										
											2025-02-18 18:39:51 -06:00
+								            note='Downloading iframe API JS',
 								            video_id=video_id, retry_fatal=fatal)
 								        if iframe_webpage:
-												[youtube] Improvements to JS player extraction (See desc) (#860)

* fallback player url extraction when it fails to be extracted from the webpage
* don't download js player unnecessarily for clients that don't require it
* try to extract js player url from any additional client configs
* ability to skip the js player usage/download using `player_skip=js`
* ability to skip the initial webpage download using `player_skip=webpage`

known issue:
* authentication for multi-channel accounts and multi-account cookies may not work correctly if the webpage or client configs are skipped
*  formats from the web client requiring signature decryption will be skipped if player js extraction is skipped

Authored by: coletdjnz
											
										
										
											2021-09-06 02:26:41 -05:00
+								            player_version = self._search_regex(
-												[ie/youtube] Retry on more critical requests (#12339)

Authored by: coletdjnz
											
										
										
											2025-02-18 18:39:51 -06:00
+								                r'player\\?/([0-9a-fA-F]{8})\\?/', iframe_webpage, 'player version', fatal=fatal)
-												[youtube] Improvements to JS player extraction (See desc) (#860)

* fallback player url extraction when it fails to be extracted from the webpage
* don't download js player unnecessarily for clients that don't require it
* try to extract js player url from any additional client configs
* ability to skip the js player usage/download using `player_skip=js`
* ability to skip the initial webpage download using `player_skip=webpage`

known issue:
* authentication for multi-channel accounts and multi-account cookies may not work correctly if the webpage or client configs are skipped
*  formats from the web client requiring signature decryption will be skipped if player js extraction is skipped

Authored by: coletdjnz
											
										
										
											2021-09-06 02:26:41 -05:00
+								            if player_version:
 								                return f'https://www.youtube.com/s/player/{player_version}/player_ias.vflset/en_US/base.js'
-												[youtube] Make cache ID a tuple of lengths instead of just the whole length

											
										
										
											2014-08-02 05:21:53 -05:00
+								    def _signature_cache_id(self, example_sig):
 								        """ Return a string representation of a signature """
-												[compat] Remove deprecated functions from core code

											
										
										
											2022-06-24 05:54:43 -05:00
+								        return '.'.join(str(len(part)) for part in example_sig.split('.'))
-												[youtube] Make cache ID a tuple of lengths instead of just the whole length

											
										
										
											2014-08-02 05:21:53 -05:00
-												[youtube] Improve player id extraction and add tests

											
										
										
											2020-05-01 19:18:08 -05:00
+								    @classmethod
 								    def _extract_player_info(cls, player_url):
 								        for player_re in cls._PLAYER_INFO_RE:
 								            id_m = re.search(player_re, player_url)
 								            if id_m:
 								                break
 								        else:
-												[cleanup] Add more ruff rules (#10149)

Authored by: seproDev

Reviewed-by: bashonly <88596187+bashonly@users.noreply.github.com>
Reviewed-by: Simon Sawicki <contact@grub4k.xyz>
											
										
										
											2024-06-11 18:09:58 -05:00
+								            raise ExtractorError(f'Cannot identify player {player_url!r}')
-												[youtube] Update to ytdl-2021.02.04.1

											
										
										
											2021-02-04 08:37:17 -06:00
+								        return id_m.group('id')
-												[youtube] Improve player id extraction and add tests

											
										
										
											2020-05-01 19:18:08 -05:00
-												[youtube] Fix throttling by decrypting n-sig (#1437)


											
										
										
											2021-10-30 23:23:58 -05:00
+								    def _load_player(self, video_id, player_url, fatal=True):
-												[youtube] Use new API for additional video extraction requests (#328)

Co-authored-by: colethedj, pukkandan
Closes https://github.com/yt-dlp/yt-dlp/issues/427
Workarounds for https://github.com/ytdl-org/youtube-dl/issues/29326, https://github.com/yt-dlp/yt-dlp/issues/319, https://github.com/ytdl-org/youtube-dl/issues/29086
											
										
										
											2021-06-29 17:07:49 -05:00
+								        player_id = self._extract_player_info(player_url)
 								        if player_id not in self._code_cache:
-												[youtube] Fix non-fatal errors in fetching player

											
										
										
											2021-10-03 16:14:55 -05:00
+								            code = self._download_webpage(
-												[youtube] Use new API for additional video extraction requests (#328)

Co-authored-by: colethedj, pukkandan
Closes https://github.com/yt-dlp/yt-dlp/issues/427
Workarounds for https://github.com/ytdl-org/youtube-dl/issues/29326, https://github.com/yt-dlp/yt-dlp/issues/319, https://github.com/ytdl-org/youtube-dl/issues/29086
											
										
										
											2021-06-29 17:07:49 -05:00
+								                player_url, video_id, fatal=fatal,
 								                note='Downloading player ' + player_id,
-												[ie/youtube] Remove broken OAuth support (#11558)

Closes #11462
Authored by: bashonly
											
										
										
											2024-11-16 17:40:21 -06:00
+								                errnote=f'Download of {player_url} failed')
-												[youtube] Fix non-fatal errors in fetching player

											
										
										
											2021-10-03 16:14:55 -05:00
+								            if code:
 								                self._code_cache[player_id] = code
-												[youtube] Fix throttling by decrypting n-sig (#1437)


											
										
										
											2021-10-30 23:23:58 -05:00
+								        return self._code_cache.get(player_id)
-												[youtube] Use new API for additional video extraction requests (#328)

Co-authored-by: colethedj, pukkandan
Closes https://github.com/yt-dlp/yt-dlp/issues/427
Workarounds for https://github.com/ytdl-org/youtube-dl/issues/29326, https://github.com/yt-dlp/yt-dlp/issues/319, https://github.com/ytdl-org/youtube-dl/issues/29086
											
										
										
											2021-06-29 17:07:49 -05:00
-												[youtube] Improve player id extraction and add tests

											
										
										
											2020-05-01 19:18:08 -05:00
+								    def _extract_signature_function(self, video_id, player_url, example_sig):
-												[youtube] Update to ytdl-2021.02.04.1

											
										
										
											2021-02-04 08:37:17 -06:00
+								        player_id = self._extract_player_info(player_url)
-												Restore accidentally deleted commits

That's what happens if you let Windows machines write :(

											
										
										
											2013-09-21 07:19:30 -05:00
-												[youtube] Add filesystem signature cache

											
										
										
											2013-09-21 17:35:03 -05:00
+								        # Read from filesystem cache
-												[cleanup] Upgrade syntax

Using https://github.com/asottile/pyupgrade

1. `__future__` imports and `coding: utf-8` were removed
2. Files were rewritten with `pyupgrade --py36-plus --keep-percent-format`
3. f-strings were cherry-picked from `pyupgrade --py36-plus`

Extractors are left untouched (except removing header) to avoid unnecessary merge conflicts

											
										
										
											2022-04-11 10:10:28 -05:00
+								        func_id = f'js_{player_id}_{self._signature_cache_id(example_sig)}'
-												[youtube] Add filesystem signature cache

											
										
										
											2013-09-21 17:35:03 -05:00
+								        assert os.path.basename(func_id) == func_id
-												[youtube] Move cache into its own module

											
										
										
											2014-09-03 05:41:05 -05:00
-												[cleanup] Misc cleanup

											
										
										
											2022-06-28 00:10:54 -05:00
+								        self.write_debug(f'Extracting signature function {func_id}')
-												[youtube] Improve signature caching

and refactor related functions

											
										
										
											2022-08-18 10:57:41 -05:00
+								        cache_spec, code = self.cache.load('youtube-sigfuncs', func_id), None
-												Prepare signature function caching

											
										
										
											2013-09-21 08:19:48 -05:00
-												[youtube] Improve signature caching

and refactor related functions

											
										
										
											2022-08-18 10:57:41 -05:00
+								        if not cache_spec:
 								            code = self._load_player(video_id, player_url)
-												[youtube] Fix throttling by decrypting n-sig (#1437)


											
										
										
											2021-10-30 23:23:58 -05:00
+								        if code:
-												[youtube] Use new API for additional video extraction requests (#328)

Co-authored-by: colethedj, pukkandan
Closes https://github.com/yt-dlp/yt-dlp/issues/427
Workarounds for https://github.com/ytdl-org/youtube-dl/issues/29326, https://github.com/yt-dlp/yt-dlp/issues/319, https://github.com/ytdl-org/youtube-dl/issues/29086
											
										
										
											2021-06-29 17:07:49 -05:00
+								            res = self._parse_sig_js(code)
-												[compat] Remove more functions

Removing any more will require changes to a large number of extractors

											
										
										
											2022-06-24 03:10:17 -05:00
+								            test_string = ''.join(map(chr, range(len(example_sig))))
-												[youtube] Improve signature caching

and refactor related functions

											
										
										
											2022-08-18 10:57:41 -05:00
+								            cache_spec = [ord(c) for c in res(test_string)]
-												[extractor, cleanup] Reduce direct use of `_downloader`

											
										
										
											2022-06-22 23:14:22 -05:00
+								            self.cache.store('youtube-sigfuncs', func_id, cache_spec)
-												[youtube] Improve signature caching

and refactor related functions

											
										
										
											2022-08-18 10:57:41 -05:00
 								        return lambda s: ''.join(s[i] for i in cache_spec)
-												Prepare signature function caching

											
										
										
											2013-09-21 08:19:48 -05:00
-												[youtube] Make cache ID a tuple of lengths instead of just the whole length

											
										
										
											2014-08-02 05:21:53 -05:00
+								    def _print_sig_code(self, func, example_sig):
-												[youtube] Fix throttling by decrypting n-sig (#1437)


											
										
										
											2021-10-30 23:23:58 -05:00
+								        if not self.get_param('youtube_print_sig_code'):
 								            return
-												[youtube] Improve cache and add an option to print the extracted signatures

											
										
										
											2013-09-22 03:30:02 -05:00
+								        def gen_sig_code(idxs):
 								            def _genslice(start, end, step):
-												[youtube] Modernize

											
										
										
											2014-09-13 00:51:06 -05:00
+								                starts = '' if start == 0 else str(start)
-												PEP8: more applied

											
										
										
											2014-11-23 14:20:46 -06:00
+								                ends = (':%d' % (end + step)) if end + step >= 0 else ':'
-												[youtube] Remove superfluous unicode specifiers

											
										
										
											2014-09-24 02:51:45 -05:00
+								                steps = '' if step == 1 else (':%d' % step)
-												[cleanup] Upgrade syntax

Using https://github.com/asottile/pyupgrade

1. `__future__` imports and `coding: utf-8` were removed
2. Files were rewritten with `pyupgrade --py36-plus --keep-percent-format`
3. f-strings were cherry-picked from `pyupgrade --py36-plus`

Extractors are left untouched (except removing header) to avoid unnecessary merge conflicts

											
										
										
											2022-04-11 10:10:28 -05:00
+								                return f's[{starts}{ends}{steps}]'
-												[youtube] Improve cache and add an option to print the extracted signatures

											
										
										
											2013-09-22 03:30:02 -05:00
 								            step = None
-												Improve code style

											
										
										
											2014-12-16 17:06:41 -06:00
+								            # Quelch pyflakes warnings - start will be set when step is set
 								            start = '(Never used)'
-												[youtube] Improve cache and add an option to print the extracted signatures

											
										
										
											2013-09-22 03:30:02 -05:00
+								            for i, prev in zip(idxs[1:], idxs[:-1]):
 								                if step is not None:
 								                    if i - prev == step:
 								                        continue
 								                    yield _genslice(start, prev, step)
 								                    step = None
 								                    continue
 								                if i - prev in [-1, 1]:
 								                    step = i - prev
 								                    start = prev
 								                    continue
 								                else:
-												[youtube] Modernize

											
										
										
											2014-09-13 00:51:06 -05:00
+								                    yield 's[%d]' % prev
-												[youtube] Improve cache and add an option to print the extracted signatures

											
										
										
											2013-09-22 03:30:02 -05:00
+								            if step is None:
-												[youtube] Modernize

											
										
										
											2014-09-13 00:51:06 -05:00
+								                yield 's[%d]' % i
-												[youtube] Improve cache and add an option to print the extracted signatures

											
										
										
											2013-09-22 03:30:02 -05:00
+								            else:
 								                yield _genslice(start, i, step)
-												[compat] Remove more functions

Removing any more will require changes to a large number of extractors

											
										
										
											2022-06-24 03:10:17 -05:00
+								        test_string = ''.join(map(chr, range(len(example_sig))))
-												Correct test strings

											
										
										
											2013-09-22 05:18:16 -05:00
+								        cache_res = func(test_string)
-												[youtube] Improve cache and add an option to print the extracted signatures

											
										
										
											2013-09-22 03:30:02 -05:00
+								        cache_spec = [ord(c) for c in cache_res]
-												[youtube] Modernize

											
										
										
											2014-09-13 00:51:06 -05:00
+								        expr_code = ' + '.join(gen_sig_code(cache_spec))
-												[cleanup] Add more ruff rules (#10149)

Authored by: seproDev

Reviewed-by: bashonly <88596187+bashonly@users.noreply.github.com>
Reviewed-by: Simon Sawicki <contact@grub4k.xyz>
											
										
										
											2024-06-11 18:09:58 -05:00
+								        signature_id_tuple = '({})'.format(', '.join(str(len(p)) for p in example_sig.split('.')))
 								        code = (f'if tuple(len(p) for p in s.split(\'.\')) == {signature_id_tuple}:\n'
 								                f'    return {expr_code}\n')
-												[youtube] Remove superfluous unicode specifiers

											
										
										
											2014-09-24 02:51:45 -05:00
+								        self.to_screen('Extracted signature function:\n' + code)
-												[youtube] Improve cache and add an option to print the extracted signatures

											
										
										
											2013-09-22 03:30:02 -05:00
-												Restore accidentally deleted commits

That's what happens if you let Windows machines write :(

											
										
										
											2013-09-21 07:19:30 -05:00
+								    def _parse_sig_js(self, jscode):
-												[ie/youtube] Fix signature function extraction (#11751)

Closes #11748
Authored by: bashonly
											
										
										
											2024-12-06 09:34:13 -06:00
+								        # Examples where `sig` is funcname:
 								        # sig=function(a){a=a.split(""); ... ;return a.join("")};
 								        # ;c&&(c=sig(decodeURIComponent(c)),a.set(b,encodeURIComponent(c)));return a};
 								        # {var l=f,m=h.sp,n=sig(decodeURIComponent(h.s));l.set(m,encodeURIComponent(n))}
 								        # sig=function(J){J=J.split(""); ... ;return J.join("")};
 								        # ;N&&(N=sig(decodeURIComponent(N)),J.set(R,encodeURIComponent(N)));return J};
 								        # {var H=u,k=f.sp,v=sig(decodeURIComponent(f.s));H.set(k,encodeURIComponent(v))}
-												Restore accidentally deleted commits

That's what happens if you let Windows machines write :(

											
										
										
											2013-09-21 07:19:30 -05:00
+								        funcname = self._search_regex(
-												[ie/youtube] Fix signature function extraction for `2f1832d2` (#11801)

Closes #11798
Authored by: bashonly
											
										
										
											2024-12-13 03:43:08 -06:00
+								            (r'\b(?P<var>[a-zA-Z0-9_$]+)&&\((?P=var)=(?P<sig>[a-zA-Z0-9_$]{2,})\(decodeURIComponent\((?P=var)\)\)',
 								             r'(?P<sig>[a-zA-Z0-9_$]+)\s*=\s*function\(\s*(?P<arg>[a-zA-Z0-9_$]+)\s*\)\s*{\s*(?P=arg)\s*=\s*(?P=arg)\.split\(\s*""\s*\)\s*;\s*[^}]+;\s*return\s+(?P=arg)\.join\(\s*""\s*\)',
 								             r'(?:\b|[^a-zA-Z0-9_$])(?P<sig>[a-zA-Z0-9_$]{2,})\s*=\s*function\(\s*a\s*\)\s*{\s*a\s*=\s*a\.split\(\s*""\s*\)(?:;[a-zA-Z0-9_$]{2}\.[a-zA-Z0-9_$]{2}\(a,\d+\))?',
-												[ie/youtube] Fix signature function extraction (#11751)

Closes #11748
Authored by: bashonly
											
										
										
											2024-12-06 09:34:13 -06:00
+								             # Old patterns
 								             r'\b[cs]\s*&&\s*[adf]\.set\([^,]+\s*,\s*encodeURIComponent\s*\(\s*(?P<sig>[a-zA-Z0-9$]+)\(',
-												[youtube] Update signature function patterns (closes #21469, closes #21476)

											
										
										
											2019-06-21 10:58:42 -05:00
+								             r'\b[a-zA-Z0-9]+\s*&&\s*[a-zA-Z0-9]+\.set\([^,]+\s*,\s*encodeURIComponent\s*\(\s*(?P<sig>[a-zA-Z0-9$]+)\(',
-												[youtube] Improve signature function detection (#641)

Authored by: PSlava (Slava <slash@i-slash.com>)
											
										
										
											2021-08-07 22:54:37 -05:00
+								             r'\bm=(?P<sig>[a-zA-Z0-9$]{2,})\(decodeURIComponent\(h\.s\)\)',
-												[youtube] Update signature function patterns (closes #21469, closes #21476)

											
										
										
											2019-06-21 10:58:42 -05:00
+								             # Obsolete patterns
-												Update to ytdl-commit-d1c6c5

[YouTube] [core] Improve platform debug log, based on yt-dlp
https://github.com/ytdl-org/youtube-dl/commit/d1c6c5c4d618fa950813c0c71aede34a5ac851e9

Except:
    * 6ed34338285f722d0da312ce0af3a15a077a3e2a [jsinterp] Add short-cut evaluation for common expression
        * There was no performance improvement when tested with https://github.com/ytdl-org/youtube-dl/issues/30641
    * e8de54bce50f6f77a4d7e8e80675f7003d5bf630 [core] Handle `/../` sequences in HTTP URLs
        * We plan to implement this differently

											
										
										
											2023-05-24 13:00:43 -05:00
+								             r'("|\')signature\1\s*,\s*(?P<sig>[a-zA-Z0-9$]+)\(',
-												[youtube] Fix extraction (closes #17457, closes #17464)

											
										
										
											2018-09-07 15:36:10 -05:00
+								             r'\.sig\|\|(?P<sig>[a-zA-Z0-9$]+)\(',
-												[youtube] Update signature function patterns (closes #21469, closes #21476)

											
										
										
											2019-06-21 10:58:42 -05:00
+								             r'yt\.akamaized\.net/\)\s*\|\|\s*.*?\s*[cs]\s*&&\s*[adf]\.set\([^,]+\s*,\s*(?:encodeURIComponent\s*\()?\s*(?P<sig>[a-zA-Z0-9$]+)\(',
 								             r'\b[cs]\s*&&\s*[adf]\.set\([^,]+\s*,\s*(?P<sig>[a-zA-Z0-9$]+)\(',
 								             r'\bc\s*&&\s*[a-zA-Z0-9]+\.set\([^,]+\s*,\s*\([^)]*\)\s*\(\s*(?P<sig>[a-zA-Z0-9$]+)\('),
-												[youtube] Fix extraction for domainless player URLs

Closes #11890
Closes #11891
Closes #11892
Closes #11894
Closes #11895
Closes #11897
Closes #11900
Closes #11903
Closes #11904
Closes #11906
Closes #11907
Closes #11909
Closes #11913
Closes #11914
Closes #11915
Closes #11916
Closes #11917
Closes #11918
Closes #11919

											
										
										
											2017-01-31 09:19:29 -06:00
+								            jscode, 'Initial JS player signature function name', group='sig')
-												[youtube] Move JavaScript interpreter into its own module

											
										
										
											2014-03-30 00:02:58 -05:00
 								        jsi = JSInterpreter(jscode)
-												[ie/youtube] Fix nsig and signature extraction for player `643afba4` (#12684)

Closes #12677, Closes #12682
Authored by: seproDev, bashonly

Co-authored-by: bashonly <88596187+bashonly@users.noreply.github.com>
											
										
										
											2025-03-21 15:58:10 -05:00
+								        global_var_map = {}
 								        _, varname, value = self._extract_player_js_global_var(jscode)
 								        if varname:
 								            global_var_map[varname] = jsi.interpret_expression(value, {}, allow_recursion=100)
 								        initial_function = jsi.extract_function(funcname, global_var_map)
-												Restore accidentally deleted commits

That's what happens if you let Windows machines write :(

											
										
										
											2013-09-21 07:19:30 -05:00
+								        return lambda s: initial_function([s])
-												[youtube] Improve signature caching

and refactor related functions

											
										
										
											2022-08-18 10:57:41 -05:00
+								    def _cached(self, func, *cache_id):
 								        def inner(*args, **kwargs):
 								            if cache_id not in self._player_cache:
 								                try:
 								                    self._player_cache[cache_id] = func(*args, **kwargs)
 								                except ExtractorError as e:
 								                    self._player_cache[cache_id] = e
 								                except Exception as e:
 								                    self._player_cache[cache_id] = ExtractorError(traceback.format_exc(), cause=e)
 								            ret = self._player_cache[cache_id]
 								            if isinstance(ret, Exception):
 								                raise ret
 								            return ret
 								        return inner
-												[ie/youtube] Only cache nsig code on successful decoding (#12750)

Authored by: seproDev, bashonly

Co-authored-by: bashonly <88596187+bashonly@users.noreply.github.com>
											
										
										
											2025-03-25 18:47:45 -05:00
+								    def _load_nsig_code_from_cache(self, player_id):
 								        cache_id = ('nsig code', player_id)
 								        if func_code := self._player_cache.get(cache_id):
 								            return func_code
 								        func_code = self.cache.load('youtube-nsig', player_id, min_ver='2025.03.26')
 								        if func_code:
 								            self._player_cache[cache_id] = func_code
 								        return func_code
 								    def _store_nsig_code_to_cache(self, player_id, func_code):
 								        cache_id = ('nsig code', player_id)
 								        if cache_id not in self._player_cache:
 								            self.cache.store('youtube-nsig', player_id, func_code)
 								            self._player_cache[cache_id] = func_code
-												[youtube] Update to ytdl-2021.02.04.1

											
										
										
											2021-02-04 08:37:17 -06:00
+								    def _decrypt_signature(self, s, video_id, player_url):
-												keep track of the dates and html5player versions of working YT signature algos

											
										
										
											2013-06-27 15:20:50 -05:00
+								        """Turn the encrypted s field into a working signature"""
-												[youtube] Improve signature caching

and refactor related functions

											
										
										
											2022-08-18 10:57:41 -05:00
+								        extract_sig = self._cached(
 								            self._extract_signature_function, 'sig', player_url, self._signature_cache_id(s))
 								        func = extract_sig(video_id, player_url, s)
 								        self._print_sig_code(func, s)
 								        return func(s)
-												[youtube] Fix throttling by decrypting n-sig (#1437)


											
										
										
											2021-10-30 23:23:58 -05:00
 								    def _decrypt_nsig(self, s, video_id, player_url):
 								        """Turn the encrypted n field into a working signature"""
 								        if player_url is None:
 								            raise ExtractorError('Cannot decrypt nsig without player_url')
-												[youtube] Ensure subtitle urls are absolute (#2765)

Closes #2755

Authored by: coletdjnz
											
										
										
											2022-02-13 15:36:01 -06:00
+								        player_url = urljoin('https://www.youtube.com', player_url)
-												[youtube] Fix throttling by decrypting n-sig (#1437)


											
										
										
											2021-10-30 23:23:58 -05:00
-												[extractor/youtube] Fallback regex for nsig code extraction

											
										
										
											2022-09-01 03:08:25 -05:00
+								        try:
 								            jsi, player_id, func_code = self._extract_n_function_code(video_id, player_url)
 								        except ExtractorError as e:
 								            raise ExtractorError('Unable to extract nsig function code', cause=e)
-												[youtube] Improve signature caching

and refactor related functions

											
										
										
											2022-08-18 10:57:41 -05:00
+								        if self.get_param('youtube_print_sig_code'):
 								            self.to_screen(f'Extracted nsig function from {player_id}:\n{func_code[1]}\n')
-												[youtube] Fix throttling by decrypting n-sig (#1437)


											
										
										
											2021-10-30 23:23:58 -05:00
-												[extractor/youtube] Add fallback to phantomjs

Related #4635

											
										
										
											2022-08-18 11:05:18 -05:00
+								        try:
 								            extract_nsig = self._cached(self._extract_n_function_from_code, 'nsig func', player_url)
 								            ret = extract_nsig(jsi, func_code)(s)
 								        except JSInterpreter.Exception as e:
 								            try:
-												[jsinterp] Implement timeout

Workaround for #4716

											
										
										
											2022-08-21 19:49:06 -05:00
+								                jsi = PhantomJSwrapper(self, timeout=5000)
-												[extractor/youtube] Add fallback to phantomjs

Related #4635

											
										
										
											2022-08-18 11:05:18 -05:00
+								            except ExtractorError:
 								                raise e
 								            self.report_warning(
 								                f'Native nsig extraction failed: Trying with PhantomJS\n'
 								                f'         n = {s} ; player = {player_url}', video_id)
-												[jsinterp] Improve separating regex

Fixes https://github.com/yt-dlp/yt-dlp/issues/4635#issuecomment-1273974909

											
										
										
											2022-10-10 21:29:27 -05:00
+								            self.write_debug(e, only_once=True)
-												[extractor/youtube] Add fallback to phantomjs

Related #4635

											
										
										
											2022-08-18 11:05:18 -05:00
 								            args, func_body = func_code
 								            ret = jsi.execute(
 								                f'console.log(function({", ".join(args)}) {{ {func_body} }}({s!r}));',
 								                video_id=video_id, note='Executing signature code').strip()
-												[youtube] Improve signature caching

and refactor related functions

											
										
										
											2022-08-18 10:57:41 -05:00
 								        self.write_debug(f'Decrypted nsig {s} => {ret}')
-												[ie/youtube] Only cache nsig code on successful decoding (#12750)

Authored by: seproDev, bashonly

Co-authored-by: bashonly <88596187+bashonly@users.noreply.github.com>
											
										
										
											2025-03-25 18:47:45 -05:00
+								        # Only cache nsig func JS code to disk if successful, and only once
 								        self._store_nsig_code_to_cache(player_id, func_code)
-												[youtube] Improve signature caching

and refactor related functions

											
										
										
											2022-08-18 10:57:41 -05:00
+								        return ret
-												[cleanup] Misc (#10623)

Authored by: bashonly
											
										
										
											2024-08-01 10:03:49 -05:00
+								    def _extract_n_function_name(self, jscode, player_url=None):
-												[ie/youtube] Fix `n` function name extraction for player `20dfca59` (#10611)

Closes #10608
Authored by: bashonly
											
										
										
											2024-07-31 16:19:30 -05:00
+								        # Examples (with placeholders nfunc, narray, idx):
 								        # *  .get("n"))&&(b=nfunc(b)
 								        # *  .get("n"))&&(b=narray[idx](b)
 								        # *  b=String.fromCharCode(110),c=a.get(b))&&c=narray[idx](c)
 								        # *  a.D&&(b="nn"[+a.D],c=a.get(b))&&(c=narray[idx](c),a.set(b,c),narray.length||nfunc("")
 								        # *  a.D&&(PL(a),b=a.j.n||null)&&(b=narray[0](b),a.set("n",b),narray.length||nfunc("")
-												[ie/youtube] Fix `n` function name extraction for player `b12cc44b` (#10668)

Authored by: seproDev
											
										
										
											2024-08-05 15:36:11 -05:00
+								        # *  a.D&&(b="nn"[+a.D],vL(a),c=a.j[b]||null)&&(c=narray[idx](c),a.set(b,c),narray.length||nfunc("")
-												[ie/youtube] Fix `n` sig extraction for player `3bb1f723` (#11750)

Closes #11744
Authored by: bashonly
											
										
										
											2024-12-06 09:35:18 -06:00
+								        # *  J.J="";J.url="";J.Z&&(R="nn"[+J.Z],mW(J),N=J.K[R]||null)&&(N=narray[idx](N),J.set(R,N))}};
-												[test] Fix test_youtube_signature

											
										
										
											2022-08-20 14:21:03 -05:00
+								        funcname, idx = self._search_regex(
-												[ie/youtube] Fix `n` function name extraction for player `3400486c` (#10542)

Authored by: bashonly
											
										
										
											2024-07-23 16:25:49 -05:00
+								            r'''(?x)
 								            (?:
 								                \.get\("n"\)\)&&\(b=|
 								                (?:
 								                    b=String\.fromCharCode\(110\)|
-												[ie/youtube] Fix `n` function name extraction for player `20dfca59` (#10611)

Closes #10608
Authored by: bashonly
											
										
										
											2024-07-31 16:19:30 -05:00
+								                    (?P<str_idx>[a-zA-Z0-9_$.]+)&&\(b="nn"\[\+(?P=str_idx)\]
-												[ie/youtube] Fix `n` function name extraction for player `b12cc44b` (#10668)

Authored by: seproDev
											
										
										
											2024-08-05 15:36:11 -05:00
+								                )
 								                (?:
 								                    ,[a-zA-Z0-9_$]+\(a\))?,c=a\.
 								                    (?:
 								                        get\(b\)|
 								                        [a-zA-Z0-9_$]+\[b\]\|\|null
 								                    )\)&&\(c=|
-												[ie/youtube] Fix `n` function name extraction for player `20dfca59` (#10611)

Closes #10608
Authored by: bashonly
											
										
										
											2024-07-31 16:19:30 -05:00
+								                \b(?P<var>[a-zA-Z0-9_$]+)=
 								            )(?P<nfunc>[a-zA-Z0-9_$]+)(?:\[(?P<idx>\d+)\])?\([a-zA-Z]\)
-												[ie/youtube] Fix `n` sig extraction for player `3bb1f723` (#11750)

Closes #11744
Authored by: bashonly
											
										
										
											2024-12-06 09:35:18 -06:00
+								            (?(var),[a-zA-Z0-9_$]+\.set\((?:"n+"|[a-zA-Z0-9_$]+)\,(?P=var)\))''',
-												[ie/youtube] Fix `n` function name extraction for player `20dfca59` (#10611)

Closes #10608
Authored by: bashonly
											
										
										
											2024-07-31 16:19:30 -05:00
+								            jscode, 'n function name', group=('nfunc', 'idx'), default=(None, None))
 								        if not funcname:
-												[cleanup] Misc (#10623)

Authored by: bashonly
											
										
										
											2024-08-01 10:03:49 -05:00
+								            self.report_warning(join_nonempty(
 								                'Falling back to generic n function search',
 								                player_url and f'         player = {player_url}', delim='\n'))
-												[ie/youtube] Fix `n` function name extraction for player `20dfca59` (#10611)

Closes #10608
Authored by: bashonly
											
										
										
											2024-07-31 16:19:30 -05:00
+								            return self._search_regex(
 								                r'''(?xs)
 								                ;\s*(?P<name>[a-zA-Z0-9_$]+)\s*=\s*function\([a-zA-Z0-9_$]+\)
-												[ie/youtube] Fix `n` sig extraction for player `3bb1f723` (#11750)

Closes #11744
Authored by: bashonly
											
										
										
											2024-12-06 09:35:18 -06:00
+								                \s*\{(?:(?!};).)+?return\s*(?P<q>["'])[\w-]+_w8_(?P=q)\s*\+\s*[a-zA-Z0-9_$]+''',
-												[ie/youtube] Fix `n` function name extraction for player `20dfca59` (#10611)

Closes #10608
Authored by: bashonly
											
										
										
											2024-07-31 16:19:30 -05:00
+								                jscode, 'Initial JS player n function name', group='name')
 								        elif not idx:
-												[test] Fix test_youtube_signature

											
										
										
											2022-08-20 14:21:03 -05:00
+								            return funcname
 								        return json.loads(js_to_json(self._search_regex(
-												[cleanup] Misc

											
										
										
											2023-07-06 09:39:42 -05:00
+								            rf'var {re.escape(funcname)}\s*=\s*(\[.+?\])\s*[,;]', jscode,
-												[test] Fix test_youtube_signature

											
										
										
											2022-08-20 14:21:03 -05:00
+								            f'Initial JS player n function list ({funcname}.{idx})')))[int(idx)]
-												[ie/youtube] Fix nsig and signature extraction for player `643afba4` (#12684)

Closes #12677, Closes #12682
Authored by: seproDev, bashonly

Co-authored-by: bashonly <88596187+bashonly@users.noreply.github.com>
											
										
										
											2025-03-21 15:58:10 -05:00
+								    def _extract_player_js_global_var(self, jscode):
 								        """Returns tuple of strings: variable assignment code, variable name, variable value code"""
 								        return self._search_regex(
 								            r'''(?x)
-												[ie/youtube] Fix signature and nsig extraction for player `363db69b` (#12725)

Closes #12724
Authored by: bashonly
											
										
										
											2025-03-24 16:18:51 -05:00
+								                (?P<q1>["\'])use\s+strict(?P=q1);\s*
-												[ie/youtube] Fix nsig and signature extraction for player `643afba4` (#12684)

Closes #12677, Closes #12682
Authored by: seproDev, bashonly

Co-authored-by: bashonly <88596187+bashonly@users.noreply.github.com>
											
										
										
											2025-03-21 15:58:10 -05:00
+								                (?P<code>
 								                    var\s+(?P<name>[a-zA-Z0-9_$]+)\s*=\s*
-												[ie/youtube] Fix signature and nsig extraction for player `363db69b` (#12725)

Closes #12724
Authored by: bashonly
											
										
										
											2025-03-24 16:18:51 -05:00
+								                    (?P<value>
 								                        (?P<q2>["\'])(?:(?!(?P=q2)).|\\.)+(?P=q2)
 								                        \.split\((?P<q3>["\'])(?:(?!(?P=q3)).)+(?P=q3)\)
-												[ie/youtube] Fix signature and nsig extraction for player `4fcd6e4a` (#12748)

Closes #12746
Authored by: seproDev
											
										
										
											2025-03-25 18:40:58 -05:00
+								                        |\[\s*(?:(?P<q4>["\'])(?:(?!(?P=q4)).|\\.)*(?P=q4)\s*,?\s*)+\]
-												[ie/youtube] Fix signature and nsig extraction for player `363db69b` (#12725)

Closes #12724
Authored by: bashonly
											
										
										
											2025-03-24 16:18:51 -05:00
+								                    )
-												[ie/youtube] Fix nsig and signature extraction for player `643afba4` (#12684)

Closes #12677, Closes #12682
Authored by: seproDev, bashonly

Co-authored-by: bashonly <88596187+bashonly@users.noreply.github.com>
											
										
										
											2025-03-21 15:58:10 -05:00
+								                )[;,]
 								            ''', jscode, 'global variable', group=('code', 'name', 'value'), default=(None, None, None))
 								    def _fixup_n_function_code(self, argnames, code, full_code):
 								        global_var, varname, _ = self._extract_player_js_global_var(full_code)
 								        if global_var:
 								            self.write_debug(f'Prepending n function code with global array variable "{varname}"')
-												[ie/youtube] Fix PhantomJS nsig fallback (#12728)

Also fixes the NSigDeno plugin

Closes #12724
Authored by: bashonly
											
										
										
											2025-03-24 16:22:25 -05:00
+								            code = global_var + '; ' + code
-												[ie/youtube] Fix nsig and signature extraction for player `643afba4` (#12684)

Closes #12677, Closes #12682
Authored by: seproDev, bashonly

Co-authored-by: bashonly <88596187+bashonly@users.noreply.github.com>
											
										
										
											2025-03-21 15:58:10 -05:00
+								        else:
 								            self.write_debug('No global array variable found in player JS')
-												[ie/youtube] Fix `n` sig extraction for player `3bb1f723` (#11750)

Closes #11744
Authored by: bashonly
											
										
										
											2024-12-06 09:35:18 -06:00
+								        return argnames, re.sub(
-												[ie/youtube] Fix nsig and signature extraction for player `643afba4` (#12684)

Closes #12677, Closes #12682
Authored by: seproDev, bashonly

Co-authored-by: bashonly <88596187+bashonly@users.noreply.github.com>
											
										
										
											2025-03-21 15:58:10 -05:00
+								            rf';\s*if\s*\(\s*typeof\s+[a-zA-Z0-9_$]+\s*===?\s*(?:(["\'])undefined\1|{varname}\[\d+\])\s*\)\s*return\s+{argnames[0]};',
-												[ie/youtube] Fix `n` sig extraction for player `3bb1f723` (#11750)

Closes #11744
Authored by: bashonly
											
										
										
											2024-12-06 09:35:18 -06:00
+								            ';', code)
-												[youtube] Improve signature caching

and refactor related functions

											
										
										
											2022-08-18 10:57:41 -05:00
+								    def _extract_n_function_code(self, video_id, player_url):
-												[youtube] Fix throttling by decrypting n-sig (#1437)


											
										
										
											2021-10-30 23:23:58 -05:00
+								        player_id = self._extract_player_info(player_url)
-												[ie/youtube] Only cache nsig code on successful decoding (#12750)

Authored by: seproDev, bashonly

Co-authored-by: bashonly <88596187+bashonly@users.noreply.github.com>
											
										
										
											2025-03-25 18:47:45 -05:00
+								        func_code = self._load_nsig_code_from_cache(player_id)
-												[youtube] Improve signature caching

and refactor related functions

											
										
										
											2022-08-18 10:57:41 -05:00
+								        jscode = func_code or self._load_player(video_id, player_url)
 								        jsi = JSInterpreter(jscode)
-												[youtube] Fix throttling by decrypting n-sig (#1437)


											
										
										
											2021-10-30 23:23:58 -05:00
 								        if func_code:
-												[youtube] Improve signature caching

and refactor related functions

											
										
										
											2022-08-18 10:57:41 -05:00
+								            return jsi, player_id, func_code
-												[youtube] Fix throttling by decrypting n-sig (#1437)


											
										
										
											2021-10-30 23:23:58 -05:00
-												[cleanup] Misc (#10623)

Authored by: bashonly
											
										
										
											2024-08-01 10:03:49 -05:00
+								        func_name = self._extract_n_function_name(jscode, player_url=player_url)
-												[extractor/youtube] Fallback regex for nsig code extraction

											
										
										
											2022-09-01 03:08:25 -05:00
-												[ie/youtube] Fix nsig and signature extraction for player `643afba4` (#12684)

Closes #12677, Closes #12682
Authored by: seproDev, bashonly

Co-authored-by: bashonly <88596187+bashonly@users.noreply.github.com>
											
										
										
											2025-03-21 15:58:10 -05:00
+								        # XXX: Workaround for the global array variable and lack of `typeof` implementation
 								        func_code = self._fixup_n_function_code(*jsi.extract_function_code(func_name), jscode)
-												[extractor/youtube] Fallback regex for nsig code extraction

											
										
										
											2022-09-01 03:08:25 -05:00
-												[youtube] Improve signature caching

and refactor related functions

											
										
										
											2022-08-18 10:57:41 -05:00
+								        return jsi, player_id, func_code
 								    def _extract_n_function_from_code(self, jsi, func_code):
-												[jsinterp] Handle new youtube signature functions

Closes #4635

											
										
										
											2022-08-13 18:21:54 -05:00
+								        func = jsi.extract_function_from_code(*func_code)
-												[jsinterp] Fix for youtube player 1f7d5369

Closes #4635 again

											
										
										
											2022-08-18 06:08:35 -05:00
-												[youtube] Improve signature caching

and refactor related functions

											
										
										
											2022-08-18 10:57:41 -05:00
+								        def extract_nsig(s):
-												[extractor/youtube] Add fallback to phantomjs

Related #4635

											
										
										
											2022-08-18 11:05:18 -05:00
+								            try:
 								                ret = func([s])
 								            except JSInterpreter.Exception:
 								                raise
 								            except Exception as e:
 								                raise JSInterpreter.Exception(traceback.format_exc(), cause=e)
-												[ie/youtube] Raise if `n` function returns input value (#11752)

Improve a95ee6d8803fca9157adecf63732ab58bf87fd88

Authored by: bashonly
											
										
										
											2024-12-06 09:58:44 -06:00
+								            if ret.startswith('enhanced_except_') or ret.endswith(s):
-												[extractor/youtube] Add fallback to phantomjs

Related #4635

											
										
										
											2022-08-18 11:05:18 -05:00
+								                raise JSInterpreter.Exception('Signature function returned an exception')
-												[jsinterp] Fix for youtube player 1f7d5369

Closes #4635 again

											
										
										
											2022-08-18 06:08:35 -05:00
+								            return ret
-												[youtube] Improve signature caching

and refactor related functions

											
										
										
											2022-08-18 10:57:41 -05:00
 								        return extract_nsig
-												Restore accidentally deleted commits

That's what happens if you let Windows machines write :(

											
										
										
											2013-09-21 07:19:30 -05:00
-												[youtube] Use new API for additional video extraction requests (#328)

Co-authored-by: colethedj, pukkandan
Closes https://github.com/yt-dlp/yt-dlp/issues/427
Workarounds for https://github.com/ytdl-org/youtube-dl/issues/29326, https://github.com/yt-dlp/yt-dlp/issues/319, https://github.com/ytdl-org/youtube-dl/issues/29086
											
										
										
											2021-06-29 17:07:49 -05:00
+								    def _extract_signature_timestamp(self, video_id, player_url, ytcfg=None, fatal=False):
 								        """
 								        Extract signatureTimestamp (sts)
 								        Required to tell API what sig/player version is in use.
 								        """
 								        sts = None
 								        if isinstance(ytcfg, dict):
 								            sts = int_or_none(ytcfg.get('STS'))
 								        if not sts:
 								            # Attempt to extract from player
 								            if player_url is None:
 								                error_msg = 'Cannot extract signature timestamp without player_url.'
 								                if fatal:
 								                    raise ExtractorError(error_msg)
 								                self.report_warning(error_msg)
 								                return
-												[youtube] Fix throttling by decrypting n-sig (#1437)


											
										
										
											2021-10-30 23:23:58 -05:00
+								            code = self._load_player(video_id, player_url, fatal=fatal)
 								            if code:
-												[youtube] Use new API for additional video extraction requests (#328)

Co-authored-by: colethedj, pukkandan
Closes https://github.com/yt-dlp/yt-dlp/issues/427
Workarounds for https://github.com/ytdl-org/youtube-dl/issues/29326, https://github.com/yt-dlp/yt-dlp/issues/319, https://github.com/ytdl-org/youtube-dl/issues/29086
											
										
										
											2021-06-29 17:07:49 -05:00
+								                sts = int_or_none(self._search_regex(
 								                    r'(?:signatureTimestamp|sts)\s*:\s*(?P<sts>[0-9]{5})', code,
 								                    'JS player signature timestamp', group='sts', fatal=fatal))
 								        return sts
-												[youtube] Extract data from multiple clients (#536)

* `player_client` accepts multiple clients
* default `player_client` = `android,web`
* music clients can be specifically requested
* Add IOS `player_client`
* Hide live dash since they can't be downloaded

Closes #501

Authored-by: pukkandan, colethedj
											
										
										
											2021-07-20 22:52:34 -05:00
+								    def _mark_watched(self, video_id, player_responses):
-												[extractor/youtube] Mark videos as fully watched (#4146)

* Also fixes videos appearing as shorts in watch history

Closes #2555
Authored by: Brett824
											
										
										
											2022-06-23 18:30:17 -05:00
+								        for is_full, key in enumerate(('videostatsPlaybackUrl', 'videostatsWatchtimeUrl')):
 								            label = 'fully ' if is_full else ''
 								            url = get_first(player_responses, ('playbackTracking', key, 'baseUrl'),
 								                            expected_type=url_or_none)
 								            if not url:
 								                self.report_warning(f'Unable to mark {label}watched')
 								                return
-												[compat] Remove deprecated functions from core code

											
										
										
											2022-06-24 05:54:43 -05:00
+								            parsed_url = urllib.parse.urlparse(url)
 								            qs = urllib.parse.parse_qs(parsed_url.query)
-												[extractor/youtube] Mark videos as fully watched (#4146)

* Also fixes videos appearing as shorts in watch history

Closes #2555
Authored by: Brett824
											
										
										
											2022-06-23 18:30:17 -05:00
 								            # cpn generation algorithm is reverse engineered from base.js.
 								            # In fact it works even with dummy cpn.
 								            CPN_ALPHABET = 'abcdefghijklmnopqrstuvwxyzABCDEFGHIJKLMNOPQRSTUVWXYZ0123456789-_'
-												[cleanup] Add more ruff rules (#10149)

Authored by: seproDev

Reviewed-by: bashonly <88596187+bashonly@users.noreply.github.com>
Reviewed-by: Simon Sawicki <contact@grub4k.xyz>
											
										
										
											2024-06-11 18:09:58 -05:00
+								            cpn = ''.join(CPN_ALPHABET[random.randint(0, 256) & 63] for _ in range(16))
-												[extractor/youtube] Mark videos as fully watched (#4146)

* Also fixes videos appearing as shorts in watch history

Closes #2555
Authored by: Brett824
											
										
										
											2022-06-23 18:30:17 -05:00
 								            # # more consistent results setting it to right before the end
 								            video_length = [str(float((qs.get('len') or ['1.5'])[0]) - 1)]
 								            qs.update({
 								                'ver': ['2'],
 								                'cpn': [cpn],
 								                'cmt': video_length,
 								                'el': 'detailpage',  # otherwise defaults to "shorts"
 								            })
 								            if is_full:
 								                # these seem to mark watchtime "history" in the real world
 								                # they're required, so send in a single value
 								                qs.update({
-												[extractor/youtube] Mark videos as fully watched

Closes #2555
Authored by: bsun0000

											
										
										
											2022-10-18 13:35:54 -05:00
+								                    'st': 0,
-												[extractor/youtube] Mark videos as fully watched (#4146)

* Also fixes videos appearing as shorts in watch history

Closes #2555
Authored by: Brett824
											
										
										
											2022-06-23 18:30:17 -05:00
+								                    'et': video_length,
 								                })
-												[compat] Remove deprecated functions from core code

											
										
										
											2022-06-24 05:54:43 -05:00
+								            url = urllib.parse.urlunparse(
 								                parsed_url._replace(query=urllib.parse.urlencode(qs, True)))
-												[extractor/youtube] Mark videos as fully watched (#4146)

* Also fixes videos appearing as shorts in watch history

Closes #2555
Authored by: Brett824
											
										
										
											2022-06-23 18:30:17 -05:00
 								            self._download_webpage(
 								                url, video_id, f'Marking {label}watched',
-												[ie/youtube] Remove broken OAuth support (#11558)

Closes #11462
Authored by: bashonly
											
										
										
											2024-11-16 17:40:21 -06:00
+								                'Unable to mark watched', fatal=False)
-												Add --mark-watched feature (Closes #5054)

											
										
										
											2016-02-29 13:01:33 -06:00
-												[extractors] Use new framework for existing embeds (#4307)

`Brightcove` is difficult to migrate because it's subclasses may depend
on the signature of the current functions. So it is left as-is for now

Note: Tests have not been migrated

											
										
										
											2022-07-31 20:23:25 -05:00
+								    @classmethod
 								    def _extract_from_webpage(cls, url, webpage):
 								        # Invidious Instances
 								        # https://github.com/yt-dlp/yt-dlp/issues/195
 								        # https://github.com/iv-org/invidious/pull/1730
 								        mobj = re.search(
 								            r'<link rel="alternate" href="(?P<url>https://www\.youtube\.com/watch\?v=[0-9A-Za-z_-]{11})"',
 								            webpage)
 								        if mobj:
 								            yield cls.url_result(mobj.group('url'), cls)
-												[cleanup] Add more ruff rules (#10149)

Authored by: seproDev

Reviewed-by: bashonly <88596187+bashonly@users.noreply.github.com>
Reviewed-by: Simon Sawicki <contact@grub4k.xyz>
											
										
										
											2024-06-11 18:09:58 -05:00
+								            raise cls.StopExtraction
-												[extractors] Use new framework for existing embeds (#4307)

`Brightcove` is difficult to migrate because it's subclasses may depend
on the signature of the current functions. So it is left as-is for now

Note: Tests have not been migrated

											
										
										
											2022-07-31 20:23:25 -05:00
 								        yield from super()._extract_from_webpage(url, webpage)
-												[youtube] Separate methods for embeds extraction

											
										
										
											2017-09-05 12:48:37 -05:00
 								        # lazyYT YouTube embed
-												[extractors] Use new framework for existing embeds (#4307)

`Brightcove` is difficult to migrate because it's subclasses may depend
on the signature of the current functions. So it is left as-is for now

Note: Tests have not been migrated

											
										
										
											2022-07-31 20:23:25 -05:00
+								        for id_ in re.findall(r'class="lazyYT" data-youtube-id="([^"]+)"', webpage):
 								            yield cls.url_result(unescapeHTML(id_), cls, id_)
-												[youtube] Separate methods for embeds extraction

											
										
										
											2017-09-05 12:48:37 -05:00
 								        # Wordpress "YouTube Video Importer" plugin
-												[extractors] Use new framework for existing embeds (#4307)

`Brightcove` is difficult to migrate because it's subclasses may depend
on the signature of the current functions. So it is left as-is for now

Note: Tests have not been migrated

											
										
										
											2022-07-31 20:23:25 -05:00
+								        for m in re.findall(r'''(?x)<div[^>]+
 								                class=(?P<q1>[\'"])[^\'"]*\byvii_single_video_player\b[^\'"]*(?P=q1)[^>]+
 								                data-video_id=(?P<q2>[\'"])([^\'"]+)(?P=q2)''', webpage):
 								            yield cls.url_result(m[-1], cls, m[-1])
-												[youtube] Separate methods for embeds extraction

											
										
										
											2017-09-05 12:48:37 -05:00
-												[jadorecettepub] Add extractor (Fixes #2148)

											
										
										
											2014-02-08 12:20:11 -06:00
+								    @classmethod
 								    def extract_id(cls, url):
-												[cleanup] Misc cleanup

											
										
										
											2022-06-28 00:10:54 -05:00
+								        video_id = cls.get_temp_id(url)
 								        if not video_id:
 								            raise ExtractorError(f'Invalid URL: {url}')
 								        return video_id
-												Move youtube extractors to youtube_dl.extractor.youtube

											
										
										
											2013-06-23 12:58:33 -05:00
-												[youtube] Sanity check `chapters` (and refactor related code)
Closes #520

											
										
										
											2021-07-19 19:02:41 -05:00
+								    def _extract_chapters_from_json(self, data, duration):
 								        chapter_list = traverse_obj(
 								            data, (
 								                'playerOverlays', 'playerOverlayRenderer', 'decoratedPlayerBarRenderer',
-												[cleanup] Add more ruff rules (#10149)

Authored by: seproDev

Reviewed-by: bashonly <88596187+bashonly@users.noreply.github.com>
Reviewed-by: Simon Sawicki <contact@grub4k.xyz>
											
										
										
											2024-06-11 18:09:58 -05:00
+								                'decoratedPlayerBarRenderer', 'playerBar', 'chapteredPlayerBarRenderer', 'chapters',
-												[youtube] Sanity check `chapters` (and refactor related code)
Closes #520

											
										
										
											2021-07-19 19:02:41 -05:00
+								            ), expected_type=list)
-												[extractor/rutube] Extract chapters from description (#6345)

Authored by: mushbite
											
										
										
											2023-03-04 07:33:17 -06:00
+								        return self._extract_chapters_helper(
-												[youtube] Sanity check `chapters` (and refactor related code)
Closes #520

											
										
										
											2021-07-19 19:02:41 -05:00
+								            chapter_list,
-												[extractor/rutube] Extract chapters from description (#6345)

Authored by: mushbite
											
										
										
											2023-03-04 07:33:17 -06:00
+								            start_function=lambda chapter: float_or_none(
-												[youtube] Sanity check `chapters` (and refactor related code)
Closes #520

											
										
										
											2021-07-19 19:02:41 -05:00
+								                traverse_obj(chapter, ('chapterRenderer', 'timeRangeStartMillis')), scale=1000),
-												[extractor/rutube] Extract chapters from description (#6345)

Authored by: mushbite
											
										
										
											2023-03-04 07:33:17 -06:00
+								            title_function=lambda chapter: traverse_obj(
-												[youtube] Sanity check `chapters` (and refactor related code)
Closes #520

											
										
										
											2021-07-19 19:02:41 -05:00
+								                chapter, ('chapterRenderer', 'title', 'simpleText'), expected_type=str),
 								            duration=duration)
 								    def _extract_chapters_from_engagement_panel(self, data, duration):
 								        content_list = traverse_obj(
-												Merge 'ytdl-org/youtube-dl/master' release 2020.11.19

Old Extractors left behind:
	VLivePlaylistIE
	YoutubeSearchURLIE
	YoutubeShowIE
	YoutubeFavouritesIE

If removing old extractors, make corresponding changes in
	docs/supportedsites.md
	youtube_dlc/extractor/extractors.py

Not merged:
	.github/ISSUE_TEMPLATE/1_broken_site.md
	.github/ISSUE_TEMPLATE/2_site_support_request.md
	.github/ISSUE_TEMPLATE/3_site_feature_request.md
	.github/ISSUE_TEMPLATE/4_bug_report.md
	.github/ISSUE_TEMPLATE/5_feature_request.md
	test/test_all_urls.py
	youtube_dlc/version.py
	Changelog

											
										
										
											2020-11-19 13:22:59 -06:00
+								            data,
-												[youtube] Sanity check `chapters` (and refactor related code)
Closes #520

											
										
										
											2021-07-19 19:02:41 -05:00
+								            ('engagementPanels', ..., 'engagementPanelSectionListRenderer', 'content', 'macroMarkersListRenderer', 'contents'),
-												[utils] `traverse_obj`: Fix more bugs

and cleanup uses of `default=[]`

Continued from b1bde57bef878478e3503ab07190fd207914ade9

											
										
										
											2023-02-09 16:26:26 -06:00
+								            expected_type=list)
-												[youtube] Simplify `_get_text` early

											
										
										
											2021-07-23 19:46:46 -05:00
+								        chapter_time = lambda chapter: parse_duration(self._get_text(chapter, 'timeDescription'))
 								        chapter_title = lambda chapter: self._get_text(chapter, 'title')
-												[youtube] Sanity check `chapters` (and refactor related code)
Closes #520

											
										
										
											2021-07-19 19:02:41 -05:00
-												[cleanup] Misc fixes

Cherry-picks from: #3498, #3947
Related: #3949, https://github.com/yt-dlp/yt-dlp/issues/1839#issuecomment-1140313836
Authored by: pukkandan, flashdagger, gamer191

											
										
										
											2022-06-03 10:59:03 -05:00
+								        return next(filter(None, (
-												[extractor/rutube] Extract chapters from description (#6345)

Authored by: mushbite
											
										
										
											2023-03-04 07:33:17 -06:00
+								            self._extract_chapters_helper(traverse_obj(contents, (..., 'macroMarkersListItemRenderer')),
 								                                          chapter_time, chapter_title, duration)
-												[cleanup] Misc fixes

Cherry-picks from: #3498, #3947
Related: #3949, https://github.com/yt-dlp/yt-dlp/issues/1839#issuecomment-1140313836
Authored by: pukkandan, flashdagger, gamer191

											
										
										
											2022-06-03 10:59:03 -05:00
+								            for contents in content_list)), [])
-												[youtube] Sanity check `chapters` (and refactor related code)
Closes #520

											
										
										
											2021-07-19 19:02:41 -05:00
-												[ie/youtube] Fix `heatmap` extraction (#8299)

Closes #8189
Authored by: bashonly
											
										
										
											2023-10-06 20:00:15 -05:00
+								    def _extract_heatmap(self, data):
 								        return traverse_obj(data, (
 								            'frameworkUpdates', 'entityBatchUpdate', 'mutations',
 								            lambda _, v: v['payload']['macroMarkersListEntity']['markersList']['markerType'] == 'MARKER_TYPE_HEATMAP',
 								            'payload', 'macroMarkersListEntity', 'markersList', 'markers', ..., {
-												[cleanup] Misc (#11347)

Closes #11361
Authored by: avagordon01, bashonly, grqz, Grub4K, seproDev

Co-authored-by: Ava Gordon <avagordon01@gmail.com>
Co-authored-by: bashonly <bashonly@protonmail.com>
Co-authored-by: N/Ame <173015200+grqz@users.noreply.github.com>
Co-authored-by: Simon Sawicki <contact@grub4k.xyz>
											
										
										
											2024-11-03 18:33:21 -06:00
+								                'start_time': ('startMillis', {float_or_none(scale=1000)}),
-												[ie/youtube] Fix `heatmap` extraction (#8299)

Closes #8189
Authored by: bashonly
											
										
										
											2023-10-06 20:00:15 -05:00
+								                'end_time': {lambda x: (int(x['startMillis']) + int(x['durationMillis'])) / 1000},
 								                'value': ('intensityScoreNormalized', {float_or_none}),
 								            })) or None
-												[extractor/youtube] Extract `heatmap` data (#7100)

Closes #3888
Authored by: tntmod54321
											
										
										
											2023-05-26 07:24:39 -05:00
-												[ie/youtube] Fix comments extraction (#9775)

Closes #9358
Authored by: jakeogh, minamotorin, shoxie007, bbilly1

Co-authored-by: minamotorin <76122224+minamotorin@users.noreply.github.com>
Co-authored-by: shoxie007 <74592022+shoxie007@users.noreply.github.com>
Co-authored-by: Simon <35427372+bbilly1@users.noreply.github.com>
											
										
										
											2024-05-17 09:37:30 -05:00
+								    def _extract_comment(self, entities, parent=None):
 								        comment_entity_payload = get_first(entities, ('payload', 'commentEntityPayload', {dict}))
 								        if not (comment_id := traverse_obj(comment_entity_payload, ('properties', 'commentId', {str}))):
 								            return
 								        toolbar_entity_payload = get_first(entities, ('payload', 'engagementToolbarStateEntityPayload', {dict}))
 								        time_text = traverse_obj(comment_entity_payload, ('properties', 'publishedTime', {str})) or ''
 								        return {
 								            'id': comment_id,
 								            'parent': parent or 'root',
 								            **traverse_obj(comment_entity_payload, {
 								                'text': ('properties', 'content', 'content', {str}),
 								                'like_count': ('toolbar', 'likeCountA11y', {parse_count}),
 								                'author_id': ('author', 'channelId', {self.ucid_or_none}),
 								                'author': ('author', 'displayName', {str}),
 								                'author_thumbnail': ('author', 'avatarThumbnailUrl', {url_or_none}),
 								                'author_is_uploader': ('author', 'isCreator', {bool}),
 								                'author_is_verified': ('author', 'isVerified', {bool}),
 								                'author_url': ('author', 'channelCommand', 'innertubeCommand', (
-												[cleanup] Add more ruff rules (#10149)

Authored by: seproDev

Reviewed-by: bashonly <88596187+bashonly@users.noreply.github.com>
Reviewed-by: Simon Sawicki <contact@grub4k.xyz>
											
										
										
											2024-06-11 18:09:58 -05:00
+								                    ('browseEndpoint', 'canonicalBaseUrl'), ('commandMetadata', 'webCommandMetadata', 'url'),
-												[cleanup] Misc (#11347)

Closes #11361
Authored by: avagordon01, bashonly, grqz, Grub4K, seproDev

Co-authored-by: Ava Gordon <avagordon01@gmail.com>
Co-authored-by: bashonly <bashonly@protonmail.com>
Co-authored-by: N/Ame <173015200+grqz@users.noreply.github.com>
Co-authored-by: Simon Sawicki <contact@grub4k.xyz>
											
										
										
											2024-11-03 18:33:21 -06:00
+								                ), {urljoin('https://www.youtube.com')}),
-												[ie/youtube] Fix comments extraction (#9775)

Closes #9358
Authored by: jakeogh, minamotorin, shoxie007, bbilly1

Co-authored-by: minamotorin <76122224+minamotorin@users.noreply.github.com>
Co-authored-by: shoxie007 <74592022+shoxie007@users.noreply.github.com>
Co-authored-by: Simon <35427372+bbilly1@users.noreply.github.com>
											
										
										
											2024-05-17 09:37:30 -05:00
+								            }, get_all=False),
 								            'is_favorited': (None if toolbar_entity_payload is None else
 								                             toolbar_entity_payload.get('heartState') == 'TOOLBAR_HEART_STATE_HEARTED'),
 								            '_time_text': time_text,  # FIXME: non-standard, but we need a way of showing that it is an estimate.
 								            'timestamp': self._parse_time_text(time_text),
 								        }
 								    def _extract_comment_old(self, comment_renderer, parent=None):
-												[Youtube] Rewrite comment extraction (#167)

Closes #121

TODO:
* Add an option for the user to specify newest/popular and max number of comments
* Refactor the download code and generalize with TabIE
* Parse time_text to timestamp

											
										
										
											2021-03-14 17:41:11 -05:00
+								        comment_id = comment_renderer.get('commentId')
 								        if not comment_id:
 								            return
-												[youtube] misc cleanup and bug fixes (#505)

* Update some `_extract_response` calls to keep them consistent
* Cleanup continuation extraction related code using new API format
* Improve `_extract_account_syncid` to support multiple parameters
* Generalize `get_text` and related functions into one
* Update `INNERTUBE_CONTEXT_CLIENT_NAME` with integer values

Authored by: colethedj
											
										
										
											2021-07-18 23:55:07 -05:00
-												[extractor/youtube] Extract more metadata for comments (#7179)

Adds new comment fields:
* `author_url` - The url to the comment author's page
* `author_is_verified` - Whether the author is verified on the platform
* `is_pinned` - Whether the comment is pinned to the top of the comments

Closes https://github.com/yt-dlp/yt-dlp/issues/5411

Authored by: coletdjnz
											
										
										
											2023-06-01 03:43:32 -05:00
+								        info = {
 								            'id': comment_id,
 								            'text': self._get_text(comment_renderer, 'contentText'),
 								            'like_count': self._get_count(comment_renderer, 'voteCount'),
 								            'author_id': traverse_obj(comment_renderer, ('authorEndpoint', 'browseEndpoint', 'browseId', {self.ucid_or_none})),
 								            'author': self._get_text(comment_renderer, 'authorText'),
 								            'author_thumbnail': traverse_obj(comment_renderer, ('authorThumbnail', 'thumbnails', -1, 'url', {url_or_none})),
 								            'parent': parent or 'root',
 								        }
-												[youtube] misc cleanup and bug fixes (#505)

* Update some `_extract_response` calls to keep them consistent
* Cleanup continuation extraction related code using new API format
* Improve `_extract_account_syncid` to support multiple parameters
* Generalize `get_text` and related functions into one
* Update `INNERTUBE_CONTEXT_CLIENT_NAME` with integer values

Authored by: colethedj
											
										
										
											2021-07-18 23:55:07 -05:00
-												[extractor/youtube] Support changing extraction language (#4470)

Adds `--extractor-args youtube:lang=<supported lang code>` extractor arg to prefer translated fields (e.g. title and description) of that language, if available, for all YouTube extractors. See README or error message for list of supported language codes.

Closes https://github.com/yt-dlp/yt-dlp/issues/387

Authored by: coletdjnz
											
										
										
											2022-09-09 00:16:46 -05:00
+								        # Timestamp is an estimate calculated from the current time and time_text
 								        time_text = self._get_text(comment_renderer, 'publishedTimeText') or ''
 								        timestamp = self._parse_time_text(time_text)
-												[extractor/youtube] Extract more metadata for comments (#7179)

Adds new comment fields:
* `author_url` - The url to the comment author's page
* `author_is_verified` - Whether the author is verified on the platform
* `is_pinned` - Whether the comment is pinned to the top of the comments

Closes https://github.com/yt-dlp/yt-dlp/issues/5411

Authored by: coletdjnz
											
										
										
											2023-06-01 03:43:32 -05:00
+								        info.update({
 								            # FIXME: non-standard, but we need a way of showing that it is an estimate.
 								            '_time_text': time_text,
 								            'timestamp': timestamp,
 								        })
-												[youtube] misc cleanup and bug fixes (#505)

* Update some `_extract_response` calls to keep them consistent
* Cleanup continuation extraction related code using new API format
* Improve `_extract_account_syncid` to support multiple parameters
* Generalize `get_text` and related functions into one
* Update `INNERTUBE_CONTEXT_CLIENT_NAME` with integer values

Authored by: colethedj
											
										
										
											2021-07-18 23:55:07 -05:00
-												[extractor/youtube] Extract more metadata for comments (#7179)

Adds new comment fields:
* `author_url` - The url to the comment author's page
* `author_is_verified` - Whether the author is verified on the platform
* `is_pinned` - Whether the comment is pinned to the top of the comments

Closes https://github.com/yt-dlp/yt-dlp/issues/5411

Authored by: coletdjnz
											
										
										
											2023-06-01 03:43:32 -05:00
+								        info['author_url'] = urljoin(
 								            'https://www.youtube.com', traverse_obj(comment_renderer, ('authorEndpoint', (
 								                ('browseEndpoint', 'canonicalBaseUrl'), ('commandMetadata', 'webCommandMetadata', 'url'))),
 								                expected_type=str, get_all=False))
-												[Youtube] Rewrite comment extraction (#167)

Closes #121

TODO:
* Add an option for the user to specify newest/popular and max number of comments
* Refactor the download code and generalize with TabIE
* Parse time_text to timestamp

											
										
										
											2021-03-14 17:41:11 -05:00
-												[extractor/youtube] Extract more metadata for comments (#7179)

Adds new comment fields:
* `author_url` - The url to the comment author's page
* `author_is_verified` - Whether the author is verified on the platform
* `is_pinned` - Whether the comment is pinned to the top of the comments

Closes https://github.com/yt-dlp/yt-dlp/issues/5411

Authored by: coletdjnz
											
										
										
											2023-06-01 03:43:32 -05:00
+								        author_is_uploader = traverse_obj(comment_renderer, 'authorIsChannelOwner')
 								        if author_is_uploader is not None:
 								            info['author_is_uploader'] = author_is_uploader
 								        comment_abr = traverse_obj(
-												[extractor/youtube] Fix comments' `is_favorited` (#7390)

Authored by: bbilly1
Closes #7389
											
										
										
											2023-06-22 13:08:42 -05:00
+								            comment_renderer, ('actionButtons', 'commentActionButtonsRenderer'), expected_type=dict)
-												[extractor/youtube] Extract more metadata for comments (#7179)

Adds new comment fields:
* `author_url` - The url to the comment author's page
* `author_is_verified` - Whether the author is verified on the platform
* `is_pinned` - Whether the comment is pinned to the top of the comments

Closes https://github.com/yt-dlp/yt-dlp/issues/5411

Authored by: coletdjnz
											
										
										
											2023-06-01 03:43:32 -05:00
+								        if comment_abr is not None:
 								            info['is_favorited'] = 'creatorHeart' in comment_abr
-												[extractor/youtube] Misc cleanup

Authored by: coletdjnz

											
										
										
											2023-06-08 08:28:49 -05:00
+								        badges = self._extract_badges([traverse_obj(comment_renderer, 'authorCommentBadge')])
 								        if self._has_badge(badges, BadgeType.VERIFIED):
 								            info['author_is_verified'] = True
-												[extractor/youtube] Extract more metadata for comments (#7179)

Adds new comment fields:
* `author_url` - The url to the comment author's page
* `author_is_verified` - Whether the author is verified on the platform
* `is_pinned` - Whether the comment is pinned to the top of the comments

Closes https://github.com/yt-dlp/yt-dlp/issues/5411

Authored by: coletdjnz
											
										
										
											2023-06-01 03:43:32 -05:00
 								        is_pinned = traverse_obj(comment_renderer, 'pinnedCommentBadge')
 								        if is_pinned:
 								            info['is_pinned'] = True
 								        return info
-												[Youtube] Rewrite comment extraction (#167)

Closes #121

TODO:
* Add an option for the user to specify newest/popular and max number of comments
* Refactor the download code and generalize with TabIE
* Parse time_text to timestamp

											
										
										
											2021-03-14 17:41:11 -05:00
-												[youtube:comments] Add more options for limiting number of comments extracted (#1626)

Extends `max_comments` extractor arg to support `max-parents,max-replies,max-replies-per-thread`.
Authored-by: coletdjnz
											
										
										
											2021-12-14 22:29:48 -06:00
+								    def _comment_entries(self, root_continuation_data, ytcfg, video_id, parent=None, tracker=None):
 								        get_single_config_arg = lambda c: self._configuration_arg(c, [''])[0]
-												[youtube:comments] Move comment extraction to new API (#466)

Closes #438, #481, #485 

Authored by: colethedj
											
										
										
											2021-07-11 18:18:40 -05:00
 								        def extract_header(contents):
 								            _continuation = None
 								            for content in contents:
-												[youtube:comments] Add more options for limiting number of comments extracted (#1626)

Extends `max_comments` extractor arg to support `max-parents,max-replies,max-replies-per-thread`.
Authored-by: coletdjnz
											
										
										
											2021-12-14 22:29:48 -06:00
+								                comments_header_renderer = traverse_obj(content, 'commentsHeaderRenderer')
-												[youtube:tab] Extract more playlist metadata (#2069)

* Add fields modified_date, modified_timestamp
* Add field playlist_count
* [youtube:tab] Extract view_count, playlist_count, modified_date

Authored by: coletdjnz, pukkandan
											
										
										
											2022-01-07 05:03:02 -06:00
+								                expected_comment_count = self._get_count(
 								                    comments_header_renderer, 'countText', 'commentsCount')
-												[youtube] misc cleanup and bug fixes (#505)

* Update some `_extract_response` calls to keep them consistent
* Cleanup continuation extraction related code using new API format
* Improve `_extract_account_syncid` to support multiple parameters
* Generalize `get_text` and related functions into one
* Update `INNERTUBE_CONTEXT_CLIENT_NAME` with integer values

Authored by: colethedj
											
										
										
											2021-07-18 23:55:07 -05:00
-												[extractor/youtube] Fix continuation loop with no comments (#7148)

Deep check the response for incomplete data.

Authored by: coletdjnz

											
										
										
											2023-05-31 02:08:28 -05:00
+								                if expected_comment_count is not None:
-												[youtube:comments] Add more options for limiting number of comments extracted (#1626)

Extends `max_comments` extractor arg to support `max-parents,max-replies,max-replies-per-thread`.
Authored-by: coletdjnz
											
										
										
											2021-12-14 22:29:48 -06:00
+								                    tracker['est_total'] = expected_comment_count
 								                    self.to_screen(f'Downloading ~{expected_comment_count} comments')
 								                comment_sort_index = int(get_single_config_arg('comment_sort') != 'top')  # 1 = new, 0 = top
-												[youtube:comments] Move comment extraction to new API (#466)

Closes #438, #481, #485 

Authored by: colethedj
											
										
										
											2021-07-11 18:18:40 -05:00
 								                sort_menu_item = try_get(
 								                    comments_header_renderer,
 								                    lambda x: x['sortMenu']['sortFilterSubMenuRenderer']['subMenuItems'][comment_sort_index], dict) or {}
 								                sort_continuation_ep = sort_menu_item.get('serviceEndpoint') or {}
 								                _continuation = self._extract_continuation_ep_data(sort_continuation_ep) or self._extract_continuation(sort_menu_item)
 								                if not _continuation:
 								                    continue
-												[youtube:comments] Add more options for limiting number of comments extracted (#1626)

Extends `max_comments` extractor arg to support `max-parents,max-replies,max-replies-per-thread`.
Authored-by: coletdjnz
											
										
										
											2021-12-14 22:29:48 -06:00
+								                sort_text = str_or_none(sort_menu_item.get('title'))
 								                if not sort_text:
-												[youtube:comments] Move comment extraction to new API (#466)

Closes #438, #481, #485 

Authored by: colethedj
											
										
										
											2021-07-11 18:18:40 -05:00
+								                    sort_text = 'top comments' if comment_sort_index == 0 else 'newest first'
-												[cleanup] Add more ruff rules (#10149)

Authored by: seproDev

Reviewed-by: bashonly <88596187+bashonly@users.noreply.github.com>
Reviewed-by: Simon Sawicki <contact@grub4k.xyz>
											
										
										
											2024-06-11 18:09:58 -05:00
+								                self.to_screen(f'Sorting comments by {sort_text.lower()}')
-												[youtube:comments] Move comment extraction to new API (#466)

Closes #438, #481, #485 

Authored by: colethedj
											
										
										
											2021-07-11 18:18:40 -05:00
+								                break
-												[extractor] Generalize `getcomments` implementation

											
										
										
											2021-10-12 04:50:50 -05:00
+								            return _continuation
-												[Youtube] Rewrite comment extraction (#167)

Closes #121

TODO:
* Add an option for the user to specify newest/popular and max number of comments
* Refactor the download code and generalize with TabIE
* Parse time_text to timestamp

											
										
										
											2021-03-14 17:41:11 -05:00
-												[ie/youtube] Fix comments extraction (#9775)

Closes #9358
Authored by: jakeogh, minamotorin, shoxie007, bbilly1

Co-authored-by: minamotorin <76122224+minamotorin@users.noreply.github.com>
Co-authored-by: shoxie007 <74592022+shoxie007@users.noreply.github.com>
Co-authored-by: Simon <35427372+bbilly1@users.noreply.github.com>
											
										
										
											2024-05-17 09:37:30 -05:00
+								        def extract_thread(contents, entity_payloads):
-												[Youtube] Rewrite comment extraction (#167)

Closes #121

TODO:
* Add an option for the user to specify newest/popular and max number of comments
* Refactor the download code and generalize with TabIE
* Parse time_text to timestamp

											
										
										
											2021-03-14 17:41:11 -05:00
+								            if not parent:
-												[youtube:comments] Add more options for limiting number of comments extracted (#1626)

Extends `max_comments` extractor arg to support `max-parents,max-replies,max-replies-per-thread`.
Authored-by: coletdjnz
											
										
										
											2021-12-14 22:29:48 -06:00
+								                tracker['current_page_thread'] = 0
-												[Youtube] Rewrite comment extraction (#167)

Closes #121

TODO:
* Add an option for the user to specify newest/popular and max number of comments
* Refactor the download code and generalize with TabIE
* Parse time_text to timestamp

											
										
										
											2021-03-14 17:41:11 -05:00
+								            for content in contents:
-												[youtube:comments] Add more options for limiting number of comments extracted (#1626)

Extends `max_comments` extractor arg to support `max-parents,max-replies,max-replies-per-thread`.
Authored-by: coletdjnz
											
										
										
											2021-12-14 22:29:48 -06:00
+								                if not parent and tracker['total_parent_comments'] >= max_parents:
 								                    yield
-												[Youtube] Rewrite comment extraction (#167)

Closes #121

TODO:
* Add an option for the user to specify newest/popular and max number of comments
* Refactor the download code and generalize with TabIE
* Parse time_text to timestamp

											
										
										
											2021-03-14 17:41:11 -05:00
+								                comment_thread_renderer = try_get(content, lambda x: x['commentThreadRenderer'])
-												[ie/youtube] Fix comments extraction (#9775)

Closes #9358
Authored by: jakeogh, minamotorin, shoxie007, bbilly1

Co-authored-by: minamotorin <76122224+minamotorin@users.noreply.github.com>
Co-authored-by: shoxie007 <74592022+shoxie007@users.noreply.github.com>
Co-authored-by: Simon <35427372+bbilly1@users.noreply.github.com>
											
										
										
											2024-05-17 09:37:30 -05:00
+								                # old comment format
 								                if not entity_payloads:
 								                    comment_renderer = get_first(
 								                        (comment_thread_renderer, content), [['commentRenderer', ('comment', 'commentRenderer')]],
 								                        expected_type=dict, default={})
 								                    comment = self._extract_comment_old(comment_renderer, parent)
 								                # new comment format
 								                else:
 								                    view_model = (
 								                        traverse_obj(comment_thread_renderer, ('commentViewModel', 'commentViewModel', {dict}))
 								                        or traverse_obj(content, ('commentViewModel', {dict})))
 								                    comment_keys = traverse_obj(view_model, (('commentKey', 'toolbarStateKey'), {str}))
 								                    if not comment_keys:
 								                        continue
 								                    entities = traverse_obj(entity_payloads, lambda _, v: v['entityKey'] in comment_keys)
 								                    comment = self._extract_comment(entities, parent)
 								                    if comment:
 								                        comment['is_pinned'] = traverse_obj(view_model, ('pinnedText', {str})) is not None
-												[Youtube] Rewrite comment extraction (#167)

Closes #121

TODO:
* Add an option for the user to specify newest/popular and max number of comments
* Refactor the download code and generalize with TabIE
* Parse time_text to timestamp

											
										
										
											2021-03-14 17:41:11 -05:00
+								                if not comment:
 								                    continue
-												[extractor/youtube] Fix comment loop detection for pinned comments (#6714)

Pinned comments may repeat a second time - this is expected.

Fixes https://github.com/yt-dlp/yt-dlp/issues/6712

Authored by: coletdjnz
											
										
										
											2023-04-06 02:44:22 -05:00
+								                comment_id = comment['id']
-												[ie/youtube] Fix comments extraction (#9775)

Closes #9358
Authored by: jakeogh, minamotorin, shoxie007, bbilly1

Co-authored-by: minamotorin <76122224+minamotorin@users.noreply.github.com>
Co-authored-by: shoxie007 <74592022+shoxie007@users.noreply.github.com>
Co-authored-by: Simon <35427372+bbilly1@users.noreply.github.com>
											
										
										
											2024-05-17 09:37:30 -05:00
-												[extractor/youtube] Extract more metadata for comments (#7179)

Adds new comment fields:
* `author_url` - The url to the comment author's page
* `author_is_verified` - Whether the author is verified on the platform
* `is_pinned` - Whether the comment is pinned to the top of the comments

Closes https://github.com/yt-dlp/yt-dlp/issues/5411

Authored by: coletdjnz
											
										
										
											2023-06-01 03:43:32 -05:00
+								                if comment.get('is_pinned'):
-												[extractor/youtube] Fix comment loop detection for pinned comments (#6714)

Pinned comments may repeat a second time - this is expected.

Fixes https://github.com/yt-dlp/yt-dlp/issues/6712

Authored by: coletdjnz
											
										
										
											2023-04-06 02:44:22 -05:00
+								                    tracker['pinned_comment_ids'].add(comment_id)
-												[extractor/youtube] Detect and break on looping comments (#6301)

Fixes https://github.com/yt-dlp/yt-dlp/issues/6290

Authored by: coletdjnz
											
										
										
											2023-03-01 01:56:53 -06:00
+								                # Sometimes YouTube may break and give us infinite looping comments.
 								                # See: https://github.com/yt-dlp/yt-dlp/issues/6290
-												[extractor/youtube] Fix comment loop detection for pinned comments (#6714)

Pinned comments may repeat a second time - this is expected.

Fixes https://github.com/yt-dlp/yt-dlp/issues/6712

Authored by: coletdjnz
											
										
										
											2023-04-06 02:44:22 -05:00
+								                if comment_id in tracker['seen_comment_ids']:
-												[extractor/youtube] Extract more metadata for comments (#7179)

Adds new comment fields:
* `author_url` - The url to the comment author's page
* `author_is_verified` - Whether the author is verified on the platform
* `is_pinned` - Whether the comment is pinned to the top of the comments

Closes https://github.com/yt-dlp/yt-dlp/issues/5411

Authored by: coletdjnz
											
										
										
											2023-06-01 03:43:32 -05:00
+								                    if comment_id in tracker['pinned_comment_ids'] and not comment.get('is_pinned'):
-												[extractor/youtube] Fix comment loop detection for pinned comments (#6714)

Pinned comments may repeat a second time - this is expected.

Fixes https://github.com/yt-dlp/yt-dlp/issues/6712

Authored by: coletdjnz
											
										
										
											2023-04-06 02:44:22 -05:00
+								                        # Pinned comments may appear a second time in newest first sort
 								                        # See: https://github.com/yt-dlp/yt-dlp/issues/6712
 								                        continue
-												[extractor/youtube] Ignore incomplete data for comment threads by default (#7475)

For both `--ignore-errors` and `--ignore-errors only_download`. Pass `--no-ignore-errors` to not ignore.

Closes https://github.com/yt-dlp/yt-dlp/issues/7474

Authored by: coletdjnz
											
										
										
											2023-07-03 05:47:10 -05:00
+								                    self.report_warning(
 								                        'Detected YouTube comments looping. Stopping comment extraction '
 								                        f'{"for this thread" if parent else ""} as we probably cannot get any more.')
-												[extractor/youtube] Detect and break on looping comments (#6301)

Fixes https://github.com/yt-dlp/yt-dlp/issues/6290

Authored by: coletdjnz
											
										
										
											2023-03-01 01:56:53 -06:00
+								                    yield
 								                else:
 								                    tracker['seen_comment_ids'].add(comment['id'])
-												[youtube:comments] Add more options for limiting number of comments extracted (#1626)

Extends `max_comments` extractor arg to support `max-parents,max-replies,max-replies-per-thread`.
Authored-by: coletdjnz
											
										
										
											2021-12-14 22:29:48 -06:00
 								                tracker['running_total'] += 1
 								                tracker['total_reply_comments' if parent else 'total_parent_comments'] += 1
-												[Youtube] Rewrite comment extraction (#167)

Closes #121

TODO:
* Add an option for the user to specify newest/popular and max number of comments
* Refactor the download code and generalize with TabIE
* Parse time_text to timestamp

											
										
										
											2021-03-14 17:41:11 -05:00
+								                yield comment
-												[youtube:comments] Add more options for limiting number of comments extracted (#1626)

Extends `max_comments` extractor arg to support `max-parents,max-replies,max-replies-per-thread`.
Authored-by: coletdjnz
											
										
										
											2021-12-14 22:29:48 -06:00
-												[Youtube] Rewrite comment extraction (#167)

Closes #121

TODO:
* Add an option for the user to specify newest/popular and max number of comments
* Refactor the download code and generalize with TabIE
* Parse time_text to timestamp

											
										
										
											2021-03-14 17:41:11 -05:00
+								                # Attempt to get the replies
 								                comment_replies_renderer = try_get(
 								                    comment_thread_renderer, lambda x: x['replies']['commentRepliesRenderer'], dict)
 								                if comment_replies_renderer:
-												[youtube:comments] Add more options for limiting number of comments extracted (#1626)

Extends `max_comments` extractor arg to support `max-parents,max-replies,max-replies-per-thread`.
Authored-by: coletdjnz
											
										
										
											2021-12-14 22:29:48 -06:00
+								                    tracker['current_page_thread'] += 1
-												[Youtube] Rewrite comment extraction (#167)

Closes #121

TODO:
* Add an option for the user to specify newest/popular and max number of comments
* Refactor the download code and generalize with TabIE
* Parse time_text to timestamp

											
										
										
											2021-03-14 17:41:11 -05:00
+								                    comment_entries_iter = self._comment_entries(
-												[youtube] Cleanup authentication code (#786)

Authored by: coletdjnz
											
										
										
											2021-09-23 19:52:17 -05:00
+								                        comment_replies_renderer, ytcfg, video_id,
-												[youtube:comments] Add more options for limiting number of comments extracted (#1626)

Extends `max_comments` extractor arg to support `max-parents,max-replies,max-replies-per-thread`.
Authored-by: coletdjnz
											
										
										
											2021-12-14 22:29:48 -06:00
+								                        parent=comment.get('id'), tracker=tracker)
-												[cleanup] Upgrade syntax

Using https://github.com/asottile/pyupgrade

1. `__future__` imports and `coding: utf-8` were removed
2. Files were rewritten with `pyupgrade --py36-plus --keep-percent-format`
3. f-strings were cherry-picked from `pyupgrade --py36-plus`

Extractors are left untouched (except removing header) to avoid unnecessary merge conflicts

											
										
										
											2022-04-11 10:10:28 -05:00
+								                    yield from itertools.islice(comment_entries_iter, min(
 								                        max_replies_per_thread, max(0, max_replies - tracker['total_reply_comments'])))
-												[Youtube] Rewrite comment extraction (#167)

Closes #121

TODO:
* Add an option for the user to specify newest/popular and max number of comments
* Refactor the download code and generalize with TabIE
* Parse time_text to timestamp

											
										
										
											2021-03-14 17:41:11 -05:00
-												[youtube:comments] Add more options for limiting number of comments extracted (#1626)

Extends `max_comments` extractor arg to support `max-parents,max-replies,max-replies-per-thread`.
Authored-by: coletdjnz
											
										
										
											2021-12-14 22:29:48 -06:00
+								        # Keeps track of counts across recursive calls
 								        if not tracker:
-												[cleanup] Add more ruff rules (#10149)

Authored by: seproDev

Reviewed-by: bashonly <88596187+bashonly@users.noreply.github.com>
Reviewed-by: Simon Sawicki <contact@grub4k.xyz>
											
										
										
											2024-06-11 18:09:58 -05:00
+								            tracker = {
 								                'running_total': 0,
 								                'est_total': None,
 								                'current_page_thread': 0,
 								                'total_parent_comments': 0,
 								                'total_reply_comments': 0,
 								                'seen_comment_ids': set(),
 								                'pinned_comment_ids': set(),
 								            }
-												[youtube:comments] Add more options for limiting number of comments extracted (#1626)

Extends `max_comments` extractor arg to support `max-parents,max-replies,max-replies-per-thread`.
Authored-by: coletdjnz
											
										
										
											2021-12-14 22:29:48 -06:00
 								        # TODO: Deprecated
-												[youtube:comments] Move comment extraction to new API (#466)

Closes #438, #481, #485 

Authored by: colethedj
											
										
										
											2021-07-11 18:18:40 -05:00
+								        # YouTube comments have a max depth of 2
-												[youtube:comments] Add more options for limiting number of comments extracted (#1626)

Extends `max_comments` extractor arg to support `max-parents,max-replies,max-replies-per-thread`.
Authored-by: coletdjnz
											
										
										
											2021-12-14 22:29:48 -06:00
+								        max_depth = int_or_none(get_single_config_arg('max_comment_depth'))
 								        if max_depth:
-												[utils] Add `deprecation_warning`

See https://github.com/yt-dlp/yt-dlp/pull/2173#issuecomment-1097021515

											
										
										
											2022-08-30 10:28:28 -05:00
+								            self._downloader.deprecated_feature('[youtube] max_comment_depth extractor argument is deprecated. '
 								                                                'Set max replies in the max-comments extractor argument instead')
-												[youtube:comments] Move comment extraction to new API (#466)

Closes #438, #481, #485 

Authored by: colethedj
											
										
										
											2021-07-11 18:18:40 -05:00
+								        if max_depth == 1 and parent:
 								            return
-												[Youtube] Rewrite comment extraction (#167)

Closes #121

TODO:
* Add an option for the user to specify newest/popular and max number of comments
* Refactor the download code and generalize with TabIE
* Parse time_text to timestamp

											
										
										
											2021-03-14 17:41:11 -05:00
-												[cleanup] Add more ruff rules (#10149)

Authored by: seproDev

Reviewed-by: bashonly <88596187+bashonly@users.noreply.github.com>
Reviewed-by: Simon Sawicki <contact@grub4k.xyz>
											
										
										
											2024-06-11 18:09:58 -05:00
+								        max_comments, max_parents, max_replies, max_replies_per_thread, *_ = (
 								            int_or_none(p, default=sys.maxsize) for p in self._configuration_arg('max_comments') + [''] * 4)
-												[youtube:comments] Move comment extraction to new API (#466)

Closes #438, #481, #485 

Authored by: colethedj
											
										
										
											2021-07-11 18:18:40 -05:00
-												[youtube:comments] Add more options for limiting number of comments extracted (#1626)

Extends `max_comments` extractor arg to support `max-parents,max-replies,max-replies-per-thread`.
Authored-by: coletdjnz
											
										
										
											2021-12-14 22:29:48 -06:00
+								        continuation = self._extract_continuation(root_continuation_data)
-												[youtube:comments] Fix comment section not being extracted in new layouts (#1324)

Co-authored-by: coletdjnz, pukkandan
											
										
										
											2021-10-17 21:58:42 -05:00
-												[youtube:comments] Add more options for limiting number of comments extracted (#1626)

Extends `max_comments` extractor arg to support `max-parents,max-replies,max-replies-per-thread`.
Authored-by: coletdjnz
											
										
										
											2021-12-14 22:29:48 -06:00
+								        response = None
-												[youtube] Add YoutubeStoriesIE (#3362)

Get channel stories with `ytstories:<channel UCID>`

Authored-by: coletdjnz
											
										
										
											2022-05-01 01:46:28 -05:00
+								        is_forced_continuation = False
-												[youtube:comments] Move comment extraction to new API (#466)

Closes #438, #481, #485 

Authored by: colethedj
											
										
										
											2021-07-11 18:18:40 -05:00
+								        is_first_continuation = parent is None
-												[youtube] Add YoutubeStoriesIE (#3362)

Get channel stories with `ytstories:<channel UCID>`

Authored-by: coletdjnz
											
										
										
											2022-05-01 01:46:28 -05:00
+								        if is_first_continuation and not continuation:
 								            # Sometimes you can get comments by generating the continuation yourself,
 								            # even if YouTube initially reports them being disabled - e.g. stories comments.
 								            # Note: if the comment section is actually disabled, YouTube may return a response with
 								            # required check_get_keys missing. So we will disable that check initially in this case.
 								            continuation = self._build_api_continuation_query(self._generate_comment_continuation(video_id))
 								            is_forced_continuation = True
-												[Youtube] Rewrite comment extraction (#167)

Closes #121

TODO:
* Add an option for the user to specify newest/popular and max number of comments
* Refactor the download code and generalize with TabIE
* Parse time_text to timestamp

											
										
										
											2021-03-14 17:41:11 -05:00
-												[extractor/youtube] Fix continuation loop with no comments (#7148)

Deep check the response for incomplete data.

Authored by: coletdjnz

											
										
										
											2023-05-31 02:08:28 -05:00
+								        continuation_items_path = (
 								            'onResponseReceivedEndpoints', ..., ('reloadContinuationItemsCommand', 'appendContinuationItemsAction'), 'continuationItems')
-												[Youtube] Rewrite comment extraction (#167)

Closes #121

TODO:
* Add an option for the user to specify newest/popular and max number of comments
* Refactor the download code and generalize with TabIE
* Parse time_text to timestamp

											
										
										
											2021-03-14 17:41:11 -05:00
+								        for page_num in itertools.count(0):
 								            if not continuation:
 								                break
-												[youtube:comments] Add more options for limiting number of comments extracted (#1626)

Extends `max_comments` extractor arg to support `max-parents,max-replies,max-replies-per-thread`.
Authored-by: coletdjnz
											
										
										
											2021-12-14 22:29:48 -06:00
+								            headers = self.generate_api_headers(ytcfg=ytcfg, visitor_data=self._extract_visitor_data(response))
-												[extractor/youtube] Fix continuation loop with no comments (#7148)

Deep check the response for incomplete data.

Authored by: coletdjnz

											
										
										
											2023-05-31 02:08:28 -05:00
+								            comment_prog_str = f"({tracker['running_total']}/~{tracker['est_total']})"
-												[youtube:comments] Move comment extraction to new API (#466)

Closes #438, #481, #485 

Authored by: colethedj
											
										
										
											2021-07-11 18:18:40 -05:00
+								            if page_num == 0:
 								                if is_first_continuation:
 								                    note_prefix = 'Downloading comment section API JSON'
-												[Youtube] Rewrite comment extraction (#167)

Closes #121

TODO:
* Add an option for the user to specify newest/popular and max number of comments
* Refactor the download code and generalize with TabIE
* Parse time_text to timestamp

											
										
										
											2021-03-14 17:41:11 -05:00
+								                else:
-												[youtube:comments] Move comment extraction to new API (#466)

Closes #438, #481, #485 

Authored by: colethedj
											
										
										
											2021-07-11 18:18:40 -05:00
+								                    note_prefix = '    Downloading comment API JSON reply thread %d %s' % (
-												[youtube:comments] Add more options for limiting number of comments extracted (#1626)

Extends `max_comments` extractor arg to support `max-parents,max-replies,max-replies-per-thread`.
Authored-by: coletdjnz
											
										
										
											2021-12-14 22:29:48 -06:00
+								                        tracker['current_page_thread'], comment_prog_str)
-												[youtube:comments] Move comment extraction to new API (#466)

Closes #438, #481, #485 

Authored by: colethedj
											
										
										
											2021-07-11 18:18:40 -05:00
+								            else:
-												[cleanup] Add more ruff rules (#10149)

Authored by: seproDev

Reviewed-by: bashonly <88596187+bashonly@users.noreply.github.com>
Reviewed-by: Simon Sawicki <contact@grub4k.xyz>
											
										
										
											2024-06-11 18:09:58 -05:00
+								                note_prefix = '{}Downloading comment{} API JSON page {} {}'.format(
-												[youtube:comments] Move comment extraction to new API (#466)

Closes #438, #481, #485 

Authored by: colethedj
											
										
										
											2021-07-11 18:18:40 -05:00
+								                    '       ' if parent else '', ' replies' if parent else '',
 								                    page_num, comment_prog_str)
-												[extractor/youtube] Fix continuation loop with no comments (#7148)

Deep check the response for incomplete data.

Authored by: coletdjnz

											
										
										
											2023-05-31 02:08:28 -05:00
 								            # Do a deep check for incomplete data as sometimes YouTube may return no comments for a continuation
 								            # Ignore check if YouTube says the comment count is 0.
 								            check_get_keys = None
 								            if not is_forced_continuation and not (tracker['est_total'] == 0 and tracker['running_total'] == 0):
 								                check_get_keys = [[*continuation_items_path, ..., (
-												[ie/youtube] Fix comments extraction (#9775)

Closes #9358
Authored by: jakeogh, minamotorin, shoxie007, bbilly1

Co-authored-by: minamotorin <76122224+minamotorin@users.noreply.github.com>
Co-authored-by: shoxie007 <74592022+shoxie007@users.noreply.github.com>
Co-authored-by: Simon <35427372+bbilly1@users.noreply.github.com>
											
										
										
											2024-05-17 09:37:30 -05:00
+								                    'commentsHeaderRenderer' if is_first_continuation else ('commentThreadRenderer', 'commentViewModel', 'commentRenderer'))]]
-												[extractor/youtube] Ignore incomplete data error for comment replies (#5490)

When --ignore-errors is used.
Closes https://github.com/yt-dlp/yt-dlp/issues/4669
Authored by: coletdjnz
											
										
										
											2022-11-10 00:35:22 -06:00
+								            try:
 								                response = self._extract_response(
 								                    item_id=None, query=continuation,
 								                    ep='next', ytcfg=ytcfg, headers=headers, note=note_prefix,
-												[extractor/youtube] Fix continuation loop with no comments (#7148)

Deep check the response for incomplete data.

Authored by: coletdjnz

											
										
										
											2023-05-31 02:08:28 -05:00
+								                    check_get_keys=check_get_keys)
-												[extractor/youtube] Ignore incomplete data error for comment replies (#5490)

When --ignore-errors is used.
Closes https://github.com/yt-dlp/yt-dlp/issues/4669
Authored by: coletdjnz
											
										
										
											2022-11-10 00:35:22 -06:00
+								            except ExtractorError as e:
 								                # Ignore incomplete data error for replies if retries didn't work.
 								                # This is to allow any other parent comments and comment threads to be downloaded.
 								                # See: https://github.com/yt-dlp/yt-dlp/issues/4669
-												[extractor/youtube] Ignore incomplete data for comment threads by default (#7475)

For both `--ignore-errors` and `--ignore-errors only_download`. Pass `--no-ignore-errors` to not ignore.

Closes https://github.com/yt-dlp/yt-dlp/issues/7474

Authored by: coletdjnz
											
										
										
											2023-07-03 05:47:10 -05:00
+								                if 'incomplete data' in str(e).lower() and parent:
 								                    if self.get_param('ignoreerrors') in (True, 'only_download'):
 								                        self.report_warning(
 								                            'Received incomplete data for a comment reply thread and retrying did not help. '
 								                            'Ignoring to let other comments be downloaded. Pass --no-ignore-errors to not ignore.')
 								                        return
 								                    else:
 								                        raise ExtractorError(
 								                            'Incomplete data received for comment reply thread. '
 								                            'Pass --ignore-errors to ignore and allow rest of comments to download.',
 								                            expected=True)
 								                raise
-												[youtube] Add YoutubeStoriesIE (#3362)

Get channel stories with `ytstories:<channel UCID>`

Authored-by: coletdjnz
											
										
										
											2022-05-01 01:46:28 -05:00
+								            is_forced_continuation = False
-												[youtube:comments] Move comment extraction to new API (#466)

Closes #438, #481, #485 

Authored by: colethedj
											
										
										
											2021-07-11 18:18:40 -05:00
+								            continuation = None
-												[ie/youtube] Fix comments extraction (#9775)

Closes #9358
Authored by: jakeogh, minamotorin, shoxie007, bbilly1

Co-authored-by: minamotorin <76122224+minamotorin@users.noreply.github.com>
Co-authored-by: shoxie007 <74592022+shoxie007@users.noreply.github.com>
Co-authored-by: Simon <35427372+bbilly1@users.noreply.github.com>
											
										
										
											2024-05-17 09:37:30 -05:00
+								            mutations = traverse_obj(response, ('frameworkUpdates', 'entityBatchUpdate', 'mutations', ..., {dict}))
-												[extractor/youtube] Fix continuation loop with no comments (#7148)

Deep check the response for incomplete data.

Authored by: coletdjnz

											
										
										
											2023-05-31 02:08:28 -05:00
+								            for continuation_items in traverse_obj(response, continuation_items_path, expected_type=list, default=[]):
-												[youtube:comments] Add more options for limiting number of comments extracted (#1626)

Extends `max_comments` extractor arg to support `max-parents,max-replies,max-replies-per-thread`.
Authored-by: coletdjnz
											
										
										
											2021-12-14 22:29:48 -06:00
+								                if is_first_continuation:
 								                    continuation = extract_header(continuation_items)
 								                    is_first_continuation = False
-												[youtube:comments] Move comment extraction to new API (#466)

Closes #438, #481, #485 

Authored by: colethedj
											
										
										
											2021-07-11 18:18:40 -05:00
+								                    if continuation:
-												[Youtube] Rewrite comment extraction (#167)

Closes #121

TODO:
* Add an option for the user to specify newest/popular and max number of comments
* Refactor the download code and generalize with TabIE
* Parse time_text to timestamp

											
										
										
											2021-03-14 17:41:11 -05:00
+								                        break
-												[youtube:comments] Add more options for limiting number of comments extracted (#1626)

Extends `max_comments` extractor arg to support `max-parents,max-replies,max-replies-per-thread`.
Authored-by: coletdjnz
											
										
										
											2021-12-14 22:29:48 -06:00
+								                    continue
-												[Youtube] Rewrite comment extraction (#167)

Closes #121

TODO:
* Add an option for the user to specify newest/popular and max number of comments
* Refactor the download code and generalize with TabIE
* Parse time_text to timestamp

											
										
										
											2021-03-14 17:41:11 -05:00
-												[ie/youtube] Fix comments extraction (#9775)

Closes #9358
Authored by: jakeogh, minamotorin, shoxie007, bbilly1

Co-authored-by: minamotorin <76122224+minamotorin@users.noreply.github.com>
Co-authored-by: shoxie007 <74592022+shoxie007@users.noreply.github.com>
Co-authored-by: Simon <35427372+bbilly1@users.noreply.github.com>
											
										
										
											2024-05-17 09:37:30 -05:00
+								                for entry in extract_thread(continuation_items, mutations):
-												[youtube:comments] Add more options for limiting number of comments extracted (#1626)

Extends `max_comments` extractor arg to support `max-parents,max-replies,max-replies-per-thread`.
Authored-by: coletdjnz
											
										
										
											2021-12-14 22:29:48 -06:00
+								                    if not entry:
 								                        return
 								                    yield entry
 								                continuation = self._extract_continuation({'contents': continuation_items})
 								                if continuation:
-												[youtube:comments] Move comment extraction to new API (#466)

Closes #438, #481, #485 

Authored by: colethedj
											
										
										
											2021-07-11 18:18:40 -05:00
+								                    break
-												[Youtube] Rewrite comment extraction (#167)

Closes #121

TODO:
* Add an option for the user to specify newest/popular and max number of comments
* Refactor the download code and generalize with TabIE
* Parse time_text to timestamp

											
										
										
											2021-03-14 17:41:11 -05:00
-												[youtube] Add YoutubeStoriesIE (#3362)

Get channel stories with `ytstories:<channel UCID>`

Authored-by: coletdjnz
											
										
										
											2022-05-01 01:46:28 -05:00
+								        message = self._get_text(root_continuation_data, ('contents', ..., 'messageRenderer', 'text'), max_runs=1)
 								        if message and not parent and tracker['running_total'] == 0:
 								            self.report_warning(f'Youtube said: {message}', video_id=video_id, only_once=True)
-												[extractor/youtube] Differentiate between no and disabled comments (#5491)

`comments` and `comment_count` will be set to None, as opposed to 
an empty list and 0, respectively.

Fixes https://github.com/yt-dlp/yt-dlp/issues/5068

Authored by: coletdjnz, pukkandan
											
										
										
											2022-11-09 21:33:03 -06:00
+								            raise self.CommentsDisabled
-												[youtube] Add YoutubeStoriesIE (#3362)

Get channel stories with `ytstories:<channel UCID>`

Authored-by: coletdjnz
											
										
										
											2022-05-01 01:46:28 -05:00
 								    @staticmethod
 								    def _generate_comment_continuation(video_id):
 								        """
 								        Generates initial comment section continuation token from given video id
 								        """
 								        token = f'\x12\r\x12\x0b{video_id}\x18\x062\'"\x11"\x0b{video_id}0\x00x\x020\x00B\x10comments-section'
 								        return base64.b64encode(token.encode()).decode()
-												[extractor] Generalize `getcomments` implementation

											
										
										
											2021-10-12 04:50:50 -05:00
+								    def _get_comments(self, ytcfg, video_id, contents, webpage):
-												[Youtube] Rewrite comment extraction (#167)

Closes #121

TODO:
* Add an option for the user to specify newest/popular and max number of comments
* Refactor the download code and generalize with TabIE
* Parse time_text to timestamp

											
										
										
											2021-03-14 17:41:11 -05:00
+								        """Entry for comment extraction"""
-												[youtube:comments] Move comment extraction to new API (#466)

Closes #438, #481, #485 

Authored by: colethedj
											
										
										
											2021-07-11 18:18:40 -05:00
+								        def _real_comment_extract(contents):
-												[youtube:comments] Fix comment section not being extracted in new layouts (#1324)

Co-authored-by: coletdjnz, pukkandan
											
										
										
											2021-10-17 21:58:42 -05:00
+								            renderer = next((
 								                item for item in traverse_obj(contents, (..., 'itemSectionRenderer'), default={})
 								                if item.get('sectionIdentifier') == 'comment-item-section'), None)
 								            yield from self._comment_entries(renderer, ytcfg, video_id)
-												[youtube] Cleanup authentication code (#786)

Authored by: coletdjnz
											
										
										
											2021-09-23 19:52:17 -05:00
-												[extractor] Generalize `getcomments` implementation

											
										
										
											2021-10-12 04:50:50 -05:00
+								        max_comments = int_or_none(self._configuration_arg('max_comments', [''])[0])
 								        return itertools.islice(_real_comment_extract(contents), 0, max_comments)
-												[Youtube] Rewrite comment extraction (#167)

Closes #121

TODO:
* Add an option for the user to specify newest/popular and max number of comments
* Refactor the download code and generalize with TabIE
* Parse time_text to timestamp

											
										
										
											2021-03-14 17:41:11 -05:00
-												[youtube] Use new API for additional video extraction requests (#328)

Co-authored-by: colethedj, pukkandan
Closes https://github.com/yt-dlp/yt-dlp/issues/427
Workarounds for https://github.com/ytdl-org/youtube-dl/issues/29326, https://github.com/yt-dlp/yt-dlp/issues/319, https://github.com/ytdl-org/youtube-dl/issues/29086
											
										
										
											2021-06-29 17:07:49 -05:00
+								    @staticmethod
-												[youtube] Cleanup authentication code (#786)

Authored by: coletdjnz
											
										
										
											2021-09-23 19:52:17 -05:00
+								    def _get_checkok_params():
 								        return {'contentCheckOk': True, 'racyCheckOk': True}
 								    @classmethod
 								    def _generate_player_context(cls, sts=None):
-												[youtube] Use new API for additional video extraction requests (#328)

Co-authored-by: colethedj, pukkandan
Closes https://github.com/yt-dlp/yt-dlp/issues/427
Workarounds for https://github.com/ytdl-org/youtube-dl/issues/29326, https://github.com/yt-dlp/yt-dlp/issues/319, https://github.com/ytdl-org/youtube-dl/issues/29086
											
										
										
											2021-06-29 17:07:49 -05:00
+								        context = {
 								            'html5Preference': 'HTML5_PREF_WANTS',
 								        }
 								        if sts is not None:
 								            context['signatureTimestamp'] = sts
 								        return {
 								            'playbackContext': {
-												[cleanup] Add more ruff rules (#10149)

Authored by: seproDev

Reviewed-by: bashonly <88596187+bashonly@users.noreply.github.com>
Reviewed-by: Simon Sawicki <contact@grub4k.xyz>
											
										
										
											2024-06-11 18:09:58 -05:00
+								                'contentPlaybackContext': context,
-												[youtube] Fix controversial videos when requested via API (#533)

Closes: https://github.com/yt-dlp/yt-dlp/issues/511#issuecomment-883024350
Authored by: colethedj
											
										
										
											2021-07-20 13:01:28 -05:00
+								            },
-												[cleanup] Add more ruff rules (#10149)

Authored by: seproDev

Reviewed-by: bashonly <88596187+bashonly@users.noreply.github.com>
Reviewed-by: Simon Sawicki <contact@grub4k.xyz>
											
										
										
											2024-06-11 18:09:58 -05:00
+								            **cls._get_checkok_params(),
-												[youtube] Use new API for additional video extraction requests (#328)

Co-authored-by: colethedj, pukkandan
Closes https://github.com/yt-dlp/yt-dlp/issues/427
Workarounds for https://github.com/ytdl-org/youtube-dl/issues/29326, https://github.com/yt-dlp/yt-dlp/issues/319, https://github.com/ytdl-org/youtube-dl/issues/29086
											
										
										
											2021-06-29 17:07:49 -05:00
+								        }
-												[ie/youtube] Use different PO token for GVS and Player (#12090)

Authored by: coletdjnz
											
										
										
											2025-01-24 18:17:37 -06:00
+								    def _get_config_po_token(self, client: str, context: _PoTokenContext):
-												[ie/youtube] Add `po_token`, `visitor_data`, `data_sync_id` extractor args (#10648)

Authored by:  seproDev, coletdjnz, bashonly
											
										
										
											2024-09-13 05:51:58 -05:00
+								        po_token_strs = self._configuration_arg('po_token', [], ie_key=YoutubeIE, casesense=True)
 								        for token_str in po_token_strs:
-												[ie/youtube] Use different PO token for GVS and Player (#12090)

Authored by: coletdjnz
											
										
										
											2025-01-24 18:17:37 -06:00
+								            po_token_meta, sep, po_token = token_str.partition('+')
 								            if not sep:
 								                self.report_warning(
 								                    f'Invalid po_token configuration format. '
 								                    f'Expected "CLIENT.CONTEXT+PO_TOKEN", got "{token_str}"', only_once=True)
 								                continue
 								            po_token_client, sep, po_token_context = po_token_meta.partition('.')
 								            if po_token_client.lower() != client:
 								                continue
-												[ie/youtube] Add `po_token`, `visitor_data`, `data_sync_id` extractor args (#10648)

Authored by:  seproDev, coletdjnz, bashonly
											
										
										
											2024-09-13 05:51:58 -05:00
+								            if not sep:
-												[ie/youtube] Use different PO token for GVS and Player (#12090)

Authored by: coletdjnz
											
										
										
											2025-01-24 18:17:37 -06:00
+								                # TODO(future): deprecate the old format?
 								                self.write_debug(
 								                    f'po_token configuration for {client} client is missing a context; assuming GVS. '
 								                    'You can provide a context with the format "CLIENT.CONTEXT+PO_TOKEN"',
 								                    only_once=True)
 								                po_token_context = _PoTokenContext.GVS.value
 								            if po_token_context.lower() != context.value:
 								                continue
 								            # Clean and validate the PO Token. This will strip invalid characters off
 								            # (e.g. additional url params the user may accidentally include)
 								            try:
 								                return base64.urlsafe_b64encode(base64.urlsafe_b64decode(urllib.parse.unquote(po_token))).decode()
 								            except (binascii.Error, ValueError):
-												[ie/youtube] Add `po_token`, `visitor_data`, `data_sync_id` extractor args (#10648)

Authored by:  seproDev, coletdjnz, bashonly
											
										
										
											2024-09-13 05:51:58 -05:00
+								                self.report_warning(
-												[ie/youtube] Use different PO token for GVS and Player (#12090)

Authored by: coletdjnz
											
										
										
											2025-01-24 18:17:37 -06:00
+								                    f'Invalid po_token configuration for {client} client: '
 								                    f'{po_token_context} PO Token should be a base64url-encoded string.',
 								                    only_once=True)
-												[ie/youtube] Add `po_token`, `visitor_data`, `data_sync_id` extractor args (#10648)

Authored by:  seproDev, coletdjnz, bashonly
											
										
										
											2024-09-13 05:51:58 -05:00
+								                continue
-												[ie/youtube] Use different PO token for GVS and Player (#12090)

Authored by: coletdjnz
											
										
										
											2025-01-24 18:17:37 -06:00
+								    def fetch_po_token(self, client='web', context=_PoTokenContext.GVS, ytcfg=None, visitor_data=None,
 								                       data_sync_id=None, session_index=None, player_url=None, video_id=None, **kwargs):
 								        """
 								        Fetch a PO Token for a given client and context. This function will validate required parameters for a given context and client.
 								        EXPERIMENTAL: This method is unstable and may change or be removed without notice.
 								        @param client: The client to fetch the PO Token for.
 								        @param context: The context in which the PO Token is used.
 								        @param ytcfg: The ytcfg for the client.
 								        @param visitor_data: visitor data.
 								        @param data_sync_id: data sync ID.
 								        @param session_index: session index.
 								        @param player_url: player URL.
 								        @param video_id: video ID.
 								        @param kwargs: Additional arguments to pass down. May be more added in the future.
 								        @return: The fetched PO Token. None if it could not be fetched.
 								        """
 								        # GVS WebPO Token is bound to visitor_data / Visitor ID when logged out.
 								        # Must have visitor_data for it to function.
 								        if player_url and context == _PoTokenContext.GVS and not visitor_data and not self.is_authenticated:
-												[ie/youtube] Add `po_token`, `visitor_data`, `data_sync_id` extractor args (#10648)

Authored by:  seproDev, coletdjnz, bashonly
											
										
										
											2024-09-13 05:51:58 -05:00
+								            self.report_warning(
-												[ie/youtube] Use different PO token for GVS and Player (#12090)

Authored by: coletdjnz
											
										
										
											2025-01-24 18:17:37 -06:00
+								                f'Unable to fetch GVS PO Token for {client} client: Missing required Visitor Data. '
-												[ie/youtube] Add `po_token`, `visitor_data`, `data_sync_id` extractor args (#10648)

Authored by:  seproDev, coletdjnz, bashonly
											
										
										
											2024-09-13 05:51:58 -05:00
+								                f'You may need to pass Visitor Data with --extractor-args "youtube:visitor_data=XXX"')
 								            return
-												[ie/youtube] Use different PO token for GVS and Player (#12090)

Authored by: coletdjnz
											
										
										
											2025-01-24 18:17:37 -06:00
+								        if context == _PoTokenContext.PLAYER and not video_id:
 								            self.report_warning(
 								                f'Unable to fetch Player PO Token for {client} client: Missing required Video ID')
 								            return
 								        config_po_token = self._get_config_po_token(client, context)
-												[ie/youtube] Add `po_token`, `visitor_data`, `data_sync_id` extractor args (#10648)

Authored by:  seproDev, coletdjnz, bashonly
											
										
										
											2024-09-13 05:51:58 -05:00
+								        if config_po_token:
-												[ie/youtube] Use different PO token for GVS and Player (#12090)

Authored by: coletdjnz
											
										
										
											2025-01-24 18:17:37 -06:00
+								            # GVS WebPO token is bound to data_sync_id / account Session ID when logged in.
 								            if player_url and context == _PoTokenContext.GVS and not data_sync_id and self.is_authenticated:
-												[ie/youtube] Add `po_token`, `visitor_data`, `data_sync_id` extractor args (#10648)

Authored by:  seproDev, coletdjnz, bashonly
											
										
										
											2024-09-13 05:51:58 -05:00
+								                self.report_warning(
-												[ie/youtube] Use different PO token for GVS and Player (#12090)

Authored by: coletdjnz
											
										
										
											2025-01-24 18:17:37 -06:00
+								                    f'Got a GVS PO Token for {client} client, but missing Data Sync ID for account. Formats may not work.'
-												[ie/youtube] Add `po_token`, `visitor_data`, `data_sync_id` extractor args (#10648)

Authored by:  seproDev, coletdjnz, bashonly
											
										
										
											2024-09-13 05:51:58 -05:00
+								                    f'You may need to pass a Data Sync ID with --extractor-args "youtube:data_sync_id=XXX"')
 								            return config_po_token
-												[ie/youtube] Use different PO token for GVS and Player (#12090)

Authored by: coletdjnz
											
										
										
											2025-01-24 18:17:37 -06:00
+								        # Require GVS WebPO Token if logged in for external fetching
 								        if player_url and context == _PoTokenContext.GVS and not data_sync_id and self.is_authenticated:
-												[ie/youtube] Add `po_token`, `visitor_data`, `data_sync_id` extractor args (#10648)

Authored by:  seproDev, coletdjnz, bashonly
											
										
										
											2024-09-13 05:51:58 -05:00
+								            self.report_warning(
-												[ie/youtube] Use different PO token for GVS and Player (#12090)

Authored by: coletdjnz
											
										
										
											2025-01-24 18:17:37 -06:00
+								                f'Unable to fetch GVS PO Token for {client} client: Missing required Data Sync ID for account. '
-												[ie/youtube] Add `po_token`, `visitor_data`, `data_sync_id` extractor args (#10648)

Authored by:  seproDev, coletdjnz, bashonly
											
										
										
											2024-09-13 05:51:58 -05:00
+								                f'You may need to pass a Data Sync ID with --extractor-args "youtube:data_sync_id=XXX"')
 								            return
 								        return self._fetch_po_token(
 								            client=client,
-												[ie/youtube] Use different PO token for GVS and Player (#12090)

Authored by: coletdjnz
											
										
										
											2025-01-24 18:17:37 -06:00
+								            context=context.value,
 								            ytcfg=ytcfg,
-												[ie/youtube] Add `po_token`, `visitor_data`, `data_sync_id` extractor args (#10648)

Authored by:  seproDev, coletdjnz, bashonly
											
										
										
											2024-09-13 05:51:58 -05:00
+								            visitor_data=visitor_data,
 								            data_sync_id=data_sync_id,
-												[ie/youtube] Use different PO token for GVS and Player (#12090)

Authored by: coletdjnz
											
										
										
											2025-01-24 18:17:37 -06:00
+								            session_index=session_index,
-												[ie/youtube] Add `po_token`, `visitor_data`, `data_sync_id` extractor args (#10648)

Authored by:  seproDev, coletdjnz, bashonly
											
										
										
											2024-09-13 05:51:58 -05:00
+								            player_url=player_url,
-												[ie/youtube] Use different PO token for GVS and Player (#12090)

Authored by: coletdjnz
											
										
										
											2025-01-24 18:17:37 -06:00
+								            video_id=video_id,
-												[ie/youtube] Add `po_token`, `visitor_data`, `data_sync_id` extractor args (#10648)

Authored by:  seproDev, coletdjnz, bashonly
											
										
										
											2024-09-13 05:51:58 -05:00
+								            **kwargs,
 								        )
-												[ie/youtube] Use different PO token for GVS and Player (#12090)

Authored by: coletdjnz
											
										
										
											2025-01-24 18:17:37 -06:00
+								    def _fetch_po_token(self, client, **kwargs):
 								        """(Unstable) External PO Token fetch stub"""
-												[ie/youtube] Add `po_token`, `visitor_data`, `data_sync_id` extractor args (#10648)

Authored by:  seproDev, coletdjnz, bashonly
											
										
										
											2024-09-13 05:51:58 -05:00
-												[youtube] Add age-gate bypass for unverified accounts (#600)

Adds `_creator` variants for each client

Authored by: zerodytrash, colethedj, pukkandan
											
										
										
											2021-08-01 16:13:46 -05:00
+								    @staticmethod
 								    def _is_agegated(player_response):
 								        if traverse_obj(player_response, ('playabilityStatus', 'desktopLegacyAgeGateReason')):
-												[youtube] Improve age-gate detection (#577)

Authored by: colethedj

											
										
										
											2021-07-29 00:23:56 -05:00
+								            return True
-												[youtube] Add age-gate bypass for unverified accounts (#600)

Adds `_creator` variants for each client

Authored by: zerodytrash, colethedj, pukkandan
											
										
										
											2021-08-01 16:13:46 -05:00
-												[utils] `traverse_obj`: Fix more bugs

and cleanup uses of `default=[]`

Continued from b1bde57bef878478e3503ab07190fd207914ade9

											
										
										
											2023-02-09 16:26:26 -06:00
+								        reasons = traverse_obj(player_response, ('playabilityStatus', ('status', 'reason')))
-												[youtube] Add age-gate bypass for unverified accounts (#600)

Adds `_creator` variants for each client

Authored by: zerodytrash, colethedj, pukkandan
											
										
										
											2021-08-01 16:13:46 -05:00
+								        AGE_GATE_REASONS = (
 								            'confirm your age', 'age-restricted', 'inappropriate',  # reason
 								            'age_verification_required', 'age_check_required',  # status
 								        )
 								        return any(expected in reason for expected in AGE_GATE_REASONS for reason in reasons)
 								    @staticmethod
 								    def _is_unplayable(player_response):
 								        return traverse_obj(player_response, ('playabilityStatus', 'status')) == 'UNPLAYABLE'
-												[youtube] Improve age-gate detection (#577)

Authored by: colethedj

											
										
										
											2021-07-29 00:23:56 -05:00
-												[ie/youtube] Add `po_token`, `visitor_data`, `data_sync_id` extractor args (#10648)

Authored by:  seproDev, coletdjnz, bashonly
											
										
										
											2024-09-13 05:51:58 -05:00
+								    def _extract_player_response(self, client, video_id, master_ytcfg, player_ytcfg, player_url, initial_pr, visitor_data, data_sync_id, po_token):
-												[youtube] Extract data from multiple clients (#536)

* `player_client` accepts multiple clients
* default `player_client` = `android,web`
* music clients can be specifically requested
* Add IOS `player_client`
* Hide live dash since they can't be downloaded

Closes #501

Authored-by: pukkandan, colethedj
											
										
										
											2021-07-20 22:52:34 -05:00
+								        headers = self.generate_api_headers(
-												[ie/youtube] Add `po_token`, `visitor_data`, `data_sync_id` extractor args (#10648)

Authored by:  seproDev, coletdjnz, bashonly
											
										
										
											2024-09-13 05:51:58 -05:00
+								            ytcfg=player_ytcfg,
 								            default_client=client,
 								            visitor_data=visitor_data,
 								            session_index=self._extract_session_index(master_ytcfg, player_ytcfg),
-												[ie/youtube] Refactor cookie auth (#11989)

Authored by: coletdjnz
											
										
										
											2025-01-11 20:02:57 -06:00
+								            delegated_session_id=(
 								                self._parse_data_sync_id(data_sync_id)[0]
 								                or self._extract_delegated_session_id(master_ytcfg, initial_pr, player_ytcfg)
 								            ),
 								            user_session_id=(
 								                self._parse_data_sync_id(data_sync_id)[1]
 								                or self._extract_user_session_id(master_ytcfg, initial_pr, player_ytcfg)
-												[ie/youtube] Add `po_token`, `visitor_data`, `data_sync_id` extractor args (#10648)

Authored by:  seproDev, coletdjnz, bashonly
											
										
										
											2024-09-13 05:51:58 -05:00
+								            ),
 								        )
-												[Youtube] Extract more formats for `music.youtube` URLs (#311)

Based on: https://github.com/ytdl-org/youtube-dl/pull/28778, https://github.com/ytdl-org/youtube-dl/pull/26160

Co-authored-by: craftingmod, colethedj, pukkandan
											
										
										
											2021-05-15 09:38:47 -05:00
-												[youtube] Add YoutubeStoriesIE (#3362)

Get channel stories with `ytstories:<channel UCID>`

Authored-by: coletdjnz
											
										
										
											2022-05-01 01:46:28 -05:00
+								        yt_query = {
 								            'videoId': video_id,
 								        }
-												[ie/youtube] Add `player_params` extractor arg (#7719)

Authored by: coletdjnz
											
										
										
											2023-07-29 01:20:42 -05:00
-												[ie/youtube] Player client maintenance (#10573)

- Add clients: android_producer, android_testsuite, android_vr, tv, web_safari
- Remove obsolete clients: android_embedded, ios_embedded, *_embedscreen

Authored by: bashonly
											
										
										
											2024-07-30 16:27:06 -05:00
+								        default_pp = traverse_obj(
 								            INNERTUBE_CLIENTS, (_split_innertube_client(client)[0], 'PLAYER_PARAMS', {str}))
 								        if player_params := self._configuration_arg('player_params', [default_pp], casesense=True)[0]:
 								            yt_query['params'] = player_params
-												[extractor/youtube] Use device-specific user agent (#4770)

Thwart latest fingerprinting attempt (see https://github.com/iv-org/invidious/issues/3230#issuecomment-1226887639)

Authored by: coletdjnz
											
										
										
											2022-08-28 17:59:54 -05:00
-												[ie/youtube] Add `po_token`, `visitor_data`, `data_sync_id` extractor args (#10648)

Authored by:  seproDev, coletdjnz, bashonly
											
										
										
											2024-09-13 05:51:58 -05:00
+								        if po_token:
 								            yt_query['serviceIntegrityDimensions'] = {'poToken': po_token}
 								        sts = self._extract_signature_timestamp(video_id, player_url, master_ytcfg, fatal=False) if player_url else None
-												[youtube] Extract data from multiple clients (#536)

* `player_client` accepts multiple clients
* default `player_client` = `android,web`
* music clients can be specifically requested
* Add IOS `player_client`
* Hide live dash since they can't be downloaded

Closes #501

Authored-by: pukkandan, colethedj
											
										
										
											2021-07-20 22:52:34 -05:00
+								        yt_query.update(self._generate_player_context(sts))
 								        return self._extract_response(
 								            item_id=video_id, ep='player', query=yt_query,
-												[youtube] Raise appropriate error when API pages can't be downloaded

											
										
										
											2021-08-07 01:45:58 -05:00
+								            ytcfg=player_ytcfg, headers=headers, fatal=True,
-												[youtube] simplify and de-duplicate client definitions (#577)

											
										
										
											2021-07-30 14:45:04 -05:00
+								            default_client=client,
-												[cleanup] Add more ruff rules (#10149)

Authored by: seproDev

Reviewed-by: bashonly <88596187+bashonly@users.noreply.github.com>
Reviewed-by: Simon Sawicki <contact@grub4k.xyz>
											
										
										
											2024-06-11 18:09:58 -05:00
+								            note='Downloading {} player API JSON'.format(client.replace('_', ' ').strip()),
-												[youtube] Extract data from multiple clients (#536)

* `player_client` accepts multiple clients
* default `player_client` = `android,web`
* music clients can be specifically requested
* Add IOS `player_client`
* Hide live dash since they can't be downloaded

Closes #501

Authored-by: pukkandan, colethedj
											
										
										
											2021-07-20 22:52:34 -05:00
+								        ) or None
 								    def _get_requested_clients(self, url, smuggled_data):
-												[youtube] Add `player_client=all`

											
										
										
											2021-07-25 16:55:53 -05:00
+								        requested_clients = []
-												[ie/youtube] Support excluding `player_client`s in extractor-arg (#10710)

Closes #10699
Authored by: bashonly
											
										
										
											2024-08-12 04:12:46 -05:00
+								        excluded_clients = []
-												[ie/youtube] Adjust player clients for site changes (#11663)

Closes #11640
Authored by: bashonly
											
										
										
											2024-12-01 09:25:09 -06:00
+								        default_clients = self._DEFAULT_AUTHED_CLIENTS if self.is_authenticated else self._DEFAULT_CLIENTS
-												[youtube] simplify and de-duplicate client definitions (#577)

											
										
										
											2021-07-30 14:45:04 -05:00
+								        allowed_clients = sorted(
-												[cleanup] Add more ruff rules (#10149)

Authored by: seproDev

Reviewed-by: bashonly <88596187+bashonly@users.noreply.github.com>
Reviewed-by: Simon Sawicki <contact@grub4k.xyz>
											
										
										
											2024-06-11 18:09:58 -05:00
+								            (client for client in INNERTUBE_CLIENTS if client[:1] != '_'),
-												[youtube] simplify and de-duplicate client definitions (#577)

											
										
										
											2021-07-30 14:45:04 -05:00
+								            key=lambda client: INNERTUBE_CLIENTS[client]['priority'], reverse=True)
-												[youtube] Add `player_client=all`

											
										
										
											2021-07-25 16:55:53 -05:00
+								        for client in self._configuration_arg('player_client'):
-												[ie/youtube] Remove `android` from default clients (#9553)

Closes #9554
Authored by: coletdjnz, bashonly

Co-authored-by: bashonly <88596187+bashonly@users.noreply.github.com>
											
										
										
											2024-05-17 11:03:02 -05:00
+								            if client == 'default':
-												[ie/youtube] Adjust player clients for site changes (#11663)

Closes #11640
Authored by: bashonly
											
										
										
											2024-12-01 09:25:09 -06:00
+								                requested_clients.extend(default_clients)
-												[youtube] Add `player_client=all`

											
										
										
											2021-07-25 16:55:53 -05:00
+								            elif client == 'all':
 								                requested_clients.extend(allowed_clients)
-												[ie/youtube] Support excluding `player_client`s in extractor-arg (#10710)

Closes #10699
Authored by: bashonly
											
										
										
											2024-08-12 04:12:46 -05:00
+								            elif client.startswith('-'):
 								                excluded_clients.append(client[1:])
-												[ie/youtube] Remove `android` from default clients (#9553)

Closes #9554
Authored by: coletdjnz, bashonly

Co-authored-by: bashonly <88596187+bashonly@users.noreply.github.com>
											
										
										
											2024-05-17 11:03:02 -05:00
+								            elif client not in allowed_clients:
-												[ie/youtube] Support excluding `player_client`s in extractor-arg (#10710)

Closes #10699
Authored by: bashonly
											
										
										
											2024-08-12 04:12:46 -05:00
+								                self.report_warning(f'Skipping unsupported client "{client}"')
-												[ie/youtube] Remove `android` from default clients (#9553)

Closes #9554
Authored by: coletdjnz, bashonly

Co-authored-by: bashonly <88596187+bashonly@users.noreply.github.com>
											
										
										
											2024-05-17 11:03:02 -05:00
+								            else:
 								                requested_clients.append(client)
-												[youtube] Extract data from multiple clients (#536)

* `player_client` accepts multiple clients
* default `player_client` = `android,web`
* music clients can be specifically requested
* Add IOS `player_client`
* Hide live dash since they can't be downloaded

Closes #501

Authored-by: pukkandan, colethedj
											
										
										
											2021-07-20 22:52:34 -05:00
+								        if not requested_clients:
-												[ie/youtube] Adjust player clients for site changes (#11663)

Closes #11640
Authored by: bashonly
											
										
										
											2024-12-01 09:25:09 -06:00
+								            requested_clients.extend(default_clients)
-												[ie/youtube] Support excluding `player_client`s in extractor-arg (#10710)

Closes #10699
Authored by: bashonly
											
										
										
											2024-08-12 04:12:46 -05:00
+								        for excluded_client in excluded_clients:
 								            if excluded_client in requested_clients:
 								                requested_clients.remove(excluded_client)
 								        if not requested_clients:
 								            raise ExtractorError('No player clients have been requested', expected=True)
-												[youtube] Add support for multifeed videos

											
										
										
											2015-07-25 10:30:34 -05:00
-												[ie/youtube] Adjust player clients for site changes (#11663)

Closes #11640
Authored by: bashonly
											
										
										
											2024-12-01 09:25:09 -06:00
+								        if self.is_authenticated:
-												[ie/youtube] Restore convenience workarounds (#12181)

Authored by: bashonly
											
										
										
											2025-01-25 10:18:15 -06:00
+								            if (smuggled_data.get('is_music_url') or self.is_music_url(url)) and 'web_music' not in requested_clients:
 								                requested_clients.append('web_music')
-												[ie/youtube] Adjust player clients for site changes (#11663)

Closes #11640
Authored by: bashonly
											
										
										
											2024-12-01 09:25:09 -06:00
+								            unsupported_clients = [
 								                client for client in requested_clients if not INNERTUBE_CLIENTS[client]['SUPPORTS_COOKIES']
 								            ]
 								            for client in unsupported_clients:
 								                self.report_warning(f'Skipping client "{client}" since it does not support cookies', only_once=True)
 								                requested_clients.remove(client)
-												[youtube] Extract data from multiple clients (#536)

* `player_client` accepts multiple clients
* default `player_client` = `android,web`
* music clients can be specifically requested
* Add IOS `player_client`
* Hide live dash since they can't be downloaded

Closes #501

Authored-by: pukkandan, colethedj
											
										
										
											2021-07-20 22:52:34 -05:00
+								        return orderedSet(requested_clients)
-												[youtube] Add support for multifeed videos

											
										
										
											2015-07-25 10:30:34 -05:00
-												[ie/youtube] Better error when all player responses are skipped (#9083)

Authored by: Grub4K, pukkandan

Co-authored-by: pukkandan <pukkandan.ytdlp@gmail.com>
											
										
										
											2024-02-24 17:20:22 -06:00
+								    def _invalid_player_response(self, pr, video_id):
 								        # YouTube may return a different video player response than expected.
 								        # See: https://github.com/TeamNewPipe/NewPipe/issues/8713
 								        if (pr_id := traverse_obj(pr, ('videoDetails', 'videoId'))) != video_id:
 								            return pr_id
-												[extractor/youtube] Use device-specific user agent (#4770)

Thwart latest fingerprinting attempt (see https://github.com/iv-org/invidious/issues/3230#issuecomment-1226887639)

Authored by: coletdjnz
											
										
										
											2022-08-28 17:59:54 -05:00
+								    def _extract_player_responses(self, clients, video_id, webpage, master_ytcfg, smuggled_data):
-												[ie/youtube] Add `po_token`, `visitor_data`, `data_sync_id` extractor args (#10648)

Authored by:  seproDev, coletdjnz, bashonly
											
										
										
											2024-09-13 05:51:58 -05:00
+								        initial_pr = None
-												[youtube] Extract data from multiple clients (#536)

* `player_client` accepts multiple clients
* default `player_client` = `android,web`
* music clients can be specifically requested
* Add IOS `player_client`
* Hide live dash since they can't be downloaded

Closes #501

Authored-by: pukkandan, colethedj
											
										
										
											2021-07-20 22:52:34 -05:00
+								        if webpage:
-												[ie/youtube] Fix initial player response usage (Bugfix for 8b8b442cb005a8d85315f301615f83fb736b967a) (#10464)

Authored by: seproDev
											
										
										
											2024-07-14 13:42:11 -05:00
+								            initial_pr = self._search_json(
 								                self._YT_INITIAL_PLAYER_RESPONSE_RE, webpage, 'initial player response', video_id, fatal=False)
-												[youtube] Skip broken multifeed videos (closes #24711)

											
										
										
											2020-04-09 10:42:43 -05:00
-												[ie/youtube] Better error when all player responses are skipped (#9083)

Authored by: Grub4K, pukkandan

Co-authored-by: pukkandan <pukkandan.ytdlp@gmail.com>
											
										
										
											2024-02-24 17:20:22 -06:00
+								        prs = []
-												[ie/youtube] Add `po_token`, `visitor_data`, `data_sync_id` extractor args (#10648)

Authored by:  seproDev, coletdjnz, bashonly
											
										
										
											2024-09-13 05:51:58 -05:00
+								        deprioritized_prs = []
-												[ie/youtube] Better error when all player responses are skipped (#9083)

Authored by: Grub4K, pukkandan

Co-authored-by: pukkandan <pukkandan.ytdlp@gmail.com>
											
										
										
											2024-02-24 17:20:22 -06:00
+								        if initial_pr and not self._invalid_player_response(initial_pr, video_id):
 								            # Android player_response does not have microFormats which are needed for
 								            # extraction of some data. So we return the initial_pr with formats
 								            # stripped out even if not requested by the user
 								            # See: https://github.com/yt-dlp/yt-dlp/issues/501
 								            prs.append({**initial_pr, 'streamingData': None})
-												[youtube] Try embedded client variants before agegate

agegate variants appears to be broken, but don't remove them for the time-being

											
										
										
											2022-03-24 18:30:41 -05:00
+								        all_clients = set(clients)
-												[YouTube] Age-gate bypass implementation (#575)

* Calling the API with `clientScreen=EMBED` allows access to most age-gated videos - discovered by @ccdffddfddfdsfedeee (https://github.com/yt-dlp/yt-dlp/issues/574#issuecomment-887171136)
* Adds clients: (web/android/ios)_(embedded/agegate), mweb_embedded
* Renamed mobile_web to mweb

Closes #574

Authored by pukkandan, MinePlayersPE
											
										
										
											2021-07-27 04:40:44 -05:00
+								        clients = clients[::-1]
-												[youtube] Add age-gate bypass for unverified accounts (#600)

Adds `_creator` variants for each client

Authored by: zerodytrash, colethedj, pukkandan
											
										
										
											2021-08-01 16:13:46 -05:00
-												[youtube] Try embedded client variants before agegate

agegate variants appears to be broken, but don't remove them for the time-being

											
										
										
											2022-03-24 18:30:41 -05:00
+								        def append_client(*client_names):
-												[YouTube] Add new age-gate bypass (#3233)

Closes #3182
Authored by: zerodytrash, pukkandan
											
										
										
											2022-03-29 05:05:31 -05:00
+								            """ Append the first client name that exists but not already used """
-												[youtube] Try embedded client variants before agegate

agegate variants appears to be broken, but don't remove them for the time-being

											
										
										
											2022-03-24 18:30:41 -05:00
+								            for client_name in client_names:
-												[YouTube] Add new age-gate bypass (#3233)

Closes #3182
Authored by: zerodytrash, pukkandan
											
										
										
											2022-03-29 05:05:31 -05:00
+								                actual_client = _split_innertube_client(client_name)[0]
 								                if actual_client in INNERTUBE_CLIENTS:
 								                    if actual_client not in all_clients:
-												[youtube] Try embedded client variants before agegate

agegate variants appears to be broken, but don't remove them for the time-being

											
										
										
											2022-03-24 18:30:41 -05:00
+								                        clients.append(client_name)
-												[YouTube] Add new age-gate bypass (#3233)

Closes #3182
Authored by: zerodytrash, pukkandan
											
										
										
											2022-03-29 05:05:31 -05:00
+								                        all_clients.add(actual_client)
 								                        return
-												[youtube] Add age-gate bypass for unverified accounts (#600)

Adds `_creator` variants for each client

Authored by: zerodytrash, colethedj, pukkandan
											
										
										
											2021-08-01 16:13:46 -05:00
-												[youtube] Improvements to JS player extraction (See desc) (#860)

* fallback player url extraction when it fails to be extracted from the webpage
* don't download js player unnecessarily for clients that don't require it
* try to extract js player url from any additional client configs
* ability to skip the js player usage/download using `player_skip=js`
* ability to skip the initial webpage download using `player_skip=webpage`

known issue:
* authentication for multi-channel accounts and multi-account cookies may not work correctly if the webpage or client configs are skipped
*  formats from the web client requiring signature decryption will be skipped if player js extraction is skipped

Authored by: coletdjnz
											
										
										
											2021-09-06 02:26:41 -05:00
+								        tried_iframe_fallback = False
-												[ie/youtube] Add `po_token`, `visitor_data`, `data_sync_id` extractor args (#10648)

Authored by:  seproDev, coletdjnz, bashonly
											
										
										
											2024-09-13 05:51:58 -05:00
+								        player_url = visitor_data = data_sync_id = None
-												[ie/youtube] Better error when all player responses are skipped (#9083)

Authored by: Grub4K, pukkandan

Co-authored-by: pukkandan <pukkandan.ytdlp@gmail.com>
											
										
										
											2024-02-24 17:20:22 -06:00
+								        skipped_clients = {}
-												[YouTube] Age-gate bypass implementation (#575)

* Calling the API with `clientScreen=EMBED` allows access to most age-gated videos - discovered by @ccdffddfddfdsfedeee (https://github.com/yt-dlp/yt-dlp/issues/574#issuecomment-887171136)
* Adds clients: (web/android/ios)_(embedded/agegate), mweb_embedded
* Renamed mobile_web to mweb

Closes #574

Authored by pukkandan, MinePlayersPE
											
										
										
											2021-07-27 04:40:44 -05:00
+								        while clients:
-												[ie/youtube] Add `po_token`, `visitor_data`, `data_sync_id` extractor args (#10648)

Authored by:  seproDev, coletdjnz, bashonly
											
										
										
											2024-09-13 05:51:58 -05:00
+								            deprioritize_pr = False
-												[YouTube] Add new age-gate bypass (#3233)

Closes #3182
Authored by: zerodytrash, pukkandan
											
										
										
											2022-03-29 05:05:31 -05:00
+								            client, base_client, variant = _split_innertube_client(clients.pop())
-												[ie/youtube] Add `po_token`, `visitor_data`, `data_sync_id` extractor args (#10648)

Authored by:  seproDev, coletdjnz, bashonly
											
										
										
											2024-09-13 05:51:58 -05:00
+								            player_ytcfg = master_ytcfg if client == 'web' else {}
 								            if 'configs' not in self._configuration_arg('player_skip') and client != 'web':
-												[youtube, cleanup] Minor refactoring

Authored by: coletdjnz, pukkandan

											
										
										
											2022-04-09 14:30:21 -05:00
+								                player_ytcfg = self._download_ytcfg(client, video_id) or player_ytcfg
-												[YouTube] Age-gate bypass implementation (#575)

* Calling the API with `clientScreen=EMBED` allows access to most age-gated videos - discovered by @ccdffddfddfdsfedeee (https://github.com/yt-dlp/yt-dlp/issues/574#issuecomment-887171136)
* Adds clients: (web/android/ios)_(embedded/agegate), mweb_embedded
* Renamed mobile_web to mweb

Closes #574

Authored by pukkandan, MinePlayersPE
											
										
										
											2021-07-27 04:40:44 -05:00
-												[youtube] Improvements to JS player extraction (See desc) (#860)

* fallback player url extraction when it fails to be extracted from the webpage
* don't download js player unnecessarily for clients that don't require it
* try to extract js player url from any additional client configs
* ability to skip the js player usage/download using `player_skip=js`
* ability to skip the initial webpage download using `player_skip=webpage`

known issue:
* authentication for multi-channel accounts and multi-account cookies may not work correctly if the webpage or client configs are skipped
*  formats from the web client requiring signature decryption will be skipped if player js extraction is skipped

Authored by: coletdjnz
											
										
										
											2021-09-06 02:26:41 -05:00
+								            player_url = player_url or self._extract_player_url(master_ytcfg, player_ytcfg, webpage=webpage)
 								            require_js_player = self._get_default_ytcfg(client).get('REQUIRE_JS_PLAYER')
 								            if 'js' in self._configuration_arg('player_skip'):
 								                require_js_player = False
 								                player_url = None
 								            if not player_url and not tried_iframe_fallback and require_js_player:
 								                player_url = self._download_player_url(video_id)
 								                tried_iframe_fallback = True
-												[ie/youtube] Add `po_token`, `visitor_data`, `data_sync_id` extractor args (#10648)

Authored by:  seproDev, coletdjnz, bashonly
											
										
										
											2024-09-13 05:51:58 -05:00
+								            visitor_data = visitor_data or self._extract_visitor_data(master_ytcfg, initial_pr, player_ytcfg)
 								            data_sync_id = data_sync_id or self._extract_data_sync_id(master_ytcfg, initial_pr, player_ytcfg)
-												[ie/youtube] Use different PO token for GVS and Player (#12090)

Authored by: coletdjnz
											
										
										
											2025-01-24 18:17:37 -06:00
+								            fetch_po_token_args = {
 								                'client': client,
 								                'visitor_data': visitor_data,
 								                'video_id': video_id,
 								                'data_sync_id': data_sync_id if self.is_authenticated else None,
 								                'player_url': player_url if require_js_player else None,
 								                'session_index': self._extract_session_index(master_ytcfg, player_ytcfg),
 								                'ytcfg': player_ytcfg,
 								            }
 								            player_po_token = self.fetch_po_token(
 								                context=_PoTokenContext.PLAYER, **fetch_po_token_args)
 								            gvs_po_token = self.fetch_po_token(
 								                context=_PoTokenContext.GVS, **fetch_po_token_args)
 								            required_pot_contexts = self._get_default_ytcfg(client)['PO_TOKEN_REQUIRED_CONTEXTS']
 								            if (
 								                not player_po_token
 								                and _PoTokenContext.PLAYER in required_pot_contexts
 								            ):
 								                # TODO: may need to skip player response request. Unsure yet..
-												[ie/youtube] Add `po_token`, `visitor_data`, `data_sync_id` extractor args (#10648)

Authored by:  seproDev, coletdjnz, bashonly
											
										
										
											2024-09-13 05:51:58 -05:00
+								                self.report_warning(
-												[ie/youtube] Use different PO token for GVS and Player (#12090)

Authored by: coletdjnz
											
										
										
											2025-01-24 18:17:37 -06:00
+								                    f'No Player PO Token provided for {client} client, '
 								                    f'which may be required for working {client} formats. This client will be deprioritized'
 								                    f'You can manually pass a Player PO Token for this client with --extractor-args "youtube:po_token={client}.player+XXX". '
 								                    f'For more information, refer to {PO_TOKEN_GUIDE_URL} .', only_once=True)
 								                deprioritize_pr = True
 								            if (
 								                not gvs_po_token
 								                and _PoTokenContext.GVS in required_pot_contexts
 								                and 'missing_pot' in self._configuration_arg('formats')
 								            ):
 								                # note: warning with help message is provided later during format processing
 								                self.report_warning(
 								                    f'No GVS PO Token provided for {client} client, '
 								                    f'which may be required for working {client} formats. This client will be deprioritized',
 								                    only_once=True)
-												[ie/youtube] Add `po_token`, `visitor_data`, `data_sync_id` extractor args (#10648)

Authored by:  seproDev, coletdjnz, bashonly
											
										
										
											2024-09-13 05:51:58 -05:00
+								                deprioritize_pr = True
 								            pr = initial_pr if client == 'web' else None
 								            try:
 								                pr = pr or self._extract_player_response(
 								                    client, video_id,
 								                    master_ytcfg=player_ytcfg or master_ytcfg,
 								                    player_ytcfg=player_ytcfg,
 								                    player_url=player_url,
 								                    initial_pr=initial_pr,
 								                    visitor_data=visitor_data,
 								                    data_sync_id=data_sync_id,
-												[ie/youtube] Use different PO token for GVS and Player (#12090)

Authored by: coletdjnz
											
										
										
											2025-01-24 18:17:37 -06:00
+								                    po_token=player_po_token)
-												[ie/youtube] Add `po_token`, `visitor_data`, `data_sync_id` extractor args (#10648)

Authored by:  seproDev, coletdjnz, bashonly
											
										
										
											2024-09-13 05:51:58 -05:00
+								            except ExtractorError as e:
 								                self.report_warning(e)
-												[youtube] Raise appropriate error when API pages can't be downloaded

											
										
										
											2021-08-07 01:45:58 -05:00
+								                continue
-												[ie/youtube] Better error when all player responses are skipped (#9083)

Authored by: Grub4K, pukkandan

Co-authored-by: pukkandan <pukkandan.ytdlp@gmail.com>
											
										
										
											2024-02-24 17:20:22 -06:00
+								            if pr_id := self._invalid_player_response(pr, video_id):
 								                skipped_clients[client] = pr_id
 								            elif pr:
 								                # Save client name for introspection later
 								                sd = traverse_obj(pr, ('streamingData', {dict})) or {}
-												[ie/youtube] Add `po_token`, `visitor_data`, `data_sync_id` extractor args (#10648)

Authored by:  seproDev, coletdjnz, bashonly
											
										
										
											2024-09-13 05:51:58 -05:00
+								                sd[STREAMING_DATA_CLIENT_NAME] = client
-												[ie/youtube] Use different PO token for GVS and Player (#12090)

Authored by: coletdjnz
											
										
										
											2025-01-24 18:17:37 -06:00
+								                sd[STREAMING_DATA_INITIAL_PO_TOKEN] = gvs_po_token
-												[ie/youtube] Better error when all player responses are skipped (#9083)

Authored by: Grub4K, pukkandan

Co-authored-by: pukkandan <pukkandan.ytdlp@gmail.com>
											
										
										
											2024-02-24 17:20:22 -06:00
+								                for f in traverse_obj(sd, (('formats', 'adaptiveFormats'), ..., {dict})):
-												[ie/youtube] Add `po_token`, `visitor_data`, `data_sync_id` extractor args (#10648)

Authored by:  seproDev, coletdjnz, bashonly
											
										
										
											2024-09-13 05:51:58 -05:00
+								                    f[STREAMING_DATA_CLIENT_NAME] = client
-												[ie/youtube] Use different PO token for GVS and Player (#12090)

Authored by: coletdjnz
											
										
										
											2025-01-24 18:17:37 -06:00
+								                    f[STREAMING_DATA_INITIAL_PO_TOKEN] = gvs_po_token
-												[ie/youtube] Add `po_token`, `visitor_data`, `data_sync_id` extractor args (#10648)

Authored by:  seproDev, coletdjnz, bashonly
											
										
										
											2024-09-13 05:51:58 -05:00
+								                if deprioritize_pr:
 								                    deprioritized_prs.append(pr)
 								                else:
 								                    prs.append(pr)
-												[YouTube] Age-gate bypass implementation (#575)

* Calling the API with `clientScreen=EMBED` allows access to most age-gated videos - discovered by @ccdffddfddfdsfedeee (https://github.com/yt-dlp/yt-dlp/issues/574#issuecomment-887171136)
* Adds clients: (web/android/ios)_(embedded/agegate), mweb_embedded
* Renamed mobile_web to mweb

Closes #574

Authored by pukkandan, MinePlayersPE
											
										
										
											2021-07-27 04:40:44 -05:00
-												[ie/youtube] Restore convenience workarounds (#12181)

Authored by: bashonly
											
										
										
											2025-01-25 10:18:15 -06:00
+								            # EU countries require age-verification for accounts to access age-restricted videos
 								            # If account is not age-verified, _is_agegated() will be truthy for non-embedded clients
 								            if self.is_authenticated and self._is_agegated(pr):
 								                self.to_screen(
 								                    f'{video_id}: This video is age-restricted and YouTube is requiring '
 								                    'account age-verification; some formats may be missing', only_once=True)
 								                # tv_embedded can work around the age-verification requirement for embeddable videos
 								                # web_creator may work around age-verification for all videos but requires PO token
 								                append_client('tv_embedded', 'web_creator')
-												[ie/youtube] Add `po_token`, `visitor_data`, `data_sync_id` extractor args (#10648)

Authored by:  seproDev, coletdjnz, bashonly
											
										
										
											2024-09-13 05:51:58 -05:00
+								        prs.extend(deprioritized_prs)
-												[ie/youtube] Better error when all player responses are skipped (#9083)

Authored by: Grub4K, pukkandan

Co-authored-by: pukkandan <pukkandan.ytdlp@gmail.com>
											
										
										
											2024-02-24 17:20:22 -06:00
+								        if skipped_clients:
 								            self.report_warning(
 								                f'Skipping player responses from {"/".join(skipped_clients)} clients '
 								                f'(got player responses for video "{"/".join(set(skipped_clients.values()))}" instead of "{video_id}")')
 								            if not prs:
 								                raise ExtractorError(
 								                    'All player responses are invalid. Your IP is likely being blocked by Youtube', expected=True)
 								        elif not prs:
 								            raise ExtractorError('Failed to extract any player response')
-												[youtube] Improvements to JS player extraction (See desc) (#860)

* fallback player url extraction when it fails to be extracted from the webpage
* don't download js player unnecessarily for clients that don't require it
* try to extract js player url from any additional client configs
* ability to skip the js player usage/download using `player_skip=js`
* ability to skip the initial webpage download using `player_skip=webpage`

known issue:
* authentication for multi-channel accounts and multi-account cookies may not work correctly if the webpage or client configs are skipped
*  formats from the web client requiring signature decryption will be skipped if player js extraction is skipped

Authored by: coletdjnz
											
										
										
											2021-09-06 02:26:41 -05:00
+								        return prs, player_url
-												[youtube] Extract data from multiple clients (#536)

* `player_client` accepts multiple clients
* default `player_client` = `android,web`
* music clients can be specifically requested
* Add IOS `player_client`
* Hide live dash since they can't be downloaded

Closes #501

Authored-by: pukkandan, colethedj
											
										
										
											2021-07-20 22:52:34 -05:00
-												[extractor/youtube] Download `post_live` videos from start (#5091)

* The fragments are generated as a `LazyList`. So only the required formats are expanded during download, but all fragment lists are printed/written in infojson.
* The m3u8 formats which cannot be downloaded from start are not extracted by default, but can be enabled with an extractor-arg. The extractor-arg `include_live_dash` is renamed to `include_incomplete_formats` to account for this new use-case.

Closes #1564
Authored by: Lesmiscore, pukkandan
											
										
										
											2022-10-03 21:48:31 -05:00
+								    def _needs_live_processing(self, live_status, duration):
-												[cleanup] Bump ruff to 0.8.x (#11608)

Authored by: seproDev
											
										
										
											2024-12-02 09:29:30 -06:00
+								        if ((live_status == 'is_live' and self.get_param('live_from_start'))
 								                or (live_status == 'post_live' and (duration or 0) > 2 * 3600)):
-												[extractor/youtube] Download `post_live` videos from start (#5091)

* The fragments are generated as a `LazyList`. So only the required formats are expanded during download, but all fragment lists are printed/written in infojson.
* The m3u8 formats which cannot be downloaded from start are not extracted by default, but can be enabled with an extractor-arg. The extractor-arg `include_live_dash` is renamed to `include_incomplete_formats` to account for this new use-case.

Closes #1564
Authored by: Lesmiscore, pukkandan
											
										
										
											2022-10-03 21:48:31 -05:00
+								            return live_status
-												[ie/youtube] Skip iOS formats that require PO Token (#11890)

Partial fix for https://github.com/yt-dlp/yt-dlp/issues/11868

Authored by: coletdjnz
											
										
										
											2024-12-23 17:03:28 -06:00
+								    def _report_pot_format_skipped(self, video_id, client_name, proto):
 								        msg = (
-												[ie/youtube] Use different PO token for GVS and Player (#12090)

Authored by: coletdjnz
											
										
										
											2025-01-24 18:17:37 -06:00
+								            f'{video_id}: {client_name} client {proto} formats require a GVS PO Token which was not provided. '
-												[ie/youtube] Skip iOS formats that require PO Token (#11890)

Partial fix for https://github.com/yt-dlp/yt-dlp/issues/11868

Authored by: coletdjnz
											
										
										
											2024-12-23 17:03:28 -06:00
+								            'They will be skipped as they may yield HTTP Error 403. '
-												[ie/youtube] Use different PO token for GVS and Player (#12090)

Authored by: coletdjnz
											
										
										
											2025-01-24 18:17:37 -06:00
+								            f'You can manually pass a GVS PO Token for this client with --extractor-args "youtube:po_token={client_name}.gvs+XXX". '
 								            f'For more information, refer to  {PO_TOKEN_GUIDE_URL} . '
-												[ie/youtube] Skip iOS formats that require PO Token (#11890)

Partial fix for https://github.com/yt-dlp/yt-dlp/issues/11868

Authored by: coletdjnz
											
										
										
											2024-12-23 17:03:28 -06:00
+								            'To enable these broken formats anyway, pass --extractor-args "youtube:formats=missing_pot"')
 								        # Only raise a warning for non-default clients, to not confuse users.
 								        # iOS HLS formats still work without PO Token, so we don't need to warn about them.
 								        if client_name in (*self._DEFAULT_CLIENTS, *self._DEFAULT_AUTHED_CLIENTS):
 								            self.write_debug(msg, only_once=True)
 								        else:
 								            self.report_warning(msg, only_once=True)
-												[extractor/youtube] Download `post_live` videos from start (#5091)

* The fragments are generated as a `LazyList`. So only the required formats are expanded during download, but all fragment lists are printed/written in infojson.
* The m3u8 formats which cannot be downloaded from start are not extracted by default, but can be enabled with an extractor-arg. The extractor-arg `include_live_dash` is renamed to `include_incomplete_formats` to account for this new use-case.

Closes #1564
Authored by: Lesmiscore, pukkandan
											
										
										
											2022-10-03 21:48:31 -05:00
+								    def _extract_formats_and_subtitles(self, streaming_data, video_id, player_url, live_status, duration):
-												Fix 2a23d92d9ec44a0168079e38bcf3d383e5c4c7bb

Closes #6517

											
										
										
											2023-03-12 04:16:09 -05:00
+								        CHUNK_SIZE = 10 << 20
-												[ie/youtube] Extract all formats from multi-language m3u8s (#9875)

Authored by: clienthax, bashonly

Co-authored-by: bashonly <88596187+bashonly@users.noreply.github.com>
											
										
										
											2024-06-20 16:54:53 -05:00
+								        PREFERRED_LANG_VALUE = 10
 								        original_language = None
-												[extractor/youtube] Consider language in format de-duplication

											
										
										
											2022-11-14 17:53:32 -06:00
+								        itags, stream_ids = collections.defaultdict(set), []
-												[extractor/youtube] Fix bug in format sorting

											
										
										
											2022-08-20 14:26:27 -05:00
+								        itag_qualities, res_qualities = {}, {0: None}
-												[youtube] Sort audio-only formats correctly
Closes #317

											
										
										
											2021-05-17 14:41:57 -05:00
+								        q = qualities([
-												[youtube] Fix format sorting when using alternate clients

											
										
										
											2021-07-25 17:03:42 -05:00
+								            # Normally tiny is the smallest video-only formats. But
 								            # audio-only formats with unknown quality may get tagged as tiny
 								            'tiny',
 								            'audio_quality_ultralow', 'audio_quality_low', 'audio_quality_medium', 'audio_quality_high',  # Audio only formats
-												[cleanup] Add more ruff rules (#10149)

Authored by: seproDev

Reviewed-by: bashonly <88596187+bashonly@users.noreply.github.com>
Reviewed-by: Simon Sawicki <contact@grub4k.xyz>
											
										
										
											2024-06-11 18:09:58 -05:00
+								            'small', 'medium', 'large', 'hd720', 'hd1080', 'hd1440', 'hd2160', 'hd2880', 'highres',
-												[youtube] Sort audio-only formats correctly
Closes #317

											
										
										
											2021-05-17 14:41:57 -05:00
+								        ])
-												[utils] `traverse_obj`: Fix more bugs

and cleanup uses of `default=[]`

Continued from b1bde57bef878478e3503ab07190fd207914ade9

											
										
										
											2023-02-09 16:26:26 -06:00
+								        streaming_formats = traverse_obj(streaming_data, (..., ('formats', 'adaptiveFormats'), ...))
-												[extractor/youtube] Add extractor-arg `formats`

Closes #7417

											
										
										
											2023-06-25 09:40:00 -05:00
+								        format_types = self._configuration_arg('formats')
 								        all_formats = 'duplicate' in format_types
 								        if self._configuration_arg('include_duplicate_formats'):
 								            all_formats = True
 								            self._downloader.deprecated_feature('[youtube] include_duplicate_formats extractor argument is deprecated. '
 								                                                'Use formats=duplicate extractor argument instead')
-												[Youtube] Extract more formats for `music.youtube` URLs (#311)

Based on: https://github.com/ytdl-org/youtube-dl/pull/28778, https://github.com/ytdl-org/youtube-dl/pull/26160

Co-authored-by: craftingmod, colethedj, pukkandan
											
										
										
											2021-05-15 09:38:47 -05:00
-												Fix 2a23d92d9ec44a0168079e38bcf3d383e5c4c7bb

Closes #6517

											
										
										
											2023-03-12 04:16:09 -05:00
+								        def build_fragments(f):
 								            return LazyList({
 								                'url': update_url_query(f['url'], {
-												[cleanup] Add more ruff rules (#10149)

Authored by: seproDev

Reviewed-by: bashonly <88596187+bashonly@users.noreply.github.com>
Reviewed-by: Simon Sawicki <contact@grub4k.xyz>
											
										
										
											2024-06-11 18:09:58 -05:00
+								                    'range': f'{range_start}-{min(range_start + CHUNK_SIZE - 1, f["filesize"])}',
 								                }),
-												Fix 2a23d92d9ec44a0168079e38bcf3d383e5c4c7bb

Closes #6517

											
										
										
											2023-03-12 04:16:09 -05:00
+								            } for range_start in range(0, f['filesize'], CHUNK_SIZE))
-												[youtube] Update to ytdl-2021.02.04.1

											
										
										
											2021-02-04 08:37:17 -06:00
+								        for fmt in streaming_formats:
-												[ie/youtube] Warn on missing formats due to SSAP (#12483)

See https://github.com/yt-dlp/yt-dlp/issues/12482

Authored by: coletdjnz
											
										
										
											2025-02-28 00:33:31 -06:00
+								            client_name = fmt[STREAMING_DATA_CLIENT_NAME]
-												[youtube] Detect DRM better

Authored by: shirt-dev

											
										
										
											2022-03-27 00:28:26 -05:00
+								            if fmt.get('targetDurationSec'):
-												[youtube] Update to ytdl-2021.02.04.1

											
										
										
											2021-02-04 08:37:17 -06:00
+								                continue
-												check live chat replay existence

											
										
										
											2020-08-04 19:30:10 -05:00
-												Update to ytdl-2021.02.10

Except: [archiveorg] Fix and improve extraction (5fc53690cbe6abb11941a3f4846b566a7472753e)

											
										
										
											2021-02-10 15:22:55 -06:00
+								            itag = str_or_none(fmt.get('itag'))
-												[Youtube] Extract more formats for `music.youtube` URLs (#311)

Based on: https://github.com/ytdl-org/youtube-dl/pull/28778, https://github.com/ytdl-org/youtube-dl/pull/26160

Co-authored-by: craftingmod, colethedj, pukkandan
											
										
										
											2021-05-15 09:38:47 -05:00
+								            audio_track = fmt.get('audioTrack') or {}
-												[extractor/youtube] Extract DRC formats

											
										
										
											2022-12-30 04:02:33 -06:00
+								            stream_id = (itag, audio_track.get('id'), fmt.get('isDrc'))
-												[extractor/youtube] Add extractor-arg `include_duplicate_formats`

											
										
										
											2023-03-09 11:43:02 -06:00
+								            if not all_formats:
 								                if stream_id in stream_ids:
 								                    continue
-												[Youtube] Extract more formats for `music.youtube` URLs (#311)

Based on: https://github.com/ytdl-org/youtube-dl/pull/28778, https://github.com/ytdl-org/youtube-dl/pull/26160

Co-authored-by: craftingmod, colethedj, pukkandan
											
										
										
											2021-05-15 09:38:47 -05:00
-												Update to ytdl-2021.02.10

Except: [archiveorg] Fix and improve extraction (5fc53690cbe6abb11941a3f4846b566a7472753e)

											
										
										
											2021-02-10 15:22:55 -06:00
+								            quality = fmt.get('quality')
-												[youtube] Fix format sorting when using alternate clients

											
										
										
											2021-07-25 17:03:42 -05:00
+								            height = int_or_none(fmt.get('height'))
-												[youtube] Sort audio-only formats correctly
Closes #317

											
										
										
											2021-05-17 14:41:57 -05:00
+								            if quality == 'tiny' or not quality:
 								                quality = fmt.get('audioQuality', '').lower() or quality
-												[youtube] Fix format sorting when using alternate clients

											
										
										
											2021-07-25 17:03:42 -05:00
+								            # The 3gp format (17) in android client has a quality of "small",
 								            # but is actually worse than other formats
 								            if itag == '17':
 								                quality = 'tiny'
 								            if quality:
 								                if itag:
 								                    itag_qualities[itag] = quality
 								                if height:
 								                    res_qualities[height] = quality
-												[ie/youtube] Skip formats if nsig decoding fails (#10223)

Ref: https://github.com/ytdl-org/youtube-dl/issues/32815

Authored by: bashonly
											
										
										
											2024-06-21 18:19:59 -05:00
-												[ie/youtube] Prioritize original language over auto-dubbed audio (#11803)

Closes #11753
Authored by: bashonly
											
										
										
											2024-12-13 04:21:48 -06:00
+								            display_name = audio_track.get('displayName') or ''
 								            is_original = 'original' in display_name.lower()
 								            is_descriptive = 'descriptive' in display_name.lower()
-												[ie/youtube] Skip formats if nsig decoding fails (#10223)

Ref: https://github.com/ytdl-org/youtube-dl/issues/32815

Authored by: bashonly
											
										
										
											2024-06-21 18:19:59 -05:00
+								            is_default = audio_track.get('audioIsDefault')
 								            language_code = audio_track.get('id', '').split('.')[0]
-												[ie/youtube] Prioritize original language over auto-dubbed audio (#11803)

Closes #11753
Authored by: bashonly
											
										
										
											2024-12-13 04:21:48 -06:00
+								            if language_code and (is_original or (is_default and not original_language)):
-												[ie/youtube] Skip formats if nsig decoding fails (#10223)

Ref: https://github.com/ytdl-org/youtube-dl/issues/32815

Authored by: bashonly
											
										
										
											2024-06-21 18:19:59 -05:00
+								                original_language = language_code
-												[ie/youtube] Warn on DRM formats (#12593)

Authored by: coletdjnz
											
										
										
											2025-03-15 16:28:16 -05:00
+								            has_drm = bool(fmt.get('drmFamilies'))
-												Update to ytdl-2021.02.10

Except: [archiveorg] Fix and improve extraction (5fc53690cbe6abb11941a3f4846b566a7472753e)

											
										
										
											2021-02-10 15:22:55 -06:00
+								            # FORMAT_STREAM_TYPE_OTF(otf=1) requires downloading the init fragment
 								            # (adding `&sq=0` to the URL) and parsing emsg box to determine the
 								            # number of fragment that would subsequently requested with (`&sq=N`)
-												[ie/youtube] Warn on DRM formats (#12593)

Authored by: coletdjnz
											
										
										
											2025-03-15 16:28:16 -05:00
+								            if fmt.get('type') == 'FORMAT_STREAM_TYPE_OTF' and not has_drm:
-												Update to ytdl-2021.02.10

Except: [archiveorg] Fix and improve extraction (5fc53690cbe6abb11941a3f4846b566a7472753e)

											
										
										
											2021-02-10 15:22:55 -06:00
+								                continue
-												[ie/youtube] Warn on DRM formats (#12593)

Authored by: coletdjnz
											
										
										
											2025-03-15 16:28:16 -05:00
+								            if has_drm:
 								                msg = f'Some {client_name} client https formats have been skipped as they are DRM protected. '
 								                if client_name == 'tv':
 								                    msg += (
 								                        f'{"Your account" if self.is_authenticated else "The current session"} may have '
 								                        f'an experiment that applies DRM to all videos on the tv client. '
 								                        f'See  https://github.com/yt-dlp/yt-dlp/issues/12563  for more details.'
 								                    )
 								                self.report_warning(msg, video_id, only_once=True)
-												[youtube] Update to ytdl-2021.02.04.1

											
										
										
											2021-02-04 08:37:17 -06:00
+								            fmt_url = fmt.get('url')
 								            if not fmt_url:
-												[compat] Remove deprecated functions from core code

											
										
										
											2022-06-24 05:54:43 -05:00
+								                sc = urllib.parse.parse_qs(fmt.get('signatureCipher'))
-												[youtube] Update to ytdl-2021.02.04.1

											
										
										
											2021-02-04 08:37:17 -06:00
+								                fmt_url = url_or_none(try_get(sc, lambda x: x['url'][0]))
 								                encrypted_sig = try_get(sc, lambda x: x['s'][0])
-												[extractor/youtube] Make signature extraction non-fatal

and reduce verbosity of it's warning

Closes #3882

											
										
										
											2022-05-28 13:14:36 -05:00
+								                if not all((sc, fmt_url, player_url, encrypted_sig)):
-												[ie/youtube] Warn on missing formats due to SSAP (#12483)

See https://github.com/yt-dlp/yt-dlp/issues/12482

Authored by: coletdjnz
											
										
										
											2025-02-28 00:33:31 -06:00
+								                    self.report_warning(
-												[ie/youtube] Warn on DRM formats (#12593)

Authored by: coletdjnz
											
										
										
											2025-03-15 16:28:16 -05:00
+								                        f'Some {client_name} client https formats have been skipped as they are missing a url. '
-												[ie/youtube] Warn on missing formats due to SSAP (#12483)

See https://github.com/yt-dlp/yt-dlp/issues/12482

Authored by: coletdjnz
											
										
										
											2025-02-28 00:33:31 -06:00
+								                        f'{"Your account" if self.is_authenticated else "The current session"} may have '
-												[ie/youtube] Warn on DRM formats (#12593)

Authored by: coletdjnz
											
										
										
											2025-03-15 16:28:16 -05:00
+								                        f'the SSAP (server-side ads) experiment which interferes with yt-dlp. '
-												[ie/youtube] Warn on missing formats due to SSAP (#12483)

See https://github.com/yt-dlp/yt-dlp/issues/12482

Authored by: coletdjnz
											
										
										
											2025-02-28 00:33:31 -06:00
+								                        f'Please see  https://github.com/yt-dlp/yt-dlp/issues/12482  for more details.',
-												[ie/youtube] Warn on DRM formats (#12593)

Authored by: coletdjnz
											
										
										
											2025-03-15 16:28:16 -05:00
+								                        video_id, only_once=True)
-												[youtube] Update to ytdl-2021.02.04.1

											
										
										
											2021-02-04 08:37:17 -06:00
+								                    continue
-												[extractor/youtube] Make signature extraction non-fatal

and reduce verbosity of it's warning

Closes #3882

											
										
										
											2022-05-28 13:14:36 -05:00
+								                try:
-												[cleanup] Add more ruff rules (#10149)

Authored by: seproDev

Reviewed-by: bashonly <88596187+bashonly@users.noreply.github.com>
Reviewed-by: Simon Sawicki <contact@grub4k.xyz>
											
										
										
											2024-06-11 18:09:58 -05:00
+								                    fmt_url += '&{}={}'.format(
-												[extractor/youtube] Make signature extraction non-fatal

and reduce verbosity of it's warning

Closes #3882

											
										
										
											2022-05-28 13:14:36 -05:00
+								                        traverse_obj(sc, ('sp', -1)) or 'signature',
-												[cleanup] Add more ruff rules (#10149)

Authored by: seproDev

Reviewed-by: bashonly <88596187+bashonly@users.noreply.github.com>
Reviewed-by: Simon Sawicki <contact@grub4k.xyz>
											
										
										
											2024-06-11 18:09:58 -05:00
+								                        self._decrypt_signature(encrypted_sig, video_id, player_url),
-												[extractor/youtube] Make signature extraction non-fatal

and reduce verbosity of it's warning

Closes #3882

											
										
										
											2022-05-28 13:14:36 -05:00
+								                    )
 								                except ExtractorError as e:
-												[youtube] Improve signature caching

and refactor related functions

											
										
										
											2022-08-18 10:57:41 -05:00
+								                    self.report_warning('Signature extraction failed: Some formats may be missing',
 								                                        video_id=video_id, only_once=True)
-												[extractor/youtube] Make signature extraction non-fatal

and reduce verbosity of it's warning

Closes #3882

											
										
										
											2022-05-28 13:14:36 -05:00
+								                    self.write_debug(e, only_once=True)
-												[youtube] Show format ID in signature deobfuscation -v output

											
										
										
											2014-08-01 23:35:18 -05:00
+								                    continue
-												[youtube] Update to ytdl-2021.02.04.1

											
										
										
											2021-02-04 08:37:17 -06:00
-												[youtube] Fix throttling by decrypting n-sig (#1437)


											
										
										
											2021-10-30 23:23:58 -05:00
+								            query = parse_qs(fmt_url)
-												[youtube] Decrypt n-sig for URLs with `ratebypass`
Closes #1796

											
										
										
											2021-11-28 06:31:46 -06:00
+								            if query.get('n'):
-												[youtube] Fix throttling by decrypting n-sig (#1437)


											
										
										
											2021-10-30 23:23:58 -05:00
+								                try:
-												[youtube] Improve signature caching

and refactor related functions

											
										
										
											2022-08-18 10:57:41 -05:00
+								                    decrypt_nsig = self._cached(self._decrypt_nsig, 'nsig', query['n'][0])
-												[youtube] Fix throttling by decrypting n-sig (#1437)


											
										
										
											2021-10-30 23:23:58 -05:00
+								                    fmt_url = update_url_query(fmt_url, {
-												[cleanup] Add more ruff rules (#10149)

Authored by: seproDev

Reviewed-by: bashonly <88596187+bashonly@users.noreply.github.com>
Reviewed-by: Simon Sawicki <contact@grub4k.xyz>
											
										
										
											2024-06-11 18:09:58 -05:00
+								                        'n': decrypt_nsig(query['n'][0], video_id, player_url),
-												[youtube] Improve signature caching

and refactor related functions

											
										
										
											2022-08-18 10:57:41 -05:00
+								                    })
-												[youtube] Fix throttling by decrypting n-sig (#1437)


											
										
										
											2021-10-30 23:23:58 -05:00
+								                except ExtractorError as e:
-												[docs] Improvements

* Move detailed installation instructions to https://github.com/yt-dlp/yt-dlp/wiki/Installation
* Link to wiki where applicable
* Fix some mistakes. Closes #4853, Closes #4855, Closes #4852
* Improve some error messages

											
										
										
											2022-09-07 07:05:45 -05:00
+								                    if player_url:
 								                        self.report_warning(
-												[ie/youtube] Fix nsig and signature extraction for player `643afba4` (#12684)

Closes #12677, Closes #12682
Authored by: seproDev, bashonly

Co-authored-by: bashonly <88596187+bashonly@users.noreply.github.com>
											
										
										
											2025-03-21 15:58:10 -05:00
+								                            f'nsig extraction failed: Some formats may be missing\n'
 								                            f'         n = {query["n"][0]} ; player = {player_url}',
 								                            video_id=video_id, only_once=True)
-												[docs] Improvements

* Move detailed installation instructions to https://github.com/yt-dlp/yt-dlp/wiki/Installation
* Link to wiki where applicable
* Fix some mistakes. Closes #4853, Closes #4855, Closes #4852
* Improve some error messages

											
										
										
											2022-09-07 07:05:45 -05:00
+								                        self.write_debug(e, only_once=True)
 								                    else:
 								                        self.report_warning(
-												[ie/youtube] Skip formats if nsig decoding fails (#10223)

Ref: https://github.com/ytdl-org/youtube-dl/issues/32815

Authored by: bashonly
											
										
										
											2024-06-21 18:19:59 -05:00
+								                            'Cannot decrypt nsig without player_url: Some formats may be missing',
-												[docs] Improvements

* Move detailed installation instructions to https://github.com/yt-dlp/yt-dlp/wiki/Installation
* Link to wiki where applicable
* Fix some mistakes. Closes #4853, Closes #4855, Closes #4852
* Improve some error messages

											
										
										
											2022-09-07 07:05:45 -05:00
+								                            video_id=video_id, only_once=True)
-												[ie/youtube] Skip formats if nsig decoding fails (#10223)

Ref: https://github.com/ytdl-org/youtube-dl/issues/32815

Authored by: bashonly
											
										
										
											2024-06-21 18:19:59 -05:00
+								                    continue
-												[youtube] Fix throttling by decrypting n-sig (#1437)


											
										
										
											2021-10-30 23:23:58 -05:00
-												[core] Fix `filesize_approx` calculation (#9560)

Reverts 22e4dfacb61f62dfbb3eb41b31c7b69ba1059b80

Despite being documented as `Kbit/s`, the extractors/manifests were returning bitrates in SI units of kilobits/sec.

Authored by: seproDev, pukkandan
											
										
										
											2024-03-31 18:17:24 -05:00
+								            tbr = float_or_none(fmt.get('averageBitrate') or fmt.get('bitrate'), 1000)
-												[cleanup] Misc (#11347)

Closes #11361
Authored by: avagordon01, bashonly, grqz, Grub4K, seproDev

Co-authored-by: Ava Gordon <avagordon01@gmail.com>
Co-authored-by: bashonly <bashonly@protonmail.com>
Co-authored-by: N/Ame <173015200+grqz@users.noreply.github.com>
Co-authored-by: Simon Sawicki <contact@grub4k.xyz>
											
										
										
											2024-11-03 18:33:21 -06:00
+								            format_duration = traverse_obj(fmt, ('approxDurationMs', {float_or_none(scale=1000)}))
-												[youtube] De-prioritize potentially damaged formats

Closes #2823

											
										
										
											2022-02-18 08:11:37 -06:00
+								            # Some formats may have much smaller duration than others (possibly damaged during encoding)
-												[docs] Consistent use of `e.g.` (#4643)

Authored by: Lesmiscore
											
										
										
											2022-08-14 07:04:13 -05:00
+								            # E.g. 2-nOtRESiUc Ref: https://github.com/yt-dlp/yt-dlp/issues/2823
-												[youtube] Avoid false positives when detecting damaged formats

Closes #3083

											
										
										
											2022-03-16 09:16:19 -05:00
+								            # Make sure to avoid false positives with small duration differences.
-												[docs] Consistent use of `e.g.` (#4643)

Authored by: Lesmiscore
											
										
										
											2022-08-14 07:04:13 -05:00
+								            # E.g. __2ABJjxzNo, ySuUZEjARPY
-												[ie/youtube] Calculate more accurate `filesize`

YouTube provides slightly different duration for each format.
Calculating file-size based on this duration instead of the
video duration gives more accurate results.

Ref: https://github.com/yt-dlp/yt-dlp/issues/1400#issuecomment-2007441207

											
										
										
											2024-03-31 15:50:03 -05:00
+								            is_damaged = try_call(lambda: format_duration < duration // 2)
-												[cleanup, docs] Misc cleanup

Closes #2828, closes #2734, closes #2802, closes #2937

											
										
										
											2022-03-04 08:08:55 -06:00
+								            if is_damaged:
-												[cleanup] Minor fixes (See desc)

* [youtube] Fix `--youtube-skip-dash-manifest`
* [build] Use `$()` in `Makefile`. Closes #3684
* Fix bug in 385ffb467b2285e85a2a5495b90314ba1f8e0700
* Fix bug in 43d7f5a5d0c77556156a3f8caa6976d3908a1e38
* [cleanup] Remove unnecessary `utf-8` from `str.encode`/`bytes.decode`
* [utils] LazyList: Expose unnecessarily "protected" attributes
and other minor cleanup

											
										
										
											2022-05-09 06:54:28 -05:00
+								                self.report_warning(
 								                    f'{video_id}: Some formats are possibly damaged. They will be deprioritized', only_once=True)
-												[extractor/youtube] Add client name to `format_note` when `-v` (#6254)

Authored by: Lesmiscore, pukkandan
											
										
										
											2023-03-11 11:03:23 -06:00
-												[ie/youtube] Use different PO token for GVS and Player (#12090)

Authored by: coletdjnz
											
										
										
											2025-01-24 18:17:37 -06:00
+								            po_token = fmt.get(STREAMING_DATA_INITIAL_PO_TOKEN)
-												[ie/youtube] Add `po_token`, `visitor_data`, `data_sync_id` extractor args (#10648)

Authored by:  seproDev, coletdjnz, bashonly
											
										
										
											2024-09-13 05:51:58 -05:00
 								            if po_token:
 								                fmt_url = update_url_query(fmt_url, {'pot': po_token})
 								            # Clients that require PO Token return videoplayback URLs that may return 403
-												[ie/youtube] Use different PO token for GVS and Player (#12090)

Authored by: coletdjnz
											
										
										
											2025-01-24 18:17:37 -06:00
+								            require_po_token = (
 								                not po_token
 								                and _PoTokenContext.GVS in self._get_default_ytcfg(client_name)['PO_TOKEN_REQUIRED_CONTEXTS']
 								                and itag not in ['18'])  # these formats do not require PO Token
-												[ie/youtube] Skip iOS formats that require PO Token (#11890)

Partial fix for https://github.com/yt-dlp/yt-dlp/issues/11868

Authored by: coletdjnz
											
										
										
											2024-12-23 17:03:28 -06:00
+								            if require_po_token and 'missing_pot' not in self._configuration_arg('formats'):
 								                self._report_pot_format_skipped(video_id, client_name, 'https')
 								                continue
-												[ie/youtube] Remove `android` from default clients (#9553)

Closes #9554
Authored by: coletdjnz, bashonly

Co-authored-by: bashonly <88596187+bashonly@users.noreply.github.com>
											
										
										
											2024-05-17 11:03:02 -05:00
-												[extractor/youtube] Prioritize premium formats

Closes #7283

											
										
										
											2023-06-19 03:39:26 -05:00
+								            name = fmt.get('qualityLabel') or quality.replace('audio_quality_', '') or ''
-												[extractor/youtube] Ignore wrong fps of some formats

											
										
										
											2023-06-20 18:41:14 -05:00
+								            fps = int_or_none(fmt.get('fps')) or 0
-												[youtube] Update to ytdl-2021.02.04.1

											
										
										
											2021-02-04 08:37:17 -06:00
+								            dct = {
 								                'asr': int_or_none(fmt.get('audioSampleRate')),
 								                'filesize': int_or_none(fmt.get('contentLength')),
-												[extractor/youtube] Extract DRC formats

											
										
										
											2022-12-30 04:02:33 -06:00
+								                'format_id': f'{itag}{"-drc" if fmt.get("isDrc") else ""}',
-												[utils] Add `join_nonempty`

											
										
										
											2021-11-05 20:05:24 -05:00
+								                'format_note': join_nonempty(
-												[ie/youtube] Prioritize original language over auto-dubbed audio (#11803)

Closes #11753
Authored by: bashonly
											
										
										
											2024-12-13 04:21:48 -06:00
+								                    join_nonempty(display_name, is_default and ' (default)', delim=''),
-												[extractor/youtube] Prioritize premium formats

Closes #7283

											
										
										
											2023-06-19 03:39:26 -05:00
+								                    name, fmt.get('isDrc') and 'DRC',
-												[extractor/youtube] Extract more format info

											
										
										
											2022-08-07 15:06:11 -05:00
+								                    try_get(fmt, lambda x: x['projectionType'].replace('RECTANGULAR', '').lower()),
 								                    try_get(fmt, lambda x: x['spatialAudioType'].replace('SPATIAL_AUDIO_TYPE_', '').lower()),
-												[ie/youtube] Skip iOS formats that require PO Token (#11890)

Partial fix for https://github.com/yt-dlp/yt-dlp/issues/11868

Authored by: coletdjnz
											
										
										
											2024-12-23 17:03:28 -06:00
+								                    is_damaged and 'DAMAGED', require_po_token and 'MISSING POT',
-												[ie/youtube] Fix `format_note` (Bugfix for 3a3bd00037e9908e87da4fa9f2ad772aa34dc60e) (#11028)

Authored by: bashonly
											
										
										
											2024-09-24 17:12:02 -05:00
+								                    (self.get_param('verbose') or all_formats) and short_client_name(client_name),
-												[extractor/youtube] Add client name to `format_note` when `-v` (#6254)

Authored by: Lesmiscore, pukkandan
											
										
										
											2023-03-11 11:03:23 -06:00
+								                    delim=', '),
-												[youtube] Deprioritize format 22

Reduces chance of encountering #3372

											
										
										
											2022-05-06 21:33:41 -05:00
+								                # Format 22 is likely to be damaged. See https://github.com/yt-dlp/yt-dlp/issues/3372
-												[ie/youtube] Skip formats if nsig decoding fails (#10223)

Ref: https://github.com/ytdl-org/youtube-dl/issues/32815

Authored by: bashonly
											
										
										
											2024-06-21 18:19:59 -05:00
+								                'source_preference': (-5 if itag == '22' else -1) + (100 if 'Premium' in name else 0),
-												[extractor/youtube] Ignore wrong fps of some formats

											
										
										
											2023-06-20 18:41:14 -05:00
+								                'fps': fps if fps > 1 else None,  # For some formats, fps is wrongly returned as 1
-												[extractor/youtube] Extract more format info

											
										
										
											2022-08-07 15:06:11 -05:00
+								                'audio_channels': fmt.get('audioChannels'),
-												[youtube] Fix format sorting when using alternate clients

											
										
										
											2021-07-25 17:03:42 -05:00
+								                'height': height,
-												[extractor/youtube] Extract DRC formats

											
										
										
											2022-12-30 04:02:33 -06:00
+								                'quality': q(quality) - bool(fmt.get('isDrc')) / 2,
-												[ie/youtube] Warn on DRM formats (#12593)

Authored by: coletdjnz
											
										
										
											2025-03-15 16:28:16 -05:00
+								                'has_drm': has_drm,
-												Update to ytdl-2021.02.10

Except: [archiveorg] Fix and improve extraction (5fc53690cbe6abb11941a3f4846b566a7472753e)

											
										
										
											2021-02-10 15:22:55 -06:00
+								                'tbr': tbr,
-												[ie/youtube] Calculate more accurate `filesize`

YouTube provides slightly different duration for each format.
Calculating file-size based on this duration instead of the
video duration gives more accurate results.

Ref: https://github.com/yt-dlp/yt-dlp/issues/1400#issuecomment-2007441207

											
										
										
											2024-03-31 15:50:03 -05:00
+								                'filesize_approx': filesize_from_tbr(tbr, format_duration),
-												[youtube] Update to ytdl-2021.02.04.1

											
										
										
											2021-02-04 08:37:17 -06:00
+								                'url': fmt_url,
-												[youtube] Fix format sorting when using alternate clients

											
										
										
											2021-07-25 17:03:42 -05:00
+								                'width': int_or_none(fmt.get('width')),
-												[ie/youtube] Extract all formats from multi-language m3u8s (#9875)

Authored by: clienthax, bashonly

Co-authored-by: bashonly <88596187+bashonly@users.noreply.github.com>
											
										
										
											2024-06-20 16:54:53 -05:00
+								                'language': join_nonempty(language_code, 'desc' if is_descriptive else '') or None,
-												[ie/youtube] Prioritize original language over auto-dubbed audio (#11803)

Closes #11753
Authored by: bashonly
											
										
										
											2024-12-13 04:21:48 -06:00
+								                'language_preference': PREFERRED_LANG_VALUE if is_original else 5 if is_default else -10 if is_descriptive else -1,
-												[ie/youtube] Remove `android` from default clients (#9553)

Closes #9554
Authored by: coletdjnz, bashonly

Co-authored-by: bashonly <88596187+bashonly@users.noreply.github.com>
											
										
										
											2024-05-17 11:03:02 -05:00
+								                # Strictly de-prioritize broken, damaged and 3gp formats
-												[ie/youtube] Skip iOS formats that require PO Token (#11890)

Partial fix for https://github.com/yt-dlp/yt-dlp/issues/11868

Authored by: coletdjnz
											
										
										
											2024-12-23 17:03:28 -06:00
+								                'preference': -20 if require_po_token else -10 if is_damaged else -2 if itag == '17' else None,
-												[youtube] Update to ytdl-2021.02.04.1

											
										
										
											2021-02-04 08:37:17 -06:00
+								            }
-												[youtube] Fix sorting of 3gp format

											
										
										
											2021-07-08 11:11:08 -05:00
+								            mime_mobj = re.match(
 								                r'((?:[^/]+)/(?:[^;]+))(?:;\s*codecs="([^"]+)")?', fmt.get('mimeType') or '')
 								            if mime_mobj:
 								                dct['ext'] = mimetype2ext(mime_mobj.group(1))
 								                dct.update(parse_codecs(mime_mobj.group(2)))
-												[extractor/youtube] Add extractor-arg `include_duplicate_formats`

											
										
										
											2023-03-09 11:43:02 -06:00
+								            if itag:
 								                itags[itag].add(('https', dct.get('language')))
 								                stream_ids.append(stream_id)
-												[extractor/youtube] Bypass throttling for `-f17`

and related cleanup

Thanks @AudricV for the finding

											
										
										
											2023-03-09 10:39:23 -06:00
+								            single_stream = 'none' in (dct.get('acodec'), dct.get('vcodec'))
 								            if single_stream and dct.get('ext'):
 								                dct['container'] = dct['ext'] + '_dash'
-												[extractor/youtube] Add extractor-arg `include_duplicate_formats`

											
										
										
											2023-03-09 11:43:02 -06:00
-												[extractor/youtube] Add extractor-arg `formats`

Closes #7417

											
										
										
											2023-06-25 09:40:00 -05:00
+								            if (all_formats or 'dashy' in format_types) and dct['filesize']:
-												[extractor/youtube] Add extractor-arg `include_duplicate_formats`

											
										
										
											2023-03-09 11:43:02 -06:00
+								                yield {
 								                    **dct,
 								                    'format_id': f'{dct["format_id"]}-dashy' if all_formats else dct['format_id'],
-												[extractor/youtube] Construct dash formats with `range` query

Closes #6369

											
										
										
											2023-02-28 11:33:44 -06:00
+								                    'protocol': 'http_dash_segments',
-												Fix 2a23d92d9ec44a0168079e38bcf3d383e5c4c7bb

Closes #6517

											
										
										
											2023-03-12 04:16:09 -05:00
+								                    'fragments': build_fragments(dct),
-												[extractor/youtube] Add extractor-arg `include_duplicate_formats`

											
										
										
											2023-03-09 11:43:02 -06:00
+								                }
-												[extractor/youtube] Add extractor-arg `formats`

Closes #7417

											
										
										
											2023-06-25 09:40:00 -05:00
+								            if all_formats or 'dashy' not in format_types:
 								                dct['downloader_options'] = {'http_chunk_size': CHUNK_SIZE}
 								                yield dct
-												[youtube] Update to ytdl-2021.02.04.1

											
										
										
											2021-02-04 08:37:17 -06:00
-												[extractor/youtube] Download `post_live` videos from start (#5091)

* The fragments are generated as a `LazyList`. So only the required formats are expanded during download, but all fragment lists are printed/written in infojson.
* The m3u8 formats which cannot be downloaded from start are not extracted by default, but can be enabled with an extractor-arg. The extractor-arg `include_live_dash` is renamed to `include_incomplete_formats` to account for this new use-case.

Closes #1564
Authored by: Lesmiscore, pukkandan
											
										
										
											2022-10-03 21:48:31 -05:00
+								        needs_live_processing = self._needs_live_processing(live_status, duration)
-												[extractor/youtube] Add extractor-arg `formats`

Closes #7417

											
										
										
											2023-06-25 09:40:00 -05:00
+								        skip_bad_formats = 'incomplete' not in format_types
 								        if self._configuration_arg('include_incomplete_formats'):
 								            skip_bad_formats = False
 								            self._downloader.deprecated_feature('[youtube] include_incomplete_formats extractor argument is deprecated. '
 								                                                'Use formats=incomplete extractor argument instead')
-												[extractor/youtube] Download `post_live` videos from start (#5091)

* The fragments are generated as a `LazyList`. So only the required formats are expanded during download, but all fragment lists are printed/written in infojson.
* The m3u8 formats which cannot be downloaded from start are not extracted by default, but can be enabled with an extractor-arg. The extractor-arg `include_live_dash` is renamed to `include_incomplete_formats` to account for this new use-case.

Closes #1564
Authored by: Lesmiscore, pukkandan
											
										
										
											2022-10-03 21:48:31 -05:00
 								        skip_manifests = set(self._configuration_arg('skip'))
 								        if (not self.get_param('youtube_include_hls_manifest', True)
 								                or needs_live_processing == 'is_live'  # These will be filtered out by YoutubeDL anyway
-												[cleanup] Bump ruff to 0.8.x (#11608)

Authored by: seproDev
											
										
										
											2024-12-02 09:29:30 -06:00
+								                or (needs_live_processing and skip_bad_formats)):
-												[extractor/youtube] Download `post_live` videos from start (#5091)

* The fragments are generated as a `LazyList`. So only the required formats are expanded during download, but all fragment lists are printed/written in infojson.
* The m3u8 formats which cannot be downloaded from start are not extracted by default, but can be enabled with an extractor-arg. The extractor-arg `include_live_dash` is renamed to `include_incomplete_formats` to account for this new use-case.

Closes #1564
Authored by: Lesmiscore, pukkandan
											
										
										
											2022-10-03 21:48:31 -05:00
+								            skip_manifests.add('hls')
-												[cleanup] Minor fixes (See desc)

* [youtube] Fix `--youtube-skip-dash-manifest`
* [build] Use `$()` in `Makefile`. Closes #3684
* Fix bug in 385ffb467b2285e85a2a5495b90314ba1f8e0700
* Fix bug in 43d7f5a5d0c77556156a3f8caa6976d3908a1e38
* [cleanup] Remove unnecessary `utf-8` from `str.encode`/`bytes.decode`
* [utils] LazyList: Expose unnecessarily "protected" attributes
and other minor cleanup

											
										
										
											2022-05-09 06:54:28 -05:00
+								        if not self.get_param('youtube_include_dash_manifest', True):
-												[extractor/youtube] Download `post_live` videos from start (#5091)

* The fragments are generated as a `LazyList`. So only the required formats are expanded during download, but all fragment lists are printed/written in infojson.
* The m3u8 formats which cannot be downloaded from start are not extracted by default, but can be enabled with an extractor-arg. The extractor-arg `include_live_dash` is renamed to `include_incomplete_formats` to account for this new use-case.

Closes #1564
Authored by: Lesmiscore, pukkandan
											
										
										
											2022-10-03 21:48:31 -05:00
+								            skip_manifests.add('dash')
 								        if self._configuration_arg('include_live_dash'):
 								            self._downloader.deprecated_feature('[youtube] include_live_dash extractor argument is deprecated. '
-												[extractor/youtube] Add extractor-arg `formats`

Closes #7417

											
										
										
											2023-06-25 09:40:00 -05:00
+								                                                'Use formats=incomplete extractor argument instead')
-												[extractor/youtube] Download `post_live` videos from start (#5091)

* The fragments are generated as a `LazyList`. So only the required formats are expanded during download, but all fragment lists are printed/written in infojson.
* The m3u8 formats which cannot be downloaded from start are not extracted by default, but can be enabled with an extractor-arg. The extractor-arg `include_live_dash` is renamed to `include_incomplete_formats` to account for this new use-case.

Closes #1564
Authored by: Lesmiscore, pukkandan
											
										
										
											2022-10-03 21:48:31 -05:00
+								        elif skip_bad_formats and live_status == 'is_live' and needs_live_processing != 'is_live':
 								            skip_manifests.add('dash')
-												Add `--extractor-args` to pass extractor-specific arguments

											
										
										
											2021-06-25 09:05:41 -05:00
-												[ie/youtube] Add `po_token`, `visitor_data`, `data_sync_id` extractor args (#10648)

Authored by:  seproDev, coletdjnz, bashonly
											
										
										
											2024-09-13 05:51:58 -05:00
+								        def process_manifest_format(f, proto, client_name, itag, po_token):
-												[extractor/youtube] Consider language in format de-duplication

											
										
										
											2022-11-14 17:53:32 -06:00
+								            key = (proto, f.get('language'))
-												[extractor/youtube] Add extractor-arg `include_duplicate_formats`

											
										
										
											2023-03-09 11:43:02 -06:00
+								            if not all_formats and key in itags[itag]:
-												[extractor/youtube] Consider language in format de-duplication

											
										
										
											2022-11-14 17:53:32 -06:00
+								                return False
-												[ie/youtube] Add `po_token`, `visitor_data`, `data_sync_id` extractor args (#10648)

Authored by:  seproDev, coletdjnz, bashonly
											
										
										
											2024-09-13 05:51:58 -05:00
+								            if f.get('source_preference') is None:
 								                f['source_preference'] = -1
 								            # Clients that require PO Token return videoplayback URLs that may return 403
 								            # hls does not currently require PO Token
-												[ie/youtube] Use different PO token for GVS and Player (#12090)

Authored by: coletdjnz
											
										
										
											2025-01-24 18:17:37 -06:00
+								            if (
 								                not po_token
 								                and _PoTokenContext.GVS in self._get_default_ytcfg(client_name)['PO_TOKEN_REQUIRED_CONTEXTS']
 								                and proto != 'hls'
 								            ):
-												[ie/youtube] Skip iOS formats that require PO Token (#11890)

Partial fix for https://github.com/yt-dlp/yt-dlp/issues/11868

Authored by: coletdjnz
											
										
										
											2024-12-23 17:03:28 -06:00
+								                if 'missing_pot' not in self._configuration_arg('formats'):
 								                    self._report_pot_format_skipped(video_id, client_name, proto)
 								                    return False
 								                f['format_note'] = join_nonempty(f.get('format_note'), 'MISSING POT', delim=' ')
-												[ie/youtube] Add `po_token`, `visitor_data`, `data_sync_id` extractor args (#10648)

Authored by:  seproDev, coletdjnz, bashonly
											
										
										
											2024-09-13 05:51:58 -05:00
+								                f['source_preference'] -= 20
-												[ie/youtube] Fix DASH formats incorrectly skipped in some situations (#11910)

Closes https://github.com/yt-dlp/yt-dlp/issues/11907
Authored by: coletdjnz
											
										
										
											2024-12-25 19:19:17 -06:00
+								            itags[itag].add(key)
-												[extractor/youtube] Add extractor-arg `include_duplicate_formats`

											
										
										
											2023-03-09 11:43:02 -06:00
+								            if itag and all_formats:
 								                f['format_id'] = f'{itag}-{proto}'
 								            elif any(p != proto for p, _ in itags[itag]):
-												[extractor/youtube] Consider language in format de-duplication

											
										
										
											2022-11-14 17:53:32 -06:00
+								                f['format_id'] = f'{itag}-{proto}'
 								            elif itag:
-												[youtube] refactor itag processing

											
										
										
											2021-10-31 02:56:44 -05:00
+								                f['format_id'] = itag
-												[ie/youtube] Extract all formats from multi-language m3u8s (#9875)

Authored by: clienthax, bashonly

Co-authored-by: bashonly <88596187+bashonly@users.noreply.github.com>
											
										
										
											2024-06-20 16:54:53 -05:00
+								            if original_language and f.get('language') == original_language:
 								                f['format_note'] = join_nonempty(f.get('format_note'), '(default)', delim=' ')
 								                f['language_preference'] = PREFERRED_LANG_VALUE
-												[extractor/youtube] Add `ios` to default clients used

* IOS is affected neither by 403 or by nsig so helps mitigate them preemptively
* IOS also has higher bit-rate "premium" formats though they are not labeled as such

											
										
										
											2023-06-21 13:50:04 -05:00
+								            if itag in ('616', '235'):
 								                f['format_note'] = join_nonempty(f.get('format_note'), 'Premium', delim=' ')
-												[ie/youtube] Avoid false DRM detection (#7396)

Some master manifests contain a mix of DRM and non-DRM formats

											
										
										
											2023-06-23 07:46:07 -05:00
+								                f['source_preference'] += 100
-												[extractor/youtube] Add `ios` to default clients used

* IOS is affected neither by 403 or by nsig so helps mitigate them preemptively
* IOS also has higher bit-rate "premium" formats though they are not labeled as such

											
										
										
											2023-06-21 13:50:04 -05:00
-												[extractor/youtube] Fix bug in format sorting

											
										
										
											2022-08-20 14:26:27 -05:00
+								            f['quality'] = q(itag_qualities.get(try_get(f, lambda f: f['format_id'].split('-')[0]), -1))
-												[youtube] Improve format sorting for IOS formats

When no itag/resolution is available for reference, use the closest resolution

											
										
										
											2022-08-15 03:28:39 -05:00
+								            if f['quality'] == -1 and f.get('height'):
 								                f['quality'] = q(res_qualities[min(res_qualities, key=lambda x: abs(x - f['height']))])
-												[cleanup] Misc

Closes #6288, Closes #7197, Closes #7265, Closes #7353, Closes #5773
Authored by: mikf, freezboltz, pukkandan

											
										
										
											2023-06-20 22:51:20 -05:00
+								            if self.get_param('verbose') or all_formats:
-												[ie/youtube] Fix `format_note` (Bugfix for 3a3bd00037e9908e87da4fa9f2ad772aa34dc60e) (#11028)

Authored by: bashonly
											
										
										
											2024-09-24 17:12:02 -05:00
+								                f['format_note'] = join_nonempty(
 								                    f.get('format_note'), short_client_name(client_name), delim=', ')
-												[extractor/youtube] Ignore wrong fps of some formats

											
										
										
											2023-06-20 18:41:14 -05:00
+								            if f.get('fps') and f['fps'] <= 1:
 								                del f['fps']
-												[ie/youtube] Avoid false DRM detection (#7396)

Some master manifests contain a mix of DRM and non-DRM formats

											
										
										
											2023-06-23 07:46:07 -05:00
 								            if proto == 'hls' and f.get('has_drm'):
 								                f['has_drm'] = 'maybe'
 								                f['source_preference'] -= 5
-												[youtube] refactor itag processing

											
										
										
											2021-10-31 02:56:44 -05:00
+								            return True
-												[youtube] Fix format sorting when using alternate clients

											
										
										
											2021-07-25 17:03:42 -05:00
-												[webvtt, extractor/youtube] Extract auto-subs from livestream VODs

Closes #4130

Authored by: pukkandan, fstirlitz

											
										
										
											2022-06-21 17:16:54 -05:00
+								        subtitles = {}
-												[youtube] Extract data from multiple clients (#536)

* `player_client` accepts multiple clients
* default `player_client` = `android,web`
* music clients can be specifically requested
* Add IOS `player_client`
* Hide live dash since they can't be downloaded

Closes #501

Authored-by: pukkandan, colethedj
											
										
										
											2021-07-20 22:52:34 -05:00
+								        for sd in streaming_data:
-												[ie/youtube] Fix `format_note` (Bugfix for 3a3bd00037e9908e87da4fa9f2ad772aa34dc60e) (#11028)

Authored by: bashonly
											
										
										
											2024-09-24 17:12:02 -05:00
+								            client_name = sd[STREAMING_DATA_CLIENT_NAME]
-												[ie/youtube] Use different PO token for GVS and Player (#12090)

Authored by: coletdjnz
											
										
										
											2025-01-24 18:17:37 -06:00
+								            po_token = sd.get(STREAMING_DATA_INITIAL_PO_TOKEN)
-												[extractor/youtube] Download `post_live` videos from start (#5091)

* The fragments are generated as a `LazyList`. So only the required formats are expanded during download, but all fragment lists are printed/written in infojson.
* The m3u8 formats which cannot be downloaded from start are not extracted by default, but can be enabled with an extractor-arg. The extractor-arg `include_live_dash` is renamed to `include_incomplete_formats` to account for this new use-case.

Closes #1564
Authored by: Lesmiscore, pukkandan
											
										
										
											2022-10-03 21:48:31 -05:00
+								            hls_manifest_url = 'hls' not in skip_manifests and sd.get('hlsManifestUrl')
-												[Youtube] Extract more formats for `music.youtube` URLs (#311)

Based on: https://github.com/ytdl-org/youtube-dl/pull/28778, https://github.com/ytdl-org/youtube-dl/pull/26160

Co-authored-by: craftingmod, colethedj, pukkandan
											
										
										
											2021-05-15 09:38:47 -05:00
+								            if hls_manifest_url:
-												[ie/youtube] Add `po_token`, `visitor_data`, `data_sync_id` extractor args (#10648)

Authored by:  seproDev, coletdjnz, bashonly
											
										
										
											2024-09-13 05:51:58 -05:00
+								                if po_token:
 								                    hls_manifest_url = hls_manifest_url.rstrip('/') + f'/pot/{po_token}'
-												[extractor/youtube] Download `post_live` videos from start (#5091)

* The fragments are generated as a `LazyList`. So only the required formats are expanded during download, but all fragment lists are printed/written in infojson.
* The m3u8 formats which cannot be downloaded from start are not extracted by default, but can be enabled with an extractor-arg. The extractor-arg `include_live_dash` is renamed to `include_incomplete_formats` to account for this new use-case.

Closes #1564
Authored by: Lesmiscore, pukkandan
											
										
										
											2022-10-03 21:48:31 -05:00
+								                fmts, subs = self._extract_m3u8_formats_and_subtitles(
 								                    hls_manifest_url, video_id, 'mp4', fatal=False, live=live_status == 'is_live')
-												[webvtt, extractor/youtube] Extract auto-subs from livestream VODs

Closes #4130

Authored by: pukkandan, fstirlitz

											
										
										
											2022-06-21 17:16:54 -05:00
+								                subtitles = self._merge_subtitles(subs, subtitles)
 								                for f in fmts:
-												[extractor/youtube] Add client name to `format_note` when `-v` (#6254)

Authored by: Lesmiscore, pukkandan
											
										
										
											2023-03-11 11:03:23 -06:00
+								                    if process_manifest_format(f, 'hls', client_name, self._search_regex(
-												[ie/youtube] Add `po_token`, `visitor_data`, `data_sync_id` extractor args (#10648)

Authored by:  seproDev, coletdjnz, bashonly
											
										
										
											2024-09-13 05:51:58 -05:00
+								                            r'/itag/(\d+)', f['url'], 'itag', default=None), po_token):
-												[youtube] refactor itag processing

											
										
										
											2021-10-31 02:56:44 -05:00
+								                        yield f
-												[youtube] Update to ytdl-2021.02.04.1

											
										
										
											2021-02-04 08:37:17 -06:00
-												[extractor/youtube] Download `post_live` videos from start (#5091)

* The fragments are generated as a `LazyList`. So only the required formats are expanded during download, but all fragment lists are printed/written in infojson.
* The m3u8 formats which cannot be downloaded from start are not extracted by default, but can be enabled with an extractor-arg. The extractor-arg `include_live_dash` is renamed to `include_incomplete_formats` to account for this new use-case.

Closes #1564
Authored by: Lesmiscore, pukkandan
											
										
										
											2022-10-03 21:48:31 -05:00
+								            dash_manifest_url = 'dash' not in skip_manifests and sd.get('dashManifestUrl')
-												Add `--extractor-args` to pass extractor-specific arguments

											
										
										
											2021-06-25 09:05:41 -05:00
+								            if dash_manifest_url:
-												[ie/youtube] Add `po_token`, `visitor_data`, `data_sync_id` extractor args (#10648)

Authored by:  seproDev, coletdjnz, bashonly
											
										
										
											2024-09-13 05:51:58 -05:00
+								                if po_token:
 								                    dash_manifest_url = dash_manifest_url.rstrip('/') + f'/pot/{po_token}'
-												[webvtt, extractor/youtube] Extract auto-subs from livestream VODs

Closes #4130

Authored by: pukkandan, fstirlitz

											
										
										
											2022-06-21 17:16:54 -05:00
+								                formats, subs = self._extract_mpd_formats_and_subtitles(dash_manifest_url, video_id, fatal=False)
 								                subtitles = self._merge_subtitles(subs, subtitles)  # Prioritize HLS subs over DASH
 								                for f in formats:
-												[ie/youtube] Add `po_token`, `visitor_data`, `data_sync_id` extractor args (#10648)

Authored by:  seproDev, coletdjnz, bashonly
											
										
										
											2024-09-13 05:51:58 -05:00
+								                    if process_manifest_format(f, 'dash', client_name, f['format_id'], po_token):
-												[youtube] refactor itag processing

											
										
										
											2021-10-31 02:56:44 -05:00
+								                        f['filesize'] = int_or_none(self._search_regex(
 								                            r'/clen/(\d+)', f.get('fragment_base_url') or f['url'], 'file size', default=None))
-												[extractor/youtube] Download `post_live` videos from start (#5091)

* The fragments are generated as a `LazyList`. So only the required formats are expanded during download, but all fragment lists are printed/written in infojson.
* The m3u8 formats which cannot be downloaded from start are not extracted by default, but can be enabled with an extractor-arg. The extractor-arg `include_live_dash` is renamed to `include_incomplete_formats` to account for this new use-case.

Closes #1564
Authored by: Lesmiscore, pukkandan
											
										
										
											2022-10-03 21:48:31 -05:00
+								                        if needs_live_processing:
-												[dash,youtube] Download live from start to end (#888)

* Add option `--live-from-start` to enable downloading live videos from start
* Add key `is_from_start` in formats to identify formats (of live videos) that downloads from start
* [dash] Create protocol `http_dash_segments_generator` that allows a function to be passed instead of fragments
* [fragment] Allow multiple live dash formats to download simultaneously
* [youtube] Implement fragment re-fetching for the live dash formats
* [youtube] Re-extract dash manifest every 5 hours (manifest expires in 6hrs)
* [postprocessor/ffmpeg] Add `FFmpegFixupDuplicateMoovPP` to fixup duplicated moov atoms

Known issue: Ctrl+C doesn't work on Windows when downloading multiple formats

Closes #1521
Authored by: nao20010128nao, pukkandan

											
										
										
											2021-12-20 00:06:46 -06:00
+								                            f['is_from_start'] = True
-												[youtube] refactor itag processing

											
										
										
											2021-10-31 02:56:44 -05:00
+								                        yield f
-												[webvtt, extractor/youtube] Extract auto-subs from livestream VODs

Closes #4130

Authored by: pukkandan, fstirlitz

											
										
										
											2022-06-21 17:16:54 -05:00
+								        yield subtitles
-												[youtube] Extract data from multiple clients (#536)

* `player_client` accepts multiple clients
* default `player_client` = `android,web`
* music clients can be specifically requested
* Add IOS `player_client`
* Hide live dash since they can't be downloaded

Closes #501

Authored-by: pukkandan, colethedj
											
										
										
											2021-07-20 22:52:34 -05:00
-												[youtube] Add storyboard formats
Closes: #1553, https://github.com/ytdl-org/youtube-dl/issues/9868
Related: https://github.com/ytdl-org/youtube-dl/pull/14951

											
										
										
											2021-11-16 13:56:23 -06:00
+								    def _extract_storyboard(self, player_responses, duration):
 								        spec = get_first(
 								            player_responses, ('storyboards', 'playerStoryboardSpecRenderer', 'spec'), default='').split('|')[::-1]
-												[youtube] Make invalid storyboard URL non-fatal

Closes #2382

											
										
										
											2022-01-19 06:39:52 -06:00
+								        base_url = url_or_none(urljoin('https://i.ytimg.com/', spec.pop() or None))
 								        if not base_url:
-												[youtube] Add storyboard formats
Closes: #1553, https://github.com/ytdl-org/youtube-dl/issues/9868
Related: https://github.com/ytdl-org/youtube-dl/pull/14951

											
										
										
											2021-11-16 13:56:23 -06:00
+								            return
 								        L = len(spec) - 1
 								        for i, args in enumerate(spec):
 								            args = args.split('#')
 								            counts = list(map(int_or_none, args[:5]))
 								            if len(args) != 8 or not all(counts):
 								                self.report_warning(f'Malformed storyboard {i}: {"#".join(args)}{bug_reports_message()}')
 								                continue
 								            width, height, frame_count, cols, rows = counts
 								            N, sigh = args[6:]
 								            url = base_url.replace('$L', str(L - i)).replace('$N', N) + f'&sigh={sigh}'
 								            fragment_count = frame_count / (cols * rows)
 								            fragment_duration = duration / fragment_count
 								            yield {
 								                'format_id': f'sb{i}',
 								                'format_note': 'storyboard',
 								                'ext': 'mhtml',
 								                'protocol': 'mhtml',
 								                'acodec': 'none',
 								                'vcodec': 'none',
 								                'url': url,
 								                'width': width,
 								                'height': height,
-												[extractor/youtube] More metadata for storyboards (#4334)

Authored by: ftk
											
										
										
											2022-07-12 10:16:45 -05:00
+								                'fps': frame_count / duration,
 								                'rows': rows,
 								                'columns': cols,
-												[youtube] Add storyboard formats
Closes: #1553, https://github.com/ytdl-org/youtube-dl/issues/9868
Related: https://github.com/ytdl-org/youtube-dl/pull/14951

											
										
										
											2021-11-16 13:56:23 -06:00
+								                'fragments': [{
-												[downloader/mhtml] Fix fragments with absolute urls (#3044)

Authored-by: coletdjnz
											
										
										
											2022-03-13 17:03:40 -05:00
+								                    'url': url.replace('$M', str(j)),
-												[youtube] Add storyboard formats
Closes: #1553, https://github.com/ytdl-org/youtube-dl/issues/9868
Related: https://github.com/ytdl-org/youtube-dl/pull/14951

											
										
										
											2021-11-16 13:56:23 -06:00
+								                    'duration': min(fragment_duration, duration - (j * fragment_duration)),
 								                } for j in range(math.ceil(fragment_count))],
 								            }
-												[dash,youtube] Download live from start to end (#888)

* Add option `--live-from-start` to enable downloading live videos from start
* Add key `is_from_start` in formats to identify formats (of live videos) that downloads from start
* [dash] Create protocol `http_dash_segments_generator` that allows a function to be passed instead of fragments
* [fragment] Allow multiple live dash formats to download simultaneously
* [youtube] Implement fragment re-fetching for the live dash formats
* [youtube] Re-extract dash manifest every 5 hours (manifest expires in 6hrs)
* [postprocessor/ffmpeg] Add `FFmpegFixupDuplicateMoovPP` to fixup duplicated moov atoms

Known issue: Ctrl+C doesn't work on Windows when downloading multiple formats

Closes #1521
Authored by: nao20010128nao, pukkandan

											
										
										
											2021-12-20 00:06:46 -06:00
+								    def _download_player_responses(self, url, smuggled_data, video_id, webpage_url):
-												[youtube] Improvements to JS player extraction (See desc) (#860)

* fallback player url extraction when it fails to be extracted from the webpage
* don't download js player unnecessarily for clients that don't require it
* try to extract js player url from any additional client configs
* ability to skip the js player usage/download using `player_skip=js`
* ability to skip the initial webpage download using `player_skip=webpage`

known issue:
* authentication for multi-channel accounts and multi-account cookies may not work correctly if the webpage or client configs are skipped
*  formats from the web client requiring signature decryption will be skipped if player js extraction is skipped

Authored by: coletdjnz
											
										
										
											2021-09-06 02:26:41 -05:00
+								        webpage = None
 								        if 'webpage' not in self._configuration_arg('player_skip'):
-												[extractor/youtube] Use device-specific user agent (#4770)

Thwart latest fingerprinting attempt (see https://github.com/iv-org/invidious/issues/3230#issuecomment-1226887639)

Authored by: coletdjnz
											
										
										
											2022-08-28 17:59:54 -05:00
+								            query = {'bpctr': '9999999999', 'has_verified': '1'}
-												[ie/youtube] Fix `player_params` arg being converted to lowercase

Fix bug in ba06d77a316650ff057347d224b5afa8b203ad65

Authored by: coletdjnz

											
										
										
											2023-07-29 17:50:25 -05:00
+								            pp = self._configuration_arg('player_params', [None], casesense=True)[0]
-												[ie/youtube] Add `player_params` extractor arg (#7719)

Authored by: coletdjnz
											
										
										
											2023-07-29 01:20:42 -05:00
+								            if pp:
 								                query['pp'] = pp
-												[ie/youtube] Retry on more critical requests (#12339)

Authored by: coletdjnz
											
										
										
											2025-02-18 18:39:51 -06:00
+								            webpage = self._download_webpage_with_retries(webpage_url, video_id, query=query)
-												[youtube] Extract data from multiple clients (#536)

* `player_client` accepts multiple clients
* default `player_client` = `android,web`
* music clients can be specifically requested
* Add IOS `player_client`
* Hide live dash since they can't be downloaded

Closes #501

Authored-by: pukkandan, colethedj
											
										
										
											2021-07-20 22:52:34 -05:00
 								        master_ytcfg = self.extract_ytcfg(video_id, webpage) or self._get_default_ytcfg()
-												[youtube] Improvements to JS player extraction (See desc) (#860)

* fallback player url extraction when it fails to be extracted from the webpage
* don't download js player unnecessarily for clients that don't require it
* try to extract js player url from any additional client configs
* ability to skip the js player usage/download using `player_skip=js`
* ability to skip the initial webpage download using `player_skip=webpage`

known issue:
* authentication for multi-channel accounts and multi-account cookies may not work correctly if the webpage or client configs are skipped
*  formats from the web client requiring signature decryption will be skipped if player js extraction is skipped

Authored by: coletdjnz
											
										
										
											2021-09-06 02:26:41 -05:00
+								        player_responses, player_url = self._extract_player_responses(
-												[youtube] Extract data from multiple clients (#536)

* `player_client` accepts multiple clients
* default `player_client` = `android,web`
* music clients can be specifically requested
* Add IOS `player_client`
* Hide live dash since they can't be downloaded

Closes #501

Authored-by: pukkandan, colethedj
											
										
										
											2021-07-20 22:52:34 -05:00
+								            self._get_requested_clients(url, smuggled_data),
-												[extractor/youtube] Use device-specific user agent (#4770)

Thwart latest fingerprinting attempt (see https://github.com/iv-org/invidious/issues/3230#issuecomment-1226887639)

Authored by: coletdjnz
											
										
										
											2022-08-28 17:59:54 -05:00
+								            video_id, webpage, master_ytcfg, smuggled_data)
-												[youtube] Extract data from multiple clients (#536)

* `player_client` accepts multiple clients
* default `player_client` = `android,web`
* music clients can be specifically requested
* Add IOS `player_client`
* Hide live dash since they can't be downloaded

Closes #501

Authored-by: pukkandan, colethedj
											
										
										
											2021-07-20 22:52:34 -05:00
-												[dash,youtube] Download live from start to end (#888)

* Add option `--live-from-start` to enable downloading live videos from start
* Add key `is_from_start` in formats to identify formats (of live videos) that downloads from start
* [dash] Create protocol `http_dash_segments_generator` that allows a function to be passed instead of fragments
* [fragment] Allow multiple live dash formats to download simultaneously
* [youtube] Implement fragment re-fetching for the live dash formats
* [youtube] Re-extract dash manifest every 5 hours (manifest expires in 6hrs)
* [postprocessor/ffmpeg] Add `FFmpegFixupDuplicateMoovPP` to fixup duplicated moov atoms

Known issue: Ctrl+C doesn't work on Windows when downloading multiple formats

Closes #1521
Authored by: nao20010128nao, pukkandan

											
										
										
											2021-12-20 00:06:46 -06:00
+								        return webpage, master_ytcfg, player_responses, player_url
-												[youtube] Avoid false positives when detecting damaged formats

Closes #3083

											
										
										
											2022-03-16 09:16:19 -05:00
+								    def _list_formats(self, video_id, microformats, video_details, player_responses, player_url, duration=None):
-												[dash,youtube] Download live from start to end (#888)

* Add option `--live-from-start` to enable downloading live videos from start
* Add key `is_from_start` in formats to identify formats (of live videos) that downloads from start
* [dash] Create protocol `http_dash_segments_generator` that allows a function to be passed instead of fragments
* [fragment] Allow multiple live dash formats to download simultaneously
* [youtube] Implement fragment re-fetching for the live dash formats
* [youtube] Re-extract dash manifest every 5 hours (manifest expires in 6hrs)
* [postprocessor/ffmpeg] Add `FFmpegFixupDuplicateMoovPP` to fixup duplicated moov atoms

Known issue: Ctrl+C doesn't work on Windows when downloading multiple formats

Closes #1521
Authored by: nao20010128nao, pukkandan

											
										
										
											2021-12-20 00:06:46 -06:00
+								        live_broadcast_details = traverse_obj(microformats, (..., 'liveBroadcastDetails'))
 								        is_live = get_first(video_details, 'isLive')
 								        if is_live is None:
 								            is_live = get_first(live_broadcast_details, 'isLiveNow')
-												[extractor/youtube] Download `post_live` videos from start (#5091)

* The fragments are generated as a `LazyList`. So only the required formats are expanded during download, but all fragment lists are printed/written in infojson.
* The m3u8 formats which cannot be downloaded from start are not extracted by default, but can be enabled with an extractor-arg. The extractor-arg `include_live_dash` is renamed to `include_incomplete_formats` to account for this new use-case.

Closes #1564
Authored by: Lesmiscore, pukkandan
											
										
										
											2022-10-03 21:48:31 -05:00
+								        live_content = get_first(video_details, 'isLiveContent')
 								        is_upcoming = get_first(video_details, 'isUpcoming')
 								        post_live = get_first(video_details, 'isPostLiveDvr')
 								        live_status = ('post_live' if post_live
 								                       else 'is_live' if is_live
 								                       else 'is_upcoming' if is_upcoming
-												[extractor/youtube] Fix live_status

Bug in 4d37720a0c5f1c9c4768ea20b0f943277f55bc12

											
										
										
											2022-10-13 21:11:53 -05:00
+								                       else 'was_live' if live_content
 								                       else 'not_live' if False in (is_live, live_content)
 								                       else None)
-												[utils] `traverse_obj`: Fix more bugs

and cleanup uses of `default=[]`

Continued from b1bde57bef878478e3503ab07190fd207914ade9

											
										
										
											2023-02-09 16:26:26 -06:00
+								        streaming_data = traverse_obj(player_responses, (..., 'streamingData'))
-												[extractor/youtube] Download `post_live` videos from start (#5091)

* The fragments are generated as a `LazyList`. So only the required formats are expanded during download, but all fragment lists are printed/written in infojson.
* The m3u8 formats which cannot be downloaded from start are not extracted by default, but can be enabled with an extractor-arg. The extractor-arg `include_live_dash` is renamed to `include_incomplete_formats` to account for this new use-case.

Closes #1564
Authored by: Lesmiscore, pukkandan
											
										
										
											2022-10-03 21:48:31 -05:00
+								        *formats, subtitles = self._extract_formats_and_subtitles(streaming_data, video_id, player_url, live_status, duration)
-												[ie/youtube] Avoid false DRM detection (#7396)

Some master manifests contain a mix of DRM and non-DRM formats

											
										
										
											2023-06-23 07:46:07 -05:00
+								        if all(f.get('has_drm') for f in formats):
 								            # If there are no formats that definitely don't have DRM, all have DRM
 								            for f in formats:
 								                f['has_drm'] = True
-												[dash,youtube] Download live from start to end (#888)

* Add option `--live-from-start` to enable downloading live videos from start
* Add key `is_from_start` in formats to identify formats (of live videos) that downloads from start
* [dash] Create protocol `http_dash_segments_generator` that allows a function to be passed instead of fragments
* [fragment] Allow multiple live dash formats to download simultaneously
* [youtube] Implement fragment re-fetching for the live dash formats
* [youtube] Re-extract dash manifest every 5 hours (manifest expires in 6hrs)
* [postprocessor/ffmpeg] Add `FFmpegFixupDuplicateMoovPP` to fixup duplicated moov atoms

Known issue: Ctrl+C doesn't work on Windows when downloading multiple formats

Closes #1521
Authored by: nao20010128nao, pukkandan

											
										
										
											2021-12-20 00:06:46 -06:00
-												[extractor/youtube] Download `post_live` videos from start (#5091)

* The fragments are generated as a `LazyList`. So only the required formats are expanded during download, but all fragment lists are printed/written in infojson.
* The m3u8 formats which cannot be downloaded from start are not extracted by default, but can be enabled with an extractor-arg. The extractor-arg `include_live_dash` is renamed to `include_incomplete_formats` to account for this new use-case.

Closes #1564
Authored by: Lesmiscore, pukkandan
											
										
										
											2022-10-03 21:48:31 -05:00
+								        return live_broadcast_details, live_status, streaming_data, formats, subtitles
-												[dash,youtube] Download live from start to end (#888)

* Add option `--live-from-start` to enable downloading live videos from start
* Add key `is_from_start` in formats to identify formats (of live videos) that downloads from start
* [dash] Create protocol `http_dash_segments_generator` that allows a function to be passed instead of fragments
* [fragment] Allow multiple live dash formats to download simultaneously
* [youtube] Implement fragment re-fetching for the live dash formats
* [youtube] Re-extract dash manifest every 5 hours (manifest expires in 6hrs)
* [postprocessor/ffmpeg] Add `FFmpegFixupDuplicateMoovPP` to fixup duplicated moov atoms

Known issue: Ctrl+C doesn't work on Windows when downloading multiple formats

Closes #1521
Authored by: nao20010128nao, pukkandan

											
										
										
											2021-12-20 00:06:46 -06:00
 								    def _real_extract(self, url):
 								        url, smuggled_data = unsmuggle_url(url, {})
 								        video_id = self._match_id(url)
 								        base_url = self.http_scheme() + '//www.youtube.com/'
 								        webpage_url = base_url + 'watch?v=' + video_id
 								        webpage, master_ytcfg, player_responses, player_url = self._download_player_responses(url, smuggled_data, video_id, webpage_url)
-												[youtube] Extract data from multiple clients (#536)

* `player_client` accepts multiple clients
* default `player_client` = `android,web`
* music clients can be specifically requested
* Add IOS `player_client`
* Hide live dash since they can't be downloaded

Closes #501

Authored-by: pukkandan, colethedj
											
										
										
											2021-07-20 22:52:34 -05:00
+								        playability_statuses = traverse_obj(
-												[utils] `traverse_obj`: Fix more bugs

and cleanup uses of `default=[]`

Continued from b1bde57bef878478e3503ab07190fd207914ade9

											
										
										
											2023-02-09 16:26:26 -06:00
+								            player_responses, (..., 'playabilityStatus'), expected_type=dict)
-												[youtube] Extract data from multiple clients (#536)

* `player_client` accepts multiple clients
* default `player_client` = `android,web`
* music clients can be specifically requested
* Add IOS `player_client`
* Hide live dash since they can't be downloaded

Closes #501

Authored-by: pukkandan, colethedj
											
										
										
											2021-07-20 22:52:34 -05:00
 								        trailer_video_id = get_first(
 								            playability_statuses,
 								            ('errorScreen', 'playerLegacyDesktopYpcTrailerRenderer', 'trailerVideoId'),
 								            expected_type=str)
 								        if trailer_video_id:
 								            return self.url_result(
 								                trailer_video_id, self.ie_key(), trailer_video_id)
 								        search_meta = ((lambda x: self._html_search_meta(x, webpage, default=None))
 								                       if webpage else (lambda x: None))
-												[utils] `traverse_obj`: Fix more bugs

and cleanup uses of `default=[]`

Continued from b1bde57bef878478e3503ab07190fd207914ade9

											
										
										
											2023-02-09 16:26:26 -06:00
+								        video_details = traverse_obj(player_responses, (..., 'videoDetails'), expected_type=dict)
-												[youtube] Extract data from multiple clients (#536)

* `player_client` accepts multiple clients
* default `player_client` = `android,web`
* music clients can be specifically requested
* Add IOS `player_client`
* Hide live dash since they can't be downloaded

Closes #501

Authored-by: pukkandan, colethedj
											
										
										
											2021-07-20 22:52:34 -05:00
+								        microformats = traverse_obj(
 								            player_responses, (..., 'microformat', 'playerMicroformatRenderer'),
-												[utils] `traverse_obj`: Fix more bugs

and cleanup uses of `default=[]`

Continued from b1bde57bef878478e3503ab07190fd207914ade9

											
										
										
											2023-02-09 16:26:26 -06:00
+								            expected_type=dict)
-												[extractor/youtube] Support changing extraction language (#4470)

Adds `--extractor-args youtube:lang=<supported lang code>` extractor arg to prefer translated fields (e.g. title and description) of that language, if available, for all YouTube extractors. See README or error message for list of supported language codes.

Closes https://github.com/yt-dlp/yt-dlp/issues/387

Authored by: coletdjnz
											
										
										
											2022-09-09 00:16:46 -05:00
 								        translated_title = self._get_text(microformats, (..., 'title'))
-												[cleanup] Bump ruff to 0.8.x (#11608)

Authored by: seproDev
											
										
										
											2024-12-02 09:29:30 -06:00
+								        video_title = ((self._preferred_lang and translated_title)
-												[extractor/youtube] Support changing extraction language (#4470)

Adds `--extractor-args youtube:lang=<supported lang code>` extractor arg to prefer translated fields (e.g. title and description) of that language, if available, for all YouTube extractors. See README or error message for list of supported language codes.

Closes https://github.com/yt-dlp/yt-dlp/issues/387

Authored by: coletdjnz
											
										
										
											2022-09-09 00:16:46 -05:00
+								                       or get_first(video_details, 'title')  # primary
 								                       or translated_title
 								                       or search_meta(['og:title', 'twitter:title', 'title']))
 								        translated_description = self._get_text(microformats, (..., 'description'))
 								        original_description = get_first(video_details, 'shortDescription')
 								        video_description = (
-												[cleanup] Bump ruff to 0.8.x (#11608)

Authored by: seproDev
											
										
										
											2024-12-02 09:29:30 -06:00
+								            (self._preferred_lang and translated_description)
-												[extractor/youtube] Support changing extraction language (#4470)

Adds `--extractor-args youtube:lang=<supported lang code>` extractor arg to prefer translated fields (e.g. title and description) of that language, if available, for all YouTube extractors. See README or error message for list of supported language codes.

Closes https://github.com/yt-dlp/yt-dlp/issues/387

Authored by: coletdjnz
											
										
										
											2022-09-09 00:16:46 -05:00
+								            # If original description is blank, it will be an empty string.
 								            # Do not prefer translated description in this case.
 								            or original_description if original_description is not None else translated_description)
-												[youtube] Extract data from multiple clients (#536)

* `player_client` accepts multiple clients
* default `player_client` = `android,web`
* music clients can be specifically requested
* Add IOS `player_client`
* Hide live dash since they can't be downloaded

Closes #501

Authored-by: pukkandan, colethedj
											
										
										
											2021-07-20 22:52:34 -05:00
-												[youtube] Remove unnecessary no-playlist warning

											
										
										
											2021-11-03 05:57:34 -05:00
+								        multifeed_metadata_list = get_first(
 								            player_responses,
 								            ('multicamera', 'playerLegacyMulticameraRenderer', 'metadataList'),
 								            expected_type=str)
 								        if multifeed_metadata_list and not smuggled_data.get('force_singlefeed'):
 								            if self.get_param('noplaylist'):
-												[cleanup] Add more ruff rules (#10149)

Authored by: seproDev

Reviewed-by: bashonly <88596187+bashonly@users.noreply.github.com>
Reviewed-by: Simon Sawicki <contact@grub4k.xyz>
											
										
										
											2024-06-11 18:09:58 -05:00
+								                self.to_screen(f'Downloading just video {video_id} because of --no-playlist')
-												[youtube] Remove unnecessary no-playlist warning

											
										
										
											2021-11-03 05:57:34 -05:00
+								            else:
 								                entries = []
 								                feed_ids = []
 								                for feed in multifeed_metadata_list.split(','):
 								                    # Unquote should take place before split on comma (,) since textual
 								                    # fields may contain comma as well (see
 								                    # https://github.com/ytdl-org/youtube-dl/issues/8536)
-												[compat] Remove deprecated functions from core code

											
										
										
											2022-06-24 05:54:43 -05:00
+								                    feed_data = urllib.parse.parse_qs(
-												[compat] Remove more functions

Removing any more will require changes to a large number of extractors

											
										
										
											2022-06-24 03:10:17 -05:00
+								                        urllib.parse.unquote_plus(feed))
-												[youtube] Remove unnecessary no-playlist warning

											
										
										
											2021-11-03 05:57:34 -05:00
 								                    def feed_entry(name):
 								                        return try_get(
-												[compat] Remove deprecated functions from core code

											
										
										
											2022-06-24 05:54:43 -05:00
+								                            feed_data, lambda x: x[name][0], str)
-												[youtube] Remove unnecessary no-playlist warning

											
										
										
											2021-11-03 05:57:34 -05:00
 								                    feed_id = feed_entry('id')
 								                    if not feed_id:
 								                        continue
 								                    feed_title = feed_entry('title')
 								                    title = video_title
 								                    if feed_title:
-												[cleanup] Add more ruff rules (#10149)

Authored by: seproDev

Reviewed-by: bashonly <88596187+bashonly@users.noreply.github.com>
Reviewed-by: Simon Sawicki <contact@grub4k.xyz>
											
										
										
											2024-06-11 18:09:58 -05:00
+								                        title += f' ({feed_title})'
-												[youtube] Remove unnecessary no-playlist warning

											
										
										
											2021-11-03 05:57:34 -05:00
+								                    entries.append({
 								                        '_type': 'url_transparent',
 								                        'ie_key': 'Youtube',
 								                        'url': smuggle_url(
-												[cleanup] Add more ruff rules (#10149)

Authored by: seproDev

Reviewed-by: bashonly <88596187+bashonly@users.noreply.github.com>
Reviewed-by: Simon Sawicki <contact@grub4k.xyz>
											
										
										
											2024-06-11 18:09:58 -05:00
+								                            '{}watch?v={}'.format(base_url, feed_data['id'][0]),
-												[youtube] Remove unnecessary no-playlist warning

											
										
										
											2021-11-03 05:57:34 -05:00
+								                            {'force_singlefeed': True}),
 								                        'title': title,
 								                    })
 								                    feed_ids.append(feed_id)
 								                self.to_screen(
-												[cleanup] Add more ruff rules (#10149)

Authored by: seproDev

Reviewed-by: bashonly <88596187+bashonly@users.noreply.github.com>
Reviewed-by: Simon Sawicki <contact@grub4k.xyz>
											
										
										
											2024-06-11 18:09:58 -05:00
+								                    'Downloading multifeed video ({}) - add --no-playlist to just download video {}'.format(
 								                        ', '.join(feed_ids), video_id))
-												[youtube] Remove unnecessary no-playlist warning

											
										
										
											2021-11-03 05:57:34 -05:00
+								                return self.playlist_result(
 								                    entries, video_id, video_title, video_description)
-												[youtube] Extract data from multiple clients (#536)

* `player_client` accepts multiple clients
* default `player_client` = `android,web`
* music clients can be specifically requested
* Add IOS `player_client`
* Hide live dash since they can't be downloaded

Closes #501

Authored-by: pukkandan, colethedj
											
										
										
											2021-07-20 22:52:34 -05:00
-												[extractor/youtube] Fix `duration` for premieres (#5382)

Closes #5378
Authored by: nosoop
											
										
										
											2022-10-28 13:30:33 -05:00
+								        duration = (int_or_none(get_first(video_details, 'lengthSeconds'))
 								                    or int_or_none(get_first(microformats, 'lengthSeconds'))
 								                    or parse_duration(search_meta('duration')) or None)
-												[youtube] Avoid false positives when detecting damaged formats

Closes #3083

											
										
										
											2022-03-16 09:16:19 -05:00
-												[extractor/youtube] Download `post_live` videos from start (#5091)

* The fragments are generated as a `LazyList`. So only the required formats are expanded during download, but all fragment lists are printed/written in infojson.
* The m3u8 formats which cannot be downloaded from start are not extracted by default, but can be enabled with an extractor-arg. The extractor-arg `include_live_dash` is renamed to `include_incomplete_formats` to account for this new use-case.

Closes #1564
Authored by: Lesmiscore, pukkandan
											
										
										
											2022-10-03 21:48:31 -05:00
+								        live_broadcast_details, live_status, streaming_data, formats, automatic_captions = \
 								            self._list_formats(video_id, microformats, video_details, player_responses, player_url, duration)
 								        if live_status == 'post_live':
 								            self.write_debug(f'{video_id}: Video is in Post-Live Manifestless mode')
-												[youtube] Quick extraction tempfix (closes #22367, closes #22163)

											
										
										
											2019-09-11 10:44:47 -05:00
-												[youtube] Update to ytdl-2021.02.04.1

											
										
										
											2021-02-04 08:37:17 -06:00
+								        if not formats:
-												[youtube] Extract data from multiple clients (#536)

* `player_client` accepts multiple clients
* default `player_client` = `android,web`
* music clients can be specifically requested
* Add IOS `player_client`
* Hide live dash since they can't be downloaded

Closes #501

Authored-by: pukkandan, colethedj
											
										
										
											2021-07-20 22:52:34 -05:00
+								            if not self.get_param('allow_unplayable_formats') and traverse_obj(streaming_data, (..., 'licenseInfos')):
-												[extractor] Better error message for DRM (#729)

Closes #636
											
										
										
											2021-08-22 15:08:38 -05:00
+								                self.report_drm(video_id)
-												[youtube] Extract data from multiple clients (#536)

* `player_client` accepts multiple clients
* default `player_client` = `android,web`
* music clients can be specifically requested
* Add IOS `player_client`
* Hide live dash since they can't be downloaded

Closes #501

Authored-by: pukkandan, colethedj
											
										
										
											2021-07-20 22:52:34 -05:00
+								            pemr = get_first(
 								                playability_statuses,
 								                ('errorScreen', 'playerErrorMessageRenderer'), expected_type=dict) or {}
 								            reason = self._get_text(pemr, 'reason') or get_first(playability_statuses, 'reason')
 								            subreason = clean_html(self._get_text(pemr, 'subreason') or '')
-												[youtube] Update to ytdl-2021.02.04.1

											
										
										
											2021-02-04 08:37:17 -06:00
+								            if subreason:
 								                if subreason == 'The uploader has not made this video available in your country.':
-												[youtube] Extract data from multiple clients (#536)

* `player_client` accepts multiple clients
* default `player_client` = `android,web`
* music clients can be specifically requested
* Add IOS `player_client`
* Hide live dash since they can't be downloaded

Closes #501

Authored-by: pukkandan, colethedj
											
										
										
											2021-07-20 22:52:34 -05:00
+								                    countries = get_first(microformats, 'availableCountries')
-												[youtube] Update to ytdl-2021.02.04.1

											
										
										
											2021-02-04 08:37:17 -06:00
+								                    if not countries:
 								                        regions_allowed = search_meta('regionsAllowed')
 								                        countries = regions_allowed.split(',') if regions_allowed else None
-												Add option `--ignore-no-formats-error`
* Ignores the "no video format" and similar errors
* Experimental - Some extractors may still throw these errors

											
										
										
											2021-04-16 19:09:58 -05:00
+								                    self.raise_geo_restricted(subreason, countries, metadata_available=True)
-												[youtube] Extract data from multiple clients (#536)

* `player_client` accepts multiple clients
* default `player_client` = `android,web`
* music clients can be specifically requested
* Add IOS `player_client`
* Hide live dash since they can't be downloaded

Closes #501

Authored-by: pukkandan, colethedj
											
										
										
											2021-07-20 22:52:34 -05:00
+								                reason += f'. {subreason}'
-												[youtube] Update to ytdl-2021.02.04.1

											
										
										
											2021-02-04 08:37:17 -06:00
+								            if reason:
-												[ie/youtube] Remove broken OAuth support (#11558)

Closes #11462
Authored by: bashonly
											
										
										
											2024-11-16 17:40:21 -06:00
+								                if 'sign in' in reason.lower():
 								                    reason = remove_end(reason, 'This helps protect our community. Learn more')
 								                    reason = f'{remove_end(reason.strip(), ".")}. {self._youtube_login_hint}'
-												Add option `--ignore-no-formats-error`
* Ignores the "no video format" and similar errors
* Experimental - Some extractors may still throw these errors

											
										
										
											2021-04-16 19:09:58 -05:00
+								                self.raise_no_formats(reason, expected=True)
-												[youtube] Quick extraction tempfix (closes #22367, closes #22163)

											
										
										
											2019-09-11 10:44:47 -05:00
-												[youtube] Extract data from multiple clients (#536)

* `player_client` accepts multiple clients
* default `player_client` = `android,web`
* music clients can be specifically requested
* Add IOS `player_client`
* Hide live dash since they can't be downloaded

Closes #501

Authored-by: pukkandan, colethedj
											
										
										
											2021-07-20 22:52:34 -05:00
+								        keywords = get_first(video_details, 'keywords', expected_type=list) or []
-												[youtube] Update to ytdl-2021.02.04.1

											
										
										
											2021-02-04 08:37:17 -06:00
+								        if not keywords and webpage:
 								            keywords = [
 								                unescapeHTML(m.group('content'))
 								                for m in re.finditer(self._meta_regex('og:video:tag'), webpage)]
 								        for keyword in keywords:
 								            if keyword.startswith('yt:stretch='):
-												Update to ytdl-commit-9f6c03

[cbsnews] Fix extraction for python <3.6
https://github.com/ytdl-org/youtube-dl/commit/9f6c03a00602eb1119e43a522cf50682f6d6a6dd

											
										
										
											2021-04-16 22:02:33 -05:00
+								                mobj = re.search(r'(\d+)\s*:\s*(\d+)', keyword)
 								                if mobj:
 								                    # NB: float is intentional for forcing float division
 								                    w, h = (float(v) for v in mobj.groups())
 								                    if w > 0 and h > 0:
 								                        ratio = w / h
 								                        for f in formats:
 								                            if f.get('vcodec') != 'none':
 								                                f['stretched_ratio'] = ratio
 								                        break
-												[youtube:tab] Extract video thumbnails from playlist (#2096)

closes #1184
Co-Authored-by: coletdjnz, pukkandan
											
										
										
											2021-12-23 21:42:02 -06:00
+								        thumbnails = self._extract_thumbnails((video_details, microformats), (..., ..., 'thumbnail'))
-												[youtube] Always extract `maxresdefault` thumbnail
Fixes: https://github.com/ytdl-org/youtube-dl/issues/29049

											
										
										
											2021-05-18 08:45:11 -05:00
+								        thumbnail_url = search_meta(['og:image', 'twitter:image'])
 								        if thumbnail_url:
 								            thumbnails.append({
 								                'url': thumbnail_url,
 								            })
-												[youtube] Populate `thumbnail` with the best "known" thumbnail
Closes #402, Related: https://github.com/yt-dlp/yt-dlp/issues/340#issuecomment-950290624

											
										
										
											2021-10-24 04:25:28 -05:00
+								        original_thumbnails = thumbnails.copy()
-												[youtube] Extract more thumbnails

* The thumbnail URLs are hard-coded and their actual existence is tested lazily
* Added option `--no-check-formats` to not test them

Closes #340, Related: #402, #337, https://github.com/ytdl-org/youtube-dl/issues/29049

											
										
										
											2021-07-15 12:19:59 -05:00
+								        # The best resolution thumbnails sometimes does not appear in the webpage
-												[youtube] De-prioritize auto-generated thumbnails

Closes #3112

											
										
										
											2022-04-28 14:01:34 -05:00
+								        # See: https://github.com/yt-dlp/yt-dlp/issues/340
-												[youtube] Extract even more thumbnails and reduce testing

* Also fix bug where `_test_url` was being ignored

Ref: https://stackoverflow.com/a/20542029
Related: #340

											
										
										
											2021-07-19 17:10:35 -05:00
+								        # List of possible thumbnails - Ref: <https://stackoverflow.com/a/20542029>
-												Do not verify thumbnail URLs by default

Partially reverts cca80fe6110653582e8c8a8d06490b4028ffd755 and 0ba692acc8feffd46b6e1085fb4a2849b685945c

Unless `--check-formats` is specified, this causes yt-dlp to return incorrect thumbnail urls.
See https://github.com/yt-dlp/yt-dlp/issues/340#issuecomment-877909966, #402

But the overhead in general use is not worth it

Closes #694, #725

											
										
										
											2021-10-18 04:53:42 -05:00
+								        thumbnail_names = [
-												[cleanup] Fix some typos (#4194)

Authored by: crazymoose77756
											
										
										
											2022-06-26 19:50:06 -05:00
+								            # While the *1,*2,*3 thumbnails are just below their corresponding "*default" variants
-												[youtube] De-prioritize auto-generated thumbnails

Closes #3112

											
										
										
											2022-04-28 14:01:34 -05:00
+								            # in resolution, these are not the custom thumbnail. So de-prioritize them
 								            'maxresdefault', 'hq720', 'sddefault', 'hqdefault', '0', 'mqdefault', 'default',
-												[cleanup] Add more ruff rules (#10149)

Authored by: seproDev

Reviewed-by: bashonly <88596187+bashonly@users.noreply.github.com>
Reviewed-by: Simon Sawicki <contact@grub4k.xyz>
											
										
										
											2024-06-11 18:09:58 -05:00
+								            'sd1', 'sd2', 'sd3', 'hq1', 'hq2', 'hq3', 'mq1', 'mq2', 'mq3', '1', '2', '3',
-												[youtube] Extract even more thumbnails and reduce testing

* Also fix bug where `_test_url` was being ignored

Ref: https://stackoverflow.com/a/20542029
Related: #340

											
										
										
											2021-07-19 17:10:35 -05:00
+								        ]
 								        n_thumbnail_names = len(thumbnail_names)
-												[youtube] Extract more thumbnails

* The thumbnail URLs are hard-coded and their actual existence is tested lazily
* Added option `--no-check-formats` to not test them

Closes #340, Related: #402, #337, https://github.com/ytdl-org/youtube-dl/issues/29049

											
										
										
											2021-07-15 12:19:59 -05:00
+								        thumbnails.extend({
 								            'url': 'https://i.ytimg.com/vi{webp}/{video_id}/{name}{live}.{ext}'.format(
 								                video_id=video_id, name=name, ext=ext,
-												[extractor/youtube] Download `post_live` videos from start (#5091)

* The fragments are generated as a `LazyList`. So only the required formats are expanded during download, but all fragment lists are printed/written in infojson.
* The m3u8 formats which cannot be downloaded from start are not extracted by default, but can be enabled with an extractor-arg. The extractor-arg `include_live_dash` is renamed to `include_incomplete_formats` to account for this new use-case.

Closes #1564
Authored by: Lesmiscore, pukkandan
											
										
										
											2022-10-03 21:48:31 -05:00
+								                webp='_webp' if ext == 'webp' else '', live='_live' if live_status == 'is_live' else ''),
-												[youtube] Extract even more thumbnails and reduce testing

* Also fix bug where `_test_url` was being ignored

Ref: https://stackoverflow.com/a/20542029
Related: #340

											
										
										
											2021-07-19 17:10:35 -05:00
+								        } for name in thumbnail_names for ext in ('webp', 'jpg'))
-												[youtube] Extract more thumbnails

* The thumbnail URLs are hard-coded and their actual existence is tested lazily
* Added option `--no-check-formats` to not test them

Closes #340, Related: #402, #337, https://github.com/ytdl-org/youtube-dl/issues/29049

											
										
										
											2021-07-15 12:19:59 -05:00
+								        for thumb in thumbnails:
-												[youtube] Extract even more thumbnails and reduce testing

* Also fix bug where `_test_url` was being ignored

Ref: https://stackoverflow.com/a/20542029
Related: #340

											
										
										
											2021-07-19 17:10:35 -05:00
+								            i = next((i for i, t in enumerate(thumbnail_names) if f'/{video_id}/{t}' in thumb['url']), n_thumbnail_names)
-												[youtube] Extract more thumbnails

* The thumbnail URLs are hard-coded and their actual existence is tested lazily
* Added option `--no-check-formats` to not test them

Closes #340, Related: #402, #337, https://github.com/ytdl-org/youtube-dl/issues/29049

											
										
										
											2021-07-15 12:19:59 -05:00
+								            thumb['preference'] = (0 if '.webp' in thumb['url'] else -1) - (2 * i)
-												[youtube] Always extract `maxresdefault` thumbnail
Fixes: https://github.com/ytdl-org/youtube-dl/issues/29049

											
										
										
											2021-05-18 08:45:11 -05:00
+								        self._remove_duplicate_formats(thumbnails)
-												[youtube] Populate `thumbnail` with the best "known" thumbnail
Closes #402, Related: https://github.com/yt-dlp/yt-dlp/issues/340#issuecomment-950290624

											
										
										
											2021-10-24 04:25:28 -05:00
+								        self._downloader._sort_thumbnails(original_thumbnails)
-												[youtube] Update to ytdl-2021.02.04.1

											
										
										
											2021-02-04 08:37:17 -06:00
-												[youtube] Improve extraction of livestream metadata
Modified from and closes #441
Authored by: pukkandan, krichbanana

											
										
										
											2021-07-21 10:15:45 -05:00
+								        category = get_first(microformats, 'category') or search_meta('genre')
-												[extractor/youtube] Define strict uploader metadata mapping (#6384)

New mapping:
```
channel -> channel name
channel_id -> UCID
channel_url -> UCID channel url

uploader -> channel name (same as channel field)
uploader_id -> @handle
uploader_url -> @handle channel url 
```

Authored by: coletdjnz
											
										
										
											2023-04-14 02:58:36 -05:00
+								        channel_id = self.ucid_or_none(str_or_none(
-												[youtube] Improve extraction of livestream metadata
Modified from and closes #441
Authored by: pukkandan, krichbanana

											
										
										
											2021-07-21 10:15:45 -05:00
+								            get_first(video_details, 'channelId')
 								            or get_first(microformats, 'externalChannelId')
-												[extractor/youtube] Define strict uploader metadata mapping (#6384)

New mapping:
```
channel -> channel name
channel_id -> UCID
channel_url -> UCID channel url

uploader -> channel name (same as channel field)
uploader_id -> @handle
uploader_url -> @handle channel url 
```

Authored by: coletdjnz
											
										
										
											2023-04-14 02:58:36 -05:00
+								            or search_meta('channelId')))
-												[youtube] Improve extraction of livestream metadata
Modified from and closes #441
Authored by: pukkandan, krichbanana

											
										
										
											2021-07-21 10:15:45 -05:00
+								        owner_profile_url = get_first(microformats, 'ownerProfileUrl')
-												[dash,youtube] Download live from start to end (#888)

* Add option `--live-from-start` to enable downloading live videos from start
* Add key `is_from_start` in formats to identify formats (of live videos) that downloads from start
* [dash] Create protocol `http_dash_segments_generator` that allows a function to be passed instead of fragments
* [fragment] Allow multiple live dash formats to download simultaneously
* [youtube] Implement fragment re-fetching for the live dash formats
* [youtube] Re-extract dash manifest every 5 hours (manifest expires in 6hrs)
* [postprocessor/ffmpeg] Add `FFmpegFixupDuplicateMoovPP` to fixup duplicated moov atoms

Known issue: Ctrl+C doesn't work on Windows when downloading multiple formats

Closes #1521
Authored by: nao20010128nao, pukkandan

											
										
										
											2021-12-20 00:06:46 -06:00
+								        live_start_time = parse_iso8601(get_first(live_broadcast_details, 'startTimestamp'))
 								        live_end_time = parse_iso8601(get_first(live_broadcast_details, 'endTimestamp'))
 								        if not duration and live_end_time and live_start_time:
 								            duration = live_end_time - live_start_time
-												[extractor/youtube] Download `post_live` videos from start (#5091)

* The fragments are generated as a `LazyList`. So only the required formats are expanded during download, but all fragment lists are printed/written in infojson.
* The m3u8 formats which cannot be downloaded from start are not extracted by default, but can be enabled with an extractor-arg. The extractor-arg `include_live_dash` is renamed to `include_incomplete_formats` to account for this new use-case.

Closes #1564
Authored by: Lesmiscore, pukkandan
											
										
										
											2022-10-03 21:48:31 -05:00
+								        needs_live_processing = self._needs_live_processing(live_status, duration)
 								        def is_bad_format(fmt):
 								            if needs_live_processing and not fmt.get('is_from_start'):
 								                return True
 								            elif (live_status == 'is_live' and needs_live_processing != 'is_live'
 								                    and fmt.get('protocol') == 'http_dash_segments'):
 								                return True
 								        for fmt in filter(is_bad_format, formats):
 								            fmt['preference'] = (fmt.get('preference') or -1) - 10
-												[extractor/youtube] Process `post_live` over 2 hours

											
										
										
											2023-06-25 20:55:47 -05:00
+								            fmt['format_note'] = join_nonempty(fmt.get('format_note'), '(Last 2 hours)', delim=' ')
-												[extractor/youtube] Download `post_live` videos from start (#5091)

* The fragments are generated as a `LazyList`. So only the required formats are expanded during download, but all fragment lists are printed/written in infojson.
* The m3u8 formats which cannot be downloaded from start are not extracted by default, but can be enabled with an extractor-arg. The extractor-arg `include_live_dash` is renamed to `include_incomplete_formats` to account for this new use-case.

Closes #1564
Authored by: Lesmiscore, pukkandan
											
										
										
											2022-10-03 21:48:31 -05:00
 								        if needs_live_processing:
 								            self._prepare_live_from_start_formats(
 								                formats, video_id, live_start_time, url, webpage_url, smuggled_data, live_status == 'is_live')
-												[youtube] Improve extraction of livestream metadata
Modified from and closes #441
Authored by: pukkandan, krichbanana

											
										
										
											2021-07-21 10:15:45 -05:00
-												[youtube] Add storyboard formats
Closes: #1553, https://github.com/ytdl-org/youtube-dl/issues/9868
Related: https://github.com/ytdl-org/youtube-dl/pull/14951

											
										
										
											2021-11-16 13:56:23 -06:00
+								        formats.extend(self._extract_storyboard(player_responses, duration))
-												[extractor/youtube] Define strict uploader metadata mapping (#6384)

New mapping:
```
channel -> channel name
channel_id -> UCID
channel_url -> UCID channel url

uploader -> channel name (same as channel field)
uploader_id -> @handle
uploader_url -> @handle channel url 
```

Authored by: coletdjnz
											
										
										
											2023-04-14 02:58:36 -05:00
+								        channel_handle = self.handle_from_url(owner_profile_url)
-												[youtube] Update to ytdl-2021.02.04.1

											
										
										
											2021-02-04 08:37:17 -06:00
+								        info = {
 								            'id': video_id,
-												[extractor] Standardize `_live_title`

											
										
										
											2021-12-15 10:00:46 -06:00
+								            'title': video_title,
-												[youtube] Update to ytdl-2021.02.04.1

											
										
										
											2021-02-04 08:37:17 -06:00
+								            'formats': formats,
 								            'thumbnails': thumbnails,
-												[youtube] Populate `thumbnail` with the best "known" thumbnail
Closes #402, Related: https://github.com/yt-dlp/yt-dlp/issues/340#issuecomment-950290624

											
										
										
											2021-10-24 04:25:28 -05:00
+								            # The best thumbnail that we are sure exists. Prevents unnecessary
 								            # URL checking if user don't care about getting the best possible thumbnail
 								            'thumbnail': traverse_obj(original_thumbnails, (-1, 'url')),
-												[youtube] Update to ytdl-2021.02.04.1

											
										
										
											2021-02-04 08:37:17 -06:00
+								            'description': video_description,
 								            'channel_id': channel_id,
-												[extractor/youtube] Define strict uploader metadata mapping (#6384)

New mapping:
```
channel -> channel name
channel_id -> UCID
channel_url -> UCID channel url

uploader -> channel name (same as channel field)
uploader_id -> @handle
uploader_url -> @handle channel url 
```

Authored by: coletdjnz
											
										
										
											2023-04-14 02:58:36 -05:00
+								            'channel_url': format_field(channel_id, None, 'https://www.youtube.com/channel/%s', default=None),
-												[youtube] Update to ytdl-2021.02.04.1

											
										
										
											2021-02-04 08:37:17 -06:00
+								            'duration': duration,
 								            'view_count': int_or_none(
-												[youtube] Extract data from multiple clients (#536)

* `player_client` accepts multiple clients
* default `player_client` = `android,web`
* music clients can be specifically requested
* Add IOS `player_client`
* Hide live dash since they can't be downloaded

Closes #501

Authored-by: pukkandan, colethedj
											
										
										
											2021-07-20 22:52:34 -05:00
+								                get_first((video_details, microformats), (..., 'viewCount'))
-												[youtube] Update to ytdl-2021.02.04.1

											
										
										
											2021-02-04 08:37:17 -06:00
+								                or search_meta('interactionCount')),
-												[youtube] Extract data from multiple clients (#536)

* `player_client` accepts multiple clients
* default `player_client` = `android,web`
* music clients can be specifically requested
* Add IOS `player_client`
* Hide live dash since they can't be downloaded

Closes #501

Authored-by: pukkandan, colethedj
											
										
										
											2021-07-20 22:52:34 -05:00
+								            'average_rating': float_or_none(get_first(video_details, 'averageRating')),
-												[youtube] Update to ytdl-2021.02.04.1

											
										
										
											2021-02-04 08:37:17 -06:00
+								            'age_limit': 18 if (
-												[youtube] Extract data from multiple clients (#536)

* `player_client` accepts multiple clients
* default `player_client` = `android,web`
* music clients can be specifically requested
* Add IOS `player_client`
* Hide live dash since they can't be downloaded

Closes #501

Authored-by: pukkandan, colethedj
											
										
										
											2021-07-20 22:52:34 -05:00
+								                get_first(microformats, 'isFamilySafe') is False
-												[youtube] Update to ytdl-2021.02.04.1

											
										
										
											2021-02-04 08:37:17 -06:00
+								                or search_meta('isFamilyFriendly') == 'false'
 								                or search_meta('og:restrictions:age') == '18+') else 0,
 								            'webpage_url': webpage_url,
 								            'categories': [category] if category else None,
 								            'tags': keywords,
-												[youtube] Extract data from multiple clients (#536)

* `player_client` accepts multiple clients
* default `player_client` = `android,web`
* music clients can be specifically requested
* Add IOS `player_client`
* Hide live dash since they can't be downloaded

Closes #501

Authored-by: pukkandan, colethedj
											
										
										
											2021-07-20 22:52:34 -05:00
+								            'playable_in_embed': get_first(playability_statuses, 'playableInEmbed'),
-												[extractor/youtube] Download `post_live` videos from start (#5091)

* The fragments are generated as a `LazyList`. So only the required formats are expanded during download, but all fragment lists are printed/written in infojson.
* The m3u8 formats which cannot be downloaded from start are not extracted by default, but can be enabled with an extractor-arg. The extractor-arg `include_live_dash` is renamed to `include_incomplete_formats` to account for this new use-case.

Closes #1564
Authored by: Lesmiscore, pukkandan
											
										
										
											2022-10-03 21:48:31 -05:00
+								            'live_status': live_status,
-												[ie/youtube] Extract `media_type` for livestreams (#11605)

Closes #11563
Authored by: nosoop
											
										
										
											2025-01-25 21:27:12 -06:00
+								            'media_type': 'livestream' if get_first(video_details, 'isLiveContent') else None,
-												[dash,youtube] Download live from start to end (#888)

* Add option `--live-from-start` to enable downloading live videos from start
* Add key `is_from_start` in formats to identify formats (of live videos) that downloads from start
* [dash] Create protocol `http_dash_segments_generator` that allows a function to be passed instead of fragments
* [fragment] Allow multiple live dash formats to download simultaneously
* [youtube] Implement fragment re-fetching for the live dash formats
* [youtube] Re-extract dash manifest every 5 hours (manifest expires in 6hrs)
* [postprocessor/ffmpeg] Add `FFmpegFixupDuplicateMoovPP` to fixup duplicated moov atoms

Known issue: Ctrl+C doesn't work on Windows when downloading multiple formats

Closes #1521
Authored by: nao20010128nao, pukkandan

											
										
										
											2021-12-20 00:06:46 -06:00
+								            'release_timestamp': live_start_time,
-												[ie/youtube] Skip formats if nsig decoding fails (#10223)

Ref: https://github.com/ytdl-org/youtube-dl/issues/32815

Authored by: bashonly
											
										
										
											2024-06-21 18:19:59 -05:00
+								            '_format_sort_fields': (  # source_preference is lower for potentially damaged formats
-												[core] Prioritize AV1 (#11153)

Authored by: seproDev
											
										
										
											2024-11-03 13:39:10 -06:00
+								                'quality', 'res', 'fps', 'hdr:12', 'source', 'vcodec', 'channels', 'acodec', 'lang', 'proto'),
-												[youtube] Update to ytdl-2021.02.04.1

											
										
										
											2021-02-04 08:37:17 -06:00
+								        }
-												[youtube] Fix thumbnails extraction and remove uploader id extraction warning (closes #25676)

											
										
										
											2020-06-15 14:29:04 -05:00
-												[webvtt, extractor/youtube] Extract auto-subs from livestream VODs

Closes #4130

Authored by: pukkandan, fstirlitz

											
										
										
											2022-06-21 17:16:54 -05:00
+								        subtitles = {}
-												[youtube] Fix subtitles only being extracted from the first client
Closes #547

											
										
										
											2021-07-22 23:07:15 -05:00
+								        pctr = traverse_obj(player_responses, (..., 'captions', 'playerCaptionsTracklistRenderer'), expected_type=dict)
-												[youtube] Update to ytdl-2021.02.04.1

											
										
										
											2021-02-04 08:37:17 -06:00
+								        if pctr:
-												[YouTube] Add auto-translated subtitles
Closes #1245

											
										
										
											2021-10-12 01:33:56 -05:00
+								            def get_lang_code(track):
 								                return (remove_start(track.get('vssId') or '', '.').replace('.', '-')
 								                        or track.get('languageCode'))
 								            # Converted into dicts to remove duplicates
 								            captions = {
 								                get_lang_code(sub): sub
-												[utils] `traverse_obj`: Fix more bugs

and cleanup uses of `default=[]`

Continued from b1bde57bef878478e3503ab07190fd207914ade9

											
										
										
											2023-02-09 16:26:26 -06:00
+								                for sub in traverse_obj(pctr, (..., 'captionTracks', ...))}
-												[YouTube] Add auto-translated subtitles
Closes #1245

											
										
										
											2021-10-12 01:33:56 -05:00
+								            translation_languages = {
 								                lang.get('languageCode'): self._get_text(lang.get('languageName'), max_runs=1)
-												[utils] `traverse_obj`: Fix more bugs

and cleanup uses of `default=[]`

Continued from b1bde57bef878478e3503ab07190fd207914ade9

											
										
										
											2023-02-09 16:26:26 -06:00
+								                for lang in traverse_obj(pctr, (..., 'translationLanguages', ...))}
-												[YouTube] Add auto-translated subtitles
Closes #1245

											
										
										
											2021-10-12 01:33:56 -05:00
-												[youtube] Add language names

Co-authored by: nixxo, tpikonen
Based on: https://github.com/ytdl-org/youtube-dl/pull/26112
Closes: #310

											
										
										
											2021-05-13 06:19:40 -05:00
+								            def process_language(container, base_url, lang_code, sub_name, query):
-												[youtube] multiple subtitles in same language

Fixes: https://github.com/ytdl-org/youtube-dl/issues/21164
Related: #310, https://github.com/ytdl-org/youtube-dl/pull/26112

											
										
										
											2021-05-12 14:20:02 -05:00
+								                lang_subs = container.setdefault(lang_code, [])
-												[youtube] Update to ytdl-2021.02.04.1

											
										
										
											2021-02-04 08:37:17 -06:00
+								                for fmt in self._SUBTITLE_FORMATS:
 								                    query.update({
 								                        'fmt': fmt,
 								                    })
 								                    lang_subs.append({
 								                        'ext': fmt,
-												[youtube] Ensure subtitle urls are absolute (#2765)

Closes #2755

Authored by: coletdjnz
											
										
										
											2022-02-13 15:36:01 -06:00
+								                        'url': urljoin('https://www.youtube.com', update_url_query(base_url, query)),
-												[youtube] Add language names

Co-authored by: nixxo, tpikonen
Based on: https://github.com/ytdl-org/youtube-dl/pull/26112
Closes: #310

											
										
										
											2021-05-13 06:19:40 -05:00
+								                        'name': sub_name,
-												[youtube] Update to ytdl-2021.02.04.1

											
										
										
											2021-02-04 08:37:17 -06:00
+								                    })
-												[youtube] Move metadata extraction after video availability check

											
										
										
											2018-06-02 14:08:38 -05:00
-												[extractor/youtube] Parse translated subtitles only when requested

Closes #4274

											
										
										
											2022-07-17 17:49:43 -05:00
+								            # NB: Constructing the full subtitle dictionary is slow
 								            get_translated_subs = 'translated_subs' not in self._configuration_arg('skip') and (
 								                self.get_param('writeautomaticsub', False) or self.get_param('listsubtitles'))
-												[YouTube] Add auto-translated subtitles
Closes #1245

											
										
										
											2021-10-12 01:33:56 -05:00
+								            for lang_code, caption_track in captions.items():
 								                base_url = caption_track.get('baseUrl')
-												[youtube] Fix auto-translated automatic captions

d49669acad71f640ffd8b78f0ea7911ae1f67720 only covered ASR

Closes #2956

											
										
										
											2022-03-27 03:36:26 -05:00
+								                orig_lang = parse_qs(base_url).get('lang', [None])[-1]
-												[youtube] Update to ytdl-2021.02.04.1

											
										
										
											2021-02-04 08:37:17 -06:00
+								                if not base_url:
 								                    continue
-												[YouTube] Add auto-translated subtitles
Closes #1245

											
										
										
											2021-10-12 01:33:56 -05:00
+								                lang_name = self._get_text(caption_track, 'name', max_runs=1)
-												[youtube] Update to ytdl-2021.02.04.1

											
										
										
											2021-02-04 08:37:17 -06:00
+								                if caption_track.get('kind') != 'asr':
 								                    if not lang_code:
 								                        continue
 								                    process_language(
-												[YouTube] Add auto-translated subtitles
Closes #1245

											
										
										
											2021-10-12 01:33:56 -05:00
+								                        subtitles, base_url, lang_code, lang_name, {})
 								                    if not caption_track.get('isTranslatable'):
 								                        continue
-												[youtube] Fix subtitles only being extracted from the first client
Closes #547

											
										
										
											2021-07-22 23:07:15 -05:00
+								                for trans_code, trans_name in translation_languages.items():
 								                    if not trans_code:
-												[youtube] Update to ytdl-2021.02.04.1

											
										
										
											2021-02-04 08:37:17 -06:00
+								                        continue
-												[youtube] Fix auto-translated automatic captions

d49669acad71f640ffd8b78f0ea7911ae1f67720 only covered ASR

Closes #2956

											
										
										
											2022-03-27 03:36:26 -05:00
+								                    orig_trans_code = trans_code
-												[extractor/youtube] Subtitles cannot be translated to `und`


Closes #5674

											
										
										
											2022-11-29 17:47:45 -06:00
+								                    if caption_track.get('kind') != 'asr' and trans_code != 'und':
-												[extractor/youtube] Parse translated subtitles only when requested

Closes #4274

											
										
										
											2022-07-17 17:49:43 -05:00
+								                        if not get_translated_subs:
-												[youtube] Add extractor-arg to skip auto-translated subs

											
										
										
											2022-03-27 03:34:20 -05:00
+								                            continue
-												[YouTube] Add auto-translated subtitles
Closes #1245

											
										
										
											2021-10-12 01:33:56 -05:00
+								                        trans_code += f'-{lang_code}'
-												[cleanup, utils] Don't use kwargs for `format_field`

											
										
										
											2022-06-17 21:00:12 -05:00
+								                        trans_name += format_field(lang_name, None, ' from %s')
-												[youtube] Fix auto-translated automatic captions

d49669acad71f640ffd8b78f0ea7911ae1f67720 only covered ASR

Closes #2956

											
										
										
											2022-03-27 03:36:26 -05:00
+								                    if lang_code == f'a-{orig_trans_code}':
-												[extractor/youtube] Determine audio language using automatic captions

											
										
										
											2023-06-14 08:38:46 -05:00
+								                        # Set audio language based on original subtitles
 								                        for f in formats:
 								                            if f.get('acodec') != 'none' and not f.get('language'):
 								                                f['language'] = orig_trans_code
 								                        # Add an "-orig" label to the original language so that it can be distinguished.
 								                        # The subs are returned without "-orig" as well for compatibility
-												[youtube] Label original auto-subs

Closes #2655

											
										
										
											2022-02-11 14:20:25 -06:00
+								                        process_language(
-												[youtube] Fix automatic captions

Closes #2956

											
										
										
											2022-03-04 22:08:03 -06:00
+								                            automatic_captions, base_url, f'{trans_code}-orig', f'{trans_name} (Original)', {})
 								                    # Setting tlang=lang returns damaged subtitles.
 								                    process_language(automatic_captions, base_url, trans_code, trans_name,
-												[youtube] Fix auto-translated automatic captions

d49669acad71f640ffd8b78f0ea7911ae1f67720 only covered ASR

Closes #2956

											
										
										
											2022-03-27 03:36:26 -05:00
+								                                     {} if orig_lang == orig_trans_code else {'tlang': trans_code})
-												[webvtt, extractor/youtube] Extract auto-subs from livestream VODs

Closes #4130

Authored by: pukkandan, fstirlitz

											
										
										
											2022-06-21 17:16:54 -05:00
 								        info['automatic_captions'] = automatic_captions
 								        info['subtitles'] = subtitles
-												[youtube] Move metadata extraction after video availability check

											
										
										
											2018-06-02 14:08:38 -05:00
-												[compat] Remove deprecated functions from core code

											
										
										
											2022-06-24 05:54:43 -05:00
+								        parsed_url = urllib.parse.urlparse(url)
-												[youtube] Update to ytdl-2021.02.04.1

											
										
										
											2021-02-04 08:37:17 -06:00
+								        for component in [parsed_url.fragment, parsed_url.query]:
-												[compat] Remove deprecated functions from core code

											
										
										
											2022-06-24 05:54:43 -05:00
+								            query = urllib.parse.parse_qs(component)
-												[youtube] Update to ytdl-2021.02.04.1

											
										
										
											2021-02-04 08:37:17 -06:00
+								            for k, v in query.items():
 								                for d_k, s_ks in [('start', ('start', 't')), ('end', ('end',))]:
 								                    d_k += '_time'
 								                    if d_k not in info and k in s_ks:
-												[cleanup] Add more ruff rules (#10149)

Authored by: seproDev

Reviewed-by: bashonly <88596187+bashonly@users.noreply.github.com>
Reviewed-by: Simon Sawicki <contact@grub4k.xyz>
											
										
										
											2024-06-11 18:09:58 -05:00
+								                        info[d_k] = parse_duration(v[0])
-												[youtube] improve Youtube Music Auto-generated description parsing(closes #20742)

											
										
										
											2019-04-27 03:16:17 -05:00
 								        # Youtube Music Auto-generated description
-												[extractor/youtube] Improve description parsing performance (#7315)

* The parsing is skipped when not needed
* The regex is improved by simulating atomic groups with lookaheads

Authored by: pukkandan, berkanteber
											
										
										
											2023-06-22 02:27:54 -05:00
+								        if (video_description or '').strip().endswith('\nAuto-generated by YouTube.'):
 								            # XXX: Causes catastrophic backtracking if description has "·"
 								            # E.g. https://www.youtube.com/watch?v=DoPaAxMQoiI
 								            # Simulating atomic groups:  (?P<a>[^xy]+)x  =>  (?=(?P<a>[^xy]+))(?P=a)x
 								            # reduces it, but does not fully fix it. https://regex101.com/r/8Ssf2h/2
-												[cleanup] Misc fixes

Cherry-picks from: #3498, #3947
Related: #3949, https://github.com/yt-dlp/yt-dlp/issues/1839#issuecomment-1140313836
Authored by: pukkandan, flashdagger, gamer191

											
										
										
											2022-06-03 10:59:03 -05:00
+								            mobj = re.search(
 								                r'''(?xs)
-												[extractor/youtube] Improve description parsing performance (#7315)

* The parsing is skipped when not needed
* The regex is improved by simulating atomic groups with lookaheads

Authored by: pukkandan, berkanteber
											
										
										
											2023-06-22 02:27:54 -05:00
+								                    (?=(?P<track>[^\n·]+))(?P=track)·
 								                    (?=(?P<artist>[^\n]+))(?P=artist)\n+
 								                    (?=(?P<album>[^\n]+))(?P=album)\n
-												[cleanup] Misc fixes

Cherry-picks from: #3498, #3947
Related: #3949, https://github.com/yt-dlp/yt-dlp/issues/1839#issuecomment-1140313836
Authored by: pukkandan, flashdagger, gamer191

											
										
										
											2022-06-03 10:59:03 -05:00
+								                    (?:.+?℗\s*(?P<release_year>\d{4})(?!\d))?
-												[ie/youtube] Fix `release_date` extraction (#11759)

Authored by: MutantPiggieGolem1
											
										
										
											2024-12-12 07:46:52 -06:00
+								                    (?:.+?Released\ on\s*:\s*(?P<release_date>\d{4}-\d{2}-\d{2}))?
-												[extractor/youtube] Improve description parsing performance (#7315)

* The parsing is skipped when not needed
* The regex is improved by simulating atomic groups with lookaheads

Authored by: pukkandan, berkanteber
											
										
										
											2023-06-22 02:27:54 -05:00
+								                    (.+?\nArtist\s*:\s*
 								                        (?=(?P<clean_artist>[^\n]+))(?P=clean_artist)\n
 								                    )?.+\nAuto-generated\ by\ YouTube\.\s*$
-												[cleanup] Misc fixes

Cherry-picks from: #3498, #3947
Related: #3949, https://github.com/yt-dlp/yt-dlp/issues/1839#issuecomment-1140313836
Authored by: pukkandan, flashdagger, gamer191

											
										
										
											2022-06-03 10:59:03 -05:00
+								                ''', video_description)
-												[youtube] improve Youtube Music Auto-generated description parsing(closes #20742)

											
										
										
											2019-04-27 03:16:17 -05:00
+								            if mobj:
 								                release_year = mobj.group('release_year')
 								                release_date = mobj.group('release_date')
 								                if release_date:
 								                    release_date = release_date.replace('-', '')
 								                    if not release_year:
-												[youtube] Update to ytdl-2021.02.04.1

											
										
										
											2021-02-04 08:37:17 -06:00
+								                        release_year = release_date[:4]
 								                info.update({
 								                    'album': mobj.group('album'.strip()),
-												[ie] Migrate commonly plural fields to lists (#8917)

Authored by: llistochek, pukkandan
Related: #3944
											
										
										
											2024-02-20 01:19:24 -06:00
+								                    'artists': ([a] if (a := mobj.group('clean_artist'))
 								                                else [a.strip() for a in mobj.group('artist').split('·')]),
-												[youtube] Update to ytdl-2021.02.04.1

											
										
										
											2021-02-04 08:37:17 -06:00
+								                    'track': mobj.group('track').strip(),
 								                    'release_date': release_date,
-												Update to ytdl-2021.02.10

Except: [archiveorg] Fix and improve extraction (5fc53690cbe6abb11941a3f4846b566a7472753e)

											
										
										
											2021-02-10 15:22:55 -06:00
+								                    'release_year': int_or_none(release_year),
-												[youtube] Update to ytdl-2021.02.04.1

											
										
										
											2021-02-04 08:37:17 -06:00
+								                })
-												[youtube] Move metadata extraction after video availability check

											
										
										
											2018-06-02 14:08:38 -05:00
-												[youtube] Update to ytdl-2021.02.04.1

											
										
										
											2021-02-04 08:37:17 -06:00
+								        initial_data = None
 								        if webpage:
-												[cleanup] Misc fixes

Closes #4027

											
										
										
											2022-06-10 14:03:54 -05:00
+								            initial_data = self.extract_yt_initial_data(video_id, webpage, fatal=False)
-												[extractor/youtube] Handle incomplete initial data from watch page (#6510)

Authored by: coletdjnz
											
										
										
											2023-03-12 20:43:37 -05:00
+								            if not traverse_obj(initial_data, 'contents'):
 								                self.report_warning('Incomplete data received in embedded initial data; re-fetching using API.')
 								                initial_data = None
-												[youtube] Update to ytdl-2021.02.04.1

											
										
										
											2021-02-04 08:37:17 -06:00
+								        if not initial_data:
-												[youtube] Cleanup authentication code (#786)

Authored by: coletdjnz
											
										
										
											2021-09-23 19:52:17 -05:00
+								            query = {'videoId': video_id}
 								            query.update(self._get_checkok_params())
-												[youtube] Use new API for additional video extraction requests (#328)

Co-authored-by: colethedj, pukkandan
Closes https://github.com/yt-dlp/yt-dlp/issues/427
Workarounds for https://github.com/ytdl-org/youtube-dl/issues/29326, https://github.com/yt-dlp/yt-dlp/issues/319, https://github.com/ytdl-org/youtube-dl/issues/29086
											
										
										
											2021-06-29 17:07:49 -05:00
+								            initial_data = self._extract_response(
 								                item_id=video_id, ep='next', fatal=False,
-												[extractor/youtube] Handle incomplete initial data from watch page (#6510)

Authored by: coletdjnz
											
										
										
											2023-03-12 20:43:37 -05:00
+								                ytcfg=master_ytcfg, query=query, check_get_keys='contents',
-												[youtube] Cleanup authentication code (#786)

Authored by: coletdjnz
											
										
										
											2021-09-23 19:52:17 -05:00
+								                headers=self.generate_api_headers(ytcfg=master_ytcfg),
-												[youtube] Use new API for additional video extraction requests (#328)

Co-authored-by: colethedj, pukkandan
Closes https://github.com/yt-dlp/yt-dlp/issues/427
Workarounds for https://github.com/ytdl-org/youtube-dl/issues/29326, https://github.com/yt-dlp/yt-dlp/issues/319, https://github.com/ytdl-org/youtube-dl/issues/29086
											
										
										
											2021-06-29 17:07:49 -05:00
+								                note='Downloading initial data API JSON')
-												[youtube] Update to ytdl-2021.02.04.1

											
										
										
											2021-02-04 08:37:17 -06:00
-												[ie/youtube] Fix `comment_count` extraction (#11274)

Authored by: bashonly
											
										
										
											2024-10-19 16:40:20 -05:00
+								        COMMENTS_SECTION_IDS = ('comment-item-section', 'engagement-panel-comments-section')
-												[youtube] Extract `comment_count` from webpage

Closes #4091

											
										
										
											2022-06-17 01:30:55 -05:00
+								        info['comment_count'] = traverse_obj(initial_data, (
 								            'contents', 'twoColumnWatchNextResults', 'results', 'results', 'contents', ..., 'itemSectionRenderer',
-												[cleanup] Add more ruff rules (#10149)

Authored by: seproDev

Reviewed-by: bashonly <88596187+bashonly@users.noreply.github.com>
Reviewed-by: Simon Sawicki <contact@grub4k.xyz>
											
										
										
											2024-06-11 18:09:58 -05:00
+								            'contents', ..., 'commentsEntryPointHeaderRenderer', 'commentCount',
-												[youtube] Extract `comment_count` from webpage

Closes #4091

											
										
										
											2022-06-17 01:30:55 -05:00
+								        ), (
-												[ie/youtube] Fix `comment_count` extraction (#11274)

Authored by: bashonly
											
										
										
											2024-10-19 16:40:20 -05:00
+								            'engagementPanels', lambda _, v: v['engagementPanelSectionListRenderer']['panelIdentifier'] in COMMENTS_SECTION_IDS,
-												[cleanup] Add more ruff rules (#10149)

Authored by: seproDev

Reviewed-by: bashonly <88596187+bashonly@users.noreply.github.com>
Reviewed-by: Simon Sawicki <contact@grub4k.xyz>
											
										
										
											2024-06-11 18:09:58 -05:00
+								            'engagementPanelSectionListRenderer', 'header', 'engagementPanelTitleHeaderRenderer', 'contextualInfo',
-												[extractor/youtube] Fix parsing `comment_count` (#6523)

Closes #5849
Authored by: nick-cd
											
										
										
											2023-03-14 18:21:14 -05:00
+								        ), expected_type=self._get_count, get_all=False)
-												[youtube] Extract `comment_count` from webpage

Closes #4091

											
										
										
											2022-06-17 01:30:55 -05:00
-												[cleanup] Misc cleanup and refactor (#2173)

											
										
										
											2022-04-17 15:58:28 -05:00
+								        try:  # This will error if there is no livechat
-												[youtube_live_chat] Support ongoing live chat (#422)

Authored by: siikamiika
											
										
										
											2021-06-22 19:12:39 -05:00
+								            initial_data['contents']['twoColumnWatchNextResults']['conversationBar']['liveChatRenderer']['continuations'][0]['reloadContinuationData']['continuation']
-												[cleanup] Misc cleanup and refactor (#2173)

											
										
										
											2022-04-17 15:58:28 -05:00
+								        except (KeyError, IndexError, TypeError):
 								            pass
 								        else:
-												[YouTube] Add auto-translated subtitles
Closes #1245

											
										
										
											2021-10-12 01:33:56 -05:00
+								            info.setdefault('subtitles', {})['live_chat'] = [{
-												[extractor/youtube] Fix live chat for videos with content warning

Fixes #4051
Authored by: coletdjnz

											
										
										
											2022-06-12 00:56:50 -05:00
+								                # url is needed to set cookies
 								                'url': f'https://www.youtube.com/watch?v={video_id}&bpctr=9999999999&has_verified=1',
-												[youtube_live_chat] Support ongoing live chat (#422)

Authored by: siikamiika
											
										
										
											2021-06-22 19:12:39 -05:00
+								                'video_id': video_id,
 								                'ext': 'json',
-												[extractor/youtube] Download `post_live` videos from start (#5091)

* The fragments are generated as a `LazyList`. So only the required formats are expanded during download, but all fragment lists are printed/written in infojson.
* The m3u8 formats which cannot be downloaded from start are not extracted by default, but can be enabled with an extractor-arg. The extractor-arg `include_live_dash` is renamed to `include_incomplete_formats` to account for this new use-case.

Closes #1564
Authored by: Lesmiscore, pukkandan
											
										
										
											2022-10-03 21:48:31 -05:00
+								                'protocol': ('youtube_live_chat' if live_status in ('is_live', 'is_upcoming')
 								                             else 'youtube_live_chat_replay'),
-												[youtube_live_chat] Support ongoing live chat (#422)

Authored by: siikamiika
											
										
										
											2021-06-22 19:12:39 -05:00
+								            }]
-												[youtube] Update to ytdl-2021.02.04.1

											
										
										
											2021-02-04 08:37:17 -06:00
 								        if initial_data:
-												[youtube] Sanity check `chapters` (and refactor related code)
Closes #520

											
										
										
											2021-07-19 19:02:41 -05:00
+								            info['chapters'] = (
 								                self._extract_chapters_from_json(initial_data, duration)
 								                or self._extract_chapters_from_engagement_panel(initial_data, duration)
-												[extractor/youtube] Bring back `_extract_chapters_from_description`

Closes #3886

											
										
										
											2022-05-28 14:30:41 -05:00
+								                or self._extract_chapters_from_description(video_description, duration)
-												[youtube] Sanity check `chapters` (and refactor related code)
Closes #520

											
										
										
											2021-07-19 19:02:41 -05:00
+								                or None)
-												[youtube] Update to ytdl-2021.02.04.1

											
										
										
											2021-02-04 08:37:17 -06:00
-												[ie/youtube] Fix `heatmap` extraction (#8299)

Closes #8189
Authored by: bashonly
											
										
										
											2023-10-06 20:00:15 -05:00
+								            info['heatmap'] = self._extract_heatmap(initial_data)
-												[extractor/youtube] Extract `heatmap` data (#7100)

Closes #3888
Authored by: tntmod54321
											
										
										
											2023-05-26 07:24:39 -05:00
-												[youtube] Improve video upload date handling (#3029)

* Don't prefer UTC upload date for past live streams/premieres
* Improve regex (fixes a regression)

Authored-by: coletdjnz
											
										
										
											2022-03-13 17:02:44 -05:00
+								        contents = traverse_obj(
 								            initial_data, ('contents', 'twoColumnWatchNextResults', 'results', 'results', 'contents'),
 								            expected_type=list, default=[])
 								        vpir = get_first(contents, 'videoPrimaryInfoRenderer')
 								        if vpir:
 								            stl = vpir.get('superTitleLink')
 								            if stl:
 								                stl = self._get_text(stl)
 								                if try_get(
 								                        vpir,
 								                        lambda x: x['superTitleIcon']['iconType']) == 'LOCATION_PIN':
 								                    info['location'] = stl
 								                else:
-												[youtube] Fix episode metadata extraction

											
										
										
											2022-04-14 23:22:03 -05:00
+								                    mobj = re.search(r'(.+?)\s*S(\d+)\s*•?\s*E(\d+)', stl)
-												[youtube] Improve video upload date handling (#3029)

* Don't prefer UTC upload date for past live streams/premieres
* Improve regex (fixes a regression)

Authored-by: coletdjnz
											
										
										
											2022-03-13 17:02:44 -05:00
+								                    if mobj:
-												[youtube] Update to ytdl-2021.02.04.1

											
										
										
											2021-02-04 08:37:17 -06:00
+								                        info.update({
-												[youtube] Improve video upload date handling (#3029)

* Don't prefer UTC upload date for past live streams/premieres
* Improve regex (fixes a regression)

Authored-by: coletdjnz
											
										
										
											2022-03-13 17:02:44 -05:00
+								                            'series': mobj.group(1),
 								                            'season_number': int(mobj.group(2)),
 								                            'episode_number': int(mobj.group(3)),
-												[youtube] Update to ytdl-2021.02.04.1

											
										
										
											2021-02-04 08:37:17 -06:00
+								                        })
-												[youtube] Improve video upload date handling (#3029)

* Don't prefer UTC upload date for past live streams/premieres
* Improve regex (fixes a regression)

Authored-by: coletdjnz
											
										
										
											2022-03-13 17:02:44 -05:00
+								            for tlb in (try_get(
 								                    vpir,
 								                    lambda x: x['videoActions']['menuRenderer']['topLevelButtons'],
 								                    list) or []):
-												[extractor/youtube] Fix video like count extraction

Support new combined button layout
Authored by: coletdjnz

											
										
										
											2022-09-08 19:34:39 -05:00
+								                tbrs = variadic(
 								                    traverse_obj(
-												[utils] `traverse_obj`: Fix more bugs

and cleanup uses of `default=[]`

Continued from b1bde57bef878478e3503ab07190fd207914ade9

											
										
										
											2023-02-09 16:26:26 -06:00
+								                        tlb, ('toggleButtonRenderer', ...),
 								                        ('segmentedLikeDislikeButtonRenderer', ..., 'toggleButtonRenderer')))
-												[extractor/youtube] Fix video like count extraction

Support new combined button layout
Authored by: coletdjnz

											
										
										
											2022-09-08 19:34:39 -05:00
+								                for tbr in tbrs:
 								                    for getter, regex in [(
 								                            lambda x: x['defaultText']['accessibility']['accessibilityData'],
 								                            r'(?P<count>[\d,]+)\s*(?P<type>(?:dis)?like)'), ([
 								                                lambda x: x['accessibility'],
 								                                lambda x: x['accessibilityData']['accessibilityData'],
 								                            ], r'(?P<type>(?:dis)?like) this video along with (?P<count>[\d,]+) other people')]:
 								                        label = (try_get(tbr, getter, dict) or {}).get('label')
 								                        if label:
 								                            mobj = re.match(regex, label)
 								                            if mobj:
 								                                info[mobj.group('type') + '_count'] = str_to_int(mobj.group('count'))
 								                                break
-												[ie/youtube] Fix `like_count` extraction (#8763)

Closes #8759
Authored by: Ganesh910
											
										
										
											2023-12-13 01:04:12 -06:00
 								            info['like_count'] = traverse_obj(vpir, (
 								                'videoActions', 'menuRenderer', 'topLevelButtons', ...,
 								                'segmentedLikeDislikeButtonViewModel', 'likeButtonViewModel', 'likeButtonViewModel',
 								                'toggleButtonViewModel', 'toggleButtonViewModel', 'defaultButtonViewModel',
 								                'buttonViewModel', 'accessibilityText', {parse_count}), get_all=False)
-												[extractor/youtube] Extract concurrent view count for livestreams (#5152)

Adds new field `concurrent_view_count`
Closes https://github.com/yt-dlp/yt-dlp/issues/4843

Authored by: coletdjnz
											
										
										
											2022-10-07 02:00:40 -05:00
+								            vcr = traverse_obj(vpir, ('viewCount', 'videoViewCountRenderer'))
 								            if vcr:
 								                vc = self._get_count(vcr, 'viewCount')
 								                # Upcoming premieres with waiting count are treated as live here
 								                if vcr.get('isLive'):
 								                    info['concurrent_view_count'] = vc
 								                elif info.get('view_count') is None:
 								                    info['view_count'] = vc
-												[youtube] Improve video upload date handling (#3029)

* Don't prefer UTC upload date for past live streams/premieres
* Improve regex (fixes a regression)

Authored-by: coletdjnz
											
										
										
											2022-03-13 17:02:44 -05:00
+								        vsir = get_first(contents, 'videoSecondaryInfoRenderer')
 								        if vsir:
 								            vor = traverse_obj(vsir, ('owner', 'videoOwnerRenderer'))
 								            info.update({
 								                'channel': self._get_text(vor, 'title'),
 								                'channel_follower_count': self._get_count(vor, 'subscriberCountText')})
-												[extractor/youtube] Define strict uploader metadata mapping (#6384)

New mapping:
```
channel -> channel name
channel_id -> UCID
channel_url -> UCID channel url

uploader -> channel name (same as channel field)
uploader_id -> @handle
uploader_url -> @handle channel url 
```

Authored by: coletdjnz
											
										
										
											2023-04-14 02:58:36 -05:00
+								            if not channel_handle:
 								                channel_handle = self.handle_from_url(
 								                    traverse_obj(vor, (
 								                        ('navigationEndpoint', ('title', 'runs', ..., 'navigationEndpoint')),
 								                        (('commandMetadata', 'webCommandMetadata', 'url'), ('browseEndpoint', 'canonicalBaseUrl')),
 								                        {str}), get_all=False))
-												[youtube] Improve video upload date handling (#3029)

* Don't prefer UTC upload date for past live streams/premieres
* Improve regex (fixes a regression)

Authored-by: coletdjnz
											
										
										
											2022-03-13 17:02:44 -05:00
+								            rows = try_get(
 								                vsir,
 								                lambda x: x['metadataRowContainer']['metadataRowContainerRenderer']['rows'],
 								                list) or []
 								            multiple_songs = False
 								            for row in rows:
 								                if try_get(row, lambda x: x['metadataRowRenderer']['hasDividerLine']) is True:
 								                    multiple_songs = True
 								                    break
 								            for row in rows:
 								                mrr = row.get('metadataRowRenderer') or {}
 								                mrr_title = mrr.get('title')
 								                if not mrr_title:
 								                    continue
 								                mrr_title = self._get_text(mrr, 'title')
 								                mrr_contents_text = self._get_text(mrr, ('contents', 0))
 								                if mrr_title == 'License':
 								                    info['license'] = mrr_contents_text
 								                elif not multiple_songs:
 								                    if mrr_title == 'Album':
 								                        info['album'] = mrr_contents_text
 								                    elif mrr_title == 'Artist':
-												[ie] Migrate commonly plural fields to lists (#8917)

Authored by: llistochek, pukkandan
Related: #3944
											
										
										
											2024-02-20 01:19:24 -06:00
+								                        info['artists'] = [mrr_contents_text] if mrr_contents_text else None
-												[youtube] Improve video upload date handling (#3029)

* Don't prefer UTC upload date for past live streams/premieres
* Improve regex (fixes a regression)

Authored-by: coletdjnz
											
										
										
											2022-03-13 17:02:44 -05:00
+								                    elif mrr_title == 'Song':
 								                        info['track'] = mrr_contents_text
-												[extractor/youtube] Extract `channel_is_verified` (#7213)

Authored by: coletdjnz

											
										
										
											2023-06-08 02:50:05 -05:00
+								            owner_badges = self._extract_badges(traverse_obj(vsir, ('owner', 'videoOwnerRenderer', 'badges')))
 								            if self._has_badge(owner_badges, BadgeType.VERIFIED):
 								                info['channel_is_verified'] = True
-												[youtube] Update to ytdl-2021.02.04.1

											
										
										
											2021-02-04 08:37:17 -06:00
-												[extractor/youtube] Define strict uploader metadata mapping (#6384)

New mapping:
```
channel -> channel name
channel_id -> UCID
channel_url -> UCID channel url

uploader -> channel name (same as channel field)
uploader_id -> @handle
uploader_url -> @handle channel url 
```

Authored by: coletdjnz
											
										
										
											2023-04-14 02:58:36 -05:00
+								        info.update({
 								            'uploader': info.get('channel'),
 								            'uploader_id': channel_handle,
 								            'uploader_url': format_field(channel_handle, None, 'https://www.youtube.com/%s', default=None),
 								        })
-												[ie/youtube] Extract upload timestamp if available (#9856)

Closes #4962, Closes #9829
Authored by: coletdjnz
											
										
										
											2024-05-26 16:13:12 -05:00
 								        # We only want timestamp IF it has time precision AND a timezone
 								        # Currently the uploadDate in microformats appears to be in US/Pacific timezone.
 								        timestamp = (
 								            parse_iso8601(get_first(microformats, 'uploadDate'), timezone=NO_DEFAULT)
 								            or parse_iso8601(search_meta('uploadDate'), timezone=NO_DEFAULT)
 								        )
 								        upload_date = (
 								            dt.datetime.fromtimestamp(timestamp, dt.timezone.utc).strftime('%Y%m%d') if timestamp else
 								            (
 								                unified_strdate(get_first(microformats, 'uploadDate'))
 								                or unified_strdate(search_meta('uploadDate'))
 								            ))
 								        # In the case we cannot get the timestamp:
-												[youtube] Improve video upload date handling (#3029)

* Don't prefer UTC upload date for past live streams/premieres
* Improve regex (fixes a regression)

Authored-by: coletdjnz
											
										
										
											2022-03-13 17:02:44 -05:00
+								        # The upload date for scheduled, live and past live streams / premieres in microformats
 								        # may be different from the stream date. Although not in UTC, we will prefer it in this case.
-												[youtube] Prefer UTC upload date for videos (#2223)

Except for live/scheduled streams/premieres. 
Closes #1881
Related: #2402 
Authored-by: coletdjnz
											
										
										
											2022-03-08 01:28:00 -06:00
+								        # See: https://github.com/yt-dlp/yt-dlp/pull/2223#issuecomment-1008485139
-												[ie/youtube] Extract upload timestamp if available (#9856)

Closes #4962, Closes #9829
Authored by: coletdjnz
											
										
										
											2024-05-26 16:13:12 -05:00
+								        if not upload_date or (not timestamp and live_status in ('not_live', None)):
 								            # this should be in UTC, as configured in the cookie/client context
-												[extractor/youtube] Support changing extraction language (#4470)

Adds `--extractor-args youtube:lang=<supported lang code>` extractor arg to prefer translated fields (e.g. title and description) of that language, if available, for all YouTube extractors. See README or error message for list of supported language codes.

Closes https://github.com/yt-dlp/yt-dlp/issues/387

Authored by: coletdjnz
											
										
										
											2022-09-09 00:16:46 -05:00
+								            upload_date = strftime_or_none(
-												[cleanup] Misc

Closes #6288, Closes #7197, Closes #7265, Closes #7353, Closes #5773
Authored by: mikf, freezboltz, pukkandan

											
										
										
											2023-06-20 22:51:20 -05:00
+								                self._parse_time_text(self._get_text(vpir, 'dateText'))) or upload_date
-												[ie/youtube] Extract upload timestamp if available (#9856)

Closes #4962, Closes #9829
Authored by: coletdjnz
											
										
										
											2024-05-26 16:13:12 -05:00
-												[youtube] Improve video upload date handling (#3029)

* Don't prefer UTC upload date for past live streams/premieres
* Improve regex (fixes a regression)

Authored-by: coletdjnz
											
										
										
											2022-03-13 17:02:44 -05:00
+								        info['upload_date'] = upload_date
-												[ie/youtube] Extract upload timestamp if available (#9856)

Closes #4962, Closes #9829
Authored by: coletdjnz
											
										
										
											2024-05-26 16:13:12 -05:00
+								        info['timestamp'] = timestamp
-												[youtube] Prefer UTC upload date for videos (#2223)

Except for live/scheduled streams/premieres. 
Closes #1881
Related: #2402 
Authored-by: coletdjnz
											
										
										
											2022-03-08 01:28:00 -06:00
-												[ie/youtube] Check newly uploaded iOS HLS formats (#8336)

Closes #7747
Authored by: bashonly
											
										
										
											2023-10-28 03:02:13 -05:00
+								        if upload_date and live_status not in ('is_live', 'post_live', 'is_upcoming'):
 								            # Newly uploaded videos' HLS formats are potentially problematic and need to be checked
-												[cleanup] Standardize `import datetime as dt` (#8978)

											
										
										
											2024-02-24 18:16:34 -06:00
+								            upload_datetime = datetime_from_str(upload_date).replace(tzinfo=dt.timezone.utc)
-												[ie/youtube] Improve detection of faulty HLS formats (#8646)

Closes #7747
Authored by: bashonly
											
										
										
											2023-11-25 20:21:29 -06:00
+								            if upload_datetime >= datetime_from_str('today-2days'):
-												[ie/youtube] Check newly uploaded iOS HLS formats (#8336)

Closes #7747
Authored by: bashonly
											
										
										
											2023-10-28 03:02:13 -05:00
+								                for fmt in info['formats']:
 								                    if fmt.get('protocol') == 'm3u8_native':
 								                        fmt['__needs_testing'] = True
-												[ie] Migrate commonly plural fields to lists (#8917)

Authored by: llistochek, pukkandan
Related: #3944
											
										
										
											2024-02-20 01:19:24 -06:00
+								        for s_k, d_k in [('artists', 'creators'), ('track', 'alt_title')]:
-												[youtube] Update to ytdl-2021.02.04.1

											
										
										
											2021-02-04 08:37:17 -06:00
+								            v = info.get(s_k)
 								            if v:
 								                info[d_k] = v
-												[youtube] Added 'subscriber_count' to extraction

											
										
										
											2020-09-15 10:16:58 -05:00
-												[extractor/youtube] Misc cleanup

Authored by: coletdjnz

											
										
										
											2023-06-08 08:28:49 -05:00
+								        badges = self._extract_badges(traverse_obj(vpir, 'badges'))
-												[extractor/youtube] Support changing extraction language (#4470)

Adds `--extractor-args youtube:lang=<supported lang code>` extractor arg to prefer translated fields (e.g. title and description) of that language, if available, for all YouTube extractors. See README or error message for list of supported language codes.

Closes https://github.com/yt-dlp/yt-dlp/issues/387

Authored by: coletdjnz
											
										
										
											2022-09-09 00:16:46 -05:00
 								        is_private = (self._has_badge(badges, BadgeType.AVAILABILITY_PRIVATE)
 								                      or get_first(video_details, 'isPrivate', expected_type=bool))
 								        info['availability'] = (
 								            'public' if self._has_badge(badges, BadgeType.AVAILABILITY_PUBLIC)
 								            else self._availability(
 								                is_private=is_private,
 								                needs_premium=(
 								                    self._has_badge(badges, BadgeType.AVAILABILITY_PREMIUM)
 								                    or False if initial_data and is_private is not None else None),
 								                needs_subscription=(
 								                    self._has_badge(badges, BadgeType.AVAILABILITY_SUBSCRIPTION)
 								                    or False if initial_data and is_private is not None else None),
 								                needs_auth=info['age_limit'] >= 18,
 								                is_unlisted=None if is_private is None else (
 								                    self._has_badge(badges, BadgeType.AVAILABILITY_UNLISTED)
 								                    or get_first(microformats, 'isUnlisted', expected_type=bool))))
-												[youtube] Show if video is `private`, `unlisted` etc in new field `availability` (#188)
Closes: #185, https://github.com/ytdl-org/youtube-dl/issues/25631

Authored by: colethedj, pukkandan

											
										
										
											2021-03-21 16:23:34 -05:00
-												[extractor] Generalize `getcomments` implementation

											
										
										
											2021-10-12 04:50:50 -05:00
+								        info['__post_extractor'] = self.extract_comments(master_ytcfg, video_id, contents, webpage)
-												[YoutubeIE] Externalize format selection

											
										
										
											2013-12-17 20:30:55 -06:00
-												[youtube] Extract data from multiple clients (#536)

* `player_client` accepts multiple clients
* default `player_client` = `android,web`
* music clients can be specifically requested
* Add IOS `player_client`
* Hide live dash since they can't be downloaded

Closes #501

Authored-by: pukkandan, colethedj
											
										
										
											2021-07-20 22:52:34 -05:00
+								        self.mark_watched(video_id, player_responses)
-												Add --mark-watched feature (Closes #5054)

											
										
										
											2016-02-29 13:01:33 -06:00
-												[youtube] Update to ytdl-2021.02.04.1

											
										
										
											2021-02-04 08:37:17 -06:00
+								        return info