2024-11-15 13:43:04 +00:00
11 changed files with 49 additions and 74 deletions
--- a/.github/workflows/build.yml
+++ b/.github/workflows/build.yml
@ -43,7 +43,7 @@ jobs:
      run: git push origin ${{ github.event.ref }}
    - name: Get Changelog
      run: |
-        changelog=$(grep -oPz '(?s)(?<=### ${{ steps.bump_version.outputs.ytdlp_version }}\n{2}).+?(?=\n{2,3}###)' Changelog.md) || true
+        changelog=$(cat Changelog.md | grep -oPz '(?s)(?<=### ${{ steps.bump_version.outputs.ytdlp_version }}\n{2}).+?(?=\n{2,3}###)') || true
        echo "changelog<<EOF" >> $GITHUB_ENV
        echo "$changelog" >> $GITHUB_ENV
        echo "EOF" >> $GITHUB_ENV
--- a/2
+++ b/2
@ -43,7 +43,7 @@ PYTHON ?= /usr/bin/env python3
 SYSCONFDIR = $(shell if [ $(PREFIX) = /usr -o $(PREFIX) = /usr/local ]; then echo /etc; else echo $(PREFIX)/etc; fi)

 # set markdown input format to "markdown-smart" for pandoc version 2 and to "markdown" for pandoc prior to version 2
-MARKDOWN = $(shell if [ `pandoc -v | head -n1 | cut -d" " -f2 | head -c1` = "2" ]; then echo markdown-smart; else echo markdown; fi)
+MARKDOWN = $(shell if [ "$(pandoc -v | head -n1 | cut -d" " -f2 | head -c1)" = "2" ]; then echo markdown-smart; else echo markdown; fi)

 install: lazy-extractors yt-dlp yt-dlp.1 completions
 	mkdir -p $(DESTDIR)$(BINDIR)
--- a/README.md
+++ b/README.md
@ -337,7 +337,8 @@ You can also fork the project on github and run your fork's [build workflow](.gi
    --list-extractors               List all supported extractors and exit
    --extractor-descriptions        Output descriptions of all supported
                                    extractors and exit
-    --force-generic-extractor       Force extraction to use the generic extractor
+    --force-generic-extractor       Force extraction to use the generic
+                                    extractor
    --default-search PREFIX         Use this prefix for unqualified URLs. Eg:
                                    "gvsearch2:python" downloads two videos from
                                    google videos for the search term "python".
@ -396,7 +397,8 @@ You can also fork the project on github and run your fork's [build workflow](.gi
                                    aliases; so be carefull to avoid defining
                                    recursive options. As a safety measure, each
                                    alias may be triggered a maximum of 100
-                                    times. This option can be used multiple times
+                                    times. This option can be used multiple
+                                    times

 ## Network Options:
    --proxy URL                     Use the specified HTTP/HTTPS/SOCKS proxy. To
@ -423,7 +425,8 @@ You can also fork the project on github and run your fork's [build workflow](.gi
                                    explicitly provided two-letter ISO 3166-2
                                    country code
    --geo-bypass-ip-block IP_BLOCK  Force bypass geographic restriction with
-                                    explicitly provided IP block in CIDR notation
+                                    explicitly provided IP block in CIDR
+                                    notation

 ## Video Selection:
    --playlist-start NUMBER         Playlist video to start at (default is 1)
@ -633,7 +636,8 @@ You can also fork the project on github and run your fork's [build workflow](.gi
                                    modification time (default)
    --no-mtime                      Do not use the Last-modified header to set
                                    the file modification time
-    --write-description             Write video description to a .description file
+    --write-description             Write video description to a .description
+                                    file
    --no-write-description          Do not write video description (default)
    --write-info-json               Write video metadata to a .info.json file
                                    (this may contain personal information)
@ -655,7 +659,8 @@ You can also fork the project on github and run your fork's [build workflow](.gi
                                    extraction is known to be quick (Alias:
                                    --no-get-comments)
    --load-info-json FILE           JSON file containing the video information
-                                    (created with the "--write-info-json" option)
+                                    (created with the "--write-info-json"
+                                    option)
    --cookies FILE                  Netscape formatted file to read cookies from
                                    and dump cookie jar in
    --no-cookies                    Do not read/dump cookies from/to file
@ -671,7 +676,8 @@ You can also fork the project on github and run your fork's [build workflow](.gi
                                    for decrypting Chromium cookies on Linux can
                                    be (optionally) specified after the browser
                                    name separated by a "+". Currently supported
-                                    keyrings are: basictext, gnomekeyring, kwallet
+                                    keyrings are: basictext, gnomekeyring,
+                                    kwallet
    --no-cookies-from-browser       Do not load cookies from browser (default)
    --cache-dir DIR                 Location in the filesystem where youtube-dl
                                    can store some downloaded information (such
@ -683,7 +689,8 @@ You can also fork the project on github and run your fork's [build workflow](.gi

 ## Thumbnail Options:
    --write-thumbnail               Write thumbnail image to disk
-    --no-write-thumbnail            Do not write thumbnail image to disk (default)
+    --no-write-thumbnail            Do not write thumbnail image to disk
+                                    (default)
    --write-all-thumbnails          Write all thumbnail image formats to disk
    --list-thumbnails               List available thumbnails of each video.
                                    Simulate unless --no-simulate is used
@ -969,7 +976,8 @@ You can also fork the project on github and run your fork's [build workflow](.gi
                                    otherwise), force (try fixing even if file
                                    already exists)
    --ffmpeg-location PATH          Location of the ffmpeg binary; either the
-                                    path to the binary or its containing directory
+                                    path to the binary or its containing
+                                    directory
    --exec [WHEN:]CMD               Execute a command, optionally prefixed with
                                    when to execute it (after_move if
                                    unspecified), separated by a ":". Supported
@ -996,7 +1004,8 @@ You can also fork the project on github and run your fork's [build workflow](.gi
                                    be used with "--paths" and "--output" to set
                                    the output filename for the split files. See
                                    "OUTPUT TEMPLATE" for details
-    --no-split-chapters             Do not split video based on chapters (default)
+    --no-split-chapters             Do not split video based on chapters
+                                    (default)
    --remove-chapters REGEX         Remove chapters whose title matches the
                                    given regular expression. The syntax is the
                                    same as --download-sections. This option can
@ -1027,7 +1036,8 @@ You can also fork the project on github and run your fork's [build workflow](.gi
                                    (after downloading and processing all
                                    formats of a video), or "playlist" (at end
                                    of playlist). This option can be used
-                                    multiple times to add different postprocessors
+                                    multiple times to add different
+                                    postprocessors

 ## SponsorBlock Options:
 Make chapter entries for, or remove various segments (sponsor,
--- a/devscripts/make_readme.py
+++ b/devscripts/make_readme.py
@ -11,7 +11,6 @@ README_FILE = 'README.md'
 OPTIONS_START = 'General Options:'
 OPTIONS_END = 'CONFIGURATION'
 EPILOG_START = 'See full documentation'
-ALLOWED_OVERSHOOT = 2

 DISABLE_PATCH = object()

@ -29,7 +28,6 @@ def apply_patch(text, patch):

 options = take_section(sys.stdin.read(), f'\n  {OPTIONS_START}', f'\n{EPILOG_START}', shift=1)

-max_width = max(map(len, options.split('\n')))
 switch_col_width = len(re.search(r'(?m)^\s{5,}', options).group())
 delim = f'\n{" " * switch_col_width}'

@ -46,12 +44,6 @@ PATCHES = (
        rf'(?m)({delim}\S+)+$',
        lambda mobj: ''.join((delim, mobj.group(0).replace(delim, '')))
    ),
-    (  # Allow overshooting last line
-        rf'(?m)^(?P<prev>.+)${delim}(?P<current>.+)$(?!{delim})',
-        lambda mobj: (mobj.group().replace(delim, ' ')
-                      if len(mobj.group()) - len(delim) + 1 <= max_width + ALLOWED_OVERSHOOT
-                      else mobj.group())
-    ),
    (  # Avoid newline when a space is available b/w switch and description
        DISABLE_PATCH,  # This creates issues with prepare_manpage
        r'(?m)^(\s{4}-.{%d})(%s)' % (switch_col_width - 6, delim),
--- a/yt_dlp/YoutubeDL.py
+++ b/yt_dlp/YoutubeDL.py
@ -576,7 +576,7 @@ class YoutubeDL:
        )
        self._allow_colors = Namespace(**{
            type_: not self.params.get('no_color') and supports_terminal_sequences(stream)
-            for type_, stream in self._out_files.items_ if type_ != 'console'
+            for type_, stream in self._out_files if type_ != 'console'
        })

        if sys.version_info < (3, 6):
@ -3671,7 +3671,7 @@ class YoutubeDL:
            sys.getfilesystemencoding(),
            self.get_encoding(),
            ', '.join(
-                f'{key} {get_encoding(stream)}' for key, stream in self._out_files.items_
+                f'{key} {get_encoding(stream)}' for key, stream in self._out_files
                if stream is not None and key != 'console')
        )

--- a/yt_dlp/downloader/common.py
+++ b/yt_dlp/downloader/common.py
@ -302,7 +302,7 @@ class FileDownloader:
    )

    def _report_progress_status(self, s, default_template):
-        for name, style in self.ProgressStyles.items_:
+        for name, style in self.ProgressStyles:
            name = f'_{name}_str'
            if name not in s:
                continue
--- a/yt_dlp/extractor/generic.py
+++ b/yt_dlp/extractor/generic.py
@ -2542,27 +2542,7 @@ class GenericIE(InfoExtractor):
                'timestamp': 1652833414,
                'age_limit': 0,
            }
-        }, {
-            'url': 'https://www.skimag.com/video/ski-people-1980/',
-            'info_dict': {
-                'id': 'ski-people-1980',
-                'title': 'Ski People (1980)',
-            },
-            'playlist_count': 1,
-            'playlist': [{
-                'md5': '022a7e31c70620ebec18deeab376ee03',
-                'info_dict': {
-                    'id': 'YTmgRiNU',
-                    'ext': 'mp4',
-                    'title': '1980 Ski People',
-                    'timestamp': 1610407738,
-                    'description': 'md5:cf9c3d101452c91e141f292b19fe4843',
-                    'thumbnail': 'https://cdn.jwplayer.com/v2/media/YTmgRiNU/poster.jpg?width=720',
-                    'duration': 5688.0,
-                    'upload_date': '20210111',
-                }
-            }]
-        },
+        }
    ]

    def report_following_redirect(self, new_url):
--- a/yt_dlp/extractor/jwplatform.py
+++ b/yt_dlp/extractor/jwplatform.py
@ -37,9 +37,6 @@ class JWPlatformIE(InfoExtractor):
                webpage)
            if ret:
                return ret
-        mobj = re.search(r'<div\b[^>]* data-video-jw-id="([a-zA-Z0-9]{8})"', webpage)
-        if mobj:
-            return [f'jwplatform:{mobj.group(1)}']

    def _real_extract(self, url):
        url, smuggled_data = unsmuggle_url(url, {})
--- a/yt_dlp/extractor/rumble.py
+++ b/yt_dlp/extractor/rumble.py
@ -24,11 +24,6 @@ class RumbleEmbedIE(InfoExtractor):
            'title': 'WMAR 2 News Latest Headlines | October 20, 6pm',
            'timestamp': 1571611968,
            'upload_date': '20191020',
-            'channel_url': 'https://rumble.com/c/WMAR',
-            'channel': 'WMAR',
-            'thumbnail': 'https://sp.rmbl.ws/s8/1/5/M/z/1/5Mz1a.OvCc-small-WMAR-2-News-Latest-Headline.jpg',
-            'duration': 234,
-            'uploader': 'WMAR',
        }
    }, {
        'url': 'https://rumble.com/embed/vslb7v',
@ -43,7 +38,6 @@ class RumbleEmbedIE(InfoExtractor):
            'channel': 'CTNews',
            'thumbnail': 'https://sp.rmbl.ws/s8/6/7/i/9/h/7i9hd.OvCc.jpg',
            'duration': 901,
-            'uploader': 'CTNews',
        }
    }, {
        'url': 'https://rumble.com/embed/ufe9n.v5pv5f',
@ -102,7 +96,6 @@ class RumbleEmbedIE(InfoExtractor):
            'channel': author.get('name'),
            'channel_url': author.get('url'),
            'duration': int_or_none(video.get('duration')),
-            'uploader': author.get('name'),
        }


--- a/yt_dlp/jsinterp.py
+++ b/yt_dlp/jsinterp.py
@ -24,7 +24,6 @@ _ASSIGN_OPERATORS.append(('=', (lambda cur, right: right)))
 _NAME_RE = r'[a-zA-Z_$][a-zA-Z_$0-9]*'

 _MATCHING_PARENS = dict(zip('({[', ')}]'))
-_QUOTES = '\'"'


 class JS_Break(ExtractorError):
@ -70,17 +69,12 @@ class JSInterpreter:
            return
        counters = {k: 0 for k in _MATCHING_PARENS.values()}
        start, splits, pos, delim_len = 0, 0, 0, len(delim) - 1
-        in_quote, escaping = None, False
        for idx, char in enumerate(expr):
            if char in _MATCHING_PARENS:
                counters[_MATCHING_PARENS[char]] += 1
            elif char in counters:
                counters[char] -= 1
-            elif not escaping and char in _QUOTES and in_quote in (char, None):
-                in_quote = None if in_quote else char
-            escaping = not escaping and in_quote and char == '\\'
-
-            if char != delim[pos] or any(counters.values()) or in_quote:
+            if char != delim[pos] or any(counters.values()):
                pos = 0
                continue
            elif pos != delim_len:
--- a/yt_dlp/utils.py
+++ b/yt_dlp/utils.py
@ -34,7 +34,6 @@ import sys
 import tempfile
 import time
 import traceback
-import types
 import urllib.parse
 import xml.etree.ElementTree
 import zlib
@ -398,14 +397,14 @@ def get_element_html_by_attribute(attribute, value, html, **kargs):
 def get_elements_by_class(class_name, html, **kargs):
    """Return the content of all tags with the specified class in the passed HTML document as a list"""
    return get_elements_by_attribute(
-        'class', r'[^\'"]*(?<=[\'"\s])%s(?=[\'"\s])[^\'"]*' % re.escape(class_name),
+        'class', r'[^\'"]*\b%s\b[^\'"]*' % re.escape(class_name),
        html, escape_value=False)


 def get_elements_html_by_class(class_name, html):
    """Return the html of all tags with the specified class in the passed HTML document as a list"""
    return get_elements_html_by_attribute(
-        'class', r'[^\'"]*(?<=[\'"\s])%s(?=[\'"\s])[^\'"]*' % re.escape(class_name),
+        'class', r'[^\'"]*\b%s\b[^\'"]*' % re.escape(class_name),
        html, escape_value=False)


@ -3405,15 +3404,16 @@ def _match_one(filter_part, dct, incomplete):
    else:
        is_incomplete = lambda k: k in incomplete

-    operator_rex = re.compile(r'''(?x)
+    operator_rex = re.compile(r'''(?x)\s*
        (?P<key>[a-z_]+)
        \s*(?P<negation>!\s*)?(?P<op>%s)(?P<none_inclusive>\s*\?)?\s*
        (?:
            (?P<quote>["\'])(?P<quotedstrval>.+?)(?P=quote)|
            (?P<strval>.+?)
        )
+        \s*$
        ''' % '|'.join(map(re.escape, COMPARISON_OPERATORS.keys())))
-    m = operator_rex.fullmatch(filter_part.strip())
+    m = operator_rex.search(filter_part)
    if m:
        m = m.groupdict()
        unnegated_op = COMPARISON_OPERATORS[m['op']]
@ -3449,10 +3449,11 @@ def _match_one(filter_part, dct, incomplete):
        '': lambda v: (v is True) if isinstance(v, bool) else (v is not None),
        '!': lambda v: (v is False) if isinstance(v, bool) else (v is None),
    }
-    operator_rex = re.compile(r'''(?x)
+    operator_rex = re.compile(r'''(?x)\s*
        (?P<op>%s)\s*(?P<key>[a-z_]+)
+        \s*$
        ''' % '|'.join(map(re.escape, UNARY_OPERATORS.keys())))
-    m = operator_rex.fullmatch(filter_part.strip())
+    m = operator_rex.search(filter_part)
    if m:
        op = UNARY_OPERATORS[m.group('op')]
        actual_value = dct.get(m.group('key'))
@ -5394,15 +5395,23 @@ class classproperty:
        return self.func(cls)


-class Namespace(types.SimpleNamespace):
+class Namespace:
    """Immutable namespace"""

-    def __iter__(self):
-        return iter(self.__dict__.values())
+    def __init__(self, **kwargs):
+        self._dict = kwargs

-    @property
-    def items_(self):
-        return self.__dict__.items()
+    def __getattr__(self, attr):
+        return self._dict[attr]
+
+    def __contains__(self, item):
+        return item in self._dict.values()
+
+    def __iter__(self):
+        return iter(self._dict.items())
+
+    def __repr__(self):
+        return f'{type(self).__name__}({", ".join(f"{k}={v}" for k, v in self)})'


 # Deprecated