[rh/urllib] Simplify gzip decoding (#7611)

Authored by: Grub4K
2024-12-22 18:17:17 -05:00 · 2023-08-27 00:13:30 +02:00 · 2023-08-27 00:13:30 +02:00 · 59e92b1f18
commit 59e92b1f18
parent 1be0a96a4d
1 changed files with 3 additions and 15 deletions
--- a/yt_dlp/networking/_urllib.py
+++ b/yt_dlp/networking/_urllib.py
@ -1,7 +1,6 @@
 from __future__ import annotations
 import functools
 import gzip
 import http.client
 import io
 import socket
@ -155,20 +154,9 @@ class HTTPHandler(urllib.request.AbstractHTTPHandler):
    @staticmethod
    def gz(data):
-        gz = gzip.GzipFile(fileobj=io.BytesIO(data), mode='rb')
+        # There may be junk added the end of the file
-        try:
+        # We ignore it by only ever decoding a single gzip payload
-            return gz.read()
+        return zlib.decompress(data, wbits=zlib.MAX_WBITS | 16)
        except OSError as original_oserror:
            # There may be junk add the end of the file
            # See http://stackoverflow.com/q/4928560/35070 for details
            for i in range(1, 1024):
                try:
                    gz = gzip.GzipFile(fileobj=io.BytesIO(data[:-i]), mode='rb')
                    return gz.read()
                except OSError:
                    continue
            else:
                raise original_oserror
    def http_request(self, req):
        # According to RFC 3986, URLs can not contain non-ASCII characters, however this is not