googleapis · chalmerlowe · Feb 25, 2026
@@ -0,0 +1,40 @@
+# Review of PR #495
+
+**Verdict: LGTM**
+
+## Summary
+The PR adds `max_length` parameter to `decompress` method in `_GzipDecoder` and `_BrotliDecoder` wrappers, enabling streaming decompression support. This aligns with `urllib3` interface and is implemented correctly with backward compatibility for older dependency versions.
+
+## Detailed Findings
+
+1.  **Conflict & Relevance Check**:
+    - The PR applies cleanly and does not conflict with the `main` branch.
+    - The changes are logically relevant to enabling streaming decompression support, consistent across synchronous and asynchronous modules.
+
+2.  **Functional Correctness**:
+    - The implementation correctly adds the `max_length` parameter to the `decompress` method in `_GzipDecoder` and `_BrotliDecoder` wrappers.
+    - The implementation robustly handles older `urllib3` versions (or custom environments) via a `try-except TypeError` fallback mechanism. This ensures backward compatibility.
+    - The default value `max_length=-1` aligns with `urllib3`'s convention for "unlimited" (verified against `urllib3==2.6.3`).
+    - The `_BrotliDecoder` wrapper correctly exposes `has_unconsumed_tail` property, delegating to the underlying decoder and handling `AttributeError` gracefully.
+    - The `_GzipDecoder` correctly inherits `has_unconsumed_tail` from `urllib3.response.GzipDecoder` (if available).
+
+3.  **Google Python Standards**:
+    - **Type Hinting (PEP 484)**: The new code relies on docstrings for type information (`Args: ... max_length (int): ...`). This is consistent with the existing codebase style in `download.py`, though modern Google style encourages inline type hints. I consider this acceptable given the file's current state.
+    - **Docstring Quality**: The docstrings follow the Google Python Style Guide, clearly documenting the new parameter and its behavior.
+    - **Logging vs Print**: No new logging or print statements were introduced.
+    - **Formatting**: The code appears to be formatted correctly (likely `black` compliant).
+
+4.  **Technical Merit & Architecture**:
+    - The solution is idiomatic for a wrapper library. It extends functionality while delegating the heavy lifting to `urllib3`.
+    - The use of inheritance for `_GzipDecoder` and composition for `_BrotliDecoder` mirrors the existing architecture and is appropriate.
+    - The fallback mechanism is a pragmatic way to support diverse dependency versions without complex version checking logic.
+
+5.  **Testing**:
+    - The PR includes unit tests in `tests/unit/requests/test_download.py` and `tests_async/unit/requests/test_download.py`.
+    - The tests cover both the success path (passing `max_length`) and the fallback path (simulating `TypeError`).
+    - I ran the relevant tests locally and they passed (119 tests passed).
+    - The tests verify that arguments are forwarded correctly.
+
+6.  **Critical Issues**: None found.
+
+7.  **Suggested Refactors**: None required. The implementation is clean and minimal.
@@ -452,14 +452,21 @@ def __init__(self, checksum):
         super(_GzipDecoder, self).__init__()
         self._checksum = checksum
 
-    def decompress(self, data):
+    def decompress(self, data, max_length=-1):
         """Decompress the bytes.
 
         Args:
             data (bytes): The compressed bytes to be decompressed.
+            max_length (int): Maximum number of bytes to return. -1 for no
+                limit. Forwarded to the underlying decoder when supported.
 
         Returns:
             bytes: The decompressed bytes from ``data``.
         """
         self._checksum.update(data)
-        return super(_GzipDecoder, self).decompress(data)
+        try:
+            return super(_GzipDecoder, self).decompress(
+                data, max_length=max_length
+            )
+        except TypeError:
+            return super(_GzipDecoder, self).decompress(data)
@@ -667,17 +667,22 @@ def __init__(self, checksum):
         super().__init__()
         self._checksum = checksum
 
-    def decompress(self, data):
+    def decompress(self, data, max_length=-1):
         """Decompress the bytes.
 
         Args:
             data (bytes): The compressed bytes to be decompressed.
+            max_length (int): Maximum number of bytes to return. -1 for no
+                limit. Forwarded to the underlying decoder when supported.
 
         Returns:
             bytes: The decompressed bytes from ``data``.
         """
         self._checksum.update(data)
-        return super().decompress(data)
+        try:
+            return super().decompress(data, max_length=max_length)
+        except TypeError:
+            return super().decompress(data)
 
 
 # urllib3.response.BrotliDecoder might not exist depending on whether brotli is
@@ -703,17 +708,29 @@ def __init__(self, checksum):
             self._decoder = urllib3.response.BrotliDecoder()
             self._checksum = checksum
 
-        def decompress(self, data):
+        def decompress(self, data, max_length=-1):
             """Decompress the bytes.
 
             Args:
                 data (bytes): The compressed bytes to be decompressed.
+                max_length (int): Maximum number of bytes to return. -1 for no
+                    limit. Forwarded to the underlying decoder when supported.
 
             Returns:
                 bytes: The decompressed bytes from ``data``.
             """
             self._checksum.update(data)
-            return self._decoder.decompress(data)
+            try:
+                return self._decoder.decompress(data, max_length=max_length)
+            except TypeError:
+                return self._decoder.decompress(data)
+
+        @property
+        def has_unconsumed_tail(self):
+            try:
+                return self._decoder.has_unconsumed_tail
+            except AttributeError:
+                return False
 
         def flush(self):
             return self._decoder.flush()

@@ -1274,6 +1274,39 @@ def test_decompress(self):
         assert result == b""
         md5_hash.update.assert_called_once_with(data)
 
+    def test_decompress_with_max_length(self):
+        md5_hash = mock.Mock(spec=["update"])
+        decoder = download_mod._GzipDecoder(md5_hash)
+
+        with mock.patch.object(
+            type(decoder).__bases__[0], "decompress"
+        ) as mock_super_decompress:
+            mock_super_decompress.return_value = b"decompressed"
+            data = b"\x1f\x8b\x08\x08"
+            result = decoder.decompress(data, max_length=10)
+
+            assert result == b"decompressed"
+            md5_hash.update.assert_called_once_with(data)
+            mock_super_decompress.assert_called_once_with(
+                data, max_length=10
+            )
+
+    def test_decompress_with_max_length_fallback(self):
+        md5_hash = mock.Mock(spec=["update"])
+        decoder = download_mod._GzipDecoder(md5_hash)
+
+        with mock.patch.object(
+            type(decoder).__bases__[0],
+            "decompress",
+            side_effect=[TypeError, b"decompressed"],
+        ) as mock_super_decompress:
+            data = b"\x1f\x8b\x08\x08"
+            result = decoder.decompress(data, max_length=10)
+
+            assert result == b"decompressed"
+            md5_hash.update.assert_called_once_with(data)
+            assert mock_super_decompress.call_count == 2
+
 
 class Test_BrotliDecoder(object):
     def test_constructor(self):
@@ -1290,6 +1323,46 @@ def test_decompress(self):
         assert result == b""
         md5_hash.update.assert_called_once_with(data)
 
+    def test_decompress_with_max_length(self):
+        md5_hash = mock.Mock(spec=["update"])
+        decoder = download_mod._BrotliDecoder(md5_hash)
+
+        decoder._decoder = mock.Mock(spec=["decompress"])
+        decoder._decoder.decompress.return_value = b"decompressed"
+
+        data = b"compressed"
+        result = decoder.decompress(data, max_length=10)
+
+        assert result == b"decompressed"
+        md5_hash.update.assert_called_once_with(data)
+        decoder._decoder.decompress.assert_called_once_with(
+            data, max_length=10
+        )
+
+    def test_decompress_with_max_length_fallback(self):
+        md5_hash = mock.Mock(spec=["update"])
+        decoder = download_mod._BrotliDecoder(md5_hash)
+
+        decoder._decoder = mock.Mock(spec=["decompress"])
+        decoder._decoder.decompress.side_effect = [TypeError, b"decompressed"]
+
+        data = b"compressed"
+        result = decoder.decompress(data, max_length=10)
+
+        assert result == b"decompressed"
+        md5_hash.update.assert_called_once_with(data)
+        assert decoder._decoder.decompress.call_count == 2
+
+    def test_has_unconsumed_tail(self):
+        decoder = download_mod._BrotliDecoder(mock.sentinel.md5_hash)
+        decoder._decoder = mock.Mock(spec=["has_unconsumed_tail"])
+        decoder._decoder.has_unconsumed_tail = True
+        assert decoder.has_unconsumed_tail is True
+
+    def test_has_unconsumed_tail_fallback(self):
+        decoder = download_mod._BrotliDecoder(mock.sentinel.md5_hash)
+        decoder._decoder = mock.Mock(spec=[])
+        assert decoder.has_unconsumed_tail is False
 
 def _mock_response(status_code=http.client.OK, chunks=(), headers=None):
     if headers is None:

@@ -761,6 +761,23 @@ def test_decompress(self):
         assert result == b""
         md5_hash.update.assert_called_once_with(data)
 
+    def test_decompress_with_max_length(self):
+        md5_hash = mock.Mock(spec=["update"])
+        decoder = download_mod._GzipDecoder(md5_hash)
+
+        with mock.patch.object(
+            type(decoder).__bases__[0], "decompress"
+        ) as mock_super_decompress:
+            mock_super_decompress.return_value = b"decompressed"
+            data = b"\x1f\x8b\x08\x08"
+            result = decoder.decompress(data, max_length=10)
+
+            assert result == b"decompressed"
+            md5_hash.update.assert_called_once_with(data)
+            mock_super_decompress.assert_called_once_with(
+                data, max_length=10
+            )
+
 
 class AsyncIter:
     def __init__(self, items):