https://github.com/python/cpython/commit/68a01f901f446f71aac88431e01bb18b9fa35bd0
commit: 68a01f901f446f71aac88431e01bb18b9fa35bd0
branch: main
author: Savannah Ostrowski <[email protected]>
committer: savannahostrowski <[email protected]>
date: 2026-01-09T00:32:05Z
summary:

GH-43374: Fix urlretrieve reporthook to report actual bytes read (#142653)

files:
A Misc/NEWS.d/next/Library/2025-12-12-23-17-10.gh-issue-43374.M6jGC5.rst
M Lib/test/test_urllib.py
M Lib/test/test_urllibnet.py
M Lib/urllib/request.py

diff --git a/Lib/test/test_urllib.py b/Lib/test/test_urllib.py
index ae524c5ffba6b1..a468b115752819 100644
--- a/Lib/test/test_urllib.py
+++ b/Lib/test/test_urllib.py
@@ -727,7 +727,7 @@ def hooktester(block_count, block_read_size, file_size, 
_report=report):
         self.assertEqual(report[0][2], 8193)
         self.assertEqual(report[0][1], 8192)
         self.assertEqual(report[1][1], 8192)
-        self.assertEqual(report[2][1], 8192)
+        self.assertEqual(report[2][1], 1)  # last block only reads 1 byte
 
 
 class urlretrieve_HttpTests(unittest.TestCase, FakeHTTPMixin):
diff --git a/Lib/test/test_urllibnet.py b/Lib/test/test_urllibnet.py
index 1a42c35dc49b9e..da094752b84c62 100644
--- a/Lib/test/test_urllibnet.py
+++ b/Lib/test/test_urllibnet.py
@@ -219,12 +219,14 @@ def recording_reporthook(blocks, block_size, total_size):
         self.assertEqual(records[0][2], expected_size)
         self.assertEqual(records[-1][2], expected_size)
 
-        block_sizes = {block_size for _, block_size, _ in records}
-        self.assertEqual({records[0][1]}, block_sizes,
-                         msg="block sizes in %s must be equal" % records_repr)
-        self.assertGreaterEqual(records[-1][0]*records[0][1], expected_size,
-                                msg="number of blocks * block size must be"
-                                " >= total size in %s" % records_repr)
+        self.assertEqual(records[0][1], 8192,
+                         msg="first block size should be 8192 in %s" % 
records_repr)
+        for block_num, block_size, total_size in records:
+            self.assertLessEqual(block_size, 8192,
+                                 msg="block size should be <= 8192 in %s" % 
records_repr)
+        total_read = sum(block_size for _, block_size, _ in records[1:])
+        self.assertEqual(total_read, expected_size,
+                         msg="sum of bytes read must equal total size in %s" % 
records_repr)
 
 
 if __name__ == "__main__":
diff --git a/Lib/urllib/request.py b/Lib/urllib/request.py
index f32de189b1353a..60607c48145cda 100644
--- a/Lib/urllib/request.py
+++ b/Lib/urllib/request.py
@@ -242,7 +242,7 @@ def urlretrieve(url, filename=None, reporthook=None, 
data=None):
                 tfp.write(block)
                 blocknum += 1
                 if reporthook:
-                    reporthook(blocknum, bs, size)
+                    reporthook(blocknum, len(block), size)
 
     if size >= 0 and read < size:
         raise ContentTooShortError(
diff --git 
a/Misc/NEWS.d/next/Library/2025-12-12-23-17-10.gh-issue-43374.M6jGC5.rst 
b/Misc/NEWS.d/next/Library/2025-12-12-23-17-10.gh-issue-43374.M6jGC5.rst
new file mode 100644
index 00000000000000..0fe3c35ab3fc1d
--- /dev/null
+++ b/Misc/NEWS.d/next/Library/2025-12-12-23-17-10.gh-issue-43374.M6jGC5.rst
@@ -0,0 +1 @@
+Fix :func:`urllib.request.urlretrieve` to pass the actual number of bytes read 
to the *reporthook* callback, instead of always passing the block size.

_______________________________________________
Python-checkins mailing list -- [email protected]
To unsubscribe send an email to [email protected]
https://mail.python.org/mailman3//lists/python-checkins.python.org
Member address: [email protected]

Reply via email to