From: Savannah Ostrowski Date: Fri, 9 Jan 2026 00:32:05 +0000 (-0800) Subject: GH-43374: Fix urlretrieve reporthook to report actual bytes read (#142653) X-Git-Url: http://git.ipfire.org/cgi-bin/gitweb.cgi?a=commitdiff_plain;h=68a01f901f446f71aac88431e01bb18b9fa35bd0;p=thirdparty%2FPython%2Fcpython.git GH-43374: Fix urlretrieve reporthook to report actual bytes read (#142653) --- diff --git a/Lib/test/test_urllib.py b/Lib/test/test_urllib.py index ae524c5ffba6..a468b1157528 100644 --- a/Lib/test/test_urllib.py +++ b/Lib/test/test_urllib.py @@ -727,7 +727,7 @@ class urlretrieve_FileTests(unittest.TestCase): self.assertEqual(report[0][2], 8193) self.assertEqual(report[0][1], 8192) self.assertEqual(report[1][1], 8192) - self.assertEqual(report[2][1], 8192) + self.assertEqual(report[2][1], 1) # last block only reads 1 byte class urlretrieve_HttpTests(unittest.TestCase, FakeHTTPMixin): diff --git a/Lib/test/test_urllibnet.py b/Lib/test/test_urllibnet.py index 1a42c35dc49b..da094752b84c 100644 --- a/Lib/test/test_urllibnet.py +++ b/Lib/test/test_urllibnet.py @@ -219,12 +219,14 @@ class urlretrieveNetworkTests(unittest.TestCase): self.assertEqual(records[0][2], expected_size) self.assertEqual(records[-1][2], expected_size) - block_sizes = {block_size for _, block_size, _ in records} - self.assertEqual({records[0][1]}, block_sizes, - msg="block sizes in %s must be equal" % records_repr) - self.assertGreaterEqual(records[-1][0]*records[0][1], expected_size, - msg="number of blocks * block size must be" - " >= total size in %s" % records_repr) + self.assertEqual(records[0][1], 8192, + msg="first block size should be 8192 in %s" % records_repr) + for block_num, block_size, total_size in records: + self.assertLessEqual(block_size, 8192, + msg="block size should be <= 8192 in %s" % records_repr) + total_read = sum(block_size for _, block_size, _ in records[1:]) + self.assertEqual(total_read, expected_size, + msg="sum of bytes read must equal total size in %s" % records_repr) if __name__ == "__main__": diff --git a/Lib/urllib/request.py b/Lib/urllib/request.py index f32de189b135..60607c48145c 100644 --- a/Lib/urllib/request.py +++ b/Lib/urllib/request.py @@ -242,7 +242,7 @@ def urlretrieve(url, filename=None, reporthook=None, data=None): tfp.write(block) blocknum += 1 if reporthook: - reporthook(blocknum, bs, size) + reporthook(blocknum, len(block), size) if size >= 0 and read < size: raise ContentTooShortError( diff --git a/Misc/NEWS.d/next/Library/2025-12-12-23-17-10.gh-issue-43374.M6jGC5.rst b/Misc/NEWS.d/next/Library/2025-12-12-23-17-10.gh-issue-43374.M6jGC5.rst new file mode 100644 index 000000000000..0fe3c35ab3fc --- /dev/null +++ b/Misc/NEWS.d/next/Library/2025-12-12-23-17-10.gh-issue-43374.M6jGC5.rst @@ -0,0 +1 @@ +Fix :func:`urllib.request.urlretrieve` to pass the actual number of bytes read to the *reporthook* callback, instead of always passing the block size.