[Python-checkins] bpo-42065: Fix incorrectly formatted _codecs.charmap_decode error message (GH-19940)

Max Bernstein webhook-mailer at python.org
Sat Oct 17 16:38:30 EDT 2020


https://github.com/python/cpython/commit/3635388f52b42e5280229104747962117104c453
commit: 3635388f52b42e5280229104747962117104c453
branch: master
author: Max Bernstein <tekknolagi at users.noreply.github.com>
committer: GitHub <noreply at github.com>
date: 2020-10-17T23:38:21+03:00
summary:

bpo-42065: Fix incorrectly formatted _codecs.charmap_decode error message (GH-19940)

files:
A Misc/NEWS.d/next/Library/2020-10-17-23-17-18.bpo-42065.85BsRA.rst
M Lib/test/test_codecs.py
M Objects/unicodeobject.c

diff --git a/Lib/test/test_codecs.py b/Lib/test/test_codecs.py
index 9be8281ce5af5..328a47b2e3766 100644
--- a/Lib/test/test_codecs.py
+++ b/Lib/test/test_codecs.py
@@ -2197,6 +2197,18 @@ def test_decode_with_int2str_map(self):
             ("", len(allbytes))
         )
 
+        self.assertRaisesRegex(TypeError,
+            "character mapping must be in range\\(0x110000\\)",
+            codecs.charmap_decode,
+            b"\x00\x01\x02", "strict", {0: "A", 1: 'Bb', 2: -2}
+        )
+
+        self.assertRaisesRegex(TypeError,
+            "character mapping must be in range\\(0x110000\\)",
+            codecs.charmap_decode,
+            b"\x00\x01\x02", "strict", {0: "A", 1: 'Bb', 2: 999999999}
+        )
+
     def test_decode_with_int2int_map(self):
         a = ord('a')
         b = ord('b')
diff --git a/Misc/NEWS.d/next/Library/2020-10-17-23-17-18.bpo-42065.85BsRA.rst b/Misc/NEWS.d/next/Library/2020-10-17-23-17-18.bpo-42065.85BsRA.rst
new file mode 100644
index 0000000000000..83c86c0799ebf
--- /dev/null
+++ b/Misc/NEWS.d/next/Library/2020-10-17-23-17-18.bpo-42065.85BsRA.rst
@@ -0,0 +1,3 @@
+Fix an incorrectly formatted error from :meth:`_codecs.charmap_decode` when
+called with a mapped value outside the range of valid Unicode code points.
+PR by Max Bernstein.
diff --git a/Objects/unicodeobject.c b/Objects/unicodeobject.c
index 01e5c728b383f..c4e73ebd45d20 100644
--- a/Objects/unicodeobject.c
+++ b/Objects/unicodeobject.c
@@ -8304,7 +8304,7 @@ charmap_decode_mapping(const char *s,
                 goto Undefined;
             if (value < 0 || value > MAX_UNICODE) {
                 PyErr_Format(PyExc_TypeError,
-                             "character mapping must be in range(0x%lx)",
+                             "character mapping must be in range(0x%x)",
                              (unsigned long)MAX_UNICODE + 1);
                 goto onError;
             }



More information about the Python-checkins mailing list