bpo-39337: encodings.normalize_encoding() now ignores non-ASCII characters (GH-22219)

author: Hai Shi <shihai1992@gmail.com> 2020-10-14 23:43:31 +0800
committer: GitHub <noreply@github.com> 2020-10-14 17:43:31 +0200
commit: c5b049b91ca50c615f9a5425055c2b79a82ac547 (patch)
tree: 7fac1361bbd7bb7ca533f034d800e593b32266b4 /Lib/test/test_codecs.py
parent: b4d895336a4692c95b4533adcc5c63a489e5e4e4 (diff)
download: cpython-c5b049b91ca50c615f9a5425055c2b79a82ac547.tar.gz
cpython-c5b049b91ca50c615f9a5425055c2b79a82ac547.zip
1 files changed, 13 insertions, 1 deletions
diff --git a/Lib/test/test_codecs.py b/Lib/test/test_codecs.py
index ddf4e08af62..09ceef76eb0 100644
--- a/Lib/test/test_codecs.py
+++ b/Lib/test/test_codecs.py
@@ -3417,7 +3417,7 @@ class Rot13UtilTest(unittest.TestCase):
 
 class CodecNameNormalizationTest(unittest.TestCase):
     """Test codec name normalization"""
-    def test_normalized_encoding(self):
+    def test_codecs_lookup(self):
         FOUND = (1, 2, 3, 4)
         NOT_FOUND = (None, None, None, None)
         def search_function(encoding):
@@ -3439,6 +3439,18 @@ class CodecNameNormalizationTest(unittest.TestCase):
         self.assertEqual(NOT_FOUND, codecs.lookup('BBB.8'))
         self.assertEqual(NOT_FOUND, codecs.lookup('a\xe9\u20ac-8'))
 
+    def test_encodings_normalize_encoding(self):
+        # encodings.normalize_encoding() ignores non-ASCII characters.
+        normalize = encodings.normalize_encoding
+        self.assertEqual(normalize('utf_8'), 'utf_8')
+        self.assertEqual(normalize('utf\xE9\u20AC\U0010ffff-8'), 'utf_8')
+        self.assertEqual(normalize('utf   8'), 'utf_8')
+        # encodings.normalize_encoding() doesn't convert
+        # characters to lower case.
+        self.assertEqual(normalize('UTF 8'), 'UTF_8')
+        self.assertEqual(normalize('utf.8'), 'utf.8')
+        self.assertEqual(normalize('utf...8'), 'utf...8')
+
 
 if __name__ == "__main__":
     unittest.main()
author	Hai Shi <shihai1992@gmail.com>	2020-10-14 23:43:31 +0800
committer	GitHub <noreply@github.com>	2020-10-14 17:43:31 +0200
commit	c5b049b91ca50c615f9a5425055c2b79a82ac547 (patch)
tree	7fac1361bbd7bb7ca533f034d800e593b32266b4 /Lib/test/test_codecs.py
parent	b4d895336a4692c95b4533adcc5c63a489e5e4e4 (diff)
download	cpython-c5b049b91ca50c615f9a5425055c2b79a82ac547.tar.gz cpython-c5b049b91ca50c615f9a5425055c2b79a82ac547.zip