Issue #25709: Fixed problem with in-place string concatenation and utf-8 cache.

author: Serhiy Storchaka <storchaka@gmail.com> 2015-12-03 01:02:03 +0200
committer: Serhiy Storchaka <storchaka@gmail.com> 2015-12-03 01:02:03 +0200
commit: e800941d66c432d29926f142085e29eca4abf6f3 (patch)
tree: 0cdc7dd7facab556fd87105897fb90792f9e17f9 /Lib/test/test_unicode.py
parent: a8f4405044f2ef834a389f50557e81221c42786c (diff)
download: cpython-git-e800941d66c432d29926f142085e29eca4abf6f3.tar.gz
1 files changed, 17 insertions, 0 deletions
diff --git a/Lib/test/test_unicode.py b/Lib/test/test_unicode.py
index 56a60df007..d7f37c5955 100644
--- a/Lib/test/test_unicode.py
+++ b/Lib/test/test_unicode.py
@@ -2699,6 +2699,23 @@ class UnicodeTest(string_tests.CommonTest,
         self.assertTrue(astral >= bmp2)
         self.assertFalse(astral >= astral2)
 
+    @support.cpython_only
+    def test_pep393_utf8_caching_bug(self):
+        # Issue #25709: Problem with string concatenation and utf-8 cache
+        from _testcapi import getargs_s_hash
+        for k in 0x24, 0xa4, 0x20ac, 0x1f40d:
+            s = ''
+            for i in range(5):
+                # Due to CPython specific optimization the 's' string can be
+                # resized in-place.
+                s += chr(k)
+                # Parsing with the "s#" format code calls indirectly
+                # PyUnicode_AsUTF8AndSize() which creates the UTF-8
+                # encoded string cached in the Unicode object.
+                self.assertEqual(getargs_s_hash(s), chr(k).encode() * (i + 1))
+                # Check that the second call returns the same result
+                self.assertEqual(getargs_s_hash(s), chr(k).encode() * (i + 1))
+
 
 class StringModuleTest(unittest.TestCase):
     def test_formatter_parser(self):
author	Serhiy Storchaka <storchaka@gmail.com>	2015-12-03 01:02:03 +0200
committer	Serhiy Storchaka <storchaka@gmail.com>	2015-12-03 01:02:03 +0200
commit	e800941d66c432d29926f142085e29eca4abf6f3 (patch)
tree	0cdc7dd7facab556fd87105897fb90792f9e17f9 /Lib/test/test_unicode.py
parent	a8f4405044f2ef834a389f50557e81221c42786c (diff)
download	cpython-git-e800941d66c432d29926f142085e29eca4abf6f3.tar.gz