]> git.ipfire.org Git - thirdparty/Python/cpython.git/commitdiff
GH-131798: Narrow the result type of _BINARY_OP_SUBSCR_STR_INT to str in the JIT...
authorTomas R. <tomas.roun8@gmail.com>
Tue, 8 Apr 2025 15:22:54 +0000 (17:22 +0200)
committerGitHub <noreply@github.com>
Tue, 8 Apr 2025 15:22:54 +0000 (08:22 -0700)
Lib/test/test_capi/test_opt.py
Misc/NEWS.d/next/Core_and_Builtins/2025-04-06-13-17-10.gh-issue-131798.uMrfha.rst [new file with mode: 0644]
Python/optimizer_bytecodes.c
Python/optimizer_cases.c.h

index 0e13799ad473813dc657e574fc0823617dc8afe8..3ade7cb7a2b6af244be3a4becd612610a8f868a5 100644 (file)
@@ -1646,6 +1646,26 @@ class TestUopsOptimization(unittest.TestCase):
         self.assertIn("_TO_BOOL_STR", uops)
         self.assertNotIn("_GUARD_TOS_UNICODE", uops)
 
+    def test_binary_subcsr_str_int_narrows_to_str(self):
+        def testfunc(n):
+            x = []
+            s = "foo"
+            for _ in range(n):
+                y = s[0]       # _BINARY_OP_SUBSCR_STR_INT
+                z = "bar" + y  # (_GUARD_TOS_UNICODE) + _BINARY_OP_ADD_UNICODE
+                x.append(z)
+            return x
+
+        res, ex = self._run_with_optimizer(testfunc, TIER2_THRESHOLD)
+        self.assertEqual(res, ["barf"] * TIER2_THRESHOLD)
+        self.assertIsNotNone(ex)
+        uops = get_opnames(ex)
+        self.assertIn("_BINARY_OP_SUBSCR_STR_INT", uops)
+        # _BINARY_OP_SUBSCR_STR_INT narrows the result to 'str' so
+        # the unicode guard before _BINARY_OP_ADD_UNICODE is removed.
+        self.assertNotIn("_GUARD_TOS_UNICODE", uops)
+        self.assertIn("_BINARY_OP_ADD_UNICODE", uops)
+
 
 def global_identity(x):
     return x
diff --git a/Misc/NEWS.d/next/Core_and_Builtins/2025-04-06-13-17-10.gh-issue-131798.uMrfha.rst b/Misc/NEWS.d/next/Core_and_Builtins/2025-04-06-13-17-10.gh-issue-131798.uMrfha.rst
new file mode 100644 (file)
index 0000000..5ea5fce
--- /dev/null
@@ -0,0 +1,2 @@
+Allow the JIT to remove unicode guards after ``_BINARY_OP_SUBSCR_STR_INT``
+by setting the return type to string.
index d7b3564db1b90a30498e1025591e83fc51a0b11e..72dc2bbd44e71c085264a57e3073586b85c53e85 100644 (file)
@@ -366,6 +366,10 @@ dummy_func(void) {
         ctx->done = true;
     }
 
+    op(_BINARY_OP_SUBSCR_STR_INT, (left, right -- res)) {
+        res = sym_new_type(ctx, &PyUnicode_Type);
+    }
+
     op(_TO_BOOL, (value -- res)) {
         int already_bool = optimize_to_bool(this_instr, ctx, value, &res);
         if (!already_bool) {
index 870c32d74ac91316cc46d651a701226de2d6af77..160d09ca7c558076249b46086221fdd645d27158 100644 (file)
 
         case _BINARY_OP_SUBSCR_STR_INT: {
             JitOptSymbol *res;
-            res = sym_new_not_null(ctx);
+            res = sym_new_type(ctx, &PyUnicode_Type);
             stack_pointer[-2] = res;
             stack_pointer += -1;
             assert(WITHIN_STACK_BOUNDS());