GH-112354: _GUARD_IS_TRUE_POP side-exits to target the next instruction, not themselves. (GH-114078)

This commit is contained in:
Mark Shannon 2024-01-15 11:41:06 +00:00 committed by GitHub
parent 2010d45327
commit ac10947ba7
No known key found for this signature in database
GPG key ID: 4AEE18F83AFDEB23
8 changed files with 40 additions and 26 deletions

View file

@ -169,7 +169,7 @@ const uint16_t _PyUop_Flags[MAX_UOP_ID+1] = {
[_CHECK_FUNCTION_EXACT_ARGS] = HAS_ARG_FLAG | HAS_DEOPT_FLAG | HAS_PASSTHROUGH_FLAG, [_CHECK_FUNCTION_EXACT_ARGS] = HAS_ARG_FLAG | HAS_DEOPT_FLAG | HAS_PASSTHROUGH_FLAG,
[_CHECK_STACK_SPACE] = HAS_ARG_FLAG | HAS_DEOPT_FLAG | HAS_PASSTHROUGH_FLAG, [_CHECK_STACK_SPACE] = HAS_ARG_FLAG | HAS_DEOPT_FLAG | HAS_PASSTHROUGH_FLAG,
[_INIT_CALL_PY_EXACT_ARGS] = HAS_ARG_FLAG | HAS_ESCAPES_FLAG | HAS_PURE_FLAG, [_INIT_CALL_PY_EXACT_ARGS] = HAS_ARG_FLAG | HAS_ESCAPES_FLAG | HAS_PURE_FLAG,
[_PUSH_FRAME] = 0, [_PUSH_FRAME] = HAS_ESCAPES_FLAG,
[_CALL_TYPE_1] = HAS_ARG_FLAG | HAS_DEOPT_FLAG, [_CALL_TYPE_1] = HAS_ARG_FLAG | HAS_DEOPT_FLAG,
[_CALL_STR_1] = HAS_ARG_FLAG | HAS_EVAL_BREAK_FLAG | HAS_DEOPT_FLAG | HAS_ERROR_FLAG | HAS_ESCAPES_FLAG, [_CALL_STR_1] = HAS_ARG_FLAG | HAS_EVAL_BREAK_FLAG | HAS_DEOPT_FLAG | HAS_ERROR_FLAG | HAS_ESCAPES_FLAG,
[_CALL_TUPLE_1] = HAS_ARG_FLAG | HAS_EVAL_BREAK_FLAG | HAS_DEOPT_FLAG | HAS_ERROR_FLAG | HAS_ESCAPES_FLAG, [_CALL_TUPLE_1] = HAS_ARG_FLAG | HAS_EVAL_BREAK_FLAG | HAS_DEOPT_FLAG | HAS_ERROR_FLAG | HAS_ESCAPES_FLAG,

View file

@ -805,7 +805,8 @@ dummy_func(
#if TIER_ONE #if TIER_ONE
assert(frame != &entry_frame); assert(frame != &entry_frame);
#endif #endif
STORE_SP(); SYNC_SP();
_PyFrame_SetStackPointer(frame, stack_pointer);
assert(EMPTY()); assert(EMPTY());
_Py_LeaveRecursiveCallPy(tstate); _Py_LeaveRecursiveCallPy(tstate);
// GH-99729: We need to unlink the frame *before* clearing it: // GH-99729: We need to unlink the frame *before* clearing it:
@ -3154,7 +3155,8 @@ dummy_func(
// Write it out explicitly because it's subtly different. // Write it out explicitly because it's subtly different.
// Eventually this should be the only occurrence of this code. // Eventually this should be the only occurrence of this code.
assert(tstate->interp->eval_frame == NULL); assert(tstate->interp->eval_frame == NULL);
STORE_SP(); SYNC_SP();
_PyFrame_SetStackPointer(frame, stack_pointer);
new_frame->previous = frame; new_frame->previous = frame;
CALL_STAT_INC(inlined_py_calls); CALL_STAT_INC(inlined_py_calls);
frame = tstate->current_frame = new_frame; frame = tstate->current_frame = new_frame;
@ -4013,20 +4015,27 @@ dummy_func(
///////// Tier-2 only opcodes ///////// ///////// Tier-2 only opcodes /////////
op (_GUARD_IS_TRUE_POP, (flag -- )) { op (_GUARD_IS_TRUE_POP, (flag -- )) {
DEOPT_IF(Py_IsFalse(flag)); SYNC_SP();
DEOPT_IF(!Py_IsTrue(flag));
assert(Py_IsTrue(flag)); assert(Py_IsTrue(flag));
} }
op (_GUARD_IS_FALSE_POP, (flag -- )) { op (_GUARD_IS_FALSE_POP, (flag -- )) {
DEOPT_IF(Py_IsTrue(flag)); SYNC_SP();
DEOPT_IF(!Py_IsFalse(flag));
assert(Py_IsFalse(flag)); assert(Py_IsFalse(flag));
} }
op (_GUARD_IS_NONE_POP, (val -- )) { op (_GUARD_IS_NONE_POP, (val -- )) {
DEOPT_IF(!Py_IsNone(val)); SYNC_SP();
if (!Py_IsNone(val)) {
Py_DECREF(val);
DEOPT_IF(1);
}
} }
op (_GUARD_IS_NOT_NONE_POP, (val -- )) { op (_GUARD_IS_NOT_NONE_POP, (val -- )) {
SYNC_SP();
DEOPT_IF(Py_IsNone(val)); DEOPT_IF(Py_IsNone(val));
Py_DECREF(val); Py_DECREF(val);
} }

View file

@ -3318,35 +3318,38 @@
case _GUARD_IS_TRUE_POP: { case _GUARD_IS_TRUE_POP: {
PyObject *flag; PyObject *flag;
flag = stack_pointer[-1]; flag = stack_pointer[-1];
if (Py_IsFalse(flag)) goto deoptimize;
assert(Py_IsTrue(flag));
stack_pointer += -1; stack_pointer += -1;
if (!Py_IsTrue(flag)) goto deoptimize;
assert(Py_IsTrue(flag));
break; break;
} }
case _GUARD_IS_FALSE_POP: { case _GUARD_IS_FALSE_POP: {
PyObject *flag; PyObject *flag;
flag = stack_pointer[-1]; flag = stack_pointer[-1];
if (Py_IsTrue(flag)) goto deoptimize;
assert(Py_IsFalse(flag));
stack_pointer += -1; stack_pointer += -1;
if (!Py_IsFalse(flag)) goto deoptimize;
assert(Py_IsFalse(flag));
break; break;
} }
case _GUARD_IS_NONE_POP: { case _GUARD_IS_NONE_POP: {
PyObject *val; PyObject *val;
val = stack_pointer[-1]; val = stack_pointer[-1];
if (!Py_IsNone(val)) goto deoptimize;
stack_pointer += -1; stack_pointer += -1;
if (!Py_IsNone(val)) {
Py_DECREF(val);
if (1) goto deoptimize;
}
break; break;
} }
case _GUARD_IS_NOT_NONE_POP: { case _GUARD_IS_NOT_NONE_POP: {
PyObject *val; PyObject *val;
val = stack_pointer[-1]; val = stack_pointer[-1];
stack_pointer += -1;
if (Py_IsNone(val)) goto deoptimize; if (Py_IsNone(val)) goto deoptimize;
Py_DECREF(val); Py_DECREF(val);
stack_pointer += -1;
break; break;
} }

View file

@ -481,18 +481,19 @@ top: // Jump here after _PUSH_FRAME or likely branches
goto done; goto done;
} }
uint32_t uopcode = BRANCH_TO_GUARD[opcode - POP_JUMP_IF_FALSE][jump_likely]; uint32_t uopcode = BRANCH_TO_GUARD[opcode - POP_JUMP_IF_FALSE][jump_likely];
_Py_CODEUNIT *next_instr = instr + 1 + _PyOpcode_Caches[_PyOpcode_Deopt[opcode]];
DPRINTF(2, "%s(%d): counter=%x, bitcount=%d, likely=%d, confidence=%d, uopcode=%s\n", DPRINTF(2, "%s(%d): counter=%x, bitcount=%d, likely=%d, confidence=%d, uopcode=%s\n",
_PyOpcode_OpName[opcode], oparg, _PyOpcode_OpName[opcode], oparg,
counter, bitcount, jump_likely, confidence, _PyUOpName(uopcode)); counter, bitcount, jump_likely, confidence, _PyUOpName(uopcode));
ADD_TO_TRACE(uopcode, max_length, 0, target); _Py_CODEUNIT *next_instr = instr + 1 + _PyOpcode_Caches[_PyOpcode_Deopt[opcode]];
if (jump_likely) {
_Py_CODEUNIT *target_instr = next_instr + oparg; _Py_CODEUNIT *target_instr = next_instr + oparg;
if (jump_likely) {
DPRINTF(2, "Jump likely (%x = %d bits), continue at byte offset %d\n", DPRINTF(2, "Jump likely (%x = %d bits), continue at byte offset %d\n",
instr[1].cache, bitcount, 2 * INSTR_IP(target_instr, code)); instr[1].cache, bitcount, 2 * INSTR_IP(target_instr, code));
instr = target_instr; instr = target_instr;
ADD_TO_TRACE(uopcode, max_length, 0, INSTR_IP(next_instr, code));
goto top; goto top;
} }
ADD_TO_TRACE(uopcode, max_length, 0, INSTR_IP(target_instr, code));
break; break;
} }

View file

@ -464,7 +464,7 @@ def compute_properties(op: parser.InstDef) -> Properties:
ends_with_eval_breaker=eval_breaker_at_end(op), ends_with_eval_breaker=eval_breaker_at_end(op),
needs_this=variable_used(op, "this_instr"), needs_this=variable_used(op, "this_instr"),
always_exits=always_exits(op), always_exits=always_exits(op),
stores_sp=variable_used(op, "STORE_SP"), stores_sp=variable_used(op, "SYNC_SP"),
tier_one_only=variable_used(op, "TIER_ONE_ONLY"), tier_one_only=variable_used(op, "TIER_ONE_ONLY"),
uses_co_consts=variable_used(op, "FRAME_CO_CONSTS"), uses_co_consts=variable_used(op, "FRAME_CO_CONSTS"),
uses_co_names=variable_used(op, "FRAME_CO_NAMES"), uses_co_names=variable_used(op, "FRAME_CO_NAMES"),

View file

@ -124,7 +124,7 @@ def replace_decrefs(
out.emit(f"Py_DECREF({var.name});\n") out.emit(f"Py_DECREF({var.name});\n")
def replace_store_sp( def replace_sync_sp(
out: CWriter, out: CWriter,
tkn: Token, tkn: Token,
tkn_iter: Iterator[Token], tkn_iter: Iterator[Token],
@ -135,9 +135,7 @@ def replace_store_sp(
next(tkn_iter) next(tkn_iter)
next(tkn_iter) next(tkn_iter)
next(tkn_iter) next(tkn_iter)
out.emit_at("", tkn)
stack.flush(out) stack.flush(out)
out.emit("_PyFrame_SetStackPointer(frame, stack_pointer);\n")
def replace_check_eval_breaker( def replace_check_eval_breaker(
@ -160,7 +158,7 @@ REPLACEMENT_FUNCTIONS = {
"ERROR_IF": replace_error, "ERROR_IF": replace_error,
"DECREF_INPUTS": replace_decrefs, "DECREF_INPUTS": replace_decrefs,
"CHECK_EVAL_BREAKER": replace_check_eval_breaker, "CHECK_EVAL_BREAKER": replace_check_eval_breaker,
"STORE_SP": replace_store_sp, "SYNC_SP": replace_sync_sp,
} }
ReplacementFunctionType = Callable[ ReplacementFunctionType = Callable[

View file

@ -201,6 +201,7 @@ Those functions include:
* `DEOPT_IF(cond, instruction)`. Deoptimize if `cond` is met. * `DEOPT_IF(cond, instruction)`. Deoptimize if `cond` is met.
* `ERROR_IF(cond, label)`. Jump to error handler at `label` if `cond` is true. * `ERROR_IF(cond, label)`. Jump to error handler at `label` if `cond` is true.
* `DECREF_INPUTS()`. Generate `Py_DECREF()` calls for the input stack effects. * `DECREF_INPUTS()`. Generate `Py_DECREF()` calls for the input stack effects.
* `SYNC_SP()`. Synchronizes the physical stack pointer with the stack effects.
Note that the use of `DECREF_INPUTS()` is optional -- manual calls Note that the use of `DECREF_INPUTS()` is optional -- manual calls
to `Py_DECREF()` or other approaches are also acceptable to `Py_DECREF()` or other approaches are also acceptable

View file

@ -169,6 +169,7 @@ class Stack:
return "" return ""
def flush(self, out: CWriter) -> None: def flush(self, out: CWriter) -> None:
out.start_line()
for var in self.variables: for var in self.variables:
if not var.peek: if not var.peek:
cast = "(PyObject *)" if var.type else "" cast = "(PyObject *)" if var.type else ""
@ -189,6 +190,7 @@ class Stack:
self.base_offset.clear() self.base_offset.clear()
self.top_offset.clear() self.top_offset.clear()
self.peek_offset.clear() self.peek_offset.clear()
out.start_line()
def as_comment(self) -> str: def as_comment(self) -> str:
return f"/* Variables: {[v.name for v in self.variables]}. Base offset: {self.base_offset.to_c()}. Top offset: {self.top_offset.to_c()} */" return f"/* Variables: {[v.name for v in self.variables]}. Base offset: {self.base_offset.to_c()}. Top offset: {self.top_offset.to_c()} */"