-
-
Notifications
You must be signed in to change notification settings - Fork 33.2k
gh-127022: Simplify PyStackRef_FromPyObjectSteal
#127024
New issue
Have a question about this project? Sign up for a free GitHub account to open an issue and contact its maintainers and the community.
By clicking “Sign up for GitHub”, you agree to our terms of service and privacy statement. We’ll occasionally send you account related emails.
Already on GitHub? Sign in to your account
Changes from 4 commits
5583ac0
16f7e7b
3631451
06ab2ec
a9e4872
File filter
Filter by extension
Conversations
Jump to
Diff view
Diff view
There are no files selected for viewing
Original file line number | Diff line number | Diff line change | ||||||||||||||||||
---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|
|
@@ -376,7 +376,7 @@ dummy_func( | |||||||||||||||||||
|
||||||||||||||||||||
pure inst(UNARY_NOT, (value -- res)) { | ||||||||||||||||||||
assert(PyStackRef_BoolCheck(value)); | ||||||||||||||||||||
res = PyStackRef_Is(value, PyStackRef_False) | ||||||||||||||||||||
res = PyStackRef_IsExactly(value, PyStackRef_False) | ||||||||||||||||||||
? PyStackRef_True : PyStackRef_False; | ||||||||||||||||||||
DEAD(value); | ||||||||||||||||||||
} | ||||||||||||||||||||
|
@@ -441,7 +441,7 @@ dummy_func( | |||||||||||||||||||
|
||||||||||||||||||||
inst(TO_BOOL_NONE, (unused/1, unused/2, value -- res)) { | ||||||||||||||||||||
// This one is a bit weird, because we expect *some* failures: | ||||||||||||||||||||
EXIT_IF(!PyStackRef_Is(value, PyStackRef_None)); | ||||||||||||||||||||
EXIT_IF(!PyStackRef_IsNone(value)); | ||||||||||||||||||||
DEAD(value); | ||||||||||||||||||||
STAT_INC(TO_BOOL, hit); | ||||||||||||||||||||
res = PyStackRef_False; | ||||||||||||||||||||
|
@@ -651,9 +651,7 @@ dummy_func( | |||||||||||||||||||
// specializations, but there is no output. | ||||||||||||||||||||
// At the end we just skip over the STORE_FAST. | ||||||||||||||||||||
op(_BINARY_OP_INPLACE_ADD_UNICODE, (left, right --)) { | ||||||||||||||||||||
#ifndef NDEBUG | ||||||||||||||||||||
PyObject *left_o = PyStackRef_AsPyObjectBorrow(left); | ||||||||||||||||||||
#endif | ||||||||||||||||||||
PyObject *right_o = PyStackRef_AsPyObjectBorrow(right); | ||||||||||||||||||||
|
||||||||||||||||||||
int next_oparg; | ||||||||||||||||||||
|
@@ -664,7 +662,7 @@ dummy_func( | |||||||||||||||||||
next_oparg = CURRENT_OPERAND0(); | ||||||||||||||||||||
#endif | ||||||||||||||||||||
_PyStackRef *target_local = &GETLOCAL(next_oparg); | ||||||||||||||||||||
DEOPT_IF(!PyStackRef_Is(*target_local, left)); | ||||||||||||||||||||
DEOPT_IF(PyStackRef_AsPyObjectBorrow(*target_local) != left_o); | ||||||||||||||||||||
STAT_INC(BINARY_OP, hit); | ||||||||||||||||||||
/* Handle `left = left + right` or `left += right` for str. | ||||||||||||||||||||
* | ||||||||||||||||||||
|
@@ -1141,7 +1139,7 @@ dummy_func( | |||||||||||||||||||
gen_frame->previous = frame; | ||||||||||||||||||||
DISPATCH_INLINED(gen_frame); | ||||||||||||||||||||
} | ||||||||||||||||||||
if (PyStackRef_Is(v, PyStackRef_None) && PyIter_Check(receiver_o)) { | ||||||||||||||||||||
if (PyStackRef_IsNone(v) && PyIter_Check(receiver_o)) { | ||||||||||||||||||||
retval_o = Py_TYPE(receiver_o)->tp_iternext(receiver_o); | ||||||||||||||||||||
} | ||||||||||||||||||||
else { | ||||||||||||||||||||
|
@@ -1249,7 +1247,7 @@ dummy_func( | |||||||||||||||||||
inst(POP_EXCEPT, (exc_value -- )) { | ||||||||||||||||||||
_PyErr_StackItem *exc_info = tstate->exc_info; | ||||||||||||||||||||
Py_XSETREF(exc_info->exc_value, | ||||||||||||||||||||
PyStackRef_Is(exc_value, PyStackRef_None) | ||||||||||||||||||||
PyStackRef_IsNone(exc_value) | ||||||||||||||||||||
? NULL : PyStackRef_AsPyObjectSteal(exc_value)); | ||||||||||||||||||||
} | ||||||||||||||||||||
|
||||||||||||||||||||
|
@@ -2481,13 +2479,7 @@ dummy_func( | |||||||||||||||||||
} | ||||||||||||||||||||
|
||||||||||||||||||||
inst(IS_OP, (left, right -- b)) { | ||||||||||||||||||||
#ifdef Py_GIL_DISABLED | ||||||||||||||||||||
// On free-threaded builds, objects are conditionally immortalized. | ||||||||||||||||||||
// So their bits don't always compare equally. | ||||||||||||||||||||
int res = Py_Is(PyStackRef_AsPyObjectBorrow(left), PyStackRef_AsPyObjectBorrow(right)) ^ oparg; | ||||||||||||||||||||
#else | ||||||||||||||||||||
int res = PyStackRef_Is(left, right) ^ oparg; | ||||||||||||||||||||
#endif | ||||||||||||||||||||
DECREF_INPUTS(); | ||||||||||||||||||||
b = res ? PyStackRef_True : PyStackRef_False; | ||||||||||||||||||||
} | ||||||||||||||||||||
|
@@ -2693,22 +2685,22 @@ dummy_func( | |||||||||||||||||||
|
||||||||||||||||||||
replaced op(_POP_JUMP_IF_FALSE, (cond -- )) { | ||||||||||||||||||||
assert(PyStackRef_BoolCheck(cond)); | ||||||||||||||||||||
int flag = PyStackRef_Is(cond, PyStackRef_False); | ||||||||||||||||||||
int flag = PyStackRef_IsFalse(cond); | ||||||||||||||||||||
DEAD(cond); | ||||||||||||||||||||
RECORD_BRANCH_TAKEN(this_instr[1].cache, flag); | ||||||||||||||||||||
JUMPBY(oparg * flag); | ||||||||||||||||||||
} | ||||||||||||||||||||
|
||||||||||||||||||||
replaced op(_POP_JUMP_IF_TRUE, (cond -- )) { | ||||||||||||||||||||
assert(PyStackRef_BoolCheck(cond)); | ||||||||||||||||||||
int flag = PyStackRef_Is(cond, PyStackRef_True); | ||||||||||||||||||||
int flag = PyStackRef_IsExactly(cond, PyStackRef_True); | ||||||||||||||||||||
|
ADDOP_I(c, loc, LOAD_FAST, 0); | |
ADDOP_LOAD_CONST(c, loc, _PyLong_GetOne()); | |
ADDOP_I(c, loc, COMPARE_OP, (Py_NE << 5) | compare_masks[Py_NE]); | |
NEW_JUMP_TARGET_LABEL(c, body); | |
ADDOP_JUMP(c, loc, POP_JUMP_IF_FALSE, body); |
Lines 5746 to 5749 in 09c240f
ADDOP(c, LOC(p), GET_LEN); | |
ADDOP_LOAD_CONST_NEW(c, LOC(p), PyLong_FromSsize_t(size)); | |
ADDOP_COMPARE(c, LOC(p), GtE); | |
RETURN_IF_ERROR(jump_to_fail_pop(c, LOC(p), pc, POP_JUMP_IF_FALSE)); |
The COMPARE_OP
s here still generate bools, but not always in the canonical representation. So we can either:
- Modify
COMPARE_OP
to ensure the canonical representation like https://github.com/colesbury/cpython/blob/5583ac0c311132e36ef458842e087945898ffdec/Python/bytecodes.c#L2409-L2416 - Use
PyStackRef_IsFalse
(instead ofPyStackRef_IsExactly
) in theJUMP_IF_FALSE
- Modify the codegen by inserting
TO_BOOL
in those two spots.
There was a problem hiding this comment.
Choose a reason for hiding this comment
The reason will be displayed to describe this comment to others. Learn more.
That makes sense, thanks for the explanation. Since using PyStackRef_IsExactly
safely is sensitive to code generation changes, I might suggest using it only when we're sure it actually matters for performance, and default to using the variants that mask out the deferred bits everywhere by default since those are always safe. I'd guess that this wouldn't affect the performance improvement of this change much, since it should come from avoiding the tagging in _PyStackRef_FromPyObjectSteal
. I don't feel super strongly though.
There was a problem hiding this comment.
Choose a reason for hiding this comment
The reason will be displayed to describe this comment to others. Learn more.
I'll switch to using PyStackRef_IsFalse
and PyStackRef_IsTrue
.
I'm no longer convinced that PyStackRef_IsExactly
is actually a performance win (and I didn't see it in measurements). I think we have issues with code generation quality that we'll need to address later. Things like POP_JUMP_IF_NONE
are composed of _IS_NONE
and _POP_JUMP_IF_TRUE
and we pack the intermediate result in a tagged _PyStackRef
. Clang does a pretty good job of optimizing through it. GCC less so: https://gcc.godbolt.org/z/Ejs8c78qd.
Some generated files are not rendered by default. Learn more about how customized files appear on GitHub.
Uh oh!
There was an error while loading. Please reload this page.