Skip to content
Merged
Changes from 8 commits
Commits
Show all changes
37 commits
Select commit Hold shift + click to select a range
69ba0e9
initial implementation
dg-pb Sep 26, 2024
9a21b55
V2
dg-pb Sep 26, 2024
f23021c
small fixes
dg-pb Sep 26, 2024
d840ad7
V3
dg-pb Sep 26, 2024
2dd7568
V4
dg-pb Sep 27, 2024
862097f
fix compiler warnings
dg-pb Sep 27, 2024
64c889b
V5 stable
dg-pb Sep 29, 2024
a7142d5
add commented fix if merging after gh-124652
dg-pb Sep 30, 2024
ba36d01
error check
dg-pb Oct 4, 2024
acba269
fix error check
dg-pb Oct 4, 2024
898a104
minor macro edit
dg-pb Oct 5, 2024
10b9f3b
merge to main
dg-pb Oct 17, 2024
3647c25
📜🤖 Added by blurb_it.
blurb-it[bot] Oct 17, 2024
f9e3fd4
small edits
dg-pb Dec 18, 2024
42f3dc7
idiomatic C
dg-pb Jan 5, 2025
4f23211
Merge remote-tracking branch 'upstream/main' into gh-119109-partial_v…
dg-pb Jan 5, 2025
acd9c56
small edits and fixes
dg-pb Jan 5, 2025
cc557e9
macros removed, post-resizing instead
dg-pb Jan 5, 2025
e8fbaf8
regain previous performance
dg-pb Jan 6, 2025
1a8a56c
small edit
dg-pb Jan 6, 2025
b3ff73d
labels removed
dg-pb Jan 6, 2025
00ebb4b
comment edits
dg-pb Jan 6, 2025
4575b6c
minor fixes and improvements
dg-pb Jan 6, 2025
25a91aa
small stack size doubled + small edits
dg-pb Jan 8, 2025
e326fcf
removed commented fix when trailing placeholders allowed
dg-pb Jan 9, 2025
85d658f
moved declarations to more sensible place
dg-pb Jan 10, 2025
cefa7d8
reorder declarations
dg-pb Jan 10, 2025
aa3a11f
Merge remote-tracking branch 'upstream/main' into gh-119109-partial_v…
dg-pb May 8, 2025
8730ded
Merge branch 'main' into gh-119109-partial_vectorcall_kw
kumaraditya303 May 17, 2025
adacecf
null fix
dg-pb Jun 10, 2025
a09ce19
Merge branch 'main' into gh-119109-partial_vectorcall_kw
serhiy-storchaka Jul 7, 2025
192d261
few more brushes based on ss review
dg-pb Jul 7, 2025
1f21e74
comment
dg-pb Jul 7, 2025
3070c67
assertion fixes
dg-pb Jul 7, 2025
2a56327
stack resize rule
dg-pb Jul 7, 2025
e83099b
comment edit
dg-pb Jul 7, 2025
482336d
potential overflow fix
dg-pb Jul 8, 2025
File filter

Filter by extension

Filter by extension

Conversations
Failed to load comments.
Loading
Jump to
Jump to file
Failed to load files.
Loading
Diff view
Diff view
196 changes: 137 additions & 59 deletions Modules/_functoolsmodule.c
Original file line number Diff line number Diff line change
Expand Up @@ -334,31 +334,40 @@ partial_descr_get(PyObject *self, PyObject *obj, PyObject *type)
return PyMethod_New(self, obj);
}

/* Merging keyword arguments using the vectorcall convention is messy, so
* if we would need to do that, we stop using vectorcall and fall back
* to using partial_call() instead. */
Py_NO_INLINE static PyObject *
partial_vectorcall_fallback(PyThreadState *tstate, partialobject *pto,
PyObject *const *args, size_t nargsf,
PyObject *kwnames)
{
pto->vectorcall = NULL;
Py_ssize_t nargs = PyVectorcall_NARGS(nargsf);
return _PyObject_MakeTpCall(tstate, (PyObject *)pto,
args, nargs, kwnames);
}
#define ALLOCATE_STACK(type, size, small_stack, stack) \
do { \
if (size <= (Py_ssize_t)Py_ARRAY_LENGTH(small_stack)) { \
stack = small_stack; \
} \
else { \
stack = PyMem_Malloc(size * sizeof(type *)); \
if (stack == NULL) { \
PyErr_NoMemory(); \
return NULL; \
} \
} \
} while (0)

#define DEALLOCATE_STACK(small_stack, stack) \
do { \
if (stack != small_stack) { \
PyMem_Free(stack); \
} \
} while (0)

static PyObject *
partial_vectorcall(partialobject *pto, PyObject *const *args,
size_t nargsf, PyObject *kwnames)
{
PyThreadState *tstate = _PyThreadState_GET();
/* Sizes */
Py_ssize_t pto_nargs = PyTuple_GET_SIZE(pto->args);
Py_ssize_t pto_nkwds = PyDict_GET_SIZE(pto->kw);
Py_ssize_t nargs = PyVectorcall_NARGS(nargsf);
Py_ssize_t nkwds = kwnames == NULL ? 0 : PyTuple_GET_SIZE(kwnames);
Py_ssize_t nargskw = nargs + nkwds;

/* pto->kw is mutable, so need to check every time */
if (PyDict_GET_SIZE(pto->kw)) {
return partial_vectorcall_fallback(tstate, pto, args, nargsf, kwnames);
}
/* Placeholder check */
Py_ssize_t pto_phcount = pto->phcount;
if (nargs < pto_phcount) {
PyErr_Format(PyExc_TypeError,
Expand All @@ -367,53 +376,121 @@ partial_vectorcall(partialobject *pto, PyObject *const *args,
return NULL;
}

Py_ssize_t nargskw = nargs;
if (kwnames != NULL) {
nargskw += PyTuple_GET_SIZE(kwnames);
}
/* Total sizes */
Py_ssize_t tot_nargs = pto_nargs + nargs - pto_phcount;
Py_ssize_t tot_nkwds;
Py_ssize_t tot_nargskw;

PyObject **pto_args = _PyTuple_ITEMS(pto->args);
Py_ssize_t pto_nargs = PyTuple_GET_SIZE(pto->args);

/* Fast path if we're called without arguments */
if (nargskw == 0) {
return _PyObject_VectorcallTstate(tstate, pto->fn,
pto_args, pto_nargs, NULL);
}
/* Special cases */
if (!pto_nkwds) {
/* Fast path if we're called without arguments */
if (nargskw == 0) {
return _PyObject_VectorcallTstate(tstate, pto->fn, pto_args,
pto_nargs, NULL);
}

/* Fast path using PY_VECTORCALL_ARGUMENTS_OFFSET to prepend a single
* positional argument */
if (pto_nargs == 1 && (nargsf & PY_VECTORCALL_ARGUMENTS_OFFSET)) {
PyObject **newargs = (PyObject **)args - 1;
PyObject *tmp = newargs[0];
newargs[0] = pto_args[0];
PyObject *ret = _PyObject_VectorcallTstate(tstate, pto->fn,
newargs, nargs + 1, kwnames);
newargs[0] = tmp;
return ret;
// TO BE ADDED ON MERGE TO MAIN
// IF https://github.com/python/cpython/pull/124788
// IS MERGED BEFORE THIS
// /* Fast path if all Placeholders */
// if (pto_nargs == pto_phcount) {
// /* NOTE: Without this, following single argument Fast Path
// * is incorrect */
// return _PyObject_VectorcallTstate(tstate, pto->fn,
// args, nargs, kwnames);
// }

/* Use PY_VECTORCALL_ARGUMENTS_OFFSET to prepend a single
* positional argument. */
if (pto_nargs == 1 && (nargsf & PY_VECTORCALL_ARGUMENTS_OFFSET)) {
PyObject **newargs = (PyObject **)args - 1;
PyObject *tmp = newargs[0];
newargs[0] = pto_args[0];
PyObject *ret = _PyObject_VectorcallTstate(tstate, pto->fn, newargs,
nargs + 1, kwnames);
newargs[0] = tmp;
return ret;
}
}

PyObject *small_stack[_PY_FASTCALL_SMALL_STACK];
PyObject **stack;
tot_nkwds = pto_nkwds + nkwds;
tot_nargskw = tot_nargs + tot_nkwds;
PyObject **stack, *small_stack[_PY_FASTCALL_SMALL_STACK];
PyObject *tot_kwnames = kwnames;

/* Initialize stack & copy keywords to stack */
if (!pto_nkwds) {
/* Allocate Stack */
tot_nkwds = pto_nkwds + nkwds;
tot_nargskw = tot_nargs + tot_nkwds;
ALLOCATE_STACK(PyObject, tot_nargskw, small_stack, stack);

Py_ssize_t tot_nargskw = pto_nargs + nargskw - pto_phcount;
if (tot_nargskw <= (Py_ssize_t)Py_ARRAY_LENGTH(small_stack)) {
stack = small_stack;
if (nkwds) {
/* if !pto_nkwds & nkwds, then simply append kw */
memcpy(stack + tot_nargs, args + nargs, nkwds * sizeof(PyObject*));
}
}
else {
stack = PyMem_Malloc(tot_nargskw * sizeof(PyObject *));
if (stack == NULL) {
PyErr_NoMemory();
return NULL;
PyObject *key, *val;
PyObject *pto_kw = NULL; // pto_kw with duplicates merged (if any)

/* Temporary stack for keywords that are not in pto->kw */
PyObject **kwtail, *small_kwtail[_PY_FASTCALL_SMALL_STACK * 2];
ALLOCATE_STACK(PyObject, nkwds * 2, small_kwtail, kwtail);

/* Merge kw to pto_kw or add to tail (if not duplicate) */
Py_ssize_t n_tail = 0;
for (Py_ssize_t i = 0; i < nkwds; ++i) {
key = PyTuple_GET_ITEM(kwnames, i);
val = args[nargs + i];
if (PyDict_Contains(pto->kw, key)) {
if (pto_kw == NULL) {
pto_kw = PyDict_Copy(pto->kw);
}
PyDict_SetItem(pto_kw, key, val);
}
else {
kwtail[n_tail] = key;
kwtail[n_tail + nkwds] = val;
n_tail++;
}
}

/* Allocate Stack */
Py_ssize_t n_merges = nkwds - n_tail;
tot_nkwds = pto_nkwds + nkwds - n_merges;
tot_nargskw = tot_nargs + tot_nkwds;
ALLOCATE_STACK(PyObject, tot_nargskw, small_stack, stack);
tot_kwnames = PyTuple_New(tot_nkwds);

/* Copy pto_kw to stack */
Py_ssize_t pos = 0, i = 0;
while (PyDict_Next(n_merges ? pto_kw : pto->kw, &pos, &key, &val)) {
PyTuple_SET_ITEM(tot_kwnames, i, key);
Py_INCREF(key);
stack[tot_nargs + i] = val;
i++;
}
Py_XDECREF(pto_kw);

/* Copy kw tail to stack */
for (Py_ssize_t i = 0; i < n_tail; ++i) {
key = kwtail[i];
val = kwtail[i + nkwds];
PyTuple_SET_ITEM(tot_kwnames, pto_nkwds + i, key);
Py_INCREF(key);
stack[tot_nargs + pto_nkwds + i] = val;
}
DEALLOCATE_STACK(small_kwtail, kwtail);
}

Py_ssize_t tot_nargs;
/* Copy Positionals to stack */
if (pto_phcount) {
tot_nargs = pto_nargs + nargs - pto_phcount;
Py_ssize_t j = 0; // New args index
for (Py_ssize_t i = 0; i < pto_nargs; i++) {
if (pto_args[i] == pto->placeholder) {
if (pto_args[i] == pto->placeholder){
stack[i] = args[j];
j += 1;
}
Expand All @@ -422,20 +499,22 @@ partial_vectorcall(partialobject *pto, PyObject *const *args,
}
}
assert(j == pto_phcount);
if (nargskw > pto_phcount) {
memcpy(stack + pto_nargs, args + j, (nargskw - j) * sizeof(PyObject*));
/* Add remaining args from new_args */
if (nargs > pto_phcount) {
memcpy(stack + pto_nargs, args + j, (nargs - j) * sizeof(PyObject*));
}
}
else {
tot_nargs = pto_nargs + nargs;
/* Copy to new stack, using borrowed references */
memcpy(stack, pto_args, pto_nargs * sizeof(PyObject*));
memcpy(stack + pto_nargs, args, nargskw * sizeof(PyObject*));
memcpy(stack + pto_nargs, args, nargs * sizeof(PyObject*));
}
PyObject *ret = _PyObject_VectorcallTstate(tstate, pto->fn,
stack, tot_nargs, kwnames);
if (stack != small_stack) {
PyMem_Free(stack);

/* Call / Maintenance / Return */
PyObject *ret = _PyObject_VectorcallTstate(tstate, pto->fn, stack,
tot_nargs, tot_kwnames);
DEALLOCATE_STACK(small_stack, stack);
if (pto_nkwds) {
Py_DECREF(tot_kwnames);
}
return ret;
}
Expand All @@ -456,7 +535,6 @@ partial_setvectorcall(partialobject *pto)
}
}


// Not converted to argument clinic, because of `*args, **kwargs` arguments.
static PyObject *
partial_call(partialobject *pto, PyObject *args, PyObject *kwargs)
Expand Down
Loading