gh-112087: Make list_{concat, repeat, inplace_repeat, ass_item) to be thread-safe (gh-115605)

This commit is contained in:
Donghee Na 2024-02-21 10:38:09 +09:00 committed by GitHub
parent 54071460d7
commit 259730bbb5
No known key found for this signature in database
GPG Key ID: B5690EEEBB952194
2 changed files with 89 additions and 41 deletions

View File

@ -23,11 +23,17 @@ extern "C" {
#define FT_ATOMIC_LOAD_SSIZE(value) _Py_atomic_load_ssize(&value) #define FT_ATOMIC_LOAD_SSIZE(value) _Py_atomic_load_ssize(&value)
#define FT_ATOMIC_LOAD_SSIZE_RELAXED(value) \ #define FT_ATOMIC_LOAD_SSIZE_RELAXED(value) \
_Py_atomic_load_ssize_relaxed(&value) _Py_atomic_load_ssize_relaxed(&value)
#define FT_ATOMIC_STORE_PTR_RELAXED(value, new_value) \
_Py_atomic_store_ptr_relaxed(&value, new_value)
#define FT_ATOMIC_STORE_PTR_RELEASE(value, new_value) \
_Py_atomic_store_ptr_release(&value, new_value)
#define FT_ATOMIC_STORE_SSIZE_RELAXED(value, new_value) \ #define FT_ATOMIC_STORE_SSIZE_RELAXED(value, new_value) \
_Py_atomic_store_ssize_relaxed(&value, new_value) _Py_atomic_store_ssize_relaxed(&value, new_value)
#else #else
#define FT_ATOMIC_LOAD_SSIZE(value) value #define FT_ATOMIC_LOAD_SSIZE(value) value
#define FT_ATOMIC_LOAD_SSIZE_RELAXED(value) value #define FT_ATOMIC_LOAD_SSIZE_RELAXED(value) value
#define FT_ATOMIC_STORE_PTR_RELAXED(value, new_value) value = new_value
#define FT_ATOMIC_STORE_PTR_RELEASE(value, new_value) value = new_value
#define FT_ATOMIC_STORE_SSIZE_RELAXED(value, new_value) value = new_value #define FT_ATOMIC_STORE_SSIZE_RELAXED(value, new_value) value = new_value
#endif #endif

View File

@ -3,6 +3,7 @@
#include "Python.h" #include "Python.h"
#include "pycore_abstract.h" // _PyIndex_Check() #include "pycore_abstract.h" // _PyIndex_Check()
#include "pycore_ceval.h" // _PyEval_GetBuiltin() #include "pycore_ceval.h" // _PyEval_GetBuiltin()
#include "pycore_pyatomic_ft_wrappers.h"
#include "pycore_interp.h" // PyInterpreterState.list #include "pycore_interp.h" // PyInterpreterState.list
#include "pycore_list.h" // struct _Py_list_freelist, _PyListIterObject #include "pycore_list.h" // struct _Py_list_freelist, _PyListIterObject
#include "pycore_long.h" // _PyLong_DigitCount #include "pycore_long.h" // _PyLong_DigitCount
@ -20,14 +21,6 @@ class list "PyListObject *" "&PyList_Type"
_Py_DECLARE_STR(list_err, "list index out of range"); _Py_DECLARE_STR(list_err, "list index out of range");
#ifdef Py_GIL_DISABLED
# define LOAD_SSIZE(value) _Py_atomic_load_ssize_relaxed(&value)
# define STORE_SSIZE(value, new_value) _Py_atomic_store_ssize_relaxed(&value, new_value)
#else
# define LOAD_SSIZE(value) value
# define STORE_SSIZE(value, new_value) value = new_value
#endif
#ifdef WITH_FREELISTS #ifdef WITH_FREELISTS
static struct _Py_list_freelist * static struct _Py_list_freelist *
get_list_freelist(void) get_list_freelist(void)
@ -563,20 +556,12 @@ PyList_GetSlice(PyObject *a, Py_ssize_t ilow, Py_ssize_t ihigh)
} }
static PyObject * static PyObject *
list_concat(PyObject *aa, PyObject *bb) list_concat_lock_held(PyListObject *a, PyListObject *b)
{ {
PyListObject *a = (PyListObject *)aa;
Py_ssize_t size; Py_ssize_t size;
Py_ssize_t i; Py_ssize_t i;
PyObject **src, **dest; PyObject **src, **dest;
PyListObject *np; PyListObject *np;
if (!PyList_Check(bb)) {
PyErr_Format(PyExc_TypeError,
"can only concatenate list (not \"%.200s\") to list",
Py_TYPE(bb)->tp_name);
return NULL;
}
#define b ((PyListObject *)bb)
assert((size_t)Py_SIZE(a) + (size_t)Py_SIZE(b) < PY_SSIZE_T_MAX); assert((size_t)Py_SIZE(a) + (size_t)Py_SIZE(b) < PY_SSIZE_T_MAX);
size = Py_SIZE(a) + Py_SIZE(b); size = Py_SIZE(a) + Py_SIZE(b);
if (size == 0) { if (size == 0) {
@ -590,23 +575,39 @@ list_concat(PyObject *aa, PyObject *bb)
dest = np->ob_item; dest = np->ob_item;
for (i = 0; i < Py_SIZE(a); i++) { for (i = 0; i < Py_SIZE(a); i++) {
PyObject *v = src[i]; PyObject *v = src[i];
dest[i] = Py_NewRef(v); FT_ATOMIC_STORE_PTR_RELAXED(dest[i], Py_NewRef(v));
} }
src = b->ob_item; src = b->ob_item;
dest = np->ob_item + Py_SIZE(a); dest = np->ob_item + Py_SIZE(a);
for (i = 0; i < Py_SIZE(b); i++) { for (i = 0; i < Py_SIZE(b); i++) {
PyObject *v = src[i]; PyObject *v = src[i];
dest[i] = Py_NewRef(v); FT_ATOMIC_STORE_PTR_RELAXED(dest[i], Py_NewRef(v));
} }
Py_SET_SIZE(np, size); Py_SET_SIZE(np, size);
return (PyObject *)np; return (PyObject *)np;
#undef b
} }
static PyObject * static PyObject *
list_repeat(PyObject *aa, Py_ssize_t n) list_concat(PyObject *aa, PyObject *bb)
{ {
if (!PyList_Check(bb)) {
PyErr_Format(PyExc_TypeError,
"can only concatenate list (not \"%.200s\") to list",
Py_TYPE(bb)->tp_name);
return NULL;
}
PyListObject *a = (PyListObject *)aa; PyListObject *a = (PyListObject *)aa;
PyListObject *b = (PyListObject *)bb;
PyObject *ret;
Py_BEGIN_CRITICAL_SECTION2(a, b);
ret = list_concat_lock_held(a, b);
Py_END_CRITICAL_SECTION2();
return ret;
}
static PyObject *
list_repeat_lock_held(PyListObject *a, Py_ssize_t n)
{
const Py_ssize_t input_size = Py_SIZE(a); const Py_ssize_t input_size = Py_SIZE(a);
if (input_size == 0 || n <= 0) if (input_size == 0 || n <= 0)
return PyList_New(0); return PyList_New(0);
@ -626,7 +627,7 @@ list_repeat(PyObject *aa, Py_ssize_t n)
_Py_RefcntAdd(elem, n); _Py_RefcntAdd(elem, n);
PyObject **dest_end = dest + output_size; PyObject **dest_end = dest + output_size;
while (dest < dest_end) { while (dest < dest_end) {
*dest++ = elem; FT_ATOMIC_STORE_PTR_RELAXED(*dest++, elem);
} }
} }
else { else {
@ -634,7 +635,7 @@ list_repeat(PyObject *aa, Py_ssize_t n)
PyObject **src_end = src + input_size; PyObject **src_end = src + input_size;
while (src < src_end) { while (src < src_end) {
_Py_RefcntAdd(*src, n); _Py_RefcntAdd(*src, n);
*dest++ = *src++; FT_ATOMIC_STORE_PTR_RELAXED(*dest++, *src++);
} }
_Py_memory_repeat((char *)np->ob_item, sizeof(PyObject *)*output_size, _Py_memory_repeat((char *)np->ob_item, sizeof(PyObject *)*output_size,
@ -645,6 +646,17 @@ list_repeat(PyObject *aa, Py_ssize_t n)
return (PyObject *) np; return (PyObject *) np;
} }
static PyObject *
list_repeat(PyObject *aa, Py_ssize_t n)
{
PyObject *ret;
PyListObject *a = (PyListObject *)aa;
Py_BEGIN_CRITICAL_SECTION(a);
ret = list_repeat_lock_held(a, n);
Py_END_CRITICAL_SECTION();
return ret;
}
static void static void
list_clear(PyListObject *a) list_clear(PyListObject *a)
{ {
@ -657,11 +669,12 @@ list_clear(PyListObject *a)
this list, we make it empty first. */ this list, we make it empty first. */
Py_ssize_t i = Py_SIZE(a); Py_ssize_t i = Py_SIZE(a);
Py_SET_SIZE(a, 0); Py_SET_SIZE(a, 0);
a->ob_item = NULL; FT_ATOMIC_STORE_PTR_RELEASE(a->ob_item, NULL);
a->allocated = 0; a->allocated = 0;
while (--i >= 0) { while (--i >= 0) {
Py_XDECREF(items[i]); Py_XDECREF(items[i]);
} }
// TODO: Use QSBR technique, if the list is shared between threads,
PyMem_Free(items); PyMem_Free(items);
// Note that there is no guarantee that the list is actually empty // Note that there is no guarantee that the list is actually empty
@ -798,9 +811,8 @@ PyList_SetSlice(PyObject *a, Py_ssize_t ilow, Py_ssize_t ihigh, PyObject *v)
} }
static PyObject * static PyObject *
list_inplace_repeat(PyObject *_self, Py_ssize_t n) list_inplace_repeat_lock_held(PyListObject *self, Py_ssize_t n)
{ {
PyListObject *self = (PyListObject *)_self;
Py_ssize_t input_size = PyList_GET_SIZE(self); Py_ssize_t input_size = PyList_GET_SIZE(self);
if (input_size == 0 || n == 1) { if (input_size == 0 || n == 1) {
return Py_NewRef(self); return Py_NewRef(self);
@ -829,21 +841,51 @@ list_inplace_repeat(PyObject *_self, Py_ssize_t n)
return Py_NewRef(self); return Py_NewRef(self);
} }
static int static PyObject *
list_ass_item(PyObject *aa, Py_ssize_t i, PyObject *v) list_inplace_repeat(PyObject *_self, Py_ssize_t n)
{
PyObject *ret;
PyListObject *self = (PyListObject *) _self;
Py_BEGIN_CRITICAL_SECTION(self);
ret = list_inplace_repeat_lock_held(self, n);
Py_END_CRITICAL_SECTION();
return ret;
}
static int
list_ass_item_lock_held(PyListObject *a, Py_ssize_t i, PyObject *v)
{ {
PyListObject *a = (PyListObject *)aa;
if (!valid_index(i, Py_SIZE(a))) { if (!valid_index(i, Py_SIZE(a))) {
PyErr_SetString(PyExc_IndexError, PyErr_SetString(PyExc_IndexError,
"list assignment index out of range"); "list assignment index out of range");
return -1; return -1;
} }
if (v == NULL) PyObject *tmp = a->ob_item[i];
return list_ass_slice(a, i, i+1, v); if (v == NULL) {
Py_SETREF(a->ob_item[i], Py_NewRef(v)); Py_ssize_t size = Py_SIZE(a);
for (Py_ssize_t idx = i; idx < size - 1; idx++) {
FT_ATOMIC_STORE_PTR_RELAXED(a->ob_item[idx], a->ob_item[idx + 1]);
}
Py_SET_SIZE(a, size - 1);
}
else {
FT_ATOMIC_STORE_PTR_RELEASE(a->ob_item[i], Py_NewRef(v));
}
Py_DECREF(tmp);
return 0; return 0;
} }
static int
list_ass_item(PyObject *aa, Py_ssize_t i, PyObject *v)
{
int ret;
PyListObject *a = (PyListObject *)aa;
Py_BEGIN_CRITICAL_SECTION(a);
ret = list_ass_item_lock_held(a, i, v);
Py_END_CRITICAL_SECTION();
return ret;
}
/*[clinic input] /*[clinic input]
@critical_section @critical_section
list.insert list.insert
@ -2979,7 +3021,7 @@ list___sizeof___impl(PyListObject *self)
/*[clinic end generated code: output=3417541f95f9a53e input=b8030a5d5ce8a187]*/ /*[clinic end generated code: output=3417541f95f9a53e input=b8030a5d5ce8a187]*/
{ {
size_t res = _PyObject_SIZE(Py_TYPE(self)); size_t res = _PyObject_SIZE(Py_TYPE(self));
Py_ssize_t allocated = LOAD_SSIZE(self->allocated); Py_ssize_t allocated = FT_ATOMIC_LOAD_SSIZE_RELAXED(self->allocated);
res += (size_t)allocated * sizeof(void*); res += (size_t)allocated * sizeof(void*);
return PyLong_FromSize_t(res); return PyLong_FromSize_t(res);
} }
@ -3382,7 +3424,7 @@ static PyObject *
listiter_next(PyObject *self) listiter_next(PyObject *self)
{ {
_PyListIterObject *it = (_PyListIterObject *)self; _PyListIterObject *it = (_PyListIterObject *)self;
Py_ssize_t index = LOAD_SSIZE(it->it_index); Py_ssize_t index = FT_ATOMIC_LOAD_SSIZE_RELAXED(it->it_index);
if (index < 0) { if (index < 0) {
return NULL; return NULL;
} }
@ -3390,7 +3432,7 @@ listiter_next(PyObject *self)
PyObject *item = list_get_item_ref(it->it_seq, index); PyObject *item = list_get_item_ref(it->it_seq, index);
if (item == NULL) { if (item == NULL) {
// out-of-bounds // out-of-bounds
STORE_SSIZE(it->it_index, -1); FT_ATOMIC_STORE_SSIZE_RELAXED(it->it_index, -1);
#ifndef Py_GIL_DISABLED #ifndef Py_GIL_DISABLED
PyListObject *seq = it->it_seq; PyListObject *seq = it->it_seq;
it->it_seq = NULL; it->it_seq = NULL;
@ -3398,7 +3440,7 @@ listiter_next(PyObject *self)
#endif #endif
return NULL; return NULL;
} }
STORE_SSIZE(it->it_index, index + 1); FT_ATOMIC_STORE_SSIZE_RELAXED(it->it_index, index + 1);
return item; return item;
} }
@ -3407,7 +3449,7 @@ listiter_len(PyObject *self, PyObject *Py_UNUSED(ignored))
{ {
assert(self != NULL); assert(self != NULL);
_PyListIterObject *it = (_PyListIterObject *)self; _PyListIterObject *it = (_PyListIterObject *)self;
Py_ssize_t index = LOAD_SSIZE(it->it_index); Py_ssize_t index = FT_ATOMIC_LOAD_SSIZE_RELAXED(it->it_index);
if (index >= 0) { if (index >= 0) {
Py_ssize_t len = PyList_GET_SIZE(it->it_seq) - index; Py_ssize_t len = PyList_GET_SIZE(it->it_seq) - index;
if (len >= 0) if (len >= 0)
@ -3537,7 +3579,7 @@ listreviter_next(PyObject *self)
{ {
listreviterobject *it = (listreviterobject *)self; listreviterobject *it = (listreviterobject *)self;
assert(it != NULL); assert(it != NULL);
Py_ssize_t index = LOAD_SSIZE(it->it_index); Py_ssize_t index = FT_ATOMIC_LOAD_SSIZE_RELAXED(it->it_index);
if (index < 0) { if (index < 0) {
return NULL; return NULL;
} }
@ -3546,10 +3588,10 @@ listreviter_next(PyObject *self)
assert(PyList_Check(seq)); assert(PyList_Check(seq));
PyObject *item = list_get_item_ref(seq, index); PyObject *item = list_get_item_ref(seq, index);
if (item != NULL) { if (item != NULL) {
STORE_SSIZE(it->it_index, index - 1); FT_ATOMIC_STORE_SSIZE_RELAXED(it->it_index, index - 1);
return item; return item;
} }
STORE_SSIZE(it->it_index, -1); FT_ATOMIC_STORE_SSIZE_RELAXED(it->it_index, -1);
#ifndef Py_GIL_DISABLED #ifndef Py_GIL_DISABLED
it->it_seq = NULL; it->it_seq = NULL;
Py_DECREF(seq); Py_DECREF(seq);
@ -3561,7 +3603,7 @@ static PyObject *
listreviter_len(PyObject *self, PyObject *Py_UNUSED(ignored)) listreviter_len(PyObject *self, PyObject *Py_UNUSED(ignored))
{ {
listreviterobject *it = (listreviterobject *)self; listreviterobject *it = (listreviterobject *)self;
Py_ssize_t index = LOAD_SSIZE(it->it_index); Py_ssize_t index = FT_ATOMIC_LOAD_SSIZE_RELAXED(it->it_index);
Py_ssize_t len = index + 1; Py_ssize_t len = index + 1;
if (it->it_seq == NULL || PyList_GET_SIZE(it->it_seq) < len) if (it->it_seq == NULL || PyList_GET_SIZE(it->it_seq) < len)
len = 0; len = 0;