Skip to content

Commit b11a384

Browse files
authored
gh-98724: Fix Py_CLEAR() macro side effects (#99100) (#100070)
The Py_CLEAR(), Py_SETREF() and Py_XSETREF() macros now only evaluate their arguments once. If an argument has side effects, these side effects are no longer duplicated. Use temporary variables to avoid duplicating side effects of macro arguments. If available, use _Py_TYPEOF() to avoid type punning. Otherwise, use memcpy() for the assignment to prevent a miscompilation with strict aliasing caused by type punning. Add _Py_TYPEOF() macro: __typeof__() on GCC and clang. Add test_py_clear() and test_py_setref() unit tests to _testcapi.
1 parent 7031275 commit b11a384

File tree

7 files changed

+235
-29
lines changed

7 files changed

+235
-29
lines changed

Doc/c-api/refcounting.rst

+44-2
Original file line numberDiff line numberDiff line change
@@ -7,8 +7,8 @@
77
Reference Counting
88
******************
99

10-
The macros in this section are used for managing reference counts of Python
11-
objects.
10+
The functions and macros in this section are used for managing reference counts
11+
of Python objects.
1212

1313

1414
.. c:function:: Py_ssize_t Py_REFCNT(PyObject *o)
@@ -129,6 +129,11 @@ objects.
129129
It is a good idea to use this macro whenever decrementing the reference
130130
count of an object that might be traversed during garbage collection.
131131
132+
.. versionchanged:: 3.12
133+
The macro argument is now only evaluated once. If the argument has side
134+
effects, these are no longer duplicated.
135+
136+
132137
.. c:function:: void Py_IncRef(PyObject *o)
133138
134139
Increment the reference count for object *o*. A function version of :c:func:`Py_XINCREF`.
@@ -139,3 +144,40 @@ objects.
139144
140145
Decrement the reference count for object *o*. A function version of :c:func:`Py_XDECREF`.
141146
It can be used for runtime dynamic embedding of Python.
147+
148+
149+
.. c:macro:: Py_SETREF(dst, src)
150+
151+
Macro safely decrementing the `dst` reference count and setting `dst` to
152+
`src`.
153+
154+
As in case of :c:func:`Py_CLEAR`, "the obvious" code can be deadly::
155+
156+
Py_DECREF(dst);
157+
dst = src;
158+
159+
The safe way is::
160+
161+
Py_SETREF(dst, src);
162+
163+
That arranges to set `dst` to `src` _before_ decrementing reference count of
164+
*dst* old value, so that any code triggered as a side-effect of `dst`
165+
getting torn down no longer believes `dst` points to a valid object.
166+
167+
.. versionadded:: 3.6
168+
169+
.. versionchanged:: 3.12
170+
The macro arguments are now only evaluated once. If an argument has side
171+
effects, these are no longer duplicated.
172+
173+
174+
.. c:macro:: Py_XSETREF(dst, src)
175+
176+
Variant of :c:macro:`Py_SETREF` macro that uses :c:func:`Py_XDECREF` instead
177+
of :c:func:`Py_DECREF`.
178+
179+
.. versionadded:: 3.6
180+
181+
.. versionchanged:: 3.12
182+
The macro arguments are now only evaluated once. If an argument has side
183+
effects, these are no longer duplicated.

Doc/whatsnew/3.12.rst

+5
Original file line numberDiff line numberDiff line change
@@ -851,6 +851,11 @@ Porting to Python 3.12
851851
:class:`bytes` type is accepted for bytes strings.
852852
(Contributed by Victor Stinner in :gh:`98393`.)
853853

854+
* The :c:macro:`Py_CLEAR`, :c:macro:`Py_SETREF` and :c:macro:`Py_XSETREF`
855+
macros now only evaluate their arguments once. If an argument has side
856+
effects, these side effects are no longer duplicated.
857+
(Contributed by Victor Stinner in :gh:`98724`.)
858+
854859
Deprecated
855860
----------
856861

Include/cpython/object.h

+51-20
Original file line numberDiff line numberDiff line change
@@ -305,38 +305,69 @@ _PyObject_GenericSetAttrWithDict(PyObject *, PyObject *,
305305

306306
PyAPI_FUNC(PyObject *) _PyObject_FunctionStr(PyObject *);
307307

308-
/* Safely decref `op` and set `op` to `op2`.
308+
/* Safely decref `dst` and set `dst` to `src`.
309309
*
310310
* As in case of Py_CLEAR "the obvious" code can be deadly:
311311
*
312-
* Py_DECREF(op);
313-
* op = op2;
312+
* Py_DECREF(dst);
313+
* dst = src;
314314
*
315315
* The safe way is:
316316
*
317-
* Py_SETREF(op, op2);
317+
* Py_SETREF(dst, src);
318318
*
319-
* That arranges to set `op` to `op2` _before_ decref'ing, so that any code
320-
* triggered as a side-effect of `op` getting torn down no longer believes
321-
* `op` points to a valid object.
319+
* That arranges to set `dst` to `src` _before_ decref'ing, so that any code
320+
* triggered as a side-effect of `dst` getting torn down no longer believes
321+
* `dst` points to a valid object.
322322
*
323-
* Py_XSETREF is a variant of Py_SETREF that uses Py_XDECREF instead of
324-
* Py_DECREF.
323+
* Temporary variables are used to only evalutate macro arguments once and so
324+
* avoid the duplication of side effects. _Py_TYPEOF() or memcpy() is used to
325+
* avoid a miscompilation caused by type punning. See Py_CLEAR() comment for
326+
* implementation details about type punning.
327+
*
328+
* The memcpy() implementation does not emit a compiler warning if 'src' has
329+
* not the same type than 'src': any pointer type is accepted for 'src'.
325330
*/
326-
327-
#define Py_SETREF(op, op2) \
328-
do { \
329-
PyObject *_py_tmp = _PyObject_CAST(op); \
330-
(op) = (op2); \
331-
Py_DECREF(_py_tmp); \
331+
#ifdef _Py_TYPEOF
332+
#define Py_SETREF(dst, src) \
333+
do { \
334+
_Py_TYPEOF(dst)* _tmp_dst_ptr = &(dst); \
335+
_Py_TYPEOF(dst) _tmp_old_dst = (*_tmp_dst_ptr); \
336+
*_tmp_dst_ptr = (src); \
337+
Py_DECREF(_tmp_old_dst); \
332338
} while (0)
339+
#else
340+
#define Py_SETREF(dst, src) \
341+
do { \
342+
PyObject **_tmp_dst_ptr = _Py_CAST(PyObject**, &(dst)); \
343+
PyObject *_tmp_old_dst = (*_tmp_dst_ptr); \
344+
PyObject *_tmp_src = _PyObject_CAST(src); \
345+
memcpy(_tmp_dst_ptr, &_tmp_src, sizeof(PyObject*)); \
346+
Py_DECREF(_tmp_old_dst); \
347+
} while (0)
348+
#endif
333349

334-
#define Py_XSETREF(op, op2) \
335-
do { \
336-
PyObject *_py_tmp = _PyObject_CAST(op); \
337-
(op) = (op2); \
338-
Py_XDECREF(_py_tmp); \
350+
/* Py_XSETREF() is a variant of Py_SETREF() that uses Py_XDECREF() instead of
351+
* Py_DECREF().
352+
*/
353+
#ifdef _Py_TYPEOF
354+
#define Py_XSETREF(dst, src) \
355+
do { \
356+
_Py_TYPEOF(dst)* _tmp_dst_ptr = &(dst); \
357+
_Py_TYPEOF(dst) _tmp_old_dst = (*_tmp_dst_ptr); \
358+
*_tmp_dst_ptr = (src); \
359+
Py_XDECREF(_tmp_old_dst); \
360+
} while (0)
361+
#else
362+
#define Py_XSETREF(dst, src) \
363+
do { \
364+
PyObject **_tmp_dst_ptr = _Py_CAST(PyObject**, &(dst)); \
365+
PyObject *_tmp_old_dst = (*_tmp_dst_ptr); \
366+
PyObject *_tmp_src = _PyObject_CAST(src); \
367+
memcpy(_tmp_dst_ptr, &_tmp_src, sizeof(PyObject*)); \
368+
Py_XDECREF(_tmp_old_dst); \
339369
} while (0)
370+
#endif
340371

341372

342373
PyAPI_DATA(PyTypeObject) _PyNone_Type;

Include/object.h

+36-7
Original file line numberDiff line numberDiff line change
@@ -598,15 +598,44 @@ static inline void Py_DECREF(PyObject *op)
598598
* one of those can't cause problems -- but in part that relies on that
599599
* Python integers aren't currently weakly referencable. Best practice is
600600
* to use Py_CLEAR() even if you can't think of a reason for why you need to.
601+
*
602+
* gh-98724: Use a temporary variable to only evaluate the macro argument once,
603+
* to avoid the duplication of side effects if the argument has side effects.
604+
*
605+
* gh-99701: If the PyObject* type is used with casting arguments to PyObject*,
606+
* the code can be miscompiled with strict aliasing because of type punning.
607+
* With strict aliasing, a compiler considers that two pointers of different
608+
* types cannot read or write the same memory which enables optimization
609+
* opportunities.
610+
*
611+
* If available, use _Py_TYPEOF() to use the 'op' type for temporary variables,
612+
* and so avoid type punning. Otherwise, use memcpy() which causes type erasure
613+
* and so prevents the compiler to reuse an old cached 'op' value after
614+
* Py_CLEAR().
601615
*/
602-
#define Py_CLEAR(op) \
603-
do { \
604-
PyObject *_py_tmp = _PyObject_CAST(op); \
605-
if (_py_tmp != NULL) { \
606-
(op) = NULL; \
607-
Py_DECREF(_py_tmp); \
608-
} \
616+
#ifdef _Py_TYPEOF
617+
#define Py_CLEAR(op) \
618+
do { \
619+
_Py_TYPEOF(op)* _tmp_op_ptr = &(op); \
620+
_Py_TYPEOF(op) _tmp_old_op = (*_tmp_op_ptr); \
621+
if (_tmp_old_op != NULL) { \
622+
*_tmp_op_ptr = _Py_NULL; \
623+
Py_DECREF(_tmp_old_op); \
624+
} \
609625
} while (0)
626+
#else
627+
#define Py_CLEAR(op) \
628+
do { \
629+
PyObject **_tmp_op_ptr = _Py_CAST(PyObject**, &(op)); \
630+
PyObject *_tmp_old_op = (*_tmp_op_ptr); \
631+
if (_tmp_old_op != NULL) { \
632+
PyObject *_null_ptr = _Py_NULL; \
633+
memcpy(_tmp_op_ptr, &_null_ptr, sizeof(PyObject*)); \
634+
Py_DECREF(_tmp_old_op); \
635+
} \
636+
} while (0)
637+
#endif
638+
610639

611640
/* Function to use in case the object pointer can be NULL: */
612641
static inline void Py_XINCREF(PyObject *op)

Include/pyport.h

+9
Original file line numberDiff line numberDiff line change
@@ -698,6 +698,15 @@ extern char * _getpty(int *, int, mode_t, int);
698698
# define _Py__has_builtin(x) 0
699699
#endif
700700

701+
// _Py_TYPEOF(expr) gets the type of an expression.
702+
//
703+
// Example: _Py_TYPEOF(x) x_copy = (x);
704+
//
705+
// The macro is only defined if GCC or clang compiler is used.
706+
#if defined(__GNUC__) || defined(__clang__)
707+
# define _Py_TYPEOF(expr) __typeof__(expr)
708+
#endif
709+
701710

702711
/* A convenient way for code to know if sanitizers are enabled. */
703712
#if defined(__has_feature)
Original file line numberDiff line numberDiff line change
@@ -0,0 +1,3 @@
1+
The :c:macro:`Py_CLEAR`, :c:macro:`Py_SETREF` and :c:macro:`Py_XSETREF` macros
2+
now only evaluate their arguments once. If an argument has side effects, these
3+
side effects are no longer duplicated. Patch by Victor Stinner.

Modules/_testcapimodule.c

+87
Original file line numberDiff line numberDiff line change
@@ -2589,6 +2589,91 @@ test_set_type_size(PyObject *self, PyObject *Py_UNUSED(ignored))
25892589
}
25902590

25912591

2592+
// Test Py_CLEAR() macro
2593+
static PyObject*
2594+
test_py_clear(PyObject *self, PyObject *Py_UNUSED(ignored))
2595+
{
2596+
// simple case with a variable
2597+
PyObject *obj = PyList_New(0);
2598+
if (obj == NULL) {
2599+
return NULL;
2600+
}
2601+
Py_CLEAR(obj);
2602+
assert(obj == NULL);
2603+
2604+
// gh-98724: complex case, Py_CLEAR() argument has a side effect
2605+
PyObject* array[1];
2606+
array[0] = PyList_New(0);
2607+
if (array[0] == NULL) {
2608+
return NULL;
2609+
}
2610+
2611+
PyObject **p = array;
2612+
Py_CLEAR(*p++);
2613+
assert(array[0] == NULL);
2614+
assert(p == array + 1);
2615+
2616+
Py_RETURN_NONE;
2617+
}
2618+
2619+
2620+
// Test Py_SETREF() and Py_XSETREF() macros, similar to test_py_clear()
2621+
static PyObject*
2622+
test_py_setref(PyObject *self, PyObject *Py_UNUSED(ignored))
2623+
{
2624+
// Py_SETREF() simple case with a variable
2625+
PyObject *obj = PyList_New(0);
2626+
if (obj == NULL) {
2627+
return NULL;
2628+
}
2629+
Py_SETREF(obj, NULL);
2630+
assert(obj == NULL);
2631+
2632+
// Py_XSETREF() simple case with a variable
2633+
PyObject *obj2 = PyList_New(0);
2634+
if (obj2 == NULL) {
2635+
return NULL;
2636+
}
2637+
Py_XSETREF(obj2, NULL);
2638+
assert(obj2 == NULL);
2639+
// test Py_XSETREF() when the argument is NULL
2640+
Py_XSETREF(obj2, NULL);
2641+
assert(obj2 == NULL);
2642+
2643+
// gh-98724: complex case, Py_SETREF() argument has a side effect
2644+
PyObject* array[1];
2645+
array[0] = PyList_New(0);
2646+
if (array[0] == NULL) {
2647+
return NULL;
2648+
}
2649+
2650+
PyObject **p = array;
2651+
Py_SETREF(*p++, NULL);
2652+
assert(array[0] == NULL);
2653+
assert(p == array + 1);
2654+
2655+
// gh-98724: complex case, Py_XSETREF() argument has a side effect
2656+
PyObject* array2[1];
2657+
array2[0] = PyList_New(0);
2658+
if (array2[0] == NULL) {
2659+
return NULL;
2660+
}
2661+
2662+
PyObject **p2 = array2;
2663+
Py_XSETREF(*p2++, NULL);
2664+
assert(array2[0] == NULL);
2665+
assert(p2 == array2 + 1);
2666+
2667+
// test Py_XSETREF() when the argument is NULL
2668+
p2 = array2;
2669+
Py_XSETREF(*p2++, NULL);
2670+
assert(array2[0] == NULL);
2671+
assert(p2 == array2 + 1);
2672+
2673+
Py_RETURN_NONE;
2674+
}
2675+
2676+
25922677
#define TEST_REFCOUNT() \
25932678
do { \
25942679
PyObject *obj = PyList_New(0); \
@@ -3252,6 +3337,8 @@ static PyMethodDef TestMethods[] = {
32523337
{"pynumber_tobase", pynumber_tobase, METH_VARARGS},
32533338
{"without_gc", without_gc, METH_O},
32543339
{"test_set_type_size", test_set_type_size, METH_NOARGS},
3340+
{"test_py_clear", test_py_clear, METH_NOARGS},
3341+
{"test_py_setref", test_py_setref, METH_NOARGS},
32553342
{"test_refcount_macros", test_refcount_macros, METH_NOARGS},
32563343
{"test_refcount_funcs", test_refcount_funcs, METH_NOARGS},
32573344
{"test_py_is_macros", test_py_is_macros, METH_NOARGS},

0 commit comments

Comments
 (0)