2020-04-13 06:38:42 -03:00
|
|
|
#ifndef Py_INTERNAL_GC_H
|
|
|
|
#define Py_INTERNAL_GC_H
|
|
|
|
#ifdef __cplusplus
|
|
|
|
extern "C" {
|
|
|
|
#endif
|
|
|
|
|
|
|
|
#ifndef Py_BUILD_CORE
|
|
|
|
# error "this header requires Py_BUILD_CORE define"
|
|
|
|
#endif
|
|
|
|
|
2024-01-09 19:04:41 -04:00
|
|
|
#include "pycore_freelist.h" // _PyFreeListState
|
|
|
|
|
2020-04-13 06:38:42 -03:00
|
|
|
/* GC information is stored BEFORE the object structure. */
|
|
|
|
typedef struct {
|
|
|
|
// Pointer to next object in the list.
|
|
|
|
// 0 means the object is not tracked
|
|
|
|
uintptr_t _gc_next;
|
|
|
|
|
|
|
|
// Pointer to previous object in the list.
|
|
|
|
// Lowest two bits are used for flags documented later.
|
|
|
|
uintptr_t _gc_prev;
|
|
|
|
} PyGC_Head;
|
|
|
|
|
2023-06-06 09:44:48 -03:00
|
|
|
#define _PyGC_Head_UNUSED PyGC_Head
|
|
|
|
|
|
|
|
|
|
|
|
/* Get an object's GC head */
|
2022-05-11 08:37:18 -03:00
|
|
|
static inline PyGC_Head* _Py_AS_GC(PyObject *op) {
|
2023-06-06 09:44:48 -03:00
|
|
|
char *gc = ((char*)op) - sizeof(PyGC_Head);
|
|
|
|
return (PyGC_Head*)gc;
|
2022-05-11 08:37:18 -03:00
|
|
|
}
|
2023-06-06 09:44:48 -03:00
|
|
|
|
|
|
|
/* Get the object given the GC head */
|
|
|
|
static inline PyObject* _Py_FROM_GC(PyGC_Head *gc) {
|
|
|
|
char *op = ((char *)gc) + sizeof(PyGC_Head);
|
|
|
|
return (PyObject *)op;
|
|
|
|
}
|
|
|
|
|
2020-04-13 06:38:42 -03:00
|
|
|
|
2024-01-25 14:27:36 -04:00
|
|
|
/* Bit flags for ob_gc_bits (in Py_GIL_DISABLED builds) */
|
|
|
|
#ifdef Py_GIL_DISABLED
|
2024-04-12 14:36:20 -03:00
|
|
|
# define _PyGC_BITS_TRACKED (1) // Tracked by the GC
|
|
|
|
# define _PyGC_BITS_FINALIZED (2) // tp_finalize was called
|
2024-01-25 14:27:36 -04:00
|
|
|
# define _PyGC_BITS_UNREACHABLE (4)
|
|
|
|
# define _PyGC_BITS_FROZEN (8)
|
2024-02-05 14:35:59 -04:00
|
|
|
# define _PyGC_BITS_SHARED (16)
|
2024-03-08 13:56:36 -04:00
|
|
|
# define _PyGC_BITS_SHARED_INLINE (32)
|
2024-04-12 14:36:20 -03:00
|
|
|
# define _PyGC_BITS_DEFERRED (64) // Use deferred reference counting
|
2024-01-25 14:27:36 -04:00
|
|
|
#endif
|
|
|
|
|
2020-04-13 06:38:42 -03:00
|
|
|
/* True if the object is currently tracked by the GC. */
|
2022-05-11 08:37:18 -03:00
|
|
|
static inline int _PyObject_GC_IS_TRACKED(PyObject *op) {
|
2024-01-25 14:27:36 -04:00
|
|
|
#ifdef Py_GIL_DISABLED
|
|
|
|
return (op->ob_gc_bits & _PyGC_BITS_TRACKED) != 0;
|
|
|
|
#else
|
2022-05-11 08:37:18 -03:00
|
|
|
PyGC_Head *gc = _Py_AS_GC(op);
|
|
|
|
return (gc->_gc_next != 0);
|
2024-01-25 14:27:36 -04:00
|
|
|
#endif
|
2022-05-11 08:37:18 -03:00
|
|
|
}
|
|
|
|
#define _PyObject_GC_IS_TRACKED(op) _PyObject_GC_IS_TRACKED(_Py_CAST(PyObject*, op))
|
2020-04-13 06:38:42 -03:00
|
|
|
|
|
|
|
/* True if the object may be tracked by the GC in the future, or already is.
|
|
|
|
This can be useful to implement some optimizations. */
|
2022-05-11 08:37:18 -03:00
|
|
|
static inline int _PyObject_GC_MAY_BE_TRACKED(PyObject *obj) {
|
|
|
|
if (!PyObject_IS_GC(obj)) {
|
|
|
|
return 0;
|
|
|
|
}
|
|
|
|
if (PyTuple_CheckExact(obj)) {
|
|
|
|
return _PyObject_GC_IS_TRACKED(obj);
|
|
|
|
}
|
|
|
|
return 1;
|
|
|
|
}
|
2020-04-13 06:38:42 -03:00
|
|
|
|
2024-02-05 14:35:59 -04:00
|
|
|
#ifdef Py_GIL_DISABLED
|
|
|
|
|
2024-03-08 13:56:36 -04:00
|
|
|
/* True if memory the object references is shared between
|
|
|
|
* multiple threads and needs special purpose when freeing
|
|
|
|
* those references due to the possibility of in-flight
|
|
|
|
* lock-free reads occurring. The object is responsible
|
|
|
|
* for calling _PyMem_FreeDelayed on the referenced
|
|
|
|
* memory. */
|
2024-02-05 14:35:59 -04:00
|
|
|
static inline int _PyObject_GC_IS_SHARED(PyObject *op) {
|
|
|
|
return (op->ob_gc_bits & _PyGC_BITS_SHARED) != 0;
|
|
|
|
}
|
|
|
|
#define _PyObject_GC_IS_SHARED(op) _PyObject_GC_IS_SHARED(_Py_CAST(PyObject*, op))
|
|
|
|
|
|
|
|
static inline void _PyObject_GC_SET_SHARED(PyObject *op) {
|
|
|
|
op->ob_gc_bits |= _PyGC_BITS_SHARED;
|
|
|
|
}
|
|
|
|
#define _PyObject_GC_SET_SHARED(op) _PyObject_GC_SET_SHARED(_Py_CAST(PyObject*, op))
|
|
|
|
|
2024-03-08 13:56:36 -04:00
|
|
|
/* True if the memory of the object is shared between multiple
|
|
|
|
* threads and needs special purpose when freeing due to
|
|
|
|
* the possibility of in-flight lock-free reads occurring.
|
|
|
|
* Objects with this bit that are GC objects will automatically
|
2024-04-19 18:47:42 -03:00
|
|
|
* delay-freed by PyObject_GC_Del. */
|
2024-03-08 13:56:36 -04:00
|
|
|
static inline int _PyObject_GC_IS_SHARED_INLINE(PyObject *op) {
|
|
|
|
return (op->ob_gc_bits & _PyGC_BITS_SHARED_INLINE) != 0;
|
|
|
|
}
|
|
|
|
#define _PyObject_GC_IS_SHARED_INLINE(op) \
|
|
|
|
_PyObject_GC_IS_SHARED_INLINE(_Py_CAST(PyObject*, op))
|
|
|
|
|
|
|
|
static inline void _PyObject_GC_SET_SHARED_INLINE(PyObject *op) {
|
|
|
|
op->ob_gc_bits |= _PyGC_BITS_SHARED_INLINE;
|
|
|
|
}
|
|
|
|
#define _PyObject_GC_SET_SHARED_INLINE(op) \
|
|
|
|
_PyObject_GC_SET_SHARED_INLINE(_Py_CAST(PyObject*, op))
|
|
|
|
|
2024-02-05 14:35:59 -04:00
|
|
|
#endif
|
2020-04-13 06:38:42 -03:00
|
|
|
|
|
|
|
/* Bit flags for _gc_prev */
|
|
|
|
/* Bit 0 is set when tp_finalize is called */
|
2024-03-20 05:54:42 -03:00
|
|
|
#define _PyGC_PREV_MASK_FINALIZED 1
|
2020-04-13 06:38:42 -03:00
|
|
|
/* Bit 1 is set when the object is in generation which is GCed currently. */
|
2024-03-20 05:54:42 -03:00
|
|
|
#define _PyGC_PREV_MASK_COLLECTING 2
|
|
|
|
|
2024-03-26 08:11:42 -03:00
|
|
|
/* Bit 0 in _gc_next is the old space bit.
|
|
|
|
* It is set as follows:
|
|
|
|
* Young: gcstate->visited_space
|
|
|
|
* old[0]: 0
|
|
|
|
* old[1]: 1
|
|
|
|
* permanent: 0
|
|
|
|
*
|
|
|
|
* During a collection all objects handled should have the bit set to
|
|
|
|
* gcstate->visited_space, as objects are moved from the young gen
|
|
|
|
* and the increment into old[gcstate->visited_space].
|
|
|
|
* When object are moved from the pending space, old[gcstate->visited_space^1]
|
|
|
|
* into the increment, the old space bit is flipped.
|
|
|
|
*/
|
2024-03-20 05:54:42 -03:00
|
|
|
#define _PyGC_NEXT_MASK_OLD_SPACE_1 1
|
|
|
|
|
|
|
|
#define _PyGC_PREV_SHIFT 2
|
2020-04-13 06:38:42 -03:00
|
|
|
#define _PyGC_PREV_MASK (((uintptr_t) -1) << _PyGC_PREV_SHIFT)
|
|
|
|
|
2024-01-05 16:17:16 -04:00
|
|
|
/* set for debugging information */
|
|
|
|
#define _PyGC_DEBUG_STATS (1<<0) /* print collection statistics */
|
|
|
|
#define _PyGC_DEBUG_COLLECTABLE (1<<1) /* print collectable objects */
|
|
|
|
#define _PyGC_DEBUG_UNCOLLECTABLE (1<<2) /* print uncollectable objects */
|
|
|
|
#define _PyGC_DEBUG_SAVEALL (1<<5) /* save all garbage in gc.garbage */
|
|
|
|
#define _PyGC_DEBUG_LEAK _PyGC_DEBUG_COLLECTABLE | \
|
|
|
|
_PyGC_DEBUG_UNCOLLECTABLE | \
|
|
|
|
_PyGC_DEBUG_SAVEALL
|
|
|
|
|
|
|
|
typedef enum {
|
|
|
|
// GC was triggered by heap allocation
|
|
|
|
_Py_GC_REASON_HEAP,
|
|
|
|
|
|
|
|
// GC was called during shutdown
|
|
|
|
_Py_GC_REASON_SHUTDOWN,
|
|
|
|
|
|
|
|
// GC was called by gc.collect() or PyGC_Collect()
|
|
|
|
_Py_GC_REASON_MANUAL
|
|
|
|
} _PyGC_Reason;
|
|
|
|
|
2020-04-13 06:38:42 -03:00
|
|
|
// Lowest bit of _gc_next is used for flags only in GC.
|
|
|
|
// But it is always 0 for normal code.
|
2022-05-11 08:37:18 -03:00
|
|
|
static inline PyGC_Head* _PyGCHead_NEXT(PyGC_Head *gc) {
|
2024-03-20 05:54:42 -03:00
|
|
|
uintptr_t next = gc->_gc_next & _PyGC_PREV_MASK;
|
2023-06-06 09:44:48 -03:00
|
|
|
return (PyGC_Head*)next;
|
2022-05-11 08:37:18 -03:00
|
|
|
}
|
|
|
|
static inline void _PyGCHead_SET_NEXT(PyGC_Head *gc, PyGC_Head *next) {
|
2024-03-20 05:54:42 -03:00
|
|
|
uintptr_t unext = (uintptr_t)next;
|
|
|
|
assert((unext & ~_PyGC_PREV_MASK) == 0);
|
|
|
|
gc->_gc_next = (gc->_gc_next & ~_PyGC_PREV_MASK) | unext;
|
2022-05-11 08:37:18 -03:00
|
|
|
}
|
2020-04-13 06:38:42 -03:00
|
|
|
|
|
|
|
// Lowest two bits of _gc_prev is used for _PyGC_PREV_MASK_* flags.
|
2022-05-11 08:37:18 -03:00
|
|
|
static inline PyGC_Head* _PyGCHead_PREV(PyGC_Head *gc) {
|
|
|
|
uintptr_t prev = (gc->_gc_prev & _PyGC_PREV_MASK);
|
2023-06-06 09:44:48 -03:00
|
|
|
return (PyGC_Head*)prev;
|
2022-05-11 08:37:18 -03:00
|
|
|
}
|
2024-03-20 05:54:42 -03:00
|
|
|
|
2022-05-11 08:37:18 -03:00
|
|
|
static inline void _PyGCHead_SET_PREV(PyGC_Head *gc, PyGC_Head *prev) {
|
2023-06-06 09:44:48 -03:00
|
|
|
uintptr_t uprev = (uintptr_t)prev;
|
2022-05-11 08:37:18 -03:00
|
|
|
assert((uprev & ~_PyGC_PREV_MASK) == 0);
|
|
|
|
gc->_gc_prev = ((gc->_gc_prev & ~_PyGC_PREV_MASK) | uprev);
|
|
|
|
}
|
|
|
|
|
|
|
|
static inline int _PyGC_FINALIZED(PyObject *op) {
|
2024-01-25 14:27:36 -04:00
|
|
|
#ifdef Py_GIL_DISABLED
|
|
|
|
return (op->ob_gc_bits & _PyGC_BITS_FINALIZED) != 0;
|
|
|
|
#else
|
2022-05-11 08:37:18 -03:00
|
|
|
PyGC_Head *gc = _Py_AS_GC(op);
|
2024-01-25 14:27:36 -04:00
|
|
|
return ((gc->_gc_prev & _PyGC_PREV_MASK_FINALIZED) != 0);
|
|
|
|
#endif
|
2022-05-11 08:37:18 -03:00
|
|
|
}
|
|
|
|
static inline void _PyGC_SET_FINALIZED(PyObject *op) {
|
2024-01-25 14:27:36 -04:00
|
|
|
#ifdef Py_GIL_DISABLED
|
|
|
|
op->ob_gc_bits |= _PyGC_BITS_FINALIZED;
|
|
|
|
#else
|
2022-05-11 08:37:18 -03:00
|
|
|
PyGC_Head *gc = _Py_AS_GC(op);
|
2024-01-25 14:27:36 -04:00
|
|
|
gc->_gc_prev |= _PyGC_PREV_MASK_FINALIZED;
|
|
|
|
#endif
|
2022-05-11 08:37:18 -03:00
|
|
|
}
|
2024-01-10 14:18:38 -04:00
|
|
|
static inline void _PyGC_CLEAR_FINALIZED(PyObject *op) {
|
2024-01-25 14:27:36 -04:00
|
|
|
#ifdef Py_GIL_DISABLED
|
|
|
|
op->ob_gc_bits &= ~_PyGC_BITS_FINALIZED;
|
|
|
|
#else
|
2024-01-10 14:18:38 -04:00
|
|
|
PyGC_Head *gc = _Py_AS_GC(op);
|
|
|
|
gc->_gc_prev &= ~_PyGC_PREV_MASK_FINALIZED;
|
2024-01-25 14:27:36 -04:00
|
|
|
#endif
|
2024-01-10 14:18:38 -04:00
|
|
|
}
|
2020-04-13 06:38:42 -03:00
|
|
|
|
2020-04-14 13:30:41 -03:00
|
|
|
|
|
|
|
/* GC runtime state */
|
|
|
|
|
|
|
|
/* If we change this, we need to change the default value in the
|
|
|
|
signature of gc.collect. */
|
|
|
|
#define NUM_GENERATIONS 3
|
|
|
|
/*
|
|
|
|
NOTE: about untracking of mutable objects.
|
|
|
|
|
|
|
|
Certain types of container cannot participate in a reference cycle, and
|
|
|
|
so do not need to be tracked by the garbage collector. Untracking these
|
|
|
|
objects reduces the cost of garbage collections. However, determining
|
|
|
|
which objects may be untracked is not free, and the costs must be
|
|
|
|
weighed against the benefits for garbage collection.
|
|
|
|
|
|
|
|
There are two possible strategies for when to untrack a container:
|
|
|
|
|
|
|
|
i) When the container is created.
|
|
|
|
ii) When the container is examined by the garbage collector.
|
|
|
|
|
|
|
|
Tuples containing only immutable objects (integers, strings etc, and
|
|
|
|
recursively, tuples of immutable objects) do not need to be tracked.
|
|
|
|
The interpreter creates a large number of tuples, many of which will
|
|
|
|
not survive until garbage collection. It is therefore not worthwhile
|
|
|
|
to untrack eligible tuples at creation time.
|
|
|
|
|
|
|
|
Instead, all tuples except the empty tuple are tracked when created.
|
|
|
|
During garbage collection it is determined whether any surviving tuples
|
|
|
|
can be untracked. A tuple can be untracked if all of its contents are
|
|
|
|
already not tracked. Tuples are examined for untracking in all garbage
|
|
|
|
collection cycles. It may take more than one cycle to untrack a tuple.
|
|
|
|
|
|
|
|
Dictionaries containing only immutable objects also do not need to be
|
|
|
|
tracked. Dictionaries are untracked when created. If a tracked item is
|
|
|
|
inserted into a dictionary (either as a key or value), the dictionary
|
|
|
|
becomes tracked. During a full garbage collection (all generations),
|
|
|
|
the collector will untrack any dictionaries whose contents are not
|
|
|
|
tracked.
|
|
|
|
|
|
|
|
The module provides the python function is_tracked(obj), which returns
|
|
|
|
the CURRENT tracking status of the object. Subsequent garbage
|
|
|
|
collections may change the tracking status of the object.
|
|
|
|
|
|
|
|
Untracking of certain containers was introduced in issue #4688, and
|
|
|
|
the algorithm was refined in response to issue #14775.
|
|
|
|
*/
|
|
|
|
|
|
|
|
struct gc_generation {
|
|
|
|
PyGC_Head head;
|
|
|
|
int threshold; /* collection threshold */
|
|
|
|
int count; /* count of allocations or collections of younger
|
|
|
|
generations */
|
|
|
|
};
|
|
|
|
|
2024-03-20 05:54:42 -03:00
|
|
|
struct gc_collection_stats {
|
|
|
|
/* number of collected objects */
|
|
|
|
Py_ssize_t collected;
|
|
|
|
/* total number of uncollectable objects (put into gc.garbage) */
|
|
|
|
Py_ssize_t uncollectable;
|
|
|
|
};
|
|
|
|
|
2020-04-14 13:30:41 -03:00
|
|
|
/* Running stats per generation */
|
|
|
|
struct gc_generation_stats {
|
|
|
|
/* total number of collections */
|
|
|
|
Py_ssize_t collections;
|
|
|
|
/* total number of collected objects */
|
|
|
|
Py_ssize_t collected;
|
|
|
|
/* total number of uncollectable objects (put into gc.garbage) */
|
|
|
|
Py_ssize_t uncollectable;
|
|
|
|
};
|
|
|
|
|
|
|
|
struct _gc_runtime_state {
|
|
|
|
/* List of objects that still need to be cleaned up, singly linked
|
|
|
|
* via their gc headers' gc_prev pointers. */
|
|
|
|
PyObject *trash_delete_later;
|
|
|
|
/* Current call-stack depth of tp_dealloc calls. */
|
|
|
|
int trash_delete_nesting;
|
|
|
|
|
2022-01-13 20:17:28 -04:00
|
|
|
/* Is automatic collection enabled? */
|
2020-04-14 13:30:41 -03:00
|
|
|
int enabled;
|
|
|
|
int debug;
|
|
|
|
/* linked lists of container objects */
|
2024-03-20 05:54:42 -03:00
|
|
|
struct gc_generation young;
|
|
|
|
struct gc_generation old[2];
|
2020-04-14 13:30:41 -03:00
|
|
|
/* a permanent generation which won't be collected */
|
|
|
|
struct gc_generation permanent_generation;
|
|
|
|
struct gc_generation_stats generation_stats[NUM_GENERATIONS];
|
|
|
|
/* true if we are currently running the collector */
|
|
|
|
int collecting;
|
|
|
|
/* list of uncollectable objects */
|
|
|
|
PyObject *garbage;
|
|
|
|
/* a list of callbacks to be invoked when collection is performed */
|
|
|
|
PyObject *callbacks;
|
2024-03-20 05:54:42 -03:00
|
|
|
|
2024-03-22 15:43:25 -03:00
|
|
|
Py_ssize_t heap_size;
|
2024-03-20 05:54:42 -03:00
|
|
|
Py_ssize_t work_to_do;
|
|
|
|
/* Which of the old spaces is the visited space */
|
|
|
|
int visited_space;
|
|
|
|
|
|
|
|
#ifdef Py_GIL_DISABLED
|
2020-04-14 13:30:41 -03:00
|
|
|
/* This is the number of objects that survived the last full
|
|
|
|
collection. It approximates the number of long lived objects
|
|
|
|
tracked by the GC.
|
2024-02-07 08:38:34 -04:00
|
|
|
|
2020-04-14 13:30:41 -03:00
|
|
|
(by "full collection", we mean a collection of the oldest
|
|
|
|
generation). */
|
|
|
|
Py_ssize_t long_lived_total;
|
2024-02-07 08:38:34 -04:00
|
|
|
/* This is the number of objects that survived all "non-full"
|
|
|
|
collections, and are awaiting to undergo a full collection for
|
|
|
|
the first time. */
|
|
|
|
Py_ssize_t long_lived_pending;
|
2024-03-20 05:54:42 -03:00
|
|
|
#endif
|
2020-04-14 13:30:41 -03:00
|
|
|
};
|
|
|
|
|
2024-02-16 12:22:27 -04:00
|
|
|
#ifdef Py_GIL_DISABLED
|
|
|
|
struct _gc_thread_state {
|
|
|
|
/* Thread-local allocation count. */
|
|
|
|
Py_ssize_t alloc_count;
|
|
|
|
};
|
|
|
|
#endif
|
|
|
|
|
2022-01-13 20:17:28 -04:00
|
|
|
|
2020-10-30 13:00:00 -03:00
|
|
|
extern void _PyGC_InitState(struct _gc_runtime_state *);
|
|
|
|
|
2024-03-20 05:54:42 -03:00
|
|
|
extern Py_ssize_t _PyGC_Collect(PyThreadState *tstate, int generation, _PyGC_Reason reason);
|
|
|
|
extern void _PyGC_CollectNoFail(PyThreadState *tstate);
|
2020-04-14 13:30:41 -03:00
|
|
|
|
2024-01-05 16:17:16 -04:00
|
|
|
/* Freeze objects tracked by the GC and ignore them in future collections. */
|
|
|
|
extern void _PyGC_Freeze(PyInterpreterState *interp);
|
|
|
|
/* Unfreezes objects placing them in the oldest generation */
|
|
|
|
extern void _PyGC_Unfreeze(PyInterpreterState *interp);
|
|
|
|
/* Number of frozen objects */
|
|
|
|
extern Py_ssize_t _PyGC_GetFreezeCount(PyInterpreterState *interp);
|
|
|
|
|
2024-03-22 15:43:25 -03:00
|
|
|
extern PyObject *_PyGC_GetObjects(PyInterpreterState *interp, int generation);
|
2024-01-05 16:17:16 -04:00
|
|
|
extern PyObject *_PyGC_GetReferrers(PyInterpreterState *interp, PyObject *objs);
|
2020-04-28 21:29:20 -03:00
|
|
|
|
|
|
|
// Functions to clear types free lists
|
2024-01-09 19:04:41 -04:00
|
|
|
extern void _PyGC_ClearAllFreeLists(PyInterpreterState *interp);
|
2024-02-20 10:57:48 -04:00
|
|
|
extern void _Py_ScheduleGC(PyThreadState *tstate);
|
2022-10-08 11:57:09 -03:00
|
|
|
extern void _Py_RunGC(PyThreadState *tstate);
|
2020-04-28 21:29:20 -03:00
|
|
|
|
2020-04-13 06:38:42 -03:00
|
|
|
#ifdef __cplusplus
|
|
|
|
}
|
|
|
|
#endif
|
|
|
|
#endif /* !Py_INTERNAL_GC_H */
|