blob: 56dcb101e0005e55b0f1ca132b218d1c9f8c2cc8 [file] [log] [blame]
Jeremy Hyltonc5007aa2000-06-30 05:02:53 +00001/*
Tim Peters88396172002-06-30 17:56:40 +00002
Jeremy Hyltonc5007aa2000-06-30 05:02:53 +00003 Reference Cycle Garbage Collection
4 ==================================
5
Neil Schemenauerb2c2c9e2000-10-04 16:34:09 +00006 Neil Schemenauer <nas@arctrix.com>
Jeremy Hyltonc5007aa2000-06-30 05:02:53 +00007
8 Based on a post on the python-dev list. Ideas from Guido van Rossum,
9 Eric Tiedemann, and various others.
10
Neil Schemenauer43411b52001-08-30 00:05:51 +000011 http://www.arctrix.com/nas/python/gc/
Neil Schemenauera7024e92008-07-15 19:24:01 +000012
13 The following mailing list threads provide a historical perspective on
14 the design of this module. Note that a fair amount of refinement has
15 occurred since those discussions.
16
17 http://mail.python.org/pipermail/python-dev/2000-March/002385.html
18 http://mail.python.org/pipermail/python-dev/2000-March/002434.html
19 http://mail.python.org/pipermail/python-dev/2000-March/002497.html
Jeremy Hyltonc5007aa2000-06-30 05:02:53 +000020
21 For a highlevel view of the collection process, read the collect
22 function.
23
Jeremy Hyltonc5007aa2000-06-30 05:02:53 +000024*/
25
Jeremy Hyltonc5007aa2000-06-30 05:02:53 +000026#include "Python.h"
Victor Stinner27e2d1f2018-11-01 00:52:28 +010027#include "pycore_context.h"
Victor Stinner444b39b2019-11-20 01:18:11 +010028#include "pycore_initconfig.h"
Victor Stinnere5014be2020-04-14 17:52:15 +020029#include "pycore_interp.h" // PyInterpreterState.gc
Victor Stinnerbcda8f12018-11-21 22:27:47 +010030#include "pycore_object.h"
Victor Stinner2e969062019-11-20 01:49:32 +010031#include "pycore_pyerrors.h"
Victor Stinnere5014be2020-04-14 17:52:15 +020032#include "pycore_pystate.h" // _PyThreadState_GET()
Łukasz Langaa785c872016-09-09 17:37:37 -070033#include "pydtrace.h"
Victor Stinnere5014be2020-04-14 17:52:15 +020034#include "pytime.h" // _PyTime_GetMonotonicClock()
Jeremy Hyltonc5007aa2000-06-30 05:02:53 +000035
Victor Stinner67e0de62019-11-20 11:48:18 +010036typedef struct _gc_runtime_state GCState;
37
Serhiy Storchaka93260282017-02-04 11:19:59 +020038/*[clinic input]
39module gc
40[clinic start generated code]*/
41/*[clinic end generated code: output=da39a3ee5e6b4b0d input=b5c9690ecc842d79]*/
42
Pablo Galindo320dd502019-10-10 22:45:17 +010043
44#ifdef Py_DEBUG
45# define GC_DEBUG
46#endif
INADA Naoki5ac9e6e2018-07-10 17:19:53 +090047
48#define GC_NEXT _PyGCHead_NEXT
49#define GC_PREV _PyGCHead_PREV
50
51// update_refs() set this bit for all objects in current generation.
52// subtract_refs() and move_unreachable() uses this to distinguish
53// visited object is in GCing or not.
54//
55// move_unreachable() removes this flag from reachable objects.
56// Only unreachable objects have this flag.
57//
58// No objects in interpreter have this flag after GC ends.
59#define PREV_MASK_COLLECTING _PyGC_PREV_MASK_COLLECTING
60
61// Lowest bit of _gc_next is used for UNREACHABLE flag.
62//
63// This flag represents the object is in unreachable list in move_unreachable()
64//
65// Although this flag is used only in move_unreachable(), move_unreachable()
66// doesn't clear this flag to skip unnecessary iteration.
67// move_legacy_finalizers() removes this flag instead.
68// Between them, unreachable list is not normal list and we can not use
69// most gc_list_* functions for it.
70#define NEXT_MASK_UNREACHABLE (1)
71
Victor Stinner626bff82018-10-25 17:31:10 +020072/* Get an object's GC head */
73#define AS_GC(o) ((PyGC_Head *)(o)-1)
74
75/* Get the object given the GC head */
76#define FROM_GC(g) ((PyObject *)(((PyGC_Head *)g)+1))
77
INADA Naoki5ac9e6e2018-07-10 17:19:53 +090078static inline int
79gc_is_collecting(PyGC_Head *g)
80{
81 return (g->_gc_prev & PREV_MASK_COLLECTING) != 0;
82}
83
84static inline void
85gc_clear_collecting(PyGC_Head *g)
86{
87 g->_gc_prev &= ~PREV_MASK_COLLECTING;
88}
89
90static inline Py_ssize_t
91gc_get_refs(PyGC_Head *g)
92{
93 return (Py_ssize_t)(g->_gc_prev >> _PyGC_PREV_SHIFT);
94}
95
96static inline void
97gc_set_refs(PyGC_Head *g, Py_ssize_t refs)
98{
99 g->_gc_prev = (g->_gc_prev & ~_PyGC_PREV_MASK)
100 | ((uintptr_t)(refs) << _PyGC_PREV_SHIFT);
101}
102
103static inline void
104gc_reset_refs(PyGC_Head *g, Py_ssize_t refs)
105{
106 g->_gc_prev = (g->_gc_prev & _PyGC_PREV_MASK_FINALIZED)
107 | PREV_MASK_COLLECTING
108 | ((uintptr_t)(refs) << _PyGC_PREV_SHIFT);
109}
110
111static inline void
112gc_decref(PyGC_Head *g)
113{
Victor Stinner626bff82018-10-25 17:31:10 +0200114 _PyObject_ASSERT_WITH_MSG(FROM_GC(g),
115 gc_get_refs(g) > 0,
116 "refcount is too small");
INADA Naoki5ac9e6e2018-07-10 17:19:53 +0900117 g->_gc_prev -= 1 << _PyGC_PREV_SHIFT;
118}
119
Jeremy Hyltonc5007aa2000-06-30 05:02:53 +0000120/* set for debugging information */
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000121#define DEBUG_STATS (1<<0) /* print collection statistics */
122#define DEBUG_COLLECTABLE (1<<1) /* print collectable objects */
123#define DEBUG_UNCOLLECTABLE (1<<2) /* print uncollectable objects */
124#define DEBUG_SAVEALL (1<<5) /* save all garbage in gc.garbage */
125#define DEBUG_LEAK DEBUG_COLLECTABLE | \
126 DEBUG_UNCOLLECTABLE | \
127 DEBUG_SAVEALL
Jeremy Hyltonc5007aa2000-06-30 05:02:53 +0000128
Victor Stinner67e0de62019-11-20 11:48:18 +0100129#define GEN_HEAD(gcstate, n) (&(gcstate)->generations[n].head)
Antoine Pitroud4156c12012-10-30 22:43:19 +0100130
Eric Snow2ebc5ce2017-09-07 23:51:28 -0600131void
Victor Stinner72474072019-11-20 12:25:50 +0100132_PyGC_InitState(GCState *gcstate)
Eric Snow2ebc5ce2017-09-07 23:51:28 -0600133{
Victor Stinner67e0de62019-11-20 11:48:18 +0100134 gcstate->enabled = 1; /* automatic collection enabled? */
Eric Snow2ebc5ce2017-09-07 23:51:28 -0600135
Victor Stinner67e0de62019-11-20 11:48:18 +0100136#define _GEN_HEAD(n) GEN_HEAD(gcstate, n)
Eric Snow2ebc5ce2017-09-07 23:51:28 -0600137 struct gc_generation generations[NUM_GENERATIONS] = {
INADA Naoki5ac9e6e2018-07-10 17:19:53 +0900138 /* PyGC_Head, threshold, count */
139 {{(uintptr_t)_GEN_HEAD(0), (uintptr_t)_GEN_HEAD(0)}, 700, 0},
140 {{(uintptr_t)_GEN_HEAD(1), (uintptr_t)_GEN_HEAD(1)}, 10, 0},
141 {{(uintptr_t)_GEN_HEAD(2), (uintptr_t)_GEN_HEAD(2)}, 10, 0},
Eric Snow2ebc5ce2017-09-07 23:51:28 -0600142 };
143 for (int i = 0; i < NUM_GENERATIONS; i++) {
Victor Stinner67e0de62019-11-20 11:48:18 +0100144 gcstate->generations[i] = generations[i];
Eric Snow2ebc5ce2017-09-07 23:51:28 -0600145 };
Victor Stinner67e0de62019-11-20 11:48:18 +0100146 gcstate->generation0 = GEN_HEAD(gcstate, 0);
brainfvckc75edab2017-10-16 12:49:41 -0700147 struct gc_generation permanent_generation = {
Victor Stinner67e0de62019-11-20 11:48:18 +0100148 {(uintptr_t)&gcstate->permanent_generation.head,
149 (uintptr_t)&gcstate->permanent_generation.head}, 0, 0
brainfvckc75edab2017-10-16 12:49:41 -0700150 };
Victor Stinner67e0de62019-11-20 11:48:18 +0100151 gcstate->permanent_generation = permanent_generation;
Eric Snow2ebc5ce2017-09-07 23:51:28 -0600152}
Antoine Pitroud4156c12012-10-30 22:43:19 +0100153
Victor Stinner444b39b2019-11-20 01:18:11 +0100154
155PyStatus
Victor Stinner01b1cc12019-11-20 02:27:56 +0100156_PyGC_Init(PyThreadState *tstate)
Victor Stinner444b39b2019-11-20 01:18:11 +0100157{
Victor Stinner72474072019-11-20 12:25:50 +0100158 GCState *gcstate = &tstate->interp->gc;
Victor Stinner67e0de62019-11-20 11:48:18 +0100159 if (gcstate->garbage == NULL) {
160 gcstate->garbage = PyList_New(0);
161 if (gcstate->garbage == NULL) {
Victor Stinner444b39b2019-11-20 01:18:11 +0100162 return _PyStatus_NO_MEMORY();
163 }
164 }
165 return _PyStatus_OK();
166}
167
168
INADA Naoki5ac9e6e2018-07-10 17:19:53 +0900169/*
170_gc_prev values
171---------------
Neil Schemenauer43411b52001-08-30 00:05:51 +0000172
INADA Naoki5ac9e6e2018-07-10 17:19:53 +0900173Between collections, _gc_prev is used for doubly linked list.
Tim Peters6fc13d92002-07-02 18:12:35 +0000174
INADA Naoki5ac9e6e2018-07-10 17:19:53 +0900175Lowest two bits of _gc_prev are used for flags.
176PREV_MASK_COLLECTING is used only while collecting and cleared before GC ends
177or _PyObject_GC_UNTRACK() is called.
Tim Peters6fc13d92002-07-02 18:12:35 +0000178
INADA Naoki5ac9e6e2018-07-10 17:19:53 +0900179During a collection, _gc_prev is temporary used for gc_refs, and the gc list
180is singly linked until _gc_prev is restored.
Tim Peters6fc13d92002-07-02 18:12:35 +0000181
INADA Naoki5ac9e6e2018-07-10 17:19:53 +0900182gc_refs
Tim Peters6fc13d92002-07-02 18:12:35 +0000183 At the start of a collection, update_refs() copies the true refcount
184 to gc_refs, for each object in the generation being collected.
185 subtract_refs() then adjusts gc_refs so that it equals the number of
186 times an object is referenced directly from outside the generation
187 being collected.
Tim Peters6fc13d92002-07-02 18:12:35 +0000188
INADA Naoki5ac9e6e2018-07-10 17:19:53 +0900189PREV_MASK_COLLECTING
190 Objects in generation being collected are marked PREV_MASK_COLLECTING in
191 update_refs().
192
193
194_gc_next values
195---------------
196
197_gc_next takes these values:
198
1990
200 The object is not tracked
201
202!= 0
203 Pointer to the next object in the GC list.
204 Additionally, lowest bit is used temporary for
205 NEXT_MASK_UNREACHABLE flag described below.
206
207NEXT_MASK_UNREACHABLE
Tim Peters6fc13d92002-07-02 18:12:35 +0000208 move_unreachable() then moves objects not reachable (whether directly or
INADA Naoki5ac9e6e2018-07-10 17:19:53 +0900209 indirectly) from outside the generation into an "unreachable" set and
210 set this flag.
Tim Peters6fc13d92002-07-02 18:12:35 +0000211
INADA Naoki5ac9e6e2018-07-10 17:19:53 +0900212 Objects that are found to be reachable have gc_refs set to 1.
213 When this flag is set for the reachable object, the object must be in
214 "unreachable" set.
215 The flag is unset and the object is moved back to "reachable" set.
216
217 move_legacy_finalizers() will remove this flag from "unreachable" set.
Tim Peters6fc13d92002-07-02 18:12:35 +0000218*/
Neil Schemenauera2b11ec2002-05-21 15:53:24 +0000219
Jeremy Hyltonc5007aa2000-06-30 05:02:53 +0000220/*** list functions ***/
221
INADA Naoki5ac9e6e2018-07-10 17:19:53 +0900222static inline void
Jeremy Hyltonc5007aa2000-06-30 05:02:53 +0000223gc_list_init(PyGC_Head *list)
224{
INADA Naoki5ac9e6e2018-07-10 17:19:53 +0900225 // List header must not have flags.
226 // We can assign pointer by simple cast.
227 list->_gc_prev = (uintptr_t)list;
228 list->_gc_next = (uintptr_t)list;
Jeremy Hyltonc5007aa2000-06-30 05:02:53 +0000229}
230
INADA Naoki5ac9e6e2018-07-10 17:19:53 +0900231static inline int
Neil Schemenauer2880ae52002-05-04 05:35:20 +0000232gc_list_is_empty(PyGC_Head *list)
233{
INADA Naoki5ac9e6e2018-07-10 17:19:53 +0900234 return (list->_gc_next == (uintptr_t)list);
Neil Schemenauer2880ae52002-05-04 05:35:20 +0000235}
236
Tim Peterse2d59182004-11-01 01:39:08 +0000237/* Append `node` to `list`. */
INADA Naoki5ac9e6e2018-07-10 17:19:53 +0900238static inline void
Jeremy Hyltonc5007aa2000-06-30 05:02:53 +0000239gc_list_append(PyGC_Head *node, PyGC_Head *list)
240{
INADA Naoki5ac9e6e2018-07-10 17:19:53 +0900241 PyGC_Head *last = (PyGC_Head *)list->_gc_prev;
242
243 // last <-> node
244 _PyGCHead_SET_PREV(node, last);
245 _PyGCHead_SET_NEXT(last, node);
246
247 // node <-> list
248 _PyGCHead_SET_NEXT(node, list);
249 list->_gc_prev = (uintptr_t)node;
Jeremy Hyltonc5007aa2000-06-30 05:02:53 +0000250}
251
Tim Peterse2d59182004-11-01 01:39:08 +0000252/* Remove `node` from the gc list it's currently in. */
INADA Naoki5ac9e6e2018-07-10 17:19:53 +0900253static inline void
Jeremy Hyltonc5007aa2000-06-30 05:02:53 +0000254gc_list_remove(PyGC_Head *node)
255{
INADA Naoki5ac9e6e2018-07-10 17:19:53 +0900256 PyGC_Head *prev = GC_PREV(node);
257 PyGC_Head *next = GC_NEXT(node);
258
259 _PyGCHead_SET_NEXT(prev, next);
260 _PyGCHead_SET_PREV(next, prev);
261
262 node->_gc_next = 0; /* object is not currently tracked */
Jeremy Hyltonc5007aa2000-06-30 05:02:53 +0000263}
264
Tim Peterse2d59182004-11-01 01:39:08 +0000265/* Move `node` from the gc list it's currently in (which is not explicitly
266 * named here) to the end of `list`. This is semantically the same as
267 * gc_list_remove(node) followed by gc_list_append(node, list).
268 */
269static void
270gc_list_move(PyGC_Head *node, PyGC_Head *list)
271{
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000272 /* Unlink from current list. */
INADA Naoki5ac9e6e2018-07-10 17:19:53 +0900273 PyGC_Head *from_prev = GC_PREV(node);
274 PyGC_Head *from_next = GC_NEXT(node);
275 _PyGCHead_SET_NEXT(from_prev, from_next);
276 _PyGCHead_SET_PREV(from_next, from_prev);
277
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000278 /* Relink at end of new list. */
INADA Naoki5ac9e6e2018-07-10 17:19:53 +0900279 // list must not have flags. So we can skip macros.
280 PyGC_Head *to_prev = (PyGC_Head*)list->_gc_prev;
281 _PyGCHead_SET_PREV(node, to_prev);
282 _PyGCHead_SET_NEXT(to_prev, node);
283 list->_gc_prev = (uintptr_t)node;
284 _PyGCHead_SET_NEXT(node, list);
Tim Peterse2d59182004-11-01 01:39:08 +0000285}
286
287/* append list `from` onto list `to`; `from` becomes an empty list */
Jeremy Hyltonc5007aa2000-06-30 05:02:53 +0000288static void
289gc_list_merge(PyGC_Head *from, PyGC_Head *to)
290{
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000291 assert(from != to);
292 if (!gc_list_is_empty(from)) {
INADA Naoki5ac9e6e2018-07-10 17:19:53 +0900293 PyGC_Head *to_tail = GC_PREV(to);
294 PyGC_Head *from_head = GC_NEXT(from);
295 PyGC_Head *from_tail = GC_PREV(from);
296 assert(from_head != from);
297 assert(from_tail != from);
298
299 _PyGCHead_SET_NEXT(to_tail, from_head);
300 _PyGCHead_SET_PREV(from_head, to_tail);
301
302 _PyGCHead_SET_NEXT(from_tail, to);
303 _PyGCHead_SET_PREV(to, from_tail);
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000304 }
305 gc_list_init(from);
Jeremy Hyltonc5007aa2000-06-30 05:02:53 +0000306}
307
Neal Norwitz7b216c52006-03-04 20:01:53 +0000308static Py_ssize_t
Jeremy Hyltonc5007aa2000-06-30 05:02:53 +0000309gc_list_size(PyGC_Head *list)
310{
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000311 PyGC_Head *gc;
312 Py_ssize_t n = 0;
INADA Naoki5ac9e6e2018-07-10 17:19:53 +0900313 for (gc = GC_NEXT(list); gc != list; gc = GC_NEXT(gc)) {
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000314 n++;
315 }
316 return n;
Jeremy Hyltonc5007aa2000-06-30 05:02:53 +0000317}
318
Pablo Galindo466326d2019-10-13 16:48:59 +0100319/* Walk the list and mark all objects as non-collecting */
320static inline void
321gc_list_clear_collecting(PyGC_Head *collectable)
322{
323 PyGC_Head *gc;
324 for (gc = GC_NEXT(collectable); gc != collectable; gc = GC_NEXT(gc)) {
325 gc_clear_collecting(gc);
326 }
327}
328
Tim Peters259272b2003-04-06 19:41:39 +0000329/* Append objects in a GC list to a Python list.
Pablo Galindo466326d2019-10-13 16:48:59 +0100330 * Return 0 if all OK, < 0 if error (out of memory for list)
Tim Peters259272b2003-04-06 19:41:39 +0000331 */
332static int
333append_objects(PyObject *py_list, PyGC_Head *gc_list)
334{
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000335 PyGC_Head *gc;
INADA Naoki5ac9e6e2018-07-10 17:19:53 +0900336 for (gc = GC_NEXT(gc_list); gc != gc_list; gc = GC_NEXT(gc)) {
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000337 PyObject *op = FROM_GC(gc);
338 if (op != py_list) {
339 if (PyList_Append(py_list, op)) {
340 return -1; /* exception */
341 }
342 }
343 }
344 return 0;
Tim Peters259272b2003-04-06 19:41:39 +0000345}
346
Tim Petersea55c512019-10-18 20:59:14 -0500347// Constants for validate_list's flags argument.
348enum flagstates {collecting_clear_unreachable_clear,
349 collecting_clear_unreachable_set,
350 collecting_set_unreachable_clear,
351 collecting_set_unreachable_set};
352
Pablo Galindo320dd502019-10-10 22:45:17 +0100353#ifdef GC_DEBUG
INADA Naoki5ac9e6e2018-07-10 17:19:53 +0900354// validate_list checks list consistency. And it works as document
Tim Peters95bfc8a2019-10-13 16:47:04 -0500355// describing when flags are expected to be set / unset.
356// `head` must be a doubly-linked gc list, although it's fine (expected!) if
357// the prev and next pointers are "polluted" with flags.
358// What's checked:
359// - The `head` pointers are not polluted.
Tim Petersea55c512019-10-18 20:59:14 -0500360// - The objects' PREV_MASK_COLLECTING and NEXT_MASK_UNREACHABLE flags are all
361// `set or clear, as specified by the 'flags' argument.
Tim Peters95bfc8a2019-10-13 16:47:04 -0500362// - The prev and next pointers are mutually consistent.
INADA Naoki5ac9e6e2018-07-10 17:19:53 +0900363static void
Tim Petersea55c512019-10-18 20:59:14 -0500364validate_list(PyGC_Head *head, enum flagstates flags)
INADA Naoki5ac9e6e2018-07-10 17:19:53 +0900365{
Tim Peters95bfc8a2019-10-13 16:47:04 -0500366 assert((head->_gc_prev & PREV_MASK_COLLECTING) == 0);
367 assert((head->_gc_next & NEXT_MASK_UNREACHABLE) == 0);
Tim Petersea55c512019-10-18 20:59:14 -0500368 uintptr_t prev_value = 0, next_value = 0;
369 switch (flags) {
370 case collecting_clear_unreachable_clear:
371 break;
372 case collecting_set_unreachable_clear:
373 prev_value = PREV_MASK_COLLECTING;
374 break;
375 case collecting_clear_unreachable_set:
376 next_value = NEXT_MASK_UNREACHABLE;
377 break;
378 case collecting_set_unreachable_set:
379 prev_value = PREV_MASK_COLLECTING;
380 next_value = NEXT_MASK_UNREACHABLE;
381 break;
382 default:
383 assert(! "bad internal flags argument");
384 }
INADA Naoki5ac9e6e2018-07-10 17:19:53 +0900385 PyGC_Head *prev = head;
386 PyGC_Head *gc = GC_NEXT(head);
387 while (gc != head) {
Tim Peters95bfc8a2019-10-13 16:47:04 -0500388 PyGC_Head *trueprev = GC_PREV(gc);
389 PyGC_Head *truenext = (PyGC_Head *)(gc->_gc_next & ~NEXT_MASK_UNREACHABLE);
390 assert(truenext != NULL);
391 assert(trueprev == prev);
392 assert((gc->_gc_prev & PREV_MASK_COLLECTING) == prev_value);
393 assert((gc->_gc_next & NEXT_MASK_UNREACHABLE) == next_value);
INADA Naoki5ac9e6e2018-07-10 17:19:53 +0900394 prev = gc;
Tim Peters95bfc8a2019-10-13 16:47:04 -0500395 gc = truenext;
INADA Naoki5ac9e6e2018-07-10 17:19:53 +0900396 }
397 assert(prev == GC_PREV(head));
398}
399#else
Tim Petersea55c512019-10-18 20:59:14 -0500400#define validate_list(x, y) do{}while(0)
INADA Naoki5ac9e6e2018-07-10 17:19:53 +0900401#endif
402
Jeremy Hyltonc5007aa2000-06-30 05:02:53 +0000403/*** end of list stuff ***/
404
405
INADA Naoki5ac9e6e2018-07-10 17:19:53 +0900406/* Set all gc_refs = ob_refcnt. After this, gc_refs is > 0 and
407 * PREV_MASK_COLLECTING bit is set for all objects in containers.
Tim Peters88396172002-06-30 17:56:40 +0000408 */
Jeremy Hyltonc5007aa2000-06-30 05:02:53 +0000409static void
410update_refs(PyGC_Head *containers)
411{
INADA Naoki5ac9e6e2018-07-10 17:19:53 +0900412 PyGC_Head *gc = GC_NEXT(containers);
413 for (; gc != containers; gc = GC_NEXT(gc)) {
414 gc_reset_refs(gc, Py_REFCNT(FROM_GC(gc)));
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000415 /* Python's cyclic gc should never see an incoming refcount
416 * of 0: if something decref'ed to 0, it should have been
417 * deallocated immediately at that time.
418 * Possible cause (if the assert triggers): a tp_dealloc
419 * routine left a gc-aware object tracked during its teardown
420 * phase, and did something-- or allowed something to happen --
421 * that called back into Python. gc can trigger then, and may
422 * see the still-tracked dying object. Before this assert
423 * was added, such mistakes went on to allow gc to try to
424 * delete the object again. In a debug build, that caused
425 * a mysterious segfault, when _Py_ForgetReference tried
426 * to remove the object from the doubly-linked list of all
427 * objects a second time. In a release build, an actual
428 * double deallocation occurred, which leads to corruption
429 * of the allocator's internal bookkeeping pointers. That's
430 * so serious that maybe this should be a release-build
431 * check instead of an assert?
432 */
Victor Stinnera4b2bc72018-10-26 18:00:13 +0200433 _PyObject_ASSERT(FROM_GC(gc), gc_get_refs(gc) != 0);
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000434 }
Jeremy Hyltonc5007aa2000-06-30 05:02:53 +0000435}
436
Tim Peters19b74c72002-07-01 03:52:19 +0000437/* A traversal callback for subtract_refs. */
Jeremy Hyltonc5007aa2000-06-30 05:02:53 +0000438static int
Victor Stinner4d5f94b2019-10-08 02:37:38 +0200439visit_decref(PyObject *op, void *parent)
Jeremy Hyltonc5007aa2000-06-30 05:02:53 +0000440{
Victor Stinner4d5f94b2019-10-08 02:37:38 +0200441 _PyObject_ASSERT(_PyObject_CAST(parent), !_PyObject_IsFreed(op));
Victor Stinnerd91d4de2019-09-09 17:44:59 +0200442
Hai Shi675d9a32020-04-15 02:11:20 +0800443 if (_PyObject_IS_GC(op)) {
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000444 PyGC_Head *gc = AS_GC(op);
445 /* We're only interested in gc_refs for objects in the
446 * generation being collected, which can be recognized
447 * because only they have positive gc_refs.
448 */
INADA Naoki5ac9e6e2018-07-10 17:19:53 +0900449 if (gc_is_collecting(gc)) {
450 gc_decref(gc);
451 }
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000452 }
453 return 0;
Jeremy Hyltonc5007aa2000-06-30 05:02:53 +0000454}
455
Tim Peters19b74c72002-07-01 03:52:19 +0000456/* Subtract internal references from gc_refs. After this, gc_refs is >= 0
457 * for all objects in containers, and is GC_REACHABLE for all tracked gc
458 * objects not in containers. The ones with gc_refs > 0 are directly
459 * reachable from outside containers, and so can't be collected.
460 */
Jeremy Hyltonc5007aa2000-06-30 05:02:53 +0000461static void
462subtract_refs(PyGC_Head *containers)
463{
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000464 traverseproc traverse;
INADA Naoki5ac9e6e2018-07-10 17:19:53 +0900465 PyGC_Head *gc = GC_NEXT(containers);
466 for (; gc != containers; gc = GC_NEXT(gc)) {
Victor Stinner4d5f94b2019-10-08 02:37:38 +0200467 PyObject *op = FROM_GC(gc);
468 traverse = Py_TYPE(op)->tp_traverse;
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000469 (void) traverse(FROM_GC(gc),
470 (visitproc)visit_decref,
Victor Stinner4d5f94b2019-10-08 02:37:38 +0200471 op);
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000472 }
Jeremy Hyltonc5007aa2000-06-30 05:02:53 +0000473}
474
Tim Peters19b74c72002-07-01 03:52:19 +0000475/* A traversal callback for move_unreachable. */
Jeremy Hyltonc5007aa2000-06-30 05:02:53 +0000476static int
Tim Peters19b74c72002-07-01 03:52:19 +0000477visit_reachable(PyObject *op, PyGC_Head *reachable)
Jeremy Hyltonc5007aa2000-06-30 05:02:53 +0000478{
Hai Shi675d9a32020-04-15 02:11:20 +0800479 if (!_PyObject_IS_GC(op)) {
INADA Naoki5ac9e6e2018-07-10 17:19:53 +0900480 return 0;
481 }
Tim Peters19b74c72002-07-01 03:52:19 +0000482
INADA Naoki5ac9e6e2018-07-10 17:19:53 +0900483 PyGC_Head *gc = AS_GC(op);
484 const Py_ssize_t gc_refs = gc_get_refs(gc);
485
Tim Peters1e739452019-10-21 11:21:35 -0500486 // Ignore objects in other generation.
Tim Peters95bfc8a2019-10-13 16:47:04 -0500487 // This also skips objects "to the left" of the current position in
488 // move_unreachable's scan of the 'young' list - they've already been
489 // traversed, and no longer have the PREV_MASK_COLLECTING flag.
Tim Peters1e739452019-10-21 11:21:35 -0500490 if (! gc_is_collecting(gc)) {
INADA Naoki5ac9e6e2018-07-10 17:19:53 +0900491 return 0;
492 }
Tim Peters1e739452019-10-21 11:21:35 -0500493 // It would be a logic error elsewhere if the collecting flag were set on
494 // an untracked object.
495 assert(gc->_gc_next != 0);
INADA Naoki5ac9e6e2018-07-10 17:19:53 +0900496
497 if (gc->_gc_next & NEXT_MASK_UNREACHABLE) {
498 /* This had gc_refs = 0 when move_unreachable got
499 * to it, but turns out it's reachable after all.
500 * Move it back to move_unreachable's 'young' list,
501 * and move_unreachable will eventually get to it
502 * again.
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000503 */
Tim Peters95bfc8a2019-10-13 16:47:04 -0500504 // Manually unlink gc from unreachable list because the list functions
505 // don't work right in the presence of NEXT_MASK_UNREACHABLE flags.
INADA Naoki5ac9e6e2018-07-10 17:19:53 +0900506 PyGC_Head *prev = GC_PREV(gc);
507 PyGC_Head *next = (PyGC_Head*)(gc->_gc_next & ~NEXT_MASK_UNREACHABLE);
Victor Stinnera4b2bc72018-10-26 18:00:13 +0200508 _PyObject_ASSERT(FROM_GC(prev),
509 prev->_gc_next & NEXT_MASK_UNREACHABLE);
510 _PyObject_ASSERT(FROM_GC(next),
511 next->_gc_next & NEXT_MASK_UNREACHABLE);
INADA Naoki5ac9e6e2018-07-10 17:19:53 +0900512 prev->_gc_next = gc->_gc_next; // copy NEXT_MASK_UNREACHABLE
513 _PyGCHead_SET_PREV(next, prev);
514
515 gc_list_append(gc, reachable);
516 gc_set_refs(gc, 1);
517 }
518 else if (gc_refs == 0) {
519 /* This is in move_unreachable's 'young' list, but
520 * the traversal hasn't yet gotten to it. All
521 * we need to do is tell move_unreachable that it's
522 * reachable.
523 */
524 gc_set_refs(gc, 1);
525 }
526 /* Else there's nothing to do.
527 * If gc_refs > 0, it must be in move_unreachable's 'young'
528 * list, and move_unreachable will eventually get to it.
529 */
530 else {
Victor Stinnera4b2bc72018-10-26 18:00:13 +0200531 _PyObject_ASSERT_WITH_MSG(op, gc_refs > 0, "refcount is too small");
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000532 }
533 return 0;
Jeremy Hyltonc5007aa2000-06-30 05:02:53 +0000534}
535
Tim Peters19b74c72002-07-01 03:52:19 +0000536/* Move the unreachable objects from young to unreachable. After this,
INADA Naoki5ac9e6e2018-07-10 17:19:53 +0900537 * all objects in young don't have PREV_MASK_COLLECTING flag and
538 * unreachable have the flag.
Tim Peters19b74c72002-07-01 03:52:19 +0000539 * All objects in young after this are directly or indirectly reachable
540 * from outside the original young; and all objects in unreachable are
541 * not.
INADA Naoki5ac9e6e2018-07-10 17:19:53 +0900542 *
543 * This function restores _gc_prev pointer. young and unreachable are
544 * doubly linked list after this function.
545 * But _gc_next in unreachable list has NEXT_MASK_UNREACHABLE flag.
546 * So we can not gc_list_* functions for unreachable until we remove the flag.
Tim Peters88396172002-06-30 17:56:40 +0000547 */
Jeremy Hyltonc5007aa2000-06-30 05:02:53 +0000548static void
Tim Peters19b74c72002-07-01 03:52:19 +0000549move_unreachable(PyGC_Head *young, PyGC_Head *unreachable)
Jeremy Hyltonc5007aa2000-06-30 05:02:53 +0000550{
INADA Naoki5ac9e6e2018-07-10 17:19:53 +0900551 // previous elem in the young list, used for restore gc_prev.
552 PyGC_Head *prev = young;
553 PyGC_Head *gc = GC_NEXT(young);
Tim Peters19b74c72002-07-01 03:52:19 +0000554
INADA Naoki5ac9e6e2018-07-10 17:19:53 +0900555 /* Invariants: all objects "to the left" of us in young are reachable
556 * (directly or indirectly) from outside the young list as it was at entry.
557 *
558 * All other objects from the original young "to the left" of us are in
559 * unreachable now, and have NEXT_MASK_UNREACHABLE. All objects to the
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000560 * left of us in 'young' now have been scanned, and no objects here
561 * or to the right have been scanned yet.
562 */
Tim Peters19b74c72002-07-01 03:52:19 +0000563
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000564 while (gc != young) {
INADA Naoki5ac9e6e2018-07-10 17:19:53 +0900565 if (gc_get_refs(gc)) {
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000566 /* gc is definitely reachable from outside the
567 * original 'young'. Mark it as such, and traverse
568 * its pointers to find any other objects that may
569 * be directly reachable from it. Note that the
570 * call to tp_traverse may append objects to young,
571 * so we have to wait until it returns to determine
572 * the next object to visit.
573 */
574 PyObject *op = FROM_GC(gc);
575 traverseproc traverse = Py_TYPE(op)->tp_traverse;
Victor Stinnera4b2bc72018-10-26 18:00:13 +0200576 _PyObject_ASSERT_WITH_MSG(op, gc_get_refs(gc) > 0,
577 "refcount is too small");
INADA Naoki5ac9e6e2018-07-10 17:19:53 +0900578 // NOTE: visit_reachable may change gc->_gc_next when
579 // young->_gc_prev == gc. Don't do gc = GC_NEXT(gc) before!
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000580 (void) traverse(op,
INADA Naoki5ac9e6e2018-07-10 17:19:53 +0900581 (visitproc)visit_reachable,
582 (void *)young);
583 // relink gc_prev to prev element.
584 _PyGCHead_SET_PREV(gc, prev);
Quan Tian3bd0d622018-10-20 05:30:03 +0800585 // gc is not COLLECTING state after here.
INADA Naoki5ac9e6e2018-07-10 17:19:53 +0900586 gc_clear_collecting(gc);
587 prev = gc;
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000588 }
589 else {
590 /* This *may* be unreachable. To make progress,
591 * assume it is. gc isn't directly reachable from
592 * any object we've already traversed, but may be
593 * reachable from an object we haven't gotten to yet.
594 * visit_reachable will eventually move gc back into
595 * young if that's so, and we'll see it again.
596 */
INADA Naoki5ac9e6e2018-07-10 17:19:53 +0900597 // Move gc to unreachable.
598 // No need to gc->next->prev = prev because it is single linked.
599 prev->_gc_next = gc->_gc_next;
600
601 // We can't use gc_list_append() here because we use
602 // NEXT_MASK_UNREACHABLE here.
603 PyGC_Head *last = GC_PREV(unreachable);
604 // NOTE: Since all objects in unreachable set has
605 // NEXT_MASK_UNREACHABLE flag, we set it unconditionally.
Tim Peters95bfc8a2019-10-13 16:47:04 -0500606 // But this may pollute the unreachable list head's 'next' pointer
607 // too. That's semantically senseless but expedient here - the
Pablo Galindo97f12672020-01-13 12:25:05 +0000608 // damage is repaired when this function ends.
INADA Naoki5ac9e6e2018-07-10 17:19:53 +0900609 last->_gc_next = (NEXT_MASK_UNREACHABLE | (uintptr_t)gc);
610 _PyGCHead_SET_PREV(gc, last);
611 gc->_gc_next = (NEXT_MASK_UNREACHABLE | (uintptr_t)unreachable);
612 unreachable->_gc_prev = (uintptr_t)gc;
613 }
614 gc = (PyGC_Head*)prev->_gc_next;
615 }
616 // young->_gc_prev must be last element remained in the list.
617 young->_gc_prev = (uintptr_t)prev;
Tim Peters95bfc8a2019-10-13 16:47:04 -0500618 // don't let the pollution of the list head's next pointer leak
619 unreachable->_gc_next &= ~NEXT_MASK_UNREACHABLE;
INADA Naoki5ac9e6e2018-07-10 17:19:53 +0900620}
621
622static void
623untrack_tuples(PyGC_Head *head)
624{
625 PyGC_Head *next, *gc = GC_NEXT(head);
626 while (gc != head) {
627 PyObject *op = FROM_GC(gc);
628 next = GC_NEXT(gc);
629 if (PyTuple_CheckExact(op)) {
630 _PyTuple_MaybeUntrack(op);
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000631 }
632 gc = next;
633 }
Jeremy Hyltonc5007aa2000-06-30 05:02:53 +0000634}
635
Antoine Pitroue1ad3da2012-05-28 22:22:34 +0200636/* Try to untrack all currently tracked dictionaries */
637static void
638untrack_dicts(PyGC_Head *head)
639{
INADA Naoki5ac9e6e2018-07-10 17:19:53 +0900640 PyGC_Head *next, *gc = GC_NEXT(head);
Antoine Pitroue1ad3da2012-05-28 22:22:34 +0200641 while (gc != head) {
642 PyObject *op = FROM_GC(gc);
INADA Naoki5ac9e6e2018-07-10 17:19:53 +0900643 next = GC_NEXT(gc);
644 if (PyDict_CheckExact(op)) {
Antoine Pitroue1ad3da2012-05-28 22:22:34 +0200645 _PyDict_MaybeUntrack(op);
INADA Naoki5ac9e6e2018-07-10 17:19:53 +0900646 }
Antoine Pitroue1ad3da2012-05-28 22:22:34 +0200647 gc = next;
648 }
649}
650
Antoine Pitrou796564c2013-07-30 19:59:21 +0200651/* Return true if object has a pre-PEP 442 finalization method. */
Neil Schemenauera765c122001-11-01 17:35:23 +0000652static int
Antoine Pitrou796564c2013-07-30 19:59:21 +0200653has_legacy_finalizer(PyObject *op)
Jeremy Hyltonc5007aa2000-06-30 05:02:53 +0000654{
Victor Stinnerdaa97562020-02-07 03:37:06 +0100655 return Py_TYPE(op)->tp_del != NULL;
Neil Schemenauera765c122001-11-01 17:35:23 +0000656}
657
Antoine Pitrou796564c2013-07-30 19:59:21 +0200658/* Move the objects in unreachable with tp_del slots into `finalizers`.
INADA Naoki5ac9e6e2018-07-10 17:19:53 +0900659 *
660 * This function also removes NEXT_MASK_UNREACHABLE flag
661 * from _gc_next in unreachable.
Jeremy Hyltonce136e92003-04-04 19:59:06 +0000662 */
Neil Schemenauera765c122001-11-01 17:35:23 +0000663static void
Antoine Pitrou796564c2013-07-30 19:59:21 +0200664move_legacy_finalizers(PyGC_Head *unreachable, PyGC_Head *finalizers)
Neil Schemenauera765c122001-11-01 17:35:23 +0000665{
INADA Naoki5ac9e6e2018-07-10 17:19:53 +0900666 PyGC_Head *gc, *next;
Tim Peters95bfc8a2019-10-13 16:47:04 -0500667 assert((unreachable->_gc_next & NEXT_MASK_UNREACHABLE) == 0);
Tim Petersf6b80452003-04-07 19:21:15 +0000668
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000669 /* March over unreachable. Move objects with finalizers into
670 * `finalizers`.
671 */
INADA Naoki5ac9e6e2018-07-10 17:19:53 +0900672 for (gc = GC_NEXT(unreachable); gc != unreachable; gc = next) {
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000673 PyObject *op = FROM_GC(gc);
Jeremy Hyltonce136e92003-04-04 19:59:06 +0000674
Victor Stinnera4b2bc72018-10-26 18:00:13 +0200675 _PyObject_ASSERT(op, gc->_gc_next & NEXT_MASK_UNREACHABLE);
INADA Naoki5ac9e6e2018-07-10 17:19:53 +0900676 gc->_gc_next &= ~NEXT_MASK_UNREACHABLE;
677 next = (PyGC_Head*)gc->_gc_next;
Tim Petersf6ae7a42003-04-05 18:40:50 +0000678
Antoine Pitrou796564c2013-07-30 19:59:21 +0200679 if (has_legacy_finalizer(op)) {
INADA Naoki5ac9e6e2018-07-10 17:19:53 +0900680 gc_clear_collecting(gc);
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000681 gc_list_move(gc, finalizers);
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000682 }
683 }
Jeremy Hyltonc5007aa2000-06-30 05:02:53 +0000684}
685
Pablo Galindo466326d2019-10-13 16:48:59 +0100686static inline void
687clear_unreachable_mask(PyGC_Head *unreachable)
688{
689 /* Check that the list head does not have the unreachable bit set */
690 assert(((uintptr_t)unreachable & NEXT_MASK_UNREACHABLE) == 0);
691
692 PyGC_Head *gc, *next;
Tim Peters95bfc8a2019-10-13 16:47:04 -0500693 assert((unreachable->_gc_next & NEXT_MASK_UNREACHABLE) == 0);
Pablo Galindo466326d2019-10-13 16:48:59 +0100694 for (gc = GC_NEXT(unreachable); gc != unreachable; gc = next) {
695 _PyObject_ASSERT((PyObject*)FROM_GC(gc), gc->_gc_next & NEXT_MASK_UNREACHABLE);
696 gc->_gc_next &= ~NEXT_MASK_UNREACHABLE;
697 next = (PyGC_Head*)gc->_gc_next;
698 }
Tim Petersea55c512019-10-18 20:59:14 -0500699 validate_list(unreachable, collecting_set_unreachable_clear);
Pablo Galindo466326d2019-10-13 16:48:59 +0100700}
701
Antoine Pitrou796564c2013-07-30 19:59:21 +0200702/* A traversal callback for move_legacy_finalizer_reachable. */
Tim Peters19b74c72002-07-01 03:52:19 +0000703static int
704visit_move(PyObject *op, PyGC_Head *tolist)
705{
Hai Shi675d9a32020-04-15 02:11:20 +0800706 if (_PyObject_IS_GC(op)) {
INADA Naoki5ac9e6e2018-07-10 17:19:53 +0900707 PyGC_Head *gc = AS_GC(op);
708 if (gc_is_collecting(gc)) {
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000709 gc_list_move(gc, tolist);
INADA Naoki5ac9e6e2018-07-10 17:19:53 +0900710 gc_clear_collecting(gc);
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000711 }
712 }
713 return 0;
Tim Peters19b74c72002-07-01 03:52:19 +0000714}
715
716/* Move objects that are reachable from finalizers, from the unreachable set
Tim Petersf6b80452003-04-07 19:21:15 +0000717 * into finalizers set.
Tim Peters19b74c72002-07-01 03:52:19 +0000718 */
Jeremy Hyltonc5007aa2000-06-30 05:02:53 +0000719static void
Antoine Pitrou796564c2013-07-30 19:59:21 +0200720move_legacy_finalizer_reachable(PyGC_Head *finalizers)
Jeremy Hyltonc5007aa2000-06-30 05:02:53 +0000721{
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000722 traverseproc traverse;
INADA Naoki5ac9e6e2018-07-10 17:19:53 +0900723 PyGC_Head *gc = GC_NEXT(finalizers);
724 for (; gc != finalizers; gc = GC_NEXT(gc)) {
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000725 /* Note that the finalizers list may grow during this. */
726 traverse = Py_TYPE(FROM_GC(gc))->tp_traverse;
727 (void) traverse(FROM_GC(gc),
728 (visitproc)visit_move,
729 (void *)finalizers);
730 }
Jeremy Hyltonc5007aa2000-06-30 05:02:53 +0000731}
732
Tim Petersead8b7a2004-10-30 23:09:22 +0000733/* Clear all weakrefs to unreachable objects, and if such a weakref has a
734 * callback, invoke it if necessary. Note that it's possible for such
735 * weakrefs to be outside the unreachable set -- indeed, those are precisely
736 * the weakrefs whose callbacks must be invoked. See gc_weakref.txt for
737 * overview & some details. Some weakrefs with callbacks may be reclaimed
738 * directly by this routine; the number reclaimed is the return value. Other
739 * weakrefs with callbacks may be moved into the `old` generation. Objects
740 * moved into `old` have gc_refs set to GC_REACHABLE; the objects remaining in
741 * unreachable are left at GC_TENTATIVELY_UNREACHABLE. When this returns,
742 * no object in `unreachable` is weakly referenced anymore.
Tim Peters403a2032003-11-20 21:21:46 +0000743 */
744static int
Tim Petersead8b7a2004-10-30 23:09:22 +0000745handle_weakrefs(PyGC_Head *unreachable, PyGC_Head *old)
Tim Peters403a2032003-11-20 21:21:46 +0000746{
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000747 PyGC_Head *gc;
748 PyObject *op; /* generally FROM_GC(gc) */
749 PyWeakReference *wr; /* generally a cast of op */
750 PyGC_Head wrcb_to_call; /* weakrefs with callbacks to call */
751 PyGC_Head *next;
752 int num_freed = 0;
Tim Peters403a2032003-11-20 21:21:46 +0000753
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000754 gc_list_init(&wrcb_to_call);
Tim Peters403a2032003-11-20 21:21:46 +0000755
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000756 /* Clear all weakrefs to the objects in unreachable. If such a weakref
757 * also has a callback, move it into `wrcb_to_call` if the callback
758 * needs to be invoked. Note that we cannot invoke any callbacks until
759 * all weakrefs to unreachable objects are cleared, lest the callback
760 * resurrect an unreachable object via a still-active weakref. We
761 * make another pass over wrcb_to_call, invoking callbacks, after this
762 * pass completes.
763 */
INADA Naoki5ac9e6e2018-07-10 17:19:53 +0900764 for (gc = GC_NEXT(unreachable); gc != unreachable; gc = next) {
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000765 PyWeakReference **wrlist;
Tim Petersead8b7a2004-10-30 23:09:22 +0000766
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000767 op = FROM_GC(gc);
INADA Naoki5ac9e6e2018-07-10 17:19:53 +0900768 next = GC_NEXT(gc);
Tim Petersead8b7a2004-10-30 23:09:22 +0000769
Neil Schemenauerbcda4602019-09-30 10:06:45 -0700770 if (PyWeakref_Check(op)) {
771 /* A weakref inside the unreachable set must be cleared. If we
772 * allow its callback to execute inside delete_garbage(), it
773 * could expose objects that have tp_clear already called on
774 * them. Or, it could resurrect unreachable objects. One way
775 * this can happen is if some container objects do not implement
776 * tp_traverse. Then, wr_object can be outside the unreachable
777 * set but can be deallocated as a result of breaking the
778 * reference cycle. If we don't clear the weakref, the callback
779 * will run and potentially cause a crash. See bpo-38006 for
780 * one example.
781 */
782 _PyWeakref_ClearRef((PyWeakReference *)op);
783 }
784
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000785 if (! PyType_SUPPORTS_WEAKREFS(Py_TYPE(op)))
786 continue;
Tim Petersead8b7a2004-10-30 23:09:22 +0000787
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000788 /* It supports weakrefs. Does it have any? */
789 wrlist = (PyWeakReference **)
Victor Stinner38aefc52020-04-06 14:07:02 +0200790 _PyObject_GET_WEAKREFS_LISTPTR(op);
Tim Petersead8b7a2004-10-30 23:09:22 +0000791
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000792 /* `op` may have some weakrefs. March over the list, clear
793 * all the weakrefs, and move the weakrefs with callbacks
794 * that must be called into wrcb_to_call.
795 */
796 for (wr = *wrlist; wr != NULL; wr = *wrlist) {
797 PyGC_Head *wrasgc; /* AS_GC(wr) */
Tim Petersead8b7a2004-10-30 23:09:22 +0000798
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000799 /* _PyWeakref_ClearRef clears the weakref but leaves
800 * the callback pointer intact. Obscure: it also
801 * changes *wrlist.
802 */
Victor Stinnera4b2bc72018-10-26 18:00:13 +0200803 _PyObject_ASSERT((PyObject *)wr, wr->wr_object == op);
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000804 _PyWeakref_ClearRef(wr);
Victor Stinnera4b2bc72018-10-26 18:00:13 +0200805 _PyObject_ASSERT((PyObject *)wr, wr->wr_object == Py_None);
806 if (wr->wr_callback == NULL) {
807 /* no callback */
808 continue;
809 }
Tim Petersead8b7a2004-10-30 23:09:22 +0000810
Victor Stinnera4b2bc72018-10-26 18:00:13 +0200811 /* Headache time. `op` is going away, and is weakly referenced by
812 * `wr`, which has a callback. Should the callback be invoked? If wr
813 * is also trash, no:
814 *
815 * 1. There's no need to call it. The object and the weakref are
816 * both going away, so it's legitimate to pretend the weakref is
817 * going away first. The user has to ensure a weakref outlives its
818 * referent if they want a guarantee that the wr callback will get
819 * invoked.
820 *
821 * 2. It may be catastrophic to call it. If the callback is also in
822 * cyclic trash (CT), then although the CT is unreachable from
823 * outside the current generation, CT may be reachable from the
824 * callback. Then the callback could resurrect insane objects.
825 *
826 * Since the callback is never needed and may be unsafe in this case,
827 * wr is simply left in the unreachable set. Note that because we
828 * already called _PyWeakref_ClearRef(wr), its callback will never
829 * trigger.
830 *
831 * OTOH, if wr isn't part of CT, we should invoke the callback: the
832 * weakref outlived the trash. Note that since wr isn't CT in this
833 * case, its callback can't be CT either -- wr acted as an external
834 * root to this generation, and therefore its callback did too. So
835 * nothing in CT is reachable from the callback either, so it's hard
836 * to imagine how calling it later could create a problem for us. wr
837 * is moved to wrcb_to_call in this case.
838 */
INADA Naoki5ac9e6e2018-07-10 17:19:53 +0900839 if (gc_is_collecting(AS_GC(wr))) {
Neil Schemenauerbcda4602019-09-30 10:06:45 -0700840 /* it should already have been cleared above */
841 assert(wr->wr_object == Py_None);
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000842 continue;
INADA Naoki5ac9e6e2018-07-10 17:19:53 +0900843 }
Tim Peterscc2a8662004-10-31 22:12:43 +0000844
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000845 /* Create a new reference so that wr can't go away
846 * before we can process it again.
847 */
848 Py_INCREF(wr);
Tim Petersead8b7a2004-10-30 23:09:22 +0000849
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000850 /* Move wr to wrcb_to_call, for the next pass. */
851 wrasgc = AS_GC(wr);
852 assert(wrasgc != next); /* wrasgc is reachable, but
853 next isn't, so they can't
854 be the same */
855 gc_list_move(wrasgc, &wrcb_to_call);
856 }
857 }
Tim Petersead8b7a2004-10-30 23:09:22 +0000858
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000859 /* Invoke the callbacks we decided to honor. It's safe to invoke them
860 * because they can't reference unreachable objects.
861 */
862 while (! gc_list_is_empty(&wrcb_to_call)) {
863 PyObject *temp;
864 PyObject *callback;
Tim Petersead8b7a2004-10-30 23:09:22 +0000865
INADA Naoki5ac9e6e2018-07-10 17:19:53 +0900866 gc = (PyGC_Head*)wrcb_to_call._gc_next;
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000867 op = FROM_GC(gc);
Victor Stinnera4b2bc72018-10-26 18:00:13 +0200868 _PyObject_ASSERT(op, PyWeakref_Check(op));
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000869 wr = (PyWeakReference *)op;
870 callback = wr->wr_callback;
Victor Stinnera4b2bc72018-10-26 18:00:13 +0200871 _PyObject_ASSERT(op, callback != NULL);
Tim Petersead8b7a2004-10-30 23:09:22 +0000872
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000873 /* copy-paste of weakrefobject.c's handle_callback() */
Petr Viktorinffd97532020-02-11 17:46:57 +0100874 temp = PyObject_CallOneArg(callback, (PyObject *)wr);
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000875 if (temp == NULL)
876 PyErr_WriteUnraisable(callback);
877 else
878 Py_DECREF(temp);
Tim Petersead8b7a2004-10-30 23:09:22 +0000879
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000880 /* Give up the reference we created in the first pass. When
881 * op's refcount hits 0 (which it may or may not do right now),
882 * op's tp_dealloc will decref op->wr_callback too. Note
883 * that the refcount probably will hit 0 now, and because this
884 * weakref was reachable to begin with, gc didn't already
885 * add it to its count of freed objects. Example: a reachable
886 * weak value dict maps some key to this reachable weakref.
887 * The callback removes this key->weakref mapping from the
888 * dict, leaving no other references to the weakref (excepting
889 * ours).
890 */
891 Py_DECREF(op);
INADA Naoki5ac9e6e2018-07-10 17:19:53 +0900892 if (wrcb_to_call._gc_next == (uintptr_t)gc) {
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000893 /* object is still alive -- move it */
894 gc_list_move(gc, old);
895 }
INADA Naoki5ac9e6e2018-07-10 17:19:53 +0900896 else {
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000897 ++num_freed;
INADA Naoki5ac9e6e2018-07-10 17:19:53 +0900898 }
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000899 }
Tim Petersead8b7a2004-10-30 23:09:22 +0000900
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000901 return num_freed;
Tim Peters403a2032003-11-20 21:21:46 +0000902}
903
Jeremy Hyltonc5007aa2000-06-30 05:02:53 +0000904static void
Serhiy Storchakaef1585e2015-12-25 20:01:53 +0200905debug_cycle(const char *msg, PyObject *op)
Jeremy Hyltonc5007aa2000-06-30 05:02:53 +0000906{
Victor Stinner499dfcf2011-03-21 13:26:24 +0100907 PySys_FormatStderr("gc: %s <%s %p>\n",
908 msg, Py_TYPE(op)->tp_name, op);
Jeremy Hyltonc5007aa2000-06-30 05:02:53 +0000909}
910
Antoine Pitrou796564c2013-07-30 19:59:21 +0200911/* Handle uncollectable garbage (cycles with tp_del slots, and stuff reachable
Tim Petersbf384c22003-04-06 00:11:39 +0000912 * only from such cycles).
Tim Petersf6b80452003-04-07 19:21:15 +0000913 * If DEBUG_SAVEALL, all objects in finalizers are appended to the module
914 * garbage list (a Python list), else only the objects in finalizers with
915 * __del__ methods are appended to garbage. All objects in finalizers are
916 * merged into the old list regardless.
Tim Petersbf384c22003-04-06 00:11:39 +0000917 */
Serhiy Storchaka301e3cc2018-05-24 15:19:29 +0300918static void
Victor Stinner2e969062019-11-20 01:49:32 +0100919handle_legacy_finalizers(PyThreadState *tstate,
Victor Stinner67e0de62019-11-20 11:48:18 +0100920 GCState *gcstate,
Victor Stinner9db03242019-04-26 02:32:01 +0200921 PyGC_Head *finalizers, PyGC_Head *old)
Jeremy Hyltonc5007aa2000-06-30 05:02:53 +0000922{
Victor Stinner2e969062019-11-20 01:49:32 +0100923 assert(!_PyErr_Occurred(tstate));
Victor Stinner67e0de62019-11-20 11:48:18 +0100924 assert(gcstate->garbage != NULL);
Victor Stinner9db03242019-04-26 02:32:01 +0200925
926 PyGC_Head *gc = GC_NEXT(finalizers);
INADA Naoki5ac9e6e2018-07-10 17:19:53 +0900927 for (; gc != finalizers; gc = GC_NEXT(gc)) {
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000928 PyObject *op = FROM_GC(gc);
Tim Petersf6b80452003-04-07 19:21:15 +0000929
Victor Stinner67e0de62019-11-20 11:48:18 +0100930 if ((gcstate->debug & DEBUG_SAVEALL) || has_legacy_finalizer(op)) {
931 if (PyList_Append(gcstate->garbage, op) < 0) {
Victor Stinner2e969062019-11-20 01:49:32 +0100932 _PyErr_Clear(tstate);
Serhiy Storchaka301e3cc2018-05-24 15:19:29 +0300933 break;
Serhiy Storchakac4653c92018-05-29 18:50:10 +0300934 }
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000935 }
936 }
Tim Petersf6b80452003-04-07 19:21:15 +0000937
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000938 gc_list_merge(finalizers, old);
Jeremy Hyltonc5007aa2000-06-30 05:02:53 +0000939}
940
Tim Peters5fbc7b12014-05-08 17:42:19 -0500941/* Run first-time finalizers (if any) on all the objects in collectable.
942 * Note that this may remove some (or even all) of the objects from the
943 * list, due to refcounts falling to 0.
944 */
Antoine Pitrou796564c2013-07-30 19:59:21 +0200945static void
Victor Stinner67e0de62019-11-20 11:48:18 +0100946finalize_garbage(PyThreadState *tstate, PyGC_Head *collectable)
Antoine Pitrou796564c2013-07-30 19:59:21 +0200947{
948 destructor finalize;
Tim Peters5fbc7b12014-05-08 17:42:19 -0500949 PyGC_Head seen;
Antoine Pitrou796564c2013-07-30 19:59:21 +0200950
Tim Peters5fbc7b12014-05-08 17:42:19 -0500951 /* While we're going through the loop, `finalize(op)` may cause op, or
952 * other objects, to be reclaimed via refcounts falling to zero. So
953 * there's little we can rely on about the structure of the input
954 * `collectable` list across iterations. For safety, we always take the
955 * first object in that list and move it to a temporary `seen` list.
956 * If objects vanish from the `collectable` and `seen` lists we don't
957 * care.
958 */
959 gc_list_init(&seen);
960
961 while (!gc_list_is_empty(collectable)) {
INADA Naoki5ac9e6e2018-07-10 17:19:53 +0900962 PyGC_Head *gc = GC_NEXT(collectable);
Antoine Pitrou796564c2013-07-30 19:59:21 +0200963 PyObject *op = FROM_GC(gc);
Tim Peters5fbc7b12014-05-08 17:42:19 -0500964 gc_list_move(gc, &seen);
Antoine Pitrou796564c2013-07-30 19:59:21 +0200965 if (!_PyGCHead_FINALIZED(gc) &&
Tim Peters5fbc7b12014-05-08 17:42:19 -0500966 (finalize = Py_TYPE(op)->tp_finalize) != NULL) {
INADA Naoki5ac9e6e2018-07-10 17:19:53 +0900967 _PyGCHead_SET_FINALIZED(gc);
Antoine Pitrou796564c2013-07-30 19:59:21 +0200968 Py_INCREF(op);
969 finalize(op);
Victor Stinner67e0de62019-11-20 11:48:18 +0100970 assert(!_PyErr_Occurred(tstate));
Antoine Pitrou796564c2013-07-30 19:59:21 +0200971 Py_DECREF(op);
972 }
973 }
Tim Peters5fbc7b12014-05-08 17:42:19 -0500974 gc_list_merge(&seen, collectable);
Antoine Pitrou796564c2013-07-30 19:59:21 +0200975}
976
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000977/* Break reference cycles by clearing the containers involved. This is
Jeremy Hyltonc5007aa2000-06-30 05:02:53 +0000978 * tricky business as the lists can be changing and we don't know which
Tim Peters19b74c72002-07-01 03:52:19 +0000979 * objects may be freed. It is possible I screwed something up here.
980 */
Jeremy Hyltonc5007aa2000-06-30 05:02:53 +0000981static void
Victor Stinner67e0de62019-11-20 11:48:18 +0100982delete_garbage(PyThreadState *tstate, GCState *gcstate,
Victor Stinner9db03242019-04-26 02:32:01 +0200983 PyGC_Head *collectable, PyGC_Head *old)
Jeremy Hyltonc5007aa2000-06-30 05:02:53 +0000984{
Victor Stinner2e969062019-11-20 01:49:32 +0100985 assert(!_PyErr_Occurred(tstate));
Victor Stinner9db03242019-04-26 02:32:01 +0200986
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000987 while (!gc_list_is_empty(collectable)) {
INADA Naoki5ac9e6e2018-07-10 17:19:53 +0900988 PyGC_Head *gc = GC_NEXT(collectable);
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000989 PyObject *op = FROM_GC(gc);
Tim Peters88396172002-06-30 17:56:40 +0000990
Victor Stinnera4b2bc72018-10-26 18:00:13 +0200991 _PyObject_ASSERT_WITH_MSG(op, Py_REFCNT(op) > 0,
992 "refcount is too small");
INADA Naoki5ac9e6e2018-07-10 17:19:53 +0900993
Victor Stinner67e0de62019-11-20 11:48:18 +0100994 if (gcstate->debug & DEBUG_SAVEALL) {
995 assert(gcstate->garbage != NULL);
996 if (PyList_Append(gcstate->garbage, op) < 0) {
Victor Stinner2e969062019-11-20 01:49:32 +0100997 _PyErr_Clear(tstate);
Serhiy Storchakac4653c92018-05-29 18:50:10 +0300998 }
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000999 }
1000 else {
Victor Stinner9db03242019-04-26 02:32:01 +02001001 inquiry clear;
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00001002 if ((clear = Py_TYPE(op)->tp_clear) != NULL) {
1003 Py_INCREF(op);
Serhiy Storchakac4653c92018-05-29 18:50:10 +03001004 (void) clear(op);
Victor Stinner2e969062019-11-20 01:49:32 +01001005 if (_PyErr_Occurred(tstate)) {
Victor Stinner71c52e32019-05-27 08:57:14 +02001006 _PyErr_WriteUnraisableMsg("in tp_clear of",
1007 (PyObject*)Py_TYPE(op));
Serhiy Storchakac4653c92018-05-29 18:50:10 +03001008 }
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00001009 Py_DECREF(op);
1010 }
1011 }
INADA Naoki5ac9e6e2018-07-10 17:19:53 +09001012 if (GC_NEXT(collectable) == gc) {
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00001013 /* object is still alive, move it, it may die later */
Pablo Galindo466326d2019-10-13 16:48:59 +01001014 gc_clear_collecting(gc);
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00001015 gc_list_move(gc, old);
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00001016 }
1017 }
Jeremy Hyltonc5007aa2000-06-30 05:02:53 +00001018}
1019
Christian Heimesa156e092008-02-16 07:38:31 +00001020/* Clear all free lists
1021 * All free lists are cleared during the collection of the highest generation.
1022 * Allocated items in the free list may keep a pymalloc arena occupied.
1023 * Clearing the free lists may give back memory to the OS earlier.
1024 */
1025static void
1026clear_freelists(void)
1027{
Victor Stinnerae00a5a2020-04-29 02:29:20 +02001028 _PyFrame_ClearFreeList();
1029 _PyTuple_ClearFreeList();
1030 _PyFloat_ClearFreeList();
1031 _PyList_ClearFreeList();
1032 _PyDict_ClearFreeList();
1033 _PyAsyncGen_ClearFreeLists();
1034 _PyContext_ClearFreeList();
Christian Heimesa156e092008-02-16 07:38:31 +00001035}
1036
Pablo Galindo97f12672020-01-13 12:25:05 +00001037// Show stats for objects in each generations
Inada Naokibf8162c2019-08-02 16:25:29 +09001038static void
Victor Stinner67e0de62019-11-20 11:48:18 +01001039show_stats_each_generations(GCState *gcstate)
Inada Naokibf8162c2019-08-02 16:25:29 +09001040{
1041 char buf[100];
1042 size_t pos = 0;
1043
1044 for (int i = 0; i < NUM_GENERATIONS && pos < sizeof(buf); i++) {
1045 pos += PyOS_snprintf(buf+pos, sizeof(buf)-pos,
1046 " %"PY_FORMAT_SIZE_T"d",
Victor Stinner67e0de62019-11-20 11:48:18 +01001047 gc_list_size(GEN_HEAD(gcstate, i)));
Inada Naokibf8162c2019-08-02 16:25:29 +09001048 }
1049
1050 PySys_FormatStderr(
1051 "gc: objects in each generation:%s\n"
1052 "gc: objects in permanent generation: %zd\n",
Victor Stinner67e0de62019-11-20 11:48:18 +01001053 buf, gc_list_size(&gcstate->permanent_generation.head));
Inada Naokibf8162c2019-08-02 16:25:29 +09001054}
1055
Pablo Galindo97f12672020-01-13 12:25:05 +00001056/* Deduce which objects among "base" are unreachable from outside the list
Pablo Galindo466326d2019-10-13 16:48:59 +01001057 and move them to 'unreachable'. The process consist in the following steps:
1058
10591. Copy all reference counts to a different field (gc_prev is used to hold
1060 this copy to save memory).
10612. Traverse all objects in "base" and visit all referred objects using
Pablo Galindo97f12672020-01-13 12:25:05 +00001062 "tp_traverse" and for every visited object, subtract 1 to the reference
Pablo Galindo466326d2019-10-13 16:48:59 +01001063 count (the one that we copied in the previous step). After this step, all
1064 objects that can be reached directly from outside must have strictly positive
1065 reference count, while all unreachable objects must have a count of exactly 0.
Pablo Galindo97f12672020-01-13 12:25:05 +000010663. Identify all unreachable objects (the ones with 0 reference count) and move
Pablo Galindo466326d2019-10-13 16:48:59 +01001067 them to the "unreachable" list. This step also needs to move back to "base" all
1068 objects that were initially marked as unreachable but are referred transitively
1069 by the reachable objects (the ones with strictly positive reference count).
1070
1071Contracts:
1072
1073 * The "base" has to be a valid list with no mask set.
1074
1075 * The "unreachable" list must be uninitialized (this function calls
1076 gc_list_init over 'unreachable').
Tim Peters95bfc8a2019-10-13 16:47:04 -05001077
Pablo Galindo466326d2019-10-13 16:48:59 +01001078IMPORTANT: This function leaves 'unreachable' with the NEXT_MASK_UNREACHABLE
1079flag set but it does not clear it to skip unnecessary iteration. Before the
1080flag is cleared (for example, by using 'clear_unreachable_mask' function or
1081by a call to 'move_legacy_finalizers'), the 'unreachable' list is not a normal
1082list and we can not use most gc_list_* functions for it. */
1083static inline void
1084deduce_unreachable(PyGC_Head *base, PyGC_Head *unreachable) {
Tim Petersea55c512019-10-18 20:59:14 -05001085 validate_list(base, collecting_clear_unreachable_clear);
Pablo Galindo466326d2019-10-13 16:48:59 +01001086 /* Using ob_refcnt and gc_refs, calculate which objects in the
1087 * container set are reachable from outside the set (i.e., have a
1088 * refcount greater than 0 when all the references within the
1089 * set are taken into account).
1090 */
1091 update_refs(base); // gc_prev is used for gc_refs
1092 subtract_refs(base);
1093
1094 /* Leave everything reachable from outside base in base, and move
1095 * everything else (in base) to unreachable.
Pablo Galindo97f12672020-01-13 12:25:05 +00001096 *
Pablo Galindo466326d2019-10-13 16:48:59 +01001097 * NOTE: This used to move the reachable objects into a reachable
1098 * set instead. But most things usually turn out to be reachable,
Pablo Galindo97f12672020-01-13 12:25:05 +00001099 * so it's more efficient to move the unreachable things. It "sounds slick"
1100 * to move the unreachable objects, until you think about it - the reason it
1101 * pays isn't actually obvious.
1102 *
1103 * Suppose we create objects A, B, C in that order. They appear in the young
1104 * generation in the same order. If B points to A, and C to B, and C is
1105 * reachable from outside, then the adjusted refcounts will be 0, 0, and 1
1106 * respectively.
1107 *
1108 * When move_unreachable finds A, A is moved to the unreachable list. The
1109 * same for B when it's first encountered. Then C is traversed, B is moved
1110 * _back_ to the reachable list. B is eventually traversed, and then A is
1111 * moved back to the reachable list.
1112 *
1113 * So instead of not moving at all, the reachable objects B and A are moved
1114 * twice each. Why is this a win? A straightforward algorithm to move the
1115 * reachable objects instead would move A, B, and C once each.
1116 *
1117 * The key is that this dance leaves the objects in order C, B, A - it's
1118 * reversed from the original order. On all _subsequent_ scans, none of
1119 * them will move. Since most objects aren't in cycles, this can save an
1120 * unbounded number of moves across an unbounded number of later collections.
1121 * It can cost more only the first time the chain is scanned.
1122 *
1123 * Drawback: move_unreachable is also used to find out what's still trash
1124 * after finalizers may resurrect objects. In _that_ case most unreachable
1125 * objects will remain unreachable, so it would be more efficient to move
1126 * the reachable objects instead. But this is a one-time cost, probably not
1127 * worth complicating the code to speed just a little.
Pablo Galindo466326d2019-10-13 16:48:59 +01001128 */
1129 gc_list_init(unreachable);
1130 move_unreachable(base, unreachable); // gc_prev is pointer again
Tim Petersea55c512019-10-18 20:59:14 -05001131 validate_list(base, collecting_clear_unreachable_clear);
1132 validate_list(unreachable, collecting_set_unreachable_set);
Pablo Galindo466326d2019-10-13 16:48:59 +01001133}
1134
1135/* Handle objects that may have resurrected after a call to 'finalize_garbage', moving
1136 them to 'old_generation' and placing the rest on 'still_unreachable'.
1137
1138 Contracts:
1139 * After this function 'unreachable' must not be used anymore and 'still_unreachable'
1140 will contain the objects that did not resurrect.
1141
1142 * The "still_unreachable" list must be uninitialized (this function calls
1143 gc_list_init over 'still_unreachable').
1144
1145IMPORTANT: After a call to this function, the 'still_unreachable' set will have the
1146PREV_MARK_COLLECTING set, but the objects in this set are going to be removed so
1147we can skip the expense of clearing the flag to avoid extra iteration. */
1148static inline void
1149handle_resurrected_objects(PyGC_Head *unreachable, PyGC_Head* still_unreachable,
1150 PyGC_Head *old_generation)
1151{
1152 // Remove the PREV_MASK_COLLECTING from unreachable
1153 // to prepare it for a new call to 'deduce_unreachable'
1154 gc_list_clear_collecting(unreachable);
1155
1156 // After the call to deduce_unreachable, the 'still_unreachable' set will
1157 // have the PREV_MARK_COLLECTING set, but the objects are going to be
1158 // removed so we can skip the expense of clearing the flag.
1159 PyGC_Head* resurrected = unreachable;
1160 deduce_unreachable(resurrected, still_unreachable);
1161 clear_unreachable_mask(still_unreachable);
1162
1163 // Move the resurrected objects to the old generation for future collection.
1164 gc_list_merge(resurrected, old_generation);
1165}
1166
Jeremy Hyltonc5007aa2000-06-30 05:02:53 +00001167/* This is the main function. Read this to understand how the
1168 * collection process works. */
Neal Norwitz7b216c52006-03-04 20:01:53 +00001169static Py_ssize_t
Victor Stinner67e0de62019-11-20 11:48:18 +01001170collect(PyThreadState *tstate, int generation,
Victor Stinner9db03242019-04-26 02:32:01 +02001171 Py_ssize_t *n_collected, Py_ssize_t *n_uncollectable, int nofail)
Jeremy Hyltonc5007aa2000-06-30 05:02:53 +00001172{
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00001173 int i;
1174 Py_ssize_t m = 0; /* # objects collected */
1175 Py_ssize_t n = 0; /* # unreachable objects that couldn't be collected */
1176 PyGC_Head *young; /* the generation we are examining */
1177 PyGC_Head *old; /* next older generation */
1178 PyGC_Head unreachable; /* non-problematic unreachable trash */
1179 PyGC_Head finalizers; /* objects with, & reachable from, __del__ */
1180 PyGC_Head *gc;
Victor Stinner7181dec2015-03-27 17:47:53 +01001181 _PyTime_t t1 = 0; /* initialize to prevent a compiler warning */
Victor Stinner72474072019-11-20 12:25:50 +01001182 GCState *gcstate = &tstate->interp->gc;
Antoine Pitrou40f6b122014-05-24 19:21:53 +02001183
Victor Stinner67e0de62019-11-20 11:48:18 +01001184 if (gcstate->debug & DEBUG_STATS) {
Inada Naokibf8162c2019-08-02 16:25:29 +09001185 PySys_WriteStderr("gc: collecting generation %d...\n", generation);
Victor Stinner67e0de62019-11-20 11:48:18 +01001186 show_stats_each_generations(gcstate);
Victor Stinner7181dec2015-03-27 17:47:53 +01001187 t1 = _PyTime_GetMonotonicClock();
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00001188 }
Neil Schemenauer2880ae52002-05-04 05:35:20 +00001189
Łukasz Langaa785c872016-09-09 17:37:37 -07001190 if (PyDTrace_GC_START_ENABLED())
1191 PyDTrace_GC_START(generation);
1192
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00001193 /* update collection and allocation counters */
1194 if (generation+1 < NUM_GENERATIONS)
Victor Stinner67e0de62019-11-20 11:48:18 +01001195 gcstate->generations[generation+1].count += 1;
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00001196 for (i = 0; i <= generation; i++)
Victor Stinner67e0de62019-11-20 11:48:18 +01001197 gcstate->generations[i].count = 0;
Neil Schemenauer2880ae52002-05-04 05:35:20 +00001198
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00001199 /* merge younger generations with one we are currently collecting */
1200 for (i = 0; i < generation; i++) {
Victor Stinner67e0de62019-11-20 11:48:18 +01001201 gc_list_merge(GEN_HEAD(gcstate, i), GEN_HEAD(gcstate, generation));
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00001202 }
Neil Schemenauer2880ae52002-05-04 05:35:20 +00001203
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00001204 /* handy references */
Victor Stinner67e0de62019-11-20 11:48:18 +01001205 young = GEN_HEAD(gcstate, generation);
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00001206 if (generation < NUM_GENERATIONS-1)
Victor Stinner67e0de62019-11-20 11:48:18 +01001207 old = GEN_HEAD(gcstate, generation+1);
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00001208 else
1209 old = young;
Tim Petersea55c512019-10-18 20:59:14 -05001210 validate_list(old, collecting_clear_unreachable_clear);
Jeremy Hyltonc5007aa2000-06-30 05:02:53 +00001211
Pablo Galindo466326d2019-10-13 16:48:59 +01001212 deduce_unreachable(young, &unreachable);
Jeremy Hyltonc5007aa2000-06-30 05:02:53 +00001213
INADA Naoki5ac9e6e2018-07-10 17:19:53 +09001214 untrack_tuples(young);
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00001215 /* Move reachable objects to next generation. */
1216 if (young != old) {
1217 if (generation == NUM_GENERATIONS - 2) {
Victor Stinner67e0de62019-11-20 11:48:18 +01001218 gcstate->long_lived_pending += gc_list_size(young);
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00001219 }
1220 gc_list_merge(young, old);
1221 }
1222 else {
Pablo Galindo97f12672020-01-13 12:25:05 +00001223 /* We only un-track dicts in full collections, to avoid quadratic
Antoine Pitroue1ad3da2012-05-28 22:22:34 +02001224 dict build-up. See issue #14775. */
1225 untrack_dicts(young);
Victor Stinner67e0de62019-11-20 11:48:18 +01001226 gcstate->long_lived_pending = 0;
1227 gcstate->long_lived_total = gc_list_size(young);
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00001228 }
Jeremy Hyltonc5007aa2000-06-30 05:02:53 +00001229
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00001230 /* All objects in unreachable are trash, but objects reachable from
Antoine Pitrou796564c2013-07-30 19:59:21 +02001231 * legacy finalizers (e.g. tp_del) can't safely be deleted.
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00001232 */
1233 gc_list_init(&finalizers);
INADA Naoki5ac9e6e2018-07-10 17:19:53 +09001234 // NEXT_MASK_UNREACHABLE is cleared here.
1235 // After move_legacy_finalizers(), unreachable is normal list.
Antoine Pitrou796564c2013-07-30 19:59:21 +02001236 move_legacy_finalizers(&unreachable, &finalizers);
1237 /* finalizers contains the unreachable objects with a legacy finalizer;
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00001238 * unreachable objects reachable *from* those are also uncollectable,
1239 * and we move those into the finalizers list too.
1240 */
Antoine Pitrou796564c2013-07-30 19:59:21 +02001241 move_legacy_finalizer_reachable(&finalizers);
Jeremy Hyltonc5007aa2000-06-30 05:02:53 +00001242
Tim Petersea55c512019-10-18 20:59:14 -05001243 validate_list(&finalizers, collecting_clear_unreachable_clear);
1244 validate_list(&unreachable, collecting_set_unreachable_clear);
INADA Naoki5ac9e6e2018-07-10 17:19:53 +09001245
Tim Petersecbf35f2019-10-09 12:37:30 -05001246 /* Print debugging information. */
Victor Stinner67e0de62019-11-20 11:48:18 +01001247 if (gcstate->debug & DEBUG_COLLECTABLE) {
Tim Petersecbf35f2019-10-09 12:37:30 -05001248 for (gc = GC_NEXT(&unreachable); gc != &unreachable; gc = GC_NEXT(gc)) {
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00001249 debug_cycle("collectable", FROM_GC(gc));
1250 }
1251 }
Tim Petersead8b7a2004-10-30 23:09:22 +00001252
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00001253 /* Clear weakrefs and invoke callbacks as necessary. */
1254 m += handle_weakrefs(&unreachable, old);
Tim Petersead8b7a2004-10-30 23:09:22 +00001255
Tim Petersea55c512019-10-18 20:59:14 -05001256 validate_list(old, collecting_clear_unreachable_clear);
1257 validate_list(&unreachable, collecting_set_unreachable_clear);
INADA Naoki5ac9e6e2018-07-10 17:19:53 +09001258
Antoine Pitrou796564c2013-07-30 19:59:21 +02001259 /* Call tp_finalize on objects which have one. */
Victor Stinner67e0de62019-11-20 11:48:18 +01001260 finalize_garbage(tstate, &unreachable);
Antoine Pitrou796564c2013-07-30 19:59:21 +02001261
Pablo Galindo466326d2019-10-13 16:48:59 +01001262 /* Handle any objects that may have resurrected after the call
1263 * to 'finalize_garbage' and continue the collection with the
1264 * objects that are still unreachable */
1265 PyGC_Head final_unreachable;
1266 handle_resurrected_objects(&unreachable, &final_unreachable, old);
1267
1268 /* Call tp_clear on objects in the final_unreachable set. This will cause
1269 * the reference cycles to be broken. It may also cause some objects
1270 * in finalizers to be freed.
1271 */
1272 m += gc_list_size(&final_unreachable);
Victor Stinner67e0de62019-11-20 11:48:18 +01001273 delete_garbage(tstate, gcstate, &final_unreachable, old);
Jeremy Hyltonc5007aa2000-06-30 05:02:53 +00001274
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00001275 /* Collect statistics on uncollectable objects found and print
1276 * debugging information. */
INADA Naoki5ac9e6e2018-07-10 17:19:53 +09001277 for (gc = GC_NEXT(&finalizers); gc != &finalizers; gc = GC_NEXT(gc)) {
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00001278 n++;
Victor Stinner67e0de62019-11-20 11:48:18 +01001279 if (gcstate->debug & DEBUG_UNCOLLECTABLE)
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00001280 debug_cycle("uncollectable", FROM_GC(gc));
1281 }
Victor Stinner67e0de62019-11-20 11:48:18 +01001282 if (gcstate->debug & DEBUG_STATS) {
Inada Naokibf8162c2019-08-02 16:25:29 +09001283 double d = _PyTime_AsSecondsDouble(_PyTime_GetMonotonicClock() - t1);
Inada Naoki013e52f2019-08-31 09:13:42 +09001284 PySys_WriteStderr(
1285 "gc: done, %" PY_FORMAT_SIZE_T "d unreachable, "
1286 "%" PY_FORMAT_SIZE_T "d uncollectable, %.4fs elapsed\n",
Inada Naokibf8162c2019-08-02 16:25:29 +09001287 n+m, n, d);
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00001288 }
Jeremy Hyltonc5007aa2000-06-30 05:02:53 +00001289
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00001290 /* Append instances in the uncollectable set to a Python
1291 * reachable list of garbage. The programmer has to deal with
1292 * this if they insist on creating this type of structure.
1293 */
Victor Stinner67e0de62019-11-20 11:48:18 +01001294 handle_legacy_finalizers(tstate, gcstate, &finalizers, old);
Tim Petersea55c512019-10-18 20:59:14 -05001295 validate_list(old, collecting_clear_unreachable_clear);
Jeremy Hyltonc5007aa2000-06-30 05:02:53 +00001296
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00001297 /* Clear free list only during the collection of the highest
1298 * generation */
1299 if (generation == NUM_GENERATIONS-1) {
1300 clear_freelists();
1301 }
Christian Heimesa156e092008-02-16 07:38:31 +00001302
Victor Stinner2e969062019-11-20 01:49:32 +01001303 if (_PyErr_Occurred(tstate)) {
Antoine Pitroufef34e32013-05-19 01:11:58 +02001304 if (nofail) {
Victor Stinner2e969062019-11-20 01:49:32 +01001305 _PyErr_Clear(tstate);
Antoine Pitroufef34e32013-05-19 01:11:58 +02001306 }
1307 else {
Victor Stinner656c45e2020-01-24 18:05:24 +01001308 _PyErr_WriteUnraisableMsg("in garbage collection", NULL);
Antoine Pitroufef34e32013-05-19 01:11:58 +02001309 }
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00001310 }
Kristján Valur Jónsson69c63522012-04-15 11:41:32 +00001311
Antoine Pitroud4156c12012-10-30 22:43:19 +01001312 /* Update stats */
Victor Stinner9db03242019-04-26 02:32:01 +02001313 if (n_collected) {
Kristján Valur Jónsson69c63522012-04-15 11:41:32 +00001314 *n_collected = m;
Victor Stinner9db03242019-04-26 02:32:01 +02001315 }
1316 if (n_uncollectable) {
Kristján Valur Jónsson69c63522012-04-15 11:41:32 +00001317 *n_uncollectable = n;
Victor Stinner9db03242019-04-26 02:32:01 +02001318 }
1319
Victor Stinner67e0de62019-11-20 11:48:18 +01001320 struct gc_generation_stats *stats = &gcstate->generation_stats[generation];
Antoine Pitroud4156c12012-10-30 22:43:19 +01001321 stats->collections++;
1322 stats->collected += m;
1323 stats->uncollectable += n;
Łukasz Langaa785c872016-09-09 17:37:37 -07001324
Victor Stinner9db03242019-04-26 02:32:01 +02001325 if (PyDTrace_GC_DONE_ENABLED()) {
Victor Stinner2e969062019-11-20 01:49:32 +01001326 PyDTrace_GC_DONE(n + m);
Victor Stinner9db03242019-04-26 02:32:01 +02001327 }
Łukasz Langaa785c872016-09-09 17:37:37 -07001328
Victor Stinner2e969062019-11-20 01:49:32 +01001329 assert(!_PyErr_Occurred(tstate));
1330 return n + m;
Jeremy Hyltonc5007aa2000-06-30 05:02:53 +00001331}
1332
Kristján Valur Jónsson69c63522012-04-15 11:41:32 +00001333/* Invoke progress callbacks to notify clients that garbage collection
1334 * is starting or stopping
1335 */
1336static void
Victor Stinner67e0de62019-11-20 11:48:18 +01001337invoke_gc_callback(PyThreadState *tstate, const char *phase,
Victor Stinner9db03242019-04-26 02:32:01 +02001338 int generation, Py_ssize_t collected,
1339 Py_ssize_t uncollectable)
Kristján Valur Jónsson69c63522012-04-15 11:41:32 +00001340{
Victor Stinner67e0de62019-11-20 11:48:18 +01001341 assert(!_PyErr_Occurred(tstate));
Victor Stinner9db03242019-04-26 02:32:01 +02001342
Kristján Valur Jónsson69c63522012-04-15 11:41:32 +00001343 /* we may get called very early */
Victor Stinner72474072019-11-20 12:25:50 +01001344 GCState *gcstate = &tstate->interp->gc;
Victor Stinner67e0de62019-11-20 11:48:18 +01001345 if (gcstate->callbacks == NULL) {
Kristján Valur Jónsson69c63522012-04-15 11:41:32 +00001346 return;
Victor Stinner9db03242019-04-26 02:32:01 +02001347 }
1348
Kristján Valur Jónsson69c63522012-04-15 11:41:32 +00001349 /* The local variable cannot be rebound, check it for sanity */
Victor Stinner67e0de62019-11-20 11:48:18 +01001350 assert(PyList_CheckExact(gcstate->callbacks));
Victor Stinner9db03242019-04-26 02:32:01 +02001351 PyObject *info = NULL;
Victor Stinner67e0de62019-11-20 11:48:18 +01001352 if (PyList_GET_SIZE(gcstate->callbacks) != 0) {
Kristján Valur Jónsson69c63522012-04-15 11:41:32 +00001353 info = Py_BuildValue("{sisnsn}",
1354 "generation", generation,
1355 "collected", collected,
1356 "uncollectable", uncollectable);
1357 if (info == NULL) {
1358 PyErr_WriteUnraisable(NULL);
1359 return;
1360 }
1361 }
Victor Stinner67e0de62019-11-20 11:48:18 +01001362 for (Py_ssize_t i=0; i<PyList_GET_SIZE(gcstate->callbacks); i++) {
1363 PyObject *r, *cb = PyList_GET_ITEM(gcstate->callbacks, i);
Kristján Valur Jónsson69c63522012-04-15 11:41:32 +00001364 Py_INCREF(cb); /* make sure cb doesn't go away */
1365 r = PyObject_CallFunction(cb, "sO", phase, info);
Serhiy Storchaka301e3cc2018-05-24 15:19:29 +03001366 if (r == NULL) {
Kristján Valur Jónsson69c63522012-04-15 11:41:32 +00001367 PyErr_WriteUnraisable(cb);
Serhiy Storchaka301e3cc2018-05-24 15:19:29 +03001368 }
1369 else {
1370 Py_DECREF(r);
1371 }
Kristján Valur Jónsson69c63522012-04-15 11:41:32 +00001372 Py_DECREF(cb);
1373 }
1374 Py_XDECREF(info);
Victor Stinner67e0de62019-11-20 11:48:18 +01001375 assert(!_PyErr_Occurred(tstate));
Kristján Valur Jónsson69c63522012-04-15 11:41:32 +00001376}
1377
1378/* Perform garbage collection of a generation and invoke
1379 * progress callbacks.
1380 */
1381static Py_ssize_t
Victor Stinner67e0de62019-11-20 11:48:18 +01001382collect_with_callback(PyThreadState *tstate, int generation)
Kristján Valur Jónsson69c63522012-04-15 11:41:32 +00001383{
Victor Stinner67e0de62019-11-20 11:48:18 +01001384 assert(!_PyErr_Occurred(tstate));
Victor Stinner9db03242019-04-26 02:32:01 +02001385 Py_ssize_t result, collected, uncollectable;
Victor Stinner67e0de62019-11-20 11:48:18 +01001386 invoke_gc_callback(tstate, "start", generation, 0, 0);
1387 result = collect(tstate, generation, &collected, &uncollectable, 0);
1388 invoke_gc_callback(tstate, "stop", generation, collected, uncollectable);
1389 assert(!_PyErr_Occurred(tstate));
Kristján Valur Jónsson69c63522012-04-15 11:41:32 +00001390 return result;
1391}
1392
Neal Norwitz7b216c52006-03-04 20:01:53 +00001393static Py_ssize_t
Victor Stinner67e0de62019-11-20 11:48:18 +01001394collect_generations(PyThreadState *tstate)
Jeremy Hyltonc5007aa2000-06-30 05:02:53 +00001395{
Victor Stinner72474072019-11-20 12:25:50 +01001396 GCState *gcstate = &tstate->interp->gc;
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00001397 /* Find the oldest generation (highest numbered) where the count
1398 * exceeds the threshold. Objects in the that generation and
1399 * generations younger than it will be collected. */
Victor Stinner9db03242019-04-26 02:32:01 +02001400 Py_ssize_t n = 0;
1401 for (int i = NUM_GENERATIONS-1; i >= 0; i--) {
Victor Stinner67e0de62019-11-20 11:48:18 +01001402 if (gcstate->generations[i].count > gcstate->generations[i].threshold) {
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00001403 /* Avoid quadratic performance degradation in number
Pablo Galindo90913982019-12-27 21:55:56 +00001404 of tracked objects (see also issue #4074):
1405
1406 To limit the cost of garbage collection, there are two strategies;
1407 - make each collection faster, e.g. by scanning fewer objects
1408 - do less collections
1409 This heuristic is about the latter strategy.
1410
1411 In addition to the various configurable thresholds, we only trigger a
1412 full collection if the ratio
1413
1414 long_lived_pending / long_lived_total
1415
1416 is above a given value (hardwired to 25%).
1417
1418 The reason is that, while "non-full" collections (i.e., collections of
1419 the young and middle generations) will always examine roughly the same
1420 number of objects -- determined by the aforementioned thresholds --,
1421 the cost of a full collection is proportional to the total number of
1422 long-lived objects, which is virtually unbounded.
1423
1424 Indeed, it has been remarked that doing a full collection every
1425 <constant number> of object creations entails a dramatic performance
1426 degradation in workloads which consist in creating and storing lots of
1427 long-lived objects (e.g. building a large list of GC-tracked objects would
1428 show quadratic performance, instead of linear as expected: see issue #4074).
1429
1430 Using the above ratio, instead, yields amortized linear performance in
1431 the total number of objects (the effect of which can be summarized
1432 thusly: "each full garbage collection is more and more costly as the
1433 number of objects grows, but we do fewer and fewer of them").
1434
1435 This heuristic was suggested by Martin von Löwis on python-dev in
1436 June 2008. His original analysis and proposal can be found at:
1437 http://mail.python.org/pipermail/python-dev/2008-June/080579.html
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00001438 */
1439 if (i == NUM_GENERATIONS - 1
Victor Stinner67e0de62019-11-20 11:48:18 +01001440 && gcstate->long_lived_pending < gcstate->long_lived_total / 4)
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00001441 continue;
Victor Stinner67e0de62019-11-20 11:48:18 +01001442 n = collect_with_callback(tstate, i);
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00001443 break;
1444 }
1445 }
1446 return n;
Jeremy Hyltonc5007aa2000-06-30 05:02:53 +00001447}
1448
Serhiy Storchaka93260282017-02-04 11:19:59 +02001449#include "clinic/gcmodule.c.h"
1450
1451/*[clinic input]
1452gc.enable
1453
1454Enable automatic garbage collection.
1455[clinic start generated code]*/
Jeremy Hyltonc5007aa2000-06-30 05:02:53 +00001456
Vladimir Marangozovf9d20c32000-08-06 22:45:31 +00001457static PyObject *
Serhiy Storchaka93260282017-02-04 11:19:59 +02001458gc_enable_impl(PyObject *module)
1459/*[clinic end generated code: output=45a427e9dce9155c input=81ac4940ca579707]*/
Vladimir Marangozovf9d20c32000-08-06 22:45:31 +00001460{
Victor Stinner67e0de62019-11-20 11:48:18 +01001461 PyThreadState *tstate = _PyThreadState_GET();
Victor Stinner72474072019-11-20 12:25:50 +01001462 GCState *gcstate = &tstate->interp->gc;
Victor Stinner67e0de62019-11-20 11:48:18 +01001463 gcstate->enabled = 1;
Serhiy Storchaka228b12e2017-01-23 09:47:21 +02001464 Py_RETURN_NONE;
Vladimir Marangozovf9d20c32000-08-06 22:45:31 +00001465}
1466
Serhiy Storchaka93260282017-02-04 11:19:59 +02001467/*[clinic input]
1468gc.disable
1469
1470Disable automatic garbage collection.
1471[clinic start generated code]*/
Vladimir Marangozovf9d20c32000-08-06 22:45:31 +00001472
1473static PyObject *
Serhiy Storchaka93260282017-02-04 11:19:59 +02001474gc_disable_impl(PyObject *module)
1475/*[clinic end generated code: output=97d1030f7aa9d279 input=8c2e5a14e800d83b]*/
Vladimir Marangozovf9d20c32000-08-06 22:45:31 +00001476{
Victor Stinner67e0de62019-11-20 11:48:18 +01001477 PyThreadState *tstate = _PyThreadState_GET();
Victor Stinner72474072019-11-20 12:25:50 +01001478 GCState *gcstate = &tstate->interp->gc;
Victor Stinner67e0de62019-11-20 11:48:18 +01001479 gcstate->enabled = 0;
Serhiy Storchaka228b12e2017-01-23 09:47:21 +02001480 Py_RETURN_NONE;
Vladimir Marangozovf9d20c32000-08-06 22:45:31 +00001481}
1482
Serhiy Storchaka93260282017-02-04 11:19:59 +02001483/*[clinic input]
1484gc.isenabled -> bool
Vladimir Marangozovf9d20c32000-08-06 22:45:31 +00001485
Serhiy Storchaka93260282017-02-04 11:19:59 +02001486Returns true if automatic garbage collection is enabled.
1487[clinic start generated code]*/
1488
1489static int
1490gc_isenabled_impl(PyObject *module)
1491/*[clinic end generated code: output=1874298331c49130 input=30005e0422373b31]*/
Vladimir Marangozovf9d20c32000-08-06 22:45:31 +00001492{
Victor Stinner67e0de62019-11-20 11:48:18 +01001493 PyThreadState *tstate = _PyThreadState_GET();
Victor Stinner72474072019-11-20 12:25:50 +01001494 GCState *gcstate = &tstate->interp->gc;
Victor Stinner67e0de62019-11-20 11:48:18 +01001495 return gcstate->enabled;
Vladimir Marangozovf9d20c32000-08-06 22:45:31 +00001496}
1497
Serhiy Storchaka93260282017-02-04 11:19:59 +02001498/*[clinic input]
1499gc.collect -> Py_ssize_t
Jeremy Hyltonc5007aa2000-06-30 05:02:53 +00001500
Serhiy Storchaka93260282017-02-04 11:19:59 +02001501 generation: int(c_default="NUM_GENERATIONS - 1") = 2
1502
1503Run the garbage collector.
1504
1505With no arguments, run a full collection. The optional argument
1506may be an integer specifying which generation to collect. A ValueError
1507is raised if the generation number is invalid.
1508
1509The number of unreachable objects is returned.
1510[clinic start generated code]*/
1511
1512static Py_ssize_t
1513gc_collect_impl(PyObject *module, int generation)
1514/*[clinic end generated code: output=b697e633043233c7 input=40720128b682d879]*/
Jeremy Hyltonc5007aa2000-06-30 05:02:53 +00001515{
Victor Stinner2e969062019-11-20 01:49:32 +01001516 PyThreadState *tstate = _PyThreadState_GET();
Jeremy Hyltonc5007aa2000-06-30 05:02:53 +00001517
Serhiy Storchaka93260282017-02-04 11:19:59 +02001518 if (generation < 0 || generation >= NUM_GENERATIONS) {
Victor Stinner2e969062019-11-20 01:49:32 +01001519 _PyErr_SetString(tstate, PyExc_ValueError, "invalid generation");
Serhiy Storchaka93260282017-02-04 11:19:59 +02001520 return -1;
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00001521 }
Barry Warsawd3c38ff2006-03-07 09:46:03 +00001522
Victor Stinner72474072019-11-20 12:25:50 +01001523 GCState *gcstate = &tstate->interp->gc;
Victor Stinner9db03242019-04-26 02:32:01 +02001524 Py_ssize_t n;
Victor Stinner67e0de62019-11-20 11:48:18 +01001525 if (gcstate->collecting) {
Victor Stinner9db03242019-04-26 02:32:01 +02001526 /* already collecting, don't do anything */
1527 n = 0;
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00001528 }
Victor Stinner9db03242019-04-26 02:32:01 +02001529 else {
Victor Stinner67e0de62019-11-20 11:48:18 +01001530 gcstate->collecting = 1;
1531 n = collect_with_callback(tstate, generation);
1532 gcstate->collecting = 0;
Victor Stinner9db03242019-04-26 02:32:01 +02001533 }
Serhiy Storchaka93260282017-02-04 11:19:59 +02001534 return n;
Jeremy Hyltonc5007aa2000-06-30 05:02:53 +00001535}
1536
Serhiy Storchaka93260282017-02-04 11:19:59 +02001537/*[clinic input]
1538gc.set_debug
1539
1540 flags: int
1541 An integer that can have the following bits turned on:
1542 DEBUG_STATS - Print statistics during collection.
1543 DEBUG_COLLECTABLE - Print collectable objects found.
1544 DEBUG_UNCOLLECTABLE - Print unreachable but uncollectable objects
1545 found.
1546 DEBUG_SAVEALL - Save objects to gc.garbage rather than freeing them.
1547 DEBUG_LEAK - Debug leaking programs (everything but STATS).
1548 /
1549
1550Set the garbage collection debugging flags.
1551
1552Debugging information is written to sys.stderr.
1553[clinic start generated code]*/
Jeremy Hyltonc5007aa2000-06-30 05:02:53 +00001554
1555static PyObject *
Serhiy Storchaka93260282017-02-04 11:19:59 +02001556gc_set_debug_impl(PyObject *module, int flags)
1557/*[clinic end generated code: output=7c8366575486b228 input=5e5ce15e84fbed15]*/
Jeremy Hyltonc5007aa2000-06-30 05:02:53 +00001558{
Victor Stinner67e0de62019-11-20 11:48:18 +01001559 PyThreadState *tstate = _PyThreadState_GET();
Victor Stinner72474072019-11-20 12:25:50 +01001560 GCState *gcstate = &tstate->interp->gc;
Victor Stinner67e0de62019-11-20 11:48:18 +01001561 gcstate->debug = flags;
Serhiy Storchaka228b12e2017-01-23 09:47:21 +02001562 Py_RETURN_NONE;
Jeremy Hyltonc5007aa2000-06-30 05:02:53 +00001563}
1564
Serhiy Storchaka93260282017-02-04 11:19:59 +02001565/*[clinic input]
1566gc.get_debug -> int
Jeremy Hyltonc5007aa2000-06-30 05:02:53 +00001567
Serhiy Storchaka93260282017-02-04 11:19:59 +02001568Get the garbage collection debugging flags.
1569[clinic start generated code]*/
1570
1571static int
1572gc_get_debug_impl(PyObject *module)
1573/*[clinic end generated code: output=91242f3506cd1e50 input=91a101e1c3b98366]*/
Jeremy Hyltonc5007aa2000-06-30 05:02:53 +00001574{
Victor Stinner67e0de62019-11-20 11:48:18 +01001575 PyThreadState *tstate = _PyThreadState_GET();
Victor Stinner72474072019-11-20 12:25:50 +01001576 GCState *gcstate = &tstate->interp->gc;
Victor Stinner67e0de62019-11-20 11:48:18 +01001577 return gcstate->debug;
Jeremy Hyltonc5007aa2000-06-30 05:02:53 +00001578}
1579
Martin v. Löwis14f8b4c2002-06-13 20:33:02 +00001580PyDoc_STRVAR(gc_set_thresh__doc__,
Neal Norwitz2a47c0f2002-01-29 00:53:41 +00001581"set_threshold(threshold0, [threshold1, threshold2]) -> None\n"
Jeremy Hyltonc5007aa2000-06-30 05:02:53 +00001582"\n"
1583"Sets the collection thresholds. Setting threshold0 to zero disables\n"
Martin v. Löwis14f8b4c2002-06-13 20:33:02 +00001584"collection.\n");
Jeremy Hyltonc5007aa2000-06-30 05:02:53 +00001585
1586static PyObject *
Victor Stinner9db03242019-04-26 02:32:01 +02001587gc_set_threshold(PyObject *self, PyObject *args)
Jeremy Hyltonc5007aa2000-06-30 05:02:53 +00001588{
Victor Stinner67e0de62019-11-20 11:48:18 +01001589 PyThreadState *tstate = _PyThreadState_GET();
Victor Stinner72474072019-11-20 12:25:50 +01001590 GCState *gcstate = &tstate->interp->gc;
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00001591 if (!PyArg_ParseTuple(args, "i|ii:set_threshold",
Victor Stinner67e0de62019-11-20 11:48:18 +01001592 &gcstate->generations[0].threshold,
1593 &gcstate->generations[1].threshold,
1594 &gcstate->generations[2].threshold))
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00001595 return NULL;
Victor Stinner9db03242019-04-26 02:32:01 +02001596 for (int i = 3; i < NUM_GENERATIONS; i++) {
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00001597 /* generations higher than 2 get the same threshold */
Victor Stinner67e0de62019-11-20 11:48:18 +01001598 gcstate->generations[i].threshold = gcstate->generations[2].threshold;
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00001599 }
Serhiy Storchaka228b12e2017-01-23 09:47:21 +02001600 Py_RETURN_NONE;
Jeremy Hyltonc5007aa2000-06-30 05:02:53 +00001601}
1602
Serhiy Storchaka93260282017-02-04 11:19:59 +02001603/*[clinic input]
1604gc.get_threshold
1605
1606Return the current collection thresholds.
1607[clinic start generated code]*/
Jeremy Hyltonc5007aa2000-06-30 05:02:53 +00001608
1609static PyObject *
Serhiy Storchaka93260282017-02-04 11:19:59 +02001610gc_get_threshold_impl(PyObject *module)
1611/*[clinic end generated code: output=7902bc9f41ecbbd8 input=286d79918034d6e6]*/
Jeremy Hyltonc5007aa2000-06-30 05:02:53 +00001612{
Victor Stinner67e0de62019-11-20 11:48:18 +01001613 PyThreadState *tstate = _PyThreadState_GET();
Victor Stinner72474072019-11-20 12:25:50 +01001614 GCState *gcstate = &tstate->interp->gc;
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00001615 return Py_BuildValue("(iii)",
Victor Stinner67e0de62019-11-20 11:48:18 +01001616 gcstate->generations[0].threshold,
1617 gcstate->generations[1].threshold,
1618 gcstate->generations[2].threshold);
Jeremy Hyltonc5007aa2000-06-30 05:02:53 +00001619}
1620
Serhiy Storchaka93260282017-02-04 11:19:59 +02001621/*[clinic input]
1622gc.get_count
1623
1624Return a three-tuple of the current collection counts.
1625[clinic start generated code]*/
Barry Warsawd3c38ff2006-03-07 09:46:03 +00001626
1627static PyObject *
Serhiy Storchaka93260282017-02-04 11:19:59 +02001628gc_get_count_impl(PyObject *module)
1629/*[clinic end generated code: output=354012e67b16398f input=a392794a08251751]*/
Barry Warsawd3c38ff2006-03-07 09:46:03 +00001630{
Victor Stinner67e0de62019-11-20 11:48:18 +01001631 PyThreadState *tstate = _PyThreadState_GET();
Victor Stinner72474072019-11-20 12:25:50 +01001632 GCState *gcstate = &tstate->interp->gc;
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00001633 return Py_BuildValue("(iii)",
Victor Stinner67e0de62019-11-20 11:48:18 +01001634 gcstate->generations[0].count,
1635 gcstate->generations[1].count,
1636 gcstate->generations[2].count);
Barry Warsawd3c38ff2006-03-07 09:46:03 +00001637}
1638
Neil Schemenauer48c70342001-08-09 15:38:31 +00001639static int
Martin v. Löwis560da622001-11-24 09:24:51 +00001640referrersvisit(PyObject* obj, PyObject *objs)
Neil Schemenauer48c70342001-08-09 15:38:31 +00001641{
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00001642 Py_ssize_t i;
1643 for (i = 0; i < PyTuple_GET_SIZE(objs); i++)
1644 if (PyTuple_GET_ITEM(objs, i) == obj)
1645 return 1;
1646 return 0;
Neil Schemenauer48c70342001-08-09 15:38:31 +00001647}
1648
Neil Schemenauer17e7be62001-08-10 14:46:47 +00001649static int
Martin v. Löwis560da622001-11-24 09:24:51 +00001650gc_referrers_for(PyObject *objs, PyGC_Head *list, PyObject *resultlist)
Neil Schemenauer48c70342001-08-09 15:38:31 +00001651{
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00001652 PyGC_Head *gc;
1653 PyObject *obj;
1654 traverseproc traverse;
INADA Naoki5ac9e6e2018-07-10 17:19:53 +09001655 for (gc = GC_NEXT(list); gc != list; gc = GC_NEXT(gc)) {
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00001656 obj = FROM_GC(gc);
1657 traverse = Py_TYPE(obj)->tp_traverse;
1658 if (obj == objs || obj == resultlist)
1659 continue;
1660 if (traverse(obj, (visitproc)referrersvisit, objs)) {
1661 if (PyList_Append(resultlist, obj) < 0)
1662 return 0; /* error */
1663 }
1664 }
1665 return 1; /* no error */
Neil Schemenauer48c70342001-08-09 15:38:31 +00001666}
1667
Martin v. Löwis14f8b4c2002-06-13 20:33:02 +00001668PyDoc_STRVAR(gc_get_referrers__doc__,
Martin v. Löwis560da622001-11-24 09:24:51 +00001669"get_referrers(*objs) -> list\n\
Martin v. Löwis14f8b4c2002-06-13 20:33:02 +00001670Return the list of objects that directly refer to any of objs.");
Neil Schemenauer48c70342001-08-09 15:38:31 +00001671
Neil Schemenauer17e7be62001-08-10 14:46:47 +00001672static PyObject *
Martin v. Löwis560da622001-11-24 09:24:51 +00001673gc_get_referrers(PyObject *self, PyObject *args)
Neil Schemenauer48c70342001-08-09 15:38:31 +00001674{
Victor Stinner67e0de62019-11-20 11:48:18 +01001675 PyThreadState *tstate = _PyThreadState_GET();
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00001676 int i;
1677 PyObject *result = PyList_New(0);
Victor Stinner67e0de62019-11-20 11:48:18 +01001678 if (!result) {
1679 return NULL;
1680 }
Thomas Wouters49fd7fa2006-04-21 10:40:58 +00001681
Victor Stinner72474072019-11-20 12:25:50 +01001682 GCState *gcstate = &tstate->interp->gc;
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00001683 for (i = 0; i < NUM_GENERATIONS; i++) {
Victor Stinner67e0de62019-11-20 11:48:18 +01001684 if (!(gc_referrers_for(args, GEN_HEAD(gcstate, i), result))) {
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00001685 Py_DECREF(result);
1686 return NULL;
1687 }
1688 }
1689 return result;
Neil Schemenauer48c70342001-08-09 15:38:31 +00001690}
Jeremy Hyltonc5007aa2000-06-30 05:02:53 +00001691
Tim Peters0f81ab62003-04-08 16:39:48 +00001692/* Append obj to list; return true if error (out of memory), false if OK. */
Jeremy Hylton5bd378b2003-04-03 16:28:38 +00001693static int
Tim Peters730f5532003-04-08 17:17:17 +00001694referentsvisit(PyObject *obj, PyObject *list)
Jeremy Hylton5bd378b2003-04-03 16:28:38 +00001695{
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00001696 return PyList_Append(list, obj) < 0;
Jeremy Hylton5bd378b2003-04-03 16:28:38 +00001697}
1698
Tim Peters730f5532003-04-08 17:17:17 +00001699PyDoc_STRVAR(gc_get_referents__doc__,
1700"get_referents(*objs) -> list\n\
Jeremy Hylton059b0942003-04-03 16:29:13 +00001701Return the list of objects that are directly referred to by objs.");
Jeremy Hylton5bd378b2003-04-03 16:28:38 +00001702
1703static PyObject *
Tim Peters730f5532003-04-08 17:17:17 +00001704gc_get_referents(PyObject *self, PyObject *args)
Jeremy Hylton5bd378b2003-04-03 16:28:38 +00001705{
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00001706 Py_ssize_t i;
1707 PyObject *result = PyList_New(0);
Tim Peters0f81ab62003-04-08 16:39:48 +00001708
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00001709 if (result == NULL)
1710 return NULL;
Tim Peters0f81ab62003-04-08 16:39:48 +00001711
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00001712 for (i = 0; i < PyTuple_GET_SIZE(args); i++) {
1713 traverseproc traverse;
1714 PyObject *obj = PyTuple_GET_ITEM(args, i);
Tim Peters0f81ab62003-04-08 16:39:48 +00001715
Hai Shi675d9a32020-04-15 02:11:20 +08001716 if (!_PyObject_IS_GC(obj))
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00001717 continue;
1718 traverse = Py_TYPE(obj)->tp_traverse;
1719 if (! traverse)
1720 continue;
1721 if (traverse(obj, (visitproc)referentsvisit, result)) {
1722 Py_DECREF(result);
1723 return NULL;
1724 }
1725 }
1726 return result;
Jeremy Hylton5bd378b2003-04-03 16:28:38 +00001727}
1728
Serhiy Storchaka93260282017-02-04 11:19:59 +02001729/*[clinic input]
1730gc.get_objects
Pablo Galindo175421b2019-02-23 03:02:06 +00001731 generation: Py_ssize_t(accept={int, NoneType}, c_default="-1") = None
1732 Generation to extract the objects from.
Serhiy Storchaka93260282017-02-04 11:19:59 +02001733
1734Return a list of objects tracked by the collector (excluding the list returned).
Pablo Galindo175421b2019-02-23 03:02:06 +00001735
1736If generation is not None, return only the objects tracked by the collector
1737that are in that generation.
Serhiy Storchaka93260282017-02-04 11:19:59 +02001738[clinic start generated code]*/
Neil Schemenauerc7c8d8e2001-08-09 15:58:59 +00001739
Neil Schemenauerc7c8d8e2001-08-09 15:58:59 +00001740static PyObject *
Pablo Galindo175421b2019-02-23 03:02:06 +00001741gc_get_objects_impl(PyObject *module, Py_ssize_t generation)
1742/*[clinic end generated code: output=48b35fea4ba6cb0e input=ef7da9df9806754c]*/
Neil Schemenauerc7c8d8e2001-08-09 15:58:59 +00001743{
Victor Stinner67e0de62019-11-20 11:48:18 +01001744 PyThreadState *tstate = _PyThreadState_GET();
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00001745 int i;
1746 PyObject* result;
Victor Stinner72474072019-11-20 12:25:50 +01001747 GCState *gcstate = &tstate->interp->gc;
Neil Schemenauerc7c8d8e2001-08-09 15:58:59 +00001748
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00001749 result = PyList_New(0);
Pablo Galindo175421b2019-02-23 03:02:06 +00001750 if (result == NULL) {
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00001751 return NULL;
Pablo Galindo175421b2019-02-23 03:02:06 +00001752 }
1753
1754 /* If generation is passed, we extract only that generation */
Victor Stinner0810fa72019-04-15 17:54:09 +02001755 if (generation != -1) {
Pablo Galindo175421b2019-02-23 03:02:06 +00001756 if (generation >= NUM_GENERATIONS) {
Victor Stinner67e0de62019-11-20 11:48:18 +01001757 _PyErr_Format(tstate, PyExc_ValueError,
1758 "generation parameter must be less than the number of "
1759 "available generations (%i)",
1760 NUM_GENERATIONS);
Pablo Galindo175421b2019-02-23 03:02:06 +00001761 goto error;
1762 }
1763
1764 if (generation < 0) {
Victor Stinner67e0de62019-11-20 11:48:18 +01001765 _PyErr_SetString(tstate, PyExc_ValueError,
1766 "generation parameter cannot be negative");
Pablo Galindo175421b2019-02-23 03:02:06 +00001767 goto error;
1768 }
1769
Victor Stinner67e0de62019-11-20 11:48:18 +01001770 if (append_objects(result, GEN_HEAD(gcstate, generation))) {
Pablo Galindo175421b2019-02-23 03:02:06 +00001771 goto error;
1772 }
1773
1774 return result;
1775 }
1776
1777 /* If generation is not passed or None, get all objects from all generations */
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00001778 for (i = 0; i < NUM_GENERATIONS; i++) {
Victor Stinner67e0de62019-11-20 11:48:18 +01001779 if (append_objects(result, GEN_HEAD(gcstate, i))) {
Pablo Galindo175421b2019-02-23 03:02:06 +00001780 goto error;
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00001781 }
1782 }
1783 return result;
Pablo Galindo175421b2019-02-23 03:02:06 +00001784
1785error:
1786 Py_DECREF(result);
1787 return NULL;
Neil Schemenauerc7c8d8e2001-08-09 15:58:59 +00001788}
1789
Serhiy Storchaka93260282017-02-04 11:19:59 +02001790/*[clinic input]
1791gc.get_stats
1792
1793Return a list of dictionaries containing per-generation statistics.
1794[clinic start generated code]*/
Antoine Pitroud4156c12012-10-30 22:43:19 +01001795
1796static PyObject *
Serhiy Storchaka93260282017-02-04 11:19:59 +02001797gc_get_stats_impl(PyObject *module)
1798/*[clinic end generated code: output=a8ab1d8a5d26f3ab input=1ef4ed9d17b1a470]*/
Antoine Pitroud4156c12012-10-30 22:43:19 +01001799{
1800 int i;
Antoine Pitroud4156c12012-10-30 22:43:19 +01001801 struct gc_generation_stats stats[NUM_GENERATIONS], *st;
Victor Stinner67e0de62019-11-20 11:48:18 +01001802 PyThreadState *tstate = _PyThreadState_GET();
Antoine Pitroud4156c12012-10-30 22:43:19 +01001803
1804 /* To get consistent values despite allocations while constructing
1805 the result list, we use a snapshot of the running stats. */
Victor Stinner72474072019-11-20 12:25:50 +01001806 GCState *gcstate = &tstate->interp->gc;
Antoine Pitroud4156c12012-10-30 22:43:19 +01001807 for (i = 0; i < NUM_GENERATIONS; i++) {
Victor Stinner67e0de62019-11-20 11:48:18 +01001808 stats[i] = gcstate->generation_stats[i];
Antoine Pitroud4156c12012-10-30 22:43:19 +01001809 }
1810
Victor Stinner9db03242019-04-26 02:32:01 +02001811 PyObject *result = PyList_New(0);
Antoine Pitroud4156c12012-10-30 22:43:19 +01001812 if (result == NULL)
1813 return NULL;
1814
1815 for (i = 0; i < NUM_GENERATIONS; i++) {
1816 PyObject *dict;
1817 st = &stats[i];
1818 dict = Py_BuildValue("{snsnsn}",
1819 "collections", st->collections,
1820 "collected", st->collected,
1821 "uncollectable", st->uncollectable
1822 );
1823 if (dict == NULL)
1824 goto error;
1825 if (PyList_Append(result, dict)) {
1826 Py_DECREF(dict);
1827 goto error;
1828 }
1829 Py_DECREF(dict);
1830 }
1831 return result;
1832
1833error:
1834 Py_XDECREF(result);
1835 return NULL;
1836}
1837
1838
Serhiy Storchaka93260282017-02-04 11:19:59 +02001839/*[clinic input]
1840gc.is_tracked
1841
1842 obj: object
1843 /
1844
1845Returns true if the object is tracked by the garbage collector.
1846
1847Simple atomic objects will return false.
1848[clinic start generated code]*/
Antoine Pitrou3a652b12009-03-23 18:52:06 +00001849
1850static PyObject *
Serhiy Storchaka93260282017-02-04 11:19:59 +02001851gc_is_tracked(PyObject *module, PyObject *obj)
1852/*[clinic end generated code: output=14f0103423b28e31 input=d83057f170ea2723]*/
Antoine Pitrou3a652b12009-03-23 18:52:06 +00001853{
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00001854 PyObject *result;
1855
Hai Shi675d9a32020-04-15 02:11:20 +08001856 if (_PyObject_IS_GC(obj) && _PyObject_GC_IS_TRACKED(obj))
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00001857 result = Py_True;
1858 else
1859 result = Py_False;
1860 Py_INCREF(result);
1861 return result;
Antoine Pitrou3a652b12009-03-23 18:52:06 +00001862}
1863
brainfvckc75edab2017-10-16 12:49:41 -07001864/*[clinic input]
Pablo Galindoa2ec3f02020-01-14 12:06:45 +00001865gc.is_finalized
1866
1867 obj: object
1868 /
1869
1870Returns true if the object has been already finalized by the GC.
1871[clinic start generated code]*/
1872
1873static PyObject *
1874gc_is_finalized(PyObject *module, PyObject *obj)
1875/*[clinic end generated code: output=e1516ac119a918ed input=201d0c58f69ae390]*/
1876{
Hai Shi675d9a32020-04-15 02:11:20 +08001877 if (_PyObject_IS_GC(obj) && _PyGCHead_FINALIZED(AS_GC(obj))) {
Pablo Galindoa2ec3f02020-01-14 12:06:45 +00001878 Py_RETURN_TRUE;
1879 }
1880 Py_RETURN_FALSE;
1881}
1882
1883/*[clinic input]
brainfvckc75edab2017-10-16 12:49:41 -07001884gc.freeze
1885
1886Freeze all current tracked objects and ignore them for future collections.
1887
1888This can be used before a POSIX fork() call to make the gc copy-on-write friendly.
1889Note: collection before a POSIX fork() call may free pages for future allocation
1890which can cause copy-on-write.
1891[clinic start generated code]*/
1892
1893static PyObject *
1894gc_freeze_impl(PyObject *module)
1895/*[clinic end generated code: output=502159d9cdc4c139 input=b602b16ac5febbe5]*/
1896{
Victor Stinner67e0de62019-11-20 11:48:18 +01001897 PyThreadState *tstate = _PyThreadState_GET();
Victor Stinner72474072019-11-20 12:25:50 +01001898 GCState *gcstate = &tstate->interp->gc;
brainfvckc75edab2017-10-16 12:49:41 -07001899 for (int i = 0; i < NUM_GENERATIONS; ++i) {
Victor Stinner67e0de62019-11-20 11:48:18 +01001900 gc_list_merge(GEN_HEAD(gcstate, i), &gcstate->permanent_generation.head);
1901 gcstate->generations[i].count = 0;
brainfvckc75edab2017-10-16 12:49:41 -07001902 }
1903 Py_RETURN_NONE;
1904}
1905
1906/*[clinic input]
1907gc.unfreeze
1908
1909Unfreeze all objects in the permanent generation.
1910
1911Put all objects in the permanent generation back into oldest generation.
1912[clinic start generated code]*/
1913
1914static PyObject *
1915gc_unfreeze_impl(PyObject *module)
1916/*[clinic end generated code: output=1c15f2043b25e169 input=2dd52b170f4cef6c]*/
1917{
Victor Stinner67e0de62019-11-20 11:48:18 +01001918 PyThreadState *tstate = _PyThreadState_GET();
Victor Stinner72474072019-11-20 12:25:50 +01001919 GCState *gcstate = &tstate->interp->gc;
Victor Stinner67e0de62019-11-20 11:48:18 +01001920 gc_list_merge(&gcstate->permanent_generation.head,
1921 GEN_HEAD(gcstate, NUM_GENERATIONS-1));
brainfvckc75edab2017-10-16 12:49:41 -07001922 Py_RETURN_NONE;
1923}
1924
1925/*[clinic input]
Victor Stinner05d68a82018-01-18 11:15:25 +01001926gc.get_freeze_count -> Py_ssize_t
brainfvckc75edab2017-10-16 12:49:41 -07001927
1928Return the number of objects in the permanent generation.
1929[clinic start generated code]*/
1930
Victor Stinner05d68a82018-01-18 11:15:25 +01001931static Py_ssize_t
brainfvckc75edab2017-10-16 12:49:41 -07001932gc_get_freeze_count_impl(PyObject *module)
Victor Stinner05d68a82018-01-18 11:15:25 +01001933/*[clinic end generated code: output=61cbd9f43aa032e1 input=45ffbc65cfe2a6ed]*/
brainfvckc75edab2017-10-16 12:49:41 -07001934{
Victor Stinner67e0de62019-11-20 11:48:18 +01001935 PyThreadState *tstate = _PyThreadState_GET();
Victor Stinner72474072019-11-20 12:25:50 +01001936 GCState *gcstate = &tstate->interp->gc;
Victor Stinner67e0de62019-11-20 11:48:18 +01001937 return gc_list_size(&gcstate->permanent_generation.head);
brainfvckc75edab2017-10-16 12:49:41 -07001938}
1939
Neil Schemenauerc7c8d8e2001-08-09 15:58:59 +00001940
Martin v. Löwis14f8b4c2002-06-13 20:33:02 +00001941PyDoc_STRVAR(gc__doc__,
Jeremy Hyltonc5007aa2000-06-30 05:02:53 +00001942"This module provides access to the garbage collector for reference cycles.\n"
1943"\n"
Vladimir Marangozovf9d20c32000-08-06 22:45:31 +00001944"enable() -- Enable automatic garbage collection.\n"
1945"disable() -- Disable automatic garbage collection.\n"
1946"isenabled() -- Returns true if automatic collection is enabled.\n"
Jeremy Hyltonc5007aa2000-06-30 05:02:53 +00001947"collect() -- Do a full collection right now.\n"
Thomas Wouters89f507f2006-12-13 04:49:30 +00001948"get_count() -- Return the current collection counts.\n"
R David Murray0e814632013-12-26 15:11:28 -05001949"get_stats() -- Return list of dictionaries containing per-generation stats.\n"
Jeremy Hyltonc5007aa2000-06-30 05:02:53 +00001950"set_debug() -- Set debugging flags.\n"
1951"get_debug() -- Get debugging flags.\n"
1952"set_threshold() -- Set the collection thresholds.\n"
1953"get_threshold() -- Return the current the collection thresholds.\n"
Neil Schemenauerc7c8d8e2001-08-09 15:58:59 +00001954"get_objects() -- Return a list of all objects tracked by the collector.\n"
Antoine Pitrou3a652b12009-03-23 18:52:06 +00001955"is_tracked() -- Returns true if a given object is tracked.\n"
Pablo Galindob6791372020-01-14 17:38:15 +00001956"is_finalized() -- Returns true if a given object has been already finalized.\n"
Jeremy Hylton5bd378b2003-04-03 16:28:38 +00001957"get_referrers() -- Return the list of objects that refer to an object.\n"
brainfvckc75edab2017-10-16 12:49:41 -07001958"get_referents() -- Return the list of objects that an object refers to.\n"
1959"freeze() -- Freeze all tracked objects and ignore them for future collections.\n"
1960"unfreeze() -- Unfreeze all objects in the permanent generation.\n"
1961"get_freeze_count() -- Return the number of objects in the permanent generation.\n");
Jeremy Hyltonc5007aa2000-06-30 05:02:53 +00001962
1963static PyMethodDef GcMethods[] = {
Serhiy Storchaka93260282017-02-04 11:19:59 +02001964 GC_ENABLE_METHODDEF
1965 GC_DISABLE_METHODDEF
1966 GC_ISENABLED_METHODDEF
1967 GC_SET_DEBUG_METHODDEF
1968 GC_GET_DEBUG_METHODDEF
1969 GC_GET_COUNT_METHODDEF
Victor Stinner9db03242019-04-26 02:32:01 +02001970 {"set_threshold", gc_set_threshold, METH_VARARGS, gc_set_thresh__doc__},
Serhiy Storchaka93260282017-02-04 11:19:59 +02001971 GC_GET_THRESHOLD_METHODDEF
1972 GC_COLLECT_METHODDEF
1973 GC_GET_OBJECTS_METHODDEF
1974 GC_GET_STATS_METHODDEF
1975 GC_IS_TRACKED_METHODDEF
Pablo Galindoa2ec3f02020-01-14 12:06:45 +00001976 GC_IS_FINALIZED_METHODDEF
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00001977 {"get_referrers", gc_get_referrers, METH_VARARGS,
1978 gc_get_referrers__doc__},
1979 {"get_referents", gc_get_referents, METH_VARARGS,
1980 gc_get_referents__doc__},
brainfvckc75edab2017-10-16 12:49:41 -07001981 GC_FREEZE_METHODDEF
1982 GC_UNFREEZE_METHODDEF
1983 GC_GET_FREEZE_COUNT_METHODDEF
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00001984 {NULL, NULL} /* Sentinel */
Jeremy Hyltonc5007aa2000-06-30 05:02:53 +00001985};
1986
Martin v. Löwis1a214512008-06-11 05:26:20 +00001987static struct PyModuleDef gcmodule = {
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00001988 PyModuleDef_HEAD_INIT,
Antoine Pitrou696e0352010-08-08 22:18:46 +00001989 "gc", /* m_name */
1990 gc__doc__, /* m_doc */
1991 -1, /* m_size */
1992 GcMethods, /* m_methods */
1993 NULL, /* m_reload */
1994 NULL, /* m_traverse */
1995 NULL, /* m_clear */
1996 NULL /* m_free */
Martin v. Löwis1a214512008-06-11 05:26:20 +00001997};
1998
Jason Tishler6bc06ec2003-09-04 11:59:50 +00001999PyMODINIT_FUNC
Martin v. Löwis1a214512008-06-11 05:26:20 +00002000PyInit_gc(void)
Jeremy Hyltonc5007aa2000-06-30 05:02:53 +00002001{
Victor Stinner72474072019-11-20 12:25:50 +01002002 PyThreadState *tstate = _PyThreadState_GET();
2003 GCState *gcstate = &tstate->interp->gc;
Jeremy Hyltonc5007aa2000-06-30 05:02:53 +00002004
Victor Stinner72474072019-11-20 12:25:50 +01002005 PyObject *m = PyModule_Create(&gcmodule);
Martin v. Löwis1a214512008-06-11 05:26:20 +00002006
Victor Stinner9db03242019-04-26 02:32:01 +02002007 if (m == NULL) {
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00002008 return NULL;
Victor Stinner9db03242019-04-26 02:32:01 +02002009 }
Tim Peters11558872003-04-06 23:30:52 +00002010
Victor Stinner67e0de62019-11-20 11:48:18 +01002011 if (gcstate->garbage == NULL) {
2012 gcstate->garbage = PyList_New(0);
Victor Stinner72474072019-11-20 12:25:50 +01002013 if (gcstate->garbage == NULL) {
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00002014 return NULL;
Victor Stinner72474072019-11-20 12:25:50 +01002015 }
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00002016 }
Victor Stinner67e0de62019-11-20 11:48:18 +01002017 Py_INCREF(gcstate->garbage);
Victor Stinner72474072019-11-20 12:25:50 +01002018 if (PyModule_AddObject(m, "garbage", gcstate->garbage) < 0) {
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00002019 return NULL;
Victor Stinner72474072019-11-20 12:25:50 +01002020 }
Thomas Wouters477c8d52006-05-27 19:21:47 +00002021
Victor Stinner67e0de62019-11-20 11:48:18 +01002022 if (gcstate->callbacks == NULL) {
2023 gcstate->callbacks = PyList_New(0);
Victor Stinner72474072019-11-20 12:25:50 +01002024 if (gcstate->callbacks == NULL) {
Kristján Valur Jónsson69c63522012-04-15 11:41:32 +00002025 return NULL;
Victor Stinner72474072019-11-20 12:25:50 +01002026 }
Kristján Valur Jónsson69c63522012-04-15 11:41:32 +00002027 }
Victor Stinner67e0de62019-11-20 11:48:18 +01002028 Py_INCREF(gcstate->callbacks);
Victor Stinner72474072019-11-20 12:25:50 +01002029 if (PyModule_AddObject(m, "callbacks", gcstate->callbacks) < 0) {
Kristján Valur Jónsson69c63522012-04-15 11:41:32 +00002030 return NULL;
Victor Stinner72474072019-11-20 12:25:50 +01002031 }
Kristján Valur Jónsson69c63522012-04-15 11:41:32 +00002032
Victor Stinner72474072019-11-20 12:25:50 +01002033#define ADD_INT(NAME) if (PyModule_AddIntConstant(m, #NAME, NAME) < 0) { return NULL; }
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00002034 ADD_INT(DEBUG_STATS);
2035 ADD_INT(DEBUG_COLLECTABLE);
2036 ADD_INT(DEBUG_UNCOLLECTABLE);
2037 ADD_INT(DEBUG_SAVEALL);
2038 ADD_INT(DEBUG_LEAK);
Tim Peters11558872003-04-06 23:30:52 +00002039#undef ADD_INT
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00002040 return m;
Jeremy Hyltonc5007aa2000-06-30 05:02:53 +00002041}
2042
Guido van Rossume13ddc92003-04-17 17:29:22 +00002043/* API to invoke gc.collect() from C */
Neal Norwitz7b216c52006-03-04 20:01:53 +00002044Py_ssize_t
Guido van Rossume13ddc92003-04-17 17:29:22 +00002045PyGC_Collect(void)
2046{
Victor Stinner2e969062019-11-20 01:49:32 +01002047 PyThreadState *tstate = _PyThreadState_GET();
Victor Stinner72474072019-11-20 12:25:50 +01002048 GCState *gcstate = &tstate->interp->gc;
Victor Stinner2e969062019-11-20 01:49:32 +01002049
Victor Stinner67e0de62019-11-20 11:48:18 +01002050 if (!gcstate->enabled) {
Victor Stinner9db03242019-04-26 02:32:01 +02002051 return 0;
2052 }
Guido van Rossume13ddc92003-04-17 17:29:22 +00002053
Victor Stinner9db03242019-04-26 02:32:01 +02002054 Py_ssize_t n;
Victor Stinner67e0de62019-11-20 11:48:18 +01002055 if (gcstate->collecting) {
Victor Stinner9db03242019-04-26 02:32:01 +02002056 /* already collecting, don't do anything */
2057 n = 0;
2058 }
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00002059 else {
Serhiy Storchaka301e3cc2018-05-24 15:19:29 +03002060 PyObject *exc, *value, *tb;
Victor Stinner67e0de62019-11-20 11:48:18 +01002061 gcstate->collecting = 1;
Victor Stinner2e969062019-11-20 01:49:32 +01002062 _PyErr_Fetch(tstate, &exc, &value, &tb);
Victor Stinner67e0de62019-11-20 11:48:18 +01002063 n = collect_with_callback(tstate, NUM_GENERATIONS - 1);
Victor Stinner2e969062019-11-20 01:49:32 +01002064 _PyErr_Restore(tstate, exc, value, tb);
Victor Stinner67e0de62019-11-20 11:48:18 +01002065 gcstate->collecting = 0;
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00002066 }
Guido van Rossume13ddc92003-04-17 17:29:22 +00002067
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00002068 return n;
Guido van Rossume13ddc92003-04-17 17:29:22 +00002069}
2070
Antoine Pitroufef34e32013-05-19 01:11:58 +02002071Py_ssize_t
Łukasz Langafef7e942016-09-09 21:47:46 -07002072_PyGC_CollectIfEnabled(void)
2073{
Łukasz Langafef7e942016-09-09 21:47:46 -07002074 return PyGC_Collect();
2075}
2076
2077Py_ssize_t
Antoine Pitroufef34e32013-05-19 01:11:58 +02002078_PyGC_CollectNoFail(void)
2079{
Victor Stinner2e969062019-11-20 01:49:32 +01002080 PyThreadState *tstate = _PyThreadState_GET();
2081 assert(!_PyErr_Occurred(tstate));
Victor Stinner9db03242019-04-26 02:32:01 +02002082
Victor Stinner72474072019-11-20 12:25:50 +01002083 GCState *gcstate = &tstate->interp->gc;
Antoine Pitroufef34e32013-05-19 01:11:58 +02002084 Py_ssize_t n;
2085
Antoine Pitrouc69c9bc2013-08-15 20:15:15 +02002086 /* Ideally, this function is only called on interpreter shutdown,
2087 and therefore not recursively. Unfortunately, when there are daemon
2088 threads, a daemon thread can start a cyclic garbage collection
2089 during interpreter shutdown (and then never finish it).
2090 See http://bugs.python.org/issue8713#msg195178 for an example.
2091 */
Victor Stinner67e0de62019-11-20 11:48:18 +01002092 if (gcstate->collecting) {
Antoine Pitrouc69c9bc2013-08-15 20:15:15 +02002093 n = 0;
Victor Stinner9db03242019-04-26 02:32:01 +02002094 }
Antoine Pitrouc69c9bc2013-08-15 20:15:15 +02002095 else {
Victor Stinner67e0de62019-11-20 11:48:18 +01002096 gcstate->collecting = 1;
2097 n = collect(tstate, NUM_GENERATIONS - 1, NULL, NULL, 1);
2098 gcstate->collecting = 0;
Antoine Pitrouc69c9bc2013-08-15 20:15:15 +02002099 }
Antoine Pitroufef34e32013-05-19 01:11:58 +02002100 return n;
2101}
Antoine Pitrou5f454a02013-05-06 21:15:57 +02002102
Antoine Pitrou696e0352010-08-08 22:18:46 +00002103void
Victor Stinner67e0de62019-11-20 11:48:18 +01002104_PyGC_DumpShutdownStats(PyThreadState *tstate)
Antoine Pitrou696e0352010-08-08 22:18:46 +00002105{
Victor Stinner72474072019-11-20 12:25:50 +01002106 GCState *gcstate = &tstate->interp->gc;
Victor Stinner67e0de62019-11-20 11:48:18 +01002107 if (!(gcstate->debug & DEBUG_SAVEALL)
2108 && gcstate->garbage != NULL && PyList_GET_SIZE(gcstate->garbage) > 0) {
Serhiy Storchakae2f92de2017-11-11 13:06:26 +02002109 const char *message;
Victor Stinner67e0de62019-11-20 11:48:18 +01002110 if (gcstate->debug & DEBUG_UNCOLLECTABLE)
Antoine Pitroub5d82042010-11-05 00:05:25 +00002111 message = "gc: %zd uncollectable objects at " \
Georg Brandl08be72d2010-10-24 15:11:22 +00002112 "shutdown";
2113 else
Antoine Pitroub5d82042010-11-05 00:05:25 +00002114 message = "gc: %zd uncollectable objects at " \
Georg Brandl08be72d2010-10-24 15:11:22 +00002115 "shutdown; use gc.set_debug(gc.DEBUG_UNCOLLECTABLE) to list them";
Antoine Pitrou070cb3c2013-05-08 13:23:25 +02002116 /* PyErr_WarnFormat does too many things and we are at shutdown,
2117 the warnings module's dependencies (e.g. linecache) may be gone
2118 already. */
2119 if (PyErr_WarnExplicitFormat(PyExc_ResourceWarning, "gc", 0,
2120 "gc", NULL, message,
Victor Stinner67e0de62019-11-20 11:48:18 +01002121 PyList_GET_SIZE(gcstate->garbage)))
Georg Brandl08be72d2010-10-24 15:11:22 +00002122 PyErr_WriteUnraisable(NULL);
Victor Stinner67e0de62019-11-20 11:48:18 +01002123 if (gcstate->debug & DEBUG_UNCOLLECTABLE) {
Antoine Pitrou696e0352010-08-08 22:18:46 +00002124 PyObject *repr = NULL, *bytes = NULL;
Victor Stinner67e0de62019-11-20 11:48:18 +01002125 repr = PyObject_Repr(gcstate->garbage);
Antoine Pitrou696e0352010-08-08 22:18:46 +00002126 if (!repr || !(bytes = PyUnicode_EncodeFSDefault(repr)))
Victor Stinner67e0de62019-11-20 11:48:18 +01002127 PyErr_WriteUnraisable(gcstate->garbage);
Antoine Pitrou696e0352010-08-08 22:18:46 +00002128 else {
2129 PySys_WriteStderr(
Antoine Pitrou070cb3c2013-05-08 13:23:25 +02002130 " %s\n",
Antoine Pitrou696e0352010-08-08 22:18:46 +00002131 PyBytes_AS_STRING(bytes)
2132 );
2133 }
2134 Py_XDECREF(repr);
2135 Py_XDECREF(bytes);
2136 }
Antoine Pitrou696e0352010-08-08 22:18:46 +00002137 }
Antoine Pitrou5f454a02013-05-06 21:15:57 +02002138}
2139
2140void
Victor Stinner7eee5be2019-11-20 10:38:34 +01002141_PyGC_Fini(PyThreadState *tstate)
Antoine Pitrou5f454a02013-05-06 21:15:57 +02002142{
Victor Stinner72474072019-11-20 12:25:50 +01002143 GCState *gcstate = &tstate->interp->gc;
Victor Stinner67e0de62019-11-20 11:48:18 +01002144 Py_CLEAR(gcstate->garbage);
2145 Py_CLEAR(gcstate->callbacks);
Antoine Pitrou696e0352010-08-08 22:18:46 +00002146}
2147
Neil Schemenauer43411b52001-08-30 00:05:51 +00002148/* for debugging */
Guido van Rossume13ddc92003-04-17 17:29:22 +00002149void
2150_PyGC_Dump(PyGC_Head *g)
Neil Schemenauer43411b52001-08-30 00:05:51 +00002151{
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00002152 _PyObject_Dump(FROM_GC(g));
Neil Schemenauer43411b52001-08-30 00:05:51 +00002153}
2154
Victor Stinnera5447732019-10-10 09:32:13 +02002155
2156#ifdef Py_DEBUG
Victor Stinner1b184552019-10-08 00:09:31 +02002157static int
2158visit_validate(PyObject *op, void *parent_raw)
2159{
2160 PyObject *parent = _PyObject_CAST(parent_raw);
2161 if (_PyObject_IsFreed(op)) {
2162 _PyObject_ASSERT_FAILED_MSG(parent,
2163 "PyObject_GC_Track() object is not valid");
2164 }
2165 return 0;
2166}
Victor Stinnera5447732019-10-10 09:32:13 +02002167#endif
Victor Stinner1b184552019-10-08 00:09:31 +02002168
2169
Neil Schemenauer43411b52001-08-30 00:05:51 +00002170/* extension modules might be compiled with GC support so these
2171 functions must always be available */
2172
2173void
Victor Stinnera42de742018-11-22 10:25:22 +01002174PyObject_GC_Track(void *op_raw)
Neil Schemenauer43411b52001-08-30 00:05:51 +00002175{
Victor Stinnera42de742018-11-22 10:25:22 +01002176 PyObject *op = _PyObject_CAST(op_raw);
Victor Stinner271753a2018-11-22 01:02:54 +01002177 if (_PyObject_GC_IS_TRACKED(op)) {
2178 _PyObject_ASSERT_FAILED_MSG(op,
2179 "object already tracked "
2180 "by the garbage collector");
2181 }
Victor Stinnera42de742018-11-22 10:25:22 +01002182 _PyObject_GC_TRACK(op);
Victor Stinner1b184552019-10-08 00:09:31 +02002183
2184#ifdef Py_DEBUG
2185 /* Check that the object is valid: validate objects traversed
2186 by tp_traverse() */
2187 traverseproc traverse = Py_TYPE(op)->tp_traverse;
2188 (void)traverse(op, visit_validate, op);
2189#endif
Neil Schemenauer43411b52001-08-30 00:05:51 +00002190}
2191
Neil Schemenauerfec4eb12002-04-12 02:41:03 +00002192void
Victor Stinnera42de742018-11-22 10:25:22 +01002193PyObject_GC_UnTrack(void *op_raw)
Neil Schemenauer43411b52001-08-30 00:05:51 +00002194{
Victor Stinnera42de742018-11-22 10:25:22 +01002195 PyObject *op = _PyObject_CAST(op_raw);
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00002196 /* Obscure: the Py_TRASHCAN mechanism requires that we be able to
2197 * call PyObject_GC_UnTrack twice on an object.
2198 */
INADA Naoki5ac9e6e2018-07-10 17:19:53 +09002199 if (_PyObject_GC_IS_TRACKED(op)) {
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00002200 _PyObject_GC_UNTRACK(op);
INADA Naoki5ac9e6e2018-07-10 17:19:53 +09002201 }
Neil Schemenauer43411b52001-08-30 00:05:51 +00002202}
2203
Hai Shi675d9a32020-04-15 02:11:20 +08002204int
2205PyObject_IS_GC(PyObject *obj)
2206{
2207 return _PyObject_IS_GC(obj);
2208}
2209
Victor Stinnerdb067af2014-05-02 22:31:14 +02002210static PyObject *
2211_PyObject_GC_Alloc(int use_calloc, size_t basicsize)
Neil Schemenauer43411b52001-08-30 00:05:51 +00002212{
Victor Stinner67e0de62019-11-20 11:48:18 +01002213 PyThreadState *tstate = _PyThreadState_GET();
Victor Stinner72474072019-11-20 12:25:50 +01002214 GCState *gcstate = &tstate->interp->gc;
Victor Stinner2e969062019-11-20 01:49:32 +01002215 if (basicsize > PY_SSIZE_T_MAX - sizeof(PyGC_Head)) {
Victor Stinner67e0de62019-11-20 11:48:18 +01002216 return _PyErr_NoMemory(tstate);
Victor Stinner2e969062019-11-20 01:49:32 +01002217 }
2218 size_t size = sizeof(PyGC_Head) + basicsize;
2219
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00002220 PyGC_Head *g;
Victor Stinner2e969062019-11-20 01:49:32 +01002221 if (use_calloc) {
Victor Stinnerdb067af2014-05-02 22:31:14 +02002222 g = (PyGC_Head *)PyObject_Calloc(1, size);
Victor Stinner2e969062019-11-20 01:49:32 +01002223 }
2224 else {
Victor Stinnerdb067af2014-05-02 22:31:14 +02002225 g = (PyGC_Head *)PyObject_Malloc(size);
Victor Stinner2e969062019-11-20 01:49:32 +01002226 }
2227 if (g == NULL) {
Victor Stinner67e0de62019-11-20 11:48:18 +01002228 return _PyErr_NoMemory(tstate);
Victor Stinner2e969062019-11-20 01:49:32 +01002229 }
INADA Naoki5ac9e6e2018-07-10 17:19:53 +09002230 assert(((uintptr_t)g & 3) == 0); // g must be aligned 4bytes boundary
Victor Stinner2e969062019-11-20 01:49:32 +01002231
INADA Naoki5ac9e6e2018-07-10 17:19:53 +09002232 g->_gc_next = 0;
2233 g->_gc_prev = 0;
Victor Stinner67e0de62019-11-20 11:48:18 +01002234 gcstate->generations[0].count++; /* number of allocated GC objects */
2235 if (gcstate->generations[0].count > gcstate->generations[0].threshold &&
2236 gcstate->enabled &&
2237 gcstate->generations[0].threshold &&
2238 !gcstate->collecting &&
2239 !_PyErr_Occurred(tstate))
Victor Stinner2e969062019-11-20 01:49:32 +01002240 {
Victor Stinner67e0de62019-11-20 11:48:18 +01002241 gcstate->collecting = 1;
2242 collect_generations(tstate);
2243 gcstate->collecting = 0;
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00002244 }
Victor Stinner2e969062019-11-20 01:49:32 +01002245 PyObject *op = FROM_GC(g);
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00002246 return op;
Neil Schemenauer43411b52001-08-30 00:05:51 +00002247}
2248
2249PyObject *
Victor Stinnerdb067af2014-05-02 22:31:14 +02002250_PyObject_GC_Malloc(size_t basicsize)
2251{
2252 return _PyObject_GC_Alloc(0, basicsize);
2253}
2254
2255PyObject *
2256_PyObject_GC_Calloc(size_t basicsize)
2257{
2258 return _PyObject_GC_Alloc(1, basicsize);
2259}
2260
2261PyObject *
Neil Schemenauer43411b52001-08-30 00:05:51 +00002262_PyObject_GC_New(PyTypeObject *tp)
2263{
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00002264 PyObject *op = _PyObject_GC_Malloc(_PyObject_SIZE(tp));
2265 if (op != NULL)
2266 op = PyObject_INIT(op, tp);
2267 return op;
Neil Schemenauer43411b52001-08-30 00:05:51 +00002268}
2269
2270PyVarObject *
Martin v. Löwis18e16552006-02-15 17:27:45 +00002271_PyObject_GC_NewVar(PyTypeObject *tp, Py_ssize_t nitems)
Neil Schemenauer43411b52001-08-30 00:05:51 +00002272{
Victor Stinner5d1866c2013-07-08 22:17:52 +02002273 size_t size;
2274 PyVarObject *op;
2275
2276 if (nitems < 0) {
2277 PyErr_BadInternalCall();
2278 return NULL;
2279 }
2280 size = _PyObject_VAR_SIZE(tp, nitems);
2281 op = (PyVarObject *) _PyObject_GC_Malloc(size);
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00002282 if (op != NULL)
2283 op = PyObject_INIT_VAR(op, tp, nitems);
2284 return op;
Neil Schemenauer43411b52001-08-30 00:05:51 +00002285}
2286
2287PyVarObject *
Martin v. Löwis41290682006-02-16 14:56:14 +00002288_PyObject_GC_Resize(PyVarObject *op, Py_ssize_t nitems)
Neil Schemenauer43411b52001-08-30 00:05:51 +00002289{
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00002290 const size_t basicsize = _PyObject_VAR_SIZE(Py_TYPE(op), nitems);
Victor Stinnera4b2bc72018-10-26 18:00:13 +02002291 _PyObject_ASSERT((PyObject *)op, !_PyObject_GC_IS_TRACKED(op));
2292 if (basicsize > PY_SSIZE_T_MAX - sizeof(PyGC_Head)) {
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00002293 return (PyVarObject *)PyErr_NoMemory();
Victor Stinnera4b2bc72018-10-26 18:00:13 +02002294 }
2295
2296 PyGC_Head *g = AS_GC(op);
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00002297 g = (PyGC_Head *)PyObject_REALLOC(g, sizeof(PyGC_Head) + basicsize);
2298 if (g == NULL)
2299 return (PyVarObject *)PyErr_NoMemory();
2300 op = (PyVarObject *) FROM_GC(g);
Victor Stinner60ac6ed2020-02-07 23:18:08 +01002301 Py_SET_SIZE(op, nitems);
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00002302 return op;
Neil Schemenauer43411b52001-08-30 00:05:51 +00002303}
2304
2305void
Neil Schemenauerfec4eb12002-04-12 02:41:03 +00002306PyObject_GC_Del(void *op)
Neil Schemenauer43411b52001-08-30 00:05:51 +00002307{
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00002308 PyGC_Head *g = AS_GC(op);
INADA Naoki5ac9e6e2018-07-10 17:19:53 +09002309 if (_PyObject_GC_IS_TRACKED(op)) {
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00002310 gc_list_remove(g);
INADA Naoki5ac9e6e2018-07-10 17:19:53 +09002311 }
Victor Stinner67e0de62019-11-20 11:48:18 +01002312 PyThreadState *tstate = _PyThreadState_GET();
Victor Stinner72474072019-11-20 12:25:50 +01002313 GCState *gcstate = &tstate->interp->gc;
Victor Stinner67e0de62019-11-20 11:48:18 +01002314 if (gcstate->generations[0].count > 0) {
2315 gcstate->generations[0].count--;
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00002316 }
2317 PyObject_FREE(g);
Neil Schemenauer43411b52001-08-30 00:05:51 +00002318}
Pablo Galindof13072b2020-04-11 01:21:54 +01002319
2320int
2321PyObject_GC_IsTracked(PyObject* obj)
2322{
Hai Shi675d9a32020-04-15 02:11:20 +08002323 if (_PyObject_IS_GC(obj) && _PyObject_GC_IS_TRACKED(obj)) {
Pablo Galindof13072b2020-04-11 01:21:54 +01002324 return 1;
2325 }
2326 return 0;
2327}
2328
2329int
2330PyObject_GC_IsFinalized(PyObject *obj)
2331{
Hai Shi675d9a32020-04-15 02:11:20 +08002332 if (_PyObject_IS_GC(obj) && _PyGCHead_FINALIZED(AS_GC(obj))) {
Pablo Galindof13072b2020-04-11 01:21:54 +01002333 return 1;
2334 }
2335 return 0;
2336}