blob: 9b478199711e1a697fc53eec057584eb0e6a1586 [file] [log] [blame]
Jeremy Hyltonc5007aa2000-06-30 05:02:53 +00001/*
Tim Peters88396172002-06-30 17:56:40 +00002
Jeremy Hyltonc5007aa2000-06-30 05:02:53 +00003 Reference Cycle Garbage Collection
4 ==================================
5
Neil Schemenauerb2c2c9e2000-10-04 16:34:09 +00006 Neil Schemenauer <nas@arctrix.com>
Jeremy Hyltonc5007aa2000-06-30 05:02:53 +00007
8 Based on a post on the python-dev list. Ideas from Guido van Rossum,
9 Eric Tiedemann, and various others.
10
Neil Schemenauer43411b52001-08-30 00:05:51 +000011 http://www.arctrix.com/nas/python/gc/
Jeremy Hyltonc5007aa2000-06-30 05:02:53 +000012 http://www.python.org/pipermail/python-dev/2000-March/003869.html
13 http://www.python.org/pipermail/python-dev/2000-March/004010.html
14 http://www.python.org/pipermail/python-dev/2000-March/004022.html
15
16 For a highlevel view of the collection process, read the collect
17 function.
18
Jeremy Hyltonc5007aa2000-06-30 05:02:53 +000019*/
20
Jeremy Hyltonc5007aa2000-06-30 05:02:53 +000021#include "Python.h"
Christian Heimes3b718a72008-02-14 12:47:33 +000022#include "frameobject.h" /* for PyFrame_ClearFreeList */
Jeremy Hyltonc5007aa2000-06-30 05:02:53 +000023
Neil Schemenauer43411b52001-08-30 00:05:51 +000024/* Get an object's GC head */
25#define AS_GC(o) ((PyGC_Head *)(o)-1)
26
27/* Get the object given the GC head */
28#define FROM_GC(g) ((PyObject *)(((PyGC_Head *)g)+1))
29
Jeremy Hyltonc5007aa2000-06-30 05:02:53 +000030/*** Global GC state ***/
31
Neil Schemenauer2880ae52002-05-04 05:35:20 +000032struct gc_generation {
33 PyGC_Head head;
34 int threshold; /* collection threshold */
35 int count; /* count of allocations or collections of younger
36 generations */
37};
38
39#define NUM_GENERATIONS 3
40#define GEN_HEAD(n) (&generations[n].head)
41
Jeremy Hyltonc5007aa2000-06-30 05:02:53 +000042/* linked lists of container objects */
Neil Schemenauer2880ae52002-05-04 05:35:20 +000043static struct gc_generation generations[NUM_GENERATIONS] = {
44 /* PyGC_Head, threshold, count */
45 {{{GEN_HEAD(0), GEN_HEAD(0), 0}}, 700, 0},
46 {{{GEN_HEAD(1), GEN_HEAD(1), 0}}, 10, 0},
47 {{{GEN_HEAD(2), GEN_HEAD(2), 0}}, 10, 0},
48};
Jeremy Hyltonc5007aa2000-06-30 05:02:53 +000049
Neil Schemenauer2880ae52002-05-04 05:35:20 +000050PyGC_Head *_PyGC_generation0 = GEN_HEAD(0);
51
Vladimir Marangozovf9d20c32000-08-06 22:45:31 +000052static int enabled = 1; /* automatic collection enabled? */
Jeremy Hyltonc5007aa2000-06-30 05:02:53 +000053
Neil Schemenauer43411b52001-08-30 00:05:51 +000054/* true if we are currently running the collector */
Tim Petersbf384c22003-04-06 00:11:39 +000055static int collecting = 0;
Neil Schemenauer43411b52001-08-30 00:05:51 +000056
Tim Peters6fc13d92002-07-02 18:12:35 +000057/* list of uncollectable objects */
Tim Petersbf384c22003-04-06 00:11:39 +000058static PyObject *garbage = NULL;
Tim Peters6fc13d92002-07-02 18:12:35 +000059
60/* Python string to use if unhandled exception occurs */
Tim Petersbf384c22003-04-06 00:11:39 +000061static PyObject *gc_str = NULL;
Tim Peters6fc13d92002-07-02 18:12:35 +000062
Tim Peters93ad66d2003-04-05 17:15:44 +000063/* Python string used to look for __del__ attribute. */
64static PyObject *delstr = NULL;
Jeremy Hyltonce136e92003-04-04 19:59:06 +000065
Antoine Pitrou4c5ecb72009-01-09 21:40:55 +000066/* This is the number of objects who survived the last full collection. It
67 approximates the number of long lived objects tracked by the GC.
68
69 (by "full collection", we mean a collection of the oldest generation).
70*/
71static Py_ssize_t long_lived_total = 0;
72
73/* This is the number of objects who survived all "non-full" collections,
74 and are awaiting to undergo a full collection for the first time.
75
76*/
77static Py_ssize_t long_lived_pending = 0;
78
79/*
80 NOTE: about the counting of long-lived objects.
81
82 To limit the cost of garbage collection, there are two strategies;
83 - make each collection faster, e.g. by scanning fewer objects
84 - do less collections
85 This heuristic is about the latter strategy.
86
87 In addition to the various configurable thresholds, we only trigger a
88 full collection if the ratio
89 long_lived_pending / long_lived_total
90 is above a given value (hardwired to 25%).
91
92 The reason is that, while "non-full" collections (i.e., collections of
93 the young and middle generations) will always examine roughly the same
94 number of objects -- determined by the aforementioned thresholds --,
95 the cost of a full collection is proportional to the total number of
96 long-lived objects, which is virtually unbounded.
97
98 Indeed, it has been remarked that doing a full collection every
99 <constant number> of object creations entails a dramatic performance
100 degradation in workloads which consist in creating and storing lots of
101 long-lived objects (e.g. building a large list of GC-tracked objects would
102 show quadratic performance, instead of linear as expected: see issue #4074).
103
104 Using the above ratio, instead, yields amortized linear performance in
105 the total number of objects (the effect of which can be summarized
106 thusly: "each full garbage collection is more and more costly as the
107 number of objects grows, but we do fewer and fewer of them").
108
109 This heuristic was suggested by Martin von Löwis on python-dev in
110 June 2008. His original analysis and proposal can be found at:
111 http://mail.python.org/pipermail/python-dev/2008-June/080579.html
112*/
113
114
Jeremy Hyltonc5007aa2000-06-30 05:02:53 +0000115/* set for debugging information */
116#define DEBUG_STATS (1<<0) /* print collection statistics */
117#define DEBUG_COLLECTABLE (1<<1) /* print collectable objects */
118#define DEBUG_UNCOLLECTABLE (1<<2) /* print uncollectable objects */
119#define DEBUG_INSTANCES (1<<3) /* print instances */
120#define DEBUG_OBJECTS (1<<4) /* print other objects */
Neil Schemenauer544de1e2000-09-22 15:22:38 +0000121#define DEBUG_SAVEALL (1<<5) /* save all garbage in gc.garbage */
Jeremy Hyltonc5007aa2000-06-30 05:02:53 +0000122#define DEBUG_LEAK DEBUG_COLLECTABLE | \
123 DEBUG_UNCOLLECTABLE | \
124 DEBUG_INSTANCES | \
Neil Schemenauer544de1e2000-09-22 15:22:38 +0000125 DEBUG_OBJECTS | \
126 DEBUG_SAVEALL
Jeremy Hyltonb709df32000-09-01 02:47:25 +0000127static int debug;
Neal Norwitz57a03612006-04-26 05:34:03 +0000128static PyObject *tmod = NULL;
Jeremy Hyltonc5007aa2000-06-30 05:02:53 +0000129
Tim Peters6fc13d92002-07-02 18:12:35 +0000130/*--------------------------------------------------------------------------
131gc_refs values.
Neil Schemenauer43411b52001-08-30 00:05:51 +0000132
Tim Peters6fc13d92002-07-02 18:12:35 +0000133Between collections, every gc'ed object has one of two gc_refs values:
134
135GC_UNTRACKED
136 The initial state; objects returned by PyObject_GC_Malloc are in this
137 state. The object doesn't live in any generation list, and its
138 tp_traverse slot must not be called.
139
140GC_REACHABLE
141 The object lives in some generation list, and its tp_traverse is safe to
142 call. An object transitions to GC_REACHABLE when PyObject_GC_Track
143 is called.
144
145During a collection, gc_refs can temporarily take on other states:
146
147>= 0
148 At the start of a collection, update_refs() copies the true refcount
149 to gc_refs, for each object in the generation being collected.
150 subtract_refs() then adjusts gc_refs so that it equals the number of
151 times an object is referenced directly from outside the generation
152 being collected.
Martin v. Löwis774348c2002-11-09 19:54:06 +0000153 gc_refs remains >= 0 throughout these steps.
Tim Peters6fc13d92002-07-02 18:12:35 +0000154
155GC_TENTATIVELY_UNREACHABLE
156 move_unreachable() then moves objects not reachable (whether directly or
157 indirectly) from outside the generation into an "unreachable" set.
158 Objects that are found to be reachable have gc_refs set to GC_REACHABLE
159 again. Objects that are found to be unreachable have gc_refs set to
160 GC_TENTATIVELY_UNREACHABLE. It's "tentatively" because the pass doing
161 this can't be sure until it ends, and GC_TENTATIVELY_UNREACHABLE may
162 transition back to GC_REACHABLE.
163
164 Only objects with GC_TENTATIVELY_UNREACHABLE still set are candidates
165 for collection. If it's decided not to collect such an object (e.g.,
166 it has a __del__ method), its gc_refs is restored to GC_REACHABLE again.
167----------------------------------------------------------------------------
168*/
Tim Petersea405632002-07-02 00:52:30 +0000169#define GC_UNTRACKED _PyGC_REFS_UNTRACKED
170#define GC_REACHABLE _PyGC_REFS_REACHABLE
171#define GC_TENTATIVELY_UNREACHABLE _PyGC_REFS_TENTATIVELY_UNREACHABLE
Tim Peters19b74c72002-07-01 03:52:19 +0000172
Tim Peters6fc13d92002-07-02 18:12:35 +0000173#define IS_TRACKED(o) ((AS_GC(o))->gc.gc_refs != GC_UNTRACKED)
Tim Peters19b74c72002-07-01 03:52:19 +0000174#define IS_REACHABLE(o) ((AS_GC(o))->gc.gc_refs == GC_REACHABLE)
175#define IS_TENTATIVELY_UNREACHABLE(o) ( \
176 (AS_GC(o))->gc.gc_refs == GC_TENTATIVELY_UNREACHABLE)
Neil Schemenauera2b11ec2002-05-21 15:53:24 +0000177
Jeremy Hyltonc5007aa2000-06-30 05:02:53 +0000178/*** list functions ***/
179
180static void
181gc_list_init(PyGC_Head *list)
182{
Tim Peters9e4ca102001-10-11 18:31:31 +0000183 list->gc.gc_prev = list;
184 list->gc.gc_next = list;
Jeremy Hyltonc5007aa2000-06-30 05:02:53 +0000185}
186
Neil Schemenauer2880ae52002-05-04 05:35:20 +0000187static int
188gc_list_is_empty(PyGC_Head *list)
189{
190 return (list->gc.gc_next == list);
191}
192
Tim Peterse2d59182004-11-01 01:39:08 +0000193#if 0
194/* This became unused after gc_list_move() was introduced. */
195/* Append `node` to `list`. */
Jeremy Hyltonc5007aa2000-06-30 05:02:53 +0000196static void
197gc_list_append(PyGC_Head *node, PyGC_Head *list)
198{
Tim Peters9e4ca102001-10-11 18:31:31 +0000199 node->gc.gc_next = list;
200 node->gc.gc_prev = list->gc.gc_prev;
201 node->gc.gc_prev->gc.gc_next = node;
202 list->gc.gc_prev = node;
Jeremy Hyltonc5007aa2000-06-30 05:02:53 +0000203}
Tim Peterse2d59182004-11-01 01:39:08 +0000204#endif
Jeremy Hyltonc5007aa2000-06-30 05:02:53 +0000205
Tim Peterse2d59182004-11-01 01:39:08 +0000206/* Remove `node` from the gc list it's currently in. */
Jeremy Hyltonc5007aa2000-06-30 05:02:53 +0000207static void
208gc_list_remove(PyGC_Head *node)
209{
Tim Peters9e4ca102001-10-11 18:31:31 +0000210 node->gc.gc_prev->gc.gc_next = node->gc.gc_next;
211 node->gc.gc_next->gc.gc_prev = node->gc.gc_prev;
212 node->gc.gc_next = NULL; /* object is not currently tracked */
Jeremy Hyltonc5007aa2000-06-30 05:02:53 +0000213}
214
Tim Peterse2d59182004-11-01 01:39:08 +0000215/* Move `node` from the gc list it's currently in (which is not explicitly
216 * named here) to the end of `list`. This is semantically the same as
217 * gc_list_remove(node) followed by gc_list_append(node, list).
218 */
219static void
220gc_list_move(PyGC_Head *node, PyGC_Head *list)
221{
Tim Petersbc1d1b82004-11-01 16:39:57 +0000222 PyGC_Head *new_prev;
Tim Peterse2d59182004-11-01 01:39:08 +0000223 PyGC_Head *current_prev = node->gc.gc_prev;
224 PyGC_Head *current_next = node->gc.gc_next;
Tim Petersbc1d1b82004-11-01 16:39:57 +0000225 /* Unlink from current list. */
Tim Peterse2d59182004-11-01 01:39:08 +0000226 current_prev->gc.gc_next = current_next;
227 current_next->gc.gc_prev = current_prev;
Tim Petersbc1d1b82004-11-01 16:39:57 +0000228 /* Relink at end of new list. */
229 new_prev = node->gc.gc_prev = list->gc.gc_prev;
Tim Peterse2d59182004-11-01 01:39:08 +0000230 new_prev->gc.gc_next = list->gc.gc_prev = node;
Tim Petersbc1d1b82004-11-01 16:39:57 +0000231 node->gc.gc_next = list;
Tim Peterse2d59182004-11-01 01:39:08 +0000232}
233
234/* append list `from` onto list `to`; `from` becomes an empty list */
Jeremy Hyltonc5007aa2000-06-30 05:02:53 +0000235static void
236gc_list_merge(PyGC_Head *from, PyGC_Head *to)
237{
238 PyGC_Head *tail;
Tim Peterse2d59182004-11-01 01:39:08 +0000239 assert(from != to);
Neil Schemenauer2880ae52002-05-04 05:35:20 +0000240 if (!gc_list_is_empty(from)) {
Tim Peters9e4ca102001-10-11 18:31:31 +0000241 tail = to->gc.gc_prev;
242 tail->gc.gc_next = from->gc.gc_next;
243 tail->gc.gc_next->gc.gc_prev = tail;
244 to->gc.gc_prev = from->gc.gc_prev;
245 to->gc.gc_prev->gc.gc_next = to;
Jeremy Hyltonc5007aa2000-06-30 05:02:53 +0000246 }
247 gc_list_init(from);
248}
249
Neal Norwitz7b216c52006-03-04 20:01:53 +0000250static Py_ssize_t
Jeremy Hyltonc5007aa2000-06-30 05:02:53 +0000251gc_list_size(PyGC_Head *list)
252{
253 PyGC_Head *gc;
Neal Norwitz7b216c52006-03-04 20:01:53 +0000254 Py_ssize_t n = 0;
Tim Peters9e4ca102001-10-11 18:31:31 +0000255 for (gc = list->gc.gc_next; gc != list; gc = gc->gc.gc_next) {
Jeremy Hyltonc5007aa2000-06-30 05:02:53 +0000256 n++;
257 }
258 return n;
259}
260
Tim Peters259272b2003-04-06 19:41:39 +0000261/* Append objects in a GC list to a Python list.
262 * Return 0 if all OK, < 0 if error (out of memory for list).
263 */
264static int
265append_objects(PyObject *py_list, PyGC_Head *gc_list)
266{
267 PyGC_Head *gc;
268 for (gc = gc_list->gc.gc_next; gc != gc_list; gc = gc->gc.gc_next) {
269 PyObject *op = FROM_GC(gc);
270 if (op != py_list) {
271 if (PyList_Append(py_list, op)) {
272 return -1; /* exception */
273 }
274 }
275 }
276 return 0;
277}
278
Jeremy Hyltonc5007aa2000-06-30 05:02:53 +0000279/*** end of list stuff ***/
280
281
Tim Peters19b74c72002-07-01 03:52:19 +0000282/* Set all gc_refs = ob_refcnt. After this, gc_refs is > 0 for all objects
283 * in containers, and is GC_REACHABLE for all tracked gc objects not in
284 * containers.
Tim Peters88396172002-06-30 17:56:40 +0000285 */
Jeremy Hyltonc5007aa2000-06-30 05:02:53 +0000286static void
287update_refs(PyGC_Head *containers)
288{
Tim Peters9e4ca102001-10-11 18:31:31 +0000289 PyGC_Head *gc = containers->gc.gc_next;
Tim Petersea405632002-07-02 00:52:30 +0000290 for (; gc != containers; gc = gc->gc.gc_next) {
291 assert(gc->gc.gc_refs == GC_REACHABLE);
Christian Heimese93237d2007-12-19 02:37:44 +0000292 gc->gc.gc_refs = Py_REFCNT(FROM_GC(gc));
Tim Peters780c4972003-11-14 00:01:17 +0000293 /* Python's cyclic gc should never see an incoming refcount
294 * of 0: if something decref'ed to 0, it should have been
295 * deallocated immediately at that time.
296 * Possible cause (if the assert triggers): a tp_dealloc
297 * routine left a gc-aware object tracked during its teardown
298 * phase, and did something-- or allowed something to happen --
299 * that called back into Python. gc can trigger then, and may
300 * see the still-tracked dying object. Before this assert
301 * was added, such mistakes went on to allow gc to try to
302 * delete the object again. In a debug build, that caused
303 * a mysterious segfault, when _Py_ForgetReference tried
304 * to remove the object from the doubly-linked list of all
305 * objects a second time. In a release build, an actual
306 * double deallocation occurred, which leads to corruption
307 * of the allocator's internal bookkeeping pointers. That's
308 * so serious that maybe this should be a release-build
309 * check instead of an assert?
310 */
311 assert(gc->gc.gc_refs != 0);
Tim Petersea405632002-07-02 00:52:30 +0000312 }
Jeremy Hyltonc5007aa2000-06-30 05:02:53 +0000313}
314
Tim Peters19b74c72002-07-01 03:52:19 +0000315/* A traversal callback for subtract_refs. */
Jeremy Hyltonc5007aa2000-06-30 05:02:53 +0000316static int
317visit_decref(PyObject *op, void *data)
318{
Tim Peters93cd83e2002-06-30 21:31:03 +0000319 assert(op != NULL);
Tim Peters19b74c72002-07-01 03:52:19 +0000320 if (PyObject_IS_GC(op)) {
321 PyGC_Head *gc = AS_GC(op);
322 /* We're only interested in gc_refs for objects in the
323 * generation being collected, which can be recognized
324 * because only they have positive gc_refs.
325 */
Tim Petersaab713b2002-07-02 22:15:28 +0000326 assert(gc->gc.gc_refs != 0); /* else refcount was too small */
Tim Peters19b74c72002-07-01 03:52:19 +0000327 if (gc->gc.gc_refs > 0)
328 gc->gc.gc_refs--;
329 }
Jeremy Hyltonc5007aa2000-06-30 05:02:53 +0000330 return 0;
331}
332
Tim Peters19b74c72002-07-01 03:52:19 +0000333/* Subtract internal references from gc_refs. After this, gc_refs is >= 0
334 * for all objects in containers, and is GC_REACHABLE for all tracked gc
335 * objects not in containers. The ones with gc_refs > 0 are directly
336 * reachable from outside containers, and so can't be collected.
337 */
Jeremy Hyltonc5007aa2000-06-30 05:02:53 +0000338static void
339subtract_refs(PyGC_Head *containers)
340{
341 traverseproc traverse;
Tim Peters9e4ca102001-10-11 18:31:31 +0000342 PyGC_Head *gc = containers->gc.gc_next;
343 for (; gc != containers; gc=gc->gc.gc_next) {
Christian Heimese93237d2007-12-19 02:37:44 +0000344 traverse = Py_TYPE(FROM_GC(gc))->tp_traverse;
Neil Schemenauer43411b52001-08-30 00:05:51 +0000345 (void) traverse(FROM_GC(gc),
Jeremy Hyltonc5007aa2000-06-30 05:02:53 +0000346 (visitproc)visit_decref,
347 NULL);
348 }
349}
350
Tim Peters19b74c72002-07-01 03:52:19 +0000351/* A traversal callback for move_unreachable. */
Jeremy Hyltonc5007aa2000-06-30 05:02:53 +0000352static int
Tim Peters19b74c72002-07-01 03:52:19 +0000353visit_reachable(PyObject *op, PyGC_Head *reachable)
Jeremy Hyltonc5007aa2000-06-30 05:02:53 +0000354{
Tim Petersea405632002-07-02 00:52:30 +0000355 if (PyObject_IS_GC(op)) {
Tim Peters19b74c72002-07-01 03:52:19 +0000356 PyGC_Head *gc = AS_GC(op);
Martin v. Löwis6db0e002006-03-01 16:56:25 +0000357 const Py_ssize_t gc_refs = gc->gc.gc_refs;
Tim Peters19b74c72002-07-01 03:52:19 +0000358
359 if (gc_refs == 0) {
360 /* This is in move_unreachable's 'young' list, but
361 * the traversal hasn't yet gotten to it. All
362 * we need to do is tell move_unreachable that it's
363 * reachable.
364 */
365 gc->gc.gc_refs = 1;
Jeremy Hyltonc5007aa2000-06-30 05:02:53 +0000366 }
Tim Peters19b74c72002-07-01 03:52:19 +0000367 else if (gc_refs == GC_TENTATIVELY_UNREACHABLE) {
368 /* This had gc_refs = 0 when move_unreachable got
369 * to it, but turns out it's reachable after all.
370 * Move it back to move_unreachable's 'young' list,
371 * and move_unreachable will eventually get to it
372 * again.
373 */
Tim Peterse2d59182004-11-01 01:39:08 +0000374 gc_list_move(gc, reachable);
Tim Peters19b74c72002-07-01 03:52:19 +0000375 gc->gc.gc_refs = 1;
376 }
377 /* Else there's nothing to do.
378 * If gc_refs > 0, it must be in move_unreachable's 'young'
379 * list, and move_unreachable will eventually get to it.
380 * If gc_refs == GC_REACHABLE, it's either in some other
381 * generation so we don't care about it, or move_unreachable
Tim Peters6fc13d92002-07-02 18:12:35 +0000382 * already dealt with it.
Tim Petersea405632002-07-02 00:52:30 +0000383 * If gc_refs == GC_UNTRACKED, it must be ignored.
Tim Peters19b74c72002-07-01 03:52:19 +0000384 */
Tim Petersea405632002-07-02 00:52:30 +0000385 else {
386 assert(gc_refs > 0
387 || gc_refs == GC_REACHABLE
388 || gc_refs == GC_UNTRACKED);
389 }
Jeremy Hyltonc5007aa2000-06-30 05:02:53 +0000390 }
391 return 0;
392}
393
Tim Peters19b74c72002-07-01 03:52:19 +0000394/* Move the unreachable objects from young to unreachable. After this,
395 * all objects in young have gc_refs = GC_REACHABLE, and all objects in
396 * unreachable have gc_refs = GC_TENTATIVELY_UNREACHABLE. All tracked
397 * gc objects not in young or unreachable still have gc_refs = GC_REACHABLE.
398 * All objects in young after this are directly or indirectly reachable
399 * from outside the original young; and all objects in unreachable are
400 * not.
Tim Peters88396172002-06-30 17:56:40 +0000401 */
Jeremy Hyltonc5007aa2000-06-30 05:02:53 +0000402static void
Tim Peters19b74c72002-07-01 03:52:19 +0000403move_unreachable(PyGC_Head *young, PyGC_Head *unreachable)
Jeremy Hyltonc5007aa2000-06-30 05:02:53 +0000404{
Tim Peters19b74c72002-07-01 03:52:19 +0000405 PyGC_Head *gc = young->gc.gc_next;
406
407 /* Invariants: all objects "to the left" of us in young have gc_refs
408 * = GC_REACHABLE, and are indeed reachable (directly or indirectly)
409 * from outside the young list as it was at entry. All other objects
410 * from the original young "to the left" of us are in unreachable now,
411 * and have gc_refs = GC_TENTATIVELY_UNREACHABLE. All objects to the
412 * left of us in 'young' now have been scanned, and no objects here
413 * or to the right have been scanned yet.
414 */
415
416 while (gc != young) {
417 PyGC_Head *next;
418
Tim Peters6fc13d92002-07-02 18:12:35 +0000419 if (gc->gc.gc_refs) {
420 /* gc is definitely reachable from outside the
421 * original 'young'. Mark it as such, and traverse
422 * its pointers to find any other objects that may
423 * be directly reachable from it. Note that the
424 * call to tp_traverse may append objects to young,
425 * so we have to wait until it returns to determine
426 * the next object to visit.
427 */
428 PyObject *op = FROM_GC(gc);
Christian Heimese93237d2007-12-19 02:37:44 +0000429 traverseproc traverse = Py_TYPE(op)->tp_traverse;
Tim Peters6fc13d92002-07-02 18:12:35 +0000430 assert(gc->gc.gc_refs > 0);
431 gc->gc.gc_refs = GC_REACHABLE;
432 (void) traverse(op,
433 (visitproc)visit_reachable,
434 (void *)young);
435 next = gc->gc.gc_next;
436 }
437 else {
Tim Peters19b74c72002-07-01 03:52:19 +0000438 /* This *may* be unreachable. To make progress,
439 * assume it is. gc isn't directly reachable from
440 * any object we've already traversed, but may be
441 * reachable from an object we haven't gotten to yet.
442 * visit_reachable will eventually move gc back into
443 * young if that's so, and we'll see it again.
444 */
445 next = gc->gc.gc_next;
Tim Peterse2d59182004-11-01 01:39:08 +0000446 gc_list_move(gc, unreachable);
Tim Peters19b74c72002-07-01 03:52:19 +0000447 gc->gc.gc_refs = GC_TENTATIVELY_UNREACHABLE;
448 }
Tim Peters19b74c72002-07-01 03:52:19 +0000449 gc = next;
Jeremy Hyltonc5007aa2000-06-30 05:02:53 +0000450 }
451}
452
Tim Peters86b993b2003-04-05 17:35:54 +0000453/* Return true if object has a finalization method.
454 * CAUTION: An instance of an old-style class has to be checked for a
Tim Petersf6b80452003-04-07 19:21:15 +0000455 *__del__ method, and earlier versions of this used to call PyObject_HasAttr,
456 * which in turn could call the class's __getattr__ hook (if any). That
457 * could invoke arbitrary Python code, mutating the object graph in arbitrary
458 * ways, and that was the source of some excruciatingly subtle bugs.
Tim Peters86b993b2003-04-05 17:35:54 +0000459 */
Neil Schemenauera765c122001-11-01 17:35:23 +0000460static int
461has_finalizer(PyObject *op)
Jeremy Hyltonc5007aa2000-06-30 05:02:53 +0000462{
Tim Peters86b993b2003-04-05 17:35:54 +0000463 if (PyInstance_Check(op)) {
Tim Peters86b993b2003-04-05 17:35:54 +0000464 assert(delstr != NULL);
Tim Petersf6b80452003-04-07 19:21:15 +0000465 return _PyInstance_Lookup(op, delstr) != NULL;
Tim Peters86b993b2003-04-05 17:35:54 +0000466 }
Phillip J. Eby2ba96612006-04-10 17:51:05 +0000467 else if (PyType_HasFeature(op->ob_type, Py_TPFLAGS_HEAPTYPE))
Tim Peters86b993b2003-04-05 17:35:54 +0000468 return op->ob_type->tp_del != NULL;
Phillip J. Eby2ba96612006-04-10 17:51:05 +0000469 else if (PyGen_CheckExact(op))
470 return PyGen_NeedsFinalizing((PyGenObject *)op);
471 else
472 return 0;
Neil Schemenauera765c122001-11-01 17:35:23 +0000473}
474
Tim Petersead8b7a2004-10-30 23:09:22 +0000475/* Move the objects in unreachable with __del__ methods into `finalizers`.
476 * Objects moved into `finalizers` have gc_refs set to GC_REACHABLE; the
477 * objects remaining in unreachable are left at GC_TENTATIVELY_UNREACHABLE.
Jeremy Hyltonce136e92003-04-04 19:59:06 +0000478 */
Neil Schemenauera765c122001-11-01 17:35:23 +0000479static void
Tim Petersead8b7a2004-10-30 23:09:22 +0000480move_finalizers(PyGC_Head *unreachable, PyGC_Head *finalizers)
Neil Schemenauera765c122001-11-01 17:35:23 +0000481{
Tim Petersead8b7a2004-10-30 23:09:22 +0000482 PyGC_Head *gc;
483 PyGC_Head *next;
Tim Petersf6b80452003-04-07 19:21:15 +0000484
Tim Petersead8b7a2004-10-30 23:09:22 +0000485 /* March over unreachable. Move objects with finalizers into
486 * `finalizers`.
487 */
488 for (gc = unreachable->gc.gc_next; gc != unreachable; gc = next) {
Neil Schemenauer43411b52001-08-30 00:05:51 +0000489 PyObject *op = FROM_GC(gc);
Jeremy Hyltonce136e92003-04-04 19:59:06 +0000490
Tim Petersf6ae7a42003-04-05 18:40:50 +0000491 assert(IS_TENTATIVELY_UNREACHABLE(op));
Tim Petersead8b7a2004-10-30 23:09:22 +0000492 next = gc->gc.gc_next;
Tim Petersf6ae7a42003-04-05 18:40:50 +0000493
Tim Petersf6b80452003-04-07 19:21:15 +0000494 if (has_finalizer(op)) {
Tim Peterse2d59182004-11-01 01:39:08 +0000495 gc_list_move(gc, finalizers);
Tim Petersf6b80452003-04-07 19:21:15 +0000496 gc->gc.gc_refs = GC_REACHABLE;
Jeremy Hyltonce136e92003-04-04 19:59:06 +0000497 }
Jeremy Hyltonc5007aa2000-06-30 05:02:53 +0000498 }
499}
500
Tim Peters19b74c72002-07-01 03:52:19 +0000501/* A traversal callback for move_finalizer_reachable. */
502static int
503visit_move(PyObject *op, PyGC_Head *tolist)
504{
505 if (PyObject_IS_GC(op)) {
Tim Petersea405632002-07-02 00:52:30 +0000506 if (IS_TENTATIVELY_UNREACHABLE(op)) {
Tim Peters19b74c72002-07-01 03:52:19 +0000507 PyGC_Head *gc = AS_GC(op);
Tim Peterse2d59182004-11-01 01:39:08 +0000508 gc_list_move(gc, tolist);
Tim Peters19b74c72002-07-01 03:52:19 +0000509 gc->gc.gc_refs = GC_REACHABLE;
510 }
511 }
512 return 0;
513}
514
515/* Move objects that are reachable from finalizers, from the unreachable set
Tim Petersf6b80452003-04-07 19:21:15 +0000516 * into finalizers set.
Tim Peters19b74c72002-07-01 03:52:19 +0000517 */
Jeremy Hyltonc5007aa2000-06-30 05:02:53 +0000518static void
Tim Petersf6b80452003-04-07 19:21:15 +0000519move_finalizer_reachable(PyGC_Head *finalizers)
Jeremy Hyltonc5007aa2000-06-30 05:02:53 +0000520{
521 traverseproc traverse;
Tim Peters9e4ca102001-10-11 18:31:31 +0000522 PyGC_Head *gc = finalizers->gc.gc_next;
Tim Petersbf384c22003-04-06 00:11:39 +0000523 for (; gc != finalizers; gc = gc->gc.gc_next) {
524 /* Note that the finalizers list may grow during this. */
Christian Heimese93237d2007-12-19 02:37:44 +0000525 traverse = Py_TYPE(FROM_GC(gc))->tp_traverse;
Tim Peters88396172002-06-30 17:56:40 +0000526 (void) traverse(FROM_GC(gc),
Tim Petersbf384c22003-04-06 00:11:39 +0000527 (visitproc)visit_move,
Tim Petersf6b80452003-04-07 19:21:15 +0000528 (void *)finalizers);
Jeremy Hyltonc5007aa2000-06-30 05:02:53 +0000529 }
530}
531
Tim Petersead8b7a2004-10-30 23:09:22 +0000532/* Clear all weakrefs to unreachable objects, and if such a weakref has a
533 * callback, invoke it if necessary. Note that it's possible for such
534 * weakrefs to be outside the unreachable set -- indeed, those are precisely
535 * the weakrefs whose callbacks must be invoked. See gc_weakref.txt for
536 * overview & some details. Some weakrefs with callbacks may be reclaimed
537 * directly by this routine; the number reclaimed is the return value. Other
538 * weakrefs with callbacks may be moved into the `old` generation. Objects
539 * moved into `old` have gc_refs set to GC_REACHABLE; the objects remaining in
540 * unreachable are left at GC_TENTATIVELY_UNREACHABLE. When this returns,
541 * no object in `unreachable` is weakly referenced anymore.
Tim Peters403a2032003-11-20 21:21:46 +0000542 */
543static int
Tim Petersead8b7a2004-10-30 23:09:22 +0000544handle_weakrefs(PyGC_Head *unreachable, PyGC_Head *old)
Tim Peters403a2032003-11-20 21:21:46 +0000545{
Tim Petersead8b7a2004-10-30 23:09:22 +0000546 PyGC_Head *gc;
547 PyObject *op; /* generally FROM_GC(gc) */
548 PyWeakReference *wr; /* generally a cast of op */
Tim Petersead8b7a2004-10-30 23:09:22 +0000549 PyGC_Head wrcb_to_call; /* weakrefs with callbacks to call */
Tim Petersead8b7a2004-10-30 23:09:22 +0000550 PyGC_Head *next;
Tim Peters403a2032003-11-20 21:21:46 +0000551 int num_freed = 0;
552
Tim Petersead8b7a2004-10-30 23:09:22 +0000553 gc_list_init(&wrcb_to_call);
Tim Peters403a2032003-11-20 21:21:46 +0000554
Tim Petersead8b7a2004-10-30 23:09:22 +0000555 /* Clear all weakrefs to the objects in unreachable. If such a weakref
556 * also has a callback, move it into `wrcb_to_call` if the callback
Tim Peterscc2a8662004-10-31 22:12:43 +0000557 * needs to be invoked. Note that we cannot invoke any callbacks until
558 * all weakrefs to unreachable objects are cleared, lest the callback
559 * resurrect an unreachable object via a still-active weakref. We
560 * make another pass over wrcb_to_call, invoking callbacks, after this
561 * pass completes.
Tim Petersead8b7a2004-10-30 23:09:22 +0000562 */
563 for (gc = unreachable->gc.gc_next; gc != unreachable; gc = next) {
564 PyWeakReference **wrlist;
565
566 op = FROM_GC(gc);
567 assert(IS_TENTATIVELY_UNREACHABLE(op));
568 next = gc->gc.gc_next;
569
Christian Heimese93237d2007-12-19 02:37:44 +0000570 if (! PyType_SUPPORTS_WEAKREFS(Py_TYPE(op)))
Tim Petersead8b7a2004-10-30 23:09:22 +0000571 continue;
572
573 /* It supports weakrefs. Does it have any? */
574 wrlist = (PyWeakReference **)
575 PyObject_GET_WEAKREFS_LISTPTR(op);
576
577 /* `op` may have some weakrefs. March over the list, clear
578 * all the weakrefs, and move the weakrefs with callbacks
Tim Peterscc2a8662004-10-31 22:12:43 +0000579 * that must be called into wrcb_to_call.
Tim Petersead8b7a2004-10-30 23:09:22 +0000580 */
581 for (wr = *wrlist; wr != NULL; wr = *wrlist) {
582 PyGC_Head *wrasgc; /* AS_GC(wr) */
583
584 /* _PyWeakref_ClearRef clears the weakref but leaves
585 * the callback pointer intact. Obscure: it also
586 * changes *wrlist.
587 */
588 assert(wr->wr_object == op);
589 _PyWeakref_ClearRef(wr);
590 assert(wr->wr_object == Py_None);
591 if (wr->wr_callback == NULL)
592 continue; /* no callback */
593
594 /* Headache time. `op` is going away, and is weakly referenced by
595 * `wr`, which has a callback. Should the callback be invoked? If wr
596 * is also trash, no:
597 *
598 * 1. There's no need to call it. The object and the weakref are
599 * both going away, so it's legitimate to pretend the weakref is
600 * going away first. The user has to ensure a weakref outlives its
601 * referent if they want a guarantee that the wr callback will get
602 * invoked.
603 *
604 * 2. It may be catastrophic to call it. If the callback is also in
605 * cyclic trash (CT), then although the CT is unreachable from
606 * outside the current generation, CT may be reachable from the
607 * callback. Then the callback could resurrect insane objects.
608 *
609 * Since the callback is never needed and may be unsafe in this case,
Tim Peterscc2a8662004-10-31 22:12:43 +0000610 * wr is simply left in the unreachable set. Note that because we
611 * already called _PyWeakref_ClearRef(wr), its callback will never
612 * trigger.
Tim Petersead8b7a2004-10-30 23:09:22 +0000613 *
614 * OTOH, if wr isn't part of CT, we should invoke the callback: the
615 * weakref outlived the trash. Note that since wr isn't CT in this
616 * case, its callback can't be CT either -- wr acted as an external
617 * root to this generation, and therefore its callback did too. So
618 * nothing in CT is reachable from the callback either, so it's hard
619 * to imagine how calling it later could create a problem for us. wr
620 * is moved to wrcb_to_call in this case.
Tim Petersead8b7a2004-10-30 23:09:22 +0000621 */
Tim Peterscc2a8662004-10-31 22:12:43 +0000622 if (IS_TENTATIVELY_UNREACHABLE(wr))
623 continue;
624 assert(IS_REACHABLE(wr));
625
Tim Petersead8b7a2004-10-30 23:09:22 +0000626 /* Create a new reference so that wr can't go away
627 * before we can process it again.
628 */
629 Py_INCREF(wr);
630
Tim Peterscc2a8662004-10-31 22:12:43 +0000631 /* Move wr to wrcb_to_call, for the next pass. */
Tim Petersead8b7a2004-10-30 23:09:22 +0000632 wrasgc = AS_GC(wr);
Tim Peterscc2a8662004-10-31 22:12:43 +0000633 assert(wrasgc != next); /* wrasgc is reachable, but
634 next isn't, so they can't
635 be the same */
Tim Peterse2d59182004-11-01 01:39:08 +0000636 gc_list_move(wrasgc, &wrcb_to_call);
Tim Petersead8b7a2004-10-30 23:09:22 +0000637 }
638 }
639
Tim Peterscc2a8662004-10-31 22:12:43 +0000640 /* Invoke the callbacks we decided to honor. It's safe to invoke them
641 * because they can't reference unreachable objects.
Tim Petersead8b7a2004-10-30 23:09:22 +0000642 */
643 while (! gc_list_is_empty(&wrcb_to_call)) {
644 PyObject *temp;
645 PyObject *callback;
646
647 gc = wrcb_to_call.gc.gc_next;
648 op = FROM_GC(gc);
649 assert(IS_REACHABLE(op));
650 assert(PyWeakref_Check(op));
651 wr = (PyWeakReference *)op;
652 callback = wr->wr_callback;
653 assert(callback != NULL);
654
655 /* copy-paste of weakrefobject.c's handle_callback() */
Georg Brandl684fd0c2006-05-25 19:15:31 +0000656 temp = PyObject_CallFunctionObjArgs(callback, wr, NULL);
Tim Petersead8b7a2004-10-30 23:09:22 +0000657 if (temp == NULL)
658 PyErr_WriteUnraisable(callback);
659 else
660 Py_DECREF(temp);
661
662 /* Give up the reference we created in the first pass. When
663 * op's refcount hits 0 (which it may or may not do right now),
Tim Peterscc2a8662004-10-31 22:12:43 +0000664 * op's tp_dealloc will decref op->wr_callback too. Note
665 * that the refcount probably will hit 0 now, and because this
666 * weakref was reachable to begin with, gc didn't already
667 * add it to its count of freed objects. Example: a reachable
668 * weak value dict maps some key to this reachable weakref.
669 * The callback removes this key->weakref mapping from the
670 * dict, leaving no other references to the weakref (excepting
671 * ours).
Tim Petersead8b7a2004-10-30 23:09:22 +0000672 */
673 Py_DECREF(op);
674 if (wrcb_to_call.gc.gc_next == gc) {
675 /* object is still alive -- move it */
Tim Peterse2d59182004-11-01 01:39:08 +0000676 gc_list_move(gc, old);
Tim Petersead8b7a2004-10-30 23:09:22 +0000677 }
678 else
679 ++num_freed;
680 }
681
Tim Peters403a2032003-11-20 21:21:46 +0000682 return num_freed;
683}
684
Jeremy Hyltonc5007aa2000-06-30 05:02:53 +0000685static void
Jeremy Hylton06257772000-08-31 15:10:24 +0000686debug_instance(char *msg, PyInstanceObject *inst)
Jeremy Hyltonc5007aa2000-06-30 05:02:53 +0000687{
Jeremy Hyltonc5007aa2000-06-30 05:02:53 +0000688 char *cname;
Neil Schemenauera765c122001-11-01 17:35:23 +0000689 /* simple version of instance_repr */
Jeremy Hyltonc5007aa2000-06-30 05:02:53 +0000690 PyObject *classname = inst->in_class->cl_name;
Gregory P. Smithdd96db62008-06-09 04:58:54 +0000691 if (classname != NULL && PyString_Check(classname))
692 cname = PyString_AsString(classname);
Jeremy Hyltonc5007aa2000-06-30 05:02:53 +0000693 else
694 cname = "?";
Jeremy Hylton06257772000-08-31 15:10:24 +0000695 PySys_WriteStderr("gc: %.100s <%.100s instance at %p>\n",
696 msg, cname, inst);
Jeremy Hyltonc5007aa2000-06-30 05:02:53 +0000697}
698
699static void
Jeremy Hylton06257772000-08-31 15:10:24 +0000700debug_cycle(char *msg, PyObject *op)
Jeremy Hyltonc5007aa2000-06-30 05:02:53 +0000701{
702 if ((debug & DEBUG_INSTANCES) && PyInstance_Check(op)) {
Jeremy Hylton06257772000-08-31 15:10:24 +0000703 debug_instance(msg, (PyInstanceObject *)op);
Neil Schemenauer544de1e2000-09-22 15:22:38 +0000704 }
705 else if (debug & DEBUG_OBJECTS) {
Jeremy Hylton06257772000-08-31 15:10:24 +0000706 PySys_WriteStderr("gc: %.100s <%.100s %p>\n",
Christian Heimese93237d2007-12-19 02:37:44 +0000707 msg, Py_TYPE(op)->tp_name, op);
Jeremy Hyltonc5007aa2000-06-30 05:02:53 +0000708 }
709}
710
Tim Petersbf384c22003-04-06 00:11:39 +0000711/* Handle uncollectable garbage (cycles with finalizers, and stuff reachable
712 * only from such cycles).
Tim Petersf6b80452003-04-07 19:21:15 +0000713 * If DEBUG_SAVEALL, all objects in finalizers are appended to the module
714 * garbage list (a Python list), else only the objects in finalizers with
715 * __del__ methods are appended to garbage. All objects in finalizers are
716 * merged into the old list regardless.
Tim Peters259272b2003-04-06 19:41:39 +0000717 * Returns 0 if all OK, <0 on error (out of memory to grow the garbage list).
718 * The finalizers list is made empty on a successful return.
Tim Petersbf384c22003-04-06 00:11:39 +0000719 */
Tim Peters259272b2003-04-06 19:41:39 +0000720static int
Tim Petersf6b80452003-04-07 19:21:15 +0000721handle_finalizers(PyGC_Head *finalizers, PyGC_Head *old)
Jeremy Hyltonc5007aa2000-06-30 05:02:53 +0000722{
Tim Petersf6b80452003-04-07 19:21:15 +0000723 PyGC_Head *gc = finalizers->gc.gc_next;
724
Jeremy Hyltonc5007aa2000-06-30 05:02:53 +0000725 if (garbage == NULL) {
726 garbage = PyList_New(0);
Tim Petersbf384c22003-04-06 00:11:39 +0000727 if (garbage == NULL)
728 Py_FatalError("gc couldn't create gc.garbage list");
Jeremy Hyltonc5007aa2000-06-30 05:02:53 +0000729 }
Tim Petersf6b80452003-04-07 19:21:15 +0000730 for (; gc != finalizers; gc = gc->gc.gc_next) {
731 PyObject *op = FROM_GC(gc);
732
733 if ((debug & DEBUG_SAVEALL) || has_finalizer(op)) {
734 if (PyList_Append(garbage, op) < 0)
735 return -1;
736 }
Jeremy Hyltonc5007aa2000-06-30 05:02:53 +0000737 }
Tim Petersf6b80452003-04-07 19:21:15 +0000738
Tim Peters259272b2003-04-06 19:41:39 +0000739 gc_list_merge(finalizers, old);
740 return 0;
Jeremy Hyltonc5007aa2000-06-30 05:02:53 +0000741}
742
Neil Schemenauer544de1e2000-09-22 15:22:38 +0000743/* Break reference cycles by clearing the containers involved. This is
Jeremy Hyltonc5007aa2000-06-30 05:02:53 +0000744 * tricky business as the lists can be changing and we don't know which
Tim Peters19b74c72002-07-01 03:52:19 +0000745 * objects may be freed. It is possible I screwed something up here.
746 */
Jeremy Hyltonc5007aa2000-06-30 05:02:53 +0000747static void
Jeremy Hyltonce136e92003-04-04 19:59:06 +0000748delete_garbage(PyGC_Head *collectable, PyGC_Head *old)
Jeremy Hyltonc5007aa2000-06-30 05:02:53 +0000749{
750 inquiry clear;
751
Jeremy Hyltonce136e92003-04-04 19:59:06 +0000752 while (!gc_list_is_empty(collectable)) {
753 PyGC_Head *gc = collectable->gc.gc_next;
Neil Schemenauer43411b52001-08-30 00:05:51 +0000754 PyObject *op = FROM_GC(gc);
Tim Peters88396172002-06-30 17:56:40 +0000755
Tim Peters19b74c72002-07-01 03:52:19 +0000756 assert(IS_TENTATIVELY_UNREACHABLE(op));
Neil Schemenauer544de1e2000-09-22 15:22:38 +0000757 if (debug & DEBUG_SAVEALL) {
758 PyList_Append(garbage, op);
Jeremy Hyltonc5007aa2000-06-30 05:02:53 +0000759 }
Neil Schemenauer544de1e2000-09-22 15:22:38 +0000760 else {
Christian Heimese93237d2007-12-19 02:37:44 +0000761 if ((clear = Py_TYPE(op)->tp_clear) != NULL) {
Neil Schemenauer544de1e2000-09-22 15:22:38 +0000762 Py_INCREF(op);
Jeremy Hylton8a135182002-06-06 23:23:55 +0000763 clear(op);
Neil Schemenauer544de1e2000-09-22 15:22:38 +0000764 Py_DECREF(op);
765 }
766 }
Jeremy Hyltonce136e92003-04-04 19:59:06 +0000767 if (collectable->gc.gc_next == gc) {
Neil Schemenauer544de1e2000-09-22 15:22:38 +0000768 /* object is still alive, move it, it may die later */
Tim Peterse2d59182004-11-01 01:39:08 +0000769 gc_list_move(gc, old);
Tim Peters19b74c72002-07-01 03:52:19 +0000770 gc->gc.gc_refs = GC_REACHABLE;
Jeremy Hyltonc5007aa2000-06-30 05:02:53 +0000771 }
772 }
773}
774
Christian Heimes3b718a72008-02-14 12:47:33 +0000775/* Clear all free lists
776 * All free lists are cleared during the collection of the highest generation.
777 * Allocated items in the free list may keep a pymalloc arena occupied.
778 * Clearing the free lists may give back memory to the OS earlier.
779 */
780static void
781clear_freelists(void)
782{
783 (void)PyMethod_ClearFreeList();
784 (void)PyFrame_ClearFreeList();
785 (void)PyCFunction_ClearFreeList();
786 (void)PyTuple_ClearFreeList();
787 (void)PyUnicode_ClearFreeList();
Gregory P. Smith2fe77062008-07-06 03:35:58 +0000788 (void)PyInt_ClearFreeList();
789 (void)PyFloat_ClearFreeList();
Christian Heimes3b718a72008-02-14 12:47:33 +0000790}
791
Antoine Pitrou73c0e652008-12-17 22:46:54 +0000792static double
793get_time(void)
794{
795 double result = 0;
796 if (tmod != NULL) {
797 PyObject *f = PyObject_CallMethod(tmod, "time", NULL);
798 if (f == NULL) {
799 PyErr_Clear();
800 }
801 else {
802 if (PyFloat_Check(f))
803 result = PyFloat_AsDouble(f);
804 Py_DECREF(f);
805 }
806 }
807 return result;
808}
809
Jeremy Hyltonc5007aa2000-06-30 05:02:53 +0000810/* This is the main function. Read this to understand how the
811 * collection process works. */
Neal Norwitz7b216c52006-03-04 20:01:53 +0000812static Py_ssize_t
Neil Schemenauer2880ae52002-05-04 05:35:20 +0000813collect(int generation)
Jeremy Hyltonc5007aa2000-06-30 05:02:53 +0000814{
Neil Schemenauer2880ae52002-05-04 05:35:20 +0000815 int i;
Neal Norwitz7b216c52006-03-04 20:01:53 +0000816 Py_ssize_t m = 0; /* # objects collected */
817 Py_ssize_t n = 0; /* # unreachable objects that couldn't be collected */
Neil Schemenauer2880ae52002-05-04 05:35:20 +0000818 PyGC_Head *young; /* the generation we are examining */
819 PyGC_Head *old; /* next older generation */
Tim Peters403a2032003-11-20 21:21:46 +0000820 PyGC_Head unreachable; /* non-problematic unreachable trash */
821 PyGC_Head finalizers; /* objects with, & reachable from, __del__ */
Jeremy Hyltonc5007aa2000-06-30 05:02:53 +0000822 PyGC_Head *gc;
Skip Montanaroc34b9312006-04-21 01:33:40 +0000823 double t1 = 0.0;
Jeremy Hyltonc5007aa2000-06-30 05:02:53 +0000824
Tim Peters93ad66d2003-04-05 17:15:44 +0000825 if (delstr == NULL) {
Gregory P. Smithdd96db62008-06-09 04:58:54 +0000826 delstr = PyString_InternFromString("__del__");
Tim Peters93ad66d2003-04-05 17:15:44 +0000827 if (delstr == NULL)
828 Py_FatalError("gc couldn't allocate \"__del__\"");
829 }
830
Jeremy Hyltonc5007aa2000-06-30 05:02:53 +0000831 if (debug & DEBUG_STATS) {
Antoine Pitrou73c0e652008-12-17 22:46:54 +0000832 t1 = get_time();
Neil Schemenauer2880ae52002-05-04 05:35:20 +0000833 PySys_WriteStderr("gc: collecting generation %d...\n",
834 generation);
835 PySys_WriteStderr("gc: objects in each generation:");
Tim Peters62e97f02006-03-28 21:44:32 +0000836 for (i = 0; i < NUM_GENERATIONS; i++)
837 PySys_WriteStderr(" %" PY_FORMAT_SIZE_T "d",
838 gc_list_size(GEN_HEAD(i)));
Neil Schemenauer2880ae52002-05-04 05:35:20 +0000839 PySys_WriteStderr("\n");
840 }
841
842 /* update collection and allocation counters */
843 if (generation+1 < NUM_GENERATIONS)
844 generations[generation+1].count += 1;
845 for (i = 0; i <= generation; i++)
Neil Schemenauerc9051642002-06-28 19:16:04 +0000846 generations[i].count = 0;
Neil Schemenauer2880ae52002-05-04 05:35:20 +0000847
848 /* merge younger generations with one we are currently collecting */
849 for (i = 0; i < generation; i++) {
850 gc_list_merge(GEN_HEAD(i), GEN_HEAD(generation));
851 }
852
853 /* handy references */
854 young = GEN_HEAD(generation);
Tim Peters19b74c72002-07-01 03:52:19 +0000855 if (generation < NUM_GENERATIONS-1)
Neil Schemenauer2880ae52002-05-04 05:35:20 +0000856 old = GEN_HEAD(generation+1);
Tim Peters19b74c72002-07-01 03:52:19 +0000857 else
858 old = young;
Jeremy Hyltonc5007aa2000-06-30 05:02:53 +0000859
860 /* Using ob_refcnt and gc_refs, calculate which objects in the
Tim Petersead8b7a2004-10-30 23:09:22 +0000861 * container set are reachable from outside the set (i.e., have a
Jeremy Hyltonc5007aa2000-06-30 05:02:53 +0000862 * refcount greater than 0 when all the references within the
Tim Petersead8b7a2004-10-30 23:09:22 +0000863 * set are taken into account).
Tim Peters19b74c72002-07-01 03:52:19 +0000864 */
Jeremy Hyltonc5007aa2000-06-30 05:02:53 +0000865 update_refs(young);
866 subtract_refs(young);
867
Tim Peters19b74c72002-07-01 03:52:19 +0000868 /* Leave everything reachable from outside young in young, and move
869 * everything else (in young) to unreachable.
870 * NOTE: This used to move the reachable objects into a reachable
871 * set instead. But most things usually turn out to be reachable,
872 * so it's more efficient to move the unreachable things.
873 */
Jeremy Hyltonc5007aa2000-06-30 05:02:53 +0000874 gc_list_init(&unreachable);
Tim Peters19b74c72002-07-01 03:52:19 +0000875 move_unreachable(young, &unreachable);
Jeremy Hyltonc5007aa2000-06-30 05:02:53 +0000876
Tim Peters19b74c72002-07-01 03:52:19 +0000877 /* Move reachable objects to next generation. */
Antoine Pitrou4c5ecb72009-01-09 21:40:55 +0000878 if (young != old) {
879 if (generation == NUM_GENERATIONS - 2) {
880 long_lived_pending += gc_list_size(young);
881 }
Tim Peters19b74c72002-07-01 03:52:19 +0000882 gc_list_merge(young, old);
Antoine Pitrou4c5ecb72009-01-09 21:40:55 +0000883 }
884 else {
885 long_lived_pending = 0;
886 long_lived_total = gc_list_size(young);
887 }
Jeremy Hyltonc5007aa2000-06-30 05:02:53 +0000888
Tim Peters19b74c72002-07-01 03:52:19 +0000889 /* All objects in unreachable are trash, but objects reachable from
890 * finalizers can't safely be deleted. Python programmers should take
891 * care not to create such things. For Python, finalizers means
Tim Peters403a2032003-11-20 21:21:46 +0000892 * instance objects with __del__ methods. Weakrefs with callbacks
Tim Petersead8b7a2004-10-30 23:09:22 +0000893 * can also call arbitrary Python code but they will be dealt with by
894 * handle_weakrefs().
Tim Petersf6b80452003-04-07 19:21:15 +0000895 */
Jeremy Hyltonc5007aa2000-06-30 05:02:53 +0000896 gc_list_init(&finalizers);
Tim Petersead8b7a2004-10-30 23:09:22 +0000897 move_finalizers(&unreachable, &finalizers);
Tim Petersbf384c22003-04-06 00:11:39 +0000898 /* finalizers contains the unreachable objects with a finalizer;
Tim Peters403a2032003-11-20 21:21:46 +0000899 * unreachable objects reachable *from* those are also uncollectable,
900 * and we move those into the finalizers list too.
Tim Petersbf384c22003-04-06 00:11:39 +0000901 */
Tim Petersf6b80452003-04-07 19:21:15 +0000902 move_finalizer_reachable(&finalizers);
Jeremy Hyltonc5007aa2000-06-30 05:02:53 +0000903
904 /* Collect statistics on collectable objects found and print
Tim Peters403a2032003-11-20 21:21:46 +0000905 * debugging information.
906 */
Tim Petersf6b80452003-04-07 19:21:15 +0000907 for (gc = unreachable.gc.gc_next; gc != &unreachable;
Tim Peters9e4ca102001-10-11 18:31:31 +0000908 gc = gc->gc.gc_next) {
Jeremy Hyltonc5007aa2000-06-30 05:02:53 +0000909 m++;
Jeremy Hylton06257772000-08-31 15:10:24 +0000910 if (debug & DEBUG_COLLECTABLE) {
Neil Schemenauer43411b52001-08-30 00:05:51 +0000911 debug_cycle("collectable", FROM_GC(gc));
Jeremy Hyltonc5007aa2000-06-30 05:02:53 +0000912 }
913 }
Tim Petersead8b7a2004-10-30 23:09:22 +0000914
915 /* Clear weakrefs and invoke callbacks as necessary. */
916 m += handle_weakrefs(&unreachable, old);
917
Tim Petersfb2ab4d2003-04-07 22:41:24 +0000918 /* Call tp_clear on objects in the unreachable set. This will cause
919 * the reference cycles to be broken. It may also cause some objects
920 * in finalizers to be freed.
921 */
Tim Petersf6b80452003-04-07 19:21:15 +0000922 delete_garbage(&unreachable, old);
Jeremy Hyltonc5007aa2000-06-30 05:02:53 +0000923
924 /* Collect statistics on uncollectable objects found and print
925 * debugging information. */
Tim Peters50c61d52003-04-06 01:50:50 +0000926 for (gc = finalizers.gc.gc_next;
Tim Petersbf384c22003-04-06 00:11:39 +0000927 gc != &finalizers;
928 gc = gc->gc.gc_next) {
Jeremy Hyltonc5007aa2000-06-30 05:02:53 +0000929 n++;
Tim Petersbf384c22003-04-06 00:11:39 +0000930 if (debug & DEBUG_UNCOLLECTABLE)
Neil Schemenauer43411b52001-08-30 00:05:51 +0000931 debug_cycle("uncollectable", FROM_GC(gc));
Tim Petersbf384c22003-04-06 00:11:39 +0000932 }
Jeremy Hylton06257772000-08-31 15:10:24 +0000933 if (debug & DEBUG_STATS) {
Antoine Pitrou73c0e652008-12-17 22:46:54 +0000934 double t2 = get_time();
Tim Peters62e97f02006-03-28 21:44:32 +0000935 if (m == 0 && n == 0)
Antoine Pitrou73c0e652008-12-17 22:46:54 +0000936 PySys_WriteStderr("gc: done");
Tim Peters62e97f02006-03-28 21:44:32 +0000937 else
Neal Norwitze22373d2006-03-06 23:31:56 +0000938 PySys_WriteStderr(
Tim Peters62e97f02006-03-28 21:44:32 +0000939 "gc: done, "
940 "%" PY_FORMAT_SIZE_T "d unreachable, "
Antoine Pitrou73c0e652008-12-17 22:46:54 +0000941 "%" PY_FORMAT_SIZE_T "d uncollectable",
Neal Norwitze22373d2006-03-06 23:31:56 +0000942 n+m, n);
Antoine Pitrou73c0e652008-12-17 22:46:54 +0000943 if (t1 && t2) {
944 PySys_WriteStderr(", %.4fs elapsed", t2-t1);
945 }
946 PySys_WriteStderr(".\n");
Jeremy Hyltonc5007aa2000-06-30 05:02:53 +0000947 }
948
949 /* Append instances in the uncollectable set to a Python
950 * reachable list of garbage. The programmer has to deal with
Tim Petersbf384c22003-04-06 00:11:39 +0000951 * this if they insist on creating this type of structure.
952 */
Tim Petersf6b80452003-04-07 19:21:15 +0000953 (void)handle_finalizers(&finalizers, old);
Jeremy Hyltonc5007aa2000-06-30 05:02:53 +0000954
Christian Heimes3b718a72008-02-14 12:47:33 +0000955 /* Clear free list only during the collection of the higest
956 * generation */
957 if (generation == NUM_GENERATIONS-1) {
958 clear_freelists();
959 }
960
Jeremy Hyltonb709df32000-09-01 02:47:25 +0000961 if (PyErr_Occurred()) {
Tim Petersf6b80452003-04-07 19:21:15 +0000962 if (gc_str == NULL)
Gregory P. Smithdd96db62008-06-09 04:58:54 +0000963 gc_str = PyString_FromString("garbage collection");
Jeremy Hyltonb709df32000-09-01 02:47:25 +0000964 PyErr_WriteUnraisable(gc_str);
965 Py_FatalError("unexpected exception during garbage collection");
966 }
Jeremy Hyltonc5007aa2000-06-30 05:02:53 +0000967 return n+m;
968}
969
Neal Norwitz7b216c52006-03-04 20:01:53 +0000970static Py_ssize_t
Jeremy Hyltonc5007aa2000-06-30 05:02:53 +0000971collect_generations(void)
972{
Neil Schemenauer2880ae52002-05-04 05:35:20 +0000973 int i;
Neal Norwitz7b216c52006-03-04 20:01:53 +0000974 Py_ssize_t n = 0;
Jeremy Hyltonc5007aa2000-06-30 05:02:53 +0000975
Neil Schemenauer2880ae52002-05-04 05:35:20 +0000976 /* Find the oldest generation (higest numbered) where the count
977 * exceeds the threshold. Objects in the that generation and
978 * generations younger than it will be collected. */
979 for (i = NUM_GENERATIONS-1; i >= 0; i--) {
980 if (generations[i].count > generations[i].threshold) {
Antoine Pitrou4c5ecb72009-01-09 21:40:55 +0000981 /* Avoid quadratic performance degradation in number
982 of tracked objects. See comments at the beginning
983 of this file, and issue #4074.
984 */
985 if (i == NUM_GENERATIONS - 1
986 && long_lived_pending < long_lived_total / 4)
987 continue;
Neil Schemenauer2880ae52002-05-04 05:35:20 +0000988 n = collect(i);
989 break;
Jeremy Hyltonc5007aa2000-06-30 05:02:53 +0000990 }
991 }
992 return n;
993}
994
Martin v. Löwis14f8b4c2002-06-13 20:33:02 +0000995PyDoc_STRVAR(gc_enable__doc__,
Vladimir Marangozovf9d20c32000-08-06 22:45:31 +0000996"enable() -> None\n"
997"\n"
Martin v. Löwis14f8b4c2002-06-13 20:33:02 +0000998"Enable automatic garbage collection.\n");
Jeremy Hyltonc5007aa2000-06-30 05:02:53 +0000999
Vladimir Marangozovf9d20c32000-08-06 22:45:31 +00001000static PyObject *
Tim Peters50c61d52003-04-06 01:50:50 +00001001gc_enable(PyObject *self, PyObject *noargs)
Vladimir Marangozovf9d20c32000-08-06 22:45:31 +00001002{
Vladimir Marangozovf9d20c32000-08-06 22:45:31 +00001003 enabled = 1;
Vladimir Marangozovf9d20c32000-08-06 22:45:31 +00001004 Py_INCREF(Py_None);
1005 return Py_None;
1006}
1007
Martin v. Löwis14f8b4c2002-06-13 20:33:02 +00001008PyDoc_STRVAR(gc_disable__doc__,
Vladimir Marangozovf9d20c32000-08-06 22:45:31 +00001009"disable() -> None\n"
1010"\n"
Martin v. Löwis14f8b4c2002-06-13 20:33:02 +00001011"Disable automatic garbage collection.\n");
Vladimir Marangozovf9d20c32000-08-06 22:45:31 +00001012
1013static PyObject *
Tim Peters50c61d52003-04-06 01:50:50 +00001014gc_disable(PyObject *self, PyObject *noargs)
Vladimir Marangozovf9d20c32000-08-06 22:45:31 +00001015{
Vladimir Marangozovf9d20c32000-08-06 22:45:31 +00001016 enabled = 0;
Vladimir Marangozovf9d20c32000-08-06 22:45:31 +00001017 Py_INCREF(Py_None);
1018 return Py_None;
1019}
1020
Martin v. Löwis14f8b4c2002-06-13 20:33:02 +00001021PyDoc_STRVAR(gc_isenabled__doc__,
Vladimir Marangozovf9d20c32000-08-06 22:45:31 +00001022"isenabled() -> status\n"
1023"\n"
Martin v. Löwis14f8b4c2002-06-13 20:33:02 +00001024"Returns true if automatic garbage collection is enabled.\n");
Vladimir Marangozovf9d20c32000-08-06 22:45:31 +00001025
1026static PyObject *
Tim Peters50c61d52003-04-06 01:50:50 +00001027gc_isenabled(PyObject *self, PyObject *noargs)
Vladimir Marangozovf9d20c32000-08-06 22:45:31 +00001028{
Raymond Hettinger674d56b2004-01-04 04:00:13 +00001029 return PyBool_FromLong((long)enabled);
Vladimir Marangozovf9d20c32000-08-06 22:45:31 +00001030}
1031
Martin v. Löwis14f8b4c2002-06-13 20:33:02 +00001032PyDoc_STRVAR(gc_collect__doc__,
Barry Warsawd3c38ff2006-03-07 09:46:03 +00001033"collect([generation]) -> n\n"
Jeremy Hyltonc5007aa2000-06-30 05:02:53 +00001034"\n"
Barry Warsawd3c38ff2006-03-07 09:46:03 +00001035"With no arguments, run a full collection. The optional argument\n"
1036"may be an integer specifying which generation to collect. A ValueError\n"
1037"is raised if the generation number is invalid.\n\n"
1038"The number of unreachable objects is returned.\n");
Jeremy Hyltonc5007aa2000-06-30 05:02:53 +00001039
1040static PyObject *
Barry Warsawd3c38ff2006-03-07 09:46:03 +00001041gc_collect(PyObject *self, PyObject *args, PyObject *kws)
Jeremy Hyltonc5007aa2000-06-30 05:02:53 +00001042{
Barry Warsawd3c38ff2006-03-07 09:46:03 +00001043 static char *keywords[] = {"generation", NULL};
1044 int genarg = NUM_GENERATIONS - 1;
Neal Norwitz7b216c52006-03-04 20:01:53 +00001045 Py_ssize_t n;
Jeremy Hyltonc5007aa2000-06-30 05:02:53 +00001046
Barry Warsawd3c38ff2006-03-07 09:46:03 +00001047 if (!PyArg_ParseTupleAndKeywords(args, kws, "|i", keywords, &genarg))
1048 return NULL;
1049
1050 else if (genarg < 0 || genarg >= NUM_GENERATIONS) {
1051 PyErr_SetString(PyExc_ValueError, "invalid generation");
1052 return NULL;
1053 }
1054
Tim Peters50c61d52003-04-06 01:50:50 +00001055 if (collecting)
Neil Schemenauere8c40cb2001-10-31 23:09:35 +00001056 n = 0; /* already collecting, don't do anything */
Neil Schemenauere8c40cb2001-10-31 23:09:35 +00001057 else {
1058 collecting = 1;
Barry Warsawd3c38ff2006-03-07 09:46:03 +00001059 n = collect(genarg);
Neil Schemenauere8c40cb2001-10-31 23:09:35 +00001060 collecting = 0;
1061 }
Jeremy Hyltonc5007aa2000-06-30 05:02:53 +00001062
Neal Norwitz7b216c52006-03-04 20:01:53 +00001063 return PyInt_FromSsize_t(n);
Jeremy Hyltonc5007aa2000-06-30 05:02:53 +00001064}
1065
Martin v. Löwis14f8b4c2002-06-13 20:33:02 +00001066PyDoc_STRVAR(gc_set_debug__doc__,
Jeremy Hyltonc5007aa2000-06-30 05:02:53 +00001067"set_debug(flags) -> None\n"
1068"\n"
1069"Set the garbage collection debugging flags. Debugging information is\n"
1070"written to sys.stderr.\n"
1071"\n"
1072"flags is an integer and can have the following bits turned on:\n"
1073"\n"
1074" DEBUG_STATS - Print statistics during collection.\n"
1075" DEBUG_COLLECTABLE - Print collectable objects found.\n"
1076" DEBUG_UNCOLLECTABLE - Print unreachable but uncollectable objects found.\n"
1077" DEBUG_INSTANCES - Print instance objects.\n"
1078" DEBUG_OBJECTS - Print objects other than instances.\n"
Neil Schemenauer544de1e2000-09-22 15:22:38 +00001079" DEBUG_SAVEALL - Save objects to gc.garbage rather than freeing them.\n"
Martin v. Löwis14f8b4c2002-06-13 20:33:02 +00001080" DEBUG_LEAK - Debug leaking programs (everything but STATS).\n");
Jeremy Hyltonc5007aa2000-06-30 05:02:53 +00001081
1082static PyObject *
Vladimir Marangozovf9d20c32000-08-06 22:45:31 +00001083gc_set_debug(PyObject *self, PyObject *args)
Jeremy Hyltonc5007aa2000-06-30 05:02:53 +00001084{
Neil Schemenauer7760cff2000-09-22 22:35:36 +00001085 if (!PyArg_ParseTuple(args, "i:set_debug", &debug))
Jeremy Hyltonc5007aa2000-06-30 05:02:53 +00001086 return NULL;
1087
1088 Py_INCREF(Py_None);
1089 return Py_None;
1090}
1091
Martin v. Löwis14f8b4c2002-06-13 20:33:02 +00001092PyDoc_STRVAR(gc_get_debug__doc__,
Jeremy Hyltonc5007aa2000-06-30 05:02:53 +00001093"get_debug() -> flags\n"
1094"\n"
Martin v. Löwis14f8b4c2002-06-13 20:33:02 +00001095"Get the garbage collection debugging flags.\n");
Jeremy Hyltonc5007aa2000-06-30 05:02:53 +00001096
1097static PyObject *
Tim Peters50c61d52003-04-06 01:50:50 +00001098gc_get_debug(PyObject *self, PyObject *noargs)
Jeremy Hyltonc5007aa2000-06-30 05:02:53 +00001099{
Jeremy Hyltonc5007aa2000-06-30 05:02:53 +00001100 return Py_BuildValue("i", debug);
1101}
1102
Martin v. Löwis14f8b4c2002-06-13 20:33:02 +00001103PyDoc_STRVAR(gc_set_thresh__doc__,
Neal Norwitz2a47c0f2002-01-29 00:53:41 +00001104"set_threshold(threshold0, [threshold1, threshold2]) -> None\n"
Jeremy Hyltonc5007aa2000-06-30 05:02:53 +00001105"\n"
1106"Sets the collection thresholds. Setting threshold0 to zero disables\n"
Martin v. Löwis14f8b4c2002-06-13 20:33:02 +00001107"collection.\n");
Jeremy Hyltonc5007aa2000-06-30 05:02:53 +00001108
1109static PyObject *
Vladimir Marangozovf9d20c32000-08-06 22:45:31 +00001110gc_set_thresh(PyObject *self, PyObject *args)
Jeremy Hyltonc5007aa2000-06-30 05:02:53 +00001111{
Neil Schemenauer2880ae52002-05-04 05:35:20 +00001112 int i;
1113 if (!PyArg_ParseTuple(args, "i|ii:set_threshold",
1114 &generations[0].threshold,
1115 &generations[1].threshold,
1116 &generations[2].threshold))
Jeremy Hyltonc5007aa2000-06-30 05:02:53 +00001117 return NULL;
Neil Schemenauer2880ae52002-05-04 05:35:20 +00001118 for (i = 2; i < NUM_GENERATIONS; i++) {
1119 /* generations higher than 2 get the same threshold */
1120 generations[i].threshold = generations[2].threshold;
1121 }
Jeremy Hyltonc5007aa2000-06-30 05:02:53 +00001122
1123 Py_INCREF(Py_None);
1124 return Py_None;
1125}
1126
Martin v. Löwis14f8b4c2002-06-13 20:33:02 +00001127PyDoc_STRVAR(gc_get_thresh__doc__,
Jeremy Hyltonc5007aa2000-06-30 05:02:53 +00001128"get_threshold() -> (threshold0, threshold1, threshold2)\n"
1129"\n"
Martin v. Löwis14f8b4c2002-06-13 20:33:02 +00001130"Return the current collection thresholds\n");
Jeremy Hyltonc5007aa2000-06-30 05:02:53 +00001131
1132static PyObject *
Tim Peters50c61d52003-04-06 01:50:50 +00001133gc_get_thresh(PyObject *self, PyObject *noargs)
Jeremy Hyltonc5007aa2000-06-30 05:02:53 +00001134{
Neil Schemenauer2880ae52002-05-04 05:35:20 +00001135 return Py_BuildValue("(iii)",
1136 generations[0].threshold,
1137 generations[1].threshold,
1138 generations[2].threshold);
Jeremy Hyltonc5007aa2000-06-30 05:02:53 +00001139}
1140
Barry Warsawd3c38ff2006-03-07 09:46:03 +00001141PyDoc_STRVAR(gc_get_count__doc__,
1142"get_count() -> (count0, count1, count2)\n"
1143"\n"
1144"Return the current collection counts\n");
1145
1146static PyObject *
1147gc_get_count(PyObject *self, PyObject *noargs)
1148{
1149 return Py_BuildValue("(iii)",
1150 generations[0].count,
1151 generations[1].count,
1152 generations[2].count);
1153}
1154
Neil Schemenauer48c70342001-08-09 15:38:31 +00001155static int
Martin v. Löwis560da622001-11-24 09:24:51 +00001156referrersvisit(PyObject* obj, PyObject *objs)
Neil Schemenauer48c70342001-08-09 15:38:31 +00001157{
Neal Norwitzffb0d902006-04-06 08:07:25 +00001158 Py_ssize_t i;
Martin v. Löwisc8fe77b2001-11-29 18:08:31 +00001159 for (i = 0; i < PyTuple_GET_SIZE(objs); i++)
1160 if (PyTuple_GET_ITEM(objs, i) == obj)
1161 return 1;
Neil Schemenauer48c70342001-08-09 15:38:31 +00001162 return 0;
1163}
1164
Neil Schemenauer17e7be62001-08-10 14:46:47 +00001165static int
Martin v. Löwis560da622001-11-24 09:24:51 +00001166gc_referrers_for(PyObject *objs, PyGC_Head *list, PyObject *resultlist)
Neil Schemenauer48c70342001-08-09 15:38:31 +00001167{
1168 PyGC_Head *gc;
1169 PyObject *obj;
1170 traverseproc traverse;
Tim Peters9e4ca102001-10-11 18:31:31 +00001171 for (gc = list->gc.gc_next; gc != list; gc = gc->gc.gc_next) {
Neil Schemenauer43411b52001-08-30 00:05:51 +00001172 obj = FROM_GC(gc);
Christian Heimese93237d2007-12-19 02:37:44 +00001173 traverse = Py_TYPE(obj)->tp_traverse;
Neil Schemenauer48c70342001-08-09 15:38:31 +00001174 if (obj == objs || obj == resultlist)
1175 continue;
Martin v. Löwis560da622001-11-24 09:24:51 +00001176 if (traverse(obj, (visitproc)referrersvisit, objs)) {
Neil Schemenauer17e7be62001-08-10 14:46:47 +00001177 if (PyList_Append(resultlist, obj) < 0)
1178 return 0; /* error */
Neil Schemenauer48c70342001-08-09 15:38:31 +00001179 }
1180 }
Neil Schemenauer17e7be62001-08-10 14:46:47 +00001181 return 1; /* no error */
Neil Schemenauer48c70342001-08-09 15:38:31 +00001182}
1183
Martin v. Löwis14f8b4c2002-06-13 20:33:02 +00001184PyDoc_STRVAR(gc_get_referrers__doc__,
Martin v. Löwis560da622001-11-24 09:24:51 +00001185"get_referrers(*objs) -> list\n\
Martin v. Löwis14f8b4c2002-06-13 20:33:02 +00001186Return the list of objects that directly refer to any of objs.");
Neil Schemenauer48c70342001-08-09 15:38:31 +00001187
Neil Schemenauer17e7be62001-08-10 14:46:47 +00001188static PyObject *
Martin v. Löwis560da622001-11-24 09:24:51 +00001189gc_get_referrers(PyObject *self, PyObject *args)
Neil Schemenauer48c70342001-08-09 15:38:31 +00001190{
Neil Schemenauer2880ae52002-05-04 05:35:20 +00001191 int i;
Neil Schemenauer48c70342001-08-09 15:38:31 +00001192 PyObject *result = PyList_New(0);
Georg Brandl5c170fd2006-03-17 19:03:25 +00001193 if (!result) return NULL;
1194
Neil Schemenauer2880ae52002-05-04 05:35:20 +00001195 for (i = 0; i < NUM_GENERATIONS; i++) {
1196 if (!(gc_referrers_for(args, GEN_HEAD(i), result))) {
1197 Py_DECREF(result);
1198 return NULL;
1199 }
Neil Schemenauer17e7be62001-08-10 14:46:47 +00001200 }
Neil Schemenauer48c70342001-08-09 15:38:31 +00001201 return result;
1202}
Jeremy Hyltonc5007aa2000-06-30 05:02:53 +00001203
Tim Peters0f81ab62003-04-08 16:39:48 +00001204/* Append obj to list; return true if error (out of memory), false if OK. */
Jeremy Hylton5bd378b2003-04-03 16:28:38 +00001205static int
Tim Peters730f5532003-04-08 17:17:17 +00001206referentsvisit(PyObject *obj, PyObject *list)
Jeremy Hylton5bd378b2003-04-03 16:28:38 +00001207{
Tim Peters0f81ab62003-04-08 16:39:48 +00001208 return PyList_Append(list, obj) < 0;
Jeremy Hylton5bd378b2003-04-03 16:28:38 +00001209}
1210
Tim Peters730f5532003-04-08 17:17:17 +00001211PyDoc_STRVAR(gc_get_referents__doc__,
1212"get_referents(*objs) -> list\n\
Jeremy Hylton059b0942003-04-03 16:29:13 +00001213Return the list of objects that are directly referred to by objs.");
Jeremy Hylton5bd378b2003-04-03 16:28:38 +00001214
1215static PyObject *
Tim Peters730f5532003-04-08 17:17:17 +00001216gc_get_referents(PyObject *self, PyObject *args)
Jeremy Hylton5bd378b2003-04-03 16:28:38 +00001217{
Neal Norwitzffb0d902006-04-06 08:07:25 +00001218 Py_ssize_t i;
Jeremy Hylton5bd378b2003-04-03 16:28:38 +00001219 PyObject *result = PyList_New(0);
Tim Peters0f81ab62003-04-08 16:39:48 +00001220
1221 if (result == NULL)
1222 return NULL;
1223
Jeremy Hylton5bd378b2003-04-03 16:28:38 +00001224 for (i = 0; i < PyTuple_GET_SIZE(args); i++) {
Tim Peters0f81ab62003-04-08 16:39:48 +00001225 traverseproc traverse;
Tim Peters93ad66d2003-04-05 17:15:44 +00001226 PyObject *obj = PyTuple_GET_ITEM(args, i);
Tim Peters0f81ab62003-04-08 16:39:48 +00001227
1228 if (! PyObject_IS_GC(obj))
Jeremy Hylton5bd378b2003-04-03 16:28:38 +00001229 continue;
Christian Heimese93237d2007-12-19 02:37:44 +00001230 traverse = Py_TYPE(obj)->tp_traverse;
Tim Peters0f81ab62003-04-08 16:39:48 +00001231 if (! traverse)
1232 continue;
Tim Peters730f5532003-04-08 17:17:17 +00001233 if (traverse(obj, (visitproc)referentsvisit, result)) {
Tim Peters0f81ab62003-04-08 16:39:48 +00001234 Py_DECREF(result);
Jeremy Hylton5bd378b2003-04-03 16:28:38 +00001235 return NULL;
Tim Peters0f81ab62003-04-08 16:39:48 +00001236 }
Jeremy Hylton5bd378b2003-04-03 16:28:38 +00001237 }
1238 return result;
1239}
1240
Martin v. Löwis14f8b4c2002-06-13 20:33:02 +00001241PyDoc_STRVAR(gc_get_objects__doc__,
Neil Schemenauerc7c8d8e2001-08-09 15:58:59 +00001242"get_objects() -> [...]\n"
1243"\n"
1244"Return a list of objects tracked by the collector (excluding the list\n"
Martin v. Löwis14f8b4c2002-06-13 20:33:02 +00001245"returned).\n");
Neil Schemenauerc7c8d8e2001-08-09 15:58:59 +00001246
Neil Schemenauerc7c8d8e2001-08-09 15:58:59 +00001247static PyObject *
Tim Peters50c61d52003-04-06 01:50:50 +00001248gc_get_objects(PyObject *self, PyObject *noargs)
Neil Schemenauerc7c8d8e2001-08-09 15:58:59 +00001249{
Neil Schemenauer2880ae52002-05-04 05:35:20 +00001250 int i;
Neil Schemenauerc7c8d8e2001-08-09 15:58:59 +00001251 PyObject* result;
1252
Neil Schemenauerc7c8d8e2001-08-09 15:58:59 +00001253 result = PyList_New(0);
Tim Peters50c61d52003-04-06 01:50:50 +00001254 if (result == NULL)
Martin v. Löwisf8a6f242001-12-02 18:31:02 +00001255 return NULL;
Neil Schemenauer2880ae52002-05-04 05:35:20 +00001256 for (i = 0; i < NUM_GENERATIONS; i++) {
1257 if (append_objects(result, GEN_HEAD(i))) {
1258 Py_DECREF(result);
1259 return NULL;
1260 }
Martin v. Löwis155aad12001-12-02 12:21:34 +00001261 }
Neil Schemenauerc7c8d8e2001-08-09 15:58:59 +00001262 return result;
1263}
1264
1265
Martin v. Löwis14f8b4c2002-06-13 20:33:02 +00001266PyDoc_STRVAR(gc__doc__,
Jeremy Hyltonc5007aa2000-06-30 05:02:53 +00001267"This module provides access to the garbage collector for reference cycles.\n"
1268"\n"
Vladimir Marangozovf9d20c32000-08-06 22:45:31 +00001269"enable() -- Enable automatic garbage collection.\n"
1270"disable() -- Disable automatic garbage collection.\n"
1271"isenabled() -- Returns true if automatic collection is enabled.\n"
Jeremy Hyltonc5007aa2000-06-30 05:02:53 +00001272"collect() -- Do a full collection right now.\n"
Barry Warsawe5ec6132006-10-09 19:43:24 +00001273"get_count() -- Return the current collection counts.\n"
Jeremy Hyltonc5007aa2000-06-30 05:02:53 +00001274"set_debug() -- Set debugging flags.\n"
1275"get_debug() -- Get debugging flags.\n"
1276"set_threshold() -- Set the collection thresholds.\n"
1277"get_threshold() -- Return the current the collection thresholds.\n"
Neil Schemenauerc7c8d8e2001-08-09 15:58:59 +00001278"get_objects() -- Return a list of all objects tracked by the collector.\n"
Jeremy Hylton5bd378b2003-04-03 16:28:38 +00001279"get_referrers() -- Return the list of objects that refer to an object.\n"
Tim Peters730f5532003-04-08 17:17:17 +00001280"get_referents() -- Return the list of objects that an object refers to.\n");
Jeremy Hyltonc5007aa2000-06-30 05:02:53 +00001281
1282static PyMethodDef GcMethods[] = {
Tim Peters50c61d52003-04-06 01:50:50 +00001283 {"enable", gc_enable, METH_NOARGS, gc_enable__doc__},
1284 {"disable", gc_disable, METH_NOARGS, gc_disable__doc__},
1285 {"isenabled", gc_isenabled, METH_NOARGS, gc_isenabled__doc__},
Vladimir Marangozovf9d20c32000-08-06 22:45:31 +00001286 {"set_debug", gc_set_debug, METH_VARARGS, gc_set_debug__doc__},
Tim Peters50c61d52003-04-06 01:50:50 +00001287 {"get_debug", gc_get_debug, METH_NOARGS, gc_get_debug__doc__},
Barry Warsawd3c38ff2006-03-07 09:46:03 +00001288 {"get_count", gc_get_count, METH_NOARGS, gc_get_count__doc__},
Vladimir Marangozovf9d20c32000-08-06 22:45:31 +00001289 {"set_threshold", gc_set_thresh, METH_VARARGS, gc_set_thresh__doc__},
Tim Peters50c61d52003-04-06 01:50:50 +00001290 {"get_threshold", gc_get_thresh, METH_NOARGS, gc_get_thresh__doc__},
Barry Warsawd3c38ff2006-03-07 09:46:03 +00001291 {"collect", (PyCFunction)gc_collect,
1292 METH_VARARGS | METH_KEYWORDS, gc_collect__doc__},
Tim Peters50c61d52003-04-06 01:50:50 +00001293 {"get_objects", gc_get_objects,METH_NOARGS, gc_get_objects__doc__},
Martin v. Löwis560da622001-11-24 09:24:51 +00001294 {"get_referrers", gc_get_referrers, METH_VARARGS,
1295 gc_get_referrers__doc__},
Tim Peters730f5532003-04-08 17:17:17 +00001296 {"get_referents", gc_get_referents, METH_VARARGS,
1297 gc_get_referents__doc__},
Jeremy Hyltonc5007aa2000-06-30 05:02:53 +00001298 {NULL, NULL} /* Sentinel */
1299};
1300
Jason Tishler6bc06ec2003-09-04 11:59:50 +00001301PyMODINIT_FUNC
Jeremy Hyltonc5007aa2000-06-30 05:02:53 +00001302initgc(void)
1303{
1304 PyObject *m;
Jeremy Hyltonc5007aa2000-06-30 05:02:53 +00001305
1306 m = Py_InitModule4("gc",
1307 GcMethods,
1308 gc__doc__,
1309 NULL,
1310 PYTHON_API_VERSION);
Neal Norwitz1ac754f2006-01-19 06:09:39 +00001311 if (m == NULL)
1312 return;
Tim Peters11558872003-04-06 23:30:52 +00001313
Jeremy Hyltonc5007aa2000-06-30 05:02:53 +00001314 if (garbage == NULL) {
1315 garbage = PyList_New(0);
Tim Peters11558872003-04-06 23:30:52 +00001316 if (garbage == NULL)
1317 return;
Jeremy Hyltonc5007aa2000-06-30 05:02:53 +00001318 }
Neil Schemenauer3b1cbf92005-06-18 17:37:06 +00001319 Py_INCREF(garbage);
Tim Peters11558872003-04-06 23:30:52 +00001320 if (PyModule_AddObject(m, "garbage", garbage) < 0)
1321 return;
Neal Norwitz57a03612006-04-26 05:34:03 +00001322
1323 /* Importing can't be done in collect() because collect()
1324 * can be called via PyGC_Collect() in Py_Finalize().
1325 * This wouldn't be a problem, except that <initialized> is
1326 * reset to 0 before calling collect which trips up
1327 * the import and triggers an assertion.
1328 */
1329 if (tmod == NULL) {
Christian Heimes000a0742008-01-03 22:16:32 +00001330 tmod = PyImport_ImportModuleNoBlock("time");
Neal Norwitz57a03612006-04-26 05:34:03 +00001331 if (tmod == NULL)
1332 PyErr_Clear();
1333 }
1334
Tim Peters11558872003-04-06 23:30:52 +00001335#define ADD_INT(NAME) if (PyModule_AddIntConstant(m, #NAME, NAME) < 0) return
1336 ADD_INT(DEBUG_STATS);
1337 ADD_INT(DEBUG_COLLECTABLE);
1338 ADD_INT(DEBUG_UNCOLLECTABLE);
1339 ADD_INT(DEBUG_INSTANCES);
1340 ADD_INT(DEBUG_OBJECTS);
1341 ADD_INT(DEBUG_SAVEALL);
1342 ADD_INT(DEBUG_LEAK);
1343#undef ADD_INT
Jeremy Hyltonc5007aa2000-06-30 05:02:53 +00001344}
1345
Guido van Rossume13ddc92003-04-17 17:29:22 +00001346/* API to invoke gc.collect() from C */
Neal Norwitz7b216c52006-03-04 20:01:53 +00001347Py_ssize_t
Guido van Rossume13ddc92003-04-17 17:29:22 +00001348PyGC_Collect(void)
1349{
Neal Norwitz7b216c52006-03-04 20:01:53 +00001350 Py_ssize_t n;
Guido van Rossume13ddc92003-04-17 17:29:22 +00001351
1352 if (collecting)
1353 n = 0; /* already collecting, don't do anything */
1354 else {
1355 collecting = 1;
1356 n = collect(NUM_GENERATIONS - 1);
1357 collecting = 0;
1358 }
1359
1360 return n;
1361}
1362
Neil Schemenauer43411b52001-08-30 00:05:51 +00001363/* for debugging */
Guido van Rossume13ddc92003-04-17 17:29:22 +00001364void
1365_PyGC_Dump(PyGC_Head *g)
Neil Schemenauer43411b52001-08-30 00:05:51 +00001366{
1367 _PyObject_Dump(FROM_GC(g));
1368}
1369
Neil Schemenauer43411b52001-08-30 00:05:51 +00001370/* extension modules might be compiled with GC support so these
1371 functions must always be available */
1372
Neil Schemenauerfec4eb12002-04-12 02:41:03 +00001373#undef PyObject_GC_Track
1374#undef PyObject_GC_UnTrack
1375#undef PyObject_GC_Del
1376#undef _PyObject_GC_Malloc
1377
Neil Schemenauer43411b52001-08-30 00:05:51 +00001378void
Neil Schemenauerfec4eb12002-04-12 02:41:03 +00001379PyObject_GC_Track(void *op)
Neil Schemenauer43411b52001-08-30 00:05:51 +00001380{
1381 _PyObject_GC_TRACK(op);
1382}
1383
Neil Schemenauerfec4eb12002-04-12 02:41:03 +00001384/* for binary compatibility with 2.2 */
Neil Schemenauer43411b52001-08-30 00:05:51 +00001385void
Neil Schemenauerfec4eb12002-04-12 02:41:03 +00001386_PyObject_GC_Track(PyObject *op)
1387{
1388 PyObject_GC_Track(op);
1389}
1390
1391void
1392PyObject_GC_UnTrack(void *op)
Neil Schemenauer43411b52001-08-30 00:05:51 +00001393{
Tim Peters803526b2002-07-07 05:13:56 +00001394 /* Obscure: the Py_TRASHCAN mechanism requires that we be able to
1395 * call PyObject_GC_UnTrack twice on an object.
1396 */
Neil Schemenauera2b11ec2002-05-21 15:53:24 +00001397 if (IS_TRACKED(op))
Guido van Rossumff413af2002-03-28 20:34:59 +00001398 _PyObject_GC_UNTRACK(op);
Neil Schemenauer43411b52001-08-30 00:05:51 +00001399}
1400
Neil Schemenauerfec4eb12002-04-12 02:41:03 +00001401/* for binary compatibility with 2.2 */
1402void
1403_PyObject_GC_UnTrack(PyObject *op)
1404{
1405 PyObject_GC_UnTrack(op);
1406}
1407
Neil Schemenauer43411b52001-08-30 00:05:51 +00001408PyObject *
Neil Schemenauerfec4eb12002-04-12 02:41:03 +00001409_PyObject_GC_Malloc(size_t basicsize)
Neil Schemenauer43411b52001-08-30 00:05:51 +00001410{
1411 PyObject *op;
Neal Norwitze7d8be82008-07-31 17:17:14 +00001412 PyGC_Head *g;
1413 if (basicsize > PY_SSIZE_T_MAX - sizeof(PyGC_Head))
1414 return PyErr_NoMemory();
1415 g = (PyGC_Head *)PyObject_MALLOC(
Anthony Baxter64182fe2006-04-11 12:14:09 +00001416 sizeof(PyGC_Head) + basicsize);
Neil Schemenauer43411b52001-08-30 00:05:51 +00001417 if (g == NULL)
Jeremy Hylton8a135182002-06-06 23:23:55 +00001418 return PyErr_NoMemory();
Tim Petersea405632002-07-02 00:52:30 +00001419 g->gc.gc_refs = GC_UNTRACKED;
Neil Schemenauer2880ae52002-05-04 05:35:20 +00001420 generations[0].count++; /* number of allocated GC objects */
1421 if (generations[0].count > generations[0].threshold &&
Neil Schemenauer43411b52001-08-30 00:05:51 +00001422 enabled &&
Neil Schemenauer2880ae52002-05-04 05:35:20 +00001423 generations[0].threshold &&
Neil Schemenauer43411b52001-08-30 00:05:51 +00001424 !collecting &&
1425 !PyErr_Occurred()) {
1426 collecting = 1;
Neil Schemenauer2880ae52002-05-04 05:35:20 +00001427 collect_generations();
Neil Schemenauer43411b52001-08-30 00:05:51 +00001428 collecting = 0;
1429 }
1430 op = FROM_GC(g);
Neil Schemenauer43411b52001-08-30 00:05:51 +00001431 return op;
1432}
1433
1434PyObject *
1435_PyObject_GC_New(PyTypeObject *tp)
1436{
Neil Schemenauerfec4eb12002-04-12 02:41:03 +00001437 PyObject *op = _PyObject_GC_Malloc(_PyObject_SIZE(tp));
Tim Petersfa8efab2002-04-28 01:57:25 +00001438 if (op != NULL)
1439 op = PyObject_INIT(op, tp);
1440 return op;
Neil Schemenauer43411b52001-08-30 00:05:51 +00001441}
1442
1443PyVarObject *
Martin v. Löwis18e16552006-02-15 17:27:45 +00001444_PyObject_GC_NewVar(PyTypeObject *tp, Py_ssize_t nitems)
Neil Schemenauer43411b52001-08-30 00:05:51 +00001445{
Neil Schemenauerfec4eb12002-04-12 02:41:03 +00001446 const size_t size = _PyObject_VAR_SIZE(tp, nitems);
1447 PyVarObject *op = (PyVarObject *) _PyObject_GC_Malloc(size);
Tim Petersfa8efab2002-04-28 01:57:25 +00001448 if (op != NULL)
1449 op = PyObject_INIT_VAR(op, tp, nitems);
1450 return op;
Neil Schemenauer43411b52001-08-30 00:05:51 +00001451}
1452
1453PyVarObject *
Martin v. Löwis41290682006-02-16 14:56:14 +00001454_PyObject_GC_Resize(PyVarObject *op, Py_ssize_t nitems)
Neil Schemenauer43411b52001-08-30 00:05:51 +00001455{
Christian Heimese93237d2007-12-19 02:37:44 +00001456 const size_t basicsize = _PyObject_VAR_SIZE(Py_TYPE(op), nitems);
Neil Schemenauer43411b52001-08-30 00:05:51 +00001457 PyGC_Head *g = AS_GC(op);
Neal Norwitze7d8be82008-07-31 17:17:14 +00001458 if (basicsize > PY_SSIZE_T_MAX - sizeof(PyGC_Head))
1459 return (PyVarObject *)PyErr_NoMemory();
Anthony Baxter64182fe2006-04-11 12:14:09 +00001460 g = (PyGC_Head *)PyObject_REALLOC(g, sizeof(PyGC_Head) + basicsize);
Neil Schemenauer43411b52001-08-30 00:05:51 +00001461 if (g == NULL)
1462 return (PyVarObject *)PyErr_NoMemory();
1463 op = (PyVarObject *) FROM_GC(g);
Christian Heimese93237d2007-12-19 02:37:44 +00001464 Py_SIZE(op) = nitems;
Neil Schemenauer43411b52001-08-30 00:05:51 +00001465 return op;
1466}
1467
1468void
Neil Schemenauerfec4eb12002-04-12 02:41:03 +00001469PyObject_GC_Del(void *op)
Neil Schemenauer43411b52001-08-30 00:05:51 +00001470{
Neil Schemenauer43411b52001-08-30 00:05:51 +00001471 PyGC_Head *g = AS_GC(op);
Neil Schemenauera2b11ec2002-05-21 15:53:24 +00001472 if (IS_TRACKED(op))
Neil Schemenauer43411b52001-08-30 00:05:51 +00001473 gc_list_remove(g);
Neil Schemenauer2880ae52002-05-04 05:35:20 +00001474 if (generations[0].count > 0) {
1475 generations[0].count--;
Neil Schemenauer43411b52001-08-30 00:05:51 +00001476 }
Neil Schemenauerfec4eb12002-04-12 02:41:03 +00001477 PyObject_FREE(g);
Neil Schemenauer43411b52001-08-30 00:05:51 +00001478}
1479
Neil Schemenauerfec4eb12002-04-12 02:41:03 +00001480/* for binary compatibility with 2.2 */
1481#undef _PyObject_GC_Del
1482void
1483_PyObject_GC_Del(PyObject *op)
1484{
1485 PyObject_GC_Del(op);
1486}