blob: 4d71591466bb8aaf49589028268c9a4a68106022 [file] [log] [blame]
Jeremy Hyltonc5007aa2000-06-30 05:02:53 +00001/*
Tim Peters88396172002-06-30 17:56:40 +00002
Jeremy Hyltonc5007aa2000-06-30 05:02:53 +00003 Reference Cycle Garbage Collection
4 ==================================
5
Neil Schemenauerb2c2c9e2000-10-04 16:34:09 +00006 Neil Schemenauer <nas@arctrix.com>
Jeremy Hyltonc5007aa2000-06-30 05:02:53 +00007
8 Based on a post on the python-dev list. Ideas from Guido van Rossum,
9 Eric Tiedemann, and various others.
10
Neil Schemenauer43411b52001-08-30 00:05:51 +000011 http://www.arctrix.com/nas/python/gc/
Jeremy Hyltonc5007aa2000-06-30 05:02:53 +000012 http://www.python.org/pipermail/python-dev/2000-March/003869.html
13 http://www.python.org/pipermail/python-dev/2000-March/004010.html
14 http://www.python.org/pipermail/python-dev/2000-March/004022.html
15
16 For a highlevel view of the collection process, read the collect
17 function.
18
Jeremy Hyltonc5007aa2000-06-30 05:02:53 +000019*/
20
Jeremy Hyltonc5007aa2000-06-30 05:02:53 +000021#include "Python.h"
Christian Heimes3b718a72008-02-14 12:47:33 +000022#include "frameobject.h" /* for PyFrame_ClearFreeList */
Jeremy Hyltonc5007aa2000-06-30 05:02:53 +000023
Neil Schemenauer43411b52001-08-30 00:05:51 +000024/* Get an object's GC head */
25#define AS_GC(o) ((PyGC_Head *)(o)-1)
26
27/* Get the object given the GC head */
28#define FROM_GC(g) ((PyObject *)(((PyGC_Head *)g)+1))
29
Jeremy Hyltonc5007aa2000-06-30 05:02:53 +000030/*** Global GC state ***/
31
Neil Schemenauer2880ae52002-05-04 05:35:20 +000032struct gc_generation {
33 PyGC_Head head;
34 int threshold; /* collection threshold */
35 int count; /* count of allocations or collections of younger
36 generations */
37};
38
39#define NUM_GENERATIONS 3
40#define GEN_HEAD(n) (&generations[n].head)
41
Jeremy Hyltonc5007aa2000-06-30 05:02:53 +000042/* linked lists of container objects */
Neil Schemenauer2880ae52002-05-04 05:35:20 +000043static struct gc_generation generations[NUM_GENERATIONS] = {
44 /* PyGC_Head, threshold, count */
45 {{{GEN_HEAD(0), GEN_HEAD(0), 0}}, 700, 0},
46 {{{GEN_HEAD(1), GEN_HEAD(1), 0}}, 10, 0},
47 {{{GEN_HEAD(2), GEN_HEAD(2), 0}}, 10, 0},
48};
Jeremy Hyltonc5007aa2000-06-30 05:02:53 +000049
Neil Schemenauer2880ae52002-05-04 05:35:20 +000050PyGC_Head *_PyGC_generation0 = GEN_HEAD(0);
51
Vladimir Marangozovf9d20c32000-08-06 22:45:31 +000052static int enabled = 1; /* automatic collection enabled? */
Jeremy Hyltonc5007aa2000-06-30 05:02:53 +000053
Neil Schemenauer43411b52001-08-30 00:05:51 +000054/* true if we are currently running the collector */
Tim Petersbf384c22003-04-06 00:11:39 +000055static int collecting = 0;
Neil Schemenauer43411b52001-08-30 00:05:51 +000056
Tim Peters6fc13d92002-07-02 18:12:35 +000057/* list of uncollectable objects */
Tim Petersbf384c22003-04-06 00:11:39 +000058static PyObject *garbage = NULL;
Tim Peters6fc13d92002-07-02 18:12:35 +000059
60/* Python string to use if unhandled exception occurs */
Tim Petersbf384c22003-04-06 00:11:39 +000061static PyObject *gc_str = NULL;
Tim Peters6fc13d92002-07-02 18:12:35 +000062
Tim Peters93ad66d2003-04-05 17:15:44 +000063/* Python string used to look for __del__ attribute. */
64static PyObject *delstr = NULL;
Jeremy Hyltonce136e92003-04-04 19:59:06 +000065
Antoine Pitrou4c5ecb72009-01-09 21:40:55 +000066/* This is the number of objects who survived the last full collection. It
67 approximates the number of long lived objects tracked by the GC.
68
69 (by "full collection", we mean a collection of the oldest generation).
70*/
71static Py_ssize_t long_lived_total = 0;
72
73/* This is the number of objects who survived all "non-full" collections,
74 and are awaiting to undergo a full collection for the first time.
75
76*/
77static Py_ssize_t long_lived_pending = 0;
78
79/*
80 NOTE: about the counting of long-lived objects.
81
82 To limit the cost of garbage collection, there are two strategies;
83 - make each collection faster, e.g. by scanning fewer objects
84 - do less collections
85 This heuristic is about the latter strategy.
86
87 In addition to the various configurable thresholds, we only trigger a
88 full collection if the ratio
89 long_lived_pending / long_lived_total
90 is above a given value (hardwired to 25%).
91
92 The reason is that, while "non-full" collections (i.e., collections of
93 the young and middle generations) will always examine roughly the same
94 number of objects -- determined by the aforementioned thresholds --,
95 the cost of a full collection is proportional to the total number of
96 long-lived objects, which is virtually unbounded.
97
98 Indeed, it has been remarked that doing a full collection every
99 <constant number> of object creations entails a dramatic performance
100 degradation in workloads which consist in creating and storing lots of
101 long-lived objects (e.g. building a large list of GC-tracked objects would
102 show quadratic performance, instead of linear as expected: see issue #4074).
103
104 Using the above ratio, instead, yields amortized linear performance in
105 the total number of objects (the effect of which can be summarized
106 thusly: "each full garbage collection is more and more costly as the
107 number of objects grows, but we do fewer and fewer of them").
108
109 This heuristic was suggested by Martin von Löwis on python-dev in
110 June 2008. His original analysis and proposal can be found at:
111 http://mail.python.org/pipermail/python-dev/2008-June/080579.html
112*/
113
114
Jeremy Hyltonc5007aa2000-06-30 05:02:53 +0000115/* set for debugging information */
116#define DEBUG_STATS (1<<0) /* print collection statistics */
117#define DEBUG_COLLECTABLE (1<<1) /* print collectable objects */
118#define DEBUG_UNCOLLECTABLE (1<<2) /* print uncollectable objects */
119#define DEBUG_INSTANCES (1<<3) /* print instances */
120#define DEBUG_OBJECTS (1<<4) /* print other objects */
Neil Schemenauer544de1e2000-09-22 15:22:38 +0000121#define DEBUG_SAVEALL (1<<5) /* save all garbage in gc.garbage */
Jeremy Hyltonc5007aa2000-06-30 05:02:53 +0000122#define DEBUG_LEAK DEBUG_COLLECTABLE | \
123 DEBUG_UNCOLLECTABLE | \
124 DEBUG_INSTANCES | \
Neil Schemenauer544de1e2000-09-22 15:22:38 +0000125 DEBUG_OBJECTS | \
126 DEBUG_SAVEALL
Jeremy Hyltonb709df32000-09-01 02:47:25 +0000127static int debug;
Neal Norwitz57a03612006-04-26 05:34:03 +0000128static PyObject *tmod = NULL;
Jeremy Hyltonc5007aa2000-06-30 05:02:53 +0000129
Tim Peters6fc13d92002-07-02 18:12:35 +0000130/*--------------------------------------------------------------------------
131gc_refs values.
Neil Schemenauer43411b52001-08-30 00:05:51 +0000132
Tim Peters6fc13d92002-07-02 18:12:35 +0000133Between collections, every gc'ed object has one of two gc_refs values:
134
135GC_UNTRACKED
136 The initial state; objects returned by PyObject_GC_Malloc are in this
137 state. The object doesn't live in any generation list, and its
138 tp_traverse slot must not be called.
139
140GC_REACHABLE
141 The object lives in some generation list, and its tp_traverse is safe to
142 call. An object transitions to GC_REACHABLE when PyObject_GC_Track
143 is called.
144
145During a collection, gc_refs can temporarily take on other states:
146
147>= 0
148 At the start of a collection, update_refs() copies the true refcount
149 to gc_refs, for each object in the generation being collected.
150 subtract_refs() then adjusts gc_refs so that it equals the number of
151 times an object is referenced directly from outside the generation
152 being collected.
Martin v. Löwis774348c2002-11-09 19:54:06 +0000153 gc_refs remains >= 0 throughout these steps.
Tim Peters6fc13d92002-07-02 18:12:35 +0000154
155GC_TENTATIVELY_UNREACHABLE
156 move_unreachable() then moves objects not reachable (whether directly or
157 indirectly) from outside the generation into an "unreachable" set.
158 Objects that are found to be reachable have gc_refs set to GC_REACHABLE
159 again. Objects that are found to be unreachable have gc_refs set to
160 GC_TENTATIVELY_UNREACHABLE. It's "tentatively" because the pass doing
161 this can't be sure until it ends, and GC_TENTATIVELY_UNREACHABLE may
162 transition back to GC_REACHABLE.
163
164 Only objects with GC_TENTATIVELY_UNREACHABLE still set are candidates
165 for collection. If it's decided not to collect such an object (e.g.,
166 it has a __del__ method), its gc_refs is restored to GC_REACHABLE again.
167----------------------------------------------------------------------------
168*/
Tim Petersea405632002-07-02 00:52:30 +0000169#define GC_UNTRACKED _PyGC_REFS_UNTRACKED
170#define GC_REACHABLE _PyGC_REFS_REACHABLE
171#define GC_TENTATIVELY_UNREACHABLE _PyGC_REFS_TENTATIVELY_UNREACHABLE
Tim Peters19b74c72002-07-01 03:52:19 +0000172
Tim Peters6fc13d92002-07-02 18:12:35 +0000173#define IS_TRACKED(o) ((AS_GC(o))->gc.gc_refs != GC_UNTRACKED)
Tim Peters19b74c72002-07-01 03:52:19 +0000174#define IS_REACHABLE(o) ((AS_GC(o))->gc.gc_refs == GC_REACHABLE)
175#define IS_TENTATIVELY_UNREACHABLE(o) ( \
176 (AS_GC(o))->gc.gc_refs == GC_TENTATIVELY_UNREACHABLE)
Neil Schemenauera2b11ec2002-05-21 15:53:24 +0000177
Jeremy Hyltonc5007aa2000-06-30 05:02:53 +0000178/*** list functions ***/
179
180static void
181gc_list_init(PyGC_Head *list)
182{
Tim Peters9e4ca102001-10-11 18:31:31 +0000183 list->gc.gc_prev = list;
184 list->gc.gc_next = list;
Jeremy Hyltonc5007aa2000-06-30 05:02:53 +0000185}
186
Neil Schemenauer2880ae52002-05-04 05:35:20 +0000187static int
188gc_list_is_empty(PyGC_Head *list)
189{
190 return (list->gc.gc_next == list);
191}
192
Tim Peterse2d59182004-11-01 01:39:08 +0000193#if 0
194/* This became unused after gc_list_move() was introduced. */
195/* Append `node` to `list`. */
Jeremy Hyltonc5007aa2000-06-30 05:02:53 +0000196static void
197gc_list_append(PyGC_Head *node, PyGC_Head *list)
198{
Tim Peters9e4ca102001-10-11 18:31:31 +0000199 node->gc.gc_next = list;
200 node->gc.gc_prev = list->gc.gc_prev;
201 node->gc.gc_prev->gc.gc_next = node;
202 list->gc.gc_prev = node;
Jeremy Hyltonc5007aa2000-06-30 05:02:53 +0000203}
Tim Peterse2d59182004-11-01 01:39:08 +0000204#endif
Jeremy Hyltonc5007aa2000-06-30 05:02:53 +0000205
Tim Peterse2d59182004-11-01 01:39:08 +0000206/* Remove `node` from the gc list it's currently in. */
Jeremy Hyltonc5007aa2000-06-30 05:02:53 +0000207static void
208gc_list_remove(PyGC_Head *node)
209{
Tim Peters9e4ca102001-10-11 18:31:31 +0000210 node->gc.gc_prev->gc.gc_next = node->gc.gc_next;
211 node->gc.gc_next->gc.gc_prev = node->gc.gc_prev;
212 node->gc.gc_next = NULL; /* object is not currently tracked */
Jeremy Hyltonc5007aa2000-06-30 05:02:53 +0000213}
214
Tim Peterse2d59182004-11-01 01:39:08 +0000215/* Move `node` from the gc list it's currently in (which is not explicitly
216 * named here) to the end of `list`. This is semantically the same as
217 * gc_list_remove(node) followed by gc_list_append(node, list).
218 */
219static void
220gc_list_move(PyGC_Head *node, PyGC_Head *list)
221{
Tim Petersbc1d1b82004-11-01 16:39:57 +0000222 PyGC_Head *new_prev;
Tim Peterse2d59182004-11-01 01:39:08 +0000223 PyGC_Head *current_prev = node->gc.gc_prev;
224 PyGC_Head *current_next = node->gc.gc_next;
Tim Petersbc1d1b82004-11-01 16:39:57 +0000225 /* Unlink from current list. */
Tim Peterse2d59182004-11-01 01:39:08 +0000226 current_prev->gc.gc_next = current_next;
227 current_next->gc.gc_prev = current_prev;
Tim Petersbc1d1b82004-11-01 16:39:57 +0000228 /* Relink at end of new list. */
229 new_prev = node->gc.gc_prev = list->gc.gc_prev;
Tim Peterse2d59182004-11-01 01:39:08 +0000230 new_prev->gc.gc_next = list->gc.gc_prev = node;
Tim Petersbc1d1b82004-11-01 16:39:57 +0000231 node->gc.gc_next = list;
Tim Peterse2d59182004-11-01 01:39:08 +0000232}
233
234/* append list `from` onto list `to`; `from` becomes an empty list */
Jeremy Hyltonc5007aa2000-06-30 05:02:53 +0000235static void
236gc_list_merge(PyGC_Head *from, PyGC_Head *to)
237{
238 PyGC_Head *tail;
Tim Peterse2d59182004-11-01 01:39:08 +0000239 assert(from != to);
Neil Schemenauer2880ae52002-05-04 05:35:20 +0000240 if (!gc_list_is_empty(from)) {
Tim Peters9e4ca102001-10-11 18:31:31 +0000241 tail = to->gc.gc_prev;
242 tail->gc.gc_next = from->gc.gc_next;
243 tail->gc.gc_next->gc.gc_prev = tail;
244 to->gc.gc_prev = from->gc.gc_prev;
245 to->gc.gc_prev->gc.gc_next = to;
Jeremy Hyltonc5007aa2000-06-30 05:02:53 +0000246 }
247 gc_list_init(from);
248}
249
Neal Norwitz7b216c52006-03-04 20:01:53 +0000250static Py_ssize_t
Jeremy Hyltonc5007aa2000-06-30 05:02:53 +0000251gc_list_size(PyGC_Head *list)
252{
253 PyGC_Head *gc;
Neal Norwitz7b216c52006-03-04 20:01:53 +0000254 Py_ssize_t n = 0;
Tim Peters9e4ca102001-10-11 18:31:31 +0000255 for (gc = list->gc.gc_next; gc != list; gc = gc->gc.gc_next) {
Jeremy Hyltonc5007aa2000-06-30 05:02:53 +0000256 n++;
257 }
258 return n;
259}
260
Tim Peters259272b2003-04-06 19:41:39 +0000261/* Append objects in a GC list to a Python list.
262 * Return 0 if all OK, < 0 if error (out of memory for list).
263 */
264static int
265append_objects(PyObject *py_list, PyGC_Head *gc_list)
266{
267 PyGC_Head *gc;
268 for (gc = gc_list->gc.gc_next; gc != gc_list; gc = gc->gc.gc_next) {
269 PyObject *op = FROM_GC(gc);
270 if (op != py_list) {
271 if (PyList_Append(py_list, op)) {
272 return -1; /* exception */
273 }
274 }
275 }
276 return 0;
277}
278
Jeremy Hyltonc5007aa2000-06-30 05:02:53 +0000279/*** end of list stuff ***/
280
281
Tim Peters19b74c72002-07-01 03:52:19 +0000282/* Set all gc_refs = ob_refcnt. After this, gc_refs is > 0 for all objects
283 * in containers, and is GC_REACHABLE for all tracked gc objects not in
284 * containers.
Tim Peters88396172002-06-30 17:56:40 +0000285 */
Jeremy Hyltonc5007aa2000-06-30 05:02:53 +0000286static void
287update_refs(PyGC_Head *containers)
288{
Tim Peters9e4ca102001-10-11 18:31:31 +0000289 PyGC_Head *gc = containers->gc.gc_next;
Tim Petersea405632002-07-02 00:52:30 +0000290 for (; gc != containers; gc = gc->gc.gc_next) {
291 assert(gc->gc.gc_refs == GC_REACHABLE);
Christian Heimese93237d2007-12-19 02:37:44 +0000292 gc->gc.gc_refs = Py_REFCNT(FROM_GC(gc));
Tim Peters780c4972003-11-14 00:01:17 +0000293 /* Python's cyclic gc should never see an incoming refcount
294 * of 0: if something decref'ed to 0, it should have been
295 * deallocated immediately at that time.
296 * Possible cause (if the assert triggers): a tp_dealloc
297 * routine left a gc-aware object tracked during its teardown
298 * phase, and did something-- or allowed something to happen --
299 * that called back into Python. gc can trigger then, and may
300 * see the still-tracked dying object. Before this assert
301 * was added, such mistakes went on to allow gc to try to
302 * delete the object again. In a debug build, that caused
303 * a mysterious segfault, when _Py_ForgetReference tried
304 * to remove the object from the doubly-linked list of all
305 * objects a second time. In a release build, an actual
306 * double deallocation occurred, which leads to corruption
307 * of the allocator's internal bookkeeping pointers. That's
308 * so serious that maybe this should be a release-build
309 * check instead of an assert?
310 */
311 assert(gc->gc.gc_refs != 0);
Tim Petersea405632002-07-02 00:52:30 +0000312 }
Jeremy Hyltonc5007aa2000-06-30 05:02:53 +0000313}
314
Tim Peters19b74c72002-07-01 03:52:19 +0000315/* A traversal callback for subtract_refs. */
Jeremy Hyltonc5007aa2000-06-30 05:02:53 +0000316static int
317visit_decref(PyObject *op, void *data)
318{
Tim Peters93cd83e2002-06-30 21:31:03 +0000319 assert(op != NULL);
Tim Peters19b74c72002-07-01 03:52:19 +0000320 if (PyObject_IS_GC(op)) {
321 PyGC_Head *gc = AS_GC(op);
322 /* We're only interested in gc_refs for objects in the
323 * generation being collected, which can be recognized
324 * because only they have positive gc_refs.
325 */
Tim Petersaab713b2002-07-02 22:15:28 +0000326 assert(gc->gc.gc_refs != 0); /* else refcount was too small */
Tim Peters19b74c72002-07-01 03:52:19 +0000327 if (gc->gc.gc_refs > 0)
328 gc->gc.gc_refs--;
329 }
Jeremy Hyltonc5007aa2000-06-30 05:02:53 +0000330 return 0;
331}
332
Tim Peters19b74c72002-07-01 03:52:19 +0000333/* Subtract internal references from gc_refs. After this, gc_refs is >= 0
334 * for all objects in containers, and is GC_REACHABLE for all tracked gc
335 * objects not in containers. The ones with gc_refs > 0 are directly
336 * reachable from outside containers, and so can't be collected.
337 */
Jeremy Hyltonc5007aa2000-06-30 05:02:53 +0000338static void
339subtract_refs(PyGC_Head *containers)
340{
341 traverseproc traverse;
Tim Peters9e4ca102001-10-11 18:31:31 +0000342 PyGC_Head *gc = containers->gc.gc_next;
343 for (; gc != containers; gc=gc->gc.gc_next) {
Christian Heimese93237d2007-12-19 02:37:44 +0000344 traverse = Py_TYPE(FROM_GC(gc))->tp_traverse;
Neil Schemenauer43411b52001-08-30 00:05:51 +0000345 (void) traverse(FROM_GC(gc),
Jeremy Hyltonc5007aa2000-06-30 05:02:53 +0000346 (visitproc)visit_decref,
347 NULL);
348 }
349}
350
Tim Peters19b74c72002-07-01 03:52:19 +0000351/* A traversal callback for move_unreachable. */
Jeremy Hyltonc5007aa2000-06-30 05:02:53 +0000352static int
Tim Peters19b74c72002-07-01 03:52:19 +0000353visit_reachable(PyObject *op, PyGC_Head *reachable)
Jeremy Hyltonc5007aa2000-06-30 05:02:53 +0000354{
Tim Petersea405632002-07-02 00:52:30 +0000355 if (PyObject_IS_GC(op)) {
Tim Peters19b74c72002-07-01 03:52:19 +0000356 PyGC_Head *gc = AS_GC(op);
Martin v. Löwis6db0e002006-03-01 16:56:25 +0000357 const Py_ssize_t gc_refs = gc->gc.gc_refs;
Tim Peters19b74c72002-07-01 03:52:19 +0000358
359 if (gc_refs == 0) {
360 /* This is in move_unreachable's 'young' list, but
361 * the traversal hasn't yet gotten to it. All
362 * we need to do is tell move_unreachable that it's
363 * reachable.
364 */
365 gc->gc.gc_refs = 1;
Jeremy Hyltonc5007aa2000-06-30 05:02:53 +0000366 }
Tim Peters19b74c72002-07-01 03:52:19 +0000367 else if (gc_refs == GC_TENTATIVELY_UNREACHABLE) {
368 /* This had gc_refs = 0 when move_unreachable got
369 * to it, but turns out it's reachable after all.
370 * Move it back to move_unreachable's 'young' list,
371 * and move_unreachable will eventually get to it
372 * again.
373 */
Tim Peterse2d59182004-11-01 01:39:08 +0000374 gc_list_move(gc, reachable);
Tim Peters19b74c72002-07-01 03:52:19 +0000375 gc->gc.gc_refs = 1;
376 }
377 /* Else there's nothing to do.
378 * If gc_refs > 0, it must be in move_unreachable's 'young'
379 * list, and move_unreachable will eventually get to it.
380 * If gc_refs == GC_REACHABLE, it's either in some other
381 * generation so we don't care about it, or move_unreachable
Tim Peters6fc13d92002-07-02 18:12:35 +0000382 * already dealt with it.
Tim Petersea405632002-07-02 00:52:30 +0000383 * If gc_refs == GC_UNTRACKED, it must be ignored.
Tim Peters19b74c72002-07-01 03:52:19 +0000384 */
Tim Petersea405632002-07-02 00:52:30 +0000385 else {
386 assert(gc_refs > 0
387 || gc_refs == GC_REACHABLE
388 || gc_refs == GC_UNTRACKED);
389 }
Jeremy Hyltonc5007aa2000-06-30 05:02:53 +0000390 }
391 return 0;
392}
393
Tim Peters19b74c72002-07-01 03:52:19 +0000394/* Move the unreachable objects from young to unreachable. After this,
395 * all objects in young have gc_refs = GC_REACHABLE, and all objects in
396 * unreachable have gc_refs = GC_TENTATIVELY_UNREACHABLE. All tracked
397 * gc objects not in young or unreachable still have gc_refs = GC_REACHABLE.
398 * All objects in young after this are directly or indirectly reachable
399 * from outside the original young; and all objects in unreachable are
400 * not.
Tim Peters88396172002-06-30 17:56:40 +0000401 */
Jeremy Hyltonc5007aa2000-06-30 05:02:53 +0000402static void
Tim Peters19b74c72002-07-01 03:52:19 +0000403move_unreachable(PyGC_Head *young, PyGC_Head *unreachable)
Jeremy Hyltonc5007aa2000-06-30 05:02:53 +0000404{
Tim Peters19b74c72002-07-01 03:52:19 +0000405 PyGC_Head *gc = young->gc.gc_next;
406
407 /* Invariants: all objects "to the left" of us in young have gc_refs
408 * = GC_REACHABLE, and are indeed reachable (directly or indirectly)
409 * from outside the young list as it was at entry. All other objects
410 * from the original young "to the left" of us are in unreachable now,
411 * and have gc_refs = GC_TENTATIVELY_UNREACHABLE. All objects to the
412 * left of us in 'young' now have been scanned, and no objects here
413 * or to the right have been scanned yet.
414 */
415
416 while (gc != young) {
417 PyGC_Head *next;
418
Tim Peters6fc13d92002-07-02 18:12:35 +0000419 if (gc->gc.gc_refs) {
420 /* gc is definitely reachable from outside the
421 * original 'young'. Mark it as such, and traverse
422 * its pointers to find any other objects that may
423 * be directly reachable from it. Note that the
424 * call to tp_traverse may append objects to young,
425 * so we have to wait until it returns to determine
426 * the next object to visit.
427 */
428 PyObject *op = FROM_GC(gc);
Christian Heimese93237d2007-12-19 02:37:44 +0000429 traverseproc traverse = Py_TYPE(op)->tp_traverse;
Tim Peters6fc13d92002-07-02 18:12:35 +0000430 assert(gc->gc.gc_refs > 0);
431 gc->gc.gc_refs = GC_REACHABLE;
432 (void) traverse(op,
433 (visitproc)visit_reachable,
434 (void *)young);
435 next = gc->gc.gc_next;
436 }
437 else {
Tim Peters19b74c72002-07-01 03:52:19 +0000438 /* This *may* be unreachable. To make progress,
439 * assume it is. gc isn't directly reachable from
440 * any object we've already traversed, but may be
441 * reachable from an object we haven't gotten to yet.
442 * visit_reachable will eventually move gc back into
443 * young if that's so, and we'll see it again.
444 */
445 next = gc->gc.gc_next;
Tim Peterse2d59182004-11-01 01:39:08 +0000446 gc_list_move(gc, unreachable);
Tim Peters19b74c72002-07-01 03:52:19 +0000447 gc->gc.gc_refs = GC_TENTATIVELY_UNREACHABLE;
448 }
Tim Peters19b74c72002-07-01 03:52:19 +0000449 gc = next;
Jeremy Hyltonc5007aa2000-06-30 05:02:53 +0000450 }
451}
452
Tim Peters86b993b2003-04-05 17:35:54 +0000453/* Return true if object has a finalization method.
454 * CAUTION: An instance of an old-style class has to be checked for a
Tim Petersf6b80452003-04-07 19:21:15 +0000455 *__del__ method, and earlier versions of this used to call PyObject_HasAttr,
456 * which in turn could call the class's __getattr__ hook (if any). That
457 * could invoke arbitrary Python code, mutating the object graph in arbitrary
458 * ways, and that was the source of some excruciatingly subtle bugs.
Tim Peters86b993b2003-04-05 17:35:54 +0000459 */
Neil Schemenauera765c122001-11-01 17:35:23 +0000460static int
461has_finalizer(PyObject *op)
Jeremy Hyltonc5007aa2000-06-30 05:02:53 +0000462{
Tim Peters86b993b2003-04-05 17:35:54 +0000463 if (PyInstance_Check(op)) {
Tim Peters86b993b2003-04-05 17:35:54 +0000464 assert(delstr != NULL);
Tim Petersf6b80452003-04-07 19:21:15 +0000465 return _PyInstance_Lookup(op, delstr) != NULL;
Tim Peters86b993b2003-04-05 17:35:54 +0000466 }
Phillip J. Eby2ba96612006-04-10 17:51:05 +0000467 else if (PyType_HasFeature(op->ob_type, Py_TPFLAGS_HEAPTYPE))
Tim Peters86b993b2003-04-05 17:35:54 +0000468 return op->ob_type->tp_del != NULL;
Phillip J. Eby2ba96612006-04-10 17:51:05 +0000469 else if (PyGen_CheckExact(op))
470 return PyGen_NeedsFinalizing((PyGenObject *)op);
471 else
472 return 0;
Neil Schemenauera765c122001-11-01 17:35:23 +0000473}
474
Tim Petersead8b7a2004-10-30 23:09:22 +0000475/* Move the objects in unreachable with __del__ methods into `finalizers`.
476 * Objects moved into `finalizers` have gc_refs set to GC_REACHABLE; the
477 * objects remaining in unreachable are left at GC_TENTATIVELY_UNREACHABLE.
Jeremy Hyltonce136e92003-04-04 19:59:06 +0000478 */
Neil Schemenauera765c122001-11-01 17:35:23 +0000479static void
Tim Petersead8b7a2004-10-30 23:09:22 +0000480move_finalizers(PyGC_Head *unreachable, PyGC_Head *finalizers)
Neil Schemenauera765c122001-11-01 17:35:23 +0000481{
Tim Petersead8b7a2004-10-30 23:09:22 +0000482 PyGC_Head *gc;
483 PyGC_Head *next;
Tim Petersf6b80452003-04-07 19:21:15 +0000484
Tim Petersead8b7a2004-10-30 23:09:22 +0000485 /* March over unreachable. Move objects with finalizers into
486 * `finalizers`.
487 */
488 for (gc = unreachable->gc.gc_next; gc != unreachable; gc = next) {
Neil Schemenauer43411b52001-08-30 00:05:51 +0000489 PyObject *op = FROM_GC(gc);
Jeremy Hyltonce136e92003-04-04 19:59:06 +0000490
Tim Petersf6ae7a42003-04-05 18:40:50 +0000491 assert(IS_TENTATIVELY_UNREACHABLE(op));
Tim Petersead8b7a2004-10-30 23:09:22 +0000492 next = gc->gc.gc_next;
Tim Petersf6ae7a42003-04-05 18:40:50 +0000493
Tim Petersf6b80452003-04-07 19:21:15 +0000494 if (has_finalizer(op)) {
Tim Peterse2d59182004-11-01 01:39:08 +0000495 gc_list_move(gc, finalizers);
Tim Petersf6b80452003-04-07 19:21:15 +0000496 gc->gc.gc_refs = GC_REACHABLE;
Jeremy Hyltonce136e92003-04-04 19:59:06 +0000497 }
Jeremy Hyltonc5007aa2000-06-30 05:02:53 +0000498 }
499}
500
Tim Peters19b74c72002-07-01 03:52:19 +0000501/* A traversal callback for move_finalizer_reachable. */
502static int
503visit_move(PyObject *op, PyGC_Head *tolist)
504{
505 if (PyObject_IS_GC(op)) {
Tim Petersea405632002-07-02 00:52:30 +0000506 if (IS_TENTATIVELY_UNREACHABLE(op)) {
Tim Peters19b74c72002-07-01 03:52:19 +0000507 PyGC_Head *gc = AS_GC(op);
Tim Peterse2d59182004-11-01 01:39:08 +0000508 gc_list_move(gc, tolist);
Tim Peters19b74c72002-07-01 03:52:19 +0000509 gc->gc.gc_refs = GC_REACHABLE;
510 }
511 }
512 return 0;
513}
514
515/* Move objects that are reachable from finalizers, from the unreachable set
Tim Petersf6b80452003-04-07 19:21:15 +0000516 * into finalizers set.
Tim Peters19b74c72002-07-01 03:52:19 +0000517 */
Jeremy Hyltonc5007aa2000-06-30 05:02:53 +0000518static void
Tim Petersf6b80452003-04-07 19:21:15 +0000519move_finalizer_reachable(PyGC_Head *finalizers)
Jeremy Hyltonc5007aa2000-06-30 05:02:53 +0000520{
521 traverseproc traverse;
Tim Peters9e4ca102001-10-11 18:31:31 +0000522 PyGC_Head *gc = finalizers->gc.gc_next;
Tim Petersbf384c22003-04-06 00:11:39 +0000523 for (; gc != finalizers; gc = gc->gc.gc_next) {
524 /* Note that the finalizers list may grow during this. */
Christian Heimese93237d2007-12-19 02:37:44 +0000525 traverse = Py_TYPE(FROM_GC(gc))->tp_traverse;
Tim Peters88396172002-06-30 17:56:40 +0000526 (void) traverse(FROM_GC(gc),
Tim Petersbf384c22003-04-06 00:11:39 +0000527 (visitproc)visit_move,
Tim Petersf6b80452003-04-07 19:21:15 +0000528 (void *)finalizers);
Jeremy Hyltonc5007aa2000-06-30 05:02:53 +0000529 }
530}
531
Tim Petersead8b7a2004-10-30 23:09:22 +0000532/* Clear all weakrefs to unreachable objects, and if such a weakref has a
533 * callback, invoke it if necessary. Note that it's possible for such
534 * weakrefs to be outside the unreachable set -- indeed, those are precisely
535 * the weakrefs whose callbacks must be invoked. See gc_weakref.txt for
536 * overview & some details. Some weakrefs with callbacks may be reclaimed
537 * directly by this routine; the number reclaimed is the return value. Other
538 * weakrefs with callbacks may be moved into the `old` generation. Objects
539 * moved into `old` have gc_refs set to GC_REACHABLE; the objects remaining in
540 * unreachable are left at GC_TENTATIVELY_UNREACHABLE. When this returns,
541 * no object in `unreachable` is weakly referenced anymore.
Tim Peters403a2032003-11-20 21:21:46 +0000542 */
543static int
Tim Petersead8b7a2004-10-30 23:09:22 +0000544handle_weakrefs(PyGC_Head *unreachable, PyGC_Head *old)
Tim Peters403a2032003-11-20 21:21:46 +0000545{
Tim Petersead8b7a2004-10-30 23:09:22 +0000546 PyGC_Head *gc;
547 PyObject *op; /* generally FROM_GC(gc) */
548 PyWeakReference *wr; /* generally a cast of op */
Tim Petersead8b7a2004-10-30 23:09:22 +0000549 PyGC_Head wrcb_to_call; /* weakrefs with callbacks to call */
Tim Petersead8b7a2004-10-30 23:09:22 +0000550 PyGC_Head *next;
Tim Peters403a2032003-11-20 21:21:46 +0000551 int num_freed = 0;
552
Tim Petersead8b7a2004-10-30 23:09:22 +0000553 gc_list_init(&wrcb_to_call);
Tim Peters403a2032003-11-20 21:21:46 +0000554
Tim Petersead8b7a2004-10-30 23:09:22 +0000555 /* Clear all weakrefs to the objects in unreachable. If such a weakref
556 * also has a callback, move it into `wrcb_to_call` if the callback
Tim Peterscc2a8662004-10-31 22:12:43 +0000557 * needs to be invoked. Note that we cannot invoke any callbacks until
558 * all weakrefs to unreachable objects are cleared, lest the callback
559 * resurrect an unreachable object via a still-active weakref. We
560 * make another pass over wrcb_to_call, invoking callbacks, after this
561 * pass completes.
Tim Petersead8b7a2004-10-30 23:09:22 +0000562 */
563 for (gc = unreachable->gc.gc_next; gc != unreachable; gc = next) {
564 PyWeakReference **wrlist;
565
566 op = FROM_GC(gc);
567 assert(IS_TENTATIVELY_UNREACHABLE(op));
568 next = gc->gc.gc_next;
569
Christian Heimese93237d2007-12-19 02:37:44 +0000570 if (! PyType_SUPPORTS_WEAKREFS(Py_TYPE(op)))
Tim Petersead8b7a2004-10-30 23:09:22 +0000571 continue;
572
573 /* It supports weakrefs. Does it have any? */
574 wrlist = (PyWeakReference **)
575 PyObject_GET_WEAKREFS_LISTPTR(op);
576
577 /* `op` may have some weakrefs. March over the list, clear
578 * all the weakrefs, and move the weakrefs with callbacks
Tim Peterscc2a8662004-10-31 22:12:43 +0000579 * that must be called into wrcb_to_call.
Tim Petersead8b7a2004-10-30 23:09:22 +0000580 */
581 for (wr = *wrlist; wr != NULL; wr = *wrlist) {
582 PyGC_Head *wrasgc; /* AS_GC(wr) */
583
584 /* _PyWeakref_ClearRef clears the weakref but leaves
585 * the callback pointer intact. Obscure: it also
586 * changes *wrlist.
587 */
588 assert(wr->wr_object == op);
589 _PyWeakref_ClearRef(wr);
590 assert(wr->wr_object == Py_None);
591 if (wr->wr_callback == NULL)
592 continue; /* no callback */
593
594 /* Headache time. `op` is going away, and is weakly referenced by
595 * `wr`, which has a callback. Should the callback be invoked? If wr
596 * is also trash, no:
597 *
598 * 1. There's no need to call it. The object and the weakref are
599 * both going away, so it's legitimate to pretend the weakref is
600 * going away first. The user has to ensure a weakref outlives its
601 * referent if they want a guarantee that the wr callback will get
602 * invoked.
603 *
604 * 2. It may be catastrophic to call it. If the callback is also in
605 * cyclic trash (CT), then although the CT is unreachable from
606 * outside the current generation, CT may be reachable from the
607 * callback. Then the callback could resurrect insane objects.
608 *
609 * Since the callback is never needed and may be unsafe in this case,
Tim Peterscc2a8662004-10-31 22:12:43 +0000610 * wr is simply left in the unreachable set. Note that because we
611 * already called _PyWeakref_ClearRef(wr), its callback will never
612 * trigger.
Tim Petersead8b7a2004-10-30 23:09:22 +0000613 *
614 * OTOH, if wr isn't part of CT, we should invoke the callback: the
615 * weakref outlived the trash. Note that since wr isn't CT in this
616 * case, its callback can't be CT either -- wr acted as an external
617 * root to this generation, and therefore its callback did too. So
618 * nothing in CT is reachable from the callback either, so it's hard
619 * to imagine how calling it later could create a problem for us. wr
620 * is moved to wrcb_to_call in this case.
Tim Petersead8b7a2004-10-30 23:09:22 +0000621 */
Tim Peterscc2a8662004-10-31 22:12:43 +0000622 if (IS_TENTATIVELY_UNREACHABLE(wr))
623 continue;
624 assert(IS_REACHABLE(wr));
625
Tim Petersead8b7a2004-10-30 23:09:22 +0000626 /* Create a new reference so that wr can't go away
627 * before we can process it again.
628 */
629 Py_INCREF(wr);
630
Tim Peterscc2a8662004-10-31 22:12:43 +0000631 /* Move wr to wrcb_to_call, for the next pass. */
Tim Petersead8b7a2004-10-30 23:09:22 +0000632 wrasgc = AS_GC(wr);
Tim Peterscc2a8662004-10-31 22:12:43 +0000633 assert(wrasgc != next); /* wrasgc is reachable, but
634 next isn't, so they can't
635 be the same */
Tim Peterse2d59182004-11-01 01:39:08 +0000636 gc_list_move(wrasgc, &wrcb_to_call);
Tim Petersead8b7a2004-10-30 23:09:22 +0000637 }
638 }
639
Tim Peterscc2a8662004-10-31 22:12:43 +0000640 /* Invoke the callbacks we decided to honor. It's safe to invoke them
641 * because they can't reference unreachable objects.
Tim Petersead8b7a2004-10-30 23:09:22 +0000642 */
643 while (! gc_list_is_empty(&wrcb_to_call)) {
644 PyObject *temp;
645 PyObject *callback;
646
647 gc = wrcb_to_call.gc.gc_next;
648 op = FROM_GC(gc);
649 assert(IS_REACHABLE(op));
650 assert(PyWeakref_Check(op));
651 wr = (PyWeakReference *)op;
652 callback = wr->wr_callback;
653 assert(callback != NULL);
654
655 /* copy-paste of weakrefobject.c's handle_callback() */
Georg Brandl684fd0c2006-05-25 19:15:31 +0000656 temp = PyObject_CallFunctionObjArgs(callback, wr, NULL);
Tim Petersead8b7a2004-10-30 23:09:22 +0000657 if (temp == NULL)
658 PyErr_WriteUnraisable(callback);
659 else
660 Py_DECREF(temp);
661
662 /* Give up the reference we created in the first pass. When
663 * op's refcount hits 0 (which it may or may not do right now),
Tim Peterscc2a8662004-10-31 22:12:43 +0000664 * op's tp_dealloc will decref op->wr_callback too. Note
665 * that the refcount probably will hit 0 now, and because this
666 * weakref was reachable to begin with, gc didn't already
667 * add it to its count of freed objects. Example: a reachable
668 * weak value dict maps some key to this reachable weakref.
669 * The callback removes this key->weakref mapping from the
670 * dict, leaving no other references to the weakref (excepting
671 * ours).
Tim Petersead8b7a2004-10-30 23:09:22 +0000672 */
673 Py_DECREF(op);
674 if (wrcb_to_call.gc.gc_next == gc) {
675 /* object is still alive -- move it */
Tim Peterse2d59182004-11-01 01:39:08 +0000676 gc_list_move(gc, old);
Tim Petersead8b7a2004-10-30 23:09:22 +0000677 }
678 else
679 ++num_freed;
680 }
681
Tim Peters403a2032003-11-20 21:21:46 +0000682 return num_freed;
683}
684
Jeremy Hyltonc5007aa2000-06-30 05:02:53 +0000685static void
Jeremy Hylton06257772000-08-31 15:10:24 +0000686debug_instance(char *msg, PyInstanceObject *inst)
Jeremy Hyltonc5007aa2000-06-30 05:02:53 +0000687{
Jeremy Hyltonc5007aa2000-06-30 05:02:53 +0000688 char *cname;
Neil Schemenauera765c122001-11-01 17:35:23 +0000689 /* simple version of instance_repr */
Jeremy Hyltonc5007aa2000-06-30 05:02:53 +0000690 PyObject *classname = inst->in_class->cl_name;
Gregory P. Smithdd96db62008-06-09 04:58:54 +0000691 if (classname != NULL && PyString_Check(classname))
692 cname = PyString_AsString(classname);
Jeremy Hyltonc5007aa2000-06-30 05:02:53 +0000693 else
694 cname = "?";
Jeremy Hylton06257772000-08-31 15:10:24 +0000695 PySys_WriteStderr("gc: %.100s <%.100s instance at %p>\n",
696 msg, cname, inst);
Jeremy Hyltonc5007aa2000-06-30 05:02:53 +0000697}
698
699static void
Jeremy Hylton06257772000-08-31 15:10:24 +0000700debug_cycle(char *msg, PyObject *op)
Jeremy Hyltonc5007aa2000-06-30 05:02:53 +0000701{
702 if ((debug & DEBUG_INSTANCES) && PyInstance_Check(op)) {
Jeremy Hylton06257772000-08-31 15:10:24 +0000703 debug_instance(msg, (PyInstanceObject *)op);
Neil Schemenauer544de1e2000-09-22 15:22:38 +0000704 }
705 else if (debug & DEBUG_OBJECTS) {
Jeremy Hylton06257772000-08-31 15:10:24 +0000706 PySys_WriteStderr("gc: %.100s <%.100s %p>\n",
Christian Heimese93237d2007-12-19 02:37:44 +0000707 msg, Py_TYPE(op)->tp_name, op);
Jeremy Hyltonc5007aa2000-06-30 05:02:53 +0000708 }
709}
710
Tim Petersbf384c22003-04-06 00:11:39 +0000711/* Handle uncollectable garbage (cycles with finalizers, and stuff reachable
712 * only from such cycles).
Tim Petersf6b80452003-04-07 19:21:15 +0000713 * If DEBUG_SAVEALL, all objects in finalizers are appended to the module
714 * garbage list (a Python list), else only the objects in finalizers with
715 * __del__ methods are appended to garbage. All objects in finalizers are
716 * merged into the old list regardless.
Tim Peters259272b2003-04-06 19:41:39 +0000717 * Returns 0 if all OK, <0 on error (out of memory to grow the garbage list).
718 * The finalizers list is made empty on a successful return.
Tim Petersbf384c22003-04-06 00:11:39 +0000719 */
Tim Peters259272b2003-04-06 19:41:39 +0000720static int
Tim Petersf6b80452003-04-07 19:21:15 +0000721handle_finalizers(PyGC_Head *finalizers, PyGC_Head *old)
Jeremy Hyltonc5007aa2000-06-30 05:02:53 +0000722{
Tim Petersf6b80452003-04-07 19:21:15 +0000723 PyGC_Head *gc = finalizers->gc.gc_next;
724
Jeremy Hyltonc5007aa2000-06-30 05:02:53 +0000725 if (garbage == NULL) {
726 garbage = PyList_New(0);
Tim Petersbf384c22003-04-06 00:11:39 +0000727 if (garbage == NULL)
728 Py_FatalError("gc couldn't create gc.garbage list");
Jeremy Hyltonc5007aa2000-06-30 05:02:53 +0000729 }
Tim Petersf6b80452003-04-07 19:21:15 +0000730 for (; gc != finalizers; gc = gc->gc.gc_next) {
731 PyObject *op = FROM_GC(gc);
732
733 if ((debug & DEBUG_SAVEALL) || has_finalizer(op)) {
734 if (PyList_Append(garbage, op) < 0)
735 return -1;
736 }
Jeremy Hyltonc5007aa2000-06-30 05:02:53 +0000737 }
Tim Petersf6b80452003-04-07 19:21:15 +0000738
Tim Peters259272b2003-04-06 19:41:39 +0000739 gc_list_merge(finalizers, old);
740 return 0;
Jeremy Hyltonc5007aa2000-06-30 05:02:53 +0000741}
742
Neil Schemenauer544de1e2000-09-22 15:22:38 +0000743/* Break reference cycles by clearing the containers involved. This is
Jeremy Hyltonc5007aa2000-06-30 05:02:53 +0000744 * tricky business as the lists can be changing and we don't know which
Tim Peters19b74c72002-07-01 03:52:19 +0000745 * objects may be freed. It is possible I screwed something up here.
746 */
Jeremy Hyltonc5007aa2000-06-30 05:02:53 +0000747static void
Jeremy Hyltonce136e92003-04-04 19:59:06 +0000748delete_garbage(PyGC_Head *collectable, PyGC_Head *old)
Jeremy Hyltonc5007aa2000-06-30 05:02:53 +0000749{
750 inquiry clear;
751
Jeremy Hyltonce136e92003-04-04 19:59:06 +0000752 while (!gc_list_is_empty(collectable)) {
753 PyGC_Head *gc = collectable->gc.gc_next;
Neil Schemenauer43411b52001-08-30 00:05:51 +0000754 PyObject *op = FROM_GC(gc);
Tim Peters88396172002-06-30 17:56:40 +0000755
Tim Peters19b74c72002-07-01 03:52:19 +0000756 assert(IS_TENTATIVELY_UNREACHABLE(op));
Neil Schemenauer544de1e2000-09-22 15:22:38 +0000757 if (debug & DEBUG_SAVEALL) {
758 PyList_Append(garbage, op);
Jeremy Hyltonc5007aa2000-06-30 05:02:53 +0000759 }
Neil Schemenauer544de1e2000-09-22 15:22:38 +0000760 else {
Christian Heimese93237d2007-12-19 02:37:44 +0000761 if ((clear = Py_TYPE(op)->tp_clear) != NULL) {
Neil Schemenauer544de1e2000-09-22 15:22:38 +0000762 Py_INCREF(op);
Jeremy Hylton8a135182002-06-06 23:23:55 +0000763 clear(op);
Neil Schemenauer544de1e2000-09-22 15:22:38 +0000764 Py_DECREF(op);
765 }
766 }
Jeremy Hyltonce136e92003-04-04 19:59:06 +0000767 if (collectable->gc.gc_next == gc) {
Neil Schemenauer544de1e2000-09-22 15:22:38 +0000768 /* object is still alive, move it, it may die later */
Tim Peterse2d59182004-11-01 01:39:08 +0000769 gc_list_move(gc, old);
Tim Peters19b74c72002-07-01 03:52:19 +0000770 gc->gc.gc_refs = GC_REACHABLE;
Jeremy Hyltonc5007aa2000-06-30 05:02:53 +0000771 }
772 }
773}
774
Christian Heimes3b718a72008-02-14 12:47:33 +0000775/* Clear all free lists
776 * All free lists are cleared during the collection of the highest generation.
777 * Allocated items in the free list may keep a pymalloc arena occupied.
778 * Clearing the free lists may give back memory to the OS earlier.
779 */
780static void
781clear_freelists(void)
782{
783 (void)PyMethod_ClearFreeList();
784 (void)PyFrame_ClearFreeList();
785 (void)PyCFunction_ClearFreeList();
786 (void)PyTuple_ClearFreeList();
Benjamin Peterson78821dd2009-01-25 17:15:10 +0000787#ifdef Py_USING_UNICODE
Christian Heimes3b718a72008-02-14 12:47:33 +0000788 (void)PyUnicode_ClearFreeList();
Benjamin Peterson78821dd2009-01-25 17:15:10 +0000789#endif
Gregory P. Smith2fe77062008-07-06 03:35:58 +0000790 (void)PyInt_ClearFreeList();
791 (void)PyFloat_ClearFreeList();
Christian Heimes3b718a72008-02-14 12:47:33 +0000792}
793
Antoine Pitrou73c0e652008-12-17 22:46:54 +0000794static double
795get_time(void)
796{
797 double result = 0;
798 if (tmod != NULL) {
799 PyObject *f = PyObject_CallMethod(tmod, "time", NULL);
800 if (f == NULL) {
801 PyErr_Clear();
802 }
803 else {
804 if (PyFloat_Check(f))
805 result = PyFloat_AsDouble(f);
806 Py_DECREF(f);
807 }
808 }
809 return result;
810}
811
Jeremy Hyltonc5007aa2000-06-30 05:02:53 +0000812/* This is the main function. Read this to understand how the
813 * collection process works. */
Neal Norwitz7b216c52006-03-04 20:01:53 +0000814static Py_ssize_t
Neil Schemenauer2880ae52002-05-04 05:35:20 +0000815collect(int generation)
Jeremy Hyltonc5007aa2000-06-30 05:02:53 +0000816{
Neil Schemenauer2880ae52002-05-04 05:35:20 +0000817 int i;
Neal Norwitz7b216c52006-03-04 20:01:53 +0000818 Py_ssize_t m = 0; /* # objects collected */
819 Py_ssize_t n = 0; /* # unreachable objects that couldn't be collected */
Neil Schemenauer2880ae52002-05-04 05:35:20 +0000820 PyGC_Head *young; /* the generation we are examining */
821 PyGC_Head *old; /* next older generation */
Tim Peters403a2032003-11-20 21:21:46 +0000822 PyGC_Head unreachable; /* non-problematic unreachable trash */
823 PyGC_Head finalizers; /* objects with, & reachable from, __del__ */
Jeremy Hyltonc5007aa2000-06-30 05:02:53 +0000824 PyGC_Head *gc;
Skip Montanaroc34b9312006-04-21 01:33:40 +0000825 double t1 = 0.0;
Jeremy Hyltonc5007aa2000-06-30 05:02:53 +0000826
Tim Peters93ad66d2003-04-05 17:15:44 +0000827 if (delstr == NULL) {
Gregory P. Smithdd96db62008-06-09 04:58:54 +0000828 delstr = PyString_InternFromString("__del__");
Tim Peters93ad66d2003-04-05 17:15:44 +0000829 if (delstr == NULL)
830 Py_FatalError("gc couldn't allocate \"__del__\"");
831 }
832
Jeremy Hyltonc5007aa2000-06-30 05:02:53 +0000833 if (debug & DEBUG_STATS) {
Antoine Pitrou73c0e652008-12-17 22:46:54 +0000834 t1 = get_time();
Neil Schemenauer2880ae52002-05-04 05:35:20 +0000835 PySys_WriteStderr("gc: collecting generation %d...\n",
836 generation);
837 PySys_WriteStderr("gc: objects in each generation:");
Tim Peters62e97f02006-03-28 21:44:32 +0000838 for (i = 0; i < NUM_GENERATIONS; i++)
839 PySys_WriteStderr(" %" PY_FORMAT_SIZE_T "d",
840 gc_list_size(GEN_HEAD(i)));
Neil Schemenauer2880ae52002-05-04 05:35:20 +0000841 PySys_WriteStderr("\n");
842 }
843
844 /* update collection and allocation counters */
845 if (generation+1 < NUM_GENERATIONS)
846 generations[generation+1].count += 1;
847 for (i = 0; i <= generation; i++)
Neil Schemenauerc9051642002-06-28 19:16:04 +0000848 generations[i].count = 0;
Neil Schemenauer2880ae52002-05-04 05:35:20 +0000849
850 /* merge younger generations with one we are currently collecting */
851 for (i = 0; i < generation; i++) {
852 gc_list_merge(GEN_HEAD(i), GEN_HEAD(generation));
853 }
854
855 /* handy references */
856 young = GEN_HEAD(generation);
Tim Peters19b74c72002-07-01 03:52:19 +0000857 if (generation < NUM_GENERATIONS-1)
Neil Schemenauer2880ae52002-05-04 05:35:20 +0000858 old = GEN_HEAD(generation+1);
Tim Peters19b74c72002-07-01 03:52:19 +0000859 else
860 old = young;
Jeremy Hyltonc5007aa2000-06-30 05:02:53 +0000861
862 /* Using ob_refcnt and gc_refs, calculate which objects in the
Tim Petersead8b7a2004-10-30 23:09:22 +0000863 * container set are reachable from outside the set (i.e., have a
Jeremy Hyltonc5007aa2000-06-30 05:02:53 +0000864 * refcount greater than 0 when all the references within the
Tim Petersead8b7a2004-10-30 23:09:22 +0000865 * set are taken into account).
Tim Peters19b74c72002-07-01 03:52:19 +0000866 */
Jeremy Hyltonc5007aa2000-06-30 05:02:53 +0000867 update_refs(young);
868 subtract_refs(young);
869
Tim Peters19b74c72002-07-01 03:52:19 +0000870 /* Leave everything reachable from outside young in young, and move
871 * everything else (in young) to unreachable.
872 * NOTE: This used to move the reachable objects into a reachable
873 * set instead. But most things usually turn out to be reachable,
874 * so it's more efficient to move the unreachable things.
875 */
Jeremy Hyltonc5007aa2000-06-30 05:02:53 +0000876 gc_list_init(&unreachable);
Tim Peters19b74c72002-07-01 03:52:19 +0000877 move_unreachable(young, &unreachable);
Jeremy Hyltonc5007aa2000-06-30 05:02:53 +0000878
Tim Peters19b74c72002-07-01 03:52:19 +0000879 /* Move reachable objects to next generation. */
Antoine Pitrou4c5ecb72009-01-09 21:40:55 +0000880 if (young != old) {
881 if (generation == NUM_GENERATIONS - 2) {
882 long_lived_pending += gc_list_size(young);
883 }
Tim Peters19b74c72002-07-01 03:52:19 +0000884 gc_list_merge(young, old);
Antoine Pitrou4c5ecb72009-01-09 21:40:55 +0000885 }
886 else {
887 long_lived_pending = 0;
888 long_lived_total = gc_list_size(young);
889 }
Jeremy Hyltonc5007aa2000-06-30 05:02:53 +0000890
Tim Peters19b74c72002-07-01 03:52:19 +0000891 /* All objects in unreachable are trash, but objects reachable from
892 * finalizers can't safely be deleted. Python programmers should take
893 * care not to create such things. For Python, finalizers means
Tim Peters403a2032003-11-20 21:21:46 +0000894 * instance objects with __del__ methods. Weakrefs with callbacks
Tim Petersead8b7a2004-10-30 23:09:22 +0000895 * can also call arbitrary Python code but they will be dealt with by
896 * handle_weakrefs().
Tim Petersf6b80452003-04-07 19:21:15 +0000897 */
Jeremy Hyltonc5007aa2000-06-30 05:02:53 +0000898 gc_list_init(&finalizers);
Tim Petersead8b7a2004-10-30 23:09:22 +0000899 move_finalizers(&unreachable, &finalizers);
Tim Petersbf384c22003-04-06 00:11:39 +0000900 /* finalizers contains the unreachable objects with a finalizer;
Tim Peters403a2032003-11-20 21:21:46 +0000901 * unreachable objects reachable *from* those are also uncollectable,
902 * and we move those into the finalizers list too.
Tim Petersbf384c22003-04-06 00:11:39 +0000903 */
Tim Petersf6b80452003-04-07 19:21:15 +0000904 move_finalizer_reachable(&finalizers);
Jeremy Hyltonc5007aa2000-06-30 05:02:53 +0000905
906 /* Collect statistics on collectable objects found and print
Tim Peters403a2032003-11-20 21:21:46 +0000907 * debugging information.
908 */
Tim Petersf6b80452003-04-07 19:21:15 +0000909 for (gc = unreachable.gc.gc_next; gc != &unreachable;
Tim Peters9e4ca102001-10-11 18:31:31 +0000910 gc = gc->gc.gc_next) {
Jeremy Hyltonc5007aa2000-06-30 05:02:53 +0000911 m++;
Jeremy Hylton06257772000-08-31 15:10:24 +0000912 if (debug & DEBUG_COLLECTABLE) {
Neil Schemenauer43411b52001-08-30 00:05:51 +0000913 debug_cycle("collectable", FROM_GC(gc));
Jeremy Hyltonc5007aa2000-06-30 05:02:53 +0000914 }
915 }
Tim Petersead8b7a2004-10-30 23:09:22 +0000916
917 /* Clear weakrefs and invoke callbacks as necessary. */
918 m += handle_weakrefs(&unreachable, old);
919
Tim Petersfb2ab4d2003-04-07 22:41:24 +0000920 /* Call tp_clear on objects in the unreachable set. This will cause
921 * the reference cycles to be broken. It may also cause some objects
922 * in finalizers to be freed.
923 */
Tim Petersf6b80452003-04-07 19:21:15 +0000924 delete_garbage(&unreachable, old);
Jeremy Hyltonc5007aa2000-06-30 05:02:53 +0000925
926 /* Collect statistics on uncollectable objects found and print
927 * debugging information. */
Tim Peters50c61d52003-04-06 01:50:50 +0000928 for (gc = finalizers.gc.gc_next;
Tim Petersbf384c22003-04-06 00:11:39 +0000929 gc != &finalizers;
930 gc = gc->gc.gc_next) {
Jeremy Hyltonc5007aa2000-06-30 05:02:53 +0000931 n++;
Tim Petersbf384c22003-04-06 00:11:39 +0000932 if (debug & DEBUG_UNCOLLECTABLE)
Neil Schemenauer43411b52001-08-30 00:05:51 +0000933 debug_cycle("uncollectable", FROM_GC(gc));
Tim Petersbf384c22003-04-06 00:11:39 +0000934 }
Jeremy Hylton06257772000-08-31 15:10:24 +0000935 if (debug & DEBUG_STATS) {
Antoine Pitrou73c0e652008-12-17 22:46:54 +0000936 double t2 = get_time();
Tim Peters62e97f02006-03-28 21:44:32 +0000937 if (m == 0 && n == 0)
Antoine Pitrou73c0e652008-12-17 22:46:54 +0000938 PySys_WriteStderr("gc: done");
Tim Peters62e97f02006-03-28 21:44:32 +0000939 else
Neal Norwitze22373d2006-03-06 23:31:56 +0000940 PySys_WriteStderr(
Tim Peters62e97f02006-03-28 21:44:32 +0000941 "gc: done, "
942 "%" PY_FORMAT_SIZE_T "d unreachable, "
Antoine Pitrou73c0e652008-12-17 22:46:54 +0000943 "%" PY_FORMAT_SIZE_T "d uncollectable",
Neal Norwitze22373d2006-03-06 23:31:56 +0000944 n+m, n);
Antoine Pitrou73c0e652008-12-17 22:46:54 +0000945 if (t1 && t2) {
946 PySys_WriteStderr(", %.4fs elapsed", t2-t1);
947 }
948 PySys_WriteStderr(".\n");
Jeremy Hyltonc5007aa2000-06-30 05:02:53 +0000949 }
950
951 /* Append instances in the uncollectable set to a Python
952 * reachable list of garbage. The programmer has to deal with
Tim Petersbf384c22003-04-06 00:11:39 +0000953 * this if they insist on creating this type of structure.
954 */
Tim Petersf6b80452003-04-07 19:21:15 +0000955 (void)handle_finalizers(&finalizers, old);
Jeremy Hyltonc5007aa2000-06-30 05:02:53 +0000956
Christian Heimes3b718a72008-02-14 12:47:33 +0000957 /* Clear free list only during the collection of the higest
958 * generation */
959 if (generation == NUM_GENERATIONS-1) {
960 clear_freelists();
961 }
962
Jeremy Hyltonb709df32000-09-01 02:47:25 +0000963 if (PyErr_Occurred()) {
Tim Petersf6b80452003-04-07 19:21:15 +0000964 if (gc_str == NULL)
Gregory P. Smithdd96db62008-06-09 04:58:54 +0000965 gc_str = PyString_FromString("garbage collection");
Jeremy Hyltonb709df32000-09-01 02:47:25 +0000966 PyErr_WriteUnraisable(gc_str);
967 Py_FatalError("unexpected exception during garbage collection");
968 }
Jeremy Hyltonc5007aa2000-06-30 05:02:53 +0000969 return n+m;
970}
971
Neal Norwitz7b216c52006-03-04 20:01:53 +0000972static Py_ssize_t
Jeremy Hyltonc5007aa2000-06-30 05:02:53 +0000973collect_generations(void)
974{
Neil Schemenauer2880ae52002-05-04 05:35:20 +0000975 int i;
Neal Norwitz7b216c52006-03-04 20:01:53 +0000976 Py_ssize_t n = 0;
Jeremy Hyltonc5007aa2000-06-30 05:02:53 +0000977
Neil Schemenauer2880ae52002-05-04 05:35:20 +0000978 /* Find the oldest generation (higest numbered) where the count
979 * exceeds the threshold. Objects in the that generation and
980 * generations younger than it will be collected. */
981 for (i = NUM_GENERATIONS-1; i >= 0; i--) {
982 if (generations[i].count > generations[i].threshold) {
Antoine Pitrou4c5ecb72009-01-09 21:40:55 +0000983 /* Avoid quadratic performance degradation in number
984 of tracked objects. See comments at the beginning
985 of this file, and issue #4074.
986 */
987 if (i == NUM_GENERATIONS - 1
988 && long_lived_pending < long_lived_total / 4)
989 continue;
Neil Schemenauer2880ae52002-05-04 05:35:20 +0000990 n = collect(i);
991 break;
Jeremy Hyltonc5007aa2000-06-30 05:02:53 +0000992 }
993 }
994 return n;
995}
996
Martin v. Löwis14f8b4c2002-06-13 20:33:02 +0000997PyDoc_STRVAR(gc_enable__doc__,
Vladimir Marangozovf9d20c32000-08-06 22:45:31 +0000998"enable() -> None\n"
999"\n"
Martin v. Löwis14f8b4c2002-06-13 20:33:02 +00001000"Enable automatic garbage collection.\n");
Jeremy Hyltonc5007aa2000-06-30 05:02:53 +00001001
Vladimir Marangozovf9d20c32000-08-06 22:45:31 +00001002static PyObject *
Tim Peters50c61d52003-04-06 01:50:50 +00001003gc_enable(PyObject *self, PyObject *noargs)
Vladimir Marangozovf9d20c32000-08-06 22:45:31 +00001004{
Vladimir Marangozovf9d20c32000-08-06 22:45:31 +00001005 enabled = 1;
Vladimir Marangozovf9d20c32000-08-06 22:45:31 +00001006 Py_INCREF(Py_None);
1007 return Py_None;
1008}
1009
Martin v. Löwis14f8b4c2002-06-13 20:33:02 +00001010PyDoc_STRVAR(gc_disable__doc__,
Vladimir Marangozovf9d20c32000-08-06 22:45:31 +00001011"disable() -> None\n"
1012"\n"
Martin v. Löwis14f8b4c2002-06-13 20:33:02 +00001013"Disable automatic garbage collection.\n");
Vladimir Marangozovf9d20c32000-08-06 22:45:31 +00001014
1015static PyObject *
Tim Peters50c61d52003-04-06 01:50:50 +00001016gc_disable(PyObject *self, PyObject *noargs)
Vladimir Marangozovf9d20c32000-08-06 22:45:31 +00001017{
Vladimir Marangozovf9d20c32000-08-06 22:45:31 +00001018 enabled = 0;
Vladimir Marangozovf9d20c32000-08-06 22:45:31 +00001019 Py_INCREF(Py_None);
1020 return Py_None;
1021}
1022
Martin v. Löwis14f8b4c2002-06-13 20:33:02 +00001023PyDoc_STRVAR(gc_isenabled__doc__,
Vladimir Marangozovf9d20c32000-08-06 22:45:31 +00001024"isenabled() -> status\n"
1025"\n"
Martin v. Löwis14f8b4c2002-06-13 20:33:02 +00001026"Returns true if automatic garbage collection is enabled.\n");
Vladimir Marangozovf9d20c32000-08-06 22:45:31 +00001027
1028static PyObject *
Tim Peters50c61d52003-04-06 01:50:50 +00001029gc_isenabled(PyObject *self, PyObject *noargs)
Vladimir Marangozovf9d20c32000-08-06 22:45:31 +00001030{
Raymond Hettinger674d56b2004-01-04 04:00:13 +00001031 return PyBool_FromLong((long)enabled);
Vladimir Marangozovf9d20c32000-08-06 22:45:31 +00001032}
1033
Martin v. Löwis14f8b4c2002-06-13 20:33:02 +00001034PyDoc_STRVAR(gc_collect__doc__,
Barry Warsawd3c38ff2006-03-07 09:46:03 +00001035"collect([generation]) -> n\n"
Jeremy Hyltonc5007aa2000-06-30 05:02:53 +00001036"\n"
Barry Warsawd3c38ff2006-03-07 09:46:03 +00001037"With no arguments, run a full collection. The optional argument\n"
1038"may be an integer specifying which generation to collect. A ValueError\n"
1039"is raised if the generation number is invalid.\n\n"
1040"The number of unreachable objects is returned.\n");
Jeremy Hyltonc5007aa2000-06-30 05:02:53 +00001041
1042static PyObject *
Barry Warsawd3c38ff2006-03-07 09:46:03 +00001043gc_collect(PyObject *self, PyObject *args, PyObject *kws)
Jeremy Hyltonc5007aa2000-06-30 05:02:53 +00001044{
Barry Warsawd3c38ff2006-03-07 09:46:03 +00001045 static char *keywords[] = {"generation", NULL};
1046 int genarg = NUM_GENERATIONS - 1;
Neal Norwitz7b216c52006-03-04 20:01:53 +00001047 Py_ssize_t n;
Jeremy Hyltonc5007aa2000-06-30 05:02:53 +00001048
Barry Warsawd3c38ff2006-03-07 09:46:03 +00001049 if (!PyArg_ParseTupleAndKeywords(args, kws, "|i", keywords, &genarg))
1050 return NULL;
1051
1052 else if (genarg < 0 || genarg >= NUM_GENERATIONS) {
1053 PyErr_SetString(PyExc_ValueError, "invalid generation");
1054 return NULL;
1055 }
1056
Tim Peters50c61d52003-04-06 01:50:50 +00001057 if (collecting)
Neil Schemenauere8c40cb2001-10-31 23:09:35 +00001058 n = 0; /* already collecting, don't do anything */
Neil Schemenauere8c40cb2001-10-31 23:09:35 +00001059 else {
1060 collecting = 1;
Barry Warsawd3c38ff2006-03-07 09:46:03 +00001061 n = collect(genarg);
Neil Schemenauere8c40cb2001-10-31 23:09:35 +00001062 collecting = 0;
1063 }
Jeremy Hyltonc5007aa2000-06-30 05:02:53 +00001064
Neal Norwitz7b216c52006-03-04 20:01:53 +00001065 return PyInt_FromSsize_t(n);
Jeremy Hyltonc5007aa2000-06-30 05:02:53 +00001066}
1067
Martin v. Löwis14f8b4c2002-06-13 20:33:02 +00001068PyDoc_STRVAR(gc_set_debug__doc__,
Jeremy Hyltonc5007aa2000-06-30 05:02:53 +00001069"set_debug(flags) -> None\n"
1070"\n"
1071"Set the garbage collection debugging flags. Debugging information is\n"
1072"written to sys.stderr.\n"
1073"\n"
1074"flags is an integer and can have the following bits turned on:\n"
1075"\n"
1076" DEBUG_STATS - Print statistics during collection.\n"
1077" DEBUG_COLLECTABLE - Print collectable objects found.\n"
1078" DEBUG_UNCOLLECTABLE - Print unreachable but uncollectable objects found.\n"
1079" DEBUG_INSTANCES - Print instance objects.\n"
1080" DEBUG_OBJECTS - Print objects other than instances.\n"
Neil Schemenauer544de1e2000-09-22 15:22:38 +00001081" DEBUG_SAVEALL - Save objects to gc.garbage rather than freeing them.\n"
Martin v. Löwis14f8b4c2002-06-13 20:33:02 +00001082" DEBUG_LEAK - Debug leaking programs (everything but STATS).\n");
Jeremy Hyltonc5007aa2000-06-30 05:02:53 +00001083
1084static PyObject *
Vladimir Marangozovf9d20c32000-08-06 22:45:31 +00001085gc_set_debug(PyObject *self, PyObject *args)
Jeremy Hyltonc5007aa2000-06-30 05:02:53 +00001086{
Neil Schemenauer7760cff2000-09-22 22:35:36 +00001087 if (!PyArg_ParseTuple(args, "i:set_debug", &debug))
Jeremy Hyltonc5007aa2000-06-30 05:02:53 +00001088 return NULL;
1089
1090 Py_INCREF(Py_None);
1091 return Py_None;
1092}
1093
Martin v. Löwis14f8b4c2002-06-13 20:33:02 +00001094PyDoc_STRVAR(gc_get_debug__doc__,
Jeremy Hyltonc5007aa2000-06-30 05:02:53 +00001095"get_debug() -> flags\n"
1096"\n"
Martin v. Löwis14f8b4c2002-06-13 20:33:02 +00001097"Get the garbage collection debugging flags.\n");
Jeremy Hyltonc5007aa2000-06-30 05:02:53 +00001098
1099static PyObject *
Tim Peters50c61d52003-04-06 01:50:50 +00001100gc_get_debug(PyObject *self, PyObject *noargs)
Jeremy Hyltonc5007aa2000-06-30 05:02:53 +00001101{
Jeremy Hyltonc5007aa2000-06-30 05:02:53 +00001102 return Py_BuildValue("i", debug);
1103}
1104
Martin v. Löwis14f8b4c2002-06-13 20:33:02 +00001105PyDoc_STRVAR(gc_set_thresh__doc__,
Neal Norwitz2a47c0f2002-01-29 00:53:41 +00001106"set_threshold(threshold0, [threshold1, threshold2]) -> None\n"
Jeremy Hyltonc5007aa2000-06-30 05:02:53 +00001107"\n"
1108"Sets the collection thresholds. Setting threshold0 to zero disables\n"
Martin v. Löwis14f8b4c2002-06-13 20:33:02 +00001109"collection.\n");
Jeremy Hyltonc5007aa2000-06-30 05:02:53 +00001110
1111static PyObject *
Vladimir Marangozovf9d20c32000-08-06 22:45:31 +00001112gc_set_thresh(PyObject *self, PyObject *args)
Jeremy Hyltonc5007aa2000-06-30 05:02:53 +00001113{
Neil Schemenauer2880ae52002-05-04 05:35:20 +00001114 int i;
1115 if (!PyArg_ParseTuple(args, "i|ii:set_threshold",
1116 &generations[0].threshold,
1117 &generations[1].threshold,
1118 &generations[2].threshold))
Jeremy Hyltonc5007aa2000-06-30 05:02:53 +00001119 return NULL;
Neil Schemenauer2880ae52002-05-04 05:35:20 +00001120 for (i = 2; i < NUM_GENERATIONS; i++) {
1121 /* generations higher than 2 get the same threshold */
1122 generations[i].threshold = generations[2].threshold;
1123 }
Jeremy Hyltonc5007aa2000-06-30 05:02:53 +00001124
1125 Py_INCREF(Py_None);
1126 return Py_None;
1127}
1128
Martin v. Löwis14f8b4c2002-06-13 20:33:02 +00001129PyDoc_STRVAR(gc_get_thresh__doc__,
Jeremy Hyltonc5007aa2000-06-30 05:02:53 +00001130"get_threshold() -> (threshold0, threshold1, threshold2)\n"
1131"\n"
Martin v. Löwis14f8b4c2002-06-13 20:33:02 +00001132"Return the current collection thresholds\n");
Jeremy Hyltonc5007aa2000-06-30 05:02:53 +00001133
1134static PyObject *
Tim Peters50c61d52003-04-06 01:50:50 +00001135gc_get_thresh(PyObject *self, PyObject *noargs)
Jeremy Hyltonc5007aa2000-06-30 05:02:53 +00001136{
Neil Schemenauer2880ae52002-05-04 05:35:20 +00001137 return Py_BuildValue("(iii)",
1138 generations[0].threshold,
1139 generations[1].threshold,
1140 generations[2].threshold);
Jeremy Hyltonc5007aa2000-06-30 05:02:53 +00001141}
1142
Barry Warsawd3c38ff2006-03-07 09:46:03 +00001143PyDoc_STRVAR(gc_get_count__doc__,
1144"get_count() -> (count0, count1, count2)\n"
1145"\n"
1146"Return the current collection counts\n");
1147
1148static PyObject *
1149gc_get_count(PyObject *self, PyObject *noargs)
1150{
1151 return Py_BuildValue("(iii)",
1152 generations[0].count,
1153 generations[1].count,
1154 generations[2].count);
1155}
1156
Neil Schemenauer48c70342001-08-09 15:38:31 +00001157static int
Martin v. Löwis560da622001-11-24 09:24:51 +00001158referrersvisit(PyObject* obj, PyObject *objs)
Neil Schemenauer48c70342001-08-09 15:38:31 +00001159{
Neal Norwitzffb0d902006-04-06 08:07:25 +00001160 Py_ssize_t i;
Martin v. Löwisc8fe77b2001-11-29 18:08:31 +00001161 for (i = 0; i < PyTuple_GET_SIZE(objs); i++)
1162 if (PyTuple_GET_ITEM(objs, i) == obj)
1163 return 1;
Neil Schemenauer48c70342001-08-09 15:38:31 +00001164 return 0;
1165}
1166
Neil Schemenauer17e7be62001-08-10 14:46:47 +00001167static int
Martin v. Löwis560da622001-11-24 09:24:51 +00001168gc_referrers_for(PyObject *objs, PyGC_Head *list, PyObject *resultlist)
Neil Schemenauer48c70342001-08-09 15:38:31 +00001169{
1170 PyGC_Head *gc;
1171 PyObject *obj;
1172 traverseproc traverse;
Tim Peters9e4ca102001-10-11 18:31:31 +00001173 for (gc = list->gc.gc_next; gc != list; gc = gc->gc.gc_next) {
Neil Schemenauer43411b52001-08-30 00:05:51 +00001174 obj = FROM_GC(gc);
Christian Heimese93237d2007-12-19 02:37:44 +00001175 traverse = Py_TYPE(obj)->tp_traverse;
Neil Schemenauer48c70342001-08-09 15:38:31 +00001176 if (obj == objs || obj == resultlist)
1177 continue;
Martin v. Löwis560da622001-11-24 09:24:51 +00001178 if (traverse(obj, (visitproc)referrersvisit, objs)) {
Neil Schemenauer17e7be62001-08-10 14:46:47 +00001179 if (PyList_Append(resultlist, obj) < 0)
1180 return 0; /* error */
Neil Schemenauer48c70342001-08-09 15:38:31 +00001181 }
1182 }
Neil Schemenauer17e7be62001-08-10 14:46:47 +00001183 return 1; /* no error */
Neil Schemenauer48c70342001-08-09 15:38:31 +00001184}
1185
Martin v. Löwis14f8b4c2002-06-13 20:33:02 +00001186PyDoc_STRVAR(gc_get_referrers__doc__,
Martin v. Löwis560da622001-11-24 09:24:51 +00001187"get_referrers(*objs) -> list\n\
Martin v. Löwis14f8b4c2002-06-13 20:33:02 +00001188Return the list of objects that directly refer to any of objs.");
Neil Schemenauer48c70342001-08-09 15:38:31 +00001189
Neil Schemenauer17e7be62001-08-10 14:46:47 +00001190static PyObject *
Martin v. Löwis560da622001-11-24 09:24:51 +00001191gc_get_referrers(PyObject *self, PyObject *args)
Neil Schemenauer48c70342001-08-09 15:38:31 +00001192{
Neil Schemenauer2880ae52002-05-04 05:35:20 +00001193 int i;
Neil Schemenauer48c70342001-08-09 15:38:31 +00001194 PyObject *result = PyList_New(0);
Georg Brandl5c170fd2006-03-17 19:03:25 +00001195 if (!result) return NULL;
1196
Neil Schemenauer2880ae52002-05-04 05:35:20 +00001197 for (i = 0; i < NUM_GENERATIONS; i++) {
1198 if (!(gc_referrers_for(args, GEN_HEAD(i), result))) {
1199 Py_DECREF(result);
1200 return NULL;
1201 }
Neil Schemenauer17e7be62001-08-10 14:46:47 +00001202 }
Neil Schemenauer48c70342001-08-09 15:38:31 +00001203 return result;
1204}
Jeremy Hyltonc5007aa2000-06-30 05:02:53 +00001205
Tim Peters0f81ab62003-04-08 16:39:48 +00001206/* Append obj to list; return true if error (out of memory), false if OK. */
Jeremy Hylton5bd378b2003-04-03 16:28:38 +00001207static int
Tim Peters730f5532003-04-08 17:17:17 +00001208referentsvisit(PyObject *obj, PyObject *list)
Jeremy Hylton5bd378b2003-04-03 16:28:38 +00001209{
Tim Peters0f81ab62003-04-08 16:39:48 +00001210 return PyList_Append(list, obj) < 0;
Jeremy Hylton5bd378b2003-04-03 16:28:38 +00001211}
1212
Tim Peters730f5532003-04-08 17:17:17 +00001213PyDoc_STRVAR(gc_get_referents__doc__,
1214"get_referents(*objs) -> list\n\
Jeremy Hylton059b0942003-04-03 16:29:13 +00001215Return the list of objects that are directly referred to by objs.");
Jeremy Hylton5bd378b2003-04-03 16:28:38 +00001216
1217static PyObject *
Tim Peters730f5532003-04-08 17:17:17 +00001218gc_get_referents(PyObject *self, PyObject *args)
Jeremy Hylton5bd378b2003-04-03 16:28:38 +00001219{
Neal Norwitzffb0d902006-04-06 08:07:25 +00001220 Py_ssize_t i;
Jeremy Hylton5bd378b2003-04-03 16:28:38 +00001221 PyObject *result = PyList_New(0);
Tim Peters0f81ab62003-04-08 16:39:48 +00001222
1223 if (result == NULL)
1224 return NULL;
1225
Jeremy Hylton5bd378b2003-04-03 16:28:38 +00001226 for (i = 0; i < PyTuple_GET_SIZE(args); i++) {
Tim Peters0f81ab62003-04-08 16:39:48 +00001227 traverseproc traverse;
Tim Peters93ad66d2003-04-05 17:15:44 +00001228 PyObject *obj = PyTuple_GET_ITEM(args, i);
Tim Peters0f81ab62003-04-08 16:39:48 +00001229
1230 if (! PyObject_IS_GC(obj))
Jeremy Hylton5bd378b2003-04-03 16:28:38 +00001231 continue;
Christian Heimese93237d2007-12-19 02:37:44 +00001232 traverse = Py_TYPE(obj)->tp_traverse;
Tim Peters0f81ab62003-04-08 16:39:48 +00001233 if (! traverse)
1234 continue;
Tim Peters730f5532003-04-08 17:17:17 +00001235 if (traverse(obj, (visitproc)referentsvisit, result)) {
Tim Peters0f81ab62003-04-08 16:39:48 +00001236 Py_DECREF(result);
Jeremy Hylton5bd378b2003-04-03 16:28:38 +00001237 return NULL;
Tim Peters0f81ab62003-04-08 16:39:48 +00001238 }
Jeremy Hylton5bd378b2003-04-03 16:28:38 +00001239 }
1240 return result;
1241}
1242
Martin v. Löwis14f8b4c2002-06-13 20:33:02 +00001243PyDoc_STRVAR(gc_get_objects__doc__,
Neil Schemenauerc7c8d8e2001-08-09 15:58:59 +00001244"get_objects() -> [...]\n"
1245"\n"
1246"Return a list of objects tracked by the collector (excluding the list\n"
Martin v. Löwis14f8b4c2002-06-13 20:33:02 +00001247"returned).\n");
Neil Schemenauerc7c8d8e2001-08-09 15:58:59 +00001248
Neil Schemenauerc7c8d8e2001-08-09 15:58:59 +00001249static PyObject *
Tim Peters50c61d52003-04-06 01:50:50 +00001250gc_get_objects(PyObject *self, PyObject *noargs)
Neil Schemenauerc7c8d8e2001-08-09 15:58:59 +00001251{
Neil Schemenauer2880ae52002-05-04 05:35:20 +00001252 int i;
Neil Schemenauerc7c8d8e2001-08-09 15:58:59 +00001253 PyObject* result;
1254
Neil Schemenauerc7c8d8e2001-08-09 15:58:59 +00001255 result = PyList_New(0);
Tim Peters50c61d52003-04-06 01:50:50 +00001256 if (result == NULL)
Martin v. Löwisf8a6f242001-12-02 18:31:02 +00001257 return NULL;
Neil Schemenauer2880ae52002-05-04 05:35:20 +00001258 for (i = 0; i < NUM_GENERATIONS; i++) {
1259 if (append_objects(result, GEN_HEAD(i))) {
1260 Py_DECREF(result);
1261 return NULL;
1262 }
Martin v. Löwis155aad12001-12-02 12:21:34 +00001263 }
Neil Schemenauerc7c8d8e2001-08-09 15:58:59 +00001264 return result;
1265}
1266
1267
Martin v. Löwis14f8b4c2002-06-13 20:33:02 +00001268PyDoc_STRVAR(gc__doc__,
Jeremy Hyltonc5007aa2000-06-30 05:02:53 +00001269"This module provides access to the garbage collector for reference cycles.\n"
1270"\n"
Vladimir Marangozovf9d20c32000-08-06 22:45:31 +00001271"enable() -- Enable automatic garbage collection.\n"
1272"disable() -- Disable automatic garbage collection.\n"
1273"isenabled() -- Returns true if automatic collection is enabled.\n"
Jeremy Hyltonc5007aa2000-06-30 05:02:53 +00001274"collect() -- Do a full collection right now.\n"
Barry Warsawe5ec6132006-10-09 19:43:24 +00001275"get_count() -- Return the current collection counts.\n"
Jeremy Hyltonc5007aa2000-06-30 05:02:53 +00001276"set_debug() -- Set debugging flags.\n"
1277"get_debug() -- Get debugging flags.\n"
1278"set_threshold() -- Set the collection thresholds.\n"
1279"get_threshold() -- Return the current the collection thresholds.\n"
Neil Schemenauerc7c8d8e2001-08-09 15:58:59 +00001280"get_objects() -- Return a list of all objects tracked by the collector.\n"
Jeremy Hylton5bd378b2003-04-03 16:28:38 +00001281"get_referrers() -- Return the list of objects that refer to an object.\n"
Tim Peters730f5532003-04-08 17:17:17 +00001282"get_referents() -- Return the list of objects that an object refers to.\n");
Jeremy Hyltonc5007aa2000-06-30 05:02:53 +00001283
1284static PyMethodDef GcMethods[] = {
Tim Peters50c61d52003-04-06 01:50:50 +00001285 {"enable", gc_enable, METH_NOARGS, gc_enable__doc__},
1286 {"disable", gc_disable, METH_NOARGS, gc_disable__doc__},
1287 {"isenabled", gc_isenabled, METH_NOARGS, gc_isenabled__doc__},
Vladimir Marangozovf9d20c32000-08-06 22:45:31 +00001288 {"set_debug", gc_set_debug, METH_VARARGS, gc_set_debug__doc__},
Tim Peters50c61d52003-04-06 01:50:50 +00001289 {"get_debug", gc_get_debug, METH_NOARGS, gc_get_debug__doc__},
Barry Warsawd3c38ff2006-03-07 09:46:03 +00001290 {"get_count", gc_get_count, METH_NOARGS, gc_get_count__doc__},
Vladimir Marangozovf9d20c32000-08-06 22:45:31 +00001291 {"set_threshold", gc_set_thresh, METH_VARARGS, gc_set_thresh__doc__},
Tim Peters50c61d52003-04-06 01:50:50 +00001292 {"get_threshold", gc_get_thresh, METH_NOARGS, gc_get_thresh__doc__},
Barry Warsawd3c38ff2006-03-07 09:46:03 +00001293 {"collect", (PyCFunction)gc_collect,
1294 METH_VARARGS | METH_KEYWORDS, gc_collect__doc__},
Tim Peters50c61d52003-04-06 01:50:50 +00001295 {"get_objects", gc_get_objects,METH_NOARGS, gc_get_objects__doc__},
Martin v. Löwis560da622001-11-24 09:24:51 +00001296 {"get_referrers", gc_get_referrers, METH_VARARGS,
1297 gc_get_referrers__doc__},
Tim Peters730f5532003-04-08 17:17:17 +00001298 {"get_referents", gc_get_referents, METH_VARARGS,
1299 gc_get_referents__doc__},
Jeremy Hyltonc5007aa2000-06-30 05:02:53 +00001300 {NULL, NULL} /* Sentinel */
1301};
1302
Jason Tishler6bc06ec2003-09-04 11:59:50 +00001303PyMODINIT_FUNC
Jeremy Hyltonc5007aa2000-06-30 05:02:53 +00001304initgc(void)
1305{
1306 PyObject *m;
Jeremy Hyltonc5007aa2000-06-30 05:02:53 +00001307
1308 m = Py_InitModule4("gc",
1309 GcMethods,
1310 gc__doc__,
1311 NULL,
1312 PYTHON_API_VERSION);
Neal Norwitz1ac754f2006-01-19 06:09:39 +00001313 if (m == NULL)
1314 return;
Tim Peters11558872003-04-06 23:30:52 +00001315
Jeremy Hyltonc5007aa2000-06-30 05:02:53 +00001316 if (garbage == NULL) {
1317 garbage = PyList_New(0);
Tim Peters11558872003-04-06 23:30:52 +00001318 if (garbage == NULL)
1319 return;
Jeremy Hyltonc5007aa2000-06-30 05:02:53 +00001320 }
Neil Schemenauer3b1cbf92005-06-18 17:37:06 +00001321 Py_INCREF(garbage);
Tim Peters11558872003-04-06 23:30:52 +00001322 if (PyModule_AddObject(m, "garbage", garbage) < 0)
1323 return;
Neal Norwitz57a03612006-04-26 05:34:03 +00001324
1325 /* Importing can't be done in collect() because collect()
1326 * can be called via PyGC_Collect() in Py_Finalize().
1327 * This wouldn't be a problem, except that <initialized> is
1328 * reset to 0 before calling collect which trips up
1329 * the import and triggers an assertion.
1330 */
1331 if (tmod == NULL) {
Christian Heimes000a0742008-01-03 22:16:32 +00001332 tmod = PyImport_ImportModuleNoBlock("time");
Neal Norwitz57a03612006-04-26 05:34:03 +00001333 if (tmod == NULL)
1334 PyErr_Clear();
1335 }
1336
Tim Peters11558872003-04-06 23:30:52 +00001337#define ADD_INT(NAME) if (PyModule_AddIntConstant(m, #NAME, NAME) < 0) return
1338 ADD_INT(DEBUG_STATS);
1339 ADD_INT(DEBUG_COLLECTABLE);
1340 ADD_INT(DEBUG_UNCOLLECTABLE);
1341 ADD_INT(DEBUG_INSTANCES);
1342 ADD_INT(DEBUG_OBJECTS);
1343 ADD_INT(DEBUG_SAVEALL);
1344 ADD_INT(DEBUG_LEAK);
1345#undef ADD_INT
Jeremy Hyltonc5007aa2000-06-30 05:02:53 +00001346}
1347
Guido van Rossume13ddc92003-04-17 17:29:22 +00001348/* API to invoke gc.collect() from C */
Neal Norwitz7b216c52006-03-04 20:01:53 +00001349Py_ssize_t
Guido van Rossume13ddc92003-04-17 17:29:22 +00001350PyGC_Collect(void)
1351{
Neal Norwitz7b216c52006-03-04 20:01:53 +00001352 Py_ssize_t n;
Guido van Rossume13ddc92003-04-17 17:29:22 +00001353
1354 if (collecting)
1355 n = 0; /* already collecting, don't do anything */
1356 else {
1357 collecting = 1;
1358 n = collect(NUM_GENERATIONS - 1);
1359 collecting = 0;
1360 }
1361
1362 return n;
1363}
1364
Neil Schemenauer43411b52001-08-30 00:05:51 +00001365/* for debugging */
Guido van Rossume13ddc92003-04-17 17:29:22 +00001366void
1367_PyGC_Dump(PyGC_Head *g)
Neil Schemenauer43411b52001-08-30 00:05:51 +00001368{
1369 _PyObject_Dump(FROM_GC(g));
1370}
1371
Neil Schemenauer43411b52001-08-30 00:05:51 +00001372/* extension modules might be compiled with GC support so these
1373 functions must always be available */
1374
Neil Schemenauerfec4eb12002-04-12 02:41:03 +00001375#undef PyObject_GC_Track
1376#undef PyObject_GC_UnTrack
1377#undef PyObject_GC_Del
1378#undef _PyObject_GC_Malloc
1379
Neil Schemenauer43411b52001-08-30 00:05:51 +00001380void
Neil Schemenauerfec4eb12002-04-12 02:41:03 +00001381PyObject_GC_Track(void *op)
Neil Schemenauer43411b52001-08-30 00:05:51 +00001382{
1383 _PyObject_GC_TRACK(op);
1384}
1385
Neil Schemenauerfec4eb12002-04-12 02:41:03 +00001386/* for binary compatibility with 2.2 */
Neil Schemenauer43411b52001-08-30 00:05:51 +00001387void
Neil Schemenauerfec4eb12002-04-12 02:41:03 +00001388_PyObject_GC_Track(PyObject *op)
1389{
1390 PyObject_GC_Track(op);
1391}
1392
1393void
1394PyObject_GC_UnTrack(void *op)
Neil Schemenauer43411b52001-08-30 00:05:51 +00001395{
Tim Peters803526b2002-07-07 05:13:56 +00001396 /* Obscure: the Py_TRASHCAN mechanism requires that we be able to
1397 * call PyObject_GC_UnTrack twice on an object.
1398 */
Neil Schemenauera2b11ec2002-05-21 15:53:24 +00001399 if (IS_TRACKED(op))
Guido van Rossumff413af2002-03-28 20:34:59 +00001400 _PyObject_GC_UNTRACK(op);
Neil Schemenauer43411b52001-08-30 00:05:51 +00001401}
1402
Neil Schemenauerfec4eb12002-04-12 02:41:03 +00001403/* for binary compatibility with 2.2 */
1404void
1405_PyObject_GC_UnTrack(PyObject *op)
1406{
1407 PyObject_GC_UnTrack(op);
1408}
1409
Neil Schemenauer43411b52001-08-30 00:05:51 +00001410PyObject *
Neil Schemenauerfec4eb12002-04-12 02:41:03 +00001411_PyObject_GC_Malloc(size_t basicsize)
Neil Schemenauer43411b52001-08-30 00:05:51 +00001412{
1413 PyObject *op;
Neal Norwitze7d8be82008-07-31 17:17:14 +00001414 PyGC_Head *g;
1415 if (basicsize > PY_SSIZE_T_MAX - sizeof(PyGC_Head))
1416 return PyErr_NoMemory();
1417 g = (PyGC_Head *)PyObject_MALLOC(
Anthony Baxter64182fe2006-04-11 12:14:09 +00001418 sizeof(PyGC_Head) + basicsize);
Neil Schemenauer43411b52001-08-30 00:05:51 +00001419 if (g == NULL)
Jeremy Hylton8a135182002-06-06 23:23:55 +00001420 return PyErr_NoMemory();
Tim Petersea405632002-07-02 00:52:30 +00001421 g->gc.gc_refs = GC_UNTRACKED;
Neil Schemenauer2880ae52002-05-04 05:35:20 +00001422 generations[0].count++; /* number of allocated GC objects */
1423 if (generations[0].count > generations[0].threshold &&
Neil Schemenauer43411b52001-08-30 00:05:51 +00001424 enabled &&
Neil Schemenauer2880ae52002-05-04 05:35:20 +00001425 generations[0].threshold &&
Neil Schemenauer43411b52001-08-30 00:05:51 +00001426 !collecting &&
1427 !PyErr_Occurred()) {
1428 collecting = 1;
Neil Schemenauer2880ae52002-05-04 05:35:20 +00001429 collect_generations();
Neil Schemenauer43411b52001-08-30 00:05:51 +00001430 collecting = 0;
1431 }
1432 op = FROM_GC(g);
Neil Schemenauer43411b52001-08-30 00:05:51 +00001433 return op;
1434}
1435
1436PyObject *
1437_PyObject_GC_New(PyTypeObject *tp)
1438{
Neil Schemenauerfec4eb12002-04-12 02:41:03 +00001439 PyObject *op = _PyObject_GC_Malloc(_PyObject_SIZE(tp));
Tim Petersfa8efab2002-04-28 01:57:25 +00001440 if (op != NULL)
1441 op = PyObject_INIT(op, tp);
1442 return op;
Neil Schemenauer43411b52001-08-30 00:05:51 +00001443}
1444
1445PyVarObject *
Martin v. Löwis18e16552006-02-15 17:27:45 +00001446_PyObject_GC_NewVar(PyTypeObject *tp, Py_ssize_t nitems)
Neil Schemenauer43411b52001-08-30 00:05:51 +00001447{
Neil Schemenauerfec4eb12002-04-12 02:41:03 +00001448 const size_t size = _PyObject_VAR_SIZE(tp, nitems);
1449 PyVarObject *op = (PyVarObject *) _PyObject_GC_Malloc(size);
Tim Petersfa8efab2002-04-28 01:57:25 +00001450 if (op != NULL)
1451 op = PyObject_INIT_VAR(op, tp, nitems);
1452 return op;
Neil Schemenauer43411b52001-08-30 00:05:51 +00001453}
1454
1455PyVarObject *
Martin v. Löwis41290682006-02-16 14:56:14 +00001456_PyObject_GC_Resize(PyVarObject *op, Py_ssize_t nitems)
Neil Schemenauer43411b52001-08-30 00:05:51 +00001457{
Christian Heimese93237d2007-12-19 02:37:44 +00001458 const size_t basicsize = _PyObject_VAR_SIZE(Py_TYPE(op), nitems);
Neil Schemenauer43411b52001-08-30 00:05:51 +00001459 PyGC_Head *g = AS_GC(op);
Neal Norwitze7d8be82008-07-31 17:17:14 +00001460 if (basicsize > PY_SSIZE_T_MAX - sizeof(PyGC_Head))
1461 return (PyVarObject *)PyErr_NoMemory();
Anthony Baxter64182fe2006-04-11 12:14:09 +00001462 g = (PyGC_Head *)PyObject_REALLOC(g, sizeof(PyGC_Head) + basicsize);
Neil Schemenauer43411b52001-08-30 00:05:51 +00001463 if (g == NULL)
1464 return (PyVarObject *)PyErr_NoMemory();
1465 op = (PyVarObject *) FROM_GC(g);
Christian Heimese93237d2007-12-19 02:37:44 +00001466 Py_SIZE(op) = nitems;
Neil Schemenauer43411b52001-08-30 00:05:51 +00001467 return op;
1468}
1469
1470void
Neil Schemenauerfec4eb12002-04-12 02:41:03 +00001471PyObject_GC_Del(void *op)
Neil Schemenauer43411b52001-08-30 00:05:51 +00001472{
Neil Schemenauer43411b52001-08-30 00:05:51 +00001473 PyGC_Head *g = AS_GC(op);
Neil Schemenauera2b11ec2002-05-21 15:53:24 +00001474 if (IS_TRACKED(op))
Neil Schemenauer43411b52001-08-30 00:05:51 +00001475 gc_list_remove(g);
Neil Schemenauer2880ae52002-05-04 05:35:20 +00001476 if (generations[0].count > 0) {
1477 generations[0].count--;
Neil Schemenauer43411b52001-08-30 00:05:51 +00001478 }
Neil Schemenauerfec4eb12002-04-12 02:41:03 +00001479 PyObject_FREE(g);
Neil Schemenauer43411b52001-08-30 00:05:51 +00001480}
1481
Neil Schemenauerfec4eb12002-04-12 02:41:03 +00001482/* for binary compatibility with 2.2 */
1483#undef _PyObject_GC_Del
1484void
1485_PyObject_GC_Del(PyObject *op)
1486{
1487 PyObject_GC_Del(op);
1488}