blob: 2474721eeb6379285ac25555a88b5198ccb6db1c [file] [log] [blame]
Jeremy Hyltonc5007aa2000-06-30 05:02:53 +00001/*
Tim Peters88396172002-06-30 17:56:40 +00002
Jeremy Hyltonc5007aa2000-06-30 05:02:53 +00003 Reference Cycle Garbage Collection
4 ==================================
5
Neil Schemenauerb2c2c9e2000-10-04 16:34:09 +00006 Neil Schemenauer <nas@arctrix.com>
Jeremy Hyltonc5007aa2000-06-30 05:02:53 +00007
8 Based on a post on the python-dev list. Ideas from Guido van Rossum,
9 Eric Tiedemann, and various others.
10
Neil Schemenauer43411b52001-08-30 00:05:51 +000011 http://www.arctrix.com/nas/python/gc/
Neil Schemenauera7024e92008-07-15 19:24:01 +000012
13 The following mailing list threads provide a historical perspective on
14 the design of this module. Note that a fair amount of refinement has
15 occurred since those discussions.
16
17 http://mail.python.org/pipermail/python-dev/2000-March/002385.html
18 http://mail.python.org/pipermail/python-dev/2000-March/002434.html
19 http://mail.python.org/pipermail/python-dev/2000-March/002497.html
Jeremy Hyltonc5007aa2000-06-30 05:02:53 +000020
21 For a highlevel view of the collection process, read the collect
22 function.
23
Jeremy Hyltonc5007aa2000-06-30 05:02:53 +000024*/
25
Jeremy Hyltonc5007aa2000-06-30 05:02:53 +000026#include "Python.h"
Christian Heimesa156e092008-02-16 07:38:31 +000027#include "frameobject.h" /* for PyFrame_ClearFreeList */
Jeremy Hyltonc5007aa2000-06-30 05:02:53 +000028
Neil Schemenauer43411b52001-08-30 00:05:51 +000029/* Get an object's GC head */
30#define AS_GC(o) ((PyGC_Head *)(o)-1)
31
32/* Get the object given the GC head */
33#define FROM_GC(g) ((PyObject *)(((PyGC_Head *)g)+1))
34
Jeremy Hyltonc5007aa2000-06-30 05:02:53 +000035/*** Global GC state ***/
36
Neil Schemenauer2880ae52002-05-04 05:35:20 +000037struct gc_generation {
38 PyGC_Head head;
39 int threshold; /* collection threshold */
40 int count; /* count of allocations or collections of younger
41 generations */
42};
43
44#define NUM_GENERATIONS 3
45#define GEN_HEAD(n) (&generations[n].head)
46
Jeremy Hyltonc5007aa2000-06-30 05:02:53 +000047/* linked lists of container objects */
Neil Schemenauer2880ae52002-05-04 05:35:20 +000048static struct gc_generation generations[NUM_GENERATIONS] = {
49 /* PyGC_Head, threshold, count */
50 {{{GEN_HEAD(0), GEN_HEAD(0), 0}}, 700, 0},
51 {{{GEN_HEAD(1), GEN_HEAD(1), 0}}, 10, 0},
52 {{{GEN_HEAD(2), GEN_HEAD(2), 0}}, 10, 0},
53};
Jeremy Hyltonc5007aa2000-06-30 05:02:53 +000054
Neil Schemenauer2880ae52002-05-04 05:35:20 +000055PyGC_Head *_PyGC_generation0 = GEN_HEAD(0);
56
Vladimir Marangozovf9d20c32000-08-06 22:45:31 +000057static int enabled = 1; /* automatic collection enabled? */
Jeremy Hyltonc5007aa2000-06-30 05:02:53 +000058
Neil Schemenauer43411b52001-08-30 00:05:51 +000059/* true if we are currently running the collector */
Tim Petersbf384c22003-04-06 00:11:39 +000060static int collecting = 0;
Neil Schemenauer43411b52001-08-30 00:05:51 +000061
Tim Peters6fc13d92002-07-02 18:12:35 +000062/* list of uncollectable objects */
Tim Petersbf384c22003-04-06 00:11:39 +000063static PyObject *garbage = NULL;
Tim Peters6fc13d92002-07-02 18:12:35 +000064
65/* Python string to use if unhandled exception occurs */
Tim Petersbf384c22003-04-06 00:11:39 +000066static PyObject *gc_str = NULL;
Tim Peters6fc13d92002-07-02 18:12:35 +000067
Tim Peters93ad66d2003-04-05 17:15:44 +000068/* Python string used to look for __del__ attribute. */
69static PyObject *delstr = NULL;
Jeremy Hyltonce136e92003-04-04 19:59:06 +000070
Antoine Pitrou14b78f52009-01-09 22:27:08 +000071/* This is the number of objects who survived the last full collection. It
72 approximates the number of long lived objects tracked by the GC.
73
74 (by "full collection", we mean a collection of the oldest generation).
75*/
76static Py_ssize_t long_lived_total = 0;
77
78/* This is the number of objects who survived all "non-full" collections,
79 and are awaiting to undergo a full collection for the first time.
80
81*/
82static Py_ssize_t long_lived_pending = 0;
83
84/*
85 NOTE: about the counting of long-lived objects.
86
87 To limit the cost of garbage collection, there are two strategies;
88 - make each collection faster, e.g. by scanning fewer objects
89 - do less collections
90 This heuristic is about the latter strategy.
91
92 In addition to the various configurable thresholds, we only trigger a
93 full collection if the ratio
94 long_lived_pending / long_lived_total
95 is above a given value (hardwired to 25%).
96
97 The reason is that, while "non-full" collections (i.e., collections of
98 the young and middle generations) will always examine roughly the same
99 number of objects -- determined by the aforementioned thresholds --,
100 the cost of a full collection is proportional to the total number of
101 long-lived objects, which is virtually unbounded.
102
103 Indeed, it has been remarked that doing a full collection every
104 <constant number> of object creations entails a dramatic performance
105 degradation in workloads which consist in creating and storing lots of
106 long-lived objects (e.g. building a large list of GC-tracked objects would
107 show quadratic performance, instead of linear as expected: see issue #4074).
108
109 Using the above ratio, instead, yields amortized linear performance in
110 the total number of objects (the effect of which can be summarized
111 thusly: "each full garbage collection is more and more costly as the
112 number of objects grows, but we do fewer and fewer of them").
113
114 This heuristic was suggested by Martin von Löwis on python-dev in
115 June 2008. His original analysis and proposal can be found at:
116 http://mail.python.org/pipermail/python-dev/2008-June/080579.html
117*/
118
119
Jeremy Hyltonc5007aa2000-06-30 05:02:53 +0000120/* set for debugging information */
121#define DEBUG_STATS (1<<0) /* print collection statistics */
122#define DEBUG_COLLECTABLE (1<<1) /* print collectable objects */
123#define DEBUG_UNCOLLECTABLE (1<<2) /* print uncollectable objects */
Neil Schemenauer544de1e2000-09-22 15:22:38 +0000124#define DEBUG_SAVEALL (1<<5) /* save all garbage in gc.garbage */
Jeremy Hyltonc5007aa2000-06-30 05:02:53 +0000125#define DEBUG_LEAK DEBUG_COLLECTABLE | \
126 DEBUG_UNCOLLECTABLE | \
Neil Schemenauer544de1e2000-09-22 15:22:38 +0000127 DEBUG_SAVEALL
Jeremy Hyltonb709df32000-09-01 02:47:25 +0000128static int debug;
Thomas Wouters477c8d52006-05-27 19:21:47 +0000129static PyObject *tmod = NULL;
Jeremy Hyltonc5007aa2000-06-30 05:02:53 +0000130
Tim Peters6fc13d92002-07-02 18:12:35 +0000131/*--------------------------------------------------------------------------
132gc_refs values.
Neil Schemenauer43411b52001-08-30 00:05:51 +0000133
Tim Peters6fc13d92002-07-02 18:12:35 +0000134Between collections, every gc'ed object has one of two gc_refs values:
135
136GC_UNTRACKED
137 The initial state; objects returned by PyObject_GC_Malloc are in this
138 state. The object doesn't live in any generation list, and its
139 tp_traverse slot must not be called.
140
141GC_REACHABLE
142 The object lives in some generation list, and its tp_traverse is safe to
143 call. An object transitions to GC_REACHABLE when PyObject_GC_Track
144 is called.
145
146During a collection, gc_refs can temporarily take on other states:
147
148>= 0
149 At the start of a collection, update_refs() copies the true refcount
150 to gc_refs, for each object in the generation being collected.
151 subtract_refs() then adjusts gc_refs so that it equals the number of
152 times an object is referenced directly from outside the generation
153 being collected.
Martin v. Löwis774348c2002-11-09 19:54:06 +0000154 gc_refs remains >= 0 throughout these steps.
Tim Peters6fc13d92002-07-02 18:12:35 +0000155
156GC_TENTATIVELY_UNREACHABLE
157 move_unreachable() then moves objects not reachable (whether directly or
158 indirectly) from outside the generation into an "unreachable" set.
159 Objects that are found to be reachable have gc_refs set to GC_REACHABLE
160 again. Objects that are found to be unreachable have gc_refs set to
161 GC_TENTATIVELY_UNREACHABLE. It's "tentatively" because the pass doing
162 this can't be sure until it ends, and GC_TENTATIVELY_UNREACHABLE may
163 transition back to GC_REACHABLE.
164
165 Only objects with GC_TENTATIVELY_UNREACHABLE still set are candidates
166 for collection. If it's decided not to collect such an object (e.g.,
167 it has a __del__ method), its gc_refs is restored to GC_REACHABLE again.
168----------------------------------------------------------------------------
169*/
Tim Petersea405632002-07-02 00:52:30 +0000170#define GC_UNTRACKED _PyGC_REFS_UNTRACKED
171#define GC_REACHABLE _PyGC_REFS_REACHABLE
172#define GC_TENTATIVELY_UNREACHABLE _PyGC_REFS_TENTATIVELY_UNREACHABLE
Tim Peters19b74c72002-07-01 03:52:19 +0000173
Tim Peters6fc13d92002-07-02 18:12:35 +0000174#define IS_TRACKED(o) ((AS_GC(o))->gc.gc_refs != GC_UNTRACKED)
Tim Peters19b74c72002-07-01 03:52:19 +0000175#define IS_REACHABLE(o) ((AS_GC(o))->gc.gc_refs == GC_REACHABLE)
176#define IS_TENTATIVELY_UNREACHABLE(o) ( \
177 (AS_GC(o))->gc.gc_refs == GC_TENTATIVELY_UNREACHABLE)
Neil Schemenauera2b11ec2002-05-21 15:53:24 +0000178
Jeremy Hyltonc5007aa2000-06-30 05:02:53 +0000179/*** list functions ***/
180
181static void
182gc_list_init(PyGC_Head *list)
183{
Tim Peters9e4ca102001-10-11 18:31:31 +0000184 list->gc.gc_prev = list;
185 list->gc.gc_next = list;
Jeremy Hyltonc5007aa2000-06-30 05:02:53 +0000186}
187
Neil Schemenauer2880ae52002-05-04 05:35:20 +0000188static int
189gc_list_is_empty(PyGC_Head *list)
190{
191 return (list->gc.gc_next == list);
192}
193
Tim Peterse2d59182004-11-01 01:39:08 +0000194#if 0
195/* This became unused after gc_list_move() was introduced. */
196/* Append `node` to `list`. */
Jeremy Hyltonc5007aa2000-06-30 05:02:53 +0000197static void
198gc_list_append(PyGC_Head *node, PyGC_Head *list)
199{
Tim Peters9e4ca102001-10-11 18:31:31 +0000200 node->gc.gc_next = list;
201 node->gc.gc_prev = list->gc.gc_prev;
202 node->gc.gc_prev->gc.gc_next = node;
203 list->gc.gc_prev = node;
Jeremy Hyltonc5007aa2000-06-30 05:02:53 +0000204}
Tim Peterse2d59182004-11-01 01:39:08 +0000205#endif
Jeremy Hyltonc5007aa2000-06-30 05:02:53 +0000206
Tim Peterse2d59182004-11-01 01:39:08 +0000207/* Remove `node` from the gc list it's currently in. */
Jeremy Hyltonc5007aa2000-06-30 05:02:53 +0000208static void
209gc_list_remove(PyGC_Head *node)
210{
Tim Peters9e4ca102001-10-11 18:31:31 +0000211 node->gc.gc_prev->gc.gc_next = node->gc.gc_next;
212 node->gc.gc_next->gc.gc_prev = node->gc.gc_prev;
213 node->gc.gc_next = NULL; /* object is not currently tracked */
Jeremy Hyltonc5007aa2000-06-30 05:02:53 +0000214}
215
Tim Peterse2d59182004-11-01 01:39:08 +0000216/* Move `node` from the gc list it's currently in (which is not explicitly
217 * named here) to the end of `list`. This is semantically the same as
218 * gc_list_remove(node) followed by gc_list_append(node, list).
219 */
220static void
221gc_list_move(PyGC_Head *node, PyGC_Head *list)
222{
Tim Petersbc1d1b82004-11-01 16:39:57 +0000223 PyGC_Head *new_prev;
Tim Peterse2d59182004-11-01 01:39:08 +0000224 PyGC_Head *current_prev = node->gc.gc_prev;
225 PyGC_Head *current_next = node->gc.gc_next;
Tim Petersbc1d1b82004-11-01 16:39:57 +0000226 /* Unlink from current list. */
Tim Peterse2d59182004-11-01 01:39:08 +0000227 current_prev->gc.gc_next = current_next;
228 current_next->gc.gc_prev = current_prev;
Tim Petersbc1d1b82004-11-01 16:39:57 +0000229 /* Relink at end of new list. */
230 new_prev = node->gc.gc_prev = list->gc.gc_prev;
Tim Peterse2d59182004-11-01 01:39:08 +0000231 new_prev->gc.gc_next = list->gc.gc_prev = node;
Tim Petersbc1d1b82004-11-01 16:39:57 +0000232 node->gc.gc_next = list;
Tim Peterse2d59182004-11-01 01:39:08 +0000233}
234
235/* append list `from` onto list `to`; `from` becomes an empty list */
Jeremy Hyltonc5007aa2000-06-30 05:02:53 +0000236static void
237gc_list_merge(PyGC_Head *from, PyGC_Head *to)
238{
239 PyGC_Head *tail;
Tim Peterse2d59182004-11-01 01:39:08 +0000240 assert(from != to);
Neil Schemenauer2880ae52002-05-04 05:35:20 +0000241 if (!gc_list_is_empty(from)) {
Tim Peters9e4ca102001-10-11 18:31:31 +0000242 tail = to->gc.gc_prev;
243 tail->gc.gc_next = from->gc.gc_next;
244 tail->gc.gc_next->gc.gc_prev = tail;
245 to->gc.gc_prev = from->gc.gc_prev;
246 to->gc.gc_prev->gc.gc_next = to;
Jeremy Hyltonc5007aa2000-06-30 05:02:53 +0000247 }
248 gc_list_init(from);
249}
250
Neal Norwitz7b216c52006-03-04 20:01:53 +0000251static Py_ssize_t
Jeremy Hyltonc5007aa2000-06-30 05:02:53 +0000252gc_list_size(PyGC_Head *list)
253{
254 PyGC_Head *gc;
Neal Norwitz7b216c52006-03-04 20:01:53 +0000255 Py_ssize_t n = 0;
Tim Peters9e4ca102001-10-11 18:31:31 +0000256 for (gc = list->gc.gc_next; gc != list; gc = gc->gc.gc_next) {
Jeremy Hyltonc5007aa2000-06-30 05:02:53 +0000257 n++;
258 }
259 return n;
260}
261
Tim Peters259272b2003-04-06 19:41:39 +0000262/* Append objects in a GC list to a Python list.
263 * Return 0 if all OK, < 0 if error (out of memory for list).
264 */
265static int
266append_objects(PyObject *py_list, PyGC_Head *gc_list)
267{
268 PyGC_Head *gc;
269 for (gc = gc_list->gc.gc_next; gc != gc_list; gc = gc->gc.gc_next) {
270 PyObject *op = FROM_GC(gc);
271 if (op != py_list) {
272 if (PyList_Append(py_list, op)) {
273 return -1; /* exception */
274 }
275 }
276 }
277 return 0;
278}
279
Jeremy Hyltonc5007aa2000-06-30 05:02:53 +0000280/*** end of list stuff ***/
281
282
Tim Peters19b74c72002-07-01 03:52:19 +0000283/* Set all gc_refs = ob_refcnt. After this, gc_refs is > 0 for all objects
284 * in containers, and is GC_REACHABLE for all tracked gc objects not in
285 * containers.
Tim Peters88396172002-06-30 17:56:40 +0000286 */
Jeremy Hyltonc5007aa2000-06-30 05:02:53 +0000287static void
288update_refs(PyGC_Head *containers)
289{
Tim Peters9e4ca102001-10-11 18:31:31 +0000290 PyGC_Head *gc = containers->gc.gc_next;
Tim Petersea405632002-07-02 00:52:30 +0000291 for (; gc != containers; gc = gc->gc.gc_next) {
292 assert(gc->gc.gc_refs == GC_REACHABLE);
Christian Heimes90aa7642007-12-19 02:45:37 +0000293 gc->gc.gc_refs = Py_REFCNT(FROM_GC(gc));
Tim Peters780c4972003-11-14 00:01:17 +0000294 /* Python's cyclic gc should never see an incoming refcount
295 * of 0: if something decref'ed to 0, it should have been
296 * deallocated immediately at that time.
297 * Possible cause (if the assert triggers): a tp_dealloc
298 * routine left a gc-aware object tracked during its teardown
299 * phase, and did something-- or allowed something to happen --
300 * that called back into Python. gc can trigger then, and may
301 * see the still-tracked dying object. Before this assert
302 * was added, such mistakes went on to allow gc to try to
303 * delete the object again. In a debug build, that caused
304 * a mysterious segfault, when _Py_ForgetReference tried
305 * to remove the object from the doubly-linked list of all
306 * objects a second time. In a release build, an actual
307 * double deallocation occurred, which leads to corruption
308 * of the allocator's internal bookkeeping pointers. That's
309 * so serious that maybe this should be a release-build
310 * check instead of an assert?
311 */
312 assert(gc->gc.gc_refs != 0);
Tim Petersea405632002-07-02 00:52:30 +0000313 }
Jeremy Hyltonc5007aa2000-06-30 05:02:53 +0000314}
315
Tim Peters19b74c72002-07-01 03:52:19 +0000316/* A traversal callback for subtract_refs. */
Jeremy Hyltonc5007aa2000-06-30 05:02:53 +0000317static int
318visit_decref(PyObject *op, void *data)
319{
Tim Peters93cd83e2002-06-30 21:31:03 +0000320 assert(op != NULL);
Tim Peters19b74c72002-07-01 03:52:19 +0000321 if (PyObject_IS_GC(op)) {
322 PyGC_Head *gc = AS_GC(op);
323 /* We're only interested in gc_refs for objects in the
324 * generation being collected, which can be recognized
325 * because only they have positive gc_refs.
326 */
Tim Petersaab713b2002-07-02 22:15:28 +0000327 assert(gc->gc.gc_refs != 0); /* else refcount was too small */
Tim Peters19b74c72002-07-01 03:52:19 +0000328 if (gc->gc.gc_refs > 0)
329 gc->gc.gc_refs--;
330 }
Jeremy Hyltonc5007aa2000-06-30 05:02:53 +0000331 return 0;
332}
333
Tim Peters19b74c72002-07-01 03:52:19 +0000334/* Subtract internal references from gc_refs. After this, gc_refs is >= 0
335 * for all objects in containers, and is GC_REACHABLE for all tracked gc
336 * objects not in containers. The ones with gc_refs > 0 are directly
337 * reachable from outside containers, and so can't be collected.
338 */
Jeremy Hyltonc5007aa2000-06-30 05:02:53 +0000339static void
340subtract_refs(PyGC_Head *containers)
341{
342 traverseproc traverse;
Tim Peters9e4ca102001-10-11 18:31:31 +0000343 PyGC_Head *gc = containers->gc.gc_next;
344 for (; gc != containers; gc=gc->gc.gc_next) {
Christian Heimes90aa7642007-12-19 02:45:37 +0000345 traverse = Py_TYPE(FROM_GC(gc))->tp_traverse;
Neil Schemenauer43411b52001-08-30 00:05:51 +0000346 (void) traverse(FROM_GC(gc),
Jeremy Hyltonc5007aa2000-06-30 05:02:53 +0000347 (visitproc)visit_decref,
348 NULL);
349 }
350}
351
Tim Peters19b74c72002-07-01 03:52:19 +0000352/* A traversal callback for move_unreachable. */
Jeremy Hyltonc5007aa2000-06-30 05:02:53 +0000353static int
Tim Peters19b74c72002-07-01 03:52:19 +0000354visit_reachable(PyObject *op, PyGC_Head *reachable)
Jeremy Hyltonc5007aa2000-06-30 05:02:53 +0000355{
Tim Petersea405632002-07-02 00:52:30 +0000356 if (PyObject_IS_GC(op)) {
Tim Peters19b74c72002-07-01 03:52:19 +0000357 PyGC_Head *gc = AS_GC(op);
Martin v. Löwis6db0e002006-03-01 16:56:25 +0000358 const Py_ssize_t gc_refs = gc->gc.gc_refs;
Tim Peters19b74c72002-07-01 03:52:19 +0000359
360 if (gc_refs == 0) {
361 /* This is in move_unreachable's 'young' list, but
362 * the traversal hasn't yet gotten to it. All
363 * we need to do is tell move_unreachable that it's
364 * reachable.
365 */
366 gc->gc.gc_refs = 1;
Jeremy Hyltonc5007aa2000-06-30 05:02:53 +0000367 }
Tim Peters19b74c72002-07-01 03:52:19 +0000368 else if (gc_refs == GC_TENTATIVELY_UNREACHABLE) {
369 /* This had gc_refs = 0 when move_unreachable got
370 * to it, but turns out it's reachable after all.
371 * Move it back to move_unreachable's 'young' list,
372 * and move_unreachable will eventually get to it
373 * again.
374 */
Tim Peterse2d59182004-11-01 01:39:08 +0000375 gc_list_move(gc, reachable);
Tim Peters19b74c72002-07-01 03:52:19 +0000376 gc->gc.gc_refs = 1;
377 }
378 /* Else there's nothing to do.
379 * If gc_refs > 0, it must be in move_unreachable's 'young'
380 * list, and move_unreachable will eventually get to it.
381 * If gc_refs == GC_REACHABLE, it's either in some other
382 * generation so we don't care about it, or move_unreachable
Tim Peters6fc13d92002-07-02 18:12:35 +0000383 * already dealt with it.
Tim Petersea405632002-07-02 00:52:30 +0000384 * If gc_refs == GC_UNTRACKED, it must be ignored.
Tim Peters19b74c72002-07-01 03:52:19 +0000385 */
Tim Petersea405632002-07-02 00:52:30 +0000386 else {
387 assert(gc_refs > 0
388 || gc_refs == GC_REACHABLE
389 || gc_refs == GC_UNTRACKED);
390 }
Jeremy Hyltonc5007aa2000-06-30 05:02:53 +0000391 }
392 return 0;
393}
394
Tim Peters19b74c72002-07-01 03:52:19 +0000395/* Move the unreachable objects from young to unreachable. After this,
396 * all objects in young have gc_refs = GC_REACHABLE, and all objects in
397 * unreachable have gc_refs = GC_TENTATIVELY_UNREACHABLE. All tracked
398 * gc objects not in young or unreachable still have gc_refs = GC_REACHABLE.
399 * All objects in young after this are directly or indirectly reachable
400 * from outside the original young; and all objects in unreachable are
401 * not.
Tim Peters88396172002-06-30 17:56:40 +0000402 */
Jeremy Hyltonc5007aa2000-06-30 05:02:53 +0000403static void
Tim Peters19b74c72002-07-01 03:52:19 +0000404move_unreachable(PyGC_Head *young, PyGC_Head *unreachable)
Jeremy Hyltonc5007aa2000-06-30 05:02:53 +0000405{
Tim Peters19b74c72002-07-01 03:52:19 +0000406 PyGC_Head *gc = young->gc.gc_next;
407
408 /* Invariants: all objects "to the left" of us in young have gc_refs
409 * = GC_REACHABLE, and are indeed reachable (directly or indirectly)
410 * from outside the young list as it was at entry. All other objects
411 * from the original young "to the left" of us are in unreachable now,
412 * and have gc_refs = GC_TENTATIVELY_UNREACHABLE. All objects to the
413 * left of us in 'young' now have been scanned, and no objects here
414 * or to the right have been scanned yet.
415 */
416
417 while (gc != young) {
418 PyGC_Head *next;
419
Tim Peters6fc13d92002-07-02 18:12:35 +0000420 if (gc->gc.gc_refs) {
421 /* gc is definitely reachable from outside the
422 * original 'young'. Mark it as such, and traverse
423 * its pointers to find any other objects that may
424 * be directly reachable from it. Note that the
425 * call to tp_traverse may append objects to young,
426 * so we have to wait until it returns to determine
427 * the next object to visit.
428 */
429 PyObject *op = FROM_GC(gc);
Christian Heimes90aa7642007-12-19 02:45:37 +0000430 traverseproc traverse = Py_TYPE(op)->tp_traverse;
Tim Peters6fc13d92002-07-02 18:12:35 +0000431 assert(gc->gc.gc_refs > 0);
432 gc->gc.gc_refs = GC_REACHABLE;
433 (void) traverse(op,
434 (visitproc)visit_reachable,
435 (void *)young);
436 next = gc->gc.gc_next;
437 }
438 else {
Tim Peters19b74c72002-07-01 03:52:19 +0000439 /* This *may* be unreachable. To make progress,
440 * assume it is. gc isn't directly reachable from
441 * any object we've already traversed, but may be
442 * reachable from an object we haven't gotten to yet.
443 * visit_reachable will eventually move gc back into
444 * young if that's so, and we'll see it again.
445 */
446 next = gc->gc.gc_next;
Tim Peterse2d59182004-11-01 01:39:08 +0000447 gc_list_move(gc, unreachable);
Tim Peters19b74c72002-07-01 03:52:19 +0000448 gc->gc.gc_refs = GC_TENTATIVELY_UNREACHABLE;
449 }
Tim Peters19b74c72002-07-01 03:52:19 +0000450 gc = next;
Jeremy Hyltonc5007aa2000-06-30 05:02:53 +0000451 }
452}
453
Amaury Forgeot d'Arcad8dcd52007-12-10 23:58:35 +0000454/* Return true if object has a finalization method. */
Neil Schemenauera765c122001-11-01 17:35:23 +0000455static int
456has_finalizer(PyObject *op)
Jeremy Hyltonc5007aa2000-06-30 05:02:53 +0000457{
Guido van Rossum50e9fb92006-08-17 05:42:55 +0000458 if (PyGen_CheckExact(op))
Thomas Wouters49fd7fa2006-04-21 10:40:58 +0000459 return PyGen_NeedsFinalizing((PyGenObject *)op);
460 else
Thomas Wouters3dfc3c12006-08-21 22:15:41 +0000461 return op->ob_type->tp_del != NULL;
Neil Schemenauera765c122001-11-01 17:35:23 +0000462}
463
Tim Petersead8b7a2004-10-30 23:09:22 +0000464/* Move the objects in unreachable with __del__ methods into `finalizers`.
465 * Objects moved into `finalizers` have gc_refs set to GC_REACHABLE; the
466 * objects remaining in unreachable are left at GC_TENTATIVELY_UNREACHABLE.
Jeremy Hyltonce136e92003-04-04 19:59:06 +0000467 */
Neil Schemenauera765c122001-11-01 17:35:23 +0000468static void
Tim Petersead8b7a2004-10-30 23:09:22 +0000469move_finalizers(PyGC_Head *unreachable, PyGC_Head *finalizers)
Neil Schemenauera765c122001-11-01 17:35:23 +0000470{
Tim Petersead8b7a2004-10-30 23:09:22 +0000471 PyGC_Head *gc;
472 PyGC_Head *next;
Tim Petersf6b80452003-04-07 19:21:15 +0000473
Tim Petersead8b7a2004-10-30 23:09:22 +0000474 /* March over unreachable. Move objects with finalizers into
475 * `finalizers`.
476 */
477 for (gc = unreachable->gc.gc_next; gc != unreachable; gc = next) {
Neil Schemenauer43411b52001-08-30 00:05:51 +0000478 PyObject *op = FROM_GC(gc);
Jeremy Hyltonce136e92003-04-04 19:59:06 +0000479
Tim Petersf6ae7a42003-04-05 18:40:50 +0000480 assert(IS_TENTATIVELY_UNREACHABLE(op));
Tim Petersead8b7a2004-10-30 23:09:22 +0000481 next = gc->gc.gc_next;
Tim Petersf6ae7a42003-04-05 18:40:50 +0000482
Tim Petersf6b80452003-04-07 19:21:15 +0000483 if (has_finalizer(op)) {
Tim Peterse2d59182004-11-01 01:39:08 +0000484 gc_list_move(gc, finalizers);
Tim Petersf6b80452003-04-07 19:21:15 +0000485 gc->gc.gc_refs = GC_REACHABLE;
Jeremy Hyltonce136e92003-04-04 19:59:06 +0000486 }
Jeremy Hyltonc5007aa2000-06-30 05:02:53 +0000487 }
488}
489
Tim Peters19b74c72002-07-01 03:52:19 +0000490/* A traversal callback for move_finalizer_reachable. */
491static int
492visit_move(PyObject *op, PyGC_Head *tolist)
493{
494 if (PyObject_IS_GC(op)) {
Tim Petersea405632002-07-02 00:52:30 +0000495 if (IS_TENTATIVELY_UNREACHABLE(op)) {
Tim Peters19b74c72002-07-01 03:52:19 +0000496 PyGC_Head *gc = AS_GC(op);
Tim Peterse2d59182004-11-01 01:39:08 +0000497 gc_list_move(gc, tolist);
Tim Peters19b74c72002-07-01 03:52:19 +0000498 gc->gc.gc_refs = GC_REACHABLE;
499 }
500 }
501 return 0;
502}
503
504/* Move objects that are reachable from finalizers, from the unreachable set
Tim Petersf6b80452003-04-07 19:21:15 +0000505 * into finalizers set.
Tim Peters19b74c72002-07-01 03:52:19 +0000506 */
Jeremy Hyltonc5007aa2000-06-30 05:02:53 +0000507static void
Tim Petersf6b80452003-04-07 19:21:15 +0000508move_finalizer_reachable(PyGC_Head *finalizers)
Jeremy Hyltonc5007aa2000-06-30 05:02:53 +0000509{
510 traverseproc traverse;
Tim Peters9e4ca102001-10-11 18:31:31 +0000511 PyGC_Head *gc = finalizers->gc.gc_next;
Tim Petersbf384c22003-04-06 00:11:39 +0000512 for (; gc != finalizers; gc = gc->gc.gc_next) {
513 /* Note that the finalizers list may grow during this. */
Christian Heimes90aa7642007-12-19 02:45:37 +0000514 traverse = Py_TYPE(FROM_GC(gc))->tp_traverse;
Tim Peters88396172002-06-30 17:56:40 +0000515 (void) traverse(FROM_GC(gc),
Tim Petersbf384c22003-04-06 00:11:39 +0000516 (visitproc)visit_move,
Tim Petersf6b80452003-04-07 19:21:15 +0000517 (void *)finalizers);
Jeremy Hyltonc5007aa2000-06-30 05:02:53 +0000518 }
519}
520
Tim Petersead8b7a2004-10-30 23:09:22 +0000521/* Clear all weakrefs to unreachable objects, and if such a weakref has a
522 * callback, invoke it if necessary. Note that it's possible for such
523 * weakrefs to be outside the unreachable set -- indeed, those are precisely
524 * the weakrefs whose callbacks must be invoked. See gc_weakref.txt for
525 * overview & some details. Some weakrefs with callbacks may be reclaimed
526 * directly by this routine; the number reclaimed is the return value. Other
527 * weakrefs with callbacks may be moved into the `old` generation. Objects
528 * moved into `old` have gc_refs set to GC_REACHABLE; the objects remaining in
529 * unreachable are left at GC_TENTATIVELY_UNREACHABLE. When this returns,
530 * no object in `unreachable` is weakly referenced anymore.
Tim Peters403a2032003-11-20 21:21:46 +0000531 */
532static int
Tim Petersead8b7a2004-10-30 23:09:22 +0000533handle_weakrefs(PyGC_Head *unreachable, PyGC_Head *old)
Tim Peters403a2032003-11-20 21:21:46 +0000534{
Tim Petersead8b7a2004-10-30 23:09:22 +0000535 PyGC_Head *gc;
536 PyObject *op; /* generally FROM_GC(gc) */
537 PyWeakReference *wr; /* generally a cast of op */
Tim Petersead8b7a2004-10-30 23:09:22 +0000538 PyGC_Head wrcb_to_call; /* weakrefs with callbacks to call */
Tim Petersead8b7a2004-10-30 23:09:22 +0000539 PyGC_Head *next;
Tim Peters403a2032003-11-20 21:21:46 +0000540 int num_freed = 0;
541
Tim Petersead8b7a2004-10-30 23:09:22 +0000542 gc_list_init(&wrcb_to_call);
Tim Peters403a2032003-11-20 21:21:46 +0000543
Tim Petersead8b7a2004-10-30 23:09:22 +0000544 /* Clear all weakrefs to the objects in unreachable. If such a weakref
545 * also has a callback, move it into `wrcb_to_call` if the callback
Tim Peterscc2a8662004-10-31 22:12:43 +0000546 * needs to be invoked. Note that we cannot invoke any callbacks until
547 * all weakrefs to unreachable objects are cleared, lest the callback
548 * resurrect an unreachable object via a still-active weakref. We
549 * make another pass over wrcb_to_call, invoking callbacks, after this
550 * pass completes.
Tim Petersead8b7a2004-10-30 23:09:22 +0000551 */
552 for (gc = unreachable->gc.gc_next; gc != unreachable; gc = next) {
553 PyWeakReference **wrlist;
554
555 op = FROM_GC(gc);
556 assert(IS_TENTATIVELY_UNREACHABLE(op));
557 next = gc->gc.gc_next;
558
Christian Heimes90aa7642007-12-19 02:45:37 +0000559 if (! PyType_SUPPORTS_WEAKREFS(Py_TYPE(op)))
Tim Petersead8b7a2004-10-30 23:09:22 +0000560 continue;
561
562 /* It supports weakrefs. Does it have any? */
563 wrlist = (PyWeakReference **)
564 PyObject_GET_WEAKREFS_LISTPTR(op);
565
566 /* `op` may have some weakrefs. March over the list, clear
567 * all the weakrefs, and move the weakrefs with callbacks
Tim Peterscc2a8662004-10-31 22:12:43 +0000568 * that must be called into wrcb_to_call.
Tim Petersead8b7a2004-10-30 23:09:22 +0000569 */
570 for (wr = *wrlist; wr != NULL; wr = *wrlist) {
571 PyGC_Head *wrasgc; /* AS_GC(wr) */
572
573 /* _PyWeakref_ClearRef clears the weakref but leaves
574 * the callback pointer intact. Obscure: it also
575 * changes *wrlist.
576 */
577 assert(wr->wr_object == op);
578 _PyWeakref_ClearRef(wr);
579 assert(wr->wr_object == Py_None);
580 if (wr->wr_callback == NULL)
581 continue; /* no callback */
582
583 /* Headache time. `op` is going away, and is weakly referenced by
584 * `wr`, which has a callback. Should the callback be invoked? If wr
585 * is also trash, no:
586 *
587 * 1. There's no need to call it. The object and the weakref are
588 * both going away, so it's legitimate to pretend the weakref is
589 * going away first. The user has to ensure a weakref outlives its
590 * referent if they want a guarantee that the wr callback will get
591 * invoked.
592 *
593 * 2. It may be catastrophic to call it. If the callback is also in
594 * cyclic trash (CT), then although the CT is unreachable from
595 * outside the current generation, CT may be reachable from the
596 * callback. Then the callback could resurrect insane objects.
597 *
598 * Since the callback is never needed and may be unsafe in this case,
Tim Peterscc2a8662004-10-31 22:12:43 +0000599 * wr is simply left in the unreachable set. Note that because we
600 * already called _PyWeakref_ClearRef(wr), its callback will never
601 * trigger.
Tim Petersead8b7a2004-10-30 23:09:22 +0000602 *
603 * OTOH, if wr isn't part of CT, we should invoke the callback: the
604 * weakref outlived the trash. Note that since wr isn't CT in this
605 * case, its callback can't be CT either -- wr acted as an external
606 * root to this generation, and therefore its callback did too. So
607 * nothing in CT is reachable from the callback either, so it's hard
608 * to imagine how calling it later could create a problem for us. wr
609 * is moved to wrcb_to_call in this case.
Tim Petersead8b7a2004-10-30 23:09:22 +0000610 */
Tim Peterscc2a8662004-10-31 22:12:43 +0000611 if (IS_TENTATIVELY_UNREACHABLE(wr))
612 continue;
613 assert(IS_REACHABLE(wr));
614
Tim Petersead8b7a2004-10-30 23:09:22 +0000615 /* Create a new reference so that wr can't go away
616 * before we can process it again.
617 */
618 Py_INCREF(wr);
619
Tim Peterscc2a8662004-10-31 22:12:43 +0000620 /* Move wr to wrcb_to_call, for the next pass. */
Tim Petersead8b7a2004-10-30 23:09:22 +0000621 wrasgc = AS_GC(wr);
Tim Peterscc2a8662004-10-31 22:12:43 +0000622 assert(wrasgc != next); /* wrasgc is reachable, but
623 next isn't, so they can't
624 be the same */
Tim Peterse2d59182004-11-01 01:39:08 +0000625 gc_list_move(wrasgc, &wrcb_to_call);
Tim Petersead8b7a2004-10-30 23:09:22 +0000626 }
627 }
628
Tim Peterscc2a8662004-10-31 22:12:43 +0000629 /* Invoke the callbacks we decided to honor. It's safe to invoke them
630 * because they can't reference unreachable objects.
Tim Petersead8b7a2004-10-30 23:09:22 +0000631 */
632 while (! gc_list_is_empty(&wrcb_to_call)) {
633 PyObject *temp;
634 PyObject *callback;
635
636 gc = wrcb_to_call.gc.gc_next;
637 op = FROM_GC(gc);
638 assert(IS_REACHABLE(op));
639 assert(PyWeakref_Check(op));
640 wr = (PyWeakReference *)op;
641 callback = wr->wr_callback;
642 assert(callback != NULL);
643
644 /* copy-paste of weakrefobject.c's handle_callback() */
Thomas Wouters477c8d52006-05-27 19:21:47 +0000645 temp = PyObject_CallFunctionObjArgs(callback, wr, NULL);
Tim Petersead8b7a2004-10-30 23:09:22 +0000646 if (temp == NULL)
647 PyErr_WriteUnraisable(callback);
648 else
649 Py_DECREF(temp);
650
651 /* Give up the reference we created in the first pass. When
652 * op's refcount hits 0 (which it may or may not do right now),
Tim Peterscc2a8662004-10-31 22:12:43 +0000653 * op's tp_dealloc will decref op->wr_callback too. Note
654 * that the refcount probably will hit 0 now, and because this
655 * weakref was reachable to begin with, gc didn't already
656 * add it to its count of freed objects. Example: a reachable
657 * weak value dict maps some key to this reachable weakref.
658 * The callback removes this key->weakref mapping from the
659 * dict, leaving no other references to the weakref (excepting
660 * ours).
Tim Petersead8b7a2004-10-30 23:09:22 +0000661 */
662 Py_DECREF(op);
663 if (wrcb_to_call.gc.gc_next == gc) {
664 /* object is still alive -- move it */
Tim Peterse2d59182004-11-01 01:39:08 +0000665 gc_list_move(gc, old);
Tim Petersead8b7a2004-10-30 23:09:22 +0000666 }
667 else
668 ++num_freed;
669 }
670
Tim Peters403a2032003-11-20 21:21:46 +0000671 return num_freed;
672}
673
Jeremy Hyltonc5007aa2000-06-30 05:02:53 +0000674static void
Jeremy Hylton06257772000-08-31 15:10:24 +0000675debug_cycle(char *msg, PyObject *op)
Jeremy Hyltonc5007aa2000-06-30 05:02:53 +0000676{
Amaury Forgeot d'Arcad8dcd52007-12-10 23:58:35 +0000677 PySys_WriteStderr("gc: %.100s <%.100s %p>\n",
Christian Heimes90aa7642007-12-19 02:45:37 +0000678 msg, Py_TYPE(op)->tp_name, op);
Jeremy Hyltonc5007aa2000-06-30 05:02:53 +0000679}
680
Tim Petersbf384c22003-04-06 00:11:39 +0000681/* Handle uncollectable garbage (cycles with finalizers, and stuff reachable
682 * only from such cycles).
Tim Petersf6b80452003-04-07 19:21:15 +0000683 * If DEBUG_SAVEALL, all objects in finalizers are appended to the module
684 * garbage list (a Python list), else only the objects in finalizers with
685 * __del__ methods are appended to garbage. All objects in finalizers are
686 * merged into the old list regardless.
Tim Peters259272b2003-04-06 19:41:39 +0000687 * Returns 0 if all OK, <0 on error (out of memory to grow the garbage list).
688 * The finalizers list is made empty on a successful return.
Tim Petersbf384c22003-04-06 00:11:39 +0000689 */
Tim Peters259272b2003-04-06 19:41:39 +0000690static int
Tim Petersf6b80452003-04-07 19:21:15 +0000691handle_finalizers(PyGC_Head *finalizers, PyGC_Head *old)
Jeremy Hyltonc5007aa2000-06-30 05:02:53 +0000692{
Tim Petersf6b80452003-04-07 19:21:15 +0000693 PyGC_Head *gc = finalizers->gc.gc_next;
694
Jeremy Hyltonc5007aa2000-06-30 05:02:53 +0000695 if (garbage == NULL) {
696 garbage = PyList_New(0);
Tim Petersbf384c22003-04-06 00:11:39 +0000697 if (garbage == NULL)
698 Py_FatalError("gc couldn't create gc.garbage list");
Jeremy Hyltonc5007aa2000-06-30 05:02:53 +0000699 }
Tim Petersf6b80452003-04-07 19:21:15 +0000700 for (; gc != finalizers; gc = gc->gc.gc_next) {
701 PyObject *op = FROM_GC(gc);
702
703 if ((debug & DEBUG_SAVEALL) || has_finalizer(op)) {
704 if (PyList_Append(garbage, op) < 0)
705 return -1;
706 }
Jeremy Hyltonc5007aa2000-06-30 05:02:53 +0000707 }
Tim Petersf6b80452003-04-07 19:21:15 +0000708
Tim Peters259272b2003-04-06 19:41:39 +0000709 gc_list_merge(finalizers, old);
710 return 0;
Jeremy Hyltonc5007aa2000-06-30 05:02:53 +0000711}
712
Neil Schemenauer544de1e2000-09-22 15:22:38 +0000713/* Break reference cycles by clearing the containers involved. This is
Jeremy Hyltonc5007aa2000-06-30 05:02:53 +0000714 * tricky business as the lists can be changing and we don't know which
Tim Peters19b74c72002-07-01 03:52:19 +0000715 * objects may be freed. It is possible I screwed something up here.
716 */
Jeremy Hyltonc5007aa2000-06-30 05:02:53 +0000717static void
Jeremy Hyltonce136e92003-04-04 19:59:06 +0000718delete_garbage(PyGC_Head *collectable, PyGC_Head *old)
Jeremy Hyltonc5007aa2000-06-30 05:02:53 +0000719{
720 inquiry clear;
721
Jeremy Hyltonce136e92003-04-04 19:59:06 +0000722 while (!gc_list_is_empty(collectable)) {
723 PyGC_Head *gc = collectable->gc.gc_next;
Neil Schemenauer43411b52001-08-30 00:05:51 +0000724 PyObject *op = FROM_GC(gc);
Tim Peters88396172002-06-30 17:56:40 +0000725
Tim Peters19b74c72002-07-01 03:52:19 +0000726 assert(IS_TENTATIVELY_UNREACHABLE(op));
Neil Schemenauer544de1e2000-09-22 15:22:38 +0000727 if (debug & DEBUG_SAVEALL) {
728 PyList_Append(garbage, op);
Jeremy Hyltonc5007aa2000-06-30 05:02:53 +0000729 }
Neil Schemenauer544de1e2000-09-22 15:22:38 +0000730 else {
Christian Heimes90aa7642007-12-19 02:45:37 +0000731 if ((clear = Py_TYPE(op)->tp_clear) != NULL) {
Neil Schemenauer544de1e2000-09-22 15:22:38 +0000732 Py_INCREF(op);
Jeremy Hylton8a135182002-06-06 23:23:55 +0000733 clear(op);
Neil Schemenauer544de1e2000-09-22 15:22:38 +0000734 Py_DECREF(op);
735 }
736 }
Jeremy Hyltonce136e92003-04-04 19:59:06 +0000737 if (collectable->gc.gc_next == gc) {
Neil Schemenauer544de1e2000-09-22 15:22:38 +0000738 /* object is still alive, move it, it may die later */
Tim Peterse2d59182004-11-01 01:39:08 +0000739 gc_list_move(gc, old);
Tim Peters19b74c72002-07-01 03:52:19 +0000740 gc->gc.gc_refs = GC_REACHABLE;
Jeremy Hyltonc5007aa2000-06-30 05:02:53 +0000741 }
742 }
743}
744
Christian Heimesa156e092008-02-16 07:38:31 +0000745/* Clear all free lists
746 * All free lists are cleared during the collection of the highest generation.
747 * Allocated items in the free list may keep a pymalloc arena occupied.
748 * Clearing the free lists may give back memory to the OS earlier.
749 */
750static void
751clear_freelists(void)
752{
753 (void)PyMethod_ClearFreeList();
754 (void)PyFrame_ClearFreeList();
755 (void)PyCFunction_ClearFreeList();
756 (void)PyTuple_ClearFreeList();
757 (void)PyUnicode_ClearFreeList();
Georg Brandl2ee470f2008-07-16 12:55:28 +0000758 (void)PyFloat_ClearFreeList();
Christian Heimesa156e092008-02-16 07:38:31 +0000759}
760
Antoine Pitrou621601a2008-12-17 23:18:19 +0000761static double
762get_time(void)
763{
764 double result = 0;
765 if (tmod != NULL) {
766 PyObject *f = PyObject_CallMethod(tmod, "time", NULL);
767 if (f == NULL) {
768 PyErr_Clear();
769 }
770 else {
771 if (PyFloat_Check(f))
772 result = PyFloat_AsDouble(f);
773 Py_DECREF(f);
774 }
775 }
776 return result;
777}
778
Jeremy Hyltonc5007aa2000-06-30 05:02:53 +0000779/* This is the main function. Read this to understand how the
780 * collection process works. */
Neal Norwitz7b216c52006-03-04 20:01:53 +0000781static Py_ssize_t
Neil Schemenauer2880ae52002-05-04 05:35:20 +0000782collect(int generation)
Jeremy Hyltonc5007aa2000-06-30 05:02:53 +0000783{
Neil Schemenauer2880ae52002-05-04 05:35:20 +0000784 int i;
Neal Norwitz7b216c52006-03-04 20:01:53 +0000785 Py_ssize_t m = 0; /* # objects collected */
786 Py_ssize_t n = 0; /* # unreachable objects that couldn't be collected */
Neil Schemenauer2880ae52002-05-04 05:35:20 +0000787 PyGC_Head *young; /* the generation we are examining */
788 PyGC_Head *old; /* next older generation */
Tim Peters403a2032003-11-20 21:21:46 +0000789 PyGC_Head unreachable; /* non-problematic unreachable trash */
790 PyGC_Head finalizers; /* objects with, & reachable from, __del__ */
Jeremy Hyltonc5007aa2000-06-30 05:02:53 +0000791 PyGC_Head *gc;
Thomas Wouters49fd7fa2006-04-21 10:40:58 +0000792 double t1 = 0.0;
Jeremy Hyltonc5007aa2000-06-30 05:02:53 +0000793
Tim Peters93ad66d2003-04-05 17:15:44 +0000794 if (delstr == NULL) {
Martin v. Löwis5b222132007-06-10 09:51:05 +0000795 delstr = PyUnicode_InternFromString("__del__");
Tim Peters93ad66d2003-04-05 17:15:44 +0000796 if (delstr == NULL)
797 Py_FatalError("gc couldn't allocate \"__del__\"");
798 }
799
Jeremy Hyltonc5007aa2000-06-30 05:02:53 +0000800 if (debug & DEBUG_STATS) {
Antoine Pitrou621601a2008-12-17 23:18:19 +0000801 t1 = get_time();
Neil Schemenauer2880ae52002-05-04 05:35:20 +0000802 PySys_WriteStderr("gc: collecting generation %d...\n",
803 generation);
804 PySys_WriteStderr("gc: objects in each generation:");
Thomas Wouters49fd7fa2006-04-21 10:40:58 +0000805 for (i = 0; i < NUM_GENERATIONS; i++)
806 PySys_WriteStderr(" %" PY_FORMAT_SIZE_T "d",
807 gc_list_size(GEN_HEAD(i)));
Neil Schemenauer2880ae52002-05-04 05:35:20 +0000808 PySys_WriteStderr("\n");
809 }
810
811 /* update collection and allocation counters */
812 if (generation+1 < NUM_GENERATIONS)
813 generations[generation+1].count += 1;
814 for (i = 0; i <= generation; i++)
Neil Schemenauerc9051642002-06-28 19:16:04 +0000815 generations[i].count = 0;
Neil Schemenauer2880ae52002-05-04 05:35:20 +0000816
817 /* merge younger generations with one we are currently collecting */
818 for (i = 0; i < generation; i++) {
819 gc_list_merge(GEN_HEAD(i), GEN_HEAD(generation));
820 }
821
822 /* handy references */
823 young = GEN_HEAD(generation);
Tim Peters19b74c72002-07-01 03:52:19 +0000824 if (generation < NUM_GENERATIONS-1)
Neil Schemenauer2880ae52002-05-04 05:35:20 +0000825 old = GEN_HEAD(generation+1);
Tim Peters19b74c72002-07-01 03:52:19 +0000826 else
827 old = young;
Jeremy Hyltonc5007aa2000-06-30 05:02:53 +0000828
829 /* Using ob_refcnt and gc_refs, calculate which objects in the
Tim Petersead8b7a2004-10-30 23:09:22 +0000830 * container set are reachable from outside the set (i.e., have a
Jeremy Hyltonc5007aa2000-06-30 05:02:53 +0000831 * refcount greater than 0 when all the references within the
Tim Petersead8b7a2004-10-30 23:09:22 +0000832 * set are taken into account).
Tim Peters19b74c72002-07-01 03:52:19 +0000833 */
Jeremy Hyltonc5007aa2000-06-30 05:02:53 +0000834 update_refs(young);
835 subtract_refs(young);
836
Tim Peters19b74c72002-07-01 03:52:19 +0000837 /* Leave everything reachable from outside young in young, and move
838 * everything else (in young) to unreachable.
839 * NOTE: This used to move the reachable objects into a reachable
840 * set instead. But most things usually turn out to be reachable,
841 * so it's more efficient to move the unreachable things.
842 */
Jeremy Hyltonc5007aa2000-06-30 05:02:53 +0000843 gc_list_init(&unreachable);
Tim Peters19b74c72002-07-01 03:52:19 +0000844 move_unreachable(young, &unreachable);
Jeremy Hyltonc5007aa2000-06-30 05:02:53 +0000845
Tim Peters19b74c72002-07-01 03:52:19 +0000846 /* Move reachable objects to next generation. */
Antoine Pitrou14b78f52009-01-09 22:27:08 +0000847 if (young != old) {
848 if (generation == NUM_GENERATIONS - 2) {
849 long_lived_pending += gc_list_size(young);
850 }
Tim Peters19b74c72002-07-01 03:52:19 +0000851 gc_list_merge(young, old);
Antoine Pitrou14b78f52009-01-09 22:27:08 +0000852 }
853 else {
854 long_lived_pending = 0;
855 long_lived_total = gc_list_size(young);
856 }
Jeremy Hyltonc5007aa2000-06-30 05:02:53 +0000857
Tim Peters19b74c72002-07-01 03:52:19 +0000858 /* All objects in unreachable are trash, but objects reachable from
859 * finalizers can't safely be deleted. Python programmers should take
860 * care not to create such things. For Python, finalizers means
Tim Peters403a2032003-11-20 21:21:46 +0000861 * instance objects with __del__ methods. Weakrefs with callbacks
Tim Petersead8b7a2004-10-30 23:09:22 +0000862 * can also call arbitrary Python code but they will be dealt with by
863 * handle_weakrefs().
Tim Petersf6b80452003-04-07 19:21:15 +0000864 */
Jeremy Hyltonc5007aa2000-06-30 05:02:53 +0000865 gc_list_init(&finalizers);
Tim Petersead8b7a2004-10-30 23:09:22 +0000866 move_finalizers(&unreachable, &finalizers);
Tim Petersbf384c22003-04-06 00:11:39 +0000867 /* finalizers contains the unreachable objects with a finalizer;
Tim Peters403a2032003-11-20 21:21:46 +0000868 * unreachable objects reachable *from* those are also uncollectable,
869 * and we move those into the finalizers list too.
Tim Petersbf384c22003-04-06 00:11:39 +0000870 */
Tim Petersf6b80452003-04-07 19:21:15 +0000871 move_finalizer_reachable(&finalizers);
Jeremy Hyltonc5007aa2000-06-30 05:02:53 +0000872
873 /* Collect statistics on collectable objects found and print
Tim Peters403a2032003-11-20 21:21:46 +0000874 * debugging information.
875 */
Tim Petersf6b80452003-04-07 19:21:15 +0000876 for (gc = unreachable.gc.gc_next; gc != &unreachable;
Tim Peters9e4ca102001-10-11 18:31:31 +0000877 gc = gc->gc.gc_next) {
Jeremy Hyltonc5007aa2000-06-30 05:02:53 +0000878 m++;
Jeremy Hylton06257772000-08-31 15:10:24 +0000879 if (debug & DEBUG_COLLECTABLE) {
Neil Schemenauer43411b52001-08-30 00:05:51 +0000880 debug_cycle("collectable", FROM_GC(gc));
Jeremy Hyltonc5007aa2000-06-30 05:02:53 +0000881 }
882 }
Tim Petersead8b7a2004-10-30 23:09:22 +0000883
884 /* Clear weakrefs and invoke callbacks as necessary. */
885 m += handle_weakrefs(&unreachable, old);
886
Tim Petersfb2ab4d2003-04-07 22:41:24 +0000887 /* Call tp_clear on objects in the unreachable set. This will cause
888 * the reference cycles to be broken. It may also cause some objects
889 * in finalizers to be freed.
890 */
Tim Petersf6b80452003-04-07 19:21:15 +0000891 delete_garbage(&unreachable, old);
Jeremy Hyltonc5007aa2000-06-30 05:02:53 +0000892
893 /* Collect statistics on uncollectable objects found and print
894 * debugging information. */
Tim Peters50c61d52003-04-06 01:50:50 +0000895 for (gc = finalizers.gc.gc_next;
Tim Petersbf384c22003-04-06 00:11:39 +0000896 gc != &finalizers;
897 gc = gc->gc.gc_next) {
Jeremy Hyltonc5007aa2000-06-30 05:02:53 +0000898 n++;
Tim Petersbf384c22003-04-06 00:11:39 +0000899 if (debug & DEBUG_UNCOLLECTABLE)
Neil Schemenauer43411b52001-08-30 00:05:51 +0000900 debug_cycle("uncollectable", FROM_GC(gc));
Tim Petersbf384c22003-04-06 00:11:39 +0000901 }
Jeremy Hylton06257772000-08-31 15:10:24 +0000902 if (debug & DEBUG_STATS) {
Antoine Pitrou621601a2008-12-17 23:18:19 +0000903 double t2 = get_time();
Thomas Wouters49fd7fa2006-04-21 10:40:58 +0000904 if (m == 0 && n == 0)
Antoine Pitrou621601a2008-12-17 23:18:19 +0000905 PySys_WriteStderr("gc: done");
Thomas Wouters49fd7fa2006-04-21 10:40:58 +0000906 else
Neal Norwitze22373d2006-03-06 23:31:56 +0000907 PySys_WriteStderr(
Thomas Wouters49fd7fa2006-04-21 10:40:58 +0000908 "gc: done, "
909 "%" PY_FORMAT_SIZE_T "d unreachable, "
Antoine Pitrou621601a2008-12-17 23:18:19 +0000910 "%" PY_FORMAT_SIZE_T "d uncollectable",
Neal Norwitze22373d2006-03-06 23:31:56 +0000911 n+m, n);
Antoine Pitrou621601a2008-12-17 23:18:19 +0000912 if (t1 && t2) {
913 PySys_WriteStderr(", %.4fs elapsed", t2-t1);
914 }
915 PySys_WriteStderr(".\n");
Jeremy Hyltonc5007aa2000-06-30 05:02:53 +0000916 }
917
918 /* Append instances in the uncollectable set to a Python
919 * reachable list of garbage. The programmer has to deal with
Tim Petersbf384c22003-04-06 00:11:39 +0000920 * this if they insist on creating this type of structure.
921 */
Tim Petersf6b80452003-04-07 19:21:15 +0000922 (void)handle_finalizers(&finalizers, old);
Jeremy Hyltonc5007aa2000-06-30 05:02:53 +0000923
Christian Heimesa156e092008-02-16 07:38:31 +0000924 /* Clear free list only during the collection of the higest
925 * generation */
926 if (generation == NUM_GENERATIONS-1) {
927 clear_freelists();
928 }
929
Jeremy Hyltonb709df32000-09-01 02:47:25 +0000930 if (PyErr_Occurred()) {
Tim Petersf6b80452003-04-07 19:21:15 +0000931 if (gc_str == NULL)
Neal Norwitz53cbdaa2007-08-23 21:42:55 +0000932 gc_str = PyUnicode_FromString("garbage collection");
Jeremy Hyltonb709df32000-09-01 02:47:25 +0000933 PyErr_WriteUnraisable(gc_str);
934 Py_FatalError("unexpected exception during garbage collection");
935 }
Jeremy Hyltonc5007aa2000-06-30 05:02:53 +0000936 return n+m;
937}
938
Neal Norwitz7b216c52006-03-04 20:01:53 +0000939static Py_ssize_t
Jeremy Hyltonc5007aa2000-06-30 05:02:53 +0000940collect_generations(void)
941{
Neil Schemenauer2880ae52002-05-04 05:35:20 +0000942 int i;
Neal Norwitz7b216c52006-03-04 20:01:53 +0000943 Py_ssize_t n = 0;
Jeremy Hyltonc5007aa2000-06-30 05:02:53 +0000944
Neil Schemenauer2880ae52002-05-04 05:35:20 +0000945 /* Find the oldest generation (higest numbered) where the count
946 * exceeds the threshold. Objects in the that generation and
947 * generations younger than it will be collected. */
948 for (i = NUM_GENERATIONS-1; i >= 0; i--) {
949 if (generations[i].count > generations[i].threshold) {
Antoine Pitrou14b78f52009-01-09 22:27:08 +0000950 /* Avoid quadratic performance degradation in number
951 of tracked objects. See comments at the beginning
952 of this file, and issue #4074.
953 */
954 if (i == NUM_GENERATIONS - 1
955 && long_lived_pending < long_lived_total / 4)
956 continue;
Neil Schemenauer2880ae52002-05-04 05:35:20 +0000957 n = collect(i);
958 break;
Jeremy Hyltonc5007aa2000-06-30 05:02:53 +0000959 }
960 }
961 return n;
962}
963
Martin v. Löwis14f8b4c2002-06-13 20:33:02 +0000964PyDoc_STRVAR(gc_enable__doc__,
Vladimir Marangozovf9d20c32000-08-06 22:45:31 +0000965"enable() -> None\n"
966"\n"
Martin v. Löwis14f8b4c2002-06-13 20:33:02 +0000967"Enable automatic garbage collection.\n");
Jeremy Hyltonc5007aa2000-06-30 05:02:53 +0000968
Vladimir Marangozovf9d20c32000-08-06 22:45:31 +0000969static PyObject *
Tim Peters50c61d52003-04-06 01:50:50 +0000970gc_enable(PyObject *self, PyObject *noargs)
Vladimir Marangozovf9d20c32000-08-06 22:45:31 +0000971{
Vladimir Marangozovf9d20c32000-08-06 22:45:31 +0000972 enabled = 1;
Vladimir Marangozovf9d20c32000-08-06 22:45:31 +0000973 Py_INCREF(Py_None);
974 return Py_None;
975}
976
Martin v. Löwis14f8b4c2002-06-13 20:33:02 +0000977PyDoc_STRVAR(gc_disable__doc__,
Vladimir Marangozovf9d20c32000-08-06 22:45:31 +0000978"disable() -> None\n"
979"\n"
Martin v. Löwis14f8b4c2002-06-13 20:33:02 +0000980"Disable automatic garbage collection.\n");
Vladimir Marangozovf9d20c32000-08-06 22:45:31 +0000981
982static PyObject *
Tim Peters50c61d52003-04-06 01:50:50 +0000983gc_disable(PyObject *self, PyObject *noargs)
Vladimir Marangozovf9d20c32000-08-06 22:45:31 +0000984{
Vladimir Marangozovf9d20c32000-08-06 22:45:31 +0000985 enabled = 0;
Vladimir Marangozovf9d20c32000-08-06 22:45:31 +0000986 Py_INCREF(Py_None);
987 return Py_None;
988}
989
Martin v. Löwis14f8b4c2002-06-13 20:33:02 +0000990PyDoc_STRVAR(gc_isenabled__doc__,
Vladimir Marangozovf9d20c32000-08-06 22:45:31 +0000991"isenabled() -> status\n"
992"\n"
Martin v. Löwis14f8b4c2002-06-13 20:33:02 +0000993"Returns true if automatic garbage collection is enabled.\n");
Vladimir Marangozovf9d20c32000-08-06 22:45:31 +0000994
995static PyObject *
Tim Peters50c61d52003-04-06 01:50:50 +0000996gc_isenabled(PyObject *self, PyObject *noargs)
Vladimir Marangozovf9d20c32000-08-06 22:45:31 +0000997{
Raymond Hettinger674d56b2004-01-04 04:00:13 +0000998 return PyBool_FromLong((long)enabled);
Vladimir Marangozovf9d20c32000-08-06 22:45:31 +0000999}
1000
Martin v. Löwis14f8b4c2002-06-13 20:33:02 +00001001PyDoc_STRVAR(gc_collect__doc__,
Barry Warsawd3c38ff2006-03-07 09:46:03 +00001002"collect([generation]) -> n\n"
Jeremy Hyltonc5007aa2000-06-30 05:02:53 +00001003"\n"
Barry Warsawd3c38ff2006-03-07 09:46:03 +00001004"With no arguments, run a full collection. The optional argument\n"
1005"may be an integer specifying which generation to collect. A ValueError\n"
1006"is raised if the generation number is invalid.\n\n"
1007"The number of unreachable objects is returned.\n");
Jeremy Hyltonc5007aa2000-06-30 05:02:53 +00001008
1009static PyObject *
Barry Warsawd3c38ff2006-03-07 09:46:03 +00001010gc_collect(PyObject *self, PyObject *args, PyObject *kws)
Jeremy Hyltonc5007aa2000-06-30 05:02:53 +00001011{
Barry Warsawd3c38ff2006-03-07 09:46:03 +00001012 static char *keywords[] = {"generation", NULL};
1013 int genarg = NUM_GENERATIONS - 1;
Neal Norwitz7b216c52006-03-04 20:01:53 +00001014 Py_ssize_t n;
Jeremy Hyltonc5007aa2000-06-30 05:02:53 +00001015
Barry Warsawd3c38ff2006-03-07 09:46:03 +00001016 if (!PyArg_ParseTupleAndKeywords(args, kws, "|i", keywords, &genarg))
1017 return NULL;
1018
1019 else if (genarg < 0 || genarg >= NUM_GENERATIONS) {
1020 PyErr_SetString(PyExc_ValueError, "invalid generation");
1021 return NULL;
1022 }
1023
Tim Peters50c61d52003-04-06 01:50:50 +00001024 if (collecting)
Neil Schemenauere8c40cb2001-10-31 23:09:35 +00001025 n = 0; /* already collecting, don't do anything */
Neil Schemenauere8c40cb2001-10-31 23:09:35 +00001026 else {
1027 collecting = 1;
Barry Warsawd3c38ff2006-03-07 09:46:03 +00001028 n = collect(genarg);
Neil Schemenauere8c40cb2001-10-31 23:09:35 +00001029 collecting = 0;
1030 }
Jeremy Hyltonc5007aa2000-06-30 05:02:53 +00001031
Christian Heimes217cfd12007-12-02 14:31:20 +00001032 return PyLong_FromSsize_t(n);
Jeremy Hyltonc5007aa2000-06-30 05:02:53 +00001033}
1034
Martin v. Löwis14f8b4c2002-06-13 20:33:02 +00001035PyDoc_STRVAR(gc_set_debug__doc__,
Jeremy Hyltonc5007aa2000-06-30 05:02:53 +00001036"set_debug(flags) -> None\n"
1037"\n"
1038"Set the garbage collection debugging flags. Debugging information is\n"
1039"written to sys.stderr.\n"
1040"\n"
1041"flags is an integer and can have the following bits turned on:\n"
1042"\n"
1043" DEBUG_STATS - Print statistics during collection.\n"
1044" DEBUG_COLLECTABLE - Print collectable objects found.\n"
1045" DEBUG_UNCOLLECTABLE - Print unreachable but uncollectable objects found.\n"
Neil Schemenauer544de1e2000-09-22 15:22:38 +00001046" DEBUG_SAVEALL - Save objects to gc.garbage rather than freeing them.\n"
Martin v. Löwis14f8b4c2002-06-13 20:33:02 +00001047" DEBUG_LEAK - Debug leaking programs (everything but STATS).\n");
Jeremy Hyltonc5007aa2000-06-30 05:02:53 +00001048
1049static PyObject *
Vladimir Marangozovf9d20c32000-08-06 22:45:31 +00001050gc_set_debug(PyObject *self, PyObject *args)
Jeremy Hyltonc5007aa2000-06-30 05:02:53 +00001051{
Neil Schemenauer7760cff2000-09-22 22:35:36 +00001052 if (!PyArg_ParseTuple(args, "i:set_debug", &debug))
Jeremy Hyltonc5007aa2000-06-30 05:02:53 +00001053 return NULL;
1054
1055 Py_INCREF(Py_None);
1056 return Py_None;
1057}
1058
Martin v. Löwis14f8b4c2002-06-13 20:33:02 +00001059PyDoc_STRVAR(gc_get_debug__doc__,
Jeremy Hyltonc5007aa2000-06-30 05:02:53 +00001060"get_debug() -> flags\n"
1061"\n"
Martin v. Löwis14f8b4c2002-06-13 20:33:02 +00001062"Get the garbage collection debugging flags.\n");
Jeremy Hyltonc5007aa2000-06-30 05:02:53 +00001063
1064static PyObject *
Tim Peters50c61d52003-04-06 01:50:50 +00001065gc_get_debug(PyObject *self, PyObject *noargs)
Jeremy Hyltonc5007aa2000-06-30 05:02:53 +00001066{
Jeremy Hyltonc5007aa2000-06-30 05:02:53 +00001067 return Py_BuildValue("i", debug);
1068}
1069
Martin v. Löwis14f8b4c2002-06-13 20:33:02 +00001070PyDoc_STRVAR(gc_set_thresh__doc__,
Neal Norwitz2a47c0f2002-01-29 00:53:41 +00001071"set_threshold(threshold0, [threshold1, threshold2]) -> None\n"
Jeremy Hyltonc5007aa2000-06-30 05:02:53 +00001072"\n"
1073"Sets the collection thresholds. Setting threshold0 to zero disables\n"
Martin v. Löwis14f8b4c2002-06-13 20:33:02 +00001074"collection.\n");
Jeremy Hyltonc5007aa2000-06-30 05:02:53 +00001075
1076static PyObject *
Vladimir Marangozovf9d20c32000-08-06 22:45:31 +00001077gc_set_thresh(PyObject *self, PyObject *args)
Jeremy Hyltonc5007aa2000-06-30 05:02:53 +00001078{
Neil Schemenauer2880ae52002-05-04 05:35:20 +00001079 int i;
1080 if (!PyArg_ParseTuple(args, "i|ii:set_threshold",
1081 &generations[0].threshold,
1082 &generations[1].threshold,
1083 &generations[2].threshold))
Jeremy Hyltonc5007aa2000-06-30 05:02:53 +00001084 return NULL;
Neil Schemenauer2880ae52002-05-04 05:35:20 +00001085 for (i = 2; i < NUM_GENERATIONS; i++) {
1086 /* generations higher than 2 get the same threshold */
1087 generations[i].threshold = generations[2].threshold;
1088 }
Jeremy Hyltonc5007aa2000-06-30 05:02:53 +00001089
1090 Py_INCREF(Py_None);
1091 return Py_None;
1092}
1093
Martin v. Löwis14f8b4c2002-06-13 20:33:02 +00001094PyDoc_STRVAR(gc_get_thresh__doc__,
Jeremy Hyltonc5007aa2000-06-30 05:02:53 +00001095"get_threshold() -> (threshold0, threshold1, threshold2)\n"
1096"\n"
Martin v. Löwis14f8b4c2002-06-13 20:33:02 +00001097"Return the current collection thresholds\n");
Jeremy Hyltonc5007aa2000-06-30 05:02:53 +00001098
1099static PyObject *
Tim Peters50c61d52003-04-06 01:50:50 +00001100gc_get_thresh(PyObject *self, PyObject *noargs)
Jeremy Hyltonc5007aa2000-06-30 05:02:53 +00001101{
Neil Schemenauer2880ae52002-05-04 05:35:20 +00001102 return Py_BuildValue("(iii)",
1103 generations[0].threshold,
1104 generations[1].threshold,
1105 generations[2].threshold);
Jeremy Hyltonc5007aa2000-06-30 05:02:53 +00001106}
1107
Barry Warsawd3c38ff2006-03-07 09:46:03 +00001108PyDoc_STRVAR(gc_get_count__doc__,
1109"get_count() -> (count0, count1, count2)\n"
1110"\n"
1111"Return the current collection counts\n");
1112
1113static PyObject *
1114gc_get_count(PyObject *self, PyObject *noargs)
1115{
1116 return Py_BuildValue("(iii)",
1117 generations[0].count,
1118 generations[1].count,
1119 generations[2].count);
1120}
1121
Neil Schemenauer48c70342001-08-09 15:38:31 +00001122static int
Martin v. Löwis560da622001-11-24 09:24:51 +00001123referrersvisit(PyObject* obj, PyObject *objs)
Neil Schemenauer48c70342001-08-09 15:38:31 +00001124{
Thomas Wouters49fd7fa2006-04-21 10:40:58 +00001125 Py_ssize_t i;
Martin v. Löwisc8fe77b2001-11-29 18:08:31 +00001126 for (i = 0; i < PyTuple_GET_SIZE(objs); i++)
1127 if (PyTuple_GET_ITEM(objs, i) == obj)
1128 return 1;
Neil Schemenauer48c70342001-08-09 15:38:31 +00001129 return 0;
1130}
1131
Neil Schemenauer17e7be62001-08-10 14:46:47 +00001132static int
Martin v. Löwis560da622001-11-24 09:24:51 +00001133gc_referrers_for(PyObject *objs, PyGC_Head *list, PyObject *resultlist)
Neil Schemenauer48c70342001-08-09 15:38:31 +00001134{
1135 PyGC_Head *gc;
1136 PyObject *obj;
1137 traverseproc traverse;
Tim Peters9e4ca102001-10-11 18:31:31 +00001138 for (gc = list->gc.gc_next; gc != list; gc = gc->gc.gc_next) {
Neil Schemenauer43411b52001-08-30 00:05:51 +00001139 obj = FROM_GC(gc);
Christian Heimes90aa7642007-12-19 02:45:37 +00001140 traverse = Py_TYPE(obj)->tp_traverse;
Neil Schemenauer48c70342001-08-09 15:38:31 +00001141 if (obj == objs || obj == resultlist)
1142 continue;
Martin v. Löwis560da622001-11-24 09:24:51 +00001143 if (traverse(obj, (visitproc)referrersvisit, objs)) {
Neil Schemenauer17e7be62001-08-10 14:46:47 +00001144 if (PyList_Append(resultlist, obj) < 0)
1145 return 0; /* error */
Neil Schemenauer48c70342001-08-09 15:38:31 +00001146 }
1147 }
Neil Schemenauer17e7be62001-08-10 14:46:47 +00001148 return 1; /* no error */
Neil Schemenauer48c70342001-08-09 15:38:31 +00001149}
1150
Martin v. Löwis14f8b4c2002-06-13 20:33:02 +00001151PyDoc_STRVAR(gc_get_referrers__doc__,
Martin v. Löwis560da622001-11-24 09:24:51 +00001152"get_referrers(*objs) -> list\n\
Martin v. Löwis14f8b4c2002-06-13 20:33:02 +00001153Return the list of objects that directly refer to any of objs.");
Neil Schemenauer48c70342001-08-09 15:38:31 +00001154
Neil Schemenauer17e7be62001-08-10 14:46:47 +00001155static PyObject *
Martin v. Löwis560da622001-11-24 09:24:51 +00001156gc_get_referrers(PyObject *self, PyObject *args)
Neil Schemenauer48c70342001-08-09 15:38:31 +00001157{
Neil Schemenauer2880ae52002-05-04 05:35:20 +00001158 int i;
Neil Schemenauer48c70342001-08-09 15:38:31 +00001159 PyObject *result = PyList_New(0);
Thomas Wouters49fd7fa2006-04-21 10:40:58 +00001160 if (!result) return NULL;
1161
Neil Schemenauer2880ae52002-05-04 05:35:20 +00001162 for (i = 0; i < NUM_GENERATIONS; i++) {
1163 if (!(gc_referrers_for(args, GEN_HEAD(i), result))) {
1164 Py_DECREF(result);
1165 return NULL;
1166 }
Neil Schemenauer17e7be62001-08-10 14:46:47 +00001167 }
Neil Schemenauer48c70342001-08-09 15:38:31 +00001168 return result;
1169}
Jeremy Hyltonc5007aa2000-06-30 05:02:53 +00001170
Tim Peters0f81ab62003-04-08 16:39:48 +00001171/* Append obj to list; return true if error (out of memory), false if OK. */
Jeremy Hylton5bd378b2003-04-03 16:28:38 +00001172static int
Tim Peters730f5532003-04-08 17:17:17 +00001173referentsvisit(PyObject *obj, PyObject *list)
Jeremy Hylton5bd378b2003-04-03 16:28:38 +00001174{
Tim Peters0f81ab62003-04-08 16:39:48 +00001175 return PyList_Append(list, obj) < 0;
Jeremy Hylton5bd378b2003-04-03 16:28:38 +00001176}
1177
Tim Peters730f5532003-04-08 17:17:17 +00001178PyDoc_STRVAR(gc_get_referents__doc__,
1179"get_referents(*objs) -> list\n\
Jeremy Hylton059b0942003-04-03 16:29:13 +00001180Return the list of objects that are directly referred to by objs.");
Jeremy Hylton5bd378b2003-04-03 16:28:38 +00001181
1182static PyObject *
Tim Peters730f5532003-04-08 17:17:17 +00001183gc_get_referents(PyObject *self, PyObject *args)
Jeremy Hylton5bd378b2003-04-03 16:28:38 +00001184{
Thomas Wouters49fd7fa2006-04-21 10:40:58 +00001185 Py_ssize_t i;
Jeremy Hylton5bd378b2003-04-03 16:28:38 +00001186 PyObject *result = PyList_New(0);
Tim Peters0f81ab62003-04-08 16:39:48 +00001187
1188 if (result == NULL)
1189 return NULL;
1190
Jeremy Hylton5bd378b2003-04-03 16:28:38 +00001191 for (i = 0; i < PyTuple_GET_SIZE(args); i++) {
Tim Peters0f81ab62003-04-08 16:39:48 +00001192 traverseproc traverse;
Tim Peters93ad66d2003-04-05 17:15:44 +00001193 PyObject *obj = PyTuple_GET_ITEM(args, i);
Tim Peters0f81ab62003-04-08 16:39:48 +00001194
1195 if (! PyObject_IS_GC(obj))
Jeremy Hylton5bd378b2003-04-03 16:28:38 +00001196 continue;
Christian Heimes90aa7642007-12-19 02:45:37 +00001197 traverse = Py_TYPE(obj)->tp_traverse;
Tim Peters0f81ab62003-04-08 16:39:48 +00001198 if (! traverse)
1199 continue;
Tim Peters730f5532003-04-08 17:17:17 +00001200 if (traverse(obj, (visitproc)referentsvisit, result)) {
Tim Peters0f81ab62003-04-08 16:39:48 +00001201 Py_DECREF(result);
Jeremy Hylton5bd378b2003-04-03 16:28:38 +00001202 return NULL;
Tim Peters0f81ab62003-04-08 16:39:48 +00001203 }
Jeremy Hylton5bd378b2003-04-03 16:28:38 +00001204 }
1205 return result;
1206}
1207
Martin v. Löwis14f8b4c2002-06-13 20:33:02 +00001208PyDoc_STRVAR(gc_get_objects__doc__,
Neil Schemenauerc7c8d8e2001-08-09 15:58:59 +00001209"get_objects() -> [...]\n"
1210"\n"
1211"Return a list of objects tracked by the collector (excluding the list\n"
Martin v. Löwis14f8b4c2002-06-13 20:33:02 +00001212"returned).\n");
Neil Schemenauerc7c8d8e2001-08-09 15:58:59 +00001213
Neil Schemenauerc7c8d8e2001-08-09 15:58:59 +00001214static PyObject *
Tim Peters50c61d52003-04-06 01:50:50 +00001215gc_get_objects(PyObject *self, PyObject *noargs)
Neil Schemenauerc7c8d8e2001-08-09 15:58:59 +00001216{
Neil Schemenauer2880ae52002-05-04 05:35:20 +00001217 int i;
Neil Schemenauerc7c8d8e2001-08-09 15:58:59 +00001218 PyObject* result;
1219
Neil Schemenauerc7c8d8e2001-08-09 15:58:59 +00001220 result = PyList_New(0);
Tim Peters50c61d52003-04-06 01:50:50 +00001221 if (result == NULL)
Martin v. Löwisf8a6f242001-12-02 18:31:02 +00001222 return NULL;
Neil Schemenauer2880ae52002-05-04 05:35:20 +00001223 for (i = 0; i < NUM_GENERATIONS; i++) {
1224 if (append_objects(result, GEN_HEAD(i))) {
1225 Py_DECREF(result);
1226 return NULL;
1227 }
Martin v. Löwis155aad12001-12-02 12:21:34 +00001228 }
Neil Schemenauerc7c8d8e2001-08-09 15:58:59 +00001229 return result;
1230}
1231
1232
Martin v. Löwis14f8b4c2002-06-13 20:33:02 +00001233PyDoc_STRVAR(gc__doc__,
Jeremy Hyltonc5007aa2000-06-30 05:02:53 +00001234"This module provides access to the garbage collector for reference cycles.\n"
1235"\n"
Vladimir Marangozovf9d20c32000-08-06 22:45:31 +00001236"enable() -- Enable automatic garbage collection.\n"
1237"disable() -- Disable automatic garbage collection.\n"
1238"isenabled() -- Returns true if automatic collection is enabled.\n"
Jeremy Hyltonc5007aa2000-06-30 05:02:53 +00001239"collect() -- Do a full collection right now.\n"
Thomas Wouters89f507f2006-12-13 04:49:30 +00001240"get_count() -- Return the current collection counts.\n"
Jeremy Hyltonc5007aa2000-06-30 05:02:53 +00001241"set_debug() -- Set debugging flags.\n"
1242"get_debug() -- Get debugging flags.\n"
1243"set_threshold() -- Set the collection thresholds.\n"
1244"get_threshold() -- Return the current the collection thresholds.\n"
Neil Schemenauerc7c8d8e2001-08-09 15:58:59 +00001245"get_objects() -- Return a list of all objects tracked by the collector.\n"
Jeremy Hylton5bd378b2003-04-03 16:28:38 +00001246"get_referrers() -- Return the list of objects that refer to an object.\n"
Tim Peters730f5532003-04-08 17:17:17 +00001247"get_referents() -- Return the list of objects that an object refers to.\n");
Jeremy Hyltonc5007aa2000-06-30 05:02:53 +00001248
1249static PyMethodDef GcMethods[] = {
Tim Peters50c61d52003-04-06 01:50:50 +00001250 {"enable", gc_enable, METH_NOARGS, gc_enable__doc__},
1251 {"disable", gc_disable, METH_NOARGS, gc_disable__doc__},
1252 {"isenabled", gc_isenabled, METH_NOARGS, gc_isenabled__doc__},
Vladimir Marangozovf9d20c32000-08-06 22:45:31 +00001253 {"set_debug", gc_set_debug, METH_VARARGS, gc_set_debug__doc__},
Tim Peters50c61d52003-04-06 01:50:50 +00001254 {"get_debug", gc_get_debug, METH_NOARGS, gc_get_debug__doc__},
Barry Warsawd3c38ff2006-03-07 09:46:03 +00001255 {"get_count", gc_get_count, METH_NOARGS, gc_get_count__doc__},
Vladimir Marangozovf9d20c32000-08-06 22:45:31 +00001256 {"set_threshold", gc_set_thresh, METH_VARARGS, gc_set_thresh__doc__},
Tim Peters50c61d52003-04-06 01:50:50 +00001257 {"get_threshold", gc_get_thresh, METH_NOARGS, gc_get_thresh__doc__},
Barry Warsawd3c38ff2006-03-07 09:46:03 +00001258 {"collect", (PyCFunction)gc_collect,
1259 METH_VARARGS | METH_KEYWORDS, gc_collect__doc__},
Tim Peters50c61d52003-04-06 01:50:50 +00001260 {"get_objects", gc_get_objects,METH_NOARGS, gc_get_objects__doc__},
Martin v. Löwis560da622001-11-24 09:24:51 +00001261 {"get_referrers", gc_get_referrers, METH_VARARGS,
1262 gc_get_referrers__doc__},
Tim Peters730f5532003-04-08 17:17:17 +00001263 {"get_referents", gc_get_referents, METH_VARARGS,
1264 gc_get_referents__doc__},
Jeremy Hyltonc5007aa2000-06-30 05:02:53 +00001265 {NULL, NULL} /* Sentinel */
1266};
1267
Martin v. Löwis1a214512008-06-11 05:26:20 +00001268static struct PyModuleDef gcmodule = {
1269 PyModuleDef_HEAD_INIT,
1270 "gc",
1271 gc__doc__,
1272 -1,
1273 GcMethods,
1274 NULL,
1275 NULL,
1276 NULL,
1277 NULL
1278};
1279
1280
Jason Tishler6bc06ec2003-09-04 11:59:50 +00001281PyMODINIT_FUNC
Martin v. Löwis1a214512008-06-11 05:26:20 +00001282PyInit_gc(void)
Jeremy Hyltonc5007aa2000-06-30 05:02:53 +00001283{
1284 PyObject *m;
Jeremy Hyltonc5007aa2000-06-30 05:02:53 +00001285
Martin v. Löwis1a214512008-06-11 05:26:20 +00001286 m = PyModule_Create(&gcmodule);
1287
Neal Norwitz1ac754f2006-01-19 06:09:39 +00001288 if (m == NULL)
Martin v. Löwis1a214512008-06-11 05:26:20 +00001289 return NULL;
Tim Peters11558872003-04-06 23:30:52 +00001290
Jeremy Hyltonc5007aa2000-06-30 05:02:53 +00001291 if (garbage == NULL) {
1292 garbage = PyList_New(0);
Tim Peters11558872003-04-06 23:30:52 +00001293 if (garbage == NULL)
Martin v. Löwis1a214512008-06-11 05:26:20 +00001294 return NULL;
Jeremy Hyltonc5007aa2000-06-30 05:02:53 +00001295 }
Neil Schemenauer3b1cbf92005-06-18 17:37:06 +00001296 Py_INCREF(garbage);
Tim Peters11558872003-04-06 23:30:52 +00001297 if (PyModule_AddObject(m, "garbage", garbage) < 0)
Martin v. Löwis1a214512008-06-11 05:26:20 +00001298 return NULL;
Thomas Wouters477c8d52006-05-27 19:21:47 +00001299
1300 /* Importing can't be done in collect() because collect()
1301 * can be called via PyGC_Collect() in Py_Finalize().
1302 * This wouldn't be a problem, except that <initialized> is
1303 * reset to 0 before calling collect which trips up
1304 * the import and triggers an assertion.
1305 */
1306 if (tmod == NULL) {
Christian Heimes072c0f12008-01-03 23:01:04 +00001307 tmod = PyImport_ImportModuleNoBlock("time");
Thomas Wouters477c8d52006-05-27 19:21:47 +00001308 if (tmod == NULL)
1309 PyErr_Clear();
1310 }
1311
Martin v. Löwis1a214512008-06-11 05:26:20 +00001312#define ADD_INT(NAME) if (PyModule_AddIntConstant(m, #NAME, NAME) < 0) return NULL
Tim Peters11558872003-04-06 23:30:52 +00001313 ADD_INT(DEBUG_STATS);
1314 ADD_INT(DEBUG_COLLECTABLE);
1315 ADD_INT(DEBUG_UNCOLLECTABLE);
Tim Peters11558872003-04-06 23:30:52 +00001316 ADD_INT(DEBUG_SAVEALL);
1317 ADD_INT(DEBUG_LEAK);
1318#undef ADD_INT
Martin v. Löwis1a214512008-06-11 05:26:20 +00001319 return m;
Jeremy Hyltonc5007aa2000-06-30 05:02:53 +00001320}
1321
Guido van Rossume13ddc92003-04-17 17:29:22 +00001322/* API to invoke gc.collect() from C */
Neal Norwitz7b216c52006-03-04 20:01:53 +00001323Py_ssize_t
Guido van Rossume13ddc92003-04-17 17:29:22 +00001324PyGC_Collect(void)
1325{
Neal Norwitz7b216c52006-03-04 20:01:53 +00001326 Py_ssize_t n;
Guido van Rossume13ddc92003-04-17 17:29:22 +00001327
1328 if (collecting)
1329 n = 0; /* already collecting, don't do anything */
1330 else {
1331 collecting = 1;
1332 n = collect(NUM_GENERATIONS - 1);
1333 collecting = 0;
1334 }
1335
1336 return n;
1337}
1338
Neil Schemenauer43411b52001-08-30 00:05:51 +00001339/* for debugging */
Guido van Rossume13ddc92003-04-17 17:29:22 +00001340void
1341_PyGC_Dump(PyGC_Head *g)
Neil Schemenauer43411b52001-08-30 00:05:51 +00001342{
1343 _PyObject_Dump(FROM_GC(g));
1344}
1345
Neil Schemenauer43411b52001-08-30 00:05:51 +00001346/* extension modules might be compiled with GC support so these
1347 functions must always be available */
1348
Neil Schemenauerfec4eb12002-04-12 02:41:03 +00001349#undef PyObject_GC_Track
1350#undef PyObject_GC_UnTrack
1351#undef PyObject_GC_Del
1352#undef _PyObject_GC_Malloc
1353
Neil Schemenauer43411b52001-08-30 00:05:51 +00001354void
Neil Schemenauerfec4eb12002-04-12 02:41:03 +00001355PyObject_GC_Track(void *op)
Neil Schemenauer43411b52001-08-30 00:05:51 +00001356{
1357 _PyObject_GC_TRACK(op);
1358}
1359
Neil Schemenauerfec4eb12002-04-12 02:41:03 +00001360/* for binary compatibility with 2.2 */
Neil Schemenauer43411b52001-08-30 00:05:51 +00001361void
Neil Schemenauerfec4eb12002-04-12 02:41:03 +00001362_PyObject_GC_Track(PyObject *op)
1363{
1364 PyObject_GC_Track(op);
1365}
1366
1367void
1368PyObject_GC_UnTrack(void *op)
Neil Schemenauer43411b52001-08-30 00:05:51 +00001369{
Tim Peters803526b2002-07-07 05:13:56 +00001370 /* Obscure: the Py_TRASHCAN mechanism requires that we be able to
1371 * call PyObject_GC_UnTrack twice on an object.
1372 */
Neil Schemenauera2b11ec2002-05-21 15:53:24 +00001373 if (IS_TRACKED(op))
Guido van Rossumff413af2002-03-28 20:34:59 +00001374 _PyObject_GC_UNTRACK(op);
Neil Schemenauer43411b52001-08-30 00:05:51 +00001375}
1376
Neil Schemenauerfec4eb12002-04-12 02:41:03 +00001377/* for binary compatibility with 2.2 */
1378void
1379_PyObject_GC_UnTrack(PyObject *op)
1380{
1381 PyObject_GC_UnTrack(op);
1382}
1383
Neil Schemenauer43411b52001-08-30 00:05:51 +00001384PyObject *
Neil Schemenauerfec4eb12002-04-12 02:41:03 +00001385_PyObject_GC_Malloc(size_t basicsize)
Neil Schemenauer43411b52001-08-30 00:05:51 +00001386{
1387 PyObject *op;
Neal Norwitz3ce5d922008-08-24 07:08:55 +00001388 PyGC_Head *g;
1389 if (basicsize > PY_SSIZE_T_MAX - sizeof(PyGC_Head))
1390 return PyErr_NoMemory();
1391 g = (PyGC_Head *)PyObject_MALLOC(
Thomas Wouters49fd7fa2006-04-21 10:40:58 +00001392 sizeof(PyGC_Head) + basicsize);
Neil Schemenauer43411b52001-08-30 00:05:51 +00001393 if (g == NULL)
Jeremy Hylton8a135182002-06-06 23:23:55 +00001394 return PyErr_NoMemory();
Tim Petersea405632002-07-02 00:52:30 +00001395 g->gc.gc_refs = GC_UNTRACKED;
Neil Schemenauer2880ae52002-05-04 05:35:20 +00001396 generations[0].count++; /* number of allocated GC objects */
1397 if (generations[0].count > generations[0].threshold &&
Neil Schemenauer43411b52001-08-30 00:05:51 +00001398 enabled &&
Neil Schemenauer2880ae52002-05-04 05:35:20 +00001399 generations[0].threshold &&
Neil Schemenauer43411b52001-08-30 00:05:51 +00001400 !collecting &&
1401 !PyErr_Occurred()) {
1402 collecting = 1;
Neil Schemenauer2880ae52002-05-04 05:35:20 +00001403 collect_generations();
Neil Schemenauer43411b52001-08-30 00:05:51 +00001404 collecting = 0;
1405 }
1406 op = FROM_GC(g);
Neil Schemenauer43411b52001-08-30 00:05:51 +00001407 return op;
1408}
1409
1410PyObject *
1411_PyObject_GC_New(PyTypeObject *tp)
1412{
Neil Schemenauerfec4eb12002-04-12 02:41:03 +00001413 PyObject *op = _PyObject_GC_Malloc(_PyObject_SIZE(tp));
Tim Petersfa8efab2002-04-28 01:57:25 +00001414 if (op != NULL)
1415 op = PyObject_INIT(op, tp);
1416 return op;
Neil Schemenauer43411b52001-08-30 00:05:51 +00001417}
1418
1419PyVarObject *
Martin v. Löwis18e16552006-02-15 17:27:45 +00001420_PyObject_GC_NewVar(PyTypeObject *tp, Py_ssize_t nitems)
Neil Schemenauer43411b52001-08-30 00:05:51 +00001421{
Neil Schemenauerfec4eb12002-04-12 02:41:03 +00001422 const size_t size = _PyObject_VAR_SIZE(tp, nitems);
1423 PyVarObject *op = (PyVarObject *) _PyObject_GC_Malloc(size);
Tim Petersfa8efab2002-04-28 01:57:25 +00001424 if (op != NULL)
1425 op = PyObject_INIT_VAR(op, tp, nitems);
1426 return op;
Neil Schemenauer43411b52001-08-30 00:05:51 +00001427}
1428
1429PyVarObject *
Martin v. Löwis41290682006-02-16 14:56:14 +00001430_PyObject_GC_Resize(PyVarObject *op, Py_ssize_t nitems)
Neil Schemenauer43411b52001-08-30 00:05:51 +00001431{
Christian Heimes90aa7642007-12-19 02:45:37 +00001432 const size_t basicsize = _PyObject_VAR_SIZE(Py_TYPE(op), nitems);
Neil Schemenauer43411b52001-08-30 00:05:51 +00001433 PyGC_Head *g = AS_GC(op);
Neal Norwitz3ce5d922008-08-24 07:08:55 +00001434 if (basicsize > PY_SSIZE_T_MAX - sizeof(PyGC_Head))
1435 return (PyVarObject *)PyErr_NoMemory();
Thomas Wouters49fd7fa2006-04-21 10:40:58 +00001436 g = (PyGC_Head *)PyObject_REALLOC(g, sizeof(PyGC_Head) + basicsize);
Neil Schemenauer43411b52001-08-30 00:05:51 +00001437 if (g == NULL)
1438 return (PyVarObject *)PyErr_NoMemory();
1439 op = (PyVarObject *) FROM_GC(g);
Christian Heimes90aa7642007-12-19 02:45:37 +00001440 Py_SIZE(op) = nitems;
Neil Schemenauer43411b52001-08-30 00:05:51 +00001441 return op;
1442}
1443
1444void
Neil Schemenauerfec4eb12002-04-12 02:41:03 +00001445PyObject_GC_Del(void *op)
Neil Schemenauer43411b52001-08-30 00:05:51 +00001446{
Neil Schemenauer43411b52001-08-30 00:05:51 +00001447 PyGC_Head *g = AS_GC(op);
Neil Schemenauera2b11ec2002-05-21 15:53:24 +00001448 if (IS_TRACKED(op))
Neil Schemenauer43411b52001-08-30 00:05:51 +00001449 gc_list_remove(g);
Neil Schemenauer2880ae52002-05-04 05:35:20 +00001450 if (generations[0].count > 0) {
1451 generations[0].count--;
Neil Schemenauer43411b52001-08-30 00:05:51 +00001452 }
Neil Schemenauerfec4eb12002-04-12 02:41:03 +00001453 PyObject_FREE(g);
Neil Schemenauer43411b52001-08-30 00:05:51 +00001454}
1455
Neil Schemenauerfec4eb12002-04-12 02:41:03 +00001456/* for binary compatibility with 2.2 */
1457#undef _PyObject_GC_Del
1458void
1459_PyObject_GC_Del(PyObject *op)
1460{
1461 PyObject_GC_Del(op);
1462}