blob: b02678591973fab574bb4267ae13452a53107d5e [file] [log] [blame]
Guido van Rossuma3309961993-07-28 09:05:47 +00001#ifndef Py_DICTOBJECT_H
2#define Py_DICTOBJECT_H
3#ifdef __cplusplus
4extern "C" {
5#endif
6
Guido van Rossumf70e43a1991-02-19 12:39:46 +00007
Guido van Rossum2ec90311997-05-13 21:23:32 +00008/* Dictionary object type -- mapping from hashable object to object */
Guido van Rossum85a5fbb1990-10-14 12:07:46 +00009
Raymond Hettinger930427b2003-05-03 06:51:59 +000010/* The distribution includes a separate file, Objects/dictnotes.txt,
Thomas Wouters4d70c3d2006-06-08 14:42:34 +000011 describing explorations into dictionary design and optimization.
Raymond Hettinger930427b2003-05-03 06:51:59 +000012 It covers typical dictionary use patterns, the parameters for
13 tuning dictionaries, and several ideas for possible optimizations.
14*/
15
Tim Peters6d6c1a32001-08-02 04:15:00 +000016/*
17There are three kinds of slots in the table:
18
191. Unused. me_key == me_value == NULL
20 Does not hold an active (key, value) pair now and never did. Unused can
21 transition to Active upon key insertion. This is the only case in which
22 me_key is NULL, and is each slot's initial state.
23
242. Active. me_key != NULL and me_key != dummy and me_value != NULL
25 Holds an active (key, value) pair. Active can transition to Dummy upon
26 key deletion. This is the only case in which me_value != NULL.
27
283. Dummy. me_key == dummy and me_value == NULL
29 Previously held an active (key, value) pair, but that was deleted and an
30 active pair has not yet overwritten the slot. Dummy can transition to
31 Active upon key insertion. Dummy slots cannot be made Unused again
32 (cannot have me_key set to NULL), else the probe sequence in case of
33 collision would have no way to know they were once active.
34
35Note: .popitem() abuses the me_hash field of an Unused or Dummy slot to
36hold a search finger. The me_hash field of Unused or Dummy slots has no
37meaning otherwise.
38*/
39
40/* PyDict_MINSIZE is the minimum size of a dictionary. This many slots are
41 * allocated directly in the dict object (in the ma_smalltable member).
42 * It must be a power of 2, and at least 4. 8 allows dicts with no more
43 * than 5 active entries to live in ma_smalltable (and so avoid an
44 * additional malloc); instrumentation suggested this suffices for the
45 * majority of dicts (consisting mostly of usually-small instance dicts and
46 * usually-small dicts created to pass keyword arguments).
47 */
Martin v. Löwis4d0d4712010-12-03 20:14:31 +000048#ifndef Py_LIMITED_API
Tim Peters6d6c1a32001-08-02 04:15:00 +000049#define PyDict_MINSIZE 8
50
51typedef struct {
Benjamin Peterson8f67d082010-10-17 20:54:53 +000052 /* Cached hash code of me_key. */
53 Py_hash_t me_hash;
Antoine Pitrouf95a1b32010-05-09 15:52:27 +000054 PyObject *me_key;
55 PyObject *me_value;
Tim Peters6d6c1a32001-08-02 04:15:00 +000056} PyDictEntry;
57
58/*
59To ensure the lookup algorithm terminates, there must be at least one Unused
60slot (NULL key) in the table.
61The value ma_fill is the number of non-NULL keys (sum of Active and Dummy);
62ma_used is the number of non-NULL, non-dummy keys (== the number of non-NULL
63values == the number of Active items).
64To avoid slowing down lookups on a near-full table, we resize the table when
65it's two-thirds full.
66*/
67typedef struct _dictobject PyDictObject;
68struct _dictobject {
Antoine Pitrouf95a1b32010-05-09 15:52:27 +000069 PyObject_HEAD
70 Py_ssize_t ma_fill; /* # Active + # Dummy */
71 Py_ssize_t ma_used; /* # Active */
Tim Peters6d6c1a32001-08-02 04:15:00 +000072
Antoine Pitrouf95a1b32010-05-09 15:52:27 +000073 /* The table contains ma_mask + 1 slots, and that's a power of 2.
74 * We store the mask instead of the size because the mask is more
75 * frequently needed.
76 */
77 Py_ssize_t ma_mask;
Tim Peters6d6c1a32001-08-02 04:15:00 +000078
Antoine Pitrouf95a1b32010-05-09 15:52:27 +000079 /* ma_table points to ma_smalltable for small tables, else to
80 * additional malloc'ed memory. ma_table is never NULL! This rule
81 * saves repeated runtime null-tests in the workhorse getitem and
82 * setitem calls.
83 */
84 PyDictEntry *ma_table;
Benjamin Peterson8f67d082010-10-17 20:54:53 +000085 PyDictEntry *(*ma_lookup)(PyDictObject *mp, PyObject *key, Py_hash_t hash);
Antoine Pitrouf95a1b32010-05-09 15:52:27 +000086 PyDictEntry ma_smalltable[PyDict_MINSIZE];
Tim Peters6d6c1a32001-08-02 04:15:00 +000087};
Martin v. Löwis4d0d4712010-12-03 20:14:31 +000088#endif /* Py_LIMITED_API */
Tim Peters6d6c1a32001-08-02 04:15:00 +000089
Mark Hammond91a681d2002-08-12 07:21:58 +000090PyAPI_DATA(PyTypeObject) PyDict_Type;
Christian Heimesa22e8bd2007-11-29 22:35:39 +000091PyAPI_DATA(PyTypeObject) PyDictIterKey_Type;
92PyAPI_DATA(PyTypeObject) PyDictIterValue_Type;
93PyAPI_DATA(PyTypeObject) PyDictIterItem_Type;
94PyAPI_DATA(PyTypeObject) PyDictKeys_Type;
95PyAPI_DATA(PyTypeObject) PyDictItems_Type;
96PyAPI_DATA(PyTypeObject) PyDictValues_Type;
Guido van Rossum2ec90311997-05-13 21:23:32 +000097
Thomas Wouters27d517b2007-02-25 20:39:11 +000098#define PyDict_Check(op) \
Christian Heimes90aa7642007-12-19 02:45:37 +000099 PyType_FastSubclass(Py_TYPE(op), Py_TPFLAGS_DICT_SUBCLASS)
100#define PyDict_CheckExact(op) (Py_TYPE(op) == &PyDict_Type)
101#define PyDictKeys_Check(op) (Py_TYPE(op) == &PyDictKeys_Type)
102#define PyDictItems_Check(op) (Py_TYPE(op) == &PyDictItems_Type)
103#define PyDictValues_Check(op) (Py_TYPE(op) == &PyDictValues_Type)
Christian Heimesa22e8bd2007-11-29 22:35:39 +0000104/* This excludes Values, since they are not sets. */
105# define PyDictViewSet_Check(op) \
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000106 (PyDictKeys_Check(op) || PyDictItems_Check(op))
Christian Heimesa22e8bd2007-11-29 22:35:39 +0000107
Guido van Rossum2ec90311997-05-13 21:23:32 +0000108
Mark Hammond91a681d2002-08-12 07:21:58 +0000109PyAPI_FUNC(PyObject *) PyDict_New(void);
110PyAPI_FUNC(PyObject *) PyDict_GetItem(PyObject *mp, PyObject *key);
Alexandre Vassalotticb314332008-06-01 03:53:03 +0000111PyAPI_FUNC(PyObject *) PyDict_GetItemWithError(PyObject *mp, PyObject *key);
Mark Hammond91a681d2002-08-12 07:21:58 +0000112PyAPI_FUNC(int) PyDict_SetItem(PyObject *mp, PyObject *key, PyObject *item);
113PyAPI_FUNC(int) PyDict_DelItem(PyObject *mp, PyObject *key);
114PyAPI_FUNC(void) PyDict_Clear(PyObject *mp);
115PyAPI_FUNC(int) PyDict_Next(
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000116 PyObject *mp, Py_ssize_t *pos, PyObject **key, PyObject **value);
Martin v. Löwis4d0d4712010-12-03 20:14:31 +0000117#ifndef Py_LIMITED_API
Thomas Wouterscf297e42007-02-23 15:07:44 +0000118PyAPI_FUNC(int) _PyDict_Next(
Benjamin Peterson8f67d082010-10-17 20:54:53 +0000119 PyObject *mp, Py_ssize_t *pos, PyObject **key, PyObject **value, Py_hash_t *hash);
Martin v. Löwis4d0d4712010-12-03 20:14:31 +0000120#endif
Mark Hammond91a681d2002-08-12 07:21:58 +0000121PyAPI_FUNC(PyObject *) PyDict_Keys(PyObject *mp);
122PyAPI_FUNC(PyObject *) PyDict_Values(PyObject *mp);
123PyAPI_FUNC(PyObject *) PyDict_Items(PyObject *mp);
Martin v. Löwis18e16552006-02-15 17:27:45 +0000124PyAPI_FUNC(Py_ssize_t) PyDict_Size(PyObject *mp);
Mark Hammond91a681d2002-08-12 07:21:58 +0000125PyAPI_FUNC(PyObject *) PyDict_Copy(PyObject *mp);
Raymond Hettingerbc0f2ab2003-11-25 21:12:14 +0000126PyAPI_FUNC(int) PyDict_Contains(PyObject *mp, PyObject *key);
Martin v. Löwis4d0d4712010-12-03 20:14:31 +0000127#ifndef Py_LIMITED_API
Benjamin Peterson8f67d082010-10-17 20:54:53 +0000128PyAPI_FUNC(int) _PyDict_Contains(PyObject *mp, PyObject *key, Py_hash_t hash);
Christian Heimes99170a52007-12-19 02:07:34 +0000129PyAPI_FUNC(PyObject *) _PyDict_NewPresized(Py_ssize_t minused);
Antoine Pitrou3a652b12009-03-23 18:52:06 +0000130PyAPI_FUNC(void) _PyDict_MaybeUntrack(PyObject *mp);
Benjamin Petersonfb886362010-04-24 18:21:17 +0000131PyAPI_FUNC(int) _PyDict_HasOnlyStringKeys(PyObject *mp);
Martin v. Löwis4d0d4712010-12-03 20:14:31 +0000132#endif
Jeremy Hyltona12c7a72000-03-30 22:27:31 +0000133
Tim Petersf582b822001-12-11 18:51:08 +0000134/* PyDict_Update(mp, other) is equivalent to PyDict_Merge(mp, other, 1). */
Mark Hammond91a681d2002-08-12 07:21:58 +0000135PyAPI_FUNC(int) PyDict_Update(PyObject *mp, PyObject *other);
Tim Petersf582b822001-12-11 18:51:08 +0000136
137/* PyDict_Merge updates/merges from a mapping object (an object that
138 supports PyMapping_Keys() and PyObject_GetItem()). If override is true,
139 the last occurrence of a key wins, else the first. The Python
140 dict.update(other) is equivalent to PyDict_Merge(dict, other, 1).
141*/
Mark Hammond91a681d2002-08-12 07:21:58 +0000142PyAPI_FUNC(int) PyDict_Merge(PyObject *mp,
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000143 PyObject *other,
144 int override);
Tim Petersf582b822001-12-11 18:51:08 +0000145
146/* PyDict_MergeFromSeq2 updates/merges from an iterable object producing
147 iterable objects of length 2. If override is true, the last occurrence
148 of a key wins, else the first. The Python dict constructor dict(seq2)
149 is equivalent to dict={}; PyDict_MergeFromSeq(dict, seq2, 1).
150*/
Mark Hammond91a681d2002-08-12 07:21:58 +0000151PyAPI_FUNC(int) PyDict_MergeFromSeq2(PyObject *d,
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000152 PyObject *seq2,
153 int override);
Guido van Rossum2ec90311997-05-13 21:23:32 +0000154
Martin v. Löwis32b4a1b2002-12-11 13:21:12 +0000155PyAPI_FUNC(PyObject *) PyDict_GetItemString(PyObject *dp, const char *key);
156PyAPI_FUNC(int) PyDict_SetItemString(PyObject *dp, const char *key, PyObject *item);
157PyAPI_FUNC(int) PyDict_DelItemString(PyObject *dp, const char *key);
Guido van Rossum85a5fbb1990-10-14 12:07:46 +0000158
Guido van Rossuma3309961993-07-28 09:05:47 +0000159#ifdef __cplusplus
160}
161#endif
162#endif /* !Py_DICTOBJECT_H */