blob: 6a7e8319440a756f6ef12e2ef68c9aaf913c9eee [file] [log] [blame]
Guido van Rossum2bc13791999-03-24 19:06:42 +00001/* Dictionary object implementation using a hash table */
Guido van Rossum9bfef441993-03-29 10:43:31 +00002
Raymond Hettinger930427b2003-05-03 06:51:59 +00003/* The distribution includes a separate file, Objects/dictnotes.txt,
Tim Peters60b29962006-01-01 01:19:23 +00004 describing explorations into dictionary design and optimization.
Raymond Hettinger930427b2003-05-03 06:51:59 +00005 It covers typical dictionary use patterns, the parameters for
6 tuning dictionaries, and several ideas for possible optimizations.
7*/
8
Victor Stinner742da042016-09-07 17:40:12 -07009/* PyDictKeysObject
10
11This implements the dictionary's hashtable.
12
Raymond Hettingerb12785d2016-10-22 09:58:14 -070013As of Python 3.6, this is compact and ordered. Basic idea is described here:
14* https://mail.python.org/pipermail/python-dev/2012-December/123028.html
15* https://morepypy.blogspot.com/2015/01/faster-more-memory-efficient-and-more.html
Victor Stinner742da042016-09-07 17:40:12 -070016
17layout:
18
19+---------------+
20| dk_refcnt |
21| dk_size |
22| dk_lookup |
23| dk_usable |
24| dk_nentries |
25+---------------+
26| dk_indices |
27| |
28+---------------+
29| dk_entries |
30| |
31+---------------+
32
33dk_indices is actual hashtable. It holds index in entries, or DKIX_EMPTY(-1)
34or DKIX_DUMMY(-2).
35Size of indices is dk_size. Type of each index in indices is vary on dk_size:
36
37* int8 for dk_size <= 128
38* int16 for 256 <= dk_size <= 2**15
39* int32 for 2**16 <= dk_size <= 2**31
40* int64 for 2**32 <= dk_size
41
42dk_entries is array of PyDictKeyEntry. It's size is USABLE_FRACTION(dk_size).
43DK_ENTRIES(dk) can be used to get pointer to entries.
44
45NOTE: Since negative value is used for DKIX_EMPTY and DKIX_DUMMY, type of
46dk_indices entry is signed integer and int16 is used for table which
47dk_size == 256.
48*/
49
Benjamin Peterson7d95e402012-04-23 11:24:50 -040050
51/*
Benjamin Peterson7d95e402012-04-23 11:24:50 -040052The DictObject can be in one of two forms.
Victor Stinner742da042016-09-07 17:40:12 -070053
Benjamin Peterson7d95e402012-04-23 11:24:50 -040054Either:
55 A combined table:
56 ma_values == NULL, dk_refcnt == 1.
57 Values are stored in the me_value field of the PyDictKeysObject.
Benjamin Peterson7d95e402012-04-23 11:24:50 -040058Or:
59 A split table:
60 ma_values != NULL, dk_refcnt >= 1
61 Values are stored in the ma_values array.
Victor Stinner742da042016-09-07 17:40:12 -070062 Only string (unicode) keys are allowed.
63 All dicts sharing same key must have same insertion order.
Benjamin Peterson7d95e402012-04-23 11:24:50 -040064
Victor Stinner742da042016-09-07 17:40:12 -070065There are four kinds of slots in the table (slot is index, and
66DK_ENTRIES(keys)[index] if index >= 0):
67
681. Unused. index == DKIX_EMPTY
69 Does not hold an active (key, value) pair now and never did. Unused can
70 transition to Active upon key insertion. This is each slot's initial state.
71
722. Active. index >= 0, me_key != NULL and me_value != NULL
73 Holds an active (key, value) pair. Active can transition to Dummy or
74 Pending upon key deletion (for combined and split tables respectively).
75 This is the only case in which me_value != NULL.
76
773. Dummy. index == DKIX_DUMMY (combined only)
78 Previously held an active (key, value) pair, but that was deleted and an
79 active pair has not yet overwritten the slot. Dummy can transition to
80 Active upon key insertion. Dummy slots cannot be made Unused again
81 else the probe sequence in case of collision would have no way to know
82 they were once active.
83
844. Pending. index >= 0, key != NULL, and value == NULL (split only)
85 Not yet inserted in split-table.
Benjamin Peterson7d95e402012-04-23 11:24:50 -040086*/
87
Victor Stinner742da042016-09-07 17:40:12 -070088/*
89Preserving insertion order
Benjamin Peterson7d95e402012-04-23 11:24:50 -040090
Victor Stinner742da042016-09-07 17:40:12 -070091It's simple for combined table. Since dk_entries is mostly append only, we can
92get insertion order by just iterating dk_entries.
93
94One exception is .popitem(). It removes last item in dk_entries and decrement
95dk_nentries to achieve amortized O(1). Since there are DKIX_DUMMY remains in
96dk_indices, we can't increment dk_usable even though dk_nentries is
97decremented.
98
99In split table, inserting into pending entry is allowed only for dk_entries[ix]
100where ix == mp->ma_used. Inserting into other index and deleting item cause
101converting the dict to the combined table.
102*/
103
104/* PyDict_MINSIZE is the starting size for any new dict.
Benjamin Peterson7d95e402012-04-23 11:24:50 -0400105 * 8 allows dicts with no more than 5 active entries; experiments suggested
106 * this suffices for the majority of dicts (consisting mostly of usually-small
107 * dicts created to pass keyword arguments).
108 * Making this 8, rather than 4 reduces the number of resizes for most
109 * dictionaries, without any significant extra memory use.
110 */
Victor Stinner742da042016-09-07 17:40:12 -0700111#define PyDict_MINSIZE 8
Benjamin Peterson7d95e402012-04-23 11:24:50 -0400112
Guido van Rossumc0b618a1997-05-02 03:12:38 +0000113#include "Python.h"
Eric Snow96c6af92015-05-29 22:21:39 -0600114#include "dict-common.h"
Victor Stinner990397e2016-09-09 20:22:59 -0700115#include "stringlib/eq.h" /* to get unicode_eq() */
Guido van Rossum4b1302b1993-03-27 18:11:32 +0000116
Larry Hastings61272b72014-01-07 12:41:53 -0800117/*[clinic input]
Larry Hastingsc2047262014-01-25 20:43:29 -0800118class dict "PyDictObject *" "&PyDict_Type"
Larry Hastings61272b72014-01-07 12:41:53 -0800119[clinic start generated code]*/
Larry Hastings581ee362014-01-28 05:00:08 -0800120/*[clinic end generated code: output=da39a3ee5e6b4b0d input=f157a5a0ce9589d6]*/
Larry Hastings44e2eaa2013-11-23 15:37:55 -0800121
Benjamin Peterson7d95e402012-04-23 11:24:50 -0400122
123/*
124To ensure the lookup algorithm terminates, there must be at least one Unused
125slot (NULL key) in the table.
126To avoid slowing down lookups on a near-full table, we resize the table when
127it's USABLE_FRACTION (currently two-thirds) full.
128*/
Guido van Rossum16e93a81997-01-28 00:00:11 +0000129
Tim Peterseb28ef22001-06-02 05:27:19 +0000130#define PERTURB_SHIFT 5
131
Guido van Rossum16e93a81997-01-28 00:00:11 +0000132/*
Tim Peterseb28ef22001-06-02 05:27:19 +0000133Major subtleties ahead: Most hash schemes depend on having a "good" hash
134function, in the sense of simulating randomness. Python doesn't: its most
R David Murray537ad7a2016-07-10 12:33:18 -0400135important hash functions (for ints) are very regular in common
Tim Peterseb28ef22001-06-02 05:27:19 +0000136cases:
Tim Peters15d49292001-05-27 07:39:22 +0000137
R David Murray537ad7a2016-07-10 12:33:18 -0400138 >>>[hash(i) for i in range(4)]
Guido van Rossumdc5f6b22006-08-24 21:29:26 +0000139 [0, 1, 2, 3]
Tim Peters15d49292001-05-27 07:39:22 +0000140
Tim Peterseb28ef22001-06-02 05:27:19 +0000141This isn't necessarily bad! To the contrary, in a table of size 2**i, taking
142the low-order i bits as the initial table index is extremely fast, and there
R David Murray537ad7a2016-07-10 12:33:18 -0400143are no collisions at all for dicts indexed by a contiguous range of ints. So
144this gives better-than-random behavior in common cases, and that's very
145desirable.
Tim Peters15d49292001-05-27 07:39:22 +0000146
Tim Peterseb28ef22001-06-02 05:27:19 +0000147OTOH, when collisions occur, the tendency to fill contiguous slices of the
148hash table makes a good collision resolution strategy crucial. Taking only
149the last i bits of the hash code is also vulnerable: for example, consider
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000150the list [i << 16 for i in range(20000)] as a set of keys. Since ints are
Guido van Rossumdc5f6b22006-08-24 21:29:26 +0000151their own hash codes, and this fits in a dict of size 2**15, the last 15 bits
152 of every hash code are all 0: they *all* map to the same table index.
Tim Peters15d49292001-05-27 07:39:22 +0000153
Tim Peterseb28ef22001-06-02 05:27:19 +0000154But catering to unusual cases should not slow the usual ones, so we just take
155the last i bits anyway. It's up to collision resolution to do the rest. If
156we *usually* find the key we're looking for on the first try (and, it turns
157out, we usually do -- the table load factor is kept under 2/3, so the odds
158are solidly in our favor), then it makes best sense to keep the initial index
159computation dirt cheap.
Tim Peters15d49292001-05-27 07:39:22 +0000160
Tim Peterseb28ef22001-06-02 05:27:19 +0000161The first half of collision resolution is to visit table indices via this
162recurrence:
Tim Peters15d49292001-05-27 07:39:22 +0000163
Tim Peterseb28ef22001-06-02 05:27:19 +0000164 j = ((5*j) + 1) mod 2**i
Tim Peters15d49292001-05-27 07:39:22 +0000165
Tim Peterseb28ef22001-06-02 05:27:19 +0000166For any initial j in range(2**i), repeating that 2**i times generates each
167int in range(2**i) exactly once (see any text on random-number generation for
168proof). By itself, this doesn't help much: like linear probing (setting
169j += 1, or j -= 1, on each loop trip), it scans the table entries in a fixed
170order. This would be bad, except that's not the only thing we do, and it's
171actually *good* in the common cases where hash keys are consecutive. In an
172example that's really too small to make this entirely clear, for a table of
173size 2**3 the order of indices is:
Tim Peters15d49292001-05-27 07:39:22 +0000174
Tim Peterseb28ef22001-06-02 05:27:19 +0000175 0 -> 1 -> 6 -> 7 -> 4 -> 5 -> 2 -> 3 -> 0 [and here it's repeating]
176
177If two things come in at index 5, the first place we look after is index 2,
178not 6, so if another comes in at index 6 the collision at 5 didn't hurt it.
179Linear probing is deadly in this case because there the fixed probe order
180is the *same* as the order consecutive keys are likely to arrive. But it's
181extremely unlikely hash codes will follow a 5*j+1 recurrence by accident,
182and certain that consecutive hash codes do not.
183
184The other half of the strategy is to get the other bits of the hash code
185into play. This is done by initializing a (unsigned) vrbl "perturb" to the
186full hash code, and changing the recurrence to:
187
Tim Peterseb28ef22001-06-02 05:27:19 +0000188 perturb >>= PERTURB_SHIFT;
INADA Naoki267941c2016-10-06 15:19:07 +0900189 j = (5*j) + 1 + perturb;
Tim Peterseb28ef22001-06-02 05:27:19 +0000190 use j % 2**i as the next table index;
191
192Now the probe sequence depends (eventually) on every bit in the hash code,
193and the pseudo-scrambling property of recurring on 5*j+1 is more valuable,
194because it quickly magnifies small differences in the bits that didn't affect
195the initial index. Note that because perturb is unsigned, if the recurrence
196is executed often enough perturb eventually becomes and remains 0. At that
197point (very rarely reached) the recurrence is on (just) 5*j+1 again, and
198that's certain to find an empty slot eventually (since it generates every int
199in range(2**i), and we make sure there's always at least one empty slot).
200
201Selecting a good value for PERTURB_SHIFT is a balancing act. You want it
202small so that the high bits of the hash code continue to affect the probe
203sequence across iterations; but you want it large so that in really bad cases
204the high-order hash bits have an effect on early iterations. 5 was "the
205best" in minimizing total collisions across experiments Tim Peters ran (on
206both normal and pathological cases), but 4 and 6 weren't significantly worse.
207
Guido van Rossumdc5f6b22006-08-24 21:29:26 +0000208Historical: Reimer Behrends contributed the idea of using a polynomial-based
Tim Peterseb28ef22001-06-02 05:27:19 +0000209approach, using repeated multiplication by x in GF(2**n) where an irreducible
210polynomial for each table size was chosen such that x was a primitive root.
211Christian Tismer later extended that to use division by x instead, as an
212efficient way to get the high bits of the hash code into play. This scheme
Guido van Rossum8ce8a782007-11-01 19:42:39 +0000213also gave excellent collision statistics, but was more expensive: two
214if-tests were required inside the loop; computing "the next" index took about
215the same number of operations but without as much potential parallelism
216(e.g., computing 5*j can go on at the same time as computing 1+perturb in the
217above, and then shifting perturb can be done while the table index is being
218masked); and the PyDictObject struct required a member to hold the table's
219polynomial. In Tim's experiments the current scheme ran faster, produced
220equally good collision statistics, needed less code & used less memory.
Thomas Wouters4d70c3d2006-06-08 14:42:34 +0000221
Guido van Rossum4b1302b1993-03-27 18:11:32 +0000222*/
Tim Petersdea48ec2001-05-22 20:40:22 +0000223
Fred Drake1bff34a2000-08-31 19:31:38 +0000224/* forward declarations */
Victor Stinner742da042016-09-07 17:40:12 -0700225static Py_ssize_t lookdict(PyDictObject *mp, PyObject *key,
INADA Naokiba609772016-12-07 20:41:42 +0900226 Py_hash_t hash, PyObject **value_addr,
Victor Stinner742da042016-09-07 17:40:12 -0700227 Py_ssize_t *hashpos);
228static Py_ssize_t lookdict_unicode(PyDictObject *mp, PyObject *key,
INADA Naokiba609772016-12-07 20:41:42 +0900229 Py_hash_t hash, PyObject **value_addr,
Victor Stinner742da042016-09-07 17:40:12 -0700230 Py_ssize_t *hashpos);
231static Py_ssize_t
Benjamin Peterson7d95e402012-04-23 11:24:50 -0400232lookdict_unicode_nodummy(PyDictObject *mp, PyObject *key,
INADA Naokiba609772016-12-07 20:41:42 +0900233 Py_hash_t hash, PyObject **value_addr,
Victor Stinner742da042016-09-07 17:40:12 -0700234 Py_ssize_t *hashpos);
235static Py_ssize_t lookdict_split(PyDictObject *mp, PyObject *key,
INADA Naokiba609772016-12-07 20:41:42 +0900236 Py_hash_t hash, PyObject **value_addr,
Victor Stinner742da042016-09-07 17:40:12 -0700237 Py_ssize_t *hashpos);
Fred Drake1bff34a2000-08-31 19:31:38 +0000238
Benjamin Peterson7d95e402012-04-23 11:24:50 -0400239static int dictresize(PyDictObject *mp, Py_ssize_t minused);
Tim Petersdea48ec2001-05-22 20:40:22 +0000240
Benjamin Peterson3c569292016-09-08 13:16:41 -0700241/*Global counter used to set ma_version_tag field of dictionary.
Victor Stinner3b6a6b42016-09-08 12:51:24 -0700242 * It is incremented each time that a dictionary is created and each
243 * time that a dictionary is modified. */
244static uint64_t pydict_global_version = 0;
245
246#define DICT_NEXT_VERSION() (++pydict_global_version)
247
Victor Stinner742da042016-09-07 17:40:12 -0700248/* Dictionary reuse scheme to save calls to malloc and free */
Christian Heimes2202f872008-02-06 14:31:34 +0000249#ifndef PyDict_MAXFREELIST
250#define PyDict_MAXFREELIST 80
251#endif
252static PyDictObject *free_list[PyDict_MAXFREELIST];
253static int numfree = 0;
Victor Stinner742da042016-09-07 17:40:12 -0700254static PyDictKeysObject *keys_free_list[PyDict_MAXFREELIST];
255static int numfreekeys = 0;
Raymond Hettinger43442782004-03-17 21:55:03 +0000256
Serhiy Storchaka1009bf12015-04-03 23:53:51 +0300257#include "clinic/dictobject.c.h"
258
Antoine Pitrou9a812cb2011-11-15 00:00:12 +0100259int
260PyDict_ClearFreeList(void)
Christian Heimes77c02eb2008-02-09 02:18:51 +0000261{
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000262 PyDictObject *op;
Victor Stinner742da042016-09-07 17:40:12 -0700263 int ret = numfree + numfreekeys;
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000264 while (numfree) {
265 op = free_list[--numfree];
266 assert(PyDict_CheckExact(op));
267 PyObject_GC_Del(op);
268 }
Victor Stinner742da042016-09-07 17:40:12 -0700269 while (numfreekeys) {
270 PyObject_FREE(keys_free_list[--numfreekeys]);
271 }
Antoine Pitrou9a812cb2011-11-15 00:00:12 +0100272 return ret;
273}
274
David Malcolm49526f42012-06-22 14:55:41 -0400275/* Print summary info about the state of the optimized allocator */
276void
277_PyDict_DebugMallocStats(FILE *out)
278{
279 _PyDebugAllocatorStats(out,
280 "free PyDictObject", numfree, sizeof(PyDictObject));
281}
282
283
Antoine Pitrou9a812cb2011-11-15 00:00:12 +0100284void
285PyDict_Fini(void)
286{
287 PyDict_ClearFreeList();
Christian Heimes77c02eb2008-02-09 02:18:51 +0000288}
289
Victor Stinner742da042016-09-07 17:40:12 -0700290#define DK_SIZE(dk) ((dk)->dk_size)
291#if SIZEOF_VOID_P > 4
Victor Stinner58f7c5a2016-09-08 11:37:36 -0700292#define DK_IXSIZE(dk) \
293 (DK_SIZE(dk) <= 0xff ? \
294 1 : DK_SIZE(dk) <= 0xffff ? \
295 2 : DK_SIZE(dk) <= 0xffffffff ? \
Benjamin Peterson3c569292016-09-08 13:16:41 -0700296 4 : sizeof(int64_t))
Victor Stinner742da042016-09-07 17:40:12 -0700297#else
Victor Stinner58f7c5a2016-09-08 11:37:36 -0700298#define DK_IXSIZE(dk) \
299 (DK_SIZE(dk) <= 0xff ? \
300 1 : DK_SIZE(dk) <= 0xffff ? \
Benjamin Peterson3c569292016-09-08 13:16:41 -0700301 2 : sizeof(int32_t))
Victor Stinner742da042016-09-07 17:40:12 -0700302#endif
Victor Stinner58f7c5a2016-09-08 11:37:36 -0700303#define DK_ENTRIES(dk) \
Benjamin Peterson186122e2016-09-08 12:20:12 -0700304 ((PyDictKeyEntry*)(&(dk)->dk_indices.as_1[DK_SIZE(dk) * DK_IXSIZE(dk)]))
Victor Stinner742da042016-09-07 17:40:12 -0700305
Antoine Pitrou2d169b22012-05-12 23:43:44 +0200306#define DK_DEBUG_INCREF _Py_INC_REFTOTAL _Py_REF_DEBUG_COMMA
307#define DK_DEBUG_DECREF _Py_DEC_REFTOTAL _Py_REF_DEBUG_COMMA
308
309#define DK_INCREF(dk) (DK_DEBUG_INCREF ++(dk)->dk_refcnt)
310#define DK_DECREF(dk) if (DK_DEBUG_DECREF (--(dk)->dk_refcnt) == 0) free_keys_object(dk)
Benjamin Peterson7d95e402012-04-23 11:24:50 -0400311#define DK_MASK(dk) (((dk)->dk_size)-1)
312#define IS_POWER_OF_2(x) (((x) & (x-1)) == 0)
313
Victor Stinner742da042016-09-07 17:40:12 -0700314/* lookup indices. returns DKIX_EMPTY, DKIX_DUMMY, or ix >=0 */
Benjamin Peterson73222252016-09-08 09:58:47 -0700315static inline Py_ssize_t
Victor Stinner742da042016-09-07 17:40:12 -0700316dk_get_index(PyDictKeysObject *keys, Py_ssize_t i)
317{
318 Py_ssize_t s = DK_SIZE(keys);
Victor Stinner71211e32016-09-08 10:52:46 -0700319 Py_ssize_t ix;
320
Victor Stinner742da042016-09-07 17:40:12 -0700321 if (s <= 0xff) {
Benjamin Peterson186122e2016-09-08 12:20:12 -0700322 int8_t *indices = keys->dk_indices.as_1;
Victor Stinner208857e2016-09-08 11:35:46 -0700323 ix = indices[i];
Victor Stinner742da042016-09-07 17:40:12 -0700324 }
325 else if (s <= 0xffff) {
Benjamin Peterson186122e2016-09-08 12:20:12 -0700326 int16_t *indices = keys->dk_indices.as_2;
Victor Stinner208857e2016-09-08 11:35:46 -0700327 ix = indices[i];
Victor Stinner742da042016-09-07 17:40:12 -0700328 }
Benjamin Peterson3c569292016-09-08 13:16:41 -0700329#if SIZEOF_VOID_P > 4
Serhiy Storchaka473e0e42016-09-10 21:34:43 +0300330 else if (s > 0xffffffff) {
Benjamin Peterson186122e2016-09-08 12:20:12 -0700331 int64_t *indices = keys->dk_indices.as_8;
Victor Stinner208857e2016-09-08 11:35:46 -0700332 ix = indices[i];
Victor Stinner742da042016-09-07 17:40:12 -0700333 }
Benjamin Peterson3c569292016-09-08 13:16:41 -0700334#endif
Serhiy Storchaka473e0e42016-09-10 21:34:43 +0300335 else {
336 int32_t *indices = keys->dk_indices.as_4;
337 ix = indices[i];
338 }
Victor Stinner71211e32016-09-08 10:52:46 -0700339 assert(ix >= DKIX_DUMMY);
340 return ix;
Victor Stinner742da042016-09-07 17:40:12 -0700341}
342
343/* write to indices. */
Benjamin Peterson73222252016-09-08 09:58:47 -0700344static inline void
Victor Stinner742da042016-09-07 17:40:12 -0700345dk_set_index(PyDictKeysObject *keys, Py_ssize_t i, Py_ssize_t ix)
346{
347 Py_ssize_t s = DK_SIZE(keys);
Victor Stinner71211e32016-09-08 10:52:46 -0700348
349 assert(ix >= DKIX_DUMMY);
350
Victor Stinner742da042016-09-07 17:40:12 -0700351 if (s <= 0xff) {
Benjamin Peterson186122e2016-09-08 12:20:12 -0700352 int8_t *indices = keys->dk_indices.as_1;
Victor Stinner71211e32016-09-08 10:52:46 -0700353 assert(ix <= 0x7f);
Victor Stinner208857e2016-09-08 11:35:46 -0700354 indices[i] = (char)ix;
Victor Stinner742da042016-09-07 17:40:12 -0700355 }
356 else if (s <= 0xffff) {
Benjamin Peterson186122e2016-09-08 12:20:12 -0700357 int16_t *indices = keys->dk_indices.as_2;
Victor Stinner71211e32016-09-08 10:52:46 -0700358 assert(ix <= 0x7fff);
Victor Stinner208857e2016-09-08 11:35:46 -0700359 indices[i] = (int16_t)ix;
Victor Stinner742da042016-09-07 17:40:12 -0700360 }
Benjamin Peterson3c569292016-09-08 13:16:41 -0700361#if SIZEOF_VOID_P > 4
Serhiy Storchaka473e0e42016-09-10 21:34:43 +0300362 else if (s > 0xffffffff) {
Benjamin Peterson186122e2016-09-08 12:20:12 -0700363 int64_t *indices = keys->dk_indices.as_8;
Victor Stinner208857e2016-09-08 11:35:46 -0700364 indices[i] = ix;
Victor Stinner742da042016-09-07 17:40:12 -0700365 }
Benjamin Peterson3c569292016-09-08 13:16:41 -0700366#endif
Serhiy Storchaka473e0e42016-09-10 21:34:43 +0300367 else {
368 int32_t *indices = keys->dk_indices.as_4;
369 assert(ix <= 0x7fffffff);
370 indices[i] = (int32_t)ix;
371 }
Victor Stinner742da042016-09-07 17:40:12 -0700372}
373
374
Antoine Pitroua504a7a2012-06-24 21:03:45 +0200375/* USABLE_FRACTION is the maximum dictionary load.
Victor Stinner742da042016-09-07 17:40:12 -0700376 * Increasing this ratio makes dictionaries more dense resulting in more
377 * collisions. Decreasing it improves sparseness at the expense of spreading
378 * indices over more cache lines and at the cost of total memory consumed.
Antoine Pitroua504a7a2012-06-24 21:03:45 +0200379 *
380 * USABLE_FRACTION must obey the following:
Benjamin Peterson7d95e402012-04-23 11:24:50 -0400381 * (0 < USABLE_FRACTION(n) < n) for all n >= 2
382 *
Victor Stinner742da042016-09-07 17:40:12 -0700383 * USABLE_FRACTION should be quick to calculate.
384 * Fractions around 1/2 to 2/3 seem to work well in practice.
Benjamin Peterson7d95e402012-04-23 11:24:50 -0400385 */
Victor Stinner742da042016-09-07 17:40:12 -0700386#define USABLE_FRACTION(n) (((n) << 1)/3)
Benjamin Peterson7d95e402012-04-23 11:24:50 -0400387
Victor Stinner742da042016-09-07 17:40:12 -0700388/* ESTIMATE_SIZE is reverse function of USABLE_FRACTION.
389 * This can be used to reserve enough size to insert n entries without
390 * resizing.
391 */
INADA Naoki92c50ee2016-11-22 00:57:02 +0900392#define ESTIMATE_SIZE(n) (((n)*3+1) >> 1)
Benjamin Peterson7d95e402012-04-23 11:24:50 -0400393
Victor Stinner742da042016-09-07 17:40:12 -0700394/* Alternative fraction that is otherwise close enough to 2n/3 to make
Benjamin Peterson7d95e402012-04-23 11:24:50 -0400395 * little difference. 8 * 2/3 == 8 * 5/8 == 5. 16 * 2/3 == 16 * 5/8 == 10.
396 * 32 * 2/3 = 21, 32 * 5/8 = 20.
397 * Its advantage is that it is faster to compute on machines with slow division.
398 * #define USABLE_FRACTION(n) (((n) >> 1) + ((n) >> 2) - ((n) >> 3))
Victor Stinner742da042016-09-07 17:40:12 -0700399 */
Benjamin Peterson7d95e402012-04-23 11:24:50 -0400400
Victor Stinnera9f61a52013-07-16 22:17:26 +0200401/* GROWTH_RATE. Growth rate upon hitting maximum load.
402 * Currently set to used*2 + capacity/2.
403 * This means that dicts double in size when growing without deletions,
Raymond Hettinger36f74aa2013-05-17 03:01:13 -0700404 * but have more head room when the number of deletions is on a par with the
405 * number of insertions.
406 * Raising this to used*4 doubles memory consumption depending on the size of
Antoine Pitroua504a7a2012-06-24 21:03:45 +0200407 * the dictionary, but results in half the number of resizes, less effort to
Raymond Hettinger36f74aa2013-05-17 03:01:13 -0700408 * resize.
409 * GROWTH_RATE was set to used*4 up to version 3.2.
410 * GROWTH_RATE was set to used*2 in version 3.3.0
Antoine Pitroua504a7a2012-06-24 21:03:45 +0200411 */
Raymond Hettinger36f74aa2013-05-17 03:01:13 -0700412#define GROWTH_RATE(d) (((d)->ma_used*2)+((d)->ma_keys->dk_size>>1))
Benjamin Peterson7d95e402012-04-23 11:24:50 -0400413
414#define ENSURE_ALLOWS_DELETIONS(d) \
415 if ((d)->ma_keys->dk_lookup == lookdict_unicode_nodummy) { \
416 (d)->ma_keys->dk_lookup = lookdict_unicode; \
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000417 }
Benjamin Peterson7d95e402012-04-23 11:24:50 -0400418
419/* This immutable, empty PyDictKeysObject is used for PyDict_Clear()
420 * (which cannot fail and thus can do no allocation).
421 */
422static PyDictKeysObject empty_keys_struct = {
Serhiy Storchaka97932e42016-09-26 23:01:23 +0300423 1, /* dk_refcnt */
Benjamin Peterson7d95e402012-04-23 11:24:50 -0400424 1, /* dk_size */
425 lookdict_split, /* dk_lookup */
426 0, /* dk_usable (immutable) */
Victor Stinner742da042016-09-07 17:40:12 -0700427 0, /* dk_nentries */
Benjamin Peterson186122e2016-09-08 12:20:12 -0700428 .dk_indices = { .as_1 = {DKIX_EMPTY, DKIX_EMPTY, DKIX_EMPTY, DKIX_EMPTY,
429 DKIX_EMPTY, DKIX_EMPTY, DKIX_EMPTY, DKIX_EMPTY}},
Benjamin Peterson7d95e402012-04-23 11:24:50 -0400430};
431
432static PyObject *empty_values[1] = { NULL };
433
434#define Py_EMPTY_KEYS &empty_keys_struct
435
Victor Stinner611b0fa2016-09-14 15:02:01 +0200436/* Uncomment to check the dict content in _PyDict_CheckConsistency() */
437/* #define DEBUG_PYDICT */
438
439
440#ifdef Py_DEBUG
441static int
442_PyDict_CheckConsistency(PyDictObject *mp)
443{
444 PyDictKeysObject *keys = mp->ma_keys;
445 int splitted = _PyDict_HasSplitTable(mp);
446 Py_ssize_t usable = USABLE_FRACTION(keys->dk_size);
447#ifdef DEBUG_PYDICT
448 PyDictKeyEntry *entries = DK_ENTRIES(keys);
449 Py_ssize_t i;
450#endif
451
452 assert(0 <= mp->ma_used && mp->ma_used <= usable);
453 assert(IS_POWER_OF_2(keys->dk_size));
454 assert(0 <= keys->dk_usable
455 && keys->dk_usable <= usable);
456 assert(0 <= keys->dk_nentries
457 && keys->dk_nentries <= usable);
458 assert(keys->dk_usable + keys->dk_nentries <= usable);
459
460 if (!splitted) {
461 /* combined table */
462 assert(keys->dk_refcnt == 1);
463 }
464
465#ifdef DEBUG_PYDICT
466 for (i=0; i < keys->dk_size; i++) {
467 Py_ssize_t ix = dk_get_index(keys, i);
468 assert(DKIX_DUMMY <= ix && ix <= usable);
469 }
470
471 for (i=0; i < usable; i++) {
472 PyDictKeyEntry *entry = &entries[i];
473 PyObject *key = entry->me_key;
474
475 if (key != NULL) {
476 if (PyUnicode_CheckExact(key)) {
477 Py_hash_t hash = ((PyASCIIObject *)key)->hash;
478 assert(hash != -1);
479 assert(entry->me_hash == hash);
480 }
481 else {
482 /* test_dict fails if PyObject_Hash() is called again */
483 assert(entry->me_hash != -1);
484 }
485 if (!splitted) {
486 assert(entry->me_value != NULL);
487 }
488 }
489
490 if (splitted) {
491 assert(entry->me_value == NULL);
492 }
493 }
494
495 if (splitted) {
496 /* splitted table */
497 for (i=0; i < mp->ma_used; i++) {
498 assert(mp->ma_values[i] != NULL);
499 }
500 }
501#endif
502
503 return 1;
504}
505#endif
506
507
Benjamin Peterson7d95e402012-04-23 11:24:50 -0400508static PyDictKeysObject *new_keys_object(Py_ssize_t size)
509{
510 PyDictKeysObject *dk;
Victor Stinner742da042016-09-07 17:40:12 -0700511 Py_ssize_t es, usable;
Benjamin Peterson7d95e402012-04-23 11:24:50 -0400512
Victor Stinner742da042016-09-07 17:40:12 -0700513 assert(size >= PyDict_MINSIZE);
Benjamin Peterson7d95e402012-04-23 11:24:50 -0400514 assert(IS_POWER_OF_2(size));
Victor Stinner742da042016-09-07 17:40:12 -0700515
516 usable = USABLE_FRACTION(size);
517 if (size <= 0xff) {
518 es = 1;
519 }
520 else if (size <= 0xffff) {
521 es = 2;
522 }
523#if SIZEOF_VOID_P > 4
524 else if (size <= 0xffffffff) {
525 es = 4;
526 }
527#endif
528 else {
529 es = sizeof(Py_ssize_t);
530 }
531
532 if (size == PyDict_MINSIZE && numfreekeys > 0) {
533 dk = keys_free_list[--numfreekeys];
534 }
535 else {
Victor Stinner98ee9d52016-09-08 09:33:56 -0700536 dk = PyObject_MALLOC(sizeof(PyDictKeysObject)
537 - Py_MEMBER_SIZE(PyDictKeysObject, dk_indices)
538 + es * size
539 + sizeof(PyDictKeyEntry) * usable);
Victor Stinner742da042016-09-07 17:40:12 -0700540 if (dk == NULL) {
541 PyErr_NoMemory();
542 return NULL;
543 }
Benjamin Peterson7d95e402012-04-23 11:24:50 -0400544 }
Antoine Pitrou2d169b22012-05-12 23:43:44 +0200545 DK_DEBUG_INCREF dk->dk_refcnt = 1;
Benjamin Peterson7d95e402012-04-23 11:24:50 -0400546 dk->dk_size = size;
Victor Stinner742da042016-09-07 17:40:12 -0700547 dk->dk_usable = usable;
Benjamin Peterson7d95e402012-04-23 11:24:50 -0400548 dk->dk_lookup = lookdict_unicode_nodummy;
Victor Stinner742da042016-09-07 17:40:12 -0700549 dk->dk_nentries = 0;
Benjamin Peterson186122e2016-09-08 12:20:12 -0700550 memset(&dk->dk_indices.as_1[0], 0xff, es * size);
Victor Stinner742da042016-09-07 17:40:12 -0700551 memset(DK_ENTRIES(dk), 0, sizeof(PyDictKeyEntry) * usable);
Benjamin Peterson7d95e402012-04-23 11:24:50 -0400552 return dk;
553}
554
555static void
556free_keys_object(PyDictKeysObject *keys)
557{
Victor Stinner742da042016-09-07 17:40:12 -0700558 PyDictKeyEntry *entries = DK_ENTRIES(keys);
Benjamin Peterson7d95e402012-04-23 11:24:50 -0400559 Py_ssize_t i, n;
Victor Stinner742da042016-09-07 17:40:12 -0700560 for (i = 0, n = keys->dk_nentries; i < n; i++) {
Benjamin Peterson7d95e402012-04-23 11:24:50 -0400561 Py_XDECREF(entries[i].me_key);
562 Py_XDECREF(entries[i].me_value);
563 }
Victor Stinner742da042016-09-07 17:40:12 -0700564 if (keys->dk_size == PyDict_MINSIZE && numfreekeys < PyDict_MAXFREELIST) {
565 keys_free_list[numfreekeys++] = keys;
566 return;
567 }
Raymond Hettingerce5179f2016-01-31 08:56:21 -0800568 PyObject_FREE(keys);
Benjamin Peterson7d95e402012-04-23 11:24:50 -0400569}
570
571#define new_values(size) PyMem_NEW(PyObject *, size)
Benjamin Peterson7d95e402012-04-23 11:24:50 -0400572#define free_values(values) PyMem_FREE(values)
573
574/* Consumes a reference to the keys object */
575static PyObject *
576new_dict(PyDictKeysObject *keys, PyObject **values)
577{
578 PyDictObject *mp;
Victor Stinnerc9b7f512013-07-08 22:19:20 +0200579 assert(keys != NULL);
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000580 if (numfree) {
581 mp = free_list[--numfree];
582 assert (mp != NULL);
583 assert (Py_TYPE(mp) == &PyDict_Type);
584 _Py_NewReference((PyObject *)mp);
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000585 }
Benjamin Peterson7d95e402012-04-23 11:24:50 -0400586 else {
587 mp = PyObject_GC_New(PyDictObject, &PyDict_Type);
588 if (mp == NULL) {
589 DK_DECREF(keys);
590 free_values(values);
591 return NULL;
592 }
593 }
594 mp->ma_keys = keys;
595 mp->ma_values = values;
596 mp->ma_used = 0;
Victor Stinner3b6a6b42016-09-08 12:51:24 -0700597 mp->ma_version_tag = DICT_NEXT_VERSION();
Victor Stinner611b0fa2016-09-14 15:02:01 +0200598 assert(_PyDict_CheckConsistency(mp));
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000599 return (PyObject *)mp;
Guido van Rossum4b1302b1993-03-27 18:11:32 +0000600}
601
Benjamin Peterson7d95e402012-04-23 11:24:50 -0400602/* Consumes a reference to the keys object */
603static PyObject *
604new_dict_with_shared_keys(PyDictKeysObject *keys)
605{
606 PyObject **values;
607 Py_ssize_t i, size;
608
Victor Stinner742da042016-09-07 17:40:12 -0700609 size = USABLE_FRACTION(DK_SIZE(keys));
Benjamin Peterson7d95e402012-04-23 11:24:50 -0400610 values = new_values(size);
611 if (values == NULL) {
612 DK_DECREF(keys);
613 return PyErr_NoMemory();
614 }
615 for (i = 0; i < size; i++) {
616 values[i] = NULL;
617 }
618 return new_dict(keys, values);
619}
620
621PyObject *
622PyDict_New(void)
623{
Victor Stinner742da042016-09-07 17:40:12 -0700624 PyDictKeysObject *keys = new_keys_object(PyDict_MINSIZE);
Victor Stinnerc9b7f512013-07-08 22:19:20 +0200625 if (keys == NULL)
626 return NULL;
627 return new_dict(keys, NULL);
Benjamin Peterson7d95e402012-04-23 11:24:50 -0400628}
629
Victor Stinner742da042016-09-07 17:40:12 -0700630/* Search index of hash table from offset of entry table */
631static Py_ssize_t
632lookdict_index(PyDictKeysObject *k, Py_hash_t hash, Py_ssize_t index)
633{
INADA Naoki267941c2016-10-06 15:19:07 +0900634 size_t i;
Victor Stinner742da042016-09-07 17:40:12 -0700635 size_t mask = DK_MASK(k);
636 Py_ssize_t ix;
637
638 i = (size_t)hash & mask;
639 ix = dk_get_index(k, i);
640 if (ix == index) {
641 return i;
642 }
643 if (ix == DKIX_EMPTY) {
644 return DKIX_EMPTY;
645 }
646
INADA Naoki267941c2016-10-06 15:19:07 +0900647 for (size_t perturb = hash;;) {
648 perturb >>= PERTURB_SHIFT;
Victor Stinner742da042016-09-07 17:40:12 -0700649 i = mask & ((i << 2) + i + perturb + 1);
650 ix = dk_get_index(k, i);
651 if (ix == index) {
652 return i;
653 }
654 if (ix == DKIX_EMPTY) {
655 return DKIX_EMPTY;
656 }
657 }
658 assert(0); /* NOT REACHED */
659 return DKIX_ERROR;
660}
661
Guido van Rossum4b1302b1993-03-27 18:11:32 +0000662/*
663The basic lookup function used by all operations.
Guido van Rossum16e93a81997-01-28 00:00:11 +0000664This is based on Algorithm D from Knuth Vol. 3, Sec. 6.4.
Guido van Rossum4b1302b1993-03-27 18:11:32 +0000665Open addressing is preferred over chaining since the link overhead for
666chaining would be substantial (100% with typical malloc overhead).
667
Tim Peterseb28ef22001-06-02 05:27:19 +0000668The initial probe index is computed as hash mod the table size. Subsequent
669probe indices are computed as explained earlier.
Guido van Rossum2bc13791999-03-24 19:06:42 +0000670
671All arithmetic on hash should ignore overflow.
Guido van Rossum16e93a81997-01-28 00:00:11 +0000672
Guido van Rossumdc5f6b22006-08-24 21:29:26 +0000673The details in this version are due to Tim Peters, building on many past
Tim Peterseb28ef22001-06-02 05:27:19 +0000674contributions by Reimer Behrends, Jyrki Alakuijala, Vladimir Marangozov and
Guido van Rossumdc5f6b22006-08-24 21:29:26 +0000675Christian Tismer.
Fred Drake1bff34a2000-08-31 19:31:38 +0000676
Victor Stinner742da042016-09-07 17:40:12 -0700677lookdict() is general-purpose, and may return DKIX_ERROR if (and only if) a
Victor Stinnera4348cc2016-09-08 12:01:25 -0700678comparison raises an exception.
Guido van Rossum89d8c602007-09-18 17:26:56 +0000679lookdict_unicode() below is specialized to string keys, comparison of which can
Victor Stinner742da042016-09-07 17:40:12 -0700680never raise an exception; that function can never return DKIX_ERROR.
Benjamin Peterson7d95e402012-04-23 11:24:50 -0400681lookdict_unicode_nodummy is further specialized for string keys that cannot be
682the <dummy> value.
Victor Stinner742da042016-09-07 17:40:12 -0700683For both, when the key isn't found a DKIX_EMPTY is returned. hashpos returns
684where the key index should be inserted.
Guido van Rossum4b1302b1993-03-27 18:11:32 +0000685*/
Victor Stinnerc7a8f672016-11-15 15:13:40 +0100686static Py_ssize_t _Py_HOT_FUNCTION
Benjamin Peterson7d95e402012-04-23 11:24:50 -0400687lookdict(PyDictObject *mp, PyObject *key,
INADA Naokiba609772016-12-07 20:41:42 +0900688 Py_hash_t hash, PyObject **value_addr, Py_ssize_t *hashpos)
Guido van Rossum4b1302b1993-03-27 18:11:32 +0000689{
INADA Naoki267941c2016-10-06 15:19:07 +0900690 size_t i, mask;
Victor Stinner742da042016-09-07 17:40:12 -0700691 Py_ssize_t ix, freeslot;
Antoine Pitrou9ed5f272013-08-13 20:18:52 +0200692 int cmp;
Victor Stinner742da042016-09-07 17:40:12 -0700693 PyDictKeysObject *dk;
694 PyDictKeyEntry *ep0, *ep;
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000695 PyObject *startkey;
Tim Peterseb28ef22001-06-02 05:27:19 +0000696
Antoine Pitrou9a234902012-05-13 20:48:01 +0200697top:
Victor Stinner742da042016-09-07 17:40:12 -0700698 dk = mp->ma_keys;
699 mask = DK_MASK(dk);
700 ep0 = DK_ENTRIES(dk);
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000701 i = (size_t)hash & mask;
Victor Stinner742da042016-09-07 17:40:12 -0700702
703 ix = dk_get_index(dk, i);
704 if (ix == DKIX_EMPTY) {
705 if (hashpos != NULL)
706 *hashpos = i;
707 *value_addr = NULL;
708 return DKIX_EMPTY;
Benjamin Peterson7d95e402012-04-23 11:24:50 -0400709 }
Victor Stinner742da042016-09-07 17:40:12 -0700710 if (ix == DKIX_DUMMY) {
711 freeslot = i;
712 }
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000713 else {
Victor Stinner742da042016-09-07 17:40:12 -0700714 ep = &ep0[ix];
Serhiy Storchaka46825d22016-09-26 21:29:34 +0300715 assert(ep->me_key != NULL);
Victor Stinner742da042016-09-07 17:40:12 -0700716 if (ep->me_key == key) {
INADA Naokiba609772016-12-07 20:41:42 +0900717 *value_addr = ep->me_value;
Victor Stinner742da042016-09-07 17:40:12 -0700718 if (hashpos != NULL)
719 *hashpos = i;
720 return ix;
721 }
Serhiy Storchaka46825d22016-09-26 21:29:34 +0300722 if (ep->me_hash == hash) {
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000723 startkey = ep->me_key;
724 Py_INCREF(startkey);
725 cmp = PyObject_RichCompareBool(startkey, key, Py_EQ);
726 Py_DECREF(startkey);
Serhiy Storchakaf0b311b2016-11-06 13:18:24 +0200727 if (cmp < 0) {
728 *value_addr = NULL;
Victor Stinner742da042016-09-07 17:40:12 -0700729 return DKIX_ERROR;
Serhiy Storchakaf0b311b2016-11-06 13:18:24 +0200730 }
Victor Stinner742da042016-09-07 17:40:12 -0700731 if (dk == mp->ma_keys && ep->me_key == startkey) {
Benjamin Peterson7d95e402012-04-23 11:24:50 -0400732 if (cmp > 0) {
INADA Naokiba609772016-12-07 20:41:42 +0900733 *value_addr = ep->me_value;
Victor Stinner742da042016-09-07 17:40:12 -0700734 if (hashpos != NULL)
735 *hashpos = i;
736 return ix;
Benjamin Peterson7d95e402012-04-23 11:24:50 -0400737 }
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000738 }
739 else {
Antoine Pitrou9a234902012-05-13 20:48:01 +0200740 /* The dict was mutated, restart */
741 goto top;
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000742 }
743 }
Victor Stinner742da042016-09-07 17:40:12 -0700744 freeslot = -1;
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000745 }
Tim Peters15d49292001-05-27 07:39:22 +0000746
INADA Naoki267941c2016-10-06 15:19:07 +0900747 for (size_t perturb = hash;;) {
748 perturb >>= PERTURB_SHIFT;
Victor Stinner742da042016-09-07 17:40:12 -0700749 i = ((i << 2) + i + perturb + 1) & mask;
750 ix = dk_get_index(dk, i);
751 if (ix == DKIX_EMPTY) {
752 if (hashpos != NULL) {
753 *hashpos = (freeslot == -1) ? (Py_ssize_t)i : freeslot;
Benjamin Peterson7d95e402012-04-23 11:24:50 -0400754 }
Victor Stinner742da042016-09-07 17:40:12 -0700755 *value_addr = NULL;
756 return ix;
Benjamin Peterson7d95e402012-04-23 11:24:50 -0400757 }
Victor Stinner742da042016-09-07 17:40:12 -0700758 if (ix == DKIX_DUMMY) {
759 if (freeslot == -1)
760 freeslot = i;
761 continue;
762 }
763 ep = &ep0[ix];
Serhiy Storchaka46825d22016-09-26 21:29:34 +0300764 assert(ep->me_key != NULL);
Benjamin Peterson7d95e402012-04-23 11:24:50 -0400765 if (ep->me_key == key) {
Victor Stinner742da042016-09-07 17:40:12 -0700766 if (hashpos != NULL) {
767 *hashpos = i;
768 }
INADA Naokiba609772016-12-07 20:41:42 +0900769 *value_addr = ep->me_value;
Victor Stinner742da042016-09-07 17:40:12 -0700770 return ix;
Benjamin Peterson7d95e402012-04-23 11:24:50 -0400771 }
Serhiy Storchaka46825d22016-09-26 21:29:34 +0300772 if (ep->me_hash == hash) {
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000773 startkey = ep->me_key;
774 Py_INCREF(startkey);
775 cmp = PyObject_RichCompareBool(startkey, key, Py_EQ);
776 Py_DECREF(startkey);
Benjamin Peterson7d95e402012-04-23 11:24:50 -0400777 if (cmp < 0) {
778 *value_addr = NULL;
Victor Stinner742da042016-09-07 17:40:12 -0700779 return DKIX_ERROR;
Benjamin Peterson7d95e402012-04-23 11:24:50 -0400780 }
Victor Stinner742da042016-09-07 17:40:12 -0700781 if (dk == mp->ma_keys && ep->me_key == startkey) {
Benjamin Peterson7d95e402012-04-23 11:24:50 -0400782 if (cmp > 0) {
Victor Stinner742da042016-09-07 17:40:12 -0700783 if (hashpos != NULL) {
784 *hashpos = i;
785 }
INADA Naokiba609772016-12-07 20:41:42 +0900786 *value_addr = ep->me_value;
Victor Stinner742da042016-09-07 17:40:12 -0700787 return ix;
Benjamin Peterson7d95e402012-04-23 11:24:50 -0400788 }
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000789 }
790 else {
Antoine Pitrou9a234902012-05-13 20:48:01 +0200791 /* The dict was mutated, restart */
792 goto top;
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000793 }
794 }
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000795 }
796 assert(0); /* NOT REACHED */
797 return 0;
Guido van Rossum4b1302b1993-03-27 18:11:32 +0000798}
799
Benjamin Peterson7d95e402012-04-23 11:24:50 -0400800/* Specialized version for string-only keys */
Victor Stinnerc7a8f672016-11-15 15:13:40 +0100801static Py_ssize_t _Py_HOT_FUNCTION
Benjamin Peterson7d95e402012-04-23 11:24:50 -0400802lookdict_unicode(PyDictObject *mp, PyObject *key,
INADA Naokiba609772016-12-07 20:41:42 +0900803 Py_hash_t hash, PyObject **value_addr, Py_ssize_t *hashpos)
Fred Drake1bff34a2000-08-31 19:31:38 +0000804{
INADA Naoki267941c2016-10-06 15:19:07 +0900805 size_t i;
Antoine Pitrou9ed5f272013-08-13 20:18:52 +0200806 size_t mask = DK_MASK(mp->ma_keys);
Victor Stinner742da042016-09-07 17:40:12 -0700807 Py_ssize_t ix, freeslot;
808 PyDictKeyEntry *ep, *ep0 = DK_ENTRIES(mp->ma_keys);
Fred Drake1bff34a2000-08-31 19:31:38 +0000809
Victor Stinner742da042016-09-07 17:40:12 -0700810 assert(mp->ma_values == NULL);
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000811 /* Make sure this function doesn't have to handle non-unicode keys,
812 including subclasses of str; e.g., one reason to subclass
813 unicodes is to override __eq__, and for speed we don't cater to
814 that here. */
815 if (!PyUnicode_CheckExact(key)) {
Benjamin Peterson7d95e402012-04-23 11:24:50 -0400816 mp->ma_keys->dk_lookup = lookdict;
Victor Stinner742da042016-09-07 17:40:12 -0700817 return lookdict(mp, key, hash, value_addr, hashpos);
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000818 }
Mark Dickinson57e683e2011-09-24 18:18:40 +0100819 i = (size_t)hash & mask;
Victor Stinner742da042016-09-07 17:40:12 -0700820 ix = dk_get_index(mp->ma_keys, i);
821 if (ix == DKIX_EMPTY) {
822 if (hashpos != NULL)
823 *hashpos = i;
824 *value_addr = NULL;
825 return DKIX_EMPTY;
Benjamin Peterson7d95e402012-04-23 11:24:50 -0400826 }
Victor Stinner742da042016-09-07 17:40:12 -0700827 if (ix == DKIX_DUMMY) {
828 freeslot = i;
829 }
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000830 else {
Victor Stinner742da042016-09-07 17:40:12 -0700831 ep = &ep0[ix];
Victor Stinner742da042016-09-07 17:40:12 -0700832 assert(ep->me_key != NULL);
Serhiy Storchaka46825d22016-09-26 21:29:34 +0300833 if (ep->me_key == key
834 || (ep->me_hash == hash && unicode_eq(ep->me_key, key))) {
Victor Stinner742da042016-09-07 17:40:12 -0700835 if (hashpos != NULL)
836 *hashpos = i;
INADA Naokiba609772016-12-07 20:41:42 +0900837 *value_addr = ep->me_value;
Victor Stinner742da042016-09-07 17:40:12 -0700838 return ix;
Benjamin Peterson7d95e402012-04-23 11:24:50 -0400839 }
Victor Stinner742da042016-09-07 17:40:12 -0700840 freeslot = -1;
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000841 }
Tim Peters15d49292001-05-27 07:39:22 +0000842
INADA Naoki267941c2016-10-06 15:19:07 +0900843 for (size_t perturb = hash;;) {
844 perturb >>= PERTURB_SHIFT;
Victor Stinner742da042016-09-07 17:40:12 -0700845 i = mask & ((i << 2) + i + perturb + 1);
846 ix = dk_get_index(mp->ma_keys, i);
847 if (ix == DKIX_EMPTY) {
848 if (hashpos != NULL) {
849 *hashpos = (freeslot == -1) ? (Py_ssize_t)i : freeslot;
Benjamin Peterson7d95e402012-04-23 11:24:50 -0400850 }
Victor Stinner742da042016-09-07 17:40:12 -0700851 *value_addr = NULL;
852 return DKIX_EMPTY;
Benjamin Peterson7d95e402012-04-23 11:24:50 -0400853 }
Victor Stinner742da042016-09-07 17:40:12 -0700854 if (ix == DKIX_DUMMY) {
855 if (freeslot == -1)
856 freeslot = i;
857 continue;
858 }
859 ep = &ep0[ix];
Serhiy Storchaka46825d22016-09-26 21:29:34 +0300860 assert(ep->me_key != NULL);
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000861 if (ep->me_key == key
Serhiy Storchaka46825d22016-09-26 21:29:34 +0300862 || (ep->me_hash == hash && unicode_eq(ep->me_key, key))) {
INADA Naokiba609772016-12-07 20:41:42 +0900863 *value_addr = ep->me_value;
Victor Stinner742da042016-09-07 17:40:12 -0700864 if (hashpos != NULL) {
865 *hashpos = i;
866 }
867 return ix;
Benjamin Peterson7d95e402012-04-23 11:24:50 -0400868 }
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000869 }
870 assert(0); /* NOT REACHED */
871 return 0;
Fred Drake1bff34a2000-08-31 19:31:38 +0000872}
873
Benjamin Peterson7d95e402012-04-23 11:24:50 -0400874/* Faster version of lookdict_unicode when it is known that no <dummy> keys
875 * will be present. */
Victor Stinnerc7a8f672016-11-15 15:13:40 +0100876static Py_ssize_t _Py_HOT_FUNCTION
Benjamin Peterson7d95e402012-04-23 11:24:50 -0400877lookdict_unicode_nodummy(PyDictObject *mp, PyObject *key,
INADA Naokiba609772016-12-07 20:41:42 +0900878 Py_hash_t hash, PyObject **value_addr,
Victor Stinner742da042016-09-07 17:40:12 -0700879 Py_ssize_t *hashpos)
Benjamin Peterson7d95e402012-04-23 11:24:50 -0400880{
INADA Naoki267941c2016-10-06 15:19:07 +0900881 size_t i;
Antoine Pitrou9ed5f272013-08-13 20:18:52 +0200882 size_t mask = DK_MASK(mp->ma_keys);
Victor Stinner742da042016-09-07 17:40:12 -0700883 Py_ssize_t ix;
884 PyDictKeyEntry *ep, *ep0 = DK_ENTRIES(mp->ma_keys);
Benjamin Peterson7d95e402012-04-23 11:24:50 -0400885
Victor Stinner742da042016-09-07 17:40:12 -0700886 assert(mp->ma_values == NULL);
Benjamin Peterson7d95e402012-04-23 11:24:50 -0400887 /* Make sure this function doesn't have to handle non-unicode keys,
888 including subclasses of str; e.g., one reason to subclass
889 unicodes is to override __eq__, and for speed we don't cater to
890 that here. */
891 if (!PyUnicode_CheckExact(key)) {
892 mp->ma_keys->dk_lookup = lookdict;
Victor Stinner742da042016-09-07 17:40:12 -0700893 return lookdict(mp, key, hash, value_addr, hashpos);
Benjamin Peterson7d95e402012-04-23 11:24:50 -0400894 }
895 i = (size_t)hash & mask;
Victor Stinner742da042016-09-07 17:40:12 -0700896 ix = dk_get_index(mp->ma_keys, i);
897 assert (ix != DKIX_DUMMY);
898 if (ix == DKIX_EMPTY) {
899 if (hashpos != NULL)
900 *hashpos = i;
901 *value_addr = NULL;
902 return DKIX_EMPTY;
903 }
904 ep = &ep0[ix];
Victor Stinnerdee6e252016-09-08 11:16:07 -0700905 assert(ep->me_key != NULL);
906 assert(PyUnicode_CheckExact(ep->me_key));
Victor Stinner742da042016-09-07 17:40:12 -0700907 if (ep->me_key == key ||
Benjamin Peterson7d95e402012-04-23 11:24:50 -0400908 (ep->me_hash == hash && unicode_eq(ep->me_key, key))) {
Victor Stinner742da042016-09-07 17:40:12 -0700909 if (hashpos != NULL)
910 *hashpos = i;
INADA Naokiba609772016-12-07 20:41:42 +0900911 *value_addr = ep->me_value;
Victor Stinner742da042016-09-07 17:40:12 -0700912 return ix;
Benjamin Peterson7d95e402012-04-23 11:24:50 -0400913 }
INADA Naoki267941c2016-10-06 15:19:07 +0900914 for (size_t perturb = hash;;) {
915 perturb >>= PERTURB_SHIFT;
Victor Stinner742da042016-09-07 17:40:12 -0700916 i = mask & ((i << 2) + i + perturb + 1);
917 ix = dk_get_index(mp->ma_keys, i);
918 assert (ix != DKIX_DUMMY);
919 if (ix == DKIX_EMPTY) {
920 if (hashpos != NULL)
921 *hashpos = i;
922 *value_addr = NULL;
923 return DKIX_EMPTY;
924 }
925 ep = &ep0[ix];
926 assert(ep->me_key != NULL && PyUnicode_CheckExact(ep->me_key));
927 if (ep->me_key == key ||
Benjamin Peterson7d95e402012-04-23 11:24:50 -0400928 (ep->me_hash == hash && unicode_eq(ep->me_key, key))) {
Victor Stinner742da042016-09-07 17:40:12 -0700929 if (hashpos != NULL)
930 *hashpos = i;
INADA Naokiba609772016-12-07 20:41:42 +0900931 *value_addr = ep->me_value;
Victor Stinner742da042016-09-07 17:40:12 -0700932 return ix;
Benjamin Peterson7d95e402012-04-23 11:24:50 -0400933 }
934 }
935 assert(0); /* NOT REACHED */
936 return 0;
937}
938
939/* Version of lookdict for split tables.
940 * All split tables and only split tables use this lookup function.
941 * Split tables only contain unicode keys and no dummy keys,
942 * so algorithm is the same as lookdict_unicode_nodummy.
943 */
Victor Stinnerc7a8f672016-11-15 15:13:40 +0100944static Py_ssize_t _Py_HOT_FUNCTION
Benjamin Peterson7d95e402012-04-23 11:24:50 -0400945lookdict_split(PyDictObject *mp, PyObject *key,
INADA Naokiba609772016-12-07 20:41:42 +0900946 Py_hash_t hash, PyObject **value_addr, Py_ssize_t *hashpos)
Benjamin Peterson7d95e402012-04-23 11:24:50 -0400947{
INADA Naoki267941c2016-10-06 15:19:07 +0900948 size_t i;
Antoine Pitrou9ed5f272013-08-13 20:18:52 +0200949 size_t mask = DK_MASK(mp->ma_keys);
Victor Stinner742da042016-09-07 17:40:12 -0700950 Py_ssize_t ix;
951 PyDictKeyEntry *ep, *ep0 = DK_ENTRIES(mp->ma_keys);
Benjamin Peterson7d95e402012-04-23 11:24:50 -0400952
Victor Stinner742da042016-09-07 17:40:12 -0700953 /* mp must split table */
954 assert(mp->ma_values != NULL);
Benjamin Peterson7d95e402012-04-23 11:24:50 -0400955 if (!PyUnicode_CheckExact(key)) {
Victor Stinner742da042016-09-07 17:40:12 -0700956 ix = lookdict(mp, key, hash, value_addr, hashpos);
957 if (ix >= 0) {
INADA Naokiba609772016-12-07 20:41:42 +0900958 *value_addr = mp->ma_values[ix];
Victor Stinner742da042016-09-07 17:40:12 -0700959 }
960 return ix;
Benjamin Peterson7d95e402012-04-23 11:24:50 -0400961 }
Victor Stinner742da042016-09-07 17:40:12 -0700962
Benjamin Peterson7d95e402012-04-23 11:24:50 -0400963 i = (size_t)hash & mask;
Victor Stinner742da042016-09-07 17:40:12 -0700964 ix = dk_get_index(mp->ma_keys, i);
965 if (ix == DKIX_EMPTY) {
966 if (hashpos != NULL)
967 *hashpos = i;
968 *value_addr = NULL;
969 return DKIX_EMPTY;
970 }
971 assert(ix >= 0);
972 ep = &ep0[ix];
Serhiy Storchaka46825d22016-09-26 21:29:34 +0300973 assert(ep->me_key != NULL && PyUnicode_CheckExact(ep->me_key));
Victor Stinner742da042016-09-07 17:40:12 -0700974 if (ep->me_key == key ||
Benjamin Peterson7d95e402012-04-23 11:24:50 -0400975 (ep->me_hash == hash && unicode_eq(ep->me_key, key))) {
Victor Stinner742da042016-09-07 17:40:12 -0700976 if (hashpos != NULL)
977 *hashpos = i;
INADA Naokiba609772016-12-07 20:41:42 +0900978 *value_addr = mp->ma_values[ix];
Victor Stinner742da042016-09-07 17:40:12 -0700979 return ix;
Benjamin Peterson7d95e402012-04-23 11:24:50 -0400980 }
INADA Naoki267941c2016-10-06 15:19:07 +0900981 for (size_t perturb = hash;;) {
982 perturb >>= PERTURB_SHIFT;
Victor Stinner742da042016-09-07 17:40:12 -0700983 i = mask & ((i << 2) + i + perturb + 1);
984 ix = dk_get_index(mp->ma_keys, i);
985 if (ix == DKIX_EMPTY) {
986 if (hashpos != NULL)
987 *hashpos = i;
988 *value_addr = NULL;
989 return DKIX_EMPTY;
990 }
991 assert(ix >= 0);
992 ep = &ep0[ix];
Serhiy Storchaka46825d22016-09-26 21:29:34 +0300993 assert(ep->me_key != NULL && PyUnicode_CheckExact(ep->me_key));
Victor Stinner742da042016-09-07 17:40:12 -0700994 if (ep->me_key == key ||
Benjamin Peterson7d95e402012-04-23 11:24:50 -0400995 (ep->me_hash == hash && unicode_eq(ep->me_key, key))) {
Victor Stinner742da042016-09-07 17:40:12 -0700996 if (hashpos != NULL)
997 *hashpos = i;
INADA Naokiba609772016-12-07 20:41:42 +0900998 *value_addr = mp->ma_values[ix];
Victor Stinner742da042016-09-07 17:40:12 -0700999 return ix;
Benjamin Peterson7d95e402012-04-23 11:24:50 -04001000 }
1001 }
1002 assert(0); /* NOT REACHED */
1003 return 0;
1004}
1005
Benjamin Petersonfb886362010-04-24 18:21:17 +00001006int
1007_PyDict_HasOnlyStringKeys(PyObject *dict)
1008{
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00001009 Py_ssize_t pos = 0;
1010 PyObject *key, *value;
Benjamin Petersonf6096542010-11-17 22:33:12 +00001011 assert(PyDict_Check(dict));
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00001012 /* Shortcut */
Benjamin Peterson7d95e402012-04-23 11:24:50 -04001013 if (((PyDictObject *)dict)->ma_keys->dk_lookup != lookdict)
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00001014 return 1;
1015 while (PyDict_Next(dict, &pos, &key, &value))
1016 if (!PyUnicode_Check(key))
1017 return 0;
1018 return 1;
Benjamin Petersonfb886362010-04-24 18:21:17 +00001019}
1020
Antoine Pitrou3a652b12009-03-23 18:52:06 +00001021#define MAINTAIN_TRACKING(mp, key, value) \
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00001022 do { \
1023 if (!_PyObject_GC_IS_TRACKED(mp)) { \
1024 if (_PyObject_GC_MAY_BE_TRACKED(key) || \
1025 _PyObject_GC_MAY_BE_TRACKED(value)) { \
1026 _PyObject_GC_TRACK(mp); \
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00001027 } \
1028 } \
1029 } while(0)
Antoine Pitrou3a652b12009-03-23 18:52:06 +00001030
1031void
1032_PyDict_MaybeUntrack(PyObject *op)
1033{
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00001034 PyDictObject *mp;
1035 PyObject *value;
Victor Stinner742da042016-09-07 17:40:12 -07001036 Py_ssize_t i, numentries;
1037 PyDictKeyEntry *ep0;
Antoine Pitrou3a652b12009-03-23 18:52:06 +00001038
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00001039 if (!PyDict_CheckExact(op) || !_PyObject_GC_IS_TRACKED(op))
1040 return;
1041
1042 mp = (PyDictObject *) op;
Victor Stinner742da042016-09-07 17:40:12 -07001043 ep0 = DK_ENTRIES(mp->ma_keys);
1044 numentries = mp->ma_keys->dk_nentries;
Benjamin Peterson7d95e402012-04-23 11:24:50 -04001045 if (_PyDict_HasSplitTable(mp)) {
Victor Stinner742da042016-09-07 17:40:12 -07001046 for (i = 0; i < numentries; i++) {
Benjamin Peterson7d95e402012-04-23 11:24:50 -04001047 if ((value = mp->ma_values[i]) == NULL)
1048 continue;
1049 if (_PyObject_GC_MAY_BE_TRACKED(value)) {
Victor Stinner742da042016-09-07 17:40:12 -07001050 assert(!_PyObject_GC_MAY_BE_TRACKED(ep0[i].me_key));
Benjamin Peterson7d95e402012-04-23 11:24:50 -04001051 return;
1052 }
1053 }
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00001054 }
Benjamin Peterson7d95e402012-04-23 11:24:50 -04001055 else {
Victor Stinner742da042016-09-07 17:40:12 -07001056 for (i = 0; i < numentries; i++) {
Benjamin Peterson7d95e402012-04-23 11:24:50 -04001057 if ((value = ep0[i].me_value) == NULL)
1058 continue;
1059 if (_PyObject_GC_MAY_BE_TRACKED(value) ||
1060 _PyObject_GC_MAY_BE_TRACKED(ep0[i].me_key))
1061 return;
1062 }
1063 }
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00001064 _PyObject_GC_UNTRACK(op);
Antoine Pitrou3a652b12009-03-23 18:52:06 +00001065}
1066
Benjamin Peterson7d95e402012-04-23 11:24:50 -04001067/* Internal function to find slot for an item from its hash
Victor Stinner3c336c52016-09-12 14:17:40 +02001068 when it is known that the key is not present in the dict.
1069
1070 The dict must be combined. */
INADA Naokiba609772016-12-07 20:41:42 +09001071static Py_ssize_t
1072find_empty_slot(PyDictKeysObject *keys, PyObject *key, Py_hash_t hash)
Guido van Rossum4b1302b1993-03-27 18:11:32 +00001073{
INADA Naoki267941c2016-10-06 15:19:07 +09001074 size_t i;
INADA Naokiba609772016-12-07 20:41:42 +09001075 size_t mask = DK_MASK(keys);
Victor Stinner742da042016-09-07 17:40:12 -07001076 Py_ssize_t ix;
Tim Peters6d6c1a32001-08-02 04:15:00 +00001077
Benjamin Peterson7d95e402012-04-23 11:24:50 -04001078 assert(key != NULL);
Victor Stinner3c336c52016-09-12 14:17:40 +02001079
Benjamin Peterson7d95e402012-04-23 11:24:50 -04001080 i = hash & mask;
INADA Naokiba609772016-12-07 20:41:42 +09001081 ix = dk_get_index(keys, i);
INADA Naoki267941c2016-10-06 15:19:07 +09001082 for (size_t perturb = hash; ix != DKIX_EMPTY;) {
1083 perturb >>= PERTURB_SHIFT;
Benjamin Peterson7d95e402012-04-23 11:24:50 -04001084 i = (i << 2) + i + perturb + 1;
INADA Naokiba609772016-12-07 20:41:42 +09001085 ix = dk_get_index(keys, i & mask);
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00001086 }
INADA Naokiba609772016-12-07 20:41:42 +09001087 assert(DK_ENTRIES(keys)[keys->dk_nentries].me_value == NULL);
1088 return i & mask;
Thomas Wouters4d70c3d2006-06-08 14:42:34 +00001089}
1090
Benjamin Peterson7d95e402012-04-23 11:24:50 -04001091static int
1092insertion_resize(PyDictObject *mp)
1093{
Raymond Hettinger36f74aa2013-05-17 03:01:13 -07001094 return dictresize(mp, GROWTH_RATE(mp));
Benjamin Peterson7d95e402012-04-23 11:24:50 -04001095}
Antoine Pitroue965d972012-02-27 00:45:12 +01001096
1097/*
1098Internal routine to insert a new item into the table.
1099Used both by the internal resize routine and by the public insert routine.
Antoine Pitroue965d972012-02-27 00:45:12 +01001100Returns -1 if an error occurred, or 0 on success.
1101*/
1102static int
Benjamin Peterson7d95e402012-04-23 11:24:50 -04001103insertdict(PyDictObject *mp, PyObject *key, Py_hash_t hash, PyObject *value)
Antoine Pitroue965d972012-02-27 00:45:12 +01001104{
Benjamin Peterson7d95e402012-04-23 11:24:50 -04001105 PyObject *old_value;
INADA Naokiba609772016-12-07 20:41:42 +09001106 PyDictKeyEntry *ep;
Victor Stinner742da042016-09-07 17:40:12 -07001107 Py_ssize_t hashpos, ix;
Antoine Pitroue965d972012-02-27 00:45:12 +01001108
Benjamin Peterson7d95e402012-04-23 11:24:50 -04001109 if (mp->ma_values != NULL && !PyUnicode_CheckExact(key)) {
1110 if (insertion_resize(mp) < 0)
1111 return -1;
1112 }
1113
INADA Naokiba609772016-12-07 20:41:42 +09001114 ix = mp->ma_keys->dk_lookup(mp, key, hash, &old_value, &hashpos);
Victor Stinner742da042016-09-07 17:40:12 -07001115 if (ix == DKIX_ERROR) {
Antoine Pitroue965d972012-02-27 00:45:12 +01001116 return -1;
1117 }
Victor Stinner742da042016-09-07 17:40:12 -07001118
Antoine Pitroud6967322014-10-18 00:35:00 +02001119 assert(PyUnicode_CheckExact(key) || mp->ma_keys->dk_lookup == lookdict);
Benjamin Petersona6f195e2012-04-30 10:23:40 -04001120 Py_INCREF(value);
Benjamin Peterson7d95e402012-04-23 11:24:50 -04001121 MAINTAIN_TRACKING(mp, key, value);
Victor Stinner742da042016-09-07 17:40:12 -07001122
1123 /* When insertion order is different from shared key, we can't share
1124 * the key anymore. Convert this instance to combine table.
1125 */
1126 if (_PyDict_HasSplitTable(mp) &&
INADA Naokiba609772016-12-07 20:41:42 +09001127 ((ix >= 0 && old_value == NULL && mp->ma_used != ix) ||
Victor Stinner742da042016-09-07 17:40:12 -07001128 (ix == DKIX_EMPTY && mp->ma_used != mp->ma_keys->dk_nentries))) {
1129 if (insertion_resize(mp) < 0) {
1130 Py_DECREF(value);
1131 return -1;
1132 }
INADA Naokiba609772016-12-07 20:41:42 +09001133 hashpos = find_empty_slot(mp->ma_keys, key, hash);
Victor Stinner742da042016-09-07 17:40:12 -07001134 ix = DKIX_EMPTY;
Benjamin Peterson7d95e402012-04-23 11:24:50 -04001135 }
Victor Stinner742da042016-09-07 17:40:12 -07001136
1137 if (ix == DKIX_EMPTY) {
1138 /* Insert into new slot. */
INADA Naokiba609772016-12-07 20:41:42 +09001139 assert(old_value == NULL);
Victor Stinner742da042016-09-07 17:40:12 -07001140 if (mp->ma_keys->dk_usable <= 0) {
1141 /* Need to resize. */
1142 if (insertion_resize(mp) < 0) {
1143 Py_DECREF(value);
1144 return -1;
Benjamin Peterson7d95e402012-04-23 11:24:50 -04001145 }
INADA Naokiba609772016-12-07 20:41:42 +09001146 hashpos = find_empty_slot(mp->ma_keys, key, hash);
Victor Stinner742da042016-09-07 17:40:12 -07001147 }
INADA Naokiba609772016-12-07 20:41:42 +09001148 ep = &DK_ENTRIES(mp->ma_keys)[mp->ma_keys->dk_nentries];
Victor Stinner742da042016-09-07 17:40:12 -07001149 dk_set_index(mp->ma_keys, hashpos, mp->ma_keys->dk_nentries);
1150 Py_INCREF(key);
1151 ep->me_key = key;
1152 ep->me_hash = hash;
1153 if (mp->ma_values) {
1154 assert (mp->ma_values[mp->ma_keys->dk_nentries] == NULL);
1155 mp->ma_values[mp->ma_keys->dk_nentries] = value;
Benjamin Peterson7d95e402012-04-23 11:24:50 -04001156 }
1157 else {
Victor Stinner742da042016-09-07 17:40:12 -07001158 ep->me_value = value;
Benjamin Peterson7d95e402012-04-23 11:24:50 -04001159 }
1160 mp->ma_used++;
Victor Stinner3b6a6b42016-09-08 12:51:24 -07001161 mp->ma_version_tag = DICT_NEXT_VERSION();
Victor Stinner742da042016-09-07 17:40:12 -07001162 mp->ma_keys->dk_usable--;
1163 mp->ma_keys->dk_nentries++;
1164 assert(mp->ma_keys->dk_usable >= 0);
Victor Stinner611b0fa2016-09-14 15:02:01 +02001165 assert(_PyDict_CheckConsistency(mp));
Victor Stinner742da042016-09-07 17:40:12 -07001166 return 0;
Benjamin Peterson7d95e402012-04-23 11:24:50 -04001167 }
Victor Stinner742da042016-09-07 17:40:12 -07001168
INADA Naokiba609772016-12-07 20:41:42 +09001169 if (_PyDict_HasSplitTable(mp)) {
1170 mp->ma_values[ix] = value;
1171 if (old_value == NULL) {
1172 /* pending state */
1173 assert(ix == mp->ma_used);
1174 mp->ma_used++;
1175 }
1176 }
1177 else {
1178 assert(old_value != NULL);
1179 DK_ENTRIES(mp->ma_keys)[ix].me_value = value;
Victor Stinner742da042016-09-07 17:40:12 -07001180 }
1181
Victor Stinner3b6a6b42016-09-08 12:51:24 -07001182 mp->ma_version_tag = DICT_NEXT_VERSION();
INADA Naokiba609772016-12-07 20:41:42 +09001183 Py_XDECREF(old_value); /* which **CAN** re-enter (see issue #22653) */
Victor Stinner611b0fa2016-09-14 15:02:01 +02001184 assert(_PyDict_CheckConsistency(mp));
Benjamin Peterson7d95e402012-04-23 11:24:50 -04001185 return 0;
Antoine Pitroue965d972012-02-27 00:45:12 +01001186}
1187
Thomas Wouters4d70c3d2006-06-08 14:42:34 +00001188/*
Serhiy Storchakae26e20d2016-10-29 10:50:00 +03001189Internal routine used by dictresize() to buid a hashtable of entries.
Thomas Wouters4d70c3d2006-06-08 14:42:34 +00001190*/
1191static void
Serhiy Storchakae26e20d2016-10-29 10:50:00 +03001192build_indices(PyDictKeysObject *keys, PyDictKeyEntry *ep, Py_ssize_t n)
Thomas Wouters4d70c3d2006-06-08 14:42:34 +00001193{
Serhiy Storchakae26e20d2016-10-29 10:50:00 +03001194 size_t mask = (size_t)DK_SIZE(keys) - 1;
1195 for (Py_ssize_t ix = 0; ix != n; ix++, ep++) {
1196 Py_hash_t hash = ep->me_hash;
1197 size_t i = hash & mask;
1198 for (size_t perturb = hash; dk_get_index(keys, i) != DKIX_EMPTY;) {
1199 perturb >>= PERTURB_SHIFT;
1200 i = mask & ((i << 2) + i + perturb + 1);
1201 }
1202 dk_set_index(keys, i, ix);
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00001203 }
Guido van Rossum4b1302b1993-03-27 18:11:32 +00001204}
1205
1206/*
1207Restructure the table by allocating a new table and reinserting all
1208items again. When entries have been deleted, the new table may
1209actually be smaller than the old one.
Benjamin Peterson7d95e402012-04-23 11:24:50 -04001210If a table is split (its keys and hashes are shared, its values are not),
1211then the values are temporarily copied into the table, it is resized as
1212a combined table, then the me_value slots in the old table are NULLed out.
1213After resizing a table is always combined,
1214but can be resplit by make_keys_shared().
Guido van Rossum4b1302b1993-03-27 18:11:32 +00001215*/
Guido van Rossum4b1302b1993-03-27 18:11:32 +00001216static int
Victor Stinner3d3f2642016-12-15 17:21:23 +01001217dictresize(PyDictObject *mp, Py_ssize_t minsize)
Guido van Rossum4b1302b1993-03-27 18:11:32 +00001218{
Serhiy Storchakae26e20d2016-10-29 10:50:00 +03001219 Py_ssize_t newsize, numentries;
Benjamin Peterson7d95e402012-04-23 11:24:50 -04001220 PyDictKeysObject *oldkeys;
1221 PyObject **oldvalues;
Serhiy Storchakae26e20d2016-10-29 10:50:00 +03001222 PyDictKeyEntry *oldentries, *newentries;
Tim Peters91a364d2001-05-19 07:04:38 +00001223
Victor Stinner742da042016-09-07 17:40:12 -07001224 /* Find the smallest table size > minused. */
1225 for (newsize = PyDict_MINSIZE;
Victor Stinner3d3f2642016-12-15 17:21:23 +01001226 newsize < minsize && newsize > 0;
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00001227 newsize <<= 1)
1228 ;
1229 if (newsize <= 0) {
1230 PyErr_NoMemory();
1231 return -1;
1232 }
Serhiy Storchakae26e20d2016-10-29 10:50:00 +03001233
Benjamin Peterson7d95e402012-04-23 11:24:50 -04001234 oldkeys = mp->ma_keys;
Serhiy Storchakae26e20d2016-10-29 10:50:00 +03001235
1236 /* NOTE: Current odict checks mp->ma_keys to detect resize happen.
1237 * So we can't reuse oldkeys even if oldkeys->dk_size == newsize.
1238 * TODO: Try reusing oldkeys when reimplement odict.
1239 */
1240
Benjamin Peterson7d95e402012-04-23 11:24:50 -04001241 /* Allocate a new table. */
1242 mp->ma_keys = new_keys_object(newsize);
1243 if (mp->ma_keys == NULL) {
1244 mp->ma_keys = oldkeys;
1245 return -1;
1246 }
Victor Stinner3d3f2642016-12-15 17:21:23 +01001247 // New table must be large enough.
1248 assert(mp->ma_keys->dk_usable >= mp->ma_used);
Benjamin Peterson7d95e402012-04-23 11:24:50 -04001249 if (oldkeys->dk_lookup == lookdict)
1250 mp->ma_keys->dk_lookup = lookdict;
Serhiy Storchakae26e20d2016-10-29 10:50:00 +03001251
1252 numentries = mp->ma_used;
1253 oldentries = DK_ENTRIES(oldkeys);
1254 newentries = DK_ENTRIES(mp->ma_keys);
1255 oldvalues = mp->ma_values;
Benjamin Peterson7d95e402012-04-23 11:24:50 -04001256 if (oldvalues != NULL) {
Serhiy Storchakae26e20d2016-10-29 10:50:00 +03001257 /* Convert split table into new combined table.
1258 * We must incref keys; we can transfer values.
1259 * Note that values of split table is always dense.
1260 */
1261 for (Py_ssize_t i = 0; i < numentries; i++) {
1262 assert(oldvalues[i] != NULL);
1263 PyDictKeyEntry *ep = &oldentries[i];
1264 PyObject *key = ep->me_key;
1265 Py_INCREF(key);
1266 newentries[i].me_key = key;
1267 newentries[i].me_hash = ep->me_hash;
1268 newentries[i].me_value = oldvalues[i];
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00001269 }
Serhiy Storchakae26e20d2016-10-29 10:50:00 +03001270
Benjamin Peterson7d95e402012-04-23 11:24:50 -04001271 DK_DECREF(oldkeys);
Serhiy Storchakae26e20d2016-10-29 10:50:00 +03001272 mp->ma_values = NULL;
Victor Stinner742da042016-09-07 17:40:12 -07001273 if (oldvalues != empty_values) {
1274 free_values(oldvalues);
1275 }
Benjamin Peterson7d95e402012-04-23 11:24:50 -04001276 }
Serhiy Storchakae26e20d2016-10-29 10:50:00 +03001277 else { // combined table.
1278 if (oldkeys->dk_nentries == numentries) {
1279 memcpy(newentries, oldentries, numentries * sizeof(PyDictKeyEntry));
1280 }
1281 else {
1282 PyDictKeyEntry *ep = oldentries;
1283 for (Py_ssize_t i = 0; i < numentries; i++) {
1284 while (ep->me_value == NULL)
1285 ep++;
1286 newentries[i] = *ep++;
1287 }
1288 }
1289
Benjamin Peterson7d95e402012-04-23 11:24:50 -04001290 assert(oldkeys->dk_lookup != lookdict_split);
Benjamin Peterson7d95e402012-04-23 11:24:50 -04001291 assert(oldkeys->dk_refcnt == 1);
Serhiy Storchakae26e20d2016-10-29 10:50:00 +03001292 if (oldkeys->dk_size == PyDict_MINSIZE &&
1293 numfreekeys < PyDict_MAXFREELIST) {
1294 DK_DEBUG_DECREF keys_free_list[numfreekeys++] = oldkeys;
1295 }
1296 else {
1297 DK_DEBUG_DECREF PyObject_FREE(oldkeys);
1298 }
Benjamin Peterson7d95e402012-04-23 11:24:50 -04001299 }
Serhiy Storchakae26e20d2016-10-29 10:50:00 +03001300
1301 build_indices(mp->ma_keys, newentries, numentries);
1302 mp->ma_keys->dk_usable -= numentries;
1303 mp->ma_keys->dk_nentries = numentries;
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00001304 return 0;
Guido van Rossum4b1302b1993-03-27 18:11:32 +00001305}
1306
Benjamin Peterson15ee8212012-04-24 14:44:18 -04001307/* Returns NULL if unable to split table.
1308 * A NULL return does not necessarily indicate an error */
Benjamin Peterson7d95e402012-04-23 11:24:50 -04001309static PyDictKeysObject *
1310make_keys_shared(PyObject *op)
1311{
1312 Py_ssize_t i;
1313 Py_ssize_t size;
1314 PyDictObject *mp = (PyDictObject *)op;
1315
Benjamin Peterson15ee8212012-04-24 14:44:18 -04001316 if (!PyDict_CheckExact(op))
1317 return NULL;
Benjamin Peterson7d95e402012-04-23 11:24:50 -04001318 if (!_PyDict_HasSplitTable(mp)) {
1319 PyDictKeyEntry *ep0;
1320 PyObject **values;
1321 assert(mp->ma_keys->dk_refcnt == 1);
1322 if (mp->ma_keys->dk_lookup == lookdict) {
1323 return NULL;
1324 }
1325 else if (mp->ma_keys->dk_lookup == lookdict_unicode) {
1326 /* Remove dummy keys */
1327 if (dictresize(mp, DK_SIZE(mp->ma_keys)))
1328 return NULL;
1329 }
1330 assert(mp->ma_keys->dk_lookup == lookdict_unicode_nodummy);
1331 /* Copy values into a new array */
Victor Stinner742da042016-09-07 17:40:12 -07001332 ep0 = DK_ENTRIES(mp->ma_keys);
1333 size = USABLE_FRACTION(DK_SIZE(mp->ma_keys));
Benjamin Peterson7d95e402012-04-23 11:24:50 -04001334 values = new_values(size);
1335 if (values == NULL) {
1336 PyErr_SetString(PyExc_MemoryError,
1337 "Not enough memory to allocate new values array");
1338 return NULL;
1339 }
1340 for (i = 0; i < size; i++) {
1341 values[i] = ep0[i].me_value;
1342 ep0[i].me_value = NULL;
1343 }
1344 mp->ma_keys->dk_lookup = lookdict_split;
1345 mp->ma_values = values;
1346 }
1347 DK_INCREF(mp->ma_keys);
1348 return mp->ma_keys;
1349}
Christian Heimes99170a52007-12-19 02:07:34 +00001350
1351PyObject *
1352_PyDict_NewPresized(Py_ssize_t minused)
1353{
INADA Naoki92c50ee2016-11-22 00:57:02 +09001354 const Py_ssize_t max_presize = 128 * 1024;
Benjamin Peterson7d95e402012-04-23 11:24:50 -04001355 Py_ssize_t newsize;
1356 PyDictKeysObject *new_keys;
INADA Naoki92c50ee2016-11-22 00:57:02 +09001357
1358 /* There are no strict guarantee that returned dict can contain minused
1359 * items without resize. So we create medium size dict instead of very
1360 * large dict or MemoryError.
1361 */
1362 if (minused > USABLE_FRACTION(max_presize)) {
1363 newsize = max_presize;
1364 }
1365 else {
1366 Py_ssize_t minsize = ESTIMATE_SIZE(minused);
1367 newsize = PyDict_MINSIZE;
1368 while (newsize < minsize) {
1369 newsize <<= 1;
1370 }
1371 }
1372 assert(IS_POWER_OF_2(newsize));
1373
Benjamin Peterson7d95e402012-04-23 11:24:50 -04001374 new_keys = new_keys_object(newsize);
1375 if (new_keys == NULL)
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00001376 return NULL;
Benjamin Peterson7d95e402012-04-23 11:24:50 -04001377 return new_dict(new_keys, NULL);
Christian Heimes99170a52007-12-19 02:07:34 +00001378}
1379
Thomas Wouters4d70c3d2006-06-08 14:42:34 +00001380/* Note that, for historical reasons, PyDict_GetItem() suppresses all errors
1381 * that may occur (originally dicts supported only string keys, and exceptions
1382 * weren't possible). So, while the original intent was that a NULL return
Thomas Wouters0e3f5912006-08-11 14:57:12 +00001383 * meant the key wasn't present, in reality it can mean that, or that an error
Thomas Wouters4d70c3d2006-06-08 14:42:34 +00001384 * (suppressed) occurred while computing the key's hash, or that some error
1385 * (suppressed) occurred when comparing keys in the dict's internal probe
1386 * sequence. A nasty example of the latter is when a Python-coded comparison
1387 * function hits a stack-depth error, which can cause this to return NULL
1388 * even if the key is present.
1389 */
Guido van Rossumc0b618a1997-05-02 03:12:38 +00001390PyObject *
Tim Peters1f5871e2000-07-04 17:44:48 +00001391PyDict_GetItem(PyObject *op, PyObject *key)
Guido van Rossum4b1302b1993-03-27 18:11:32 +00001392{
Benjamin Peterson8f67d082010-10-17 20:54:53 +00001393 Py_hash_t hash;
Victor Stinner742da042016-09-07 17:40:12 -07001394 Py_ssize_t ix;
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00001395 PyDictObject *mp = (PyDictObject *)op;
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00001396 PyThreadState *tstate;
INADA Naokiba609772016-12-07 20:41:42 +09001397 PyObject *value;
Benjamin Peterson7d95e402012-04-23 11:24:50 -04001398
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00001399 if (!PyDict_Check(op))
1400 return NULL;
1401 if (!PyUnicode_CheckExact(key) ||
Martin v. Löwisd63a3b82011-09-28 07:41:54 +02001402 (hash = ((PyASCIIObject *) key)->hash) == -1)
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00001403 {
1404 hash = PyObject_Hash(key);
1405 if (hash == -1) {
1406 PyErr_Clear();
1407 return NULL;
1408 }
1409 }
Thomas Wouters4d70c3d2006-06-08 14:42:34 +00001410
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00001411 /* We can arrive here with a NULL tstate during initialization: try
1412 running "python -Wi" for an example related to string interning.
1413 Let's just hope that no exception occurs then... This must be
1414 _PyThreadState_Current and not PyThreadState_GET() because in debug
1415 mode, the latter complains if tstate is NULL. */
Victor Stinner0cae6092016-11-11 01:43:56 +01001416 tstate = PyThreadState_GET();
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00001417 if (tstate != NULL && tstate->curexc_type != NULL) {
1418 /* preserve the existing exception */
1419 PyObject *err_type, *err_value, *err_tb;
1420 PyErr_Fetch(&err_type, &err_value, &err_tb);
INADA Naokiba609772016-12-07 20:41:42 +09001421 ix = (mp->ma_keys->dk_lookup)(mp, key, hash, &value, NULL);
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00001422 /* ignore errors */
1423 PyErr_Restore(err_type, err_value, err_tb);
Victor Stinner742da042016-09-07 17:40:12 -07001424 if (ix < 0)
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00001425 return NULL;
1426 }
1427 else {
INADA Naokiba609772016-12-07 20:41:42 +09001428 ix = (mp->ma_keys->dk_lookup)(mp, key, hash, &value, NULL);
Victor Stinner742da042016-09-07 17:40:12 -07001429 if (ix < 0) {
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00001430 PyErr_Clear();
1431 return NULL;
1432 }
1433 }
INADA Naokiba609772016-12-07 20:41:42 +09001434 return value;
Guido van Rossum4b1302b1993-03-27 18:11:32 +00001435}
1436
Serhiy Storchakaf0b311b2016-11-06 13:18:24 +02001437/* Same as PyDict_GetItemWithError() but with hash supplied by caller.
1438 This returns NULL *with* an exception set if an exception occurred.
1439 It returns NULL *without* an exception set if the key wasn't present.
1440*/
Raymond Hettinger4b74fba2014-05-03 16:32:11 -07001441PyObject *
1442_PyDict_GetItem_KnownHash(PyObject *op, PyObject *key, Py_hash_t hash)
1443{
Victor Stinner742da042016-09-07 17:40:12 -07001444 Py_ssize_t ix;
Raymond Hettinger4b74fba2014-05-03 16:32:11 -07001445 PyDictObject *mp = (PyDictObject *)op;
INADA Naokiba609772016-12-07 20:41:42 +09001446 PyObject *value;
Raymond Hettinger4b74fba2014-05-03 16:32:11 -07001447
Serhiy Storchakaf0b311b2016-11-06 13:18:24 +02001448 if (!PyDict_Check(op)) {
1449 PyErr_BadInternalCall();
Raymond Hettinger4b74fba2014-05-03 16:32:11 -07001450 return NULL;
Raymond Hettinger4b74fba2014-05-03 16:32:11 -07001451 }
Serhiy Storchakaf0b311b2016-11-06 13:18:24 +02001452
INADA Naokiba609772016-12-07 20:41:42 +09001453 ix = (mp->ma_keys->dk_lookup)(mp, key, hash, &value, NULL);
Serhiy Storchakaf0b311b2016-11-06 13:18:24 +02001454 if (ix < 0) {
1455 return NULL;
Raymond Hettinger4b74fba2014-05-03 16:32:11 -07001456 }
INADA Naokiba609772016-12-07 20:41:42 +09001457 return value;
Raymond Hettinger4b74fba2014-05-03 16:32:11 -07001458}
1459
Guido van Rossum47b9ff62006-08-24 00:41:19 +00001460/* Variant of PyDict_GetItem() that doesn't suppress exceptions.
1461 This returns NULL *with* an exception set if an exception occurred.
1462 It returns NULL *without* an exception set if the key wasn't present.
1463*/
1464PyObject *
1465PyDict_GetItemWithError(PyObject *op, PyObject *key)
1466{
Victor Stinner742da042016-09-07 17:40:12 -07001467 Py_ssize_t ix;
Benjamin Peterson8f67d082010-10-17 20:54:53 +00001468 Py_hash_t hash;
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00001469 PyDictObject*mp = (PyDictObject *)op;
INADA Naokiba609772016-12-07 20:41:42 +09001470 PyObject *value;
Guido van Rossum47b9ff62006-08-24 00:41:19 +00001471
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00001472 if (!PyDict_Check(op)) {
1473 PyErr_BadInternalCall();
1474 return NULL;
1475 }
1476 if (!PyUnicode_CheckExact(key) ||
Martin v. Löwisd63a3b82011-09-28 07:41:54 +02001477 (hash = ((PyASCIIObject *) key)->hash) == -1)
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00001478 {
1479 hash = PyObject_Hash(key);
1480 if (hash == -1) {
1481 return NULL;
1482 }
1483 }
Guido van Rossum47b9ff62006-08-24 00:41:19 +00001484
INADA Naokiba609772016-12-07 20:41:42 +09001485 ix = (mp->ma_keys->dk_lookup)(mp, key, hash, &value, NULL);
Victor Stinner742da042016-09-07 17:40:12 -07001486 if (ix < 0)
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00001487 return NULL;
INADA Naokiba609772016-12-07 20:41:42 +09001488 return value;
Guido van Rossum47b9ff62006-08-24 00:41:19 +00001489}
1490
Brett Cannonfd074152012-04-14 14:10:13 -04001491PyObject *
1492_PyDict_GetItemIdWithError(PyObject *dp, struct _Py_Identifier *key)
1493{
1494 PyObject *kv;
1495 kv = _PyUnicode_FromId(key); /* borrowed */
1496 if (kv == NULL)
1497 return NULL;
1498 return PyDict_GetItemWithError(dp, kv);
1499}
1500
Victor Stinnerb4efc962015-11-20 09:24:02 +01001501/* Fast version of global value lookup (LOAD_GLOBAL).
Benjamin Peterson7d95e402012-04-23 11:24:50 -04001502 * Lookup in globals, then builtins.
Victor Stinnerb4efc962015-11-20 09:24:02 +01001503 *
1504 * Raise an exception and return NULL if an error occurred (ex: computing the
1505 * key hash failed, key comparison failed, ...). Return NULL if the key doesn't
1506 * exist. Return the value if the key exists.
Benjamin Peterson7d95e402012-04-23 11:24:50 -04001507 */
1508PyObject *
1509_PyDict_LoadGlobal(PyDictObject *globals, PyDictObject *builtins, PyObject *key)
Guido van Rossum4b1302b1993-03-27 18:11:32 +00001510{
Victor Stinner742da042016-09-07 17:40:12 -07001511 Py_ssize_t ix;
Victor Stinnerb4efc962015-11-20 09:24:02 +01001512 Py_hash_t hash;
INADA Naokiba609772016-12-07 20:41:42 +09001513 PyObject *value;
Victor Stinnerb4efc962015-11-20 09:24:02 +01001514
1515 if (!PyUnicode_CheckExact(key) ||
1516 (hash = ((PyASCIIObject *) key)->hash) == -1)
1517 {
1518 hash = PyObject_Hash(key);
1519 if (hash == -1)
1520 return NULL;
Antoine Pitroue965d972012-02-27 00:45:12 +01001521 }
Victor Stinnerb4efc962015-11-20 09:24:02 +01001522
1523 /* namespace 1: globals */
INADA Naokiba609772016-12-07 20:41:42 +09001524 ix = globals->ma_keys->dk_lookup(globals, key, hash, &value, NULL);
Victor Stinner742da042016-09-07 17:40:12 -07001525 if (ix == DKIX_ERROR)
Benjamin Peterson7d95e402012-04-23 11:24:50 -04001526 return NULL;
INADA Naokiba609772016-12-07 20:41:42 +09001527 if (ix != DKIX_EMPTY && value != NULL)
1528 return value;
Victor Stinnerb4efc962015-11-20 09:24:02 +01001529
1530 /* namespace 2: builtins */
INADA Naokiba609772016-12-07 20:41:42 +09001531 ix = builtins->ma_keys->dk_lookup(builtins, key, hash, &value, NULL);
Victor Stinner742da042016-09-07 17:40:12 -07001532 if (ix < 0)
Victor Stinnerb4efc962015-11-20 09:24:02 +01001533 return NULL;
INADA Naokiba609772016-12-07 20:41:42 +09001534 return value;
Guido van Rossum4b1302b1993-03-27 18:11:32 +00001535}
1536
Antoine Pitroue965d972012-02-27 00:45:12 +01001537/* CAUTION: PyDict_SetItem() must guarantee that it won't resize the
1538 * dictionary if it's merely replacing the value for an existing key.
1539 * This means that it's safe to loop over a dictionary with PyDict_Next()
1540 * and occasionally replace a value -- but you can't insert new keys or
1541 * remove them.
1542 */
1543int
Benjamin Peterson7d95e402012-04-23 11:24:50 -04001544PyDict_SetItem(PyObject *op, PyObject *key, PyObject *value)
Antoine Pitroue965d972012-02-27 00:45:12 +01001545{
Benjamin Peterson7d95e402012-04-23 11:24:50 -04001546 PyDictObject *mp;
1547 Py_hash_t hash;
Antoine Pitroue965d972012-02-27 00:45:12 +01001548 if (!PyDict_Check(op)) {
1549 PyErr_BadInternalCall();
1550 return -1;
1551 }
1552 assert(key);
1553 assert(value);
Benjamin Peterson7d95e402012-04-23 11:24:50 -04001554 mp = (PyDictObject *)op;
1555 if (!PyUnicode_CheckExact(key) ||
1556 (hash = ((PyASCIIObject *) key)->hash) == -1)
1557 {
Antoine Pitroue965d972012-02-27 00:45:12 +01001558 hash = PyObject_Hash(key);
1559 if (hash == -1)
1560 return -1;
1561 }
Benjamin Peterson7d95e402012-04-23 11:24:50 -04001562
1563 /* insertdict() handles any resizing that might be necessary */
1564 return insertdict(mp, key, hash, value);
Antoine Pitroue965d972012-02-27 00:45:12 +01001565}
1566
Guido van Rossum4b1302b1993-03-27 18:11:32 +00001567int
Raymond Hettinger4b74fba2014-05-03 16:32:11 -07001568_PyDict_SetItem_KnownHash(PyObject *op, PyObject *key, PyObject *value,
1569 Py_hash_t hash)
1570{
1571 PyDictObject *mp;
1572
1573 if (!PyDict_Check(op)) {
1574 PyErr_BadInternalCall();
1575 return -1;
1576 }
1577 assert(key);
1578 assert(value);
Serhiy Storchakab9d98d52015-10-02 12:47:11 +03001579 assert(hash != -1);
Raymond Hettinger4b74fba2014-05-03 16:32:11 -07001580 mp = (PyDictObject *)op;
1581
1582 /* insertdict() handles any resizing that might be necessary */
1583 return insertdict(mp, key, hash, value);
1584}
1585
1586int
Tim Peters1f5871e2000-07-04 17:44:48 +00001587PyDict_DelItem(PyObject *op, PyObject *key)
Guido van Rossum4b1302b1993-03-27 18:11:32 +00001588{
Benjamin Peterson7d95e402012-04-23 11:24:50 -04001589 Py_hash_t hash;
Guido van Rossumd7047b31995-01-02 19:07:15 +00001590
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00001591 assert(key);
1592 if (!PyUnicode_CheckExact(key) ||
Martin v. Löwisd63a3b82011-09-28 07:41:54 +02001593 (hash = ((PyASCIIObject *) key)->hash) == -1) {
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00001594 hash = PyObject_Hash(key);
1595 if (hash == -1)
1596 return -1;
1597 }
Victor Stinner742da042016-09-07 17:40:12 -07001598
1599 return _PyDict_DelItem_KnownHash(op, key, hash);
Guido van Rossum4b1302b1993-03-27 18:11:32 +00001600}
1601
Serhiy Storchakab9d98d52015-10-02 12:47:11 +03001602int
1603_PyDict_DelItem_KnownHash(PyObject *op, PyObject *key, Py_hash_t hash)
1604{
Victor Stinner742da042016-09-07 17:40:12 -07001605 Py_ssize_t hashpos, ix;
Serhiy Storchakab9d98d52015-10-02 12:47:11 +03001606 PyDictObject *mp;
1607 PyDictKeyEntry *ep;
1608 PyObject *old_key, *old_value;
Serhiy Storchakab9d98d52015-10-02 12:47:11 +03001609
1610 if (!PyDict_Check(op)) {
1611 PyErr_BadInternalCall();
1612 return -1;
1613 }
1614 assert(key);
1615 assert(hash != -1);
1616 mp = (PyDictObject *)op;
INADA Naokiba609772016-12-07 20:41:42 +09001617 ix = (mp->ma_keys->dk_lookup)(mp, key, hash, &old_value, &hashpos);
Victor Stinner742da042016-09-07 17:40:12 -07001618 if (ix == DKIX_ERROR)
Serhiy Storchakab9d98d52015-10-02 12:47:11 +03001619 return -1;
INADA Naokiba609772016-12-07 20:41:42 +09001620 if (ix == DKIX_EMPTY || old_value == NULL) {
Serhiy Storchakab9d98d52015-10-02 12:47:11 +03001621 _PyErr_SetKeyError(key);
1622 return -1;
1623 }
Victor Stinner742da042016-09-07 17:40:12 -07001624 assert(dk_get_index(mp->ma_keys, hashpos) == ix);
Victor Stinner78601a32016-09-09 19:28:36 -07001625
1626 // Split table doesn't allow deletion. Combine it.
1627 if (_PyDict_HasSplitTable(mp)) {
1628 if (dictresize(mp, DK_SIZE(mp->ma_keys))) {
1629 return -1;
1630 }
INADA Naokiba609772016-12-07 20:41:42 +09001631 ix = (mp->ma_keys->dk_lookup)(mp, key, hash, &old_value, &hashpos);
Victor Stinner78601a32016-09-09 19:28:36 -07001632 assert(ix >= 0);
1633 }
1634
Victor Stinner78601a32016-09-09 19:28:36 -07001635 assert(old_value != NULL);
Serhiy Storchakab9d98d52015-10-02 12:47:11 +03001636 mp->ma_used--;
Victor Stinner3b6a6b42016-09-08 12:51:24 -07001637 mp->ma_version_tag = DICT_NEXT_VERSION();
Victor Stinner78601a32016-09-09 19:28:36 -07001638 ep = &DK_ENTRIES(mp->ma_keys)[ix];
1639 dk_set_index(mp->ma_keys, hashpos, DKIX_DUMMY);
1640 ENSURE_ALLOWS_DELETIONS(mp);
1641 old_key = ep->me_key;
1642 ep->me_key = NULL;
INADA Naokiba609772016-12-07 20:41:42 +09001643 ep->me_value = NULL;
Victor Stinner78601a32016-09-09 19:28:36 -07001644 Py_DECREF(old_key);
Serhiy Storchakab9d98d52015-10-02 12:47:11 +03001645 Py_DECREF(old_value);
Victor Stinner611b0fa2016-09-14 15:02:01 +02001646
1647 assert(_PyDict_CheckConsistency(mp));
Serhiy Storchakab9d98d52015-10-02 12:47:11 +03001648 return 0;
1649}
1650
Guido van Rossum25831651993-05-19 14:50:45 +00001651void
Tim Peters1f5871e2000-07-04 17:44:48 +00001652PyDict_Clear(PyObject *op)
Guido van Rossum4b1302b1993-03-27 18:11:32 +00001653{
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00001654 PyDictObject *mp;
Benjamin Peterson7d95e402012-04-23 11:24:50 -04001655 PyDictKeysObject *oldkeys;
1656 PyObject **oldvalues;
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00001657 Py_ssize_t i, n;
Tim Petersdea48ec2001-05-22 20:40:22 +00001658
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00001659 if (!PyDict_Check(op))
1660 return;
Benjamin Peterson7d95e402012-04-23 11:24:50 -04001661 mp = ((PyDictObject *)op);
1662 oldkeys = mp->ma_keys;
1663 oldvalues = mp->ma_values;
1664 if (oldvalues == empty_values)
1665 return;
1666 /* Empty the dict... */
1667 DK_INCREF(Py_EMPTY_KEYS);
1668 mp->ma_keys = Py_EMPTY_KEYS;
1669 mp->ma_values = empty_values;
1670 mp->ma_used = 0;
Victor Stinner3b6a6b42016-09-08 12:51:24 -07001671 mp->ma_version_tag = DICT_NEXT_VERSION();
Benjamin Peterson7d95e402012-04-23 11:24:50 -04001672 /* ...then clear the keys and values */
1673 if (oldvalues != NULL) {
Victor Stinner742da042016-09-07 17:40:12 -07001674 n = oldkeys->dk_nentries;
Benjamin Peterson7d95e402012-04-23 11:24:50 -04001675 for (i = 0; i < n; i++)
1676 Py_CLEAR(oldvalues[i]);
1677 free_values(oldvalues);
1678 DK_DECREF(oldkeys);
1679 }
1680 else {
1681 assert(oldkeys->dk_refcnt == 1);
Antoine Pitrou2d169b22012-05-12 23:43:44 +02001682 DK_DECREF(oldkeys);
Benjamin Peterson7d95e402012-04-23 11:24:50 -04001683 }
Victor Stinner611b0fa2016-09-14 15:02:01 +02001684 assert(_PyDict_CheckConsistency(mp));
Benjamin Peterson7d95e402012-04-23 11:24:50 -04001685}
1686
Serhiy Storchaka49f5cdd2016-10-09 23:08:05 +03001687/* Internal version of PyDict_Next that returns a hash value in addition
1688 * to the key and value.
1689 * Return 1 on success, return 0 when the reached the end of the dictionary
1690 * (or if op is not a dictionary)
Benjamin Peterson7d95e402012-04-23 11:24:50 -04001691 */
Serhiy Storchaka49f5cdd2016-10-09 23:08:05 +03001692int
1693_PyDict_Next(PyObject *op, Py_ssize_t *ppos, PyObject **pkey,
1694 PyObject **pvalue, Py_hash_t *phash)
Benjamin Peterson7d95e402012-04-23 11:24:50 -04001695{
INADA Naokica2d8be2016-11-04 16:59:10 +09001696 Py_ssize_t i;
Benjamin Peterson7d95e402012-04-23 11:24:50 -04001697 PyDictObject *mp;
Serhiy Storchaka49f5cdd2016-10-09 23:08:05 +03001698 PyDictKeyEntry *entry_ptr;
1699 PyObject *value;
Benjamin Peterson7d95e402012-04-23 11:24:50 -04001700
1701 if (!PyDict_Check(op))
Serhiy Storchaka49f5cdd2016-10-09 23:08:05 +03001702 return 0;
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00001703 mp = (PyDictObject *)op;
Serhiy Storchaka49f5cdd2016-10-09 23:08:05 +03001704 i = *ppos;
Benjamin Peterson7d95e402012-04-23 11:24:50 -04001705 if (mp->ma_values) {
INADA Naokica2d8be2016-11-04 16:59:10 +09001706 if (i < 0 || i >= mp->ma_used)
Serhiy Storchaka49f5cdd2016-10-09 23:08:05 +03001707 return 0;
INADA Naokica2d8be2016-11-04 16:59:10 +09001708 /* values of split table is always dense */
Serhiy Storchaka49f5cdd2016-10-09 23:08:05 +03001709 entry_ptr = &DK_ENTRIES(mp->ma_keys)[i];
INADA Naokica2d8be2016-11-04 16:59:10 +09001710 value = mp->ma_values[i];
1711 assert(value != NULL);
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00001712 }
Benjamin Peterson7d95e402012-04-23 11:24:50 -04001713 else {
INADA Naokica2d8be2016-11-04 16:59:10 +09001714 Py_ssize_t n = mp->ma_keys->dk_nentries;
1715 if (i < 0 || i >= n)
1716 return 0;
Serhiy Storchaka49f5cdd2016-10-09 23:08:05 +03001717 entry_ptr = &DK_ENTRIES(mp->ma_keys)[i];
1718 while (i < n && entry_ptr->me_value == NULL) {
1719 entry_ptr++;
1720 i++;
Victor Stinner742da042016-09-07 17:40:12 -07001721 }
Serhiy Storchaka49f5cdd2016-10-09 23:08:05 +03001722 if (i >= n)
1723 return 0;
1724 value = entry_ptr->me_value;
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00001725 }
Serhiy Storchaka49f5cdd2016-10-09 23:08:05 +03001726 *ppos = i+1;
1727 if (pkey)
1728 *pkey = entry_ptr->me_key;
1729 if (phash)
1730 *phash = entry_ptr->me_hash;
Benjamin Peterson7d95e402012-04-23 11:24:50 -04001731 if (pvalue)
Serhiy Storchaka49f5cdd2016-10-09 23:08:05 +03001732 *pvalue = value;
1733 return 1;
Guido van Rossum4b1302b1993-03-27 18:11:32 +00001734}
1735
Tim Peters080c88b2003-02-15 03:01:11 +00001736/*
1737 * Iterate over a dict. Use like so:
1738 *
Thomas Wouters4d70c3d2006-06-08 14:42:34 +00001739 * Py_ssize_t i;
Tim Peters080c88b2003-02-15 03:01:11 +00001740 * PyObject *key, *value;
1741 * i = 0; # important! i should not otherwise be changed by you
Neal Norwitz07323012003-02-15 14:45:12 +00001742 * while (PyDict_Next(yourdict, &i, &key, &value)) {
Serhiy Storchaka49f5cdd2016-10-09 23:08:05 +03001743 * Refer to borrowed references in key and value.
Tim Peters080c88b2003-02-15 03:01:11 +00001744 * }
1745 *
Serhiy Storchaka49f5cdd2016-10-09 23:08:05 +03001746 * Return 1 on success, return 0 when the reached the end of the dictionary
1747 * (or if op is not a dictionary)
1748 *
Tim Peters080c88b2003-02-15 03:01:11 +00001749 * CAUTION: In general, it isn't safe to use PyDict_Next in a loop that
Tim Peters67830702001-03-21 19:23:56 +00001750 * mutates the dict. One exception: it is safe if the loop merely changes
1751 * the values associated with the keys (but doesn't insert new keys or
1752 * delete keys), via PyDict_SetItem().
1753 */
Guido van Rossum25831651993-05-19 14:50:45 +00001754int
Martin v. Löwis18e16552006-02-15 17:27:45 +00001755PyDict_Next(PyObject *op, Py_ssize_t *ppos, PyObject **pkey, PyObject **pvalue)
Guido van Rossum4b1302b1993-03-27 18:11:32 +00001756{
Serhiy Storchaka49f5cdd2016-10-09 23:08:05 +03001757 return _PyDict_Next(op, ppos, pkey, pvalue, NULL);
Thomas Wouterscf297e42007-02-23 15:07:44 +00001758}
1759
Eric Snow96c6af92015-05-29 22:21:39 -06001760/* Internal version of dict.pop(). */
1761PyObject *
Yury Selivanov684ef2c2016-10-28 19:01:21 -04001762_PyDict_Pop(PyObject *dict, PyObject *key, PyObject *deflt)
Eric Snow96c6af92015-05-29 22:21:39 -06001763{
1764 Py_hash_t hash;
Victor Stinner742da042016-09-07 17:40:12 -07001765 Py_ssize_t ix, hashpos;
Eric Snow96c6af92015-05-29 22:21:39 -06001766 PyObject *old_value, *old_key;
1767 PyDictKeyEntry *ep;
Yury Selivanov684ef2c2016-10-28 19:01:21 -04001768 PyDictObject *mp;
1769
1770 assert(PyDict_Check(dict));
1771 mp = (PyDictObject *)dict;
Eric Snow96c6af92015-05-29 22:21:39 -06001772
1773 if (mp->ma_used == 0) {
1774 if (deflt) {
1775 Py_INCREF(deflt);
1776 return deflt;
1777 }
1778 _PyErr_SetKeyError(key);
1779 return NULL;
1780 }
1781 if (!PyUnicode_CheckExact(key) ||
1782 (hash = ((PyASCIIObject *) key)->hash) == -1) {
1783 hash = PyObject_Hash(key);
1784 if (hash == -1)
1785 return NULL;
1786 }
INADA Naokiba609772016-12-07 20:41:42 +09001787 ix = (mp->ma_keys->dk_lookup)(mp, key, hash, &old_value, &hashpos);
Victor Stinner742da042016-09-07 17:40:12 -07001788 if (ix == DKIX_ERROR)
Eric Snow96c6af92015-05-29 22:21:39 -06001789 return NULL;
INADA Naokiba609772016-12-07 20:41:42 +09001790 if (ix == DKIX_EMPTY || old_value == NULL) {
Eric Snow96c6af92015-05-29 22:21:39 -06001791 if (deflt) {
1792 Py_INCREF(deflt);
1793 return deflt;
1794 }
1795 _PyErr_SetKeyError(key);
1796 return NULL;
1797 }
Victor Stinner3b6a6b42016-09-08 12:51:24 -07001798
Victor Stinner78601a32016-09-09 19:28:36 -07001799 // Split table doesn't allow deletion. Combine it.
1800 if (_PyDict_HasSplitTable(mp)) {
1801 if (dictresize(mp, DK_SIZE(mp->ma_keys))) {
1802 return NULL;
1803 }
INADA Naokiba609772016-12-07 20:41:42 +09001804 ix = (mp->ma_keys->dk_lookup)(mp, key, hash, &old_value, &hashpos);
Victor Stinner78601a32016-09-09 19:28:36 -07001805 assert(ix >= 0);
1806 }
1807
Victor Stinner78601a32016-09-09 19:28:36 -07001808 assert(old_value != NULL);
Eric Snow96c6af92015-05-29 22:21:39 -06001809 mp->ma_used--;
Victor Stinner3b6a6b42016-09-08 12:51:24 -07001810 mp->ma_version_tag = DICT_NEXT_VERSION();
Victor Stinner78601a32016-09-09 19:28:36 -07001811 dk_set_index(mp->ma_keys, hashpos, DKIX_DUMMY);
1812 ep = &DK_ENTRIES(mp->ma_keys)[ix];
1813 ENSURE_ALLOWS_DELETIONS(mp);
1814 old_key = ep->me_key;
1815 ep->me_key = NULL;
INADA Naokiba609772016-12-07 20:41:42 +09001816 ep->me_value = NULL;
Victor Stinner78601a32016-09-09 19:28:36 -07001817 Py_DECREF(old_key);
Victor Stinner611b0fa2016-09-14 15:02:01 +02001818
1819 assert(_PyDict_CheckConsistency(mp));
Eric Snow96c6af92015-05-29 22:21:39 -06001820 return old_value;
1821}
1822
1823/* Internal version of dict.from_keys(). It is subclass-friendly. */
1824PyObject *
1825_PyDict_FromKeys(PyObject *cls, PyObject *iterable, PyObject *value)
1826{
1827 PyObject *it; /* iter(iterable) */
1828 PyObject *key;
1829 PyObject *d;
1830 int status;
1831
Victor Stinnera5ed5f02016-12-06 18:45:50 +01001832 d = _PyObject_CallNoArg(cls);
Eric Snow96c6af92015-05-29 22:21:39 -06001833 if (d == NULL)
1834 return NULL;
1835
1836 if (PyDict_CheckExact(d) && ((PyDictObject *)d)->ma_used == 0) {
1837 if (PyDict_CheckExact(iterable)) {
1838 PyDictObject *mp = (PyDictObject *)d;
1839 PyObject *oldvalue;
1840 Py_ssize_t pos = 0;
1841 PyObject *key;
1842 Py_hash_t hash;
1843
Victor Stinner742da042016-09-07 17:40:12 -07001844 if (dictresize(mp, ESTIMATE_SIZE(Py_SIZE(iterable)))) {
Eric Snow96c6af92015-05-29 22:21:39 -06001845 Py_DECREF(d);
1846 return NULL;
1847 }
1848
1849 while (_PyDict_Next(iterable, &pos, &key, &oldvalue, &hash)) {
1850 if (insertdict(mp, key, hash, value)) {
1851 Py_DECREF(d);
1852 return NULL;
1853 }
1854 }
1855 return d;
1856 }
1857 if (PyAnySet_CheckExact(iterable)) {
1858 PyDictObject *mp = (PyDictObject *)d;
1859 Py_ssize_t pos = 0;
1860 PyObject *key;
1861 Py_hash_t hash;
1862
Victor Stinner742da042016-09-07 17:40:12 -07001863 if (dictresize(mp, ESTIMATE_SIZE(PySet_GET_SIZE(iterable)))) {
Eric Snow96c6af92015-05-29 22:21:39 -06001864 Py_DECREF(d);
1865 return NULL;
1866 }
1867
1868 while (_PySet_NextEntry(iterable, &pos, &key, &hash)) {
1869 if (insertdict(mp, key, hash, value)) {
1870 Py_DECREF(d);
1871 return NULL;
1872 }
1873 }
1874 return d;
1875 }
1876 }
1877
1878 it = PyObject_GetIter(iterable);
1879 if (it == NULL){
1880 Py_DECREF(d);
1881 return NULL;
1882 }
1883
1884 if (PyDict_CheckExact(d)) {
1885 while ((key = PyIter_Next(it)) != NULL) {
1886 status = PyDict_SetItem(d, key, value);
1887 Py_DECREF(key);
1888 if (status < 0)
1889 goto Fail;
1890 }
1891 } else {
1892 while ((key = PyIter_Next(it)) != NULL) {
1893 status = PyObject_SetItem(d, key, value);
1894 Py_DECREF(key);
1895 if (status < 0)
1896 goto Fail;
1897 }
1898 }
1899
1900 if (PyErr_Occurred())
1901 goto Fail;
1902 Py_DECREF(it);
1903 return d;
1904
1905Fail:
1906 Py_DECREF(it);
1907 Py_DECREF(d);
1908 return NULL;
1909}
1910
Guido van Rossum4b1302b1993-03-27 18:11:32 +00001911/* Methods */
1912
1913static void
Benjamin Peterson7d95e402012-04-23 11:24:50 -04001914dict_dealloc(PyDictObject *mp)
Guido van Rossum4b1302b1993-03-27 18:11:32 +00001915{
Benjamin Peterson7d95e402012-04-23 11:24:50 -04001916 PyObject **values = mp->ma_values;
1917 PyDictKeysObject *keys = mp->ma_keys;
1918 Py_ssize_t i, n;
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00001919 PyObject_GC_UnTrack(mp);
1920 Py_TRASHCAN_SAFE_BEGIN(mp)
Benjamin Peterson7d95e402012-04-23 11:24:50 -04001921 if (values != NULL) {
1922 if (values != empty_values) {
Victor Stinner742da042016-09-07 17:40:12 -07001923 for (i = 0, n = mp->ma_keys->dk_nentries; i < n; i++) {
Benjamin Peterson7d95e402012-04-23 11:24:50 -04001924 Py_XDECREF(values[i]);
1925 }
1926 free_values(values);
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00001927 }
Benjamin Peterson7d95e402012-04-23 11:24:50 -04001928 DK_DECREF(keys);
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00001929 }
Victor Stinnerac2a4fe2013-07-16 22:19:00 +02001930 else if (keys != NULL) {
Antoine Pitrou2d169b22012-05-12 23:43:44 +02001931 assert(keys->dk_refcnt == 1);
1932 DK_DECREF(keys);
Benjamin Peterson7d95e402012-04-23 11:24:50 -04001933 }
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00001934 if (numfree < PyDict_MAXFREELIST && Py_TYPE(mp) == &PyDict_Type)
1935 free_list[numfree++] = mp;
1936 else
1937 Py_TYPE(mp)->tp_free((PyObject *)mp);
1938 Py_TRASHCAN_SAFE_END(mp)
Guido van Rossum4b1302b1993-03-27 18:11:32 +00001939}
1940
Benjamin Peterson7d95e402012-04-23 11:24:50 -04001941
Guido van Rossumc0b618a1997-05-02 03:12:38 +00001942static PyObject *
Guido van Rossum8ce8a782007-11-01 19:42:39 +00001943dict_repr(PyDictObject *mp)
Guido van Rossum4b1302b1993-03-27 18:11:32 +00001944{
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00001945 Py_ssize_t i;
Victor Stinnerf91929b2013-11-19 13:07:38 +01001946 PyObject *key = NULL, *value = NULL;
1947 _PyUnicodeWriter writer;
1948 int first;
Guido van Rossum255443b1998-04-10 22:47:14 +00001949
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00001950 i = Py_ReprEnter((PyObject *)mp);
1951 if (i != 0) {
1952 return i > 0 ? PyUnicode_FromString("{...}") : NULL;
1953 }
Guido van Rossum255443b1998-04-10 22:47:14 +00001954
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00001955 if (mp->ma_used == 0) {
Victor Stinnerf91929b2013-11-19 13:07:38 +01001956 Py_ReprLeave((PyObject *)mp);
1957 return PyUnicode_FromString("{}");
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00001958 }
Tim Petersa7259592001-06-16 05:11:17 +00001959
Victor Stinnerf91929b2013-11-19 13:07:38 +01001960 _PyUnicodeWriter_Init(&writer);
1961 writer.overallocate = 1;
1962 /* "{" + "1: 2" + ", 3: 4" * (len - 1) + "}" */
1963 writer.min_length = 1 + 4 + (2 + 4) * (mp->ma_used - 1) + 1;
Tim Petersa7259592001-06-16 05:11:17 +00001964
Victor Stinnerf91929b2013-11-19 13:07:38 +01001965 if (_PyUnicodeWriter_WriteChar(&writer, '{') < 0)
1966 goto error;
Tim Petersa7259592001-06-16 05:11:17 +00001967
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00001968 /* Do repr() on each key+value pair, and insert ": " between them.
1969 Note that repr may mutate the dict. */
1970 i = 0;
Victor Stinnerf91929b2013-11-19 13:07:38 +01001971 first = 1;
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00001972 while (PyDict_Next((PyObject *)mp, &i, &key, &value)) {
Victor Stinnerf91929b2013-11-19 13:07:38 +01001973 PyObject *s;
1974 int res;
1975
Benjamin Peterson7d95e402012-04-23 11:24:50 -04001976 /* Prevent repr from deleting key or value during key format. */
1977 Py_INCREF(key);
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00001978 Py_INCREF(value);
Victor Stinnerf97dfd72013-07-18 01:00:45 +02001979
Victor Stinnerf91929b2013-11-19 13:07:38 +01001980 if (!first) {
1981 if (_PyUnicodeWriter_WriteASCIIString(&writer, ", ", 2) < 0)
1982 goto error;
1983 }
1984 first = 0;
1985
1986 s = PyObject_Repr(key);
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00001987 if (s == NULL)
Victor Stinnerf91929b2013-11-19 13:07:38 +01001988 goto error;
1989 res = _PyUnicodeWriter_WriteStr(&writer, s);
1990 Py_DECREF(s);
1991 if (res < 0)
1992 goto error;
1993
1994 if (_PyUnicodeWriter_WriteASCIIString(&writer, ": ", 2) < 0)
1995 goto error;
1996
1997 s = PyObject_Repr(value);
1998 if (s == NULL)
1999 goto error;
2000 res = _PyUnicodeWriter_WriteStr(&writer, s);
2001 Py_DECREF(s);
2002 if (res < 0)
2003 goto error;
2004
2005 Py_CLEAR(key);
2006 Py_CLEAR(value);
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00002007 }
Tim Petersa7259592001-06-16 05:11:17 +00002008
Victor Stinnerf91929b2013-11-19 13:07:38 +01002009 writer.overallocate = 0;
2010 if (_PyUnicodeWriter_WriteChar(&writer, '}') < 0)
2011 goto error;
Tim Petersa7259592001-06-16 05:11:17 +00002012
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00002013 Py_ReprLeave((PyObject *)mp);
Victor Stinnerf91929b2013-11-19 13:07:38 +01002014
2015 return _PyUnicodeWriter_Finish(&writer);
2016
2017error:
2018 Py_ReprLeave((PyObject *)mp);
2019 _PyUnicodeWriter_Dealloc(&writer);
2020 Py_XDECREF(key);
2021 Py_XDECREF(value);
2022 return NULL;
Guido van Rossum4b1302b1993-03-27 18:11:32 +00002023}
2024
Martin v. Löwis18e16552006-02-15 17:27:45 +00002025static Py_ssize_t
Guido van Rossum8ce8a782007-11-01 19:42:39 +00002026dict_length(PyDictObject *mp)
Guido van Rossum4b1302b1993-03-27 18:11:32 +00002027{
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00002028 return mp->ma_used;
Guido van Rossum4b1302b1993-03-27 18:11:32 +00002029}
2030
Guido van Rossumc0b618a1997-05-02 03:12:38 +00002031static PyObject *
Antoine Pitrou9ed5f272013-08-13 20:18:52 +02002032dict_subscript(PyDictObject *mp, PyObject *key)
Guido van Rossum4b1302b1993-03-27 18:11:32 +00002033{
Victor Stinner742da042016-09-07 17:40:12 -07002034 Py_ssize_t ix;
Benjamin Peterson8f67d082010-10-17 20:54:53 +00002035 Py_hash_t hash;
INADA Naokiba609772016-12-07 20:41:42 +09002036 PyObject *value;
Benjamin Peterson7d95e402012-04-23 11:24:50 -04002037
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00002038 if (!PyUnicode_CheckExact(key) ||
Martin v. Löwisd63a3b82011-09-28 07:41:54 +02002039 (hash = ((PyASCIIObject *) key)->hash) == -1) {
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00002040 hash = PyObject_Hash(key);
2041 if (hash == -1)
2042 return NULL;
2043 }
INADA Naokiba609772016-12-07 20:41:42 +09002044 ix = (mp->ma_keys->dk_lookup)(mp, key, hash, &value, NULL);
Victor Stinner742da042016-09-07 17:40:12 -07002045 if (ix == DKIX_ERROR)
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00002046 return NULL;
INADA Naokiba609772016-12-07 20:41:42 +09002047 if (ix == DKIX_EMPTY || value == NULL) {
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00002048 if (!PyDict_CheckExact(mp)) {
2049 /* Look up __missing__ method if we're a subclass. */
2050 PyObject *missing, *res;
Benjamin Petersonce798522012-01-22 11:24:29 -05002051 _Py_IDENTIFIER(__missing__);
2052 missing = _PyObject_LookupSpecial((PyObject *)mp, &PyId___missing__);
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00002053 if (missing != NULL) {
Victor Stinnerde4ae3d2016-12-04 22:59:09 +01002054 res = PyObject_CallFunctionObjArgs(missing,
2055 key, NULL);
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00002056 Py_DECREF(missing);
2057 return res;
2058 }
2059 else if (PyErr_Occurred())
2060 return NULL;
2061 }
Raymond Hettinger69492da2013-09-02 15:59:26 -07002062 _PyErr_SetKeyError(key);
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00002063 return NULL;
2064 }
INADA Naokiba609772016-12-07 20:41:42 +09002065 Py_INCREF(value);
2066 return value;
Guido van Rossum4b1302b1993-03-27 18:11:32 +00002067}
2068
2069static int
Guido van Rossum8ce8a782007-11-01 19:42:39 +00002070dict_ass_sub(PyDictObject *mp, PyObject *v, PyObject *w)
Guido van Rossum4b1302b1993-03-27 18:11:32 +00002071{
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00002072 if (w == NULL)
2073 return PyDict_DelItem((PyObject *)mp, v);
2074 else
2075 return PyDict_SetItem((PyObject *)mp, v, w);
Guido van Rossum4b1302b1993-03-27 18:11:32 +00002076}
2077
Guido van Rossuma9e7a811997-05-13 21:02:11 +00002078static PyMappingMethods dict_as_mapping = {
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00002079 (lenfunc)dict_length, /*mp_length*/
2080 (binaryfunc)dict_subscript, /*mp_subscript*/
2081 (objobjargproc)dict_ass_sub, /*mp_ass_subscript*/
Guido van Rossum4b1302b1993-03-27 18:11:32 +00002082};
2083
Guido van Rossumc0b618a1997-05-02 03:12:38 +00002084static PyObject *
Antoine Pitrou9ed5f272013-08-13 20:18:52 +02002085dict_keys(PyDictObject *mp)
Guido van Rossum4b1302b1993-03-27 18:11:32 +00002086{
Antoine Pitrou9ed5f272013-08-13 20:18:52 +02002087 PyObject *v;
2088 Py_ssize_t i, j;
Benjamin Peterson7d95e402012-04-23 11:24:50 -04002089 PyDictKeyEntry *ep;
2090 Py_ssize_t size, n, offset;
2091 PyObject **value_ptr;
Guido van Rossuma4dd0112001-04-15 22:16:26 +00002092
Guido van Rossuma4dd0112001-04-15 22:16:26 +00002093 again:
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00002094 n = mp->ma_used;
2095 v = PyList_New(n);
2096 if (v == NULL)
2097 return NULL;
2098 if (n != mp->ma_used) {
2099 /* Durnit. The allocations caused the dict to resize.
2100 * Just start over, this shouldn't normally happen.
2101 */
2102 Py_DECREF(v);
2103 goto again;
2104 }
Victor Stinner742da042016-09-07 17:40:12 -07002105 ep = DK_ENTRIES(mp->ma_keys);
2106 size = mp->ma_keys->dk_nentries;
Benjamin Peterson7d95e402012-04-23 11:24:50 -04002107 if (mp->ma_values) {
2108 value_ptr = mp->ma_values;
2109 offset = sizeof(PyObject *);
2110 }
2111 else {
2112 value_ptr = &ep[0].me_value;
2113 offset = sizeof(PyDictKeyEntry);
2114 }
2115 for (i = 0, j = 0; i < size; i++) {
2116 if (*value_ptr != NULL) {
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00002117 PyObject *key = ep[i].me_key;
2118 Py_INCREF(key);
2119 PyList_SET_ITEM(v, j, key);
2120 j++;
2121 }
Benjamin Peterson7d95e402012-04-23 11:24:50 -04002122 value_ptr = (PyObject **)(((char *)value_ptr) + offset);
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00002123 }
2124 assert(j == n);
2125 return v;
Guido van Rossum4b1302b1993-03-27 18:11:32 +00002126}
2127
Guido van Rossumc0b618a1997-05-02 03:12:38 +00002128static PyObject *
Antoine Pitrou9ed5f272013-08-13 20:18:52 +02002129dict_values(PyDictObject *mp)
Guido van Rossum25831651993-05-19 14:50:45 +00002130{
Antoine Pitrou9ed5f272013-08-13 20:18:52 +02002131 PyObject *v;
2132 Py_ssize_t i, j;
Benjamin Petersonf0acae22016-09-08 09:50:08 -07002133 PyDictKeyEntry *ep;
Benjamin Peterson7d95e402012-04-23 11:24:50 -04002134 Py_ssize_t size, n, offset;
2135 PyObject **value_ptr;
Guido van Rossuma4dd0112001-04-15 22:16:26 +00002136
Guido van Rossuma4dd0112001-04-15 22:16:26 +00002137 again:
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00002138 n = mp->ma_used;
2139 v = PyList_New(n);
2140 if (v == NULL)
2141 return NULL;
2142 if (n != mp->ma_used) {
2143 /* Durnit. The allocations caused the dict to resize.
2144 * Just start over, this shouldn't normally happen.
2145 */
2146 Py_DECREF(v);
2147 goto again;
2148 }
Benjamin Petersonf0acae22016-09-08 09:50:08 -07002149 ep = DK_ENTRIES(mp->ma_keys);
Victor Stinner742da042016-09-07 17:40:12 -07002150 size = mp->ma_keys->dk_nentries;
Benjamin Peterson7d95e402012-04-23 11:24:50 -04002151 if (mp->ma_values) {
2152 value_ptr = mp->ma_values;
2153 offset = sizeof(PyObject *);
2154 }
2155 else {
Benjamin Petersonf0acae22016-09-08 09:50:08 -07002156 value_ptr = &ep[0].me_value;
Benjamin Peterson7d95e402012-04-23 11:24:50 -04002157 offset = sizeof(PyDictKeyEntry);
2158 }
2159 for (i = 0, j = 0; i < size; i++) {
2160 PyObject *value = *value_ptr;
2161 value_ptr = (PyObject **)(((char *)value_ptr) + offset);
2162 if (value != NULL) {
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00002163 Py_INCREF(value);
2164 PyList_SET_ITEM(v, j, value);
2165 j++;
2166 }
2167 }
2168 assert(j == n);
2169 return v;
Guido van Rossum25831651993-05-19 14:50:45 +00002170}
2171
Guido van Rossumc0b618a1997-05-02 03:12:38 +00002172static PyObject *
Antoine Pitrou9ed5f272013-08-13 20:18:52 +02002173dict_items(PyDictObject *mp)
Guido van Rossum25831651993-05-19 14:50:45 +00002174{
Antoine Pitrou9ed5f272013-08-13 20:18:52 +02002175 PyObject *v;
2176 Py_ssize_t i, j, n;
Benjamin Peterson7d95e402012-04-23 11:24:50 -04002177 Py_ssize_t size, offset;
2178 PyObject *item, *key;
2179 PyDictKeyEntry *ep;
2180 PyObject **value_ptr;
Guido van Rossuma4dd0112001-04-15 22:16:26 +00002181
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00002182 /* Preallocate the list of tuples, to avoid allocations during
2183 * the loop over the items, which could trigger GC, which
2184 * could resize the dict. :-(
2185 */
Guido van Rossuma4dd0112001-04-15 22:16:26 +00002186 again:
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00002187 n = mp->ma_used;
2188 v = PyList_New(n);
2189 if (v == NULL)
2190 return NULL;
2191 for (i = 0; i < n; i++) {
2192 item = PyTuple_New(2);
2193 if (item == NULL) {
2194 Py_DECREF(v);
2195 return NULL;
2196 }
2197 PyList_SET_ITEM(v, i, item);
2198 }
2199 if (n != mp->ma_used) {
2200 /* Durnit. The allocations caused the dict to resize.
2201 * Just start over, this shouldn't normally happen.
2202 */
2203 Py_DECREF(v);
2204 goto again;
2205 }
2206 /* Nothing we do below makes any function calls. */
Victor Stinner742da042016-09-07 17:40:12 -07002207 ep = DK_ENTRIES(mp->ma_keys);
2208 size = mp->ma_keys->dk_nentries;
Benjamin Peterson7d95e402012-04-23 11:24:50 -04002209 if (mp->ma_values) {
2210 value_ptr = mp->ma_values;
2211 offset = sizeof(PyObject *);
2212 }
2213 else {
2214 value_ptr = &ep[0].me_value;
2215 offset = sizeof(PyDictKeyEntry);
2216 }
2217 for (i = 0, j = 0; i < size; i++) {
2218 PyObject *value = *value_ptr;
2219 value_ptr = (PyObject **)(((char *)value_ptr) + offset);
2220 if (value != NULL) {
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00002221 key = ep[i].me_key;
2222 item = PyList_GET_ITEM(v, j);
2223 Py_INCREF(key);
2224 PyTuple_SET_ITEM(item, 0, key);
2225 Py_INCREF(value);
2226 PyTuple_SET_ITEM(item, 1, value);
2227 j++;
2228 }
2229 }
2230 assert(j == n);
2231 return v;
Guido van Rossum25831651993-05-19 14:50:45 +00002232}
2233
Larry Hastings5c661892014-01-24 06:17:25 -08002234/*[clinic input]
2235@classmethod
2236dict.fromkeys
Larry Hastings5c661892014-01-24 06:17:25 -08002237 iterable: object
2238 value: object=None
2239 /
2240
2241Returns a new dict with keys from iterable and values equal to value.
2242[clinic start generated code]*/
2243
Larry Hastings5c661892014-01-24 06:17:25 -08002244static PyObject *
2245dict_fromkeys_impl(PyTypeObject *type, PyObject *iterable, PyObject *value)
Serhiy Storchaka1009bf12015-04-03 23:53:51 +03002246/*[clinic end generated code: output=8fb98e4b10384999 input=b85a667f9bf4669d]*/
Larry Hastings5c661892014-01-24 06:17:25 -08002247{
Eric Snow96c6af92015-05-29 22:21:39 -06002248 return _PyDict_FromKeys((PyObject *)type, iterable, value);
Raymond Hettingere33d3df2002-11-27 07:29:33 +00002249}
2250
Raymond Hettinger31017ae2004-03-04 08:25:44 +00002251static int
Victor Stinner742da042016-09-07 17:40:12 -07002252dict_update_common(PyObject *self, PyObject *args, PyObject *kwds,
2253 const char *methname)
Guido van Rossume3f5b9c1997-05-28 19:15:28 +00002254{
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00002255 PyObject *arg = NULL;
2256 int result = 0;
Raymond Hettinger31017ae2004-03-04 08:25:44 +00002257
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00002258 if (!PyArg_UnpackTuple(args, methname, 0, 1, &arg))
2259 result = -1;
Raymond Hettinger31017ae2004-03-04 08:25:44 +00002260
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00002261 else if (arg != NULL) {
Martin v. Löwis1c67dd92011-10-14 15:16:45 +02002262 _Py_IDENTIFIER(keys);
2263 if (_PyObject_HasAttrId(arg, &PyId_keys))
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00002264 result = PyDict_Merge(self, arg, 1);
2265 else
2266 result = PyDict_MergeFromSeq2(self, arg, 1);
2267 }
2268 if (result == 0 && kwds != NULL) {
2269 if (PyArg_ValidateKeywordArguments(kwds))
2270 result = PyDict_Merge(self, kwds, 1);
2271 else
2272 result = -1;
2273 }
2274 return result;
Raymond Hettinger31017ae2004-03-04 08:25:44 +00002275}
2276
2277static PyObject *
2278dict_update(PyObject *self, PyObject *args, PyObject *kwds)
2279{
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00002280 if (dict_update_common(self, args, kwds, "update") != -1)
2281 Py_RETURN_NONE;
2282 return NULL;
Tim Peters6d6c1a32001-08-02 04:15:00 +00002283}
2284
Guido van Rossum05ac6de2001-08-10 20:28:28 +00002285/* Update unconditionally replaces existing items.
2286 Merge has a 3rd argument 'override'; if set, it acts like Update,
Tim Peters1fc240e2001-10-26 05:06:50 +00002287 otherwise it leaves existing items unchanged.
2288
2289 PyDict_{Update,Merge} update/merge from a mapping object.
2290
Tim Petersf582b822001-12-11 18:51:08 +00002291 PyDict_MergeFromSeq2 updates/merges from any iterable object
Tim Peters1fc240e2001-10-26 05:06:50 +00002292 producing iterable objects of length 2.
2293*/
2294
Tim Petersf582b822001-12-11 18:51:08 +00002295int
Tim Peters1fc240e2001-10-26 05:06:50 +00002296PyDict_MergeFromSeq2(PyObject *d, PyObject *seq2, int override)
2297{
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00002298 PyObject *it; /* iter(seq2) */
2299 Py_ssize_t i; /* index into seq2 of current element */
2300 PyObject *item; /* seq2[i] */
2301 PyObject *fast; /* item as a 2-tuple or 2-list */
Tim Peters1fc240e2001-10-26 05:06:50 +00002302
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00002303 assert(d != NULL);
2304 assert(PyDict_Check(d));
2305 assert(seq2 != NULL);
Tim Peters1fc240e2001-10-26 05:06:50 +00002306
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00002307 it = PyObject_GetIter(seq2);
2308 if (it == NULL)
2309 return -1;
Tim Peters1fc240e2001-10-26 05:06:50 +00002310
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00002311 for (i = 0; ; ++i) {
2312 PyObject *key, *value;
2313 Py_ssize_t n;
Tim Peters1fc240e2001-10-26 05:06:50 +00002314
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00002315 fast = NULL;
2316 item = PyIter_Next(it);
2317 if (item == NULL) {
2318 if (PyErr_Occurred())
2319 goto Fail;
2320 break;
2321 }
Tim Peters1fc240e2001-10-26 05:06:50 +00002322
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00002323 /* Convert item to sequence, and verify length 2. */
2324 fast = PySequence_Fast(item, "");
2325 if (fast == NULL) {
2326 if (PyErr_ExceptionMatches(PyExc_TypeError))
2327 PyErr_Format(PyExc_TypeError,
2328 "cannot convert dictionary update "
2329 "sequence element #%zd to a sequence",
2330 i);
2331 goto Fail;
2332 }
2333 n = PySequence_Fast_GET_SIZE(fast);
2334 if (n != 2) {
2335 PyErr_Format(PyExc_ValueError,
2336 "dictionary update sequence element #%zd "
2337 "has length %zd; 2 is required",
2338 i, n);
2339 goto Fail;
2340 }
Tim Peters1fc240e2001-10-26 05:06:50 +00002341
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00002342 /* Update/merge with this (key, value) pair. */
2343 key = PySequence_Fast_GET_ITEM(fast, 0);
2344 value = PySequence_Fast_GET_ITEM(fast, 1);
2345 if (override || PyDict_GetItem(d, key) == NULL) {
2346 int status = PyDict_SetItem(d, key, value);
2347 if (status < 0)
2348 goto Fail;
2349 }
2350 Py_DECREF(fast);
2351 Py_DECREF(item);
2352 }
Tim Peters1fc240e2001-10-26 05:06:50 +00002353
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00002354 i = 0;
Victor Stinner611b0fa2016-09-14 15:02:01 +02002355 assert(_PyDict_CheckConsistency((PyDictObject *)d));
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00002356 goto Return;
Tim Peters1fc240e2001-10-26 05:06:50 +00002357Fail:
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00002358 Py_XDECREF(item);
2359 Py_XDECREF(fast);
2360 i = -1;
Tim Peters1fc240e2001-10-26 05:06:50 +00002361Return:
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00002362 Py_DECREF(it);
2363 return Py_SAFE_DOWNCAST(i, Py_ssize_t, int);
Tim Peters1fc240e2001-10-26 05:06:50 +00002364}
2365
doko@ubuntu.comc96df682016-10-11 08:04:02 +02002366static int
Serhiy Storchakae036ef82016-10-02 11:06:43 +03002367dict_merge(PyObject *a, PyObject *b, int override)
Guido van Rossum05ac6de2001-08-10 20:28:28 +00002368{
Antoine Pitrou9ed5f272013-08-13 20:18:52 +02002369 PyDictObject *mp, *other;
2370 Py_ssize_t i, n;
Victor Stinner742da042016-09-07 17:40:12 -07002371 PyDictKeyEntry *entry, *ep0;
Tim Peters6d6c1a32001-08-02 04:15:00 +00002372
Serhiy Storchakae036ef82016-10-02 11:06:43 +03002373 assert(0 <= override && override <= 2);
2374
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00002375 /* We accept for the argument either a concrete dictionary object,
2376 * or an abstract "mapping" object. For the former, we can do
2377 * things quite efficiently. For the latter, we only require that
2378 * PyMapping_Keys() and PyObject_GetItem() be supported.
2379 */
2380 if (a == NULL || !PyDict_Check(a) || b == NULL) {
2381 PyErr_BadInternalCall();
2382 return -1;
2383 }
2384 mp = (PyDictObject*)a;
2385 if (PyDict_Check(b)) {
2386 other = (PyDictObject*)b;
2387 if (other == mp || other->ma_used == 0)
2388 /* a.update(a) or a.update({}); nothing to do */
2389 return 0;
2390 if (mp->ma_used == 0)
2391 /* Since the target dict is empty, PyDict_GetItem()
2392 * always returns NULL. Setting override to 1
2393 * skips the unnecessary test.
2394 */
2395 override = 1;
2396 /* Do one big resize at the start, rather than
2397 * incrementally resizing as we insert new items. Expect
2398 * that there will be no (or few) overlapping keys.
2399 */
INADA Naokib1152be2016-10-27 19:26:50 +09002400 if (USABLE_FRACTION(mp->ma_keys->dk_size) < other->ma_used) {
2401 if (dictresize(mp, ESTIMATE_SIZE(mp->ma_used + other->ma_used))) {
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00002402 return -1;
INADA Naokib1152be2016-10-27 19:26:50 +09002403 }
2404 }
Victor Stinner742da042016-09-07 17:40:12 -07002405 ep0 = DK_ENTRIES(other->ma_keys);
2406 for (i = 0, n = other->ma_keys->dk_nentries; i < n; i++) {
Benjamin Petersona82f77f2015-07-04 19:55:16 -05002407 PyObject *key, *value;
2408 Py_hash_t hash;
Victor Stinner742da042016-09-07 17:40:12 -07002409 entry = &ep0[i];
Benjamin Petersona82f77f2015-07-04 19:55:16 -05002410 key = entry->me_key;
2411 hash = entry->me_hash;
Benjamin Peterson7d95e402012-04-23 11:24:50 -04002412 if (other->ma_values)
2413 value = other->ma_values[i];
2414 else
2415 value = entry->me_value;
2416
Benjamin Petersona82f77f2015-07-04 19:55:16 -05002417 if (value != NULL) {
2418 int err = 0;
2419 Py_INCREF(key);
2420 Py_INCREF(value);
Serhiy Storchakaf0b311b2016-11-06 13:18:24 +02002421 if (override == 1)
Benjamin Petersona82f77f2015-07-04 19:55:16 -05002422 err = insertdict(mp, key, hash, value);
Serhiy Storchakaf0b311b2016-11-06 13:18:24 +02002423 else if (_PyDict_GetItem_KnownHash(a, key, hash) == NULL) {
2424 if (PyErr_Occurred()) {
2425 Py_DECREF(value);
2426 Py_DECREF(key);
2427 return -1;
2428 }
2429 err = insertdict(mp, key, hash, value);
2430 }
Serhiy Storchakae036ef82016-10-02 11:06:43 +03002431 else if (override != 0) {
2432 _PyErr_SetKeyError(key);
2433 Py_DECREF(value);
2434 Py_DECREF(key);
2435 return -1;
2436 }
Benjamin Petersona82f77f2015-07-04 19:55:16 -05002437 Py_DECREF(value);
2438 Py_DECREF(key);
2439 if (err != 0)
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00002440 return -1;
Benjamin Petersona82f77f2015-07-04 19:55:16 -05002441
Victor Stinner742da042016-09-07 17:40:12 -07002442 if (n != other->ma_keys->dk_nentries) {
Benjamin Petersona82f77f2015-07-04 19:55:16 -05002443 PyErr_SetString(PyExc_RuntimeError,
2444 "dict mutated during update");
2445 return -1;
2446 }
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00002447 }
2448 }
2449 }
2450 else {
2451 /* Do it the generic, slower way */
2452 PyObject *keys = PyMapping_Keys(b);
2453 PyObject *iter;
2454 PyObject *key, *value;
2455 int status;
Barry Warsaw66a0d1d2001-06-26 20:08:32 +00002456
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00002457 if (keys == NULL)
2458 /* Docstring says this is equivalent to E.keys() so
2459 * if E doesn't have a .keys() method we want
2460 * AttributeError to percolate up. Might as well
2461 * do the same for any other error.
2462 */
2463 return -1;
Barry Warsaw66a0d1d2001-06-26 20:08:32 +00002464
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00002465 iter = PyObject_GetIter(keys);
2466 Py_DECREF(keys);
2467 if (iter == NULL)
2468 return -1;
Barry Warsaw66a0d1d2001-06-26 20:08:32 +00002469
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00002470 for (key = PyIter_Next(iter); key; key = PyIter_Next(iter)) {
Serhiy Storchakae036ef82016-10-02 11:06:43 +03002471 if (override != 1 && PyDict_GetItem(a, key) != NULL) {
2472 if (override != 0) {
2473 _PyErr_SetKeyError(key);
2474 Py_DECREF(key);
2475 Py_DECREF(iter);
2476 return -1;
2477 }
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00002478 Py_DECREF(key);
2479 continue;
2480 }
2481 value = PyObject_GetItem(b, key);
2482 if (value == NULL) {
2483 Py_DECREF(iter);
2484 Py_DECREF(key);
2485 return -1;
2486 }
2487 status = PyDict_SetItem(a, key, value);
2488 Py_DECREF(key);
2489 Py_DECREF(value);
2490 if (status < 0) {
2491 Py_DECREF(iter);
2492 return -1;
2493 }
2494 }
2495 Py_DECREF(iter);
2496 if (PyErr_Occurred())
2497 /* Iterator completed, via error */
2498 return -1;
2499 }
Victor Stinner611b0fa2016-09-14 15:02:01 +02002500 assert(_PyDict_CheckConsistency((PyDictObject *)a));
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00002501 return 0;
Guido van Rossume3f5b9c1997-05-28 19:15:28 +00002502}
2503
Serhiy Storchakae036ef82016-10-02 11:06:43 +03002504int
2505PyDict_Update(PyObject *a, PyObject *b)
2506{
2507 return dict_merge(a, b, 1);
2508}
2509
2510int
2511PyDict_Merge(PyObject *a, PyObject *b, int override)
2512{
2513 /* XXX Deprecate override not in (0, 1). */
2514 return dict_merge(a, b, override != 0);
2515}
2516
2517int
2518_PyDict_MergeEx(PyObject *a, PyObject *b, int override)
2519{
2520 return dict_merge(a, b, override);
2521}
2522
Guido van Rossume3f5b9c1997-05-28 19:15:28 +00002523static PyObject *
Antoine Pitrou9ed5f272013-08-13 20:18:52 +02002524dict_copy(PyDictObject *mp)
Guido van Rossume3f5b9c1997-05-28 19:15:28 +00002525{
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00002526 return PyDict_Copy((PyObject*)mp);
Jeremy Hyltona12c7a72000-03-30 22:27:31 +00002527}
2528
2529PyObject *
Tim Peters1f5871e2000-07-04 17:44:48 +00002530PyDict_Copy(PyObject *o)
Jeremy Hyltona12c7a72000-03-30 22:27:31 +00002531{
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00002532 PyObject *copy;
Benjamin Peterson7d95e402012-04-23 11:24:50 -04002533 PyDictObject *mp;
2534 Py_ssize_t i, n;
Jeremy Hyltona12c7a72000-03-30 22:27:31 +00002535
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00002536 if (o == NULL || !PyDict_Check(o)) {
2537 PyErr_BadInternalCall();
2538 return NULL;
2539 }
Benjamin Peterson7d95e402012-04-23 11:24:50 -04002540 mp = (PyDictObject *)o;
2541 if (_PyDict_HasSplitTable(mp)) {
2542 PyDictObject *split_copy;
Victor Stinner742da042016-09-07 17:40:12 -07002543 Py_ssize_t size = USABLE_FRACTION(DK_SIZE(mp->ma_keys));
2544 PyObject **newvalues;
2545 newvalues = new_values(size);
Benjamin Peterson7d95e402012-04-23 11:24:50 -04002546 if (newvalues == NULL)
2547 return PyErr_NoMemory();
2548 split_copy = PyObject_GC_New(PyDictObject, &PyDict_Type);
2549 if (split_copy == NULL) {
2550 free_values(newvalues);
2551 return NULL;
2552 }
2553 split_copy->ma_values = newvalues;
2554 split_copy->ma_keys = mp->ma_keys;
2555 split_copy->ma_used = mp->ma_used;
2556 DK_INCREF(mp->ma_keys);
Victor Stinner742da042016-09-07 17:40:12 -07002557 for (i = 0, n = size; i < n; i++) {
Benjamin Peterson7d95e402012-04-23 11:24:50 -04002558 PyObject *value = mp->ma_values[i];
2559 Py_XINCREF(value);
2560 split_copy->ma_values[i] = value;
2561 }
Benjamin Peterson7ce67e42012-04-24 10:32:57 -04002562 if (_PyObject_GC_IS_TRACKED(mp))
2563 _PyObject_GC_TRACK(split_copy);
Benjamin Peterson7d95e402012-04-23 11:24:50 -04002564 return (PyObject *)split_copy;
2565 }
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00002566 copy = PyDict_New();
2567 if (copy == NULL)
2568 return NULL;
2569 if (PyDict_Merge(copy, o, 1) == 0)
2570 return copy;
2571 Py_DECREF(copy);
2572 return NULL;
Guido van Rossume3f5b9c1997-05-28 19:15:28 +00002573}
2574
Martin v. Löwis18e16552006-02-15 17:27:45 +00002575Py_ssize_t
Tim Peters1f5871e2000-07-04 17:44:48 +00002576PyDict_Size(PyObject *mp)
Guido van Rossum4199fac1993-11-05 10:18:44 +00002577{
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00002578 if (mp == NULL || !PyDict_Check(mp)) {
2579 PyErr_BadInternalCall();
2580 return -1;
2581 }
2582 return ((PyDictObject *)mp)->ma_used;
Guido van Rossum4199fac1993-11-05 10:18:44 +00002583}
2584
Guido van Rossumc0b618a1997-05-02 03:12:38 +00002585PyObject *
Tim Peters1f5871e2000-07-04 17:44:48 +00002586PyDict_Keys(PyObject *mp)
Guido van Rossum4b1302b1993-03-27 18:11:32 +00002587{
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00002588 if (mp == NULL || !PyDict_Check(mp)) {
2589 PyErr_BadInternalCall();
2590 return NULL;
2591 }
2592 return dict_keys((PyDictObject *)mp);
Guido van Rossum4b1302b1993-03-27 18:11:32 +00002593}
2594
Guido van Rossumc0b618a1997-05-02 03:12:38 +00002595PyObject *
Tim Peters1f5871e2000-07-04 17:44:48 +00002596PyDict_Values(PyObject *mp)
Guido van Rossum25831651993-05-19 14:50:45 +00002597{
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00002598 if (mp == NULL || !PyDict_Check(mp)) {
2599 PyErr_BadInternalCall();
2600 return NULL;
2601 }
2602 return dict_values((PyDictObject *)mp);
Guido van Rossum25831651993-05-19 14:50:45 +00002603}
2604
Guido van Rossumc0b618a1997-05-02 03:12:38 +00002605PyObject *
Tim Peters1f5871e2000-07-04 17:44:48 +00002606PyDict_Items(PyObject *mp)
Guido van Rossum25831651993-05-19 14:50:45 +00002607{
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00002608 if (mp == NULL || !PyDict_Check(mp)) {
2609 PyErr_BadInternalCall();
2610 return NULL;
2611 }
2612 return dict_items((PyDictObject *)mp);
Guido van Rossum25831651993-05-19 14:50:45 +00002613}
2614
Tim Peterse63415e2001-05-08 04:38:29 +00002615/* Return 1 if dicts equal, 0 if not, -1 if error.
2616 * Gets out as soon as any difference is detected.
2617 * Uses only Py_EQ comparison.
2618 */
2619static int
Guido van Rossum8ce8a782007-11-01 19:42:39 +00002620dict_equal(PyDictObject *a, PyDictObject *b)
Tim Peterse63415e2001-05-08 04:38:29 +00002621{
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00002622 Py_ssize_t i;
Tim Peterse63415e2001-05-08 04:38:29 +00002623
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00002624 if (a->ma_used != b->ma_used)
2625 /* can't be equal if # of entries differ */
2626 return 0;
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00002627 /* Same # of entries -- check all of 'em. Exit early on any diff. */
Victor Stinner742da042016-09-07 17:40:12 -07002628 for (i = 0; i < a->ma_keys->dk_nentries; i++) {
2629 PyDictKeyEntry *ep = &DK_ENTRIES(a->ma_keys)[i];
Benjamin Peterson7d95e402012-04-23 11:24:50 -04002630 PyObject *aval;
2631 if (a->ma_values)
2632 aval = a->ma_values[i];
2633 else
2634 aval = ep->me_value;
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00002635 if (aval != NULL) {
2636 int cmp;
2637 PyObject *bval;
Benjamin Peterson7d95e402012-04-23 11:24:50 -04002638 PyObject *key = ep->me_key;
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00002639 /* temporarily bump aval's refcount to ensure it stays
2640 alive until we're done with it */
2641 Py_INCREF(aval);
2642 /* ditto for key */
2643 Py_INCREF(key);
Antoine Pitrou0e9958b2012-12-02 19:10:07 +01002644 /* reuse the known hash value */
INADA Naokiba609772016-12-07 20:41:42 +09002645 b->ma_keys->dk_lookup(b, key, ep->me_hash, &bval, NULL);
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00002646 Py_DECREF(key);
2647 if (bval == NULL) {
2648 Py_DECREF(aval);
2649 if (PyErr_Occurred())
2650 return -1;
2651 return 0;
2652 }
2653 cmp = PyObject_RichCompareBool(aval, bval, Py_EQ);
2654 Py_DECREF(aval);
2655 if (cmp <= 0) /* error or not equal */
2656 return cmp;
2657 }
2658 }
2659 return 1;
Benjamin Peterson7d95e402012-04-23 11:24:50 -04002660}
Tim Peterse63415e2001-05-08 04:38:29 +00002661
2662static PyObject *
2663dict_richcompare(PyObject *v, PyObject *w, int op)
2664{
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00002665 int cmp;
2666 PyObject *res;
Tim Peterse63415e2001-05-08 04:38:29 +00002667
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00002668 if (!PyDict_Check(v) || !PyDict_Check(w)) {
2669 res = Py_NotImplemented;
2670 }
2671 else if (op == Py_EQ || op == Py_NE) {
2672 cmp = dict_equal((PyDictObject *)v, (PyDictObject *)w);
2673 if (cmp < 0)
2674 return NULL;
2675 res = (cmp == (op == Py_EQ)) ? Py_True : Py_False;
2676 }
2677 else
2678 res = Py_NotImplemented;
2679 Py_INCREF(res);
2680 return res;
Benjamin Peterson7d95e402012-04-23 11:24:50 -04002681}
Tim Peterse63415e2001-05-08 04:38:29 +00002682
Larry Hastings61272b72014-01-07 12:41:53 -08002683/*[clinic input]
Larry Hastings31826802013-10-19 00:09:25 -07002684
2685@coexist
2686dict.__contains__
2687
2688 key: object
2689 /
2690
Meador Ingee02de8c2014-01-14 16:48:31 -06002691True if D has a key k, else False.
Larry Hastings61272b72014-01-07 12:41:53 -08002692[clinic start generated code]*/
Larry Hastings31826802013-10-19 00:09:25 -07002693
Guido van Rossumc0b618a1997-05-02 03:12:38 +00002694static PyObject *
Larry Hastingsc2047262014-01-25 20:43:29 -08002695dict___contains__(PyDictObject *self, PyObject *key)
Serhiy Storchaka1009bf12015-04-03 23:53:51 +03002696/*[clinic end generated code: output=a3d03db709ed6e6b input=b852b2a19b51ab24]*/
Guido van Rossum4b1302b1993-03-27 18:11:32 +00002697{
Larry Hastingsc2047262014-01-25 20:43:29 -08002698 register PyDictObject *mp = self;
Benjamin Peterson8f67d082010-10-17 20:54:53 +00002699 Py_hash_t hash;
Victor Stinner742da042016-09-07 17:40:12 -07002700 Py_ssize_t ix;
INADA Naokiba609772016-12-07 20:41:42 +09002701 PyObject *value;
Thomas Wouters4d70c3d2006-06-08 14:42:34 +00002702
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00002703 if (!PyUnicode_CheckExact(key) ||
Martin v. Löwisd63a3b82011-09-28 07:41:54 +02002704 (hash = ((PyASCIIObject *) key)->hash) == -1) {
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00002705 hash = PyObject_Hash(key);
2706 if (hash == -1)
2707 return NULL;
2708 }
INADA Naokiba609772016-12-07 20:41:42 +09002709 ix = (mp->ma_keys->dk_lookup)(mp, key, hash, &value, NULL);
Victor Stinner742da042016-09-07 17:40:12 -07002710 if (ix == DKIX_ERROR)
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00002711 return NULL;
INADA Naokiba609772016-12-07 20:41:42 +09002712 if (ix == DKIX_EMPTY || value == NULL)
Victor Stinner742da042016-09-07 17:40:12 -07002713 Py_RETURN_FALSE;
2714 Py_RETURN_TRUE;
Guido van Rossum4b1302b1993-03-27 18:11:32 +00002715}
2716
Guido van Rossumc0b618a1997-05-02 03:12:38 +00002717static PyObject *
Antoine Pitrou9ed5f272013-08-13 20:18:52 +02002718dict_get(PyDictObject *mp, PyObject *args)
Barry Warsawc38c5da1997-10-06 17:49:20 +00002719{
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00002720 PyObject *key;
2721 PyObject *failobj = Py_None;
2722 PyObject *val = NULL;
Benjamin Peterson8f67d082010-10-17 20:54:53 +00002723 Py_hash_t hash;
Victor Stinner742da042016-09-07 17:40:12 -07002724 Py_ssize_t ix;
Barry Warsawc38c5da1997-10-06 17:49:20 +00002725
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00002726 if (!PyArg_UnpackTuple(args, "get", 1, 2, &key, &failobj))
2727 return NULL;
Barry Warsawc38c5da1997-10-06 17:49:20 +00002728
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00002729 if (!PyUnicode_CheckExact(key) ||
Martin v. Löwisd63a3b82011-09-28 07:41:54 +02002730 (hash = ((PyASCIIObject *) key)->hash) == -1) {
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00002731 hash = PyObject_Hash(key);
2732 if (hash == -1)
2733 return NULL;
2734 }
INADA Naokiba609772016-12-07 20:41:42 +09002735 ix = (mp->ma_keys->dk_lookup)(mp, key, hash, &val, NULL);
Victor Stinner742da042016-09-07 17:40:12 -07002736 if (ix == DKIX_ERROR)
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00002737 return NULL;
INADA Naokiba609772016-12-07 20:41:42 +09002738 if (ix == DKIX_EMPTY || val == NULL) {
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00002739 val = failobj;
INADA Naokiba609772016-12-07 20:41:42 +09002740 }
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00002741 Py_INCREF(val);
2742 return val;
Barry Warsawc38c5da1997-10-06 17:49:20 +00002743}
2744
Benjamin Peterson00e98862013-03-07 22:16:29 -05002745PyObject *
2746PyDict_SetDefault(PyObject *d, PyObject *key, PyObject *defaultobj)
Guido van Rossum164452c2000-08-08 16:12:54 +00002747{
Benjamin Peterson00e98862013-03-07 22:16:29 -05002748 PyDictObject *mp = (PyDictObject *)d;
INADA Naoki93f26f72016-11-02 18:45:16 +09002749 PyObject *value;
Benjamin Peterson8f67d082010-10-17 20:54:53 +00002750 Py_hash_t hash;
Victor Stinner742da042016-09-07 17:40:12 -07002751 Py_ssize_t hashpos, ix;
Guido van Rossum164452c2000-08-08 16:12:54 +00002752
Benjamin Peterson00e98862013-03-07 22:16:29 -05002753 if (!PyDict_Check(d)) {
2754 PyErr_BadInternalCall();
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00002755 return NULL;
Benjamin Peterson00e98862013-03-07 22:16:29 -05002756 }
INADA Naoki93f26f72016-11-02 18:45:16 +09002757
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00002758 if (!PyUnicode_CheckExact(key) ||
Martin v. Löwisd63a3b82011-09-28 07:41:54 +02002759 (hash = ((PyASCIIObject *) key)->hash) == -1) {
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00002760 hash = PyObject_Hash(key);
2761 if (hash == -1)
2762 return NULL;
2763 }
INADA Naoki93f26f72016-11-02 18:45:16 +09002764
2765 if (mp->ma_values != NULL && !PyUnicode_CheckExact(key)) {
2766 if (insertion_resize(mp) < 0)
2767 return NULL;
2768 }
2769
INADA Naokiba609772016-12-07 20:41:42 +09002770 ix = (mp->ma_keys->dk_lookup)(mp, key, hash, &value, &hashpos);
Victor Stinner742da042016-09-07 17:40:12 -07002771 if (ix == DKIX_ERROR)
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00002772 return NULL;
INADA Naoki93f26f72016-11-02 18:45:16 +09002773
2774 if (_PyDict_HasSplitTable(mp) &&
INADA Naokiba609772016-12-07 20:41:42 +09002775 ((ix >= 0 && value == NULL && mp->ma_used != ix) ||
INADA Naoki93f26f72016-11-02 18:45:16 +09002776 (ix == DKIX_EMPTY && mp->ma_used != mp->ma_keys->dk_nentries))) {
2777 if (insertion_resize(mp) < 0) {
2778 return NULL;
2779 }
INADA Naokiba609772016-12-07 20:41:42 +09002780 hashpos = find_empty_slot(mp->ma_keys, key, hash);
INADA Naoki93f26f72016-11-02 18:45:16 +09002781 ix = DKIX_EMPTY;
2782 }
2783
2784 if (ix == DKIX_EMPTY) {
2785 PyDictKeyEntry *ep, *ep0;
2786 value = defaultobj;
Benjamin Peterson7d95e402012-04-23 11:24:50 -04002787 if (mp->ma_keys->dk_usable <= 0) {
Victor Stinner3c336c52016-09-12 14:17:40 +02002788 if (insertion_resize(mp) < 0) {
Benjamin Peterson7d95e402012-04-23 11:24:50 -04002789 return NULL;
Victor Stinner3c336c52016-09-12 14:17:40 +02002790 }
INADA Naokiba609772016-12-07 20:41:42 +09002791 hashpos = find_empty_slot(mp->ma_keys, key, hash);
Benjamin Peterson7d95e402012-04-23 11:24:50 -04002792 }
INADA Naoki93f26f72016-11-02 18:45:16 +09002793 ep0 = DK_ENTRIES(mp->ma_keys);
2794 ep = &ep0[mp->ma_keys->dk_nentries];
2795 dk_set_index(mp->ma_keys, hashpos, mp->ma_keys->dk_nentries);
Benjamin Petersonb1efa532013-03-04 09:47:50 -05002796 Py_INCREF(key);
INADA Naoki93f26f72016-11-02 18:45:16 +09002797 Py_INCREF(value);
2798 MAINTAIN_TRACKING(mp, key, value);
Benjamin Peterson7d95e402012-04-23 11:24:50 -04002799 ep->me_key = key;
2800 ep->me_hash = hash;
INADA Naokiba609772016-12-07 20:41:42 +09002801 if (_PyDict_HasSplitTable(mp)) {
INADA Naoki93f26f72016-11-02 18:45:16 +09002802 assert(mp->ma_values[mp->ma_keys->dk_nentries] == NULL);
2803 mp->ma_values[mp->ma_keys->dk_nentries] = value;
Victor Stinner742da042016-09-07 17:40:12 -07002804 }
2805 else {
INADA Naoki93f26f72016-11-02 18:45:16 +09002806 ep->me_value = value;
Victor Stinner742da042016-09-07 17:40:12 -07002807 }
Benjamin Peterson7d95e402012-04-23 11:24:50 -04002808 mp->ma_used++;
Victor Stinner3b6a6b42016-09-08 12:51:24 -07002809 mp->ma_version_tag = DICT_NEXT_VERSION();
INADA Naoki93f26f72016-11-02 18:45:16 +09002810 mp->ma_keys->dk_usable--;
2811 mp->ma_keys->dk_nentries++;
2812 assert(mp->ma_keys->dk_usable >= 0);
2813 }
INADA Naokiba609772016-12-07 20:41:42 +09002814 else if (value == NULL) {
INADA Naoki93f26f72016-11-02 18:45:16 +09002815 value = defaultobj;
2816 assert(_PyDict_HasSplitTable(mp));
2817 assert(ix == mp->ma_used);
2818 Py_INCREF(value);
2819 MAINTAIN_TRACKING(mp, key, value);
INADA Naokiba609772016-12-07 20:41:42 +09002820 mp->ma_values[ix] = value;
INADA Naoki93f26f72016-11-02 18:45:16 +09002821 mp->ma_used++;
2822 mp->ma_version_tag = DICT_NEXT_VERSION();
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00002823 }
INADA Naoki93f26f72016-11-02 18:45:16 +09002824
2825 assert(_PyDict_CheckConsistency(mp));
2826 return value;
Guido van Rossum164452c2000-08-08 16:12:54 +00002827}
2828
Benjamin Peterson00e98862013-03-07 22:16:29 -05002829static PyObject *
2830dict_setdefault(PyDictObject *mp, PyObject *args)
2831{
2832 PyObject *key, *val;
2833 PyObject *defaultobj = Py_None;
2834
2835 if (!PyArg_UnpackTuple(args, "setdefault", 1, 2, &key, &defaultobj))
2836 return NULL;
2837
Benjamin Peterson55898502013-03-08 08:36:49 -05002838 val = PyDict_SetDefault((PyObject *)mp, key, defaultobj);
Benjamin Peterson00e98862013-03-07 22:16:29 -05002839 Py_XINCREF(val);
2840 return val;
2841}
Guido van Rossum164452c2000-08-08 16:12:54 +00002842
2843static PyObject *
Antoine Pitrou9ed5f272013-08-13 20:18:52 +02002844dict_clear(PyDictObject *mp)
Guido van Rossumfb8f1ca1997-03-21 21:55:12 +00002845{
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00002846 PyDict_Clear((PyObject *)mp);
2847 Py_RETURN_NONE;
Guido van Rossumfb8f1ca1997-03-21 21:55:12 +00002848}
2849
Guido van Rossumba6ab842000-12-12 22:02:18 +00002850static PyObject *
Guido van Rossum8ce8a782007-11-01 19:42:39 +00002851dict_pop(PyDictObject *mp, PyObject *args)
Guido van Rossume027d982002-04-12 15:11:59 +00002852{
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00002853 PyObject *key, *deflt = NULL;
Guido van Rossume027d982002-04-12 15:11:59 +00002854
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00002855 if(!PyArg_UnpackTuple(args, "pop", 1, 2, &key, &deflt))
2856 return NULL;
Eric Snow96c6af92015-05-29 22:21:39 -06002857
Yury Selivanov684ef2c2016-10-28 19:01:21 -04002858 return _PyDict_Pop((PyObject*)mp, key, deflt);
Guido van Rossume027d982002-04-12 15:11:59 +00002859}
2860
2861static PyObject *
Guido van Rossum8ce8a782007-11-01 19:42:39 +00002862dict_popitem(PyDictObject *mp)
Guido van Rossumba6ab842000-12-12 22:02:18 +00002863{
Victor Stinner742da042016-09-07 17:40:12 -07002864 Py_ssize_t i, j;
2865 PyDictKeyEntry *ep0, *ep;
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00002866 PyObject *res;
Guido van Rossumba6ab842000-12-12 22:02:18 +00002867
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00002868 /* Allocate the result tuple before checking the size. Believe it
2869 * or not, this allocation could trigger a garbage collection which
2870 * could empty the dict, so if we checked the size first and that
2871 * happened, the result would be an infinite loop (searching for an
2872 * entry that no longer exists). Note that the usual popitem()
2873 * idiom is "while d: k, v = d.popitem()". so needing to throw the
2874 * tuple away if the dict *is* empty isn't a significant
2875 * inefficiency -- possible, but unlikely in practice.
2876 */
2877 res = PyTuple_New(2);
2878 if (res == NULL)
2879 return NULL;
2880 if (mp->ma_used == 0) {
2881 Py_DECREF(res);
2882 PyErr_SetString(PyExc_KeyError,
2883 "popitem(): dictionary is empty");
2884 return NULL;
2885 }
Benjamin Peterson7d95e402012-04-23 11:24:50 -04002886 /* Convert split table to combined table */
2887 if (mp->ma_keys->dk_lookup == lookdict_split) {
2888 if (dictresize(mp, DK_SIZE(mp->ma_keys))) {
2889 Py_DECREF(res);
2890 return NULL;
2891 }
2892 }
2893 ENSURE_ALLOWS_DELETIONS(mp);
Victor Stinner742da042016-09-07 17:40:12 -07002894
2895 /* Pop last item */
2896 ep0 = DK_ENTRIES(mp->ma_keys);
2897 i = mp->ma_keys->dk_nentries - 1;
2898 while (i >= 0 && ep0[i].me_value == NULL) {
2899 i--;
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00002900 }
Victor Stinner742da042016-09-07 17:40:12 -07002901 assert(i >= 0);
2902
2903 ep = &ep0[i];
2904 j = lookdict_index(mp->ma_keys, ep->me_hash, i);
2905 assert(j >= 0);
2906 assert(dk_get_index(mp->ma_keys, j) == i);
2907 dk_set_index(mp->ma_keys, j, DKIX_DUMMY);
2908
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00002909 PyTuple_SET_ITEM(res, 0, ep->me_key);
2910 PyTuple_SET_ITEM(res, 1, ep->me_value);
Victor Stinner742da042016-09-07 17:40:12 -07002911 ep->me_key = NULL;
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00002912 ep->me_value = NULL;
Victor Stinner742da042016-09-07 17:40:12 -07002913 /* We can't dk_usable++ since there is DKIX_DUMMY in indices */
2914 mp->ma_keys->dk_nentries = i;
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00002915 mp->ma_used--;
Victor Stinner3b6a6b42016-09-08 12:51:24 -07002916 mp->ma_version_tag = DICT_NEXT_VERSION();
Victor Stinner611b0fa2016-09-14 15:02:01 +02002917 assert(_PyDict_CheckConsistency(mp));
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00002918 return res;
Guido van Rossumba6ab842000-12-12 22:02:18 +00002919}
2920
Jeremy Hylton8caad492000-06-23 14:18:11 +00002921static int
2922dict_traverse(PyObject *op, visitproc visit, void *arg)
2923{
Benjamin Peterson7d95e402012-04-23 11:24:50 -04002924 PyDictObject *mp = (PyDictObject *)op;
Benjamin Peterson55f44522016-09-05 12:12:59 -07002925 PyDictKeysObject *keys = mp->ma_keys;
Serhiy Storchaka46825d22016-09-26 21:29:34 +03002926 PyDictKeyEntry *entries = DK_ENTRIES(keys);
Victor Stinner742da042016-09-07 17:40:12 -07002927 Py_ssize_t i, n = keys->dk_nentries;
2928
Benjamin Peterson55f44522016-09-05 12:12:59 -07002929 if (keys->dk_lookup == lookdict) {
2930 for (i = 0; i < n; i++) {
2931 if (entries[i].me_value != NULL) {
2932 Py_VISIT(entries[i].me_value);
2933 Py_VISIT(entries[i].me_key);
Benjamin Peterson7d95e402012-04-23 11:24:50 -04002934 }
2935 }
Victor Stinner742da042016-09-07 17:40:12 -07002936 }
2937 else {
Benjamin Peterson7d95e402012-04-23 11:24:50 -04002938 if (mp->ma_values != NULL) {
Benjamin Peterson55f44522016-09-05 12:12:59 -07002939 for (i = 0; i < n; i++) {
Benjamin Peterson7d95e402012-04-23 11:24:50 -04002940 Py_VISIT(mp->ma_values[i]);
2941 }
2942 }
2943 else {
Benjamin Peterson55f44522016-09-05 12:12:59 -07002944 for (i = 0; i < n; i++) {
2945 Py_VISIT(entries[i].me_value);
Benjamin Peterson7d95e402012-04-23 11:24:50 -04002946 }
2947 }
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00002948 }
2949 return 0;
Jeremy Hylton8caad492000-06-23 14:18:11 +00002950}
2951
2952static int
2953dict_tp_clear(PyObject *op)
2954{
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00002955 PyDict_Clear(op);
2956 return 0;
Jeremy Hylton8caad492000-06-23 14:18:11 +00002957}
2958
Guido van Rossum8ce8a782007-11-01 19:42:39 +00002959static PyObject *dictiter_new(PyDictObject *, PyTypeObject *);
Guido van Rossum09e563a2001-05-01 12:10:21 +00002960
Serhiy Storchaka0ce7a3a2015-12-22 08:16:18 +02002961Py_ssize_t
Eric Snow96c6af92015-05-29 22:21:39 -06002962_PyDict_SizeOf(PyDictObject *mp)
Martin v. Löwis00709aa2008-06-04 14:18:43 +00002963{
Victor Stinner742da042016-09-07 17:40:12 -07002964 Py_ssize_t size, usable, res;
Martin v. Löwis00709aa2008-06-04 14:18:43 +00002965
Benjamin Peterson7d95e402012-04-23 11:24:50 -04002966 size = DK_SIZE(mp->ma_keys);
Victor Stinner742da042016-09-07 17:40:12 -07002967 usable = USABLE_FRACTION(size);
2968
Serhiy Storchaka5c4064e2015-12-19 20:05:25 +02002969 res = _PyObject_SIZE(Py_TYPE(mp));
Benjamin Peterson7d95e402012-04-23 11:24:50 -04002970 if (mp->ma_values)
Victor Stinner742da042016-09-07 17:40:12 -07002971 res += usable * sizeof(PyObject*);
Martin v. Loewis4f2f3b62012-04-24 19:13:57 +02002972 /* If the dictionary is split, the keys portion is accounted-for
2973 in the type object. */
2974 if (mp->ma_keys->dk_refcnt == 1)
Victor Stinner98ee9d52016-09-08 09:33:56 -07002975 res += (sizeof(PyDictKeysObject)
2976 - Py_MEMBER_SIZE(PyDictKeysObject, dk_indices)
2977 + DK_IXSIZE(mp->ma_keys) * size
2978 + sizeof(PyDictKeyEntry) * usable);
Serhiy Storchaka0ce7a3a2015-12-22 08:16:18 +02002979 return res;
Martin v. Loewis4f2f3b62012-04-24 19:13:57 +02002980}
2981
2982Py_ssize_t
2983_PyDict_KeysSize(PyDictKeysObject *keys)
2984{
Victor Stinner98ee9d52016-09-08 09:33:56 -07002985 return (sizeof(PyDictKeysObject)
2986 - Py_MEMBER_SIZE(PyDictKeysObject, dk_indices)
2987 + DK_IXSIZE(keys) * DK_SIZE(keys)
2988 + USABLE_FRACTION(DK_SIZE(keys)) * sizeof(PyDictKeyEntry));
Martin v. Löwis00709aa2008-06-04 14:18:43 +00002989}
2990
doko@ubuntu.com17210f52016-01-14 14:04:59 +01002991static PyObject *
Serhiy Storchaka0ce7a3a2015-12-22 08:16:18 +02002992dict_sizeof(PyDictObject *mp)
2993{
2994 return PyLong_FromSsize_t(_PyDict_SizeOf(mp));
2995}
2996
Raymond Hettinger8f5cdaa2003-12-13 11:26:12 +00002997PyDoc_STRVAR(getitem__doc__, "x.__getitem__(y) <==> x[y]");
2998
Martin v. Löwis00709aa2008-06-04 14:18:43 +00002999PyDoc_STRVAR(sizeof__doc__,
3000"D.__sizeof__() -> size of D in memory, in bytes");
3001
Martin v. Löwis14f8b4c2002-06-13 20:33:02 +00003002PyDoc_STRVAR(get__doc__,
Guido van Rossumefae8862002-09-04 11:29:45 +00003003"D.get(k[,d]) -> D[k] if k in D, else d. d defaults to None.");
Tim Petersf7f88b12000-12-13 23:18:45 +00003004
Martin v. Löwis14f8b4c2002-06-13 20:33:02 +00003005PyDoc_STRVAR(setdefault_doc__,
Guido van Rossumefae8862002-09-04 11:29:45 +00003006"D.setdefault(k[,d]) -> D.get(k,d), also set D[k]=d if k not in D");
Tim Petersf7f88b12000-12-13 23:18:45 +00003007
Martin v. Löwis14f8b4c2002-06-13 20:33:02 +00003008PyDoc_STRVAR(pop__doc__,
Benjamin Petersonf10a79a2008-10-11 00:49:57 +00003009"D.pop(k[,d]) -> v, remove specified key and return the corresponding value.\n\
Raymond Hettingera3e1e4c2003-03-06 23:54:28 +00003010If key is not found, d is returned if given, otherwise KeyError is raised");
Guido van Rossume027d982002-04-12 15:11:59 +00003011
Martin v. Löwis14f8b4c2002-06-13 20:33:02 +00003012PyDoc_STRVAR(popitem__doc__,
Tim Petersf7f88b12000-12-13 23:18:45 +00003013"D.popitem() -> (k, v), remove and return some (key, value) pair as a\n\
Benjamin Petersonf10a79a2008-10-11 00:49:57 +000030142-tuple; but raise KeyError if D is empty.");
Tim Petersf7f88b12000-12-13 23:18:45 +00003015
Martin v. Löwis14f8b4c2002-06-13 20:33:02 +00003016PyDoc_STRVAR(update__doc__,
Brett Cannonf2754162013-05-11 14:46:48 -04003017"D.update([E, ]**F) -> None. Update D from dict/iterable E and F.\n\
3018If E is present and has a .keys() method, then does: for k in E: D[k] = E[k]\n\
3019If E is present and lacks a .keys() method, then does: for k, v in E: D[k] = v\n\
3020In either case, this is followed by: for k in F: D[k] = F[k]");
Tim Petersf7f88b12000-12-13 23:18:45 +00003021
Martin v. Löwis14f8b4c2002-06-13 20:33:02 +00003022PyDoc_STRVAR(clear__doc__,
3023"D.clear() -> None. Remove all items from D.");
Tim Petersf7f88b12000-12-13 23:18:45 +00003024
Martin v. Löwis14f8b4c2002-06-13 20:33:02 +00003025PyDoc_STRVAR(copy__doc__,
3026"D.copy() -> a shallow copy of D");
Tim Petersf7f88b12000-12-13 23:18:45 +00003027
Guido van Rossumb90c8482007-02-10 01:11:45 +00003028/* Forward */
3029static PyObject *dictkeys_new(PyObject *);
3030static PyObject *dictitems_new(PyObject *);
3031static PyObject *dictvalues_new(PyObject *);
3032
Guido van Rossum45c85d12007-07-27 16:31:40 +00003033PyDoc_STRVAR(keys__doc__,
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00003034 "D.keys() -> a set-like object providing a view on D's keys");
Guido van Rossum45c85d12007-07-27 16:31:40 +00003035PyDoc_STRVAR(items__doc__,
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00003036 "D.items() -> a set-like object providing a view on D's items");
Guido van Rossum45c85d12007-07-27 16:31:40 +00003037PyDoc_STRVAR(values__doc__,
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00003038 "D.values() -> an object providing a view on D's values");
Guido van Rossumb90c8482007-02-10 01:11:45 +00003039
Guido van Rossumc0b618a1997-05-02 03:12:38 +00003040static PyMethodDef mapp_methods[] = {
Larry Hastings31826802013-10-19 00:09:25 -07003041 DICT___CONTAINS___METHODDEF
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00003042 {"__getitem__", (PyCFunction)dict_subscript, METH_O | METH_COEXIST,
3043 getitem__doc__},
Serhiy Storchaka0ce7a3a2015-12-22 08:16:18 +02003044 {"__sizeof__", (PyCFunction)dict_sizeof, METH_NOARGS,
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00003045 sizeof__doc__},
3046 {"get", (PyCFunction)dict_get, METH_VARARGS,
3047 get__doc__},
3048 {"setdefault", (PyCFunction)dict_setdefault, METH_VARARGS,
3049 setdefault_doc__},
3050 {"pop", (PyCFunction)dict_pop, METH_VARARGS,
3051 pop__doc__},
3052 {"popitem", (PyCFunction)dict_popitem, METH_NOARGS,
3053 popitem__doc__},
3054 {"keys", (PyCFunction)dictkeys_new, METH_NOARGS,
3055 keys__doc__},
3056 {"items", (PyCFunction)dictitems_new, METH_NOARGS,
3057 items__doc__},
3058 {"values", (PyCFunction)dictvalues_new, METH_NOARGS,
3059 values__doc__},
3060 {"update", (PyCFunction)dict_update, METH_VARARGS | METH_KEYWORDS,
3061 update__doc__},
Larry Hastings5c661892014-01-24 06:17:25 -08003062 DICT_FROMKEYS_METHODDEF
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00003063 {"clear", (PyCFunction)dict_clear, METH_NOARGS,
3064 clear__doc__},
3065 {"copy", (PyCFunction)dict_copy, METH_NOARGS,
3066 copy__doc__},
3067 {NULL, NULL} /* sentinel */
Guido van Rossum4b1302b1993-03-27 18:11:32 +00003068};
3069
Thomas Wouters4d70c3d2006-06-08 14:42:34 +00003070/* Return 1 if `key` is in dict `op`, 0 if not, and -1 on error. */
Raymond Hettingerbc0f2ab2003-11-25 21:12:14 +00003071int
3072PyDict_Contains(PyObject *op, PyObject *key)
Guido van Rossum0dbb4fb2001-04-20 16:50:40 +00003073{
Benjamin Peterson8f67d082010-10-17 20:54:53 +00003074 Py_hash_t hash;
Victor Stinner742da042016-09-07 17:40:12 -07003075 Py_ssize_t ix;
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00003076 PyDictObject *mp = (PyDictObject *)op;
INADA Naokiba609772016-12-07 20:41:42 +09003077 PyObject *value;
Guido van Rossum0dbb4fb2001-04-20 16:50:40 +00003078
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00003079 if (!PyUnicode_CheckExact(key) ||
Martin v. Löwisd63a3b82011-09-28 07:41:54 +02003080 (hash = ((PyASCIIObject *) key)->hash) == -1) {
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00003081 hash = PyObject_Hash(key);
3082 if (hash == -1)
3083 return -1;
3084 }
INADA Naokiba609772016-12-07 20:41:42 +09003085 ix = (mp->ma_keys->dk_lookup)(mp, key, hash, &value, NULL);
Victor Stinner742da042016-09-07 17:40:12 -07003086 if (ix == DKIX_ERROR)
3087 return -1;
INADA Naokiba609772016-12-07 20:41:42 +09003088 return (ix != DKIX_EMPTY && value != NULL);
Guido van Rossum0dbb4fb2001-04-20 16:50:40 +00003089}
3090
Thomas Wouterscf297e42007-02-23 15:07:44 +00003091/* Internal version of PyDict_Contains used when the hash value is already known */
3092int
Benjamin Peterson8f67d082010-10-17 20:54:53 +00003093_PyDict_Contains(PyObject *op, PyObject *key, Py_hash_t hash)
Thomas Wouterscf297e42007-02-23 15:07:44 +00003094{
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00003095 PyDictObject *mp = (PyDictObject *)op;
INADA Naokiba609772016-12-07 20:41:42 +09003096 PyObject *value;
Victor Stinner742da042016-09-07 17:40:12 -07003097 Py_ssize_t ix;
Thomas Wouterscf297e42007-02-23 15:07:44 +00003098
INADA Naokiba609772016-12-07 20:41:42 +09003099 ix = (mp->ma_keys->dk_lookup)(mp, key, hash, &value, NULL);
Victor Stinner742da042016-09-07 17:40:12 -07003100 if (ix == DKIX_ERROR)
3101 return -1;
INADA Naokiba609772016-12-07 20:41:42 +09003102 return (ix != DKIX_EMPTY && value != NULL);
Thomas Wouterscf297e42007-02-23 15:07:44 +00003103}
3104
Guido van Rossum0dbb4fb2001-04-20 16:50:40 +00003105/* Hack to implement "key in dict" */
3106static PySequenceMethods dict_as_sequence = {
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00003107 0, /* sq_length */
3108 0, /* sq_concat */
3109 0, /* sq_repeat */
3110 0, /* sq_item */
3111 0, /* sq_slice */
3112 0, /* sq_ass_item */
3113 0, /* sq_ass_slice */
3114 PyDict_Contains, /* sq_contains */
3115 0, /* sq_inplace_concat */
3116 0, /* sq_inplace_repeat */
Guido van Rossum0dbb4fb2001-04-20 16:50:40 +00003117};
3118
Guido van Rossum09e563a2001-05-01 12:10:21 +00003119static PyObject *
Tim Peters6d6c1a32001-08-02 04:15:00 +00003120dict_new(PyTypeObject *type, PyObject *args, PyObject *kwds)
3121{
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00003122 PyObject *self;
Victor Stinnera9f61a52013-07-16 22:17:26 +02003123 PyDictObject *d;
Tim Peters6d6c1a32001-08-02 04:15:00 +00003124
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00003125 assert(type != NULL && type->tp_alloc != NULL);
3126 self = type->tp_alloc(type, 0);
Victor Stinnera9f61a52013-07-16 22:17:26 +02003127 if (self == NULL)
3128 return NULL;
Victor Stinnera9f61a52013-07-16 22:17:26 +02003129 d = (PyDictObject *)self;
Victor Stinnerac2a4fe2013-07-16 22:19:00 +02003130
Victor Stinnera9f61a52013-07-16 22:17:26 +02003131 /* The object has been implicitly tracked by tp_alloc */
3132 if (type == &PyDict_Type)
3133 _PyObject_GC_UNTRACK(d);
Victor Stinnerac2a4fe2013-07-16 22:19:00 +02003134
3135 d->ma_used = 0;
Victor Stinner3b6a6b42016-09-08 12:51:24 -07003136 d->ma_version_tag = DICT_NEXT_VERSION();
Victor Stinner742da042016-09-07 17:40:12 -07003137 d->ma_keys = new_keys_object(PyDict_MINSIZE);
Victor Stinnerac2a4fe2013-07-16 22:19:00 +02003138 if (d->ma_keys == NULL) {
3139 Py_DECREF(self);
3140 return NULL;
3141 }
Victor Stinner611b0fa2016-09-14 15:02:01 +02003142 assert(_PyDict_CheckConsistency(d));
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00003143 return self;
Tim Peters6d6c1a32001-08-02 04:15:00 +00003144}
3145
Tim Peters25786c02001-09-02 08:22:48 +00003146static int
3147dict_init(PyObject *self, PyObject *args, PyObject *kwds)
3148{
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00003149 return dict_update_common(self, args, kwds, "dict");
Tim Peters25786c02001-09-02 08:22:48 +00003150}
3151
Tim Peters6d6c1a32001-08-02 04:15:00 +00003152static PyObject *
Guido van Rossum8ce8a782007-11-01 19:42:39 +00003153dict_iter(PyDictObject *dict)
Guido van Rossum09e563a2001-05-01 12:10:21 +00003154{
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00003155 return dictiter_new(dict, &PyDictIterKey_Type);
Guido van Rossum09e563a2001-05-01 12:10:21 +00003156}
Guido van Rossum59d1d2b2001-04-20 19:13:02 +00003157
Martin v. Löwis14f8b4c2002-06-13 20:33:02 +00003158PyDoc_STRVAR(dictionary_doc,
Ezio Melotti7f807b72010-03-01 04:08:34 +00003159"dict() -> new empty dictionary\n"
Tim Petersa427a2b2001-10-29 22:25:45 +00003160"dict(mapping) -> new dictionary initialized from a mapping object's\n"
Ezio Melotti7f807b72010-03-01 04:08:34 +00003161" (key, value) pairs\n"
3162"dict(iterable) -> new dictionary initialized as if via:\n"
Tim Peters4d859532001-10-27 18:27:48 +00003163" d = {}\n"
Ezio Melotti7f807b72010-03-01 04:08:34 +00003164" for k, v in iterable:\n"
Just van Rossuma797d812002-11-23 09:45:04 +00003165" d[k] = v\n"
3166"dict(**kwargs) -> new dictionary initialized with the name=value pairs\n"
3167" in the keyword argument list. For example: dict(one=1, two=2)");
Tim Peters25786c02001-09-02 08:22:48 +00003168
Guido van Rossumc0b618a1997-05-02 03:12:38 +00003169PyTypeObject PyDict_Type = {
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00003170 PyVarObject_HEAD_INIT(&PyType_Type, 0)
3171 "dict",
3172 sizeof(PyDictObject),
3173 0,
3174 (destructor)dict_dealloc, /* tp_dealloc */
3175 0, /* tp_print */
3176 0, /* tp_getattr */
3177 0, /* tp_setattr */
3178 0, /* tp_reserved */
3179 (reprfunc)dict_repr, /* tp_repr */
3180 0, /* tp_as_number */
3181 &dict_as_sequence, /* tp_as_sequence */
3182 &dict_as_mapping, /* tp_as_mapping */
Georg Brandl00da4e02010-10-18 07:32:48 +00003183 PyObject_HashNotImplemented, /* tp_hash */
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00003184 0, /* tp_call */
3185 0, /* tp_str */
3186 PyObject_GenericGetAttr, /* tp_getattro */
3187 0, /* tp_setattro */
3188 0, /* tp_as_buffer */
3189 Py_TPFLAGS_DEFAULT | Py_TPFLAGS_HAVE_GC |
3190 Py_TPFLAGS_BASETYPE | Py_TPFLAGS_DICT_SUBCLASS, /* tp_flags */
3191 dictionary_doc, /* tp_doc */
3192 dict_traverse, /* tp_traverse */
3193 dict_tp_clear, /* tp_clear */
3194 dict_richcompare, /* tp_richcompare */
3195 0, /* tp_weaklistoffset */
3196 (getiterfunc)dict_iter, /* tp_iter */
3197 0, /* tp_iternext */
3198 mapp_methods, /* tp_methods */
3199 0, /* tp_members */
3200 0, /* tp_getset */
3201 0, /* tp_base */
3202 0, /* tp_dict */
3203 0, /* tp_descr_get */
3204 0, /* tp_descr_set */
3205 0, /* tp_dictoffset */
3206 dict_init, /* tp_init */
3207 PyType_GenericAlloc, /* tp_alloc */
3208 dict_new, /* tp_new */
3209 PyObject_GC_Del, /* tp_free */
Guido van Rossum4b1302b1993-03-27 18:11:32 +00003210};
3211
Victor Stinner3c1e4812012-03-26 22:10:51 +02003212PyObject *
3213_PyDict_GetItemId(PyObject *dp, struct _Py_Identifier *key)
3214{
3215 PyObject *kv;
3216 kv = _PyUnicode_FromId(key); /* borrowed */
Victor Stinner5b3b1002013-07-22 23:50:57 +02003217 if (kv == NULL) {
3218 PyErr_Clear();
Victor Stinner3c1e4812012-03-26 22:10:51 +02003219 return NULL;
Victor Stinner5b3b1002013-07-22 23:50:57 +02003220 }
Victor Stinner3c1e4812012-03-26 22:10:51 +02003221 return PyDict_GetItem(dp, kv);
3222}
3223
Guido van Rossum3cca2451997-05-16 14:23:33 +00003224/* For backward compatibility with old dictionary interface */
3225
Guido van Rossumc0b618a1997-05-02 03:12:38 +00003226PyObject *
Martin v. Löwis32b4a1b2002-12-11 13:21:12 +00003227PyDict_GetItemString(PyObject *v, const char *key)
Guido van Rossum4b1302b1993-03-27 18:11:32 +00003228{
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00003229 PyObject *kv, *rv;
3230 kv = PyUnicode_FromString(key);
Victor Stinnerfdcbab92013-07-16 22:16:05 +02003231 if (kv == NULL) {
3232 PyErr_Clear();
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00003233 return NULL;
Victor Stinnerfdcbab92013-07-16 22:16:05 +02003234 }
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00003235 rv = PyDict_GetItem(v, kv);
3236 Py_DECREF(kv);
3237 return rv;
Guido van Rossum4b1302b1993-03-27 18:11:32 +00003238}
3239
3240int
Victor Stinner3c1e4812012-03-26 22:10:51 +02003241_PyDict_SetItemId(PyObject *v, struct _Py_Identifier *key, PyObject *item)
3242{
3243 PyObject *kv;
3244 kv = _PyUnicode_FromId(key); /* borrowed */
3245 if (kv == NULL)
3246 return -1;
3247 return PyDict_SetItem(v, kv, item);
3248}
3249
3250int
Martin v. Löwis32b4a1b2002-12-11 13:21:12 +00003251PyDict_SetItemString(PyObject *v, const char *key, PyObject *item)
Guido van Rossum4b1302b1993-03-27 18:11:32 +00003252{
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00003253 PyObject *kv;
3254 int err;
3255 kv = PyUnicode_FromString(key);
3256 if (kv == NULL)
3257 return -1;
3258 PyUnicode_InternInPlace(&kv); /* XXX Should we really? */
3259 err = PyDict_SetItem(v, kv, item);
3260 Py_DECREF(kv);
3261 return err;
Guido van Rossum4b1302b1993-03-27 18:11:32 +00003262}
3263
3264int
Victor Stinner5fd2e5a2013-11-06 18:58:22 +01003265_PyDict_DelItemId(PyObject *v, _Py_Identifier *key)
3266{
3267 PyObject *kv = _PyUnicode_FromId(key); /* borrowed */
3268 if (kv == NULL)
3269 return -1;
3270 return PyDict_DelItem(v, kv);
3271}
3272
3273int
Martin v. Löwis32b4a1b2002-12-11 13:21:12 +00003274PyDict_DelItemString(PyObject *v, const char *key)
Guido van Rossum4b1302b1993-03-27 18:11:32 +00003275{
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00003276 PyObject *kv;
3277 int err;
3278 kv = PyUnicode_FromString(key);
3279 if (kv == NULL)
3280 return -1;
3281 err = PyDict_DelItem(v, kv);
3282 Py_DECREF(kv);
3283 return err;
Guido van Rossum4b1302b1993-03-27 18:11:32 +00003284}
Guido van Rossum59d1d2b2001-04-20 19:13:02 +00003285
Raymond Hettinger019a1482004-03-18 02:41:19 +00003286/* Dictionary iterator types */
Guido van Rossum59d1d2b2001-04-20 19:13:02 +00003287
3288typedef struct {
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00003289 PyObject_HEAD
3290 PyDictObject *di_dict; /* Set to NULL when iterator is exhausted */
3291 Py_ssize_t di_used;
3292 Py_ssize_t di_pos;
3293 PyObject* di_result; /* reusable result tuple for iteritems */
3294 Py_ssize_t len;
Guido van Rossum59d1d2b2001-04-20 19:13:02 +00003295} dictiterobject;
3296
3297static PyObject *
Guido van Rossum8ce8a782007-11-01 19:42:39 +00003298dictiter_new(PyDictObject *dict, PyTypeObject *itertype)
Guido van Rossum59d1d2b2001-04-20 19:13:02 +00003299{
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00003300 dictiterobject *di;
3301 di = PyObject_GC_New(dictiterobject, itertype);
3302 if (di == NULL)
3303 return NULL;
3304 Py_INCREF(dict);
3305 di->di_dict = dict;
3306 di->di_used = dict->ma_used;
3307 di->di_pos = 0;
3308 di->len = dict->ma_used;
3309 if (itertype == &PyDictIterItem_Type) {
3310 di->di_result = PyTuple_Pack(2, Py_None, Py_None);
3311 if (di->di_result == NULL) {
3312 Py_DECREF(di);
3313 return NULL;
3314 }
3315 }
3316 else
3317 di->di_result = NULL;
3318 _PyObject_GC_TRACK(di);
3319 return (PyObject *)di;
Guido van Rossum59d1d2b2001-04-20 19:13:02 +00003320}
3321
3322static void
3323dictiter_dealloc(dictiterobject *di)
3324{
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00003325 Py_XDECREF(di->di_dict);
3326 Py_XDECREF(di->di_result);
3327 PyObject_GC_Del(di);
Antoine Pitrou7ddda782009-01-01 15:35:33 +00003328}
3329
3330static int
3331dictiter_traverse(dictiterobject *di, visitproc visit, void *arg)
3332{
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00003333 Py_VISIT(di->di_dict);
3334 Py_VISIT(di->di_result);
3335 return 0;
Guido van Rossum59d1d2b2001-04-20 19:13:02 +00003336}
3337
Raymond Hettinger6b27cda2005-09-24 21:23:05 +00003338static PyObject *
Raymond Hettinger0ce6dc82004-03-18 08:38:00 +00003339dictiter_len(dictiterobject *di)
3340{
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00003341 Py_ssize_t len = 0;
3342 if (di->di_dict != NULL && di->di_used == di->di_dict->ma_used)
3343 len = di->len;
3344 return PyLong_FromSize_t(len);
Raymond Hettinger0ce6dc82004-03-18 08:38:00 +00003345}
3346
Guido van Rossumb90c8482007-02-10 01:11:45 +00003347PyDoc_STRVAR(length_hint_doc,
3348 "Private method returning an estimate of len(list(it)).");
Raymond Hettinger6b27cda2005-09-24 21:23:05 +00003349
Kristján Valur Jónsson31668b82012-04-03 10:49:41 +00003350static PyObject *
3351dictiter_reduce(dictiterobject *di);
3352
3353PyDoc_STRVAR(reduce_doc, "Return state information for pickling.");
3354
Raymond Hettinger6b27cda2005-09-24 21:23:05 +00003355static PyMethodDef dictiter_methods[] = {
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00003356 {"__length_hint__", (PyCFunction)dictiter_len, METH_NOARGS,
3357 length_hint_doc},
Kristján Valur Jónsson31668b82012-04-03 10:49:41 +00003358 {"__reduce__", (PyCFunction)dictiter_reduce, METH_NOARGS,
3359 reduce_doc},
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00003360 {NULL, NULL} /* sentinel */
Raymond Hettinger0ce6dc82004-03-18 08:38:00 +00003361};
3362
Serhiy Storchaka49f5cdd2016-10-09 23:08:05 +03003363static PyObject*
3364dictiter_iternextkey(dictiterobject *di)
Guido van Rossum213c7a62001-04-23 14:08:49 +00003365{
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00003366 PyObject *key;
INADA Naokica2d8be2016-11-04 16:59:10 +09003367 Py_ssize_t i;
Antoine Pitrou9ed5f272013-08-13 20:18:52 +02003368 PyDictKeysObject *k;
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00003369 PyDictObject *d = di->di_dict;
Guido van Rossum213c7a62001-04-23 14:08:49 +00003370
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00003371 if (d == NULL)
3372 return NULL;
3373 assert (PyDict_Check(d));
Guido van Rossum2147df72002-07-16 20:30:22 +00003374
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00003375 if (di->di_used != d->ma_used) {
3376 PyErr_SetString(PyExc_RuntimeError,
3377 "dictionary changed size during iteration");
3378 di->di_used = -1; /* Make this state sticky */
3379 return NULL;
3380 }
Guido van Rossum2147df72002-07-16 20:30:22 +00003381
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00003382 i = di->di_pos;
Benjamin Peterson7d95e402012-04-23 11:24:50 -04003383 k = d->ma_keys;
INADA Naokica2d8be2016-11-04 16:59:10 +09003384 assert(i >= 0);
Benjamin Peterson7d95e402012-04-23 11:24:50 -04003385 if (d->ma_values) {
INADA Naokica2d8be2016-11-04 16:59:10 +09003386 if (i >= d->ma_used)
Serhiy Storchaka49f5cdd2016-10-09 23:08:05 +03003387 goto fail;
3388 key = DK_ENTRIES(k)[i].me_key;
INADA Naokica2d8be2016-11-04 16:59:10 +09003389 assert(d->ma_values[i] != NULL);
Benjamin Peterson7d95e402012-04-23 11:24:50 -04003390 }
3391 else {
INADA Naokica2d8be2016-11-04 16:59:10 +09003392 Py_ssize_t n = k->dk_nentries;
Serhiy Storchaka49f5cdd2016-10-09 23:08:05 +03003393 PyDictKeyEntry *entry_ptr = &DK_ENTRIES(k)[i];
3394 while (i < n && entry_ptr->me_value == NULL) {
3395 entry_ptr++;
3396 i++;
3397 }
3398 if (i >= n)
3399 goto fail;
3400 key = entry_ptr->me_key;
Benjamin Peterson7d95e402012-04-23 11:24:50 -04003401 }
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00003402 di->di_pos = i+1;
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00003403 di->len--;
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00003404 Py_INCREF(key);
3405 return key;
Raymond Hettinger019a1482004-03-18 02:41:19 +00003406
3407fail:
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00003408 di->di_dict = NULL;
Serhiy Storchakafbb1c5e2016-03-30 20:40:02 +03003409 Py_DECREF(d);
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00003410 return NULL;
Guido van Rossum59d1d2b2001-04-20 19:13:02 +00003411}
3412
Raymond Hettinger019a1482004-03-18 02:41:19 +00003413PyTypeObject PyDictIterKey_Type = {
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00003414 PyVarObject_HEAD_INIT(&PyType_Type, 0)
3415 "dict_keyiterator", /* tp_name */
3416 sizeof(dictiterobject), /* tp_basicsize */
3417 0, /* tp_itemsize */
3418 /* methods */
3419 (destructor)dictiter_dealloc, /* tp_dealloc */
3420 0, /* tp_print */
3421 0, /* tp_getattr */
3422 0, /* tp_setattr */
3423 0, /* tp_reserved */
3424 0, /* tp_repr */
3425 0, /* tp_as_number */
3426 0, /* tp_as_sequence */
3427 0, /* tp_as_mapping */
3428 0, /* tp_hash */
3429 0, /* tp_call */
3430 0, /* tp_str */
3431 PyObject_GenericGetAttr, /* tp_getattro */
3432 0, /* tp_setattro */
3433 0, /* tp_as_buffer */
3434 Py_TPFLAGS_DEFAULT | Py_TPFLAGS_HAVE_GC,/* tp_flags */
3435 0, /* tp_doc */
3436 (traverseproc)dictiter_traverse, /* tp_traverse */
3437 0, /* tp_clear */
3438 0, /* tp_richcompare */
3439 0, /* tp_weaklistoffset */
3440 PyObject_SelfIter, /* tp_iter */
3441 (iternextfunc)dictiter_iternextkey, /* tp_iternext */
3442 dictiter_methods, /* tp_methods */
3443 0,
Raymond Hettinger019a1482004-03-18 02:41:19 +00003444};
3445
Serhiy Storchaka49f5cdd2016-10-09 23:08:05 +03003446static PyObject *
3447dictiter_iternextvalue(dictiterobject *di)
Raymond Hettinger019a1482004-03-18 02:41:19 +00003448{
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00003449 PyObject *value;
INADA Naokica2d8be2016-11-04 16:59:10 +09003450 Py_ssize_t i;
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00003451 PyDictObject *d = di->di_dict;
Raymond Hettinger019a1482004-03-18 02:41:19 +00003452
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00003453 if (d == NULL)
3454 return NULL;
3455 assert (PyDict_Check(d));
Raymond Hettinger019a1482004-03-18 02:41:19 +00003456
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00003457 if (di->di_used != d->ma_used) {
3458 PyErr_SetString(PyExc_RuntimeError,
3459 "dictionary changed size during iteration");
3460 di->di_used = -1; /* Make this state sticky */
3461 return NULL;
3462 }
Raymond Hettinger019a1482004-03-18 02:41:19 +00003463
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00003464 i = di->di_pos;
INADA Naokica2d8be2016-11-04 16:59:10 +09003465 assert(i >= 0);
Benjamin Peterson7d95e402012-04-23 11:24:50 -04003466 if (d->ma_values) {
INADA Naokica2d8be2016-11-04 16:59:10 +09003467 if (i >= d->ma_used)
Serhiy Storchaka49f5cdd2016-10-09 23:08:05 +03003468 goto fail;
INADA Naokica2d8be2016-11-04 16:59:10 +09003469 value = d->ma_values[i];
3470 assert(value != NULL);
Benjamin Peterson7d95e402012-04-23 11:24:50 -04003471 }
3472 else {
INADA Naokica2d8be2016-11-04 16:59:10 +09003473 Py_ssize_t n = d->ma_keys->dk_nentries;
Serhiy Storchaka49f5cdd2016-10-09 23:08:05 +03003474 PyDictKeyEntry *entry_ptr = &DK_ENTRIES(d->ma_keys)[i];
3475 while (i < n && entry_ptr->me_value == NULL) {
3476 entry_ptr++;
3477 i++;
3478 }
3479 if (i >= n)
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00003480 goto fail;
Serhiy Storchaka49f5cdd2016-10-09 23:08:05 +03003481 value = entry_ptr->me_value;
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00003482 }
3483 di->di_pos = i+1;
3484 di->len--;
3485 Py_INCREF(value);
3486 return value;
Raymond Hettinger019a1482004-03-18 02:41:19 +00003487
3488fail:
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00003489 di->di_dict = NULL;
Serhiy Storchakafbb1c5e2016-03-30 20:40:02 +03003490 Py_DECREF(d);
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00003491 return NULL;
Raymond Hettinger019a1482004-03-18 02:41:19 +00003492}
3493
3494PyTypeObject PyDictIterValue_Type = {
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00003495 PyVarObject_HEAD_INIT(&PyType_Type, 0)
3496 "dict_valueiterator", /* tp_name */
3497 sizeof(dictiterobject), /* tp_basicsize */
3498 0, /* tp_itemsize */
3499 /* methods */
3500 (destructor)dictiter_dealloc, /* tp_dealloc */
3501 0, /* tp_print */
3502 0, /* tp_getattr */
3503 0, /* tp_setattr */
3504 0, /* tp_reserved */
3505 0, /* tp_repr */
3506 0, /* tp_as_number */
3507 0, /* tp_as_sequence */
3508 0, /* tp_as_mapping */
3509 0, /* tp_hash */
3510 0, /* tp_call */
3511 0, /* tp_str */
3512 PyObject_GenericGetAttr, /* tp_getattro */
3513 0, /* tp_setattro */
3514 0, /* tp_as_buffer */
Serhiy Storchaka49f5cdd2016-10-09 23:08:05 +03003515 Py_TPFLAGS_DEFAULT | Py_TPFLAGS_HAVE_GC, /* tp_flags */
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00003516 0, /* tp_doc */
3517 (traverseproc)dictiter_traverse, /* tp_traverse */
3518 0, /* tp_clear */
3519 0, /* tp_richcompare */
3520 0, /* tp_weaklistoffset */
3521 PyObject_SelfIter, /* tp_iter */
3522 (iternextfunc)dictiter_iternextvalue, /* tp_iternext */
3523 dictiter_methods, /* tp_methods */
3524 0,
Raymond Hettinger019a1482004-03-18 02:41:19 +00003525};
3526
Serhiy Storchaka49f5cdd2016-10-09 23:08:05 +03003527static PyObject *
3528dictiter_iternextitem(dictiterobject *di)
Raymond Hettinger019a1482004-03-18 02:41:19 +00003529{
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00003530 PyObject *key, *value, *result = di->di_result;
INADA Naokica2d8be2016-11-04 16:59:10 +09003531 Py_ssize_t i;
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00003532 PyDictObject *d = di->di_dict;
Raymond Hettinger019a1482004-03-18 02:41:19 +00003533
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00003534 if (d == NULL)
3535 return NULL;
3536 assert (PyDict_Check(d));
Raymond Hettinger019a1482004-03-18 02:41:19 +00003537
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00003538 if (di->di_used != d->ma_used) {
3539 PyErr_SetString(PyExc_RuntimeError,
3540 "dictionary changed size during iteration");
3541 di->di_used = -1; /* Make this state sticky */
3542 return NULL;
3543 }
Raymond Hettinger019a1482004-03-18 02:41:19 +00003544
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00003545 i = di->di_pos;
INADA Naokica2d8be2016-11-04 16:59:10 +09003546 assert(i >= 0);
Benjamin Peterson7d95e402012-04-23 11:24:50 -04003547 if (d->ma_values) {
INADA Naokica2d8be2016-11-04 16:59:10 +09003548 if (i >= d->ma_used)
Serhiy Storchaka49f5cdd2016-10-09 23:08:05 +03003549 goto fail;
3550 key = DK_ENTRIES(d->ma_keys)[i].me_key;
INADA Naokica2d8be2016-11-04 16:59:10 +09003551 value = d->ma_values[i];
3552 assert(value != NULL);
Benjamin Peterson7d95e402012-04-23 11:24:50 -04003553 }
3554 else {
INADA Naokica2d8be2016-11-04 16:59:10 +09003555 Py_ssize_t n = d->ma_keys->dk_nentries;
Serhiy Storchaka49f5cdd2016-10-09 23:08:05 +03003556 PyDictKeyEntry *entry_ptr = &DK_ENTRIES(d->ma_keys)[i];
3557 while (i < n && entry_ptr->me_value == NULL) {
3558 entry_ptr++;
3559 i++;
3560 }
3561 if (i >= n)
3562 goto fail;
3563 key = entry_ptr->me_key;
3564 value = entry_ptr->me_value;
Benjamin Peterson7d95e402012-04-23 11:24:50 -04003565 }
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00003566 di->di_pos = i+1;
Serhiy Storchaka49f5cdd2016-10-09 23:08:05 +03003567 di->len--;
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00003568 if (result->ob_refcnt == 1) {
3569 Py_INCREF(result);
3570 Py_DECREF(PyTuple_GET_ITEM(result, 0));
3571 Py_DECREF(PyTuple_GET_ITEM(result, 1));
Serhiy Storchaka49f5cdd2016-10-09 23:08:05 +03003572 }
3573 else {
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00003574 result = PyTuple_New(2);
3575 if (result == NULL)
3576 return NULL;
3577 }
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00003578 Py_INCREF(key);
3579 Py_INCREF(value);
Eric Snow96c6af92015-05-29 22:21:39 -06003580 PyTuple_SET_ITEM(result, 0, key); /* steals reference */
3581 PyTuple_SET_ITEM(result, 1, value); /* steals reference */
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00003582 return result;
Raymond Hettinger019a1482004-03-18 02:41:19 +00003583
3584fail:
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00003585 di->di_dict = NULL;
Serhiy Storchakafbb1c5e2016-03-30 20:40:02 +03003586 Py_DECREF(d);
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00003587 return NULL;
Raymond Hettinger019a1482004-03-18 02:41:19 +00003588}
3589
3590PyTypeObject PyDictIterItem_Type = {
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00003591 PyVarObject_HEAD_INIT(&PyType_Type, 0)
3592 "dict_itemiterator", /* tp_name */
3593 sizeof(dictiterobject), /* tp_basicsize */
3594 0, /* tp_itemsize */
3595 /* methods */
3596 (destructor)dictiter_dealloc, /* tp_dealloc */
3597 0, /* tp_print */
3598 0, /* tp_getattr */
3599 0, /* tp_setattr */
3600 0, /* tp_reserved */
3601 0, /* tp_repr */
3602 0, /* tp_as_number */
3603 0, /* tp_as_sequence */
3604 0, /* tp_as_mapping */
3605 0, /* tp_hash */
3606 0, /* tp_call */
3607 0, /* tp_str */
3608 PyObject_GenericGetAttr, /* tp_getattro */
3609 0, /* tp_setattro */
3610 0, /* tp_as_buffer */
3611 Py_TPFLAGS_DEFAULT | Py_TPFLAGS_HAVE_GC,/* tp_flags */
3612 0, /* tp_doc */
3613 (traverseproc)dictiter_traverse, /* tp_traverse */
3614 0, /* tp_clear */
3615 0, /* tp_richcompare */
3616 0, /* tp_weaklistoffset */
3617 PyObject_SelfIter, /* tp_iter */
3618 (iternextfunc)dictiter_iternextitem, /* tp_iternext */
3619 dictiter_methods, /* tp_methods */
3620 0,
Guido van Rossum59d1d2b2001-04-20 19:13:02 +00003621};
Guido van Rossumb90c8482007-02-10 01:11:45 +00003622
3623
Kristján Valur Jónsson31668b82012-04-03 10:49:41 +00003624static PyObject *
3625dictiter_reduce(dictiterobject *di)
3626{
3627 PyObject *list;
3628 dictiterobject tmp;
3629
3630 list = PyList_New(0);
3631 if (!list)
3632 return NULL;
3633
3634 /* copy the itertor state */
3635 tmp = *di;
3636 Py_XINCREF(tmp.di_dict);
Benjamin Peterson7d95e402012-04-23 11:24:50 -04003637
Kristján Valur Jónsson31668b82012-04-03 10:49:41 +00003638 /* iterate the temporary into a list */
3639 for(;;) {
3640 PyObject *element = 0;
3641 if (Py_TYPE(di) == &PyDictIterItem_Type)
3642 element = dictiter_iternextitem(&tmp);
3643 else if (Py_TYPE(di) == &PyDictIterKey_Type)
3644 element = dictiter_iternextkey(&tmp);
3645 else if (Py_TYPE(di) == &PyDictIterValue_Type)
3646 element = dictiter_iternextvalue(&tmp);
3647 else
3648 assert(0);
3649 if (element) {
3650 if (PyList_Append(list, element)) {
3651 Py_DECREF(element);
3652 Py_DECREF(list);
3653 Py_XDECREF(tmp.di_dict);
3654 return NULL;
3655 }
3656 Py_DECREF(element);
3657 } else
3658 break;
3659 }
3660 Py_XDECREF(tmp.di_dict);
3661 /* check for error */
3662 if (tmp.di_dict != NULL) {
3663 /* we have an error */
3664 Py_DECREF(list);
3665 return NULL;
3666 }
Antoine Pitroua7013882012-04-05 00:04:20 +02003667 return Py_BuildValue("N(N)", _PyObject_GetBuiltin("iter"), list);
Kristján Valur Jónsson31668b82012-04-03 10:49:41 +00003668}
3669
Guido van Rossum3ac67412007-02-10 18:55:06 +00003670/***********************************************/
Guido van Rossumb90c8482007-02-10 01:11:45 +00003671/* View objects for keys(), items(), values(). */
Guido van Rossum3ac67412007-02-10 18:55:06 +00003672/***********************************************/
3673
Guido van Rossumb90c8482007-02-10 01:11:45 +00003674/* The instance lay-out is the same for all three; but the type differs. */
3675
Guido van Rossumb90c8482007-02-10 01:11:45 +00003676static void
Eric Snow96c6af92015-05-29 22:21:39 -06003677dictview_dealloc(_PyDictViewObject *dv)
Guido van Rossumb90c8482007-02-10 01:11:45 +00003678{
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00003679 Py_XDECREF(dv->dv_dict);
3680 PyObject_GC_Del(dv);
Antoine Pitrou7ddda782009-01-01 15:35:33 +00003681}
3682
3683static int
Eric Snow96c6af92015-05-29 22:21:39 -06003684dictview_traverse(_PyDictViewObject *dv, visitproc visit, void *arg)
Antoine Pitrou7ddda782009-01-01 15:35:33 +00003685{
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00003686 Py_VISIT(dv->dv_dict);
3687 return 0;
Guido van Rossumb90c8482007-02-10 01:11:45 +00003688}
3689
Guido van Rossum83825ac2007-02-10 04:54:19 +00003690static Py_ssize_t
Eric Snow96c6af92015-05-29 22:21:39 -06003691dictview_len(_PyDictViewObject *dv)
Guido van Rossumb90c8482007-02-10 01:11:45 +00003692{
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00003693 Py_ssize_t len = 0;
3694 if (dv->dv_dict != NULL)
3695 len = dv->dv_dict->ma_used;
3696 return len;
Guido van Rossumb90c8482007-02-10 01:11:45 +00003697}
3698
Eric Snow96c6af92015-05-29 22:21:39 -06003699PyObject *
3700_PyDictView_New(PyObject *dict, PyTypeObject *type)
Guido van Rossumb90c8482007-02-10 01:11:45 +00003701{
Eric Snow96c6af92015-05-29 22:21:39 -06003702 _PyDictViewObject *dv;
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00003703 if (dict == NULL) {
3704 PyErr_BadInternalCall();
3705 return NULL;
3706 }
3707 if (!PyDict_Check(dict)) {
3708 /* XXX Get rid of this restriction later */
3709 PyErr_Format(PyExc_TypeError,
3710 "%s() requires a dict argument, not '%s'",
3711 type->tp_name, dict->ob_type->tp_name);
3712 return NULL;
3713 }
Eric Snow96c6af92015-05-29 22:21:39 -06003714 dv = PyObject_GC_New(_PyDictViewObject, type);
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00003715 if (dv == NULL)
3716 return NULL;
3717 Py_INCREF(dict);
3718 dv->dv_dict = (PyDictObject *)dict;
3719 _PyObject_GC_TRACK(dv);
3720 return (PyObject *)dv;
Guido van Rossumb90c8482007-02-10 01:11:45 +00003721}
3722
Neal Norwitze36f2ba2007-02-26 23:12:28 +00003723/* TODO(guido): The views objects are not complete:
3724
3725 * support more set operations
3726 * support arbitrary mappings?
3727 - either these should be static or exported in dictobject.h
3728 - if public then they should probably be in builtins
3729*/
3730
Guido van Rossumaac530c2007-08-24 22:33:45 +00003731/* Return 1 if self is a subset of other, iterating over self;
3732 0 if not; -1 if an error occurred. */
Guido van Rossumd9214d12007-02-12 02:23:40 +00003733static int
3734all_contained_in(PyObject *self, PyObject *other)
3735{
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00003736 PyObject *iter = PyObject_GetIter(self);
3737 int ok = 1;
Guido van Rossumd9214d12007-02-12 02:23:40 +00003738
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00003739 if (iter == NULL)
3740 return -1;
3741 for (;;) {
3742 PyObject *next = PyIter_Next(iter);
3743 if (next == NULL) {
3744 if (PyErr_Occurred())
3745 ok = -1;
3746 break;
3747 }
3748 ok = PySequence_Contains(other, next);
3749 Py_DECREF(next);
3750 if (ok <= 0)
3751 break;
3752 }
3753 Py_DECREF(iter);
3754 return ok;
Guido van Rossumd9214d12007-02-12 02:23:40 +00003755}
3756
3757static PyObject *
3758dictview_richcompare(PyObject *self, PyObject *other, int op)
3759{
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00003760 Py_ssize_t len_self, len_other;
3761 int ok;
3762 PyObject *result;
Guido van Rossumaac530c2007-08-24 22:33:45 +00003763
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00003764 assert(self != NULL);
3765 assert(PyDictViewSet_Check(self));
3766 assert(other != NULL);
Guido van Rossumd9214d12007-02-12 02:23:40 +00003767
Brian Curtindfc80e32011-08-10 20:28:54 -05003768 if (!PyAnySet_Check(other) && !PyDictViewSet_Check(other))
3769 Py_RETURN_NOTIMPLEMENTED;
Guido van Rossumaac530c2007-08-24 22:33:45 +00003770
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00003771 len_self = PyObject_Size(self);
3772 if (len_self < 0)
3773 return NULL;
3774 len_other = PyObject_Size(other);
3775 if (len_other < 0)
3776 return NULL;
Guido van Rossumaac530c2007-08-24 22:33:45 +00003777
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00003778 ok = 0;
3779 switch(op) {
Guido van Rossumaac530c2007-08-24 22:33:45 +00003780
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00003781 case Py_NE:
3782 case Py_EQ:
3783 if (len_self == len_other)
3784 ok = all_contained_in(self, other);
3785 if (op == Py_NE && ok >= 0)
3786 ok = !ok;
3787 break;
Guido van Rossumaac530c2007-08-24 22:33:45 +00003788
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00003789 case Py_LT:
3790 if (len_self < len_other)
3791 ok = all_contained_in(self, other);
3792 break;
Guido van Rossumaac530c2007-08-24 22:33:45 +00003793
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00003794 case Py_LE:
3795 if (len_self <= len_other)
3796 ok = all_contained_in(self, other);
3797 break;
Guido van Rossumaac530c2007-08-24 22:33:45 +00003798
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00003799 case Py_GT:
3800 if (len_self > len_other)
3801 ok = all_contained_in(other, self);
3802 break;
Guido van Rossumaac530c2007-08-24 22:33:45 +00003803
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00003804 case Py_GE:
3805 if (len_self >= len_other)
3806 ok = all_contained_in(other, self);
3807 break;
Guido van Rossumaac530c2007-08-24 22:33:45 +00003808
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00003809 }
3810 if (ok < 0)
3811 return NULL;
3812 result = ok ? Py_True : Py_False;
3813 Py_INCREF(result);
3814 return result;
Guido van Rossumd9214d12007-02-12 02:23:40 +00003815}
3816
Raymond Hettingerb0d56af2009-03-03 10:52:49 +00003817static PyObject *
Eric Snow96c6af92015-05-29 22:21:39 -06003818dictview_repr(_PyDictViewObject *dv)
Raymond Hettingerb0d56af2009-03-03 10:52:49 +00003819{
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00003820 PyObject *seq;
3821 PyObject *result;
Raymond Hettingerb0d56af2009-03-03 10:52:49 +00003822
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00003823 seq = PySequence_List((PyObject *)dv);
3824 if (seq == NULL)
3825 return NULL;
3826
3827 result = PyUnicode_FromFormat("%s(%R)", Py_TYPE(dv)->tp_name, seq);
3828 Py_DECREF(seq);
3829 return result;
Raymond Hettingerb0d56af2009-03-03 10:52:49 +00003830}
3831
Guido van Rossum3ac67412007-02-10 18:55:06 +00003832/*** dict_keys ***/
Guido van Rossumb90c8482007-02-10 01:11:45 +00003833
3834static PyObject *
Eric Snow96c6af92015-05-29 22:21:39 -06003835dictkeys_iter(_PyDictViewObject *dv)
Guido van Rossumb90c8482007-02-10 01:11:45 +00003836{
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00003837 if (dv->dv_dict == NULL) {
3838 Py_RETURN_NONE;
3839 }
3840 return dictiter_new(dv->dv_dict, &PyDictIterKey_Type);
Guido van Rossum3ac67412007-02-10 18:55:06 +00003841}
3842
3843static int
Eric Snow96c6af92015-05-29 22:21:39 -06003844dictkeys_contains(_PyDictViewObject *dv, PyObject *obj)
Guido van Rossum3ac67412007-02-10 18:55:06 +00003845{
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00003846 if (dv->dv_dict == NULL)
3847 return 0;
3848 return PyDict_Contains((PyObject *)dv->dv_dict, obj);
Guido van Rossumb90c8482007-02-10 01:11:45 +00003849}
3850
Guido van Rossum83825ac2007-02-10 04:54:19 +00003851static PySequenceMethods dictkeys_as_sequence = {
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00003852 (lenfunc)dictview_len, /* sq_length */
3853 0, /* sq_concat */
3854 0, /* sq_repeat */
3855 0, /* sq_item */
3856 0, /* sq_slice */
3857 0, /* sq_ass_item */
3858 0, /* sq_ass_slice */
3859 (objobjproc)dictkeys_contains, /* sq_contains */
Guido van Rossum83825ac2007-02-10 04:54:19 +00003860};
3861
Guido van Rossum523259b2007-08-24 23:41:22 +00003862static PyObject*
3863dictviews_sub(PyObject* self, PyObject *other)
3864{
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00003865 PyObject *result = PySet_New(self);
3866 PyObject *tmp;
Martin v. Löwisbd928fe2011-10-14 10:20:37 +02003867 _Py_IDENTIFIER(difference_update);
Martin v. Löwisafe55bb2011-10-09 10:38:36 +02003868
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00003869 if (result == NULL)
3870 return NULL;
Guido van Rossum523259b2007-08-24 23:41:22 +00003871
Benjamin Petersonf11b25b2016-03-03 22:05:36 -08003872 tmp = _PyObject_CallMethodIdObjArgs(result, &PyId_difference_update, other, NULL);
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00003873 if (tmp == NULL) {
3874 Py_DECREF(result);
3875 return NULL;
3876 }
Guido van Rossum523259b2007-08-24 23:41:22 +00003877
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00003878 Py_DECREF(tmp);
3879 return result;
Guido van Rossum523259b2007-08-24 23:41:22 +00003880}
3881
Benjamin Peterson025e9eb2015-05-05 20:16:41 -04003882PyObject*
3883_PyDictView_Intersect(PyObject* self, PyObject *other)
Guido van Rossum523259b2007-08-24 23:41:22 +00003884{
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00003885 PyObject *result = PySet_New(self);
3886 PyObject *tmp;
Martin v. Löwisbd928fe2011-10-14 10:20:37 +02003887 _Py_IDENTIFIER(intersection_update);
Martin v. Löwisafe55bb2011-10-09 10:38:36 +02003888
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00003889 if (result == NULL)
3890 return NULL;
Guido van Rossum523259b2007-08-24 23:41:22 +00003891
Benjamin Petersonf11b25b2016-03-03 22:05:36 -08003892 tmp = _PyObject_CallMethodIdObjArgs(result, &PyId_intersection_update, other, NULL);
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00003893 if (tmp == NULL) {
3894 Py_DECREF(result);
3895 return NULL;
3896 }
Guido van Rossum523259b2007-08-24 23:41:22 +00003897
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00003898 Py_DECREF(tmp);
3899 return result;
Guido van Rossum523259b2007-08-24 23:41:22 +00003900}
3901
3902static PyObject*
3903dictviews_or(PyObject* self, PyObject *other)
3904{
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00003905 PyObject *result = PySet_New(self);
3906 PyObject *tmp;
Martin v. Löwis1c67dd92011-10-14 15:16:45 +02003907 _Py_IDENTIFIER(update);
Victor Stinnerd1a9cc22011-10-13 22:51:17 +02003908
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00003909 if (result == NULL)
3910 return NULL;
Guido van Rossum523259b2007-08-24 23:41:22 +00003911
Benjamin Petersonf11b25b2016-03-03 22:05:36 -08003912 tmp = _PyObject_CallMethodIdObjArgs(result, &PyId_update, other, NULL);
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00003913 if (tmp == NULL) {
3914 Py_DECREF(result);
3915 return NULL;
3916 }
Guido van Rossum523259b2007-08-24 23:41:22 +00003917
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00003918 Py_DECREF(tmp);
3919 return result;
Guido van Rossum523259b2007-08-24 23:41:22 +00003920}
3921
3922static PyObject*
3923dictviews_xor(PyObject* self, PyObject *other)
3924{
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00003925 PyObject *result = PySet_New(self);
3926 PyObject *tmp;
Martin v. Löwisbd928fe2011-10-14 10:20:37 +02003927 _Py_IDENTIFIER(symmetric_difference_update);
Martin v. Löwisafe55bb2011-10-09 10:38:36 +02003928
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00003929 if (result == NULL)
3930 return NULL;
Guido van Rossum523259b2007-08-24 23:41:22 +00003931
Benjamin Petersonf11b25b2016-03-03 22:05:36 -08003932 tmp = _PyObject_CallMethodIdObjArgs(result, &PyId_symmetric_difference_update, other, NULL);
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00003933 if (tmp == NULL) {
3934 Py_DECREF(result);
3935 return NULL;
3936 }
Guido van Rossum523259b2007-08-24 23:41:22 +00003937
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00003938 Py_DECREF(tmp);
3939 return result;
Guido van Rossum523259b2007-08-24 23:41:22 +00003940}
3941
3942static PyNumberMethods dictviews_as_number = {
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00003943 0, /*nb_add*/
3944 (binaryfunc)dictviews_sub, /*nb_subtract*/
3945 0, /*nb_multiply*/
3946 0, /*nb_remainder*/
3947 0, /*nb_divmod*/
3948 0, /*nb_power*/
3949 0, /*nb_negative*/
3950 0, /*nb_positive*/
3951 0, /*nb_absolute*/
3952 0, /*nb_bool*/
3953 0, /*nb_invert*/
3954 0, /*nb_lshift*/
3955 0, /*nb_rshift*/
Benjamin Peterson025e9eb2015-05-05 20:16:41 -04003956 (binaryfunc)_PyDictView_Intersect, /*nb_and*/
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00003957 (binaryfunc)dictviews_xor, /*nb_xor*/
3958 (binaryfunc)dictviews_or, /*nb_or*/
Guido van Rossum523259b2007-08-24 23:41:22 +00003959};
3960
Daniel Stutzbach045b3ba2010-09-02 15:06:06 +00003961static PyObject*
3962dictviews_isdisjoint(PyObject *self, PyObject *other)
3963{
3964 PyObject *it;
3965 PyObject *item = NULL;
3966
3967 if (self == other) {
Eric Snow96c6af92015-05-29 22:21:39 -06003968 if (dictview_len((_PyDictViewObject *)self) == 0)
Daniel Stutzbach045b3ba2010-09-02 15:06:06 +00003969 Py_RETURN_TRUE;
3970 else
3971 Py_RETURN_FALSE;
3972 }
3973
3974 /* Iterate over the shorter object (only if other is a set,
3975 * because PySequence_Contains may be expensive otherwise): */
3976 if (PyAnySet_Check(other) || PyDictViewSet_Check(other)) {
Eric Snow96c6af92015-05-29 22:21:39 -06003977 Py_ssize_t len_self = dictview_len((_PyDictViewObject *)self);
Daniel Stutzbach045b3ba2010-09-02 15:06:06 +00003978 Py_ssize_t len_other = PyObject_Size(other);
3979 if (len_other == -1)
3980 return NULL;
3981
3982 if ((len_other > len_self)) {
3983 PyObject *tmp = other;
3984 other = self;
3985 self = tmp;
3986 }
3987 }
3988
3989 it = PyObject_GetIter(other);
3990 if (it == NULL)
3991 return NULL;
3992
3993 while ((item = PyIter_Next(it)) != NULL) {
3994 int contains = PySequence_Contains(self, item);
3995 Py_DECREF(item);
3996 if (contains == -1) {
3997 Py_DECREF(it);
3998 return NULL;
3999 }
4000
4001 if (contains) {
4002 Py_DECREF(it);
4003 Py_RETURN_FALSE;
4004 }
4005 }
4006 Py_DECREF(it);
4007 if (PyErr_Occurred())
4008 return NULL; /* PyIter_Next raised an exception. */
4009 Py_RETURN_TRUE;
4010}
4011
4012PyDoc_STRVAR(isdisjoint_doc,
4013"Return True if the view and the given iterable have a null intersection.");
4014
Guido van Rossumb90c8482007-02-10 01:11:45 +00004015static PyMethodDef dictkeys_methods[] = {
Daniel Stutzbach045b3ba2010-09-02 15:06:06 +00004016 {"isdisjoint", (PyCFunction)dictviews_isdisjoint, METH_O,
4017 isdisjoint_doc},
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00004018 {NULL, NULL} /* sentinel */
Guido van Rossumb90c8482007-02-10 01:11:45 +00004019};
4020
4021PyTypeObject PyDictKeys_Type = {
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00004022 PyVarObject_HEAD_INIT(&PyType_Type, 0)
4023 "dict_keys", /* tp_name */
Eric Snow96c6af92015-05-29 22:21:39 -06004024 sizeof(_PyDictViewObject), /* tp_basicsize */
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00004025 0, /* tp_itemsize */
4026 /* methods */
4027 (destructor)dictview_dealloc, /* tp_dealloc */
4028 0, /* tp_print */
4029 0, /* tp_getattr */
4030 0, /* tp_setattr */
4031 0, /* tp_reserved */
4032 (reprfunc)dictview_repr, /* tp_repr */
4033 &dictviews_as_number, /* tp_as_number */
4034 &dictkeys_as_sequence, /* tp_as_sequence */
4035 0, /* tp_as_mapping */
4036 0, /* tp_hash */
4037 0, /* tp_call */
4038 0, /* tp_str */
4039 PyObject_GenericGetAttr, /* tp_getattro */
4040 0, /* tp_setattro */
4041 0, /* tp_as_buffer */
4042 Py_TPFLAGS_DEFAULT | Py_TPFLAGS_HAVE_GC,/* tp_flags */
4043 0, /* tp_doc */
4044 (traverseproc)dictview_traverse, /* tp_traverse */
4045 0, /* tp_clear */
4046 dictview_richcompare, /* tp_richcompare */
4047 0, /* tp_weaklistoffset */
4048 (getiterfunc)dictkeys_iter, /* tp_iter */
4049 0, /* tp_iternext */
4050 dictkeys_methods, /* tp_methods */
4051 0,
Guido van Rossumb90c8482007-02-10 01:11:45 +00004052};
4053
4054static PyObject *
4055dictkeys_new(PyObject *dict)
4056{
Eric Snow96c6af92015-05-29 22:21:39 -06004057 return _PyDictView_New(dict, &PyDictKeys_Type);
Guido van Rossumb90c8482007-02-10 01:11:45 +00004058}
4059
Guido van Rossum3ac67412007-02-10 18:55:06 +00004060/*** dict_items ***/
Guido van Rossumb90c8482007-02-10 01:11:45 +00004061
4062static PyObject *
Eric Snow96c6af92015-05-29 22:21:39 -06004063dictitems_iter(_PyDictViewObject *dv)
Guido van Rossumb90c8482007-02-10 01:11:45 +00004064{
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00004065 if (dv->dv_dict == NULL) {
4066 Py_RETURN_NONE;
4067 }
4068 return dictiter_new(dv->dv_dict, &PyDictIterItem_Type);
Guido van Rossum3ac67412007-02-10 18:55:06 +00004069}
4070
4071static int
Eric Snow96c6af92015-05-29 22:21:39 -06004072dictitems_contains(_PyDictViewObject *dv, PyObject *obj)
Guido van Rossum3ac67412007-02-10 18:55:06 +00004073{
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00004074 PyObject *key, *value, *found;
4075 if (dv->dv_dict == NULL)
4076 return 0;
4077 if (!PyTuple_Check(obj) || PyTuple_GET_SIZE(obj) != 2)
4078 return 0;
4079 key = PyTuple_GET_ITEM(obj, 0);
4080 value = PyTuple_GET_ITEM(obj, 1);
Raymond Hettinger6692f012016-09-18 21:46:08 -07004081 found = PyDict_GetItemWithError((PyObject *)dv->dv_dict, key);
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00004082 if (found == NULL) {
4083 if (PyErr_Occurred())
4084 return -1;
4085 return 0;
4086 }
4087 return PyObject_RichCompareBool(value, found, Py_EQ);
Guido van Rossumb90c8482007-02-10 01:11:45 +00004088}
4089
Guido van Rossum83825ac2007-02-10 04:54:19 +00004090static PySequenceMethods dictitems_as_sequence = {
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00004091 (lenfunc)dictview_len, /* sq_length */
4092 0, /* sq_concat */
4093 0, /* sq_repeat */
4094 0, /* sq_item */
4095 0, /* sq_slice */
4096 0, /* sq_ass_item */
4097 0, /* sq_ass_slice */
4098 (objobjproc)dictitems_contains, /* sq_contains */
Guido van Rossum83825ac2007-02-10 04:54:19 +00004099};
4100
Guido van Rossumb90c8482007-02-10 01:11:45 +00004101static PyMethodDef dictitems_methods[] = {
Daniel Stutzbach045b3ba2010-09-02 15:06:06 +00004102 {"isdisjoint", (PyCFunction)dictviews_isdisjoint, METH_O,
4103 isdisjoint_doc},
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00004104 {NULL, NULL} /* sentinel */
Guido van Rossumb90c8482007-02-10 01:11:45 +00004105};
4106
4107PyTypeObject PyDictItems_Type = {
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00004108 PyVarObject_HEAD_INIT(&PyType_Type, 0)
4109 "dict_items", /* tp_name */
Eric Snow96c6af92015-05-29 22:21:39 -06004110 sizeof(_PyDictViewObject), /* tp_basicsize */
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00004111 0, /* tp_itemsize */
4112 /* methods */
4113 (destructor)dictview_dealloc, /* tp_dealloc */
4114 0, /* tp_print */
4115 0, /* tp_getattr */
4116 0, /* tp_setattr */
4117 0, /* tp_reserved */
4118 (reprfunc)dictview_repr, /* tp_repr */
4119 &dictviews_as_number, /* tp_as_number */
4120 &dictitems_as_sequence, /* tp_as_sequence */
4121 0, /* tp_as_mapping */
4122 0, /* tp_hash */
4123 0, /* tp_call */
4124 0, /* tp_str */
4125 PyObject_GenericGetAttr, /* tp_getattro */
4126 0, /* tp_setattro */
4127 0, /* tp_as_buffer */
4128 Py_TPFLAGS_DEFAULT | Py_TPFLAGS_HAVE_GC,/* tp_flags */
4129 0, /* tp_doc */
4130 (traverseproc)dictview_traverse, /* tp_traverse */
4131 0, /* tp_clear */
4132 dictview_richcompare, /* tp_richcompare */
4133 0, /* tp_weaklistoffset */
4134 (getiterfunc)dictitems_iter, /* tp_iter */
4135 0, /* tp_iternext */
4136 dictitems_methods, /* tp_methods */
4137 0,
Guido van Rossumb90c8482007-02-10 01:11:45 +00004138};
4139
4140static PyObject *
4141dictitems_new(PyObject *dict)
4142{
Eric Snow96c6af92015-05-29 22:21:39 -06004143 return _PyDictView_New(dict, &PyDictItems_Type);
Guido van Rossumb90c8482007-02-10 01:11:45 +00004144}
4145
Guido van Rossum3ac67412007-02-10 18:55:06 +00004146/*** dict_values ***/
Guido van Rossumb90c8482007-02-10 01:11:45 +00004147
4148static PyObject *
Eric Snow96c6af92015-05-29 22:21:39 -06004149dictvalues_iter(_PyDictViewObject *dv)
Guido van Rossumb90c8482007-02-10 01:11:45 +00004150{
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00004151 if (dv->dv_dict == NULL) {
4152 Py_RETURN_NONE;
4153 }
4154 return dictiter_new(dv->dv_dict, &PyDictIterValue_Type);
Guido van Rossumb90c8482007-02-10 01:11:45 +00004155}
4156
Guido van Rossum83825ac2007-02-10 04:54:19 +00004157static PySequenceMethods dictvalues_as_sequence = {
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00004158 (lenfunc)dictview_len, /* sq_length */
4159 0, /* sq_concat */
4160 0, /* sq_repeat */
4161 0, /* sq_item */
4162 0, /* sq_slice */
4163 0, /* sq_ass_item */
4164 0, /* sq_ass_slice */
4165 (objobjproc)0, /* sq_contains */
Guido van Rossum83825ac2007-02-10 04:54:19 +00004166};
4167
Guido van Rossumb90c8482007-02-10 01:11:45 +00004168static PyMethodDef dictvalues_methods[] = {
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00004169 {NULL, NULL} /* sentinel */
Guido van Rossumb90c8482007-02-10 01:11:45 +00004170};
4171
4172PyTypeObject PyDictValues_Type = {
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00004173 PyVarObject_HEAD_INIT(&PyType_Type, 0)
4174 "dict_values", /* tp_name */
Eric Snow96c6af92015-05-29 22:21:39 -06004175 sizeof(_PyDictViewObject), /* tp_basicsize */
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00004176 0, /* tp_itemsize */
4177 /* methods */
4178 (destructor)dictview_dealloc, /* tp_dealloc */
4179 0, /* tp_print */
4180 0, /* tp_getattr */
4181 0, /* tp_setattr */
4182 0, /* tp_reserved */
4183 (reprfunc)dictview_repr, /* tp_repr */
4184 0, /* tp_as_number */
4185 &dictvalues_as_sequence, /* tp_as_sequence */
4186 0, /* tp_as_mapping */
4187 0, /* tp_hash */
4188 0, /* tp_call */
4189 0, /* tp_str */
4190 PyObject_GenericGetAttr, /* tp_getattro */
4191 0, /* tp_setattro */
4192 0, /* tp_as_buffer */
4193 Py_TPFLAGS_DEFAULT | Py_TPFLAGS_HAVE_GC,/* tp_flags */
4194 0, /* tp_doc */
4195 (traverseproc)dictview_traverse, /* tp_traverse */
4196 0, /* tp_clear */
4197 0, /* tp_richcompare */
4198 0, /* tp_weaklistoffset */
4199 (getiterfunc)dictvalues_iter, /* tp_iter */
4200 0, /* tp_iternext */
4201 dictvalues_methods, /* tp_methods */
4202 0,
Guido van Rossumb90c8482007-02-10 01:11:45 +00004203};
4204
4205static PyObject *
4206dictvalues_new(PyObject *dict)
4207{
Eric Snow96c6af92015-05-29 22:21:39 -06004208 return _PyDictView_New(dict, &PyDictValues_Type);
Guido van Rossumb90c8482007-02-10 01:11:45 +00004209}
Benjamin Peterson7d95e402012-04-23 11:24:50 -04004210
4211/* Returns NULL if cannot allocate a new PyDictKeysObject,
4212 but does not set an error */
4213PyDictKeysObject *
4214_PyDict_NewKeysForClass(void)
4215{
Victor Stinner742da042016-09-07 17:40:12 -07004216 PyDictKeysObject *keys = new_keys_object(PyDict_MINSIZE);
Benjamin Peterson7d95e402012-04-23 11:24:50 -04004217 if (keys == NULL)
4218 PyErr_Clear();
4219 else
4220 keys->dk_lookup = lookdict_split;
4221 return keys;
4222}
4223
4224#define CACHED_KEYS(tp) (((PyHeapTypeObject*)tp)->ht_cached_keys)
4225
4226PyObject *
4227PyObject_GenericGetDict(PyObject *obj, void *context)
4228{
4229 PyObject *dict, **dictptr = _PyObject_GetDictPtr(obj);
4230 if (dictptr == NULL) {
4231 PyErr_SetString(PyExc_AttributeError,
4232 "This object has no __dict__");
4233 return NULL;
4234 }
4235 dict = *dictptr;
4236 if (dict == NULL) {
4237 PyTypeObject *tp = Py_TYPE(obj);
4238 if ((tp->tp_flags & Py_TPFLAGS_HEAPTYPE) && CACHED_KEYS(tp)) {
4239 DK_INCREF(CACHED_KEYS(tp));
4240 *dictptr = dict = new_dict_with_shared_keys(CACHED_KEYS(tp));
4241 }
4242 else {
4243 *dictptr = dict = PyDict_New();
4244 }
4245 }
4246 Py_XINCREF(dict);
4247 return dict;
4248}
4249
4250int
4251_PyObjectDict_SetItem(PyTypeObject *tp, PyObject **dictptr,
Victor Stinner742da042016-09-07 17:40:12 -07004252 PyObject *key, PyObject *value)
Benjamin Peterson7d95e402012-04-23 11:24:50 -04004253{
4254 PyObject *dict;
4255 int res;
4256 PyDictKeysObject *cached;
4257
4258 assert(dictptr != NULL);
4259 if ((tp->tp_flags & Py_TPFLAGS_HEAPTYPE) && (cached = CACHED_KEYS(tp))) {
4260 assert(dictptr != NULL);
4261 dict = *dictptr;
4262 if (dict == NULL) {
4263 DK_INCREF(cached);
4264 dict = new_dict_with_shared_keys(cached);
4265 if (dict == NULL)
4266 return -1;
4267 *dictptr = dict;
4268 }
4269 if (value == NULL) {
4270 res = PyDict_DelItem(dict, key);
4271 if (cached != ((PyDictObject *)dict)->ma_keys) {
4272 CACHED_KEYS(tp) = NULL;
4273 DK_DECREF(cached);
4274 }
Victor Stinner3d3f2642016-12-15 17:21:23 +01004275 }
4276 else {
4277 int was_shared = cached == ((PyDictObject *)dict)->ma_keys;
Benjamin Peterson7d95e402012-04-23 11:24:50 -04004278 res = PyDict_SetItem(dict, key, value);
Victor Stinner3d3f2642016-12-15 17:21:23 +01004279 if (was_shared && cached != ((PyDictObject *)dict)->ma_keys) {
4280 /* PyDict_SetItem() may call dictresize and convert split table
4281 * into combined table. In such case, convert it to split
4282 * table again and update type's shared key only when this is
4283 * the only dict sharing key with the type.
4284 *
4285 * This is to allow using shared key in class like this:
4286 *
4287 * class C:
4288 * def __init__(self):
4289 * # one dict resize happens
4290 * self.a, self.b, self.c = 1, 2, 3
4291 * self.d, self.e, self.f = 4, 5, 6
4292 * a = C()
4293 */
Benjamin Peterson15ee8212012-04-24 14:44:18 -04004294 if (cached->dk_refcnt == 1) {
Benjamin Peterson7d95e402012-04-23 11:24:50 -04004295 CACHED_KEYS(tp) = make_keys_shared(dict);
Victor Stinner742da042016-09-07 17:40:12 -07004296 }
4297 else {
Benjamin Peterson7d95e402012-04-23 11:24:50 -04004298 CACHED_KEYS(tp) = NULL;
4299 }
4300 DK_DECREF(cached);
Benjamin Peterson15ee8212012-04-24 14:44:18 -04004301 if (CACHED_KEYS(tp) == NULL && PyErr_Occurred())
4302 return -1;
Benjamin Peterson7d95e402012-04-23 11:24:50 -04004303 }
4304 }
4305 } else {
4306 dict = *dictptr;
4307 if (dict == NULL) {
4308 dict = PyDict_New();
4309 if (dict == NULL)
4310 return -1;
4311 *dictptr = dict;
4312 }
4313 if (value == NULL) {
4314 res = PyDict_DelItem(dict, key);
4315 } else {
4316 res = PyDict_SetItem(dict, key, value);
4317 }
4318 }
4319 return res;
4320}
4321
4322void
4323_PyDictKeys_DecRef(PyDictKeysObject *keys)
4324{
4325 DK_DECREF(keys);
4326}