blob: 9950f50896a6f49a4055a9ad79356a6d17ed3e7f [file] [log] [blame]
Guido van Rossum2bc13791999-03-24 19:06:42 +00001/* Dictionary object implementation using a hash table */
Guido van Rossum9bfef441993-03-29 10:43:31 +00002
Raymond Hettinger930427b2003-05-03 06:51:59 +00003/* The distribution includes a separate file, Objects/dictnotes.txt,
Tim Peters60b29962006-01-01 01:19:23 +00004 describing explorations into dictionary design and optimization.
Raymond Hettinger930427b2003-05-03 06:51:59 +00005 It covers typical dictionary use patterns, the parameters for
6 tuning dictionaries, and several ideas for possible optimizations.
7*/
8
Victor Stinner742da042016-09-07 17:40:12 -07009/* PyDictKeysObject
10
11This implements the dictionary's hashtable.
12
Raymond Hettingerb12785d2016-10-22 09:58:14 -070013As of Python 3.6, this is compact and ordered. Basic idea is described here:
14* https://mail.python.org/pipermail/python-dev/2012-December/123028.html
15* https://morepypy.blogspot.com/2015/01/faster-more-memory-efficient-and-more.html
Victor Stinner742da042016-09-07 17:40:12 -070016
17layout:
18
19+---------------+
20| dk_refcnt |
21| dk_size |
22| dk_lookup |
23| dk_usable |
24| dk_nentries |
25+---------------+
26| dk_indices |
27| |
28+---------------+
29| dk_entries |
30| |
31+---------------+
32
33dk_indices is actual hashtable. It holds index in entries, or DKIX_EMPTY(-1)
34or DKIX_DUMMY(-2).
35Size of indices is dk_size. Type of each index in indices is vary on dk_size:
36
37* int8 for dk_size <= 128
38* int16 for 256 <= dk_size <= 2**15
39* int32 for 2**16 <= dk_size <= 2**31
40* int64 for 2**32 <= dk_size
41
42dk_entries is array of PyDictKeyEntry. It's size is USABLE_FRACTION(dk_size).
43DK_ENTRIES(dk) can be used to get pointer to entries.
44
45NOTE: Since negative value is used for DKIX_EMPTY and DKIX_DUMMY, type of
46dk_indices entry is signed integer and int16 is used for table which
47dk_size == 256.
48*/
49
Benjamin Peterson7d95e402012-04-23 11:24:50 -040050
51/*
Benjamin Peterson7d95e402012-04-23 11:24:50 -040052The DictObject can be in one of two forms.
Victor Stinner742da042016-09-07 17:40:12 -070053
Benjamin Peterson7d95e402012-04-23 11:24:50 -040054Either:
55 A combined table:
56 ma_values == NULL, dk_refcnt == 1.
57 Values are stored in the me_value field of the PyDictKeysObject.
Benjamin Peterson7d95e402012-04-23 11:24:50 -040058Or:
59 A split table:
60 ma_values != NULL, dk_refcnt >= 1
61 Values are stored in the ma_values array.
Victor Stinner742da042016-09-07 17:40:12 -070062 Only string (unicode) keys are allowed.
63 All dicts sharing same key must have same insertion order.
Benjamin Peterson7d95e402012-04-23 11:24:50 -040064
Victor Stinner742da042016-09-07 17:40:12 -070065There are four kinds of slots in the table (slot is index, and
66DK_ENTRIES(keys)[index] if index >= 0):
67
681. Unused. index == DKIX_EMPTY
69 Does not hold an active (key, value) pair now and never did. Unused can
70 transition to Active upon key insertion. This is each slot's initial state.
71
722. Active. index >= 0, me_key != NULL and me_value != NULL
73 Holds an active (key, value) pair. Active can transition to Dummy or
74 Pending upon key deletion (for combined and split tables respectively).
75 This is the only case in which me_value != NULL.
76
773. Dummy. index == DKIX_DUMMY (combined only)
78 Previously held an active (key, value) pair, but that was deleted and an
79 active pair has not yet overwritten the slot. Dummy can transition to
80 Active upon key insertion. Dummy slots cannot be made Unused again
81 else the probe sequence in case of collision would have no way to know
82 they were once active.
83
844. Pending. index >= 0, key != NULL, and value == NULL (split only)
85 Not yet inserted in split-table.
Benjamin Peterson7d95e402012-04-23 11:24:50 -040086*/
87
Victor Stinner742da042016-09-07 17:40:12 -070088/*
89Preserving insertion order
Benjamin Peterson7d95e402012-04-23 11:24:50 -040090
Victor Stinner742da042016-09-07 17:40:12 -070091It's simple for combined table. Since dk_entries is mostly append only, we can
92get insertion order by just iterating dk_entries.
93
94One exception is .popitem(). It removes last item in dk_entries and decrement
95dk_nentries to achieve amortized O(1). Since there are DKIX_DUMMY remains in
96dk_indices, we can't increment dk_usable even though dk_nentries is
97decremented.
98
99In split table, inserting into pending entry is allowed only for dk_entries[ix]
100where ix == mp->ma_used. Inserting into other index and deleting item cause
101converting the dict to the combined table.
102*/
103
104/* PyDict_MINSIZE is the starting size for any new dict.
Benjamin Peterson7d95e402012-04-23 11:24:50 -0400105 * 8 allows dicts with no more than 5 active entries; experiments suggested
106 * this suffices for the majority of dicts (consisting mostly of usually-small
107 * dicts created to pass keyword arguments).
108 * Making this 8, rather than 4 reduces the number of resizes for most
109 * dictionaries, without any significant extra memory use.
110 */
Victor Stinner742da042016-09-07 17:40:12 -0700111#define PyDict_MINSIZE 8
Benjamin Peterson7d95e402012-04-23 11:24:50 -0400112
Guido van Rossumc0b618a1997-05-02 03:12:38 +0000113#include "Python.h"
Eric Snow96c6af92015-05-29 22:21:39 -0600114#include "dict-common.h"
Victor Stinner990397e2016-09-09 20:22:59 -0700115#include "stringlib/eq.h" /* to get unicode_eq() */
Guido van Rossum4b1302b1993-03-27 18:11:32 +0000116
Larry Hastings61272b72014-01-07 12:41:53 -0800117/*[clinic input]
Larry Hastingsc2047262014-01-25 20:43:29 -0800118class dict "PyDictObject *" "&PyDict_Type"
Larry Hastings61272b72014-01-07 12:41:53 -0800119[clinic start generated code]*/
Larry Hastings581ee362014-01-28 05:00:08 -0800120/*[clinic end generated code: output=da39a3ee5e6b4b0d input=f157a5a0ce9589d6]*/
Larry Hastings44e2eaa2013-11-23 15:37:55 -0800121
Benjamin Peterson7d95e402012-04-23 11:24:50 -0400122
123/*
124To ensure the lookup algorithm terminates, there must be at least one Unused
125slot (NULL key) in the table.
126To avoid slowing down lookups on a near-full table, we resize the table when
127it's USABLE_FRACTION (currently two-thirds) full.
128*/
Guido van Rossum16e93a81997-01-28 00:00:11 +0000129
Tim Peterseb28ef22001-06-02 05:27:19 +0000130#define PERTURB_SHIFT 5
131
Guido van Rossum16e93a81997-01-28 00:00:11 +0000132/*
Tim Peterseb28ef22001-06-02 05:27:19 +0000133Major subtleties ahead: Most hash schemes depend on having a "good" hash
134function, in the sense of simulating randomness. Python doesn't: its most
R David Murray537ad7a2016-07-10 12:33:18 -0400135important hash functions (for ints) are very regular in common
Tim Peterseb28ef22001-06-02 05:27:19 +0000136cases:
Tim Peters15d49292001-05-27 07:39:22 +0000137
R David Murray537ad7a2016-07-10 12:33:18 -0400138 >>>[hash(i) for i in range(4)]
Guido van Rossumdc5f6b22006-08-24 21:29:26 +0000139 [0, 1, 2, 3]
Tim Peters15d49292001-05-27 07:39:22 +0000140
Tim Peterseb28ef22001-06-02 05:27:19 +0000141This isn't necessarily bad! To the contrary, in a table of size 2**i, taking
142the low-order i bits as the initial table index is extremely fast, and there
R David Murray537ad7a2016-07-10 12:33:18 -0400143are no collisions at all for dicts indexed by a contiguous range of ints. So
144this gives better-than-random behavior in common cases, and that's very
145desirable.
Tim Peters15d49292001-05-27 07:39:22 +0000146
Tim Peterseb28ef22001-06-02 05:27:19 +0000147OTOH, when collisions occur, the tendency to fill contiguous slices of the
148hash table makes a good collision resolution strategy crucial. Taking only
149the last i bits of the hash code is also vulnerable: for example, consider
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000150the list [i << 16 for i in range(20000)] as a set of keys. Since ints are
Guido van Rossumdc5f6b22006-08-24 21:29:26 +0000151their own hash codes, and this fits in a dict of size 2**15, the last 15 bits
152 of every hash code are all 0: they *all* map to the same table index.
Tim Peters15d49292001-05-27 07:39:22 +0000153
Tim Peterseb28ef22001-06-02 05:27:19 +0000154But catering to unusual cases should not slow the usual ones, so we just take
155the last i bits anyway. It's up to collision resolution to do the rest. If
156we *usually* find the key we're looking for on the first try (and, it turns
157out, we usually do -- the table load factor is kept under 2/3, so the odds
158are solidly in our favor), then it makes best sense to keep the initial index
159computation dirt cheap.
Tim Peters15d49292001-05-27 07:39:22 +0000160
Tim Peterseb28ef22001-06-02 05:27:19 +0000161The first half of collision resolution is to visit table indices via this
162recurrence:
Tim Peters15d49292001-05-27 07:39:22 +0000163
Tim Peterseb28ef22001-06-02 05:27:19 +0000164 j = ((5*j) + 1) mod 2**i
Tim Peters15d49292001-05-27 07:39:22 +0000165
Tim Peterseb28ef22001-06-02 05:27:19 +0000166For any initial j in range(2**i), repeating that 2**i times generates each
167int in range(2**i) exactly once (see any text on random-number generation for
168proof). By itself, this doesn't help much: like linear probing (setting
169j += 1, or j -= 1, on each loop trip), it scans the table entries in a fixed
170order. This would be bad, except that's not the only thing we do, and it's
171actually *good* in the common cases where hash keys are consecutive. In an
172example that's really too small to make this entirely clear, for a table of
173size 2**3 the order of indices is:
Tim Peters15d49292001-05-27 07:39:22 +0000174
Tim Peterseb28ef22001-06-02 05:27:19 +0000175 0 -> 1 -> 6 -> 7 -> 4 -> 5 -> 2 -> 3 -> 0 [and here it's repeating]
176
177If two things come in at index 5, the first place we look after is index 2,
178not 6, so if another comes in at index 6 the collision at 5 didn't hurt it.
179Linear probing is deadly in this case because there the fixed probe order
180is the *same* as the order consecutive keys are likely to arrive. But it's
181extremely unlikely hash codes will follow a 5*j+1 recurrence by accident,
182and certain that consecutive hash codes do not.
183
184The other half of the strategy is to get the other bits of the hash code
185into play. This is done by initializing a (unsigned) vrbl "perturb" to the
186full hash code, and changing the recurrence to:
187
Tim Peterseb28ef22001-06-02 05:27:19 +0000188 perturb >>= PERTURB_SHIFT;
INADA Naoki267941c2016-10-06 15:19:07 +0900189 j = (5*j) + 1 + perturb;
Tim Peterseb28ef22001-06-02 05:27:19 +0000190 use j % 2**i as the next table index;
191
192Now the probe sequence depends (eventually) on every bit in the hash code,
193and the pseudo-scrambling property of recurring on 5*j+1 is more valuable,
194because it quickly magnifies small differences in the bits that didn't affect
195the initial index. Note that because perturb is unsigned, if the recurrence
196is executed often enough perturb eventually becomes and remains 0. At that
197point (very rarely reached) the recurrence is on (just) 5*j+1 again, and
198that's certain to find an empty slot eventually (since it generates every int
199in range(2**i), and we make sure there's always at least one empty slot).
200
201Selecting a good value for PERTURB_SHIFT is a balancing act. You want it
202small so that the high bits of the hash code continue to affect the probe
203sequence across iterations; but you want it large so that in really bad cases
204the high-order hash bits have an effect on early iterations. 5 was "the
205best" in minimizing total collisions across experiments Tim Peters ran (on
206both normal and pathological cases), but 4 and 6 weren't significantly worse.
207
Guido van Rossumdc5f6b22006-08-24 21:29:26 +0000208Historical: Reimer Behrends contributed the idea of using a polynomial-based
Tim Peterseb28ef22001-06-02 05:27:19 +0000209approach, using repeated multiplication by x in GF(2**n) where an irreducible
210polynomial for each table size was chosen such that x was a primitive root.
211Christian Tismer later extended that to use division by x instead, as an
212efficient way to get the high bits of the hash code into play. This scheme
Guido van Rossum8ce8a782007-11-01 19:42:39 +0000213also gave excellent collision statistics, but was more expensive: two
214if-tests were required inside the loop; computing "the next" index took about
215the same number of operations but without as much potential parallelism
216(e.g., computing 5*j can go on at the same time as computing 1+perturb in the
217above, and then shifting perturb can be done while the table index is being
218masked); and the PyDictObject struct required a member to hold the table's
219polynomial. In Tim's experiments the current scheme ran faster, produced
220equally good collision statistics, needed less code & used less memory.
Thomas Wouters4d70c3d2006-06-08 14:42:34 +0000221
Guido van Rossum4b1302b1993-03-27 18:11:32 +0000222*/
Tim Petersdea48ec2001-05-22 20:40:22 +0000223
Fred Drake1bff34a2000-08-31 19:31:38 +0000224/* forward declarations */
Victor Stinner742da042016-09-07 17:40:12 -0700225static Py_ssize_t lookdict(PyDictObject *mp, PyObject *key,
INADA Naokiba609772016-12-07 20:41:42 +0900226 Py_hash_t hash, PyObject **value_addr,
Victor Stinner742da042016-09-07 17:40:12 -0700227 Py_ssize_t *hashpos);
228static Py_ssize_t lookdict_unicode(PyDictObject *mp, PyObject *key,
INADA Naokiba609772016-12-07 20:41:42 +0900229 Py_hash_t hash, PyObject **value_addr,
Victor Stinner742da042016-09-07 17:40:12 -0700230 Py_ssize_t *hashpos);
231static Py_ssize_t
Benjamin Peterson7d95e402012-04-23 11:24:50 -0400232lookdict_unicode_nodummy(PyDictObject *mp, PyObject *key,
INADA Naokiba609772016-12-07 20:41:42 +0900233 Py_hash_t hash, PyObject **value_addr,
Victor Stinner742da042016-09-07 17:40:12 -0700234 Py_ssize_t *hashpos);
235static Py_ssize_t lookdict_split(PyDictObject *mp, PyObject *key,
INADA Naokiba609772016-12-07 20:41:42 +0900236 Py_hash_t hash, PyObject **value_addr,
Victor Stinner742da042016-09-07 17:40:12 -0700237 Py_ssize_t *hashpos);
Fred Drake1bff34a2000-08-31 19:31:38 +0000238
Benjamin Peterson7d95e402012-04-23 11:24:50 -0400239static int dictresize(PyDictObject *mp, Py_ssize_t minused);
Tim Petersdea48ec2001-05-22 20:40:22 +0000240
Benjamin Peterson3c569292016-09-08 13:16:41 -0700241/*Global counter used to set ma_version_tag field of dictionary.
Victor Stinner3b6a6b42016-09-08 12:51:24 -0700242 * It is incremented each time that a dictionary is created and each
243 * time that a dictionary is modified. */
244static uint64_t pydict_global_version = 0;
245
246#define DICT_NEXT_VERSION() (++pydict_global_version)
247
Victor Stinner742da042016-09-07 17:40:12 -0700248/* Dictionary reuse scheme to save calls to malloc and free */
Christian Heimes2202f872008-02-06 14:31:34 +0000249#ifndef PyDict_MAXFREELIST
250#define PyDict_MAXFREELIST 80
251#endif
252static PyDictObject *free_list[PyDict_MAXFREELIST];
253static int numfree = 0;
Victor Stinner742da042016-09-07 17:40:12 -0700254static PyDictKeysObject *keys_free_list[PyDict_MAXFREELIST];
255static int numfreekeys = 0;
Raymond Hettinger43442782004-03-17 21:55:03 +0000256
Serhiy Storchaka1009bf12015-04-03 23:53:51 +0300257#include "clinic/dictobject.c.h"
258
Antoine Pitrou9a812cb2011-11-15 00:00:12 +0100259int
260PyDict_ClearFreeList(void)
Christian Heimes77c02eb2008-02-09 02:18:51 +0000261{
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000262 PyDictObject *op;
Victor Stinner742da042016-09-07 17:40:12 -0700263 int ret = numfree + numfreekeys;
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000264 while (numfree) {
265 op = free_list[--numfree];
266 assert(PyDict_CheckExact(op));
267 PyObject_GC_Del(op);
268 }
Victor Stinner742da042016-09-07 17:40:12 -0700269 while (numfreekeys) {
270 PyObject_FREE(keys_free_list[--numfreekeys]);
271 }
Antoine Pitrou9a812cb2011-11-15 00:00:12 +0100272 return ret;
273}
274
David Malcolm49526f42012-06-22 14:55:41 -0400275/* Print summary info about the state of the optimized allocator */
276void
277_PyDict_DebugMallocStats(FILE *out)
278{
279 _PyDebugAllocatorStats(out,
280 "free PyDictObject", numfree, sizeof(PyDictObject));
281}
282
283
Antoine Pitrou9a812cb2011-11-15 00:00:12 +0100284void
285PyDict_Fini(void)
286{
287 PyDict_ClearFreeList();
Christian Heimes77c02eb2008-02-09 02:18:51 +0000288}
289
Victor Stinner742da042016-09-07 17:40:12 -0700290#define DK_SIZE(dk) ((dk)->dk_size)
291#if SIZEOF_VOID_P > 4
Victor Stinner58f7c5a2016-09-08 11:37:36 -0700292#define DK_IXSIZE(dk) \
293 (DK_SIZE(dk) <= 0xff ? \
294 1 : DK_SIZE(dk) <= 0xffff ? \
295 2 : DK_SIZE(dk) <= 0xffffffff ? \
Benjamin Peterson3c569292016-09-08 13:16:41 -0700296 4 : sizeof(int64_t))
Victor Stinner742da042016-09-07 17:40:12 -0700297#else
Victor Stinner58f7c5a2016-09-08 11:37:36 -0700298#define DK_IXSIZE(dk) \
299 (DK_SIZE(dk) <= 0xff ? \
300 1 : DK_SIZE(dk) <= 0xffff ? \
Benjamin Peterson3c569292016-09-08 13:16:41 -0700301 2 : sizeof(int32_t))
Victor Stinner742da042016-09-07 17:40:12 -0700302#endif
Victor Stinner58f7c5a2016-09-08 11:37:36 -0700303#define DK_ENTRIES(dk) \
Benjamin Peterson186122e2016-09-08 12:20:12 -0700304 ((PyDictKeyEntry*)(&(dk)->dk_indices.as_1[DK_SIZE(dk) * DK_IXSIZE(dk)]))
Victor Stinner742da042016-09-07 17:40:12 -0700305
Antoine Pitrou2d169b22012-05-12 23:43:44 +0200306#define DK_DEBUG_INCREF _Py_INC_REFTOTAL _Py_REF_DEBUG_COMMA
307#define DK_DEBUG_DECREF _Py_DEC_REFTOTAL _Py_REF_DEBUG_COMMA
308
309#define DK_INCREF(dk) (DK_DEBUG_INCREF ++(dk)->dk_refcnt)
310#define DK_DECREF(dk) if (DK_DEBUG_DECREF (--(dk)->dk_refcnt) == 0) free_keys_object(dk)
Benjamin Peterson7d95e402012-04-23 11:24:50 -0400311#define DK_MASK(dk) (((dk)->dk_size)-1)
312#define IS_POWER_OF_2(x) (((x) & (x-1)) == 0)
313
Victor Stinner742da042016-09-07 17:40:12 -0700314/* lookup indices. returns DKIX_EMPTY, DKIX_DUMMY, or ix >=0 */
Benjamin Peterson73222252016-09-08 09:58:47 -0700315static inline Py_ssize_t
Victor Stinner742da042016-09-07 17:40:12 -0700316dk_get_index(PyDictKeysObject *keys, Py_ssize_t i)
317{
318 Py_ssize_t s = DK_SIZE(keys);
Victor Stinner71211e32016-09-08 10:52:46 -0700319 Py_ssize_t ix;
320
Victor Stinner742da042016-09-07 17:40:12 -0700321 if (s <= 0xff) {
Benjamin Peterson186122e2016-09-08 12:20:12 -0700322 int8_t *indices = keys->dk_indices.as_1;
Victor Stinner208857e2016-09-08 11:35:46 -0700323 ix = indices[i];
Victor Stinner742da042016-09-07 17:40:12 -0700324 }
325 else if (s <= 0xffff) {
Benjamin Peterson186122e2016-09-08 12:20:12 -0700326 int16_t *indices = keys->dk_indices.as_2;
Victor Stinner208857e2016-09-08 11:35:46 -0700327 ix = indices[i];
Victor Stinner742da042016-09-07 17:40:12 -0700328 }
Benjamin Peterson3c569292016-09-08 13:16:41 -0700329#if SIZEOF_VOID_P > 4
Serhiy Storchaka473e0e42016-09-10 21:34:43 +0300330 else if (s > 0xffffffff) {
Benjamin Peterson186122e2016-09-08 12:20:12 -0700331 int64_t *indices = keys->dk_indices.as_8;
Victor Stinner208857e2016-09-08 11:35:46 -0700332 ix = indices[i];
Victor Stinner742da042016-09-07 17:40:12 -0700333 }
Benjamin Peterson3c569292016-09-08 13:16:41 -0700334#endif
Serhiy Storchaka473e0e42016-09-10 21:34:43 +0300335 else {
336 int32_t *indices = keys->dk_indices.as_4;
337 ix = indices[i];
338 }
Victor Stinner71211e32016-09-08 10:52:46 -0700339 assert(ix >= DKIX_DUMMY);
340 return ix;
Victor Stinner742da042016-09-07 17:40:12 -0700341}
342
343/* write to indices. */
Benjamin Peterson73222252016-09-08 09:58:47 -0700344static inline void
Victor Stinner742da042016-09-07 17:40:12 -0700345dk_set_index(PyDictKeysObject *keys, Py_ssize_t i, Py_ssize_t ix)
346{
347 Py_ssize_t s = DK_SIZE(keys);
Victor Stinner71211e32016-09-08 10:52:46 -0700348
349 assert(ix >= DKIX_DUMMY);
350
Victor Stinner742da042016-09-07 17:40:12 -0700351 if (s <= 0xff) {
Benjamin Peterson186122e2016-09-08 12:20:12 -0700352 int8_t *indices = keys->dk_indices.as_1;
Victor Stinner71211e32016-09-08 10:52:46 -0700353 assert(ix <= 0x7f);
Victor Stinner208857e2016-09-08 11:35:46 -0700354 indices[i] = (char)ix;
Victor Stinner742da042016-09-07 17:40:12 -0700355 }
356 else if (s <= 0xffff) {
Benjamin Peterson186122e2016-09-08 12:20:12 -0700357 int16_t *indices = keys->dk_indices.as_2;
Victor Stinner71211e32016-09-08 10:52:46 -0700358 assert(ix <= 0x7fff);
Victor Stinner208857e2016-09-08 11:35:46 -0700359 indices[i] = (int16_t)ix;
Victor Stinner742da042016-09-07 17:40:12 -0700360 }
Benjamin Peterson3c569292016-09-08 13:16:41 -0700361#if SIZEOF_VOID_P > 4
Serhiy Storchaka473e0e42016-09-10 21:34:43 +0300362 else if (s > 0xffffffff) {
Benjamin Peterson186122e2016-09-08 12:20:12 -0700363 int64_t *indices = keys->dk_indices.as_8;
Victor Stinner208857e2016-09-08 11:35:46 -0700364 indices[i] = ix;
Victor Stinner742da042016-09-07 17:40:12 -0700365 }
Benjamin Peterson3c569292016-09-08 13:16:41 -0700366#endif
Serhiy Storchaka473e0e42016-09-10 21:34:43 +0300367 else {
368 int32_t *indices = keys->dk_indices.as_4;
369 assert(ix <= 0x7fffffff);
370 indices[i] = (int32_t)ix;
371 }
Victor Stinner742da042016-09-07 17:40:12 -0700372}
373
374
Antoine Pitroua504a7a2012-06-24 21:03:45 +0200375/* USABLE_FRACTION is the maximum dictionary load.
Victor Stinner742da042016-09-07 17:40:12 -0700376 * Increasing this ratio makes dictionaries more dense resulting in more
377 * collisions. Decreasing it improves sparseness at the expense of spreading
378 * indices over more cache lines and at the cost of total memory consumed.
Antoine Pitroua504a7a2012-06-24 21:03:45 +0200379 *
380 * USABLE_FRACTION must obey the following:
Benjamin Peterson7d95e402012-04-23 11:24:50 -0400381 * (0 < USABLE_FRACTION(n) < n) for all n >= 2
382 *
Victor Stinner742da042016-09-07 17:40:12 -0700383 * USABLE_FRACTION should be quick to calculate.
384 * Fractions around 1/2 to 2/3 seem to work well in practice.
Benjamin Peterson7d95e402012-04-23 11:24:50 -0400385 */
Victor Stinner742da042016-09-07 17:40:12 -0700386#define USABLE_FRACTION(n) (((n) << 1)/3)
Benjamin Peterson7d95e402012-04-23 11:24:50 -0400387
Victor Stinner742da042016-09-07 17:40:12 -0700388/* ESTIMATE_SIZE is reverse function of USABLE_FRACTION.
389 * This can be used to reserve enough size to insert n entries without
390 * resizing.
391 */
INADA Naoki92c50ee2016-11-22 00:57:02 +0900392#define ESTIMATE_SIZE(n) (((n)*3+1) >> 1)
Benjamin Peterson7d95e402012-04-23 11:24:50 -0400393
Victor Stinner742da042016-09-07 17:40:12 -0700394/* Alternative fraction that is otherwise close enough to 2n/3 to make
Benjamin Peterson7d95e402012-04-23 11:24:50 -0400395 * little difference. 8 * 2/3 == 8 * 5/8 == 5. 16 * 2/3 == 16 * 5/8 == 10.
396 * 32 * 2/3 = 21, 32 * 5/8 = 20.
397 * Its advantage is that it is faster to compute on machines with slow division.
398 * #define USABLE_FRACTION(n) (((n) >> 1) + ((n) >> 2) - ((n) >> 3))
Victor Stinner742da042016-09-07 17:40:12 -0700399 */
Benjamin Peterson7d95e402012-04-23 11:24:50 -0400400
Victor Stinnera9f61a52013-07-16 22:17:26 +0200401/* GROWTH_RATE. Growth rate upon hitting maximum load.
402 * Currently set to used*2 + capacity/2.
403 * This means that dicts double in size when growing without deletions,
Raymond Hettinger36f74aa2013-05-17 03:01:13 -0700404 * but have more head room when the number of deletions is on a par with the
405 * number of insertions.
406 * Raising this to used*4 doubles memory consumption depending on the size of
Antoine Pitroua504a7a2012-06-24 21:03:45 +0200407 * the dictionary, but results in half the number of resizes, less effort to
Raymond Hettinger36f74aa2013-05-17 03:01:13 -0700408 * resize.
409 * GROWTH_RATE was set to used*4 up to version 3.2.
410 * GROWTH_RATE was set to used*2 in version 3.3.0
Antoine Pitroua504a7a2012-06-24 21:03:45 +0200411 */
Raymond Hettinger36f74aa2013-05-17 03:01:13 -0700412#define GROWTH_RATE(d) (((d)->ma_used*2)+((d)->ma_keys->dk_size>>1))
Benjamin Peterson7d95e402012-04-23 11:24:50 -0400413
414#define ENSURE_ALLOWS_DELETIONS(d) \
415 if ((d)->ma_keys->dk_lookup == lookdict_unicode_nodummy) { \
416 (d)->ma_keys->dk_lookup = lookdict_unicode; \
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000417 }
Benjamin Peterson7d95e402012-04-23 11:24:50 -0400418
419/* This immutable, empty PyDictKeysObject is used for PyDict_Clear()
420 * (which cannot fail and thus can do no allocation).
421 */
422static PyDictKeysObject empty_keys_struct = {
Serhiy Storchaka97932e42016-09-26 23:01:23 +0300423 1, /* dk_refcnt */
Benjamin Peterson7d95e402012-04-23 11:24:50 -0400424 1, /* dk_size */
425 lookdict_split, /* dk_lookup */
426 0, /* dk_usable (immutable) */
Victor Stinner742da042016-09-07 17:40:12 -0700427 0, /* dk_nentries */
Benjamin Peterson186122e2016-09-08 12:20:12 -0700428 .dk_indices = { .as_1 = {DKIX_EMPTY, DKIX_EMPTY, DKIX_EMPTY, DKIX_EMPTY,
429 DKIX_EMPTY, DKIX_EMPTY, DKIX_EMPTY, DKIX_EMPTY}},
Benjamin Peterson7d95e402012-04-23 11:24:50 -0400430};
431
432static PyObject *empty_values[1] = { NULL };
433
434#define Py_EMPTY_KEYS &empty_keys_struct
435
Victor Stinner611b0fa2016-09-14 15:02:01 +0200436/* Uncomment to check the dict content in _PyDict_CheckConsistency() */
437/* #define DEBUG_PYDICT */
438
439
440#ifdef Py_DEBUG
441static int
442_PyDict_CheckConsistency(PyDictObject *mp)
443{
444 PyDictKeysObject *keys = mp->ma_keys;
445 int splitted = _PyDict_HasSplitTable(mp);
446 Py_ssize_t usable = USABLE_FRACTION(keys->dk_size);
447#ifdef DEBUG_PYDICT
448 PyDictKeyEntry *entries = DK_ENTRIES(keys);
449 Py_ssize_t i;
450#endif
451
452 assert(0 <= mp->ma_used && mp->ma_used <= usable);
453 assert(IS_POWER_OF_2(keys->dk_size));
454 assert(0 <= keys->dk_usable
455 && keys->dk_usable <= usable);
456 assert(0 <= keys->dk_nentries
457 && keys->dk_nentries <= usable);
458 assert(keys->dk_usable + keys->dk_nentries <= usable);
459
460 if (!splitted) {
461 /* combined table */
462 assert(keys->dk_refcnt == 1);
463 }
464
465#ifdef DEBUG_PYDICT
466 for (i=0; i < keys->dk_size; i++) {
467 Py_ssize_t ix = dk_get_index(keys, i);
468 assert(DKIX_DUMMY <= ix && ix <= usable);
469 }
470
471 for (i=0; i < usable; i++) {
472 PyDictKeyEntry *entry = &entries[i];
473 PyObject *key = entry->me_key;
474
475 if (key != NULL) {
476 if (PyUnicode_CheckExact(key)) {
477 Py_hash_t hash = ((PyASCIIObject *)key)->hash;
478 assert(hash != -1);
479 assert(entry->me_hash == hash);
480 }
481 else {
482 /* test_dict fails if PyObject_Hash() is called again */
483 assert(entry->me_hash != -1);
484 }
485 if (!splitted) {
486 assert(entry->me_value != NULL);
487 }
488 }
489
490 if (splitted) {
491 assert(entry->me_value == NULL);
492 }
493 }
494
495 if (splitted) {
496 /* splitted table */
497 for (i=0; i < mp->ma_used; i++) {
498 assert(mp->ma_values[i] != NULL);
499 }
500 }
501#endif
502
503 return 1;
504}
505#endif
506
507
Benjamin Peterson7d95e402012-04-23 11:24:50 -0400508static PyDictKeysObject *new_keys_object(Py_ssize_t size)
509{
510 PyDictKeysObject *dk;
Victor Stinner742da042016-09-07 17:40:12 -0700511 Py_ssize_t es, usable;
Benjamin Peterson7d95e402012-04-23 11:24:50 -0400512
Victor Stinner742da042016-09-07 17:40:12 -0700513 assert(size >= PyDict_MINSIZE);
Benjamin Peterson7d95e402012-04-23 11:24:50 -0400514 assert(IS_POWER_OF_2(size));
Victor Stinner742da042016-09-07 17:40:12 -0700515
516 usable = USABLE_FRACTION(size);
517 if (size <= 0xff) {
518 es = 1;
519 }
520 else if (size <= 0xffff) {
521 es = 2;
522 }
523#if SIZEOF_VOID_P > 4
524 else if (size <= 0xffffffff) {
525 es = 4;
526 }
527#endif
528 else {
529 es = sizeof(Py_ssize_t);
530 }
531
532 if (size == PyDict_MINSIZE && numfreekeys > 0) {
533 dk = keys_free_list[--numfreekeys];
534 }
535 else {
Victor Stinner98ee9d52016-09-08 09:33:56 -0700536 dk = PyObject_MALLOC(sizeof(PyDictKeysObject)
537 - Py_MEMBER_SIZE(PyDictKeysObject, dk_indices)
538 + es * size
539 + sizeof(PyDictKeyEntry) * usable);
Victor Stinner742da042016-09-07 17:40:12 -0700540 if (dk == NULL) {
541 PyErr_NoMemory();
542 return NULL;
543 }
Benjamin Peterson7d95e402012-04-23 11:24:50 -0400544 }
Antoine Pitrou2d169b22012-05-12 23:43:44 +0200545 DK_DEBUG_INCREF dk->dk_refcnt = 1;
Benjamin Peterson7d95e402012-04-23 11:24:50 -0400546 dk->dk_size = size;
Victor Stinner742da042016-09-07 17:40:12 -0700547 dk->dk_usable = usable;
Benjamin Peterson7d95e402012-04-23 11:24:50 -0400548 dk->dk_lookup = lookdict_unicode_nodummy;
Victor Stinner742da042016-09-07 17:40:12 -0700549 dk->dk_nentries = 0;
Benjamin Peterson186122e2016-09-08 12:20:12 -0700550 memset(&dk->dk_indices.as_1[0], 0xff, es * size);
Victor Stinner742da042016-09-07 17:40:12 -0700551 memset(DK_ENTRIES(dk), 0, sizeof(PyDictKeyEntry) * usable);
Benjamin Peterson7d95e402012-04-23 11:24:50 -0400552 return dk;
553}
554
555static void
556free_keys_object(PyDictKeysObject *keys)
557{
Victor Stinner742da042016-09-07 17:40:12 -0700558 PyDictKeyEntry *entries = DK_ENTRIES(keys);
Benjamin Peterson7d95e402012-04-23 11:24:50 -0400559 Py_ssize_t i, n;
Victor Stinner742da042016-09-07 17:40:12 -0700560 for (i = 0, n = keys->dk_nentries; i < n; i++) {
Benjamin Peterson7d95e402012-04-23 11:24:50 -0400561 Py_XDECREF(entries[i].me_key);
562 Py_XDECREF(entries[i].me_value);
563 }
Victor Stinner742da042016-09-07 17:40:12 -0700564 if (keys->dk_size == PyDict_MINSIZE && numfreekeys < PyDict_MAXFREELIST) {
565 keys_free_list[numfreekeys++] = keys;
566 return;
567 }
Raymond Hettingerce5179f2016-01-31 08:56:21 -0800568 PyObject_FREE(keys);
Benjamin Peterson7d95e402012-04-23 11:24:50 -0400569}
570
571#define new_values(size) PyMem_NEW(PyObject *, size)
Benjamin Peterson7d95e402012-04-23 11:24:50 -0400572#define free_values(values) PyMem_FREE(values)
573
574/* Consumes a reference to the keys object */
575static PyObject *
576new_dict(PyDictKeysObject *keys, PyObject **values)
577{
578 PyDictObject *mp;
Victor Stinnerc9b7f512013-07-08 22:19:20 +0200579 assert(keys != NULL);
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000580 if (numfree) {
581 mp = free_list[--numfree];
582 assert (mp != NULL);
583 assert (Py_TYPE(mp) == &PyDict_Type);
584 _Py_NewReference((PyObject *)mp);
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000585 }
Benjamin Peterson7d95e402012-04-23 11:24:50 -0400586 else {
587 mp = PyObject_GC_New(PyDictObject, &PyDict_Type);
588 if (mp == NULL) {
589 DK_DECREF(keys);
590 free_values(values);
591 return NULL;
592 }
593 }
594 mp->ma_keys = keys;
595 mp->ma_values = values;
596 mp->ma_used = 0;
Victor Stinner3b6a6b42016-09-08 12:51:24 -0700597 mp->ma_version_tag = DICT_NEXT_VERSION();
Victor Stinner611b0fa2016-09-14 15:02:01 +0200598 assert(_PyDict_CheckConsistency(mp));
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000599 return (PyObject *)mp;
Guido van Rossum4b1302b1993-03-27 18:11:32 +0000600}
601
Benjamin Peterson7d95e402012-04-23 11:24:50 -0400602/* Consumes a reference to the keys object */
603static PyObject *
604new_dict_with_shared_keys(PyDictKeysObject *keys)
605{
606 PyObject **values;
607 Py_ssize_t i, size;
608
Victor Stinner742da042016-09-07 17:40:12 -0700609 size = USABLE_FRACTION(DK_SIZE(keys));
Benjamin Peterson7d95e402012-04-23 11:24:50 -0400610 values = new_values(size);
611 if (values == NULL) {
612 DK_DECREF(keys);
613 return PyErr_NoMemory();
614 }
615 for (i = 0; i < size; i++) {
616 values[i] = NULL;
617 }
618 return new_dict(keys, values);
619}
620
621PyObject *
622PyDict_New(void)
623{
Victor Stinner742da042016-09-07 17:40:12 -0700624 PyDictKeysObject *keys = new_keys_object(PyDict_MINSIZE);
Victor Stinnerc9b7f512013-07-08 22:19:20 +0200625 if (keys == NULL)
626 return NULL;
627 return new_dict(keys, NULL);
Benjamin Peterson7d95e402012-04-23 11:24:50 -0400628}
629
Victor Stinner742da042016-09-07 17:40:12 -0700630/* Search index of hash table from offset of entry table */
631static Py_ssize_t
632lookdict_index(PyDictKeysObject *k, Py_hash_t hash, Py_ssize_t index)
633{
INADA Naoki267941c2016-10-06 15:19:07 +0900634 size_t i;
Victor Stinner742da042016-09-07 17:40:12 -0700635 size_t mask = DK_MASK(k);
636 Py_ssize_t ix;
637
638 i = (size_t)hash & mask;
639 ix = dk_get_index(k, i);
640 if (ix == index) {
641 return i;
642 }
643 if (ix == DKIX_EMPTY) {
644 return DKIX_EMPTY;
645 }
646
INADA Naoki267941c2016-10-06 15:19:07 +0900647 for (size_t perturb = hash;;) {
648 perturb >>= PERTURB_SHIFT;
Victor Stinner742da042016-09-07 17:40:12 -0700649 i = mask & ((i << 2) + i + perturb + 1);
650 ix = dk_get_index(k, i);
651 if (ix == index) {
652 return i;
653 }
654 if (ix == DKIX_EMPTY) {
655 return DKIX_EMPTY;
656 }
657 }
658 assert(0); /* NOT REACHED */
659 return DKIX_ERROR;
660}
661
Guido van Rossum4b1302b1993-03-27 18:11:32 +0000662/*
663The basic lookup function used by all operations.
Guido van Rossum16e93a81997-01-28 00:00:11 +0000664This is based on Algorithm D from Knuth Vol. 3, Sec. 6.4.
Guido van Rossum4b1302b1993-03-27 18:11:32 +0000665Open addressing is preferred over chaining since the link overhead for
666chaining would be substantial (100% with typical malloc overhead).
667
Tim Peterseb28ef22001-06-02 05:27:19 +0000668The initial probe index is computed as hash mod the table size. Subsequent
669probe indices are computed as explained earlier.
Guido van Rossum2bc13791999-03-24 19:06:42 +0000670
671All arithmetic on hash should ignore overflow.
Guido van Rossum16e93a81997-01-28 00:00:11 +0000672
Guido van Rossumdc5f6b22006-08-24 21:29:26 +0000673The details in this version are due to Tim Peters, building on many past
Tim Peterseb28ef22001-06-02 05:27:19 +0000674contributions by Reimer Behrends, Jyrki Alakuijala, Vladimir Marangozov and
Guido van Rossumdc5f6b22006-08-24 21:29:26 +0000675Christian Tismer.
Fred Drake1bff34a2000-08-31 19:31:38 +0000676
Victor Stinner742da042016-09-07 17:40:12 -0700677lookdict() is general-purpose, and may return DKIX_ERROR if (and only if) a
Victor Stinnera4348cc2016-09-08 12:01:25 -0700678comparison raises an exception.
Guido van Rossum89d8c602007-09-18 17:26:56 +0000679lookdict_unicode() below is specialized to string keys, comparison of which can
Victor Stinner742da042016-09-07 17:40:12 -0700680never raise an exception; that function can never return DKIX_ERROR.
Benjamin Peterson7d95e402012-04-23 11:24:50 -0400681lookdict_unicode_nodummy is further specialized for string keys that cannot be
682the <dummy> value.
Victor Stinner742da042016-09-07 17:40:12 -0700683For both, when the key isn't found a DKIX_EMPTY is returned. hashpos returns
684where the key index should be inserted.
Guido van Rossum4b1302b1993-03-27 18:11:32 +0000685*/
Victor Stinnerc7a8f672016-11-15 15:13:40 +0100686static Py_ssize_t _Py_HOT_FUNCTION
Benjamin Peterson7d95e402012-04-23 11:24:50 -0400687lookdict(PyDictObject *mp, PyObject *key,
INADA Naokiba609772016-12-07 20:41:42 +0900688 Py_hash_t hash, PyObject **value_addr, Py_ssize_t *hashpos)
Guido van Rossum4b1302b1993-03-27 18:11:32 +0000689{
INADA Naoki267941c2016-10-06 15:19:07 +0900690 size_t i, mask;
Victor Stinner742da042016-09-07 17:40:12 -0700691 Py_ssize_t ix, freeslot;
Antoine Pitrou9ed5f272013-08-13 20:18:52 +0200692 int cmp;
Victor Stinner742da042016-09-07 17:40:12 -0700693 PyDictKeysObject *dk;
694 PyDictKeyEntry *ep0, *ep;
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000695 PyObject *startkey;
Tim Peterseb28ef22001-06-02 05:27:19 +0000696
Antoine Pitrou9a234902012-05-13 20:48:01 +0200697top:
Victor Stinner742da042016-09-07 17:40:12 -0700698 dk = mp->ma_keys;
699 mask = DK_MASK(dk);
700 ep0 = DK_ENTRIES(dk);
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000701 i = (size_t)hash & mask;
Victor Stinner742da042016-09-07 17:40:12 -0700702
703 ix = dk_get_index(dk, i);
704 if (ix == DKIX_EMPTY) {
705 if (hashpos != NULL)
706 *hashpos = i;
707 *value_addr = NULL;
708 return DKIX_EMPTY;
Benjamin Peterson7d95e402012-04-23 11:24:50 -0400709 }
Victor Stinner742da042016-09-07 17:40:12 -0700710 if (ix == DKIX_DUMMY) {
711 freeslot = i;
712 }
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000713 else {
Victor Stinner742da042016-09-07 17:40:12 -0700714 ep = &ep0[ix];
Serhiy Storchaka46825d22016-09-26 21:29:34 +0300715 assert(ep->me_key != NULL);
Victor Stinner742da042016-09-07 17:40:12 -0700716 if (ep->me_key == key) {
INADA Naokiba609772016-12-07 20:41:42 +0900717 *value_addr = ep->me_value;
Victor Stinner742da042016-09-07 17:40:12 -0700718 if (hashpos != NULL)
719 *hashpos = i;
720 return ix;
721 }
Serhiy Storchaka46825d22016-09-26 21:29:34 +0300722 if (ep->me_hash == hash) {
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000723 startkey = ep->me_key;
724 Py_INCREF(startkey);
725 cmp = PyObject_RichCompareBool(startkey, key, Py_EQ);
726 Py_DECREF(startkey);
Serhiy Storchakaf0b311b2016-11-06 13:18:24 +0200727 if (cmp < 0) {
728 *value_addr = NULL;
Victor Stinner742da042016-09-07 17:40:12 -0700729 return DKIX_ERROR;
Serhiy Storchakaf0b311b2016-11-06 13:18:24 +0200730 }
Victor Stinner742da042016-09-07 17:40:12 -0700731 if (dk == mp->ma_keys && ep->me_key == startkey) {
Benjamin Peterson7d95e402012-04-23 11:24:50 -0400732 if (cmp > 0) {
INADA Naokiba609772016-12-07 20:41:42 +0900733 *value_addr = ep->me_value;
Victor Stinner742da042016-09-07 17:40:12 -0700734 if (hashpos != NULL)
735 *hashpos = i;
736 return ix;
Benjamin Peterson7d95e402012-04-23 11:24:50 -0400737 }
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000738 }
739 else {
Antoine Pitrou9a234902012-05-13 20:48:01 +0200740 /* The dict was mutated, restart */
741 goto top;
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000742 }
743 }
Victor Stinner742da042016-09-07 17:40:12 -0700744 freeslot = -1;
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000745 }
Tim Peters15d49292001-05-27 07:39:22 +0000746
INADA Naoki267941c2016-10-06 15:19:07 +0900747 for (size_t perturb = hash;;) {
748 perturb >>= PERTURB_SHIFT;
Victor Stinner742da042016-09-07 17:40:12 -0700749 i = ((i << 2) + i + perturb + 1) & mask;
750 ix = dk_get_index(dk, i);
751 if (ix == DKIX_EMPTY) {
752 if (hashpos != NULL) {
753 *hashpos = (freeslot == -1) ? (Py_ssize_t)i : freeslot;
Benjamin Peterson7d95e402012-04-23 11:24:50 -0400754 }
Victor Stinner742da042016-09-07 17:40:12 -0700755 *value_addr = NULL;
756 return ix;
Benjamin Peterson7d95e402012-04-23 11:24:50 -0400757 }
Victor Stinner742da042016-09-07 17:40:12 -0700758 if (ix == DKIX_DUMMY) {
759 if (freeslot == -1)
760 freeslot = i;
761 continue;
762 }
763 ep = &ep0[ix];
Serhiy Storchaka46825d22016-09-26 21:29:34 +0300764 assert(ep->me_key != NULL);
Benjamin Peterson7d95e402012-04-23 11:24:50 -0400765 if (ep->me_key == key) {
Victor Stinner742da042016-09-07 17:40:12 -0700766 if (hashpos != NULL) {
767 *hashpos = i;
768 }
INADA Naokiba609772016-12-07 20:41:42 +0900769 *value_addr = ep->me_value;
Victor Stinner742da042016-09-07 17:40:12 -0700770 return ix;
Benjamin Peterson7d95e402012-04-23 11:24:50 -0400771 }
Serhiy Storchaka46825d22016-09-26 21:29:34 +0300772 if (ep->me_hash == hash) {
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000773 startkey = ep->me_key;
774 Py_INCREF(startkey);
775 cmp = PyObject_RichCompareBool(startkey, key, Py_EQ);
776 Py_DECREF(startkey);
Benjamin Peterson7d95e402012-04-23 11:24:50 -0400777 if (cmp < 0) {
778 *value_addr = NULL;
Victor Stinner742da042016-09-07 17:40:12 -0700779 return DKIX_ERROR;
Benjamin Peterson7d95e402012-04-23 11:24:50 -0400780 }
Victor Stinner742da042016-09-07 17:40:12 -0700781 if (dk == mp->ma_keys && ep->me_key == startkey) {
Benjamin Peterson7d95e402012-04-23 11:24:50 -0400782 if (cmp > 0) {
Victor Stinner742da042016-09-07 17:40:12 -0700783 if (hashpos != NULL) {
784 *hashpos = i;
785 }
INADA Naokiba609772016-12-07 20:41:42 +0900786 *value_addr = ep->me_value;
Victor Stinner742da042016-09-07 17:40:12 -0700787 return ix;
Benjamin Peterson7d95e402012-04-23 11:24:50 -0400788 }
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000789 }
790 else {
Antoine Pitrou9a234902012-05-13 20:48:01 +0200791 /* The dict was mutated, restart */
792 goto top;
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000793 }
794 }
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000795 }
796 assert(0); /* NOT REACHED */
797 return 0;
Guido van Rossum4b1302b1993-03-27 18:11:32 +0000798}
799
Benjamin Peterson7d95e402012-04-23 11:24:50 -0400800/* Specialized version for string-only keys */
Victor Stinnerc7a8f672016-11-15 15:13:40 +0100801static Py_ssize_t _Py_HOT_FUNCTION
Benjamin Peterson7d95e402012-04-23 11:24:50 -0400802lookdict_unicode(PyDictObject *mp, PyObject *key,
INADA Naokiba609772016-12-07 20:41:42 +0900803 Py_hash_t hash, PyObject **value_addr, Py_ssize_t *hashpos)
Fred Drake1bff34a2000-08-31 19:31:38 +0000804{
INADA Naoki267941c2016-10-06 15:19:07 +0900805 size_t i;
Antoine Pitrou9ed5f272013-08-13 20:18:52 +0200806 size_t mask = DK_MASK(mp->ma_keys);
Victor Stinner742da042016-09-07 17:40:12 -0700807 Py_ssize_t ix, freeslot;
808 PyDictKeyEntry *ep, *ep0 = DK_ENTRIES(mp->ma_keys);
Fred Drake1bff34a2000-08-31 19:31:38 +0000809
Victor Stinner742da042016-09-07 17:40:12 -0700810 assert(mp->ma_values == NULL);
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000811 /* Make sure this function doesn't have to handle non-unicode keys,
812 including subclasses of str; e.g., one reason to subclass
813 unicodes is to override __eq__, and for speed we don't cater to
814 that here. */
815 if (!PyUnicode_CheckExact(key)) {
Benjamin Peterson7d95e402012-04-23 11:24:50 -0400816 mp->ma_keys->dk_lookup = lookdict;
Victor Stinner742da042016-09-07 17:40:12 -0700817 return lookdict(mp, key, hash, value_addr, hashpos);
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000818 }
Mark Dickinson57e683e2011-09-24 18:18:40 +0100819 i = (size_t)hash & mask;
Victor Stinner742da042016-09-07 17:40:12 -0700820 ix = dk_get_index(mp->ma_keys, i);
821 if (ix == DKIX_EMPTY) {
822 if (hashpos != NULL)
823 *hashpos = i;
824 *value_addr = NULL;
825 return DKIX_EMPTY;
Benjamin Peterson7d95e402012-04-23 11:24:50 -0400826 }
Victor Stinner742da042016-09-07 17:40:12 -0700827 if (ix == DKIX_DUMMY) {
828 freeslot = i;
829 }
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000830 else {
Victor Stinner742da042016-09-07 17:40:12 -0700831 ep = &ep0[ix];
Victor Stinner742da042016-09-07 17:40:12 -0700832 assert(ep->me_key != NULL);
Serhiy Storchaka46825d22016-09-26 21:29:34 +0300833 if (ep->me_key == key
834 || (ep->me_hash == hash && unicode_eq(ep->me_key, key))) {
Victor Stinner742da042016-09-07 17:40:12 -0700835 if (hashpos != NULL)
836 *hashpos = i;
INADA Naokiba609772016-12-07 20:41:42 +0900837 *value_addr = ep->me_value;
Victor Stinner742da042016-09-07 17:40:12 -0700838 return ix;
Benjamin Peterson7d95e402012-04-23 11:24:50 -0400839 }
Victor Stinner742da042016-09-07 17:40:12 -0700840 freeslot = -1;
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000841 }
Tim Peters15d49292001-05-27 07:39:22 +0000842
INADA Naoki267941c2016-10-06 15:19:07 +0900843 for (size_t perturb = hash;;) {
844 perturb >>= PERTURB_SHIFT;
Victor Stinner742da042016-09-07 17:40:12 -0700845 i = mask & ((i << 2) + i + perturb + 1);
846 ix = dk_get_index(mp->ma_keys, i);
847 if (ix == DKIX_EMPTY) {
848 if (hashpos != NULL) {
849 *hashpos = (freeslot == -1) ? (Py_ssize_t)i : freeslot;
Benjamin Peterson7d95e402012-04-23 11:24:50 -0400850 }
Victor Stinner742da042016-09-07 17:40:12 -0700851 *value_addr = NULL;
852 return DKIX_EMPTY;
Benjamin Peterson7d95e402012-04-23 11:24:50 -0400853 }
Victor Stinner742da042016-09-07 17:40:12 -0700854 if (ix == DKIX_DUMMY) {
855 if (freeslot == -1)
856 freeslot = i;
857 continue;
858 }
859 ep = &ep0[ix];
Serhiy Storchaka46825d22016-09-26 21:29:34 +0300860 assert(ep->me_key != NULL);
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000861 if (ep->me_key == key
Serhiy Storchaka46825d22016-09-26 21:29:34 +0300862 || (ep->me_hash == hash && unicode_eq(ep->me_key, key))) {
INADA Naokiba609772016-12-07 20:41:42 +0900863 *value_addr = ep->me_value;
Victor Stinner742da042016-09-07 17:40:12 -0700864 if (hashpos != NULL) {
865 *hashpos = i;
866 }
867 return ix;
Benjamin Peterson7d95e402012-04-23 11:24:50 -0400868 }
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000869 }
870 assert(0); /* NOT REACHED */
871 return 0;
Fred Drake1bff34a2000-08-31 19:31:38 +0000872}
873
Benjamin Peterson7d95e402012-04-23 11:24:50 -0400874/* Faster version of lookdict_unicode when it is known that no <dummy> keys
875 * will be present. */
Victor Stinnerc7a8f672016-11-15 15:13:40 +0100876static Py_ssize_t _Py_HOT_FUNCTION
Benjamin Peterson7d95e402012-04-23 11:24:50 -0400877lookdict_unicode_nodummy(PyDictObject *mp, PyObject *key,
INADA Naokiba609772016-12-07 20:41:42 +0900878 Py_hash_t hash, PyObject **value_addr,
Victor Stinner742da042016-09-07 17:40:12 -0700879 Py_ssize_t *hashpos)
Benjamin Peterson7d95e402012-04-23 11:24:50 -0400880{
INADA Naoki267941c2016-10-06 15:19:07 +0900881 size_t i;
Antoine Pitrou9ed5f272013-08-13 20:18:52 +0200882 size_t mask = DK_MASK(mp->ma_keys);
Victor Stinner742da042016-09-07 17:40:12 -0700883 Py_ssize_t ix;
884 PyDictKeyEntry *ep, *ep0 = DK_ENTRIES(mp->ma_keys);
Benjamin Peterson7d95e402012-04-23 11:24:50 -0400885
Victor Stinner742da042016-09-07 17:40:12 -0700886 assert(mp->ma_values == NULL);
Benjamin Peterson7d95e402012-04-23 11:24:50 -0400887 /* Make sure this function doesn't have to handle non-unicode keys,
888 including subclasses of str; e.g., one reason to subclass
889 unicodes is to override __eq__, and for speed we don't cater to
890 that here. */
891 if (!PyUnicode_CheckExact(key)) {
892 mp->ma_keys->dk_lookup = lookdict;
Victor Stinner742da042016-09-07 17:40:12 -0700893 return lookdict(mp, key, hash, value_addr, hashpos);
Benjamin Peterson7d95e402012-04-23 11:24:50 -0400894 }
895 i = (size_t)hash & mask;
Victor Stinner742da042016-09-07 17:40:12 -0700896 ix = dk_get_index(mp->ma_keys, i);
897 assert (ix != DKIX_DUMMY);
898 if (ix == DKIX_EMPTY) {
899 if (hashpos != NULL)
900 *hashpos = i;
901 *value_addr = NULL;
902 return DKIX_EMPTY;
903 }
904 ep = &ep0[ix];
Victor Stinnerdee6e252016-09-08 11:16:07 -0700905 assert(ep->me_key != NULL);
906 assert(PyUnicode_CheckExact(ep->me_key));
Victor Stinner742da042016-09-07 17:40:12 -0700907 if (ep->me_key == key ||
Benjamin Peterson7d95e402012-04-23 11:24:50 -0400908 (ep->me_hash == hash && unicode_eq(ep->me_key, key))) {
Victor Stinner742da042016-09-07 17:40:12 -0700909 if (hashpos != NULL)
910 *hashpos = i;
INADA Naokiba609772016-12-07 20:41:42 +0900911 *value_addr = ep->me_value;
Victor Stinner742da042016-09-07 17:40:12 -0700912 return ix;
Benjamin Peterson7d95e402012-04-23 11:24:50 -0400913 }
INADA Naoki267941c2016-10-06 15:19:07 +0900914 for (size_t perturb = hash;;) {
915 perturb >>= PERTURB_SHIFT;
Victor Stinner742da042016-09-07 17:40:12 -0700916 i = mask & ((i << 2) + i + perturb + 1);
917 ix = dk_get_index(mp->ma_keys, i);
918 assert (ix != DKIX_DUMMY);
919 if (ix == DKIX_EMPTY) {
920 if (hashpos != NULL)
921 *hashpos = i;
922 *value_addr = NULL;
923 return DKIX_EMPTY;
924 }
925 ep = &ep0[ix];
926 assert(ep->me_key != NULL && PyUnicode_CheckExact(ep->me_key));
927 if (ep->me_key == key ||
Benjamin Peterson7d95e402012-04-23 11:24:50 -0400928 (ep->me_hash == hash && unicode_eq(ep->me_key, key))) {
Victor Stinner742da042016-09-07 17:40:12 -0700929 if (hashpos != NULL)
930 *hashpos = i;
INADA Naokiba609772016-12-07 20:41:42 +0900931 *value_addr = ep->me_value;
Victor Stinner742da042016-09-07 17:40:12 -0700932 return ix;
Benjamin Peterson7d95e402012-04-23 11:24:50 -0400933 }
934 }
935 assert(0); /* NOT REACHED */
936 return 0;
937}
938
939/* Version of lookdict for split tables.
940 * All split tables and only split tables use this lookup function.
941 * Split tables only contain unicode keys and no dummy keys,
942 * so algorithm is the same as lookdict_unicode_nodummy.
943 */
Victor Stinnerc7a8f672016-11-15 15:13:40 +0100944static Py_ssize_t _Py_HOT_FUNCTION
Benjamin Peterson7d95e402012-04-23 11:24:50 -0400945lookdict_split(PyDictObject *mp, PyObject *key,
INADA Naokiba609772016-12-07 20:41:42 +0900946 Py_hash_t hash, PyObject **value_addr, Py_ssize_t *hashpos)
Benjamin Peterson7d95e402012-04-23 11:24:50 -0400947{
INADA Naoki267941c2016-10-06 15:19:07 +0900948 size_t i;
Antoine Pitrou9ed5f272013-08-13 20:18:52 +0200949 size_t mask = DK_MASK(mp->ma_keys);
Victor Stinner742da042016-09-07 17:40:12 -0700950 Py_ssize_t ix;
951 PyDictKeyEntry *ep, *ep0 = DK_ENTRIES(mp->ma_keys);
Benjamin Peterson7d95e402012-04-23 11:24:50 -0400952
Victor Stinner742da042016-09-07 17:40:12 -0700953 /* mp must split table */
954 assert(mp->ma_values != NULL);
Benjamin Peterson7d95e402012-04-23 11:24:50 -0400955 if (!PyUnicode_CheckExact(key)) {
Victor Stinner742da042016-09-07 17:40:12 -0700956 ix = lookdict(mp, key, hash, value_addr, hashpos);
957 if (ix >= 0) {
INADA Naokiba609772016-12-07 20:41:42 +0900958 *value_addr = mp->ma_values[ix];
Victor Stinner742da042016-09-07 17:40:12 -0700959 }
960 return ix;
Benjamin Peterson7d95e402012-04-23 11:24:50 -0400961 }
Victor Stinner742da042016-09-07 17:40:12 -0700962
Benjamin Peterson7d95e402012-04-23 11:24:50 -0400963 i = (size_t)hash & mask;
Victor Stinner742da042016-09-07 17:40:12 -0700964 ix = dk_get_index(mp->ma_keys, i);
965 if (ix == DKIX_EMPTY) {
966 if (hashpos != NULL)
967 *hashpos = i;
968 *value_addr = NULL;
969 return DKIX_EMPTY;
970 }
971 assert(ix >= 0);
972 ep = &ep0[ix];
Serhiy Storchaka46825d22016-09-26 21:29:34 +0300973 assert(ep->me_key != NULL && PyUnicode_CheckExact(ep->me_key));
Victor Stinner742da042016-09-07 17:40:12 -0700974 if (ep->me_key == key ||
Benjamin Peterson7d95e402012-04-23 11:24:50 -0400975 (ep->me_hash == hash && unicode_eq(ep->me_key, key))) {
Victor Stinner742da042016-09-07 17:40:12 -0700976 if (hashpos != NULL)
977 *hashpos = i;
INADA Naokiba609772016-12-07 20:41:42 +0900978 *value_addr = mp->ma_values[ix];
Victor Stinner742da042016-09-07 17:40:12 -0700979 return ix;
Benjamin Peterson7d95e402012-04-23 11:24:50 -0400980 }
INADA Naoki267941c2016-10-06 15:19:07 +0900981 for (size_t perturb = hash;;) {
982 perturb >>= PERTURB_SHIFT;
Victor Stinner742da042016-09-07 17:40:12 -0700983 i = mask & ((i << 2) + i + perturb + 1);
984 ix = dk_get_index(mp->ma_keys, i);
985 if (ix == DKIX_EMPTY) {
986 if (hashpos != NULL)
987 *hashpos = i;
988 *value_addr = NULL;
989 return DKIX_EMPTY;
990 }
991 assert(ix >= 0);
992 ep = &ep0[ix];
Serhiy Storchaka46825d22016-09-26 21:29:34 +0300993 assert(ep->me_key != NULL && PyUnicode_CheckExact(ep->me_key));
Victor Stinner742da042016-09-07 17:40:12 -0700994 if (ep->me_key == key ||
Benjamin Peterson7d95e402012-04-23 11:24:50 -0400995 (ep->me_hash == hash && unicode_eq(ep->me_key, key))) {
Victor Stinner742da042016-09-07 17:40:12 -0700996 if (hashpos != NULL)
997 *hashpos = i;
INADA Naokiba609772016-12-07 20:41:42 +0900998 *value_addr = mp->ma_values[ix];
Victor Stinner742da042016-09-07 17:40:12 -0700999 return ix;
Benjamin Peterson7d95e402012-04-23 11:24:50 -04001000 }
1001 }
1002 assert(0); /* NOT REACHED */
1003 return 0;
1004}
1005
Benjamin Petersonfb886362010-04-24 18:21:17 +00001006int
1007_PyDict_HasOnlyStringKeys(PyObject *dict)
1008{
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00001009 Py_ssize_t pos = 0;
1010 PyObject *key, *value;
Benjamin Petersonf6096542010-11-17 22:33:12 +00001011 assert(PyDict_Check(dict));
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00001012 /* Shortcut */
Benjamin Peterson7d95e402012-04-23 11:24:50 -04001013 if (((PyDictObject *)dict)->ma_keys->dk_lookup != lookdict)
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00001014 return 1;
1015 while (PyDict_Next(dict, &pos, &key, &value))
1016 if (!PyUnicode_Check(key))
1017 return 0;
1018 return 1;
Benjamin Petersonfb886362010-04-24 18:21:17 +00001019}
1020
Antoine Pitrou3a652b12009-03-23 18:52:06 +00001021#define MAINTAIN_TRACKING(mp, key, value) \
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00001022 do { \
1023 if (!_PyObject_GC_IS_TRACKED(mp)) { \
1024 if (_PyObject_GC_MAY_BE_TRACKED(key) || \
1025 _PyObject_GC_MAY_BE_TRACKED(value)) { \
1026 _PyObject_GC_TRACK(mp); \
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00001027 } \
1028 } \
1029 } while(0)
Antoine Pitrou3a652b12009-03-23 18:52:06 +00001030
1031void
1032_PyDict_MaybeUntrack(PyObject *op)
1033{
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00001034 PyDictObject *mp;
1035 PyObject *value;
Victor Stinner742da042016-09-07 17:40:12 -07001036 Py_ssize_t i, numentries;
1037 PyDictKeyEntry *ep0;
Antoine Pitrou3a652b12009-03-23 18:52:06 +00001038
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00001039 if (!PyDict_CheckExact(op) || !_PyObject_GC_IS_TRACKED(op))
1040 return;
1041
1042 mp = (PyDictObject *) op;
Victor Stinner742da042016-09-07 17:40:12 -07001043 ep0 = DK_ENTRIES(mp->ma_keys);
1044 numentries = mp->ma_keys->dk_nentries;
Benjamin Peterson7d95e402012-04-23 11:24:50 -04001045 if (_PyDict_HasSplitTable(mp)) {
Victor Stinner742da042016-09-07 17:40:12 -07001046 for (i = 0; i < numentries; i++) {
Benjamin Peterson7d95e402012-04-23 11:24:50 -04001047 if ((value = mp->ma_values[i]) == NULL)
1048 continue;
1049 if (_PyObject_GC_MAY_BE_TRACKED(value)) {
Victor Stinner742da042016-09-07 17:40:12 -07001050 assert(!_PyObject_GC_MAY_BE_TRACKED(ep0[i].me_key));
Benjamin Peterson7d95e402012-04-23 11:24:50 -04001051 return;
1052 }
1053 }
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00001054 }
Benjamin Peterson7d95e402012-04-23 11:24:50 -04001055 else {
Victor Stinner742da042016-09-07 17:40:12 -07001056 for (i = 0; i < numentries; i++) {
Benjamin Peterson7d95e402012-04-23 11:24:50 -04001057 if ((value = ep0[i].me_value) == NULL)
1058 continue;
1059 if (_PyObject_GC_MAY_BE_TRACKED(value) ||
1060 _PyObject_GC_MAY_BE_TRACKED(ep0[i].me_key))
1061 return;
1062 }
1063 }
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00001064 _PyObject_GC_UNTRACK(op);
Antoine Pitrou3a652b12009-03-23 18:52:06 +00001065}
1066
Benjamin Peterson7d95e402012-04-23 11:24:50 -04001067/* Internal function to find slot for an item from its hash
Victor Stinner3c336c52016-09-12 14:17:40 +02001068 when it is known that the key is not present in the dict.
1069
1070 The dict must be combined. */
INADA Naokiba609772016-12-07 20:41:42 +09001071static Py_ssize_t
1072find_empty_slot(PyDictKeysObject *keys, PyObject *key, Py_hash_t hash)
Guido van Rossum4b1302b1993-03-27 18:11:32 +00001073{
INADA Naoki267941c2016-10-06 15:19:07 +09001074 size_t i;
INADA Naokiba609772016-12-07 20:41:42 +09001075 size_t mask = DK_MASK(keys);
Victor Stinner742da042016-09-07 17:40:12 -07001076 Py_ssize_t ix;
Tim Peters6d6c1a32001-08-02 04:15:00 +00001077
Benjamin Peterson7d95e402012-04-23 11:24:50 -04001078 assert(key != NULL);
Victor Stinner3c336c52016-09-12 14:17:40 +02001079
Benjamin Peterson7d95e402012-04-23 11:24:50 -04001080 i = hash & mask;
INADA Naokiba609772016-12-07 20:41:42 +09001081 ix = dk_get_index(keys, i);
INADA Naoki267941c2016-10-06 15:19:07 +09001082 for (size_t perturb = hash; ix != DKIX_EMPTY;) {
1083 perturb >>= PERTURB_SHIFT;
Benjamin Peterson7d95e402012-04-23 11:24:50 -04001084 i = (i << 2) + i + perturb + 1;
INADA Naokiba609772016-12-07 20:41:42 +09001085 ix = dk_get_index(keys, i & mask);
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00001086 }
INADA Naokiba609772016-12-07 20:41:42 +09001087 assert(DK_ENTRIES(keys)[keys->dk_nentries].me_value == NULL);
1088 return i & mask;
Thomas Wouters4d70c3d2006-06-08 14:42:34 +00001089}
1090
Benjamin Peterson7d95e402012-04-23 11:24:50 -04001091static int
1092insertion_resize(PyDictObject *mp)
1093{
Raymond Hettinger36f74aa2013-05-17 03:01:13 -07001094 return dictresize(mp, GROWTH_RATE(mp));
Benjamin Peterson7d95e402012-04-23 11:24:50 -04001095}
Antoine Pitroue965d972012-02-27 00:45:12 +01001096
1097/*
1098Internal routine to insert a new item into the table.
1099Used both by the internal resize routine and by the public insert routine.
Antoine Pitroue965d972012-02-27 00:45:12 +01001100Returns -1 if an error occurred, or 0 on success.
1101*/
1102static int
Benjamin Peterson7d95e402012-04-23 11:24:50 -04001103insertdict(PyDictObject *mp, PyObject *key, Py_hash_t hash, PyObject *value)
Antoine Pitroue965d972012-02-27 00:45:12 +01001104{
Benjamin Peterson7d95e402012-04-23 11:24:50 -04001105 PyObject *old_value;
INADA Naokiba609772016-12-07 20:41:42 +09001106 PyDictKeyEntry *ep;
Victor Stinner742da042016-09-07 17:40:12 -07001107 Py_ssize_t hashpos, ix;
Antoine Pitroue965d972012-02-27 00:45:12 +01001108
Benjamin Peterson7d95e402012-04-23 11:24:50 -04001109 if (mp->ma_values != NULL && !PyUnicode_CheckExact(key)) {
1110 if (insertion_resize(mp) < 0)
1111 return -1;
1112 }
1113
INADA Naokiba609772016-12-07 20:41:42 +09001114 ix = mp->ma_keys->dk_lookup(mp, key, hash, &old_value, &hashpos);
Victor Stinner742da042016-09-07 17:40:12 -07001115 if (ix == DKIX_ERROR) {
Antoine Pitroue965d972012-02-27 00:45:12 +01001116 return -1;
1117 }
Victor Stinner742da042016-09-07 17:40:12 -07001118
Antoine Pitroud6967322014-10-18 00:35:00 +02001119 assert(PyUnicode_CheckExact(key) || mp->ma_keys->dk_lookup == lookdict);
Benjamin Petersona6f195e2012-04-30 10:23:40 -04001120 Py_INCREF(value);
Benjamin Peterson7d95e402012-04-23 11:24:50 -04001121 MAINTAIN_TRACKING(mp, key, value);
Victor Stinner742da042016-09-07 17:40:12 -07001122
1123 /* When insertion order is different from shared key, we can't share
1124 * the key anymore. Convert this instance to combine table.
1125 */
1126 if (_PyDict_HasSplitTable(mp) &&
INADA Naokiba609772016-12-07 20:41:42 +09001127 ((ix >= 0 && old_value == NULL && mp->ma_used != ix) ||
Victor Stinner742da042016-09-07 17:40:12 -07001128 (ix == DKIX_EMPTY && mp->ma_used != mp->ma_keys->dk_nentries))) {
1129 if (insertion_resize(mp) < 0) {
1130 Py_DECREF(value);
1131 return -1;
1132 }
INADA Naokiba609772016-12-07 20:41:42 +09001133 hashpos = find_empty_slot(mp->ma_keys, key, hash);
Victor Stinner742da042016-09-07 17:40:12 -07001134 ix = DKIX_EMPTY;
Benjamin Peterson7d95e402012-04-23 11:24:50 -04001135 }
Victor Stinner742da042016-09-07 17:40:12 -07001136
1137 if (ix == DKIX_EMPTY) {
1138 /* Insert into new slot. */
INADA Naokiba609772016-12-07 20:41:42 +09001139 assert(old_value == NULL);
Victor Stinner742da042016-09-07 17:40:12 -07001140 if (mp->ma_keys->dk_usable <= 0) {
1141 /* Need to resize. */
1142 if (insertion_resize(mp) < 0) {
1143 Py_DECREF(value);
1144 return -1;
Benjamin Peterson7d95e402012-04-23 11:24:50 -04001145 }
INADA Naokiba609772016-12-07 20:41:42 +09001146 hashpos = find_empty_slot(mp->ma_keys, key, hash);
Victor Stinner742da042016-09-07 17:40:12 -07001147 }
INADA Naokiba609772016-12-07 20:41:42 +09001148 ep = &DK_ENTRIES(mp->ma_keys)[mp->ma_keys->dk_nentries];
Victor Stinner742da042016-09-07 17:40:12 -07001149 dk_set_index(mp->ma_keys, hashpos, mp->ma_keys->dk_nentries);
1150 Py_INCREF(key);
1151 ep->me_key = key;
1152 ep->me_hash = hash;
1153 if (mp->ma_values) {
1154 assert (mp->ma_values[mp->ma_keys->dk_nentries] == NULL);
1155 mp->ma_values[mp->ma_keys->dk_nentries] = value;
Benjamin Peterson7d95e402012-04-23 11:24:50 -04001156 }
1157 else {
Victor Stinner742da042016-09-07 17:40:12 -07001158 ep->me_value = value;
Benjamin Peterson7d95e402012-04-23 11:24:50 -04001159 }
1160 mp->ma_used++;
Victor Stinner3b6a6b42016-09-08 12:51:24 -07001161 mp->ma_version_tag = DICT_NEXT_VERSION();
Victor Stinner742da042016-09-07 17:40:12 -07001162 mp->ma_keys->dk_usable--;
1163 mp->ma_keys->dk_nentries++;
1164 assert(mp->ma_keys->dk_usable >= 0);
Victor Stinner611b0fa2016-09-14 15:02:01 +02001165 assert(_PyDict_CheckConsistency(mp));
Victor Stinner742da042016-09-07 17:40:12 -07001166 return 0;
Benjamin Peterson7d95e402012-04-23 11:24:50 -04001167 }
Victor Stinner742da042016-09-07 17:40:12 -07001168
INADA Naokiba609772016-12-07 20:41:42 +09001169 if (_PyDict_HasSplitTable(mp)) {
1170 mp->ma_values[ix] = value;
1171 if (old_value == NULL) {
1172 /* pending state */
1173 assert(ix == mp->ma_used);
1174 mp->ma_used++;
1175 }
1176 }
1177 else {
1178 assert(old_value != NULL);
1179 DK_ENTRIES(mp->ma_keys)[ix].me_value = value;
Victor Stinner742da042016-09-07 17:40:12 -07001180 }
1181
Victor Stinner3b6a6b42016-09-08 12:51:24 -07001182 mp->ma_version_tag = DICT_NEXT_VERSION();
INADA Naokiba609772016-12-07 20:41:42 +09001183 Py_XDECREF(old_value); /* which **CAN** re-enter (see issue #22653) */
Victor Stinner611b0fa2016-09-14 15:02:01 +02001184 assert(_PyDict_CheckConsistency(mp));
Benjamin Peterson7d95e402012-04-23 11:24:50 -04001185 return 0;
Antoine Pitroue965d972012-02-27 00:45:12 +01001186}
1187
Thomas Wouters4d70c3d2006-06-08 14:42:34 +00001188/*
Serhiy Storchakae26e20d2016-10-29 10:50:00 +03001189Internal routine used by dictresize() to buid a hashtable of entries.
Thomas Wouters4d70c3d2006-06-08 14:42:34 +00001190*/
1191static void
Serhiy Storchakae26e20d2016-10-29 10:50:00 +03001192build_indices(PyDictKeysObject *keys, PyDictKeyEntry *ep, Py_ssize_t n)
Thomas Wouters4d70c3d2006-06-08 14:42:34 +00001193{
Serhiy Storchakae26e20d2016-10-29 10:50:00 +03001194 size_t mask = (size_t)DK_SIZE(keys) - 1;
1195 for (Py_ssize_t ix = 0; ix != n; ix++, ep++) {
1196 Py_hash_t hash = ep->me_hash;
1197 size_t i = hash & mask;
1198 for (size_t perturb = hash; dk_get_index(keys, i) != DKIX_EMPTY;) {
1199 perturb >>= PERTURB_SHIFT;
1200 i = mask & ((i << 2) + i + perturb + 1);
1201 }
1202 dk_set_index(keys, i, ix);
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00001203 }
Guido van Rossum4b1302b1993-03-27 18:11:32 +00001204}
1205
1206/*
1207Restructure the table by allocating a new table and reinserting all
1208items again. When entries have been deleted, the new table may
1209actually be smaller than the old one.
Benjamin Peterson7d95e402012-04-23 11:24:50 -04001210If a table is split (its keys and hashes are shared, its values are not),
1211then the values are temporarily copied into the table, it is resized as
1212a combined table, then the me_value slots in the old table are NULLed out.
1213After resizing a table is always combined,
1214but can be resplit by make_keys_shared().
Guido van Rossum4b1302b1993-03-27 18:11:32 +00001215*/
Guido van Rossum4b1302b1993-03-27 18:11:32 +00001216static int
Victor Stinner3d3f2642016-12-15 17:21:23 +01001217dictresize(PyDictObject *mp, Py_ssize_t minsize)
Guido van Rossum4b1302b1993-03-27 18:11:32 +00001218{
Serhiy Storchakae26e20d2016-10-29 10:50:00 +03001219 Py_ssize_t newsize, numentries;
Benjamin Peterson7d95e402012-04-23 11:24:50 -04001220 PyDictKeysObject *oldkeys;
1221 PyObject **oldvalues;
Serhiy Storchakae26e20d2016-10-29 10:50:00 +03001222 PyDictKeyEntry *oldentries, *newentries;
Tim Peters91a364d2001-05-19 07:04:38 +00001223
Victor Stinner742da042016-09-07 17:40:12 -07001224 /* Find the smallest table size > minused. */
1225 for (newsize = PyDict_MINSIZE;
Victor Stinner3d3f2642016-12-15 17:21:23 +01001226 newsize < minsize && newsize > 0;
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00001227 newsize <<= 1)
1228 ;
1229 if (newsize <= 0) {
1230 PyErr_NoMemory();
1231 return -1;
1232 }
Serhiy Storchakae26e20d2016-10-29 10:50:00 +03001233
Benjamin Peterson7d95e402012-04-23 11:24:50 -04001234 oldkeys = mp->ma_keys;
Serhiy Storchakae26e20d2016-10-29 10:50:00 +03001235
1236 /* NOTE: Current odict checks mp->ma_keys to detect resize happen.
1237 * So we can't reuse oldkeys even if oldkeys->dk_size == newsize.
1238 * TODO: Try reusing oldkeys when reimplement odict.
1239 */
1240
Benjamin Peterson7d95e402012-04-23 11:24:50 -04001241 /* Allocate a new table. */
1242 mp->ma_keys = new_keys_object(newsize);
1243 if (mp->ma_keys == NULL) {
1244 mp->ma_keys = oldkeys;
1245 return -1;
1246 }
Victor Stinner3d3f2642016-12-15 17:21:23 +01001247 // New table must be large enough.
1248 assert(mp->ma_keys->dk_usable >= mp->ma_used);
Benjamin Peterson7d95e402012-04-23 11:24:50 -04001249 if (oldkeys->dk_lookup == lookdict)
1250 mp->ma_keys->dk_lookup = lookdict;
Serhiy Storchakae26e20d2016-10-29 10:50:00 +03001251
1252 numentries = mp->ma_used;
1253 oldentries = DK_ENTRIES(oldkeys);
1254 newentries = DK_ENTRIES(mp->ma_keys);
1255 oldvalues = mp->ma_values;
Benjamin Peterson7d95e402012-04-23 11:24:50 -04001256 if (oldvalues != NULL) {
Serhiy Storchakae26e20d2016-10-29 10:50:00 +03001257 /* Convert split table into new combined table.
1258 * We must incref keys; we can transfer values.
1259 * Note that values of split table is always dense.
1260 */
1261 for (Py_ssize_t i = 0; i < numentries; i++) {
1262 assert(oldvalues[i] != NULL);
1263 PyDictKeyEntry *ep = &oldentries[i];
1264 PyObject *key = ep->me_key;
1265 Py_INCREF(key);
1266 newentries[i].me_key = key;
1267 newentries[i].me_hash = ep->me_hash;
1268 newentries[i].me_value = oldvalues[i];
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00001269 }
Serhiy Storchakae26e20d2016-10-29 10:50:00 +03001270
Benjamin Peterson7d95e402012-04-23 11:24:50 -04001271 DK_DECREF(oldkeys);
Serhiy Storchakae26e20d2016-10-29 10:50:00 +03001272 mp->ma_values = NULL;
Victor Stinner742da042016-09-07 17:40:12 -07001273 if (oldvalues != empty_values) {
1274 free_values(oldvalues);
1275 }
Benjamin Peterson7d95e402012-04-23 11:24:50 -04001276 }
Serhiy Storchakae26e20d2016-10-29 10:50:00 +03001277 else { // combined table.
1278 if (oldkeys->dk_nentries == numentries) {
1279 memcpy(newentries, oldentries, numentries * sizeof(PyDictKeyEntry));
1280 }
1281 else {
1282 PyDictKeyEntry *ep = oldentries;
1283 for (Py_ssize_t i = 0; i < numentries; i++) {
1284 while (ep->me_value == NULL)
1285 ep++;
1286 newentries[i] = *ep++;
1287 }
1288 }
1289
Benjamin Peterson7d95e402012-04-23 11:24:50 -04001290 assert(oldkeys->dk_lookup != lookdict_split);
Benjamin Peterson7d95e402012-04-23 11:24:50 -04001291 assert(oldkeys->dk_refcnt == 1);
Serhiy Storchakae26e20d2016-10-29 10:50:00 +03001292 if (oldkeys->dk_size == PyDict_MINSIZE &&
1293 numfreekeys < PyDict_MAXFREELIST) {
1294 DK_DEBUG_DECREF keys_free_list[numfreekeys++] = oldkeys;
1295 }
1296 else {
1297 DK_DEBUG_DECREF PyObject_FREE(oldkeys);
1298 }
Benjamin Peterson7d95e402012-04-23 11:24:50 -04001299 }
Serhiy Storchakae26e20d2016-10-29 10:50:00 +03001300
1301 build_indices(mp->ma_keys, newentries, numentries);
1302 mp->ma_keys->dk_usable -= numentries;
1303 mp->ma_keys->dk_nentries = numentries;
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00001304 return 0;
Guido van Rossum4b1302b1993-03-27 18:11:32 +00001305}
1306
Benjamin Peterson15ee8212012-04-24 14:44:18 -04001307/* Returns NULL if unable to split table.
1308 * A NULL return does not necessarily indicate an error */
Benjamin Peterson7d95e402012-04-23 11:24:50 -04001309static PyDictKeysObject *
1310make_keys_shared(PyObject *op)
1311{
1312 Py_ssize_t i;
1313 Py_ssize_t size;
1314 PyDictObject *mp = (PyDictObject *)op;
1315
Benjamin Peterson15ee8212012-04-24 14:44:18 -04001316 if (!PyDict_CheckExact(op))
1317 return NULL;
Benjamin Peterson7d95e402012-04-23 11:24:50 -04001318 if (!_PyDict_HasSplitTable(mp)) {
1319 PyDictKeyEntry *ep0;
1320 PyObject **values;
1321 assert(mp->ma_keys->dk_refcnt == 1);
1322 if (mp->ma_keys->dk_lookup == lookdict) {
1323 return NULL;
1324 }
1325 else if (mp->ma_keys->dk_lookup == lookdict_unicode) {
1326 /* Remove dummy keys */
1327 if (dictresize(mp, DK_SIZE(mp->ma_keys)))
1328 return NULL;
1329 }
1330 assert(mp->ma_keys->dk_lookup == lookdict_unicode_nodummy);
1331 /* Copy values into a new array */
Victor Stinner742da042016-09-07 17:40:12 -07001332 ep0 = DK_ENTRIES(mp->ma_keys);
1333 size = USABLE_FRACTION(DK_SIZE(mp->ma_keys));
Benjamin Peterson7d95e402012-04-23 11:24:50 -04001334 values = new_values(size);
1335 if (values == NULL) {
1336 PyErr_SetString(PyExc_MemoryError,
1337 "Not enough memory to allocate new values array");
1338 return NULL;
1339 }
1340 for (i = 0; i < size; i++) {
1341 values[i] = ep0[i].me_value;
1342 ep0[i].me_value = NULL;
1343 }
1344 mp->ma_keys->dk_lookup = lookdict_split;
1345 mp->ma_values = values;
1346 }
1347 DK_INCREF(mp->ma_keys);
1348 return mp->ma_keys;
1349}
Christian Heimes99170a52007-12-19 02:07:34 +00001350
1351PyObject *
1352_PyDict_NewPresized(Py_ssize_t minused)
1353{
INADA Naoki92c50ee2016-11-22 00:57:02 +09001354 const Py_ssize_t max_presize = 128 * 1024;
Benjamin Peterson7d95e402012-04-23 11:24:50 -04001355 Py_ssize_t newsize;
1356 PyDictKeysObject *new_keys;
INADA Naoki92c50ee2016-11-22 00:57:02 +09001357
1358 /* There are no strict guarantee that returned dict can contain minused
1359 * items without resize. So we create medium size dict instead of very
1360 * large dict or MemoryError.
1361 */
1362 if (minused > USABLE_FRACTION(max_presize)) {
1363 newsize = max_presize;
1364 }
1365 else {
1366 Py_ssize_t minsize = ESTIMATE_SIZE(minused);
1367 newsize = PyDict_MINSIZE;
1368 while (newsize < minsize) {
1369 newsize <<= 1;
1370 }
1371 }
1372 assert(IS_POWER_OF_2(newsize));
1373
Benjamin Peterson7d95e402012-04-23 11:24:50 -04001374 new_keys = new_keys_object(newsize);
1375 if (new_keys == NULL)
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00001376 return NULL;
Benjamin Peterson7d95e402012-04-23 11:24:50 -04001377 return new_dict(new_keys, NULL);
Christian Heimes99170a52007-12-19 02:07:34 +00001378}
1379
Thomas Wouters4d70c3d2006-06-08 14:42:34 +00001380/* Note that, for historical reasons, PyDict_GetItem() suppresses all errors
1381 * that may occur (originally dicts supported only string keys, and exceptions
1382 * weren't possible). So, while the original intent was that a NULL return
Thomas Wouters0e3f5912006-08-11 14:57:12 +00001383 * meant the key wasn't present, in reality it can mean that, or that an error
Thomas Wouters4d70c3d2006-06-08 14:42:34 +00001384 * (suppressed) occurred while computing the key's hash, or that some error
1385 * (suppressed) occurred when comparing keys in the dict's internal probe
1386 * sequence. A nasty example of the latter is when a Python-coded comparison
1387 * function hits a stack-depth error, which can cause this to return NULL
1388 * even if the key is present.
1389 */
Guido van Rossumc0b618a1997-05-02 03:12:38 +00001390PyObject *
Tim Peters1f5871e2000-07-04 17:44:48 +00001391PyDict_GetItem(PyObject *op, PyObject *key)
Guido van Rossum4b1302b1993-03-27 18:11:32 +00001392{
Benjamin Peterson8f67d082010-10-17 20:54:53 +00001393 Py_hash_t hash;
Victor Stinner742da042016-09-07 17:40:12 -07001394 Py_ssize_t ix;
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00001395 PyDictObject *mp = (PyDictObject *)op;
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00001396 PyThreadState *tstate;
INADA Naokiba609772016-12-07 20:41:42 +09001397 PyObject *value;
Benjamin Peterson7d95e402012-04-23 11:24:50 -04001398
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00001399 if (!PyDict_Check(op))
1400 return NULL;
1401 if (!PyUnicode_CheckExact(key) ||
Martin v. Löwisd63a3b82011-09-28 07:41:54 +02001402 (hash = ((PyASCIIObject *) key)->hash) == -1)
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00001403 {
1404 hash = PyObject_Hash(key);
1405 if (hash == -1) {
1406 PyErr_Clear();
1407 return NULL;
1408 }
1409 }
Thomas Wouters4d70c3d2006-06-08 14:42:34 +00001410
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00001411 /* We can arrive here with a NULL tstate during initialization: try
1412 running "python -Wi" for an example related to string interning.
1413 Let's just hope that no exception occurs then... This must be
1414 _PyThreadState_Current and not PyThreadState_GET() because in debug
1415 mode, the latter complains if tstate is NULL. */
Victor Stinner0cae6092016-11-11 01:43:56 +01001416 tstate = PyThreadState_GET();
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00001417 if (tstate != NULL && tstate->curexc_type != NULL) {
1418 /* preserve the existing exception */
1419 PyObject *err_type, *err_value, *err_tb;
1420 PyErr_Fetch(&err_type, &err_value, &err_tb);
INADA Naokiba609772016-12-07 20:41:42 +09001421 ix = (mp->ma_keys->dk_lookup)(mp, key, hash, &value, NULL);
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00001422 /* ignore errors */
1423 PyErr_Restore(err_type, err_value, err_tb);
Victor Stinner742da042016-09-07 17:40:12 -07001424 if (ix < 0)
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00001425 return NULL;
1426 }
1427 else {
INADA Naokiba609772016-12-07 20:41:42 +09001428 ix = (mp->ma_keys->dk_lookup)(mp, key, hash, &value, NULL);
Victor Stinner742da042016-09-07 17:40:12 -07001429 if (ix < 0) {
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00001430 PyErr_Clear();
1431 return NULL;
1432 }
1433 }
INADA Naokiba609772016-12-07 20:41:42 +09001434 return value;
Guido van Rossum4b1302b1993-03-27 18:11:32 +00001435}
1436
Serhiy Storchakaf0b311b2016-11-06 13:18:24 +02001437/* Same as PyDict_GetItemWithError() but with hash supplied by caller.
1438 This returns NULL *with* an exception set if an exception occurred.
1439 It returns NULL *without* an exception set if the key wasn't present.
1440*/
Raymond Hettinger4b74fba2014-05-03 16:32:11 -07001441PyObject *
1442_PyDict_GetItem_KnownHash(PyObject *op, PyObject *key, Py_hash_t hash)
1443{
Victor Stinner742da042016-09-07 17:40:12 -07001444 Py_ssize_t ix;
Raymond Hettinger4b74fba2014-05-03 16:32:11 -07001445 PyDictObject *mp = (PyDictObject *)op;
INADA Naokiba609772016-12-07 20:41:42 +09001446 PyObject *value;
Raymond Hettinger4b74fba2014-05-03 16:32:11 -07001447
Serhiy Storchakaf0b311b2016-11-06 13:18:24 +02001448 if (!PyDict_Check(op)) {
1449 PyErr_BadInternalCall();
Raymond Hettinger4b74fba2014-05-03 16:32:11 -07001450 return NULL;
Raymond Hettinger4b74fba2014-05-03 16:32:11 -07001451 }
Serhiy Storchakaf0b311b2016-11-06 13:18:24 +02001452
INADA Naokiba609772016-12-07 20:41:42 +09001453 ix = (mp->ma_keys->dk_lookup)(mp, key, hash, &value, NULL);
Serhiy Storchakaf0b311b2016-11-06 13:18:24 +02001454 if (ix < 0) {
1455 return NULL;
Raymond Hettinger4b74fba2014-05-03 16:32:11 -07001456 }
INADA Naokiba609772016-12-07 20:41:42 +09001457 return value;
Raymond Hettinger4b74fba2014-05-03 16:32:11 -07001458}
1459
Guido van Rossum47b9ff62006-08-24 00:41:19 +00001460/* Variant of PyDict_GetItem() that doesn't suppress exceptions.
1461 This returns NULL *with* an exception set if an exception occurred.
1462 It returns NULL *without* an exception set if the key wasn't present.
1463*/
1464PyObject *
1465PyDict_GetItemWithError(PyObject *op, PyObject *key)
1466{
Victor Stinner742da042016-09-07 17:40:12 -07001467 Py_ssize_t ix;
Benjamin Peterson8f67d082010-10-17 20:54:53 +00001468 Py_hash_t hash;
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00001469 PyDictObject*mp = (PyDictObject *)op;
INADA Naokiba609772016-12-07 20:41:42 +09001470 PyObject *value;
Guido van Rossum47b9ff62006-08-24 00:41:19 +00001471
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00001472 if (!PyDict_Check(op)) {
1473 PyErr_BadInternalCall();
1474 return NULL;
1475 }
1476 if (!PyUnicode_CheckExact(key) ||
Martin v. Löwisd63a3b82011-09-28 07:41:54 +02001477 (hash = ((PyASCIIObject *) key)->hash) == -1)
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00001478 {
1479 hash = PyObject_Hash(key);
1480 if (hash == -1) {
1481 return NULL;
1482 }
1483 }
Guido van Rossum47b9ff62006-08-24 00:41:19 +00001484
INADA Naokiba609772016-12-07 20:41:42 +09001485 ix = (mp->ma_keys->dk_lookup)(mp, key, hash, &value, NULL);
Victor Stinner742da042016-09-07 17:40:12 -07001486 if (ix < 0)
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00001487 return NULL;
INADA Naokiba609772016-12-07 20:41:42 +09001488 return value;
Guido van Rossum47b9ff62006-08-24 00:41:19 +00001489}
1490
Brett Cannonfd074152012-04-14 14:10:13 -04001491PyObject *
1492_PyDict_GetItemIdWithError(PyObject *dp, struct _Py_Identifier *key)
1493{
1494 PyObject *kv;
1495 kv = _PyUnicode_FromId(key); /* borrowed */
1496 if (kv == NULL)
1497 return NULL;
1498 return PyDict_GetItemWithError(dp, kv);
1499}
1500
Victor Stinnerb4efc962015-11-20 09:24:02 +01001501/* Fast version of global value lookup (LOAD_GLOBAL).
Benjamin Peterson7d95e402012-04-23 11:24:50 -04001502 * Lookup in globals, then builtins.
Victor Stinnerb4efc962015-11-20 09:24:02 +01001503 *
1504 * Raise an exception and return NULL if an error occurred (ex: computing the
1505 * key hash failed, key comparison failed, ...). Return NULL if the key doesn't
1506 * exist. Return the value if the key exists.
Benjamin Peterson7d95e402012-04-23 11:24:50 -04001507 */
1508PyObject *
1509_PyDict_LoadGlobal(PyDictObject *globals, PyDictObject *builtins, PyObject *key)
Guido van Rossum4b1302b1993-03-27 18:11:32 +00001510{
Victor Stinner742da042016-09-07 17:40:12 -07001511 Py_ssize_t ix;
Victor Stinnerb4efc962015-11-20 09:24:02 +01001512 Py_hash_t hash;
INADA Naokiba609772016-12-07 20:41:42 +09001513 PyObject *value;
Victor Stinnerb4efc962015-11-20 09:24:02 +01001514
1515 if (!PyUnicode_CheckExact(key) ||
1516 (hash = ((PyASCIIObject *) key)->hash) == -1)
1517 {
1518 hash = PyObject_Hash(key);
1519 if (hash == -1)
1520 return NULL;
Antoine Pitroue965d972012-02-27 00:45:12 +01001521 }
Victor Stinnerb4efc962015-11-20 09:24:02 +01001522
1523 /* namespace 1: globals */
INADA Naokiba609772016-12-07 20:41:42 +09001524 ix = globals->ma_keys->dk_lookup(globals, key, hash, &value, NULL);
Victor Stinner742da042016-09-07 17:40:12 -07001525 if (ix == DKIX_ERROR)
Benjamin Peterson7d95e402012-04-23 11:24:50 -04001526 return NULL;
INADA Naokiba609772016-12-07 20:41:42 +09001527 if (ix != DKIX_EMPTY && value != NULL)
1528 return value;
Victor Stinnerb4efc962015-11-20 09:24:02 +01001529
1530 /* namespace 2: builtins */
INADA Naokiba609772016-12-07 20:41:42 +09001531 ix = builtins->ma_keys->dk_lookup(builtins, key, hash, &value, NULL);
Victor Stinner742da042016-09-07 17:40:12 -07001532 if (ix < 0)
Victor Stinnerb4efc962015-11-20 09:24:02 +01001533 return NULL;
INADA Naokiba609772016-12-07 20:41:42 +09001534 return value;
Guido van Rossum4b1302b1993-03-27 18:11:32 +00001535}
1536
Antoine Pitroue965d972012-02-27 00:45:12 +01001537/* CAUTION: PyDict_SetItem() must guarantee that it won't resize the
1538 * dictionary if it's merely replacing the value for an existing key.
1539 * This means that it's safe to loop over a dictionary with PyDict_Next()
1540 * and occasionally replace a value -- but you can't insert new keys or
1541 * remove them.
1542 */
1543int
Benjamin Peterson7d95e402012-04-23 11:24:50 -04001544PyDict_SetItem(PyObject *op, PyObject *key, PyObject *value)
Antoine Pitroue965d972012-02-27 00:45:12 +01001545{
Benjamin Peterson7d95e402012-04-23 11:24:50 -04001546 PyDictObject *mp;
1547 Py_hash_t hash;
Antoine Pitroue965d972012-02-27 00:45:12 +01001548 if (!PyDict_Check(op)) {
1549 PyErr_BadInternalCall();
1550 return -1;
1551 }
1552 assert(key);
1553 assert(value);
Benjamin Peterson7d95e402012-04-23 11:24:50 -04001554 mp = (PyDictObject *)op;
1555 if (!PyUnicode_CheckExact(key) ||
1556 (hash = ((PyASCIIObject *) key)->hash) == -1)
1557 {
Antoine Pitroue965d972012-02-27 00:45:12 +01001558 hash = PyObject_Hash(key);
1559 if (hash == -1)
1560 return -1;
1561 }
Benjamin Peterson7d95e402012-04-23 11:24:50 -04001562
1563 /* insertdict() handles any resizing that might be necessary */
1564 return insertdict(mp, key, hash, value);
Antoine Pitroue965d972012-02-27 00:45:12 +01001565}
1566
Guido van Rossum4b1302b1993-03-27 18:11:32 +00001567int
Raymond Hettinger4b74fba2014-05-03 16:32:11 -07001568_PyDict_SetItem_KnownHash(PyObject *op, PyObject *key, PyObject *value,
1569 Py_hash_t hash)
1570{
1571 PyDictObject *mp;
1572
1573 if (!PyDict_Check(op)) {
1574 PyErr_BadInternalCall();
1575 return -1;
1576 }
1577 assert(key);
1578 assert(value);
Serhiy Storchakab9d98d52015-10-02 12:47:11 +03001579 assert(hash != -1);
Raymond Hettinger4b74fba2014-05-03 16:32:11 -07001580 mp = (PyDictObject *)op;
1581
1582 /* insertdict() handles any resizing that might be necessary */
1583 return insertdict(mp, key, hash, value);
1584}
1585
Antoine Pitroue10ca3a2016-12-27 14:19:20 +01001586static int
Antoine Pitroud741ed42016-12-27 14:23:43 +01001587delitem_common(PyDictObject *mp, Py_ssize_t hashpos, Py_ssize_t ix,
Antoine Pitrouc06ae202016-12-27 14:34:54 +01001588 PyObject *old_value)
Antoine Pitroue10ca3a2016-12-27 14:19:20 +01001589{
Antoine Pitrouc06ae202016-12-27 14:34:54 +01001590 PyObject *old_key;
Antoine Pitroud741ed42016-12-27 14:23:43 +01001591 PyDictKeyEntry *ep;
Antoine Pitroue10ca3a2016-12-27 14:19:20 +01001592
Antoine Pitroue10ca3a2016-12-27 14:19:20 +01001593 mp->ma_used--;
Antoine Pitroud741ed42016-12-27 14:23:43 +01001594 mp->ma_version_tag = DICT_NEXT_VERSION();
1595 ep = &DK_ENTRIES(mp->ma_keys)[ix];
1596 dk_set_index(mp->ma_keys, hashpos, DKIX_DUMMY);
1597 ENSURE_ALLOWS_DELETIONS(mp);
1598 old_key = ep->me_key;
1599 ep->me_key = NULL;
Antoine Pitrouc06ae202016-12-27 14:34:54 +01001600 ep->me_value = NULL;
Antoine Pitroud741ed42016-12-27 14:23:43 +01001601 Py_DECREF(old_key);
Antoine Pitroue10ca3a2016-12-27 14:19:20 +01001602 Py_DECREF(old_value);
Antoine Pitroud741ed42016-12-27 14:23:43 +01001603
1604 assert(_PyDict_CheckConsistency(mp));
Antoine Pitroue10ca3a2016-12-27 14:19:20 +01001605 return 0;
1606}
1607
Raymond Hettinger4b74fba2014-05-03 16:32:11 -07001608int
Tim Peters1f5871e2000-07-04 17:44:48 +00001609PyDict_DelItem(PyObject *op, PyObject *key)
Guido van Rossum4b1302b1993-03-27 18:11:32 +00001610{
Benjamin Peterson7d95e402012-04-23 11:24:50 -04001611 Py_hash_t hash;
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00001612 assert(key);
1613 if (!PyUnicode_CheckExact(key) ||
Martin v. Löwisd63a3b82011-09-28 07:41:54 +02001614 (hash = ((PyASCIIObject *) key)->hash) == -1) {
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00001615 hash = PyObject_Hash(key);
1616 if (hash == -1)
1617 return -1;
1618 }
Victor Stinner742da042016-09-07 17:40:12 -07001619
1620 return _PyDict_DelItem_KnownHash(op, key, hash);
Guido van Rossum4b1302b1993-03-27 18:11:32 +00001621}
1622
Serhiy Storchakab9d98d52015-10-02 12:47:11 +03001623int
1624_PyDict_DelItem_KnownHash(PyObject *op, PyObject *key, Py_hash_t hash)
1625{
Victor Stinner742da042016-09-07 17:40:12 -07001626 Py_ssize_t hashpos, ix;
Serhiy Storchakab9d98d52015-10-02 12:47:11 +03001627 PyDictObject *mp;
Antoine Pitrouc06ae202016-12-27 14:34:54 +01001628 PyObject *old_value;
Serhiy Storchakab9d98d52015-10-02 12:47:11 +03001629
1630 if (!PyDict_Check(op)) {
1631 PyErr_BadInternalCall();
1632 return -1;
1633 }
1634 assert(key);
1635 assert(hash != -1);
1636 mp = (PyDictObject *)op;
INADA Naokiba609772016-12-07 20:41:42 +09001637 ix = (mp->ma_keys->dk_lookup)(mp, key, hash, &old_value, &hashpos);
Victor Stinner742da042016-09-07 17:40:12 -07001638 if (ix == DKIX_ERROR)
Serhiy Storchakab9d98d52015-10-02 12:47:11 +03001639 return -1;
INADA Naokiba609772016-12-07 20:41:42 +09001640 if (ix == DKIX_EMPTY || old_value == NULL) {
Serhiy Storchakab9d98d52015-10-02 12:47:11 +03001641 _PyErr_SetKeyError(key);
1642 return -1;
1643 }
Victor Stinner742da042016-09-07 17:40:12 -07001644 assert(dk_get_index(mp->ma_keys, hashpos) == ix);
Victor Stinner78601a32016-09-09 19:28:36 -07001645
1646 // Split table doesn't allow deletion. Combine it.
1647 if (_PyDict_HasSplitTable(mp)) {
1648 if (dictresize(mp, DK_SIZE(mp->ma_keys))) {
1649 return -1;
1650 }
INADA Naokiba609772016-12-07 20:41:42 +09001651 ix = (mp->ma_keys->dk_lookup)(mp, key, hash, &old_value, &hashpos);
Victor Stinner78601a32016-09-09 19:28:36 -07001652 assert(ix >= 0);
1653 }
1654
Antoine Pitrouc06ae202016-12-27 14:34:54 +01001655 return delitem_common(mp, hashpos, ix, old_value);
Serhiy Storchakab9d98d52015-10-02 12:47:11 +03001656}
1657
Antoine Pitroud741ed42016-12-27 14:23:43 +01001658/* This function promises that the predicate -> deletion sequence is atomic
1659 * (i.e. protected by the GIL), assuming the predicate itself doesn't
1660 * release the GIL.
1661 */
Antoine Pitroue10ca3a2016-12-27 14:19:20 +01001662int
1663_PyDict_DelItemIf(PyObject *op, PyObject *key,
1664 int (*predicate)(PyObject *value))
1665{
Antoine Pitroud741ed42016-12-27 14:23:43 +01001666 Py_ssize_t hashpos, ix;
Antoine Pitroue10ca3a2016-12-27 14:19:20 +01001667 PyDictObject *mp;
1668 Py_hash_t hash;
Antoine Pitrouc06ae202016-12-27 14:34:54 +01001669 PyObject *old_value;
Antoine Pitroue10ca3a2016-12-27 14:19:20 +01001670 int res;
1671
1672 if (!PyDict_Check(op)) {
1673 PyErr_BadInternalCall();
1674 return -1;
1675 }
1676 assert(key);
1677 hash = PyObject_Hash(key);
1678 if (hash == -1)
1679 return -1;
1680 mp = (PyDictObject *)op;
Antoine Pitrouc06ae202016-12-27 14:34:54 +01001681 ix = (mp->ma_keys->dk_lookup)(mp, key, hash, &old_value, &hashpos);
Antoine Pitroud741ed42016-12-27 14:23:43 +01001682 if (ix == DKIX_ERROR)
Antoine Pitroue10ca3a2016-12-27 14:19:20 +01001683 return -1;
Antoine Pitrouc06ae202016-12-27 14:34:54 +01001684 if (ix == DKIX_EMPTY || old_value == NULL) {
Antoine Pitroue10ca3a2016-12-27 14:19:20 +01001685 _PyErr_SetKeyError(key);
1686 return -1;
1687 }
Antoine Pitroud741ed42016-12-27 14:23:43 +01001688 assert(dk_get_index(mp->ma_keys, hashpos) == ix);
1689
1690 // Split table doesn't allow deletion. Combine it.
1691 if (_PyDict_HasSplitTable(mp)) {
1692 if (dictresize(mp, DK_SIZE(mp->ma_keys))) {
1693 return -1;
1694 }
Antoine Pitrouc06ae202016-12-27 14:34:54 +01001695 ix = (mp->ma_keys->dk_lookup)(mp, key, hash, &old_value, &hashpos);
Antoine Pitroud741ed42016-12-27 14:23:43 +01001696 assert(ix >= 0);
1697 }
1698
Antoine Pitrouc06ae202016-12-27 14:34:54 +01001699 res = predicate(old_value);
Antoine Pitroue10ca3a2016-12-27 14:19:20 +01001700 if (res == -1)
1701 return -1;
1702 if (res > 0)
Antoine Pitrouc06ae202016-12-27 14:34:54 +01001703 return delitem_common(mp, hashpos, ix, old_value);
Antoine Pitroue10ca3a2016-12-27 14:19:20 +01001704 else
1705 return 0;
1706}
1707
1708
Guido van Rossum25831651993-05-19 14:50:45 +00001709void
Tim Peters1f5871e2000-07-04 17:44:48 +00001710PyDict_Clear(PyObject *op)
Guido van Rossum4b1302b1993-03-27 18:11:32 +00001711{
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00001712 PyDictObject *mp;
Benjamin Peterson7d95e402012-04-23 11:24:50 -04001713 PyDictKeysObject *oldkeys;
1714 PyObject **oldvalues;
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00001715 Py_ssize_t i, n;
Tim Petersdea48ec2001-05-22 20:40:22 +00001716
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00001717 if (!PyDict_Check(op))
1718 return;
Benjamin Peterson7d95e402012-04-23 11:24:50 -04001719 mp = ((PyDictObject *)op);
1720 oldkeys = mp->ma_keys;
1721 oldvalues = mp->ma_values;
1722 if (oldvalues == empty_values)
1723 return;
1724 /* Empty the dict... */
1725 DK_INCREF(Py_EMPTY_KEYS);
1726 mp->ma_keys = Py_EMPTY_KEYS;
1727 mp->ma_values = empty_values;
1728 mp->ma_used = 0;
Victor Stinner3b6a6b42016-09-08 12:51:24 -07001729 mp->ma_version_tag = DICT_NEXT_VERSION();
Benjamin Peterson7d95e402012-04-23 11:24:50 -04001730 /* ...then clear the keys and values */
1731 if (oldvalues != NULL) {
Victor Stinner742da042016-09-07 17:40:12 -07001732 n = oldkeys->dk_nentries;
Benjamin Peterson7d95e402012-04-23 11:24:50 -04001733 for (i = 0; i < n; i++)
1734 Py_CLEAR(oldvalues[i]);
1735 free_values(oldvalues);
1736 DK_DECREF(oldkeys);
1737 }
1738 else {
1739 assert(oldkeys->dk_refcnt == 1);
Antoine Pitrou2d169b22012-05-12 23:43:44 +02001740 DK_DECREF(oldkeys);
Benjamin Peterson7d95e402012-04-23 11:24:50 -04001741 }
Victor Stinner611b0fa2016-09-14 15:02:01 +02001742 assert(_PyDict_CheckConsistency(mp));
Benjamin Peterson7d95e402012-04-23 11:24:50 -04001743}
1744
Serhiy Storchaka49f5cdd2016-10-09 23:08:05 +03001745/* Internal version of PyDict_Next that returns a hash value in addition
1746 * to the key and value.
1747 * Return 1 on success, return 0 when the reached the end of the dictionary
1748 * (or if op is not a dictionary)
Benjamin Peterson7d95e402012-04-23 11:24:50 -04001749 */
Serhiy Storchaka49f5cdd2016-10-09 23:08:05 +03001750int
1751_PyDict_Next(PyObject *op, Py_ssize_t *ppos, PyObject **pkey,
1752 PyObject **pvalue, Py_hash_t *phash)
Benjamin Peterson7d95e402012-04-23 11:24:50 -04001753{
INADA Naokica2d8be2016-11-04 16:59:10 +09001754 Py_ssize_t i;
Benjamin Peterson7d95e402012-04-23 11:24:50 -04001755 PyDictObject *mp;
Serhiy Storchaka49f5cdd2016-10-09 23:08:05 +03001756 PyDictKeyEntry *entry_ptr;
1757 PyObject *value;
Benjamin Peterson7d95e402012-04-23 11:24:50 -04001758
1759 if (!PyDict_Check(op))
Serhiy Storchaka49f5cdd2016-10-09 23:08:05 +03001760 return 0;
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00001761 mp = (PyDictObject *)op;
Serhiy Storchaka49f5cdd2016-10-09 23:08:05 +03001762 i = *ppos;
Benjamin Peterson7d95e402012-04-23 11:24:50 -04001763 if (mp->ma_values) {
INADA Naokica2d8be2016-11-04 16:59:10 +09001764 if (i < 0 || i >= mp->ma_used)
Serhiy Storchaka49f5cdd2016-10-09 23:08:05 +03001765 return 0;
INADA Naokica2d8be2016-11-04 16:59:10 +09001766 /* values of split table is always dense */
Serhiy Storchaka49f5cdd2016-10-09 23:08:05 +03001767 entry_ptr = &DK_ENTRIES(mp->ma_keys)[i];
INADA Naokica2d8be2016-11-04 16:59:10 +09001768 value = mp->ma_values[i];
1769 assert(value != NULL);
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00001770 }
Benjamin Peterson7d95e402012-04-23 11:24:50 -04001771 else {
INADA Naokica2d8be2016-11-04 16:59:10 +09001772 Py_ssize_t n = mp->ma_keys->dk_nentries;
1773 if (i < 0 || i >= n)
1774 return 0;
Serhiy Storchaka49f5cdd2016-10-09 23:08:05 +03001775 entry_ptr = &DK_ENTRIES(mp->ma_keys)[i];
1776 while (i < n && entry_ptr->me_value == NULL) {
1777 entry_ptr++;
1778 i++;
Victor Stinner742da042016-09-07 17:40:12 -07001779 }
Serhiy Storchaka49f5cdd2016-10-09 23:08:05 +03001780 if (i >= n)
1781 return 0;
1782 value = entry_ptr->me_value;
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00001783 }
Serhiy Storchaka49f5cdd2016-10-09 23:08:05 +03001784 *ppos = i+1;
1785 if (pkey)
1786 *pkey = entry_ptr->me_key;
1787 if (phash)
1788 *phash = entry_ptr->me_hash;
Benjamin Peterson7d95e402012-04-23 11:24:50 -04001789 if (pvalue)
Serhiy Storchaka49f5cdd2016-10-09 23:08:05 +03001790 *pvalue = value;
1791 return 1;
Guido van Rossum4b1302b1993-03-27 18:11:32 +00001792}
1793
Tim Peters080c88b2003-02-15 03:01:11 +00001794/*
1795 * Iterate over a dict. Use like so:
1796 *
Thomas Wouters4d70c3d2006-06-08 14:42:34 +00001797 * Py_ssize_t i;
Tim Peters080c88b2003-02-15 03:01:11 +00001798 * PyObject *key, *value;
1799 * i = 0; # important! i should not otherwise be changed by you
Neal Norwitz07323012003-02-15 14:45:12 +00001800 * while (PyDict_Next(yourdict, &i, &key, &value)) {
Serhiy Storchaka49f5cdd2016-10-09 23:08:05 +03001801 * Refer to borrowed references in key and value.
Tim Peters080c88b2003-02-15 03:01:11 +00001802 * }
1803 *
Serhiy Storchaka49f5cdd2016-10-09 23:08:05 +03001804 * Return 1 on success, return 0 when the reached the end of the dictionary
1805 * (or if op is not a dictionary)
1806 *
Tim Peters080c88b2003-02-15 03:01:11 +00001807 * CAUTION: In general, it isn't safe to use PyDict_Next in a loop that
Tim Peters67830702001-03-21 19:23:56 +00001808 * mutates the dict. One exception: it is safe if the loop merely changes
1809 * the values associated with the keys (but doesn't insert new keys or
1810 * delete keys), via PyDict_SetItem().
1811 */
Guido van Rossum25831651993-05-19 14:50:45 +00001812int
Martin v. Löwis18e16552006-02-15 17:27:45 +00001813PyDict_Next(PyObject *op, Py_ssize_t *ppos, PyObject **pkey, PyObject **pvalue)
Guido van Rossum4b1302b1993-03-27 18:11:32 +00001814{
Serhiy Storchaka49f5cdd2016-10-09 23:08:05 +03001815 return _PyDict_Next(op, ppos, pkey, pvalue, NULL);
Thomas Wouterscf297e42007-02-23 15:07:44 +00001816}
1817
Eric Snow96c6af92015-05-29 22:21:39 -06001818/* Internal version of dict.pop(). */
1819PyObject *
Serhiy Storchaka42e1ea92017-01-12 19:12:21 +02001820_PyDict_Pop_KnownHash(PyObject *dict, PyObject *key, Py_hash_t hash, PyObject *deflt)
Eric Snow96c6af92015-05-29 22:21:39 -06001821{
Victor Stinner742da042016-09-07 17:40:12 -07001822 Py_ssize_t ix, hashpos;
Eric Snow96c6af92015-05-29 22:21:39 -06001823 PyObject *old_value, *old_key;
1824 PyDictKeyEntry *ep;
Yury Selivanov684ef2c2016-10-28 19:01:21 -04001825 PyDictObject *mp;
1826
1827 assert(PyDict_Check(dict));
1828 mp = (PyDictObject *)dict;
Eric Snow96c6af92015-05-29 22:21:39 -06001829
1830 if (mp->ma_used == 0) {
1831 if (deflt) {
1832 Py_INCREF(deflt);
1833 return deflt;
1834 }
1835 _PyErr_SetKeyError(key);
1836 return NULL;
1837 }
INADA Naokiba609772016-12-07 20:41:42 +09001838 ix = (mp->ma_keys->dk_lookup)(mp, key, hash, &old_value, &hashpos);
Victor Stinner742da042016-09-07 17:40:12 -07001839 if (ix == DKIX_ERROR)
Eric Snow96c6af92015-05-29 22:21:39 -06001840 return NULL;
INADA Naokiba609772016-12-07 20:41:42 +09001841 if (ix == DKIX_EMPTY || old_value == NULL) {
Eric Snow96c6af92015-05-29 22:21:39 -06001842 if (deflt) {
1843 Py_INCREF(deflt);
1844 return deflt;
1845 }
1846 _PyErr_SetKeyError(key);
1847 return NULL;
1848 }
Victor Stinner3b6a6b42016-09-08 12:51:24 -07001849
Victor Stinner78601a32016-09-09 19:28:36 -07001850 // Split table doesn't allow deletion. Combine it.
1851 if (_PyDict_HasSplitTable(mp)) {
1852 if (dictresize(mp, DK_SIZE(mp->ma_keys))) {
1853 return NULL;
1854 }
INADA Naokiba609772016-12-07 20:41:42 +09001855 ix = (mp->ma_keys->dk_lookup)(mp, key, hash, &old_value, &hashpos);
Victor Stinner78601a32016-09-09 19:28:36 -07001856 assert(ix >= 0);
1857 }
1858
Victor Stinner78601a32016-09-09 19:28:36 -07001859 assert(old_value != NULL);
Eric Snow96c6af92015-05-29 22:21:39 -06001860 mp->ma_used--;
Victor Stinner3b6a6b42016-09-08 12:51:24 -07001861 mp->ma_version_tag = DICT_NEXT_VERSION();
Victor Stinner78601a32016-09-09 19:28:36 -07001862 dk_set_index(mp->ma_keys, hashpos, DKIX_DUMMY);
1863 ep = &DK_ENTRIES(mp->ma_keys)[ix];
1864 ENSURE_ALLOWS_DELETIONS(mp);
1865 old_key = ep->me_key;
1866 ep->me_key = NULL;
INADA Naokiba609772016-12-07 20:41:42 +09001867 ep->me_value = NULL;
Victor Stinner78601a32016-09-09 19:28:36 -07001868 Py_DECREF(old_key);
Victor Stinner611b0fa2016-09-14 15:02:01 +02001869
1870 assert(_PyDict_CheckConsistency(mp));
Eric Snow96c6af92015-05-29 22:21:39 -06001871 return old_value;
1872}
1873
Serhiy Storchaka67796522017-01-12 18:34:33 +02001874PyObject *
Serhiy Storchaka42e1ea92017-01-12 19:12:21 +02001875_PyDict_Pop(PyObject *dict, PyObject *key, PyObject *deflt)
Serhiy Storchaka67796522017-01-12 18:34:33 +02001876{
1877 Py_hash_t hash;
1878
Serhiy Storchaka42e1ea92017-01-12 19:12:21 +02001879 if (((PyDictObject *)dict)->ma_used == 0) {
Serhiy Storchaka67796522017-01-12 18:34:33 +02001880 if (deflt) {
1881 Py_INCREF(deflt);
1882 return deflt;
1883 }
1884 _PyErr_SetKeyError(key);
1885 return NULL;
1886 }
1887 if (!PyUnicode_CheckExact(key) ||
1888 (hash = ((PyASCIIObject *) key)->hash) == -1) {
1889 hash = PyObject_Hash(key);
1890 if (hash == -1)
1891 return NULL;
1892 }
Serhiy Storchaka42e1ea92017-01-12 19:12:21 +02001893 return _PyDict_Pop_KnownHash(dict, key, hash, deflt);
Serhiy Storchaka67796522017-01-12 18:34:33 +02001894}
1895
Eric Snow96c6af92015-05-29 22:21:39 -06001896/* Internal version of dict.from_keys(). It is subclass-friendly. */
1897PyObject *
1898_PyDict_FromKeys(PyObject *cls, PyObject *iterable, PyObject *value)
1899{
1900 PyObject *it; /* iter(iterable) */
1901 PyObject *key;
1902 PyObject *d;
1903 int status;
1904
Victor Stinnera5ed5f02016-12-06 18:45:50 +01001905 d = _PyObject_CallNoArg(cls);
Eric Snow96c6af92015-05-29 22:21:39 -06001906 if (d == NULL)
1907 return NULL;
1908
1909 if (PyDict_CheckExact(d) && ((PyDictObject *)d)->ma_used == 0) {
1910 if (PyDict_CheckExact(iterable)) {
1911 PyDictObject *mp = (PyDictObject *)d;
1912 PyObject *oldvalue;
1913 Py_ssize_t pos = 0;
1914 PyObject *key;
1915 Py_hash_t hash;
1916
Victor Stinner742da042016-09-07 17:40:12 -07001917 if (dictresize(mp, ESTIMATE_SIZE(Py_SIZE(iterable)))) {
Eric Snow96c6af92015-05-29 22:21:39 -06001918 Py_DECREF(d);
1919 return NULL;
1920 }
1921
1922 while (_PyDict_Next(iterable, &pos, &key, &oldvalue, &hash)) {
1923 if (insertdict(mp, key, hash, value)) {
1924 Py_DECREF(d);
1925 return NULL;
1926 }
1927 }
1928 return d;
1929 }
1930 if (PyAnySet_CheckExact(iterable)) {
1931 PyDictObject *mp = (PyDictObject *)d;
1932 Py_ssize_t pos = 0;
1933 PyObject *key;
1934 Py_hash_t hash;
1935
Victor Stinner742da042016-09-07 17:40:12 -07001936 if (dictresize(mp, ESTIMATE_SIZE(PySet_GET_SIZE(iterable)))) {
Eric Snow96c6af92015-05-29 22:21:39 -06001937 Py_DECREF(d);
1938 return NULL;
1939 }
1940
1941 while (_PySet_NextEntry(iterable, &pos, &key, &hash)) {
1942 if (insertdict(mp, key, hash, value)) {
1943 Py_DECREF(d);
1944 return NULL;
1945 }
1946 }
1947 return d;
1948 }
1949 }
1950
1951 it = PyObject_GetIter(iterable);
1952 if (it == NULL){
1953 Py_DECREF(d);
1954 return NULL;
1955 }
1956
1957 if (PyDict_CheckExact(d)) {
1958 while ((key = PyIter_Next(it)) != NULL) {
1959 status = PyDict_SetItem(d, key, value);
1960 Py_DECREF(key);
1961 if (status < 0)
1962 goto Fail;
1963 }
1964 } else {
1965 while ((key = PyIter_Next(it)) != NULL) {
1966 status = PyObject_SetItem(d, key, value);
1967 Py_DECREF(key);
1968 if (status < 0)
1969 goto Fail;
1970 }
1971 }
1972
1973 if (PyErr_Occurred())
1974 goto Fail;
1975 Py_DECREF(it);
1976 return d;
1977
1978Fail:
1979 Py_DECREF(it);
1980 Py_DECREF(d);
1981 return NULL;
1982}
1983
Guido van Rossum4b1302b1993-03-27 18:11:32 +00001984/* Methods */
1985
1986static void
Benjamin Peterson7d95e402012-04-23 11:24:50 -04001987dict_dealloc(PyDictObject *mp)
Guido van Rossum4b1302b1993-03-27 18:11:32 +00001988{
Benjamin Peterson7d95e402012-04-23 11:24:50 -04001989 PyObject **values = mp->ma_values;
1990 PyDictKeysObject *keys = mp->ma_keys;
1991 Py_ssize_t i, n;
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00001992 PyObject_GC_UnTrack(mp);
1993 Py_TRASHCAN_SAFE_BEGIN(mp)
Benjamin Peterson7d95e402012-04-23 11:24:50 -04001994 if (values != NULL) {
1995 if (values != empty_values) {
Victor Stinner742da042016-09-07 17:40:12 -07001996 for (i = 0, n = mp->ma_keys->dk_nentries; i < n; i++) {
Benjamin Peterson7d95e402012-04-23 11:24:50 -04001997 Py_XDECREF(values[i]);
1998 }
1999 free_values(values);
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00002000 }
Benjamin Peterson7d95e402012-04-23 11:24:50 -04002001 DK_DECREF(keys);
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00002002 }
Victor Stinnerac2a4fe2013-07-16 22:19:00 +02002003 else if (keys != NULL) {
Antoine Pitrou2d169b22012-05-12 23:43:44 +02002004 assert(keys->dk_refcnt == 1);
2005 DK_DECREF(keys);
Benjamin Peterson7d95e402012-04-23 11:24:50 -04002006 }
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00002007 if (numfree < PyDict_MAXFREELIST && Py_TYPE(mp) == &PyDict_Type)
2008 free_list[numfree++] = mp;
2009 else
2010 Py_TYPE(mp)->tp_free((PyObject *)mp);
2011 Py_TRASHCAN_SAFE_END(mp)
Guido van Rossum4b1302b1993-03-27 18:11:32 +00002012}
2013
Benjamin Peterson7d95e402012-04-23 11:24:50 -04002014
Guido van Rossumc0b618a1997-05-02 03:12:38 +00002015static PyObject *
Guido van Rossum8ce8a782007-11-01 19:42:39 +00002016dict_repr(PyDictObject *mp)
Guido van Rossum4b1302b1993-03-27 18:11:32 +00002017{
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00002018 Py_ssize_t i;
Victor Stinnerf91929b2013-11-19 13:07:38 +01002019 PyObject *key = NULL, *value = NULL;
2020 _PyUnicodeWriter writer;
2021 int first;
Guido van Rossum255443b1998-04-10 22:47:14 +00002022
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00002023 i = Py_ReprEnter((PyObject *)mp);
2024 if (i != 0) {
2025 return i > 0 ? PyUnicode_FromString("{...}") : NULL;
2026 }
Guido van Rossum255443b1998-04-10 22:47:14 +00002027
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00002028 if (mp->ma_used == 0) {
Victor Stinnerf91929b2013-11-19 13:07:38 +01002029 Py_ReprLeave((PyObject *)mp);
2030 return PyUnicode_FromString("{}");
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00002031 }
Tim Petersa7259592001-06-16 05:11:17 +00002032
Victor Stinnerf91929b2013-11-19 13:07:38 +01002033 _PyUnicodeWriter_Init(&writer);
2034 writer.overallocate = 1;
2035 /* "{" + "1: 2" + ", 3: 4" * (len - 1) + "}" */
2036 writer.min_length = 1 + 4 + (2 + 4) * (mp->ma_used - 1) + 1;
Tim Petersa7259592001-06-16 05:11:17 +00002037
Victor Stinnerf91929b2013-11-19 13:07:38 +01002038 if (_PyUnicodeWriter_WriteChar(&writer, '{') < 0)
2039 goto error;
Tim Petersa7259592001-06-16 05:11:17 +00002040
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00002041 /* Do repr() on each key+value pair, and insert ": " between them.
2042 Note that repr may mutate the dict. */
2043 i = 0;
Victor Stinnerf91929b2013-11-19 13:07:38 +01002044 first = 1;
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00002045 while (PyDict_Next((PyObject *)mp, &i, &key, &value)) {
Victor Stinnerf91929b2013-11-19 13:07:38 +01002046 PyObject *s;
2047 int res;
2048
Benjamin Peterson7d95e402012-04-23 11:24:50 -04002049 /* Prevent repr from deleting key or value during key format. */
2050 Py_INCREF(key);
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00002051 Py_INCREF(value);
Victor Stinnerf97dfd72013-07-18 01:00:45 +02002052
Victor Stinnerf91929b2013-11-19 13:07:38 +01002053 if (!first) {
2054 if (_PyUnicodeWriter_WriteASCIIString(&writer, ", ", 2) < 0)
2055 goto error;
2056 }
2057 first = 0;
2058
2059 s = PyObject_Repr(key);
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00002060 if (s == NULL)
Victor Stinnerf91929b2013-11-19 13:07:38 +01002061 goto error;
2062 res = _PyUnicodeWriter_WriteStr(&writer, s);
2063 Py_DECREF(s);
2064 if (res < 0)
2065 goto error;
2066
2067 if (_PyUnicodeWriter_WriteASCIIString(&writer, ": ", 2) < 0)
2068 goto error;
2069
2070 s = PyObject_Repr(value);
2071 if (s == NULL)
2072 goto error;
2073 res = _PyUnicodeWriter_WriteStr(&writer, s);
2074 Py_DECREF(s);
2075 if (res < 0)
2076 goto error;
2077
2078 Py_CLEAR(key);
2079 Py_CLEAR(value);
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00002080 }
Tim Petersa7259592001-06-16 05:11:17 +00002081
Victor Stinnerf91929b2013-11-19 13:07:38 +01002082 writer.overallocate = 0;
2083 if (_PyUnicodeWriter_WriteChar(&writer, '}') < 0)
2084 goto error;
Tim Petersa7259592001-06-16 05:11:17 +00002085
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00002086 Py_ReprLeave((PyObject *)mp);
Victor Stinnerf91929b2013-11-19 13:07:38 +01002087
2088 return _PyUnicodeWriter_Finish(&writer);
2089
2090error:
2091 Py_ReprLeave((PyObject *)mp);
2092 _PyUnicodeWriter_Dealloc(&writer);
2093 Py_XDECREF(key);
2094 Py_XDECREF(value);
2095 return NULL;
Guido van Rossum4b1302b1993-03-27 18:11:32 +00002096}
2097
Martin v. Löwis18e16552006-02-15 17:27:45 +00002098static Py_ssize_t
Guido van Rossum8ce8a782007-11-01 19:42:39 +00002099dict_length(PyDictObject *mp)
Guido van Rossum4b1302b1993-03-27 18:11:32 +00002100{
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00002101 return mp->ma_used;
Guido van Rossum4b1302b1993-03-27 18:11:32 +00002102}
2103
Guido van Rossumc0b618a1997-05-02 03:12:38 +00002104static PyObject *
Antoine Pitrou9ed5f272013-08-13 20:18:52 +02002105dict_subscript(PyDictObject *mp, PyObject *key)
Guido van Rossum4b1302b1993-03-27 18:11:32 +00002106{
Victor Stinner742da042016-09-07 17:40:12 -07002107 Py_ssize_t ix;
Benjamin Peterson8f67d082010-10-17 20:54:53 +00002108 Py_hash_t hash;
INADA Naokiba609772016-12-07 20:41:42 +09002109 PyObject *value;
Benjamin Peterson7d95e402012-04-23 11:24:50 -04002110
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00002111 if (!PyUnicode_CheckExact(key) ||
Martin v. Löwisd63a3b82011-09-28 07:41:54 +02002112 (hash = ((PyASCIIObject *) key)->hash) == -1) {
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00002113 hash = PyObject_Hash(key);
2114 if (hash == -1)
2115 return NULL;
2116 }
INADA Naokiba609772016-12-07 20:41:42 +09002117 ix = (mp->ma_keys->dk_lookup)(mp, key, hash, &value, NULL);
Victor Stinner742da042016-09-07 17:40:12 -07002118 if (ix == DKIX_ERROR)
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00002119 return NULL;
INADA Naokiba609772016-12-07 20:41:42 +09002120 if (ix == DKIX_EMPTY || value == NULL) {
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00002121 if (!PyDict_CheckExact(mp)) {
2122 /* Look up __missing__ method if we're a subclass. */
2123 PyObject *missing, *res;
Benjamin Petersonce798522012-01-22 11:24:29 -05002124 _Py_IDENTIFIER(__missing__);
2125 missing = _PyObject_LookupSpecial((PyObject *)mp, &PyId___missing__);
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00002126 if (missing != NULL) {
Victor Stinnerde4ae3d2016-12-04 22:59:09 +01002127 res = PyObject_CallFunctionObjArgs(missing,
2128 key, NULL);
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00002129 Py_DECREF(missing);
2130 return res;
2131 }
2132 else if (PyErr_Occurred())
2133 return NULL;
2134 }
Raymond Hettinger69492da2013-09-02 15:59:26 -07002135 _PyErr_SetKeyError(key);
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00002136 return NULL;
2137 }
INADA Naokiba609772016-12-07 20:41:42 +09002138 Py_INCREF(value);
2139 return value;
Guido van Rossum4b1302b1993-03-27 18:11:32 +00002140}
2141
2142static int
Guido van Rossum8ce8a782007-11-01 19:42:39 +00002143dict_ass_sub(PyDictObject *mp, PyObject *v, PyObject *w)
Guido van Rossum4b1302b1993-03-27 18:11:32 +00002144{
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00002145 if (w == NULL)
2146 return PyDict_DelItem((PyObject *)mp, v);
2147 else
2148 return PyDict_SetItem((PyObject *)mp, v, w);
Guido van Rossum4b1302b1993-03-27 18:11:32 +00002149}
2150
Guido van Rossuma9e7a811997-05-13 21:02:11 +00002151static PyMappingMethods dict_as_mapping = {
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00002152 (lenfunc)dict_length, /*mp_length*/
2153 (binaryfunc)dict_subscript, /*mp_subscript*/
2154 (objobjargproc)dict_ass_sub, /*mp_ass_subscript*/
Guido van Rossum4b1302b1993-03-27 18:11:32 +00002155};
2156
Guido van Rossumc0b618a1997-05-02 03:12:38 +00002157static PyObject *
Antoine Pitrou9ed5f272013-08-13 20:18:52 +02002158dict_keys(PyDictObject *mp)
Guido van Rossum4b1302b1993-03-27 18:11:32 +00002159{
Antoine Pitrou9ed5f272013-08-13 20:18:52 +02002160 PyObject *v;
2161 Py_ssize_t i, j;
Benjamin Peterson7d95e402012-04-23 11:24:50 -04002162 PyDictKeyEntry *ep;
2163 Py_ssize_t size, n, offset;
2164 PyObject **value_ptr;
Guido van Rossuma4dd0112001-04-15 22:16:26 +00002165
Guido van Rossuma4dd0112001-04-15 22:16:26 +00002166 again:
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00002167 n = mp->ma_used;
2168 v = PyList_New(n);
2169 if (v == NULL)
2170 return NULL;
2171 if (n != mp->ma_used) {
2172 /* Durnit. The allocations caused the dict to resize.
2173 * Just start over, this shouldn't normally happen.
2174 */
2175 Py_DECREF(v);
2176 goto again;
2177 }
Victor Stinner742da042016-09-07 17:40:12 -07002178 ep = DK_ENTRIES(mp->ma_keys);
2179 size = mp->ma_keys->dk_nentries;
Benjamin Peterson7d95e402012-04-23 11:24:50 -04002180 if (mp->ma_values) {
2181 value_ptr = mp->ma_values;
2182 offset = sizeof(PyObject *);
2183 }
2184 else {
2185 value_ptr = &ep[0].me_value;
2186 offset = sizeof(PyDictKeyEntry);
2187 }
2188 for (i = 0, j = 0; i < size; i++) {
2189 if (*value_ptr != NULL) {
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00002190 PyObject *key = ep[i].me_key;
2191 Py_INCREF(key);
2192 PyList_SET_ITEM(v, j, key);
2193 j++;
2194 }
Benjamin Peterson7d95e402012-04-23 11:24:50 -04002195 value_ptr = (PyObject **)(((char *)value_ptr) + offset);
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00002196 }
2197 assert(j == n);
2198 return v;
Guido van Rossum4b1302b1993-03-27 18:11:32 +00002199}
2200
Guido van Rossumc0b618a1997-05-02 03:12:38 +00002201static PyObject *
Antoine Pitrou9ed5f272013-08-13 20:18:52 +02002202dict_values(PyDictObject *mp)
Guido van Rossum25831651993-05-19 14:50:45 +00002203{
Antoine Pitrou9ed5f272013-08-13 20:18:52 +02002204 PyObject *v;
2205 Py_ssize_t i, j;
Benjamin Petersonf0acae22016-09-08 09:50:08 -07002206 PyDictKeyEntry *ep;
Benjamin Peterson7d95e402012-04-23 11:24:50 -04002207 Py_ssize_t size, n, offset;
2208 PyObject **value_ptr;
Guido van Rossuma4dd0112001-04-15 22:16:26 +00002209
Guido van Rossuma4dd0112001-04-15 22:16:26 +00002210 again:
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00002211 n = mp->ma_used;
2212 v = PyList_New(n);
2213 if (v == NULL)
2214 return NULL;
2215 if (n != mp->ma_used) {
2216 /* Durnit. The allocations caused the dict to resize.
2217 * Just start over, this shouldn't normally happen.
2218 */
2219 Py_DECREF(v);
2220 goto again;
2221 }
Benjamin Petersonf0acae22016-09-08 09:50:08 -07002222 ep = DK_ENTRIES(mp->ma_keys);
Victor Stinner742da042016-09-07 17:40:12 -07002223 size = mp->ma_keys->dk_nentries;
Benjamin Peterson7d95e402012-04-23 11:24:50 -04002224 if (mp->ma_values) {
2225 value_ptr = mp->ma_values;
2226 offset = sizeof(PyObject *);
2227 }
2228 else {
Benjamin Petersonf0acae22016-09-08 09:50:08 -07002229 value_ptr = &ep[0].me_value;
Benjamin Peterson7d95e402012-04-23 11:24:50 -04002230 offset = sizeof(PyDictKeyEntry);
2231 }
2232 for (i = 0, j = 0; i < size; i++) {
2233 PyObject *value = *value_ptr;
2234 value_ptr = (PyObject **)(((char *)value_ptr) + offset);
2235 if (value != NULL) {
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00002236 Py_INCREF(value);
2237 PyList_SET_ITEM(v, j, value);
2238 j++;
2239 }
2240 }
2241 assert(j == n);
2242 return v;
Guido van Rossum25831651993-05-19 14:50:45 +00002243}
2244
Guido van Rossumc0b618a1997-05-02 03:12:38 +00002245static PyObject *
Antoine Pitrou9ed5f272013-08-13 20:18:52 +02002246dict_items(PyDictObject *mp)
Guido van Rossum25831651993-05-19 14:50:45 +00002247{
Antoine Pitrou9ed5f272013-08-13 20:18:52 +02002248 PyObject *v;
2249 Py_ssize_t i, j, n;
Benjamin Peterson7d95e402012-04-23 11:24:50 -04002250 Py_ssize_t size, offset;
2251 PyObject *item, *key;
2252 PyDictKeyEntry *ep;
2253 PyObject **value_ptr;
Guido van Rossuma4dd0112001-04-15 22:16:26 +00002254
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00002255 /* Preallocate the list of tuples, to avoid allocations during
2256 * the loop over the items, which could trigger GC, which
2257 * could resize the dict. :-(
2258 */
Guido van Rossuma4dd0112001-04-15 22:16:26 +00002259 again:
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00002260 n = mp->ma_used;
2261 v = PyList_New(n);
2262 if (v == NULL)
2263 return NULL;
2264 for (i = 0; i < n; i++) {
2265 item = PyTuple_New(2);
2266 if (item == NULL) {
2267 Py_DECREF(v);
2268 return NULL;
2269 }
2270 PyList_SET_ITEM(v, i, item);
2271 }
2272 if (n != mp->ma_used) {
2273 /* Durnit. The allocations caused the dict to resize.
2274 * Just start over, this shouldn't normally happen.
2275 */
2276 Py_DECREF(v);
2277 goto again;
2278 }
2279 /* Nothing we do below makes any function calls. */
Victor Stinner742da042016-09-07 17:40:12 -07002280 ep = DK_ENTRIES(mp->ma_keys);
2281 size = mp->ma_keys->dk_nentries;
Benjamin Peterson7d95e402012-04-23 11:24:50 -04002282 if (mp->ma_values) {
2283 value_ptr = mp->ma_values;
2284 offset = sizeof(PyObject *);
2285 }
2286 else {
2287 value_ptr = &ep[0].me_value;
2288 offset = sizeof(PyDictKeyEntry);
2289 }
2290 for (i = 0, j = 0; i < size; i++) {
2291 PyObject *value = *value_ptr;
2292 value_ptr = (PyObject **)(((char *)value_ptr) + offset);
2293 if (value != NULL) {
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00002294 key = ep[i].me_key;
2295 item = PyList_GET_ITEM(v, j);
2296 Py_INCREF(key);
2297 PyTuple_SET_ITEM(item, 0, key);
2298 Py_INCREF(value);
2299 PyTuple_SET_ITEM(item, 1, value);
2300 j++;
2301 }
2302 }
2303 assert(j == n);
2304 return v;
Guido van Rossum25831651993-05-19 14:50:45 +00002305}
2306
Larry Hastings5c661892014-01-24 06:17:25 -08002307/*[clinic input]
2308@classmethod
2309dict.fromkeys
Larry Hastings5c661892014-01-24 06:17:25 -08002310 iterable: object
2311 value: object=None
2312 /
2313
2314Returns a new dict with keys from iterable and values equal to value.
2315[clinic start generated code]*/
2316
Larry Hastings5c661892014-01-24 06:17:25 -08002317static PyObject *
2318dict_fromkeys_impl(PyTypeObject *type, PyObject *iterable, PyObject *value)
Serhiy Storchaka1009bf12015-04-03 23:53:51 +03002319/*[clinic end generated code: output=8fb98e4b10384999 input=b85a667f9bf4669d]*/
Larry Hastings5c661892014-01-24 06:17:25 -08002320{
Eric Snow96c6af92015-05-29 22:21:39 -06002321 return _PyDict_FromKeys((PyObject *)type, iterable, value);
Raymond Hettingere33d3df2002-11-27 07:29:33 +00002322}
2323
Raymond Hettinger31017ae2004-03-04 08:25:44 +00002324static int
Victor Stinner742da042016-09-07 17:40:12 -07002325dict_update_common(PyObject *self, PyObject *args, PyObject *kwds,
2326 const char *methname)
Guido van Rossume3f5b9c1997-05-28 19:15:28 +00002327{
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00002328 PyObject *arg = NULL;
2329 int result = 0;
Raymond Hettinger31017ae2004-03-04 08:25:44 +00002330
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00002331 if (!PyArg_UnpackTuple(args, methname, 0, 1, &arg))
2332 result = -1;
Raymond Hettinger31017ae2004-03-04 08:25:44 +00002333
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00002334 else if (arg != NULL) {
Martin v. Löwis1c67dd92011-10-14 15:16:45 +02002335 _Py_IDENTIFIER(keys);
2336 if (_PyObject_HasAttrId(arg, &PyId_keys))
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00002337 result = PyDict_Merge(self, arg, 1);
2338 else
2339 result = PyDict_MergeFromSeq2(self, arg, 1);
2340 }
2341 if (result == 0 && kwds != NULL) {
2342 if (PyArg_ValidateKeywordArguments(kwds))
2343 result = PyDict_Merge(self, kwds, 1);
2344 else
2345 result = -1;
2346 }
2347 return result;
Raymond Hettinger31017ae2004-03-04 08:25:44 +00002348}
2349
2350static PyObject *
2351dict_update(PyObject *self, PyObject *args, PyObject *kwds)
2352{
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00002353 if (dict_update_common(self, args, kwds, "update") != -1)
2354 Py_RETURN_NONE;
2355 return NULL;
Tim Peters6d6c1a32001-08-02 04:15:00 +00002356}
2357
Guido van Rossum05ac6de2001-08-10 20:28:28 +00002358/* Update unconditionally replaces existing items.
2359 Merge has a 3rd argument 'override'; if set, it acts like Update,
Tim Peters1fc240e2001-10-26 05:06:50 +00002360 otherwise it leaves existing items unchanged.
2361
2362 PyDict_{Update,Merge} update/merge from a mapping object.
2363
Tim Petersf582b822001-12-11 18:51:08 +00002364 PyDict_MergeFromSeq2 updates/merges from any iterable object
Tim Peters1fc240e2001-10-26 05:06:50 +00002365 producing iterable objects of length 2.
2366*/
2367
Tim Petersf582b822001-12-11 18:51:08 +00002368int
Tim Peters1fc240e2001-10-26 05:06:50 +00002369PyDict_MergeFromSeq2(PyObject *d, PyObject *seq2, int override)
2370{
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00002371 PyObject *it; /* iter(seq2) */
2372 Py_ssize_t i; /* index into seq2 of current element */
2373 PyObject *item; /* seq2[i] */
2374 PyObject *fast; /* item as a 2-tuple or 2-list */
Tim Peters1fc240e2001-10-26 05:06:50 +00002375
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00002376 assert(d != NULL);
2377 assert(PyDict_Check(d));
2378 assert(seq2 != NULL);
Tim Peters1fc240e2001-10-26 05:06:50 +00002379
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00002380 it = PyObject_GetIter(seq2);
2381 if (it == NULL)
2382 return -1;
Tim Peters1fc240e2001-10-26 05:06:50 +00002383
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00002384 for (i = 0; ; ++i) {
2385 PyObject *key, *value;
2386 Py_ssize_t n;
Tim Peters1fc240e2001-10-26 05:06:50 +00002387
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00002388 fast = NULL;
2389 item = PyIter_Next(it);
2390 if (item == NULL) {
2391 if (PyErr_Occurred())
2392 goto Fail;
2393 break;
2394 }
Tim Peters1fc240e2001-10-26 05:06:50 +00002395
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00002396 /* Convert item to sequence, and verify length 2. */
2397 fast = PySequence_Fast(item, "");
2398 if (fast == NULL) {
2399 if (PyErr_ExceptionMatches(PyExc_TypeError))
2400 PyErr_Format(PyExc_TypeError,
2401 "cannot convert dictionary update "
2402 "sequence element #%zd to a sequence",
2403 i);
2404 goto Fail;
2405 }
2406 n = PySequence_Fast_GET_SIZE(fast);
2407 if (n != 2) {
2408 PyErr_Format(PyExc_ValueError,
2409 "dictionary update sequence element #%zd "
2410 "has length %zd; 2 is required",
2411 i, n);
2412 goto Fail;
2413 }
Tim Peters1fc240e2001-10-26 05:06:50 +00002414
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00002415 /* Update/merge with this (key, value) pair. */
2416 key = PySequence_Fast_GET_ITEM(fast, 0);
2417 value = PySequence_Fast_GET_ITEM(fast, 1);
2418 if (override || PyDict_GetItem(d, key) == NULL) {
2419 int status = PyDict_SetItem(d, key, value);
2420 if (status < 0)
2421 goto Fail;
2422 }
2423 Py_DECREF(fast);
2424 Py_DECREF(item);
2425 }
Tim Peters1fc240e2001-10-26 05:06:50 +00002426
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00002427 i = 0;
Victor Stinner611b0fa2016-09-14 15:02:01 +02002428 assert(_PyDict_CheckConsistency((PyDictObject *)d));
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00002429 goto Return;
Tim Peters1fc240e2001-10-26 05:06:50 +00002430Fail:
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00002431 Py_XDECREF(item);
2432 Py_XDECREF(fast);
2433 i = -1;
Tim Peters1fc240e2001-10-26 05:06:50 +00002434Return:
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00002435 Py_DECREF(it);
2436 return Py_SAFE_DOWNCAST(i, Py_ssize_t, int);
Tim Peters1fc240e2001-10-26 05:06:50 +00002437}
2438
doko@ubuntu.comc96df682016-10-11 08:04:02 +02002439static int
Serhiy Storchakae036ef82016-10-02 11:06:43 +03002440dict_merge(PyObject *a, PyObject *b, int override)
Guido van Rossum05ac6de2001-08-10 20:28:28 +00002441{
Antoine Pitrou9ed5f272013-08-13 20:18:52 +02002442 PyDictObject *mp, *other;
2443 Py_ssize_t i, n;
Victor Stinner742da042016-09-07 17:40:12 -07002444 PyDictKeyEntry *entry, *ep0;
Tim Peters6d6c1a32001-08-02 04:15:00 +00002445
Serhiy Storchakae036ef82016-10-02 11:06:43 +03002446 assert(0 <= override && override <= 2);
2447
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00002448 /* We accept for the argument either a concrete dictionary object,
2449 * or an abstract "mapping" object. For the former, we can do
2450 * things quite efficiently. For the latter, we only require that
2451 * PyMapping_Keys() and PyObject_GetItem() be supported.
2452 */
2453 if (a == NULL || !PyDict_Check(a) || b == NULL) {
2454 PyErr_BadInternalCall();
2455 return -1;
2456 }
2457 mp = (PyDictObject*)a;
2458 if (PyDict_Check(b)) {
2459 other = (PyDictObject*)b;
2460 if (other == mp || other->ma_used == 0)
2461 /* a.update(a) or a.update({}); nothing to do */
2462 return 0;
2463 if (mp->ma_used == 0)
2464 /* Since the target dict is empty, PyDict_GetItem()
2465 * always returns NULL. Setting override to 1
2466 * skips the unnecessary test.
2467 */
2468 override = 1;
2469 /* Do one big resize at the start, rather than
2470 * incrementally resizing as we insert new items. Expect
2471 * that there will be no (or few) overlapping keys.
2472 */
INADA Naokib1152be2016-10-27 19:26:50 +09002473 if (USABLE_FRACTION(mp->ma_keys->dk_size) < other->ma_used) {
2474 if (dictresize(mp, ESTIMATE_SIZE(mp->ma_used + other->ma_used))) {
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00002475 return -1;
INADA Naokib1152be2016-10-27 19:26:50 +09002476 }
2477 }
Victor Stinner742da042016-09-07 17:40:12 -07002478 ep0 = DK_ENTRIES(other->ma_keys);
2479 for (i = 0, n = other->ma_keys->dk_nentries; i < n; i++) {
Benjamin Petersona82f77f2015-07-04 19:55:16 -05002480 PyObject *key, *value;
2481 Py_hash_t hash;
Victor Stinner742da042016-09-07 17:40:12 -07002482 entry = &ep0[i];
Benjamin Petersona82f77f2015-07-04 19:55:16 -05002483 key = entry->me_key;
2484 hash = entry->me_hash;
Benjamin Peterson7d95e402012-04-23 11:24:50 -04002485 if (other->ma_values)
2486 value = other->ma_values[i];
2487 else
2488 value = entry->me_value;
2489
Benjamin Petersona82f77f2015-07-04 19:55:16 -05002490 if (value != NULL) {
2491 int err = 0;
2492 Py_INCREF(key);
2493 Py_INCREF(value);
Serhiy Storchakaf0b311b2016-11-06 13:18:24 +02002494 if (override == 1)
Benjamin Petersona82f77f2015-07-04 19:55:16 -05002495 err = insertdict(mp, key, hash, value);
Serhiy Storchakaf0b311b2016-11-06 13:18:24 +02002496 else if (_PyDict_GetItem_KnownHash(a, key, hash) == NULL) {
2497 if (PyErr_Occurred()) {
2498 Py_DECREF(value);
2499 Py_DECREF(key);
2500 return -1;
2501 }
2502 err = insertdict(mp, key, hash, value);
2503 }
Serhiy Storchakae036ef82016-10-02 11:06:43 +03002504 else if (override != 0) {
2505 _PyErr_SetKeyError(key);
2506 Py_DECREF(value);
2507 Py_DECREF(key);
2508 return -1;
2509 }
Benjamin Petersona82f77f2015-07-04 19:55:16 -05002510 Py_DECREF(value);
2511 Py_DECREF(key);
2512 if (err != 0)
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00002513 return -1;
Benjamin Petersona82f77f2015-07-04 19:55:16 -05002514
Victor Stinner742da042016-09-07 17:40:12 -07002515 if (n != other->ma_keys->dk_nentries) {
Benjamin Petersona82f77f2015-07-04 19:55:16 -05002516 PyErr_SetString(PyExc_RuntimeError,
2517 "dict mutated during update");
2518 return -1;
2519 }
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00002520 }
2521 }
2522 }
2523 else {
2524 /* Do it the generic, slower way */
2525 PyObject *keys = PyMapping_Keys(b);
2526 PyObject *iter;
2527 PyObject *key, *value;
2528 int status;
Barry Warsaw66a0d1d2001-06-26 20:08:32 +00002529
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00002530 if (keys == NULL)
2531 /* Docstring says this is equivalent to E.keys() so
2532 * if E doesn't have a .keys() method we want
2533 * AttributeError to percolate up. Might as well
2534 * do the same for any other error.
2535 */
2536 return -1;
Barry Warsaw66a0d1d2001-06-26 20:08:32 +00002537
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00002538 iter = PyObject_GetIter(keys);
2539 Py_DECREF(keys);
2540 if (iter == NULL)
2541 return -1;
Barry Warsaw66a0d1d2001-06-26 20:08:32 +00002542
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00002543 for (key = PyIter_Next(iter); key; key = PyIter_Next(iter)) {
Serhiy Storchakae036ef82016-10-02 11:06:43 +03002544 if (override != 1 && PyDict_GetItem(a, key) != NULL) {
2545 if (override != 0) {
2546 _PyErr_SetKeyError(key);
2547 Py_DECREF(key);
2548 Py_DECREF(iter);
2549 return -1;
2550 }
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00002551 Py_DECREF(key);
2552 continue;
2553 }
2554 value = PyObject_GetItem(b, key);
2555 if (value == NULL) {
2556 Py_DECREF(iter);
2557 Py_DECREF(key);
2558 return -1;
2559 }
2560 status = PyDict_SetItem(a, key, value);
2561 Py_DECREF(key);
2562 Py_DECREF(value);
2563 if (status < 0) {
2564 Py_DECREF(iter);
2565 return -1;
2566 }
2567 }
2568 Py_DECREF(iter);
2569 if (PyErr_Occurred())
2570 /* Iterator completed, via error */
2571 return -1;
2572 }
Victor Stinner611b0fa2016-09-14 15:02:01 +02002573 assert(_PyDict_CheckConsistency((PyDictObject *)a));
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00002574 return 0;
Guido van Rossume3f5b9c1997-05-28 19:15:28 +00002575}
2576
Serhiy Storchakae036ef82016-10-02 11:06:43 +03002577int
2578PyDict_Update(PyObject *a, PyObject *b)
2579{
2580 return dict_merge(a, b, 1);
2581}
2582
2583int
2584PyDict_Merge(PyObject *a, PyObject *b, int override)
2585{
2586 /* XXX Deprecate override not in (0, 1). */
2587 return dict_merge(a, b, override != 0);
2588}
2589
2590int
2591_PyDict_MergeEx(PyObject *a, PyObject *b, int override)
2592{
2593 return dict_merge(a, b, override);
2594}
2595
Guido van Rossume3f5b9c1997-05-28 19:15:28 +00002596static PyObject *
Antoine Pitrou9ed5f272013-08-13 20:18:52 +02002597dict_copy(PyDictObject *mp)
Guido van Rossume3f5b9c1997-05-28 19:15:28 +00002598{
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00002599 return PyDict_Copy((PyObject*)mp);
Jeremy Hyltona12c7a72000-03-30 22:27:31 +00002600}
2601
2602PyObject *
Tim Peters1f5871e2000-07-04 17:44:48 +00002603PyDict_Copy(PyObject *o)
Jeremy Hyltona12c7a72000-03-30 22:27:31 +00002604{
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00002605 PyObject *copy;
Benjamin Peterson7d95e402012-04-23 11:24:50 -04002606 PyDictObject *mp;
2607 Py_ssize_t i, n;
Jeremy Hyltona12c7a72000-03-30 22:27:31 +00002608
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00002609 if (o == NULL || !PyDict_Check(o)) {
2610 PyErr_BadInternalCall();
2611 return NULL;
2612 }
Benjamin Peterson7d95e402012-04-23 11:24:50 -04002613 mp = (PyDictObject *)o;
2614 if (_PyDict_HasSplitTable(mp)) {
2615 PyDictObject *split_copy;
Victor Stinner742da042016-09-07 17:40:12 -07002616 Py_ssize_t size = USABLE_FRACTION(DK_SIZE(mp->ma_keys));
2617 PyObject **newvalues;
2618 newvalues = new_values(size);
Benjamin Peterson7d95e402012-04-23 11:24:50 -04002619 if (newvalues == NULL)
2620 return PyErr_NoMemory();
2621 split_copy = PyObject_GC_New(PyDictObject, &PyDict_Type);
2622 if (split_copy == NULL) {
2623 free_values(newvalues);
2624 return NULL;
2625 }
2626 split_copy->ma_values = newvalues;
2627 split_copy->ma_keys = mp->ma_keys;
2628 split_copy->ma_used = mp->ma_used;
2629 DK_INCREF(mp->ma_keys);
Victor Stinner742da042016-09-07 17:40:12 -07002630 for (i = 0, n = size; i < n; i++) {
Benjamin Peterson7d95e402012-04-23 11:24:50 -04002631 PyObject *value = mp->ma_values[i];
2632 Py_XINCREF(value);
2633 split_copy->ma_values[i] = value;
2634 }
Benjamin Peterson7ce67e42012-04-24 10:32:57 -04002635 if (_PyObject_GC_IS_TRACKED(mp))
2636 _PyObject_GC_TRACK(split_copy);
Benjamin Peterson7d95e402012-04-23 11:24:50 -04002637 return (PyObject *)split_copy;
2638 }
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00002639 copy = PyDict_New();
2640 if (copy == NULL)
2641 return NULL;
2642 if (PyDict_Merge(copy, o, 1) == 0)
2643 return copy;
2644 Py_DECREF(copy);
2645 return NULL;
Guido van Rossume3f5b9c1997-05-28 19:15:28 +00002646}
2647
Martin v. Löwis18e16552006-02-15 17:27:45 +00002648Py_ssize_t
Tim Peters1f5871e2000-07-04 17:44:48 +00002649PyDict_Size(PyObject *mp)
Guido van Rossum4199fac1993-11-05 10:18:44 +00002650{
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00002651 if (mp == NULL || !PyDict_Check(mp)) {
2652 PyErr_BadInternalCall();
2653 return -1;
2654 }
2655 return ((PyDictObject *)mp)->ma_used;
Guido van Rossum4199fac1993-11-05 10:18:44 +00002656}
2657
Guido van Rossumc0b618a1997-05-02 03:12:38 +00002658PyObject *
Tim Peters1f5871e2000-07-04 17:44:48 +00002659PyDict_Keys(PyObject *mp)
Guido van Rossum4b1302b1993-03-27 18:11:32 +00002660{
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00002661 if (mp == NULL || !PyDict_Check(mp)) {
2662 PyErr_BadInternalCall();
2663 return NULL;
2664 }
2665 return dict_keys((PyDictObject *)mp);
Guido van Rossum4b1302b1993-03-27 18:11:32 +00002666}
2667
Guido van Rossumc0b618a1997-05-02 03:12:38 +00002668PyObject *
Tim Peters1f5871e2000-07-04 17:44:48 +00002669PyDict_Values(PyObject *mp)
Guido van Rossum25831651993-05-19 14:50:45 +00002670{
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00002671 if (mp == NULL || !PyDict_Check(mp)) {
2672 PyErr_BadInternalCall();
2673 return NULL;
2674 }
2675 return dict_values((PyDictObject *)mp);
Guido van Rossum25831651993-05-19 14:50:45 +00002676}
2677
Guido van Rossumc0b618a1997-05-02 03:12:38 +00002678PyObject *
Tim Peters1f5871e2000-07-04 17:44:48 +00002679PyDict_Items(PyObject *mp)
Guido van Rossum25831651993-05-19 14:50:45 +00002680{
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00002681 if (mp == NULL || !PyDict_Check(mp)) {
2682 PyErr_BadInternalCall();
2683 return NULL;
2684 }
2685 return dict_items((PyDictObject *)mp);
Guido van Rossum25831651993-05-19 14:50:45 +00002686}
2687
Tim Peterse63415e2001-05-08 04:38:29 +00002688/* Return 1 if dicts equal, 0 if not, -1 if error.
2689 * Gets out as soon as any difference is detected.
2690 * Uses only Py_EQ comparison.
2691 */
2692static int
Guido van Rossum8ce8a782007-11-01 19:42:39 +00002693dict_equal(PyDictObject *a, PyDictObject *b)
Tim Peterse63415e2001-05-08 04:38:29 +00002694{
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00002695 Py_ssize_t i;
Tim Peterse63415e2001-05-08 04:38:29 +00002696
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00002697 if (a->ma_used != b->ma_used)
2698 /* can't be equal if # of entries differ */
2699 return 0;
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00002700 /* Same # of entries -- check all of 'em. Exit early on any diff. */
Victor Stinner742da042016-09-07 17:40:12 -07002701 for (i = 0; i < a->ma_keys->dk_nentries; i++) {
2702 PyDictKeyEntry *ep = &DK_ENTRIES(a->ma_keys)[i];
Benjamin Peterson7d95e402012-04-23 11:24:50 -04002703 PyObject *aval;
2704 if (a->ma_values)
2705 aval = a->ma_values[i];
2706 else
2707 aval = ep->me_value;
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00002708 if (aval != NULL) {
2709 int cmp;
2710 PyObject *bval;
Benjamin Peterson7d95e402012-04-23 11:24:50 -04002711 PyObject *key = ep->me_key;
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00002712 /* temporarily bump aval's refcount to ensure it stays
2713 alive until we're done with it */
2714 Py_INCREF(aval);
2715 /* ditto for key */
2716 Py_INCREF(key);
Antoine Pitrou0e9958b2012-12-02 19:10:07 +01002717 /* reuse the known hash value */
INADA Naokiba609772016-12-07 20:41:42 +09002718 b->ma_keys->dk_lookup(b, key, ep->me_hash, &bval, NULL);
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00002719 Py_DECREF(key);
2720 if (bval == NULL) {
2721 Py_DECREF(aval);
2722 if (PyErr_Occurred())
2723 return -1;
2724 return 0;
2725 }
2726 cmp = PyObject_RichCompareBool(aval, bval, Py_EQ);
2727 Py_DECREF(aval);
2728 if (cmp <= 0) /* error or not equal */
2729 return cmp;
2730 }
2731 }
2732 return 1;
Benjamin Peterson7d95e402012-04-23 11:24:50 -04002733}
Tim Peterse63415e2001-05-08 04:38:29 +00002734
2735static PyObject *
2736dict_richcompare(PyObject *v, PyObject *w, int op)
2737{
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00002738 int cmp;
2739 PyObject *res;
Tim Peterse63415e2001-05-08 04:38:29 +00002740
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00002741 if (!PyDict_Check(v) || !PyDict_Check(w)) {
2742 res = Py_NotImplemented;
2743 }
2744 else if (op == Py_EQ || op == Py_NE) {
2745 cmp = dict_equal((PyDictObject *)v, (PyDictObject *)w);
2746 if (cmp < 0)
2747 return NULL;
2748 res = (cmp == (op == Py_EQ)) ? Py_True : Py_False;
2749 }
2750 else
2751 res = Py_NotImplemented;
2752 Py_INCREF(res);
2753 return res;
Benjamin Peterson7d95e402012-04-23 11:24:50 -04002754}
Tim Peterse63415e2001-05-08 04:38:29 +00002755
Larry Hastings61272b72014-01-07 12:41:53 -08002756/*[clinic input]
Larry Hastings31826802013-10-19 00:09:25 -07002757
2758@coexist
2759dict.__contains__
2760
2761 key: object
2762 /
2763
Meador Ingee02de8c2014-01-14 16:48:31 -06002764True if D has a key k, else False.
Larry Hastings61272b72014-01-07 12:41:53 -08002765[clinic start generated code]*/
Larry Hastings31826802013-10-19 00:09:25 -07002766
Guido van Rossumc0b618a1997-05-02 03:12:38 +00002767static PyObject *
Larry Hastingsc2047262014-01-25 20:43:29 -08002768dict___contains__(PyDictObject *self, PyObject *key)
Serhiy Storchaka1009bf12015-04-03 23:53:51 +03002769/*[clinic end generated code: output=a3d03db709ed6e6b input=b852b2a19b51ab24]*/
Guido van Rossum4b1302b1993-03-27 18:11:32 +00002770{
Larry Hastingsc2047262014-01-25 20:43:29 -08002771 register PyDictObject *mp = self;
Benjamin Peterson8f67d082010-10-17 20:54:53 +00002772 Py_hash_t hash;
Victor Stinner742da042016-09-07 17:40:12 -07002773 Py_ssize_t ix;
INADA Naokiba609772016-12-07 20:41:42 +09002774 PyObject *value;
Thomas Wouters4d70c3d2006-06-08 14:42:34 +00002775
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00002776 if (!PyUnicode_CheckExact(key) ||
Martin v. Löwisd63a3b82011-09-28 07:41:54 +02002777 (hash = ((PyASCIIObject *) key)->hash) == -1) {
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00002778 hash = PyObject_Hash(key);
2779 if (hash == -1)
2780 return NULL;
2781 }
INADA Naokiba609772016-12-07 20:41:42 +09002782 ix = (mp->ma_keys->dk_lookup)(mp, key, hash, &value, NULL);
Victor Stinner742da042016-09-07 17:40:12 -07002783 if (ix == DKIX_ERROR)
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00002784 return NULL;
INADA Naokiba609772016-12-07 20:41:42 +09002785 if (ix == DKIX_EMPTY || value == NULL)
Victor Stinner742da042016-09-07 17:40:12 -07002786 Py_RETURN_FALSE;
2787 Py_RETURN_TRUE;
Guido van Rossum4b1302b1993-03-27 18:11:32 +00002788}
2789
Guido van Rossumc0b618a1997-05-02 03:12:38 +00002790static PyObject *
Antoine Pitrou9ed5f272013-08-13 20:18:52 +02002791dict_get(PyDictObject *mp, PyObject *args)
Barry Warsawc38c5da1997-10-06 17:49:20 +00002792{
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00002793 PyObject *key;
2794 PyObject *failobj = Py_None;
2795 PyObject *val = NULL;
Benjamin Peterson8f67d082010-10-17 20:54:53 +00002796 Py_hash_t hash;
Victor Stinner742da042016-09-07 17:40:12 -07002797 Py_ssize_t ix;
Barry Warsawc38c5da1997-10-06 17:49:20 +00002798
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00002799 if (!PyArg_UnpackTuple(args, "get", 1, 2, &key, &failobj))
2800 return NULL;
Barry Warsawc38c5da1997-10-06 17:49:20 +00002801
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00002802 if (!PyUnicode_CheckExact(key) ||
Martin v. Löwisd63a3b82011-09-28 07:41:54 +02002803 (hash = ((PyASCIIObject *) key)->hash) == -1) {
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00002804 hash = PyObject_Hash(key);
2805 if (hash == -1)
2806 return NULL;
2807 }
INADA Naokiba609772016-12-07 20:41:42 +09002808 ix = (mp->ma_keys->dk_lookup)(mp, key, hash, &val, NULL);
Victor Stinner742da042016-09-07 17:40:12 -07002809 if (ix == DKIX_ERROR)
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00002810 return NULL;
INADA Naokiba609772016-12-07 20:41:42 +09002811 if (ix == DKIX_EMPTY || val == NULL) {
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00002812 val = failobj;
INADA Naokiba609772016-12-07 20:41:42 +09002813 }
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00002814 Py_INCREF(val);
2815 return val;
Barry Warsawc38c5da1997-10-06 17:49:20 +00002816}
2817
Benjamin Peterson00e98862013-03-07 22:16:29 -05002818PyObject *
2819PyDict_SetDefault(PyObject *d, PyObject *key, PyObject *defaultobj)
Guido van Rossum164452c2000-08-08 16:12:54 +00002820{
Benjamin Peterson00e98862013-03-07 22:16:29 -05002821 PyDictObject *mp = (PyDictObject *)d;
INADA Naoki93f26f72016-11-02 18:45:16 +09002822 PyObject *value;
Benjamin Peterson8f67d082010-10-17 20:54:53 +00002823 Py_hash_t hash;
Victor Stinner742da042016-09-07 17:40:12 -07002824 Py_ssize_t hashpos, ix;
Guido van Rossum164452c2000-08-08 16:12:54 +00002825
Benjamin Peterson00e98862013-03-07 22:16:29 -05002826 if (!PyDict_Check(d)) {
2827 PyErr_BadInternalCall();
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00002828 return NULL;
Benjamin Peterson00e98862013-03-07 22:16:29 -05002829 }
INADA Naoki93f26f72016-11-02 18:45:16 +09002830
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00002831 if (!PyUnicode_CheckExact(key) ||
Martin v. Löwisd63a3b82011-09-28 07:41:54 +02002832 (hash = ((PyASCIIObject *) key)->hash) == -1) {
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00002833 hash = PyObject_Hash(key);
2834 if (hash == -1)
2835 return NULL;
2836 }
INADA Naoki93f26f72016-11-02 18:45:16 +09002837
2838 if (mp->ma_values != NULL && !PyUnicode_CheckExact(key)) {
2839 if (insertion_resize(mp) < 0)
2840 return NULL;
2841 }
2842
INADA Naokiba609772016-12-07 20:41:42 +09002843 ix = (mp->ma_keys->dk_lookup)(mp, key, hash, &value, &hashpos);
Victor Stinner742da042016-09-07 17:40:12 -07002844 if (ix == DKIX_ERROR)
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00002845 return NULL;
INADA Naoki93f26f72016-11-02 18:45:16 +09002846
2847 if (_PyDict_HasSplitTable(mp) &&
INADA Naokiba609772016-12-07 20:41:42 +09002848 ((ix >= 0 && value == NULL && mp->ma_used != ix) ||
INADA Naoki93f26f72016-11-02 18:45:16 +09002849 (ix == DKIX_EMPTY && mp->ma_used != mp->ma_keys->dk_nentries))) {
2850 if (insertion_resize(mp) < 0) {
2851 return NULL;
2852 }
INADA Naokiba609772016-12-07 20:41:42 +09002853 hashpos = find_empty_slot(mp->ma_keys, key, hash);
INADA Naoki93f26f72016-11-02 18:45:16 +09002854 ix = DKIX_EMPTY;
2855 }
2856
2857 if (ix == DKIX_EMPTY) {
2858 PyDictKeyEntry *ep, *ep0;
2859 value = defaultobj;
Benjamin Peterson7d95e402012-04-23 11:24:50 -04002860 if (mp->ma_keys->dk_usable <= 0) {
Victor Stinner3c336c52016-09-12 14:17:40 +02002861 if (insertion_resize(mp) < 0) {
Benjamin Peterson7d95e402012-04-23 11:24:50 -04002862 return NULL;
Victor Stinner3c336c52016-09-12 14:17:40 +02002863 }
INADA Naokiba609772016-12-07 20:41:42 +09002864 hashpos = find_empty_slot(mp->ma_keys, key, hash);
Benjamin Peterson7d95e402012-04-23 11:24:50 -04002865 }
INADA Naoki93f26f72016-11-02 18:45:16 +09002866 ep0 = DK_ENTRIES(mp->ma_keys);
2867 ep = &ep0[mp->ma_keys->dk_nentries];
2868 dk_set_index(mp->ma_keys, hashpos, mp->ma_keys->dk_nentries);
Benjamin Petersonb1efa532013-03-04 09:47:50 -05002869 Py_INCREF(key);
INADA Naoki93f26f72016-11-02 18:45:16 +09002870 Py_INCREF(value);
2871 MAINTAIN_TRACKING(mp, key, value);
Benjamin Peterson7d95e402012-04-23 11:24:50 -04002872 ep->me_key = key;
2873 ep->me_hash = hash;
INADA Naokiba609772016-12-07 20:41:42 +09002874 if (_PyDict_HasSplitTable(mp)) {
INADA Naoki93f26f72016-11-02 18:45:16 +09002875 assert(mp->ma_values[mp->ma_keys->dk_nentries] == NULL);
2876 mp->ma_values[mp->ma_keys->dk_nentries] = value;
Victor Stinner742da042016-09-07 17:40:12 -07002877 }
2878 else {
INADA Naoki93f26f72016-11-02 18:45:16 +09002879 ep->me_value = value;
Victor Stinner742da042016-09-07 17:40:12 -07002880 }
Benjamin Peterson7d95e402012-04-23 11:24:50 -04002881 mp->ma_used++;
Victor Stinner3b6a6b42016-09-08 12:51:24 -07002882 mp->ma_version_tag = DICT_NEXT_VERSION();
INADA Naoki93f26f72016-11-02 18:45:16 +09002883 mp->ma_keys->dk_usable--;
2884 mp->ma_keys->dk_nentries++;
2885 assert(mp->ma_keys->dk_usable >= 0);
2886 }
INADA Naokiba609772016-12-07 20:41:42 +09002887 else if (value == NULL) {
INADA Naoki93f26f72016-11-02 18:45:16 +09002888 value = defaultobj;
2889 assert(_PyDict_HasSplitTable(mp));
2890 assert(ix == mp->ma_used);
2891 Py_INCREF(value);
2892 MAINTAIN_TRACKING(mp, key, value);
INADA Naokiba609772016-12-07 20:41:42 +09002893 mp->ma_values[ix] = value;
INADA Naoki93f26f72016-11-02 18:45:16 +09002894 mp->ma_used++;
2895 mp->ma_version_tag = DICT_NEXT_VERSION();
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00002896 }
INADA Naoki93f26f72016-11-02 18:45:16 +09002897
2898 assert(_PyDict_CheckConsistency(mp));
2899 return value;
Guido van Rossum164452c2000-08-08 16:12:54 +00002900}
2901
Benjamin Peterson00e98862013-03-07 22:16:29 -05002902static PyObject *
2903dict_setdefault(PyDictObject *mp, PyObject *args)
2904{
2905 PyObject *key, *val;
2906 PyObject *defaultobj = Py_None;
2907
2908 if (!PyArg_UnpackTuple(args, "setdefault", 1, 2, &key, &defaultobj))
2909 return NULL;
2910
Benjamin Peterson55898502013-03-08 08:36:49 -05002911 val = PyDict_SetDefault((PyObject *)mp, key, defaultobj);
Benjamin Peterson00e98862013-03-07 22:16:29 -05002912 Py_XINCREF(val);
2913 return val;
2914}
Guido van Rossum164452c2000-08-08 16:12:54 +00002915
2916static PyObject *
Antoine Pitrou9ed5f272013-08-13 20:18:52 +02002917dict_clear(PyDictObject *mp)
Guido van Rossumfb8f1ca1997-03-21 21:55:12 +00002918{
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00002919 PyDict_Clear((PyObject *)mp);
2920 Py_RETURN_NONE;
Guido van Rossumfb8f1ca1997-03-21 21:55:12 +00002921}
2922
Guido van Rossumba6ab842000-12-12 22:02:18 +00002923static PyObject *
Guido van Rossum8ce8a782007-11-01 19:42:39 +00002924dict_pop(PyDictObject *mp, PyObject *args)
Guido van Rossume027d982002-04-12 15:11:59 +00002925{
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00002926 PyObject *key, *deflt = NULL;
Guido van Rossume027d982002-04-12 15:11:59 +00002927
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00002928 if(!PyArg_UnpackTuple(args, "pop", 1, 2, &key, &deflt))
2929 return NULL;
Eric Snow96c6af92015-05-29 22:21:39 -06002930
Yury Selivanov684ef2c2016-10-28 19:01:21 -04002931 return _PyDict_Pop((PyObject*)mp, key, deflt);
Guido van Rossume027d982002-04-12 15:11:59 +00002932}
2933
2934static PyObject *
Guido van Rossum8ce8a782007-11-01 19:42:39 +00002935dict_popitem(PyDictObject *mp)
Guido van Rossumba6ab842000-12-12 22:02:18 +00002936{
Victor Stinner742da042016-09-07 17:40:12 -07002937 Py_ssize_t i, j;
2938 PyDictKeyEntry *ep0, *ep;
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00002939 PyObject *res;
Guido van Rossumba6ab842000-12-12 22:02:18 +00002940
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00002941 /* Allocate the result tuple before checking the size. Believe it
2942 * or not, this allocation could trigger a garbage collection which
2943 * could empty the dict, so if we checked the size first and that
2944 * happened, the result would be an infinite loop (searching for an
2945 * entry that no longer exists). Note that the usual popitem()
2946 * idiom is "while d: k, v = d.popitem()". so needing to throw the
2947 * tuple away if the dict *is* empty isn't a significant
2948 * inefficiency -- possible, but unlikely in practice.
2949 */
2950 res = PyTuple_New(2);
2951 if (res == NULL)
2952 return NULL;
2953 if (mp->ma_used == 0) {
2954 Py_DECREF(res);
2955 PyErr_SetString(PyExc_KeyError,
2956 "popitem(): dictionary is empty");
2957 return NULL;
2958 }
Benjamin Peterson7d95e402012-04-23 11:24:50 -04002959 /* Convert split table to combined table */
2960 if (mp->ma_keys->dk_lookup == lookdict_split) {
2961 if (dictresize(mp, DK_SIZE(mp->ma_keys))) {
2962 Py_DECREF(res);
2963 return NULL;
2964 }
2965 }
2966 ENSURE_ALLOWS_DELETIONS(mp);
Victor Stinner742da042016-09-07 17:40:12 -07002967
2968 /* Pop last item */
2969 ep0 = DK_ENTRIES(mp->ma_keys);
2970 i = mp->ma_keys->dk_nentries - 1;
2971 while (i >= 0 && ep0[i].me_value == NULL) {
2972 i--;
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00002973 }
Victor Stinner742da042016-09-07 17:40:12 -07002974 assert(i >= 0);
2975
2976 ep = &ep0[i];
2977 j = lookdict_index(mp->ma_keys, ep->me_hash, i);
2978 assert(j >= 0);
2979 assert(dk_get_index(mp->ma_keys, j) == i);
2980 dk_set_index(mp->ma_keys, j, DKIX_DUMMY);
2981
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00002982 PyTuple_SET_ITEM(res, 0, ep->me_key);
2983 PyTuple_SET_ITEM(res, 1, ep->me_value);
Victor Stinner742da042016-09-07 17:40:12 -07002984 ep->me_key = NULL;
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00002985 ep->me_value = NULL;
Victor Stinner742da042016-09-07 17:40:12 -07002986 /* We can't dk_usable++ since there is DKIX_DUMMY in indices */
2987 mp->ma_keys->dk_nentries = i;
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00002988 mp->ma_used--;
Victor Stinner3b6a6b42016-09-08 12:51:24 -07002989 mp->ma_version_tag = DICT_NEXT_VERSION();
Victor Stinner611b0fa2016-09-14 15:02:01 +02002990 assert(_PyDict_CheckConsistency(mp));
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00002991 return res;
Guido van Rossumba6ab842000-12-12 22:02:18 +00002992}
2993
Jeremy Hylton8caad492000-06-23 14:18:11 +00002994static int
2995dict_traverse(PyObject *op, visitproc visit, void *arg)
2996{
Benjamin Peterson7d95e402012-04-23 11:24:50 -04002997 PyDictObject *mp = (PyDictObject *)op;
Benjamin Peterson55f44522016-09-05 12:12:59 -07002998 PyDictKeysObject *keys = mp->ma_keys;
Serhiy Storchaka46825d22016-09-26 21:29:34 +03002999 PyDictKeyEntry *entries = DK_ENTRIES(keys);
Victor Stinner742da042016-09-07 17:40:12 -07003000 Py_ssize_t i, n = keys->dk_nentries;
3001
Benjamin Peterson55f44522016-09-05 12:12:59 -07003002 if (keys->dk_lookup == lookdict) {
3003 for (i = 0; i < n; i++) {
3004 if (entries[i].me_value != NULL) {
3005 Py_VISIT(entries[i].me_value);
3006 Py_VISIT(entries[i].me_key);
Benjamin Peterson7d95e402012-04-23 11:24:50 -04003007 }
3008 }
Victor Stinner742da042016-09-07 17:40:12 -07003009 }
3010 else {
Benjamin Peterson7d95e402012-04-23 11:24:50 -04003011 if (mp->ma_values != NULL) {
Benjamin Peterson55f44522016-09-05 12:12:59 -07003012 for (i = 0; i < n; i++) {
Benjamin Peterson7d95e402012-04-23 11:24:50 -04003013 Py_VISIT(mp->ma_values[i]);
3014 }
3015 }
3016 else {
Benjamin Peterson55f44522016-09-05 12:12:59 -07003017 for (i = 0; i < n; i++) {
3018 Py_VISIT(entries[i].me_value);
Benjamin Peterson7d95e402012-04-23 11:24:50 -04003019 }
3020 }
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00003021 }
3022 return 0;
Jeremy Hylton8caad492000-06-23 14:18:11 +00003023}
3024
3025static int
3026dict_tp_clear(PyObject *op)
3027{
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00003028 PyDict_Clear(op);
3029 return 0;
Jeremy Hylton8caad492000-06-23 14:18:11 +00003030}
3031
Guido van Rossum8ce8a782007-11-01 19:42:39 +00003032static PyObject *dictiter_new(PyDictObject *, PyTypeObject *);
Guido van Rossum09e563a2001-05-01 12:10:21 +00003033
Serhiy Storchaka0ce7a3a2015-12-22 08:16:18 +02003034Py_ssize_t
Eric Snow96c6af92015-05-29 22:21:39 -06003035_PyDict_SizeOf(PyDictObject *mp)
Martin v. Löwis00709aa2008-06-04 14:18:43 +00003036{
Victor Stinner742da042016-09-07 17:40:12 -07003037 Py_ssize_t size, usable, res;
Martin v. Löwis00709aa2008-06-04 14:18:43 +00003038
Benjamin Peterson7d95e402012-04-23 11:24:50 -04003039 size = DK_SIZE(mp->ma_keys);
Victor Stinner742da042016-09-07 17:40:12 -07003040 usable = USABLE_FRACTION(size);
3041
Serhiy Storchaka5c4064e2015-12-19 20:05:25 +02003042 res = _PyObject_SIZE(Py_TYPE(mp));
Benjamin Peterson7d95e402012-04-23 11:24:50 -04003043 if (mp->ma_values)
Victor Stinner742da042016-09-07 17:40:12 -07003044 res += usable * sizeof(PyObject*);
Martin v. Loewis4f2f3b62012-04-24 19:13:57 +02003045 /* If the dictionary is split, the keys portion is accounted-for
3046 in the type object. */
3047 if (mp->ma_keys->dk_refcnt == 1)
Victor Stinner98ee9d52016-09-08 09:33:56 -07003048 res += (sizeof(PyDictKeysObject)
3049 - Py_MEMBER_SIZE(PyDictKeysObject, dk_indices)
3050 + DK_IXSIZE(mp->ma_keys) * size
3051 + sizeof(PyDictKeyEntry) * usable);
Serhiy Storchaka0ce7a3a2015-12-22 08:16:18 +02003052 return res;
Martin v. Loewis4f2f3b62012-04-24 19:13:57 +02003053}
3054
3055Py_ssize_t
3056_PyDict_KeysSize(PyDictKeysObject *keys)
3057{
Victor Stinner98ee9d52016-09-08 09:33:56 -07003058 return (sizeof(PyDictKeysObject)
3059 - Py_MEMBER_SIZE(PyDictKeysObject, dk_indices)
3060 + DK_IXSIZE(keys) * DK_SIZE(keys)
3061 + USABLE_FRACTION(DK_SIZE(keys)) * sizeof(PyDictKeyEntry));
Martin v. Löwis00709aa2008-06-04 14:18:43 +00003062}
3063
doko@ubuntu.com17210f52016-01-14 14:04:59 +01003064static PyObject *
Serhiy Storchaka0ce7a3a2015-12-22 08:16:18 +02003065dict_sizeof(PyDictObject *mp)
3066{
3067 return PyLong_FromSsize_t(_PyDict_SizeOf(mp));
3068}
3069
Raymond Hettinger8f5cdaa2003-12-13 11:26:12 +00003070PyDoc_STRVAR(getitem__doc__, "x.__getitem__(y) <==> x[y]");
3071
Martin v. Löwis00709aa2008-06-04 14:18:43 +00003072PyDoc_STRVAR(sizeof__doc__,
3073"D.__sizeof__() -> size of D in memory, in bytes");
3074
Martin v. Löwis14f8b4c2002-06-13 20:33:02 +00003075PyDoc_STRVAR(get__doc__,
Guido van Rossumefae8862002-09-04 11:29:45 +00003076"D.get(k[,d]) -> D[k] if k in D, else d. d defaults to None.");
Tim Petersf7f88b12000-12-13 23:18:45 +00003077
Martin v. Löwis14f8b4c2002-06-13 20:33:02 +00003078PyDoc_STRVAR(setdefault_doc__,
Guido van Rossumefae8862002-09-04 11:29:45 +00003079"D.setdefault(k[,d]) -> D.get(k,d), also set D[k]=d if k not in D");
Tim Petersf7f88b12000-12-13 23:18:45 +00003080
Martin v. Löwis14f8b4c2002-06-13 20:33:02 +00003081PyDoc_STRVAR(pop__doc__,
Benjamin Petersonf10a79a2008-10-11 00:49:57 +00003082"D.pop(k[,d]) -> v, remove specified key and return the corresponding value.\n\
Raymond Hettingera3e1e4c2003-03-06 23:54:28 +00003083If key is not found, d is returned if given, otherwise KeyError is raised");
Guido van Rossume027d982002-04-12 15:11:59 +00003084
Martin v. Löwis14f8b4c2002-06-13 20:33:02 +00003085PyDoc_STRVAR(popitem__doc__,
Tim Petersf7f88b12000-12-13 23:18:45 +00003086"D.popitem() -> (k, v), remove and return some (key, value) pair as a\n\
Benjamin Petersonf10a79a2008-10-11 00:49:57 +000030872-tuple; but raise KeyError if D is empty.");
Tim Petersf7f88b12000-12-13 23:18:45 +00003088
Martin v. Löwis14f8b4c2002-06-13 20:33:02 +00003089PyDoc_STRVAR(update__doc__,
Brett Cannonf2754162013-05-11 14:46:48 -04003090"D.update([E, ]**F) -> None. Update D from dict/iterable E and F.\n\
3091If E is present and has a .keys() method, then does: for k in E: D[k] = E[k]\n\
3092If E is present and lacks a .keys() method, then does: for k, v in E: D[k] = v\n\
3093In either case, this is followed by: for k in F: D[k] = F[k]");
Tim Petersf7f88b12000-12-13 23:18:45 +00003094
Martin v. Löwis14f8b4c2002-06-13 20:33:02 +00003095PyDoc_STRVAR(clear__doc__,
3096"D.clear() -> None. Remove all items from D.");
Tim Petersf7f88b12000-12-13 23:18:45 +00003097
Martin v. Löwis14f8b4c2002-06-13 20:33:02 +00003098PyDoc_STRVAR(copy__doc__,
3099"D.copy() -> a shallow copy of D");
Tim Petersf7f88b12000-12-13 23:18:45 +00003100
Guido van Rossumb90c8482007-02-10 01:11:45 +00003101/* Forward */
3102static PyObject *dictkeys_new(PyObject *);
3103static PyObject *dictitems_new(PyObject *);
3104static PyObject *dictvalues_new(PyObject *);
3105
Guido van Rossum45c85d12007-07-27 16:31:40 +00003106PyDoc_STRVAR(keys__doc__,
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00003107 "D.keys() -> a set-like object providing a view on D's keys");
Guido van Rossum45c85d12007-07-27 16:31:40 +00003108PyDoc_STRVAR(items__doc__,
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00003109 "D.items() -> a set-like object providing a view on D's items");
Guido van Rossum45c85d12007-07-27 16:31:40 +00003110PyDoc_STRVAR(values__doc__,
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00003111 "D.values() -> an object providing a view on D's values");
Guido van Rossumb90c8482007-02-10 01:11:45 +00003112
Guido van Rossumc0b618a1997-05-02 03:12:38 +00003113static PyMethodDef mapp_methods[] = {
Larry Hastings31826802013-10-19 00:09:25 -07003114 DICT___CONTAINS___METHODDEF
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00003115 {"__getitem__", (PyCFunction)dict_subscript, METH_O | METH_COEXIST,
3116 getitem__doc__},
Serhiy Storchaka0ce7a3a2015-12-22 08:16:18 +02003117 {"__sizeof__", (PyCFunction)dict_sizeof, METH_NOARGS,
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00003118 sizeof__doc__},
3119 {"get", (PyCFunction)dict_get, METH_VARARGS,
3120 get__doc__},
3121 {"setdefault", (PyCFunction)dict_setdefault, METH_VARARGS,
3122 setdefault_doc__},
3123 {"pop", (PyCFunction)dict_pop, METH_VARARGS,
3124 pop__doc__},
3125 {"popitem", (PyCFunction)dict_popitem, METH_NOARGS,
3126 popitem__doc__},
3127 {"keys", (PyCFunction)dictkeys_new, METH_NOARGS,
3128 keys__doc__},
3129 {"items", (PyCFunction)dictitems_new, METH_NOARGS,
3130 items__doc__},
3131 {"values", (PyCFunction)dictvalues_new, METH_NOARGS,
3132 values__doc__},
3133 {"update", (PyCFunction)dict_update, METH_VARARGS | METH_KEYWORDS,
3134 update__doc__},
Larry Hastings5c661892014-01-24 06:17:25 -08003135 DICT_FROMKEYS_METHODDEF
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00003136 {"clear", (PyCFunction)dict_clear, METH_NOARGS,
3137 clear__doc__},
3138 {"copy", (PyCFunction)dict_copy, METH_NOARGS,
3139 copy__doc__},
3140 {NULL, NULL} /* sentinel */
Guido van Rossum4b1302b1993-03-27 18:11:32 +00003141};
3142
Thomas Wouters4d70c3d2006-06-08 14:42:34 +00003143/* Return 1 if `key` is in dict `op`, 0 if not, and -1 on error. */
Raymond Hettingerbc0f2ab2003-11-25 21:12:14 +00003144int
3145PyDict_Contains(PyObject *op, PyObject *key)
Guido van Rossum0dbb4fb2001-04-20 16:50:40 +00003146{
Benjamin Peterson8f67d082010-10-17 20:54:53 +00003147 Py_hash_t hash;
Victor Stinner742da042016-09-07 17:40:12 -07003148 Py_ssize_t ix;
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00003149 PyDictObject *mp = (PyDictObject *)op;
INADA Naokiba609772016-12-07 20:41:42 +09003150 PyObject *value;
Guido van Rossum0dbb4fb2001-04-20 16:50:40 +00003151
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00003152 if (!PyUnicode_CheckExact(key) ||
Martin v. Löwisd63a3b82011-09-28 07:41:54 +02003153 (hash = ((PyASCIIObject *) key)->hash) == -1) {
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00003154 hash = PyObject_Hash(key);
3155 if (hash == -1)
3156 return -1;
3157 }
INADA Naokiba609772016-12-07 20:41:42 +09003158 ix = (mp->ma_keys->dk_lookup)(mp, key, hash, &value, NULL);
Victor Stinner742da042016-09-07 17:40:12 -07003159 if (ix == DKIX_ERROR)
3160 return -1;
INADA Naokiba609772016-12-07 20:41:42 +09003161 return (ix != DKIX_EMPTY && value != NULL);
Guido van Rossum0dbb4fb2001-04-20 16:50:40 +00003162}
3163
Thomas Wouterscf297e42007-02-23 15:07:44 +00003164/* Internal version of PyDict_Contains used when the hash value is already known */
3165int
Benjamin Peterson8f67d082010-10-17 20:54:53 +00003166_PyDict_Contains(PyObject *op, PyObject *key, Py_hash_t hash)
Thomas Wouterscf297e42007-02-23 15:07:44 +00003167{
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00003168 PyDictObject *mp = (PyDictObject *)op;
INADA Naokiba609772016-12-07 20:41:42 +09003169 PyObject *value;
Victor Stinner742da042016-09-07 17:40:12 -07003170 Py_ssize_t ix;
Thomas Wouterscf297e42007-02-23 15:07:44 +00003171
INADA Naokiba609772016-12-07 20:41:42 +09003172 ix = (mp->ma_keys->dk_lookup)(mp, key, hash, &value, NULL);
Victor Stinner742da042016-09-07 17:40:12 -07003173 if (ix == DKIX_ERROR)
3174 return -1;
INADA Naokiba609772016-12-07 20:41:42 +09003175 return (ix != DKIX_EMPTY && value != NULL);
Thomas Wouterscf297e42007-02-23 15:07:44 +00003176}
3177
Guido van Rossum0dbb4fb2001-04-20 16:50:40 +00003178/* Hack to implement "key in dict" */
3179static PySequenceMethods dict_as_sequence = {
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00003180 0, /* sq_length */
3181 0, /* sq_concat */
3182 0, /* sq_repeat */
3183 0, /* sq_item */
3184 0, /* sq_slice */
3185 0, /* sq_ass_item */
3186 0, /* sq_ass_slice */
3187 PyDict_Contains, /* sq_contains */
3188 0, /* sq_inplace_concat */
3189 0, /* sq_inplace_repeat */
Guido van Rossum0dbb4fb2001-04-20 16:50:40 +00003190};
3191
Guido van Rossum09e563a2001-05-01 12:10:21 +00003192static PyObject *
Tim Peters6d6c1a32001-08-02 04:15:00 +00003193dict_new(PyTypeObject *type, PyObject *args, PyObject *kwds)
3194{
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00003195 PyObject *self;
Victor Stinnera9f61a52013-07-16 22:17:26 +02003196 PyDictObject *d;
Tim Peters6d6c1a32001-08-02 04:15:00 +00003197
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00003198 assert(type != NULL && type->tp_alloc != NULL);
3199 self = type->tp_alloc(type, 0);
Victor Stinnera9f61a52013-07-16 22:17:26 +02003200 if (self == NULL)
3201 return NULL;
Victor Stinnera9f61a52013-07-16 22:17:26 +02003202 d = (PyDictObject *)self;
Victor Stinnerac2a4fe2013-07-16 22:19:00 +02003203
Victor Stinnera9f61a52013-07-16 22:17:26 +02003204 /* The object has been implicitly tracked by tp_alloc */
3205 if (type == &PyDict_Type)
3206 _PyObject_GC_UNTRACK(d);
Victor Stinnerac2a4fe2013-07-16 22:19:00 +02003207
3208 d->ma_used = 0;
Victor Stinner3b6a6b42016-09-08 12:51:24 -07003209 d->ma_version_tag = DICT_NEXT_VERSION();
Victor Stinner742da042016-09-07 17:40:12 -07003210 d->ma_keys = new_keys_object(PyDict_MINSIZE);
Victor Stinnerac2a4fe2013-07-16 22:19:00 +02003211 if (d->ma_keys == NULL) {
3212 Py_DECREF(self);
3213 return NULL;
3214 }
Victor Stinner611b0fa2016-09-14 15:02:01 +02003215 assert(_PyDict_CheckConsistency(d));
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00003216 return self;
Tim Peters6d6c1a32001-08-02 04:15:00 +00003217}
3218
Tim Peters25786c02001-09-02 08:22:48 +00003219static int
3220dict_init(PyObject *self, PyObject *args, PyObject *kwds)
3221{
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00003222 return dict_update_common(self, args, kwds, "dict");
Tim Peters25786c02001-09-02 08:22:48 +00003223}
3224
Tim Peters6d6c1a32001-08-02 04:15:00 +00003225static PyObject *
Guido van Rossum8ce8a782007-11-01 19:42:39 +00003226dict_iter(PyDictObject *dict)
Guido van Rossum09e563a2001-05-01 12:10:21 +00003227{
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00003228 return dictiter_new(dict, &PyDictIterKey_Type);
Guido van Rossum09e563a2001-05-01 12:10:21 +00003229}
Guido van Rossum59d1d2b2001-04-20 19:13:02 +00003230
Martin v. Löwis14f8b4c2002-06-13 20:33:02 +00003231PyDoc_STRVAR(dictionary_doc,
Ezio Melotti7f807b72010-03-01 04:08:34 +00003232"dict() -> new empty dictionary\n"
Tim Petersa427a2b2001-10-29 22:25:45 +00003233"dict(mapping) -> new dictionary initialized from a mapping object's\n"
Ezio Melotti7f807b72010-03-01 04:08:34 +00003234" (key, value) pairs\n"
3235"dict(iterable) -> new dictionary initialized as if via:\n"
Tim Peters4d859532001-10-27 18:27:48 +00003236" d = {}\n"
Ezio Melotti7f807b72010-03-01 04:08:34 +00003237" for k, v in iterable:\n"
Just van Rossuma797d812002-11-23 09:45:04 +00003238" d[k] = v\n"
3239"dict(**kwargs) -> new dictionary initialized with the name=value pairs\n"
3240" in the keyword argument list. For example: dict(one=1, two=2)");
Tim Peters25786c02001-09-02 08:22:48 +00003241
Guido van Rossumc0b618a1997-05-02 03:12:38 +00003242PyTypeObject PyDict_Type = {
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00003243 PyVarObject_HEAD_INIT(&PyType_Type, 0)
3244 "dict",
3245 sizeof(PyDictObject),
3246 0,
3247 (destructor)dict_dealloc, /* tp_dealloc */
3248 0, /* tp_print */
3249 0, /* tp_getattr */
3250 0, /* tp_setattr */
3251 0, /* tp_reserved */
3252 (reprfunc)dict_repr, /* tp_repr */
3253 0, /* tp_as_number */
3254 &dict_as_sequence, /* tp_as_sequence */
3255 &dict_as_mapping, /* tp_as_mapping */
Georg Brandl00da4e02010-10-18 07:32:48 +00003256 PyObject_HashNotImplemented, /* tp_hash */
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00003257 0, /* tp_call */
3258 0, /* tp_str */
3259 PyObject_GenericGetAttr, /* tp_getattro */
3260 0, /* tp_setattro */
3261 0, /* tp_as_buffer */
3262 Py_TPFLAGS_DEFAULT | Py_TPFLAGS_HAVE_GC |
3263 Py_TPFLAGS_BASETYPE | Py_TPFLAGS_DICT_SUBCLASS, /* tp_flags */
3264 dictionary_doc, /* tp_doc */
3265 dict_traverse, /* tp_traverse */
3266 dict_tp_clear, /* tp_clear */
3267 dict_richcompare, /* tp_richcompare */
3268 0, /* tp_weaklistoffset */
3269 (getiterfunc)dict_iter, /* tp_iter */
3270 0, /* tp_iternext */
3271 mapp_methods, /* tp_methods */
3272 0, /* tp_members */
3273 0, /* tp_getset */
3274 0, /* tp_base */
3275 0, /* tp_dict */
3276 0, /* tp_descr_get */
3277 0, /* tp_descr_set */
3278 0, /* tp_dictoffset */
3279 dict_init, /* tp_init */
3280 PyType_GenericAlloc, /* tp_alloc */
3281 dict_new, /* tp_new */
3282 PyObject_GC_Del, /* tp_free */
Guido van Rossum4b1302b1993-03-27 18:11:32 +00003283};
3284
Victor Stinner3c1e4812012-03-26 22:10:51 +02003285PyObject *
3286_PyDict_GetItemId(PyObject *dp, struct _Py_Identifier *key)
3287{
3288 PyObject *kv;
3289 kv = _PyUnicode_FromId(key); /* borrowed */
Victor Stinner5b3b1002013-07-22 23:50:57 +02003290 if (kv == NULL) {
3291 PyErr_Clear();
Victor Stinner3c1e4812012-03-26 22:10:51 +02003292 return NULL;
Victor Stinner5b3b1002013-07-22 23:50:57 +02003293 }
Victor Stinner3c1e4812012-03-26 22:10:51 +02003294 return PyDict_GetItem(dp, kv);
3295}
3296
Guido van Rossum3cca2451997-05-16 14:23:33 +00003297/* For backward compatibility with old dictionary interface */
3298
Guido van Rossumc0b618a1997-05-02 03:12:38 +00003299PyObject *
Martin v. Löwis32b4a1b2002-12-11 13:21:12 +00003300PyDict_GetItemString(PyObject *v, const char *key)
Guido van Rossum4b1302b1993-03-27 18:11:32 +00003301{
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00003302 PyObject *kv, *rv;
3303 kv = PyUnicode_FromString(key);
Victor Stinnerfdcbab92013-07-16 22:16:05 +02003304 if (kv == NULL) {
3305 PyErr_Clear();
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00003306 return NULL;
Victor Stinnerfdcbab92013-07-16 22:16:05 +02003307 }
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00003308 rv = PyDict_GetItem(v, kv);
3309 Py_DECREF(kv);
3310 return rv;
Guido van Rossum4b1302b1993-03-27 18:11:32 +00003311}
3312
3313int
Victor Stinner3c1e4812012-03-26 22:10:51 +02003314_PyDict_SetItemId(PyObject *v, struct _Py_Identifier *key, PyObject *item)
3315{
3316 PyObject *kv;
3317 kv = _PyUnicode_FromId(key); /* borrowed */
3318 if (kv == NULL)
3319 return -1;
3320 return PyDict_SetItem(v, kv, item);
3321}
3322
3323int
Martin v. Löwis32b4a1b2002-12-11 13:21:12 +00003324PyDict_SetItemString(PyObject *v, const char *key, PyObject *item)
Guido van Rossum4b1302b1993-03-27 18:11:32 +00003325{
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00003326 PyObject *kv;
3327 int err;
3328 kv = PyUnicode_FromString(key);
3329 if (kv == NULL)
3330 return -1;
3331 PyUnicode_InternInPlace(&kv); /* XXX Should we really? */
3332 err = PyDict_SetItem(v, kv, item);
3333 Py_DECREF(kv);
3334 return err;
Guido van Rossum4b1302b1993-03-27 18:11:32 +00003335}
3336
3337int
Victor Stinner5fd2e5a2013-11-06 18:58:22 +01003338_PyDict_DelItemId(PyObject *v, _Py_Identifier *key)
3339{
3340 PyObject *kv = _PyUnicode_FromId(key); /* borrowed */
3341 if (kv == NULL)
3342 return -1;
3343 return PyDict_DelItem(v, kv);
3344}
3345
3346int
Martin v. Löwis32b4a1b2002-12-11 13:21:12 +00003347PyDict_DelItemString(PyObject *v, const char *key)
Guido van Rossum4b1302b1993-03-27 18:11:32 +00003348{
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00003349 PyObject *kv;
3350 int err;
3351 kv = PyUnicode_FromString(key);
3352 if (kv == NULL)
3353 return -1;
3354 err = PyDict_DelItem(v, kv);
3355 Py_DECREF(kv);
3356 return err;
Guido van Rossum4b1302b1993-03-27 18:11:32 +00003357}
Guido van Rossum59d1d2b2001-04-20 19:13:02 +00003358
Raymond Hettinger019a1482004-03-18 02:41:19 +00003359/* Dictionary iterator types */
Guido van Rossum59d1d2b2001-04-20 19:13:02 +00003360
3361typedef struct {
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00003362 PyObject_HEAD
3363 PyDictObject *di_dict; /* Set to NULL when iterator is exhausted */
3364 Py_ssize_t di_used;
3365 Py_ssize_t di_pos;
3366 PyObject* di_result; /* reusable result tuple for iteritems */
3367 Py_ssize_t len;
Guido van Rossum59d1d2b2001-04-20 19:13:02 +00003368} dictiterobject;
3369
3370static PyObject *
Guido van Rossum8ce8a782007-11-01 19:42:39 +00003371dictiter_new(PyDictObject *dict, PyTypeObject *itertype)
Guido van Rossum59d1d2b2001-04-20 19:13:02 +00003372{
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00003373 dictiterobject *di;
3374 di = PyObject_GC_New(dictiterobject, itertype);
3375 if (di == NULL)
3376 return NULL;
3377 Py_INCREF(dict);
3378 di->di_dict = dict;
3379 di->di_used = dict->ma_used;
3380 di->di_pos = 0;
3381 di->len = dict->ma_used;
3382 if (itertype == &PyDictIterItem_Type) {
3383 di->di_result = PyTuple_Pack(2, Py_None, Py_None);
3384 if (di->di_result == NULL) {
3385 Py_DECREF(di);
3386 return NULL;
3387 }
3388 }
3389 else
3390 di->di_result = NULL;
3391 _PyObject_GC_TRACK(di);
3392 return (PyObject *)di;
Guido van Rossum59d1d2b2001-04-20 19:13:02 +00003393}
3394
3395static void
3396dictiter_dealloc(dictiterobject *di)
3397{
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00003398 Py_XDECREF(di->di_dict);
3399 Py_XDECREF(di->di_result);
3400 PyObject_GC_Del(di);
Antoine Pitrou7ddda782009-01-01 15:35:33 +00003401}
3402
3403static int
3404dictiter_traverse(dictiterobject *di, visitproc visit, void *arg)
3405{
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00003406 Py_VISIT(di->di_dict);
3407 Py_VISIT(di->di_result);
3408 return 0;
Guido van Rossum59d1d2b2001-04-20 19:13:02 +00003409}
3410
Raymond Hettinger6b27cda2005-09-24 21:23:05 +00003411static PyObject *
Raymond Hettinger0ce6dc82004-03-18 08:38:00 +00003412dictiter_len(dictiterobject *di)
3413{
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00003414 Py_ssize_t len = 0;
3415 if (di->di_dict != NULL && di->di_used == di->di_dict->ma_used)
3416 len = di->len;
3417 return PyLong_FromSize_t(len);
Raymond Hettinger0ce6dc82004-03-18 08:38:00 +00003418}
3419
Guido van Rossumb90c8482007-02-10 01:11:45 +00003420PyDoc_STRVAR(length_hint_doc,
3421 "Private method returning an estimate of len(list(it)).");
Raymond Hettinger6b27cda2005-09-24 21:23:05 +00003422
Kristján Valur Jónsson31668b82012-04-03 10:49:41 +00003423static PyObject *
3424dictiter_reduce(dictiterobject *di);
3425
3426PyDoc_STRVAR(reduce_doc, "Return state information for pickling.");
3427
Raymond Hettinger6b27cda2005-09-24 21:23:05 +00003428static PyMethodDef dictiter_methods[] = {
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00003429 {"__length_hint__", (PyCFunction)dictiter_len, METH_NOARGS,
3430 length_hint_doc},
Kristján Valur Jónsson31668b82012-04-03 10:49:41 +00003431 {"__reduce__", (PyCFunction)dictiter_reduce, METH_NOARGS,
3432 reduce_doc},
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00003433 {NULL, NULL} /* sentinel */
Raymond Hettinger0ce6dc82004-03-18 08:38:00 +00003434};
3435
Serhiy Storchaka49f5cdd2016-10-09 23:08:05 +03003436static PyObject*
3437dictiter_iternextkey(dictiterobject *di)
Guido van Rossum213c7a62001-04-23 14:08:49 +00003438{
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00003439 PyObject *key;
INADA Naokica2d8be2016-11-04 16:59:10 +09003440 Py_ssize_t i;
Antoine Pitrou9ed5f272013-08-13 20:18:52 +02003441 PyDictKeysObject *k;
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00003442 PyDictObject *d = di->di_dict;
Guido van Rossum213c7a62001-04-23 14:08:49 +00003443
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00003444 if (d == NULL)
3445 return NULL;
3446 assert (PyDict_Check(d));
Guido van Rossum2147df72002-07-16 20:30:22 +00003447
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00003448 if (di->di_used != d->ma_used) {
3449 PyErr_SetString(PyExc_RuntimeError,
3450 "dictionary changed size during iteration");
3451 di->di_used = -1; /* Make this state sticky */
3452 return NULL;
3453 }
Guido van Rossum2147df72002-07-16 20:30:22 +00003454
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00003455 i = di->di_pos;
Benjamin Peterson7d95e402012-04-23 11:24:50 -04003456 k = d->ma_keys;
INADA Naokica2d8be2016-11-04 16:59:10 +09003457 assert(i >= 0);
Benjamin Peterson7d95e402012-04-23 11:24:50 -04003458 if (d->ma_values) {
INADA Naokica2d8be2016-11-04 16:59:10 +09003459 if (i >= d->ma_used)
Serhiy Storchaka49f5cdd2016-10-09 23:08:05 +03003460 goto fail;
3461 key = DK_ENTRIES(k)[i].me_key;
INADA Naokica2d8be2016-11-04 16:59:10 +09003462 assert(d->ma_values[i] != NULL);
Benjamin Peterson7d95e402012-04-23 11:24:50 -04003463 }
3464 else {
INADA Naokica2d8be2016-11-04 16:59:10 +09003465 Py_ssize_t n = k->dk_nentries;
Serhiy Storchaka49f5cdd2016-10-09 23:08:05 +03003466 PyDictKeyEntry *entry_ptr = &DK_ENTRIES(k)[i];
3467 while (i < n && entry_ptr->me_value == NULL) {
3468 entry_ptr++;
3469 i++;
3470 }
3471 if (i >= n)
3472 goto fail;
3473 key = entry_ptr->me_key;
Benjamin Peterson7d95e402012-04-23 11:24:50 -04003474 }
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00003475 di->di_pos = i+1;
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00003476 di->len--;
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00003477 Py_INCREF(key);
3478 return key;
Raymond Hettinger019a1482004-03-18 02:41:19 +00003479
3480fail:
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00003481 di->di_dict = NULL;
Serhiy Storchakafbb1c5e2016-03-30 20:40:02 +03003482 Py_DECREF(d);
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00003483 return NULL;
Guido van Rossum59d1d2b2001-04-20 19:13:02 +00003484}
3485
Raymond Hettinger019a1482004-03-18 02:41:19 +00003486PyTypeObject PyDictIterKey_Type = {
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00003487 PyVarObject_HEAD_INIT(&PyType_Type, 0)
3488 "dict_keyiterator", /* tp_name */
3489 sizeof(dictiterobject), /* tp_basicsize */
3490 0, /* tp_itemsize */
3491 /* methods */
3492 (destructor)dictiter_dealloc, /* tp_dealloc */
3493 0, /* tp_print */
3494 0, /* tp_getattr */
3495 0, /* tp_setattr */
3496 0, /* tp_reserved */
3497 0, /* tp_repr */
3498 0, /* tp_as_number */
3499 0, /* tp_as_sequence */
3500 0, /* tp_as_mapping */
3501 0, /* tp_hash */
3502 0, /* tp_call */
3503 0, /* tp_str */
3504 PyObject_GenericGetAttr, /* tp_getattro */
3505 0, /* tp_setattro */
3506 0, /* tp_as_buffer */
3507 Py_TPFLAGS_DEFAULT | Py_TPFLAGS_HAVE_GC,/* tp_flags */
3508 0, /* tp_doc */
3509 (traverseproc)dictiter_traverse, /* tp_traverse */
3510 0, /* tp_clear */
3511 0, /* tp_richcompare */
3512 0, /* tp_weaklistoffset */
3513 PyObject_SelfIter, /* tp_iter */
3514 (iternextfunc)dictiter_iternextkey, /* tp_iternext */
3515 dictiter_methods, /* tp_methods */
3516 0,
Raymond Hettinger019a1482004-03-18 02:41:19 +00003517};
3518
Serhiy Storchaka49f5cdd2016-10-09 23:08:05 +03003519static PyObject *
3520dictiter_iternextvalue(dictiterobject *di)
Raymond Hettinger019a1482004-03-18 02:41:19 +00003521{
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00003522 PyObject *value;
INADA Naokica2d8be2016-11-04 16:59:10 +09003523 Py_ssize_t i;
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00003524 PyDictObject *d = di->di_dict;
Raymond Hettinger019a1482004-03-18 02:41:19 +00003525
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00003526 if (d == NULL)
3527 return NULL;
3528 assert (PyDict_Check(d));
Raymond Hettinger019a1482004-03-18 02:41:19 +00003529
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00003530 if (di->di_used != d->ma_used) {
3531 PyErr_SetString(PyExc_RuntimeError,
3532 "dictionary changed size during iteration");
3533 di->di_used = -1; /* Make this state sticky */
3534 return NULL;
3535 }
Raymond Hettinger019a1482004-03-18 02:41:19 +00003536
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00003537 i = di->di_pos;
INADA Naokica2d8be2016-11-04 16:59:10 +09003538 assert(i >= 0);
Benjamin Peterson7d95e402012-04-23 11:24:50 -04003539 if (d->ma_values) {
INADA Naokica2d8be2016-11-04 16:59:10 +09003540 if (i >= d->ma_used)
Serhiy Storchaka49f5cdd2016-10-09 23:08:05 +03003541 goto fail;
INADA Naokica2d8be2016-11-04 16:59:10 +09003542 value = d->ma_values[i];
3543 assert(value != NULL);
Benjamin Peterson7d95e402012-04-23 11:24:50 -04003544 }
3545 else {
INADA Naokica2d8be2016-11-04 16:59:10 +09003546 Py_ssize_t n = d->ma_keys->dk_nentries;
Serhiy Storchaka49f5cdd2016-10-09 23:08:05 +03003547 PyDictKeyEntry *entry_ptr = &DK_ENTRIES(d->ma_keys)[i];
3548 while (i < n && entry_ptr->me_value == NULL) {
3549 entry_ptr++;
3550 i++;
3551 }
3552 if (i >= n)
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00003553 goto fail;
Serhiy Storchaka49f5cdd2016-10-09 23:08:05 +03003554 value = entry_ptr->me_value;
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00003555 }
3556 di->di_pos = i+1;
3557 di->len--;
3558 Py_INCREF(value);
3559 return value;
Raymond Hettinger019a1482004-03-18 02:41:19 +00003560
3561fail:
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00003562 di->di_dict = NULL;
Serhiy Storchakafbb1c5e2016-03-30 20:40:02 +03003563 Py_DECREF(d);
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00003564 return NULL;
Raymond Hettinger019a1482004-03-18 02:41:19 +00003565}
3566
3567PyTypeObject PyDictIterValue_Type = {
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00003568 PyVarObject_HEAD_INIT(&PyType_Type, 0)
3569 "dict_valueiterator", /* tp_name */
3570 sizeof(dictiterobject), /* tp_basicsize */
3571 0, /* tp_itemsize */
3572 /* methods */
3573 (destructor)dictiter_dealloc, /* tp_dealloc */
3574 0, /* tp_print */
3575 0, /* tp_getattr */
3576 0, /* tp_setattr */
3577 0, /* tp_reserved */
3578 0, /* tp_repr */
3579 0, /* tp_as_number */
3580 0, /* tp_as_sequence */
3581 0, /* tp_as_mapping */
3582 0, /* tp_hash */
3583 0, /* tp_call */
3584 0, /* tp_str */
3585 PyObject_GenericGetAttr, /* tp_getattro */
3586 0, /* tp_setattro */
3587 0, /* tp_as_buffer */
Serhiy Storchaka49f5cdd2016-10-09 23:08:05 +03003588 Py_TPFLAGS_DEFAULT | Py_TPFLAGS_HAVE_GC, /* tp_flags */
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00003589 0, /* tp_doc */
3590 (traverseproc)dictiter_traverse, /* tp_traverse */
3591 0, /* tp_clear */
3592 0, /* tp_richcompare */
3593 0, /* tp_weaklistoffset */
3594 PyObject_SelfIter, /* tp_iter */
3595 (iternextfunc)dictiter_iternextvalue, /* tp_iternext */
3596 dictiter_methods, /* tp_methods */
3597 0,
Raymond Hettinger019a1482004-03-18 02:41:19 +00003598};
3599
Serhiy Storchaka49f5cdd2016-10-09 23:08:05 +03003600static PyObject *
3601dictiter_iternextitem(dictiterobject *di)
Raymond Hettinger019a1482004-03-18 02:41:19 +00003602{
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00003603 PyObject *key, *value, *result = di->di_result;
INADA Naokica2d8be2016-11-04 16:59:10 +09003604 Py_ssize_t i;
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00003605 PyDictObject *d = di->di_dict;
Raymond Hettinger019a1482004-03-18 02:41:19 +00003606
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00003607 if (d == NULL)
3608 return NULL;
3609 assert (PyDict_Check(d));
Raymond Hettinger019a1482004-03-18 02:41:19 +00003610
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00003611 if (di->di_used != d->ma_used) {
3612 PyErr_SetString(PyExc_RuntimeError,
3613 "dictionary changed size during iteration");
3614 di->di_used = -1; /* Make this state sticky */
3615 return NULL;
3616 }
Raymond Hettinger019a1482004-03-18 02:41:19 +00003617
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00003618 i = di->di_pos;
INADA Naokica2d8be2016-11-04 16:59:10 +09003619 assert(i >= 0);
Benjamin Peterson7d95e402012-04-23 11:24:50 -04003620 if (d->ma_values) {
INADA Naokica2d8be2016-11-04 16:59:10 +09003621 if (i >= d->ma_used)
Serhiy Storchaka49f5cdd2016-10-09 23:08:05 +03003622 goto fail;
3623 key = DK_ENTRIES(d->ma_keys)[i].me_key;
INADA Naokica2d8be2016-11-04 16:59:10 +09003624 value = d->ma_values[i];
3625 assert(value != NULL);
Benjamin Peterson7d95e402012-04-23 11:24:50 -04003626 }
3627 else {
INADA Naokica2d8be2016-11-04 16:59:10 +09003628 Py_ssize_t n = d->ma_keys->dk_nentries;
Serhiy Storchaka49f5cdd2016-10-09 23:08:05 +03003629 PyDictKeyEntry *entry_ptr = &DK_ENTRIES(d->ma_keys)[i];
3630 while (i < n && entry_ptr->me_value == NULL) {
3631 entry_ptr++;
3632 i++;
3633 }
3634 if (i >= n)
3635 goto fail;
3636 key = entry_ptr->me_key;
3637 value = entry_ptr->me_value;
Benjamin Peterson7d95e402012-04-23 11:24:50 -04003638 }
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00003639 di->di_pos = i+1;
Serhiy Storchaka49f5cdd2016-10-09 23:08:05 +03003640 di->len--;
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00003641 if (result->ob_refcnt == 1) {
3642 Py_INCREF(result);
3643 Py_DECREF(PyTuple_GET_ITEM(result, 0));
3644 Py_DECREF(PyTuple_GET_ITEM(result, 1));
Serhiy Storchaka49f5cdd2016-10-09 23:08:05 +03003645 }
3646 else {
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00003647 result = PyTuple_New(2);
3648 if (result == NULL)
3649 return NULL;
3650 }
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00003651 Py_INCREF(key);
3652 Py_INCREF(value);
Eric Snow96c6af92015-05-29 22:21:39 -06003653 PyTuple_SET_ITEM(result, 0, key); /* steals reference */
3654 PyTuple_SET_ITEM(result, 1, value); /* steals reference */
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00003655 return result;
Raymond Hettinger019a1482004-03-18 02:41:19 +00003656
3657fail:
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00003658 di->di_dict = NULL;
Serhiy Storchakafbb1c5e2016-03-30 20:40:02 +03003659 Py_DECREF(d);
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00003660 return NULL;
Raymond Hettinger019a1482004-03-18 02:41:19 +00003661}
3662
3663PyTypeObject PyDictIterItem_Type = {
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00003664 PyVarObject_HEAD_INIT(&PyType_Type, 0)
3665 "dict_itemiterator", /* tp_name */
3666 sizeof(dictiterobject), /* tp_basicsize */
3667 0, /* tp_itemsize */
3668 /* methods */
3669 (destructor)dictiter_dealloc, /* tp_dealloc */
3670 0, /* tp_print */
3671 0, /* tp_getattr */
3672 0, /* tp_setattr */
3673 0, /* tp_reserved */
3674 0, /* tp_repr */
3675 0, /* tp_as_number */
3676 0, /* tp_as_sequence */
3677 0, /* tp_as_mapping */
3678 0, /* tp_hash */
3679 0, /* tp_call */
3680 0, /* tp_str */
3681 PyObject_GenericGetAttr, /* tp_getattro */
3682 0, /* tp_setattro */
3683 0, /* tp_as_buffer */
3684 Py_TPFLAGS_DEFAULT | Py_TPFLAGS_HAVE_GC,/* tp_flags */
3685 0, /* tp_doc */
3686 (traverseproc)dictiter_traverse, /* tp_traverse */
3687 0, /* tp_clear */
3688 0, /* tp_richcompare */
3689 0, /* tp_weaklistoffset */
3690 PyObject_SelfIter, /* tp_iter */
3691 (iternextfunc)dictiter_iternextitem, /* tp_iternext */
3692 dictiter_methods, /* tp_methods */
3693 0,
Guido van Rossum59d1d2b2001-04-20 19:13:02 +00003694};
Guido van Rossumb90c8482007-02-10 01:11:45 +00003695
3696
Kristján Valur Jónsson31668b82012-04-03 10:49:41 +00003697static PyObject *
3698dictiter_reduce(dictiterobject *di)
3699{
3700 PyObject *list;
3701 dictiterobject tmp;
3702
3703 list = PyList_New(0);
3704 if (!list)
3705 return NULL;
3706
3707 /* copy the itertor state */
3708 tmp = *di;
3709 Py_XINCREF(tmp.di_dict);
Benjamin Peterson7d95e402012-04-23 11:24:50 -04003710
Kristján Valur Jónsson31668b82012-04-03 10:49:41 +00003711 /* iterate the temporary into a list */
3712 for(;;) {
3713 PyObject *element = 0;
3714 if (Py_TYPE(di) == &PyDictIterItem_Type)
3715 element = dictiter_iternextitem(&tmp);
3716 else if (Py_TYPE(di) == &PyDictIterKey_Type)
3717 element = dictiter_iternextkey(&tmp);
3718 else if (Py_TYPE(di) == &PyDictIterValue_Type)
3719 element = dictiter_iternextvalue(&tmp);
3720 else
3721 assert(0);
3722 if (element) {
3723 if (PyList_Append(list, element)) {
3724 Py_DECREF(element);
3725 Py_DECREF(list);
3726 Py_XDECREF(tmp.di_dict);
3727 return NULL;
3728 }
3729 Py_DECREF(element);
3730 } else
3731 break;
3732 }
3733 Py_XDECREF(tmp.di_dict);
3734 /* check for error */
3735 if (tmp.di_dict != NULL) {
3736 /* we have an error */
3737 Py_DECREF(list);
3738 return NULL;
3739 }
Antoine Pitroua7013882012-04-05 00:04:20 +02003740 return Py_BuildValue("N(N)", _PyObject_GetBuiltin("iter"), list);
Kristján Valur Jónsson31668b82012-04-03 10:49:41 +00003741}
3742
Guido van Rossum3ac67412007-02-10 18:55:06 +00003743/***********************************************/
Guido van Rossumb90c8482007-02-10 01:11:45 +00003744/* View objects for keys(), items(), values(). */
Guido van Rossum3ac67412007-02-10 18:55:06 +00003745/***********************************************/
3746
Guido van Rossumb90c8482007-02-10 01:11:45 +00003747/* The instance lay-out is the same for all three; but the type differs. */
3748
Guido van Rossumb90c8482007-02-10 01:11:45 +00003749static void
Eric Snow96c6af92015-05-29 22:21:39 -06003750dictview_dealloc(_PyDictViewObject *dv)
Guido van Rossumb90c8482007-02-10 01:11:45 +00003751{
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00003752 Py_XDECREF(dv->dv_dict);
3753 PyObject_GC_Del(dv);
Antoine Pitrou7ddda782009-01-01 15:35:33 +00003754}
3755
3756static int
Eric Snow96c6af92015-05-29 22:21:39 -06003757dictview_traverse(_PyDictViewObject *dv, visitproc visit, void *arg)
Antoine Pitrou7ddda782009-01-01 15:35:33 +00003758{
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00003759 Py_VISIT(dv->dv_dict);
3760 return 0;
Guido van Rossumb90c8482007-02-10 01:11:45 +00003761}
3762
Guido van Rossum83825ac2007-02-10 04:54:19 +00003763static Py_ssize_t
Eric Snow96c6af92015-05-29 22:21:39 -06003764dictview_len(_PyDictViewObject *dv)
Guido van Rossumb90c8482007-02-10 01:11:45 +00003765{
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00003766 Py_ssize_t len = 0;
3767 if (dv->dv_dict != NULL)
3768 len = dv->dv_dict->ma_used;
3769 return len;
Guido van Rossumb90c8482007-02-10 01:11:45 +00003770}
3771
Eric Snow96c6af92015-05-29 22:21:39 -06003772PyObject *
3773_PyDictView_New(PyObject *dict, PyTypeObject *type)
Guido van Rossumb90c8482007-02-10 01:11:45 +00003774{
Eric Snow96c6af92015-05-29 22:21:39 -06003775 _PyDictViewObject *dv;
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00003776 if (dict == NULL) {
3777 PyErr_BadInternalCall();
3778 return NULL;
3779 }
3780 if (!PyDict_Check(dict)) {
3781 /* XXX Get rid of this restriction later */
3782 PyErr_Format(PyExc_TypeError,
3783 "%s() requires a dict argument, not '%s'",
3784 type->tp_name, dict->ob_type->tp_name);
3785 return NULL;
3786 }
Eric Snow96c6af92015-05-29 22:21:39 -06003787 dv = PyObject_GC_New(_PyDictViewObject, type);
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00003788 if (dv == NULL)
3789 return NULL;
3790 Py_INCREF(dict);
3791 dv->dv_dict = (PyDictObject *)dict;
3792 _PyObject_GC_TRACK(dv);
3793 return (PyObject *)dv;
Guido van Rossumb90c8482007-02-10 01:11:45 +00003794}
3795
Neal Norwitze36f2ba2007-02-26 23:12:28 +00003796/* TODO(guido): The views objects are not complete:
3797
3798 * support more set operations
3799 * support arbitrary mappings?
3800 - either these should be static or exported in dictobject.h
3801 - if public then they should probably be in builtins
3802*/
3803
Guido van Rossumaac530c2007-08-24 22:33:45 +00003804/* Return 1 if self is a subset of other, iterating over self;
3805 0 if not; -1 if an error occurred. */
Guido van Rossumd9214d12007-02-12 02:23:40 +00003806static int
3807all_contained_in(PyObject *self, PyObject *other)
3808{
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00003809 PyObject *iter = PyObject_GetIter(self);
3810 int ok = 1;
Guido van Rossumd9214d12007-02-12 02:23:40 +00003811
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00003812 if (iter == NULL)
3813 return -1;
3814 for (;;) {
3815 PyObject *next = PyIter_Next(iter);
3816 if (next == NULL) {
3817 if (PyErr_Occurred())
3818 ok = -1;
3819 break;
3820 }
3821 ok = PySequence_Contains(other, next);
3822 Py_DECREF(next);
3823 if (ok <= 0)
3824 break;
3825 }
3826 Py_DECREF(iter);
3827 return ok;
Guido van Rossumd9214d12007-02-12 02:23:40 +00003828}
3829
3830static PyObject *
3831dictview_richcompare(PyObject *self, PyObject *other, int op)
3832{
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00003833 Py_ssize_t len_self, len_other;
3834 int ok;
3835 PyObject *result;
Guido van Rossumaac530c2007-08-24 22:33:45 +00003836
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00003837 assert(self != NULL);
3838 assert(PyDictViewSet_Check(self));
3839 assert(other != NULL);
Guido van Rossumd9214d12007-02-12 02:23:40 +00003840
Brian Curtindfc80e32011-08-10 20:28:54 -05003841 if (!PyAnySet_Check(other) && !PyDictViewSet_Check(other))
3842 Py_RETURN_NOTIMPLEMENTED;
Guido van Rossumaac530c2007-08-24 22:33:45 +00003843
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00003844 len_self = PyObject_Size(self);
3845 if (len_self < 0)
3846 return NULL;
3847 len_other = PyObject_Size(other);
3848 if (len_other < 0)
3849 return NULL;
Guido van Rossumaac530c2007-08-24 22:33:45 +00003850
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00003851 ok = 0;
3852 switch(op) {
Guido van Rossumaac530c2007-08-24 22:33:45 +00003853
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00003854 case Py_NE:
3855 case Py_EQ:
3856 if (len_self == len_other)
3857 ok = all_contained_in(self, other);
3858 if (op == Py_NE && ok >= 0)
3859 ok = !ok;
3860 break;
Guido van Rossumaac530c2007-08-24 22:33:45 +00003861
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00003862 case Py_LT:
3863 if (len_self < len_other)
3864 ok = all_contained_in(self, other);
3865 break;
Guido van Rossumaac530c2007-08-24 22:33:45 +00003866
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00003867 case Py_LE:
3868 if (len_self <= len_other)
3869 ok = all_contained_in(self, other);
3870 break;
Guido van Rossumaac530c2007-08-24 22:33:45 +00003871
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00003872 case Py_GT:
3873 if (len_self > len_other)
3874 ok = all_contained_in(other, self);
3875 break;
Guido van Rossumaac530c2007-08-24 22:33:45 +00003876
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00003877 case Py_GE:
3878 if (len_self >= len_other)
3879 ok = all_contained_in(other, self);
3880 break;
Guido van Rossumaac530c2007-08-24 22:33:45 +00003881
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00003882 }
3883 if (ok < 0)
3884 return NULL;
3885 result = ok ? Py_True : Py_False;
3886 Py_INCREF(result);
3887 return result;
Guido van Rossumd9214d12007-02-12 02:23:40 +00003888}
3889
Raymond Hettingerb0d56af2009-03-03 10:52:49 +00003890static PyObject *
Eric Snow96c6af92015-05-29 22:21:39 -06003891dictview_repr(_PyDictViewObject *dv)
Raymond Hettingerb0d56af2009-03-03 10:52:49 +00003892{
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00003893 PyObject *seq;
3894 PyObject *result;
Raymond Hettingerb0d56af2009-03-03 10:52:49 +00003895
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00003896 seq = PySequence_List((PyObject *)dv);
3897 if (seq == NULL)
3898 return NULL;
3899
3900 result = PyUnicode_FromFormat("%s(%R)", Py_TYPE(dv)->tp_name, seq);
3901 Py_DECREF(seq);
3902 return result;
Raymond Hettingerb0d56af2009-03-03 10:52:49 +00003903}
3904
Guido van Rossum3ac67412007-02-10 18:55:06 +00003905/*** dict_keys ***/
Guido van Rossumb90c8482007-02-10 01:11:45 +00003906
3907static PyObject *
Eric Snow96c6af92015-05-29 22:21:39 -06003908dictkeys_iter(_PyDictViewObject *dv)
Guido van Rossumb90c8482007-02-10 01:11:45 +00003909{
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00003910 if (dv->dv_dict == NULL) {
3911 Py_RETURN_NONE;
3912 }
3913 return dictiter_new(dv->dv_dict, &PyDictIterKey_Type);
Guido van Rossum3ac67412007-02-10 18:55:06 +00003914}
3915
3916static int
Eric Snow96c6af92015-05-29 22:21:39 -06003917dictkeys_contains(_PyDictViewObject *dv, PyObject *obj)
Guido van Rossum3ac67412007-02-10 18:55:06 +00003918{
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00003919 if (dv->dv_dict == NULL)
3920 return 0;
3921 return PyDict_Contains((PyObject *)dv->dv_dict, obj);
Guido van Rossumb90c8482007-02-10 01:11:45 +00003922}
3923
Guido van Rossum83825ac2007-02-10 04:54:19 +00003924static PySequenceMethods dictkeys_as_sequence = {
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00003925 (lenfunc)dictview_len, /* sq_length */
3926 0, /* sq_concat */
3927 0, /* sq_repeat */
3928 0, /* sq_item */
3929 0, /* sq_slice */
3930 0, /* sq_ass_item */
3931 0, /* sq_ass_slice */
3932 (objobjproc)dictkeys_contains, /* sq_contains */
Guido van Rossum83825ac2007-02-10 04:54:19 +00003933};
3934
Guido van Rossum523259b2007-08-24 23:41:22 +00003935static PyObject*
3936dictviews_sub(PyObject* self, PyObject *other)
3937{
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00003938 PyObject *result = PySet_New(self);
3939 PyObject *tmp;
Martin v. Löwisbd928fe2011-10-14 10:20:37 +02003940 _Py_IDENTIFIER(difference_update);
Martin v. Löwisafe55bb2011-10-09 10:38:36 +02003941
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00003942 if (result == NULL)
3943 return NULL;
Guido van Rossum523259b2007-08-24 23:41:22 +00003944
Benjamin Petersonf11b25b2016-03-03 22:05:36 -08003945 tmp = _PyObject_CallMethodIdObjArgs(result, &PyId_difference_update, other, NULL);
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00003946 if (tmp == NULL) {
3947 Py_DECREF(result);
3948 return NULL;
3949 }
Guido van Rossum523259b2007-08-24 23:41:22 +00003950
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00003951 Py_DECREF(tmp);
3952 return result;
Guido van Rossum523259b2007-08-24 23:41:22 +00003953}
3954
Benjamin Peterson025e9eb2015-05-05 20:16:41 -04003955PyObject*
3956_PyDictView_Intersect(PyObject* self, PyObject *other)
Guido van Rossum523259b2007-08-24 23:41:22 +00003957{
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00003958 PyObject *result = PySet_New(self);
3959 PyObject *tmp;
Martin v. Löwisbd928fe2011-10-14 10:20:37 +02003960 _Py_IDENTIFIER(intersection_update);
Martin v. Löwisafe55bb2011-10-09 10:38:36 +02003961
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00003962 if (result == NULL)
3963 return NULL;
Guido van Rossum523259b2007-08-24 23:41:22 +00003964
Benjamin Petersonf11b25b2016-03-03 22:05:36 -08003965 tmp = _PyObject_CallMethodIdObjArgs(result, &PyId_intersection_update, other, NULL);
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00003966 if (tmp == NULL) {
3967 Py_DECREF(result);
3968 return NULL;
3969 }
Guido van Rossum523259b2007-08-24 23:41:22 +00003970
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00003971 Py_DECREF(tmp);
3972 return result;
Guido van Rossum523259b2007-08-24 23:41:22 +00003973}
3974
3975static PyObject*
3976dictviews_or(PyObject* self, PyObject *other)
3977{
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00003978 PyObject *result = PySet_New(self);
3979 PyObject *tmp;
Martin v. Löwis1c67dd92011-10-14 15:16:45 +02003980 _Py_IDENTIFIER(update);
Victor Stinnerd1a9cc22011-10-13 22:51:17 +02003981
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00003982 if (result == NULL)
3983 return NULL;
Guido van Rossum523259b2007-08-24 23:41:22 +00003984
Benjamin Petersonf11b25b2016-03-03 22:05:36 -08003985 tmp = _PyObject_CallMethodIdObjArgs(result, &PyId_update, other, NULL);
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00003986 if (tmp == NULL) {
3987 Py_DECREF(result);
3988 return NULL;
3989 }
Guido van Rossum523259b2007-08-24 23:41:22 +00003990
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00003991 Py_DECREF(tmp);
3992 return result;
Guido van Rossum523259b2007-08-24 23:41:22 +00003993}
3994
3995static PyObject*
3996dictviews_xor(PyObject* self, PyObject *other)
3997{
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00003998 PyObject *result = PySet_New(self);
3999 PyObject *tmp;
Martin v. Löwisbd928fe2011-10-14 10:20:37 +02004000 _Py_IDENTIFIER(symmetric_difference_update);
Martin v. Löwisafe55bb2011-10-09 10:38:36 +02004001
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00004002 if (result == NULL)
4003 return NULL;
Guido van Rossum523259b2007-08-24 23:41:22 +00004004
Benjamin Petersonf11b25b2016-03-03 22:05:36 -08004005 tmp = _PyObject_CallMethodIdObjArgs(result, &PyId_symmetric_difference_update, other, NULL);
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00004006 if (tmp == NULL) {
4007 Py_DECREF(result);
4008 return NULL;
4009 }
Guido van Rossum523259b2007-08-24 23:41:22 +00004010
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00004011 Py_DECREF(tmp);
4012 return result;
Guido van Rossum523259b2007-08-24 23:41:22 +00004013}
4014
4015static PyNumberMethods dictviews_as_number = {
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00004016 0, /*nb_add*/
4017 (binaryfunc)dictviews_sub, /*nb_subtract*/
4018 0, /*nb_multiply*/
4019 0, /*nb_remainder*/
4020 0, /*nb_divmod*/
4021 0, /*nb_power*/
4022 0, /*nb_negative*/
4023 0, /*nb_positive*/
4024 0, /*nb_absolute*/
4025 0, /*nb_bool*/
4026 0, /*nb_invert*/
4027 0, /*nb_lshift*/
4028 0, /*nb_rshift*/
Benjamin Peterson025e9eb2015-05-05 20:16:41 -04004029 (binaryfunc)_PyDictView_Intersect, /*nb_and*/
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00004030 (binaryfunc)dictviews_xor, /*nb_xor*/
4031 (binaryfunc)dictviews_or, /*nb_or*/
Guido van Rossum523259b2007-08-24 23:41:22 +00004032};
4033
Daniel Stutzbach045b3ba2010-09-02 15:06:06 +00004034static PyObject*
4035dictviews_isdisjoint(PyObject *self, PyObject *other)
4036{
4037 PyObject *it;
4038 PyObject *item = NULL;
4039
4040 if (self == other) {
Eric Snow96c6af92015-05-29 22:21:39 -06004041 if (dictview_len((_PyDictViewObject *)self) == 0)
Daniel Stutzbach045b3ba2010-09-02 15:06:06 +00004042 Py_RETURN_TRUE;
4043 else
4044 Py_RETURN_FALSE;
4045 }
4046
4047 /* Iterate over the shorter object (only if other is a set,
4048 * because PySequence_Contains may be expensive otherwise): */
4049 if (PyAnySet_Check(other) || PyDictViewSet_Check(other)) {
Eric Snow96c6af92015-05-29 22:21:39 -06004050 Py_ssize_t len_self = dictview_len((_PyDictViewObject *)self);
Daniel Stutzbach045b3ba2010-09-02 15:06:06 +00004051 Py_ssize_t len_other = PyObject_Size(other);
4052 if (len_other == -1)
4053 return NULL;
4054
4055 if ((len_other > len_self)) {
4056 PyObject *tmp = other;
4057 other = self;
4058 self = tmp;
4059 }
4060 }
4061
4062 it = PyObject_GetIter(other);
4063 if (it == NULL)
4064 return NULL;
4065
4066 while ((item = PyIter_Next(it)) != NULL) {
4067 int contains = PySequence_Contains(self, item);
4068 Py_DECREF(item);
4069 if (contains == -1) {
4070 Py_DECREF(it);
4071 return NULL;
4072 }
4073
4074 if (contains) {
4075 Py_DECREF(it);
4076 Py_RETURN_FALSE;
4077 }
4078 }
4079 Py_DECREF(it);
4080 if (PyErr_Occurred())
4081 return NULL; /* PyIter_Next raised an exception. */
4082 Py_RETURN_TRUE;
4083}
4084
4085PyDoc_STRVAR(isdisjoint_doc,
4086"Return True if the view and the given iterable have a null intersection.");
4087
Guido van Rossumb90c8482007-02-10 01:11:45 +00004088static PyMethodDef dictkeys_methods[] = {
Daniel Stutzbach045b3ba2010-09-02 15:06:06 +00004089 {"isdisjoint", (PyCFunction)dictviews_isdisjoint, METH_O,
4090 isdisjoint_doc},
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00004091 {NULL, NULL} /* sentinel */
Guido van Rossumb90c8482007-02-10 01:11:45 +00004092};
4093
4094PyTypeObject PyDictKeys_Type = {
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00004095 PyVarObject_HEAD_INIT(&PyType_Type, 0)
4096 "dict_keys", /* tp_name */
Eric Snow96c6af92015-05-29 22:21:39 -06004097 sizeof(_PyDictViewObject), /* tp_basicsize */
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00004098 0, /* tp_itemsize */
4099 /* methods */
4100 (destructor)dictview_dealloc, /* tp_dealloc */
4101 0, /* tp_print */
4102 0, /* tp_getattr */
4103 0, /* tp_setattr */
4104 0, /* tp_reserved */
4105 (reprfunc)dictview_repr, /* tp_repr */
4106 &dictviews_as_number, /* tp_as_number */
4107 &dictkeys_as_sequence, /* tp_as_sequence */
4108 0, /* tp_as_mapping */
4109 0, /* tp_hash */
4110 0, /* tp_call */
4111 0, /* tp_str */
4112 PyObject_GenericGetAttr, /* tp_getattro */
4113 0, /* tp_setattro */
4114 0, /* tp_as_buffer */
4115 Py_TPFLAGS_DEFAULT | Py_TPFLAGS_HAVE_GC,/* tp_flags */
4116 0, /* tp_doc */
4117 (traverseproc)dictview_traverse, /* tp_traverse */
4118 0, /* tp_clear */
4119 dictview_richcompare, /* tp_richcompare */
4120 0, /* tp_weaklistoffset */
4121 (getiterfunc)dictkeys_iter, /* tp_iter */
4122 0, /* tp_iternext */
4123 dictkeys_methods, /* tp_methods */
4124 0,
Guido van Rossumb90c8482007-02-10 01:11:45 +00004125};
4126
4127static PyObject *
4128dictkeys_new(PyObject *dict)
4129{
Eric Snow96c6af92015-05-29 22:21:39 -06004130 return _PyDictView_New(dict, &PyDictKeys_Type);
Guido van Rossumb90c8482007-02-10 01:11:45 +00004131}
4132
Guido van Rossum3ac67412007-02-10 18:55:06 +00004133/*** dict_items ***/
Guido van Rossumb90c8482007-02-10 01:11:45 +00004134
4135static PyObject *
Eric Snow96c6af92015-05-29 22:21:39 -06004136dictitems_iter(_PyDictViewObject *dv)
Guido van Rossumb90c8482007-02-10 01:11:45 +00004137{
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00004138 if (dv->dv_dict == NULL) {
4139 Py_RETURN_NONE;
4140 }
4141 return dictiter_new(dv->dv_dict, &PyDictIterItem_Type);
Guido van Rossum3ac67412007-02-10 18:55:06 +00004142}
4143
4144static int
Eric Snow96c6af92015-05-29 22:21:39 -06004145dictitems_contains(_PyDictViewObject *dv, PyObject *obj)
Guido van Rossum3ac67412007-02-10 18:55:06 +00004146{
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00004147 PyObject *key, *value, *found;
4148 if (dv->dv_dict == NULL)
4149 return 0;
4150 if (!PyTuple_Check(obj) || PyTuple_GET_SIZE(obj) != 2)
4151 return 0;
4152 key = PyTuple_GET_ITEM(obj, 0);
4153 value = PyTuple_GET_ITEM(obj, 1);
Raymond Hettinger6692f012016-09-18 21:46:08 -07004154 found = PyDict_GetItemWithError((PyObject *)dv->dv_dict, key);
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00004155 if (found == NULL) {
4156 if (PyErr_Occurred())
4157 return -1;
4158 return 0;
4159 }
4160 return PyObject_RichCompareBool(value, found, Py_EQ);
Guido van Rossumb90c8482007-02-10 01:11:45 +00004161}
4162
Guido van Rossum83825ac2007-02-10 04:54:19 +00004163static PySequenceMethods dictitems_as_sequence = {
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00004164 (lenfunc)dictview_len, /* sq_length */
4165 0, /* sq_concat */
4166 0, /* sq_repeat */
4167 0, /* sq_item */
4168 0, /* sq_slice */
4169 0, /* sq_ass_item */
4170 0, /* sq_ass_slice */
4171 (objobjproc)dictitems_contains, /* sq_contains */
Guido van Rossum83825ac2007-02-10 04:54:19 +00004172};
4173
Guido van Rossumb90c8482007-02-10 01:11:45 +00004174static PyMethodDef dictitems_methods[] = {
Daniel Stutzbach045b3ba2010-09-02 15:06:06 +00004175 {"isdisjoint", (PyCFunction)dictviews_isdisjoint, METH_O,
4176 isdisjoint_doc},
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00004177 {NULL, NULL} /* sentinel */
Guido van Rossumb90c8482007-02-10 01:11:45 +00004178};
4179
4180PyTypeObject PyDictItems_Type = {
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00004181 PyVarObject_HEAD_INIT(&PyType_Type, 0)
4182 "dict_items", /* tp_name */
Eric Snow96c6af92015-05-29 22:21:39 -06004183 sizeof(_PyDictViewObject), /* tp_basicsize */
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00004184 0, /* tp_itemsize */
4185 /* methods */
4186 (destructor)dictview_dealloc, /* tp_dealloc */
4187 0, /* tp_print */
4188 0, /* tp_getattr */
4189 0, /* tp_setattr */
4190 0, /* tp_reserved */
4191 (reprfunc)dictview_repr, /* tp_repr */
4192 &dictviews_as_number, /* tp_as_number */
4193 &dictitems_as_sequence, /* tp_as_sequence */
4194 0, /* tp_as_mapping */
4195 0, /* tp_hash */
4196 0, /* tp_call */
4197 0, /* tp_str */
4198 PyObject_GenericGetAttr, /* tp_getattro */
4199 0, /* tp_setattro */
4200 0, /* tp_as_buffer */
4201 Py_TPFLAGS_DEFAULT | Py_TPFLAGS_HAVE_GC,/* tp_flags */
4202 0, /* tp_doc */
4203 (traverseproc)dictview_traverse, /* tp_traverse */
4204 0, /* tp_clear */
4205 dictview_richcompare, /* tp_richcompare */
4206 0, /* tp_weaklistoffset */
4207 (getiterfunc)dictitems_iter, /* tp_iter */
4208 0, /* tp_iternext */
4209 dictitems_methods, /* tp_methods */
4210 0,
Guido van Rossumb90c8482007-02-10 01:11:45 +00004211};
4212
4213static PyObject *
4214dictitems_new(PyObject *dict)
4215{
Eric Snow96c6af92015-05-29 22:21:39 -06004216 return _PyDictView_New(dict, &PyDictItems_Type);
Guido van Rossumb90c8482007-02-10 01:11:45 +00004217}
4218
Guido van Rossum3ac67412007-02-10 18:55:06 +00004219/*** dict_values ***/
Guido van Rossumb90c8482007-02-10 01:11:45 +00004220
4221static PyObject *
Eric Snow96c6af92015-05-29 22:21:39 -06004222dictvalues_iter(_PyDictViewObject *dv)
Guido van Rossumb90c8482007-02-10 01:11:45 +00004223{
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00004224 if (dv->dv_dict == NULL) {
4225 Py_RETURN_NONE;
4226 }
4227 return dictiter_new(dv->dv_dict, &PyDictIterValue_Type);
Guido van Rossumb90c8482007-02-10 01:11:45 +00004228}
4229
Guido van Rossum83825ac2007-02-10 04:54:19 +00004230static PySequenceMethods dictvalues_as_sequence = {
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00004231 (lenfunc)dictview_len, /* sq_length */
4232 0, /* sq_concat */
4233 0, /* sq_repeat */
4234 0, /* sq_item */
4235 0, /* sq_slice */
4236 0, /* sq_ass_item */
4237 0, /* sq_ass_slice */
4238 (objobjproc)0, /* sq_contains */
Guido van Rossum83825ac2007-02-10 04:54:19 +00004239};
4240
Guido van Rossumb90c8482007-02-10 01:11:45 +00004241static PyMethodDef dictvalues_methods[] = {
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00004242 {NULL, NULL} /* sentinel */
Guido van Rossumb90c8482007-02-10 01:11:45 +00004243};
4244
4245PyTypeObject PyDictValues_Type = {
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00004246 PyVarObject_HEAD_INIT(&PyType_Type, 0)
4247 "dict_values", /* tp_name */
Eric Snow96c6af92015-05-29 22:21:39 -06004248 sizeof(_PyDictViewObject), /* tp_basicsize */
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00004249 0, /* tp_itemsize */
4250 /* methods */
4251 (destructor)dictview_dealloc, /* tp_dealloc */
4252 0, /* tp_print */
4253 0, /* tp_getattr */
4254 0, /* tp_setattr */
4255 0, /* tp_reserved */
4256 (reprfunc)dictview_repr, /* tp_repr */
4257 0, /* tp_as_number */
4258 &dictvalues_as_sequence, /* tp_as_sequence */
4259 0, /* tp_as_mapping */
4260 0, /* tp_hash */
4261 0, /* tp_call */
4262 0, /* tp_str */
4263 PyObject_GenericGetAttr, /* tp_getattro */
4264 0, /* tp_setattro */
4265 0, /* tp_as_buffer */
4266 Py_TPFLAGS_DEFAULT | Py_TPFLAGS_HAVE_GC,/* tp_flags */
4267 0, /* tp_doc */
4268 (traverseproc)dictview_traverse, /* tp_traverse */
4269 0, /* tp_clear */
4270 0, /* tp_richcompare */
4271 0, /* tp_weaklistoffset */
4272 (getiterfunc)dictvalues_iter, /* tp_iter */
4273 0, /* tp_iternext */
4274 dictvalues_methods, /* tp_methods */
4275 0,
Guido van Rossumb90c8482007-02-10 01:11:45 +00004276};
4277
4278static PyObject *
4279dictvalues_new(PyObject *dict)
4280{
Eric Snow96c6af92015-05-29 22:21:39 -06004281 return _PyDictView_New(dict, &PyDictValues_Type);
Guido van Rossumb90c8482007-02-10 01:11:45 +00004282}
Benjamin Peterson7d95e402012-04-23 11:24:50 -04004283
4284/* Returns NULL if cannot allocate a new PyDictKeysObject,
4285 but does not set an error */
4286PyDictKeysObject *
4287_PyDict_NewKeysForClass(void)
4288{
Victor Stinner742da042016-09-07 17:40:12 -07004289 PyDictKeysObject *keys = new_keys_object(PyDict_MINSIZE);
Benjamin Peterson7d95e402012-04-23 11:24:50 -04004290 if (keys == NULL)
4291 PyErr_Clear();
4292 else
4293 keys->dk_lookup = lookdict_split;
4294 return keys;
4295}
4296
4297#define CACHED_KEYS(tp) (((PyHeapTypeObject*)tp)->ht_cached_keys)
4298
4299PyObject *
4300PyObject_GenericGetDict(PyObject *obj, void *context)
4301{
4302 PyObject *dict, **dictptr = _PyObject_GetDictPtr(obj);
4303 if (dictptr == NULL) {
4304 PyErr_SetString(PyExc_AttributeError,
4305 "This object has no __dict__");
4306 return NULL;
4307 }
4308 dict = *dictptr;
4309 if (dict == NULL) {
4310 PyTypeObject *tp = Py_TYPE(obj);
4311 if ((tp->tp_flags & Py_TPFLAGS_HEAPTYPE) && CACHED_KEYS(tp)) {
4312 DK_INCREF(CACHED_KEYS(tp));
4313 *dictptr = dict = new_dict_with_shared_keys(CACHED_KEYS(tp));
4314 }
4315 else {
4316 *dictptr = dict = PyDict_New();
4317 }
4318 }
4319 Py_XINCREF(dict);
4320 return dict;
4321}
4322
4323int
4324_PyObjectDict_SetItem(PyTypeObject *tp, PyObject **dictptr,
Victor Stinner742da042016-09-07 17:40:12 -07004325 PyObject *key, PyObject *value)
Benjamin Peterson7d95e402012-04-23 11:24:50 -04004326{
4327 PyObject *dict;
4328 int res;
4329 PyDictKeysObject *cached;
4330
4331 assert(dictptr != NULL);
4332 if ((tp->tp_flags & Py_TPFLAGS_HEAPTYPE) && (cached = CACHED_KEYS(tp))) {
4333 assert(dictptr != NULL);
4334 dict = *dictptr;
4335 if (dict == NULL) {
4336 DK_INCREF(cached);
4337 dict = new_dict_with_shared_keys(cached);
4338 if (dict == NULL)
4339 return -1;
4340 *dictptr = dict;
4341 }
4342 if (value == NULL) {
4343 res = PyDict_DelItem(dict, key);
4344 if (cached != ((PyDictObject *)dict)->ma_keys) {
4345 CACHED_KEYS(tp) = NULL;
4346 DK_DECREF(cached);
4347 }
Victor Stinner3d3f2642016-12-15 17:21:23 +01004348 }
4349 else {
4350 int was_shared = cached == ((PyDictObject *)dict)->ma_keys;
Benjamin Peterson7d95e402012-04-23 11:24:50 -04004351 res = PyDict_SetItem(dict, key, value);
Victor Stinner3d3f2642016-12-15 17:21:23 +01004352 if (was_shared && cached != ((PyDictObject *)dict)->ma_keys) {
4353 /* PyDict_SetItem() may call dictresize and convert split table
4354 * into combined table. In such case, convert it to split
4355 * table again and update type's shared key only when this is
4356 * the only dict sharing key with the type.
4357 *
4358 * This is to allow using shared key in class like this:
4359 *
4360 * class C:
4361 * def __init__(self):
4362 * # one dict resize happens
4363 * self.a, self.b, self.c = 1, 2, 3
4364 * self.d, self.e, self.f = 4, 5, 6
4365 * a = C()
4366 */
Benjamin Peterson15ee8212012-04-24 14:44:18 -04004367 if (cached->dk_refcnt == 1) {
Benjamin Peterson7d95e402012-04-23 11:24:50 -04004368 CACHED_KEYS(tp) = make_keys_shared(dict);
Victor Stinner742da042016-09-07 17:40:12 -07004369 }
4370 else {
Benjamin Peterson7d95e402012-04-23 11:24:50 -04004371 CACHED_KEYS(tp) = NULL;
4372 }
4373 DK_DECREF(cached);
Benjamin Peterson15ee8212012-04-24 14:44:18 -04004374 if (CACHED_KEYS(tp) == NULL && PyErr_Occurred())
4375 return -1;
Benjamin Peterson7d95e402012-04-23 11:24:50 -04004376 }
4377 }
4378 } else {
4379 dict = *dictptr;
4380 if (dict == NULL) {
4381 dict = PyDict_New();
4382 if (dict == NULL)
4383 return -1;
4384 *dictptr = dict;
4385 }
4386 if (value == NULL) {
4387 res = PyDict_DelItem(dict, key);
4388 } else {
4389 res = PyDict_SetItem(dict, key, value);
4390 }
4391 }
4392 return res;
4393}
4394
4395void
4396_PyDictKeys_DecRef(PyDictKeysObject *keys)
4397{
4398 DK_DECREF(keys);
4399}