blob: baef58942798f231e34245709301a76049cf96a4 [file] [log] [blame]
Guido van Rossum2bc13791999-03-24 19:06:42 +00001/* Dictionary object implementation using a hash table */
Guido van Rossum9bfef441993-03-29 10:43:31 +00002
Raymond Hettinger930427b2003-05-03 06:51:59 +00003/* The distribution includes a separate file, Objects/dictnotes.txt,
Tim Peters60b29962006-01-01 01:19:23 +00004 describing explorations into dictionary design and optimization.
Raymond Hettinger930427b2003-05-03 06:51:59 +00005 It covers typical dictionary use patterns, the parameters for
6 tuning dictionaries, and several ideas for possible optimizations.
7*/
8
Victor Stinner742da042016-09-07 17:40:12 -07009/* PyDictKeysObject
10
11This implements the dictionary's hashtable.
12
Raymond Hettingerb12785d2016-10-22 09:58:14 -070013As of Python 3.6, this is compact and ordered. Basic idea is described here:
14* https://mail.python.org/pipermail/python-dev/2012-December/123028.html
15* https://morepypy.blogspot.com/2015/01/faster-more-memory-efficient-and-more.html
Victor Stinner742da042016-09-07 17:40:12 -070016
17layout:
18
19+---------------+
20| dk_refcnt |
21| dk_size |
22| dk_lookup |
23| dk_usable |
24| dk_nentries |
25+---------------+
26| dk_indices |
27| |
28+---------------+
29| dk_entries |
30| |
31+---------------+
32
33dk_indices is actual hashtable. It holds index in entries, or DKIX_EMPTY(-1)
34or DKIX_DUMMY(-2).
35Size of indices is dk_size. Type of each index in indices is vary on dk_size:
36
37* int8 for dk_size <= 128
38* int16 for 256 <= dk_size <= 2**15
39* int32 for 2**16 <= dk_size <= 2**31
40* int64 for 2**32 <= dk_size
41
42dk_entries is array of PyDictKeyEntry. It's size is USABLE_FRACTION(dk_size).
43DK_ENTRIES(dk) can be used to get pointer to entries.
44
45NOTE: Since negative value is used for DKIX_EMPTY and DKIX_DUMMY, type of
46dk_indices entry is signed integer and int16 is used for table which
47dk_size == 256.
48*/
49
Benjamin Peterson7d95e402012-04-23 11:24:50 -040050
51/*
Benjamin Peterson7d95e402012-04-23 11:24:50 -040052The DictObject can be in one of two forms.
Victor Stinner742da042016-09-07 17:40:12 -070053
Benjamin Peterson7d95e402012-04-23 11:24:50 -040054Either:
55 A combined table:
56 ma_values == NULL, dk_refcnt == 1.
57 Values are stored in the me_value field of the PyDictKeysObject.
Benjamin Peterson7d95e402012-04-23 11:24:50 -040058Or:
59 A split table:
60 ma_values != NULL, dk_refcnt >= 1
61 Values are stored in the ma_values array.
Victor Stinner742da042016-09-07 17:40:12 -070062 Only string (unicode) keys are allowed.
63 All dicts sharing same key must have same insertion order.
Benjamin Peterson7d95e402012-04-23 11:24:50 -040064
Victor Stinner742da042016-09-07 17:40:12 -070065There are four kinds of slots in the table (slot is index, and
66DK_ENTRIES(keys)[index] if index >= 0):
67
681. Unused. index == DKIX_EMPTY
69 Does not hold an active (key, value) pair now and never did. Unused can
70 transition to Active upon key insertion. This is each slot's initial state.
71
722. Active. index >= 0, me_key != NULL and me_value != NULL
73 Holds an active (key, value) pair. Active can transition to Dummy or
74 Pending upon key deletion (for combined and split tables respectively).
75 This is the only case in which me_value != NULL.
76
773. Dummy. index == DKIX_DUMMY (combined only)
78 Previously held an active (key, value) pair, but that was deleted and an
79 active pair has not yet overwritten the slot. Dummy can transition to
80 Active upon key insertion. Dummy slots cannot be made Unused again
81 else the probe sequence in case of collision would have no way to know
82 they were once active.
83
844. Pending. index >= 0, key != NULL, and value == NULL (split only)
85 Not yet inserted in split-table.
Benjamin Peterson7d95e402012-04-23 11:24:50 -040086*/
87
Victor Stinner742da042016-09-07 17:40:12 -070088/*
89Preserving insertion order
Benjamin Peterson7d95e402012-04-23 11:24:50 -040090
Victor Stinner742da042016-09-07 17:40:12 -070091It's simple for combined table. Since dk_entries is mostly append only, we can
92get insertion order by just iterating dk_entries.
93
94One exception is .popitem(). It removes last item in dk_entries and decrement
95dk_nentries to achieve amortized O(1). Since there are DKIX_DUMMY remains in
96dk_indices, we can't increment dk_usable even though dk_nentries is
97decremented.
98
99In split table, inserting into pending entry is allowed only for dk_entries[ix]
100where ix == mp->ma_used. Inserting into other index and deleting item cause
101converting the dict to the combined table.
102*/
103
104/* PyDict_MINSIZE is the starting size for any new dict.
Benjamin Peterson7d95e402012-04-23 11:24:50 -0400105 * 8 allows dicts with no more than 5 active entries; experiments suggested
106 * this suffices for the majority of dicts (consisting mostly of usually-small
107 * dicts created to pass keyword arguments).
108 * Making this 8, rather than 4 reduces the number of resizes for most
109 * dictionaries, without any significant extra memory use.
110 */
Victor Stinner742da042016-09-07 17:40:12 -0700111#define PyDict_MINSIZE 8
Benjamin Peterson7d95e402012-04-23 11:24:50 -0400112
Guido van Rossumc0b618a1997-05-02 03:12:38 +0000113#include "Python.h"
Eric Snow96c6af92015-05-29 22:21:39 -0600114#include "dict-common.h"
Victor Stinner990397e2016-09-09 20:22:59 -0700115#include "stringlib/eq.h" /* to get unicode_eq() */
Guido van Rossum4b1302b1993-03-27 18:11:32 +0000116
Larry Hastings61272b72014-01-07 12:41:53 -0800117/*[clinic input]
Larry Hastingsc2047262014-01-25 20:43:29 -0800118class dict "PyDictObject *" "&PyDict_Type"
Larry Hastings61272b72014-01-07 12:41:53 -0800119[clinic start generated code]*/
Larry Hastings581ee362014-01-28 05:00:08 -0800120/*[clinic end generated code: output=da39a3ee5e6b4b0d input=f157a5a0ce9589d6]*/
Larry Hastings44e2eaa2013-11-23 15:37:55 -0800121
Benjamin Peterson7d95e402012-04-23 11:24:50 -0400122
123/*
124To ensure the lookup algorithm terminates, there must be at least one Unused
125slot (NULL key) in the table.
126To avoid slowing down lookups on a near-full table, we resize the table when
127it's USABLE_FRACTION (currently two-thirds) full.
128*/
Guido van Rossum16e93a81997-01-28 00:00:11 +0000129
Tim Peterseb28ef22001-06-02 05:27:19 +0000130#define PERTURB_SHIFT 5
131
Guido van Rossum16e93a81997-01-28 00:00:11 +0000132/*
Tim Peterseb28ef22001-06-02 05:27:19 +0000133Major subtleties ahead: Most hash schemes depend on having a "good" hash
134function, in the sense of simulating randomness. Python doesn't: its most
R David Murray537ad7a2016-07-10 12:33:18 -0400135important hash functions (for ints) are very regular in common
Tim Peterseb28ef22001-06-02 05:27:19 +0000136cases:
Tim Peters15d49292001-05-27 07:39:22 +0000137
R David Murray537ad7a2016-07-10 12:33:18 -0400138 >>>[hash(i) for i in range(4)]
Guido van Rossumdc5f6b22006-08-24 21:29:26 +0000139 [0, 1, 2, 3]
Tim Peters15d49292001-05-27 07:39:22 +0000140
Tim Peterseb28ef22001-06-02 05:27:19 +0000141This isn't necessarily bad! To the contrary, in a table of size 2**i, taking
142the low-order i bits as the initial table index is extremely fast, and there
R David Murray537ad7a2016-07-10 12:33:18 -0400143are no collisions at all for dicts indexed by a contiguous range of ints. So
144this gives better-than-random behavior in common cases, and that's very
145desirable.
Tim Peters15d49292001-05-27 07:39:22 +0000146
Tim Peterseb28ef22001-06-02 05:27:19 +0000147OTOH, when collisions occur, the tendency to fill contiguous slices of the
148hash table makes a good collision resolution strategy crucial. Taking only
149the last i bits of the hash code is also vulnerable: for example, consider
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000150the list [i << 16 for i in range(20000)] as a set of keys. Since ints are
Guido van Rossumdc5f6b22006-08-24 21:29:26 +0000151their own hash codes, and this fits in a dict of size 2**15, the last 15 bits
152 of every hash code are all 0: they *all* map to the same table index.
Tim Peters15d49292001-05-27 07:39:22 +0000153
Tim Peterseb28ef22001-06-02 05:27:19 +0000154But catering to unusual cases should not slow the usual ones, so we just take
155the last i bits anyway. It's up to collision resolution to do the rest. If
156we *usually* find the key we're looking for on the first try (and, it turns
157out, we usually do -- the table load factor is kept under 2/3, so the odds
158are solidly in our favor), then it makes best sense to keep the initial index
159computation dirt cheap.
Tim Peters15d49292001-05-27 07:39:22 +0000160
Tim Peterseb28ef22001-06-02 05:27:19 +0000161The first half of collision resolution is to visit table indices via this
162recurrence:
Tim Peters15d49292001-05-27 07:39:22 +0000163
Tim Peterseb28ef22001-06-02 05:27:19 +0000164 j = ((5*j) + 1) mod 2**i
Tim Peters15d49292001-05-27 07:39:22 +0000165
Tim Peterseb28ef22001-06-02 05:27:19 +0000166For any initial j in range(2**i), repeating that 2**i times generates each
167int in range(2**i) exactly once (see any text on random-number generation for
168proof). By itself, this doesn't help much: like linear probing (setting
169j += 1, or j -= 1, on each loop trip), it scans the table entries in a fixed
170order. This would be bad, except that's not the only thing we do, and it's
171actually *good* in the common cases where hash keys are consecutive. In an
172example that's really too small to make this entirely clear, for a table of
173size 2**3 the order of indices is:
Tim Peters15d49292001-05-27 07:39:22 +0000174
Tim Peterseb28ef22001-06-02 05:27:19 +0000175 0 -> 1 -> 6 -> 7 -> 4 -> 5 -> 2 -> 3 -> 0 [and here it's repeating]
176
177If two things come in at index 5, the first place we look after is index 2,
178not 6, so if another comes in at index 6 the collision at 5 didn't hurt it.
179Linear probing is deadly in this case because there the fixed probe order
180is the *same* as the order consecutive keys are likely to arrive. But it's
181extremely unlikely hash codes will follow a 5*j+1 recurrence by accident,
182and certain that consecutive hash codes do not.
183
184The other half of the strategy is to get the other bits of the hash code
185into play. This is done by initializing a (unsigned) vrbl "perturb" to the
186full hash code, and changing the recurrence to:
187
Tim Peterseb28ef22001-06-02 05:27:19 +0000188 perturb >>= PERTURB_SHIFT;
INADA Naoki267941c2016-10-06 15:19:07 +0900189 j = (5*j) + 1 + perturb;
Tim Peterseb28ef22001-06-02 05:27:19 +0000190 use j % 2**i as the next table index;
191
192Now the probe sequence depends (eventually) on every bit in the hash code,
193and the pseudo-scrambling property of recurring on 5*j+1 is more valuable,
194because it quickly magnifies small differences in the bits that didn't affect
195the initial index. Note that because perturb is unsigned, if the recurrence
196is executed often enough perturb eventually becomes and remains 0. At that
197point (very rarely reached) the recurrence is on (just) 5*j+1 again, and
198that's certain to find an empty slot eventually (since it generates every int
199in range(2**i), and we make sure there's always at least one empty slot).
200
201Selecting a good value for PERTURB_SHIFT is a balancing act. You want it
202small so that the high bits of the hash code continue to affect the probe
203sequence across iterations; but you want it large so that in really bad cases
204the high-order hash bits have an effect on early iterations. 5 was "the
205best" in minimizing total collisions across experiments Tim Peters ran (on
206both normal and pathological cases), but 4 and 6 weren't significantly worse.
207
Guido van Rossumdc5f6b22006-08-24 21:29:26 +0000208Historical: Reimer Behrends contributed the idea of using a polynomial-based
Tim Peterseb28ef22001-06-02 05:27:19 +0000209approach, using repeated multiplication by x in GF(2**n) where an irreducible
210polynomial for each table size was chosen such that x was a primitive root.
211Christian Tismer later extended that to use division by x instead, as an
212efficient way to get the high bits of the hash code into play. This scheme
Guido van Rossum8ce8a782007-11-01 19:42:39 +0000213also gave excellent collision statistics, but was more expensive: two
214if-tests were required inside the loop; computing "the next" index took about
215the same number of operations but without as much potential parallelism
216(e.g., computing 5*j can go on at the same time as computing 1+perturb in the
217above, and then shifting perturb can be done while the table index is being
218masked); and the PyDictObject struct required a member to hold the table's
219polynomial. In Tim's experiments the current scheme ran faster, produced
220equally good collision statistics, needed less code & used less memory.
Thomas Wouters4d70c3d2006-06-08 14:42:34 +0000221
Guido van Rossum4b1302b1993-03-27 18:11:32 +0000222*/
Tim Petersdea48ec2001-05-22 20:40:22 +0000223
Fred Drake1bff34a2000-08-31 19:31:38 +0000224/* forward declarations */
Victor Stinner742da042016-09-07 17:40:12 -0700225static Py_ssize_t lookdict(PyDictObject *mp, PyObject *key,
INADA Naokiba609772016-12-07 20:41:42 +0900226 Py_hash_t hash, PyObject **value_addr,
Victor Stinner742da042016-09-07 17:40:12 -0700227 Py_ssize_t *hashpos);
228static Py_ssize_t lookdict_unicode(PyDictObject *mp, PyObject *key,
INADA Naokiba609772016-12-07 20:41:42 +0900229 Py_hash_t hash, PyObject **value_addr,
Victor Stinner742da042016-09-07 17:40:12 -0700230 Py_ssize_t *hashpos);
231static Py_ssize_t
Benjamin Peterson7d95e402012-04-23 11:24:50 -0400232lookdict_unicode_nodummy(PyDictObject *mp, PyObject *key,
INADA Naokiba609772016-12-07 20:41:42 +0900233 Py_hash_t hash, PyObject **value_addr,
Victor Stinner742da042016-09-07 17:40:12 -0700234 Py_ssize_t *hashpos);
235static Py_ssize_t lookdict_split(PyDictObject *mp, PyObject *key,
INADA Naokiba609772016-12-07 20:41:42 +0900236 Py_hash_t hash, PyObject **value_addr,
Victor Stinner742da042016-09-07 17:40:12 -0700237 Py_ssize_t *hashpos);
Fred Drake1bff34a2000-08-31 19:31:38 +0000238
Benjamin Peterson7d95e402012-04-23 11:24:50 -0400239static int dictresize(PyDictObject *mp, Py_ssize_t minused);
Tim Petersdea48ec2001-05-22 20:40:22 +0000240
Benjamin Peterson3c569292016-09-08 13:16:41 -0700241/*Global counter used to set ma_version_tag field of dictionary.
Victor Stinner3b6a6b42016-09-08 12:51:24 -0700242 * It is incremented each time that a dictionary is created and each
243 * time that a dictionary is modified. */
244static uint64_t pydict_global_version = 0;
245
246#define DICT_NEXT_VERSION() (++pydict_global_version)
247
Victor Stinner742da042016-09-07 17:40:12 -0700248/* Dictionary reuse scheme to save calls to malloc and free */
Christian Heimes2202f872008-02-06 14:31:34 +0000249#ifndef PyDict_MAXFREELIST
250#define PyDict_MAXFREELIST 80
251#endif
252static PyDictObject *free_list[PyDict_MAXFREELIST];
253static int numfree = 0;
Victor Stinner742da042016-09-07 17:40:12 -0700254static PyDictKeysObject *keys_free_list[PyDict_MAXFREELIST];
255static int numfreekeys = 0;
Raymond Hettinger43442782004-03-17 21:55:03 +0000256
Serhiy Storchaka1009bf12015-04-03 23:53:51 +0300257#include "clinic/dictobject.c.h"
258
Antoine Pitrou9a812cb2011-11-15 00:00:12 +0100259int
260PyDict_ClearFreeList(void)
Christian Heimes77c02eb2008-02-09 02:18:51 +0000261{
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000262 PyDictObject *op;
Victor Stinner742da042016-09-07 17:40:12 -0700263 int ret = numfree + numfreekeys;
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000264 while (numfree) {
265 op = free_list[--numfree];
266 assert(PyDict_CheckExact(op));
267 PyObject_GC_Del(op);
268 }
Victor Stinner742da042016-09-07 17:40:12 -0700269 while (numfreekeys) {
270 PyObject_FREE(keys_free_list[--numfreekeys]);
271 }
Antoine Pitrou9a812cb2011-11-15 00:00:12 +0100272 return ret;
273}
274
David Malcolm49526f42012-06-22 14:55:41 -0400275/* Print summary info about the state of the optimized allocator */
276void
277_PyDict_DebugMallocStats(FILE *out)
278{
279 _PyDebugAllocatorStats(out,
280 "free PyDictObject", numfree, sizeof(PyDictObject));
281}
282
283
Antoine Pitrou9a812cb2011-11-15 00:00:12 +0100284void
285PyDict_Fini(void)
286{
287 PyDict_ClearFreeList();
Christian Heimes77c02eb2008-02-09 02:18:51 +0000288}
289
Victor Stinner742da042016-09-07 17:40:12 -0700290#define DK_SIZE(dk) ((dk)->dk_size)
291#if SIZEOF_VOID_P > 4
Victor Stinner58f7c5a2016-09-08 11:37:36 -0700292#define DK_IXSIZE(dk) \
293 (DK_SIZE(dk) <= 0xff ? \
294 1 : DK_SIZE(dk) <= 0xffff ? \
295 2 : DK_SIZE(dk) <= 0xffffffff ? \
Benjamin Peterson3c569292016-09-08 13:16:41 -0700296 4 : sizeof(int64_t))
Victor Stinner742da042016-09-07 17:40:12 -0700297#else
Victor Stinner58f7c5a2016-09-08 11:37:36 -0700298#define DK_IXSIZE(dk) \
299 (DK_SIZE(dk) <= 0xff ? \
300 1 : DK_SIZE(dk) <= 0xffff ? \
Benjamin Peterson3c569292016-09-08 13:16:41 -0700301 2 : sizeof(int32_t))
Victor Stinner742da042016-09-07 17:40:12 -0700302#endif
Victor Stinner58f7c5a2016-09-08 11:37:36 -0700303#define DK_ENTRIES(dk) \
Benjamin Peterson186122e2016-09-08 12:20:12 -0700304 ((PyDictKeyEntry*)(&(dk)->dk_indices.as_1[DK_SIZE(dk) * DK_IXSIZE(dk)]))
Victor Stinner742da042016-09-07 17:40:12 -0700305
Antoine Pitrou2d169b22012-05-12 23:43:44 +0200306#define DK_DEBUG_INCREF _Py_INC_REFTOTAL _Py_REF_DEBUG_COMMA
307#define DK_DEBUG_DECREF _Py_DEC_REFTOTAL _Py_REF_DEBUG_COMMA
308
309#define DK_INCREF(dk) (DK_DEBUG_INCREF ++(dk)->dk_refcnt)
310#define DK_DECREF(dk) if (DK_DEBUG_DECREF (--(dk)->dk_refcnt) == 0) free_keys_object(dk)
Benjamin Peterson7d95e402012-04-23 11:24:50 -0400311#define DK_MASK(dk) (((dk)->dk_size)-1)
312#define IS_POWER_OF_2(x) (((x) & (x-1)) == 0)
313
Victor Stinner742da042016-09-07 17:40:12 -0700314/* lookup indices. returns DKIX_EMPTY, DKIX_DUMMY, or ix >=0 */
Benjamin Peterson73222252016-09-08 09:58:47 -0700315static inline Py_ssize_t
Victor Stinner742da042016-09-07 17:40:12 -0700316dk_get_index(PyDictKeysObject *keys, Py_ssize_t i)
317{
318 Py_ssize_t s = DK_SIZE(keys);
Victor Stinner71211e32016-09-08 10:52:46 -0700319 Py_ssize_t ix;
320
Victor Stinner742da042016-09-07 17:40:12 -0700321 if (s <= 0xff) {
Benjamin Peterson186122e2016-09-08 12:20:12 -0700322 int8_t *indices = keys->dk_indices.as_1;
Victor Stinner208857e2016-09-08 11:35:46 -0700323 ix = indices[i];
Victor Stinner742da042016-09-07 17:40:12 -0700324 }
325 else if (s <= 0xffff) {
Benjamin Peterson186122e2016-09-08 12:20:12 -0700326 int16_t *indices = keys->dk_indices.as_2;
Victor Stinner208857e2016-09-08 11:35:46 -0700327 ix = indices[i];
Victor Stinner742da042016-09-07 17:40:12 -0700328 }
Benjamin Peterson3c569292016-09-08 13:16:41 -0700329#if SIZEOF_VOID_P > 4
Serhiy Storchaka473e0e42016-09-10 21:34:43 +0300330 else if (s > 0xffffffff) {
Benjamin Peterson186122e2016-09-08 12:20:12 -0700331 int64_t *indices = keys->dk_indices.as_8;
Victor Stinner208857e2016-09-08 11:35:46 -0700332 ix = indices[i];
Victor Stinner742da042016-09-07 17:40:12 -0700333 }
Benjamin Peterson3c569292016-09-08 13:16:41 -0700334#endif
Serhiy Storchaka473e0e42016-09-10 21:34:43 +0300335 else {
336 int32_t *indices = keys->dk_indices.as_4;
337 ix = indices[i];
338 }
Victor Stinner71211e32016-09-08 10:52:46 -0700339 assert(ix >= DKIX_DUMMY);
340 return ix;
Victor Stinner742da042016-09-07 17:40:12 -0700341}
342
343/* write to indices. */
Benjamin Peterson73222252016-09-08 09:58:47 -0700344static inline void
Victor Stinner742da042016-09-07 17:40:12 -0700345dk_set_index(PyDictKeysObject *keys, Py_ssize_t i, Py_ssize_t ix)
346{
347 Py_ssize_t s = DK_SIZE(keys);
Victor Stinner71211e32016-09-08 10:52:46 -0700348
349 assert(ix >= DKIX_DUMMY);
350
Victor Stinner742da042016-09-07 17:40:12 -0700351 if (s <= 0xff) {
Benjamin Peterson186122e2016-09-08 12:20:12 -0700352 int8_t *indices = keys->dk_indices.as_1;
Victor Stinner71211e32016-09-08 10:52:46 -0700353 assert(ix <= 0x7f);
Victor Stinner208857e2016-09-08 11:35:46 -0700354 indices[i] = (char)ix;
Victor Stinner742da042016-09-07 17:40:12 -0700355 }
356 else if (s <= 0xffff) {
Benjamin Peterson186122e2016-09-08 12:20:12 -0700357 int16_t *indices = keys->dk_indices.as_2;
Victor Stinner71211e32016-09-08 10:52:46 -0700358 assert(ix <= 0x7fff);
Victor Stinner208857e2016-09-08 11:35:46 -0700359 indices[i] = (int16_t)ix;
Victor Stinner742da042016-09-07 17:40:12 -0700360 }
Benjamin Peterson3c569292016-09-08 13:16:41 -0700361#if SIZEOF_VOID_P > 4
Serhiy Storchaka473e0e42016-09-10 21:34:43 +0300362 else if (s > 0xffffffff) {
Benjamin Peterson186122e2016-09-08 12:20:12 -0700363 int64_t *indices = keys->dk_indices.as_8;
Victor Stinner208857e2016-09-08 11:35:46 -0700364 indices[i] = ix;
Victor Stinner742da042016-09-07 17:40:12 -0700365 }
Benjamin Peterson3c569292016-09-08 13:16:41 -0700366#endif
Serhiy Storchaka473e0e42016-09-10 21:34:43 +0300367 else {
368 int32_t *indices = keys->dk_indices.as_4;
369 assert(ix <= 0x7fffffff);
370 indices[i] = (int32_t)ix;
371 }
Victor Stinner742da042016-09-07 17:40:12 -0700372}
373
374
Antoine Pitroua504a7a2012-06-24 21:03:45 +0200375/* USABLE_FRACTION is the maximum dictionary load.
Victor Stinner742da042016-09-07 17:40:12 -0700376 * Increasing this ratio makes dictionaries more dense resulting in more
377 * collisions. Decreasing it improves sparseness at the expense of spreading
378 * indices over more cache lines and at the cost of total memory consumed.
Antoine Pitroua504a7a2012-06-24 21:03:45 +0200379 *
380 * USABLE_FRACTION must obey the following:
Benjamin Peterson7d95e402012-04-23 11:24:50 -0400381 * (0 < USABLE_FRACTION(n) < n) for all n >= 2
382 *
Victor Stinner742da042016-09-07 17:40:12 -0700383 * USABLE_FRACTION should be quick to calculate.
384 * Fractions around 1/2 to 2/3 seem to work well in practice.
Benjamin Peterson7d95e402012-04-23 11:24:50 -0400385 */
Victor Stinner742da042016-09-07 17:40:12 -0700386#define USABLE_FRACTION(n) (((n) << 1)/3)
Benjamin Peterson7d95e402012-04-23 11:24:50 -0400387
Victor Stinner742da042016-09-07 17:40:12 -0700388/* ESTIMATE_SIZE is reverse function of USABLE_FRACTION.
389 * This can be used to reserve enough size to insert n entries without
390 * resizing.
391 */
INADA Naoki92c50ee2016-11-22 00:57:02 +0900392#define ESTIMATE_SIZE(n) (((n)*3+1) >> 1)
Benjamin Peterson7d95e402012-04-23 11:24:50 -0400393
Victor Stinner742da042016-09-07 17:40:12 -0700394/* Alternative fraction that is otherwise close enough to 2n/3 to make
Benjamin Peterson7d95e402012-04-23 11:24:50 -0400395 * little difference. 8 * 2/3 == 8 * 5/8 == 5. 16 * 2/3 == 16 * 5/8 == 10.
396 * 32 * 2/3 = 21, 32 * 5/8 = 20.
397 * Its advantage is that it is faster to compute on machines with slow division.
398 * #define USABLE_FRACTION(n) (((n) >> 1) + ((n) >> 2) - ((n) >> 3))
Victor Stinner742da042016-09-07 17:40:12 -0700399 */
Benjamin Peterson7d95e402012-04-23 11:24:50 -0400400
Victor Stinnera9f61a52013-07-16 22:17:26 +0200401/* GROWTH_RATE. Growth rate upon hitting maximum load.
402 * Currently set to used*2 + capacity/2.
403 * This means that dicts double in size when growing without deletions,
Raymond Hettinger36f74aa2013-05-17 03:01:13 -0700404 * but have more head room when the number of deletions is on a par with the
405 * number of insertions.
406 * Raising this to used*4 doubles memory consumption depending on the size of
Antoine Pitroua504a7a2012-06-24 21:03:45 +0200407 * the dictionary, but results in half the number of resizes, less effort to
Raymond Hettinger36f74aa2013-05-17 03:01:13 -0700408 * resize.
409 * GROWTH_RATE was set to used*4 up to version 3.2.
410 * GROWTH_RATE was set to used*2 in version 3.3.0
Antoine Pitroua504a7a2012-06-24 21:03:45 +0200411 */
Raymond Hettinger36f74aa2013-05-17 03:01:13 -0700412#define GROWTH_RATE(d) (((d)->ma_used*2)+((d)->ma_keys->dk_size>>1))
Benjamin Peterson7d95e402012-04-23 11:24:50 -0400413
414#define ENSURE_ALLOWS_DELETIONS(d) \
415 if ((d)->ma_keys->dk_lookup == lookdict_unicode_nodummy) { \
416 (d)->ma_keys->dk_lookup = lookdict_unicode; \
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000417 }
Benjamin Peterson7d95e402012-04-23 11:24:50 -0400418
419/* This immutable, empty PyDictKeysObject is used for PyDict_Clear()
420 * (which cannot fail and thus can do no allocation).
421 */
422static PyDictKeysObject empty_keys_struct = {
Serhiy Storchaka97932e42016-09-26 23:01:23 +0300423 1, /* dk_refcnt */
Benjamin Peterson7d95e402012-04-23 11:24:50 -0400424 1, /* dk_size */
425 lookdict_split, /* dk_lookup */
426 0, /* dk_usable (immutable) */
Victor Stinner742da042016-09-07 17:40:12 -0700427 0, /* dk_nentries */
Benjamin Peterson186122e2016-09-08 12:20:12 -0700428 .dk_indices = { .as_1 = {DKIX_EMPTY, DKIX_EMPTY, DKIX_EMPTY, DKIX_EMPTY,
429 DKIX_EMPTY, DKIX_EMPTY, DKIX_EMPTY, DKIX_EMPTY}},
Benjamin Peterson7d95e402012-04-23 11:24:50 -0400430};
431
432static PyObject *empty_values[1] = { NULL };
433
434#define Py_EMPTY_KEYS &empty_keys_struct
435
Victor Stinner611b0fa2016-09-14 15:02:01 +0200436/* Uncomment to check the dict content in _PyDict_CheckConsistency() */
437/* #define DEBUG_PYDICT */
438
439
440#ifdef Py_DEBUG
441static int
442_PyDict_CheckConsistency(PyDictObject *mp)
443{
444 PyDictKeysObject *keys = mp->ma_keys;
445 int splitted = _PyDict_HasSplitTable(mp);
446 Py_ssize_t usable = USABLE_FRACTION(keys->dk_size);
447#ifdef DEBUG_PYDICT
448 PyDictKeyEntry *entries = DK_ENTRIES(keys);
449 Py_ssize_t i;
450#endif
451
452 assert(0 <= mp->ma_used && mp->ma_used <= usable);
453 assert(IS_POWER_OF_2(keys->dk_size));
454 assert(0 <= keys->dk_usable
455 && keys->dk_usable <= usable);
456 assert(0 <= keys->dk_nentries
457 && keys->dk_nentries <= usable);
458 assert(keys->dk_usable + keys->dk_nentries <= usable);
459
460 if (!splitted) {
461 /* combined table */
462 assert(keys->dk_refcnt == 1);
463 }
464
465#ifdef DEBUG_PYDICT
466 for (i=0; i < keys->dk_size; i++) {
467 Py_ssize_t ix = dk_get_index(keys, i);
468 assert(DKIX_DUMMY <= ix && ix <= usable);
469 }
470
471 for (i=0; i < usable; i++) {
472 PyDictKeyEntry *entry = &entries[i];
473 PyObject *key = entry->me_key;
474
475 if (key != NULL) {
476 if (PyUnicode_CheckExact(key)) {
477 Py_hash_t hash = ((PyASCIIObject *)key)->hash;
478 assert(hash != -1);
479 assert(entry->me_hash == hash);
480 }
481 else {
482 /* test_dict fails if PyObject_Hash() is called again */
483 assert(entry->me_hash != -1);
484 }
485 if (!splitted) {
486 assert(entry->me_value != NULL);
487 }
488 }
489
490 if (splitted) {
491 assert(entry->me_value == NULL);
492 }
493 }
494
495 if (splitted) {
496 /* splitted table */
497 for (i=0; i < mp->ma_used; i++) {
498 assert(mp->ma_values[i] != NULL);
499 }
500 }
501#endif
502
503 return 1;
504}
505#endif
506
507
Benjamin Peterson7d95e402012-04-23 11:24:50 -0400508static PyDictKeysObject *new_keys_object(Py_ssize_t size)
509{
510 PyDictKeysObject *dk;
Victor Stinner742da042016-09-07 17:40:12 -0700511 Py_ssize_t es, usable;
Benjamin Peterson7d95e402012-04-23 11:24:50 -0400512
Victor Stinner742da042016-09-07 17:40:12 -0700513 assert(size >= PyDict_MINSIZE);
Benjamin Peterson7d95e402012-04-23 11:24:50 -0400514 assert(IS_POWER_OF_2(size));
Victor Stinner742da042016-09-07 17:40:12 -0700515
516 usable = USABLE_FRACTION(size);
517 if (size <= 0xff) {
518 es = 1;
519 }
520 else if (size <= 0xffff) {
521 es = 2;
522 }
523#if SIZEOF_VOID_P > 4
524 else if (size <= 0xffffffff) {
525 es = 4;
526 }
527#endif
528 else {
529 es = sizeof(Py_ssize_t);
530 }
531
532 if (size == PyDict_MINSIZE && numfreekeys > 0) {
533 dk = keys_free_list[--numfreekeys];
534 }
535 else {
Victor Stinner98ee9d52016-09-08 09:33:56 -0700536 dk = PyObject_MALLOC(sizeof(PyDictKeysObject)
537 - Py_MEMBER_SIZE(PyDictKeysObject, dk_indices)
538 + es * size
539 + sizeof(PyDictKeyEntry) * usable);
Victor Stinner742da042016-09-07 17:40:12 -0700540 if (dk == NULL) {
541 PyErr_NoMemory();
542 return NULL;
543 }
Benjamin Peterson7d95e402012-04-23 11:24:50 -0400544 }
Antoine Pitrou2d169b22012-05-12 23:43:44 +0200545 DK_DEBUG_INCREF dk->dk_refcnt = 1;
Benjamin Peterson7d95e402012-04-23 11:24:50 -0400546 dk->dk_size = size;
Victor Stinner742da042016-09-07 17:40:12 -0700547 dk->dk_usable = usable;
Benjamin Peterson7d95e402012-04-23 11:24:50 -0400548 dk->dk_lookup = lookdict_unicode_nodummy;
Victor Stinner742da042016-09-07 17:40:12 -0700549 dk->dk_nentries = 0;
Benjamin Peterson186122e2016-09-08 12:20:12 -0700550 memset(&dk->dk_indices.as_1[0], 0xff, es * size);
Victor Stinner742da042016-09-07 17:40:12 -0700551 memset(DK_ENTRIES(dk), 0, sizeof(PyDictKeyEntry) * usable);
Benjamin Peterson7d95e402012-04-23 11:24:50 -0400552 return dk;
553}
554
555static void
556free_keys_object(PyDictKeysObject *keys)
557{
Victor Stinner742da042016-09-07 17:40:12 -0700558 PyDictKeyEntry *entries = DK_ENTRIES(keys);
Benjamin Peterson7d95e402012-04-23 11:24:50 -0400559 Py_ssize_t i, n;
Victor Stinner742da042016-09-07 17:40:12 -0700560 for (i = 0, n = keys->dk_nentries; i < n; i++) {
Benjamin Peterson7d95e402012-04-23 11:24:50 -0400561 Py_XDECREF(entries[i].me_key);
562 Py_XDECREF(entries[i].me_value);
563 }
Victor Stinner742da042016-09-07 17:40:12 -0700564 if (keys->dk_size == PyDict_MINSIZE && numfreekeys < PyDict_MAXFREELIST) {
565 keys_free_list[numfreekeys++] = keys;
566 return;
567 }
Raymond Hettingerce5179f2016-01-31 08:56:21 -0800568 PyObject_FREE(keys);
Benjamin Peterson7d95e402012-04-23 11:24:50 -0400569}
570
571#define new_values(size) PyMem_NEW(PyObject *, size)
Benjamin Peterson7d95e402012-04-23 11:24:50 -0400572#define free_values(values) PyMem_FREE(values)
573
574/* Consumes a reference to the keys object */
575static PyObject *
576new_dict(PyDictKeysObject *keys, PyObject **values)
577{
578 PyDictObject *mp;
Victor Stinnerc9b7f512013-07-08 22:19:20 +0200579 assert(keys != NULL);
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000580 if (numfree) {
581 mp = free_list[--numfree];
582 assert (mp != NULL);
583 assert (Py_TYPE(mp) == &PyDict_Type);
584 _Py_NewReference((PyObject *)mp);
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000585 }
Benjamin Peterson7d95e402012-04-23 11:24:50 -0400586 else {
587 mp = PyObject_GC_New(PyDictObject, &PyDict_Type);
588 if (mp == NULL) {
589 DK_DECREF(keys);
590 free_values(values);
591 return NULL;
592 }
593 }
594 mp->ma_keys = keys;
595 mp->ma_values = values;
596 mp->ma_used = 0;
Victor Stinner3b6a6b42016-09-08 12:51:24 -0700597 mp->ma_version_tag = DICT_NEXT_VERSION();
Victor Stinner611b0fa2016-09-14 15:02:01 +0200598 assert(_PyDict_CheckConsistency(mp));
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000599 return (PyObject *)mp;
Guido van Rossum4b1302b1993-03-27 18:11:32 +0000600}
601
Benjamin Peterson7d95e402012-04-23 11:24:50 -0400602/* Consumes a reference to the keys object */
603static PyObject *
604new_dict_with_shared_keys(PyDictKeysObject *keys)
605{
606 PyObject **values;
607 Py_ssize_t i, size;
608
Victor Stinner742da042016-09-07 17:40:12 -0700609 size = USABLE_FRACTION(DK_SIZE(keys));
Benjamin Peterson7d95e402012-04-23 11:24:50 -0400610 values = new_values(size);
611 if (values == NULL) {
612 DK_DECREF(keys);
613 return PyErr_NoMemory();
614 }
615 for (i = 0; i < size; i++) {
616 values[i] = NULL;
617 }
618 return new_dict(keys, values);
619}
620
621PyObject *
622PyDict_New(void)
623{
Victor Stinner742da042016-09-07 17:40:12 -0700624 PyDictKeysObject *keys = new_keys_object(PyDict_MINSIZE);
Victor Stinnerc9b7f512013-07-08 22:19:20 +0200625 if (keys == NULL)
626 return NULL;
627 return new_dict(keys, NULL);
Benjamin Peterson7d95e402012-04-23 11:24:50 -0400628}
629
Victor Stinner742da042016-09-07 17:40:12 -0700630/* Search index of hash table from offset of entry table */
631static Py_ssize_t
632lookdict_index(PyDictKeysObject *k, Py_hash_t hash, Py_ssize_t index)
633{
INADA Naoki267941c2016-10-06 15:19:07 +0900634 size_t i;
Victor Stinner742da042016-09-07 17:40:12 -0700635 size_t mask = DK_MASK(k);
636 Py_ssize_t ix;
637
638 i = (size_t)hash & mask;
639 ix = dk_get_index(k, i);
640 if (ix == index) {
641 return i;
642 }
643 if (ix == DKIX_EMPTY) {
644 return DKIX_EMPTY;
645 }
646
INADA Naoki267941c2016-10-06 15:19:07 +0900647 for (size_t perturb = hash;;) {
648 perturb >>= PERTURB_SHIFT;
Victor Stinner742da042016-09-07 17:40:12 -0700649 i = mask & ((i << 2) + i + perturb + 1);
650 ix = dk_get_index(k, i);
651 if (ix == index) {
652 return i;
653 }
654 if (ix == DKIX_EMPTY) {
655 return DKIX_EMPTY;
656 }
657 }
658 assert(0); /* NOT REACHED */
659 return DKIX_ERROR;
660}
661
Guido van Rossum4b1302b1993-03-27 18:11:32 +0000662/*
663The basic lookup function used by all operations.
Guido van Rossum16e93a81997-01-28 00:00:11 +0000664This is based on Algorithm D from Knuth Vol. 3, Sec. 6.4.
Guido van Rossum4b1302b1993-03-27 18:11:32 +0000665Open addressing is preferred over chaining since the link overhead for
666chaining would be substantial (100% with typical malloc overhead).
667
Tim Peterseb28ef22001-06-02 05:27:19 +0000668The initial probe index is computed as hash mod the table size. Subsequent
669probe indices are computed as explained earlier.
Guido van Rossum2bc13791999-03-24 19:06:42 +0000670
671All arithmetic on hash should ignore overflow.
Guido van Rossum16e93a81997-01-28 00:00:11 +0000672
Guido van Rossumdc5f6b22006-08-24 21:29:26 +0000673The details in this version are due to Tim Peters, building on many past
Tim Peterseb28ef22001-06-02 05:27:19 +0000674contributions by Reimer Behrends, Jyrki Alakuijala, Vladimir Marangozov and
Guido van Rossumdc5f6b22006-08-24 21:29:26 +0000675Christian Tismer.
Fred Drake1bff34a2000-08-31 19:31:38 +0000676
Victor Stinner742da042016-09-07 17:40:12 -0700677lookdict() is general-purpose, and may return DKIX_ERROR if (and only if) a
Victor Stinnera4348cc2016-09-08 12:01:25 -0700678comparison raises an exception.
Guido van Rossum89d8c602007-09-18 17:26:56 +0000679lookdict_unicode() below is specialized to string keys, comparison of which can
Victor Stinner742da042016-09-07 17:40:12 -0700680never raise an exception; that function can never return DKIX_ERROR.
Benjamin Peterson7d95e402012-04-23 11:24:50 -0400681lookdict_unicode_nodummy is further specialized for string keys that cannot be
682the <dummy> value.
Victor Stinner742da042016-09-07 17:40:12 -0700683For both, when the key isn't found a DKIX_EMPTY is returned. hashpos returns
684where the key index should be inserted.
Guido van Rossum4b1302b1993-03-27 18:11:32 +0000685*/
Victor Stinnerc7a8f672016-11-15 15:13:40 +0100686static Py_ssize_t _Py_HOT_FUNCTION
Benjamin Peterson7d95e402012-04-23 11:24:50 -0400687lookdict(PyDictObject *mp, PyObject *key,
INADA Naokiba609772016-12-07 20:41:42 +0900688 Py_hash_t hash, PyObject **value_addr, Py_ssize_t *hashpos)
Guido van Rossum4b1302b1993-03-27 18:11:32 +0000689{
INADA Naoki267941c2016-10-06 15:19:07 +0900690 size_t i, mask;
Victor Stinner742da042016-09-07 17:40:12 -0700691 Py_ssize_t ix, freeslot;
Antoine Pitrou9ed5f272013-08-13 20:18:52 +0200692 int cmp;
Victor Stinner742da042016-09-07 17:40:12 -0700693 PyDictKeysObject *dk;
694 PyDictKeyEntry *ep0, *ep;
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000695 PyObject *startkey;
Tim Peterseb28ef22001-06-02 05:27:19 +0000696
Antoine Pitrou9a234902012-05-13 20:48:01 +0200697top:
Victor Stinner742da042016-09-07 17:40:12 -0700698 dk = mp->ma_keys;
699 mask = DK_MASK(dk);
700 ep0 = DK_ENTRIES(dk);
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000701 i = (size_t)hash & mask;
Victor Stinner742da042016-09-07 17:40:12 -0700702
703 ix = dk_get_index(dk, i);
704 if (ix == DKIX_EMPTY) {
705 if (hashpos != NULL)
706 *hashpos = i;
707 *value_addr = NULL;
708 return DKIX_EMPTY;
Benjamin Peterson7d95e402012-04-23 11:24:50 -0400709 }
Victor Stinner742da042016-09-07 17:40:12 -0700710 if (ix == DKIX_DUMMY) {
711 freeslot = i;
712 }
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000713 else {
Victor Stinner742da042016-09-07 17:40:12 -0700714 ep = &ep0[ix];
Serhiy Storchaka46825d22016-09-26 21:29:34 +0300715 assert(ep->me_key != NULL);
Victor Stinner742da042016-09-07 17:40:12 -0700716 if (ep->me_key == key) {
INADA Naokiba609772016-12-07 20:41:42 +0900717 *value_addr = ep->me_value;
Victor Stinner742da042016-09-07 17:40:12 -0700718 if (hashpos != NULL)
719 *hashpos = i;
720 return ix;
721 }
Serhiy Storchaka46825d22016-09-26 21:29:34 +0300722 if (ep->me_hash == hash) {
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000723 startkey = ep->me_key;
724 Py_INCREF(startkey);
725 cmp = PyObject_RichCompareBool(startkey, key, Py_EQ);
726 Py_DECREF(startkey);
Serhiy Storchakaf0b311b2016-11-06 13:18:24 +0200727 if (cmp < 0) {
728 *value_addr = NULL;
Victor Stinner742da042016-09-07 17:40:12 -0700729 return DKIX_ERROR;
Serhiy Storchakaf0b311b2016-11-06 13:18:24 +0200730 }
Victor Stinner742da042016-09-07 17:40:12 -0700731 if (dk == mp->ma_keys && ep->me_key == startkey) {
Benjamin Peterson7d95e402012-04-23 11:24:50 -0400732 if (cmp > 0) {
INADA Naokiba609772016-12-07 20:41:42 +0900733 *value_addr = ep->me_value;
Victor Stinner742da042016-09-07 17:40:12 -0700734 if (hashpos != NULL)
735 *hashpos = i;
736 return ix;
Benjamin Peterson7d95e402012-04-23 11:24:50 -0400737 }
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000738 }
739 else {
Antoine Pitrou9a234902012-05-13 20:48:01 +0200740 /* The dict was mutated, restart */
741 goto top;
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000742 }
743 }
Victor Stinner742da042016-09-07 17:40:12 -0700744 freeslot = -1;
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000745 }
Tim Peters15d49292001-05-27 07:39:22 +0000746
INADA Naoki267941c2016-10-06 15:19:07 +0900747 for (size_t perturb = hash;;) {
748 perturb >>= PERTURB_SHIFT;
Victor Stinner742da042016-09-07 17:40:12 -0700749 i = ((i << 2) + i + perturb + 1) & mask;
750 ix = dk_get_index(dk, i);
751 if (ix == DKIX_EMPTY) {
752 if (hashpos != NULL) {
753 *hashpos = (freeslot == -1) ? (Py_ssize_t)i : freeslot;
Benjamin Peterson7d95e402012-04-23 11:24:50 -0400754 }
Victor Stinner742da042016-09-07 17:40:12 -0700755 *value_addr = NULL;
756 return ix;
Benjamin Peterson7d95e402012-04-23 11:24:50 -0400757 }
Victor Stinner742da042016-09-07 17:40:12 -0700758 if (ix == DKIX_DUMMY) {
759 if (freeslot == -1)
760 freeslot = i;
761 continue;
762 }
763 ep = &ep0[ix];
Serhiy Storchaka46825d22016-09-26 21:29:34 +0300764 assert(ep->me_key != NULL);
Benjamin Peterson7d95e402012-04-23 11:24:50 -0400765 if (ep->me_key == key) {
Victor Stinner742da042016-09-07 17:40:12 -0700766 if (hashpos != NULL) {
767 *hashpos = i;
768 }
INADA Naokiba609772016-12-07 20:41:42 +0900769 *value_addr = ep->me_value;
Victor Stinner742da042016-09-07 17:40:12 -0700770 return ix;
Benjamin Peterson7d95e402012-04-23 11:24:50 -0400771 }
Serhiy Storchaka46825d22016-09-26 21:29:34 +0300772 if (ep->me_hash == hash) {
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000773 startkey = ep->me_key;
774 Py_INCREF(startkey);
775 cmp = PyObject_RichCompareBool(startkey, key, Py_EQ);
776 Py_DECREF(startkey);
Benjamin Peterson7d95e402012-04-23 11:24:50 -0400777 if (cmp < 0) {
778 *value_addr = NULL;
Victor Stinner742da042016-09-07 17:40:12 -0700779 return DKIX_ERROR;
Benjamin Peterson7d95e402012-04-23 11:24:50 -0400780 }
Victor Stinner742da042016-09-07 17:40:12 -0700781 if (dk == mp->ma_keys && ep->me_key == startkey) {
Benjamin Peterson7d95e402012-04-23 11:24:50 -0400782 if (cmp > 0) {
Victor Stinner742da042016-09-07 17:40:12 -0700783 if (hashpos != NULL) {
784 *hashpos = i;
785 }
INADA Naokiba609772016-12-07 20:41:42 +0900786 *value_addr = ep->me_value;
Victor Stinner742da042016-09-07 17:40:12 -0700787 return ix;
Benjamin Peterson7d95e402012-04-23 11:24:50 -0400788 }
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000789 }
790 else {
Antoine Pitrou9a234902012-05-13 20:48:01 +0200791 /* The dict was mutated, restart */
792 goto top;
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000793 }
794 }
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000795 }
796 assert(0); /* NOT REACHED */
797 return 0;
Guido van Rossum4b1302b1993-03-27 18:11:32 +0000798}
799
Benjamin Peterson7d95e402012-04-23 11:24:50 -0400800/* Specialized version for string-only keys */
Victor Stinnerc7a8f672016-11-15 15:13:40 +0100801static Py_ssize_t _Py_HOT_FUNCTION
Benjamin Peterson7d95e402012-04-23 11:24:50 -0400802lookdict_unicode(PyDictObject *mp, PyObject *key,
INADA Naokiba609772016-12-07 20:41:42 +0900803 Py_hash_t hash, PyObject **value_addr, Py_ssize_t *hashpos)
Fred Drake1bff34a2000-08-31 19:31:38 +0000804{
INADA Naoki267941c2016-10-06 15:19:07 +0900805 size_t i;
Antoine Pitrou9ed5f272013-08-13 20:18:52 +0200806 size_t mask = DK_MASK(mp->ma_keys);
Victor Stinner742da042016-09-07 17:40:12 -0700807 Py_ssize_t ix, freeslot;
808 PyDictKeyEntry *ep, *ep0 = DK_ENTRIES(mp->ma_keys);
Fred Drake1bff34a2000-08-31 19:31:38 +0000809
Victor Stinner742da042016-09-07 17:40:12 -0700810 assert(mp->ma_values == NULL);
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000811 /* Make sure this function doesn't have to handle non-unicode keys,
812 including subclasses of str; e.g., one reason to subclass
813 unicodes is to override __eq__, and for speed we don't cater to
814 that here. */
815 if (!PyUnicode_CheckExact(key)) {
Benjamin Peterson7d95e402012-04-23 11:24:50 -0400816 mp->ma_keys->dk_lookup = lookdict;
Victor Stinner742da042016-09-07 17:40:12 -0700817 return lookdict(mp, key, hash, value_addr, hashpos);
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000818 }
Mark Dickinson57e683e2011-09-24 18:18:40 +0100819 i = (size_t)hash & mask;
Victor Stinner742da042016-09-07 17:40:12 -0700820 ix = dk_get_index(mp->ma_keys, i);
821 if (ix == DKIX_EMPTY) {
822 if (hashpos != NULL)
823 *hashpos = i;
824 *value_addr = NULL;
825 return DKIX_EMPTY;
Benjamin Peterson7d95e402012-04-23 11:24:50 -0400826 }
Victor Stinner742da042016-09-07 17:40:12 -0700827 if (ix == DKIX_DUMMY) {
828 freeslot = i;
829 }
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000830 else {
Victor Stinner742da042016-09-07 17:40:12 -0700831 ep = &ep0[ix];
Victor Stinner742da042016-09-07 17:40:12 -0700832 assert(ep->me_key != NULL);
Serhiy Storchaka46825d22016-09-26 21:29:34 +0300833 if (ep->me_key == key
834 || (ep->me_hash == hash && unicode_eq(ep->me_key, key))) {
Victor Stinner742da042016-09-07 17:40:12 -0700835 if (hashpos != NULL)
836 *hashpos = i;
INADA Naokiba609772016-12-07 20:41:42 +0900837 *value_addr = ep->me_value;
Victor Stinner742da042016-09-07 17:40:12 -0700838 return ix;
Benjamin Peterson7d95e402012-04-23 11:24:50 -0400839 }
Victor Stinner742da042016-09-07 17:40:12 -0700840 freeslot = -1;
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000841 }
Tim Peters15d49292001-05-27 07:39:22 +0000842
INADA Naoki267941c2016-10-06 15:19:07 +0900843 for (size_t perturb = hash;;) {
844 perturb >>= PERTURB_SHIFT;
Victor Stinner742da042016-09-07 17:40:12 -0700845 i = mask & ((i << 2) + i + perturb + 1);
846 ix = dk_get_index(mp->ma_keys, i);
847 if (ix == DKIX_EMPTY) {
848 if (hashpos != NULL) {
849 *hashpos = (freeslot == -1) ? (Py_ssize_t)i : freeslot;
Benjamin Peterson7d95e402012-04-23 11:24:50 -0400850 }
Victor Stinner742da042016-09-07 17:40:12 -0700851 *value_addr = NULL;
852 return DKIX_EMPTY;
Benjamin Peterson7d95e402012-04-23 11:24:50 -0400853 }
Victor Stinner742da042016-09-07 17:40:12 -0700854 if (ix == DKIX_DUMMY) {
855 if (freeslot == -1)
856 freeslot = i;
857 continue;
858 }
859 ep = &ep0[ix];
Serhiy Storchaka46825d22016-09-26 21:29:34 +0300860 assert(ep->me_key != NULL);
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000861 if (ep->me_key == key
Serhiy Storchaka46825d22016-09-26 21:29:34 +0300862 || (ep->me_hash == hash && unicode_eq(ep->me_key, key))) {
INADA Naokiba609772016-12-07 20:41:42 +0900863 *value_addr = ep->me_value;
Victor Stinner742da042016-09-07 17:40:12 -0700864 if (hashpos != NULL) {
865 *hashpos = i;
866 }
867 return ix;
Benjamin Peterson7d95e402012-04-23 11:24:50 -0400868 }
Antoine Pitrouf95a1b32010-05-09 15:52:27 +0000869 }
870 assert(0); /* NOT REACHED */
871 return 0;
Fred Drake1bff34a2000-08-31 19:31:38 +0000872}
873
Benjamin Peterson7d95e402012-04-23 11:24:50 -0400874/* Faster version of lookdict_unicode when it is known that no <dummy> keys
875 * will be present. */
Victor Stinnerc7a8f672016-11-15 15:13:40 +0100876static Py_ssize_t _Py_HOT_FUNCTION
Benjamin Peterson7d95e402012-04-23 11:24:50 -0400877lookdict_unicode_nodummy(PyDictObject *mp, PyObject *key,
INADA Naokiba609772016-12-07 20:41:42 +0900878 Py_hash_t hash, PyObject **value_addr,
Victor Stinner742da042016-09-07 17:40:12 -0700879 Py_ssize_t *hashpos)
Benjamin Peterson7d95e402012-04-23 11:24:50 -0400880{
INADA Naoki267941c2016-10-06 15:19:07 +0900881 size_t i;
Antoine Pitrou9ed5f272013-08-13 20:18:52 +0200882 size_t mask = DK_MASK(mp->ma_keys);
Victor Stinner742da042016-09-07 17:40:12 -0700883 Py_ssize_t ix;
884 PyDictKeyEntry *ep, *ep0 = DK_ENTRIES(mp->ma_keys);
Benjamin Peterson7d95e402012-04-23 11:24:50 -0400885
Victor Stinner742da042016-09-07 17:40:12 -0700886 assert(mp->ma_values == NULL);
Benjamin Peterson7d95e402012-04-23 11:24:50 -0400887 /* Make sure this function doesn't have to handle non-unicode keys,
888 including subclasses of str; e.g., one reason to subclass
889 unicodes is to override __eq__, and for speed we don't cater to
890 that here. */
891 if (!PyUnicode_CheckExact(key)) {
892 mp->ma_keys->dk_lookup = lookdict;
Victor Stinner742da042016-09-07 17:40:12 -0700893 return lookdict(mp, key, hash, value_addr, hashpos);
Benjamin Peterson7d95e402012-04-23 11:24:50 -0400894 }
895 i = (size_t)hash & mask;
Victor Stinner742da042016-09-07 17:40:12 -0700896 ix = dk_get_index(mp->ma_keys, i);
897 assert (ix != DKIX_DUMMY);
898 if (ix == DKIX_EMPTY) {
899 if (hashpos != NULL)
900 *hashpos = i;
901 *value_addr = NULL;
902 return DKIX_EMPTY;
903 }
904 ep = &ep0[ix];
Victor Stinnerdee6e252016-09-08 11:16:07 -0700905 assert(ep->me_key != NULL);
906 assert(PyUnicode_CheckExact(ep->me_key));
Victor Stinner742da042016-09-07 17:40:12 -0700907 if (ep->me_key == key ||
Benjamin Peterson7d95e402012-04-23 11:24:50 -0400908 (ep->me_hash == hash && unicode_eq(ep->me_key, key))) {
Victor Stinner742da042016-09-07 17:40:12 -0700909 if (hashpos != NULL)
910 *hashpos = i;
INADA Naokiba609772016-12-07 20:41:42 +0900911 *value_addr = ep->me_value;
Victor Stinner742da042016-09-07 17:40:12 -0700912 return ix;
Benjamin Peterson7d95e402012-04-23 11:24:50 -0400913 }
INADA Naoki267941c2016-10-06 15:19:07 +0900914 for (size_t perturb = hash;;) {
915 perturb >>= PERTURB_SHIFT;
Victor Stinner742da042016-09-07 17:40:12 -0700916 i = mask & ((i << 2) + i + perturb + 1);
917 ix = dk_get_index(mp->ma_keys, i);
918 assert (ix != DKIX_DUMMY);
919 if (ix == DKIX_EMPTY) {
920 if (hashpos != NULL)
921 *hashpos = i;
922 *value_addr = NULL;
923 return DKIX_EMPTY;
924 }
925 ep = &ep0[ix];
926 assert(ep->me_key != NULL && PyUnicode_CheckExact(ep->me_key));
927 if (ep->me_key == key ||
Benjamin Peterson7d95e402012-04-23 11:24:50 -0400928 (ep->me_hash == hash && unicode_eq(ep->me_key, key))) {
Victor Stinner742da042016-09-07 17:40:12 -0700929 if (hashpos != NULL)
930 *hashpos = i;
INADA Naokiba609772016-12-07 20:41:42 +0900931 *value_addr = ep->me_value;
Victor Stinner742da042016-09-07 17:40:12 -0700932 return ix;
Benjamin Peterson7d95e402012-04-23 11:24:50 -0400933 }
934 }
935 assert(0); /* NOT REACHED */
936 return 0;
937}
938
939/* Version of lookdict for split tables.
940 * All split tables and only split tables use this lookup function.
941 * Split tables only contain unicode keys and no dummy keys,
942 * so algorithm is the same as lookdict_unicode_nodummy.
943 */
Victor Stinnerc7a8f672016-11-15 15:13:40 +0100944static Py_ssize_t _Py_HOT_FUNCTION
Benjamin Peterson7d95e402012-04-23 11:24:50 -0400945lookdict_split(PyDictObject *mp, PyObject *key,
INADA Naokiba609772016-12-07 20:41:42 +0900946 Py_hash_t hash, PyObject **value_addr, Py_ssize_t *hashpos)
Benjamin Peterson7d95e402012-04-23 11:24:50 -0400947{
INADA Naoki267941c2016-10-06 15:19:07 +0900948 size_t i;
Antoine Pitrou9ed5f272013-08-13 20:18:52 +0200949 size_t mask = DK_MASK(mp->ma_keys);
Victor Stinner742da042016-09-07 17:40:12 -0700950 Py_ssize_t ix;
951 PyDictKeyEntry *ep, *ep0 = DK_ENTRIES(mp->ma_keys);
Benjamin Peterson7d95e402012-04-23 11:24:50 -0400952
Victor Stinner742da042016-09-07 17:40:12 -0700953 /* mp must split table */
954 assert(mp->ma_values != NULL);
Benjamin Peterson7d95e402012-04-23 11:24:50 -0400955 if (!PyUnicode_CheckExact(key)) {
Victor Stinner742da042016-09-07 17:40:12 -0700956 ix = lookdict(mp, key, hash, value_addr, hashpos);
957 if (ix >= 0) {
INADA Naokiba609772016-12-07 20:41:42 +0900958 *value_addr = mp->ma_values[ix];
Victor Stinner742da042016-09-07 17:40:12 -0700959 }
960 return ix;
Benjamin Peterson7d95e402012-04-23 11:24:50 -0400961 }
Victor Stinner742da042016-09-07 17:40:12 -0700962
Benjamin Peterson7d95e402012-04-23 11:24:50 -0400963 i = (size_t)hash & mask;
Victor Stinner742da042016-09-07 17:40:12 -0700964 ix = dk_get_index(mp->ma_keys, i);
965 if (ix == DKIX_EMPTY) {
966 if (hashpos != NULL)
967 *hashpos = i;
968 *value_addr = NULL;
969 return DKIX_EMPTY;
970 }
971 assert(ix >= 0);
972 ep = &ep0[ix];
Serhiy Storchaka46825d22016-09-26 21:29:34 +0300973 assert(ep->me_key != NULL && PyUnicode_CheckExact(ep->me_key));
Victor Stinner742da042016-09-07 17:40:12 -0700974 if (ep->me_key == key ||
Benjamin Peterson7d95e402012-04-23 11:24:50 -0400975 (ep->me_hash == hash && unicode_eq(ep->me_key, key))) {
Victor Stinner742da042016-09-07 17:40:12 -0700976 if (hashpos != NULL)
977 *hashpos = i;
INADA Naokiba609772016-12-07 20:41:42 +0900978 *value_addr = mp->ma_values[ix];
Victor Stinner742da042016-09-07 17:40:12 -0700979 return ix;
Benjamin Peterson7d95e402012-04-23 11:24:50 -0400980 }
INADA Naoki267941c2016-10-06 15:19:07 +0900981 for (size_t perturb = hash;;) {
982 perturb >>= PERTURB_SHIFT;
Victor Stinner742da042016-09-07 17:40:12 -0700983 i = mask & ((i << 2) + i + perturb + 1);
984 ix = dk_get_index(mp->ma_keys, i);
985 if (ix == DKIX_EMPTY) {
986 if (hashpos != NULL)
987 *hashpos = i;
988 *value_addr = NULL;
989 return DKIX_EMPTY;
990 }
991 assert(ix >= 0);
992 ep = &ep0[ix];
Serhiy Storchaka46825d22016-09-26 21:29:34 +0300993 assert(ep->me_key != NULL && PyUnicode_CheckExact(ep->me_key));
Victor Stinner742da042016-09-07 17:40:12 -0700994 if (ep->me_key == key ||
Benjamin Peterson7d95e402012-04-23 11:24:50 -0400995 (ep->me_hash == hash && unicode_eq(ep->me_key, key))) {
Victor Stinner742da042016-09-07 17:40:12 -0700996 if (hashpos != NULL)
997 *hashpos = i;
INADA Naokiba609772016-12-07 20:41:42 +0900998 *value_addr = mp->ma_values[ix];
Victor Stinner742da042016-09-07 17:40:12 -0700999 return ix;
Benjamin Peterson7d95e402012-04-23 11:24:50 -04001000 }
1001 }
1002 assert(0); /* NOT REACHED */
1003 return 0;
1004}
1005
Benjamin Petersonfb886362010-04-24 18:21:17 +00001006int
1007_PyDict_HasOnlyStringKeys(PyObject *dict)
1008{
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00001009 Py_ssize_t pos = 0;
1010 PyObject *key, *value;
Benjamin Petersonf6096542010-11-17 22:33:12 +00001011 assert(PyDict_Check(dict));
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00001012 /* Shortcut */
Benjamin Peterson7d95e402012-04-23 11:24:50 -04001013 if (((PyDictObject *)dict)->ma_keys->dk_lookup != lookdict)
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00001014 return 1;
1015 while (PyDict_Next(dict, &pos, &key, &value))
1016 if (!PyUnicode_Check(key))
1017 return 0;
1018 return 1;
Benjamin Petersonfb886362010-04-24 18:21:17 +00001019}
1020
Antoine Pitrou3a652b12009-03-23 18:52:06 +00001021#define MAINTAIN_TRACKING(mp, key, value) \
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00001022 do { \
1023 if (!_PyObject_GC_IS_TRACKED(mp)) { \
1024 if (_PyObject_GC_MAY_BE_TRACKED(key) || \
1025 _PyObject_GC_MAY_BE_TRACKED(value)) { \
1026 _PyObject_GC_TRACK(mp); \
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00001027 } \
1028 } \
1029 } while(0)
Antoine Pitrou3a652b12009-03-23 18:52:06 +00001030
1031void
1032_PyDict_MaybeUntrack(PyObject *op)
1033{
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00001034 PyDictObject *mp;
1035 PyObject *value;
Victor Stinner742da042016-09-07 17:40:12 -07001036 Py_ssize_t i, numentries;
1037 PyDictKeyEntry *ep0;
Antoine Pitrou3a652b12009-03-23 18:52:06 +00001038
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00001039 if (!PyDict_CheckExact(op) || !_PyObject_GC_IS_TRACKED(op))
1040 return;
1041
1042 mp = (PyDictObject *) op;
Victor Stinner742da042016-09-07 17:40:12 -07001043 ep0 = DK_ENTRIES(mp->ma_keys);
1044 numentries = mp->ma_keys->dk_nentries;
Benjamin Peterson7d95e402012-04-23 11:24:50 -04001045 if (_PyDict_HasSplitTable(mp)) {
Victor Stinner742da042016-09-07 17:40:12 -07001046 for (i = 0; i < numentries; i++) {
Benjamin Peterson7d95e402012-04-23 11:24:50 -04001047 if ((value = mp->ma_values[i]) == NULL)
1048 continue;
1049 if (_PyObject_GC_MAY_BE_TRACKED(value)) {
Victor Stinner742da042016-09-07 17:40:12 -07001050 assert(!_PyObject_GC_MAY_BE_TRACKED(ep0[i].me_key));
Benjamin Peterson7d95e402012-04-23 11:24:50 -04001051 return;
1052 }
1053 }
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00001054 }
Benjamin Peterson7d95e402012-04-23 11:24:50 -04001055 else {
Victor Stinner742da042016-09-07 17:40:12 -07001056 for (i = 0; i < numentries; i++) {
Benjamin Peterson7d95e402012-04-23 11:24:50 -04001057 if ((value = ep0[i].me_value) == NULL)
1058 continue;
1059 if (_PyObject_GC_MAY_BE_TRACKED(value) ||
1060 _PyObject_GC_MAY_BE_TRACKED(ep0[i].me_key))
1061 return;
1062 }
1063 }
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00001064 _PyObject_GC_UNTRACK(op);
Antoine Pitrou3a652b12009-03-23 18:52:06 +00001065}
1066
Benjamin Peterson7d95e402012-04-23 11:24:50 -04001067/* Internal function to find slot for an item from its hash
Victor Stinner3c336c52016-09-12 14:17:40 +02001068 when it is known that the key is not present in the dict.
1069
1070 The dict must be combined. */
INADA Naokiba609772016-12-07 20:41:42 +09001071static Py_ssize_t
1072find_empty_slot(PyDictKeysObject *keys, PyObject *key, Py_hash_t hash)
Guido van Rossum4b1302b1993-03-27 18:11:32 +00001073{
INADA Naoki267941c2016-10-06 15:19:07 +09001074 size_t i;
INADA Naokiba609772016-12-07 20:41:42 +09001075 size_t mask = DK_MASK(keys);
Victor Stinner742da042016-09-07 17:40:12 -07001076 Py_ssize_t ix;
Tim Peters6d6c1a32001-08-02 04:15:00 +00001077
Benjamin Peterson7d95e402012-04-23 11:24:50 -04001078 assert(key != NULL);
Victor Stinner3c336c52016-09-12 14:17:40 +02001079
Benjamin Peterson7d95e402012-04-23 11:24:50 -04001080 i = hash & mask;
INADA Naokiba609772016-12-07 20:41:42 +09001081 ix = dk_get_index(keys, i);
INADA Naoki267941c2016-10-06 15:19:07 +09001082 for (size_t perturb = hash; ix != DKIX_EMPTY;) {
1083 perturb >>= PERTURB_SHIFT;
Benjamin Peterson7d95e402012-04-23 11:24:50 -04001084 i = (i << 2) + i + perturb + 1;
INADA Naokiba609772016-12-07 20:41:42 +09001085 ix = dk_get_index(keys, i & mask);
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00001086 }
INADA Naokiba609772016-12-07 20:41:42 +09001087 assert(DK_ENTRIES(keys)[keys->dk_nentries].me_value == NULL);
1088 return i & mask;
Thomas Wouters4d70c3d2006-06-08 14:42:34 +00001089}
1090
Benjamin Peterson7d95e402012-04-23 11:24:50 -04001091static int
1092insertion_resize(PyDictObject *mp)
1093{
Raymond Hettinger36f74aa2013-05-17 03:01:13 -07001094 return dictresize(mp, GROWTH_RATE(mp));
Benjamin Peterson7d95e402012-04-23 11:24:50 -04001095}
Antoine Pitroue965d972012-02-27 00:45:12 +01001096
1097/*
1098Internal routine to insert a new item into the table.
1099Used both by the internal resize routine and by the public insert routine.
Antoine Pitroue965d972012-02-27 00:45:12 +01001100Returns -1 if an error occurred, or 0 on success.
1101*/
1102static int
Benjamin Peterson7d95e402012-04-23 11:24:50 -04001103insertdict(PyDictObject *mp, PyObject *key, Py_hash_t hash, PyObject *value)
Antoine Pitroue965d972012-02-27 00:45:12 +01001104{
Benjamin Peterson7d95e402012-04-23 11:24:50 -04001105 PyObject *old_value;
INADA Naokiba609772016-12-07 20:41:42 +09001106 PyDictKeyEntry *ep;
Victor Stinner742da042016-09-07 17:40:12 -07001107 Py_ssize_t hashpos, ix;
Antoine Pitroue965d972012-02-27 00:45:12 +01001108
Benjamin Peterson7d95e402012-04-23 11:24:50 -04001109 if (mp->ma_values != NULL && !PyUnicode_CheckExact(key)) {
1110 if (insertion_resize(mp) < 0)
1111 return -1;
1112 }
1113
INADA Naokiba609772016-12-07 20:41:42 +09001114 ix = mp->ma_keys->dk_lookup(mp, key, hash, &old_value, &hashpos);
Victor Stinner742da042016-09-07 17:40:12 -07001115 if (ix == DKIX_ERROR) {
Antoine Pitroue965d972012-02-27 00:45:12 +01001116 return -1;
1117 }
Victor Stinner742da042016-09-07 17:40:12 -07001118
Antoine Pitroud6967322014-10-18 00:35:00 +02001119 assert(PyUnicode_CheckExact(key) || mp->ma_keys->dk_lookup == lookdict);
Benjamin Petersona6f195e2012-04-30 10:23:40 -04001120 Py_INCREF(value);
Benjamin Peterson7d95e402012-04-23 11:24:50 -04001121 MAINTAIN_TRACKING(mp, key, value);
Victor Stinner742da042016-09-07 17:40:12 -07001122
1123 /* When insertion order is different from shared key, we can't share
1124 * the key anymore. Convert this instance to combine table.
1125 */
1126 if (_PyDict_HasSplitTable(mp) &&
INADA Naokiba609772016-12-07 20:41:42 +09001127 ((ix >= 0 && old_value == NULL && mp->ma_used != ix) ||
Victor Stinner742da042016-09-07 17:40:12 -07001128 (ix == DKIX_EMPTY && mp->ma_used != mp->ma_keys->dk_nentries))) {
1129 if (insertion_resize(mp) < 0) {
1130 Py_DECREF(value);
1131 return -1;
1132 }
INADA Naokiba609772016-12-07 20:41:42 +09001133 hashpos = find_empty_slot(mp->ma_keys, key, hash);
Victor Stinner742da042016-09-07 17:40:12 -07001134 ix = DKIX_EMPTY;
Benjamin Peterson7d95e402012-04-23 11:24:50 -04001135 }
Victor Stinner742da042016-09-07 17:40:12 -07001136
1137 if (ix == DKIX_EMPTY) {
1138 /* Insert into new slot. */
INADA Naokiba609772016-12-07 20:41:42 +09001139 assert(old_value == NULL);
Victor Stinner742da042016-09-07 17:40:12 -07001140 if (mp->ma_keys->dk_usable <= 0) {
1141 /* Need to resize. */
1142 if (insertion_resize(mp) < 0) {
1143 Py_DECREF(value);
1144 return -1;
Benjamin Peterson7d95e402012-04-23 11:24:50 -04001145 }
INADA Naokiba609772016-12-07 20:41:42 +09001146 hashpos = find_empty_slot(mp->ma_keys, key, hash);
Victor Stinner742da042016-09-07 17:40:12 -07001147 }
INADA Naokiba609772016-12-07 20:41:42 +09001148 ep = &DK_ENTRIES(mp->ma_keys)[mp->ma_keys->dk_nentries];
Victor Stinner742da042016-09-07 17:40:12 -07001149 dk_set_index(mp->ma_keys, hashpos, mp->ma_keys->dk_nentries);
1150 Py_INCREF(key);
1151 ep->me_key = key;
1152 ep->me_hash = hash;
1153 if (mp->ma_values) {
1154 assert (mp->ma_values[mp->ma_keys->dk_nentries] == NULL);
1155 mp->ma_values[mp->ma_keys->dk_nentries] = value;
Benjamin Peterson7d95e402012-04-23 11:24:50 -04001156 }
1157 else {
Victor Stinner742da042016-09-07 17:40:12 -07001158 ep->me_value = value;
Benjamin Peterson7d95e402012-04-23 11:24:50 -04001159 }
1160 mp->ma_used++;
Victor Stinner3b6a6b42016-09-08 12:51:24 -07001161 mp->ma_version_tag = DICT_NEXT_VERSION();
Victor Stinner742da042016-09-07 17:40:12 -07001162 mp->ma_keys->dk_usable--;
1163 mp->ma_keys->dk_nentries++;
1164 assert(mp->ma_keys->dk_usable >= 0);
Victor Stinner611b0fa2016-09-14 15:02:01 +02001165 assert(_PyDict_CheckConsistency(mp));
Victor Stinner742da042016-09-07 17:40:12 -07001166 return 0;
Benjamin Peterson7d95e402012-04-23 11:24:50 -04001167 }
Victor Stinner742da042016-09-07 17:40:12 -07001168
INADA Naokiba609772016-12-07 20:41:42 +09001169 if (_PyDict_HasSplitTable(mp)) {
1170 mp->ma_values[ix] = value;
1171 if (old_value == NULL) {
1172 /* pending state */
1173 assert(ix == mp->ma_used);
1174 mp->ma_used++;
1175 }
1176 }
1177 else {
1178 assert(old_value != NULL);
1179 DK_ENTRIES(mp->ma_keys)[ix].me_value = value;
Victor Stinner742da042016-09-07 17:40:12 -07001180 }
1181
Victor Stinner3b6a6b42016-09-08 12:51:24 -07001182 mp->ma_version_tag = DICT_NEXT_VERSION();
INADA Naokiba609772016-12-07 20:41:42 +09001183 Py_XDECREF(old_value); /* which **CAN** re-enter (see issue #22653) */
Victor Stinner611b0fa2016-09-14 15:02:01 +02001184 assert(_PyDict_CheckConsistency(mp));
Benjamin Peterson7d95e402012-04-23 11:24:50 -04001185 return 0;
Antoine Pitroue965d972012-02-27 00:45:12 +01001186}
1187
Thomas Wouters4d70c3d2006-06-08 14:42:34 +00001188/*
Serhiy Storchakae26e20d2016-10-29 10:50:00 +03001189Internal routine used by dictresize() to buid a hashtable of entries.
Thomas Wouters4d70c3d2006-06-08 14:42:34 +00001190*/
1191static void
Serhiy Storchakae26e20d2016-10-29 10:50:00 +03001192build_indices(PyDictKeysObject *keys, PyDictKeyEntry *ep, Py_ssize_t n)
Thomas Wouters4d70c3d2006-06-08 14:42:34 +00001193{
Serhiy Storchakae26e20d2016-10-29 10:50:00 +03001194 size_t mask = (size_t)DK_SIZE(keys) - 1;
1195 for (Py_ssize_t ix = 0; ix != n; ix++, ep++) {
1196 Py_hash_t hash = ep->me_hash;
1197 size_t i = hash & mask;
1198 for (size_t perturb = hash; dk_get_index(keys, i) != DKIX_EMPTY;) {
1199 perturb >>= PERTURB_SHIFT;
1200 i = mask & ((i << 2) + i + perturb + 1);
1201 }
1202 dk_set_index(keys, i, ix);
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00001203 }
Guido van Rossum4b1302b1993-03-27 18:11:32 +00001204}
1205
1206/*
1207Restructure the table by allocating a new table and reinserting all
1208items again. When entries have been deleted, the new table may
1209actually be smaller than the old one.
Benjamin Peterson7d95e402012-04-23 11:24:50 -04001210If a table is split (its keys and hashes are shared, its values are not),
1211then the values are temporarily copied into the table, it is resized as
1212a combined table, then the me_value slots in the old table are NULLed out.
1213After resizing a table is always combined,
1214but can be resplit by make_keys_shared().
Guido van Rossum4b1302b1993-03-27 18:11:32 +00001215*/
Guido van Rossum4b1302b1993-03-27 18:11:32 +00001216static int
Victor Stinner3d3f2642016-12-15 17:21:23 +01001217dictresize(PyDictObject *mp, Py_ssize_t minsize)
Guido van Rossum4b1302b1993-03-27 18:11:32 +00001218{
Serhiy Storchakae26e20d2016-10-29 10:50:00 +03001219 Py_ssize_t newsize, numentries;
Benjamin Peterson7d95e402012-04-23 11:24:50 -04001220 PyDictKeysObject *oldkeys;
1221 PyObject **oldvalues;
Serhiy Storchakae26e20d2016-10-29 10:50:00 +03001222 PyDictKeyEntry *oldentries, *newentries;
Tim Peters91a364d2001-05-19 07:04:38 +00001223
Victor Stinner742da042016-09-07 17:40:12 -07001224 /* Find the smallest table size > minused. */
1225 for (newsize = PyDict_MINSIZE;
Victor Stinner3d3f2642016-12-15 17:21:23 +01001226 newsize < minsize && newsize > 0;
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00001227 newsize <<= 1)
1228 ;
1229 if (newsize <= 0) {
1230 PyErr_NoMemory();
1231 return -1;
1232 }
Serhiy Storchakae26e20d2016-10-29 10:50:00 +03001233
Benjamin Peterson7d95e402012-04-23 11:24:50 -04001234 oldkeys = mp->ma_keys;
Serhiy Storchakae26e20d2016-10-29 10:50:00 +03001235
1236 /* NOTE: Current odict checks mp->ma_keys to detect resize happen.
1237 * So we can't reuse oldkeys even if oldkeys->dk_size == newsize.
1238 * TODO: Try reusing oldkeys when reimplement odict.
1239 */
1240
Benjamin Peterson7d95e402012-04-23 11:24:50 -04001241 /* Allocate a new table. */
1242 mp->ma_keys = new_keys_object(newsize);
1243 if (mp->ma_keys == NULL) {
1244 mp->ma_keys = oldkeys;
1245 return -1;
1246 }
Victor Stinner3d3f2642016-12-15 17:21:23 +01001247 // New table must be large enough.
1248 assert(mp->ma_keys->dk_usable >= mp->ma_used);
Benjamin Peterson7d95e402012-04-23 11:24:50 -04001249 if (oldkeys->dk_lookup == lookdict)
1250 mp->ma_keys->dk_lookup = lookdict;
Serhiy Storchakae26e20d2016-10-29 10:50:00 +03001251
1252 numentries = mp->ma_used;
1253 oldentries = DK_ENTRIES(oldkeys);
1254 newentries = DK_ENTRIES(mp->ma_keys);
1255 oldvalues = mp->ma_values;
Benjamin Peterson7d95e402012-04-23 11:24:50 -04001256 if (oldvalues != NULL) {
Serhiy Storchakae26e20d2016-10-29 10:50:00 +03001257 /* Convert split table into new combined table.
1258 * We must incref keys; we can transfer values.
1259 * Note that values of split table is always dense.
1260 */
1261 for (Py_ssize_t i = 0; i < numentries; i++) {
1262 assert(oldvalues[i] != NULL);
1263 PyDictKeyEntry *ep = &oldentries[i];
1264 PyObject *key = ep->me_key;
1265 Py_INCREF(key);
1266 newentries[i].me_key = key;
1267 newentries[i].me_hash = ep->me_hash;
1268 newentries[i].me_value = oldvalues[i];
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00001269 }
Serhiy Storchakae26e20d2016-10-29 10:50:00 +03001270
Benjamin Peterson7d95e402012-04-23 11:24:50 -04001271 DK_DECREF(oldkeys);
Serhiy Storchakae26e20d2016-10-29 10:50:00 +03001272 mp->ma_values = NULL;
Victor Stinner742da042016-09-07 17:40:12 -07001273 if (oldvalues != empty_values) {
1274 free_values(oldvalues);
1275 }
Benjamin Peterson7d95e402012-04-23 11:24:50 -04001276 }
Serhiy Storchakae26e20d2016-10-29 10:50:00 +03001277 else { // combined table.
1278 if (oldkeys->dk_nentries == numentries) {
1279 memcpy(newentries, oldentries, numentries * sizeof(PyDictKeyEntry));
1280 }
1281 else {
1282 PyDictKeyEntry *ep = oldentries;
1283 for (Py_ssize_t i = 0; i < numentries; i++) {
1284 while (ep->me_value == NULL)
1285 ep++;
1286 newentries[i] = *ep++;
1287 }
1288 }
1289
Benjamin Peterson7d95e402012-04-23 11:24:50 -04001290 assert(oldkeys->dk_lookup != lookdict_split);
Benjamin Peterson7d95e402012-04-23 11:24:50 -04001291 assert(oldkeys->dk_refcnt == 1);
Serhiy Storchakae26e20d2016-10-29 10:50:00 +03001292 if (oldkeys->dk_size == PyDict_MINSIZE &&
1293 numfreekeys < PyDict_MAXFREELIST) {
1294 DK_DEBUG_DECREF keys_free_list[numfreekeys++] = oldkeys;
1295 }
1296 else {
1297 DK_DEBUG_DECREF PyObject_FREE(oldkeys);
1298 }
Benjamin Peterson7d95e402012-04-23 11:24:50 -04001299 }
Serhiy Storchakae26e20d2016-10-29 10:50:00 +03001300
1301 build_indices(mp->ma_keys, newentries, numentries);
1302 mp->ma_keys->dk_usable -= numentries;
1303 mp->ma_keys->dk_nentries = numentries;
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00001304 return 0;
Guido van Rossum4b1302b1993-03-27 18:11:32 +00001305}
1306
Benjamin Peterson15ee8212012-04-24 14:44:18 -04001307/* Returns NULL if unable to split table.
1308 * A NULL return does not necessarily indicate an error */
Benjamin Peterson7d95e402012-04-23 11:24:50 -04001309static PyDictKeysObject *
1310make_keys_shared(PyObject *op)
1311{
1312 Py_ssize_t i;
1313 Py_ssize_t size;
1314 PyDictObject *mp = (PyDictObject *)op;
1315
Benjamin Peterson15ee8212012-04-24 14:44:18 -04001316 if (!PyDict_CheckExact(op))
1317 return NULL;
Benjamin Peterson7d95e402012-04-23 11:24:50 -04001318 if (!_PyDict_HasSplitTable(mp)) {
1319 PyDictKeyEntry *ep0;
1320 PyObject **values;
1321 assert(mp->ma_keys->dk_refcnt == 1);
1322 if (mp->ma_keys->dk_lookup == lookdict) {
1323 return NULL;
1324 }
1325 else if (mp->ma_keys->dk_lookup == lookdict_unicode) {
1326 /* Remove dummy keys */
1327 if (dictresize(mp, DK_SIZE(mp->ma_keys)))
1328 return NULL;
1329 }
1330 assert(mp->ma_keys->dk_lookup == lookdict_unicode_nodummy);
1331 /* Copy values into a new array */
Victor Stinner742da042016-09-07 17:40:12 -07001332 ep0 = DK_ENTRIES(mp->ma_keys);
1333 size = USABLE_FRACTION(DK_SIZE(mp->ma_keys));
Benjamin Peterson7d95e402012-04-23 11:24:50 -04001334 values = new_values(size);
1335 if (values == NULL) {
1336 PyErr_SetString(PyExc_MemoryError,
1337 "Not enough memory to allocate new values array");
1338 return NULL;
1339 }
1340 for (i = 0; i < size; i++) {
1341 values[i] = ep0[i].me_value;
1342 ep0[i].me_value = NULL;
1343 }
1344 mp->ma_keys->dk_lookup = lookdict_split;
1345 mp->ma_values = values;
1346 }
1347 DK_INCREF(mp->ma_keys);
1348 return mp->ma_keys;
1349}
Christian Heimes99170a52007-12-19 02:07:34 +00001350
1351PyObject *
1352_PyDict_NewPresized(Py_ssize_t minused)
1353{
INADA Naoki92c50ee2016-11-22 00:57:02 +09001354 const Py_ssize_t max_presize = 128 * 1024;
Benjamin Peterson7d95e402012-04-23 11:24:50 -04001355 Py_ssize_t newsize;
1356 PyDictKeysObject *new_keys;
INADA Naoki92c50ee2016-11-22 00:57:02 +09001357
1358 /* There are no strict guarantee that returned dict can contain minused
1359 * items without resize. So we create medium size dict instead of very
1360 * large dict or MemoryError.
1361 */
1362 if (minused > USABLE_FRACTION(max_presize)) {
1363 newsize = max_presize;
1364 }
1365 else {
1366 Py_ssize_t minsize = ESTIMATE_SIZE(minused);
1367 newsize = PyDict_MINSIZE;
1368 while (newsize < minsize) {
1369 newsize <<= 1;
1370 }
1371 }
1372 assert(IS_POWER_OF_2(newsize));
1373
Benjamin Peterson7d95e402012-04-23 11:24:50 -04001374 new_keys = new_keys_object(newsize);
1375 if (new_keys == NULL)
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00001376 return NULL;
Benjamin Peterson7d95e402012-04-23 11:24:50 -04001377 return new_dict(new_keys, NULL);
Christian Heimes99170a52007-12-19 02:07:34 +00001378}
1379
Thomas Wouters4d70c3d2006-06-08 14:42:34 +00001380/* Note that, for historical reasons, PyDict_GetItem() suppresses all errors
1381 * that may occur (originally dicts supported only string keys, and exceptions
1382 * weren't possible). So, while the original intent was that a NULL return
Thomas Wouters0e3f5912006-08-11 14:57:12 +00001383 * meant the key wasn't present, in reality it can mean that, or that an error
Thomas Wouters4d70c3d2006-06-08 14:42:34 +00001384 * (suppressed) occurred while computing the key's hash, or that some error
1385 * (suppressed) occurred when comparing keys in the dict's internal probe
1386 * sequence. A nasty example of the latter is when a Python-coded comparison
1387 * function hits a stack-depth error, which can cause this to return NULL
1388 * even if the key is present.
1389 */
Guido van Rossumc0b618a1997-05-02 03:12:38 +00001390PyObject *
Tim Peters1f5871e2000-07-04 17:44:48 +00001391PyDict_GetItem(PyObject *op, PyObject *key)
Guido van Rossum4b1302b1993-03-27 18:11:32 +00001392{
Benjamin Peterson8f67d082010-10-17 20:54:53 +00001393 Py_hash_t hash;
Victor Stinner742da042016-09-07 17:40:12 -07001394 Py_ssize_t ix;
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00001395 PyDictObject *mp = (PyDictObject *)op;
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00001396 PyThreadState *tstate;
INADA Naokiba609772016-12-07 20:41:42 +09001397 PyObject *value;
Benjamin Peterson7d95e402012-04-23 11:24:50 -04001398
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00001399 if (!PyDict_Check(op))
1400 return NULL;
1401 if (!PyUnicode_CheckExact(key) ||
Martin v. Löwisd63a3b82011-09-28 07:41:54 +02001402 (hash = ((PyASCIIObject *) key)->hash) == -1)
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00001403 {
1404 hash = PyObject_Hash(key);
1405 if (hash == -1) {
1406 PyErr_Clear();
1407 return NULL;
1408 }
1409 }
Thomas Wouters4d70c3d2006-06-08 14:42:34 +00001410
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00001411 /* We can arrive here with a NULL tstate during initialization: try
1412 running "python -Wi" for an example related to string interning.
1413 Let's just hope that no exception occurs then... This must be
1414 _PyThreadState_Current and not PyThreadState_GET() because in debug
1415 mode, the latter complains if tstate is NULL. */
Victor Stinner0cae6092016-11-11 01:43:56 +01001416 tstate = PyThreadState_GET();
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00001417 if (tstate != NULL && tstate->curexc_type != NULL) {
1418 /* preserve the existing exception */
1419 PyObject *err_type, *err_value, *err_tb;
1420 PyErr_Fetch(&err_type, &err_value, &err_tb);
INADA Naokiba609772016-12-07 20:41:42 +09001421 ix = (mp->ma_keys->dk_lookup)(mp, key, hash, &value, NULL);
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00001422 /* ignore errors */
1423 PyErr_Restore(err_type, err_value, err_tb);
Victor Stinner742da042016-09-07 17:40:12 -07001424 if (ix < 0)
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00001425 return NULL;
1426 }
1427 else {
INADA Naokiba609772016-12-07 20:41:42 +09001428 ix = (mp->ma_keys->dk_lookup)(mp, key, hash, &value, NULL);
Victor Stinner742da042016-09-07 17:40:12 -07001429 if (ix < 0) {
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00001430 PyErr_Clear();
1431 return NULL;
1432 }
1433 }
INADA Naokiba609772016-12-07 20:41:42 +09001434 return value;
Guido van Rossum4b1302b1993-03-27 18:11:32 +00001435}
1436
Serhiy Storchakaf0b311b2016-11-06 13:18:24 +02001437/* Same as PyDict_GetItemWithError() but with hash supplied by caller.
1438 This returns NULL *with* an exception set if an exception occurred.
1439 It returns NULL *without* an exception set if the key wasn't present.
1440*/
Raymond Hettinger4b74fba2014-05-03 16:32:11 -07001441PyObject *
1442_PyDict_GetItem_KnownHash(PyObject *op, PyObject *key, Py_hash_t hash)
1443{
Victor Stinner742da042016-09-07 17:40:12 -07001444 Py_ssize_t ix;
Raymond Hettinger4b74fba2014-05-03 16:32:11 -07001445 PyDictObject *mp = (PyDictObject *)op;
INADA Naokiba609772016-12-07 20:41:42 +09001446 PyObject *value;
Raymond Hettinger4b74fba2014-05-03 16:32:11 -07001447
Serhiy Storchakaf0b311b2016-11-06 13:18:24 +02001448 if (!PyDict_Check(op)) {
1449 PyErr_BadInternalCall();
Raymond Hettinger4b74fba2014-05-03 16:32:11 -07001450 return NULL;
Raymond Hettinger4b74fba2014-05-03 16:32:11 -07001451 }
Serhiy Storchakaf0b311b2016-11-06 13:18:24 +02001452
INADA Naokiba609772016-12-07 20:41:42 +09001453 ix = (mp->ma_keys->dk_lookup)(mp, key, hash, &value, NULL);
Serhiy Storchakaf0b311b2016-11-06 13:18:24 +02001454 if (ix < 0) {
1455 return NULL;
Raymond Hettinger4b74fba2014-05-03 16:32:11 -07001456 }
INADA Naokiba609772016-12-07 20:41:42 +09001457 return value;
Raymond Hettinger4b74fba2014-05-03 16:32:11 -07001458}
1459
Guido van Rossum47b9ff62006-08-24 00:41:19 +00001460/* Variant of PyDict_GetItem() that doesn't suppress exceptions.
1461 This returns NULL *with* an exception set if an exception occurred.
1462 It returns NULL *without* an exception set if the key wasn't present.
1463*/
1464PyObject *
1465PyDict_GetItemWithError(PyObject *op, PyObject *key)
1466{
Victor Stinner742da042016-09-07 17:40:12 -07001467 Py_ssize_t ix;
Benjamin Peterson8f67d082010-10-17 20:54:53 +00001468 Py_hash_t hash;
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00001469 PyDictObject*mp = (PyDictObject *)op;
INADA Naokiba609772016-12-07 20:41:42 +09001470 PyObject *value;
Guido van Rossum47b9ff62006-08-24 00:41:19 +00001471
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00001472 if (!PyDict_Check(op)) {
1473 PyErr_BadInternalCall();
1474 return NULL;
1475 }
1476 if (!PyUnicode_CheckExact(key) ||
Martin v. Löwisd63a3b82011-09-28 07:41:54 +02001477 (hash = ((PyASCIIObject *) key)->hash) == -1)
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00001478 {
1479 hash = PyObject_Hash(key);
1480 if (hash == -1) {
1481 return NULL;
1482 }
1483 }
Guido van Rossum47b9ff62006-08-24 00:41:19 +00001484
INADA Naokiba609772016-12-07 20:41:42 +09001485 ix = (mp->ma_keys->dk_lookup)(mp, key, hash, &value, NULL);
Victor Stinner742da042016-09-07 17:40:12 -07001486 if (ix < 0)
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00001487 return NULL;
INADA Naokiba609772016-12-07 20:41:42 +09001488 return value;
Guido van Rossum47b9ff62006-08-24 00:41:19 +00001489}
1490
Brett Cannonfd074152012-04-14 14:10:13 -04001491PyObject *
1492_PyDict_GetItemIdWithError(PyObject *dp, struct _Py_Identifier *key)
1493{
1494 PyObject *kv;
1495 kv = _PyUnicode_FromId(key); /* borrowed */
1496 if (kv == NULL)
1497 return NULL;
1498 return PyDict_GetItemWithError(dp, kv);
1499}
1500
Victor Stinnerb4efc962015-11-20 09:24:02 +01001501/* Fast version of global value lookup (LOAD_GLOBAL).
Benjamin Peterson7d95e402012-04-23 11:24:50 -04001502 * Lookup in globals, then builtins.
Victor Stinnerb4efc962015-11-20 09:24:02 +01001503 *
1504 * Raise an exception and return NULL if an error occurred (ex: computing the
1505 * key hash failed, key comparison failed, ...). Return NULL if the key doesn't
1506 * exist. Return the value if the key exists.
Benjamin Peterson7d95e402012-04-23 11:24:50 -04001507 */
1508PyObject *
1509_PyDict_LoadGlobal(PyDictObject *globals, PyDictObject *builtins, PyObject *key)
Guido van Rossum4b1302b1993-03-27 18:11:32 +00001510{
Victor Stinner742da042016-09-07 17:40:12 -07001511 Py_ssize_t ix;
Victor Stinnerb4efc962015-11-20 09:24:02 +01001512 Py_hash_t hash;
INADA Naokiba609772016-12-07 20:41:42 +09001513 PyObject *value;
Victor Stinnerb4efc962015-11-20 09:24:02 +01001514
1515 if (!PyUnicode_CheckExact(key) ||
1516 (hash = ((PyASCIIObject *) key)->hash) == -1)
1517 {
1518 hash = PyObject_Hash(key);
1519 if (hash == -1)
1520 return NULL;
Antoine Pitroue965d972012-02-27 00:45:12 +01001521 }
Victor Stinnerb4efc962015-11-20 09:24:02 +01001522
1523 /* namespace 1: globals */
INADA Naokiba609772016-12-07 20:41:42 +09001524 ix = globals->ma_keys->dk_lookup(globals, key, hash, &value, NULL);
Victor Stinner742da042016-09-07 17:40:12 -07001525 if (ix == DKIX_ERROR)
Benjamin Peterson7d95e402012-04-23 11:24:50 -04001526 return NULL;
INADA Naokiba609772016-12-07 20:41:42 +09001527 if (ix != DKIX_EMPTY && value != NULL)
1528 return value;
Victor Stinnerb4efc962015-11-20 09:24:02 +01001529
1530 /* namespace 2: builtins */
INADA Naokiba609772016-12-07 20:41:42 +09001531 ix = builtins->ma_keys->dk_lookup(builtins, key, hash, &value, NULL);
Victor Stinner742da042016-09-07 17:40:12 -07001532 if (ix < 0)
Victor Stinnerb4efc962015-11-20 09:24:02 +01001533 return NULL;
INADA Naokiba609772016-12-07 20:41:42 +09001534 return value;
Guido van Rossum4b1302b1993-03-27 18:11:32 +00001535}
1536
Antoine Pitroue965d972012-02-27 00:45:12 +01001537/* CAUTION: PyDict_SetItem() must guarantee that it won't resize the
1538 * dictionary if it's merely replacing the value for an existing key.
1539 * This means that it's safe to loop over a dictionary with PyDict_Next()
1540 * and occasionally replace a value -- but you can't insert new keys or
1541 * remove them.
1542 */
1543int
Benjamin Peterson7d95e402012-04-23 11:24:50 -04001544PyDict_SetItem(PyObject *op, PyObject *key, PyObject *value)
Antoine Pitroue965d972012-02-27 00:45:12 +01001545{
Benjamin Peterson7d95e402012-04-23 11:24:50 -04001546 PyDictObject *mp;
1547 Py_hash_t hash;
Antoine Pitroue965d972012-02-27 00:45:12 +01001548 if (!PyDict_Check(op)) {
1549 PyErr_BadInternalCall();
1550 return -1;
1551 }
1552 assert(key);
1553 assert(value);
Benjamin Peterson7d95e402012-04-23 11:24:50 -04001554 mp = (PyDictObject *)op;
1555 if (!PyUnicode_CheckExact(key) ||
1556 (hash = ((PyASCIIObject *) key)->hash) == -1)
1557 {
Antoine Pitroue965d972012-02-27 00:45:12 +01001558 hash = PyObject_Hash(key);
1559 if (hash == -1)
1560 return -1;
1561 }
Benjamin Peterson7d95e402012-04-23 11:24:50 -04001562
1563 /* insertdict() handles any resizing that might be necessary */
1564 return insertdict(mp, key, hash, value);
Antoine Pitroue965d972012-02-27 00:45:12 +01001565}
1566
Guido van Rossum4b1302b1993-03-27 18:11:32 +00001567int
Raymond Hettinger4b74fba2014-05-03 16:32:11 -07001568_PyDict_SetItem_KnownHash(PyObject *op, PyObject *key, PyObject *value,
1569 Py_hash_t hash)
1570{
1571 PyDictObject *mp;
1572
1573 if (!PyDict_Check(op)) {
1574 PyErr_BadInternalCall();
1575 return -1;
1576 }
1577 assert(key);
1578 assert(value);
Serhiy Storchakab9d98d52015-10-02 12:47:11 +03001579 assert(hash != -1);
Raymond Hettinger4b74fba2014-05-03 16:32:11 -07001580 mp = (PyDictObject *)op;
1581
1582 /* insertdict() handles any resizing that might be necessary */
1583 return insertdict(mp, key, hash, value);
1584}
1585
Antoine Pitroue10ca3a2016-12-27 14:19:20 +01001586static int
Antoine Pitroud741ed42016-12-27 14:23:43 +01001587delitem_common(PyDictObject *mp, Py_ssize_t hashpos, Py_ssize_t ix,
Antoine Pitrouc06ae202016-12-27 14:34:54 +01001588 PyObject *old_value)
Antoine Pitroue10ca3a2016-12-27 14:19:20 +01001589{
Antoine Pitrouc06ae202016-12-27 14:34:54 +01001590 PyObject *old_key;
Antoine Pitroud741ed42016-12-27 14:23:43 +01001591 PyDictKeyEntry *ep;
Antoine Pitroue10ca3a2016-12-27 14:19:20 +01001592
Antoine Pitroue10ca3a2016-12-27 14:19:20 +01001593 mp->ma_used--;
Antoine Pitroud741ed42016-12-27 14:23:43 +01001594 mp->ma_version_tag = DICT_NEXT_VERSION();
1595 ep = &DK_ENTRIES(mp->ma_keys)[ix];
1596 dk_set_index(mp->ma_keys, hashpos, DKIX_DUMMY);
1597 ENSURE_ALLOWS_DELETIONS(mp);
1598 old_key = ep->me_key;
1599 ep->me_key = NULL;
Antoine Pitrouc06ae202016-12-27 14:34:54 +01001600 ep->me_value = NULL;
Antoine Pitroud741ed42016-12-27 14:23:43 +01001601 Py_DECREF(old_key);
Antoine Pitroue10ca3a2016-12-27 14:19:20 +01001602 Py_DECREF(old_value);
Antoine Pitroud741ed42016-12-27 14:23:43 +01001603
1604 assert(_PyDict_CheckConsistency(mp));
Antoine Pitroue10ca3a2016-12-27 14:19:20 +01001605 return 0;
1606}
1607
Raymond Hettinger4b74fba2014-05-03 16:32:11 -07001608int
Tim Peters1f5871e2000-07-04 17:44:48 +00001609PyDict_DelItem(PyObject *op, PyObject *key)
Guido van Rossum4b1302b1993-03-27 18:11:32 +00001610{
Benjamin Peterson7d95e402012-04-23 11:24:50 -04001611 Py_hash_t hash;
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00001612 assert(key);
1613 if (!PyUnicode_CheckExact(key) ||
Martin v. Löwisd63a3b82011-09-28 07:41:54 +02001614 (hash = ((PyASCIIObject *) key)->hash) == -1) {
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00001615 hash = PyObject_Hash(key);
1616 if (hash == -1)
1617 return -1;
1618 }
Victor Stinner742da042016-09-07 17:40:12 -07001619
1620 return _PyDict_DelItem_KnownHash(op, key, hash);
Guido van Rossum4b1302b1993-03-27 18:11:32 +00001621}
1622
Serhiy Storchakab9d98d52015-10-02 12:47:11 +03001623int
1624_PyDict_DelItem_KnownHash(PyObject *op, PyObject *key, Py_hash_t hash)
1625{
Victor Stinner742da042016-09-07 17:40:12 -07001626 Py_ssize_t hashpos, ix;
Serhiy Storchakab9d98d52015-10-02 12:47:11 +03001627 PyDictObject *mp;
Antoine Pitrouc06ae202016-12-27 14:34:54 +01001628 PyObject *old_value;
Serhiy Storchakab9d98d52015-10-02 12:47:11 +03001629
1630 if (!PyDict_Check(op)) {
1631 PyErr_BadInternalCall();
1632 return -1;
1633 }
1634 assert(key);
1635 assert(hash != -1);
1636 mp = (PyDictObject *)op;
INADA Naokiba609772016-12-07 20:41:42 +09001637 ix = (mp->ma_keys->dk_lookup)(mp, key, hash, &old_value, &hashpos);
Victor Stinner742da042016-09-07 17:40:12 -07001638 if (ix == DKIX_ERROR)
Serhiy Storchakab9d98d52015-10-02 12:47:11 +03001639 return -1;
INADA Naokiba609772016-12-07 20:41:42 +09001640 if (ix == DKIX_EMPTY || old_value == NULL) {
Serhiy Storchakab9d98d52015-10-02 12:47:11 +03001641 _PyErr_SetKeyError(key);
1642 return -1;
1643 }
Victor Stinner742da042016-09-07 17:40:12 -07001644 assert(dk_get_index(mp->ma_keys, hashpos) == ix);
Victor Stinner78601a32016-09-09 19:28:36 -07001645
1646 // Split table doesn't allow deletion. Combine it.
1647 if (_PyDict_HasSplitTable(mp)) {
1648 if (dictresize(mp, DK_SIZE(mp->ma_keys))) {
1649 return -1;
1650 }
INADA Naokiba609772016-12-07 20:41:42 +09001651 ix = (mp->ma_keys->dk_lookup)(mp, key, hash, &old_value, &hashpos);
Victor Stinner78601a32016-09-09 19:28:36 -07001652 assert(ix >= 0);
1653 }
1654
Antoine Pitrouc06ae202016-12-27 14:34:54 +01001655 return delitem_common(mp, hashpos, ix, old_value);
Serhiy Storchakab9d98d52015-10-02 12:47:11 +03001656}
1657
Antoine Pitroud741ed42016-12-27 14:23:43 +01001658/* This function promises that the predicate -> deletion sequence is atomic
1659 * (i.e. protected by the GIL), assuming the predicate itself doesn't
1660 * release the GIL.
1661 */
Antoine Pitroue10ca3a2016-12-27 14:19:20 +01001662int
1663_PyDict_DelItemIf(PyObject *op, PyObject *key,
1664 int (*predicate)(PyObject *value))
1665{
Antoine Pitroud741ed42016-12-27 14:23:43 +01001666 Py_ssize_t hashpos, ix;
Antoine Pitroue10ca3a2016-12-27 14:19:20 +01001667 PyDictObject *mp;
1668 Py_hash_t hash;
Antoine Pitrouc06ae202016-12-27 14:34:54 +01001669 PyObject *old_value;
Antoine Pitroue10ca3a2016-12-27 14:19:20 +01001670 int res;
1671
1672 if (!PyDict_Check(op)) {
1673 PyErr_BadInternalCall();
1674 return -1;
1675 }
1676 assert(key);
1677 hash = PyObject_Hash(key);
1678 if (hash == -1)
1679 return -1;
1680 mp = (PyDictObject *)op;
Antoine Pitrouc06ae202016-12-27 14:34:54 +01001681 ix = (mp->ma_keys->dk_lookup)(mp, key, hash, &old_value, &hashpos);
Antoine Pitroud741ed42016-12-27 14:23:43 +01001682 if (ix == DKIX_ERROR)
Antoine Pitroue10ca3a2016-12-27 14:19:20 +01001683 return -1;
Antoine Pitrouc06ae202016-12-27 14:34:54 +01001684 if (ix == DKIX_EMPTY || old_value == NULL) {
Antoine Pitroue10ca3a2016-12-27 14:19:20 +01001685 _PyErr_SetKeyError(key);
1686 return -1;
1687 }
Antoine Pitroud741ed42016-12-27 14:23:43 +01001688 assert(dk_get_index(mp->ma_keys, hashpos) == ix);
1689
1690 // Split table doesn't allow deletion. Combine it.
1691 if (_PyDict_HasSplitTable(mp)) {
1692 if (dictresize(mp, DK_SIZE(mp->ma_keys))) {
1693 return -1;
1694 }
Antoine Pitrouc06ae202016-12-27 14:34:54 +01001695 ix = (mp->ma_keys->dk_lookup)(mp, key, hash, &old_value, &hashpos);
Antoine Pitroud741ed42016-12-27 14:23:43 +01001696 assert(ix >= 0);
1697 }
1698
Antoine Pitrouc06ae202016-12-27 14:34:54 +01001699 res = predicate(old_value);
Antoine Pitroue10ca3a2016-12-27 14:19:20 +01001700 if (res == -1)
1701 return -1;
1702 if (res > 0)
Antoine Pitrouc06ae202016-12-27 14:34:54 +01001703 return delitem_common(mp, hashpos, ix, old_value);
Antoine Pitroue10ca3a2016-12-27 14:19:20 +01001704 else
1705 return 0;
1706}
1707
1708
Guido van Rossum25831651993-05-19 14:50:45 +00001709void
Tim Peters1f5871e2000-07-04 17:44:48 +00001710PyDict_Clear(PyObject *op)
Guido van Rossum4b1302b1993-03-27 18:11:32 +00001711{
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00001712 PyDictObject *mp;
Benjamin Peterson7d95e402012-04-23 11:24:50 -04001713 PyDictKeysObject *oldkeys;
1714 PyObject **oldvalues;
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00001715 Py_ssize_t i, n;
Tim Petersdea48ec2001-05-22 20:40:22 +00001716
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00001717 if (!PyDict_Check(op))
1718 return;
Benjamin Peterson7d95e402012-04-23 11:24:50 -04001719 mp = ((PyDictObject *)op);
1720 oldkeys = mp->ma_keys;
1721 oldvalues = mp->ma_values;
1722 if (oldvalues == empty_values)
1723 return;
1724 /* Empty the dict... */
1725 DK_INCREF(Py_EMPTY_KEYS);
1726 mp->ma_keys = Py_EMPTY_KEYS;
1727 mp->ma_values = empty_values;
1728 mp->ma_used = 0;
Victor Stinner3b6a6b42016-09-08 12:51:24 -07001729 mp->ma_version_tag = DICT_NEXT_VERSION();
Benjamin Peterson7d95e402012-04-23 11:24:50 -04001730 /* ...then clear the keys and values */
1731 if (oldvalues != NULL) {
Victor Stinner742da042016-09-07 17:40:12 -07001732 n = oldkeys->dk_nentries;
Benjamin Peterson7d95e402012-04-23 11:24:50 -04001733 for (i = 0; i < n; i++)
1734 Py_CLEAR(oldvalues[i]);
1735 free_values(oldvalues);
1736 DK_DECREF(oldkeys);
1737 }
1738 else {
1739 assert(oldkeys->dk_refcnt == 1);
Antoine Pitrou2d169b22012-05-12 23:43:44 +02001740 DK_DECREF(oldkeys);
Benjamin Peterson7d95e402012-04-23 11:24:50 -04001741 }
Victor Stinner611b0fa2016-09-14 15:02:01 +02001742 assert(_PyDict_CheckConsistency(mp));
Benjamin Peterson7d95e402012-04-23 11:24:50 -04001743}
1744
Serhiy Storchaka49f5cdd2016-10-09 23:08:05 +03001745/* Internal version of PyDict_Next that returns a hash value in addition
1746 * to the key and value.
1747 * Return 1 on success, return 0 when the reached the end of the dictionary
1748 * (or if op is not a dictionary)
Benjamin Peterson7d95e402012-04-23 11:24:50 -04001749 */
Serhiy Storchaka49f5cdd2016-10-09 23:08:05 +03001750int
1751_PyDict_Next(PyObject *op, Py_ssize_t *ppos, PyObject **pkey,
1752 PyObject **pvalue, Py_hash_t *phash)
Benjamin Peterson7d95e402012-04-23 11:24:50 -04001753{
INADA Naokica2d8be2016-11-04 16:59:10 +09001754 Py_ssize_t i;
Benjamin Peterson7d95e402012-04-23 11:24:50 -04001755 PyDictObject *mp;
Serhiy Storchaka49f5cdd2016-10-09 23:08:05 +03001756 PyDictKeyEntry *entry_ptr;
1757 PyObject *value;
Benjamin Peterson7d95e402012-04-23 11:24:50 -04001758
1759 if (!PyDict_Check(op))
Serhiy Storchaka49f5cdd2016-10-09 23:08:05 +03001760 return 0;
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00001761 mp = (PyDictObject *)op;
Serhiy Storchaka49f5cdd2016-10-09 23:08:05 +03001762 i = *ppos;
Benjamin Peterson7d95e402012-04-23 11:24:50 -04001763 if (mp->ma_values) {
INADA Naokica2d8be2016-11-04 16:59:10 +09001764 if (i < 0 || i >= mp->ma_used)
Serhiy Storchaka49f5cdd2016-10-09 23:08:05 +03001765 return 0;
INADA Naokica2d8be2016-11-04 16:59:10 +09001766 /* values of split table is always dense */
Serhiy Storchaka49f5cdd2016-10-09 23:08:05 +03001767 entry_ptr = &DK_ENTRIES(mp->ma_keys)[i];
INADA Naokica2d8be2016-11-04 16:59:10 +09001768 value = mp->ma_values[i];
1769 assert(value != NULL);
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00001770 }
Benjamin Peterson7d95e402012-04-23 11:24:50 -04001771 else {
INADA Naokica2d8be2016-11-04 16:59:10 +09001772 Py_ssize_t n = mp->ma_keys->dk_nentries;
1773 if (i < 0 || i >= n)
1774 return 0;
Serhiy Storchaka49f5cdd2016-10-09 23:08:05 +03001775 entry_ptr = &DK_ENTRIES(mp->ma_keys)[i];
1776 while (i < n && entry_ptr->me_value == NULL) {
1777 entry_ptr++;
1778 i++;
Victor Stinner742da042016-09-07 17:40:12 -07001779 }
Serhiy Storchaka49f5cdd2016-10-09 23:08:05 +03001780 if (i >= n)
1781 return 0;
1782 value = entry_ptr->me_value;
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00001783 }
Serhiy Storchaka49f5cdd2016-10-09 23:08:05 +03001784 *ppos = i+1;
1785 if (pkey)
1786 *pkey = entry_ptr->me_key;
1787 if (phash)
1788 *phash = entry_ptr->me_hash;
Benjamin Peterson7d95e402012-04-23 11:24:50 -04001789 if (pvalue)
Serhiy Storchaka49f5cdd2016-10-09 23:08:05 +03001790 *pvalue = value;
1791 return 1;
Guido van Rossum4b1302b1993-03-27 18:11:32 +00001792}
1793
Tim Peters080c88b2003-02-15 03:01:11 +00001794/*
1795 * Iterate over a dict. Use like so:
1796 *
Thomas Wouters4d70c3d2006-06-08 14:42:34 +00001797 * Py_ssize_t i;
Tim Peters080c88b2003-02-15 03:01:11 +00001798 * PyObject *key, *value;
1799 * i = 0; # important! i should not otherwise be changed by you
Neal Norwitz07323012003-02-15 14:45:12 +00001800 * while (PyDict_Next(yourdict, &i, &key, &value)) {
Serhiy Storchaka49f5cdd2016-10-09 23:08:05 +03001801 * Refer to borrowed references in key and value.
Tim Peters080c88b2003-02-15 03:01:11 +00001802 * }
1803 *
Serhiy Storchaka49f5cdd2016-10-09 23:08:05 +03001804 * Return 1 on success, return 0 when the reached the end of the dictionary
1805 * (or if op is not a dictionary)
1806 *
Tim Peters080c88b2003-02-15 03:01:11 +00001807 * CAUTION: In general, it isn't safe to use PyDict_Next in a loop that
Tim Peters67830702001-03-21 19:23:56 +00001808 * mutates the dict. One exception: it is safe if the loop merely changes
1809 * the values associated with the keys (but doesn't insert new keys or
1810 * delete keys), via PyDict_SetItem().
1811 */
Guido van Rossum25831651993-05-19 14:50:45 +00001812int
Martin v. Löwis18e16552006-02-15 17:27:45 +00001813PyDict_Next(PyObject *op, Py_ssize_t *ppos, PyObject **pkey, PyObject **pvalue)
Guido van Rossum4b1302b1993-03-27 18:11:32 +00001814{
Serhiy Storchaka49f5cdd2016-10-09 23:08:05 +03001815 return _PyDict_Next(op, ppos, pkey, pvalue, NULL);
Thomas Wouterscf297e42007-02-23 15:07:44 +00001816}
1817
Eric Snow96c6af92015-05-29 22:21:39 -06001818/* Internal version of dict.pop(). */
1819PyObject *
Yury Selivanov684ef2c2016-10-28 19:01:21 -04001820_PyDict_Pop(PyObject *dict, PyObject *key, PyObject *deflt)
Eric Snow96c6af92015-05-29 22:21:39 -06001821{
1822 Py_hash_t hash;
Victor Stinner742da042016-09-07 17:40:12 -07001823 Py_ssize_t ix, hashpos;
Eric Snow96c6af92015-05-29 22:21:39 -06001824 PyObject *old_value, *old_key;
1825 PyDictKeyEntry *ep;
Yury Selivanov684ef2c2016-10-28 19:01:21 -04001826 PyDictObject *mp;
1827
1828 assert(PyDict_Check(dict));
1829 mp = (PyDictObject *)dict;
Eric Snow96c6af92015-05-29 22:21:39 -06001830
1831 if (mp->ma_used == 0) {
1832 if (deflt) {
1833 Py_INCREF(deflt);
1834 return deflt;
1835 }
1836 _PyErr_SetKeyError(key);
1837 return NULL;
1838 }
1839 if (!PyUnicode_CheckExact(key) ||
1840 (hash = ((PyASCIIObject *) key)->hash) == -1) {
1841 hash = PyObject_Hash(key);
1842 if (hash == -1)
1843 return NULL;
1844 }
INADA Naokiba609772016-12-07 20:41:42 +09001845 ix = (mp->ma_keys->dk_lookup)(mp, key, hash, &old_value, &hashpos);
Victor Stinner742da042016-09-07 17:40:12 -07001846 if (ix == DKIX_ERROR)
Eric Snow96c6af92015-05-29 22:21:39 -06001847 return NULL;
INADA Naokiba609772016-12-07 20:41:42 +09001848 if (ix == DKIX_EMPTY || old_value == NULL) {
Eric Snow96c6af92015-05-29 22:21:39 -06001849 if (deflt) {
1850 Py_INCREF(deflt);
1851 return deflt;
1852 }
1853 _PyErr_SetKeyError(key);
1854 return NULL;
1855 }
Victor Stinner3b6a6b42016-09-08 12:51:24 -07001856
Victor Stinner78601a32016-09-09 19:28:36 -07001857 // Split table doesn't allow deletion. Combine it.
1858 if (_PyDict_HasSplitTable(mp)) {
1859 if (dictresize(mp, DK_SIZE(mp->ma_keys))) {
1860 return NULL;
1861 }
INADA Naokiba609772016-12-07 20:41:42 +09001862 ix = (mp->ma_keys->dk_lookup)(mp, key, hash, &old_value, &hashpos);
Victor Stinner78601a32016-09-09 19:28:36 -07001863 assert(ix >= 0);
1864 }
1865
Victor Stinner78601a32016-09-09 19:28:36 -07001866 assert(old_value != NULL);
Eric Snow96c6af92015-05-29 22:21:39 -06001867 mp->ma_used--;
Victor Stinner3b6a6b42016-09-08 12:51:24 -07001868 mp->ma_version_tag = DICT_NEXT_VERSION();
Victor Stinner78601a32016-09-09 19:28:36 -07001869 dk_set_index(mp->ma_keys, hashpos, DKIX_DUMMY);
1870 ep = &DK_ENTRIES(mp->ma_keys)[ix];
1871 ENSURE_ALLOWS_DELETIONS(mp);
1872 old_key = ep->me_key;
1873 ep->me_key = NULL;
INADA Naokiba609772016-12-07 20:41:42 +09001874 ep->me_value = NULL;
Victor Stinner78601a32016-09-09 19:28:36 -07001875 Py_DECREF(old_key);
Victor Stinner611b0fa2016-09-14 15:02:01 +02001876
1877 assert(_PyDict_CheckConsistency(mp));
Eric Snow96c6af92015-05-29 22:21:39 -06001878 return old_value;
1879}
1880
1881/* Internal version of dict.from_keys(). It is subclass-friendly. */
1882PyObject *
1883_PyDict_FromKeys(PyObject *cls, PyObject *iterable, PyObject *value)
1884{
1885 PyObject *it; /* iter(iterable) */
1886 PyObject *key;
1887 PyObject *d;
1888 int status;
1889
Victor Stinnera5ed5f02016-12-06 18:45:50 +01001890 d = _PyObject_CallNoArg(cls);
Eric Snow96c6af92015-05-29 22:21:39 -06001891 if (d == NULL)
1892 return NULL;
1893
1894 if (PyDict_CheckExact(d) && ((PyDictObject *)d)->ma_used == 0) {
1895 if (PyDict_CheckExact(iterable)) {
1896 PyDictObject *mp = (PyDictObject *)d;
1897 PyObject *oldvalue;
1898 Py_ssize_t pos = 0;
1899 PyObject *key;
1900 Py_hash_t hash;
1901
Victor Stinner742da042016-09-07 17:40:12 -07001902 if (dictresize(mp, ESTIMATE_SIZE(Py_SIZE(iterable)))) {
Eric Snow96c6af92015-05-29 22:21:39 -06001903 Py_DECREF(d);
1904 return NULL;
1905 }
1906
1907 while (_PyDict_Next(iterable, &pos, &key, &oldvalue, &hash)) {
1908 if (insertdict(mp, key, hash, value)) {
1909 Py_DECREF(d);
1910 return NULL;
1911 }
1912 }
1913 return d;
1914 }
1915 if (PyAnySet_CheckExact(iterable)) {
1916 PyDictObject *mp = (PyDictObject *)d;
1917 Py_ssize_t pos = 0;
1918 PyObject *key;
1919 Py_hash_t hash;
1920
Victor Stinner742da042016-09-07 17:40:12 -07001921 if (dictresize(mp, ESTIMATE_SIZE(PySet_GET_SIZE(iterable)))) {
Eric Snow96c6af92015-05-29 22:21:39 -06001922 Py_DECREF(d);
1923 return NULL;
1924 }
1925
1926 while (_PySet_NextEntry(iterable, &pos, &key, &hash)) {
1927 if (insertdict(mp, key, hash, value)) {
1928 Py_DECREF(d);
1929 return NULL;
1930 }
1931 }
1932 return d;
1933 }
1934 }
1935
1936 it = PyObject_GetIter(iterable);
1937 if (it == NULL){
1938 Py_DECREF(d);
1939 return NULL;
1940 }
1941
1942 if (PyDict_CheckExact(d)) {
1943 while ((key = PyIter_Next(it)) != NULL) {
1944 status = PyDict_SetItem(d, key, value);
1945 Py_DECREF(key);
1946 if (status < 0)
1947 goto Fail;
1948 }
1949 } else {
1950 while ((key = PyIter_Next(it)) != NULL) {
1951 status = PyObject_SetItem(d, key, value);
1952 Py_DECREF(key);
1953 if (status < 0)
1954 goto Fail;
1955 }
1956 }
1957
1958 if (PyErr_Occurred())
1959 goto Fail;
1960 Py_DECREF(it);
1961 return d;
1962
1963Fail:
1964 Py_DECREF(it);
1965 Py_DECREF(d);
1966 return NULL;
1967}
1968
Guido van Rossum4b1302b1993-03-27 18:11:32 +00001969/* Methods */
1970
1971static void
Benjamin Peterson7d95e402012-04-23 11:24:50 -04001972dict_dealloc(PyDictObject *mp)
Guido van Rossum4b1302b1993-03-27 18:11:32 +00001973{
Benjamin Peterson7d95e402012-04-23 11:24:50 -04001974 PyObject **values = mp->ma_values;
1975 PyDictKeysObject *keys = mp->ma_keys;
1976 Py_ssize_t i, n;
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00001977 PyObject_GC_UnTrack(mp);
1978 Py_TRASHCAN_SAFE_BEGIN(mp)
Benjamin Peterson7d95e402012-04-23 11:24:50 -04001979 if (values != NULL) {
1980 if (values != empty_values) {
Victor Stinner742da042016-09-07 17:40:12 -07001981 for (i = 0, n = mp->ma_keys->dk_nentries; i < n; i++) {
Benjamin Peterson7d95e402012-04-23 11:24:50 -04001982 Py_XDECREF(values[i]);
1983 }
1984 free_values(values);
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00001985 }
Benjamin Peterson7d95e402012-04-23 11:24:50 -04001986 DK_DECREF(keys);
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00001987 }
Victor Stinnerac2a4fe2013-07-16 22:19:00 +02001988 else if (keys != NULL) {
Antoine Pitrou2d169b22012-05-12 23:43:44 +02001989 assert(keys->dk_refcnt == 1);
1990 DK_DECREF(keys);
Benjamin Peterson7d95e402012-04-23 11:24:50 -04001991 }
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00001992 if (numfree < PyDict_MAXFREELIST && Py_TYPE(mp) == &PyDict_Type)
1993 free_list[numfree++] = mp;
1994 else
1995 Py_TYPE(mp)->tp_free((PyObject *)mp);
1996 Py_TRASHCAN_SAFE_END(mp)
Guido van Rossum4b1302b1993-03-27 18:11:32 +00001997}
1998
Benjamin Peterson7d95e402012-04-23 11:24:50 -04001999
Guido van Rossumc0b618a1997-05-02 03:12:38 +00002000static PyObject *
Guido van Rossum8ce8a782007-11-01 19:42:39 +00002001dict_repr(PyDictObject *mp)
Guido van Rossum4b1302b1993-03-27 18:11:32 +00002002{
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00002003 Py_ssize_t i;
Victor Stinnerf91929b2013-11-19 13:07:38 +01002004 PyObject *key = NULL, *value = NULL;
2005 _PyUnicodeWriter writer;
2006 int first;
Guido van Rossum255443b1998-04-10 22:47:14 +00002007
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00002008 i = Py_ReprEnter((PyObject *)mp);
2009 if (i != 0) {
2010 return i > 0 ? PyUnicode_FromString("{...}") : NULL;
2011 }
Guido van Rossum255443b1998-04-10 22:47:14 +00002012
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00002013 if (mp->ma_used == 0) {
Victor Stinnerf91929b2013-11-19 13:07:38 +01002014 Py_ReprLeave((PyObject *)mp);
2015 return PyUnicode_FromString("{}");
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00002016 }
Tim Petersa7259592001-06-16 05:11:17 +00002017
Victor Stinnerf91929b2013-11-19 13:07:38 +01002018 _PyUnicodeWriter_Init(&writer);
2019 writer.overallocate = 1;
2020 /* "{" + "1: 2" + ", 3: 4" * (len - 1) + "}" */
2021 writer.min_length = 1 + 4 + (2 + 4) * (mp->ma_used - 1) + 1;
Tim Petersa7259592001-06-16 05:11:17 +00002022
Victor Stinnerf91929b2013-11-19 13:07:38 +01002023 if (_PyUnicodeWriter_WriteChar(&writer, '{') < 0)
2024 goto error;
Tim Petersa7259592001-06-16 05:11:17 +00002025
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00002026 /* Do repr() on each key+value pair, and insert ": " between them.
2027 Note that repr may mutate the dict. */
2028 i = 0;
Victor Stinnerf91929b2013-11-19 13:07:38 +01002029 first = 1;
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00002030 while (PyDict_Next((PyObject *)mp, &i, &key, &value)) {
Victor Stinnerf91929b2013-11-19 13:07:38 +01002031 PyObject *s;
2032 int res;
2033
Benjamin Peterson7d95e402012-04-23 11:24:50 -04002034 /* Prevent repr from deleting key or value during key format. */
2035 Py_INCREF(key);
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00002036 Py_INCREF(value);
Victor Stinnerf97dfd72013-07-18 01:00:45 +02002037
Victor Stinnerf91929b2013-11-19 13:07:38 +01002038 if (!first) {
2039 if (_PyUnicodeWriter_WriteASCIIString(&writer, ", ", 2) < 0)
2040 goto error;
2041 }
2042 first = 0;
2043
2044 s = PyObject_Repr(key);
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00002045 if (s == NULL)
Victor Stinnerf91929b2013-11-19 13:07:38 +01002046 goto error;
2047 res = _PyUnicodeWriter_WriteStr(&writer, s);
2048 Py_DECREF(s);
2049 if (res < 0)
2050 goto error;
2051
2052 if (_PyUnicodeWriter_WriteASCIIString(&writer, ": ", 2) < 0)
2053 goto error;
2054
2055 s = PyObject_Repr(value);
2056 if (s == NULL)
2057 goto error;
2058 res = _PyUnicodeWriter_WriteStr(&writer, s);
2059 Py_DECREF(s);
2060 if (res < 0)
2061 goto error;
2062
2063 Py_CLEAR(key);
2064 Py_CLEAR(value);
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00002065 }
Tim Petersa7259592001-06-16 05:11:17 +00002066
Victor Stinnerf91929b2013-11-19 13:07:38 +01002067 writer.overallocate = 0;
2068 if (_PyUnicodeWriter_WriteChar(&writer, '}') < 0)
2069 goto error;
Tim Petersa7259592001-06-16 05:11:17 +00002070
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00002071 Py_ReprLeave((PyObject *)mp);
Victor Stinnerf91929b2013-11-19 13:07:38 +01002072
2073 return _PyUnicodeWriter_Finish(&writer);
2074
2075error:
2076 Py_ReprLeave((PyObject *)mp);
2077 _PyUnicodeWriter_Dealloc(&writer);
2078 Py_XDECREF(key);
2079 Py_XDECREF(value);
2080 return NULL;
Guido van Rossum4b1302b1993-03-27 18:11:32 +00002081}
2082
Martin v. Löwis18e16552006-02-15 17:27:45 +00002083static Py_ssize_t
Guido van Rossum8ce8a782007-11-01 19:42:39 +00002084dict_length(PyDictObject *mp)
Guido van Rossum4b1302b1993-03-27 18:11:32 +00002085{
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00002086 return mp->ma_used;
Guido van Rossum4b1302b1993-03-27 18:11:32 +00002087}
2088
Guido van Rossumc0b618a1997-05-02 03:12:38 +00002089static PyObject *
Antoine Pitrou9ed5f272013-08-13 20:18:52 +02002090dict_subscript(PyDictObject *mp, PyObject *key)
Guido van Rossum4b1302b1993-03-27 18:11:32 +00002091{
Victor Stinner742da042016-09-07 17:40:12 -07002092 Py_ssize_t ix;
Benjamin Peterson8f67d082010-10-17 20:54:53 +00002093 Py_hash_t hash;
INADA Naokiba609772016-12-07 20:41:42 +09002094 PyObject *value;
Benjamin Peterson7d95e402012-04-23 11:24:50 -04002095
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00002096 if (!PyUnicode_CheckExact(key) ||
Martin v. Löwisd63a3b82011-09-28 07:41:54 +02002097 (hash = ((PyASCIIObject *) key)->hash) == -1) {
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00002098 hash = PyObject_Hash(key);
2099 if (hash == -1)
2100 return NULL;
2101 }
INADA Naokiba609772016-12-07 20:41:42 +09002102 ix = (mp->ma_keys->dk_lookup)(mp, key, hash, &value, NULL);
Victor Stinner742da042016-09-07 17:40:12 -07002103 if (ix == DKIX_ERROR)
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00002104 return NULL;
INADA Naokiba609772016-12-07 20:41:42 +09002105 if (ix == DKIX_EMPTY || value == NULL) {
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00002106 if (!PyDict_CheckExact(mp)) {
2107 /* Look up __missing__ method if we're a subclass. */
2108 PyObject *missing, *res;
Benjamin Petersonce798522012-01-22 11:24:29 -05002109 _Py_IDENTIFIER(__missing__);
2110 missing = _PyObject_LookupSpecial((PyObject *)mp, &PyId___missing__);
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00002111 if (missing != NULL) {
Victor Stinnerde4ae3d2016-12-04 22:59:09 +01002112 res = PyObject_CallFunctionObjArgs(missing,
2113 key, NULL);
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00002114 Py_DECREF(missing);
2115 return res;
2116 }
2117 else if (PyErr_Occurred())
2118 return NULL;
2119 }
Raymond Hettinger69492da2013-09-02 15:59:26 -07002120 _PyErr_SetKeyError(key);
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00002121 return NULL;
2122 }
INADA Naokiba609772016-12-07 20:41:42 +09002123 Py_INCREF(value);
2124 return value;
Guido van Rossum4b1302b1993-03-27 18:11:32 +00002125}
2126
2127static int
Guido van Rossum8ce8a782007-11-01 19:42:39 +00002128dict_ass_sub(PyDictObject *mp, PyObject *v, PyObject *w)
Guido van Rossum4b1302b1993-03-27 18:11:32 +00002129{
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00002130 if (w == NULL)
2131 return PyDict_DelItem((PyObject *)mp, v);
2132 else
2133 return PyDict_SetItem((PyObject *)mp, v, w);
Guido van Rossum4b1302b1993-03-27 18:11:32 +00002134}
2135
Guido van Rossuma9e7a811997-05-13 21:02:11 +00002136static PyMappingMethods dict_as_mapping = {
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00002137 (lenfunc)dict_length, /*mp_length*/
2138 (binaryfunc)dict_subscript, /*mp_subscript*/
2139 (objobjargproc)dict_ass_sub, /*mp_ass_subscript*/
Guido van Rossum4b1302b1993-03-27 18:11:32 +00002140};
2141
Guido van Rossumc0b618a1997-05-02 03:12:38 +00002142static PyObject *
Antoine Pitrou9ed5f272013-08-13 20:18:52 +02002143dict_keys(PyDictObject *mp)
Guido van Rossum4b1302b1993-03-27 18:11:32 +00002144{
Antoine Pitrou9ed5f272013-08-13 20:18:52 +02002145 PyObject *v;
2146 Py_ssize_t i, j;
Benjamin Peterson7d95e402012-04-23 11:24:50 -04002147 PyDictKeyEntry *ep;
2148 Py_ssize_t size, n, offset;
2149 PyObject **value_ptr;
Guido van Rossuma4dd0112001-04-15 22:16:26 +00002150
Guido van Rossuma4dd0112001-04-15 22:16:26 +00002151 again:
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00002152 n = mp->ma_used;
2153 v = PyList_New(n);
2154 if (v == NULL)
2155 return NULL;
2156 if (n != mp->ma_used) {
2157 /* Durnit. The allocations caused the dict to resize.
2158 * Just start over, this shouldn't normally happen.
2159 */
2160 Py_DECREF(v);
2161 goto again;
2162 }
Victor Stinner742da042016-09-07 17:40:12 -07002163 ep = DK_ENTRIES(mp->ma_keys);
2164 size = mp->ma_keys->dk_nentries;
Benjamin Peterson7d95e402012-04-23 11:24:50 -04002165 if (mp->ma_values) {
2166 value_ptr = mp->ma_values;
2167 offset = sizeof(PyObject *);
2168 }
2169 else {
2170 value_ptr = &ep[0].me_value;
2171 offset = sizeof(PyDictKeyEntry);
2172 }
2173 for (i = 0, j = 0; i < size; i++) {
2174 if (*value_ptr != NULL) {
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00002175 PyObject *key = ep[i].me_key;
2176 Py_INCREF(key);
2177 PyList_SET_ITEM(v, j, key);
2178 j++;
2179 }
Benjamin Peterson7d95e402012-04-23 11:24:50 -04002180 value_ptr = (PyObject **)(((char *)value_ptr) + offset);
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00002181 }
2182 assert(j == n);
2183 return v;
Guido van Rossum4b1302b1993-03-27 18:11:32 +00002184}
2185
Guido van Rossumc0b618a1997-05-02 03:12:38 +00002186static PyObject *
Antoine Pitrou9ed5f272013-08-13 20:18:52 +02002187dict_values(PyDictObject *mp)
Guido van Rossum25831651993-05-19 14:50:45 +00002188{
Antoine Pitrou9ed5f272013-08-13 20:18:52 +02002189 PyObject *v;
2190 Py_ssize_t i, j;
Benjamin Petersonf0acae22016-09-08 09:50:08 -07002191 PyDictKeyEntry *ep;
Benjamin Peterson7d95e402012-04-23 11:24:50 -04002192 Py_ssize_t size, n, offset;
2193 PyObject **value_ptr;
Guido van Rossuma4dd0112001-04-15 22:16:26 +00002194
Guido van Rossuma4dd0112001-04-15 22:16:26 +00002195 again:
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00002196 n = mp->ma_used;
2197 v = PyList_New(n);
2198 if (v == NULL)
2199 return NULL;
2200 if (n != mp->ma_used) {
2201 /* Durnit. The allocations caused the dict to resize.
2202 * Just start over, this shouldn't normally happen.
2203 */
2204 Py_DECREF(v);
2205 goto again;
2206 }
Benjamin Petersonf0acae22016-09-08 09:50:08 -07002207 ep = DK_ENTRIES(mp->ma_keys);
Victor Stinner742da042016-09-07 17:40:12 -07002208 size = mp->ma_keys->dk_nentries;
Benjamin Peterson7d95e402012-04-23 11:24:50 -04002209 if (mp->ma_values) {
2210 value_ptr = mp->ma_values;
2211 offset = sizeof(PyObject *);
2212 }
2213 else {
Benjamin Petersonf0acae22016-09-08 09:50:08 -07002214 value_ptr = &ep[0].me_value;
Benjamin Peterson7d95e402012-04-23 11:24:50 -04002215 offset = sizeof(PyDictKeyEntry);
2216 }
2217 for (i = 0, j = 0; i < size; i++) {
2218 PyObject *value = *value_ptr;
2219 value_ptr = (PyObject **)(((char *)value_ptr) + offset);
2220 if (value != NULL) {
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00002221 Py_INCREF(value);
2222 PyList_SET_ITEM(v, j, value);
2223 j++;
2224 }
2225 }
2226 assert(j == n);
2227 return v;
Guido van Rossum25831651993-05-19 14:50:45 +00002228}
2229
Guido van Rossumc0b618a1997-05-02 03:12:38 +00002230static PyObject *
Antoine Pitrou9ed5f272013-08-13 20:18:52 +02002231dict_items(PyDictObject *mp)
Guido van Rossum25831651993-05-19 14:50:45 +00002232{
Antoine Pitrou9ed5f272013-08-13 20:18:52 +02002233 PyObject *v;
2234 Py_ssize_t i, j, n;
Benjamin Peterson7d95e402012-04-23 11:24:50 -04002235 Py_ssize_t size, offset;
2236 PyObject *item, *key;
2237 PyDictKeyEntry *ep;
2238 PyObject **value_ptr;
Guido van Rossuma4dd0112001-04-15 22:16:26 +00002239
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00002240 /* Preallocate the list of tuples, to avoid allocations during
2241 * the loop over the items, which could trigger GC, which
2242 * could resize the dict. :-(
2243 */
Guido van Rossuma4dd0112001-04-15 22:16:26 +00002244 again:
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00002245 n = mp->ma_used;
2246 v = PyList_New(n);
2247 if (v == NULL)
2248 return NULL;
2249 for (i = 0; i < n; i++) {
2250 item = PyTuple_New(2);
2251 if (item == NULL) {
2252 Py_DECREF(v);
2253 return NULL;
2254 }
2255 PyList_SET_ITEM(v, i, item);
2256 }
2257 if (n != mp->ma_used) {
2258 /* Durnit. The allocations caused the dict to resize.
2259 * Just start over, this shouldn't normally happen.
2260 */
2261 Py_DECREF(v);
2262 goto again;
2263 }
2264 /* Nothing we do below makes any function calls. */
Victor Stinner742da042016-09-07 17:40:12 -07002265 ep = DK_ENTRIES(mp->ma_keys);
2266 size = mp->ma_keys->dk_nentries;
Benjamin Peterson7d95e402012-04-23 11:24:50 -04002267 if (mp->ma_values) {
2268 value_ptr = mp->ma_values;
2269 offset = sizeof(PyObject *);
2270 }
2271 else {
2272 value_ptr = &ep[0].me_value;
2273 offset = sizeof(PyDictKeyEntry);
2274 }
2275 for (i = 0, j = 0; i < size; i++) {
2276 PyObject *value = *value_ptr;
2277 value_ptr = (PyObject **)(((char *)value_ptr) + offset);
2278 if (value != NULL) {
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00002279 key = ep[i].me_key;
2280 item = PyList_GET_ITEM(v, j);
2281 Py_INCREF(key);
2282 PyTuple_SET_ITEM(item, 0, key);
2283 Py_INCREF(value);
2284 PyTuple_SET_ITEM(item, 1, value);
2285 j++;
2286 }
2287 }
2288 assert(j == n);
2289 return v;
Guido van Rossum25831651993-05-19 14:50:45 +00002290}
2291
Larry Hastings5c661892014-01-24 06:17:25 -08002292/*[clinic input]
2293@classmethod
2294dict.fromkeys
Larry Hastings5c661892014-01-24 06:17:25 -08002295 iterable: object
2296 value: object=None
2297 /
2298
2299Returns a new dict with keys from iterable and values equal to value.
2300[clinic start generated code]*/
2301
Larry Hastings5c661892014-01-24 06:17:25 -08002302static PyObject *
2303dict_fromkeys_impl(PyTypeObject *type, PyObject *iterable, PyObject *value)
Serhiy Storchaka1009bf12015-04-03 23:53:51 +03002304/*[clinic end generated code: output=8fb98e4b10384999 input=b85a667f9bf4669d]*/
Larry Hastings5c661892014-01-24 06:17:25 -08002305{
Eric Snow96c6af92015-05-29 22:21:39 -06002306 return _PyDict_FromKeys((PyObject *)type, iterable, value);
Raymond Hettingere33d3df2002-11-27 07:29:33 +00002307}
2308
Raymond Hettinger31017ae2004-03-04 08:25:44 +00002309static int
Victor Stinner742da042016-09-07 17:40:12 -07002310dict_update_common(PyObject *self, PyObject *args, PyObject *kwds,
2311 const char *methname)
Guido van Rossume3f5b9c1997-05-28 19:15:28 +00002312{
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00002313 PyObject *arg = NULL;
2314 int result = 0;
Raymond Hettinger31017ae2004-03-04 08:25:44 +00002315
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00002316 if (!PyArg_UnpackTuple(args, methname, 0, 1, &arg))
2317 result = -1;
Raymond Hettinger31017ae2004-03-04 08:25:44 +00002318
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00002319 else if (arg != NULL) {
Martin v. Löwis1c67dd92011-10-14 15:16:45 +02002320 _Py_IDENTIFIER(keys);
2321 if (_PyObject_HasAttrId(arg, &PyId_keys))
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00002322 result = PyDict_Merge(self, arg, 1);
2323 else
2324 result = PyDict_MergeFromSeq2(self, arg, 1);
2325 }
2326 if (result == 0 && kwds != NULL) {
2327 if (PyArg_ValidateKeywordArguments(kwds))
2328 result = PyDict_Merge(self, kwds, 1);
2329 else
2330 result = -1;
2331 }
2332 return result;
Raymond Hettinger31017ae2004-03-04 08:25:44 +00002333}
2334
2335static PyObject *
2336dict_update(PyObject *self, PyObject *args, PyObject *kwds)
2337{
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00002338 if (dict_update_common(self, args, kwds, "update") != -1)
2339 Py_RETURN_NONE;
2340 return NULL;
Tim Peters6d6c1a32001-08-02 04:15:00 +00002341}
2342
Guido van Rossum05ac6de2001-08-10 20:28:28 +00002343/* Update unconditionally replaces existing items.
2344 Merge has a 3rd argument 'override'; if set, it acts like Update,
Tim Peters1fc240e2001-10-26 05:06:50 +00002345 otherwise it leaves existing items unchanged.
2346
2347 PyDict_{Update,Merge} update/merge from a mapping object.
2348
Tim Petersf582b822001-12-11 18:51:08 +00002349 PyDict_MergeFromSeq2 updates/merges from any iterable object
Tim Peters1fc240e2001-10-26 05:06:50 +00002350 producing iterable objects of length 2.
2351*/
2352
Tim Petersf582b822001-12-11 18:51:08 +00002353int
Tim Peters1fc240e2001-10-26 05:06:50 +00002354PyDict_MergeFromSeq2(PyObject *d, PyObject *seq2, int override)
2355{
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00002356 PyObject *it; /* iter(seq2) */
2357 Py_ssize_t i; /* index into seq2 of current element */
2358 PyObject *item; /* seq2[i] */
2359 PyObject *fast; /* item as a 2-tuple or 2-list */
Tim Peters1fc240e2001-10-26 05:06:50 +00002360
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00002361 assert(d != NULL);
2362 assert(PyDict_Check(d));
2363 assert(seq2 != NULL);
Tim Peters1fc240e2001-10-26 05:06:50 +00002364
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00002365 it = PyObject_GetIter(seq2);
2366 if (it == NULL)
2367 return -1;
Tim Peters1fc240e2001-10-26 05:06:50 +00002368
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00002369 for (i = 0; ; ++i) {
2370 PyObject *key, *value;
2371 Py_ssize_t n;
Tim Peters1fc240e2001-10-26 05:06:50 +00002372
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00002373 fast = NULL;
2374 item = PyIter_Next(it);
2375 if (item == NULL) {
2376 if (PyErr_Occurred())
2377 goto Fail;
2378 break;
2379 }
Tim Peters1fc240e2001-10-26 05:06:50 +00002380
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00002381 /* Convert item to sequence, and verify length 2. */
2382 fast = PySequence_Fast(item, "");
2383 if (fast == NULL) {
2384 if (PyErr_ExceptionMatches(PyExc_TypeError))
2385 PyErr_Format(PyExc_TypeError,
2386 "cannot convert dictionary update "
2387 "sequence element #%zd to a sequence",
2388 i);
2389 goto Fail;
2390 }
2391 n = PySequence_Fast_GET_SIZE(fast);
2392 if (n != 2) {
2393 PyErr_Format(PyExc_ValueError,
2394 "dictionary update sequence element #%zd "
2395 "has length %zd; 2 is required",
2396 i, n);
2397 goto Fail;
2398 }
Tim Peters1fc240e2001-10-26 05:06:50 +00002399
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00002400 /* Update/merge with this (key, value) pair. */
2401 key = PySequence_Fast_GET_ITEM(fast, 0);
2402 value = PySequence_Fast_GET_ITEM(fast, 1);
2403 if (override || PyDict_GetItem(d, key) == NULL) {
2404 int status = PyDict_SetItem(d, key, value);
2405 if (status < 0)
2406 goto Fail;
2407 }
2408 Py_DECREF(fast);
2409 Py_DECREF(item);
2410 }
Tim Peters1fc240e2001-10-26 05:06:50 +00002411
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00002412 i = 0;
Victor Stinner611b0fa2016-09-14 15:02:01 +02002413 assert(_PyDict_CheckConsistency((PyDictObject *)d));
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00002414 goto Return;
Tim Peters1fc240e2001-10-26 05:06:50 +00002415Fail:
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00002416 Py_XDECREF(item);
2417 Py_XDECREF(fast);
2418 i = -1;
Tim Peters1fc240e2001-10-26 05:06:50 +00002419Return:
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00002420 Py_DECREF(it);
2421 return Py_SAFE_DOWNCAST(i, Py_ssize_t, int);
Tim Peters1fc240e2001-10-26 05:06:50 +00002422}
2423
doko@ubuntu.comc96df682016-10-11 08:04:02 +02002424static int
Serhiy Storchakae036ef82016-10-02 11:06:43 +03002425dict_merge(PyObject *a, PyObject *b, int override)
Guido van Rossum05ac6de2001-08-10 20:28:28 +00002426{
Antoine Pitrou9ed5f272013-08-13 20:18:52 +02002427 PyDictObject *mp, *other;
2428 Py_ssize_t i, n;
Victor Stinner742da042016-09-07 17:40:12 -07002429 PyDictKeyEntry *entry, *ep0;
Tim Peters6d6c1a32001-08-02 04:15:00 +00002430
Serhiy Storchakae036ef82016-10-02 11:06:43 +03002431 assert(0 <= override && override <= 2);
2432
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00002433 /* We accept for the argument either a concrete dictionary object,
2434 * or an abstract "mapping" object. For the former, we can do
2435 * things quite efficiently. For the latter, we only require that
2436 * PyMapping_Keys() and PyObject_GetItem() be supported.
2437 */
2438 if (a == NULL || !PyDict_Check(a) || b == NULL) {
2439 PyErr_BadInternalCall();
2440 return -1;
2441 }
2442 mp = (PyDictObject*)a;
2443 if (PyDict_Check(b)) {
2444 other = (PyDictObject*)b;
2445 if (other == mp || other->ma_used == 0)
2446 /* a.update(a) or a.update({}); nothing to do */
2447 return 0;
2448 if (mp->ma_used == 0)
2449 /* Since the target dict is empty, PyDict_GetItem()
2450 * always returns NULL. Setting override to 1
2451 * skips the unnecessary test.
2452 */
2453 override = 1;
2454 /* Do one big resize at the start, rather than
2455 * incrementally resizing as we insert new items. Expect
2456 * that there will be no (or few) overlapping keys.
2457 */
INADA Naokib1152be2016-10-27 19:26:50 +09002458 if (USABLE_FRACTION(mp->ma_keys->dk_size) < other->ma_used) {
2459 if (dictresize(mp, ESTIMATE_SIZE(mp->ma_used + other->ma_used))) {
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00002460 return -1;
INADA Naokib1152be2016-10-27 19:26:50 +09002461 }
2462 }
Victor Stinner742da042016-09-07 17:40:12 -07002463 ep0 = DK_ENTRIES(other->ma_keys);
2464 for (i = 0, n = other->ma_keys->dk_nentries; i < n; i++) {
Benjamin Petersona82f77f2015-07-04 19:55:16 -05002465 PyObject *key, *value;
2466 Py_hash_t hash;
Victor Stinner742da042016-09-07 17:40:12 -07002467 entry = &ep0[i];
Benjamin Petersona82f77f2015-07-04 19:55:16 -05002468 key = entry->me_key;
2469 hash = entry->me_hash;
Benjamin Peterson7d95e402012-04-23 11:24:50 -04002470 if (other->ma_values)
2471 value = other->ma_values[i];
2472 else
2473 value = entry->me_value;
2474
Benjamin Petersona82f77f2015-07-04 19:55:16 -05002475 if (value != NULL) {
2476 int err = 0;
2477 Py_INCREF(key);
2478 Py_INCREF(value);
Serhiy Storchakaf0b311b2016-11-06 13:18:24 +02002479 if (override == 1)
Benjamin Petersona82f77f2015-07-04 19:55:16 -05002480 err = insertdict(mp, key, hash, value);
Serhiy Storchakaf0b311b2016-11-06 13:18:24 +02002481 else if (_PyDict_GetItem_KnownHash(a, key, hash) == NULL) {
2482 if (PyErr_Occurred()) {
2483 Py_DECREF(value);
2484 Py_DECREF(key);
2485 return -1;
2486 }
2487 err = insertdict(mp, key, hash, value);
2488 }
Serhiy Storchakae036ef82016-10-02 11:06:43 +03002489 else if (override != 0) {
2490 _PyErr_SetKeyError(key);
2491 Py_DECREF(value);
2492 Py_DECREF(key);
2493 return -1;
2494 }
Benjamin Petersona82f77f2015-07-04 19:55:16 -05002495 Py_DECREF(value);
2496 Py_DECREF(key);
2497 if (err != 0)
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00002498 return -1;
Benjamin Petersona82f77f2015-07-04 19:55:16 -05002499
Victor Stinner742da042016-09-07 17:40:12 -07002500 if (n != other->ma_keys->dk_nentries) {
Benjamin Petersona82f77f2015-07-04 19:55:16 -05002501 PyErr_SetString(PyExc_RuntimeError,
2502 "dict mutated during update");
2503 return -1;
2504 }
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00002505 }
2506 }
2507 }
2508 else {
2509 /* Do it the generic, slower way */
2510 PyObject *keys = PyMapping_Keys(b);
2511 PyObject *iter;
2512 PyObject *key, *value;
2513 int status;
Barry Warsaw66a0d1d2001-06-26 20:08:32 +00002514
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00002515 if (keys == NULL)
2516 /* Docstring says this is equivalent to E.keys() so
2517 * if E doesn't have a .keys() method we want
2518 * AttributeError to percolate up. Might as well
2519 * do the same for any other error.
2520 */
2521 return -1;
Barry Warsaw66a0d1d2001-06-26 20:08:32 +00002522
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00002523 iter = PyObject_GetIter(keys);
2524 Py_DECREF(keys);
2525 if (iter == NULL)
2526 return -1;
Barry Warsaw66a0d1d2001-06-26 20:08:32 +00002527
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00002528 for (key = PyIter_Next(iter); key; key = PyIter_Next(iter)) {
Serhiy Storchakae036ef82016-10-02 11:06:43 +03002529 if (override != 1 && PyDict_GetItem(a, key) != NULL) {
2530 if (override != 0) {
2531 _PyErr_SetKeyError(key);
2532 Py_DECREF(key);
2533 Py_DECREF(iter);
2534 return -1;
2535 }
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00002536 Py_DECREF(key);
2537 continue;
2538 }
2539 value = PyObject_GetItem(b, key);
2540 if (value == NULL) {
2541 Py_DECREF(iter);
2542 Py_DECREF(key);
2543 return -1;
2544 }
2545 status = PyDict_SetItem(a, key, value);
2546 Py_DECREF(key);
2547 Py_DECREF(value);
2548 if (status < 0) {
2549 Py_DECREF(iter);
2550 return -1;
2551 }
2552 }
2553 Py_DECREF(iter);
2554 if (PyErr_Occurred())
2555 /* Iterator completed, via error */
2556 return -1;
2557 }
Victor Stinner611b0fa2016-09-14 15:02:01 +02002558 assert(_PyDict_CheckConsistency((PyDictObject *)a));
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00002559 return 0;
Guido van Rossume3f5b9c1997-05-28 19:15:28 +00002560}
2561
Serhiy Storchakae036ef82016-10-02 11:06:43 +03002562int
2563PyDict_Update(PyObject *a, PyObject *b)
2564{
2565 return dict_merge(a, b, 1);
2566}
2567
2568int
2569PyDict_Merge(PyObject *a, PyObject *b, int override)
2570{
2571 /* XXX Deprecate override not in (0, 1). */
2572 return dict_merge(a, b, override != 0);
2573}
2574
2575int
2576_PyDict_MergeEx(PyObject *a, PyObject *b, int override)
2577{
2578 return dict_merge(a, b, override);
2579}
2580
Guido van Rossume3f5b9c1997-05-28 19:15:28 +00002581static PyObject *
Antoine Pitrou9ed5f272013-08-13 20:18:52 +02002582dict_copy(PyDictObject *mp)
Guido van Rossume3f5b9c1997-05-28 19:15:28 +00002583{
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00002584 return PyDict_Copy((PyObject*)mp);
Jeremy Hyltona12c7a72000-03-30 22:27:31 +00002585}
2586
2587PyObject *
Tim Peters1f5871e2000-07-04 17:44:48 +00002588PyDict_Copy(PyObject *o)
Jeremy Hyltona12c7a72000-03-30 22:27:31 +00002589{
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00002590 PyObject *copy;
Benjamin Peterson7d95e402012-04-23 11:24:50 -04002591 PyDictObject *mp;
2592 Py_ssize_t i, n;
Jeremy Hyltona12c7a72000-03-30 22:27:31 +00002593
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00002594 if (o == NULL || !PyDict_Check(o)) {
2595 PyErr_BadInternalCall();
2596 return NULL;
2597 }
Benjamin Peterson7d95e402012-04-23 11:24:50 -04002598 mp = (PyDictObject *)o;
2599 if (_PyDict_HasSplitTable(mp)) {
2600 PyDictObject *split_copy;
Victor Stinner742da042016-09-07 17:40:12 -07002601 Py_ssize_t size = USABLE_FRACTION(DK_SIZE(mp->ma_keys));
2602 PyObject **newvalues;
2603 newvalues = new_values(size);
Benjamin Peterson7d95e402012-04-23 11:24:50 -04002604 if (newvalues == NULL)
2605 return PyErr_NoMemory();
2606 split_copy = PyObject_GC_New(PyDictObject, &PyDict_Type);
2607 if (split_copy == NULL) {
2608 free_values(newvalues);
2609 return NULL;
2610 }
2611 split_copy->ma_values = newvalues;
2612 split_copy->ma_keys = mp->ma_keys;
2613 split_copy->ma_used = mp->ma_used;
2614 DK_INCREF(mp->ma_keys);
Victor Stinner742da042016-09-07 17:40:12 -07002615 for (i = 0, n = size; i < n; i++) {
Benjamin Peterson7d95e402012-04-23 11:24:50 -04002616 PyObject *value = mp->ma_values[i];
2617 Py_XINCREF(value);
2618 split_copy->ma_values[i] = value;
2619 }
Benjamin Peterson7ce67e42012-04-24 10:32:57 -04002620 if (_PyObject_GC_IS_TRACKED(mp))
2621 _PyObject_GC_TRACK(split_copy);
Benjamin Peterson7d95e402012-04-23 11:24:50 -04002622 return (PyObject *)split_copy;
2623 }
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00002624 copy = PyDict_New();
2625 if (copy == NULL)
2626 return NULL;
2627 if (PyDict_Merge(copy, o, 1) == 0)
2628 return copy;
2629 Py_DECREF(copy);
2630 return NULL;
Guido van Rossume3f5b9c1997-05-28 19:15:28 +00002631}
2632
Martin v. Löwis18e16552006-02-15 17:27:45 +00002633Py_ssize_t
Tim Peters1f5871e2000-07-04 17:44:48 +00002634PyDict_Size(PyObject *mp)
Guido van Rossum4199fac1993-11-05 10:18:44 +00002635{
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00002636 if (mp == NULL || !PyDict_Check(mp)) {
2637 PyErr_BadInternalCall();
2638 return -1;
2639 }
2640 return ((PyDictObject *)mp)->ma_used;
Guido van Rossum4199fac1993-11-05 10:18:44 +00002641}
2642
Guido van Rossumc0b618a1997-05-02 03:12:38 +00002643PyObject *
Tim Peters1f5871e2000-07-04 17:44:48 +00002644PyDict_Keys(PyObject *mp)
Guido van Rossum4b1302b1993-03-27 18:11:32 +00002645{
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00002646 if (mp == NULL || !PyDict_Check(mp)) {
2647 PyErr_BadInternalCall();
2648 return NULL;
2649 }
2650 return dict_keys((PyDictObject *)mp);
Guido van Rossum4b1302b1993-03-27 18:11:32 +00002651}
2652
Guido van Rossumc0b618a1997-05-02 03:12:38 +00002653PyObject *
Tim Peters1f5871e2000-07-04 17:44:48 +00002654PyDict_Values(PyObject *mp)
Guido van Rossum25831651993-05-19 14:50:45 +00002655{
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00002656 if (mp == NULL || !PyDict_Check(mp)) {
2657 PyErr_BadInternalCall();
2658 return NULL;
2659 }
2660 return dict_values((PyDictObject *)mp);
Guido van Rossum25831651993-05-19 14:50:45 +00002661}
2662
Guido van Rossumc0b618a1997-05-02 03:12:38 +00002663PyObject *
Tim Peters1f5871e2000-07-04 17:44:48 +00002664PyDict_Items(PyObject *mp)
Guido van Rossum25831651993-05-19 14:50:45 +00002665{
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00002666 if (mp == NULL || !PyDict_Check(mp)) {
2667 PyErr_BadInternalCall();
2668 return NULL;
2669 }
2670 return dict_items((PyDictObject *)mp);
Guido van Rossum25831651993-05-19 14:50:45 +00002671}
2672
Tim Peterse63415e2001-05-08 04:38:29 +00002673/* Return 1 if dicts equal, 0 if not, -1 if error.
2674 * Gets out as soon as any difference is detected.
2675 * Uses only Py_EQ comparison.
2676 */
2677static int
Guido van Rossum8ce8a782007-11-01 19:42:39 +00002678dict_equal(PyDictObject *a, PyDictObject *b)
Tim Peterse63415e2001-05-08 04:38:29 +00002679{
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00002680 Py_ssize_t i;
Tim Peterse63415e2001-05-08 04:38:29 +00002681
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00002682 if (a->ma_used != b->ma_used)
2683 /* can't be equal if # of entries differ */
2684 return 0;
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00002685 /* Same # of entries -- check all of 'em. Exit early on any diff. */
Victor Stinner742da042016-09-07 17:40:12 -07002686 for (i = 0; i < a->ma_keys->dk_nentries; i++) {
2687 PyDictKeyEntry *ep = &DK_ENTRIES(a->ma_keys)[i];
Benjamin Peterson7d95e402012-04-23 11:24:50 -04002688 PyObject *aval;
2689 if (a->ma_values)
2690 aval = a->ma_values[i];
2691 else
2692 aval = ep->me_value;
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00002693 if (aval != NULL) {
2694 int cmp;
2695 PyObject *bval;
Benjamin Peterson7d95e402012-04-23 11:24:50 -04002696 PyObject *key = ep->me_key;
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00002697 /* temporarily bump aval's refcount to ensure it stays
2698 alive until we're done with it */
2699 Py_INCREF(aval);
2700 /* ditto for key */
2701 Py_INCREF(key);
Antoine Pitrou0e9958b2012-12-02 19:10:07 +01002702 /* reuse the known hash value */
INADA Naokiba609772016-12-07 20:41:42 +09002703 b->ma_keys->dk_lookup(b, key, ep->me_hash, &bval, NULL);
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00002704 Py_DECREF(key);
2705 if (bval == NULL) {
2706 Py_DECREF(aval);
2707 if (PyErr_Occurred())
2708 return -1;
2709 return 0;
2710 }
2711 cmp = PyObject_RichCompareBool(aval, bval, Py_EQ);
2712 Py_DECREF(aval);
2713 if (cmp <= 0) /* error or not equal */
2714 return cmp;
2715 }
2716 }
2717 return 1;
Benjamin Peterson7d95e402012-04-23 11:24:50 -04002718}
Tim Peterse63415e2001-05-08 04:38:29 +00002719
2720static PyObject *
2721dict_richcompare(PyObject *v, PyObject *w, int op)
2722{
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00002723 int cmp;
2724 PyObject *res;
Tim Peterse63415e2001-05-08 04:38:29 +00002725
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00002726 if (!PyDict_Check(v) || !PyDict_Check(w)) {
2727 res = Py_NotImplemented;
2728 }
2729 else if (op == Py_EQ || op == Py_NE) {
2730 cmp = dict_equal((PyDictObject *)v, (PyDictObject *)w);
2731 if (cmp < 0)
2732 return NULL;
2733 res = (cmp == (op == Py_EQ)) ? Py_True : Py_False;
2734 }
2735 else
2736 res = Py_NotImplemented;
2737 Py_INCREF(res);
2738 return res;
Benjamin Peterson7d95e402012-04-23 11:24:50 -04002739}
Tim Peterse63415e2001-05-08 04:38:29 +00002740
Larry Hastings61272b72014-01-07 12:41:53 -08002741/*[clinic input]
Larry Hastings31826802013-10-19 00:09:25 -07002742
2743@coexist
2744dict.__contains__
2745
2746 key: object
2747 /
2748
Meador Ingee02de8c2014-01-14 16:48:31 -06002749True if D has a key k, else False.
Larry Hastings61272b72014-01-07 12:41:53 -08002750[clinic start generated code]*/
Larry Hastings31826802013-10-19 00:09:25 -07002751
Guido van Rossumc0b618a1997-05-02 03:12:38 +00002752static PyObject *
Larry Hastingsc2047262014-01-25 20:43:29 -08002753dict___contains__(PyDictObject *self, PyObject *key)
Serhiy Storchaka1009bf12015-04-03 23:53:51 +03002754/*[clinic end generated code: output=a3d03db709ed6e6b input=b852b2a19b51ab24]*/
Guido van Rossum4b1302b1993-03-27 18:11:32 +00002755{
Larry Hastingsc2047262014-01-25 20:43:29 -08002756 register PyDictObject *mp = self;
Benjamin Peterson8f67d082010-10-17 20:54:53 +00002757 Py_hash_t hash;
Victor Stinner742da042016-09-07 17:40:12 -07002758 Py_ssize_t ix;
INADA Naokiba609772016-12-07 20:41:42 +09002759 PyObject *value;
Thomas Wouters4d70c3d2006-06-08 14:42:34 +00002760
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00002761 if (!PyUnicode_CheckExact(key) ||
Martin v. Löwisd63a3b82011-09-28 07:41:54 +02002762 (hash = ((PyASCIIObject *) key)->hash) == -1) {
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00002763 hash = PyObject_Hash(key);
2764 if (hash == -1)
2765 return NULL;
2766 }
INADA Naokiba609772016-12-07 20:41:42 +09002767 ix = (mp->ma_keys->dk_lookup)(mp, key, hash, &value, NULL);
Victor Stinner742da042016-09-07 17:40:12 -07002768 if (ix == DKIX_ERROR)
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00002769 return NULL;
INADA Naokiba609772016-12-07 20:41:42 +09002770 if (ix == DKIX_EMPTY || value == NULL)
Victor Stinner742da042016-09-07 17:40:12 -07002771 Py_RETURN_FALSE;
2772 Py_RETURN_TRUE;
Guido van Rossum4b1302b1993-03-27 18:11:32 +00002773}
2774
Guido van Rossumc0b618a1997-05-02 03:12:38 +00002775static PyObject *
Antoine Pitrou9ed5f272013-08-13 20:18:52 +02002776dict_get(PyDictObject *mp, PyObject *args)
Barry Warsawc38c5da1997-10-06 17:49:20 +00002777{
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00002778 PyObject *key;
2779 PyObject *failobj = Py_None;
2780 PyObject *val = NULL;
Benjamin Peterson8f67d082010-10-17 20:54:53 +00002781 Py_hash_t hash;
Victor Stinner742da042016-09-07 17:40:12 -07002782 Py_ssize_t ix;
Barry Warsawc38c5da1997-10-06 17:49:20 +00002783
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00002784 if (!PyArg_UnpackTuple(args, "get", 1, 2, &key, &failobj))
2785 return NULL;
Barry Warsawc38c5da1997-10-06 17:49:20 +00002786
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00002787 if (!PyUnicode_CheckExact(key) ||
Martin v. Löwisd63a3b82011-09-28 07:41:54 +02002788 (hash = ((PyASCIIObject *) key)->hash) == -1) {
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00002789 hash = PyObject_Hash(key);
2790 if (hash == -1)
2791 return NULL;
2792 }
INADA Naokiba609772016-12-07 20:41:42 +09002793 ix = (mp->ma_keys->dk_lookup)(mp, key, hash, &val, NULL);
Victor Stinner742da042016-09-07 17:40:12 -07002794 if (ix == DKIX_ERROR)
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00002795 return NULL;
INADA Naokiba609772016-12-07 20:41:42 +09002796 if (ix == DKIX_EMPTY || val == NULL) {
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00002797 val = failobj;
INADA Naokiba609772016-12-07 20:41:42 +09002798 }
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00002799 Py_INCREF(val);
2800 return val;
Barry Warsawc38c5da1997-10-06 17:49:20 +00002801}
2802
Benjamin Peterson00e98862013-03-07 22:16:29 -05002803PyObject *
2804PyDict_SetDefault(PyObject *d, PyObject *key, PyObject *defaultobj)
Guido van Rossum164452c2000-08-08 16:12:54 +00002805{
Benjamin Peterson00e98862013-03-07 22:16:29 -05002806 PyDictObject *mp = (PyDictObject *)d;
INADA Naoki93f26f72016-11-02 18:45:16 +09002807 PyObject *value;
Benjamin Peterson8f67d082010-10-17 20:54:53 +00002808 Py_hash_t hash;
Victor Stinner742da042016-09-07 17:40:12 -07002809 Py_ssize_t hashpos, ix;
Guido van Rossum164452c2000-08-08 16:12:54 +00002810
Benjamin Peterson00e98862013-03-07 22:16:29 -05002811 if (!PyDict_Check(d)) {
2812 PyErr_BadInternalCall();
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00002813 return NULL;
Benjamin Peterson00e98862013-03-07 22:16:29 -05002814 }
INADA Naoki93f26f72016-11-02 18:45:16 +09002815
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00002816 if (!PyUnicode_CheckExact(key) ||
Martin v. Löwisd63a3b82011-09-28 07:41:54 +02002817 (hash = ((PyASCIIObject *) key)->hash) == -1) {
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00002818 hash = PyObject_Hash(key);
2819 if (hash == -1)
2820 return NULL;
2821 }
INADA Naoki93f26f72016-11-02 18:45:16 +09002822
2823 if (mp->ma_values != NULL && !PyUnicode_CheckExact(key)) {
2824 if (insertion_resize(mp) < 0)
2825 return NULL;
2826 }
2827
INADA Naokiba609772016-12-07 20:41:42 +09002828 ix = (mp->ma_keys->dk_lookup)(mp, key, hash, &value, &hashpos);
Victor Stinner742da042016-09-07 17:40:12 -07002829 if (ix == DKIX_ERROR)
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00002830 return NULL;
INADA Naoki93f26f72016-11-02 18:45:16 +09002831
2832 if (_PyDict_HasSplitTable(mp) &&
INADA Naokiba609772016-12-07 20:41:42 +09002833 ((ix >= 0 && value == NULL && mp->ma_used != ix) ||
INADA Naoki93f26f72016-11-02 18:45:16 +09002834 (ix == DKIX_EMPTY && mp->ma_used != mp->ma_keys->dk_nentries))) {
2835 if (insertion_resize(mp) < 0) {
2836 return NULL;
2837 }
INADA Naokiba609772016-12-07 20:41:42 +09002838 hashpos = find_empty_slot(mp->ma_keys, key, hash);
INADA Naoki93f26f72016-11-02 18:45:16 +09002839 ix = DKIX_EMPTY;
2840 }
2841
2842 if (ix == DKIX_EMPTY) {
2843 PyDictKeyEntry *ep, *ep0;
2844 value = defaultobj;
Benjamin Peterson7d95e402012-04-23 11:24:50 -04002845 if (mp->ma_keys->dk_usable <= 0) {
Victor Stinner3c336c52016-09-12 14:17:40 +02002846 if (insertion_resize(mp) < 0) {
Benjamin Peterson7d95e402012-04-23 11:24:50 -04002847 return NULL;
Victor Stinner3c336c52016-09-12 14:17:40 +02002848 }
INADA Naokiba609772016-12-07 20:41:42 +09002849 hashpos = find_empty_slot(mp->ma_keys, key, hash);
Benjamin Peterson7d95e402012-04-23 11:24:50 -04002850 }
INADA Naoki93f26f72016-11-02 18:45:16 +09002851 ep0 = DK_ENTRIES(mp->ma_keys);
2852 ep = &ep0[mp->ma_keys->dk_nentries];
2853 dk_set_index(mp->ma_keys, hashpos, mp->ma_keys->dk_nentries);
Benjamin Petersonb1efa532013-03-04 09:47:50 -05002854 Py_INCREF(key);
INADA Naoki93f26f72016-11-02 18:45:16 +09002855 Py_INCREF(value);
2856 MAINTAIN_TRACKING(mp, key, value);
Benjamin Peterson7d95e402012-04-23 11:24:50 -04002857 ep->me_key = key;
2858 ep->me_hash = hash;
INADA Naokiba609772016-12-07 20:41:42 +09002859 if (_PyDict_HasSplitTable(mp)) {
INADA Naoki93f26f72016-11-02 18:45:16 +09002860 assert(mp->ma_values[mp->ma_keys->dk_nentries] == NULL);
2861 mp->ma_values[mp->ma_keys->dk_nentries] = value;
Victor Stinner742da042016-09-07 17:40:12 -07002862 }
2863 else {
INADA Naoki93f26f72016-11-02 18:45:16 +09002864 ep->me_value = value;
Victor Stinner742da042016-09-07 17:40:12 -07002865 }
Benjamin Peterson7d95e402012-04-23 11:24:50 -04002866 mp->ma_used++;
Victor Stinner3b6a6b42016-09-08 12:51:24 -07002867 mp->ma_version_tag = DICT_NEXT_VERSION();
INADA Naoki93f26f72016-11-02 18:45:16 +09002868 mp->ma_keys->dk_usable--;
2869 mp->ma_keys->dk_nentries++;
2870 assert(mp->ma_keys->dk_usable >= 0);
2871 }
INADA Naokiba609772016-12-07 20:41:42 +09002872 else if (value == NULL) {
INADA Naoki93f26f72016-11-02 18:45:16 +09002873 value = defaultobj;
2874 assert(_PyDict_HasSplitTable(mp));
2875 assert(ix == mp->ma_used);
2876 Py_INCREF(value);
2877 MAINTAIN_TRACKING(mp, key, value);
INADA Naokiba609772016-12-07 20:41:42 +09002878 mp->ma_values[ix] = value;
INADA Naoki93f26f72016-11-02 18:45:16 +09002879 mp->ma_used++;
2880 mp->ma_version_tag = DICT_NEXT_VERSION();
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00002881 }
INADA Naoki93f26f72016-11-02 18:45:16 +09002882
2883 assert(_PyDict_CheckConsistency(mp));
2884 return value;
Guido van Rossum164452c2000-08-08 16:12:54 +00002885}
2886
Benjamin Peterson00e98862013-03-07 22:16:29 -05002887static PyObject *
2888dict_setdefault(PyDictObject *mp, PyObject *args)
2889{
2890 PyObject *key, *val;
2891 PyObject *defaultobj = Py_None;
2892
2893 if (!PyArg_UnpackTuple(args, "setdefault", 1, 2, &key, &defaultobj))
2894 return NULL;
2895
Benjamin Peterson55898502013-03-08 08:36:49 -05002896 val = PyDict_SetDefault((PyObject *)mp, key, defaultobj);
Benjamin Peterson00e98862013-03-07 22:16:29 -05002897 Py_XINCREF(val);
2898 return val;
2899}
Guido van Rossum164452c2000-08-08 16:12:54 +00002900
2901static PyObject *
Antoine Pitrou9ed5f272013-08-13 20:18:52 +02002902dict_clear(PyDictObject *mp)
Guido van Rossumfb8f1ca1997-03-21 21:55:12 +00002903{
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00002904 PyDict_Clear((PyObject *)mp);
2905 Py_RETURN_NONE;
Guido van Rossumfb8f1ca1997-03-21 21:55:12 +00002906}
2907
Guido van Rossumba6ab842000-12-12 22:02:18 +00002908static PyObject *
Guido van Rossum8ce8a782007-11-01 19:42:39 +00002909dict_pop(PyDictObject *mp, PyObject *args)
Guido van Rossume027d982002-04-12 15:11:59 +00002910{
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00002911 PyObject *key, *deflt = NULL;
Guido van Rossume027d982002-04-12 15:11:59 +00002912
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00002913 if(!PyArg_UnpackTuple(args, "pop", 1, 2, &key, &deflt))
2914 return NULL;
Eric Snow96c6af92015-05-29 22:21:39 -06002915
Yury Selivanov684ef2c2016-10-28 19:01:21 -04002916 return _PyDict_Pop((PyObject*)mp, key, deflt);
Guido van Rossume027d982002-04-12 15:11:59 +00002917}
2918
2919static PyObject *
Guido van Rossum8ce8a782007-11-01 19:42:39 +00002920dict_popitem(PyDictObject *mp)
Guido van Rossumba6ab842000-12-12 22:02:18 +00002921{
Victor Stinner742da042016-09-07 17:40:12 -07002922 Py_ssize_t i, j;
2923 PyDictKeyEntry *ep0, *ep;
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00002924 PyObject *res;
Guido van Rossumba6ab842000-12-12 22:02:18 +00002925
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00002926 /* Allocate the result tuple before checking the size. Believe it
2927 * or not, this allocation could trigger a garbage collection which
2928 * could empty the dict, so if we checked the size first and that
2929 * happened, the result would be an infinite loop (searching for an
2930 * entry that no longer exists). Note that the usual popitem()
2931 * idiom is "while d: k, v = d.popitem()". so needing to throw the
2932 * tuple away if the dict *is* empty isn't a significant
2933 * inefficiency -- possible, but unlikely in practice.
2934 */
2935 res = PyTuple_New(2);
2936 if (res == NULL)
2937 return NULL;
2938 if (mp->ma_used == 0) {
2939 Py_DECREF(res);
2940 PyErr_SetString(PyExc_KeyError,
2941 "popitem(): dictionary is empty");
2942 return NULL;
2943 }
Benjamin Peterson7d95e402012-04-23 11:24:50 -04002944 /* Convert split table to combined table */
2945 if (mp->ma_keys->dk_lookup == lookdict_split) {
2946 if (dictresize(mp, DK_SIZE(mp->ma_keys))) {
2947 Py_DECREF(res);
2948 return NULL;
2949 }
2950 }
2951 ENSURE_ALLOWS_DELETIONS(mp);
Victor Stinner742da042016-09-07 17:40:12 -07002952
2953 /* Pop last item */
2954 ep0 = DK_ENTRIES(mp->ma_keys);
2955 i = mp->ma_keys->dk_nentries - 1;
2956 while (i >= 0 && ep0[i].me_value == NULL) {
2957 i--;
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00002958 }
Victor Stinner742da042016-09-07 17:40:12 -07002959 assert(i >= 0);
2960
2961 ep = &ep0[i];
2962 j = lookdict_index(mp->ma_keys, ep->me_hash, i);
2963 assert(j >= 0);
2964 assert(dk_get_index(mp->ma_keys, j) == i);
2965 dk_set_index(mp->ma_keys, j, DKIX_DUMMY);
2966
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00002967 PyTuple_SET_ITEM(res, 0, ep->me_key);
2968 PyTuple_SET_ITEM(res, 1, ep->me_value);
Victor Stinner742da042016-09-07 17:40:12 -07002969 ep->me_key = NULL;
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00002970 ep->me_value = NULL;
Victor Stinner742da042016-09-07 17:40:12 -07002971 /* We can't dk_usable++ since there is DKIX_DUMMY in indices */
2972 mp->ma_keys->dk_nentries = i;
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00002973 mp->ma_used--;
Victor Stinner3b6a6b42016-09-08 12:51:24 -07002974 mp->ma_version_tag = DICT_NEXT_VERSION();
Victor Stinner611b0fa2016-09-14 15:02:01 +02002975 assert(_PyDict_CheckConsistency(mp));
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00002976 return res;
Guido van Rossumba6ab842000-12-12 22:02:18 +00002977}
2978
Jeremy Hylton8caad492000-06-23 14:18:11 +00002979static int
2980dict_traverse(PyObject *op, visitproc visit, void *arg)
2981{
Benjamin Peterson7d95e402012-04-23 11:24:50 -04002982 PyDictObject *mp = (PyDictObject *)op;
Benjamin Peterson55f44522016-09-05 12:12:59 -07002983 PyDictKeysObject *keys = mp->ma_keys;
Serhiy Storchaka46825d22016-09-26 21:29:34 +03002984 PyDictKeyEntry *entries = DK_ENTRIES(keys);
Victor Stinner742da042016-09-07 17:40:12 -07002985 Py_ssize_t i, n = keys->dk_nentries;
2986
Benjamin Peterson55f44522016-09-05 12:12:59 -07002987 if (keys->dk_lookup == lookdict) {
2988 for (i = 0; i < n; i++) {
2989 if (entries[i].me_value != NULL) {
2990 Py_VISIT(entries[i].me_value);
2991 Py_VISIT(entries[i].me_key);
Benjamin Peterson7d95e402012-04-23 11:24:50 -04002992 }
2993 }
Victor Stinner742da042016-09-07 17:40:12 -07002994 }
2995 else {
Benjamin Peterson7d95e402012-04-23 11:24:50 -04002996 if (mp->ma_values != NULL) {
Benjamin Peterson55f44522016-09-05 12:12:59 -07002997 for (i = 0; i < n; i++) {
Benjamin Peterson7d95e402012-04-23 11:24:50 -04002998 Py_VISIT(mp->ma_values[i]);
2999 }
3000 }
3001 else {
Benjamin Peterson55f44522016-09-05 12:12:59 -07003002 for (i = 0; i < n; i++) {
3003 Py_VISIT(entries[i].me_value);
Benjamin Peterson7d95e402012-04-23 11:24:50 -04003004 }
3005 }
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00003006 }
3007 return 0;
Jeremy Hylton8caad492000-06-23 14:18:11 +00003008}
3009
3010static int
3011dict_tp_clear(PyObject *op)
3012{
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00003013 PyDict_Clear(op);
3014 return 0;
Jeremy Hylton8caad492000-06-23 14:18:11 +00003015}
3016
Guido van Rossum8ce8a782007-11-01 19:42:39 +00003017static PyObject *dictiter_new(PyDictObject *, PyTypeObject *);
Guido van Rossum09e563a2001-05-01 12:10:21 +00003018
Serhiy Storchaka0ce7a3a2015-12-22 08:16:18 +02003019Py_ssize_t
Eric Snow96c6af92015-05-29 22:21:39 -06003020_PyDict_SizeOf(PyDictObject *mp)
Martin v. Löwis00709aa2008-06-04 14:18:43 +00003021{
Victor Stinner742da042016-09-07 17:40:12 -07003022 Py_ssize_t size, usable, res;
Martin v. Löwis00709aa2008-06-04 14:18:43 +00003023
Benjamin Peterson7d95e402012-04-23 11:24:50 -04003024 size = DK_SIZE(mp->ma_keys);
Victor Stinner742da042016-09-07 17:40:12 -07003025 usable = USABLE_FRACTION(size);
3026
Serhiy Storchaka5c4064e2015-12-19 20:05:25 +02003027 res = _PyObject_SIZE(Py_TYPE(mp));
Benjamin Peterson7d95e402012-04-23 11:24:50 -04003028 if (mp->ma_values)
Victor Stinner742da042016-09-07 17:40:12 -07003029 res += usable * sizeof(PyObject*);
Martin v. Loewis4f2f3b62012-04-24 19:13:57 +02003030 /* If the dictionary is split, the keys portion is accounted-for
3031 in the type object. */
3032 if (mp->ma_keys->dk_refcnt == 1)
Victor Stinner98ee9d52016-09-08 09:33:56 -07003033 res += (sizeof(PyDictKeysObject)
3034 - Py_MEMBER_SIZE(PyDictKeysObject, dk_indices)
3035 + DK_IXSIZE(mp->ma_keys) * size
3036 + sizeof(PyDictKeyEntry) * usable);
Serhiy Storchaka0ce7a3a2015-12-22 08:16:18 +02003037 return res;
Martin v. Loewis4f2f3b62012-04-24 19:13:57 +02003038}
3039
3040Py_ssize_t
3041_PyDict_KeysSize(PyDictKeysObject *keys)
3042{
Victor Stinner98ee9d52016-09-08 09:33:56 -07003043 return (sizeof(PyDictKeysObject)
3044 - Py_MEMBER_SIZE(PyDictKeysObject, dk_indices)
3045 + DK_IXSIZE(keys) * DK_SIZE(keys)
3046 + USABLE_FRACTION(DK_SIZE(keys)) * sizeof(PyDictKeyEntry));
Martin v. Löwis00709aa2008-06-04 14:18:43 +00003047}
3048
doko@ubuntu.com17210f52016-01-14 14:04:59 +01003049static PyObject *
Serhiy Storchaka0ce7a3a2015-12-22 08:16:18 +02003050dict_sizeof(PyDictObject *mp)
3051{
3052 return PyLong_FromSsize_t(_PyDict_SizeOf(mp));
3053}
3054
Raymond Hettinger8f5cdaa2003-12-13 11:26:12 +00003055PyDoc_STRVAR(getitem__doc__, "x.__getitem__(y) <==> x[y]");
3056
Martin v. Löwis00709aa2008-06-04 14:18:43 +00003057PyDoc_STRVAR(sizeof__doc__,
3058"D.__sizeof__() -> size of D in memory, in bytes");
3059
Martin v. Löwis14f8b4c2002-06-13 20:33:02 +00003060PyDoc_STRVAR(get__doc__,
Guido van Rossumefae8862002-09-04 11:29:45 +00003061"D.get(k[,d]) -> D[k] if k in D, else d. d defaults to None.");
Tim Petersf7f88b12000-12-13 23:18:45 +00003062
Martin v. Löwis14f8b4c2002-06-13 20:33:02 +00003063PyDoc_STRVAR(setdefault_doc__,
Guido van Rossumefae8862002-09-04 11:29:45 +00003064"D.setdefault(k[,d]) -> D.get(k,d), also set D[k]=d if k not in D");
Tim Petersf7f88b12000-12-13 23:18:45 +00003065
Martin v. Löwis14f8b4c2002-06-13 20:33:02 +00003066PyDoc_STRVAR(pop__doc__,
Benjamin Petersonf10a79a2008-10-11 00:49:57 +00003067"D.pop(k[,d]) -> v, remove specified key and return the corresponding value.\n\
Raymond Hettingera3e1e4c2003-03-06 23:54:28 +00003068If key is not found, d is returned if given, otherwise KeyError is raised");
Guido van Rossume027d982002-04-12 15:11:59 +00003069
Martin v. Löwis14f8b4c2002-06-13 20:33:02 +00003070PyDoc_STRVAR(popitem__doc__,
Tim Petersf7f88b12000-12-13 23:18:45 +00003071"D.popitem() -> (k, v), remove and return some (key, value) pair as a\n\
Benjamin Petersonf10a79a2008-10-11 00:49:57 +000030722-tuple; but raise KeyError if D is empty.");
Tim Petersf7f88b12000-12-13 23:18:45 +00003073
Martin v. Löwis14f8b4c2002-06-13 20:33:02 +00003074PyDoc_STRVAR(update__doc__,
Brett Cannonf2754162013-05-11 14:46:48 -04003075"D.update([E, ]**F) -> None. Update D from dict/iterable E and F.\n\
3076If E is present and has a .keys() method, then does: for k in E: D[k] = E[k]\n\
3077If E is present and lacks a .keys() method, then does: for k, v in E: D[k] = v\n\
3078In either case, this is followed by: for k in F: D[k] = F[k]");
Tim Petersf7f88b12000-12-13 23:18:45 +00003079
Martin v. Löwis14f8b4c2002-06-13 20:33:02 +00003080PyDoc_STRVAR(clear__doc__,
3081"D.clear() -> None. Remove all items from D.");
Tim Petersf7f88b12000-12-13 23:18:45 +00003082
Martin v. Löwis14f8b4c2002-06-13 20:33:02 +00003083PyDoc_STRVAR(copy__doc__,
3084"D.copy() -> a shallow copy of D");
Tim Petersf7f88b12000-12-13 23:18:45 +00003085
Guido van Rossumb90c8482007-02-10 01:11:45 +00003086/* Forward */
3087static PyObject *dictkeys_new(PyObject *);
3088static PyObject *dictitems_new(PyObject *);
3089static PyObject *dictvalues_new(PyObject *);
3090
Guido van Rossum45c85d12007-07-27 16:31:40 +00003091PyDoc_STRVAR(keys__doc__,
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00003092 "D.keys() -> a set-like object providing a view on D's keys");
Guido van Rossum45c85d12007-07-27 16:31:40 +00003093PyDoc_STRVAR(items__doc__,
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00003094 "D.items() -> a set-like object providing a view on D's items");
Guido van Rossum45c85d12007-07-27 16:31:40 +00003095PyDoc_STRVAR(values__doc__,
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00003096 "D.values() -> an object providing a view on D's values");
Guido van Rossumb90c8482007-02-10 01:11:45 +00003097
Guido van Rossumc0b618a1997-05-02 03:12:38 +00003098static PyMethodDef mapp_methods[] = {
Larry Hastings31826802013-10-19 00:09:25 -07003099 DICT___CONTAINS___METHODDEF
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00003100 {"__getitem__", (PyCFunction)dict_subscript, METH_O | METH_COEXIST,
3101 getitem__doc__},
Serhiy Storchaka0ce7a3a2015-12-22 08:16:18 +02003102 {"__sizeof__", (PyCFunction)dict_sizeof, METH_NOARGS,
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00003103 sizeof__doc__},
3104 {"get", (PyCFunction)dict_get, METH_VARARGS,
3105 get__doc__},
3106 {"setdefault", (PyCFunction)dict_setdefault, METH_VARARGS,
3107 setdefault_doc__},
3108 {"pop", (PyCFunction)dict_pop, METH_VARARGS,
3109 pop__doc__},
3110 {"popitem", (PyCFunction)dict_popitem, METH_NOARGS,
3111 popitem__doc__},
3112 {"keys", (PyCFunction)dictkeys_new, METH_NOARGS,
3113 keys__doc__},
3114 {"items", (PyCFunction)dictitems_new, METH_NOARGS,
3115 items__doc__},
3116 {"values", (PyCFunction)dictvalues_new, METH_NOARGS,
3117 values__doc__},
3118 {"update", (PyCFunction)dict_update, METH_VARARGS | METH_KEYWORDS,
3119 update__doc__},
Larry Hastings5c661892014-01-24 06:17:25 -08003120 DICT_FROMKEYS_METHODDEF
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00003121 {"clear", (PyCFunction)dict_clear, METH_NOARGS,
3122 clear__doc__},
3123 {"copy", (PyCFunction)dict_copy, METH_NOARGS,
3124 copy__doc__},
3125 {NULL, NULL} /* sentinel */
Guido van Rossum4b1302b1993-03-27 18:11:32 +00003126};
3127
Thomas Wouters4d70c3d2006-06-08 14:42:34 +00003128/* Return 1 if `key` is in dict `op`, 0 if not, and -1 on error. */
Raymond Hettingerbc0f2ab2003-11-25 21:12:14 +00003129int
3130PyDict_Contains(PyObject *op, PyObject *key)
Guido van Rossum0dbb4fb2001-04-20 16:50:40 +00003131{
Benjamin Peterson8f67d082010-10-17 20:54:53 +00003132 Py_hash_t hash;
Victor Stinner742da042016-09-07 17:40:12 -07003133 Py_ssize_t ix;
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00003134 PyDictObject *mp = (PyDictObject *)op;
INADA Naokiba609772016-12-07 20:41:42 +09003135 PyObject *value;
Guido van Rossum0dbb4fb2001-04-20 16:50:40 +00003136
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00003137 if (!PyUnicode_CheckExact(key) ||
Martin v. Löwisd63a3b82011-09-28 07:41:54 +02003138 (hash = ((PyASCIIObject *) key)->hash) == -1) {
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00003139 hash = PyObject_Hash(key);
3140 if (hash == -1)
3141 return -1;
3142 }
INADA Naokiba609772016-12-07 20:41:42 +09003143 ix = (mp->ma_keys->dk_lookup)(mp, key, hash, &value, NULL);
Victor Stinner742da042016-09-07 17:40:12 -07003144 if (ix == DKIX_ERROR)
3145 return -1;
INADA Naokiba609772016-12-07 20:41:42 +09003146 return (ix != DKIX_EMPTY && value != NULL);
Guido van Rossum0dbb4fb2001-04-20 16:50:40 +00003147}
3148
Thomas Wouterscf297e42007-02-23 15:07:44 +00003149/* Internal version of PyDict_Contains used when the hash value is already known */
3150int
Benjamin Peterson8f67d082010-10-17 20:54:53 +00003151_PyDict_Contains(PyObject *op, PyObject *key, Py_hash_t hash)
Thomas Wouterscf297e42007-02-23 15:07:44 +00003152{
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00003153 PyDictObject *mp = (PyDictObject *)op;
INADA Naokiba609772016-12-07 20:41:42 +09003154 PyObject *value;
Victor Stinner742da042016-09-07 17:40:12 -07003155 Py_ssize_t ix;
Thomas Wouterscf297e42007-02-23 15:07:44 +00003156
INADA Naokiba609772016-12-07 20:41:42 +09003157 ix = (mp->ma_keys->dk_lookup)(mp, key, hash, &value, NULL);
Victor Stinner742da042016-09-07 17:40:12 -07003158 if (ix == DKIX_ERROR)
3159 return -1;
INADA Naokiba609772016-12-07 20:41:42 +09003160 return (ix != DKIX_EMPTY && value != NULL);
Thomas Wouterscf297e42007-02-23 15:07:44 +00003161}
3162
Guido van Rossum0dbb4fb2001-04-20 16:50:40 +00003163/* Hack to implement "key in dict" */
3164static PySequenceMethods dict_as_sequence = {
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00003165 0, /* sq_length */
3166 0, /* sq_concat */
3167 0, /* sq_repeat */
3168 0, /* sq_item */
3169 0, /* sq_slice */
3170 0, /* sq_ass_item */
3171 0, /* sq_ass_slice */
3172 PyDict_Contains, /* sq_contains */
3173 0, /* sq_inplace_concat */
3174 0, /* sq_inplace_repeat */
Guido van Rossum0dbb4fb2001-04-20 16:50:40 +00003175};
3176
Guido van Rossum09e563a2001-05-01 12:10:21 +00003177static PyObject *
Tim Peters6d6c1a32001-08-02 04:15:00 +00003178dict_new(PyTypeObject *type, PyObject *args, PyObject *kwds)
3179{
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00003180 PyObject *self;
Victor Stinnera9f61a52013-07-16 22:17:26 +02003181 PyDictObject *d;
Tim Peters6d6c1a32001-08-02 04:15:00 +00003182
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00003183 assert(type != NULL && type->tp_alloc != NULL);
3184 self = type->tp_alloc(type, 0);
Victor Stinnera9f61a52013-07-16 22:17:26 +02003185 if (self == NULL)
3186 return NULL;
Victor Stinnera9f61a52013-07-16 22:17:26 +02003187 d = (PyDictObject *)self;
Victor Stinnerac2a4fe2013-07-16 22:19:00 +02003188
Victor Stinnera9f61a52013-07-16 22:17:26 +02003189 /* The object has been implicitly tracked by tp_alloc */
3190 if (type == &PyDict_Type)
3191 _PyObject_GC_UNTRACK(d);
Victor Stinnerac2a4fe2013-07-16 22:19:00 +02003192
3193 d->ma_used = 0;
Victor Stinner3b6a6b42016-09-08 12:51:24 -07003194 d->ma_version_tag = DICT_NEXT_VERSION();
Victor Stinner742da042016-09-07 17:40:12 -07003195 d->ma_keys = new_keys_object(PyDict_MINSIZE);
Victor Stinnerac2a4fe2013-07-16 22:19:00 +02003196 if (d->ma_keys == NULL) {
3197 Py_DECREF(self);
3198 return NULL;
3199 }
Victor Stinner611b0fa2016-09-14 15:02:01 +02003200 assert(_PyDict_CheckConsistency(d));
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00003201 return self;
Tim Peters6d6c1a32001-08-02 04:15:00 +00003202}
3203
Tim Peters25786c02001-09-02 08:22:48 +00003204static int
3205dict_init(PyObject *self, PyObject *args, PyObject *kwds)
3206{
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00003207 return dict_update_common(self, args, kwds, "dict");
Tim Peters25786c02001-09-02 08:22:48 +00003208}
3209
Tim Peters6d6c1a32001-08-02 04:15:00 +00003210static PyObject *
Guido van Rossum8ce8a782007-11-01 19:42:39 +00003211dict_iter(PyDictObject *dict)
Guido van Rossum09e563a2001-05-01 12:10:21 +00003212{
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00003213 return dictiter_new(dict, &PyDictIterKey_Type);
Guido van Rossum09e563a2001-05-01 12:10:21 +00003214}
Guido van Rossum59d1d2b2001-04-20 19:13:02 +00003215
Martin v. Löwis14f8b4c2002-06-13 20:33:02 +00003216PyDoc_STRVAR(dictionary_doc,
Ezio Melotti7f807b72010-03-01 04:08:34 +00003217"dict() -> new empty dictionary\n"
Tim Petersa427a2b2001-10-29 22:25:45 +00003218"dict(mapping) -> new dictionary initialized from a mapping object's\n"
Ezio Melotti7f807b72010-03-01 04:08:34 +00003219" (key, value) pairs\n"
3220"dict(iterable) -> new dictionary initialized as if via:\n"
Tim Peters4d859532001-10-27 18:27:48 +00003221" d = {}\n"
Ezio Melotti7f807b72010-03-01 04:08:34 +00003222" for k, v in iterable:\n"
Just van Rossuma797d812002-11-23 09:45:04 +00003223" d[k] = v\n"
3224"dict(**kwargs) -> new dictionary initialized with the name=value pairs\n"
3225" in the keyword argument list. For example: dict(one=1, two=2)");
Tim Peters25786c02001-09-02 08:22:48 +00003226
Guido van Rossumc0b618a1997-05-02 03:12:38 +00003227PyTypeObject PyDict_Type = {
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00003228 PyVarObject_HEAD_INIT(&PyType_Type, 0)
3229 "dict",
3230 sizeof(PyDictObject),
3231 0,
3232 (destructor)dict_dealloc, /* tp_dealloc */
3233 0, /* tp_print */
3234 0, /* tp_getattr */
3235 0, /* tp_setattr */
3236 0, /* tp_reserved */
3237 (reprfunc)dict_repr, /* tp_repr */
3238 0, /* tp_as_number */
3239 &dict_as_sequence, /* tp_as_sequence */
3240 &dict_as_mapping, /* tp_as_mapping */
Georg Brandl00da4e02010-10-18 07:32:48 +00003241 PyObject_HashNotImplemented, /* tp_hash */
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00003242 0, /* tp_call */
3243 0, /* tp_str */
3244 PyObject_GenericGetAttr, /* tp_getattro */
3245 0, /* tp_setattro */
3246 0, /* tp_as_buffer */
3247 Py_TPFLAGS_DEFAULT | Py_TPFLAGS_HAVE_GC |
3248 Py_TPFLAGS_BASETYPE | Py_TPFLAGS_DICT_SUBCLASS, /* tp_flags */
3249 dictionary_doc, /* tp_doc */
3250 dict_traverse, /* tp_traverse */
3251 dict_tp_clear, /* tp_clear */
3252 dict_richcompare, /* tp_richcompare */
3253 0, /* tp_weaklistoffset */
3254 (getiterfunc)dict_iter, /* tp_iter */
3255 0, /* tp_iternext */
3256 mapp_methods, /* tp_methods */
3257 0, /* tp_members */
3258 0, /* tp_getset */
3259 0, /* tp_base */
3260 0, /* tp_dict */
3261 0, /* tp_descr_get */
3262 0, /* tp_descr_set */
3263 0, /* tp_dictoffset */
3264 dict_init, /* tp_init */
3265 PyType_GenericAlloc, /* tp_alloc */
3266 dict_new, /* tp_new */
3267 PyObject_GC_Del, /* tp_free */
Guido van Rossum4b1302b1993-03-27 18:11:32 +00003268};
3269
Victor Stinner3c1e4812012-03-26 22:10:51 +02003270PyObject *
3271_PyDict_GetItemId(PyObject *dp, struct _Py_Identifier *key)
3272{
3273 PyObject *kv;
3274 kv = _PyUnicode_FromId(key); /* borrowed */
Victor Stinner5b3b1002013-07-22 23:50:57 +02003275 if (kv == NULL) {
3276 PyErr_Clear();
Victor Stinner3c1e4812012-03-26 22:10:51 +02003277 return NULL;
Victor Stinner5b3b1002013-07-22 23:50:57 +02003278 }
Victor Stinner3c1e4812012-03-26 22:10:51 +02003279 return PyDict_GetItem(dp, kv);
3280}
3281
Guido van Rossum3cca2451997-05-16 14:23:33 +00003282/* For backward compatibility with old dictionary interface */
3283
Guido van Rossumc0b618a1997-05-02 03:12:38 +00003284PyObject *
Martin v. Löwis32b4a1b2002-12-11 13:21:12 +00003285PyDict_GetItemString(PyObject *v, const char *key)
Guido van Rossum4b1302b1993-03-27 18:11:32 +00003286{
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00003287 PyObject *kv, *rv;
3288 kv = PyUnicode_FromString(key);
Victor Stinnerfdcbab92013-07-16 22:16:05 +02003289 if (kv == NULL) {
3290 PyErr_Clear();
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00003291 return NULL;
Victor Stinnerfdcbab92013-07-16 22:16:05 +02003292 }
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00003293 rv = PyDict_GetItem(v, kv);
3294 Py_DECREF(kv);
3295 return rv;
Guido van Rossum4b1302b1993-03-27 18:11:32 +00003296}
3297
3298int
Victor Stinner3c1e4812012-03-26 22:10:51 +02003299_PyDict_SetItemId(PyObject *v, struct _Py_Identifier *key, PyObject *item)
3300{
3301 PyObject *kv;
3302 kv = _PyUnicode_FromId(key); /* borrowed */
3303 if (kv == NULL)
3304 return -1;
3305 return PyDict_SetItem(v, kv, item);
3306}
3307
3308int
Martin v. Löwis32b4a1b2002-12-11 13:21:12 +00003309PyDict_SetItemString(PyObject *v, const char *key, PyObject *item)
Guido van Rossum4b1302b1993-03-27 18:11:32 +00003310{
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00003311 PyObject *kv;
3312 int err;
3313 kv = PyUnicode_FromString(key);
3314 if (kv == NULL)
3315 return -1;
3316 PyUnicode_InternInPlace(&kv); /* XXX Should we really? */
3317 err = PyDict_SetItem(v, kv, item);
3318 Py_DECREF(kv);
3319 return err;
Guido van Rossum4b1302b1993-03-27 18:11:32 +00003320}
3321
3322int
Victor Stinner5fd2e5a2013-11-06 18:58:22 +01003323_PyDict_DelItemId(PyObject *v, _Py_Identifier *key)
3324{
3325 PyObject *kv = _PyUnicode_FromId(key); /* borrowed */
3326 if (kv == NULL)
3327 return -1;
3328 return PyDict_DelItem(v, kv);
3329}
3330
3331int
Martin v. Löwis32b4a1b2002-12-11 13:21:12 +00003332PyDict_DelItemString(PyObject *v, const char *key)
Guido van Rossum4b1302b1993-03-27 18:11:32 +00003333{
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00003334 PyObject *kv;
3335 int err;
3336 kv = PyUnicode_FromString(key);
3337 if (kv == NULL)
3338 return -1;
3339 err = PyDict_DelItem(v, kv);
3340 Py_DECREF(kv);
3341 return err;
Guido van Rossum4b1302b1993-03-27 18:11:32 +00003342}
Guido van Rossum59d1d2b2001-04-20 19:13:02 +00003343
Raymond Hettinger019a1482004-03-18 02:41:19 +00003344/* Dictionary iterator types */
Guido van Rossum59d1d2b2001-04-20 19:13:02 +00003345
3346typedef struct {
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00003347 PyObject_HEAD
3348 PyDictObject *di_dict; /* Set to NULL when iterator is exhausted */
3349 Py_ssize_t di_used;
3350 Py_ssize_t di_pos;
3351 PyObject* di_result; /* reusable result tuple for iteritems */
3352 Py_ssize_t len;
Guido van Rossum59d1d2b2001-04-20 19:13:02 +00003353} dictiterobject;
3354
3355static PyObject *
Guido van Rossum8ce8a782007-11-01 19:42:39 +00003356dictiter_new(PyDictObject *dict, PyTypeObject *itertype)
Guido van Rossum59d1d2b2001-04-20 19:13:02 +00003357{
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00003358 dictiterobject *di;
3359 di = PyObject_GC_New(dictiterobject, itertype);
3360 if (di == NULL)
3361 return NULL;
3362 Py_INCREF(dict);
3363 di->di_dict = dict;
3364 di->di_used = dict->ma_used;
3365 di->di_pos = 0;
3366 di->len = dict->ma_used;
3367 if (itertype == &PyDictIterItem_Type) {
3368 di->di_result = PyTuple_Pack(2, Py_None, Py_None);
3369 if (di->di_result == NULL) {
3370 Py_DECREF(di);
3371 return NULL;
3372 }
3373 }
3374 else
3375 di->di_result = NULL;
3376 _PyObject_GC_TRACK(di);
3377 return (PyObject *)di;
Guido van Rossum59d1d2b2001-04-20 19:13:02 +00003378}
3379
3380static void
3381dictiter_dealloc(dictiterobject *di)
3382{
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00003383 Py_XDECREF(di->di_dict);
3384 Py_XDECREF(di->di_result);
3385 PyObject_GC_Del(di);
Antoine Pitrou7ddda782009-01-01 15:35:33 +00003386}
3387
3388static int
3389dictiter_traverse(dictiterobject *di, visitproc visit, void *arg)
3390{
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00003391 Py_VISIT(di->di_dict);
3392 Py_VISIT(di->di_result);
3393 return 0;
Guido van Rossum59d1d2b2001-04-20 19:13:02 +00003394}
3395
Raymond Hettinger6b27cda2005-09-24 21:23:05 +00003396static PyObject *
Raymond Hettinger0ce6dc82004-03-18 08:38:00 +00003397dictiter_len(dictiterobject *di)
3398{
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00003399 Py_ssize_t len = 0;
3400 if (di->di_dict != NULL && di->di_used == di->di_dict->ma_used)
3401 len = di->len;
3402 return PyLong_FromSize_t(len);
Raymond Hettinger0ce6dc82004-03-18 08:38:00 +00003403}
3404
Guido van Rossumb90c8482007-02-10 01:11:45 +00003405PyDoc_STRVAR(length_hint_doc,
3406 "Private method returning an estimate of len(list(it)).");
Raymond Hettinger6b27cda2005-09-24 21:23:05 +00003407
Kristján Valur Jónsson31668b82012-04-03 10:49:41 +00003408static PyObject *
3409dictiter_reduce(dictiterobject *di);
3410
3411PyDoc_STRVAR(reduce_doc, "Return state information for pickling.");
3412
Raymond Hettinger6b27cda2005-09-24 21:23:05 +00003413static PyMethodDef dictiter_methods[] = {
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00003414 {"__length_hint__", (PyCFunction)dictiter_len, METH_NOARGS,
3415 length_hint_doc},
Kristján Valur Jónsson31668b82012-04-03 10:49:41 +00003416 {"__reduce__", (PyCFunction)dictiter_reduce, METH_NOARGS,
3417 reduce_doc},
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00003418 {NULL, NULL} /* sentinel */
Raymond Hettinger0ce6dc82004-03-18 08:38:00 +00003419};
3420
Serhiy Storchaka49f5cdd2016-10-09 23:08:05 +03003421static PyObject*
3422dictiter_iternextkey(dictiterobject *di)
Guido van Rossum213c7a62001-04-23 14:08:49 +00003423{
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00003424 PyObject *key;
INADA Naokica2d8be2016-11-04 16:59:10 +09003425 Py_ssize_t i;
Antoine Pitrou9ed5f272013-08-13 20:18:52 +02003426 PyDictKeysObject *k;
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00003427 PyDictObject *d = di->di_dict;
Guido van Rossum213c7a62001-04-23 14:08:49 +00003428
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00003429 if (d == NULL)
3430 return NULL;
3431 assert (PyDict_Check(d));
Guido van Rossum2147df72002-07-16 20:30:22 +00003432
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00003433 if (di->di_used != d->ma_used) {
3434 PyErr_SetString(PyExc_RuntimeError,
3435 "dictionary changed size during iteration");
3436 di->di_used = -1; /* Make this state sticky */
3437 return NULL;
3438 }
Guido van Rossum2147df72002-07-16 20:30:22 +00003439
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00003440 i = di->di_pos;
Benjamin Peterson7d95e402012-04-23 11:24:50 -04003441 k = d->ma_keys;
INADA Naokica2d8be2016-11-04 16:59:10 +09003442 assert(i >= 0);
Benjamin Peterson7d95e402012-04-23 11:24:50 -04003443 if (d->ma_values) {
INADA Naokica2d8be2016-11-04 16:59:10 +09003444 if (i >= d->ma_used)
Serhiy Storchaka49f5cdd2016-10-09 23:08:05 +03003445 goto fail;
3446 key = DK_ENTRIES(k)[i].me_key;
INADA Naokica2d8be2016-11-04 16:59:10 +09003447 assert(d->ma_values[i] != NULL);
Benjamin Peterson7d95e402012-04-23 11:24:50 -04003448 }
3449 else {
INADA Naokica2d8be2016-11-04 16:59:10 +09003450 Py_ssize_t n = k->dk_nentries;
Serhiy Storchaka49f5cdd2016-10-09 23:08:05 +03003451 PyDictKeyEntry *entry_ptr = &DK_ENTRIES(k)[i];
3452 while (i < n && entry_ptr->me_value == NULL) {
3453 entry_ptr++;
3454 i++;
3455 }
3456 if (i >= n)
3457 goto fail;
3458 key = entry_ptr->me_key;
Benjamin Peterson7d95e402012-04-23 11:24:50 -04003459 }
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00003460 di->di_pos = i+1;
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00003461 di->len--;
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00003462 Py_INCREF(key);
3463 return key;
Raymond Hettinger019a1482004-03-18 02:41:19 +00003464
3465fail:
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00003466 di->di_dict = NULL;
Serhiy Storchakafbb1c5e2016-03-30 20:40:02 +03003467 Py_DECREF(d);
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00003468 return NULL;
Guido van Rossum59d1d2b2001-04-20 19:13:02 +00003469}
3470
Raymond Hettinger019a1482004-03-18 02:41:19 +00003471PyTypeObject PyDictIterKey_Type = {
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00003472 PyVarObject_HEAD_INIT(&PyType_Type, 0)
3473 "dict_keyiterator", /* tp_name */
3474 sizeof(dictiterobject), /* tp_basicsize */
3475 0, /* tp_itemsize */
3476 /* methods */
3477 (destructor)dictiter_dealloc, /* tp_dealloc */
3478 0, /* tp_print */
3479 0, /* tp_getattr */
3480 0, /* tp_setattr */
3481 0, /* tp_reserved */
3482 0, /* tp_repr */
3483 0, /* tp_as_number */
3484 0, /* tp_as_sequence */
3485 0, /* tp_as_mapping */
3486 0, /* tp_hash */
3487 0, /* tp_call */
3488 0, /* tp_str */
3489 PyObject_GenericGetAttr, /* tp_getattro */
3490 0, /* tp_setattro */
3491 0, /* tp_as_buffer */
3492 Py_TPFLAGS_DEFAULT | Py_TPFLAGS_HAVE_GC,/* tp_flags */
3493 0, /* tp_doc */
3494 (traverseproc)dictiter_traverse, /* tp_traverse */
3495 0, /* tp_clear */
3496 0, /* tp_richcompare */
3497 0, /* tp_weaklistoffset */
3498 PyObject_SelfIter, /* tp_iter */
3499 (iternextfunc)dictiter_iternextkey, /* tp_iternext */
3500 dictiter_methods, /* tp_methods */
3501 0,
Raymond Hettinger019a1482004-03-18 02:41:19 +00003502};
3503
Serhiy Storchaka49f5cdd2016-10-09 23:08:05 +03003504static PyObject *
3505dictiter_iternextvalue(dictiterobject *di)
Raymond Hettinger019a1482004-03-18 02:41:19 +00003506{
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00003507 PyObject *value;
INADA Naokica2d8be2016-11-04 16:59:10 +09003508 Py_ssize_t i;
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00003509 PyDictObject *d = di->di_dict;
Raymond Hettinger019a1482004-03-18 02:41:19 +00003510
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00003511 if (d == NULL)
3512 return NULL;
3513 assert (PyDict_Check(d));
Raymond Hettinger019a1482004-03-18 02:41:19 +00003514
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00003515 if (di->di_used != d->ma_used) {
3516 PyErr_SetString(PyExc_RuntimeError,
3517 "dictionary changed size during iteration");
3518 di->di_used = -1; /* Make this state sticky */
3519 return NULL;
3520 }
Raymond Hettinger019a1482004-03-18 02:41:19 +00003521
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00003522 i = di->di_pos;
INADA Naokica2d8be2016-11-04 16:59:10 +09003523 assert(i >= 0);
Benjamin Peterson7d95e402012-04-23 11:24:50 -04003524 if (d->ma_values) {
INADA Naokica2d8be2016-11-04 16:59:10 +09003525 if (i >= d->ma_used)
Serhiy Storchaka49f5cdd2016-10-09 23:08:05 +03003526 goto fail;
INADA Naokica2d8be2016-11-04 16:59:10 +09003527 value = d->ma_values[i];
3528 assert(value != NULL);
Benjamin Peterson7d95e402012-04-23 11:24:50 -04003529 }
3530 else {
INADA Naokica2d8be2016-11-04 16:59:10 +09003531 Py_ssize_t n = d->ma_keys->dk_nentries;
Serhiy Storchaka49f5cdd2016-10-09 23:08:05 +03003532 PyDictKeyEntry *entry_ptr = &DK_ENTRIES(d->ma_keys)[i];
3533 while (i < n && entry_ptr->me_value == NULL) {
3534 entry_ptr++;
3535 i++;
3536 }
3537 if (i >= n)
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00003538 goto fail;
Serhiy Storchaka49f5cdd2016-10-09 23:08:05 +03003539 value = entry_ptr->me_value;
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00003540 }
3541 di->di_pos = i+1;
3542 di->len--;
3543 Py_INCREF(value);
3544 return value;
Raymond Hettinger019a1482004-03-18 02:41:19 +00003545
3546fail:
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00003547 di->di_dict = NULL;
Serhiy Storchakafbb1c5e2016-03-30 20:40:02 +03003548 Py_DECREF(d);
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00003549 return NULL;
Raymond Hettinger019a1482004-03-18 02:41:19 +00003550}
3551
3552PyTypeObject PyDictIterValue_Type = {
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00003553 PyVarObject_HEAD_INIT(&PyType_Type, 0)
3554 "dict_valueiterator", /* tp_name */
3555 sizeof(dictiterobject), /* tp_basicsize */
3556 0, /* tp_itemsize */
3557 /* methods */
3558 (destructor)dictiter_dealloc, /* tp_dealloc */
3559 0, /* tp_print */
3560 0, /* tp_getattr */
3561 0, /* tp_setattr */
3562 0, /* tp_reserved */
3563 0, /* tp_repr */
3564 0, /* tp_as_number */
3565 0, /* tp_as_sequence */
3566 0, /* tp_as_mapping */
3567 0, /* tp_hash */
3568 0, /* tp_call */
3569 0, /* tp_str */
3570 PyObject_GenericGetAttr, /* tp_getattro */
3571 0, /* tp_setattro */
3572 0, /* tp_as_buffer */
Serhiy Storchaka49f5cdd2016-10-09 23:08:05 +03003573 Py_TPFLAGS_DEFAULT | Py_TPFLAGS_HAVE_GC, /* tp_flags */
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00003574 0, /* tp_doc */
3575 (traverseproc)dictiter_traverse, /* tp_traverse */
3576 0, /* tp_clear */
3577 0, /* tp_richcompare */
3578 0, /* tp_weaklistoffset */
3579 PyObject_SelfIter, /* tp_iter */
3580 (iternextfunc)dictiter_iternextvalue, /* tp_iternext */
3581 dictiter_methods, /* tp_methods */
3582 0,
Raymond Hettinger019a1482004-03-18 02:41:19 +00003583};
3584
Serhiy Storchaka49f5cdd2016-10-09 23:08:05 +03003585static PyObject *
3586dictiter_iternextitem(dictiterobject *di)
Raymond Hettinger019a1482004-03-18 02:41:19 +00003587{
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00003588 PyObject *key, *value, *result = di->di_result;
INADA Naokica2d8be2016-11-04 16:59:10 +09003589 Py_ssize_t i;
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00003590 PyDictObject *d = di->di_dict;
Raymond Hettinger019a1482004-03-18 02:41:19 +00003591
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00003592 if (d == NULL)
3593 return NULL;
3594 assert (PyDict_Check(d));
Raymond Hettinger019a1482004-03-18 02:41:19 +00003595
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00003596 if (di->di_used != d->ma_used) {
3597 PyErr_SetString(PyExc_RuntimeError,
3598 "dictionary changed size during iteration");
3599 di->di_used = -1; /* Make this state sticky */
3600 return NULL;
3601 }
Raymond Hettinger019a1482004-03-18 02:41:19 +00003602
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00003603 i = di->di_pos;
INADA Naokica2d8be2016-11-04 16:59:10 +09003604 assert(i >= 0);
Benjamin Peterson7d95e402012-04-23 11:24:50 -04003605 if (d->ma_values) {
INADA Naokica2d8be2016-11-04 16:59:10 +09003606 if (i >= d->ma_used)
Serhiy Storchaka49f5cdd2016-10-09 23:08:05 +03003607 goto fail;
3608 key = DK_ENTRIES(d->ma_keys)[i].me_key;
INADA Naokica2d8be2016-11-04 16:59:10 +09003609 value = d->ma_values[i];
3610 assert(value != NULL);
Benjamin Peterson7d95e402012-04-23 11:24:50 -04003611 }
3612 else {
INADA Naokica2d8be2016-11-04 16:59:10 +09003613 Py_ssize_t n = d->ma_keys->dk_nentries;
Serhiy Storchaka49f5cdd2016-10-09 23:08:05 +03003614 PyDictKeyEntry *entry_ptr = &DK_ENTRIES(d->ma_keys)[i];
3615 while (i < n && entry_ptr->me_value == NULL) {
3616 entry_ptr++;
3617 i++;
3618 }
3619 if (i >= n)
3620 goto fail;
3621 key = entry_ptr->me_key;
3622 value = entry_ptr->me_value;
Benjamin Peterson7d95e402012-04-23 11:24:50 -04003623 }
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00003624 di->di_pos = i+1;
Serhiy Storchaka49f5cdd2016-10-09 23:08:05 +03003625 di->len--;
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00003626 if (result->ob_refcnt == 1) {
3627 Py_INCREF(result);
3628 Py_DECREF(PyTuple_GET_ITEM(result, 0));
3629 Py_DECREF(PyTuple_GET_ITEM(result, 1));
Serhiy Storchaka49f5cdd2016-10-09 23:08:05 +03003630 }
3631 else {
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00003632 result = PyTuple_New(2);
3633 if (result == NULL)
3634 return NULL;
3635 }
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00003636 Py_INCREF(key);
3637 Py_INCREF(value);
Eric Snow96c6af92015-05-29 22:21:39 -06003638 PyTuple_SET_ITEM(result, 0, key); /* steals reference */
3639 PyTuple_SET_ITEM(result, 1, value); /* steals reference */
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00003640 return result;
Raymond Hettinger019a1482004-03-18 02:41:19 +00003641
3642fail:
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00003643 di->di_dict = NULL;
Serhiy Storchakafbb1c5e2016-03-30 20:40:02 +03003644 Py_DECREF(d);
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00003645 return NULL;
Raymond Hettinger019a1482004-03-18 02:41:19 +00003646}
3647
3648PyTypeObject PyDictIterItem_Type = {
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00003649 PyVarObject_HEAD_INIT(&PyType_Type, 0)
3650 "dict_itemiterator", /* tp_name */
3651 sizeof(dictiterobject), /* tp_basicsize */
3652 0, /* tp_itemsize */
3653 /* methods */
3654 (destructor)dictiter_dealloc, /* tp_dealloc */
3655 0, /* tp_print */
3656 0, /* tp_getattr */
3657 0, /* tp_setattr */
3658 0, /* tp_reserved */
3659 0, /* tp_repr */
3660 0, /* tp_as_number */
3661 0, /* tp_as_sequence */
3662 0, /* tp_as_mapping */
3663 0, /* tp_hash */
3664 0, /* tp_call */
3665 0, /* tp_str */
3666 PyObject_GenericGetAttr, /* tp_getattro */
3667 0, /* tp_setattro */
3668 0, /* tp_as_buffer */
3669 Py_TPFLAGS_DEFAULT | Py_TPFLAGS_HAVE_GC,/* tp_flags */
3670 0, /* tp_doc */
3671 (traverseproc)dictiter_traverse, /* tp_traverse */
3672 0, /* tp_clear */
3673 0, /* tp_richcompare */
3674 0, /* tp_weaklistoffset */
3675 PyObject_SelfIter, /* tp_iter */
3676 (iternextfunc)dictiter_iternextitem, /* tp_iternext */
3677 dictiter_methods, /* tp_methods */
3678 0,
Guido van Rossum59d1d2b2001-04-20 19:13:02 +00003679};
Guido van Rossumb90c8482007-02-10 01:11:45 +00003680
3681
Kristján Valur Jónsson31668b82012-04-03 10:49:41 +00003682static PyObject *
3683dictiter_reduce(dictiterobject *di)
3684{
3685 PyObject *list;
3686 dictiterobject tmp;
3687
3688 list = PyList_New(0);
3689 if (!list)
3690 return NULL;
3691
3692 /* copy the itertor state */
3693 tmp = *di;
3694 Py_XINCREF(tmp.di_dict);
Benjamin Peterson7d95e402012-04-23 11:24:50 -04003695
Kristján Valur Jónsson31668b82012-04-03 10:49:41 +00003696 /* iterate the temporary into a list */
3697 for(;;) {
3698 PyObject *element = 0;
3699 if (Py_TYPE(di) == &PyDictIterItem_Type)
3700 element = dictiter_iternextitem(&tmp);
3701 else if (Py_TYPE(di) == &PyDictIterKey_Type)
3702 element = dictiter_iternextkey(&tmp);
3703 else if (Py_TYPE(di) == &PyDictIterValue_Type)
3704 element = dictiter_iternextvalue(&tmp);
3705 else
3706 assert(0);
3707 if (element) {
3708 if (PyList_Append(list, element)) {
3709 Py_DECREF(element);
3710 Py_DECREF(list);
3711 Py_XDECREF(tmp.di_dict);
3712 return NULL;
3713 }
3714 Py_DECREF(element);
3715 } else
3716 break;
3717 }
3718 Py_XDECREF(tmp.di_dict);
3719 /* check for error */
3720 if (tmp.di_dict != NULL) {
3721 /* we have an error */
3722 Py_DECREF(list);
3723 return NULL;
3724 }
Antoine Pitroua7013882012-04-05 00:04:20 +02003725 return Py_BuildValue("N(N)", _PyObject_GetBuiltin("iter"), list);
Kristján Valur Jónsson31668b82012-04-03 10:49:41 +00003726}
3727
Guido van Rossum3ac67412007-02-10 18:55:06 +00003728/***********************************************/
Guido van Rossumb90c8482007-02-10 01:11:45 +00003729/* View objects for keys(), items(), values(). */
Guido van Rossum3ac67412007-02-10 18:55:06 +00003730/***********************************************/
3731
Guido van Rossumb90c8482007-02-10 01:11:45 +00003732/* The instance lay-out is the same for all three; but the type differs. */
3733
Guido van Rossumb90c8482007-02-10 01:11:45 +00003734static void
Eric Snow96c6af92015-05-29 22:21:39 -06003735dictview_dealloc(_PyDictViewObject *dv)
Guido van Rossumb90c8482007-02-10 01:11:45 +00003736{
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00003737 Py_XDECREF(dv->dv_dict);
3738 PyObject_GC_Del(dv);
Antoine Pitrou7ddda782009-01-01 15:35:33 +00003739}
3740
3741static int
Eric Snow96c6af92015-05-29 22:21:39 -06003742dictview_traverse(_PyDictViewObject *dv, visitproc visit, void *arg)
Antoine Pitrou7ddda782009-01-01 15:35:33 +00003743{
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00003744 Py_VISIT(dv->dv_dict);
3745 return 0;
Guido van Rossumb90c8482007-02-10 01:11:45 +00003746}
3747
Guido van Rossum83825ac2007-02-10 04:54:19 +00003748static Py_ssize_t
Eric Snow96c6af92015-05-29 22:21:39 -06003749dictview_len(_PyDictViewObject *dv)
Guido van Rossumb90c8482007-02-10 01:11:45 +00003750{
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00003751 Py_ssize_t len = 0;
3752 if (dv->dv_dict != NULL)
3753 len = dv->dv_dict->ma_used;
3754 return len;
Guido van Rossumb90c8482007-02-10 01:11:45 +00003755}
3756
Eric Snow96c6af92015-05-29 22:21:39 -06003757PyObject *
3758_PyDictView_New(PyObject *dict, PyTypeObject *type)
Guido van Rossumb90c8482007-02-10 01:11:45 +00003759{
Eric Snow96c6af92015-05-29 22:21:39 -06003760 _PyDictViewObject *dv;
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00003761 if (dict == NULL) {
3762 PyErr_BadInternalCall();
3763 return NULL;
3764 }
3765 if (!PyDict_Check(dict)) {
3766 /* XXX Get rid of this restriction later */
3767 PyErr_Format(PyExc_TypeError,
3768 "%s() requires a dict argument, not '%s'",
3769 type->tp_name, dict->ob_type->tp_name);
3770 return NULL;
3771 }
Eric Snow96c6af92015-05-29 22:21:39 -06003772 dv = PyObject_GC_New(_PyDictViewObject, type);
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00003773 if (dv == NULL)
3774 return NULL;
3775 Py_INCREF(dict);
3776 dv->dv_dict = (PyDictObject *)dict;
3777 _PyObject_GC_TRACK(dv);
3778 return (PyObject *)dv;
Guido van Rossumb90c8482007-02-10 01:11:45 +00003779}
3780
Neal Norwitze36f2ba2007-02-26 23:12:28 +00003781/* TODO(guido): The views objects are not complete:
3782
3783 * support more set operations
3784 * support arbitrary mappings?
3785 - either these should be static or exported in dictobject.h
3786 - if public then they should probably be in builtins
3787*/
3788
Guido van Rossumaac530c2007-08-24 22:33:45 +00003789/* Return 1 if self is a subset of other, iterating over self;
3790 0 if not; -1 if an error occurred. */
Guido van Rossumd9214d12007-02-12 02:23:40 +00003791static int
3792all_contained_in(PyObject *self, PyObject *other)
3793{
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00003794 PyObject *iter = PyObject_GetIter(self);
3795 int ok = 1;
Guido van Rossumd9214d12007-02-12 02:23:40 +00003796
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00003797 if (iter == NULL)
3798 return -1;
3799 for (;;) {
3800 PyObject *next = PyIter_Next(iter);
3801 if (next == NULL) {
3802 if (PyErr_Occurred())
3803 ok = -1;
3804 break;
3805 }
3806 ok = PySequence_Contains(other, next);
3807 Py_DECREF(next);
3808 if (ok <= 0)
3809 break;
3810 }
3811 Py_DECREF(iter);
3812 return ok;
Guido van Rossumd9214d12007-02-12 02:23:40 +00003813}
3814
3815static PyObject *
3816dictview_richcompare(PyObject *self, PyObject *other, int op)
3817{
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00003818 Py_ssize_t len_self, len_other;
3819 int ok;
3820 PyObject *result;
Guido van Rossumaac530c2007-08-24 22:33:45 +00003821
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00003822 assert(self != NULL);
3823 assert(PyDictViewSet_Check(self));
3824 assert(other != NULL);
Guido van Rossumd9214d12007-02-12 02:23:40 +00003825
Brian Curtindfc80e32011-08-10 20:28:54 -05003826 if (!PyAnySet_Check(other) && !PyDictViewSet_Check(other))
3827 Py_RETURN_NOTIMPLEMENTED;
Guido van Rossumaac530c2007-08-24 22:33:45 +00003828
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00003829 len_self = PyObject_Size(self);
3830 if (len_self < 0)
3831 return NULL;
3832 len_other = PyObject_Size(other);
3833 if (len_other < 0)
3834 return NULL;
Guido van Rossumaac530c2007-08-24 22:33:45 +00003835
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00003836 ok = 0;
3837 switch(op) {
Guido van Rossumaac530c2007-08-24 22:33:45 +00003838
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00003839 case Py_NE:
3840 case Py_EQ:
3841 if (len_self == len_other)
3842 ok = all_contained_in(self, other);
3843 if (op == Py_NE && ok >= 0)
3844 ok = !ok;
3845 break;
Guido van Rossumaac530c2007-08-24 22:33:45 +00003846
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00003847 case Py_LT:
3848 if (len_self < len_other)
3849 ok = all_contained_in(self, other);
3850 break;
Guido van Rossumaac530c2007-08-24 22:33:45 +00003851
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00003852 case Py_LE:
3853 if (len_self <= len_other)
3854 ok = all_contained_in(self, other);
3855 break;
Guido van Rossumaac530c2007-08-24 22:33:45 +00003856
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00003857 case Py_GT:
3858 if (len_self > len_other)
3859 ok = all_contained_in(other, self);
3860 break;
Guido van Rossumaac530c2007-08-24 22:33:45 +00003861
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00003862 case Py_GE:
3863 if (len_self >= len_other)
3864 ok = all_contained_in(other, self);
3865 break;
Guido van Rossumaac530c2007-08-24 22:33:45 +00003866
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00003867 }
3868 if (ok < 0)
3869 return NULL;
3870 result = ok ? Py_True : Py_False;
3871 Py_INCREF(result);
3872 return result;
Guido van Rossumd9214d12007-02-12 02:23:40 +00003873}
3874
Raymond Hettingerb0d56af2009-03-03 10:52:49 +00003875static PyObject *
Eric Snow96c6af92015-05-29 22:21:39 -06003876dictview_repr(_PyDictViewObject *dv)
Raymond Hettingerb0d56af2009-03-03 10:52:49 +00003877{
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00003878 PyObject *seq;
3879 PyObject *result;
Raymond Hettingerb0d56af2009-03-03 10:52:49 +00003880
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00003881 seq = PySequence_List((PyObject *)dv);
3882 if (seq == NULL)
3883 return NULL;
3884
3885 result = PyUnicode_FromFormat("%s(%R)", Py_TYPE(dv)->tp_name, seq);
3886 Py_DECREF(seq);
3887 return result;
Raymond Hettingerb0d56af2009-03-03 10:52:49 +00003888}
3889
Guido van Rossum3ac67412007-02-10 18:55:06 +00003890/*** dict_keys ***/
Guido van Rossumb90c8482007-02-10 01:11:45 +00003891
3892static PyObject *
Eric Snow96c6af92015-05-29 22:21:39 -06003893dictkeys_iter(_PyDictViewObject *dv)
Guido van Rossumb90c8482007-02-10 01:11:45 +00003894{
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00003895 if (dv->dv_dict == NULL) {
3896 Py_RETURN_NONE;
3897 }
3898 return dictiter_new(dv->dv_dict, &PyDictIterKey_Type);
Guido van Rossum3ac67412007-02-10 18:55:06 +00003899}
3900
3901static int
Eric Snow96c6af92015-05-29 22:21:39 -06003902dictkeys_contains(_PyDictViewObject *dv, PyObject *obj)
Guido van Rossum3ac67412007-02-10 18:55:06 +00003903{
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00003904 if (dv->dv_dict == NULL)
3905 return 0;
3906 return PyDict_Contains((PyObject *)dv->dv_dict, obj);
Guido van Rossumb90c8482007-02-10 01:11:45 +00003907}
3908
Guido van Rossum83825ac2007-02-10 04:54:19 +00003909static PySequenceMethods dictkeys_as_sequence = {
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00003910 (lenfunc)dictview_len, /* sq_length */
3911 0, /* sq_concat */
3912 0, /* sq_repeat */
3913 0, /* sq_item */
3914 0, /* sq_slice */
3915 0, /* sq_ass_item */
3916 0, /* sq_ass_slice */
3917 (objobjproc)dictkeys_contains, /* sq_contains */
Guido van Rossum83825ac2007-02-10 04:54:19 +00003918};
3919
Guido van Rossum523259b2007-08-24 23:41:22 +00003920static PyObject*
3921dictviews_sub(PyObject* self, PyObject *other)
3922{
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00003923 PyObject *result = PySet_New(self);
3924 PyObject *tmp;
Martin v. Löwisbd928fe2011-10-14 10:20:37 +02003925 _Py_IDENTIFIER(difference_update);
Martin v. Löwisafe55bb2011-10-09 10:38:36 +02003926
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00003927 if (result == NULL)
3928 return NULL;
Guido van Rossum523259b2007-08-24 23:41:22 +00003929
Benjamin Petersonf11b25b2016-03-03 22:05:36 -08003930 tmp = _PyObject_CallMethodIdObjArgs(result, &PyId_difference_update, other, NULL);
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00003931 if (tmp == NULL) {
3932 Py_DECREF(result);
3933 return NULL;
3934 }
Guido van Rossum523259b2007-08-24 23:41:22 +00003935
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00003936 Py_DECREF(tmp);
3937 return result;
Guido van Rossum523259b2007-08-24 23:41:22 +00003938}
3939
Benjamin Peterson025e9eb2015-05-05 20:16:41 -04003940PyObject*
3941_PyDictView_Intersect(PyObject* self, PyObject *other)
Guido van Rossum523259b2007-08-24 23:41:22 +00003942{
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00003943 PyObject *result = PySet_New(self);
3944 PyObject *tmp;
Martin v. Löwisbd928fe2011-10-14 10:20:37 +02003945 _Py_IDENTIFIER(intersection_update);
Martin v. Löwisafe55bb2011-10-09 10:38:36 +02003946
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00003947 if (result == NULL)
3948 return NULL;
Guido van Rossum523259b2007-08-24 23:41:22 +00003949
Benjamin Petersonf11b25b2016-03-03 22:05:36 -08003950 tmp = _PyObject_CallMethodIdObjArgs(result, &PyId_intersection_update, other, NULL);
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00003951 if (tmp == NULL) {
3952 Py_DECREF(result);
3953 return NULL;
3954 }
Guido van Rossum523259b2007-08-24 23:41:22 +00003955
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00003956 Py_DECREF(tmp);
3957 return result;
Guido van Rossum523259b2007-08-24 23:41:22 +00003958}
3959
3960static PyObject*
3961dictviews_or(PyObject* self, PyObject *other)
3962{
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00003963 PyObject *result = PySet_New(self);
3964 PyObject *tmp;
Martin v. Löwis1c67dd92011-10-14 15:16:45 +02003965 _Py_IDENTIFIER(update);
Victor Stinnerd1a9cc22011-10-13 22:51:17 +02003966
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00003967 if (result == NULL)
3968 return NULL;
Guido van Rossum523259b2007-08-24 23:41:22 +00003969
Benjamin Petersonf11b25b2016-03-03 22:05:36 -08003970 tmp = _PyObject_CallMethodIdObjArgs(result, &PyId_update, other, NULL);
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00003971 if (tmp == NULL) {
3972 Py_DECREF(result);
3973 return NULL;
3974 }
Guido van Rossum523259b2007-08-24 23:41:22 +00003975
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00003976 Py_DECREF(tmp);
3977 return result;
Guido van Rossum523259b2007-08-24 23:41:22 +00003978}
3979
3980static PyObject*
3981dictviews_xor(PyObject* self, PyObject *other)
3982{
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00003983 PyObject *result = PySet_New(self);
3984 PyObject *tmp;
Martin v. Löwisbd928fe2011-10-14 10:20:37 +02003985 _Py_IDENTIFIER(symmetric_difference_update);
Martin v. Löwisafe55bb2011-10-09 10:38:36 +02003986
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00003987 if (result == NULL)
3988 return NULL;
Guido van Rossum523259b2007-08-24 23:41:22 +00003989
Benjamin Petersonf11b25b2016-03-03 22:05:36 -08003990 tmp = _PyObject_CallMethodIdObjArgs(result, &PyId_symmetric_difference_update, other, NULL);
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00003991 if (tmp == NULL) {
3992 Py_DECREF(result);
3993 return NULL;
3994 }
Guido van Rossum523259b2007-08-24 23:41:22 +00003995
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00003996 Py_DECREF(tmp);
3997 return result;
Guido van Rossum523259b2007-08-24 23:41:22 +00003998}
3999
4000static PyNumberMethods dictviews_as_number = {
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00004001 0, /*nb_add*/
4002 (binaryfunc)dictviews_sub, /*nb_subtract*/
4003 0, /*nb_multiply*/
4004 0, /*nb_remainder*/
4005 0, /*nb_divmod*/
4006 0, /*nb_power*/
4007 0, /*nb_negative*/
4008 0, /*nb_positive*/
4009 0, /*nb_absolute*/
4010 0, /*nb_bool*/
4011 0, /*nb_invert*/
4012 0, /*nb_lshift*/
4013 0, /*nb_rshift*/
Benjamin Peterson025e9eb2015-05-05 20:16:41 -04004014 (binaryfunc)_PyDictView_Intersect, /*nb_and*/
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00004015 (binaryfunc)dictviews_xor, /*nb_xor*/
4016 (binaryfunc)dictviews_or, /*nb_or*/
Guido van Rossum523259b2007-08-24 23:41:22 +00004017};
4018
Daniel Stutzbach045b3ba2010-09-02 15:06:06 +00004019static PyObject*
4020dictviews_isdisjoint(PyObject *self, PyObject *other)
4021{
4022 PyObject *it;
4023 PyObject *item = NULL;
4024
4025 if (self == other) {
Eric Snow96c6af92015-05-29 22:21:39 -06004026 if (dictview_len((_PyDictViewObject *)self) == 0)
Daniel Stutzbach045b3ba2010-09-02 15:06:06 +00004027 Py_RETURN_TRUE;
4028 else
4029 Py_RETURN_FALSE;
4030 }
4031
4032 /* Iterate over the shorter object (only if other is a set,
4033 * because PySequence_Contains may be expensive otherwise): */
4034 if (PyAnySet_Check(other) || PyDictViewSet_Check(other)) {
Eric Snow96c6af92015-05-29 22:21:39 -06004035 Py_ssize_t len_self = dictview_len((_PyDictViewObject *)self);
Daniel Stutzbach045b3ba2010-09-02 15:06:06 +00004036 Py_ssize_t len_other = PyObject_Size(other);
4037 if (len_other == -1)
4038 return NULL;
4039
4040 if ((len_other > len_self)) {
4041 PyObject *tmp = other;
4042 other = self;
4043 self = tmp;
4044 }
4045 }
4046
4047 it = PyObject_GetIter(other);
4048 if (it == NULL)
4049 return NULL;
4050
4051 while ((item = PyIter_Next(it)) != NULL) {
4052 int contains = PySequence_Contains(self, item);
4053 Py_DECREF(item);
4054 if (contains == -1) {
4055 Py_DECREF(it);
4056 return NULL;
4057 }
4058
4059 if (contains) {
4060 Py_DECREF(it);
4061 Py_RETURN_FALSE;
4062 }
4063 }
4064 Py_DECREF(it);
4065 if (PyErr_Occurred())
4066 return NULL; /* PyIter_Next raised an exception. */
4067 Py_RETURN_TRUE;
4068}
4069
4070PyDoc_STRVAR(isdisjoint_doc,
4071"Return True if the view and the given iterable have a null intersection.");
4072
Guido van Rossumb90c8482007-02-10 01:11:45 +00004073static PyMethodDef dictkeys_methods[] = {
Daniel Stutzbach045b3ba2010-09-02 15:06:06 +00004074 {"isdisjoint", (PyCFunction)dictviews_isdisjoint, METH_O,
4075 isdisjoint_doc},
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00004076 {NULL, NULL} /* sentinel */
Guido van Rossumb90c8482007-02-10 01:11:45 +00004077};
4078
4079PyTypeObject PyDictKeys_Type = {
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00004080 PyVarObject_HEAD_INIT(&PyType_Type, 0)
4081 "dict_keys", /* tp_name */
Eric Snow96c6af92015-05-29 22:21:39 -06004082 sizeof(_PyDictViewObject), /* tp_basicsize */
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00004083 0, /* tp_itemsize */
4084 /* methods */
4085 (destructor)dictview_dealloc, /* tp_dealloc */
4086 0, /* tp_print */
4087 0, /* tp_getattr */
4088 0, /* tp_setattr */
4089 0, /* tp_reserved */
4090 (reprfunc)dictview_repr, /* tp_repr */
4091 &dictviews_as_number, /* tp_as_number */
4092 &dictkeys_as_sequence, /* tp_as_sequence */
4093 0, /* tp_as_mapping */
4094 0, /* tp_hash */
4095 0, /* tp_call */
4096 0, /* tp_str */
4097 PyObject_GenericGetAttr, /* tp_getattro */
4098 0, /* tp_setattro */
4099 0, /* tp_as_buffer */
4100 Py_TPFLAGS_DEFAULT | Py_TPFLAGS_HAVE_GC,/* tp_flags */
4101 0, /* tp_doc */
4102 (traverseproc)dictview_traverse, /* tp_traverse */
4103 0, /* tp_clear */
4104 dictview_richcompare, /* tp_richcompare */
4105 0, /* tp_weaklistoffset */
4106 (getiterfunc)dictkeys_iter, /* tp_iter */
4107 0, /* tp_iternext */
4108 dictkeys_methods, /* tp_methods */
4109 0,
Guido van Rossumb90c8482007-02-10 01:11:45 +00004110};
4111
4112static PyObject *
4113dictkeys_new(PyObject *dict)
4114{
Eric Snow96c6af92015-05-29 22:21:39 -06004115 return _PyDictView_New(dict, &PyDictKeys_Type);
Guido van Rossumb90c8482007-02-10 01:11:45 +00004116}
4117
Guido van Rossum3ac67412007-02-10 18:55:06 +00004118/*** dict_items ***/
Guido van Rossumb90c8482007-02-10 01:11:45 +00004119
4120static PyObject *
Eric Snow96c6af92015-05-29 22:21:39 -06004121dictitems_iter(_PyDictViewObject *dv)
Guido van Rossumb90c8482007-02-10 01:11:45 +00004122{
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00004123 if (dv->dv_dict == NULL) {
4124 Py_RETURN_NONE;
4125 }
4126 return dictiter_new(dv->dv_dict, &PyDictIterItem_Type);
Guido van Rossum3ac67412007-02-10 18:55:06 +00004127}
4128
4129static int
Eric Snow96c6af92015-05-29 22:21:39 -06004130dictitems_contains(_PyDictViewObject *dv, PyObject *obj)
Guido van Rossum3ac67412007-02-10 18:55:06 +00004131{
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00004132 PyObject *key, *value, *found;
4133 if (dv->dv_dict == NULL)
4134 return 0;
4135 if (!PyTuple_Check(obj) || PyTuple_GET_SIZE(obj) != 2)
4136 return 0;
4137 key = PyTuple_GET_ITEM(obj, 0);
4138 value = PyTuple_GET_ITEM(obj, 1);
Raymond Hettinger6692f012016-09-18 21:46:08 -07004139 found = PyDict_GetItemWithError((PyObject *)dv->dv_dict, key);
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00004140 if (found == NULL) {
4141 if (PyErr_Occurred())
4142 return -1;
4143 return 0;
4144 }
4145 return PyObject_RichCompareBool(value, found, Py_EQ);
Guido van Rossumb90c8482007-02-10 01:11:45 +00004146}
4147
Guido van Rossum83825ac2007-02-10 04:54:19 +00004148static PySequenceMethods dictitems_as_sequence = {
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00004149 (lenfunc)dictview_len, /* sq_length */
4150 0, /* sq_concat */
4151 0, /* sq_repeat */
4152 0, /* sq_item */
4153 0, /* sq_slice */
4154 0, /* sq_ass_item */
4155 0, /* sq_ass_slice */
4156 (objobjproc)dictitems_contains, /* sq_contains */
Guido van Rossum83825ac2007-02-10 04:54:19 +00004157};
4158
Guido van Rossumb90c8482007-02-10 01:11:45 +00004159static PyMethodDef dictitems_methods[] = {
Daniel Stutzbach045b3ba2010-09-02 15:06:06 +00004160 {"isdisjoint", (PyCFunction)dictviews_isdisjoint, METH_O,
4161 isdisjoint_doc},
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00004162 {NULL, NULL} /* sentinel */
Guido van Rossumb90c8482007-02-10 01:11:45 +00004163};
4164
4165PyTypeObject PyDictItems_Type = {
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00004166 PyVarObject_HEAD_INIT(&PyType_Type, 0)
4167 "dict_items", /* tp_name */
Eric Snow96c6af92015-05-29 22:21:39 -06004168 sizeof(_PyDictViewObject), /* tp_basicsize */
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00004169 0, /* tp_itemsize */
4170 /* methods */
4171 (destructor)dictview_dealloc, /* tp_dealloc */
4172 0, /* tp_print */
4173 0, /* tp_getattr */
4174 0, /* tp_setattr */
4175 0, /* tp_reserved */
4176 (reprfunc)dictview_repr, /* tp_repr */
4177 &dictviews_as_number, /* tp_as_number */
4178 &dictitems_as_sequence, /* tp_as_sequence */
4179 0, /* tp_as_mapping */
4180 0, /* tp_hash */
4181 0, /* tp_call */
4182 0, /* tp_str */
4183 PyObject_GenericGetAttr, /* tp_getattro */
4184 0, /* tp_setattro */
4185 0, /* tp_as_buffer */
4186 Py_TPFLAGS_DEFAULT | Py_TPFLAGS_HAVE_GC,/* tp_flags */
4187 0, /* tp_doc */
4188 (traverseproc)dictview_traverse, /* tp_traverse */
4189 0, /* tp_clear */
4190 dictview_richcompare, /* tp_richcompare */
4191 0, /* tp_weaklistoffset */
4192 (getiterfunc)dictitems_iter, /* tp_iter */
4193 0, /* tp_iternext */
4194 dictitems_methods, /* tp_methods */
4195 0,
Guido van Rossumb90c8482007-02-10 01:11:45 +00004196};
4197
4198static PyObject *
4199dictitems_new(PyObject *dict)
4200{
Eric Snow96c6af92015-05-29 22:21:39 -06004201 return _PyDictView_New(dict, &PyDictItems_Type);
Guido van Rossumb90c8482007-02-10 01:11:45 +00004202}
4203
Guido van Rossum3ac67412007-02-10 18:55:06 +00004204/*** dict_values ***/
Guido van Rossumb90c8482007-02-10 01:11:45 +00004205
4206static PyObject *
Eric Snow96c6af92015-05-29 22:21:39 -06004207dictvalues_iter(_PyDictViewObject *dv)
Guido van Rossumb90c8482007-02-10 01:11:45 +00004208{
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00004209 if (dv->dv_dict == NULL) {
4210 Py_RETURN_NONE;
4211 }
4212 return dictiter_new(dv->dv_dict, &PyDictIterValue_Type);
Guido van Rossumb90c8482007-02-10 01:11:45 +00004213}
4214
Guido van Rossum83825ac2007-02-10 04:54:19 +00004215static PySequenceMethods dictvalues_as_sequence = {
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00004216 (lenfunc)dictview_len, /* sq_length */
4217 0, /* sq_concat */
4218 0, /* sq_repeat */
4219 0, /* sq_item */
4220 0, /* sq_slice */
4221 0, /* sq_ass_item */
4222 0, /* sq_ass_slice */
4223 (objobjproc)0, /* sq_contains */
Guido van Rossum83825ac2007-02-10 04:54:19 +00004224};
4225
Guido van Rossumb90c8482007-02-10 01:11:45 +00004226static PyMethodDef dictvalues_methods[] = {
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00004227 {NULL, NULL} /* sentinel */
Guido van Rossumb90c8482007-02-10 01:11:45 +00004228};
4229
4230PyTypeObject PyDictValues_Type = {
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00004231 PyVarObject_HEAD_INIT(&PyType_Type, 0)
4232 "dict_values", /* tp_name */
Eric Snow96c6af92015-05-29 22:21:39 -06004233 sizeof(_PyDictViewObject), /* tp_basicsize */
Antoine Pitrouf95a1b32010-05-09 15:52:27 +00004234 0, /* tp_itemsize */
4235 /* methods */
4236 (destructor)dictview_dealloc, /* tp_dealloc */
4237 0, /* tp_print */
4238 0, /* tp_getattr */
4239 0, /* tp_setattr */
4240 0, /* tp_reserved */
4241 (reprfunc)dictview_repr, /* tp_repr */
4242 0, /* tp_as_number */
4243 &dictvalues_as_sequence, /* tp_as_sequence */
4244 0, /* tp_as_mapping */
4245 0, /* tp_hash */
4246 0, /* tp_call */
4247 0, /* tp_str */
4248 PyObject_GenericGetAttr, /* tp_getattro */
4249 0, /* tp_setattro */
4250 0, /* tp_as_buffer */
4251 Py_TPFLAGS_DEFAULT | Py_TPFLAGS_HAVE_GC,/* tp_flags */
4252 0, /* tp_doc */
4253 (traverseproc)dictview_traverse, /* tp_traverse */
4254 0, /* tp_clear */
4255 0, /* tp_richcompare */
4256 0, /* tp_weaklistoffset */
4257 (getiterfunc)dictvalues_iter, /* tp_iter */
4258 0, /* tp_iternext */
4259 dictvalues_methods, /* tp_methods */
4260 0,
Guido van Rossumb90c8482007-02-10 01:11:45 +00004261};
4262
4263static PyObject *
4264dictvalues_new(PyObject *dict)
4265{
Eric Snow96c6af92015-05-29 22:21:39 -06004266 return _PyDictView_New(dict, &PyDictValues_Type);
Guido van Rossumb90c8482007-02-10 01:11:45 +00004267}
Benjamin Peterson7d95e402012-04-23 11:24:50 -04004268
4269/* Returns NULL if cannot allocate a new PyDictKeysObject,
4270 but does not set an error */
4271PyDictKeysObject *
4272_PyDict_NewKeysForClass(void)
4273{
Victor Stinner742da042016-09-07 17:40:12 -07004274 PyDictKeysObject *keys = new_keys_object(PyDict_MINSIZE);
Benjamin Peterson7d95e402012-04-23 11:24:50 -04004275 if (keys == NULL)
4276 PyErr_Clear();
4277 else
4278 keys->dk_lookup = lookdict_split;
4279 return keys;
4280}
4281
4282#define CACHED_KEYS(tp) (((PyHeapTypeObject*)tp)->ht_cached_keys)
4283
4284PyObject *
4285PyObject_GenericGetDict(PyObject *obj, void *context)
4286{
4287 PyObject *dict, **dictptr = _PyObject_GetDictPtr(obj);
4288 if (dictptr == NULL) {
4289 PyErr_SetString(PyExc_AttributeError,
4290 "This object has no __dict__");
4291 return NULL;
4292 }
4293 dict = *dictptr;
4294 if (dict == NULL) {
4295 PyTypeObject *tp = Py_TYPE(obj);
4296 if ((tp->tp_flags & Py_TPFLAGS_HEAPTYPE) && CACHED_KEYS(tp)) {
4297 DK_INCREF(CACHED_KEYS(tp));
4298 *dictptr = dict = new_dict_with_shared_keys(CACHED_KEYS(tp));
4299 }
4300 else {
4301 *dictptr = dict = PyDict_New();
4302 }
4303 }
4304 Py_XINCREF(dict);
4305 return dict;
4306}
4307
4308int
4309_PyObjectDict_SetItem(PyTypeObject *tp, PyObject **dictptr,
Victor Stinner742da042016-09-07 17:40:12 -07004310 PyObject *key, PyObject *value)
Benjamin Peterson7d95e402012-04-23 11:24:50 -04004311{
4312 PyObject *dict;
4313 int res;
4314 PyDictKeysObject *cached;
4315
4316 assert(dictptr != NULL);
4317 if ((tp->tp_flags & Py_TPFLAGS_HEAPTYPE) && (cached = CACHED_KEYS(tp))) {
4318 assert(dictptr != NULL);
4319 dict = *dictptr;
4320 if (dict == NULL) {
4321 DK_INCREF(cached);
4322 dict = new_dict_with_shared_keys(cached);
4323 if (dict == NULL)
4324 return -1;
4325 *dictptr = dict;
4326 }
4327 if (value == NULL) {
4328 res = PyDict_DelItem(dict, key);
4329 if (cached != ((PyDictObject *)dict)->ma_keys) {
4330 CACHED_KEYS(tp) = NULL;
4331 DK_DECREF(cached);
4332 }
Victor Stinner3d3f2642016-12-15 17:21:23 +01004333 }
4334 else {
4335 int was_shared = cached == ((PyDictObject *)dict)->ma_keys;
Benjamin Peterson7d95e402012-04-23 11:24:50 -04004336 res = PyDict_SetItem(dict, key, value);
Victor Stinner3d3f2642016-12-15 17:21:23 +01004337 if (was_shared && cached != ((PyDictObject *)dict)->ma_keys) {
4338 /* PyDict_SetItem() may call dictresize and convert split table
4339 * into combined table. In such case, convert it to split
4340 * table again and update type's shared key only when this is
4341 * the only dict sharing key with the type.
4342 *
4343 * This is to allow using shared key in class like this:
4344 *
4345 * class C:
4346 * def __init__(self):
4347 * # one dict resize happens
4348 * self.a, self.b, self.c = 1, 2, 3
4349 * self.d, self.e, self.f = 4, 5, 6
4350 * a = C()
4351 */
Benjamin Peterson15ee8212012-04-24 14:44:18 -04004352 if (cached->dk_refcnt == 1) {
Benjamin Peterson7d95e402012-04-23 11:24:50 -04004353 CACHED_KEYS(tp) = make_keys_shared(dict);
Victor Stinner742da042016-09-07 17:40:12 -07004354 }
4355 else {
Benjamin Peterson7d95e402012-04-23 11:24:50 -04004356 CACHED_KEYS(tp) = NULL;
4357 }
4358 DK_DECREF(cached);
Benjamin Peterson15ee8212012-04-24 14:44:18 -04004359 if (CACHED_KEYS(tp) == NULL && PyErr_Occurred())
4360 return -1;
Benjamin Peterson7d95e402012-04-23 11:24:50 -04004361 }
4362 }
4363 } else {
4364 dict = *dictptr;
4365 if (dict == NULL) {
4366 dict = PyDict_New();
4367 if (dict == NULL)
4368 return -1;
4369 *dictptr = dict;
4370 }
4371 if (value == NULL) {
4372 res = PyDict_DelItem(dict, key);
4373 } else {
4374 res = PyDict_SetItem(dict, key, value);
4375 }
4376 }
4377 return res;
4378}
4379
4380void
4381_PyDictKeys_DecRef(PyDictKeysObject *keys)
4382{
4383 DK_DECREF(keys);
4384}