Objects/dictobject.c

   1
   2 /* Dictionary object implementation using a hash table */
   3
   4 /* The distribution includes a separate file, Objects/dictnotes.txt,
   5    describing explorations into dictionary design and optimization.
   6    It covers typical dictionary use patterns, the parameters for
   7    tuning dictionaries, and several ideas for possible optimizations.
   8 */
   9
  10 #include "Python.h"
  11
  12
  13 /* Set a key error with the specified argument, wrapping it in a
  14  * tuple automatically so that tuple keys are not unpacked as the
  15  * exception arguments. */
  16 static void
  17 set_key_error(PyObject *arg)
  18 {
  19         PyObject *tup;
  20         tup = PyTuple_Pack(1, arg);
  21         if (!tup)
  22                 return; /* caller will expect error to be set anyway */
  23         PyErr_SetObject(PyExc_KeyError, tup);
  24         Py_DECREF(tup);
  25 }
  26
  27 /* Define this out if you don't want conversion statistics on exit. */
  28 #undef SHOW_CONVERSION_COUNTS
  29
  30 /* See large comment block below.  This must be >= 1. */
  31 #define PERTURB_SHIFT 5
  32
  33 /*
  34 Major subtleties ahead:  Most hash schemes depend on having a "good" hash
  35 function, in the sense of simulating randomness.  Python doesn't:  its most
  36 important hash functions (for strings and ints) are very regular in common
  37 cases:
  38
  39 >>> map(hash, (0, 1, 2, 3))
  40 [0, 1, 2, 3]
  41 >>> map(hash, ("namea", "nameb", "namec", "named"))
  42 [-1658398457, -1658398460, -1658398459, -1658398462]
  43 >>>
  44
  45 This isn't necessarily bad!  To the contrary, in a table of size 2**i, taking
  46 the low-order i bits as the initial table index is extremely fast, and there
  47 are no collisions at all for dicts indexed by a contiguous range of ints.
  48 The same is approximately true when keys are "consecutive" strings.  So this
  49 gives better-than-random behavior in common cases, and that's very desirable.
  50
  51 OTOH, when collisions occur, the tendency to fill contiguous slices of the
  52 hash table makes a good collision resolution strategy crucial.  Taking only
  53 the last i bits of the hash code is also vulnerable:  for example, consider
  54 [i << 16 for i in range(20000)] as a set of keys.  Since ints are their own
  55 hash codes, and this fits in a dict of size 2**15, the last 15 bits of every
  56 hash code are all 0:  they *all* map to the same table index.
  57
  58 But catering to unusual cases should not slow the usual ones, so we just take
  59 the last i bits anyway.  It's up to collision resolution to do the rest.  If
  60 we *usually* find the key we're looking for on the first try (and, it turns
  61 out, we usually do -- the table load factor is kept under 2/3, so the odds
  62 are solidly in our favor), then it makes best sense to keep the initial index
  63 computation dirt cheap.
  64
  65 The first half of collision resolution is to visit table indices via this
  66 recurrence:
  67
  68     j = ((5*j) + 1) mod 2**i
  69
  70 For any initial j in range(2**i), repeating that 2**i times generates each
  71 int in range(2**i) exactly once (see any text on random-number generation for
  72 proof).  By itself, this doesn't help much:  like linear probing (setting
  73 j += 1, or j -= 1, on each loop trip), it scans the table entries in a fixed
  74 order.  This would be bad, except that's not the only thing we do, and it's
  75 actually *good* in the common cases where hash keys are consecutive.  In an
  76 example that's really too small to make this entirely clear, for a table of
  77 size 2**3 the order of indices is:
  78
  79     0 -> 1 -> 6 -> 7 -> 4 -> 5 -> 2 -> 3 -> 0 [and here it's repeating]
  80
  81 If two things come in at index 5, the first place we look after is index 2,
  82 not 6, so if another comes in at index 6 the collision at 5 didn't hurt it.
  83 Linear probing is deadly in this case because there the fixed probe order
  84 is the *same* as the order consecutive keys are likely to arrive.  But it's
  85 extremely unlikely hash codes will follow a 5*j+1 recurrence by accident,
  86 and certain that consecutive hash codes do not.
  87
  88 The other half of the strategy is to get the other bits of the hash code
  89 into play.  This is done by initializing a (unsigned) vrbl "perturb" to the
  90 full hash code, and changing the recurrence to:
  91
  92     j = (5*j) + 1 + perturb;
  93     perturb >>= PERTURB_SHIFT;
  94     use j % 2**i as the next table index;
  95
  96 Now the probe sequence depends (eventually) on every bit in the hash code,
  97 and the pseudo-scrambling property of recurring on 5*j+1 is more valuable,
  98 because it quickly magnifies small differences in the bits that didn't affect
  99 the initial index.  Note that because perturb is unsigned, if the recurrence
 100 is executed often enough perturb eventually becomes and remains 0.  At that
 101 point (very rarely reached) the recurrence is on (just) 5*j+1 again, and
 102 that's certain to find an empty slot eventually (since it generates every int
 103 in range(2**i), and we make sure there's always at least one empty slot).
 104
 105 Selecting a good value for PERTURB_SHIFT is a balancing act.  You want it
 106 small so that the high bits of the hash code continue to affect the probe
 107 sequence across iterations; but you want it large so that in really bad cases
 108 the high-order hash bits have an effect on early iterations.  5 was "the
 109 best" in minimizing total collisions across experiments Tim Peters ran (on
 110 both normal and pathological cases), but 4 and 6 weren't significantly worse.
 111
 112 Historical:  Reimer Behrends contributed the idea of using a polynomial-based
 113 approach, using repeated multiplication by x in GF(2**n) where an irreducible
 114 polynomial for each table size was chosen such that x was a primitive root.
 115 Christian Tismer later extended that to use division by x instead, as an
 116 efficient way to get the high bits of the hash code into play.  This scheme
 117 also gave excellent collision statistics, but was more expensive:  two
 118 if-tests were required inside the loop; computing "the next" index took about
 119 the same number of operations but without as much potential parallelism
 120 (e.g., computing 5*j can go on at the same time as computing 1+perturb in the
 121 above, and then shifting perturb can be done while the table index is being
 122 masked); and the PyDictObject struct required a member to hold the table's
 123 polynomial.  In Tim's experiments the current scheme ran faster, produced
 124 equally good collision statistics, needed less code & used less memory.
 125
 126 Theoretical Python 2.5 headache:  hash codes are only C "long", but
 127 sizeof(Py_ssize_t) > sizeof(long) may be possible.  In that case, and if a
 128 dict is genuinely huge, then only the slots directly reachable via indexing
 129 by a C long can be the first slot in a probe sequence.  The probe sequence
 130 will still eventually reach every slot in the table, but the collision rate
 131 on initial probes may be much higher than this scheme was designed for.
 132 Getting a hash code as fat as Py_ssize_t is the only real cure.  But in
 133 practice, this probably won't make a lick of difference for many years (at
 134 which point everyone will have terabytes of RAM on 64-bit boxes).
 135 */
 136
 137 /* Object used as dummy key to fill deleted entries */
 138 static PyObject *dummy = NULL; /* Initialized by first call to newPyDictObject() */
 139
 140 #ifdef Py_REF_DEBUG
 141 PyObject *
 142 _PyDict_Dummy(void)
 143 {
 144         return dummy;
 145 }
 146 #endif
 147
 148 /* forward declarations */
 149 static PyDictEntry *
 150 lookdict_string(PyDictObject *mp, PyObject *key, long hash);
 151
 152 #ifdef SHOW_CONVERSION_COUNTS
 153 static long created = 0L;
 154 static long converted = 0L;
 155
 156 static void
 157 show_counts(void)
 158 {
 159         fprintf(stderr, "created %ld string dicts\n", created);
 160         fprintf(stderr, "converted %ld to normal dicts\n", converted);
 161         fprintf(stderr, "%.2f%% conversion rate\n", (100.0*converted)/created);
 162 }
 163 #endif
 164
 165 /* Debug statistic to compare allocations with reuse through the free list */
 166 #undef SHOW_ALLOC_COUNT
 167 #ifdef SHOW_ALLOC_COUNT
 168 static size_t count_alloc = 0;
 169 static size_t count_reuse = 0;
 170
 171 static void
 172 show_alloc(void)
 173 {
 174         fprintf(stderr, "Dict allocations: %" PY_FORMAT_SIZE_T "d\n",
 175                 count_alloc);
 176         fprintf(stderr, "Dict reuse through freelist: %" PY_FORMAT_SIZE_T
 177                 "d\n", count_reuse);
 178         fprintf(stderr, "%.2f%% reuse rate\n\n",
 179                 (100.0*count_reuse/(count_alloc+count_reuse)));
 180 }
 181 #endif
 182
 183 /* Debug statistic to count GC tracking of dicts */
 184 #ifdef SHOW_TRACK_COUNT
 185 static Py_ssize_t count_untracked = 0;
 186 static Py_ssize_t count_tracked = 0;
 187
 188 static void
 189 show_track(void)
 190 {
 191         fprintf(stderr, "Dicts created: %" PY_FORMAT_SIZE_T "d\n",
 192                 count_tracked + count_untracked);
 193         fprintf(stderr, "Dicts tracked by the GC: %" PY_FORMAT_SIZE_T
 194                 "d\n", count_tracked);
 195         fprintf(stderr, "%.2f%% dict tracking rate\n\n",
 196                 (100.0*count_tracked/(count_untracked+count_tracked)));
 197 }
 198 #endif
 199
 200
 201 /* Initialization macros.
 202    There are two ways to create a dict:  PyDict_New() is the main C API
 203    function, and the tp_new slot maps to dict_new().  In the latter case we
 204    can save a little time over what PyDict_New does because it's guaranteed
 205    that the PyDictObject struct is already zeroed out.
 206    Everyone except dict_new() should use EMPTY_TO_MINSIZE (unless they have
 207    an excellent reason not to).
 208 */
 209
 210 #define INIT_NONZERO_DICT_SLOTS(mp) do {                                \
 211         (mp)->ma_table = (mp)->ma_smalltable;                           \
 212         (mp)->ma_mask = PyDict_MINSIZE - 1;                             \
 213     } while(0)
 214
 215 #define EMPTY_TO_MINSIZE(mp) do {                                       \
 216         memset((mp)->ma_smalltable, 0, sizeof((mp)->ma_smalltable));    \
 217         (mp)->ma_used = (mp)->ma_fill = 0;                              \
 218         INIT_NONZERO_DICT_SLOTS(mp);                                    \
 219     } while(0)
 220
 221 /* Dictionary reuse scheme to save calls to malloc, free, and memset */
 222 #ifndef PyDict_MAXFREELIST
 223 #define PyDict_MAXFREELIST 80
 224 #endif
 225 static PyDictObject *free_list[PyDict_MAXFREELIST];
 226 static int numfree = 0;
 227
 228 void
 229 PyDict_Fini(void)
 230 {
 231         PyDictObject *op;
 232
 233         while (numfree) {
 234                 op = free_list[--numfree];
 235                 assert(PyDict_CheckExact(op));
 236                 PyObject_GC_Del(op);
 237         }
 238 }
 239
 240 PyObject *
 241 PyDict_New(void)
 242 {
 243         register PyDictObject *mp;
 244         if (dummy == NULL) { /* Auto-initialize dummy */
 245                 dummy = PyString_FromString("<dummy key>");
 246                 if (dummy == NULL)
 247                         return NULL;
 248 #ifdef SHOW_CONVERSION_COUNTS
 249                 Py_AtExit(show_counts);
 250 #endif
 251 #ifdef SHOW_ALLOC_COUNT
 252                 Py_AtExit(show_alloc);
 253 #endif
 254 #ifdef SHOW_TRACK_COUNT
 255                 Py_AtExit(show_track);
 256 #endif
 257         }
 258         if (numfree) {
 259                 mp = free_list[--numfree];
 260                 assert (mp != NULL);
 261                 assert (Py_TYPE(mp) == &PyDict_Type);
 262                 _Py_NewReference((PyObject *)mp);
 263                 if (mp->ma_fill) {
 264                         EMPTY_TO_MINSIZE(mp);
 265                 } else {
 266                         /* At least set ma_table and ma_mask; these are wrong
 267                            if an empty but presized dict is added to freelist */
 268                         INIT_NONZERO_DICT_SLOTS(mp);
 269                 }
 270                 assert (mp->ma_used == 0);
 271                 assert (mp->ma_table == mp->ma_smalltable);
 272                 assert (mp->ma_mask == PyDict_MINSIZE - 1);
 273 #ifdef SHOW_ALLOC_COUNT
 274                 count_reuse++;
 275 #endif
 276         } else {
 277                 mp = PyObject_GC_New(PyDictObject, &PyDict_Type);
 278                 if (mp == NULL)
 279                         return NULL;
 280                 EMPTY_TO_MINSIZE(mp);
 281 #ifdef SHOW_ALLOC_COUNT
 282                 count_alloc++;
 283 #endif
 284         }
 285         mp->ma_lookup = lookdict_string;
 286 #ifdef SHOW_TRACK_COUNT
 287         count_untracked++;
 288 #endif
 289 #ifdef SHOW_CONVERSION_COUNTS
 290         ++created;
 291 #endif
 292         return (PyObject *)mp;
 293 }
 294
 295 /*
 296 The basic lookup function used by all operations.
 297 This is based on Algorithm D from Knuth Vol. 3, Sec. 6.4.
 298 Open addressing is preferred over chaining since the link overhead for
 299 chaining would be substantial (100% with typical malloc overhead).
 300
 301 The initial probe index is computed as hash mod the table size. Subsequent
 302 probe indices are computed as explained earlier.
 303
 304 All arithmetic on hash should ignore overflow.
 305
 306 (The details in this version are due to Tim Peters, building on many past
 307 contributions by Reimer Behrends, Jyrki Alakuijala, Vladimir Marangozov and
 308 Christian Tismer).
 309
 310 lookdict() is general-purpose, and may return NULL if (and only if) a
 311 comparison raises an exception (this was new in Python 2.5).
 312 lookdict_string() below is specialized to string keys, comparison of which can
 313 never raise an exception; that function can never return NULL.  For both, when
 314 the key isn't found a PyDictEntry* is returned for which the me_value field is
 315 NULL; this is the slot in the dict at which the key would have been found, and
 316 the caller can (if it wishes) add the <key, value> pair to the returned
 317 PyDictEntry*.
 318 */
 319 static PyDictEntry *
 320 lookdict(PyDictObject *mp, PyObject *key, register long hash)
 321 {
 322         register size_t i;
 323         register size_t perturb;
 324         register PyDictEntry *freeslot;
 325         register size_t mask = (size_t)mp->ma_mask;
 326         PyDictEntry *ep0 = mp->ma_table;
 327         register PyDictEntry *ep;
 328         register int cmp;
 329         PyObject *startkey;
 330
 331         i = (size_t)hash & mask;
 332         ep = &ep0[i];
 333         if (ep->me_key == NULL || ep->me_key == key)
 334                 return ep;
 335
 336         if (ep->me_key == dummy)
 337                 freeslot = ep;
 338         else {
 339                 if (ep->me_hash == hash) {
 340                         startkey = ep->me_key;
 341                         Py_INCREF(startkey);
 342                         cmp = PyObject_RichCompareBool(startkey, key, Py_EQ);
 343                         Py_DECREF(startkey);
 344                         if (cmp < 0)
 345                                 return NULL;
 346                         if (ep0 == mp->ma_table && ep->me_key == startkey) {
 347                                 if (cmp > 0)
 348                                         return ep;
 349                         }
 350                         else {
 351                                 /* The compare did major nasty stuff to the
 352                                  * dict:  start over.
 353                                  * XXX A clever adversary could prevent this
 354                                  * XXX from terminating.
 355                                  */
 356                                 return lookdict(mp, key, hash);
 357                         }
 358                 }
 359                 freeslot = NULL;
 360         }
 361
 362         /* In the loop, me_key == dummy is by far (factor of 100s) the
 363            least likely outcome, so test for that last. */
 364         for (perturb = hash; ; perturb >>= PERTURB_SHIFT) {
 365                 i = (i << 2) + i + perturb + 1;
 366                 ep = &ep0[i & mask];
 367                 if (ep->me_key == NULL)
 368                         return freeslot == NULL ? ep : freeslot;
 369                 if (ep->me_key == key)
 370                         return ep;
 371                 if (ep->me_hash == hash && ep->me_key != dummy) {
 372                         startkey = ep->me_key;
 373                         Py_INCREF(startkey);
 374                         cmp = PyObject_RichCompareBool(startkey, key, Py_EQ);
 375                         Py_DECREF(startkey);
 376                         if (cmp < 0)
 377                                 return NULL;
 378                         if (ep0 == mp->ma_table && ep->me_key == startkey) {
 379                                 if (cmp > 0)
 380                                         return ep;
 381                         }
 382                         else {
 383                                 /* The compare did major nasty stuff to the
 384                                  * dict:  start over.
 385                                  * XXX A clever adversary could prevent this
 386                                  * XXX from terminating.
 387                                  */
 388                                 return lookdict(mp, key, hash);
 389                         }
 390                 }
 391                 else if (ep->me_key == dummy && freeslot == NULL)
 392                         freeslot = ep;
 393         }
 394         assert(0);      /* NOT REACHED */
 395         return 0;
 396 }
 397
 398 /*
 399  * Hacked up version of lookdict which can assume keys are always strings;
 400  * this assumption allows testing for errors during PyObject_RichCompareBool()
 401  * to be dropped; string-string comparisons never raise exceptions.  This also
 402  * means we don't need to go through PyObject_RichCompareBool(); we can always
 403  * use _PyString_Eq() directly.
 404  *
 405  * This is valuable because dicts with only string keys are very common.
 406  */
 407 static PyDictEntry *
 408 lookdict_string(PyDictObject *mp, PyObject *key, register long hash)
 409 {
 410         register size_t i;
 411         register size_t perturb;
 412         register PyDictEntry *freeslot;
 413         register size_t mask = (size_t)mp->ma_mask;
 414         PyDictEntry *ep0 = mp->ma_table;
 415         register PyDictEntry *ep;
 416
 417         /* Make sure this function doesn't have to handle non-string keys,
 418            including subclasses of str; e.g., one reason to subclass
 419            strings is to override __eq__, and for speed we don't cater to
 420            that here. */
 421         if (!PyString_CheckExact(key)) {
 422 #ifdef SHOW_CONVERSION_COUNTS
 423                 ++converted;
 424 #endif
 425                 mp->ma_lookup = lookdict;
 426                 return lookdict(mp, key, hash);
 427         }
 428         i = hash & mask;
 429         ep = &ep0[i];
 430         if (ep->me_key == NULL || ep->me_key == key)
 431                 return ep;
 432         if (ep->me_key == dummy)
 433                 freeslot = ep;
 434         else {
 435                 if (ep->me_hash == hash && _PyString_Eq(ep->me_key, key))
 436                         return ep;
 437                 freeslot = NULL;
 438         }
 439
 440         /* In the loop, me_key == dummy is by far (factor of 100s) the
 441            least likely outcome, so test for that last. */
 442         for (perturb = hash; ; perturb >>= PERTURB_SHIFT) {
 443                 i = (i << 2) + i + perturb + 1;
 444                 ep = &ep0[i & mask];
 445                 if (ep->me_key == NULL)
 446                         return freeslot == NULL ? ep : freeslot;
 447                 if (ep->me_key == key
 448                     || (ep->me_hash == hash
 449                         && ep->me_key != dummy
 450                         && _PyString_Eq(ep->me_key, key)))
 451                         return ep;
 452                 if (ep->me_key == dummy && freeslot == NULL)
 453                         freeslot = ep;
 454         }
 455         assert(0);      /* NOT REACHED */
 456         return 0;
 457 }
 458
 459 #ifdef SHOW_TRACK_COUNT
 460 #define INCREASE_TRACK_COUNT \
 461         (count_tracked++, count_untracked--);
 462 #define DECREASE_TRACK_COUNT \
 463         (count_tracked--, count_untracked++);
 464 #else
 465 #define INCREASE_TRACK_COUNT
 466 #define DECREASE_TRACK_COUNT
 467 #endif
 468
 469 #define MAINTAIN_TRACKING(mp, key, value) \
 470         do { \
 471                 if (!_PyObject_GC_IS_TRACKED(mp)) { \
 472                         if (_PyObject_GC_MAY_BE_TRACKED(key) || \
 473                                 _PyObject_GC_MAY_BE_TRACKED(value)) { \
 474                                 _PyObject_GC_TRACK(mp); \
 475                                 INCREASE_TRACK_COUNT \
 476                         } \
 477                 } \
 478         } while(0)
 479
 480 void
 481 _PyDict_MaybeUntrack(PyObject *op)
 482 {
 483         PyDictObject *mp;
 484         PyObject *value;
 485         Py_ssize_t mask, i;
 486         PyDictEntry *ep;
 487
 488         if (!PyDict_CheckExact(op) || !_PyObject_GC_IS_TRACKED(op))
 489                 return;
 490
 491         mp = (PyDictObject *) op;
 492         ep = mp->ma_table;
 493         mask = mp->ma_mask;
 494         for (i = 0; i <= mask; i++) {
 495                 if ((value = ep[i].me_value) == NULL)
 496                         continue;
 497                 if (_PyObject_GC_MAY_BE_TRACKED(value) ||
 498                         _PyObject_GC_MAY_BE_TRACKED(ep[i].me_key))
 499                         return;
 500         }
 501         DECREASE_TRACK_COUNT
 502         _PyObject_GC_UNTRACK(op);
 503 }
 504
 505
 506 /*
 507 Internal routine to insert a new item into the table.
 508 Used both by the internal resize routine and by the public insert routine.
 509 Eats a reference to key and one to value.
 510 Returns -1 if an error occurred, or 0 on success.
 511 */
 512 static int
 513 insertdict(register PyDictObject *mp, PyObject *key, long hash, PyObject *value)
 514 {
 515         PyObject *old_value;
 516         register PyDictEntry *ep;
 517         typedef PyDictEntry *(*lookupfunc)(PyDictObject *, PyObject *, long);
 518
 519         assert(mp->ma_lookup != NULL);
 520         ep = mp->ma_lookup(mp, key, hash);
 521         if (ep == NULL) {
 522                 Py_DECREF(key);
 523                 Py_DECREF(value);
 524                 return -1;
 525         }
 526         MAINTAIN_TRACKING(mp, key, value);
 527         if (ep->me_value != NULL) {
 528                 old_value = ep->me_value;
 529                 ep->me_value = value;
 530                 Py_DECREF(old_value); /* which **CAN** re-enter */
 531                 Py_DECREF(key);
 532         }
 533         else {
 534                 if (ep->me_key == NULL)
 535                         mp->ma_fill++;
 536                 else {
 537                         assert(ep->me_key == dummy);
 538                         Py_DECREF(dummy);
 539                 }
 540                 ep->me_key = key;
 541                 ep->me_hash = (Py_ssize_t)hash;
 542                 ep->me_value = value;
 543                 mp->ma_used++;
 544         }
 545         return 0;
 546 }
 547
 548 /*
 549 Internal routine used by dictresize() to insert an item which is
 550 known to be absent from the dict.  This routine also assumes that
 551 the dict contains no deleted entries.  Besides the performance benefit,
 552 using insertdict() in dictresize() is dangerous (SF bug #1456209).
 553 Note that no refcounts are changed by this routine; if needed, the caller
 554 is responsible for incref'ing `key` and `value`.
 555 */
 556 static void
 557 insertdict_clean(register PyDictObject *mp, PyObject *key, long hash,
 558                  PyObject *value)
 559 {
 560         register size_t i;
 561         register size_t perturb;
 562         register size_t mask = (size_t)mp->ma_mask;
 563         PyDictEntry *ep0 = mp->ma_table;
 564         register PyDictEntry *ep;
 565
 566         MAINTAIN_TRACKING(mp, key, value);
 567         i = hash & mask;
 568         ep = &ep0[i];
 569         for (perturb = hash; ep->me_key != NULL; perturb >>= PERTURB_SHIFT) {
 570                 i = (i << 2) + i + perturb + 1;
 571                 ep = &ep0[i & mask];
 572         }
 573         assert(ep->me_value == NULL);
 574         mp->ma_fill++;
 575         ep->me_key = key;
 576         ep->me_hash = (Py_ssize_t)hash;
 577         ep->me_value = value;
 578         mp->ma_used++;
 579 }
 580
 581 /*
 582 Restructure the table by allocating a new table and reinserting all
 583 items again.  When entries have been deleted, the new table may
 584 actually be smaller than the old one.
 585 */
 586 static int
 587 dictresize(PyDictObject *mp, Py_ssize_t minused)
 588 {
 589         Py_ssize_t newsize;
 590         PyDictEntry *oldtable, *newtable, *ep;
 591         Py_ssize_t i;
 592         int is_oldtable_malloced;
 593         PyDictEntry small_copy[PyDict_MINSIZE];
 594
 595         assert(minused >= 0);
 596
 597         /* Find the smallest table size > minused. */
 598         for (newsize = PyDict_MINSIZE;
 599              newsize <= minused && newsize > 0;
 600              newsize <<= 1)
 601                 ;
 602         if (newsize <= 0) {
 603                 PyErr_NoMemory();
 604                 return -1;
 605         }
 606
 607         /* Get space for a new table. */
 608         oldtable = mp->ma_table;
 609         assert(oldtable != NULL);
 610         is_oldtable_malloced = oldtable != mp->ma_smalltable;
 611
 612         if (newsize == PyDict_MINSIZE) {
 613                 /* A large table is shrinking, or we can't get any smaller. */
 614                 newtable = mp->ma_smalltable;
 615                 if (newtable == oldtable) {
 616                         if (mp->ma_fill == mp->ma_used) {
 617                                 /* No dummies, so no point doing anything. */
 618                                 return 0;
 619                         }
 620                         /* We're not going to resize it, but rebuild the
 621                            table anyway to purge old dummy entries.
 622                            Subtle:  This is *necessary* if fill==size,
 623                            as lookdict needs at least one virgin slot to
 624                            terminate failing searches.  If fill < size, it's
 625                            merely desirable, as dummies slow searches. */
 626                         assert(mp->ma_fill > mp->ma_used);
 627                         memcpy(small_copy, oldtable, sizeof(small_copy));
 628                         oldtable = small_copy;
 629                 }
 630         }
 631         else {
 632                 newtable = PyMem_NEW(PyDictEntry, newsize);
 633                 if (newtable == NULL) {
 634                         PyErr_NoMemory();
 635                         return -1;
 636                 }
 637         }
 638
 639         /* Make the dict empty, using the new table. */
 640         assert(newtable != oldtable);
 641         mp->ma_table = newtable;
 642         mp->ma_mask = newsize - 1;
 643         memset(newtable, 0, sizeof(PyDictEntry) * newsize);
 644         mp->ma_used = 0;
 645         i = mp->ma_fill;
 646         mp->ma_fill = 0;
 647
 648         /* Copy the data over; this is refcount-neutral for active entries;
 649            dummy entries aren't copied over, of course */
 650         for (ep = oldtable; i > 0; ep++) {
 651                 if (ep->me_value != NULL) {     /* active entry */
 652                         --i;
 653                         insertdict_clean(mp, ep->me_key, (long)ep->me_hash,
 654                                          ep->me_value);
 655                 }
 656                 else if (ep->me_key != NULL) {  /* dummy entry */
 657                         --i;
 658                         assert(ep->me_key == dummy);
 659                         Py_DECREF(ep->me_key);
 660                 }
 661                 /* else key == value == NULL:  nothing to do */
 662         }
 663
 664         if (is_oldtable_malloced)
 665                 PyMem_DEL(oldtable);
 666         return 0;
 667 }
 668
 669 /* Create a new dictionary pre-sized to hold an estimated number of elements.
 670    Underestimates are okay because the dictionary will resize as necessary.
 671    Overestimates just mean the dictionary will be more sparse than usual.
 672 */
 673
 674 PyObject *
 675 _PyDict_NewPresized(Py_ssize_t minused)
 676 {
 677         PyObject *op = PyDict_New();
 678
 679         if (minused>5 && op != NULL && dictresize((PyDictObject *)op, minused) == -1) {
 680                 Py_DECREF(op);
 681                 return NULL;
 682         }
 683         return op;
 684 }
 685
 686 /* Note that, for historical reasons, PyDict_GetItem() suppresses all errors
 687  * that may occur (originally dicts supported only string keys, and exceptions
 688  * weren't possible).  So, while the original intent was that a NULL return
 689  * meant the key wasn't present, in reality it can mean that, or that an error
 690  * (suppressed) occurred while computing the key's hash, or that some error
 691  * (suppressed) occurred when comparing keys in the dict's internal probe
 692  * sequence.  A nasty example of the latter is when a Python-coded comparison
 693  * function hits a stack-depth error, which can cause this to return NULL
 694  * even if the key is present.
 695  */
 696 PyObject *
 697 PyDict_GetItem(PyObject *op, PyObject *key)
 698 {
 699         long hash;
 700         PyDictObject *mp = (PyDictObject *)op;
 701         PyDictEntry *ep;
 702         PyThreadState *tstate;
 703         if (!PyDict_Check(op))
 704                 return NULL;
 705         if (!PyString_CheckExact(key) ||
 706             (hash = ((PyStringObject *) key)->ob_shash) == -1)
 707         {
 708                 hash = PyObject_Hash(key);
 709                 if (hash == -1) {
 710                         PyErr_Clear();
 711                         return NULL;
 712                 }
 713         }
 714
 715         /* We can arrive here with a NULL tstate during initialization:
 716            try running "python -Wi" for an example related to string
 717            interning.  Let's just hope that no exception occurs then... */
 718         tstate = _PyThreadState_Current;
 719         if (tstate != NULL && tstate->curexc_type != NULL) {
 720                 /* preserve the existing exception */
 721                 PyObject *err_type, *err_value, *err_tb;
 722                 PyErr_Fetch(&err_type, &err_value, &err_tb);
 723                 ep = (mp->ma_lookup)(mp, key, hash);
 724                 /* ignore errors */
 725                 PyErr_Restore(err_type, err_value, err_tb);
 726                 if (ep == NULL)
 727                         return NULL;
 728         }
 729         else {
 730                 ep = (mp->ma_lookup)(mp, key, hash);
 731                 if (ep == NULL) {
 732                         PyErr_Clear();
 733                         return NULL;
 734                 }
 735         }
 736         return ep->me_value;
 737 }
 738
 739 /* CAUTION: PyDict_SetItem() must guarantee that it won't resize the
 740  * dictionary if it's merely replacing the value for an existing key.
 741  * This means that it's safe to loop over a dictionary with PyDict_Next()
 742  * and occasionally replace a value -- but you can't insert new keys or
 743  * remove them.
 744  */
 745 int
 746 PyDict_SetItem(register PyObject *op, PyObject *key, PyObject *value)
 747 {
 748         register PyDictObject *mp;
 749         register long hash;
 750         register Py_ssize_t n_used;
 751
 752         if (!PyDict_Check(op)) {
 753                 PyErr_BadInternalCall();
 754                 return -1;
 755         }
 756         assert(key);
 757         assert(value);
 758         mp = (PyDictObject *)op;
 759         if (PyString_CheckExact(key)) {
 760                 hash = ((PyStringObject *)key)->ob_shash;
 761                 if (hash == -1)
 762                         hash = PyObject_Hash(key);
 763         }
 764         else {
 765                 hash = PyObject_Hash(key);
 766                 if (hash == -1)
 767                         return -1;
 768         }
 769         assert(mp->ma_fill <= mp->ma_mask);  /* at least one empty slot */
 770         n_used = mp->ma_used;
 771         Py_INCREF(value);
 772         Py_INCREF(key);
 773         if (insertdict(mp, key, hash, value) != 0)
 774                 return -1;
 775         /* If we added a key, we can safely resize.  Otherwise just return!
 776          * If fill >= 2/3 size, adjust size.  Normally, this doubles or
 777          * quaduples the size, but it's also possible for the dict to shrink
 778          * (if ma_fill is much larger than ma_used, meaning a lot of dict
 779          * keys have been * deleted).
 780          *
 781          * Quadrupling the size improves average dictionary sparseness
 782          * (reducing collisions) at the cost of some memory and iteration
 783          * speed (which loops over every possible entry).  It also halves
 784          * the number of expensive resize operations in a growing dictionary.
 785          *
 786          * Very large dictionaries (over 50K items) use doubling instead.
 787          * This may help applications with severe memory constraints.
 788          */
 789         if (!(mp->ma_used > n_used && mp->ma_fill*3 >= (mp->ma_mask+1)*2))
 790                 return 0;
 791         return dictresize(mp, (mp->ma_used > 50000 ? 2 : 4) * mp->ma_used);
 792 }
 793
 794 int
 795 PyDict_DelItem(PyObject *op, PyObject *key)
 796 {
 797         register PyDictObject *mp;
 798         register long hash;
 799         register PyDictEntry *ep;
 800         PyObject *old_value, *old_key;
 801
 802         if (!PyDict_Check(op)) {
 803                 PyErr_BadInternalCall();
 804                 return -1;
 805         }
 806         assert(key);
 807         if (!PyString_CheckExact(key) ||
 808             (hash = ((PyStringObject *) key)->ob_shash) == -1) {
 809                 hash = PyObject_Hash(key);
 810                 if (hash == -1)
 811                         return -1;
 812         }
 813         mp = (PyDictObject *)op;
 814         ep = (mp->ma_lookup)(mp, key, hash);
 815         if (ep == NULL)
 816                 return -1;
 817         if (ep->me_value == NULL) {
 818                 set_key_error(key);
 819                 return -1;
 820         }
 821         old_key = ep->me_key;
 822         Py_INCREF(dummy);
 823         ep->me_key = dummy;
 824         old_value = ep->me_value;
 825         ep->me_value = NULL;
 826         mp->ma_used--;
 827         Py_DECREF(old_value);
 828         Py_DECREF(old_key);
 829         return 0;
 830 }
 831
 832 void
 833 PyDict_Clear(PyObject *op)
 834 {
 835         PyDictObject *mp;
 836         PyDictEntry *ep, *table;
 837         int table_is_malloced;
 838         Py_ssize_t fill;
 839         PyDictEntry small_copy[PyDict_MINSIZE];
 840 #ifdef Py_DEBUG
 841         Py_ssize_t i, n;
 842 #endif
 843
 844         if (!PyDict_Check(op))
 845                 return;
 846         mp = (PyDictObject *)op;
 847 #ifdef Py_DEBUG
 848         n = mp->ma_mask + 1;
 849         i = 0;
 850 #endif
 851
 852         table = mp->ma_table;
 853         assert(table != NULL);
 854         table_is_malloced = table != mp->ma_smalltable;
 855
 856         /* This is delicate.  During the process of clearing the dict,
 857          * decrefs can cause the dict to mutate.  To avoid fatal confusion
 858          * (voice of experience), we have to make the dict empty before
 859          * clearing the slots, and never refer to anything via mp->xxx while
 860          * clearing.
 861          */
 862         fill = mp->ma_fill;
 863         if (table_is_malloced)
 864                 EMPTY_TO_MINSIZE(mp);
 865
 866         else if (fill > 0) {
 867                 /* It's a small table with something that needs to be cleared.
 868                  * Afraid the only safe way is to copy the dict entries into
 869                  * another small table first.
 870                  */
 871                 memcpy(small_copy, table, sizeof(small_copy));
 872                 table = small_copy;
 873                 EMPTY_TO_MINSIZE(mp);
 874         }
 875         /* else it's a small table that's already empty */
 876
 877         /* Now we can finally clear things.  If C had refcounts, we could
 878          * assert that the refcount on table is 1 now, i.e. that this function
 879          * has unique access to it, so decref side-effects can't alter it.
 880          */
 881         for (ep = table; fill > 0; ++ep) {
 882 #ifdef Py_DEBUG
 883                 assert(i < n);
 884                 ++i;
 885 #endif
 886                 if (ep->me_key) {
 887                         --fill;
 888                         Py_DECREF(ep->me_key);
 889                         Py_XDECREF(ep->me_value);
 890                 }
 891 #ifdef Py_DEBUG
 892                 else
 893                         assert(ep->me_value == NULL);
 894 #endif
 895         }
 896
 897         if (table_is_malloced)
 898                 PyMem_DEL(table);
 899 }
 900
 901 /*
 902  * Iterate over a dict.  Use like so:
 903  *
 904  *     Py_ssize_t i;
 905  *     PyObject *key, *value;
 906  *     i = 0;   # important!  i should not otherwise be changed by you
 907  *     while (PyDict_Next(yourdict, &i, &key, &value)) {
 908  *              Refer to borrowed references in key and value.
 909  *     }
 910  *
 911  * CAUTION:  In general, it isn't safe to use PyDict_Next in a loop that
 912  * mutates the dict.  One exception:  it is safe if the loop merely changes
 913  * the values associated with the keys (but doesn't insert new keys or
 914  * delete keys), via PyDict_SetItem().
 915  */
 916 int
 917 PyDict_Next(PyObject *op, Py_ssize_t *ppos, PyObject **pkey, PyObject **pvalue)
 918 {
 919         register Py_ssize_t i;
 920         register Py_ssize_t mask;
 921         register PyDictEntry *ep;
 922
 923         if (!PyDict_Check(op))
 924                 return 0;
 925         i = *ppos;
 926         if (i < 0)
 927                 return 0;
 928         ep = ((PyDictObject *)op)->ma_table;
 929         mask = ((PyDictObject *)op)->ma_mask;
 930         while (i <= mask && ep[i].me_value == NULL)
 931                 i++;
 932         *ppos = i+1;
 933         if (i > mask)
 934                 return 0;
 935         if (pkey)
 936                 *pkey = ep[i].me_key;
 937         if (pvalue)
 938                 *pvalue = ep[i].me_value;
 939         return 1;
 940 }
 941
 942 /* Internal version of PyDict_Next that returns a hash value in addition to the key and value.*/
 943 int
 944 _PyDict_Next(PyObject *op, Py_ssize_t *ppos, PyObject **pkey, PyObject **pvalue, long *phash)
 945 {
 946         register Py_ssize_t i;
 947         register Py_ssize_t mask;
 948         register PyDictEntry *ep;
 949
 950         if (!PyDict_Check(op))
 951                 return 0;
 952         i = *ppos;
 953         if (i < 0)
 954                 return 0;
 955         ep = ((PyDictObject *)op)->ma_table;
 956         mask = ((PyDictObject *)op)->ma_mask;
 957         while (i <= mask && ep[i].me_value == NULL)
 958                 i++;
 959         *ppos = i+1;
 960         if (i > mask)
 961                 return 0;
 962         *phash = (long)(ep[i].me_hash);
 963         if (pkey)
 964                 *pkey = ep[i].me_key;
 965         if (pvalue)
 966                 *pvalue = ep[i].me_value;
 967         return 1;
 968 }
 969
 970 /* Methods */
 971
 972 static void
 973 dict_dealloc(register PyDictObject *mp)
 974 {
 975         register PyDictEntry *ep;
 976         Py_ssize_t fill = mp->ma_fill;
 977         PyObject_GC_UnTrack(mp);
 978         Py_TRASHCAN_SAFE_BEGIN(mp)
 979         for (ep = mp->ma_table; fill > 0; ep++) {
 980                 if (ep->me_key) {
 981                         --fill;
 982                         Py_DECREF(ep->me_key);
 983                         Py_XDECREF(ep->me_value);
 984                 }
 985         }
 986         if (mp->ma_table != mp->ma_smalltable)
 987                 PyMem_DEL(mp->ma_table);
 988         if (numfree < PyDict_MAXFREELIST && Py_TYPE(mp) == &PyDict_Type)
 989                 free_list[numfree++] = mp;
 990         else
 991                 Py_TYPE(mp)->tp_free((PyObject *)mp);
 992         Py_TRASHCAN_SAFE_END(mp)
 993 }
 994
 995 static int
 996 dict_print(register PyDictObject *mp, register FILE *fp, register int flags)
 997 {
 998         register Py_ssize_t i;
 999         register Py_ssize_t any;
1000         int status;
1001
1002         status = Py_ReprEnter((PyObject*)mp);
1003         if (status != 0) {
1004                 if (status < 0)
1005                         return status;
1006                 Py_BEGIN_ALLOW_THREADS
1007                 fprintf(fp, "{...}");
1008                 Py_END_ALLOW_THREADS
1009                 return 0;
1010         }
1011
1012         Py_BEGIN_ALLOW_THREADS
1013         fprintf(fp, "{");
1014         Py_END_ALLOW_THREADS
1015         any = 0;
1016         for (i = 0; i <= mp->ma_mask; i++) {
1017                 PyDictEntry *ep = mp->ma_table + i;
1018                 PyObject *pvalue = ep->me_value;
1019                 if (pvalue != NULL) {
1020                         /* Prevent PyObject_Repr from deleting value during
1021                            key format */
1022                         Py_INCREF(pvalue);
1023                         if (any++ > 0) {
1024                                 Py_BEGIN_ALLOW_THREADS
1025                                 fprintf(fp, ", ");
1026                                 Py_END_ALLOW_THREADS
1027                         }
1028                         if (PyObject_Print((PyObject *)ep->me_key, fp, 0)!=0) {
1029                                 Py_DECREF(pvalue);
1030                                 Py_ReprLeave((PyObject*)mp);
1031                                 return -1;
1032                         }
1033                         Py_BEGIN_ALLOW_THREADS
1034                         fprintf(fp, ": ");
1035                         Py_END_ALLOW_THREADS
1036                         if (PyObject_Print(pvalue, fp, 0) != 0) {
1037                                 Py_DECREF(pvalue);
1038                                 Py_ReprLeave((PyObject*)mp);
1039                                 return -1;
1040                         }
1041                         Py_DECREF(pvalue);
1042                 }
1043         }
1044         Py_BEGIN_ALLOW_THREADS
1045         fprintf(fp, "}");
1046         Py_END_ALLOW_THREADS
1047         Py_ReprLeave((PyObject*)mp);
1048         return 0;
1049 }
1050
1051 static PyObject *
1052 dict_repr(PyDictObject *mp)
1053 {
1054         Py_ssize_t i;
1055         PyObject *s, *temp, *colon = NULL;
1056         PyObject *pieces = NULL, *result = NULL;
1057         PyObject *key, *value;
1058
1059         i = Py_ReprEnter((PyObject *)mp);
1060         if (i != 0) {
1061                 return i > 0 ? PyString_FromString("{...}") : NULL;
1062         }
1063
1064         if (mp->ma_used == 0) {
1065                 result = PyString_FromString("{}");
1066                 goto Done;
1067         }
1068
1069         pieces = PyList_New(0);
1070         if (pieces == NULL)
1071                 goto Done;
1072
1073         colon = PyString_FromString(": ");
1074         if (colon == NULL)
1075                 goto Done;
1076
1077         /* Do repr() on each key+value pair, and insert ": " between them.
1078            Note that repr may mutate the dict. */
1079         i = 0;
1080         while (PyDict_Next((PyObject *)mp, &i, &key, &value)) {
1081                 int status;
1082                 /* Prevent repr from deleting value during key format. */
1083                 Py_INCREF(value);
1084                 s = PyObject_Repr(key);
1085                 PyString_Concat(&s, colon);
1086                 PyString_ConcatAndDel(&s, PyObject_Repr(value));
1087                 Py_DECREF(value);
1088                 if (s == NULL)
1089                         goto Done;
1090                 status = PyList_Append(pieces, s);
1091                 Py_DECREF(s);  /* append created a new ref */
1092                 if (status < 0)
1093                         goto Done;
1094         }
1095
1096         /* Add "{}" decorations to the first and last items. */
1097         assert(PyList_GET_SIZE(pieces) > 0);
1098         s = PyString_FromString("{");
1099         if (s == NULL)
1100                 goto Done;
1101         temp = PyList_GET_ITEM(pieces, 0);
1102         PyString_ConcatAndDel(&s, temp);
1103         PyList_SET_ITEM(pieces, 0, s);
1104         if (s == NULL)
1105                 goto Done;
1106
1107         s = PyString_FromString("}");
1108         if (s == NULL)
1109                 goto Done;
1110         temp = PyList_GET_ITEM(pieces, PyList_GET_SIZE(pieces) - 1);
1111         PyString_ConcatAndDel(&temp, s);
1112         PyList_SET_ITEM(pieces, PyList_GET_SIZE(pieces) - 1, temp);
1113         if (temp == NULL)
1114                 goto Done;
1115
1116         /* Paste them all together with ", " between. */
1117         s = PyString_FromString(", ");
1118         if (s == NULL)
1119                 goto Done;
1120         result = _PyString_Join(s, pieces);
1121         Py_DECREF(s);
1122
1123 Done:
1124         Py_XDECREF(pieces);
1125         Py_XDECREF(colon);
1126         Py_ReprLeave((PyObject *)mp);
1127         return result;
1128 }
1129
1130 static Py_ssize_t
1131 dict_length(PyDictObject *mp)
1132 {
1133         return mp->ma_used;
1134 }
1135
1136 static PyObject *
1137 dict_subscript(PyDictObject *mp, register PyObject *key)
1138 {
1139         PyObject *v;
1140         long hash;
1141         PyDictEntry *ep;
1142         assert(mp->ma_table != NULL);
1143         if (!PyString_CheckExact(key) ||
1144             (hash = ((PyStringObject *) key)->ob_shash) == -1) {
1145                 hash = PyObject_Hash(key);
1146                 if (hash == -1)
1147                         return NULL;
1148         }
1149         ep = (mp->ma_lookup)(mp, key, hash);
1150         if (ep == NULL)
1151                 return NULL;
1152         v = ep->me_value;
1153         if (v == NULL) {
1154                 if (!PyDict_CheckExact(mp)) {
1155                         /* Look up __missing__ method if we're a subclass. */
1156                         PyObject *missing;
1157                         static PyObject *missing_str = NULL;
1158                         if (missing_str == NULL)
1159                                 missing_str =
1160                                   PyString_InternFromString("__missing__");
1161                         missing = _PyType_Lookup(Py_TYPE(mp), missing_str);
1162                         if (missing != NULL)
1163                                 return PyObject_CallFunctionObjArgs(missing,
1164                                         (PyObject *)mp, key, NULL);
1165                 }
1166                 set_key_error(key);
1167                 return NULL;
1168         }
1169         else
1170                 Py_INCREF(v);
1171         return v;
1172 }
1173
1174 static int
1175 dict_ass_sub(PyDictObject *mp, PyObject *v, PyObject *w)
1176 {
1177         if (w == NULL)
1178                 return PyDict_DelItem((PyObject *)mp, v);
1179         else
1180                 return PyDict_SetItem((PyObject *)mp, v, w);
1181 }
1182
1183 static PyMappingMethods dict_as_mapping = {
1184         (lenfunc)dict_length, /*mp_length*/
1185         (binaryfunc)dict_subscript, /*mp_subscript*/
1186         (objobjargproc)dict_ass_sub, /*mp_ass_subscript*/
1187 };
1188
1189 static PyObject *
1190 dict_keys(register PyDictObject *mp)
1191 {
1192         register PyObject *v;
1193         register Py_ssize_t i, j;
1194         PyDictEntry *ep;
1195         Py_ssize_t mask, n;
1196
1197   again:
1198         n = mp->ma_used;
1199         v = PyList_New(n);
1200         if (v == NULL)
1201                 return NULL;
1202         if (n != mp->ma_used) {
1203                 /* Durnit.  The allocations caused the dict to resize.
1204                  * Just start over, this shouldn't normally happen.
1205                  */
1206                 Py_DECREF(v);
1207                 goto again;
1208         }
1209         ep = mp->ma_table;
1210         mask = mp->ma_mask;
1211         for (i = 0, j = 0; i <= mask; i++) {
1212                 if (ep[i].me_value != NULL) {
1213                         PyObject *key = ep[i].me_key;
1214                         Py_INCREF(key);
1215                         PyList_SET_ITEM(v, j, key);
1216                         j++;
1217                 }
1218         }
1219         assert(j == n);
1220         return v;
1221 }
1222
1223 static PyObject *
1224 dict_values(register PyDictObject *mp)
1225 {
1226         register PyObject *v;
1227         register Py_ssize_t i, j;
1228         PyDictEntry *ep;
1229         Py_ssize_t mask, n;
1230
1231   again:
1232         n = mp->ma_used;
1233         v = PyList_New(n);
1234         if (v == NULL)
1235                 return NULL;
1236         if (n != mp->ma_used) {
1237                 /* Durnit.  The allocations caused the dict to resize.
1238                  * Just start over, this shouldn't normally happen.
1239                  */
1240                 Py_DECREF(v);
1241                 goto again;
1242         }
1243         ep = mp->ma_table;
1244         mask = mp->ma_mask;
1245         for (i = 0, j = 0; i <= mask; i++) {
1246                 if (ep[i].me_value != NULL) {
1247                         PyObject *value = ep[i].me_value;
1248                         Py_INCREF(value);
1249                         PyList_SET_ITEM(v, j, value);
1250                         j++;
1251                 }
1252         }
1253         assert(j == n);
1254         return v;
1255 }
1256
1257 static PyObject *
1258 dict_items(register PyDictObject *mp)
1259 {
1260         register PyObject *v;
1261         register Py_ssize_t i, j, n;
1262         Py_ssize_t mask;
1263         PyObject *item, *key, *value;
1264         PyDictEntry *ep;
1265
1266         /* Preallocate the list of tuples, to avoid allocations during
1267          * the loop over the items, which could trigger GC, which
1268          * could resize the dict. :-(
1269          */
1270   again:
1271         n = mp->ma_used;
1272         v = PyList_New(n);
1273         if (v == NULL)
1274                 return NULL;
1275         for (i = 0; i < n; i++) {
1276                 item = PyTuple_New(2);
1277                 if (item == NULL) {
1278                         Py_DECREF(v);
1279                         return NULL;
1280                 }
1281                 PyList_SET_ITEM(v, i, item);
1282         }
1283         if (n != mp->ma_used) {
1284                 /* Durnit.  The allocations caused the dict to resize.
1285                  * Just start over, this shouldn't normally happen.
1286                  */
1287                 Py_DECREF(v);
1288                 goto again;
1289         }
1290         /* Nothing we do below makes any function calls. */
1291         ep = mp->ma_table;
1292         mask = mp->ma_mask;
1293         for (i = 0, j = 0; i <= mask; i++) {
1294                 if ((value=ep[i].me_value) != NULL) {
1295                         key = ep[i].me_key;
1296                         item = PyList_GET_ITEM(v, j);
1297                         Py_INCREF(key);
1298                         PyTuple_SET_ITEM(item, 0, key);
1299                         Py_INCREF(value);
1300                         PyTuple_SET_ITEM(item, 1, value);
1301                         j++;
1302                 }
1303         }
1304         assert(j == n);
1305         return v;
1306 }
1307
1308 static PyObject *
1309 dict_fromkeys(PyObject *cls, PyObject *args)
1310 {
1311         PyObject *seq;
1312         PyObject *value = Py_None;
1313         PyObject *it;   /* iter(seq) */
1314         PyObject *key;
1315         PyObject *d;
1316         int status;
1317
1318         if (!PyArg_UnpackTuple(args, "fromkeys", 1, 2, &seq, &value))
1319                 return NULL;
1320
1321         d = PyObject_CallObject(cls, NULL);
1322         if (d == NULL)
1323                 return NULL;
1324
1325         if (PyDict_CheckExact(d) && PyDict_CheckExact(seq)) {
1326                 PyDictObject *mp = (PyDictObject *)d;
1327                 PyObject *oldvalue;
1328                 Py_ssize_t pos = 0;
1329                 PyObject *key;
1330                 long hash;
1331
1332                 if (dictresize(mp, Py_SIZE(seq)))
1333                         return NULL;
1334
1335                 while (_PyDict_Next(seq, &pos, &key, &oldvalue, &hash)) {
1336                         Py_INCREF(key);
1337                         Py_INCREF(value);
1338                         if (insertdict(mp, key, hash, value))
1339                                 return NULL;
1340                 }
1341                 return d;
1342         }
1343
1344         if (PyDict_CheckExact(d) && PyAnySet_CheckExact(seq)) {
1345                 PyDictObject *mp = (PyDictObject *)d;
1346                 Py_ssize_t pos = 0;
1347                 PyObject *key;
1348                 long hash;
1349
1350                 if (dictresize(mp, PySet_GET_SIZE(seq)))
1351                         return NULL;
1352
1353                 while (_PySet_NextEntry(seq, &pos, &key, &hash)) {
1354                         Py_INCREF(key);
1355                         Py_INCREF(value);
1356                         if (insertdict(mp, key, hash, value))
1357                                 return NULL;
1358                 }
1359                 return d;
1360         }
1361
1362         it = PyObject_GetIter(seq);
1363         if (it == NULL){
1364                 Py_DECREF(d);
1365                 return NULL;
1366         }
1367
1368         if (PyDict_CheckExact(d)) {
1369                 while ((key = PyIter_Next(it)) != NULL) {
1370                         status = PyDict_SetItem(d, key, value);
1371                         Py_DECREF(key);
1372                         if (status < 0)
1373                                 goto Fail;
1374                 }
1375         } else {
1376                 while ((key = PyIter_Next(it)) != NULL) {
1377                         status = PyObject_SetItem(d, key, value);
1378                         Py_DECREF(key);
1379                         if (status < 0)
1380                                 goto Fail;
1381                 }
1382         }
1383
1384         if (PyErr_Occurred())
1385                 goto Fail;
1386         Py_DECREF(it);
1387         return d;
1388
1389 Fail:
1390         Py_DECREF(it);
1391         Py_DECREF(d);
1392         return NULL;
1393 }
1394
1395 static int
1396 dict_update_common(PyObject *self, PyObject *args, PyObject *kwds, char *methname)
1397 {
1398         PyObject *arg = NULL;
1399         int result = 0;
1400
1401         if (!PyArg_UnpackTuple(args, methname, 0, 1, &arg))
1402                 result = -1;
1403
1404         else if (arg != NULL) {
1405                 if (PyObject_HasAttrString(arg, "keys"))
1406                         result = PyDict_Merge(self, arg, 1);
1407                 else
1408                         result = PyDict_MergeFromSeq2(self, arg, 1);
1409         }
1410         if (result == 0 && kwds != NULL)
1411                 result = PyDict_Merge(self, kwds, 1);
1412         return result;
1413 }
1414
1415 static PyObject *
1416 dict_update(PyObject *self, PyObject *args, PyObject *kwds)
1417 {
1418         if (dict_update_common(self, args, kwds, "update") != -1)
1419                 Py_RETURN_NONE;
1420         return NULL;
1421 }
1422
1423 /* Update unconditionally replaces existing items.
1424    Merge has a 3rd argument 'override'; if set, it acts like Update,
1425    otherwise it leaves existing items unchanged.
1426
1427    PyDict_{Update,Merge} update/merge from a mapping object.
1428
1429    PyDict_MergeFromSeq2 updates/merges from any iterable object
1430    producing iterable objects of length 2.
1431 */
1432
1433 int
1434 PyDict_MergeFromSeq2(PyObject *d, PyObject *seq2, int override)
1435 {
1436         PyObject *it;   /* iter(seq2) */
1437         Py_ssize_t i;   /* index into seq2 of current element */
1438         PyObject *item; /* seq2[i] */
1439         PyObject *fast; /* item as a 2-tuple or 2-list */
1440
1441         assert(d != NULL);
1442         assert(PyDict_Check(d));
1443         assert(seq2 != NULL);
1444
1445         it = PyObject_GetIter(seq2);
1446         if (it == NULL)
1447                 return -1;
1448
1449         for (i = 0; ; ++i) {
1450                 PyObject *key, *value;
1451                 Py_ssize_t n;
1452
1453                 fast = NULL;
1454                 item = PyIter_Next(it);
1455                 if (item == NULL) {
1456                         if (PyErr_Occurred())
1457                                 goto Fail;
1458                         break;
1459                 }
1460
1461                 /* Convert item to sequence, and verify length 2. */
1462                 fast = PySequence_Fast(item, "");
1463                 if (fast == NULL) {
1464                         if (PyErr_ExceptionMatches(PyExc_TypeError))
1465                                 PyErr_Format(PyExc_TypeError,
1466                                         "cannot convert dictionary update "
1467                                         "sequence element #%zd to a sequence",
1468                                         i);
1469                         goto Fail;
1470                 }
1471                 n = PySequence_Fast_GET_SIZE(fast);
1472                 if (n != 2) {
1473                         PyErr_Format(PyExc_ValueError,
1474                                      "dictionary update sequence element #%zd "
1475                                      "has length %zd; 2 is required",
1476                                      i, n);
1477                         goto Fail;
1478                 }
1479
1480                 /* Update/merge with this (key, value) pair. */
1481                 key = PySequence_Fast_GET_ITEM(fast, 0);
1482                 value = PySequence_Fast_GET_ITEM(fast, 1);
1483                 if (override || PyDict_GetItem(d, key) == NULL) {
1484                         int status = PyDict_SetItem(d, key, value);
1485                         if (status < 0)
1486                                 goto Fail;
1487                 }
1488                 Py_DECREF(fast);
1489                 Py_DECREF(item);
1490         }
1491
1492         i = 0;
1493         goto Return;
1494 Fail:
1495         Py_XDECREF(item);
1496         Py_XDECREF(fast);
1497         i = -1;
1498 Return:
1499         Py_DECREF(it);
1500         return Py_SAFE_DOWNCAST(i, Py_ssize_t, int);
1501 }
1502
1503 int
1504 PyDict_Update(PyObject *a, PyObject *b)
1505 {
1506         return PyDict_Merge(a, b, 1);
1507 }
1508
1509 int
1510 PyDict_Merge(PyObject *a, PyObject *b, int override)
1511 {
1512         register PyDictObject *mp, *other;
1513         register Py_ssize_t i;
1514         PyDictEntry *entry;
1515
1516         /* We accept for the argument either a concrete dictionary object,
1517          * or an abstract "mapping" object.  For the former, we can do
1518          * things quite efficiently.  For the latter, we only require that
1519          * PyMapping_Keys() and PyObject_GetItem() be supported.
1520          */
1521         if (a == NULL || !PyDict_Check(a) || b == NULL) {
1522                 PyErr_BadInternalCall();
1523                 return -1;
1524         }
1525         mp = (PyDictObject*)a;
1526         if (PyDict_Check(b)) {
1527                 other = (PyDictObject*)b;
1528                 if (other == mp || other->ma_used == 0)
1529                         /* a.update(a) or a.update({}); nothing to do */
1530                         return 0;
1531                 if (mp->ma_used == 0)
1532                         /* Since the target dict is empty, PyDict_GetItem()
1533                          * always returns NULL.  Setting override to 1
1534                          * skips the unnecessary test.
1535                          */
1536                         override = 1;
1537                 /* Do one big resize at the start, rather than
1538                  * incrementally resizing as we insert new items.  Expect
1539                  * that there will be no (or few) overlapping keys.
1540                  */
1541                 if ((mp->ma_fill + other->ma_used)*3 >= (mp->ma_mask+1)*2) {
1542                    if (dictresize(mp, (mp->ma_used + other->ma_used)*2) != 0)
1543                            return -1;
1544                 }
1545                 for (i = 0; i <= other->ma_mask; i++) {
1546                         entry = &other->ma_table[i];
1547                         if (entry->me_value != NULL &&
1548                             (override ||
1549                              PyDict_GetItem(a, entry->me_key) == NULL)) {
1550                                 Py_INCREF(entry->me_key);
1551                                 Py_INCREF(entry->me_value);
1552                                 if (insertdict(mp, entry->me_key,
1553                                                (long)entry->me_hash,
1554                                                entry->me_value) != 0)
1555                                         return -1;
1556                         }
1557                 }
1558         }
1559         else {
1560                 /* Do it the generic, slower way */
1561                 PyObject *keys = PyMapping_Keys(b);
1562                 PyObject *iter;
1563                 PyObject *key, *value;
1564                 int status;
1565
1566                 if (keys == NULL)
1567                         /* Docstring says this is equivalent to E.keys() so
1568                          * if E doesn't have a .keys() method we want
1569                          * AttributeError to percolate up.  Might as well
1570                          * do the same for any other error.
1571                          */
1572                         return -1;
1573
1574                 iter = PyObject_GetIter(keys);
1575                 Py_DECREF(keys);
1576                 if (iter == NULL)
1577                         return -1;
1578
1579                 for (key = PyIter_Next(iter); key; key = PyIter_Next(iter)) {
1580                         if (!override && PyDict_GetItem(a, key) != NULL) {
1581                                 Py_DECREF(key);
1582                                 continue;
1583                         }
1584                         value = PyObject_GetItem(b, key);
1585                         if (value == NULL) {
1586                                 Py_DECREF(iter);
1587                                 Py_DECREF(key);
1588                                 return -1;
1589                         }
1590                         status = PyDict_SetItem(a, key, value);
1591                         Py_DECREF(key);
1592                         Py_DECREF(value);
1593                         if (status < 0) {
1594                                 Py_DECREF(iter);
1595                                 return -1;
1596                         }
1597                 }
1598                 Py_DECREF(iter);
1599                 if (PyErr_Occurred())
1600                         /* Iterator completed, via error */
1601                         return -1;
1602         }
1603         return 0;
1604 }
1605
1606 static PyObject *
1607 dict_copy(register PyDictObject *mp)
1608 {
1609         return PyDict_Copy((PyObject*)mp);
1610 }
1611
1612 PyObject *
1613 PyDict_Copy(PyObject *o)
1614 {
1615         PyObject *copy;
1616
1617         if (o == NULL || !PyDict_Check(o)) {
1618                 PyErr_BadInternalCall();
1619                 return NULL;
1620         }
1621         copy = PyDict_New();
1622         if (copy == NULL)
1623                 return NULL;
1624         if (PyDict_Merge(copy, o, 1) == 0)
1625                 return copy;
1626         Py_DECREF(copy);
1627         return NULL;
1628 }
1629
1630 Py_ssize_t
1631 PyDict_Size(PyObject *mp)
1632 {
1633         if (mp == NULL || !PyDict_Check(mp)) {
1634                 PyErr_BadInternalCall();
1635                 return -1;
1636         }
1637         return ((PyDictObject *)mp)->ma_used;
1638 }
1639
1640 PyObject *
1641 PyDict_Keys(PyObject *mp)
1642 {
1643         if (mp == NULL || !PyDict_Check(mp)) {
1644                 PyErr_BadInternalCall();
1645                 return NULL;
1646         }
1647         return dict_keys((PyDictObject *)mp);
1648 }
1649
1650 PyObject *
1651 PyDict_Values(PyObject *mp)
1652 {
1653         if (mp == NULL || !PyDict_Check(mp)) {
1654                 PyErr_BadInternalCall();
1655                 return NULL;
1656         }
1657         return dict_values((PyDictObject *)mp);
1658 }
1659
1660 PyObject *
1661 PyDict_Items(PyObject *mp)
1662 {
1663         if (mp == NULL || !PyDict_Check(mp)) {
1664                 PyErr_BadInternalCall();
1665                 return NULL;
1666         }
1667         return dict_items((PyDictObject *)mp);
1668 }
1669
1670 /* Subroutine which returns the smallest key in a for which b's value
1671    is different or absent.  The value is returned too, through the
1672    pval argument.  Both are NULL if no key in a is found for which b's status
1673    differs.  The refcounts on (and only on) non-NULL *pval and function return
1674    values must be decremented by the caller (characterize() increments them
1675    to ensure that mutating comparison and PyDict_GetItem calls can't delete
1676    them before the caller is done looking at them). */
1677
1678 static PyObject *
1679 characterize(PyDictObject *a, PyDictObject *b, PyObject **pval)
1680 {
1681         PyObject *akey = NULL; /* smallest key in a s.t. a[akey] != b[akey] */
1682         PyObject *aval = NULL; /* a[akey] */
1683         Py_ssize_t i;
1684         int cmp;
1685
1686         for (i = 0; i <= a->ma_mask; i++) {
1687                 PyObject *thiskey, *thisaval, *thisbval;
1688                 if (a->ma_table[i].me_value == NULL)
1689                         continue;
1690                 thiskey = a->ma_table[i].me_key;
1691                 Py_INCREF(thiskey);  /* keep alive across compares */
1692                 if (akey != NULL) {
1693                         cmp = PyObject_RichCompareBool(akey, thiskey, Py_LT);
1694                         if (cmp < 0) {
1695                                 Py_DECREF(thiskey);
1696                                 goto Fail;
1697                         }
1698                         if (cmp > 0 ||
1699                             i > a->ma_mask ||
1700                             a->ma_table[i].me_value == NULL)
1701                         {
1702                                 /* Not the *smallest* a key; or maybe it is
1703                                  * but the compare shrunk the dict so we can't
1704                                  * find its associated value anymore; or
1705                                  * maybe it is but the compare deleted the
1706                                  * a[thiskey] entry.
1707                                  */
1708                                 Py_DECREF(thiskey);
1709                                 continue;
1710                         }
1711                 }
1712
1713                 /* Compare a[thiskey] to b[thiskey]; cmp <- true iff equal. */
1714                 thisaval = a->ma_table[i].me_value;
1715                 assert(thisaval);
1716                 Py_INCREF(thisaval);   /* keep alive */
1717                 thisbval = PyDict_GetItem((PyObject *)b, thiskey);
1718                 if (thisbval == NULL)
1719                         cmp = 0;
1720                 else {
1721                         /* both dicts have thiskey:  same values? */
1722                         cmp = PyObject_RichCompareBool(
1723                                                 thisaval, thisbval, Py_EQ);
1724                         if (cmp < 0) {
1725                                 Py_DECREF(thiskey);
1726                                 Py_DECREF(thisaval);
1727                                 goto Fail;
1728                         }
1729                 }
1730                 if (cmp == 0) {
1731                         /* New winner. */
1732                         Py_XDECREF(akey);
1733                         Py_XDECREF(aval);
1734                         akey = thiskey;
1735                         aval = thisaval;
1736                 }
1737                 else {
1738                         Py_DECREF(thiskey);
1739                         Py_DECREF(thisaval);
1740                 }
1741         }
1742         *pval = aval;
1743         return akey;
1744
1745 Fail:
1746         Py_XDECREF(akey);
1747         Py_XDECREF(aval);
1748         *pval = NULL;
1749         return NULL;
1750 }
1751
1752 static int
1753 dict_compare(PyDictObject *a, PyDictObject *b)
1754 {
1755         PyObject *adiff, *bdiff, *aval, *bval;
1756         int res;
1757
1758         /* Compare lengths first */
1759         if (a->ma_used < b->ma_used)
1760                 return -1;      /* a is shorter */
1761         else if (a->ma_used > b->ma_used)
1762                 return 1;       /* b is shorter */
1763
1764         /* Same length -- check all keys */
1765         bdiff = bval = NULL;
1766         adiff = characterize(a, b, &aval);
1767         if (adiff == NULL) {
1768                 assert(!aval);
1769                 /* Either an error, or a is a subset with the same length so
1770                  * must be equal.
1771                  */
1772                 res = PyErr_Occurred() ? -1 : 0;
1773                 goto Finished;
1774         }
1775         bdiff = characterize(b, a, &bval);
1776         if (bdiff == NULL && PyErr_Occurred()) {
1777                 assert(!bval);
1778                 res = -1;
1779                 goto Finished;
1780         }
1781         res = 0;
1782         if (bdiff) {
1783                 /* bdiff == NULL "should be" impossible now, but perhaps
1784                  * the last comparison done by the characterize() on a had
1785                  * the side effect of making the dicts equal!
1786                  */
1787                 res = PyObject_Compare(adiff, bdiff);
1788         }
1789         if (res == 0 && bval != NULL)
1790                 res = PyObject_Compare(aval, bval);
1791
1792 Finished:
1793         Py_XDECREF(adiff);
1794         Py_XDECREF(bdiff);
1795         Py_XDECREF(aval);
1796         Py_XDECREF(bval);
1797         return res;
1798 }
1799
1800 /* Return 1 if dicts equal, 0 if not, -1 if error.
1801  * Gets out as soon as any difference is detected.
1802  * Uses only Py_EQ comparison.
1803  */
1804 static int
1805 dict_equal(PyDictObject *a, PyDictObject *b)
1806 {
1807         Py_ssize_t i;
1808
1809         if (a->ma_used != b->ma_used)
1810                 /* can't be equal if # of entries differ */
1811                 return 0;
1812
1813         /* Same # of entries -- check all of 'em.  Exit early on any diff. */
1814         for (i = 0; i <= a->ma_mask; i++) {
1815                 PyObject *aval = a->ma_table[i].me_value;
1816                 if (aval != NULL) {
1817                         int cmp;
1818                         PyObject *bval;
1819                         PyObject *key = a->ma_table[i].me_key;
1820                         /* temporarily bump aval's refcount to ensure it stays
1821                            alive until we're done with it */
1822                         Py_INCREF(aval);
1823                         /* ditto for key */
1824                         Py_INCREF(key);
1825                         bval = PyDict_GetItem((PyObject *)b, key);
1826                         Py_DECREF(key);
1827                         if (bval == NULL) {
1828                                 Py_DECREF(aval);
1829                                 return 0;
1830                         }
1831                         cmp = PyObject_RichCompareBool(aval, bval, Py_EQ);
1832                         Py_DECREF(aval);
1833                         if (cmp <= 0)  /* error or not equal */
1834                                 return cmp;
1835                 }
1836         }
1837         return 1;
1838  }
1839
1840 static PyObject *
1841 dict_richcompare(PyObject *v, PyObject *w, int op)
1842 {
1843         int cmp;
1844         PyObject *res;
1845
1846         if (!PyDict_Check(v) || !PyDict_Check(w)) {
1847                 res = Py_NotImplemented;
1848         }
1849         else if (op == Py_EQ || op == Py_NE) {
1850                 cmp = dict_equal((PyDictObject *)v, (PyDictObject *)w);
1851                 if (cmp < 0)
1852                         return NULL;
1853                 res = (cmp == (op == Py_EQ)) ? Py_True : Py_False;
1854         }
1855         else {
1856                 /* Py3K warning if comparison isn't == or !=  */
1857                 if (PyErr_WarnPy3k("dict inequality comparisons not supported "
1858                                    "in 3.x", 1) < 0) {
1859                         return NULL;
1860                 }
1861                 res = Py_NotImplemented;
1862         }
1863         Py_INCREF(res);
1864         return res;
1865  }
1866
1867 static PyObject *
1868 dict_contains(register PyDictObject *mp, PyObject *key)
1869 {
1870         long hash;
1871         PyDictEntry *ep;
1872
1873         if (!PyString_CheckExact(key) ||
1874             (hash = ((PyStringObject *) key)->ob_shash) == -1) {
1875                 hash = PyObject_Hash(key);
1876                 if (hash == -1)
1877                         return NULL;
1878         }
1879         ep = (mp->ma_lookup)(mp, key, hash);
1880         if (ep == NULL)
1881                 return NULL;
1882         return PyBool_FromLong(ep->me_value != NULL);
1883 }
1884
1885 static PyObject *
1886 dict_has_key(register PyDictObject *mp, PyObject *key)
1887 {
1888         if (PyErr_WarnPy3k("dict.has_key() not supported in 3.x; "
1889                            "use the in operator", 1) < 0)
1890                 return NULL;
1891         return dict_contains(mp, key);
1892 }
1893
1894 static PyObject *
1895 dict_get(register PyDictObject *mp, PyObject *args)
1896 {
1897         PyObject *key;
1898         PyObject *failobj = Py_None;
1899         PyObject *val = NULL;
1900         long hash;
1901         PyDictEntry *ep;
1902
1903         if (!PyArg_UnpackTuple(args, "get", 1, 2, &key, &failobj))
1904                 return NULL;
1905
1906         if (!PyString_CheckExact(key) ||
1907             (hash = ((PyStringObject *) key)->ob_shash) == -1) {
1908                 hash = PyObject_Hash(key);
1909                 if (hash == -1)
1910                         return NULL;
1911         }
1912         ep = (mp->ma_lookup)(mp, key, hash);
1913         if (ep == NULL)
1914                 return NULL;
1915         val = ep->me_value;
1916         if (val == NULL)
1917                 val = failobj;
1918         Py_INCREF(val);
1919         return val;
1920 }
1921
1922
1923 static PyObject *
1924 dict_setdefault(register PyDictObject *mp, PyObject *args)
1925 {
1926         PyObject *key;
1927         PyObject *failobj = Py_None;
1928         PyObject *val = NULL;
1929         long hash;
1930         PyDictEntry *ep;
1931
1932         if (!PyArg_UnpackTuple(args, "setdefault", 1, 2, &key, &failobj))
1933                 return NULL;
1934
1935         if (!PyString_CheckExact(key) ||
1936             (hash = ((PyStringObject *) key)->ob_shash) == -1) {
1937                 hash = PyObject_Hash(key);
1938                 if (hash == -1)
1939                         return NULL;
1940         }
1941         ep = (mp->ma_lookup)(mp, key, hash);
1942         if (ep == NULL)
1943                 return NULL;
1944         val = ep->me_value;
1945         if (val == NULL) {
1946                 val = failobj;
1947                 if (PyDict_SetItem((PyObject*)mp, key, failobj))
1948                         val = NULL;
1949         }
1950         Py_XINCREF(val);
1951         return val;
1952 }
1953
1954
1955 static PyObject *
1956 dict_clear(register PyDictObject *mp)
1957 {
1958         PyDict_Clear((PyObject *)mp);
1959         Py_RETURN_NONE;
1960 }
1961
1962 static PyObject *
1963 dict_pop(PyDictObject *mp, PyObject *args)
1964 {
1965         long hash;
1966         PyDictEntry *ep;
1967         PyObject *old_value, *old_key;
1968         PyObject *key, *deflt = NULL;
1969
1970         if(!PyArg_UnpackTuple(args, "pop", 1, 2, &key, &deflt))
1971                 return NULL;
1972         if (mp->ma_used == 0) {
1973                 if (deflt) {
1974                         Py_INCREF(deflt);
1975                         return deflt;
1976                 }
1977                 PyErr_SetString(PyExc_KeyError,
1978                                 "pop(): dictionary is empty");
1979                 return NULL;
1980         }
1981         if (!PyString_CheckExact(key) ||
1982             (hash = ((PyStringObject *) key)->ob_shash) == -1) {
1983                 hash = PyObject_Hash(key);
1984                 if (hash == -1)
1985                         return NULL;
1986         }
1987         ep = (mp->ma_lookup)(mp, key, hash);
1988         if (ep == NULL)
1989                 return NULL;
1990         if (ep->me_value == NULL) {
1991                 if (deflt) {
1992                         Py_INCREF(deflt);
1993                         return deflt;
1994                 }
1995                 set_key_error(key);
1996                 return NULL;
1997         }
1998         old_key = ep->me_key;
1999         Py_INCREF(dummy);
2000         ep->me_key = dummy;
2001         old_value = ep->me_value;
2002         ep->me_value = NULL;
2003         mp->ma_used--;
2004         Py_DECREF(old_key);
2005         return old_value;
2006 }
2007
2008 static PyObject *
2009 dict_popitem(PyDictObject *mp)
2010 {
2011         Py_ssize_t i = 0;
2012         PyDictEntry *ep;
2013         PyObject *res;
2014
2015         /* Allocate the result tuple before checking the size.  Believe it
2016          * or not, this allocation could trigger a garbage collection which
2017          * could empty the dict, so if we checked the size first and that
2018          * happened, the result would be an infinite loop (searching for an
2019          * entry that no longer exists).  Note that the usual popitem()
2020          * idiom is "while d: k, v = d.popitem()". so needing to throw the
2021          * tuple away if the dict *is* empty isn't a significant
2022          * inefficiency -- possible, but unlikely in practice.
2023          */
2024         res = PyTuple_New(2);
2025         if (res == NULL)
2026                 return NULL;
2027         if (mp->ma_used == 0) {
2028                 Py_DECREF(res);
2029                 PyErr_SetString(PyExc_KeyError,
2030                                 "popitem(): dictionary is empty");
2031                 return NULL;
2032         }
2033         /* Set ep to "the first" dict entry with a value.  We abuse the hash
2034          * field of slot 0 to hold a search finger:
2035          * If slot 0 has a value, use slot 0.
2036          * Else slot 0 is being used to hold a search finger,
2037          * and we use its hash value as the first index to look.
2038          */
2039         ep = &mp->ma_table[0];
2040         if (ep->me_value == NULL) {
2041                 i = ep->me_hash;
2042                 /* The hash field may be a real hash value, or it may be a
2043                  * legit search finger, or it may be a once-legit search
2044                  * finger that's out of bounds now because it wrapped around
2045                  * or the table shrunk -- simply make sure it's in bounds now.
2046                  */
2047                 if (i > mp->ma_mask || i < 1)
2048                         i = 1;  /* skip slot 0 */
2049                 while ((ep = &mp->ma_table[i])->me_value == NULL) {
2050                         i++;
2051                         if (i > mp->ma_mask)
2052                                 i = 1;
2053                 }
2054         }
2055         PyTuple_SET_ITEM(res, 0, ep->me_key);
2056         PyTuple_SET_ITEM(res, 1, ep->me_value);
2057         Py_INCREF(dummy);
2058         ep->me_key = dummy;
2059         ep->me_value = NULL;
2060         mp->ma_used--;
2061         assert(mp->ma_table[0].me_value == NULL);
2062         mp->ma_table[0].me_hash = i + 1;  /* next place to start */
2063         return res;
2064 }
2065
2066 static int
2067 dict_traverse(PyObject *op, visitproc visit, void *arg)
2068 {
2069         Py_ssize_t i = 0;
2070         PyObject *pk;
2071         PyObject *pv;
2072
2073         while (PyDict_Next(op, &i, &pk, &pv)) {
2074                 Py_VISIT(pk);
2075                 Py_VISIT(pv);
2076         }
2077         return 0;
2078 }
2079
2080 static int
2081 dict_tp_clear(PyObject *op)
2082 {
2083         PyDict_Clear(op);
2084         return 0;
2085 }
2086
2087
2088 extern PyTypeObject PyDictIterKey_Type; /* Forward */
2089 extern PyTypeObject PyDictIterValue_Type; /* Forward */
2090 extern PyTypeObject PyDictIterItem_Type; /* Forward */
2091 static PyObject *dictiter_new(PyDictObject *, PyTypeObject *);
2092
2093 static PyObject *
2094 dict_iterkeys(PyDictObject *dict)
2095 {
2096         return dictiter_new(dict, &PyDictIterKey_Type);
2097 }
2098
2099 static PyObject *
2100 dict_itervalues(PyDictObject *dict)
2101 {
2102         return dictiter_new(dict, &PyDictIterValue_Type);
2103 }
2104
2105 static PyObject *
2106 dict_iteritems(PyDictObject *dict)
2107 {
2108         return dictiter_new(dict, &PyDictIterItem_Type);
2109 }
2110
2111 static PyObject *
2112 dict_sizeof(PyDictObject *mp)
2113 {
2114         Py_ssize_t res;
2115
2116         res = sizeof(PyDictObject);
2117         if (mp->ma_table != mp->ma_smalltable)
2118                 res = res + (mp->ma_mask + 1) * sizeof(PyDictEntry);
2119         return PyInt_FromSsize_t(res);
2120 }
2121
2122 PyDoc_STRVAR(has_key__doc__,
2123 "D.has_key(k) -> True if D has a key k, else False");
2124
2125 PyDoc_STRVAR(contains__doc__,
2126 "D.__contains__(k) -> True if D has a key k, else False");
2127
2128 PyDoc_STRVAR(getitem__doc__, "x.__getitem__(y) <==> x[y]");
2129
2130 PyDoc_STRVAR(sizeof__doc__,
2131 "D.__sizeof__() -> size of D in memory, in bytes");
2132
2133 PyDoc_STRVAR(get__doc__,
2134 "D.get(k[,d]) -> D[k] if k in D, else d.  d defaults to None.");
2135
2136 PyDoc_STRVAR(setdefault_doc__,
2137 "D.setdefault(k[,d]) -> D.get(k,d), also set D[k]=d if k not in D");
2138
2139 PyDoc_STRVAR(pop__doc__,
2140 "D.pop(k[,d]) -> v, remove specified key and return the corresponding value.\n\
2141 If key is not found, d is returned if given, otherwise KeyError is raised");
2142
2143 PyDoc_STRVAR(popitem__doc__,
2144 "D.popitem() -> (k, v), remove and return some (key, value) pair as a\n\
2145 2-tuple; but raise KeyError if D is empty.");
2146
2147 PyDoc_STRVAR(keys__doc__,
2148 "D.keys() -> list of D's keys");
2149
2150 PyDoc_STRVAR(items__doc__,
2151 "D.items() -> list of D's (key, value) pairs, as 2-tuples");
2152
2153 PyDoc_STRVAR(values__doc__,
2154 "D.values() -> list of D's values");
2155
2156 PyDoc_STRVAR(update__doc__,
2157 "D.update(E, **F) -> None.  Update D from dict/iterable E and F.\n"
2158 "If E has a .keys() method, does:     for k in E: D[k] = E[k]\n\
2159 If E lacks .keys() method, does:     for (k, v) in E: D[k] = v\n\
2160 In either case, this is followed by: for k in F: D[k] = F[k]");
2161
2162 PyDoc_STRVAR(fromkeys__doc__,
2163 "dict.fromkeys(S[,v]) -> New dict with keys from S and values equal to v.\n\
2164 v defaults to None.");
2165
2166 PyDoc_STRVAR(clear__doc__,
2167 "D.clear() -> None.  Remove all items from D.");
2168
2169 PyDoc_STRVAR(copy__doc__,
2170 "D.copy() -> a shallow copy of D");
2171
2172 PyDoc_STRVAR(iterkeys__doc__,
2173 "D.iterkeys() -> an iterator over the keys of D");
2174
2175 PyDoc_STRVAR(itervalues__doc__,
2176 "D.itervalues() -> an iterator over the values of D");
2177
2178 PyDoc_STRVAR(iteritems__doc__,
2179 "D.iteritems() -> an iterator over the (key, value) items of D");
2180
2181 static PyMethodDef mapp_methods[] = {
2182         {"__contains__",(PyCFunction)dict_contains,     METH_O | METH_COEXIST,
2183          contains__doc__},
2184         {"__getitem__", (PyCFunction)dict_subscript,    METH_O | METH_COEXIST,
2185          getitem__doc__},
2186         {"__sizeof__",  (PyCFunction)dict_sizeof,       METH_NOARGS,
2187          sizeof__doc__},
2188         {"has_key",     (PyCFunction)dict_has_key,      METH_O,
2189          has_key__doc__},
2190         {"get",         (PyCFunction)dict_get,          METH_VARARGS,
2191          get__doc__},
2192         {"setdefault",  (PyCFunction)dict_setdefault,   METH_VARARGS,
2193          setdefault_doc__},
2194         {"pop",         (PyCFunction)dict_pop,          METH_VARARGS,
2195          pop__doc__},
2196         {"popitem",     (PyCFunction)dict_popitem,      METH_NOARGS,
2197          popitem__doc__},
2198         {"keys",        (PyCFunction)dict_keys,         METH_NOARGS,
2199         keys__doc__},
2200         {"items",       (PyCFunction)dict_items,        METH_NOARGS,
2201          items__doc__},
2202         {"values",      (PyCFunction)dict_values,       METH_NOARGS,
2203          values__doc__},
2204         {"update",      (PyCFunction)dict_update,       METH_VARARGS | METH_KEYWORDS,
2205          update__doc__},
2206         {"fromkeys",    (PyCFunction)dict_fromkeys,     METH_VARARGS | METH_CLASS,
2207          fromkeys__doc__},
2208         {"clear",       (PyCFunction)dict_clear,        METH_NOARGS,
2209          clear__doc__},
2210         {"copy",        (PyCFunction)dict_copy,         METH_NOARGS,
2211          copy__doc__},
2212         {"iterkeys",    (PyCFunction)dict_iterkeys,     METH_NOARGS,
2213          iterkeys__doc__},
2214         {"itervalues",  (PyCFunction)dict_itervalues,   METH_NOARGS,
2215          itervalues__doc__},
2216         {"iteritems",   (PyCFunction)dict_iteritems,    METH_NOARGS,
2217          iteritems__doc__},
2218         {NULL,          NULL}   /* sentinel */
2219 };
2220
2221 /* Return 1 if `key` is in dict `op`, 0 if not, and -1 on error. */
2222 int
2223 PyDict_Contains(PyObject *op, PyObject *key)
2224 {
2225         long hash;
2226         PyDictObject *mp = (PyDictObject *)op;
2227         PyDictEntry *ep;
2228
2229         if (!PyString_CheckExact(key) ||
2230             (hash = ((PyStringObject *) key)->ob_shash) == -1) {
2231                 hash = PyObject_Hash(key);
2232                 if (hash == -1)
2233                         return -1;
2234         }
2235         ep = (mp->ma_lookup)(mp, key, hash);
2236         return ep == NULL ? -1 : (ep->me_value != NULL);
2237 }
2238
2239 /* Internal version of PyDict_Contains used when the hash value is already known */
2240 int
2241 _PyDict_Contains(PyObject *op, PyObject *key, long hash)
2242 {
2243         PyDictObject *mp = (PyDictObject *)op;
2244         PyDictEntry *ep;
2245
2246         ep = (mp->ma_lookup)(mp, key, hash);
2247         return ep == NULL ? -1 : (ep->me_value != NULL);
2248 }
2249
2250 /* Hack to implement "key in dict" */
2251 static PySequenceMethods dict_as_sequence = {
2252         0,                      /* sq_length */
2253         0,                      /* sq_concat */
2254         0,                      /* sq_repeat */
2255         0,                      /* sq_item */
2256         0,                      /* sq_slice */
2257         0,                      /* sq_ass_item */
2258         0,                      /* sq_ass_slice */
2259         PyDict_Contains,        /* sq_contains */
2260         0,                      /* sq_inplace_concat */
2261         0,                      /* sq_inplace_repeat */
2262 };
2263
2264 static PyObject *
2265 dict_new(PyTypeObject *type, PyObject *args, PyObject *kwds)
2266 {
2267         PyObject *self;
2268
2269         assert(type != NULL && type->tp_alloc != NULL);
2270         self = type->tp_alloc(type, 0);
2271         if (self != NULL) {
2272                 PyDictObject *d = (PyDictObject *)self;
2273                 /* It's guaranteed that tp->alloc zeroed out the struct. */
2274                 assert(d->ma_table == NULL && d->ma_fill == 0 && d->ma_used == 0);
2275                 INIT_NONZERO_DICT_SLOTS(d);
2276                 d->ma_lookup = lookdict_string;
2277                 /* The object has been implicitely tracked by tp_alloc */
2278                 if (type == &PyDict_Type)
2279                         _PyObject_GC_UNTRACK(d);
2280 #ifdef SHOW_CONVERSION_COUNTS
2281                 ++created;
2282 #endif
2283 #ifdef SHOW_TRACK_COUNT
2284                 if (_PyObject_GC_IS_TRACKED(d))
2285                         count_tracked++;
2286                 else
2287                         count_untracked++;
2288 #endif
2289         }
2290         return self;
2291 }
2292
2293 static int
2294 dict_init(PyObject *self, PyObject *args, PyObject *kwds)
2295 {
2296         return dict_update_common(self, args, kwds, "dict");
2297 }
2298
2299 static PyObject *
2300 dict_iter(PyDictObject *dict)
2301 {
2302         return dictiter_new(dict, &PyDictIterKey_Type);
2303 }
2304
2305 PyDoc_STRVAR(dictionary_doc,
2306 "dict() -> new empty dictionary.\n"
2307 "dict(mapping) -> new dictionary initialized from a mapping object's\n"
2308 "    (key, value) pairs.\n"
2309 "dict(seq) -> new dictionary initialized as if via:\n"
2310 "    d = {}\n"
2311 "    for k, v in seq:\n"
2312 "        d[k] = v\n"
2313 "dict(**kwargs) -> new dictionary initialized with the name=value pairs\n"
2314 "    in the keyword argument list.  For example:  dict(one=1, two=2)");
2315
2316 PyTypeObject PyDict_Type = {
2317         PyVarObject_HEAD_INIT(&PyType_Type, 0)
2318         "dict",
2319         sizeof(PyDictObject),
2320         0,
2321         (destructor)dict_dealloc,               /* tp_dealloc */
2322         (printfunc)dict_print,                  /* tp_print */
2323         0,                                      /* tp_getattr */
2324         0,                                      /* tp_setattr */
2325         (cmpfunc)dict_compare,                  /* tp_compare */
2326         (reprfunc)dict_repr,                    /* tp_repr */
2327         0,                                      /* tp_as_number */
2328         &dict_as_sequence,                      /* tp_as_sequence */
2329         &dict_as_mapping,                       /* tp_as_mapping */
2330         (hashfunc)PyObject_HashNotImplemented,  /* tp_hash */
2331         0,                                      /* tp_call */
2332         0,                                      /* tp_str */
2333         PyObject_GenericGetAttr,                /* tp_getattro */
2334         0,                                      /* tp_setattro */
2335         0,                                      /* tp_as_buffer */
2336         Py_TPFLAGS_DEFAULT | Py_TPFLAGS_HAVE_GC |
2337                 Py_TPFLAGS_BASETYPE | Py_TPFLAGS_DICT_SUBCLASS, /* tp_flags */
2338         dictionary_doc,                         /* tp_doc */
2339         dict_traverse,                          /* tp_traverse */
2340         dict_tp_clear,                          /* tp_clear */
2341         dict_richcompare,                       /* tp_richcompare */
2342         0,                                      /* tp_weaklistoffset */
2343         (getiterfunc)dict_iter,                 /* tp_iter */
2344         0,                                      /* tp_iternext */
2345         mapp_methods,                           /* tp_methods */
2346         0,                                      /* tp_members */
2347         0,                                      /* tp_getset */
2348         0,                                      /* tp_base */
2349         0,                                      /* tp_dict */
2350         0,                                      /* tp_descr_get */
2351         0,                                      /* tp_descr_set */
2352         0,                                      /* tp_dictoffset */
2353         dict_init,                              /* tp_init */
2354         PyType_GenericAlloc,                    /* tp_alloc */
2355         dict_new,                               /* tp_new */
2356         PyObject_GC_Del,                        /* tp_free */
2357 };
2358
2359 /* For backward compatibility with old dictionary interface */
2360
2361 PyObject *
2362 PyDict_GetItemString(PyObject *v, const char *key)
2363 {
2364         PyObject *kv, *rv;
2365         kv = PyString_FromString(key);
2366         if (kv == NULL)
2367                 return NULL;
2368         rv = PyDict_GetItem(v, kv);
2369         Py_DECREF(kv);
2370         return rv;
2371 }
2372
2373 int
2374 PyDict_SetItemString(PyObject *v, const char *key, PyObject *item)
2375 {
2376         PyObject *kv;
2377         int err;
2378         kv = PyString_FromString(key);
2379         if (kv == NULL)
2380                 return -1;
2381         PyString_InternInPlace(&kv); /* XXX Should we really? */
2382         err = PyDict_SetItem(v, kv, item);
2383         Py_DECREF(kv);
2384         return err;
2385 }
2386
2387 int
2388 PyDict_DelItemString(PyObject *v, const char *key)
2389 {
2390         PyObject *kv;
2391         int err;
2392         kv = PyString_FromString(key);
2393         if (kv == NULL)
2394                 return -1;
2395         err = PyDict_DelItem(v, kv);
2396         Py_DECREF(kv);
2397         return err;
2398 }
2399
2400 /* Dictionary iterator types */
2401
2402 typedef struct {
2403         PyObject_HEAD
2404         PyDictObject *di_dict; /* Set to NULL when iterator is exhausted */
2405         Py_ssize_t di_used;
2406         Py_ssize_t di_pos;
2407         PyObject* di_result; /* reusable result tuple for iteritems */
2408         Py_ssize_t len;
2409 } dictiterobject;
2410
2411 static PyObject *
2412 dictiter_new(PyDictObject *dict, PyTypeObject *itertype)
2413 {
2414         dictiterobject *di;
2415         di = PyObject_GC_New(dictiterobject, itertype);
2416         if (di == NULL)
2417                 return NULL;
2418         Py_INCREF(dict);
2419         di->di_dict = dict;
2420         di->di_used = dict->ma_used;
2421         di->di_pos = 0;
2422         di->len = dict->ma_used;
2423         if (itertype == &PyDictIterItem_Type) {
2424                 di->di_result = PyTuple_Pack(2, Py_None, Py_None);
2425                 if (di->di_result == NULL) {
2426                         Py_DECREF(di);
2427                         return NULL;
2428                 }
2429         }
2430         else
2431                 di->di_result = NULL;
2432         _PyObject_GC_TRACK(di);
2433         return (PyObject *)di;
2434 }
2435
2436 static void
2437 dictiter_dealloc(dictiterobject *di)
2438 {
2439         Py_XDECREF(di->di_dict);
2440         Py_XDECREF(di->di_result);
2441         PyObject_GC_Del(di);
2442 }
2443
2444 static int
2445 dictiter_traverse(dictiterobject *di, visitproc visit, void *arg)
2446 {
2447         Py_VISIT(di->di_dict);
2448         Py_VISIT(di->di_result);
2449         return 0;
2450 }
2451
2452 static PyObject *
2453 dictiter_len(dictiterobject *di)
2454 {
2455         Py_ssize_t len = 0;
2456         if (di->di_dict != NULL && di->di_used == di->di_dict->ma_used)
2457                 len = di->len;
2458         return PyInt_FromSize_t(len);
2459 }
2460
2461 PyDoc_STRVAR(length_hint_doc, "Private method returning an estimate of len(list(it)).");
2462
2463 static PyMethodDef dictiter_methods[] = {
2464         {"__length_hint__", (PyCFunction)dictiter_len, METH_NOARGS, length_hint_doc},
2465         {NULL,          NULL}           /* sentinel */
2466 };
2467
2468 static PyObject *dictiter_iternextkey(dictiterobject *di)
2469 {
2470         PyObject *key;
2471         register Py_ssize_t i, mask;
2472         register PyDictEntry *ep;
2473         PyDictObject *d = di->di_dict;
2474
2475         if (d == NULL)
2476                 return NULL;
2477         assert (PyDict_Check(d));
2478
2479         if (di->di_used != d->ma_used) {
2480                 PyErr_SetString(PyExc_RuntimeError,
2481                                 "dictionary changed size during iteration");
2482                 di->di_used = -1; /* Make this state sticky */
2483                 return NULL;
2484         }
2485
2486         i = di->di_pos;
2487         if (i < 0)
2488                 goto fail;
2489         ep = d->ma_table;
2490         mask = d->ma_mask;
2491         while (i <= mask && ep[i].me_value == NULL)
2492                 i++;
2493         di->di_pos = i+1;
2494         if (i > mask)
2495                 goto fail;
2496         di->len--;
2497         key = ep[i].me_key;
2498         Py_INCREF(key);
2499         return key;
2500
2501 fail:
2502         Py_DECREF(d);
2503         di->di_dict = NULL;
2504         return NULL;
2505 }
2506
2507 PyTypeObject PyDictIterKey_Type = {
2508         PyVarObject_HEAD_INIT(&PyType_Type, 0)
2509         "dictionary-keyiterator",               /* tp_name */
2510         sizeof(dictiterobject),                 /* tp_basicsize */
2511         0,                                      /* tp_itemsize */
2512         /* methods */
2513         (destructor)dictiter_dealloc,           /* tp_dealloc */
2514         0,                                      /* tp_print */
2515         0,                                      /* tp_getattr */
2516         0,                                      /* tp_setattr */
2517         0,                                      /* tp_compare */
2518         0,                                      /* tp_repr */
2519         0,                                      /* tp_as_number */
2520         0,                                      /* tp_as_sequence */
2521         0,                                      /* tp_as_mapping */
2522         0,                                      /* tp_hash */
2523         0,                                      /* tp_call */
2524         0,                                      /* tp_str */
2525         PyObject_GenericGetAttr,                /* tp_getattro */
2526         0,                                      /* tp_setattro */
2527         0,                                      /* tp_as_buffer */
2528         Py_TPFLAGS_DEFAULT | Py_TPFLAGS_HAVE_GC,/* tp_flags */
2529         0,                                      /* tp_doc */
2530         (traverseproc)dictiter_traverse,        /* tp_traverse */
2531         0,                                      /* tp_clear */
2532         0,                                      /* tp_richcompare */
2533         0,                                      /* tp_weaklistoffset */
2534         PyObject_SelfIter,                      /* tp_iter */
2535         (iternextfunc)dictiter_iternextkey,     /* tp_iternext */
2536         dictiter_methods,                       /* tp_methods */
2537         0,
2538 };
2539
2540 static PyObject *dictiter_iternextvalue(dictiterobject *di)
2541 {
2542         PyObject *value;
2543         register Py_ssize_t i, mask;
2544         register PyDictEntry *ep;
2545         PyDictObject *d = di->di_dict;
2546
2547         if (d == NULL)
2548                 return NULL;
2549         assert (PyDict_Check(d));
2550
2551         if (di->di_used != d->ma_used) {
2552                 PyErr_SetString(PyExc_RuntimeError,
2553                                 "dictionary changed size during iteration");
2554                 di->di_used = -1; /* Make this state sticky */
2555                 return NULL;
2556         }
2557
2558         i = di->di_pos;
2559         mask = d->ma_mask;
2560         if (i < 0 || i > mask)
2561                 goto fail;
2562         ep = d->ma_table;
2563         while ((value=ep[i].me_value) == NULL) {
2564                 i++;
2565                 if (i > mask)
2566                         goto fail;
2567         }
2568         di->di_pos = i+1;
2569         di->len--;
2570         Py_INCREF(value);
2571         return value;
2572
2573 fail:
2574         Py_DECREF(d);
2575         di->di_dict = NULL;
2576         return NULL;
2577 }
2578
2579 PyTypeObject PyDictIterValue_Type = {
2580         PyVarObject_HEAD_INIT(&PyType_Type, 0)
2581         "dictionary-valueiterator",             /* tp_name */
2582         sizeof(dictiterobject),                 /* tp_basicsize */
2583         0,                                      /* tp_itemsize */
2584         /* methods */
2585         (destructor)dictiter_dealloc,           /* tp_dealloc */
2586         0,                                      /* tp_print */
2587         0,                                      /* tp_getattr */
2588         0,                                      /* tp_setattr */
2589         0,                                      /* tp_compare */
2590         0,                                      /* tp_repr */
2591         0,                                      /* tp_as_number */
2592         0,                                      /* tp_as_sequence */
2593         0,                                      /* tp_as_mapping */
2594         0,                                      /* tp_hash */
2595         0,                                      /* tp_call */
2596         0,                                      /* tp_str */
2597         PyObject_GenericGetAttr,                /* tp_getattro */
2598         0,                                      /* tp_setattro */
2599         0,                                      /* tp_as_buffer */
2600         Py_TPFLAGS_DEFAULT | Py_TPFLAGS_HAVE_GC,/* tp_flags */
2601         0,                                      /* tp_doc */
2602         (traverseproc)dictiter_traverse,        /* tp_traverse */
2603         0,                                      /* tp_clear */
2604         0,                                      /* tp_richcompare */
2605         0,                                      /* tp_weaklistoffset */
2606         PyObject_SelfIter,                      /* tp_iter */
2607         (iternextfunc)dictiter_iternextvalue,   /* tp_iternext */
2608         dictiter_methods,                       /* tp_methods */
2609         0,
2610 };
2611
2612 static PyObject *dictiter_iternextitem(dictiterobject *di)
2613 {
2614         PyObject *key, *value, *result = di->di_result;
2615         register Py_ssize_t i, mask;
2616         register PyDictEntry *ep;
2617         PyDictObject *d = di->di_dict;
2618
2619         if (d == NULL)
2620                 return NULL;
2621         assert (PyDict_Check(d));
2622
2623         if (di->di_used != d->ma_used) {
2624                 PyErr_SetString(PyExc_RuntimeError,
2625                                 "dictionary changed size during iteration");
2626                 di->di_used = -1; /* Make this state sticky */
2627                 return NULL;
2628         }
2629
2630         i = di->di_pos;
2631         if (i < 0)
2632                 goto fail;
2633         ep = d->ma_table;
2634         mask = d->ma_mask;
2635         while (i <= mask && ep[i].me_value == NULL)
2636                 i++;
2637         di->di_pos = i+1;
2638         if (i > mask)
2639                 goto fail;
2640
2641         if (result->ob_refcnt == 1) {
2642                 Py_INCREF(result);
2643                 Py_DECREF(PyTuple_GET_ITEM(result, 0));
2644                 Py_DECREF(PyTuple_GET_ITEM(result, 1));
2645         } else {
2646                 result = PyTuple_New(2);
2647                 if (result == NULL)
2648                         return NULL;
2649         }
2650         di->len--;
2651         key = ep[i].me_key;
2652         value = ep[i].me_value;
2653         Py_INCREF(key);
2654         Py_INCREF(value);
2655         PyTuple_SET_ITEM(result, 0, key);
2656         PyTuple_SET_ITEM(result, 1, value);
2657         return result;
2658
2659 fail:
2660         Py_DECREF(d);
2661         di->di_dict = NULL;
2662         return NULL;
2663 }
2664
2665 PyTypeObject PyDictIterItem_Type = {
2666         PyVarObject_HEAD_INIT(&PyType_Type, 0)
2667         "dictionary-itemiterator",              /* tp_name */
2668         sizeof(dictiterobject),                 /* tp_basicsize */
2669         0,                                      /* tp_itemsize */
2670         /* methods */
2671         (destructor)dictiter_dealloc,           /* tp_dealloc */
2672         0,                                      /* tp_print */
2673         0,                                      /* tp_getattr */
2674         0,                                      /* tp_setattr */
2675         0,                                      /* tp_compare */
2676         0,                                      /* tp_repr */
2677         0,                                      /* tp_as_number */
2678         0,                                      /* tp_as_sequence */
2679         0,                                      /* tp_as_mapping */
2680         0,                                      /* tp_hash */
2681         0,                                      /* tp_call */
2682         0,                                      /* tp_str */
2683         PyObject_GenericGetAttr,                /* tp_getattro */
2684         0,                                      /* tp_setattro */
2685         0,                                      /* tp_as_buffer */
2686         Py_TPFLAGS_DEFAULT | Py_TPFLAGS_HAVE_GC,/* tp_flags */
2687         0,                                      /* tp_doc */
2688         (traverseproc)dictiter_traverse,        /* tp_traverse */
2689         0,                                      /* tp_clear */
2690         0,                                      /* tp_richcompare */
2691         0,                                      /* tp_weaklistoffset */
2692         PyObject_SelfIter,                      /* tp_iter */
2693         (iternextfunc)dictiter_iternextitem,    /* tp_iternext */
2694         dictiter_methods,                       /* tp_methods */
2695         0,
2696 };