@@ -564,10 +564,25 @@ def __hash__(self):
564
564
try :
565
565
dinv = pow (self ._denominator , - 1 , _PyHASH_MODULUS )
566
566
except ValueError :
567
- # ValueError means there is no modular inverse
567
+ # ValueError means there is no modular inverse.
568
568
hash_ = _PyHASH_INF
569
569
else :
570
- hash_ = hash (abs (self ._numerator )) * dinv % _PyHASH_MODULUS
570
+ # The general algorithm now specifies that the absolute value of
571
+ # the hash is
572
+ # (|N| * dinv) % P
573
+ # where N is self._numerator and P is _PyHASH_MODULUS. That's
574
+ # optimized here in two ways: first, for a non-negative int i,
575
+ # hash(i) == i % P, but the int hash implementation doesn't need
576
+ # to divide, and is faster than doing % P explicitly. So we do
577
+ # hash(|N| * dinv)
578
+ # instead. Second, N is unbounded, so its product with dinv may
579
+ # be arbitrarily expensive to compute. The final answer is the
580
+ # same if we use the bounded |N| % P instead, which can again
581
+ # be done with an int hash() call. If 0 <= i < P, hash(i) == i,
582
+ # so this nested hash() call wastes a bit of time making a
583
+ # redundant copy when |N| < P, but can save an arbitrarily large
584
+ # amount of computation for large |N|.
585
+ hash_ = hash (hash (abs (self ._numerator )) * dinv )
571
586
result = hash_ if self ._numerator >= 0 else - hash_
572
587
return - 2 if result == - 1 else result
573
588
0 commit comments