| Guido van Rossum | e7b146f | 2000-02-04 15:28:42 +0000 | [diff] [blame] | 1 | """Random variable generators. | 
| Guido van Rossum | ff03b1a | 1994-03-09 12:55:02 +0000 | [diff] [blame] | 2 |  | 
| Tim Peters | d7b5e88 | 2001-01-25 03:36:26 +0000 | [diff] [blame] | 3 |     integers | 
 | 4 |     -------- | 
 | 5 |            uniform within range | 
 | 6 |  | 
 | 7 |     sequences | 
 | 8 |     --------- | 
 | 9 |            pick random element | 
| Raymond Hettinger | f24eb35 | 2002-11-12 17:41:57 +0000 | [diff] [blame] | 10 |            pick random sample | 
| Tim Peters | d7b5e88 | 2001-01-25 03:36:26 +0000 | [diff] [blame] | 11 |            generate random permutation | 
 | 12 |  | 
| Guido van Rossum | e7b146f | 2000-02-04 15:28:42 +0000 | [diff] [blame] | 13 |     distributions on the real line: | 
 | 14 |     ------------------------------ | 
| Tim Peters | d7b5e88 | 2001-01-25 03:36:26 +0000 | [diff] [blame] | 15 |            uniform | 
| Christian Heimes | fe337bf | 2008-03-23 21:54:12 +0000 | [diff] [blame] | 16 |            triangular | 
| Guido van Rossum | e7b146f | 2000-02-04 15:28:42 +0000 | [diff] [blame] | 17 |            normal (Gaussian) | 
 | 18 |            lognormal | 
 | 19 |            negative exponential | 
 | 20 |            gamma | 
 | 21 |            beta | 
| Raymond Hettinger | 40f6217 | 2002-12-29 23:03:38 +0000 | [diff] [blame] | 22 |            pareto | 
 | 23 |            Weibull | 
| Guido van Rossum | ff03b1a | 1994-03-09 12:55:02 +0000 | [diff] [blame] | 24 |  | 
| Guido van Rossum | e7b146f | 2000-02-04 15:28:42 +0000 | [diff] [blame] | 25 |     distributions on the circle (angles 0 to 2pi) | 
 | 26 |     --------------------------------------------- | 
 | 27 |            circular uniform | 
 | 28 |            von Mises | 
 | 29 |  | 
| Raymond Hettinger | 40f6217 | 2002-12-29 23:03:38 +0000 | [diff] [blame] | 30 | General notes on the underlying Mersenne Twister core generator: | 
| Guido van Rossum | e7b146f | 2000-02-04 15:28:42 +0000 | [diff] [blame] | 31 |  | 
| Raymond Hettinger | 40f6217 | 2002-12-29 23:03:38 +0000 | [diff] [blame] | 32 | * The period is 2**19937-1. | 
| Thomas Wouters | 0e3f591 | 2006-08-11 14:57:12 +0000 | [diff] [blame] | 33 | * It is one of the most extensively tested generators in existence. | 
| Thomas Wouters | 0e3f591 | 2006-08-11 14:57:12 +0000 | [diff] [blame] | 34 | * The random() method is implemented in C, executes in a single Python step, | 
 | 35 |   and is, therefore, threadsafe. | 
| Tim Peters | e360d95 | 2001-01-26 10:00:39 +0000 | [diff] [blame] | 36 |  | 
| Guido van Rossum | e7b146f | 2000-02-04 15:28:42 +0000 | [diff] [blame] | 37 | """ | 
| Guido van Rossum | d03e119 | 1998-05-29 17:51:31 +0000 | [diff] [blame] | 38 |  | 
| Christian Heimes | fe337bf | 2008-03-23 21:54:12 +0000 | [diff] [blame] | 39 | from __future__ import division | 
| Raymond Hettinger | 2f726e9 | 2003-10-05 09:09:15 +0000 | [diff] [blame] | 40 | from warnings import warn as _warn | 
 | 41 | from types import MethodType as _MethodType, BuiltinMethodType as _BuiltinMethodType | 
| Raymond Hettinger | 91e27c2 | 2005-08-19 01:36:35 +0000 | [diff] [blame] | 42 | from math import log as _log, exp as _exp, pi as _pi, e as _e, ceil as _ceil | 
| Tim Peters | d7b5e88 | 2001-01-25 03:36:26 +0000 | [diff] [blame] | 43 | from math import sqrt as _sqrt, acos as _acos, cos as _cos, sin as _sin | 
| Raymond Hettinger | c1c43ca | 2004-09-05 00:00:42 +0000 | [diff] [blame] | 44 | from os import urandom as _urandom | 
 | 45 | from binascii import hexlify as _hexlify | 
| Raymond Hettinger | 886687d | 2009-02-24 11:27:15 +0000 | [diff] [blame] | 46 | import collections as _collections | 
| Guido van Rossum | ff03b1a | 1994-03-09 12:55:02 +0000 | [diff] [blame] | 47 |  | 
| Raymond Hettinger | f24eb35 | 2002-11-12 17:41:57 +0000 | [diff] [blame] | 48 | __all__ = ["Random","seed","random","uniform","randint","choice","sample", | 
| Skip Montanaro | 0de6580 | 2001-02-15 22:15:14 +0000 | [diff] [blame] | 49 |            "randrange","shuffle","normalvariate","lognormvariate", | 
| Christian Heimes | fe337bf | 2008-03-23 21:54:12 +0000 | [diff] [blame] | 50 |            "expovariate","vonmisesvariate","gammavariate","triangular", | 
| Raymond Hettinger | f8a52d3 | 2003-08-05 12:23:19 +0000 | [diff] [blame] | 51 |            "gauss","betavariate","paretovariate","weibullvariate", | 
| Raymond Hettinger | 28de64f | 2008-01-13 23:40:30 +0000 | [diff] [blame] | 52 |            "getstate","setstate", "getrandbits", | 
| Raymond Hettinger | 23f1241 | 2004-09-13 22:23:21 +0000 | [diff] [blame] | 53 |            "SystemRandom"] | 
| Tim Peters | d7b5e88 | 2001-01-25 03:36:26 +0000 | [diff] [blame] | 54 |  | 
 | 55 | NV_MAGICCONST = 4 * _exp(-0.5)/_sqrt(2.0) | 
| Tim Peters | d7b5e88 | 2001-01-25 03:36:26 +0000 | [diff] [blame] | 56 | TWOPI = 2.0*_pi | 
| Tim Peters | d7b5e88 | 2001-01-25 03:36:26 +0000 | [diff] [blame] | 57 | LOG4 = _log(4.0) | 
| Tim Peters | d7b5e88 | 2001-01-25 03:36:26 +0000 | [diff] [blame] | 58 | SG_MAGICCONST = 1.0 + _log(4.5) | 
| Raymond Hettinger | 2f726e9 | 2003-10-05 09:09:15 +0000 | [diff] [blame] | 59 | BPF = 53        # Number of bits in a float | 
| Tim Peters | 7c2a85b | 2004-08-31 02:19:55 +0000 | [diff] [blame] | 60 | RECIP_BPF = 2**-BPF | 
| Tim Peters | d7b5e88 | 2001-01-25 03:36:26 +0000 | [diff] [blame] | 61 |  | 
| Raymond Hettinger | 356a459 | 2004-08-30 06:14:31 +0000 | [diff] [blame] | 62 |  | 
| Tim Peters | d7b5e88 | 2001-01-25 03:36:26 +0000 | [diff] [blame] | 63 | # Translated by Guido van Rossum from C source provided by | 
| Raymond Hettinger | 40f6217 | 2002-12-29 23:03:38 +0000 | [diff] [blame] | 64 | # Adrian Baddeley.  Adapted by Raymond Hettinger for use with | 
| Raymond Hettinger | 3fa19d7 | 2004-08-31 01:05:15 +0000 | [diff] [blame] | 65 | # the Mersenne Twister  and os.urandom() core generators. | 
| Tim Peters | d7b5e88 | 2001-01-25 03:36:26 +0000 | [diff] [blame] | 66 |  | 
| Raymond Hettinger | 145a4a0 | 2003-01-07 10:25:55 +0000 | [diff] [blame] | 67 | import _random | 
| Raymond Hettinger | 40f6217 | 2002-12-29 23:03:38 +0000 | [diff] [blame] | 68 |  | 
| Raymond Hettinger | 145a4a0 | 2003-01-07 10:25:55 +0000 | [diff] [blame] | 69 | class Random(_random.Random): | 
| Raymond Hettinger | c32f033 | 2002-05-23 19:44:49 +0000 | [diff] [blame] | 70 |     """Random number generator base class used by bound module functions. | 
 | 71 |  | 
 | 72 |     Used to instantiate instances of Random to get generators that don't | 
| Raymond Hettinger | 28de64f | 2008-01-13 23:40:30 +0000 | [diff] [blame] | 73 |     share state. | 
| Raymond Hettinger | c32f033 | 2002-05-23 19:44:49 +0000 | [diff] [blame] | 74 |  | 
 | 75 |     Class Random can also be subclassed if you want to use a different basic | 
 | 76 |     generator of your own devising: in that case, override the following | 
| Raymond Hettinger | 28de64f | 2008-01-13 23:40:30 +0000 | [diff] [blame] | 77 |     methods:  random(), seed(), getstate(), and setstate(). | 
| Benjamin Peterson | d18de0e | 2008-07-31 20:21:46 +0000 | [diff] [blame] | 78 |     Optionally, implement a getrandbits() method so that randrange() | 
| Raymond Hettinger | 2f726e9 | 2003-10-05 09:09:15 +0000 | [diff] [blame] | 79 |     can cover arbitrarily large ranges. | 
| Raymond Hettinger | ef4d4bd | 2002-05-23 23:58:17 +0000 | [diff] [blame] | 80 |  | 
| Raymond Hettinger | c32f033 | 2002-05-23 19:44:49 +0000 | [diff] [blame] | 81 |     """ | 
| Tim Peters | d7b5e88 | 2001-01-25 03:36:26 +0000 | [diff] [blame] | 82 |  | 
| Christian Heimes | cbf3b5c | 2007-12-03 21:02:03 +0000 | [diff] [blame] | 83 |     VERSION = 3     # used by getstate/setstate | 
| Tim Peters | d7b5e88 | 2001-01-25 03:36:26 +0000 | [diff] [blame] | 84 |  | 
 | 85 |     def __init__(self, x=None): | 
 | 86 |         """Initialize an instance. | 
 | 87 |  | 
 | 88 |         Optional argument x controls seeding, as for Random.seed(). | 
 | 89 |         """ | 
 | 90 |  | 
 | 91 |         self.seed(x) | 
| Raymond Hettinger | 40f6217 | 2002-12-29 23:03:38 +0000 | [diff] [blame] | 92 |         self.gauss_next = None | 
| Tim Peters | d7b5e88 | 2001-01-25 03:36:26 +0000 | [diff] [blame] | 93 |  | 
| Tim Peters | 0de88fc | 2001-02-01 04:59:18 +0000 | [diff] [blame] | 94 |     def seed(self, a=None): | 
 | 95 |         """Initialize internal state from hashable object. | 
| Tim Peters | d7b5e88 | 2001-01-25 03:36:26 +0000 | [diff] [blame] | 96 |  | 
| Raymond Hettinger | 23f1241 | 2004-09-13 22:23:21 +0000 | [diff] [blame] | 97 |         None or no argument seeds from current time or from an operating | 
 | 98 |         system specific randomness source if available. | 
| Tim Peters | 0de88fc | 2001-02-01 04:59:18 +0000 | [diff] [blame] | 99 |  | 
| Mark Dickinson | 5c2db37 | 2009-12-05 20:28:34 +0000 | [diff] [blame] | 100 |         If a is not None or an int, hash(a) is used instead. | 
| Tim Peters | d7b5e88 | 2001-01-25 03:36:26 +0000 | [diff] [blame] | 101 |         """ | 
 | 102 |  | 
| Raymond Hettinger | 3081d59 | 2003-08-09 18:30:57 +0000 | [diff] [blame] | 103 |         if a is None: | 
| Raymond Hettinger | c1c43ca | 2004-09-05 00:00:42 +0000 | [diff] [blame] | 104 |             try: | 
| Guido van Rossum | e2a383d | 2007-01-15 16:59:06 +0000 | [diff] [blame] | 105 |                 a = int(_hexlify(_urandom(16)), 16) | 
| Raymond Hettinger | c1c43ca | 2004-09-05 00:00:42 +0000 | [diff] [blame] | 106 |             except NotImplementedError: | 
| Raymond Hettinger | 356a459 | 2004-08-30 06:14:31 +0000 | [diff] [blame] | 107 |                 import time | 
| Guido van Rossum | e2a383d | 2007-01-15 16:59:06 +0000 | [diff] [blame] | 108 |                 a = int(time.time() * 256) # use fractional seconds | 
| Raymond Hettinger | 356a459 | 2004-08-30 06:14:31 +0000 | [diff] [blame] | 109 |  | 
| Guido van Rossum | cd16bf6 | 2007-06-13 18:07:49 +0000 | [diff] [blame] | 110 |         super().seed(a) | 
| Tim Peters | 46c04e1 | 2002-05-05 20:40:00 +0000 | [diff] [blame] | 111 |         self.gauss_next = None | 
 | 112 |  | 
| Tim Peters | cd80410 | 2001-01-25 20:25:57 +0000 | [diff] [blame] | 113 |     def getstate(self): | 
 | 114 |         """Return internal state; can be passed to setstate() later.""" | 
| Guido van Rossum | cd16bf6 | 2007-06-13 18:07:49 +0000 | [diff] [blame] | 115 |         return self.VERSION, super().getstate(), self.gauss_next | 
| Tim Peters | cd80410 | 2001-01-25 20:25:57 +0000 | [diff] [blame] | 116 |  | 
 | 117 |     def setstate(self, state): | 
 | 118 |         """Restore internal state from object returned by getstate().""" | 
 | 119 |         version = state[0] | 
| Christian Heimes | cbf3b5c | 2007-12-03 21:02:03 +0000 | [diff] [blame] | 120 |         if version == 3: | 
| Raymond Hettinger | 40f6217 | 2002-12-29 23:03:38 +0000 | [diff] [blame] | 121 |             version, internalstate, self.gauss_next = state | 
| Guido van Rossum | cd16bf6 | 2007-06-13 18:07:49 +0000 | [diff] [blame] | 122 |             super().setstate(internalstate) | 
| Christian Heimes | cbf3b5c | 2007-12-03 21:02:03 +0000 | [diff] [blame] | 123 |         elif version == 2: | 
 | 124 |             version, internalstate, self.gauss_next = state | 
 | 125 |             # In version 2, the state was saved as signed ints, which causes | 
 | 126 |             #   inconsistencies between 32/64-bit systems. The state is | 
 | 127 |             #   really unsigned 32-bit ints, so we convert negative ints from | 
 | 128 |             #   version 2 to positive longs for version 3. | 
 | 129 |             try: | 
 | 130 |                 internalstate = tuple( x % (2**32) for x in internalstate ) | 
 | 131 |             except ValueError as e: | 
 | 132 |                 raise TypeError from e | 
 | 133 |             super(Random, self).setstate(internalstate) | 
| Tim Peters | cd80410 | 2001-01-25 20:25:57 +0000 | [diff] [blame] | 134 |         else: | 
 | 135 |             raise ValueError("state with version %s passed to " | 
 | 136 |                              "Random.setstate() of version %s" % | 
 | 137 |                              (version, self.VERSION)) | 
 | 138 |  | 
| Tim Peters | cd80410 | 2001-01-25 20:25:57 +0000 | [diff] [blame] | 139 | ## ---- Methods below this point do not need to be overridden when | 
 | 140 | ## ---- subclassing for the purpose of using a different core generator. | 
 | 141 |  | 
 | 142 | ## -------------------- pickle support  ------------------- | 
 | 143 |  | 
 | 144 |     def __getstate__(self): # for pickle | 
 | 145 |         return self.getstate() | 
 | 146 |  | 
 | 147 |     def __setstate__(self, state):  # for pickle | 
 | 148 |         self.setstate(state) | 
 | 149 |  | 
| Raymond Hettinger | 5f078ff | 2003-06-24 20:29:04 +0000 | [diff] [blame] | 150 |     def __reduce__(self): | 
 | 151 |         return self.__class__, (), self.getstate() | 
 | 152 |  | 
| Tim Peters | cd80410 | 2001-01-25 20:25:57 +0000 | [diff] [blame] | 153 | ## -------------------- integer methods  ------------------- | 
 | 154 |  | 
| Raymond Hettinger | 2f726e9 | 2003-10-05 09:09:15 +0000 | [diff] [blame] | 155 |     def randrange(self, start, stop=None, step=1, int=int, default=None, | 
| Guido van Rossum | e2a383d | 2007-01-15 16:59:06 +0000 | [diff] [blame] | 156 |                   maxwidth=1<<BPF): | 
| Tim Peters | d7b5e88 | 2001-01-25 03:36:26 +0000 | [diff] [blame] | 157 |         """Choose a random item from range(start, stop[, step]). | 
 | 158 |  | 
 | 159 |         This fixes the problem with randint() which includes the | 
 | 160 |         endpoint; in Python this is usually not what you want. | 
| Raymond Hettinger | 2f726e9 | 2003-10-05 09:09:15 +0000 | [diff] [blame] | 161 |         Do not supply the 'int', 'default', and 'maxwidth' arguments. | 
| Tim Peters | d7b5e88 | 2001-01-25 03:36:26 +0000 | [diff] [blame] | 162 |         """ | 
 | 163 |  | 
 | 164 |         # This code is a bit messy to make it fast for the | 
| Tim Peters | 9146f27 | 2002-08-16 03:41:39 +0000 | [diff] [blame] | 165 |         # common case while still doing adequate error checking. | 
| Tim Peters | d7b5e88 | 2001-01-25 03:36:26 +0000 | [diff] [blame] | 166 |         istart = int(start) | 
 | 167 |         if istart != start: | 
| Collin Winter | ce36ad8 | 2007-08-30 01:19:48 +0000 | [diff] [blame] | 168 |             raise ValueError("non-integer arg 1 for randrange()") | 
| Tim Peters | d7b5e88 | 2001-01-25 03:36:26 +0000 | [diff] [blame] | 169 |         if stop is default: | 
 | 170 |             if istart > 0: | 
| Raymond Hettinger | 2f726e9 | 2003-10-05 09:09:15 +0000 | [diff] [blame] | 171 |                 if istart >= maxwidth: | 
 | 172 |                     return self._randbelow(istart) | 
| Tim Peters | d7b5e88 | 2001-01-25 03:36:26 +0000 | [diff] [blame] | 173 |                 return int(self.random() * istart) | 
| Collin Winter | ce36ad8 | 2007-08-30 01:19:48 +0000 | [diff] [blame] | 174 |             raise ValueError("empty range for randrange()") | 
| Tim Peters | 9146f27 | 2002-08-16 03:41:39 +0000 | [diff] [blame] | 175 |  | 
 | 176 |         # stop argument supplied. | 
| Tim Peters | d7b5e88 | 2001-01-25 03:36:26 +0000 | [diff] [blame] | 177 |         istop = int(stop) | 
 | 178 |         if istop != stop: | 
| Collin Winter | ce36ad8 | 2007-08-30 01:19:48 +0000 | [diff] [blame] | 179 |             raise ValueError("non-integer stop for randrange()") | 
| Raymond Hettinger | 2f726e9 | 2003-10-05 09:09:15 +0000 | [diff] [blame] | 180 |         width = istop - istart | 
 | 181 |         if step == 1 and width > 0: | 
| Tim Peters | 76ca1d4 | 2003-06-19 03:46:46 +0000 | [diff] [blame] | 182 |             # Note that | 
| Raymond Hettinger | 2f726e9 | 2003-10-05 09:09:15 +0000 | [diff] [blame] | 183 |             #     int(istart + self.random()*width) | 
| Tim Peters | 76ca1d4 | 2003-06-19 03:46:46 +0000 | [diff] [blame] | 184 |             # instead would be incorrect.  For example, consider istart | 
 | 185 |             # = -2 and istop = 0.  Then the guts would be in | 
 | 186 |             # -2.0 to 0.0 exclusive on both ends (ignoring that random() | 
 | 187 |             # might return 0.0), and because int() truncates toward 0, the | 
 | 188 |             # final result would be -1 or 0 (instead of -2 or -1). | 
| Raymond Hettinger | 2f726e9 | 2003-10-05 09:09:15 +0000 | [diff] [blame] | 189 |             #     istart + int(self.random()*width) | 
| Tim Peters | 76ca1d4 | 2003-06-19 03:46:46 +0000 | [diff] [blame] | 190 |             # would also be incorrect, for a subtler reason:  the RHS | 
 | 191 |             # can return a long, and then randrange() would also return | 
 | 192 |             # a long, but we're supposed to return an int (for backward | 
 | 193 |             # compatibility). | 
| Raymond Hettinger | 2f726e9 | 2003-10-05 09:09:15 +0000 | [diff] [blame] | 194 |  | 
 | 195 |             if width >= maxwidth: | 
| Tim Peters | 58eb11c | 2004-01-18 20:29:55 +0000 | [diff] [blame] | 196 |                 return int(istart + self._randbelow(width)) | 
| Raymond Hettinger | 2f726e9 | 2003-10-05 09:09:15 +0000 | [diff] [blame] | 197 |             return int(istart + int(self.random()*width)) | 
| Tim Peters | d7b5e88 | 2001-01-25 03:36:26 +0000 | [diff] [blame] | 198 |         if step == 1: | 
| Collin Winter | ce36ad8 | 2007-08-30 01:19:48 +0000 | [diff] [blame] | 199 |             raise ValueError("empty range for randrange() (%d,%d, %d)" % (istart, istop, width)) | 
| Tim Peters | 9146f27 | 2002-08-16 03:41:39 +0000 | [diff] [blame] | 200 |  | 
 | 201 |         # Non-unit step argument supplied. | 
| Tim Peters | d7b5e88 | 2001-01-25 03:36:26 +0000 | [diff] [blame] | 202 |         istep = int(step) | 
 | 203 |         if istep != step: | 
| Collin Winter | ce36ad8 | 2007-08-30 01:19:48 +0000 | [diff] [blame] | 204 |             raise ValueError("non-integer step for randrange()") | 
| Tim Peters | d7b5e88 | 2001-01-25 03:36:26 +0000 | [diff] [blame] | 205 |         if istep > 0: | 
| Raymond Hettinger | ffdb8bb | 2004-09-27 15:29:05 +0000 | [diff] [blame] | 206 |             n = (width + istep - 1) // istep | 
| Tim Peters | d7b5e88 | 2001-01-25 03:36:26 +0000 | [diff] [blame] | 207 |         elif istep < 0: | 
| Raymond Hettinger | ffdb8bb | 2004-09-27 15:29:05 +0000 | [diff] [blame] | 208 |             n = (width + istep + 1) // istep | 
| Tim Peters | d7b5e88 | 2001-01-25 03:36:26 +0000 | [diff] [blame] | 209 |         else: | 
| Collin Winter | ce36ad8 | 2007-08-30 01:19:48 +0000 | [diff] [blame] | 210 |             raise ValueError("zero step for randrange()") | 
| Tim Peters | d7b5e88 | 2001-01-25 03:36:26 +0000 | [diff] [blame] | 211 |  | 
 | 212 |         if n <= 0: | 
| Collin Winter | ce36ad8 | 2007-08-30 01:19:48 +0000 | [diff] [blame] | 213 |             raise ValueError("empty range for randrange()") | 
| Raymond Hettinger | 2f726e9 | 2003-10-05 09:09:15 +0000 | [diff] [blame] | 214 |  | 
 | 215 |         if n >= maxwidth: | 
| Thomas Wouters | 902d6eb | 2007-01-09 23:18:33 +0000 | [diff] [blame] | 216 |             return istart + istep*self._randbelow(n) | 
| Tim Peters | d7b5e88 | 2001-01-25 03:36:26 +0000 | [diff] [blame] | 217 |         return istart + istep*int(self.random() * n) | 
 | 218 |  | 
 | 219 |     def randint(self, a, b): | 
| Tim Peters | cd80410 | 2001-01-25 20:25:57 +0000 | [diff] [blame] | 220 |         """Return random integer in range [a, b], including both end points. | 
| Tim Peters | d7b5e88 | 2001-01-25 03:36:26 +0000 | [diff] [blame] | 221 |         """ | 
 | 222 |  | 
 | 223 |         return self.randrange(a, b+1) | 
 | 224 |  | 
| Guido van Rossum | e2a383d | 2007-01-15 16:59:06 +0000 | [diff] [blame] | 225 |     def _randbelow(self, n, _log=_log, int=int, _maxwidth=1<<BPF, | 
| Raymond Hettinger | 2f726e9 | 2003-10-05 09:09:15 +0000 | [diff] [blame] | 226 |                    _Method=_MethodType, _BuiltinMethod=_BuiltinMethodType): | 
 | 227 |         """Return a random int in the range [0,n) | 
 | 228 |  | 
 | 229 |         Handles the case where n has more bits than returned | 
 | 230 |         by a single call to the underlying generator. | 
 | 231 |         """ | 
 | 232 |  | 
 | 233 |         try: | 
 | 234 |             getrandbits = self.getrandbits | 
 | 235 |         except AttributeError: | 
 | 236 |             pass | 
 | 237 |         else: | 
 | 238 |             # Only call self.getrandbits if the original random() builtin method | 
 | 239 |             # has not been overridden or if a new getrandbits() was supplied. | 
 | 240 |             # This assures that the two methods correspond. | 
 | 241 |             if type(self.random) is _BuiltinMethod or type(getrandbits) is _Method: | 
 | 242 |                 k = int(1.00001 + _log(n-1, 2.0))   # 2**k > n-1 > 2**(k-2) | 
 | 243 |                 r = getrandbits(k) | 
 | 244 |                 while r >= n: | 
 | 245 |                     r = getrandbits(k) | 
 | 246 |                 return r | 
 | 247 |         if n >= _maxwidth: | 
 | 248 |             _warn("Underlying random() generator does not supply \n" | 
 | 249 |                 "enough bits to choose from a population range this large") | 
 | 250 |         return int(self.random() * n) | 
 | 251 |  | 
| Tim Peters | cd80410 | 2001-01-25 20:25:57 +0000 | [diff] [blame] | 252 | ## -------------------- sequence methods  ------------------- | 
 | 253 |  | 
| Tim Peters | d7b5e88 | 2001-01-25 03:36:26 +0000 | [diff] [blame] | 254 |     def choice(self, seq): | 
 | 255 |         """Choose a random element from a non-empty sequence.""" | 
| Raymond Hettinger | 5dae505 | 2004-06-07 02:07:15 +0000 | [diff] [blame] | 256 |         return seq[int(self.random() * len(seq))]  # raises IndexError if seq is empty | 
| Tim Peters | d7b5e88 | 2001-01-25 03:36:26 +0000 | [diff] [blame] | 257 |  | 
 | 258 |     def shuffle(self, x, random=None, int=int): | 
 | 259 |         """x, random=random.random -> shuffle list x in place; return None. | 
 | 260 |  | 
 | 261 |         Optional arg random is a 0-argument function returning a random | 
 | 262 |         float in [0.0, 1.0); by default, the standard random.random. | 
| Tim Peters | d7b5e88 | 2001-01-25 03:36:26 +0000 | [diff] [blame] | 263 |         """ | 
 | 264 |  | 
 | 265 |         if random is None: | 
 | 266 |             random = self.random | 
| Guido van Rossum | 805365e | 2007-05-07 22:24:25 +0000 | [diff] [blame] | 267 |         for i in reversed(range(1, len(x))): | 
| Tim Peters | cd80410 | 2001-01-25 20:25:57 +0000 | [diff] [blame] | 268 |             # pick an element in x[:i+1] with which to exchange x[i] | 
| Tim Peters | d7b5e88 | 2001-01-25 03:36:26 +0000 | [diff] [blame] | 269 |             j = int(random() * (i+1)) | 
 | 270 |             x[i], x[j] = x[j], x[i] | 
 | 271 |  | 
| Raymond Hettinger | fdbe522 | 2003-06-13 07:01:51 +0000 | [diff] [blame] | 272 |     def sample(self, population, k): | 
| Raymond Hettinger | 1acde19 | 2008-01-14 01:00:53 +0000 | [diff] [blame] | 273 |         """Chooses k unique random elements from a population sequence or set. | 
| Raymond Hettinger | f24eb35 | 2002-11-12 17:41:57 +0000 | [diff] [blame] | 274 |  | 
| Raymond Hettinger | c0b4034 | 2002-11-13 15:26:37 +0000 | [diff] [blame] | 275 |         Returns a new list containing elements from the population while | 
 | 276 |         leaving the original population unchanged.  The resulting list is | 
 | 277 |         in selection order so that all sub-slices will also be valid random | 
 | 278 |         samples.  This allows raffle winners (the sample) to be partitioned | 
 | 279 |         into grand prize and second place winners (the subslices). | 
| Raymond Hettinger | f24eb35 | 2002-11-12 17:41:57 +0000 | [diff] [blame] | 280 |  | 
| Raymond Hettinger | c0b4034 | 2002-11-13 15:26:37 +0000 | [diff] [blame] | 281 |         Members of the population need not be hashable or unique.  If the | 
 | 282 |         population contains repeats, then each occurrence is a possible | 
 | 283 |         selection in the sample. | 
| Raymond Hettinger | f24eb35 | 2002-11-12 17:41:57 +0000 | [diff] [blame] | 284 |  | 
| Guido van Rossum | 805365e | 2007-05-07 22:24:25 +0000 | [diff] [blame] | 285 |         To choose a sample in a range of integers, use range as an argument. | 
| Raymond Hettinger | c0b4034 | 2002-11-13 15:26:37 +0000 | [diff] [blame] | 286 |         This is especially fast and space efficient for sampling from a | 
| Guido van Rossum | 805365e | 2007-05-07 22:24:25 +0000 | [diff] [blame] | 287 |         large population:   sample(range(10000000), 60) | 
| Raymond Hettinger | f24eb35 | 2002-11-12 17:41:57 +0000 | [diff] [blame] | 288 |         """ | 
 | 289 |  | 
| Raymond Hettinger | c0b4034 | 2002-11-13 15:26:37 +0000 | [diff] [blame] | 290 |         # Sampling without replacement entails tracking either potential | 
| Raymond Hettinger | 91e27c2 | 2005-08-19 01:36:35 +0000 | [diff] [blame] | 291 |         # selections (the pool) in a list or previous selections in a set. | 
| Raymond Hettinger | c0b4034 | 2002-11-13 15:26:37 +0000 | [diff] [blame] | 292 |  | 
| Jeremy Hylton | 2b55d35 | 2004-02-23 17:27:57 +0000 | [diff] [blame] | 293 |         # When the number of selections is small compared to the | 
 | 294 |         # population, then tracking selections is efficient, requiring | 
| Raymond Hettinger | 91e27c2 | 2005-08-19 01:36:35 +0000 | [diff] [blame] | 295 |         # only a small set and an occasional reselection.  For | 
| Jeremy Hylton | 2b55d35 | 2004-02-23 17:27:57 +0000 | [diff] [blame] | 296 |         # a larger number of selections, the pool tracking method is | 
 | 297 |         # preferred since the list takes less space than the | 
| Raymond Hettinger | 91e27c2 | 2005-08-19 01:36:35 +0000 | [diff] [blame] | 298 |         # set and it doesn't suffer from frequent reselections. | 
| Raymond Hettinger | c0b4034 | 2002-11-13 15:26:37 +0000 | [diff] [blame] | 299 |  | 
| Raymond Hettinger | 886687d | 2009-02-24 11:27:15 +0000 | [diff] [blame] | 300 |         if isinstance(population, _collections.Set): | 
| Raymond Hettinger | 1acde19 | 2008-01-14 01:00:53 +0000 | [diff] [blame] | 301 |             population = tuple(population) | 
| Raymond Hettinger | 886687d | 2009-02-24 11:27:15 +0000 | [diff] [blame] | 302 |         if not isinstance(population, _collections.Sequence): | 
 | 303 |             raise TypeError("Population must be a sequence or Set.  For dicts, use list(d).") | 
| Raymond Hettinger | 1acde19 | 2008-01-14 01:00:53 +0000 | [diff] [blame] | 304 |         random = self.random | 
| Raymond Hettinger | f24eb35 | 2002-11-12 17:41:57 +0000 | [diff] [blame] | 305 |         n = len(population) | 
 | 306 |         if not 0 <= k <= n: | 
| Raymond Hettinger | 1acde19 | 2008-01-14 01:00:53 +0000 | [diff] [blame] | 307 |             raise ValueError("Sample larger than population") | 
| Raymond Hettinger | fdbe522 | 2003-06-13 07:01:51 +0000 | [diff] [blame] | 308 |         _int = int | 
| Raymond Hettinger | c0b4034 | 2002-11-13 15:26:37 +0000 | [diff] [blame] | 309 |         result = [None] * k | 
| Raymond Hettinger | 91e27c2 | 2005-08-19 01:36:35 +0000 | [diff] [blame] | 310 |         setsize = 21        # size of a small set minus size of an empty list | 
 | 311 |         if k > 5: | 
| Tim Peters | 9e34c04 | 2005-08-26 15:20:46 +0000 | [diff] [blame] | 312 |             setsize += 4 ** _ceil(_log(k * 3, 4)) # table size for big sets | 
| Raymond Hettinger | 1acde19 | 2008-01-14 01:00:53 +0000 | [diff] [blame] | 313 |         if n <= setsize: | 
 | 314 |             # An n-length list is smaller than a k-length set | 
| Raymond Hettinger | 311f419 | 2002-11-18 09:01:24 +0000 | [diff] [blame] | 315 |             pool = list(population) | 
| Guido van Rossum | 805365e | 2007-05-07 22:24:25 +0000 | [diff] [blame] | 316 |             for i in range(k):         # invariant:  non-selected at [0,n-i) | 
| Raymond Hettinger | fdbe522 | 2003-06-13 07:01:51 +0000 | [diff] [blame] | 317 |                 j = _int(random() * (n-i)) | 
| Raymond Hettinger | 311f419 | 2002-11-18 09:01:24 +0000 | [diff] [blame] | 318 |                 result[i] = pool[j] | 
| Raymond Hettinger | 8b9aa8d | 2003-01-04 05:20:33 +0000 | [diff] [blame] | 319 |                 pool[j] = pool[n-i-1]   # move non-selected item into vacancy | 
| Raymond Hettinger | c0b4034 | 2002-11-13 15:26:37 +0000 | [diff] [blame] | 320 |         else: | 
| Raymond Hettinger | 1acde19 | 2008-01-14 01:00:53 +0000 | [diff] [blame] | 321 |             selected = set() | 
 | 322 |             selected_add = selected.add | 
 | 323 |             for i in range(k): | 
 | 324 |                 j = _int(random() * n) | 
 | 325 |                 while j in selected: | 
| Raymond Hettinger | fdbe522 | 2003-06-13 07:01:51 +0000 | [diff] [blame] | 326 |                     j = _int(random() * n) | 
| Raymond Hettinger | 1acde19 | 2008-01-14 01:00:53 +0000 | [diff] [blame] | 327 |                 selected_add(j) | 
 | 328 |                 result[i] = population[j] | 
| Raymond Hettinger | 311f419 | 2002-11-18 09:01:24 +0000 | [diff] [blame] | 329 |         return result | 
| Raymond Hettinger | f24eb35 | 2002-11-12 17:41:57 +0000 | [diff] [blame] | 330 |  | 
| Tim Peters | cd80410 | 2001-01-25 20:25:57 +0000 | [diff] [blame] | 331 | ## -------------------- real-valued distributions  ------------------- | 
 | 332 |  | 
 | 333 | ## -------------------- uniform distribution ------------------- | 
| Tim Peters | d7b5e88 | 2001-01-25 03:36:26 +0000 | [diff] [blame] | 334 |  | 
 | 335 |     def uniform(self, a, b): | 
| Raymond Hettinger | be40db0 | 2009-06-11 23:12:14 +0000 | [diff] [blame] | 336 |         "Get a random number in the range [a, b) or [a, b] depending on rounding." | 
| Tim Peters | d7b5e88 | 2001-01-25 03:36:26 +0000 | [diff] [blame] | 337 |         return a + (b-a) * self.random() | 
| Guido van Rossum | ff03b1a | 1994-03-09 12:55:02 +0000 | [diff] [blame] | 338 |  | 
| Christian Heimes | fe337bf | 2008-03-23 21:54:12 +0000 | [diff] [blame] | 339 | ## -------------------- triangular -------------------- | 
 | 340 |  | 
 | 341 |     def triangular(self, low=0.0, high=1.0, mode=None): | 
 | 342 |         """Triangular distribution. | 
 | 343 |  | 
 | 344 |         Continuous distribution bounded by given lower and upper limits, | 
 | 345 |         and having a given mode value in-between. | 
 | 346 |  | 
 | 347 |         http://en.wikipedia.org/wiki/Triangular_distribution | 
 | 348 |  | 
 | 349 |         """ | 
 | 350 |         u = self.random() | 
 | 351 |         c = 0.5 if mode is None else (mode - low) / (high - low) | 
 | 352 |         if u > c: | 
 | 353 |             u = 1.0 - u | 
 | 354 |             c = 1.0 - c | 
 | 355 |             low, high = high, low | 
 | 356 |         return low + (high - low) * (u * c) ** 0.5 | 
 | 357 |  | 
| Tim Peters | cd80410 | 2001-01-25 20:25:57 +0000 | [diff] [blame] | 358 | ## -------------------- normal distribution -------------------- | 
| Guido van Rossum | ff03b1a | 1994-03-09 12:55:02 +0000 | [diff] [blame] | 359 |  | 
| Tim Peters | d7b5e88 | 2001-01-25 03:36:26 +0000 | [diff] [blame] | 360 |     def normalvariate(self, mu, sigma): | 
| Raymond Hettinger | c32f033 | 2002-05-23 19:44:49 +0000 | [diff] [blame] | 361 |         """Normal distribution. | 
 | 362 |  | 
 | 363 |         mu is the mean, and sigma is the standard deviation. | 
| Raymond Hettinger | ef4d4bd | 2002-05-23 23:58:17 +0000 | [diff] [blame] | 364 |  | 
| Raymond Hettinger | c32f033 | 2002-05-23 19:44:49 +0000 | [diff] [blame] | 365 |         """ | 
| Tim Peters | d7b5e88 | 2001-01-25 03:36:26 +0000 | [diff] [blame] | 366 |         # mu = mean, sigma = standard deviation | 
| Guido van Rossum | ff03b1a | 1994-03-09 12:55:02 +0000 | [diff] [blame] | 367 |  | 
| Tim Peters | d7b5e88 | 2001-01-25 03:36:26 +0000 | [diff] [blame] | 368 |         # Uses Kinderman and Monahan method. Reference: Kinderman, | 
 | 369 |         # A.J. and Monahan, J.F., "Computer generation of random | 
 | 370 |         # variables using the ratio of uniform deviates", ACM Trans | 
 | 371 |         # Math Software, 3, (1977), pp257-260. | 
| Guido van Rossum | ff03b1a | 1994-03-09 12:55:02 +0000 | [diff] [blame] | 372 |  | 
| Tim Peters | d7b5e88 | 2001-01-25 03:36:26 +0000 | [diff] [blame] | 373 |         random = self.random | 
| Raymond Hettinger | 42406e6 | 2005-04-30 09:02:51 +0000 | [diff] [blame] | 374 |         while 1: | 
| Tim Peters | 0c9886d | 2001-01-15 01:18:21 +0000 | [diff] [blame] | 375 |             u1 = random() | 
| Raymond Hettinger | 73ced7e | 2003-01-04 09:26:32 +0000 | [diff] [blame] | 376 |             u2 = 1.0 - random() | 
| Tim Peters | d7b5e88 | 2001-01-25 03:36:26 +0000 | [diff] [blame] | 377 |             z = NV_MAGICCONST*(u1-0.5)/u2 | 
 | 378 |             zz = z*z/4.0 | 
 | 379 |             if zz <= -_log(u2): | 
 | 380 |                 break | 
 | 381 |         return mu + z*sigma | 
| Guido van Rossum | ff03b1a | 1994-03-09 12:55:02 +0000 | [diff] [blame] | 382 |  | 
| Tim Peters | cd80410 | 2001-01-25 20:25:57 +0000 | [diff] [blame] | 383 | ## -------------------- lognormal distribution -------------------- | 
| Tim Peters | d7b5e88 | 2001-01-25 03:36:26 +0000 | [diff] [blame] | 384 |  | 
 | 385 |     def lognormvariate(self, mu, sigma): | 
| Raymond Hettinger | c32f033 | 2002-05-23 19:44:49 +0000 | [diff] [blame] | 386 |         """Log normal distribution. | 
 | 387 |  | 
 | 388 |         If you take the natural logarithm of this distribution, you'll get a | 
 | 389 |         normal distribution with mean mu and standard deviation sigma. | 
 | 390 |         mu can have any value, and sigma must be greater than zero. | 
| Raymond Hettinger | ef4d4bd | 2002-05-23 23:58:17 +0000 | [diff] [blame] | 391 |  | 
| Raymond Hettinger | c32f033 | 2002-05-23 19:44:49 +0000 | [diff] [blame] | 392 |         """ | 
| Tim Peters | d7b5e88 | 2001-01-25 03:36:26 +0000 | [diff] [blame] | 393 |         return _exp(self.normalvariate(mu, sigma)) | 
 | 394 |  | 
| Tim Peters | cd80410 | 2001-01-25 20:25:57 +0000 | [diff] [blame] | 395 | ## -------------------- exponential distribution -------------------- | 
| Tim Peters | d7b5e88 | 2001-01-25 03:36:26 +0000 | [diff] [blame] | 396 |  | 
 | 397 |     def expovariate(self, lambd): | 
| Raymond Hettinger | c32f033 | 2002-05-23 19:44:49 +0000 | [diff] [blame] | 398 |         """Exponential distribution. | 
 | 399 |  | 
| Mark Dickinson | 2f94736 | 2009-01-07 17:54:07 +0000 | [diff] [blame] | 400 |         lambd is 1.0 divided by the desired mean.  It should be | 
 | 401 |         nonzero.  (The parameter would be called "lambda", but that is | 
 | 402 |         a reserved word in Python.)  Returned values range from 0 to | 
 | 403 |         positive infinity if lambd is positive, and from negative | 
 | 404 |         infinity to 0 if lambd is negative. | 
| Raymond Hettinger | ef4d4bd | 2002-05-23 23:58:17 +0000 | [diff] [blame] | 405 |  | 
| Raymond Hettinger | c32f033 | 2002-05-23 19:44:49 +0000 | [diff] [blame] | 406 |         """ | 
| Tim Peters | d7b5e88 | 2001-01-25 03:36:26 +0000 | [diff] [blame] | 407 |         # lambd: rate lambd = 1/mean | 
 | 408 |         # ('lambda' is a Python reserved word) | 
 | 409 |  | 
 | 410 |         random = self.random | 
| Tim Peters | 0c9886d | 2001-01-15 01:18:21 +0000 | [diff] [blame] | 411 |         u = random() | 
 | 412 |         while u <= 1e-7: | 
 | 413 |             u = random() | 
| Tim Peters | d7b5e88 | 2001-01-25 03:36:26 +0000 | [diff] [blame] | 414 |         return -_log(u)/lambd | 
| Guido van Rossum | ff03b1a | 1994-03-09 12:55:02 +0000 | [diff] [blame] | 415 |  | 
| Tim Peters | cd80410 | 2001-01-25 20:25:57 +0000 | [diff] [blame] | 416 | ## -------------------- von Mises distribution -------------------- | 
| Guido van Rossum | ff03b1a | 1994-03-09 12:55:02 +0000 | [diff] [blame] | 417 |  | 
| Tim Peters | d7b5e88 | 2001-01-25 03:36:26 +0000 | [diff] [blame] | 418 |     def vonmisesvariate(self, mu, kappa): | 
| Raymond Hettinger | c32f033 | 2002-05-23 19:44:49 +0000 | [diff] [blame] | 419 |         """Circular data distribution. | 
| Raymond Hettinger | ef4d4bd | 2002-05-23 23:58:17 +0000 | [diff] [blame] | 420 |  | 
| Raymond Hettinger | c32f033 | 2002-05-23 19:44:49 +0000 | [diff] [blame] | 421 |         mu is the mean angle, expressed in radians between 0 and 2*pi, and | 
 | 422 |         kappa is the concentration parameter, which must be greater than or | 
 | 423 |         equal to zero.  If kappa is equal to zero, this distribution reduces | 
 | 424 |         to a uniform random angle over the range 0 to 2*pi. | 
| Raymond Hettinger | ef4d4bd | 2002-05-23 23:58:17 +0000 | [diff] [blame] | 425 |  | 
| Raymond Hettinger | c32f033 | 2002-05-23 19:44:49 +0000 | [diff] [blame] | 426 |         """ | 
| Tim Peters | d7b5e88 | 2001-01-25 03:36:26 +0000 | [diff] [blame] | 427 |         # mu:    mean angle (in radians between 0 and 2*pi) | 
 | 428 |         # kappa: concentration parameter kappa (>= 0) | 
 | 429 |         # if kappa = 0 generate uniform random angle | 
 | 430 |  | 
 | 431 |         # Based upon an algorithm published in: Fisher, N.I., | 
 | 432 |         # "Statistical Analysis of Circular Data", Cambridge | 
 | 433 |         # University Press, 1993. | 
 | 434 |  | 
 | 435 |         # Thanks to Magnus Kessler for a correction to the | 
 | 436 |         # implementation of step 4. | 
 | 437 |  | 
 | 438 |         random = self.random | 
 | 439 |         if kappa <= 1e-6: | 
 | 440 |             return TWOPI * random() | 
 | 441 |  | 
 | 442 |         a = 1.0 + _sqrt(1.0 + 4.0 * kappa * kappa) | 
 | 443 |         b = (a - _sqrt(2.0 * a))/(2.0 * kappa) | 
 | 444 |         r = (1.0 + b * b)/(2.0 * b) | 
| Guido van Rossum | ff03b1a | 1994-03-09 12:55:02 +0000 | [diff] [blame] | 445 |  | 
| Raymond Hettinger | 42406e6 | 2005-04-30 09:02:51 +0000 | [diff] [blame] | 446 |         while 1: | 
| Tim Peters | 0c9886d | 2001-01-15 01:18:21 +0000 | [diff] [blame] | 447 |             u1 = random() | 
| Tim Peters | d7b5e88 | 2001-01-25 03:36:26 +0000 | [diff] [blame] | 448 |  | 
 | 449 |             z = _cos(_pi * u1) | 
 | 450 |             f = (1.0 + r * z)/(r + z) | 
 | 451 |             c = kappa * (r - f) | 
 | 452 |  | 
 | 453 |             u2 = random() | 
 | 454 |  | 
| Raymond Hettinger | 42406e6 | 2005-04-30 09:02:51 +0000 | [diff] [blame] | 455 |             if u2 < c * (2.0 - c) or u2 <= c * _exp(1.0 - c): | 
| Tim Peters | 0c9886d | 2001-01-15 01:18:21 +0000 | [diff] [blame] | 456 |                 break | 
| Tim Peters | d7b5e88 | 2001-01-25 03:36:26 +0000 | [diff] [blame] | 457 |  | 
 | 458 |         u3 = random() | 
 | 459 |         if u3 > 0.5: | 
 | 460 |             theta = (mu % TWOPI) + _acos(f) | 
 | 461 |         else: | 
 | 462 |             theta = (mu % TWOPI) - _acos(f) | 
 | 463 |  | 
 | 464 |         return theta | 
 | 465 |  | 
| Tim Peters | cd80410 | 2001-01-25 20:25:57 +0000 | [diff] [blame] | 466 | ## -------------------- gamma distribution -------------------- | 
| Tim Peters | d7b5e88 | 2001-01-25 03:36:26 +0000 | [diff] [blame] | 467 |  | 
 | 468 |     def gammavariate(self, alpha, beta): | 
| Raymond Hettinger | c32f033 | 2002-05-23 19:44:49 +0000 | [diff] [blame] | 469 |         """Gamma distribution.  Not the gamma function! | 
 | 470 |  | 
 | 471 |         Conditions on the parameters are alpha > 0 and beta > 0. | 
 | 472 |  | 
 | 473 |         """ | 
| Tim Peters | 8ac1495 | 2002-05-23 15:15:30 +0000 | [diff] [blame] | 474 |  | 
| Raymond Hettinger | b760efb | 2002-05-14 06:40:34 +0000 | [diff] [blame] | 475 |         # alpha > 0, beta > 0, mean is alpha*beta, variance is alpha*beta**2 | 
| Tim Peters | 8ac1495 | 2002-05-23 15:15:30 +0000 | [diff] [blame] | 476 |  | 
| Guido van Rossum | 570764d | 2002-05-14 14:08:12 +0000 | [diff] [blame] | 477 |         # Warning: a few older sources define the gamma distribution in terms | 
 | 478 |         # of alpha > -1.0 | 
 | 479 |         if alpha <= 0.0 or beta <= 0.0: | 
| Collin Winter | ce36ad8 | 2007-08-30 01:19:48 +0000 | [diff] [blame] | 480 |             raise ValueError('gammavariate: alpha and beta must be > 0.0') | 
| Tim Peters | 8ac1495 | 2002-05-23 15:15:30 +0000 | [diff] [blame] | 481 |  | 
| Tim Peters | d7b5e88 | 2001-01-25 03:36:26 +0000 | [diff] [blame] | 482 |         random = self.random | 
| Tim Peters | d7b5e88 | 2001-01-25 03:36:26 +0000 | [diff] [blame] | 483 |         if alpha > 1.0: | 
 | 484 |  | 
 | 485 |             # Uses R.C.H. Cheng, "The generation of Gamma | 
 | 486 |             # variables with non-integral shape parameters", | 
 | 487 |             # Applied Statistics, (1977), 26, No. 1, p71-74 | 
 | 488 |  | 
| Raymond Hettinger | ca6cdc2 | 2002-05-13 23:40:14 +0000 | [diff] [blame] | 489 |             ainv = _sqrt(2.0 * alpha - 1.0) | 
 | 490 |             bbb = alpha - LOG4 | 
 | 491 |             ccc = alpha + ainv | 
| Tim Peters | 8ac1495 | 2002-05-23 15:15:30 +0000 | [diff] [blame] | 492 |  | 
| Raymond Hettinger | 42406e6 | 2005-04-30 09:02:51 +0000 | [diff] [blame] | 493 |             while 1: | 
| Tim Peters | d7b5e88 | 2001-01-25 03:36:26 +0000 | [diff] [blame] | 494 |                 u1 = random() | 
| Raymond Hettinger | 73ced7e | 2003-01-04 09:26:32 +0000 | [diff] [blame] | 495 |                 if not 1e-7 < u1 < .9999999: | 
 | 496 |                     continue | 
 | 497 |                 u2 = 1.0 - random() | 
| Tim Peters | d7b5e88 | 2001-01-25 03:36:26 +0000 | [diff] [blame] | 498 |                 v = _log(u1/(1.0-u1))/ainv | 
 | 499 |                 x = alpha*_exp(v) | 
 | 500 |                 z = u1*u1*u2 | 
 | 501 |                 r = bbb+ccc*v-x | 
 | 502 |                 if r + SG_MAGICCONST - 4.5*z >= 0.0 or r >= _log(z): | 
| Raymond Hettinger | b760efb | 2002-05-14 06:40:34 +0000 | [diff] [blame] | 503 |                     return x * beta | 
| Tim Peters | d7b5e88 | 2001-01-25 03:36:26 +0000 | [diff] [blame] | 504 |  | 
 | 505 |         elif alpha == 1.0: | 
 | 506 |             # expovariate(1) | 
 | 507 |             u = random() | 
 | 508 |             while u <= 1e-7: | 
 | 509 |                 u = random() | 
| Raymond Hettinger | b760efb | 2002-05-14 06:40:34 +0000 | [diff] [blame] | 510 |             return -_log(u) * beta | 
| Tim Peters | d7b5e88 | 2001-01-25 03:36:26 +0000 | [diff] [blame] | 511 |  | 
 | 512 |         else:   # alpha is between 0 and 1 (exclusive) | 
 | 513 |  | 
 | 514 |             # Uses ALGORITHM GS of Statistical Computing - Kennedy & Gentle | 
 | 515 |  | 
| Raymond Hettinger | 42406e6 | 2005-04-30 09:02:51 +0000 | [diff] [blame] | 516 |             while 1: | 
| Tim Peters | d7b5e88 | 2001-01-25 03:36:26 +0000 | [diff] [blame] | 517 |                 u = random() | 
 | 518 |                 b = (_e + alpha)/_e | 
 | 519 |                 p = b*u | 
 | 520 |                 if p <= 1.0: | 
| Raymond Hettinger | 42406e6 | 2005-04-30 09:02:51 +0000 | [diff] [blame] | 521 |                     x = p ** (1.0/alpha) | 
| Tim Peters | d7b5e88 | 2001-01-25 03:36:26 +0000 | [diff] [blame] | 522 |                 else: | 
| Tim Peters | d7b5e88 | 2001-01-25 03:36:26 +0000 | [diff] [blame] | 523 |                     x = -_log((b-p)/alpha) | 
 | 524 |                 u1 = random() | 
| Raymond Hettinger | 42406e6 | 2005-04-30 09:02:51 +0000 | [diff] [blame] | 525 |                 if p > 1.0: | 
 | 526 |                     if u1 <= x ** (alpha - 1.0): | 
 | 527 |                         break | 
 | 528 |                 elif u1 <= _exp(-x): | 
| Tim Peters | d7b5e88 | 2001-01-25 03:36:26 +0000 | [diff] [blame] | 529 |                     break | 
| Raymond Hettinger | b760efb | 2002-05-14 06:40:34 +0000 | [diff] [blame] | 530 |             return x * beta | 
 | 531 |  | 
| Tim Peters | cd80410 | 2001-01-25 20:25:57 +0000 | [diff] [blame] | 532 | ## -------------------- Gauss (faster alternative) -------------------- | 
| Guido van Rossum | 95bfcda | 1994-03-09 14:21:05 +0000 | [diff] [blame] | 533 |  | 
| Tim Peters | d7b5e88 | 2001-01-25 03:36:26 +0000 | [diff] [blame] | 534 |     def gauss(self, mu, sigma): | 
| Raymond Hettinger | c32f033 | 2002-05-23 19:44:49 +0000 | [diff] [blame] | 535 |         """Gaussian distribution. | 
 | 536 |  | 
 | 537 |         mu is the mean, and sigma is the standard deviation.  This is | 
 | 538 |         slightly faster than the normalvariate() function. | 
 | 539 |  | 
 | 540 |         Not thread-safe without a lock around calls. | 
| Raymond Hettinger | ef4d4bd | 2002-05-23 23:58:17 +0000 | [diff] [blame] | 541 |  | 
| Raymond Hettinger | c32f033 | 2002-05-23 19:44:49 +0000 | [diff] [blame] | 542 |         """ | 
| Guido van Rossum | cc32ac9 | 1994-03-15 16:10:24 +0000 | [diff] [blame] | 543 |  | 
| Tim Peters | d7b5e88 | 2001-01-25 03:36:26 +0000 | [diff] [blame] | 544 |         # When x and y are two variables from [0, 1), uniformly | 
 | 545 |         # distributed, then | 
 | 546 |         # | 
 | 547 |         #    cos(2*pi*x)*sqrt(-2*log(1-y)) | 
 | 548 |         #    sin(2*pi*x)*sqrt(-2*log(1-y)) | 
 | 549 |         # | 
 | 550 |         # are two *independent* variables with normal distribution | 
 | 551 |         # (mu = 0, sigma = 1). | 
 | 552 |         # (Lambert Meertens) | 
 | 553 |         # (corrected version; bug discovered by Mike Miller, fixed by LM) | 
| Guido van Rossum | cc32ac9 | 1994-03-15 16:10:24 +0000 | [diff] [blame] | 554 |  | 
| Tim Peters | d7b5e88 | 2001-01-25 03:36:26 +0000 | [diff] [blame] | 555 |         # Multithreading note: When two threads call this function | 
 | 556 |         # simultaneously, it is possible that they will receive the | 
 | 557 |         # same return value.  The window is very small though.  To | 
 | 558 |         # avoid this, you have to use a lock around all calls.  (I | 
 | 559 |         # didn't want to slow this down in the serial case by using a | 
 | 560 |         # lock here.) | 
| Guido van Rossum | d03e119 | 1998-05-29 17:51:31 +0000 | [diff] [blame] | 561 |  | 
| Tim Peters | d7b5e88 | 2001-01-25 03:36:26 +0000 | [diff] [blame] | 562 |         random = self.random | 
 | 563 |         z = self.gauss_next | 
 | 564 |         self.gauss_next = None | 
 | 565 |         if z is None: | 
 | 566 |             x2pi = random() * TWOPI | 
 | 567 |             g2rad = _sqrt(-2.0 * _log(1.0 - random())) | 
 | 568 |             z = _cos(x2pi) * g2rad | 
 | 569 |             self.gauss_next = _sin(x2pi) * g2rad | 
| Guido van Rossum | cc32ac9 | 1994-03-15 16:10:24 +0000 | [diff] [blame] | 570 |  | 
| Tim Peters | d7b5e88 | 2001-01-25 03:36:26 +0000 | [diff] [blame] | 571 |         return mu + z*sigma | 
| Guido van Rossum | 95bfcda | 1994-03-09 14:21:05 +0000 | [diff] [blame] | 572 |  | 
| Tim Peters | cd80410 | 2001-01-25 20:25:57 +0000 | [diff] [blame] | 573 | ## -------------------- beta -------------------- | 
| Tim Peters | 85e2e47 | 2001-01-26 06:49:56 +0000 | [diff] [blame] | 574 | ## See | 
 | 575 | ## http://sourceforge.net/bugs/?func=detailbug&bug_id=130030&group_id=5470 | 
 | 576 | ## for Ivan Frohne's insightful analysis of why the original implementation: | 
 | 577 | ## | 
 | 578 | ##    def betavariate(self, alpha, beta): | 
 | 579 | ##        # Discrete Event Simulation in C, pp 87-88. | 
 | 580 | ## | 
 | 581 | ##        y = self.expovariate(alpha) | 
 | 582 | ##        z = self.expovariate(1.0/beta) | 
 | 583 | ##        return z/(y+z) | 
 | 584 | ## | 
 | 585 | ## was dead wrong, and how it probably got that way. | 
| Guido van Rossum | 95bfcda | 1994-03-09 14:21:05 +0000 | [diff] [blame] | 586 |  | 
| Tim Peters | d7b5e88 | 2001-01-25 03:36:26 +0000 | [diff] [blame] | 587 |     def betavariate(self, alpha, beta): | 
| Raymond Hettinger | c32f033 | 2002-05-23 19:44:49 +0000 | [diff] [blame] | 588 |         """Beta distribution. | 
 | 589 |  | 
| Thomas Wouters | b213704 | 2007-02-01 18:02:27 +0000 | [diff] [blame] | 590 |         Conditions on the parameters are alpha > 0 and beta > 0. | 
| Raymond Hettinger | c32f033 | 2002-05-23 19:44:49 +0000 | [diff] [blame] | 591 |         Returned values range between 0 and 1. | 
| Raymond Hettinger | ef4d4bd | 2002-05-23 23:58:17 +0000 | [diff] [blame] | 592 |  | 
| Raymond Hettinger | c32f033 | 2002-05-23 19:44:49 +0000 | [diff] [blame] | 593 |         """ | 
| Raymond Hettinger | ef4d4bd | 2002-05-23 23:58:17 +0000 | [diff] [blame] | 594 |  | 
| Tim Peters | 85e2e47 | 2001-01-26 06:49:56 +0000 | [diff] [blame] | 595 |         # This version due to Janne Sinkkonen, and matches all the std | 
 | 596 |         # texts (e.g., Knuth Vol 2 Ed 3 pg 134 "the beta distribution"). | 
 | 597 |         y = self.gammavariate(alpha, 1.) | 
 | 598 |         if y == 0: | 
 | 599 |             return 0.0 | 
 | 600 |         else: | 
 | 601 |             return y / (y + self.gammavariate(beta, 1.)) | 
| Guido van Rossum | 95bfcda | 1994-03-09 14:21:05 +0000 | [diff] [blame] | 602 |  | 
| Tim Peters | cd80410 | 2001-01-25 20:25:57 +0000 | [diff] [blame] | 603 | ## -------------------- Pareto -------------------- | 
| Guido van Rossum | cf4559a | 1997-12-02 02:47:39 +0000 | [diff] [blame] | 604 |  | 
| Tim Peters | d7b5e88 | 2001-01-25 03:36:26 +0000 | [diff] [blame] | 605 |     def paretovariate(self, alpha): | 
| Raymond Hettinger | c32f033 | 2002-05-23 19:44:49 +0000 | [diff] [blame] | 606 |         """Pareto distribution.  alpha is the shape parameter.""" | 
| Tim Peters | d7b5e88 | 2001-01-25 03:36:26 +0000 | [diff] [blame] | 607 |         # Jain, pg. 495 | 
| Guido van Rossum | cf4559a | 1997-12-02 02:47:39 +0000 | [diff] [blame] | 608 |  | 
| Raymond Hettinger | 73ced7e | 2003-01-04 09:26:32 +0000 | [diff] [blame] | 609 |         u = 1.0 - self.random() | 
| Tim Peters | d7b5e88 | 2001-01-25 03:36:26 +0000 | [diff] [blame] | 610 |         return 1.0 / pow(u, 1.0/alpha) | 
| Guido van Rossum | cf4559a | 1997-12-02 02:47:39 +0000 | [diff] [blame] | 611 |  | 
| Tim Peters | cd80410 | 2001-01-25 20:25:57 +0000 | [diff] [blame] | 612 | ## -------------------- Weibull -------------------- | 
| Guido van Rossum | cf4559a | 1997-12-02 02:47:39 +0000 | [diff] [blame] | 613 |  | 
| Tim Peters | d7b5e88 | 2001-01-25 03:36:26 +0000 | [diff] [blame] | 614 |     def weibullvariate(self, alpha, beta): | 
| Raymond Hettinger | c32f033 | 2002-05-23 19:44:49 +0000 | [diff] [blame] | 615 |         """Weibull distribution. | 
 | 616 |  | 
 | 617 |         alpha is the scale parameter and beta is the shape parameter. | 
| Raymond Hettinger | ef4d4bd | 2002-05-23 23:58:17 +0000 | [diff] [blame] | 618 |  | 
| Raymond Hettinger | c32f033 | 2002-05-23 19:44:49 +0000 | [diff] [blame] | 619 |         """ | 
| Tim Peters | d7b5e88 | 2001-01-25 03:36:26 +0000 | [diff] [blame] | 620 |         # Jain, pg. 499; bug fix courtesy Bill Arms | 
| Guido van Rossum | cf4559a | 1997-12-02 02:47:39 +0000 | [diff] [blame] | 621 |  | 
| Raymond Hettinger | 73ced7e | 2003-01-04 09:26:32 +0000 | [diff] [blame] | 622 |         u = 1.0 - self.random() | 
| Tim Peters | d7b5e88 | 2001-01-25 03:36:26 +0000 | [diff] [blame] | 623 |         return alpha * pow(-_log(u), 1.0/beta) | 
| Guido van Rossum | 6c395ba | 1999-08-18 13:53:28 +0000 | [diff] [blame] | 624 |  | 
| Raymond Hettinger | 23f1241 | 2004-09-13 22:23:21 +0000 | [diff] [blame] | 625 | ## --------------- Operating System Random Source  ------------------ | 
| Raymond Hettinger | 356a459 | 2004-08-30 06:14:31 +0000 | [diff] [blame] | 626 |  | 
| Raymond Hettinger | 23f1241 | 2004-09-13 22:23:21 +0000 | [diff] [blame] | 627 | class SystemRandom(Random): | 
 | 628 |     """Alternate random number generator using sources provided | 
 | 629 |     by the operating system (such as /dev/urandom on Unix or | 
 | 630 |     CryptGenRandom on Windows). | 
| Raymond Hettinger | 356a459 | 2004-08-30 06:14:31 +0000 | [diff] [blame] | 631 |  | 
 | 632 |      Not available on all systems (see os.urandom() for details). | 
 | 633 |     """ | 
 | 634 |  | 
 | 635 |     def random(self): | 
 | 636 |         """Get the next random number in the range [0.0, 1.0).""" | 
| Guido van Rossum | e2a383d | 2007-01-15 16:59:06 +0000 | [diff] [blame] | 637 |         return (int(_hexlify(_urandom(7)), 16) >> 3) * RECIP_BPF | 
| Raymond Hettinger | 356a459 | 2004-08-30 06:14:31 +0000 | [diff] [blame] | 638 |  | 
 | 639 |     def getrandbits(self, k): | 
 | 640 |         """getrandbits(k) -> x.  Generates a long int with k random bits.""" | 
| Raymond Hettinger | 356a459 | 2004-08-30 06:14:31 +0000 | [diff] [blame] | 641 |         if k <= 0: | 
 | 642 |             raise ValueError('number of bits must be greater than zero') | 
 | 643 |         if k != int(k): | 
 | 644 |             raise TypeError('number of bits should be an integer') | 
 | 645 |         bytes = (k + 7) // 8                    # bits / 8 and rounded up | 
| Guido van Rossum | e2a383d | 2007-01-15 16:59:06 +0000 | [diff] [blame] | 646 |         x = int(_hexlify(_urandom(bytes)), 16) | 
| Raymond Hettinger | 356a459 | 2004-08-30 06:14:31 +0000 | [diff] [blame] | 647 |         return x >> (bytes * 8 - k)             # trim excess bits | 
 | 648 |  | 
| Raymond Hettinger | 28de64f | 2008-01-13 23:40:30 +0000 | [diff] [blame] | 649 |     def seed(self, *args, **kwds): | 
| Raymond Hettinger | 23f1241 | 2004-09-13 22:23:21 +0000 | [diff] [blame] | 650 |         "Stub method.  Not used for a system random number generator." | 
| Raymond Hettinger | 356a459 | 2004-08-30 06:14:31 +0000 | [diff] [blame] | 651 |         return None | 
| Raymond Hettinger | 356a459 | 2004-08-30 06:14:31 +0000 | [diff] [blame] | 652 |  | 
 | 653 |     def _notimplemented(self, *args, **kwds): | 
| Raymond Hettinger | 23f1241 | 2004-09-13 22:23:21 +0000 | [diff] [blame] | 654 |         "Method should not be called for a system random number generator." | 
 | 655 |         raise NotImplementedError('System entropy source does not have state.') | 
| Raymond Hettinger | 356a459 | 2004-08-30 06:14:31 +0000 | [diff] [blame] | 656 |     getstate = setstate = _notimplemented | 
 | 657 |  | 
| Tim Peters | cd80410 | 2001-01-25 20:25:57 +0000 | [diff] [blame] | 658 | ## -------------------- test program -------------------- | 
| Guido van Rossum | ff03b1a | 1994-03-09 12:55:02 +0000 | [diff] [blame] | 659 |  | 
| Raymond Hettinger | 6229713 | 2003-08-30 01:24:19 +0000 | [diff] [blame] | 660 | def _test_generator(n, func, args): | 
| Tim Peters | 0c9886d | 2001-01-15 01:18:21 +0000 | [diff] [blame] | 661 |     import time | 
| Guido van Rossum | be19ed7 | 2007-02-09 05:37:30 +0000 | [diff] [blame] | 662 |     print(n, 'times', func.__name__) | 
| Raymond Hettinger | b98154e | 2003-05-24 17:26:02 +0000 | [diff] [blame] | 663 |     total = 0.0 | 
| Tim Peters | 0c9886d | 2001-01-15 01:18:21 +0000 | [diff] [blame] | 664 |     sqsum = 0.0 | 
 | 665 |     smallest = 1e10 | 
 | 666 |     largest = -1e10 | 
 | 667 |     t0 = time.time() | 
 | 668 |     for i in range(n): | 
| Raymond Hettinger | 6229713 | 2003-08-30 01:24:19 +0000 | [diff] [blame] | 669 |         x = func(*args) | 
| Raymond Hettinger | b98154e | 2003-05-24 17:26:02 +0000 | [diff] [blame] | 670 |         total += x | 
| Tim Peters | 0c9886d | 2001-01-15 01:18:21 +0000 | [diff] [blame] | 671 |         sqsum = sqsum + x*x | 
 | 672 |         smallest = min(x, smallest) | 
 | 673 |         largest = max(x, largest) | 
 | 674 |     t1 = time.time() | 
| Guido van Rossum | be19ed7 | 2007-02-09 05:37:30 +0000 | [diff] [blame] | 675 |     print(round(t1-t0, 3), 'sec,', end=' ') | 
| Raymond Hettinger | b98154e | 2003-05-24 17:26:02 +0000 | [diff] [blame] | 676 |     avg = total/n | 
| Tim Peters | d7b5e88 | 2001-01-25 03:36:26 +0000 | [diff] [blame] | 677 |     stddev = _sqrt(sqsum/n - avg*avg) | 
| Guido van Rossum | be19ed7 | 2007-02-09 05:37:30 +0000 | [diff] [blame] | 678 |     print('avg %g, stddev %g, min %g, max %g' % \ | 
 | 679 |               (avg, stddev, smallest, largest)) | 
| Guido van Rossum | ff03b1a | 1994-03-09 12:55:02 +0000 | [diff] [blame] | 680 |  | 
| Raymond Hettinger | f24eb35 | 2002-11-12 17:41:57 +0000 | [diff] [blame] | 681 |  | 
 | 682 | def _test(N=2000): | 
| Raymond Hettinger | 6229713 | 2003-08-30 01:24:19 +0000 | [diff] [blame] | 683 |     _test_generator(N, random, ()) | 
 | 684 |     _test_generator(N, normalvariate, (0.0, 1.0)) | 
 | 685 |     _test_generator(N, lognormvariate, (0.0, 1.0)) | 
 | 686 |     _test_generator(N, vonmisesvariate, (0.0, 1.0)) | 
 | 687 |     _test_generator(N, gammavariate, (0.01, 1.0)) | 
 | 688 |     _test_generator(N, gammavariate, (0.1, 1.0)) | 
 | 689 |     _test_generator(N, gammavariate, (0.1, 2.0)) | 
 | 690 |     _test_generator(N, gammavariate, (0.5, 1.0)) | 
 | 691 |     _test_generator(N, gammavariate, (0.9, 1.0)) | 
 | 692 |     _test_generator(N, gammavariate, (1.0, 1.0)) | 
 | 693 |     _test_generator(N, gammavariate, (2.0, 1.0)) | 
 | 694 |     _test_generator(N, gammavariate, (20.0, 1.0)) | 
 | 695 |     _test_generator(N, gammavariate, (200.0, 1.0)) | 
 | 696 |     _test_generator(N, gauss, (0.0, 1.0)) | 
 | 697 |     _test_generator(N, betavariate, (3.0, 3.0)) | 
| Christian Heimes | fe337bf | 2008-03-23 21:54:12 +0000 | [diff] [blame] | 698 |     _test_generator(N, triangular, (0.0, 1.0, 1.0/3.0)) | 
| Tim Peters | cd80410 | 2001-01-25 20:25:57 +0000 | [diff] [blame] | 699 |  | 
| Tim Peters | 715c4c4 | 2001-01-26 22:56:56 +0000 | [diff] [blame] | 700 | # Create one instance, seeded from current time, and export its methods | 
| Raymond Hettinger | 40f6217 | 2002-12-29 23:03:38 +0000 | [diff] [blame] | 701 | # as module-level functions.  The functions share state across all uses | 
 | 702 | #(both in the user's code and in the Python libraries), but that's fine | 
 | 703 | # for most programs and is easier for the casual user than making them | 
 | 704 | # instantiate their own Random() instance. | 
 | 705 |  | 
| Tim Peters | d7b5e88 | 2001-01-25 03:36:26 +0000 | [diff] [blame] | 706 | _inst = Random() | 
 | 707 | seed = _inst.seed | 
 | 708 | random = _inst.random | 
 | 709 | uniform = _inst.uniform | 
| Christian Heimes | fe337bf | 2008-03-23 21:54:12 +0000 | [diff] [blame] | 710 | triangular = _inst.triangular | 
| Tim Peters | d7b5e88 | 2001-01-25 03:36:26 +0000 | [diff] [blame] | 711 | randint = _inst.randint | 
 | 712 | choice = _inst.choice | 
 | 713 | randrange = _inst.randrange | 
| Raymond Hettinger | f24eb35 | 2002-11-12 17:41:57 +0000 | [diff] [blame] | 714 | sample = _inst.sample | 
| Tim Peters | d7b5e88 | 2001-01-25 03:36:26 +0000 | [diff] [blame] | 715 | shuffle = _inst.shuffle | 
 | 716 | normalvariate = _inst.normalvariate | 
 | 717 | lognormvariate = _inst.lognormvariate | 
| Tim Peters | d7b5e88 | 2001-01-25 03:36:26 +0000 | [diff] [blame] | 718 | expovariate = _inst.expovariate | 
 | 719 | vonmisesvariate = _inst.vonmisesvariate | 
 | 720 | gammavariate = _inst.gammavariate | 
| Tim Peters | d7b5e88 | 2001-01-25 03:36:26 +0000 | [diff] [blame] | 721 | gauss = _inst.gauss | 
 | 722 | betavariate = _inst.betavariate | 
 | 723 | paretovariate = _inst.paretovariate | 
 | 724 | weibullvariate = _inst.weibullvariate | 
 | 725 | getstate = _inst.getstate | 
 | 726 | setstate = _inst.setstate | 
| Raymond Hettinger | 2f726e9 | 2003-10-05 09:09:15 +0000 | [diff] [blame] | 727 | getrandbits = _inst.getrandbits | 
| Tim Peters | d7b5e88 | 2001-01-25 03:36:26 +0000 | [diff] [blame] | 728 |  | 
| Guido van Rossum | ff03b1a | 1994-03-09 12:55:02 +0000 | [diff] [blame] | 729 | if __name__ == '__main__': | 
| Tim Peters | d7b5e88 | 2001-01-25 03:36:26 +0000 | [diff] [blame] | 730 |     _test() |