blob: 72b422f480dfcea72338420b699f99af0e655c5d [file] [log] [blame]
Guido van Rossume7b146f2000-02-04 15:28:42 +00001"""Random variable generators.
Guido van Rossumff03b1a1994-03-09 12:55:02 +00002
Tim Petersd7b5e882001-01-25 03:36:26 +00003 integers
4 --------
5 uniform within range
6
7 sequences
8 ---------
9 pick random element
Raymond Hettingerf24eb352002-11-12 17:41:57 +000010 pick random sample
Tim Petersd7b5e882001-01-25 03:36:26 +000011 generate random permutation
12
Guido van Rossume7b146f2000-02-04 15:28:42 +000013 distributions on the real line:
14 ------------------------------
Tim Petersd7b5e882001-01-25 03:36:26 +000015 uniform
Guido van Rossume7b146f2000-02-04 15:28:42 +000016 normal (Gaussian)
17 lognormal
18 negative exponential
19 gamma
20 beta
Raymond Hettinger40f62172002-12-29 23:03:38 +000021 pareto
22 Weibull
Guido van Rossumff03b1a1994-03-09 12:55:02 +000023
Guido van Rossume7b146f2000-02-04 15:28:42 +000024 distributions on the circle (angles 0 to 2pi)
25 ---------------------------------------------
26 circular uniform
27 von Mises
28
Raymond Hettinger40f62172002-12-29 23:03:38 +000029General notes on the underlying Mersenne Twister core generator:
Guido van Rossume7b146f2000-02-04 15:28:42 +000030
Raymond Hettinger40f62172002-12-29 23:03:38 +000031* The period is 2**19937-1.
Thomas Wouters0e3f5912006-08-11 14:57:12 +000032* It is one of the most extensively tested generators in existence.
Thomas Wouters0e3f5912006-08-11 14:57:12 +000033* The random() method is implemented in C, executes in a single Python step,
34 and is, therefore, threadsafe.
Tim Peterse360d952001-01-26 10:00:39 +000035
Guido van Rossume7b146f2000-02-04 15:28:42 +000036"""
Guido van Rossumd03e1191998-05-29 17:51:31 +000037
Raymond Hettinger2f726e92003-10-05 09:09:15 +000038from warnings import warn as _warn
39from types import MethodType as _MethodType, BuiltinMethodType as _BuiltinMethodType
Raymond Hettinger91e27c22005-08-19 01:36:35 +000040from math import log as _log, exp as _exp, pi as _pi, e as _e, ceil as _ceil
Tim Petersd7b5e882001-01-25 03:36:26 +000041from math import sqrt as _sqrt, acos as _acos, cos as _cos, sin as _sin
Raymond Hettingerc1c43ca2004-09-05 00:00:42 +000042from os import urandom as _urandom
43from binascii import hexlify as _hexlify
Guido van Rossumff03b1a1994-03-09 12:55:02 +000044
Raymond Hettingerf24eb352002-11-12 17:41:57 +000045__all__ = ["Random","seed","random","uniform","randint","choice","sample",
Skip Montanaro0de65802001-02-15 22:15:14 +000046 "randrange","shuffle","normalvariate","lognormvariate",
Raymond Hettingerf8a52d32003-08-05 12:23:19 +000047 "expovariate","vonmisesvariate","gammavariate",
48 "gauss","betavariate","paretovariate","weibullvariate",
Raymond Hettinger28de64f2008-01-13 23:40:30 +000049 "getstate","setstate", "getrandbits",
Raymond Hettinger23f12412004-09-13 22:23:21 +000050 "SystemRandom"]
Tim Petersd7b5e882001-01-25 03:36:26 +000051
52NV_MAGICCONST = 4 * _exp(-0.5)/_sqrt(2.0)
Tim Petersd7b5e882001-01-25 03:36:26 +000053TWOPI = 2.0*_pi
Tim Petersd7b5e882001-01-25 03:36:26 +000054LOG4 = _log(4.0)
Tim Petersd7b5e882001-01-25 03:36:26 +000055SG_MAGICCONST = 1.0 + _log(4.5)
Raymond Hettinger2f726e92003-10-05 09:09:15 +000056BPF = 53 # Number of bits in a float
Tim Peters7c2a85b2004-08-31 02:19:55 +000057RECIP_BPF = 2**-BPF
Tim Petersd7b5e882001-01-25 03:36:26 +000058
Raymond Hettinger356a4592004-08-30 06:14:31 +000059
Tim Petersd7b5e882001-01-25 03:36:26 +000060# Translated by Guido van Rossum from C source provided by
Raymond Hettinger40f62172002-12-29 23:03:38 +000061# Adrian Baddeley. Adapted by Raymond Hettinger for use with
Raymond Hettinger3fa19d72004-08-31 01:05:15 +000062# the Mersenne Twister and os.urandom() core generators.
Tim Petersd7b5e882001-01-25 03:36:26 +000063
Raymond Hettinger145a4a02003-01-07 10:25:55 +000064import _random
Raymond Hettinger40f62172002-12-29 23:03:38 +000065
Raymond Hettinger145a4a02003-01-07 10:25:55 +000066class Random(_random.Random):
Raymond Hettingerc32f0332002-05-23 19:44:49 +000067 """Random number generator base class used by bound module functions.
68
69 Used to instantiate instances of Random to get generators that don't
Raymond Hettinger28de64f2008-01-13 23:40:30 +000070 share state.
Raymond Hettingerc32f0332002-05-23 19:44:49 +000071
72 Class Random can also be subclassed if you want to use a different basic
73 generator of your own devising: in that case, override the following
Raymond Hettinger28de64f2008-01-13 23:40:30 +000074 methods: random(), seed(), getstate(), and setstate().
Raymond Hettinger2f726e92003-10-05 09:09:15 +000075 Optionally, implement a getrandombits() method so that randrange()
76 can cover arbitrarily large ranges.
Raymond Hettingeref4d4bd2002-05-23 23:58:17 +000077
Raymond Hettingerc32f0332002-05-23 19:44:49 +000078 """
Tim Petersd7b5e882001-01-25 03:36:26 +000079
Christian Heimescbf3b5c2007-12-03 21:02:03 +000080 VERSION = 3 # used by getstate/setstate
Tim Petersd7b5e882001-01-25 03:36:26 +000081
82 def __init__(self, x=None):
83 """Initialize an instance.
84
85 Optional argument x controls seeding, as for Random.seed().
86 """
87
88 self.seed(x)
Raymond Hettinger40f62172002-12-29 23:03:38 +000089 self.gauss_next = None
Tim Petersd7b5e882001-01-25 03:36:26 +000090
Tim Peters0de88fc2001-02-01 04:59:18 +000091 def seed(self, a=None):
92 """Initialize internal state from hashable object.
Tim Petersd7b5e882001-01-25 03:36:26 +000093
Raymond Hettinger23f12412004-09-13 22:23:21 +000094 None or no argument seeds from current time or from an operating
95 system specific randomness source if available.
Tim Peters0de88fc2001-02-01 04:59:18 +000096
Tim Petersbcd725f2001-02-01 10:06:53 +000097 If a is not None or an int or long, hash(a) is used instead.
Tim Petersd7b5e882001-01-25 03:36:26 +000098 """
99
Raymond Hettinger3081d592003-08-09 18:30:57 +0000100 if a is None:
Raymond Hettingerc1c43ca2004-09-05 00:00:42 +0000101 try:
Guido van Rossume2a383d2007-01-15 16:59:06 +0000102 a = int(_hexlify(_urandom(16)), 16)
Raymond Hettingerc1c43ca2004-09-05 00:00:42 +0000103 except NotImplementedError:
Raymond Hettinger356a4592004-08-30 06:14:31 +0000104 import time
Guido van Rossume2a383d2007-01-15 16:59:06 +0000105 a = int(time.time() * 256) # use fractional seconds
Raymond Hettinger356a4592004-08-30 06:14:31 +0000106
Guido van Rossumcd16bf62007-06-13 18:07:49 +0000107 super().seed(a)
Tim Peters46c04e12002-05-05 20:40:00 +0000108 self.gauss_next = None
109
Tim Peterscd804102001-01-25 20:25:57 +0000110 def getstate(self):
111 """Return internal state; can be passed to setstate() later."""
Guido van Rossumcd16bf62007-06-13 18:07:49 +0000112 return self.VERSION, super().getstate(), self.gauss_next
Tim Peterscd804102001-01-25 20:25:57 +0000113
114 def setstate(self, state):
115 """Restore internal state from object returned by getstate()."""
116 version = state[0]
Christian Heimescbf3b5c2007-12-03 21:02:03 +0000117 if version == 3:
Raymond Hettinger40f62172002-12-29 23:03:38 +0000118 version, internalstate, self.gauss_next = state
Guido van Rossumcd16bf62007-06-13 18:07:49 +0000119 super().setstate(internalstate)
Christian Heimescbf3b5c2007-12-03 21:02:03 +0000120 elif version == 2:
121 version, internalstate, self.gauss_next = state
122 # In version 2, the state was saved as signed ints, which causes
123 # inconsistencies between 32/64-bit systems. The state is
124 # really unsigned 32-bit ints, so we convert negative ints from
125 # version 2 to positive longs for version 3.
126 try:
127 internalstate = tuple( x % (2**32) for x in internalstate )
128 except ValueError as e:
129 raise TypeError from e
130 super(Random, self).setstate(internalstate)
Tim Peterscd804102001-01-25 20:25:57 +0000131 else:
132 raise ValueError("state with version %s passed to "
133 "Random.setstate() of version %s" %
134 (version, self.VERSION))
135
Tim Peterscd804102001-01-25 20:25:57 +0000136## ---- Methods below this point do not need to be overridden when
137## ---- subclassing for the purpose of using a different core generator.
138
139## -------------------- pickle support -------------------
140
141 def __getstate__(self): # for pickle
142 return self.getstate()
143
144 def __setstate__(self, state): # for pickle
145 self.setstate(state)
146
Raymond Hettinger5f078ff2003-06-24 20:29:04 +0000147 def __reduce__(self):
148 return self.__class__, (), self.getstate()
149
Tim Peterscd804102001-01-25 20:25:57 +0000150## -------------------- integer methods -------------------
151
Raymond Hettinger2f726e92003-10-05 09:09:15 +0000152 def randrange(self, start, stop=None, step=1, int=int, default=None,
Guido van Rossume2a383d2007-01-15 16:59:06 +0000153 maxwidth=1<<BPF):
Tim Petersd7b5e882001-01-25 03:36:26 +0000154 """Choose a random item from range(start, stop[, step]).
155
156 This fixes the problem with randint() which includes the
157 endpoint; in Python this is usually not what you want.
Raymond Hettinger2f726e92003-10-05 09:09:15 +0000158 Do not supply the 'int', 'default', and 'maxwidth' arguments.
Tim Petersd7b5e882001-01-25 03:36:26 +0000159 """
160
161 # This code is a bit messy to make it fast for the
Tim Peters9146f272002-08-16 03:41:39 +0000162 # common case while still doing adequate error checking.
Tim Petersd7b5e882001-01-25 03:36:26 +0000163 istart = int(start)
164 if istart != start:
Collin Winterce36ad82007-08-30 01:19:48 +0000165 raise ValueError("non-integer arg 1 for randrange()")
Tim Petersd7b5e882001-01-25 03:36:26 +0000166 if stop is default:
167 if istart > 0:
Raymond Hettinger2f726e92003-10-05 09:09:15 +0000168 if istart >= maxwidth:
169 return self._randbelow(istart)
Tim Petersd7b5e882001-01-25 03:36:26 +0000170 return int(self.random() * istart)
Collin Winterce36ad82007-08-30 01:19:48 +0000171 raise ValueError("empty range for randrange()")
Tim Peters9146f272002-08-16 03:41:39 +0000172
173 # stop argument supplied.
Tim Petersd7b5e882001-01-25 03:36:26 +0000174 istop = int(stop)
175 if istop != stop:
Collin Winterce36ad82007-08-30 01:19:48 +0000176 raise ValueError("non-integer stop for randrange()")
Raymond Hettinger2f726e92003-10-05 09:09:15 +0000177 width = istop - istart
178 if step == 1 and width > 0:
Tim Peters76ca1d42003-06-19 03:46:46 +0000179 # Note that
Raymond Hettinger2f726e92003-10-05 09:09:15 +0000180 # int(istart + self.random()*width)
Tim Peters76ca1d42003-06-19 03:46:46 +0000181 # instead would be incorrect. For example, consider istart
182 # = -2 and istop = 0. Then the guts would be in
183 # -2.0 to 0.0 exclusive on both ends (ignoring that random()
184 # might return 0.0), and because int() truncates toward 0, the
185 # final result would be -1 or 0 (instead of -2 or -1).
Raymond Hettinger2f726e92003-10-05 09:09:15 +0000186 # istart + int(self.random()*width)
Tim Peters76ca1d42003-06-19 03:46:46 +0000187 # would also be incorrect, for a subtler reason: the RHS
188 # can return a long, and then randrange() would also return
189 # a long, but we're supposed to return an int (for backward
190 # compatibility).
Raymond Hettinger2f726e92003-10-05 09:09:15 +0000191
192 if width >= maxwidth:
Tim Peters58eb11c2004-01-18 20:29:55 +0000193 return int(istart + self._randbelow(width))
Raymond Hettinger2f726e92003-10-05 09:09:15 +0000194 return int(istart + int(self.random()*width))
Tim Petersd7b5e882001-01-25 03:36:26 +0000195 if step == 1:
Collin Winterce36ad82007-08-30 01:19:48 +0000196 raise ValueError("empty range for randrange() (%d,%d, %d)" % (istart, istop, width))
Tim Peters9146f272002-08-16 03:41:39 +0000197
198 # Non-unit step argument supplied.
Tim Petersd7b5e882001-01-25 03:36:26 +0000199 istep = int(step)
200 if istep != step:
Collin Winterce36ad82007-08-30 01:19:48 +0000201 raise ValueError("non-integer step for randrange()")
Tim Petersd7b5e882001-01-25 03:36:26 +0000202 if istep > 0:
Raymond Hettingerffdb8bb2004-09-27 15:29:05 +0000203 n = (width + istep - 1) // istep
Tim Petersd7b5e882001-01-25 03:36:26 +0000204 elif istep < 0:
Raymond Hettingerffdb8bb2004-09-27 15:29:05 +0000205 n = (width + istep + 1) // istep
Tim Petersd7b5e882001-01-25 03:36:26 +0000206 else:
Collin Winterce36ad82007-08-30 01:19:48 +0000207 raise ValueError("zero step for randrange()")
Tim Petersd7b5e882001-01-25 03:36:26 +0000208
209 if n <= 0:
Collin Winterce36ad82007-08-30 01:19:48 +0000210 raise ValueError("empty range for randrange()")
Raymond Hettinger2f726e92003-10-05 09:09:15 +0000211
212 if n >= maxwidth:
Thomas Wouters902d6eb2007-01-09 23:18:33 +0000213 return istart + istep*self._randbelow(n)
Tim Petersd7b5e882001-01-25 03:36:26 +0000214 return istart + istep*int(self.random() * n)
215
216 def randint(self, a, b):
Tim Peterscd804102001-01-25 20:25:57 +0000217 """Return random integer in range [a, b], including both end points.
Tim Petersd7b5e882001-01-25 03:36:26 +0000218 """
219
220 return self.randrange(a, b+1)
221
Guido van Rossume2a383d2007-01-15 16:59:06 +0000222 def _randbelow(self, n, _log=_log, int=int, _maxwidth=1<<BPF,
Raymond Hettinger2f726e92003-10-05 09:09:15 +0000223 _Method=_MethodType, _BuiltinMethod=_BuiltinMethodType):
224 """Return a random int in the range [0,n)
225
226 Handles the case where n has more bits than returned
227 by a single call to the underlying generator.
228 """
229
230 try:
231 getrandbits = self.getrandbits
232 except AttributeError:
233 pass
234 else:
235 # Only call self.getrandbits if the original random() builtin method
236 # has not been overridden or if a new getrandbits() was supplied.
237 # This assures that the two methods correspond.
238 if type(self.random) is _BuiltinMethod or type(getrandbits) is _Method:
239 k = int(1.00001 + _log(n-1, 2.0)) # 2**k > n-1 > 2**(k-2)
240 r = getrandbits(k)
241 while r >= n:
242 r = getrandbits(k)
243 return r
244 if n >= _maxwidth:
245 _warn("Underlying random() generator does not supply \n"
246 "enough bits to choose from a population range this large")
247 return int(self.random() * n)
248
Tim Peterscd804102001-01-25 20:25:57 +0000249## -------------------- sequence methods -------------------
250
Tim Petersd7b5e882001-01-25 03:36:26 +0000251 def choice(self, seq):
252 """Choose a random element from a non-empty sequence."""
Raymond Hettinger5dae5052004-06-07 02:07:15 +0000253 return seq[int(self.random() * len(seq))] # raises IndexError if seq is empty
Tim Petersd7b5e882001-01-25 03:36:26 +0000254
255 def shuffle(self, x, random=None, int=int):
256 """x, random=random.random -> shuffle list x in place; return None.
257
258 Optional arg random is a 0-argument function returning a random
259 float in [0.0, 1.0); by default, the standard random.random.
Tim Petersd7b5e882001-01-25 03:36:26 +0000260 """
261
262 if random is None:
263 random = self.random
Guido van Rossum805365e2007-05-07 22:24:25 +0000264 for i in reversed(range(1, len(x))):
Tim Peterscd804102001-01-25 20:25:57 +0000265 # pick an element in x[:i+1] with which to exchange x[i]
Tim Petersd7b5e882001-01-25 03:36:26 +0000266 j = int(random() * (i+1))
267 x[i], x[j] = x[j], x[i]
268
Raymond Hettingerfdbe5222003-06-13 07:01:51 +0000269 def sample(self, population, k):
Raymond Hettinger1acde192008-01-14 01:00:53 +0000270 """Chooses k unique random elements from a population sequence or set.
Raymond Hettingerf24eb352002-11-12 17:41:57 +0000271
Raymond Hettingerc0b40342002-11-13 15:26:37 +0000272 Returns a new list containing elements from the population while
273 leaving the original population unchanged. The resulting list is
274 in selection order so that all sub-slices will also be valid random
275 samples. This allows raffle winners (the sample) to be partitioned
276 into grand prize and second place winners (the subslices).
Raymond Hettingerf24eb352002-11-12 17:41:57 +0000277
Raymond Hettingerc0b40342002-11-13 15:26:37 +0000278 Members of the population need not be hashable or unique. If the
279 population contains repeats, then each occurrence is a possible
280 selection in the sample.
Raymond Hettingerf24eb352002-11-12 17:41:57 +0000281
Guido van Rossum805365e2007-05-07 22:24:25 +0000282 To choose a sample in a range of integers, use range as an argument.
Raymond Hettingerc0b40342002-11-13 15:26:37 +0000283 This is especially fast and space efficient for sampling from a
Guido van Rossum805365e2007-05-07 22:24:25 +0000284 large population: sample(range(10000000), 60)
Raymond Hettingerf24eb352002-11-12 17:41:57 +0000285 """
286
Raymond Hettingerc0b40342002-11-13 15:26:37 +0000287 # Sampling without replacement entails tracking either potential
Raymond Hettinger91e27c22005-08-19 01:36:35 +0000288 # selections (the pool) in a list or previous selections in a set.
Raymond Hettingerc0b40342002-11-13 15:26:37 +0000289
Jeremy Hylton2b55d352004-02-23 17:27:57 +0000290 # When the number of selections is small compared to the
291 # population, then tracking selections is efficient, requiring
Raymond Hettinger91e27c22005-08-19 01:36:35 +0000292 # only a small set and an occasional reselection. For
Jeremy Hylton2b55d352004-02-23 17:27:57 +0000293 # a larger number of selections, the pool tracking method is
294 # preferred since the list takes less space than the
Raymond Hettinger91e27c22005-08-19 01:36:35 +0000295 # set and it doesn't suffer from frequent reselections.
Raymond Hettingerc0b40342002-11-13 15:26:37 +0000296
Raymond Hettinger1acde192008-01-14 01:00:53 +0000297 if isinstance(population, (set, frozenset)):
298 population = tuple(population)
299 if not hasattr(population, '__getitem__') or hasattr(population, 'keys'):
300 raise TypeError("Population must be a sequence or set. For dicts, use dict.keys().")
301 random = self.random
Raymond Hettingerf24eb352002-11-12 17:41:57 +0000302 n = len(population)
303 if not 0 <= k <= n:
Raymond Hettinger1acde192008-01-14 01:00:53 +0000304 raise ValueError("Sample larger than population")
Raymond Hettingerfdbe5222003-06-13 07:01:51 +0000305 _int = int
Raymond Hettingerc0b40342002-11-13 15:26:37 +0000306 result = [None] * k
Raymond Hettinger91e27c22005-08-19 01:36:35 +0000307 setsize = 21 # size of a small set minus size of an empty list
308 if k > 5:
Tim Peters9e34c042005-08-26 15:20:46 +0000309 setsize += 4 ** _ceil(_log(k * 3, 4)) # table size for big sets
Raymond Hettinger1acde192008-01-14 01:00:53 +0000310 if n <= setsize:
311 # An n-length list is smaller than a k-length set
Raymond Hettinger311f4192002-11-18 09:01:24 +0000312 pool = list(population)
Guido van Rossum805365e2007-05-07 22:24:25 +0000313 for i in range(k): # invariant: non-selected at [0,n-i)
Raymond Hettingerfdbe5222003-06-13 07:01:51 +0000314 j = _int(random() * (n-i))
Raymond Hettinger311f4192002-11-18 09:01:24 +0000315 result[i] = pool[j]
Raymond Hettinger8b9aa8d2003-01-04 05:20:33 +0000316 pool[j] = pool[n-i-1] # move non-selected item into vacancy
Raymond Hettingerc0b40342002-11-13 15:26:37 +0000317 else:
Raymond Hettinger1acde192008-01-14 01:00:53 +0000318 selected = set()
319 selected_add = selected.add
320 for i in range(k):
321 j = _int(random() * n)
322 while j in selected:
Raymond Hettingerfdbe5222003-06-13 07:01:51 +0000323 j = _int(random() * n)
Raymond Hettinger1acde192008-01-14 01:00:53 +0000324 selected_add(j)
325 result[i] = population[j]
Raymond Hettinger311f4192002-11-18 09:01:24 +0000326 return result
Raymond Hettingerf24eb352002-11-12 17:41:57 +0000327
Tim Peterscd804102001-01-25 20:25:57 +0000328## -------------------- real-valued distributions -------------------
329
330## -------------------- uniform distribution -------------------
Tim Petersd7b5e882001-01-25 03:36:26 +0000331
332 def uniform(self, a, b):
333 """Get a random number in the range [a, b)."""
334 return a + (b-a) * self.random()
Guido van Rossumff03b1a1994-03-09 12:55:02 +0000335
Tim Peterscd804102001-01-25 20:25:57 +0000336## -------------------- normal distribution --------------------
Guido van Rossumff03b1a1994-03-09 12:55:02 +0000337
Tim Petersd7b5e882001-01-25 03:36:26 +0000338 def normalvariate(self, mu, sigma):
Raymond Hettingerc32f0332002-05-23 19:44:49 +0000339 """Normal distribution.
340
341 mu is the mean, and sigma is the standard deviation.
Raymond Hettingeref4d4bd2002-05-23 23:58:17 +0000342
Raymond Hettingerc32f0332002-05-23 19:44:49 +0000343 """
Tim Petersd7b5e882001-01-25 03:36:26 +0000344 # mu = mean, sigma = standard deviation
Guido van Rossumff03b1a1994-03-09 12:55:02 +0000345
Tim Petersd7b5e882001-01-25 03:36:26 +0000346 # Uses Kinderman and Monahan method. Reference: Kinderman,
347 # A.J. and Monahan, J.F., "Computer generation of random
348 # variables using the ratio of uniform deviates", ACM Trans
349 # Math Software, 3, (1977), pp257-260.
Guido van Rossumff03b1a1994-03-09 12:55:02 +0000350
Tim Petersd7b5e882001-01-25 03:36:26 +0000351 random = self.random
Raymond Hettinger42406e62005-04-30 09:02:51 +0000352 while 1:
Tim Peters0c9886d2001-01-15 01:18:21 +0000353 u1 = random()
Raymond Hettinger73ced7e2003-01-04 09:26:32 +0000354 u2 = 1.0 - random()
Tim Petersd7b5e882001-01-25 03:36:26 +0000355 z = NV_MAGICCONST*(u1-0.5)/u2
356 zz = z*z/4.0
357 if zz <= -_log(u2):
358 break
359 return mu + z*sigma
Guido van Rossumff03b1a1994-03-09 12:55:02 +0000360
Tim Peterscd804102001-01-25 20:25:57 +0000361## -------------------- lognormal distribution --------------------
Tim Petersd7b5e882001-01-25 03:36:26 +0000362
363 def lognormvariate(self, mu, sigma):
Raymond Hettingerc32f0332002-05-23 19:44:49 +0000364 """Log normal distribution.
365
366 If you take the natural logarithm of this distribution, you'll get a
367 normal distribution with mean mu and standard deviation sigma.
368 mu can have any value, and sigma must be greater than zero.
Raymond Hettingeref4d4bd2002-05-23 23:58:17 +0000369
Raymond Hettingerc32f0332002-05-23 19:44:49 +0000370 """
Tim Petersd7b5e882001-01-25 03:36:26 +0000371 return _exp(self.normalvariate(mu, sigma))
372
Tim Peterscd804102001-01-25 20:25:57 +0000373## -------------------- exponential distribution --------------------
Tim Petersd7b5e882001-01-25 03:36:26 +0000374
375 def expovariate(self, lambd):
Raymond Hettingerc32f0332002-05-23 19:44:49 +0000376 """Exponential distribution.
377
378 lambd is 1.0 divided by the desired mean. (The parameter would be
379 called "lambda", but that is a reserved word in Python.) Returned
380 values range from 0 to positive infinity.
Raymond Hettingeref4d4bd2002-05-23 23:58:17 +0000381
Raymond Hettingerc32f0332002-05-23 19:44:49 +0000382 """
Tim Petersd7b5e882001-01-25 03:36:26 +0000383 # lambd: rate lambd = 1/mean
384 # ('lambda' is a Python reserved word)
385
386 random = self.random
Tim Peters0c9886d2001-01-15 01:18:21 +0000387 u = random()
388 while u <= 1e-7:
389 u = random()
Tim Petersd7b5e882001-01-25 03:36:26 +0000390 return -_log(u)/lambd
Guido van Rossumff03b1a1994-03-09 12:55:02 +0000391
Tim Peterscd804102001-01-25 20:25:57 +0000392## -------------------- von Mises distribution --------------------
Guido van Rossumff03b1a1994-03-09 12:55:02 +0000393
Tim Petersd7b5e882001-01-25 03:36:26 +0000394 def vonmisesvariate(self, mu, kappa):
Raymond Hettingerc32f0332002-05-23 19:44:49 +0000395 """Circular data distribution.
Raymond Hettingeref4d4bd2002-05-23 23:58:17 +0000396
Raymond Hettingerc32f0332002-05-23 19:44:49 +0000397 mu is the mean angle, expressed in radians between 0 and 2*pi, and
398 kappa is the concentration parameter, which must be greater than or
399 equal to zero. If kappa is equal to zero, this distribution reduces
400 to a uniform random angle over the range 0 to 2*pi.
Raymond Hettingeref4d4bd2002-05-23 23:58:17 +0000401
Raymond Hettingerc32f0332002-05-23 19:44:49 +0000402 """
Tim Petersd7b5e882001-01-25 03:36:26 +0000403 # mu: mean angle (in radians between 0 and 2*pi)
404 # kappa: concentration parameter kappa (>= 0)
405 # if kappa = 0 generate uniform random angle
406
407 # Based upon an algorithm published in: Fisher, N.I.,
408 # "Statistical Analysis of Circular Data", Cambridge
409 # University Press, 1993.
410
411 # Thanks to Magnus Kessler for a correction to the
412 # implementation of step 4.
413
414 random = self.random
415 if kappa <= 1e-6:
416 return TWOPI * random()
417
418 a = 1.0 + _sqrt(1.0 + 4.0 * kappa * kappa)
419 b = (a - _sqrt(2.0 * a))/(2.0 * kappa)
420 r = (1.0 + b * b)/(2.0 * b)
Guido van Rossumff03b1a1994-03-09 12:55:02 +0000421
Raymond Hettinger42406e62005-04-30 09:02:51 +0000422 while 1:
Tim Peters0c9886d2001-01-15 01:18:21 +0000423 u1 = random()
Tim Petersd7b5e882001-01-25 03:36:26 +0000424
425 z = _cos(_pi * u1)
426 f = (1.0 + r * z)/(r + z)
427 c = kappa * (r - f)
428
429 u2 = random()
430
Raymond Hettinger42406e62005-04-30 09:02:51 +0000431 if u2 < c * (2.0 - c) or u2 <= c * _exp(1.0 - c):
Tim Peters0c9886d2001-01-15 01:18:21 +0000432 break
Tim Petersd7b5e882001-01-25 03:36:26 +0000433
434 u3 = random()
435 if u3 > 0.5:
436 theta = (mu % TWOPI) + _acos(f)
437 else:
438 theta = (mu % TWOPI) - _acos(f)
439
440 return theta
441
Tim Peterscd804102001-01-25 20:25:57 +0000442## -------------------- gamma distribution --------------------
Tim Petersd7b5e882001-01-25 03:36:26 +0000443
444 def gammavariate(self, alpha, beta):
Raymond Hettingerc32f0332002-05-23 19:44:49 +0000445 """Gamma distribution. Not the gamma function!
446
447 Conditions on the parameters are alpha > 0 and beta > 0.
448
449 """
Tim Peters8ac14952002-05-23 15:15:30 +0000450
Raymond Hettingerb760efb2002-05-14 06:40:34 +0000451 # alpha > 0, beta > 0, mean is alpha*beta, variance is alpha*beta**2
Tim Peters8ac14952002-05-23 15:15:30 +0000452
Guido van Rossum570764d2002-05-14 14:08:12 +0000453 # Warning: a few older sources define the gamma distribution in terms
454 # of alpha > -1.0
455 if alpha <= 0.0 or beta <= 0.0:
Collin Winterce36ad82007-08-30 01:19:48 +0000456 raise ValueError('gammavariate: alpha and beta must be > 0.0')
Tim Peters8ac14952002-05-23 15:15:30 +0000457
Tim Petersd7b5e882001-01-25 03:36:26 +0000458 random = self.random
Tim Petersd7b5e882001-01-25 03:36:26 +0000459 if alpha > 1.0:
460
461 # Uses R.C.H. Cheng, "The generation of Gamma
462 # variables with non-integral shape parameters",
463 # Applied Statistics, (1977), 26, No. 1, p71-74
464
Raymond Hettingerca6cdc22002-05-13 23:40:14 +0000465 ainv = _sqrt(2.0 * alpha - 1.0)
466 bbb = alpha - LOG4
467 ccc = alpha + ainv
Tim Peters8ac14952002-05-23 15:15:30 +0000468
Raymond Hettinger42406e62005-04-30 09:02:51 +0000469 while 1:
Tim Petersd7b5e882001-01-25 03:36:26 +0000470 u1 = random()
Raymond Hettinger73ced7e2003-01-04 09:26:32 +0000471 if not 1e-7 < u1 < .9999999:
472 continue
473 u2 = 1.0 - random()
Tim Petersd7b5e882001-01-25 03:36:26 +0000474 v = _log(u1/(1.0-u1))/ainv
475 x = alpha*_exp(v)
476 z = u1*u1*u2
477 r = bbb+ccc*v-x
478 if r + SG_MAGICCONST - 4.5*z >= 0.0 or r >= _log(z):
Raymond Hettingerb760efb2002-05-14 06:40:34 +0000479 return x * beta
Tim Petersd7b5e882001-01-25 03:36:26 +0000480
481 elif alpha == 1.0:
482 # expovariate(1)
483 u = random()
484 while u <= 1e-7:
485 u = random()
Raymond Hettingerb760efb2002-05-14 06:40:34 +0000486 return -_log(u) * beta
Tim Petersd7b5e882001-01-25 03:36:26 +0000487
488 else: # alpha is between 0 and 1 (exclusive)
489
490 # Uses ALGORITHM GS of Statistical Computing - Kennedy & Gentle
491
Raymond Hettinger42406e62005-04-30 09:02:51 +0000492 while 1:
Tim Petersd7b5e882001-01-25 03:36:26 +0000493 u = random()
494 b = (_e + alpha)/_e
495 p = b*u
496 if p <= 1.0:
Raymond Hettinger42406e62005-04-30 09:02:51 +0000497 x = p ** (1.0/alpha)
Tim Petersd7b5e882001-01-25 03:36:26 +0000498 else:
Tim Petersd7b5e882001-01-25 03:36:26 +0000499 x = -_log((b-p)/alpha)
500 u1 = random()
Raymond Hettinger42406e62005-04-30 09:02:51 +0000501 if p > 1.0:
502 if u1 <= x ** (alpha - 1.0):
503 break
504 elif u1 <= _exp(-x):
Tim Petersd7b5e882001-01-25 03:36:26 +0000505 break
Raymond Hettingerb760efb2002-05-14 06:40:34 +0000506 return x * beta
507
Tim Peterscd804102001-01-25 20:25:57 +0000508## -------------------- Gauss (faster alternative) --------------------
Guido van Rossum95bfcda1994-03-09 14:21:05 +0000509
Tim Petersd7b5e882001-01-25 03:36:26 +0000510 def gauss(self, mu, sigma):
Raymond Hettingerc32f0332002-05-23 19:44:49 +0000511 """Gaussian distribution.
512
513 mu is the mean, and sigma is the standard deviation. This is
514 slightly faster than the normalvariate() function.
515
516 Not thread-safe without a lock around calls.
Raymond Hettingeref4d4bd2002-05-23 23:58:17 +0000517
Raymond Hettingerc32f0332002-05-23 19:44:49 +0000518 """
Guido van Rossumcc32ac91994-03-15 16:10:24 +0000519
Tim Petersd7b5e882001-01-25 03:36:26 +0000520 # When x and y are two variables from [0, 1), uniformly
521 # distributed, then
522 #
523 # cos(2*pi*x)*sqrt(-2*log(1-y))
524 # sin(2*pi*x)*sqrt(-2*log(1-y))
525 #
526 # are two *independent* variables with normal distribution
527 # (mu = 0, sigma = 1).
528 # (Lambert Meertens)
529 # (corrected version; bug discovered by Mike Miller, fixed by LM)
Guido van Rossumcc32ac91994-03-15 16:10:24 +0000530
Tim Petersd7b5e882001-01-25 03:36:26 +0000531 # Multithreading note: When two threads call this function
532 # simultaneously, it is possible that they will receive the
533 # same return value. The window is very small though. To
534 # avoid this, you have to use a lock around all calls. (I
535 # didn't want to slow this down in the serial case by using a
536 # lock here.)
Guido van Rossumd03e1191998-05-29 17:51:31 +0000537
Tim Petersd7b5e882001-01-25 03:36:26 +0000538 random = self.random
539 z = self.gauss_next
540 self.gauss_next = None
541 if z is None:
542 x2pi = random() * TWOPI
543 g2rad = _sqrt(-2.0 * _log(1.0 - random()))
544 z = _cos(x2pi) * g2rad
545 self.gauss_next = _sin(x2pi) * g2rad
Guido van Rossumcc32ac91994-03-15 16:10:24 +0000546
Tim Petersd7b5e882001-01-25 03:36:26 +0000547 return mu + z*sigma
Guido van Rossum95bfcda1994-03-09 14:21:05 +0000548
Tim Peterscd804102001-01-25 20:25:57 +0000549## -------------------- beta --------------------
Tim Peters85e2e472001-01-26 06:49:56 +0000550## See
551## http://sourceforge.net/bugs/?func=detailbug&bug_id=130030&group_id=5470
552## for Ivan Frohne's insightful analysis of why the original implementation:
553##
554## def betavariate(self, alpha, beta):
555## # Discrete Event Simulation in C, pp 87-88.
556##
557## y = self.expovariate(alpha)
558## z = self.expovariate(1.0/beta)
559## return z/(y+z)
560##
561## was dead wrong, and how it probably got that way.
Guido van Rossum95bfcda1994-03-09 14:21:05 +0000562
Tim Petersd7b5e882001-01-25 03:36:26 +0000563 def betavariate(self, alpha, beta):
Raymond Hettingerc32f0332002-05-23 19:44:49 +0000564 """Beta distribution.
565
Thomas Woutersb2137042007-02-01 18:02:27 +0000566 Conditions on the parameters are alpha > 0 and beta > 0.
Raymond Hettingerc32f0332002-05-23 19:44:49 +0000567 Returned values range between 0 and 1.
Raymond Hettingeref4d4bd2002-05-23 23:58:17 +0000568
Raymond Hettingerc32f0332002-05-23 19:44:49 +0000569 """
Raymond Hettingeref4d4bd2002-05-23 23:58:17 +0000570
Tim Peters85e2e472001-01-26 06:49:56 +0000571 # This version due to Janne Sinkkonen, and matches all the std
572 # texts (e.g., Knuth Vol 2 Ed 3 pg 134 "the beta distribution").
573 y = self.gammavariate(alpha, 1.)
574 if y == 0:
575 return 0.0
576 else:
577 return y / (y + self.gammavariate(beta, 1.))
Guido van Rossum95bfcda1994-03-09 14:21:05 +0000578
Tim Peterscd804102001-01-25 20:25:57 +0000579## -------------------- Pareto --------------------
Guido van Rossumcf4559a1997-12-02 02:47:39 +0000580
Tim Petersd7b5e882001-01-25 03:36:26 +0000581 def paretovariate(self, alpha):
Raymond Hettingerc32f0332002-05-23 19:44:49 +0000582 """Pareto distribution. alpha is the shape parameter."""
Tim Petersd7b5e882001-01-25 03:36:26 +0000583 # Jain, pg. 495
Guido van Rossumcf4559a1997-12-02 02:47:39 +0000584
Raymond Hettinger73ced7e2003-01-04 09:26:32 +0000585 u = 1.0 - self.random()
Tim Petersd7b5e882001-01-25 03:36:26 +0000586 return 1.0 / pow(u, 1.0/alpha)
Guido van Rossumcf4559a1997-12-02 02:47:39 +0000587
Tim Peterscd804102001-01-25 20:25:57 +0000588## -------------------- Weibull --------------------
Guido van Rossumcf4559a1997-12-02 02:47:39 +0000589
Tim Petersd7b5e882001-01-25 03:36:26 +0000590 def weibullvariate(self, alpha, beta):
Raymond Hettingerc32f0332002-05-23 19:44:49 +0000591 """Weibull distribution.
592
593 alpha is the scale parameter and beta is the shape parameter.
Raymond Hettingeref4d4bd2002-05-23 23:58:17 +0000594
Raymond Hettingerc32f0332002-05-23 19:44:49 +0000595 """
Tim Petersd7b5e882001-01-25 03:36:26 +0000596 # Jain, pg. 499; bug fix courtesy Bill Arms
Guido van Rossumcf4559a1997-12-02 02:47:39 +0000597
Raymond Hettinger73ced7e2003-01-04 09:26:32 +0000598 u = 1.0 - self.random()
Tim Petersd7b5e882001-01-25 03:36:26 +0000599 return alpha * pow(-_log(u), 1.0/beta)
Guido van Rossum6c395ba1999-08-18 13:53:28 +0000600
Raymond Hettinger23f12412004-09-13 22:23:21 +0000601## --------------- Operating System Random Source ------------------
Raymond Hettinger356a4592004-08-30 06:14:31 +0000602
Raymond Hettinger23f12412004-09-13 22:23:21 +0000603class SystemRandom(Random):
604 """Alternate random number generator using sources provided
605 by the operating system (such as /dev/urandom on Unix or
606 CryptGenRandom on Windows).
Raymond Hettinger356a4592004-08-30 06:14:31 +0000607
608 Not available on all systems (see os.urandom() for details).
609 """
610
611 def random(self):
612 """Get the next random number in the range [0.0, 1.0)."""
Guido van Rossume2a383d2007-01-15 16:59:06 +0000613 return (int(_hexlify(_urandom(7)), 16) >> 3) * RECIP_BPF
Raymond Hettinger356a4592004-08-30 06:14:31 +0000614
615 def getrandbits(self, k):
616 """getrandbits(k) -> x. Generates a long int with k random bits."""
Raymond Hettinger356a4592004-08-30 06:14:31 +0000617 if k <= 0:
618 raise ValueError('number of bits must be greater than zero')
619 if k != int(k):
620 raise TypeError('number of bits should be an integer')
621 bytes = (k + 7) // 8 # bits / 8 and rounded up
Guido van Rossume2a383d2007-01-15 16:59:06 +0000622 x = int(_hexlify(_urandom(bytes)), 16)
Raymond Hettinger356a4592004-08-30 06:14:31 +0000623 return x >> (bytes * 8 - k) # trim excess bits
624
Raymond Hettinger28de64f2008-01-13 23:40:30 +0000625 def seed(self, *args, **kwds):
Raymond Hettinger23f12412004-09-13 22:23:21 +0000626 "Stub method. Not used for a system random number generator."
Raymond Hettinger356a4592004-08-30 06:14:31 +0000627 return None
Raymond Hettinger356a4592004-08-30 06:14:31 +0000628
629 def _notimplemented(self, *args, **kwds):
Raymond Hettinger23f12412004-09-13 22:23:21 +0000630 "Method should not be called for a system random number generator."
631 raise NotImplementedError('System entropy source does not have state.')
Raymond Hettinger356a4592004-08-30 06:14:31 +0000632 getstate = setstate = _notimplemented
633
Tim Peterscd804102001-01-25 20:25:57 +0000634## -------------------- test program --------------------
Guido van Rossumff03b1a1994-03-09 12:55:02 +0000635
Raymond Hettinger62297132003-08-30 01:24:19 +0000636def _test_generator(n, func, args):
Tim Peters0c9886d2001-01-15 01:18:21 +0000637 import time
Guido van Rossumbe19ed72007-02-09 05:37:30 +0000638 print(n, 'times', func.__name__)
Raymond Hettingerb98154e2003-05-24 17:26:02 +0000639 total = 0.0
Tim Peters0c9886d2001-01-15 01:18:21 +0000640 sqsum = 0.0
641 smallest = 1e10
642 largest = -1e10
643 t0 = time.time()
644 for i in range(n):
Raymond Hettinger62297132003-08-30 01:24:19 +0000645 x = func(*args)
Raymond Hettingerb98154e2003-05-24 17:26:02 +0000646 total += x
Tim Peters0c9886d2001-01-15 01:18:21 +0000647 sqsum = sqsum + x*x
648 smallest = min(x, smallest)
649 largest = max(x, largest)
650 t1 = time.time()
Guido van Rossumbe19ed72007-02-09 05:37:30 +0000651 print(round(t1-t0, 3), 'sec,', end=' ')
Raymond Hettingerb98154e2003-05-24 17:26:02 +0000652 avg = total/n
Tim Petersd7b5e882001-01-25 03:36:26 +0000653 stddev = _sqrt(sqsum/n - avg*avg)
Guido van Rossumbe19ed72007-02-09 05:37:30 +0000654 print('avg %g, stddev %g, min %g, max %g' % \
655 (avg, stddev, smallest, largest))
Guido van Rossumff03b1a1994-03-09 12:55:02 +0000656
Raymond Hettingerf24eb352002-11-12 17:41:57 +0000657
658def _test(N=2000):
Raymond Hettinger62297132003-08-30 01:24:19 +0000659 _test_generator(N, random, ())
660 _test_generator(N, normalvariate, (0.0, 1.0))
661 _test_generator(N, lognormvariate, (0.0, 1.0))
662 _test_generator(N, vonmisesvariate, (0.0, 1.0))
663 _test_generator(N, gammavariate, (0.01, 1.0))
664 _test_generator(N, gammavariate, (0.1, 1.0))
665 _test_generator(N, gammavariate, (0.1, 2.0))
666 _test_generator(N, gammavariate, (0.5, 1.0))
667 _test_generator(N, gammavariate, (0.9, 1.0))
668 _test_generator(N, gammavariate, (1.0, 1.0))
669 _test_generator(N, gammavariate, (2.0, 1.0))
670 _test_generator(N, gammavariate, (20.0, 1.0))
671 _test_generator(N, gammavariate, (200.0, 1.0))
672 _test_generator(N, gauss, (0.0, 1.0))
673 _test_generator(N, betavariate, (3.0, 3.0))
Tim Peterscd804102001-01-25 20:25:57 +0000674
Tim Peters715c4c42001-01-26 22:56:56 +0000675# Create one instance, seeded from current time, and export its methods
Raymond Hettinger40f62172002-12-29 23:03:38 +0000676# as module-level functions. The functions share state across all uses
677#(both in the user's code and in the Python libraries), but that's fine
678# for most programs and is easier for the casual user than making them
679# instantiate their own Random() instance.
680
Tim Petersd7b5e882001-01-25 03:36:26 +0000681_inst = Random()
682seed = _inst.seed
683random = _inst.random
684uniform = _inst.uniform
685randint = _inst.randint
686choice = _inst.choice
687randrange = _inst.randrange
Raymond Hettingerf24eb352002-11-12 17:41:57 +0000688sample = _inst.sample
Tim Petersd7b5e882001-01-25 03:36:26 +0000689shuffle = _inst.shuffle
690normalvariate = _inst.normalvariate
691lognormvariate = _inst.lognormvariate
Tim Petersd7b5e882001-01-25 03:36:26 +0000692expovariate = _inst.expovariate
693vonmisesvariate = _inst.vonmisesvariate
694gammavariate = _inst.gammavariate
Tim Petersd7b5e882001-01-25 03:36:26 +0000695gauss = _inst.gauss
696betavariate = _inst.betavariate
697paretovariate = _inst.paretovariate
698weibullvariate = _inst.weibullvariate
699getstate = _inst.getstate
700setstate = _inst.setstate
Raymond Hettinger2f726e92003-10-05 09:09:15 +0000701getrandbits = _inst.getrandbits
Tim Petersd7b5e882001-01-25 03:36:26 +0000702
Guido van Rossumff03b1a1994-03-09 12:55:02 +0000703if __name__ == '__main__':
Tim Petersd7b5e882001-01-25 03:36:26 +0000704 _test()