blob: 5e5720388a35e70b84abba2527c69762db592703 [file] [log] [blame]
Guido van Rossume7b146f2000-02-04 15:28:42 +00001"""Random variable generators.
Guido van Rossumff03b1a1994-03-09 12:55:02 +00002
Tim Petersd7b5e882001-01-25 03:36:26 +00003 integers
4 --------
5 uniform within range
6
7 sequences
8 ---------
9 pick random element
Raymond Hettingerf24eb352002-11-12 17:41:57 +000010 pick random sample
Tim Petersd7b5e882001-01-25 03:36:26 +000011 generate random permutation
12
Guido van Rossume7b146f2000-02-04 15:28:42 +000013 distributions on the real line:
14 ------------------------------
Tim Petersd7b5e882001-01-25 03:36:26 +000015 uniform
Guido van Rossume7b146f2000-02-04 15:28:42 +000016 normal (Gaussian)
17 lognormal
18 negative exponential
19 gamma
20 beta
Raymond Hettinger40f62172002-12-29 23:03:38 +000021 pareto
22 Weibull
Guido van Rossumff03b1a1994-03-09 12:55:02 +000023
Guido van Rossume7b146f2000-02-04 15:28:42 +000024 distributions on the circle (angles 0 to 2pi)
25 ---------------------------------------------
26 circular uniform
27 von Mises
28
Raymond Hettinger40f62172002-12-29 23:03:38 +000029General notes on the underlying Mersenne Twister core generator:
Guido van Rossume7b146f2000-02-04 15:28:42 +000030
Raymond Hettinger40f62172002-12-29 23:03:38 +000031* The period is 2**19937-1.
Thomas Wouters0e3f5912006-08-11 14:57:12 +000032* It is one of the most extensively tested generators in existence.
Thomas Wouters0e3f5912006-08-11 14:57:12 +000033* The random() method is implemented in C, executes in a single Python step,
34 and is, therefore, threadsafe.
Tim Peterse360d952001-01-26 10:00:39 +000035
Guido van Rossume7b146f2000-02-04 15:28:42 +000036"""
Guido van Rossumd03e1191998-05-29 17:51:31 +000037
Raymond Hettinger2f726e92003-10-05 09:09:15 +000038from warnings import warn as _warn
39from types import MethodType as _MethodType, BuiltinMethodType as _BuiltinMethodType
Raymond Hettinger91e27c22005-08-19 01:36:35 +000040from math import log as _log, exp as _exp, pi as _pi, e as _e, ceil as _ceil
Tim Petersd7b5e882001-01-25 03:36:26 +000041from math import sqrt as _sqrt, acos as _acos, cos as _cos, sin as _sin
Raymond Hettingerc1c43ca2004-09-05 00:00:42 +000042from os import urandom as _urandom
43from binascii import hexlify as _hexlify
Guido van Rossumff03b1a1994-03-09 12:55:02 +000044
Raymond Hettingerf24eb352002-11-12 17:41:57 +000045__all__ = ["Random","seed","random","uniform","randint","choice","sample",
Skip Montanaro0de65802001-02-15 22:15:14 +000046 "randrange","shuffle","normalvariate","lognormvariate",
Raymond Hettingerf8a52d32003-08-05 12:23:19 +000047 "expovariate","vonmisesvariate","gammavariate",
48 "gauss","betavariate","paretovariate","weibullvariate",
Raymond Hettinger28de64f2008-01-13 23:40:30 +000049 "getstate","setstate", "getrandbits",
Raymond Hettinger23f12412004-09-13 22:23:21 +000050 "SystemRandom"]
Tim Petersd7b5e882001-01-25 03:36:26 +000051
52NV_MAGICCONST = 4 * _exp(-0.5)/_sqrt(2.0)
Tim Petersd7b5e882001-01-25 03:36:26 +000053TWOPI = 2.0*_pi
Tim Petersd7b5e882001-01-25 03:36:26 +000054LOG4 = _log(4.0)
Tim Petersd7b5e882001-01-25 03:36:26 +000055SG_MAGICCONST = 1.0 + _log(4.5)
Raymond Hettinger2f726e92003-10-05 09:09:15 +000056BPF = 53 # Number of bits in a float
Tim Peters7c2a85b2004-08-31 02:19:55 +000057RECIP_BPF = 2**-BPF
Tim Petersd7b5e882001-01-25 03:36:26 +000058
Raymond Hettinger356a4592004-08-30 06:14:31 +000059
Tim Petersd7b5e882001-01-25 03:36:26 +000060# Translated by Guido van Rossum from C source provided by
Raymond Hettinger40f62172002-12-29 23:03:38 +000061# Adrian Baddeley. Adapted by Raymond Hettinger for use with
Raymond Hettinger3fa19d72004-08-31 01:05:15 +000062# the Mersenne Twister and os.urandom() core generators.
Tim Petersd7b5e882001-01-25 03:36:26 +000063
Raymond Hettinger145a4a02003-01-07 10:25:55 +000064import _random
Raymond Hettinger40f62172002-12-29 23:03:38 +000065
Raymond Hettinger145a4a02003-01-07 10:25:55 +000066class Random(_random.Random):
Raymond Hettingerc32f0332002-05-23 19:44:49 +000067 """Random number generator base class used by bound module functions.
68
69 Used to instantiate instances of Random to get generators that don't
Raymond Hettinger28de64f2008-01-13 23:40:30 +000070 share state.
Raymond Hettingerc32f0332002-05-23 19:44:49 +000071
72 Class Random can also be subclassed if you want to use a different basic
73 generator of your own devising: in that case, override the following
Raymond Hettinger28de64f2008-01-13 23:40:30 +000074 methods: random(), seed(), getstate(), and setstate().
Raymond Hettinger2f726e92003-10-05 09:09:15 +000075 Optionally, implement a getrandombits() method so that randrange()
76 can cover arbitrarily large ranges.
Raymond Hettingeref4d4bd2002-05-23 23:58:17 +000077
Raymond Hettingerc32f0332002-05-23 19:44:49 +000078 """
Tim Petersd7b5e882001-01-25 03:36:26 +000079
Christian Heimescbf3b5c2007-12-03 21:02:03 +000080 VERSION = 3 # used by getstate/setstate
Tim Petersd7b5e882001-01-25 03:36:26 +000081
82 def __init__(self, x=None):
83 """Initialize an instance.
84
85 Optional argument x controls seeding, as for Random.seed().
86 """
87
88 self.seed(x)
Raymond Hettinger40f62172002-12-29 23:03:38 +000089 self.gauss_next = None
Tim Petersd7b5e882001-01-25 03:36:26 +000090
Tim Peters0de88fc2001-02-01 04:59:18 +000091 def seed(self, a=None):
92 """Initialize internal state from hashable object.
Tim Petersd7b5e882001-01-25 03:36:26 +000093
Raymond Hettinger23f12412004-09-13 22:23:21 +000094 None or no argument seeds from current time or from an operating
95 system specific randomness source if available.
Tim Peters0de88fc2001-02-01 04:59:18 +000096
Tim Petersbcd725f2001-02-01 10:06:53 +000097 If a is not None or an int or long, hash(a) is used instead.
Tim Petersd7b5e882001-01-25 03:36:26 +000098 """
99
Raymond Hettinger3081d592003-08-09 18:30:57 +0000100 if a is None:
Raymond Hettingerc1c43ca2004-09-05 00:00:42 +0000101 try:
Guido van Rossume2a383d2007-01-15 16:59:06 +0000102 a = int(_hexlify(_urandom(16)), 16)
Raymond Hettingerc1c43ca2004-09-05 00:00:42 +0000103 except NotImplementedError:
Raymond Hettinger356a4592004-08-30 06:14:31 +0000104 import time
Guido van Rossume2a383d2007-01-15 16:59:06 +0000105 a = int(time.time() * 256) # use fractional seconds
Raymond Hettinger356a4592004-08-30 06:14:31 +0000106
Guido van Rossumcd16bf62007-06-13 18:07:49 +0000107 super().seed(a)
Tim Peters46c04e12002-05-05 20:40:00 +0000108 self.gauss_next = None
109
Tim Peterscd804102001-01-25 20:25:57 +0000110 def getstate(self):
111 """Return internal state; can be passed to setstate() later."""
Guido van Rossumcd16bf62007-06-13 18:07:49 +0000112 return self.VERSION, super().getstate(), self.gauss_next
Tim Peterscd804102001-01-25 20:25:57 +0000113
114 def setstate(self, state):
115 """Restore internal state from object returned by getstate()."""
116 version = state[0]
Christian Heimescbf3b5c2007-12-03 21:02:03 +0000117 if version == 3:
Raymond Hettinger40f62172002-12-29 23:03:38 +0000118 version, internalstate, self.gauss_next = state
Guido van Rossumcd16bf62007-06-13 18:07:49 +0000119 super().setstate(internalstate)
Christian Heimescbf3b5c2007-12-03 21:02:03 +0000120 elif version == 2:
121 version, internalstate, self.gauss_next = state
122 # In version 2, the state was saved as signed ints, which causes
123 # inconsistencies between 32/64-bit systems. The state is
124 # really unsigned 32-bit ints, so we convert negative ints from
125 # version 2 to positive longs for version 3.
126 try:
127 internalstate = tuple( x % (2**32) for x in internalstate )
128 except ValueError as e:
129 raise TypeError from e
130 super(Random, self).setstate(internalstate)
Tim Peterscd804102001-01-25 20:25:57 +0000131 else:
132 raise ValueError("state with version %s passed to "
133 "Random.setstate() of version %s" %
134 (version, self.VERSION))
135
Tim Peterscd804102001-01-25 20:25:57 +0000136## ---- Methods below this point do not need to be overridden when
137## ---- subclassing for the purpose of using a different core generator.
138
139## -------------------- pickle support -------------------
140
141 def __getstate__(self): # for pickle
142 return self.getstate()
143
144 def __setstate__(self, state): # for pickle
145 self.setstate(state)
146
Raymond Hettinger5f078ff2003-06-24 20:29:04 +0000147 def __reduce__(self):
148 return self.__class__, (), self.getstate()
149
Tim Peterscd804102001-01-25 20:25:57 +0000150## -------------------- integer methods -------------------
151
Raymond Hettinger2f726e92003-10-05 09:09:15 +0000152 def randrange(self, start, stop=None, step=1, int=int, default=None,
Guido van Rossume2a383d2007-01-15 16:59:06 +0000153 maxwidth=1<<BPF):
Tim Petersd7b5e882001-01-25 03:36:26 +0000154 """Choose a random item from range(start, stop[, step]).
155
156 This fixes the problem with randint() which includes the
157 endpoint; in Python this is usually not what you want.
Raymond Hettinger2f726e92003-10-05 09:09:15 +0000158 Do not supply the 'int', 'default', and 'maxwidth' arguments.
Tim Petersd7b5e882001-01-25 03:36:26 +0000159 """
160
161 # This code is a bit messy to make it fast for the
Tim Peters9146f272002-08-16 03:41:39 +0000162 # common case while still doing adequate error checking.
Tim Petersd7b5e882001-01-25 03:36:26 +0000163 istart = int(start)
164 if istart != start:
Collin Winterce36ad82007-08-30 01:19:48 +0000165 raise ValueError("non-integer arg 1 for randrange()")
Tim Petersd7b5e882001-01-25 03:36:26 +0000166 if stop is default:
167 if istart > 0:
Raymond Hettinger2f726e92003-10-05 09:09:15 +0000168 if istart >= maxwidth:
169 return self._randbelow(istart)
Tim Petersd7b5e882001-01-25 03:36:26 +0000170 return int(self.random() * istart)
Collin Winterce36ad82007-08-30 01:19:48 +0000171 raise ValueError("empty range for randrange()")
Tim Peters9146f272002-08-16 03:41:39 +0000172
173 # stop argument supplied.
Tim Petersd7b5e882001-01-25 03:36:26 +0000174 istop = int(stop)
175 if istop != stop:
Collin Winterce36ad82007-08-30 01:19:48 +0000176 raise ValueError("non-integer stop for randrange()")
Raymond Hettinger2f726e92003-10-05 09:09:15 +0000177 width = istop - istart
178 if step == 1 and width > 0:
Tim Peters76ca1d42003-06-19 03:46:46 +0000179 # Note that
Raymond Hettinger2f726e92003-10-05 09:09:15 +0000180 # int(istart + self.random()*width)
Tim Peters76ca1d42003-06-19 03:46:46 +0000181 # instead would be incorrect. For example, consider istart
182 # = -2 and istop = 0. Then the guts would be in
183 # -2.0 to 0.0 exclusive on both ends (ignoring that random()
184 # might return 0.0), and because int() truncates toward 0, the
185 # final result would be -1 or 0 (instead of -2 or -1).
Raymond Hettinger2f726e92003-10-05 09:09:15 +0000186 # istart + int(self.random()*width)
Tim Peters76ca1d42003-06-19 03:46:46 +0000187 # would also be incorrect, for a subtler reason: the RHS
188 # can return a long, and then randrange() would also return
189 # a long, but we're supposed to return an int (for backward
190 # compatibility).
Raymond Hettinger2f726e92003-10-05 09:09:15 +0000191
192 if width >= maxwidth:
Tim Peters58eb11c2004-01-18 20:29:55 +0000193 return int(istart + self._randbelow(width))
Raymond Hettinger2f726e92003-10-05 09:09:15 +0000194 return int(istart + int(self.random()*width))
Tim Petersd7b5e882001-01-25 03:36:26 +0000195 if step == 1:
Collin Winterce36ad82007-08-30 01:19:48 +0000196 raise ValueError("empty range for randrange() (%d,%d, %d)" % (istart, istop, width))
Tim Peters9146f272002-08-16 03:41:39 +0000197
198 # Non-unit step argument supplied.
Tim Petersd7b5e882001-01-25 03:36:26 +0000199 istep = int(step)
200 if istep != step:
Collin Winterce36ad82007-08-30 01:19:48 +0000201 raise ValueError("non-integer step for randrange()")
Tim Petersd7b5e882001-01-25 03:36:26 +0000202 if istep > 0:
Raymond Hettingerffdb8bb2004-09-27 15:29:05 +0000203 n = (width + istep - 1) // istep
Tim Petersd7b5e882001-01-25 03:36:26 +0000204 elif istep < 0:
Raymond Hettingerffdb8bb2004-09-27 15:29:05 +0000205 n = (width + istep + 1) // istep
Tim Petersd7b5e882001-01-25 03:36:26 +0000206 else:
Collin Winterce36ad82007-08-30 01:19:48 +0000207 raise ValueError("zero step for randrange()")
Tim Petersd7b5e882001-01-25 03:36:26 +0000208
209 if n <= 0:
Collin Winterce36ad82007-08-30 01:19:48 +0000210 raise ValueError("empty range for randrange()")
Raymond Hettinger2f726e92003-10-05 09:09:15 +0000211
212 if n >= maxwidth:
Thomas Wouters902d6eb2007-01-09 23:18:33 +0000213 return istart + istep*self._randbelow(n)
Tim Petersd7b5e882001-01-25 03:36:26 +0000214 return istart + istep*int(self.random() * n)
215
216 def randint(self, a, b):
Tim Peterscd804102001-01-25 20:25:57 +0000217 """Return random integer in range [a, b], including both end points.
Tim Petersd7b5e882001-01-25 03:36:26 +0000218 """
219
220 return self.randrange(a, b+1)
221
Guido van Rossume2a383d2007-01-15 16:59:06 +0000222 def _randbelow(self, n, _log=_log, int=int, _maxwidth=1<<BPF,
Raymond Hettinger2f726e92003-10-05 09:09:15 +0000223 _Method=_MethodType, _BuiltinMethod=_BuiltinMethodType):
224 """Return a random int in the range [0,n)
225
226 Handles the case where n has more bits than returned
227 by a single call to the underlying generator.
228 """
229
230 try:
231 getrandbits = self.getrandbits
232 except AttributeError:
233 pass
234 else:
235 # Only call self.getrandbits if the original random() builtin method
236 # has not been overridden or if a new getrandbits() was supplied.
237 # This assures that the two methods correspond.
238 if type(self.random) is _BuiltinMethod or type(getrandbits) is _Method:
239 k = int(1.00001 + _log(n-1, 2.0)) # 2**k > n-1 > 2**(k-2)
240 r = getrandbits(k)
241 while r >= n:
242 r = getrandbits(k)
243 return r
244 if n >= _maxwidth:
245 _warn("Underlying random() generator does not supply \n"
246 "enough bits to choose from a population range this large")
247 return int(self.random() * n)
248
Tim Peterscd804102001-01-25 20:25:57 +0000249## -------------------- sequence methods -------------------
250
Tim Petersd7b5e882001-01-25 03:36:26 +0000251 def choice(self, seq):
252 """Choose a random element from a non-empty sequence."""
Raymond Hettinger5dae5052004-06-07 02:07:15 +0000253 return seq[int(self.random() * len(seq))] # raises IndexError if seq is empty
Tim Petersd7b5e882001-01-25 03:36:26 +0000254
255 def shuffle(self, x, random=None, int=int):
256 """x, random=random.random -> shuffle list x in place; return None.
257
258 Optional arg random is a 0-argument function returning a random
259 float in [0.0, 1.0); by default, the standard random.random.
Tim Petersd7b5e882001-01-25 03:36:26 +0000260 """
261
262 if random is None:
263 random = self.random
Guido van Rossum805365e2007-05-07 22:24:25 +0000264 for i in reversed(range(1, len(x))):
Tim Peterscd804102001-01-25 20:25:57 +0000265 # pick an element in x[:i+1] with which to exchange x[i]
Tim Petersd7b5e882001-01-25 03:36:26 +0000266 j = int(random() * (i+1))
267 x[i], x[j] = x[j], x[i]
268
Raymond Hettingerfdbe5222003-06-13 07:01:51 +0000269 def sample(self, population, k):
Raymond Hettingerf24eb352002-11-12 17:41:57 +0000270 """Chooses k unique random elements from a population sequence.
271
Raymond Hettingerc0b40342002-11-13 15:26:37 +0000272 Returns a new list containing elements from the population while
273 leaving the original population unchanged. The resulting list is
274 in selection order so that all sub-slices will also be valid random
275 samples. This allows raffle winners (the sample) to be partitioned
276 into grand prize and second place winners (the subslices).
Raymond Hettingerf24eb352002-11-12 17:41:57 +0000277
Raymond Hettingerc0b40342002-11-13 15:26:37 +0000278 Members of the population need not be hashable or unique. If the
279 population contains repeats, then each occurrence is a possible
280 selection in the sample.
Raymond Hettingerf24eb352002-11-12 17:41:57 +0000281
Guido van Rossum805365e2007-05-07 22:24:25 +0000282 To choose a sample in a range of integers, use range as an argument.
Raymond Hettingerc0b40342002-11-13 15:26:37 +0000283 This is especially fast and space efficient for sampling from a
Guido van Rossum805365e2007-05-07 22:24:25 +0000284 large population: sample(range(10000000), 60)
Raymond Hettingerf24eb352002-11-12 17:41:57 +0000285 """
286
Thomas Wouters49fd7fa2006-04-21 10:40:58 +0000287 # XXX Although the documentation says `population` is "a sequence",
288 # XXX attempts are made to cater to any iterable with a __len__
289 # XXX method. This has had mixed success. Examples from both
290 # XXX sides: sets work fine, and should become officially supported;
291 # XXX dicts are much harder, and have failed in various subtle
292 # XXX ways across attempts. Support for mapping types should probably
293 # XXX be dropped (and users should pass mapping.keys() or .values()
294 # XXX explicitly).
295
Raymond Hettingerc0b40342002-11-13 15:26:37 +0000296 # Sampling without replacement entails tracking either potential
Raymond Hettinger91e27c22005-08-19 01:36:35 +0000297 # selections (the pool) in a list or previous selections in a set.
Raymond Hettingerc0b40342002-11-13 15:26:37 +0000298
Jeremy Hylton2b55d352004-02-23 17:27:57 +0000299 # When the number of selections is small compared to the
300 # population, then tracking selections is efficient, requiring
Raymond Hettinger91e27c22005-08-19 01:36:35 +0000301 # only a small set and an occasional reselection. For
Jeremy Hylton2b55d352004-02-23 17:27:57 +0000302 # a larger number of selections, the pool tracking method is
303 # preferred since the list takes less space than the
Raymond Hettinger91e27c22005-08-19 01:36:35 +0000304 # set and it doesn't suffer from frequent reselections.
Raymond Hettingerc0b40342002-11-13 15:26:37 +0000305
Raymond Hettingerf24eb352002-11-12 17:41:57 +0000306 n = len(population)
307 if not 0 <= k <= n:
Collin Winterce36ad82007-08-30 01:19:48 +0000308 raise ValueError("sample larger than population")
Raymond Hettinger8b9aa8d2003-01-04 05:20:33 +0000309 random = self.random
Raymond Hettingerfdbe5222003-06-13 07:01:51 +0000310 _int = int
Raymond Hettingerc0b40342002-11-13 15:26:37 +0000311 result = [None] * k
Raymond Hettinger91e27c22005-08-19 01:36:35 +0000312 setsize = 21 # size of a small set minus size of an empty list
313 if k > 5:
Tim Peters9e34c042005-08-26 15:20:46 +0000314 setsize += 4 ** _ceil(_log(k * 3, 4)) # table size for big sets
Thomas Wouters49fd7fa2006-04-21 10:40:58 +0000315 if n <= setsize or hasattr(population, "keys"):
316 # An n-length list is smaller than a k-length set, or this is a
317 # mapping type so the other algorithm wouldn't work.
Raymond Hettinger311f4192002-11-18 09:01:24 +0000318 pool = list(population)
Guido van Rossum805365e2007-05-07 22:24:25 +0000319 for i in range(k): # invariant: non-selected at [0,n-i)
Raymond Hettingerfdbe5222003-06-13 07:01:51 +0000320 j = _int(random() * (n-i))
Raymond Hettinger311f4192002-11-18 09:01:24 +0000321 result[i] = pool[j]
Raymond Hettinger8b9aa8d2003-01-04 05:20:33 +0000322 pool[j] = pool[n-i-1] # move non-selected item into vacancy
Raymond Hettingerc0b40342002-11-13 15:26:37 +0000323 else:
Raymond Hettinger66d09f12003-09-06 04:25:54 +0000324 try:
Thomas Wouters49fd7fa2006-04-21 10:40:58 +0000325 selected = set()
326 selected_add = selected.add
Guido van Rossum805365e2007-05-07 22:24:25 +0000327 for i in range(k):
Raymond Hettingerfdbe5222003-06-13 07:01:51 +0000328 j = _int(random() * n)
Thomas Wouters49fd7fa2006-04-21 10:40:58 +0000329 while j in selected:
330 j = _int(random() * n)
331 selected_add(j)
332 result[i] = population[j]
333 except (TypeError, KeyError): # handle (at least) sets
334 if isinstance(population, list):
335 raise
336 return self.sample(tuple(population), k)
Raymond Hettinger311f4192002-11-18 09:01:24 +0000337 return result
Raymond Hettingerf24eb352002-11-12 17:41:57 +0000338
Tim Peterscd804102001-01-25 20:25:57 +0000339## -------------------- real-valued distributions -------------------
340
341## -------------------- uniform distribution -------------------
Tim Petersd7b5e882001-01-25 03:36:26 +0000342
343 def uniform(self, a, b):
344 """Get a random number in the range [a, b)."""
345 return a + (b-a) * self.random()
Guido van Rossumff03b1a1994-03-09 12:55:02 +0000346
Tim Peterscd804102001-01-25 20:25:57 +0000347## -------------------- normal distribution --------------------
Guido van Rossumff03b1a1994-03-09 12:55:02 +0000348
Tim Petersd7b5e882001-01-25 03:36:26 +0000349 def normalvariate(self, mu, sigma):
Raymond Hettingerc32f0332002-05-23 19:44:49 +0000350 """Normal distribution.
351
352 mu is the mean, and sigma is the standard deviation.
Raymond Hettingeref4d4bd2002-05-23 23:58:17 +0000353
Raymond Hettingerc32f0332002-05-23 19:44:49 +0000354 """
Tim Petersd7b5e882001-01-25 03:36:26 +0000355 # mu = mean, sigma = standard deviation
Guido van Rossumff03b1a1994-03-09 12:55:02 +0000356
Tim Petersd7b5e882001-01-25 03:36:26 +0000357 # Uses Kinderman and Monahan method. Reference: Kinderman,
358 # A.J. and Monahan, J.F., "Computer generation of random
359 # variables using the ratio of uniform deviates", ACM Trans
360 # Math Software, 3, (1977), pp257-260.
Guido van Rossumff03b1a1994-03-09 12:55:02 +0000361
Tim Petersd7b5e882001-01-25 03:36:26 +0000362 random = self.random
Raymond Hettinger42406e62005-04-30 09:02:51 +0000363 while 1:
Tim Peters0c9886d2001-01-15 01:18:21 +0000364 u1 = random()
Raymond Hettinger73ced7e2003-01-04 09:26:32 +0000365 u2 = 1.0 - random()
Tim Petersd7b5e882001-01-25 03:36:26 +0000366 z = NV_MAGICCONST*(u1-0.5)/u2
367 zz = z*z/4.0
368 if zz <= -_log(u2):
369 break
370 return mu + z*sigma
Guido van Rossumff03b1a1994-03-09 12:55:02 +0000371
Tim Peterscd804102001-01-25 20:25:57 +0000372## -------------------- lognormal distribution --------------------
Tim Petersd7b5e882001-01-25 03:36:26 +0000373
374 def lognormvariate(self, mu, sigma):
Raymond Hettingerc32f0332002-05-23 19:44:49 +0000375 """Log normal distribution.
376
377 If you take the natural logarithm of this distribution, you'll get a
378 normal distribution with mean mu and standard deviation sigma.
379 mu can have any value, and sigma must be greater than zero.
Raymond Hettingeref4d4bd2002-05-23 23:58:17 +0000380
Raymond Hettingerc32f0332002-05-23 19:44:49 +0000381 """
Tim Petersd7b5e882001-01-25 03:36:26 +0000382 return _exp(self.normalvariate(mu, sigma))
383
Tim Peterscd804102001-01-25 20:25:57 +0000384## -------------------- exponential distribution --------------------
Tim Petersd7b5e882001-01-25 03:36:26 +0000385
386 def expovariate(self, lambd):
Raymond Hettingerc32f0332002-05-23 19:44:49 +0000387 """Exponential distribution.
388
389 lambd is 1.0 divided by the desired mean. (The parameter would be
390 called "lambda", but that is a reserved word in Python.) Returned
391 values range from 0 to positive infinity.
Raymond Hettingeref4d4bd2002-05-23 23:58:17 +0000392
Raymond Hettingerc32f0332002-05-23 19:44:49 +0000393 """
Tim Petersd7b5e882001-01-25 03:36:26 +0000394 # lambd: rate lambd = 1/mean
395 # ('lambda' is a Python reserved word)
396
397 random = self.random
Tim Peters0c9886d2001-01-15 01:18:21 +0000398 u = random()
399 while u <= 1e-7:
400 u = random()
Tim Petersd7b5e882001-01-25 03:36:26 +0000401 return -_log(u)/lambd
Guido van Rossumff03b1a1994-03-09 12:55:02 +0000402
Tim Peterscd804102001-01-25 20:25:57 +0000403## -------------------- von Mises distribution --------------------
Guido van Rossumff03b1a1994-03-09 12:55:02 +0000404
Tim Petersd7b5e882001-01-25 03:36:26 +0000405 def vonmisesvariate(self, mu, kappa):
Raymond Hettingerc32f0332002-05-23 19:44:49 +0000406 """Circular data distribution.
Raymond Hettingeref4d4bd2002-05-23 23:58:17 +0000407
Raymond Hettingerc32f0332002-05-23 19:44:49 +0000408 mu is the mean angle, expressed in radians between 0 and 2*pi, and
409 kappa is the concentration parameter, which must be greater than or
410 equal to zero. If kappa is equal to zero, this distribution reduces
411 to a uniform random angle over the range 0 to 2*pi.
Raymond Hettingeref4d4bd2002-05-23 23:58:17 +0000412
Raymond Hettingerc32f0332002-05-23 19:44:49 +0000413 """
Tim Petersd7b5e882001-01-25 03:36:26 +0000414 # mu: mean angle (in radians between 0 and 2*pi)
415 # kappa: concentration parameter kappa (>= 0)
416 # if kappa = 0 generate uniform random angle
417
418 # Based upon an algorithm published in: Fisher, N.I.,
419 # "Statistical Analysis of Circular Data", Cambridge
420 # University Press, 1993.
421
422 # Thanks to Magnus Kessler for a correction to the
423 # implementation of step 4.
424
425 random = self.random
426 if kappa <= 1e-6:
427 return TWOPI * random()
428
429 a = 1.0 + _sqrt(1.0 + 4.0 * kappa * kappa)
430 b = (a - _sqrt(2.0 * a))/(2.0 * kappa)
431 r = (1.0 + b * b)/(2.0 * b)
Guido van Rossumff03b1a1994-03-09 12:55:02 +0000432
Raymond Hettinger42406e62005-04-30 09:02:51 +0000433 while 1:
Tim Peters0c9886d2001-01-15 01:18:21 +0000434 u1 = random()
Tim Petersd7b5e882001-01-25 03:36:26 +0000435
436 z = _cos(_pi * u1)
437 f = (1.0 + r * z)/(r + z)
438 c = kappa * (r - f)
439
440 u2 = random()
441
Raymond Hettinger42406e62005-04-30 09:02:51 +0000442 if u2 < c * (2.0 - c) or u2 <= c * _exp(1.0 - c):
Tim Peters0c9886d2001-01-15 01:18:21 +0000443 break
Tim Petersd7b5e882001-01-25 03:36:26 +0000444
445 u3 = random()
446 if u3 > 0.5:
447 theta = (mu % TWOPI) + _acos(f)
448 else:
449 theta = (mu % TWOPI) - _acos(f)
450
451 return theta
452
Tim Peterscd804102001-01-25 20:25:57 +0000453## -------------------- gamma distribution --------------------
Tim Petersd7b5e882001-01-25 03:36:26 +0000454
455 def gammavariate(self, alpha, beta):
Raymond Hettingerc32f0332002-05-23 19:44:49 +0000456 """Gamma distribution. Not the gamma function!
457
458 Conditions on the parameters are alpha > 0 and beta > 0.
459
460 """
Tim Peters8ac14952002-05-23 15:15:30 +0000461
Raymond Hettingerb760efb2002-05-14 06:40:34 +0000462 # alpha > 0, beta > 0, mean is alpha*beta, variance is alpha*beta**2
Tim Peters8ac14952002-05-23 15:15:30 +0000463
Guido van Rossum570764d2002-05-14 14:08:12 +0000464 # Warning: a few older sources define the gamma distribution in terms
465 # of alpha > -1.0
466 if alpha <= 0.0 or beta <= 0.0:
Collin Winterce36ad82007-08-30 01:19:48 +0000467 raise ValueError('gammavariate: alpha and beta must be > 0.0')
Tim Peters8ac14952002-05-23 15:15:30 +0000468
Tim Petersd7b5e882001-01-25 03:36:26 +0000469 random = self.random
Tim Petersd7b5e882001-01-25 03:36:26 +0000470 if alpha > 1.0:
471
472 # Uses R.C.H. Cheng, "The generation of Gamma
473 # variables with non-integral shape parameters",
474 # Applied Statistics, (1977), 26, No. 1, p71-74
475
Raymond Hettingerca6cdc22002-05-13 23:40:14 +0000476 ainv = _sqrt(2.0 * alpha - 1.0)
477 bbb = alpha - LOG4
478 ccc = alpha + ainv
Tim Peters8ac14952002-05-23 15:15:30 +0000479
Raymond Hettinger42406e62005-04-30 09:02:51 +0000480 while 1:
Tim Petersd7b5e882001-01-25 03:36:26 +0000481 u1 = random()
Raymond Hettinger73ced7e2003-01-04 09:26:32 +0000482 if not 1e-7 < u1 < .9999999:
483 continue
484 u2 = 1.0 - random()
Tim Petersd7b5e882001-01-25 03:36:26 +0000485 v = _log(u1/(1.0-u1))/ainv
486 x = alpha*_exp(v)
487 z = u1*u1*u2
488 r = bbb+ccc*v-x
489 if r + SG_MAGICCONST - 4.5*z >= 0.0 or r >= _log(z):
Raymond Hettingerb760efb2002-05-14 06:40:34 +0000490 return x * beta
Tim Petersd7b5e882001-01-25 03:36:26 +0000491
492 elif alpha == 1.0:
493 # expovariate(1)
494 u = random()
495 while u <= 1e-7:
496 u = random()
Raymond Hettingerb760efb2002-05-14 06:40:34 +0000497 return -_log(u) * beta
Tim Petersd7b5e882001-01-25 03:36:26 +0000498
499 else: # alpha is between 0 and 1 (exclusive)
500
501 # Uses ALGORITHM GS of Statistical Computing - Kennedy & Gentle
502
Raymond Hettinger42406e62005-04-30 09:02:51 +0000503 while 1:
Tim Petersd7b5e882001-01-25 03:36:26 +0000504 u = random()
505 b = (_e + alpha)/_e
506 p = b*u
507 if p <= 1.0:
Raymond Hettinger42406e62005-04-30 09:02:51 +0000508 x = p ** (1.0/alpha)
Tim Petersd7b5e882001-01-25 03:36:26 +0000509 else:
Tim Petersd7b5e882001-01-25 03:36:26 +0000510 x = -_log((b-p)/alpha)
511 u1 = random()
Raymond Hettinger42406e62005-04-30 09:02:51 +0000512 if p > 1.0:
513 if u1 <= x ** (alpha - 1.0):
514 break
515 elif u1 <= _exp(-x):
Tim Petersd7b5e882001-01-25 03:36:26 +0000516 break
Raymond Hettingerb760efb2002-05-14 06:40:34 +0000517 return x * beta
518
Tim Peterscd804102001-01-25 20:25:57 +0000519## -------------------- Gauss (faster alternative) --------------------
Guido van Rossum95bfcda1994-03-09 14:21:05 +0000520
Tim Petersd7b5e882001-01-25 03:36:26 +0000521 def gauss(self, mu, sigma):
Raymond Hettingerc32f0332002-05-23 19:44:49 +0000522 """Gaussian distribution.
523
524 mu is the mean, and sigma is the standard deviation. This is
525 slightly faster than the normalvariate() function.
526
527 Not thread-safe without a lock around calls.
Raymond Hettingeref4d4bd2002-05-23 23:58:17 +0000528
Raymond Hettingerc32f0332002-05-23 19:44:49 +0000529 """
Guido van Rossumcc32ac91994-03-15 16:10:24 +0000530
Tim Petersd7b5e882001-01-25 03:36:26 +0000531 # When x and y are two variables from [0, 1), uniformly
532 # distributed, then
533 #
534 # cos(2*pi*x)*sqrt(-2*log(1-y))
535 # sin(2*pi*x)*sqrt(-2*log(1-y))
536 #
537 # are two *independent* variables with normal distribution
538 # (mu = 0, sigma = 1).
539 # (Lambert Meertens)
540 # (corrected version; bug discovered by Mike Miller, fixed by LM)
Guido van Rossumcc32ac91994-03-15 16:10:24 +0000541
Tim Petersd7b5e882001-01-25 03:36:26 +0000542 # Multithreading note: When two threads call this function
543 # simultaneously, it is possible that they will receive the
544 # same return value. The window is very small though. To
545 # avoid this, you have to use a lock around all calls. (I
546 # didn't want to slow this down in the serial case by using a
547 # lock here.)
Guido van Rossumd03e1191998-05-29 17:51:31 +0000548
Tim Petersd7b5e882001-01-25 03:36:26 +0000549 random = self.random
550 z = self.gauss_next
551 self.gauss_next = None
552 if z is None:
553 x2pi = random() * TWOPI
554 g2rad = _sqrt(-2.0 * _log(1.0 - random()))
555 z = _cos(x2pi) * g2rad
556 self.gauss_next = _sin(x2pi) * g2rad
Guido van Rossumcc32ac91994-03-15 16:10:24 +0000557
Tim Petersd7b5e882001-01-25 03:36:26 +0000558 return mu + z*sigma
Guido van Rossum95bfcda1994-03-09 14:21:05 +0000559
Tim Peterscd804102001-01-25 20:25:57 +0000560## -------------------- beta --------------------
Tim Peters85e2e472001-01-26 06:49:56 +0000561## See
562## http://sourceforge.net/bugs/?func=detailbug&bug_id=130030&group_id=5470
563## for Ivan Frohne's insightful analysis of why the original implementation:
564##
565## def betavariate(self, alpha, beta):
566## # Discrete Event Simulation in C, pp 87-88.
567##
568## y = self.expovariate(alpha)
569## z = self.expovariate(1.0/beta)
570## return z/(y+z)
571##
572## was dead wrong, and how it probably got that way.
Guido van Rossum95bfcda1994-03-09 14:21:05 +0000573
Tim Petersd7b5e882001-01-25 03:36:26 +0000574 def betavariate(self, alpha, beta):
Raymond Hettingerc32f0332002-05-23 19:44:49 +0000575 """Beta distribution.
576
Thomas Woutersb2137042007-02-01 18:02:27 +0000577 Conditions on the parameters are alpha > 0 and beta > 0.
Raymond Hettingerc32f0332002-05-23 19:44:49 +0000578 Returned values range between 0 and 1.
Raymond Hettingeref4d4bd2002-05-23 23:58:17 +0000579
Raymond Hettingerc32f0332002-05-23 19:44:49 +0000580 """
Raymond Hettingeref4d4bd2002-05-23 23:58:17 +0000581
Tim Peters85e2e472001-01-26 06:49:56 +0000582 # This version due to Janne Sinkkonen, and matches all the std
583 # texts (e.g., Knuth Vol 2 Ed 3 pg 134 "the beta distribution").
584 y = self.gammavariate(alpha, 1.)
585 if y == 0:
586 return 0.0
587 else:
588 return y / (y + self.gammavariate(beta, 1.))
Guido van Rossum95bfcda1994-03-09 14:21:05 +0000589
Tim Peterscd804102001-01-25 20:25:57 +0000590## -------------------- Pareto --------------------
Guido van Rossumcf4559a1997-12-02 02:47:39 +0000591
Tim Petersd7b5e882001-01-25 03:36:26 +0000592 def paretovariate(self, alpha):
Raymond Hettingerc32f0332002-05-23 19:44:49 +0000593 """Pareto distribution. alpha is the shape parameter."""
Tim Petersd7b5e882001-01-25 03:36:26 +0000594 # Jain, pg. 495
Guido van Rossumcf4559a1997-12-02 02:47:39 +0000595
Raymond Hettinger73ced7e2003-01-04 09:26:32 +0000596 u = 1.0 - self.random()
Tim Petersd7b5e882001-01-25 03:36:26 +0000597 return 1.0 / pow(u, 1.0/alpha)
Guido van Rossumcf4559a1997-12-02 02:47:39 +0000598
Tim Peterscd804102001-01-25 20:25:57 +0000599## -------------------- Weibull --------------------
Guido van Rossumcf4559a1997-12-02 02:47:39 +0000600
Tim Petersd7b5e882001-01-25 03:36:26 +0000601 def weibullvariate(self, alpha, beta):
Raymond Hettingerc32f0332002-05-23 19:44:49 +0000602 """Weibull distribution.
603
604 alpha is the scale parameter and beta is the shape parameter.
Raymond Hettingeref4d4bd2002-05-23 23:58:17 +0000605
Raymond Hettingerc32f0332002-05-23 19:44:49 +0000606 """
Tim Petersd7b5e882001-01-25 03:36:26 +0000607 # Jain, pg. 499; bug fix courtesy Bill Arms
Guido van Rossumcf4559a1997-12-02 02:47:39 +0000608
Raymond Hettinger73ced7e2003-01-04 09:26:32 +0000609 u = 1.0 - self.random()
Tim Petersd7b5e882001-01-25 03:36:26 +0000610 return alpha * pow(-_log(u), 1.0/beta)
Guido van Rossum6c395ba1999-08-18 13:53:28 +0000611
Raymond Hettinger23f12412004-09-13 22:23:21 +0000612## --------------- Operating System Random Source ------------------
Raymond Hettinger356a4592004-08-30 06:14:31 +0000613
Raymond Hettinger23f12412004-09-13 22:23:21 +0000614class SystemRandom(Random):
615 """Alternate random number generator using sources provided
616 by the operating system (such as /dev/urandom on Unix or
617 CryptGenRandom on Windows).
Raymond Hettinger356a4592004-08-30 06:14:31 +0000618
619 Not available on all systems (see os.urandom() for details).
620 """
621
622 def random(self):
623 """Get the next random number in the range [0.0, 1.0)."""
Guido van Rossume2a383d2007-01-15 16:59:06 +0000624 return (int(_hexlify(_urandom(7)), 16) >> 3) * RECIP_BPF
Raymond Hettinger356a4592004-08-30 06:14:31 +0000625
626 def getrandbits(self, k):
627 """getrandbits(k) -> x. Generates a long int with k random bits."""
Raymond Hettinger356a4592004-08-30 06:14:31 +0000628 if k <= 0:
629 raise ValueError('number of bits must be greater than zero')
630 if k != int(k):
631 raise TypeError('number of bits should be an integer')
632 bytes = (k + 7) // 8 # bits / 8 and rounded up
Guido van Rossume2a383d2007-01-15 16:59:06 +0000633 x = int(_hexlify(_urandom(bytes)), 16)
Raymond Hettinger356a4592004-08-30 06:14:31 +0000634 return x >> (bytes * 8 - k) # trim excess bits
635
Raymond Hettinger28de64f2008-01-13 23:40:30 +0000636 def seed(self, *args, **kwds):
Raymond Hettinger23f12412004-09-13 22:23:21 +0000637 "Stub method. Not used for a system random number generator."
Raymond Hettinger356a4592004-08-30 06:14:31 +0000638 return None
Raymond Hettinger356a4592004-08-30 06:14:31 +0000639
640 def _notimplemented(self, *args, **kwds):
Raymond Hettinger23f12412004-09-13 22:23:21 +0000641 "Method should not be called for a system random number generator."
642 raise NotImplementedError('System entropy source does not have state.')
Raymond Hettinger356a4592004-08-30 06:14:31 +0000643 getstate = setstate = _notimplemented
644
Tim Peterscd804102001-01-25 20:25:57 +0000645## -------------------- test program --------------------
Guido van Rossumff03b1a1994-03-09 12:55:02 +0000646
Raymond Hettinger62297132003-08-30 01:24:19 +0000647def _test_generator(n, func, args):
Tim Peters0c9886d2001-01-15 01:18:21 +0000648 import time
Guido van Rossumbe19ed72007-02-09 05:37:30 +0000649 print(n, 'times', func.__name__)
Raymond Hettingerb98154e2003-05-24 17:26:02 +0000650 total = 0.0
Tim Peters0c9886d2001-01-15 01:18:21 +0000651 sqsum = 0.0
652 smallest = 1e10
653 largest = -1e10
654 t0 = time.time()
655 for i in range(n):
Raymond Hettinger62297132003-08-30 01:24:19 +0000656 x = func(*args)
Raymond Hettingerb98154e2003-05-24 17:26:02 +0000657 total += x
Tim Peters0c9886d2001-01-15 01:18:21 +0000658 sqsum = sqsum + x*x
659 smallest = min(x, smallest)
660 largest = max(x, largest)
661 t1 = time.time()
Guido van Rossumbe19ed72007-02-09 05:37:30 +0000662 print(round(t1-t0, 3), 'sec,', end=' ')
Raymond Hettingerb98154e2003-05-24 17:26:02 +0000663 avg = total/n
Tim Petersd7b5e882001-01-25 03:36:26 +0000664 stddev = _sqrt(sqsum/n - avg*avg)
Guido van Rossumbe19ed72007-02-09 05:37:30 +0000665 print('avg %g, stddev %g, min %g, max %g' % \
666 (avg, stddev, smallest, largest))
Guido van Rossumff03b1a1994-03-09 12:55:02 +0000667
Raymond Hettingerf24eb352002-11-12 17:41:57 +0000668
669def _test(N=2000):
Raymond Hettinger62297132003-08-30 01:24:19 +0000670 _test_generator(N, random, ())
671 _test_generator(N, normalvariate, (0.0, 1.0))
672 _test_generator(N, lognormvariate, (0.0, 1.0))
673 _test_generator(N, vonmisesvariate, (0.0, 1.0))
674 _test_generator(N, gammavariate, (0.01, 1.0))
675 _test_generator(N, gammavariate, (0.1, 1.0))
676 _test_generator(N, gammavariate, (0.1, 2.0))
677 _test_generator(N, gammavariate, (0.5, 1.0))
678 _test_generator(N, gammavariate, (0.9, 1.0))
679 _test_generator(N, gammavariate, (1.0, 1.0))
680 _test_generator(N, gammavariate, (2.0, 1.0))
681 _test_generator(N, gammavariate, (20.0, 1.0))
682 _test_generator(N, gammavariate, (200.0, 1.0))
683 _test_generator(N, gauss, (0.0, 1.0))
684 _test_generator(N, betavariate, (3.0, 3.0))
Tim Peterscd804102001-01-25 20:25:57 +0000685
Tim Peters715c4c42001-01-26 22:56:56 +0000686# Create one instance, seeded from current time, and export its methods
Raymond Hettinger40f62172002-12-29 23:03:38 +0000687# as module-level functions. The functions share state across all uses
688#(both in the user's code and in the Python libraries), but that's fine
689# for most programs and is easier for the casual user than making them
690# instantiate their own Random() instance.
691
Tim Petersd7b5e882001-01-25 03:36:26 +0000692_inst = Random()
693seed = _inst.seed
694random = _inst.random
695uniform = _inst.uniform
696randint = _inst.randint
697choice = _inst.choice
698randrange = _inst.randrange
Raymond Hettingerf24eb352002-11-12 17:41:57 +0000699sample = _inst.sample
Tim Petersd7b5e882001-01-25 03:36:26 +0000700shuffle = _inst.shuffle
701normalvariate = _inst.normalvariate
702lognormvariate = _inst.lognormvariate
Tim Petersd7b5e882001-01-25 03:36:26 +0000703expovariate = _inst.expovariate
704vonmisesvariate = _inst.vonmisesvariate
705gammavariate = _inst.gammavariate
Tim Petersd7b5e882001-01-25 03:36:26 +0000706gauss = _inst.gauss
707betavariate = _inst.betavariate
708paretovariate = _inst.paretovariate
709weibullvariate = _inst.weibullvariate
710getstate = _inst.getstate
711setstate = _inst.setstate
Raymond Hettinger2f726e92003-10-05 09:09:15 +0000712getrandbits = _inst.getrandbits
Tim Petersd7b5e882001-01-25 03:36:26 +0000713
Guido van Rossumff03b1a1994-03-09 12:55:02 +0000714if __name__ == '__main__':
Tim Petersd7b5e882001-01-25 03:36:26 +0000715 _test()