blob: a818f732af22acf590950e9b05f6a393ec93fa23 [file] [log] [blame]
Guido van Rossume7b146f2000-02-04 15:28:42 +00001"""Random variable generators.
Guido van Rossumff03b1a1994-03-09 12:55:02 +00002
Tim Petersd7b5e882001-01-25 03:36:26 +00003 integers
4 --------
5 uniform within range
6
7 sequences
8 ---------
9 pick random element
10 generate random permutation
11
Guido van Rossume7b146f2000-02-04 15:28:42 +000012 distributions on the real line:
13 ------------------------------
Tim Petersd7b5e882001-01-25 03:36:26 +000014 uniform
Guido van Rossume7b146f2000-02-04 15:28:42 +000015 normal (Gaussian)
16 lognormal
17 negative exponential
18 gamma
19 beta
Guido van Rossumff03b1a1994-03-09 12:55:02 +000020
Guido van Rossume7b146f2000-02-04 15:28:42 +000021 distributions on the circle (angles 0 to 2pi)
22 ---------------------------------------------
23 circular uniform
24 von Mises
25
26Translated from anonymously contributed C/C++ source.
27
28Multi-threading note: the random number generator used here is not
29thread-safe; it is possible that two calls return the same random
Tim Petersd7b5e882001-01-25 03:36:26 +000030value.
Guido van Rossume7b146f2000-02-04 15:28:42 +000031"""
Tim Petersd7b5e882001-01-25 03:36:26 +000032# XXX The docstring sucks.
Guido van Rossumd03e1191998-05-29 17:51:31 +000033
Tim Petersd7b5e882001-01-25 03:36:26 +000034from math import log as _log, exp as _exp, pi as _pi, e as _e
35from math import sqrt as _sqrt, acos as _acos, cos as _cos, sin as _sin
Guido van Rossumff03b1a1994-03-09 12:55:02 +000036
Tim Petersd7b5e882001-01-25 03:36:26 +000037def _verify(name, expected):
Tim Peters0c9886d2001-01-15 01:18:21 +000038 computed = eval(name)
39 if abs(computed - expected) > 1e-7:
Tim Petersd7b5e882001-01-25 03:36:26 +000040 raise ValueError(
41 "computed value for %s deviates too much "
42 "(computed %g, expected %g)" % (name, computed, expected))
43
44NV_MAGICCONST = 4 * _exp(-0.5)/_sqrt(2.0)
45_verify('NV_MAGICCONST', 1.71552776992141)
46
47TWOPI = 2.0*_pi
48_verify('TWOPI', 6.28318530718)
49
50LOG4 = _log(4.0)
51_verify('LOG4', 1.38629436111989)
52
53SG_MAGICCONST = 1.0 + _log(4.5)
54_verify('SG_MAGICCONST', 2.50407739677627)
55
56del _verify
57
58# Translated by Guido van Rossum from C source provided by
59# Adrian Baddeley.
60
61class Random:
62
63 VERSION = 1 # used by getstate/setstate
64
65 def __init__(self, x=None):
66 """Initialize an instance.
67
68 Optional argument x controls seeding, as for Random.seed().
69 """
70
71 self.seed(x)
72 self.gauss_next = None
73
74 # Specific to Wichmann-Hill generator. Subclasses wishing to use a
75 # different core generator should override seed(), random(), getstate()
76 # and setstate().
77
78 def __whseed(self, x=0, y=0, z=0):
79 """Set the Wichmann-Hill seed from (x, y, z).
80
81 These must be integers in the range [0, 256).
82 """
83
84 if not type(x) == type(y) == type(z) == type(0):
85 raise TypeError('seeds must be integers')
86 if not (0 <= x < 256 and 0 <= y < 256 and 0 <= z < 256):
87 raise ValueError('seeds must be in range(0, 256)')
88 if 0 == x == y == z:
89 # Initialize from current time
90 import time
91 t = long(time.time()) * 256
92 t = int((t&0xffffff) ^ (t>>24))
93 t, x = divmod(t, 256)
94 t, y = divmod(t, 256)
95 t, z = divmod(t, 256)
96 # Zero is a poor seed, so substitute 1
97 self._seed = (x or 1, y or 1, z or 1)
98
99 def seed(self, a=None):
100 """Seed from hashable value
101
102 None or no argument seeds from current time.
103 """
104
105 if a is None:
106 self.__whseed()
107 a = hash(a)
108 a, x = divmod(a, 256)
109 a, y = divmod(a, 256)
110 a, z = divmod(a, 256)
111 x = (x + a) % 256 or 1
112 y = (y + a) % 256 or 1
113 z = (z + a) % 256 or 1
114 self.__whseed(x, y, z)
115
116 def getstate(self):
117 """Return internal state; can be passed to setstate() later."""
118
119 return self.VERSION, self._seed, self.gauss_next
120
121 def __getstate__(self): # for pickle
122 self.getstate()
123
124 def setstate(self, state):
125 """Restore internal state from object returned by getstate()."""
126 version = state[0]
127 if version == 1:
128 version, self._seed, self.gauss_next = state
129 else:
130 raise ValueError("state with version %s passed to "
131 "Random.setstate() of version %s" %
132 (version, self.VERSION))
133
134 def __setstate__(self, state): # for pickle
135 self.setstate(state)
136
137 def random(self):
138 """Get the next random number in the range [0.0, 1.0)."""
139
140 # Wichman-Hill random number generator.
141 #
142 # Wichmann, B. A. & Hill, I. D. (1982)
143 # Algorithm AS 183:
144 # An efficient and portable pseudo-random number generator
145 # Applied Statistics 31 (1982) 188-190
146 #
147 # see also:
148 # Correction to Algorithm AS 183
149 # Applied Statistics 33 (1984) 123
150 #
151 # McLeod, A. I. (1985)
152 # A remark on Algorithm AS 183
153 # Applied Statistics 34 (1985),198-200
154
155 # This part is thread-unsafe:
156 # BEGIN CRITICAL SECTION
157 x, y, z = self._seed
158 x = (171 * x) % 30269
159 y = (172 * y) % 30307
160 z = (170 * z) % 30323
161 self._seed = x, y, z
162 # END CRITICAL SECTION
163
164 # Note: on a platform using IEEE-754 double arithmetic, this can
165 # never return 0.0 (asserted by Tim; proof too long for a comment).
166 return (x/30269.0 + y/30307.0 + z/30323.0) % 1.0
167
168 def randrange(self, start, stop=None, step=1, int=int, default=None):
169 """Choose a random item from range(start, stop[, step]).
170
171 This fixes the problem with randint() which includes the
172 endpoint; in Python this is usually not what you want.
173 Do not supply the 'int' and 'default' arguments.
174 """
175
176 # This code is a bit messy to make it fast for the
177 # common case while still doing adequate error checking
178 istart = int(start)
179 if istart != start:
180 raise ValueError, "non-integer arg 1 for randrange()"
181 if stop is default:
182 if istart > 0:
183 return int(self.random() * istart)
184 raise ValueError, "empty range for randrange()"
185 istop = int(stop)
186 if istop != stop:
187 raise ValueError, "non-integer stop for randrange()"
188 if step == 1:
189 if istart < istop:
190 return istart + int(self.random() *
191 (istop - istart))
192 raise ValueError, "empty range for randrange()"
193 istep = int(step)
194 if istep != step:
195 raise ValueError, "non-integer step for randrange()"
196 if istep > 0:
197 n = (istop - istart + istep - 1) / istep
198 elif istep < 0:
199 n = (istop - istart + istep + 1) / istep
200 else:
201 raise ValueError, "zero step for randrange()"
202
203 if n <= 0:
204 raise ValueError, "empty range for randrange()"
205 return istart + istep*int(self.random() * n)
206
207 def randint(self, a, b):
208 """Get a random integer in the range [a, b] including
209 both end points.
210
211 (Deprecated; use randrange below.)
212 """
213
214 return self.randrange(a, b+1)
215
216 def choice(self, seq):
217 """Choose a random element from a non-empty sequence."""
218 return seq[int(self.random() * len(seq))]
219
220 def shuffle(self, x, random=None, int=int):
221 """x, random=random.random -> shuffle list x in place; return None.
222
223 Optional arg random is a 0-argument function returning a random
224 float in [0.0, 1.0); by default, the standard random.random.
225
226 Note that for even rather small len(x), the total number of
227 permutations of x is larger than the period of most random number
228 generators; this implies that "most" permutations of a long
229 sequence can never be generated.
230 """
231
232 if random is None:
233 random = self.random
234 for i in xrange(len(x)-1, 0, -1):
235 # pick an element in x[:i+1] with which to exchange x[i]
236 j = int(random() * (i+1))
237 x[i], x[j] = x[j], x[i]
238
239# -------------------- uniform distribution -------------------
240
241 def uniform(self, a, b):
242 """Get a random number in the range [a, b)."""
243 return a + (b-a) * self.random()
Guido van Rossumff03b1a1994-03-09 12:55:02 +0000244
245# -------------------- normal distribution --------------------
246
Tim Petersd7b5e882001-01-25 03:36:26 +0000247 def normalvariate(self, mu, sigma):
248 # mu = mean, sigma = standard deviation
Guido van Rossumff03b1a1994-03-09 12:55:02 +0000249
Tim Petersd7b5e882001-01-25 03:36:26 +0000250 # Uses Kinderman and Monahan method. Reference: Kinderman,
251 # A.J. and Monahan, J.F., "Computer generation of random
252 # variables using the ratio of uniform deviates", ACM Trans
253 # Math Software, 3, (1977), pp257-260.
Guido van Rossumff03b1a1994-03-09 12:55:02 +0000254
Tim Petersd7b5e882001-01-25 03:36:26 +0000255 random = self.random
Tim Peters0c9886d2001-01-15 01:18:21 +0000256 while 1:
257 u1 = random()
258 u2 = random()
Tim Petersd7b5e882001-01-25 03:36:26 +0000259 z = NV_MAGICCONST*(u1-0.5)/u2
260 zz = z*z/4.0
261 if zz <= -_log(u2):
262 break
263 return mu + z*sigma
Guido van Rossumff03b1a1994-03-09 12:55:02 +0000264
Tim Petersd7b5e882001-01-25 03:36:26 +0000265# -------------------- lognormal distribution --------------------
266
267 def lognormvariate(self, mu, sigma):
268 return _exp(self.normalvariate(mu, sigma))
269
270# -------------------- circular uniform --------------------
271
272 def cunifvariate(self, mean, arc):
273 # mean: mean angle (in radians between 0 and pi)
274 # arc: range of distribution (in radians between 0 and pi)
275
276 return (mean + arc * (self.random() - 0.5)) % _pi
277
278# -------------------- exponential distribution --------------------
279
280 def expovariate(self, lambd):
281 # lambd: rate lambd = 1/mean
282 # ('lambda' is a Python reserved word)
283
284 random = self.random
Tim Peters0c9886d2001-01-15 01:18:21 +0000285 u = random()
286 while u <= 1e-7:
287 u = random()
Tim Petersd7b5e882001-01-25 03:36:26 +0000288 return -_log(u)/lambd
Guido van Rossumff03b1a1994-03-09 12:55:02 +0000289
Tim Petersd7b5e882001-01-25 03:36:26 +0000290# -------------------- von Mises distribution --------------------
Guido van Rossumff03b1a1994-03-09 12:55:02 +0000291
Tim Petersd7b5e882001-01-25 03:36:26 +0000292 def vonmisesvariate(self, mu, kappa):
293 # mu: mean angle (in radians between 0 and 2*pi)
294 # kappa: concentration parameter kappa (>= 0)
295 # if kappa = 0 generate uniform random angle
296
297 # Based upon an algorithm published in: Fisher, N.I.,
298 # "Statistical Analysis of Circular Data", Cambridge
299 # University Press, 1993.
300
301 # Thanks to Magnus Kessler for a correction to the
302 # implementation of step 4.
303
304 random = self.random
305 if kappa <= 1e-6:
306 return TWOPI * random()
307
308 a = 1.0 + _sqrt(1.0 + 4.0 * kappa * kappa)
309 b = (a - _sqrt(2.0 * a))/(2.0 * kappa)
310 r = (1.0 + b * b)/(2.0 * b)
Guido van Rossumff03b1a1994-03-09 12:55:02 +0000311
Tim Peters0c9886d2001-01-15 01:18:21 +0000312 while 1:
Tim Peters0c9886d2001-01-15 01:18:21 +0000313 u1 = random()
Tim Petersd7b5e882001-01-25 03:36:26 +0000314
315 z = _cos(_pi * u1)
316 f = (1.0 + r * z)/(r + z)
317 c = kappa * (r - f)
318
319 u2 = random()
320
321 if not (u2 >= c * (2.0 - c) and u2 > c * _exp(1.0 - c)):
Tim Peters0c9886d2001-01-15 01:18:21 +0000322 break
Tim Petersd7b5e882001-01-25 03:36:26 +0000323
324 u3 = random()
325 if u3 > 0.5:
326 theta = (mu % TWOPI) + _acos(f)
327 else:
328 theta = (mu % TWOPI) - _acos(f)
329
330 return theta
331
332# -------------------- gamma distribution --------------------
333
334 def gammavariate(self, alpha, beta):
335 # beta times standard gamma
336 ainv = _sqrt(2.0 * alpha - 1.0)
337 return beta * self.stdgamma(alpha, ainv, alpha - LOG4, alpha + ainv)
338
339 def stdgamma(self, alpha, ainv, bbb, ccc):
340 # ainv = sqrt(2 * alpha - 1)
341 # bbb = alpha - log(4)
342 # ccc = alpha + ainv
343
344 random = self.random
345 if alpha <= 0.0:
346 raise ValueError, 'stdgamma: alpha must be > 0.0'
347
348 if alpha > 1.0:
349
350 # Uses R.C.H. Cheng, "The generation of Gamma
351 # variables with non-integral shape parameters",
352 # Applied Statistics, (1977), 26, No. 1, p71-74
353
354 while 1:
355 u1 = random()
356 u2 = random()
357 v = _log(u1/(1.0-u1))/ainv
358 x = alpha*_exp(v)
359 z = u1*u1*u2
360 r = bbb+ccc*v-x
361 if r + SG_MAGICCONST - 4.5*z >= 0.0 or r >= _log(z):
362 return x
363
364 elif alpha == 1.0:
365 # expovariate(1)
366 u = random()
367 while u <= 1e-7:
368 u = random()
369 return -_log(u)
370
371 else: # alpha is between 0 and 1 (exclusive)
372
373 # Uses ALGORITHM GS of Statistical Computing - Kennedy & Gentle
374
375 while 1:
376 u = random()
377 b = (_e + alpha)/_e
378 p = b*u
379 if p <= 1.0:
380 x = pow(p, 1.0/alpha)
381 else:
382 # p > 1
383 x = -_log((b-p)/alpha)
384 u1 = random()
385 if not (((p <= 1.0) and (u1 > _exp(-x))) or
386 ((p > 1) and (u1 > pow(x, alpha - 1.0)))):
387 break
388 return x
Guido van Rossumff03b1a1994-03-09 12:55:02 +0000389
Guido van Rossum95bfcda1994-03-09 14:21:05 +0000390
391# -------------------- Gauss (faster alternative) --------------------
392
Tim Petersd7b5e882001-01-25 03:36:26 +0000393 def gauss(self, mu, sigma):
Guido van Rossumcc32ac91994-03-15 16:10:24 +0000394
Tim Petersd7b5e882001-01-25 03:36:26 +0000395 # When x and y are two variables from [0, 1), uniformly
396 # distributed, then
397 #
398 # cos(2*pi*x)*sqrt(-2*log(1-y))
399 # sin(2*pi*x)*sqrt(-2*log(1-y))
400 #
401 # are two *independent* variables with normal distribution
402 # (mu = 0, sigma = 1).
403 # (Lambert Meertens)
404 # (corrected version; bug discovered by Mike Miller, fixed by LM)
Guido van Rossumcc32ac91994-03-15 16:10:24 +0000405
Tim Petersd7b5e882001-01-25 03:36:26 +0000406 # Multithreading note: When two threads call this function
407 # simultaneously, it is possible that they will receive the
408 # same return value. The window is very small though. To
409 # avoid this, you have to use a lock around all calls. (I
410 # didn't want to slow this down in the serial case by using a
411 # lock here.)
Guido van Rossumd03e1191998-05-29 17:51:31 +0000412
Tim Petersd7b5e882001-01-25 03:36:26 +0000413 random = self.random
414 z = self.gauss_next
415 self.gauss_next = None
416 if z is None:
417 x2pi = random() * TWOPI
418 g2rad = _sqrt(-2.0 * _log(1.0 - random()))
419 z = _cos(x2pi) * g2rad
420 self.gauss_next = _sin(x2pi) * g2rad
Guido van Rossumcc32ac91994-03-15 16:10:24 +0000421
Tim Petersd7b5e882001-01-25 03:36:26 +0000422 return mu + z*sigma
Guido van Rossum95bfcda1994-03-09 14:21:05 +0000423
424# -------------------- beta --------------------
425
Tim Petersd7b5e882001-01-25 03:36:26 +0000426 def betavariate(self, alpha, beta):
Guido van Rossumcc32ac91994-03-15 16:10:24 +0000427
Tim Petersd7b5e882001-01-25 03:36:26 +0000428 # Discrete Event Simulation in C, pp 87-88.
Guido van Rossumcc32ac91994-03-15 16:10:24 +0000429
Tim Petersd7b5e882001-01-25 03:36:26 +0000430 y = self.expovariate(alpha)
431 z = self.expovariate(1.0/beta)
432 return z/(y+z)
Guido van Rossum95bfcda1994-03-09 14:21:05 +0000433
Guido van Rossum5bdea891997-12-09 19:43:18 +0000434# -------------------- Pareto --------------------
Guido van Rossumcf4559a1997-12-02 02:47:39 +0000435
Tim Petersd7b5e882001-01-25 03:36:26 +0000436 def paretovariate(self, alpha):
437 # Jain, pg. 495
Guido van Rossumcf4559a1997-12-02 02:47:39 +0000438
Tim Petersd7b5e882001-01-25 03:36:26 +0000439 u = self.random()
440 return 1.0 / pow(u, 1.0/alpha)
Guido van Rossumcf4559a1997-12-02 02:47:39 +0000441
Guido van Rossum5bdea891997-12-09 19:43:18 +0000442# -------------------- Weibull --------------------
Guido van Rossumcf4559a1997-12-02 02:47:39 +0000443
Tim Petersd7b5e882001-01-25 03:36:26 +0000444 def weibullvariate(self, alpha, beta):
445 # Jain, pg. 499; bug fix courtesy Bill Arms
Guido van Rossumcf4559a1997-12-02 02:47:39 +0000446
Tim Petersd7b5e882001-01-25 03:36:26 +0000447 u = self.random()
448 return alpha * pow(-_log(u), 1.0/beta)
Guido van Rossum6c395ba1999-08-18 13:53:28 +0000449
Guido van Rossumff03b1a1994-03-09 12:55:02 +0000450# -------------------- test program --------------------
451
Tim Petersd7b5e882001-01-25 03:36:26 +0000452def _test_generator(n, funccall):
Tim Peters0c9886d2001-01-15 01:18:21 +0000453 import time
454 print n, 'times', funccall
455 code = compile(funccall, funccall, 'eval')
456 sum = 0.0
457 sqsum = 0.0
458 smallest = 1e10
459 largest = -1e10
460 t0 = time.time()
461 for i in range(n):
462 x = eval(code)
463 sum = sum + x
464 sqsum = sqsum + x*x
465 smallest = min(x, smallest)
466 largest = max(x, largest)
467 t1 = time.time()
468 print round(t1-t0, 3), 'sec,',
469 avg = sum/n
Tim Petersd7b5e882001-01-25 03:36:26 +0000470 stddev = _sqrt(sqsum/n - avg*avg)
Tim Peters0c9886d2001-01-15 01:18:21 +0000471 print 'avg %g, stddev %g, min %g, max %g' % \
472 (avg, stddev, smallest, largest)
Guido van Rossumff03b1a1994-03-09 12:55:02 +0000473
Tim Petersd7b5e882001-01-25 03:36:26 +0000474def _test(N=200):
475 print 'TWOPI =', TWOPI
476 print 'LOG4 =', LOG4
477 print 'NV_MAGICCONST =', NV_MAGICCONST
478 print 'SG_MAGICCONST =', SG_MAGICCONST
479 _test_generator(N, 'random()')
480 _test_generator(N, 'normalvariate(0.0, 1.0)')
481 _test_generator(N, 'lognormvariate(0.0, 1.0)')
482 _test_generator(N, 'cunifvariate(0.0, 1.0)')
483 _test_generator(N, 'expovariate(1.0)')
484 _test_generator(N, 'vonmisesvariate(0.0, 1.0)')
485 _test_generator(N, 'gammavariate(0.5, 1.0)')
486 _test_generator(N, 'gammavariate(0.9, 1.0)')
487 _test_generator(N, 'gammavariate(1.0, 1.0)')
488 _test_generator(N, 'gammavariate(2.0, 1.0)')
489 _test_generator(N, 'gammavariate(20.0, 1.0)')
490 _test_generator(N, 'gammavariate(200.0, 1.0)')
491 _test_generator(N, 'gauss(0.0, 1.0)')
492 _test_generator(N, 'betavariate(3.0, 3.0)')
493 _test_generator(N, 'paretovariate(1.0)')
494 _test_generator(N, 'weibullvariate(1.0, 1.0)')
495
496# Initialize from current time.
497_inst = Random()
498seed = _inst.seed
499random = _inst.random
500uniform = _inst.uniform
501randint = _inst.randint
502choice = _inst.choice
503randrange = _inst.randrange
504shuffle = _inst.shuffle
505normalvariate = _inst.normalvariate
506lognormvariate = _inst.lognormvariate
507cunifvariate = _inst.cunifvariate
508expovariate = _inst.expovariate
509vonmisesvariate = _inst.vonmisesvariate
510gammavariate = _inst.gammavariate
511stdgamma = _inst.stdgamma
512gauss = _inst.gauss
513betavariate = _inst.betavariate
514paretovariate = _inst.paretovariate
515weibullvariate = _inst.weibullvariate
516getstate = _inst.getstate
517setstate = _inst.setstate
518
Guido van Rossumff03b1a1994-03-09 12:55:02 +0000519if __name__ == '__main__':
Tim Petersd7b5e882001-01-25 03:36:26 +0000520 _test()