-
Notifications
You must be signed in to change notification settings - Fork 0
/
Copy pathdistribution.py
executable file
·89 lines (72 loc) · 2.79 KB
/
distribution.py
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
#! /usr/bin/env python
# -*- coding: utf-8 -*-
import scipy.integrate as inte
import numpy as np
import matplotlib.pyplot as plt
import scipy.interpolate as interpol
class Distribution( object ):
"""distribution(func, a, b)
A distribution object represents a probability distribution, the provided function is taken as the
probability density function and an cumulative density function and its inverse are calculated. `a` and
`b` are taken as the lower and the upper bound respectively.
`func` need not to be normalized
Parameters
----------
func function:
specifies the probability density function of the distribution
a float:
specifies the lower bound of the distribution
b float:
specifies the upper bound of the distribution
Members
----------
pdf():
returns the probability density function, takes a float as an argument
cdf():
returns the cumulative probability density function, takes a float as an argument
ppf():
returns the inverse cumulative probability funciton, takes a float as an argument
norm():
returns the normalisation factor (integral over pdf)
sample(int n):
returns an array of n sampled values
mean():
returns the mean value of the distribution
_lowerbound:
lowerbound of the distribution
_upperbound:
upperbound of the distribution
"""
def __init__(self, func = lambda x: 1, a = 0., b = 1000.):
self._pdf = func
self._lowerbound = a
self._upperbound = b
self.cdf_init(self._lowerbound, self._upperbound)
self._norm = self.cdf()(self._upperbound)
t, step = np.linspace(self._lowerbound, self._upperbound, 10000, endpoint=True, retstep=True)
y = [step*( self.cdf()(t[i]) + self.cdf()(t[i+1]) )/2. for i in (range(t.size - 1))]
self._mean = self._upperbound - sum(y)/self._norm
def pdf(self):
return self._pdf
def cdf_init(self, a, b):
t, step = np.linspace(a, b, 10000, endpoint=True, retstep=True)
y = np.array(t)
y[0], i = 0, 0
for i in (range(t.size - 1)):
y[i+1] = y[i] + step*( self.pdf()(t[i]) + self.pdf()(t[i+1]) )/2
self._x, self._y = t, y
def cdf(self):
return interpol.interp1d(self._x, self._y)
def ppf(self): # inverse cdf
return interpol.interp1d(self._y, self._x)
def norm(self):
return self._norm
def sample(self, n=1):
if n==1:
t = np.random.uniform(0,self.norm())
return self.ppf()(t)
else:
t = np.random.uniform(0,self.norm(),n)
return self.ppf()(t)
def mean(self):
return self._mean