-
Notifications
You must be signed in to change notification settings - Fork 0
/
Copy pathscde.py
181 lines (142 loc) · 5.55 KB
/
scde.py
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
167
168
169
170
171
172
173
174
175
176
177
178
179
180
181
"""
Module scde provides methods to compute self-consistent density estimations.
(see
https://yketa.github.io/UBC_2018_Wiki/#Self-consistent%20density%20estimation)
(Taken from https://github.com/yketa/active_particles/blob/master/scde.py)
"""
import numpy as np
from scipy.interpolate import griddata
from fastkde import fastKDE
from multiprocessing import Pool
from itertools import product
from functools import partial
from operator import itemgetter
class PDF:
"""
Compute and manipulate probability density functions computed via
self-consistent density estimation.
"""
def __init__(self, *vars, renormalise=True, **fastKDE_kwargs):
"""
Compute probability density function.
(see fastkde.fastKDE.pdf)
NOTE: Coordinates in self.axes are in the same order as the input
variables while it is in reversed order in self.pdf (see
fastkde.fastKDE.pdf).
See active_particles.scde.PDF.evaluate for probability density
function evaluation.
Positional arguments
--------------------
vars : array-like
Input variables.
Parameters
----------
renormalise : bool
Rescale probability density function values by the integral over
the computed volume.
DEFAULT: True
Optional keyword arguments
--------------------------
(see fastkde.fastKDE.pdf)
"""
self.vars = vars
self.n = len(self.vars)
self.fastKDE_kwargs = fastKDE_kwargs
self.pdf, self.axes = fastKDE.pdf(*self.vars, **self.fastKDE_kwargs)
if self.n == 1: self.axes = [np.array(self.axes)]
self._extended_axes()
if renormalise: self.renormalise()
def evaluate(self, *coordinates, method='linear', fill_value=0,
processes=None):
"""
Evaluate interpolated probability density function from evaluated
points.
NOTE: As a matter of efficiency, probability density function at
coordinates is evaluated with a pool of worker processes. (see
multiprocessing.Pool and multiprocessing.Pool.starmap)
Parameters
----------
method : string
Method of interpolation. (see scipy.interpolate.griddata)
DEFAULT: linear
fill_value : float
Value used to fill in for requested points outside of the convex
hull of the input points. (see scipy.interpolate.griddata)
DEFAULT: 0
processes : int
Number of worker processes to use. (see multiprocessing.Pool)
NOTE: If processes == None then processes = os.cpu_count().
DEFAULT: None
Positional arguments
--------------------
coordinates : (self.n,) array-like
Coordinates at which to evaluate the interpolated probability
density function.
Returns
-------
pdfs : (len(coordinates),) array-like
Interpolated probability density function at coordinates.
"""
pdf_flat, extended_axes_flat = self._flat()
with Pool(processes=processes) as pool: # pool of worker processes
pdfs = pool.starmap(
partial(griddata, method=method, fill_value=fill_value),
product([extended_axes_flat], [pdf_flat],
np.array(coordinates)[:, ::-1]))
return np.array(pdfs).flatten()
def integrate(self, apply_func=None):
"""
Integrate apply_func(pdf) over the whole computed volume.
Parameters
----------
apply_func : function
Function to apply to the probability density function.
NOTE: If apply_func == None, then apply_func = lambda x: x.
DEFAULT: None
Returns
-------
integral : float
Integrated probability density function.
"""
if apply_func == None: apply_func = lambda x: x
integral = apply_func(self.pdf)
for ax in range(self.n):
integral = np.trapz(integral, self.axes[-ax-1], axis=0)
return integral
def entropy(self):
"""
Returns the Shannon entropy of the distribution.
Returns
-------
entropy : float
Shannon entropy of the distribution.
"""
return self.integrate(apply_func=
lambda x: - x * np.ma.log(x).filled(0))
def renormalise(self):
"""
Rescale probability density function values self.pdf by the integral
over the the computed volume.
"""
self.pdf /= self.integrate(apply_func=lambda x: x)
def _extended_axes(self):
"""
Sets self.extended_axes as self.axes coordinates in extended form.
"""
self.extended_axes = np.empty(self.pdf.shape + (self.n,)) # extended points coordinates at which the probability density function is evaluated
for ind in np.ndindex(self.pdf.shape):
self.extended_axes[ind] = [self.axes[-i-1][ind[i]]
for i in range(self.n)]
def _flat(self):
"""
Returns flat self.pdf and self.extended_axes.
Returns
-------
pdf_flat : (np.prod(self.pdf.shape),) Numpy array
Flat self.pdf.
extended_axes_flat : (np.prod(self.pdf.shape), self.n) Numpy array
Flat self.extended_axes.
"""
pdf_flat = self.pdf.flatten()
extended_axes_flat = self.extended_axes.reshape((-1, len(self.axes)))
return pdf_flat, extended_axes_flat