-
Notifications
You must be signed in to change notification settings - Fork 3
/
cf.py
267 lines (212 loc) · 8.01 KB
/
cf.py
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
167
168
169
170
171
172
173
174
175
176
177
178
179
180
181
182
183
184
185
186
187
188
189
190
191
192
193
194
195
196
197
198
199
200
201
202
203
204
205
206
207
208
209
210
211
212
213
214
215
216
217
218
219
220
221
222
223
224
225
226
227
228
229
230
231
232
233
234
235
236
237
238
239
240
241
242
243
244
245
246
247
248
249
250
251
252
253
254
255
256
257
258
259
260
261
262
263
264
265
266
267
'''
A simple 2PCF, using a particle grid and N^2
Layout
------
- `_do_cell_pair()` contains the core computation;
- `_2pcf()` contains the loop over cell pairs;
- `numba_2pcf()` is the main entry point.
'''
import numpy as np
import numba as nb
import astropy.table
from astropy.table import Table
from . import particle_grid
__all__ = ['numba_2pcf', 'jackknife']
_fastmath = True
_parallel = True
@nb.njit(fastmath=_fastmath)
def _do_cell_pair(pos1, pos2, Rmax, nbin, Xoff, npairs):
'''Compute a statistic on a pair of cells, applying
offset `Xoff` to account for the periodic wrap.
'''
dtype = pos1.dtype
inv_bw = dtype.type(nbin/Rmax)
Rmax2 = Rmax*Rmax
N1,N2 = len(pos1), len(pos2)
for i in range(N1):
p1 = pos1[i]
for j in range(N2):
p2 = pos2[j]
# Early exit conditions
# TODO: could exploit cell sorting better
zdiff = np.abs(p1[2] - p2[2] + Xoff[2])
if zdiff > Rmax:
continue
ydiff = np.abs(p1[1] - p2[1] + Xoff[1])
if ydiff > Rmax:
continue
xdiff = np.abs(p1[0] - p2[0] + Xoff[0])
if xdiff > Rmax:
continue
r2 = xdiff**2 + ydiff**2 + zdiff**2
if r2 > Rmax2:
continue
r = np.sqrt(r2)
b = int(r*inv_bw)
npairs[b] += 1
@nb.njit(parallel=_parallel,fastmath=_fastmath)
def _2pcf(psort, offsets, ngrid, box, Rmax, nbin):
'''Loop over all pairs of neighboring cells in parallel,
accumulating a pair-wise statistic like the 2PCF.
'''
dtype = psort.dtype
ncell = np.prod(ngrid)
s = offsets # length ngrid^3 + 1
nw = np.array([3,3,3]) # neighbor width
nneigh = np.prod(nw)
pad = 8 # pad each thread's workspace for performance
nthread = nb.get_num_threads()
thread_npairs = np.zeros((nthread,nbin+pad), dtype=np.int64)
# loop over cell pairs
for cpair in nb.prange(ncell*nneigh):
t = nb.np.ufunc.parallel._get_thread_id()
c = cpair // nneigh # 1d primary cell index
off1d = cpair % nneigh # 0..26
nprimary = s[c+1] - s[c]
if nprimary == 0: # optimize the case of sparse cells
continue
# global neighbor index
c3d = _1d_to_3d(c,ngrid)
off3d = _1d_to_3d(off1d,nw)
d3d = c3d + off3d - 1
# periodic neighbor index wrap
Xoff = np.zeros(3, dtype=dtype)
for j in range(3):
if d3d[j] >= ngrid[j]:
d3d[j] -= ngrid[j]
Xoff[j] -= box
if d3d[j] < 0:
d3d[j] += ngrid[j]
Xoff[j] += box
# 1d neighbor index
d = d3d[0]*ngrid[1]*ngrid[2] + d3d[1]*ngrid[2] + d3d[2]
nsecondary = s[d+1] - s[d]
if nsecondary == 0:
continue
_do_cell_pair(psort[s[c]:s[c+1]],
psort[s[d]:s[d+1]],
Rmax, nbin, Xoff,
thread_npairs[t],
)
# sum over threads, removing the padding
npairs = thread_npairs[:,:nbin].sum(axis=0)
# no self-counts
npairs[0] -= len(psort)
return npairs
@nb.njit(fastmath=_fastmath)
def _1d_to_3d(i,ngrid):
'''i is flat index, n1d is grid size'''
X = np.empty(3,dtype=np.int64)
X[0] = i // (ngrid[1]*ngrid[2])
X[1] = i // ngrid[2] - X[0]*ngrid[2]
X[2] = i % ngrid[2]
return X
def numba_2pcf(pos, box, Rmax, nbin, nthread=-1, n1djack=None, pg_kwargs=None,
corrfunc=False):
'''
Compute the 2PCF, and optionally jackknife.
Assumes a periodic box and autocorrelation.
Parameters
----------
pos: ndarray, shape (N,3)
The particle positions, in domain [0,box)
box: float
The box size
Rmax: float
The maximum radius of the 2PCF measurement
nbin: int
The number of linear radial 2PCF bins
nthread: int, optional
Number of threads to use (parallelized over cell pairs).
Default of -1 means to use the numba default.
n1djack: int, optional
Number of jackknife patches per dimension. Patches
are sub-cubes. Default of None means to not do jackknife.
Results are returned as columns in the `res` table whose
names are prefixed with `jack_`.
pg_kwargs: dict, optional
Any keyword arguments to pass directly to the `particle_grid`
function. Default: None.
corrfunc: bool, optional
Use Corrfunc instead. Useful for debugging.
Default: False.
Returns
-------
res: astropy.Table
An Astropy Table with the 2PCF measurement, of length `nbin`.
Contains at least the columns `rmin`, `rmax`, `rmid`, `npairs`,
and `xi`. The `res.meta` dict holds metadata.
'''
if pg_kwargs is None:
pg_kwargs = {}
pg_kwargs = pg_kwargs.copy()
if 'nthread' not in pg_kwargs:
pg_kwargs['nthread'] = nthread
if 'sort_in_cell' not in pg_kwargs:
pg_kwargs['sort_in_cell'] = True
if nthread == -1:
nthread = nb.get_num_threads()
# coerce inputs to match pos type
box = pos.dtype.type(box)
Rmax = pos.dtype.type(Rmax)
edges = np.linspace(0,Rmax,nbin+1)
if not corrfunc:
ngrid = int(np.floor(box/Rmax))
ngrid = max(ngrid,3) # so that neighbors are always unique
ngrid = (ngrid,)*3
ngrid = np.atleast_1d(ngrid)
psort, offsets = particle_grid.particle_grid(pos, ngrid, box, **pg_kwargs)
nb.set_num_threads(nthread)
counts = _2pcf(psort, offsets, ngrid, box, Rmax, nbin)
else:
import Corrfunc.theory.DD
res = Corrfunc.theory.DD(1, nthread, edges, *pos.T, boxsize=box, periodic=True)
counts = res['npairs']
counts[0] -= len(pos)
# compute xi from pairs
N = len(pos)
RR = np.diff(edges**3) * 4/3*np.pi * N*(N-1)/box**3
xi = counts/RR - 1
meta = dict(corrfunc=corrfunc, box=box, nthread=nthread, n1djack=n1djack)
t = Table(dict(rmin=edges[:-1],
rmax=edges[1:],
rmid=(edges[1:] + edges[:-1])/2,
xi=xi,
npairs=counts,
),
meta=meta,
)
if n1djack:
jack = jackknife(n1djack, pos, box, Rmax, nbin, nthread=nthread, pg_kwargs=pg_kwargs,
corrfunc=corrfunc)
for col in jack.colnames:
if col in t.colnames:
del jack[col]
t = astropy.table.hstack((t,jack))
return t
def jackknife(n1djack, pos, box, Rmax, nbin, nthread=-1, corrfunc=False, pg_kwargs=None):
'''Run a drop-1 jackknife covariance estimator, using `n1djack`^3 cubic subvolumes.
Usually this would be called from `numba_2pcf(..., n1djack=n1d)`.
'''
# use the chaining mesh to generate patches
psort, offsets = particle_grid.particle_grid(pos, n1djack, box, nthread=nthread)
del pos # careful!
occ = np.diff(offsets)
all_res = []
njack = n1djack**3
for i in range(njack):
pos_drop1 = np.empty((len(psort) - occ[i],3), dtype=psort.dtype)
# copy all before the dropped patch, then all after
pos_drop1[:offsets[i]] = psort[:offsets[i]]
pos_drop1[offsets[i]:] = psort[offsets[i+1]:]
res = numba_2pcf(pos_drop1, box, Rmax, nbin, nthread=nthread, pg_kwargs=pg_kwargs,
corrfunc=corrfunc)
all_res += [res]
jackres = all_res[0]['rmin','rmax','rmid'].copy()
jackres['jack_xi'] = np.vstack([t['xi'] for t in all_res]).T
jackres['jack_mean'] = jackres['jack_xi'].mean(axis=1)
diff = jackres['jack_xi'] - jackres['jack_mean'].reshape(-1,1)
jackres['jack_cov'] = (diff @ diff.T) * (njack - 1) / njack
jackres['jack_cor'] = jackres['jack_cov'] / jackres['jack_cov'].diagonal()**0.5
jackres['jack_cor'] /= (jackres['jack_cov'].diagonal()**0.5).reshape(-1,1)
return jackres