1 | /****************************************************************************/ |
---|
2 | /* TREELOAD.C: routines to create tree. Public routines: maketree(). */ |
---|
3 | /* Copyright (c) 1999 by Joshua E. Barnes, Tokyo, JAPAN. */ |
---|
4 | /****************************************************************************/ |
---|
5 | |
---|
6 | #include "stdinc.h" |
---|
7 | #include "mathfns.h" |
---|
8 | #include "vectmath.h" |
---|
9 | #include "treedefs.h" |
---|
10 | |
---|
11 | /* |
---|
12 | * Local routines and variables to perform tree construction. |
---|
13 | */ |
---|
14 | |
---|
15 | local void newtree(void); /* flush existing tree */ |
---|
16 | local cellptr makecell(void); /* create an empty cell */ |
---|
17 | local void expandbox(bodyptr, int); /* set size of root cell */ |
---|
18 | local void loadbody(bodyptr); /* load body into tree */ |
---|
19 | local int subindex(bodyptr, cellptr); /* compute subcell index */ |
---|
20 | local void hackcofm(cellptr, real, int); /* find centers of mass */ |
---|
21 | local void setrcrit(cellptr, vector, real); /* set cell's crit. radius */ |
---|
22 | local void threadtree(nodeptr, nodeptr); /* set next and more links */ |
---|
23 | local void hackquad(cellptr); /* compute quad moments */ |
---|
24 | |
---|
25 | local bool bh86, sw94; /* use alternate criteria */ |
---|
26 | local nodeptr freecell = NULL; /* list of free cells */ |
---|
27 | |
---|
28 | #define MAXLEVEL 32 /* max height of tree */ |
---|
29 | |
---|
30 | local int cellhist[MAXLEVEL]; /* count cells by level */ |
---|
31 | local int subnhist[MAXLEVEL]; /* count subnodes by level */ |
---|
32 | |
---|
33 | /* |
---|
34 | * MAKETREE: initialize tree structure for hierarchical force calculation. |
---|
35 | */ |
---|
36 | |
---|
37 | void maketree(bodyptr btab, int nbody) |
---|
38 | { |
---|
39 | double cpustart; |
---|
40 | bodyptr p; |
---|
41 | int i; |
---|
42 | |
---|
43 | cpustart = cputime(); /* record time at start */ |
---|
44 | newtree(); /* flush existing tree, etc */ |
---|
45 | root = makecell(); /* allocate the root cell */ |
---|
46 | CLRV(Pos(root)); /* initialize the midpoint */ |
---|
47 | expandbox(btab, nbody); /* and expand cell to fit */ |
---|
48 | for (p = btab; p < btab+nbody; p++) /* loop over all bodies */ |
---|
49 | loadbody(p); /* insert each into tree */ |
---|
50 | bh86 = scanopt(options, "bh86"); /* set flags for alternate */ |
---|
51 | sw94 = scanopt(options, "sw94"); /* ...cell opening criteria */ |
---|
52 | if (bh86 && sw94) /* can't have both at once */ |
---|
53 | error("maketree: incompatible options bh86 and sw94\n"); |
---|
54 | tdepth = 0; /* init count of levels */ |
---|
55 | for (i = 0; i < MAXLEVEL; i++) /* and init tree histograms */ |
---|
56 | cellhist[i] = subnhist[i] = 0; |
---|
57 | hackcofm(root, rsize, 0); /* find c-of-m coords, etc */ |
---|
58 | threadtree((nodeptr) root, NULL); /* add next and more links */ |
---|
59 | if (usequad) /* if including quad terms */ |
---|
60 | hackquad(root); /* find quadrupole moments */ |
---|
61 | cputree = cputime() - cpustart; /* store elapsed CPU time */ |
---|
62 | } |
---|
63 | |
---|
64 | /* |
---|
65 | * NEWTREE: reclaim cells in tree, prepare to build new one. |
---|
66 | */ |
---|
67 | |
---|
68 | local void newtree(void) |
---|
69 | { |
---|
70 | static bool firstcall = TRUE; |
---|
71 | nodeptr p; |
---|
72 | |
---|
73 | if (! firstcall) { /* if cells to reclaim */ |
---|
74 | p = (nodeptr) root; /* start with the root */ |
---|
75 | while (p != NULL) /* loop scanning tree */ |
---|
76 | if (Type(p) == CELL) { /* if we found a cell to */ |
---|
77 | Next(p) = freecell; /* then save existing list */ |
---|
78 | freecell = p; /* and add it to the front */ |
---|
79 | p = More(p); /* then scan down tree */ |
---|
80 | } else /* else, skip over bodies */ |
---|
81 | p = Next(p); /* by going on to the next */ |
---|
82 | } else /* else nothing to reclaim */ |
---|
83 | firstcall = FALSE; /* so just note it */ |
---|
84 | root = NULL; /* flush existing tree */ |
---|
85 | ncell = 0; /* reset cell count */ |
---|
86 | } |
---|
87 | |
---|
88 | /* |
---|
89 | * MAKECELL: return pointer to free cell. |
---|
90 | */ |
---|
91 | |
---|
92 | local cellptr makecell(void) |
---|
93 | { |
---|
94 | cellptr c; |
---|
95 | int i; |
---|
96 | |
---|
97 | if (freecell == NULL) /* if no free cells left */ |
---|
98 | c = (cellptr) allocate(sizeof(cell)); /* then allocate a new one */ |
---|
99 | else { /* else use existing cell */ |
---|
100 | c = (cellptr) freecell; /* take the one in front */ |
---|
101 | freecell = Next(c); /* and go on to next one */ |
---|
102 | } |
---|
103 | Type(c) = CELL; /* initialize node type */ |
---|
104 | Update(c) = FALSE; /* and force update flag */ |
---|
105 | for (i = 0; i < NSUB; i++) /* loop over subcells */ |
---|
106 | Subp(c)[i] = NULL; /* and empty each one */ |
---|
107 | ncell++; /* count one more cell */ |
---|
108 | return (c); /* return pointer to cell */ |
---|
109 | } |
---|
110 | |
---|
111 | /* |
---|
112 | * EXPANDBOX: find range of coordinate values (with respect to root) |
---|
113 | * and expand root cell to fit. The size is doubled at each step to |
---|
114 | * take advantage of exact representation of powers of two. |
---|
115 | */ |
---|
116 | |
---|
117 | local void expandbox(bodyptr btab, int nbody) |
---|
118 | { |
---|
119 | real dmax, d; |
---|
120 | bodyptr p; |
---|
121 | int k; |
---|
122 | |
---|
123 | dmax = 0.0; /* keep track of max value */ |
---|
124 | for (p = btab; p < btab+nbody; p++) /* loop over all bodies */ |
---|
125 | for (k = 0; k < NDIM; k++) { /* and over all dimensions */ |
---|
126 | d = rabs(Pos(p)[k] - Pos(root)[k]); /* find distance to midpnt */ |
---|
127 | if (d > dmax) /* if bigger than old one */ |
---|
128 | dmax = d; /* store new max value */ |
---|
129 | } |
---|
130 | while (rsize < 2 * dmax) /* loop until value fits */ |
---|
131 | rsize = 2 * rsize; /* doubling box each time */ |
---|
132 | } |
---|
133 | |
---|
134 | /* |
---|
135 | * LOADBODY: descend tree and insert body p in appropriate place. |
---|
136 | */ |
---|
137 | |
---|
138 | local void loadbody(bodyptr p) |
---|
139 | { |
---|
140 | cellptr q, c; |
---|
141 | int qind, k; |
---|
142 | real qsize, dist2; |
---|
143 | vector distv; |
---|
144 | |
---|
145 | q = root; /* start with tree root */ |
---|
146 | qind = subindex(p, q); /* get index of subcell */ |
---|
147 | qsize = rsize; /* keep track of cell size */ |
---|
148 | while (Subp(q)[qind] != NULL) { /* loop descending tree */ |
---|
149 | if (Type(Subp(q)[qind]) == BODY) { /* if another body reached */ |
---|
150 | DOTPSUBV(dist2, distv, Pos(p), Pos(Subp(q)[qind])); |
---|
151 | if (dist2 == 0.0) /* check positions differ */ |
---|
152 | error("loadbody: two bodies have same position\n"); |
---|
153 | c = makecell(); /* then allocate new cell */ |
---|
154 | for (k = 0; k < NDIM; k++) /* and initialize midpoint */ |
---|
155 | Pos(c)[k] = Pos(q)[k] + /* offset from parent */ |
---|
156 | (Pos(p)[k] < Pos(q)[k] ? - qsize : qsize) / 4; |
---|
157 | Subp(c)[subindex((bodyptr) Subp(q)[qind], c)] = Subp(q)[qind]; |
---|
158 | /* put body in cell */ |
---|
159 | Subp(q)[qind] = (nodeptr) c; /* link cell in tree */ |
---|
160 | } |
---|
161 | q = (cellptr) Subp(q)[qind]; /* advance to next level */ |
---|
162 | qind = subindex(p, q); /* get index to examine */ |
---|
163 | qsize = qsize / 2; /* shrink current cell */ |
---|
164 | } |
---|
165 | Subp(q)[qind] = (nodeptr) p; /* found place, store p */ |
---|
166 | } |
---|
167 | |
---|
168 | /* |
---|
169 | * SUBINDEX: compute subcell index for body p in cell q. |
---|
170 | */ |
---|
171 | |
---|
172 | local int subindex(bodyptr p, cellptr q) |
---|
173 | { |
---|
174 | int ind, k; |
---|
175 | |
---|
176 | ind = 0; /* accumulate subcell index */ |
---|
177 | for (k = 0; k < NDIM; k++) /* loop over dimensions */ |
---|
178 | if (Pos(q)[k] <= Pos(p)[k]) /* if beyond midpoint */ |
---|
179 | ind += NSUB >> (k + 1); /* then skip over subcells */ |
---|
180 | return (ind); |
---|
181 | } |
---|
182 | |
---|
183 | /* |
---|
184 | * HACKCOFM: descend tree finding center-of-mass coordinates; |
---|
185 | * also sets critical cell radii, if appropriate. |
---|
186 | */ |
---|
187 | |
---|
188 | local void hackcofm(cellptr p, real psize, int lev) |
---|
189 | { |
---|
190 | vector cmpos, tmpv; |
---|
191 | int i, k; |
---|
192 | nodeptr q; |
---|
193 | real dpq; |
---|
194 | |
---|
195 | tdepth = MAX(tdepth, lev); /* remember maximum level */ |
---|
196 | cellhist[lev]++; /* count cells by level */ |
---|
197 | Mass(p) = 0.0; /* init cell's total mass */ |
---|
198 | CLRV(cmpos); /* and center of mass pos */ |
---|
199 | for (i = 0; i < NSUB; i++) /* loop over the subnodes */ |
---|
200 | if ((q = Subp(p)[i]) != NULL) { /* skipping the NULLs */ |
---|
201 | subnhist[lev]++; /* count existing subnodes */ |
---|
202 | if (Type(q) == CELL) /* and if node is a cell */ |
---|
203 | hackcofm((cellptr) q, psize/2, lev+1); |
---|
204 | /* then do the same for it */ |
---|
205 | Update(p) |= Update(q); /* propagate update request */ |
---|
206 | Mass(p) += Mass(q); /* accumulate total mass */ |
---|
207 | MULVS(tmpv, Pos(q), Mass(q)); /* weight position by mass */ |
---|
208 | ADDV(cmpos, cmpos, tmpv); /* and sum c-of-m position */ |
---|
209 | } |
---|
210 | if (Mass(p) > 0.0) { /* usually, cell has mass */ |
---|
211 | DIVVS(cmpos, cmpos, Mass(p)); /* so find c-of-m position */ |
---|
212 | } else { /* but if no mass inside */ |
---|
213 | SETV(cmpos, Pos(p)); /* use geo. center for now */ |
---|
214 | } |
---|
215 | for (k = 0; k < NDIM; k++) /* check c-of-m of cell */ |
---|
216 | if (cmpos[k] < Pos(p)[k] - psize/2 || /* if actually outside cell */ |
---|
217 | Pos(p)[k] + psize/2 <= cmpos[k]) |
---|
218 | error("hackcofm: tree structure error\n"); |
---|
219 | #if !defined(QUICKSCAN) |
---|
220 | setrcrit(p, cmpos, psize); /* set critical radius */ |
---|
221 | #endif |
---|
222 | SETV(Pos(p), cmpos); /* and center-of-mass pos */ |
---|
223 | } |
---|
224 | |
---|
225 | #if !defined(QUICKSCAN) |
---|
226 | |
---|
227 | /* |
---|
228 | * SETRCRIT: assign critical radius for cell p, using center-of-mass |
---|
229 | * position cmpos and cell size psize. |
---|
230 | */ |
---|
231 | |
---|
232 | local void setrcrit(cellptr p, vector cmpos, real psize) |
---|
233 | { |
---|
234 | real bmax2, d; |
---|
235 | int k; |
---|
236 | |
---|
237 | if (theta == 0.0) /* if exact calculation */ |
---|
238 | Rcrit2(p) = rsqr(2 * rsize); /* then always open cells */ |
---|
239 | else if (sw94) { /* if using S&W's criterion */ |
---|
240 | bmax2 = 0.0; /* compute max distance^2 */ |
---|
241 | for (k = 0; k < NDIM; k++) { /* loop over dimensions */ |
---|
242 | d = cmpos[k] - Pos(p)[k] + psize/2; /* get dist from corner */ |
---|
243 | bmax2 += rsqr(MAX(d, psize - d)); /* and sum max distance^2 */ |
---|
244 | } |
---|
245 | Rcrit2(p) = bmax2 / rsqr(theta); /* use max dist from cm */ |
---|
246 | } else if (bh86) /* if using old criterion */ |
---|
247 | Rcrit2(p) = rsqr(psize / theta); /* then use size of cell */ |
---|
248 | else { /* else use new criterion */ |
---|
249 | DISTV(d, cmpos, Pos(p)); /* find offset from center */ |
---|
250 | Rcrit2(p) = rsqr(psize / theta + d); /* use size plus offset */ |
---|
251 | } |
---|
252 | } |
---|
253 | |
---|
254 | #endif |
---|
255 | |
---|
256 | /* |
---|
257 | * THREADTREE: do a recursive treewalk starting from node p, |
---|
258 | * with next stop n, installing Next and More links. |
---|
259 | */ |
---|
260 | |
---|
261 | local void threadtree(nodeptr p, nodeptr n) |
---|
262 | { |
---|
263 | int ndesc, i; |
---|
264 | nodeptr desc[NSUB+1]; |
---|
265 | |
---|
266 | Next(p) = n; /* set link to next node */ |
---|
267 | if (Type(p) == CELL) { /* if descendents to thread */ |
---|
268 | ndesc = 0; /* start counting them */ |
---|
269 | for (i = 0; i < NSUB; i++) /* loop over all subcells */ |
---|
270 | if (Subp(p)[i] != NULL) /* if this one is occupied */ |
---|
271 | desc[ndesc++] = Subp(p)[i]; /* then store it in table */ |
---|
272 | More(p) = desc[0]; /* set link to 1st one */ |
---|
273 | desc[ndesc] = n; /* thread last one to next */ |
---|
274 | for (i = 0; i < ndesc; i++) /* loop over descendents */ |
---|
275 | threadtree(desc[i], desc[i+1]); /* and thread them together */ |
---|
276 | } |
---|
277 | } |
---|
278 | |
---|
279 | /* |
---|
280 | * HACKQUAD: descend tree, evaluating quadrupole moments. Note that this |
---|
281 | * routine is coded so that the Subp() and Quad() components of a cell can |
---|
282 | * share the same memory locations. |
---|
283 | */ |
---|
284 | |
---|
285 | local void hackquad(cellptr p) |
---|
286 | { |
---|
287 | int ndesc, i; |
---|
288 | nodeptr desc[NSUB], q; |
---|
289 | vector dr; |
---|
290 | real drsq; |
---|
291 | matrix drdr, Idrsq, tmpm; |
---|
292 | |
---|
293 | ndesc = 0; /* count occupied subnodes */ |
---|
294 | for (i = 0; i < NSUB; i++) /* loop over all subnodes */ |
---|
295 | if (Subp(p)[i] != NULL) /* if this one's occupied */ |
---|
296 | desc[ndesc++] = Subp(p)[i]; /* copy it to safety */ |
---|
297 | CLRM(Quad(p)); /* init quadrupole moment */ |
---|
298 | for (i = 0; i < ndesc; i++) { /* loop over real subnodes */ |
---|
299 | q = desc[i]; /* access ech one in turn */ |
---|
300 | if (Type(q) == CELL) /* if it's also a cell */ |
---|
301 | hackquad((cellptr) q); /* then process it first */ |
---|
302 | SUBV(dr, Pos(q), Pos(p)); /* find displacement vect. */ |
---|
303 | OUTVP(drdr, dr, dr); /* form outer prod. of dr */ |
---|
304 | DOTVP(drsq, dr, dr); /* and dot prod. dr * dr */ |
---|
305 | SETMI(Idrsq); /* init unit matrix */ |
---|
306 | MULMS(Idrsq, Idrsq, drsq); /* and scale by dr * dr */ |
---|
307 | MULMS(tmpm, drdr, 3.0); /* scale drdr by 3 */ |
---|
308 | SUBM(tmpm, tmpm, Idrsq); /* now form quad. moment */ |
---|
309 | MULMS(tmpm, tmpm, Mass(q)); /* from cm of subnode */ |
---|
310 | if (Type(q) == CELL) /* if subnode is cell */ |
---|
311 | ADDM(tmpm, tmpm, Quad(q)); /* then include its moment */ |
---|
312 | ADDM(Quad(p), Quad(p), tmpm); /* increment moment of cell */ |
---|
313 | } |
---|
314 | } |
---|