forked from scottransom/psrfits_utils
-
Notifications
You must be signed in to change notification settings - Fork 4
/
Copy pathmpimerge_psrfits.c
379 lines (340 loc) · 14.2 KB
/
mpimerge_psrfits.c
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
167
168
169
170
171
172
173
174
175
176
177
178
179
180
181
182
183
184
185
186
187
188
189
190
191
192
193
194
195
196
197
198
199
200
201
202
203
204
205
206
207
208
209
210
211
212
213
214
215
216
217
218
219
220
221
222
223
224
225
226
227
228
229
230
231
232
233
234
235
236
237
238
239
240
241
242
243
244
245
246
247
248
249
250
251
252
253
254
255
256
257
258
259
260
261
262
263
264
265
266
267
268
269
270
271
272
273
274
275
276
277
278
279
280
281
282
283
284
285
286
287
288
289
290
291
292
293
294
295
296
297
298
299
300
301
302
303
304
305
306
307
308
309
310
311
312
313
314
315
316
317
318
319
320
321
322
323
324
325
326
327
328
329
330
331
332
333
334
335
336
337
338
339
340
341
342
343
344
345
346
347
348
349
350
351
352
353
354
355
356
357
358
359
360
361
362
363
364
365
366
367
368
369
370
371
372
373
374
375
376
377
378
379
#include <stdlib.h>
#include <stdio.h>
#include <string.h>
#include <getopt.h>
#include "psrfits.h"
#include "mpi.h"
#define HDRLEN 14400
#define FLAG 9e9
void reorder_data(unsigned char* outbuf, unsigned char *inbuf,
int nband, int nspec, int npol, int nchan)
{
int band, spec, pol, inoff = 0, outoff = 0;
int spband = nspec * npol * nchan;
int spspec = npol * nchan;
for (spec = 0 ; spec < nspec ; spec++) {
for (pol = 0 ; pol < npol ; pol++) {
for (band = 0 ; band < nband ; band++) {
inoff = band * spband + pol * nchan + spec * spspec;
memcpy(outbuf + outoff, inbuf + inoff, nchan);
outoff += nchan;
}
}
}
}
void usage() {
printf("usage: mpimerge_psrfits [optios] basefilename\n"
"Options:\n"
" -o name, --output=name Output base filename (auto-generate)\n"
" -i nn, --initial=nn Starting input file number (1)\n"
" -f nn, --final=nn Ending input file number (auto)\n"
"\n");
}
int main(int argc, char *argv[])
{
int ii, nc = 0, ncnp = 0, gpubps = 0, status = 0, statsum = 0;
int fnum_start = 1, fnum_end = 0;
int numprocs, numbands, myid, baddata = 0, droppedrow = 0;
int *counts, *offsets;
unsigned char *tmpbuf = NULL;
struct psrfits pf;
struct {
double value;
int index;
} offs_in, offs_out;
char hostname[100];
char output_base[256] = "\0";
MPI_Status mpistat;
/* Cmd line */
static struct option long_opts[] = {
{"output", 1, NULL, 'o'},
{"initial", 1, NULL, 'i'},
{"final", 1, NULL, 'f'},
{0,0,0,0}
};
int opt, opti;
MPI_Init(&argc, &argv);
MPI_Comm_size(MPI_COMM_WORLD, &numprocs);
MPI_Comm_rank(MPI_COMM_WORLD, &myid);
numbands = numprocs - 1;
// Process the command line
while ((opt=getopt_long(argc,argv,"o:i:f:",long_opts,&opti))!=-1) {
switch (opt) {
case 'o':
strncpy(output_base, optarg, 255);
output_base[255]='\0';
break;
case 'i':
fnum_start = atoi(optarg);
break;
case 'f':
fnum_end = atoi(optarg);
break;
default:
if (myid==0) usage();
MPI_Finalize();
exit(0);
break;
}
}
if (optind==argc) {
if (myid==0) usage();
MPI_Finalize();
exit(1);
}
if (myid == 0) { // Master proc only
printf("\n\n");
printf(" MPI Search-mode PSRFITs Combiner\n");
printf(" by Scott M. Ransom\n\n");
}
// Determine the hostnames of the processes
{
FILE *hostfile;
hostfile = fopen("/etc/hostname", "r");
fscanf(hostfile, "%s\n", hostname);
fclose(hostfile);
if (hostname != NULL) {
MPI_Barrier(MPI_COMM_WORLD);
if (myid == 0) printf("\n");
fflush(NULL);
for (ii = 0 ; ii < numprocs ; ii++) {
MPI_Barrier(MPI_COMM_WORLD);
if (myid == ii)
printf("Process %3d is on machine %s\n", myid, hostname);
fflush(NULL);
MPI_Barrier(MPI_COMM_WORLD);
}
MPI_Barrier(MPI_COMM_WORLD);
fflush(NULL);
}
}
// Basefilenames for the GPU nodes
if (myid > 0) {
sprintf(pf.basefilename, "/data/gpu/partial/%s/%s",
hostname, argv[optind]);
}
// Initialize some key parts of the PSRFITS structure
pf.tot_rows = pf.N = pf.T = pf.status = 0;
pf.filenum = fnum_start;
pf.filename[0] = '\0';
if (myid == 1) {
FILE *psrfitsfile;
char hdr[HDRLEN], filenm[200];
// Read the header info
sprintf(filenm, "%s_0001.fits", pf.basefilename);
psrfitsfile = fopen(filenm, "r");
fread(&hdr, 1, HDRLEN, psrfitsfile);
fclose(psrfitsfile);
// Send the header to the master proc
MPI_Send(hdr, HDRLEN, MPI_CHAR, 0, 0, MPI_COMM_WORLD);
} else if (myid == 0) {
FILE *psrfitsfile;
char hdr[HDRLEN], tmpfilenm[80];
// Receive the header info from proc 1
MPI_Recv(hdr, HDRLEN, MPI_CHAR, 1, 0, MPI_COMM_WORLD, &mpistat);
// Now write that header to a temp file
strcpy(tmpfilenm, "mpi_merge_psrfits.XXXXXX");
mkstemp(tmpfilenm);
psrfitsfile = fopen(tmpfilenm, "w");
fwrite(&hdr, 1, HDRLEN, psrfitsfile);
fclose(psrfitsfile);
sprintf(pf.filename, "%s", tmpfilenm);
// And read the key information into a PSRFITS struct
status = psrfits_open(&pf);
status = psrfits_close(&pf);
remove(tmpfilenm);
// Now create the output PSTFITS file
if (output_base[0]=='\0') {
/* Set up default output filename */
strcpy(output_base, argv[optind]);
}
strcpy(pf.basefilename, output_base);
pf.filenum = 0;
pf.multifile = 1;
pf.filename[0] = '\0';
nc = pf.hdr.nchan;
ncnp = pf.hdr.nchan * pf.hdr.npol;
gpubps = pf.sub.bytes_per_subint;
pf.hdr.orig_nchan *= numbands;
pf.hdr.nchan *= numbands;
pf.hdr.fctr = pf.hdr.fctr - 0.5 * pf.hdr.BW + numbands/2.0 * pf.hdr.BW;
pf.hdr.BW *= numbands;
pf.sub.bytes_per_subint *= numbands;
long long filelen = 40 * (1L<<30); // In GB
pf.rows_per_file = filelen / pf.sub.bytes_per_subint;
status = psrfits_create(&pf);
// For in-memory transpose of data
tmpbuf = (unsigned char *)malloc(pf.sub.bytes_per_subint);
}
// Open the input PSRFITs files for real
if (myid > 0) {
status = psrfits_open(&pf);
nc = pf.hdr.nchan;
ncnp = pf.hdr.nchan * pf.hdr.npol;
gpubps = pf.sub.bytes_per_subint;
}
// Alloc data buffers for the PSRFITS files
pf.sub.dat_freqs = (float *)malloc(sizeof(float) * pf.hdr.nchan);
pf.sub.dat_weights = (float *)malloc(sizeof(float) * pf.hdr.nchan);
pf.sub.dat_offsets = (float *)malloc(sizeof(float) *
pf.hdr.nchan * pf.hdr.npol);
pf.sub.dat_scales = (float *)malloc(sizeof(float) *
pf.hdr.nchan * pf.hdr.npol);
pf.sub.data = (unsigned char *)malloc(pf.sub.bytes_per_subint);
// Counts and offsets for MPI_Gatherv
counts = (int *)malloc(sizeof(int) * numprocs);
offsets = (int *)malloc(sizeof(int) * numprocs);
counts[0] = offsets[0] = 0; // master sends nothing
// Now loop over the rows (i.e. subints)...
do {
MPI_Barrier(MPI_COMM_WORLD);
// Read the current subint from each of the "slave" nodes
if ((myid > 0) && (!baddata)) {
status = psrfits_read_subint(&pf);
if (status) {
pf.sub.offs = FLAG; // High value so it won't be min
if (pf.rownum > pf.rows_per_file) {
// Shouldn't be here unless opening of new file failed...
printf("Proc %d: Can't open next file. Setting status=114.\n", myid);
status = 114;
}
}
} else { // Root process
pf.sub.offs = FLAG; // High value so it won't be min
}
// Find the minimum value of OFFS_SUB to see if we dropped a row
offs_in.value = pf.sub.offs;
offs_in.index = myid;
MPI_Allreduce(&offs_in, &offs_out, 1, MPI_DOUBLE_INT,
MPI_MINLOC, MPI_COMM_WORLD);
// If all procs are returning the FLAG value, break.
if (offs_out.value==FLAG) break;
// Identify dropped rows
if ((myid > 0) && (!status) && (!baddata) &&
(pf.sub.offs > (offs_out.value + 0.1 * pf.sub.tsubint))) {
printf("Proc %d, row %d: Dropped a row. Filling with zeros.\n",
myid, pf.rownum);
droppedrow = 1;
}
if (myid > 0) {
// Ignore errors for moving past EOF (107), read errors (108)
// and missing files (114)
if (droppedrow ||
status==108 ||
((myid > 0) && (status==114 || status==107) && (!baddata))) {
if (status) printf("Proc %d, row %d: Ignoring CFITSIO error %d. Filling with zeros.\n", myid, pf.rownum, status);
// Set the data and the weights to all zeros
for (ii = 0 ; ii < pf.hdr.nchan ; ii++)
pf.sub.dat_weights[ii] = 0.0;
for (ii = 0 ; ii < pf.sub.bytes_per_subint ; ii++)
pf.sub.data[ii] = 0;
// And the scales and offsets to nominal values
for (ii = 0 ; ii < pf.hdr.nchan * pf.hdr.npol ; ii++) {
pf.sub.dat_offsets[ii] = 0.0;
pf.sub.dat_scales[ii] = 1.0;
}
// reset the status to 0 and allow going to next row
if (status==114 || status==107) {
baddata = 1;
}
if (status==108) { // Try reading the next row...
pf.rownum++;
pf.tot_rows++;
pf.N += pf.hdr.nsblk;
pf.T = pf.N * pf.hdr.dt;
}
if (droppedrow) { // We want to read the current row again...
pf.rownum--;
pf.tot_rows--;
pf.N -= pf.hdr.nsblk;
pf.T = pf.N * pf.hdr.dt;
droppedrow = 0; // reset
}
status = 0;
}
}
// If we've passed final file, exit
if (fnum_end && pf.filenum > fnum_end) break;
// Combine statuses of all nodes by summing....
MPI_Allreduce(&status, &statsum, 1,
MPI_INT, MPI_SUM, MPI_COMM_WORLD);
if (statsum) break;
if (myid == offs_out.index) { // Send all of the non-band-specific parts to master
MPI_Send(&pf.sub.tsubint, 1, MPI_DOUBLE, 0, 0, MPI_COMM_WORLD);
MPI_Send(&pf.sub.offs, 1, MPI_DOUBLE, 0, 0, MPI_COMM_WORLD);
MPI_Send(&pf.sub.lst, 1, MPI_DOUBLE, 0, 0, MPI_COMM_WORLD);
MPI_Send(&pf.sub.ra, 1, MPI_DOUBLE, 0, 0, MPI_COMM_WORLD);
MPI_Send(&pf.sub.dec, 1, MPI_DOUBLE, 0, 0, MPI_COMM_WORLD);
MPI_Send(&pf.sub.glon, 1, MPI_DOUBLE, 0, 0, MPI_COMM_WORLD);
MPI_Send(&pf.sub.glat, 1, MPI_DOUBLE, 0, 0, MPI_COMM_WORLD);
MPI_Send(&pf.sub.feed_ang, 1, MPI_DOUBLE, 0, 0, MPI_COMM_WORLD);
MPI_Send(&pf.sub.pos_ang, 1, MPI_DOUBLE, 0, 0, MPI_COMM_WORLD);
MPI_Send(&pf.sub.par_ang, 1, MPI_DOUBLE, 0, 0, MPI_COMM_WORLD);
MPI_Send(&pf.sub.tel_az, 1, MPI_DOUBLE, 0, 0, MPI_COMM_WORLD);
MPI_Send(&pf.sub.tel_zen, 1, MPI_DOUBLE, 0, 0, MPI_COMM_WORLD);
} else if (myid == 0) { // Receive all of the non-data parts
MPI_Recv(&pf.sub.tsubint, 1, MPI_DOUBLE, offs_out.index, 0, MPI_COMM_WORLD, &mpistat);
MPI_Recv(&pf.sub.offs, 1, MPI_DOUBLE, offs_out.index, 0, MPI_COMM_WORLD, &mpistat);
MPI_Recv(&pf.sub.lst, 1, MPI_DOUBLE, offs_out.index, 0, MPI_COMM_WORLD, &mpistat);
MPI_Recv(&pf.sub.ra, 1, MPI_DOUBLE, offs_out.index, 0, MPI_COMM_WORLD, &mpistat);
MPI_Recv(&pf.sub.dec, 1, MPI_DOUBLE, offs_out.index, 0, MPI_COMM_WORLD, &mpistat);
MPI_Recv(&pf.sub.glon, 1, MPI_DOUBLE, offs_out.index, 0, MPI_COMM_WORLD, &mpistat);
MPI_Recv(&pf.sub.glat, 1, MPI_DOUBLE, offs_out.index, 0, MPI_COMM_WORLD, &mpistat);
MPI_Recv(&pf.sub.feed_ang, 1, MPI_DOUBLE, offs_out.index, 0, MPI_COMM_WORLD, &mpistat);
MPI_Recv(&pf.sub.pos_ang, 1, MPI_DOUBLE, offs_out.index, 0, MPI_COMM_WORLD, &mpistat);
MPI_Recv(&pf.sub.par_ang, 1, MPI_DOUBLE, offs_out.index, 0, MPI_COMM_WORLD, &mpistat);
MPI_Recv(&pf.sub.tel_az, 1, MPI_DOUBLE, offs_out.index, 0, MPI_COMM_WORLD, &mpistat);
MPI_Recv(&pf.sub.tel_zen, 1, MPI_DOUBLE, offs_out.index, 0, MPI_COMM_WORLD, &mpistat);
}
// Now gather the vector quantities...
// Vectors of length nchan
for (ii = 1 ; ii < numprocs ; ii++) {
counts[ii] = nc;
offsets[ii] = (ii - 1) * nc;
}
status = MPI_Gatherv(pf.sub.dat_freqs, nc, MPI_FLOAT,
pf.sub.dat_freqs, counts, offsets, MPI_FLOAT,
0, MPI_COMM_WORLD);
status = MPI_Gatherv(pf.sub.dat_weights, nc, MPI_FLOAT,
pf.sub.dat_weights, counts, offsets, MPI_FLOAT,
0, MPI_COMM_WORLD);
// Vectors of length nchan * npol
for (ii = 1 ; ii < numprocs ; ii++) {
counts[ii] = ncnp;
offsets[ii] = (ii - 1) * ncnp;
}
status = MPI_Gatherv(pf.sub.dat_offsets, ncnp, MPI_FLOAT,
pf.sub.dat_offsets, counts, offsets, MPI_FLOAT,
0, MPI_COMM_WORLD);
status = MPI_Gatherv(pf.sub.dat_scales, ncnp, MPI_FLOAT,
pf.sub.dat_scales, counts, offsets, MPI_FLOAT,
0, MPI_COMM_WORLD);
// Vectors of length pf.sub.bytes_per_subint for the raw data
for (ii = 1 ; ii < numprocs ; ii++) {
counts[ii] = gpubps;
offsets[ii] = (ii - 1) * gpubps;
}
status = MPI_Gatherv(pf.sub.data, gpubps, MPI_UNSIGNED_CHAR,
tmpbuf, counts, offsets, MPI_UNSIGNED_CHAR,
0, MPI_COMM_WORLD);
// Reorder and write the new row to the output file
if (myid == 0) {
reorder_data(pf.sub.data, tmpbuf, numbands,
pf.hdr.nsblk, pf.hdr.npol, nc);
status = psrfits_write_subint(&pf);
}
} while (statsum == 0);
// Free the arrays
free(pf.sub.dat_freqs);
free(pf.sub.dat_weights);
free(pf.sub.dat_offsets);
free(pf.sub.dat_scales);
free(pf.sub.data);
if (myid == 0) free(tmpbuf);
free(counts);
free(offsets);
// Close the files and finalize things
status = psrfits_close(&pf);
MPI_Finalize();
exit(0);
}