indexamajig.c 28.7 KB
Newer Older
Thomas White's avatar
Thomas White committed
1
/*
2
 * indexamajig.c
Thomas White's avatar
Thomas White committed
3
 *
Thomas White's avatar
Thomas White committed
4
 * Index patterns, output hkl+intensity etc.
Thomas White's avatar
Thomas White committed
5
 *
Thomas White's avatar
Thomas White committed
6
 * Copyright © 2012 Thomas White <taw@physics.org>
Thomas White's avatar
Thomas White committed
7
 *
Thomas White's avatar
Thomas White committed
8
9
10
11
12
13
14
15
16
17
18
19
20
21
 * This file is part of CrystFEL.
 *
 * CrystFEL is free software: you can redistribute it and/or modify
 * it under the terms of the GNU General Public License as published by
 * the Free Software Foundation, either version 3 of the License, or
 * (at your option) any later version.
 *
 * CrystFEL is distributed in the hope that it will be useful,
 * but WITHOUT ANY WARRANTY; without even the implied warranty of
 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
 * GNU General Public License for more details.
 *
 * You should have received a copy of the GNU General Public License
 * along with CrystFEL.  If not, see <http://www.gnu.org/licenses/>.
Thomas White's avatar
Thomas White committed
22
23
24
25
26
27
28
29
30
31
32
33
34
35
 *
 */


#ifdef HAVE_CONFIG_H
#include <config.h>
#endif

#include <stdarg.h>
#include <stdlib.h>
#include <stdio.h>
#include <string.h>
#include <unistd.h>
#include <getopt.h>
Thomas White's avatar
Thomas White committed
36
#include <hdf5.h>
Thomas White's avatar
Thomas White committed
37
#include <gsl/gsl_errno.h>
38
#include <pthread.h>
39
40

#ifdef HAVE_CLOCK_GETTIME
41
#include <time.h>
42
43
44
#else
#include <sys/time.h>
#endif
Thomas White's avatar
Thomas White committed
45
46
47

#include "utils.h"
#include "hdf5-file.h"
Thomas White's avatar
Thomas White committed
48
#include "index.h"
49
#include "peaks.h"
50
#include "detector.h"
Thomas White's avatar
Thomas White committed
51
#include "filters.h"
52
#include "thread-pool.h"
53
#include "beam-parameters.h"
54
#include "geometry.h"
Thomas White's avatar
Thomas White committed
55
#include "stream.h"
Thomas White's avatar
Thomas White committed
56
#include "reflist-utils.h"
57

58

Thomas White's avatar
Thomas White committed
59
/* Write statistics at APPROXIMATELY this interval */
60
61
62
#define STATS_EVERY_N_SECONDS (5)


63
64
65
66
67
68
enum {
	PEAK_ZAEF,
	PEAK_HDF5,
};


69
70
/* Information about the indexing process which is common to all patterns */
struct static_index_args
71
72
73
74
75
{
	UnitCell *cell;
	int config_cmfilter;
	int config_noisefilter;
	int config_verbose;
Thomas White's avatar
Thomas White committed
76
	int stream_flags;         /* What goes into the output? */
77
	int config_satcorr;
78
	int config_closer;
79
	int config_insane;
80
	int config_bgsub;
81
	float threshold;
82
	float min_gradient;
83
	float min_snr;
84
	double min_int_snr;
Thomas White's avatar
Thomas White committed
85
	struct detector *det;
Thomas White's avatar
Thomas White committed
86
87
	IndexingMethod *indm;
	IndexingPrivate **ipriv;
Thomas White's avatar
Thomas White committed
88
	int peaks;                /* Peak detection method */
89
	int cellr;
90
	float tols[4];
91
	struct beam_params *beam;
Thomas White's avatar
Thomas White committed
92
	const char *element;
93
	const char *hdf5_peak_path;
94
95
96
	double ir_inn;
	double ir_mid;
	double ir_out;
97

98
99
100
	/* Output stream */
	pthread_mutex_t *output_mutex;  /* Protects the output stream */
	FILE *ofh;
101
	const struct copy_hdf5_field *copyme;
102
103
104
};


105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
/* Information about the indexing process for one pattern */
struct index_args
{
	/* "Input" */
	char *filename;
	struct static_index_args static_args;

	/* "Output" */
	int indexable;
};


/* Information needed to choose the next task and dispatch it */
struct queue_args
{
	FILE *fh;
	char *prefix;
122
	int config_basename;
123
124
	struct static_index_args static_args;

125
	char *use_this_one_instead;
126
127
128
129
130
131

	int n_indexable;
	int n_processed;
	int n_indexable_last_stats;
	int n_processed_last_stats;
	int t_last_stats;
132
133
134
};


Thomas White's avatar
Thomas White committed
135
136
137
138
139
140
static void show_help(const char *s)
{
	printf("Syntax: %s [options]\n\n", s);
	printf(
"Process and index FEL diffraction images.\n"
"\n"
141
" -h, --help               Display this help message.\n"
Thomas White's avatar
Thomas White committed
142
"\n"
143
" -i, --input=<filename>   Specify file containing list of images to process.\n"
Thomas White's avatar
Thomas White committed
144
"                           '-' means stdin, which is the default.\n"
Thomas White's avatar
Thomas White committed
145
146
" -o, --output=<filename>  Write output stream to this file. '-' for stdout.\n"
"                           Default: indexamajig.stream\n"
Thomas White's avatar
Thomas White committed
147
"\n"
Thomas White's avatar
Thomas White committed
148
149
150
151
152
"     --indexing=<methods> Use 'methods' for indexing.  Provide one or more\n"
"                           methods separated by commas.  Choose from:\n"
"                            none     : no indexing (default)\n"
"                            dirax    : invoke DirAx\n"
"                            mosflm   : invoke MOSFLM (DPS)\n"
Thomas White's avatar
Thomas White committed
153
"                            reax     : DPS algorithm with known unit cell\n"
154
" -g. --geometry=<file>    Get detector geometry from file.\n"
155
156
157
" -b, --beam=<file>        Get beam parameters from file (provides nominal\n"
"                           wavelength value if no per-shot value is found in\n"
"                           the HDF5 files.\n"
158
" -p, --pdb=<file>         PDB file from which to get the unit cell to match.\n"
Thomas White's avatar
Thomas White committed
159
"                           Default: 'molecule.pdb'.\n"
160
"     --basename           Remove the directory parts of the filenames.\n"
161
" -x, --prefix=<p>         Prefix filenames from input file with <p>.\n"
162
163
164
"     --peaks=<method>     Use 'method' for finding peaks.  Choose from:\n"
"                           zaef  : Use Zaefferer (2000) gradient detection.\n"
"                                    This is the default method.\n"
165
166
167
"                           hdf5  : Get from a table in HDF5 file.\n"
"     --hdf5-peaks=<p>     Find peaks table in HDF5 file here.\n"
"                           Default: /processing/hitfinder/peakinfo\n"
Thomas White's avatar
Thomas White committed
168
169
"\n\n"
"You can control what information is included in the output stream using\n"
Thomas White's avatar
Thomas White committed
170
"' --record=<flag1>,<flag2>,<flag3>' and so on.  Possible flags are:\n\n"
171
172
" integrated        Include a list of reflection intensities, produced by\n"
"                    integrating around predicted peak locations.\n"
Thomas White's avatar
Thomas White committed
173
"\n"
174
175
" peaks             Include peak locations and intensities from the peak\n"
"                    search.\n"
Thomas White's avatar
Thomas White committed
176
"\n"
177
" peaksifindexed    As 'peaks', but only if the pattern could be indexed.\n"
Thomas White's avatar
Thomas White committed
178
"\n"
179
180
" peaksifnotindexed As 'peaks', but only if the pattern could NOT be indexed.\n"
"\n\n"
Thomas White's avatar
Thomas White committed
181
"The default is '--record=integrated'.\n"
Thomas White's avatar
Thomas White committed
182
183
"\n\n"
"For more control over the process, you might need:\n\n"
184
185
186
187
188
189
190
191
192
193
194
195
196
197
198
199
200
201
202
203
204
205
206
207
208
209
210
211
"  --cell-reduction=<m>  Use <m> as the cell reduction method. Choose from:\n"
"                         none    : no matching, just use the raw cell.\n"
"                         reduce  : full cell reduction.\n"
"                         compare : match by at most changing the order of\n"
"                                   the indices.\n"
"                         compare_ab : compare 'a' and 'b' lengths only.\n"
"    --tolerance=<tol>   Set the tolerances for cell reduction.\n"
"                          Default: 5,5,5,1.5.\n"
"    --filter-cm         Perform common-mode noise subtraction on images\n"
"                         before proceeding.  Intensities will be extracted\n"
"                         from the image as it is after this processing.\n"
"    --filter-noise      Apply an aggressive noise filter which sets all\n"
"                         pixels in each 3x3 region to zero if any of them\n"
"                         have negative values.  Intensity measurement will\n"
"                         be performed on the image as it was before this.\n"
"    --no-sat-corr       Don't correct values of saturated peaks using a\n"
"                         table included in the HDF5 file.\n"
"    --threshold=<n>     Only accept peaks above <n> ADU.  Default: 800.\n"
"    --min-gradient=<n>  Minimum gradient for Zaefferer peak search.\n"
"                         Default: 100,000.\n"
"    --min-snr=<n>       Minimum signal-to-noise ratio for peaks.\n"
"                         Default: 5.\n"
"    --min-integration-snr=<n> Minimum signal-to-noise ratio for peaks\n"
"                         during integration. Default: -infinity.\n"
"    --int-radius=<r>    Set the integration radii.  Default: 4,5,7.\n"
"-e, --image=<element>   Use this image from the HDF5 file.\n"
"                          Example: /data/data0.\n"
"                          Default: The first one found.\n"
Thomas White's avatar
Thomas White committed
212
"\n"
213
214
215
216
"\nFor time-resolved stuff, you might want to use:\n\n"
"     --copy-hdf5-field <f>  Copy the value of field <f> into the stream. You\n"
"                             can use this option as many times as you need.\n"
"\n"
217
218
219
"\nOptions for greater performance or verbosity:\n\n"
"     --verbose            Be verbose about indexing.\n"
" -j <n>                   Run <n> analyses in parallel.  Default 1.\n"
220
221
222
"\n"
"\nOptions you probably won't need:\n\n"
"     --no-check-prefix    Don't attempt to correct the --prefix.\n"
223
224
225
"     --no-closer-peak     Don't integrate from the location of a nearby peak\n"
"                           instead of the position closest to the reciprocal\n"
"                           lattice point.\n"
226
227
"     --insane             Don't check that the reduced cell accounts for at\n"
"                           least 10%% of the located peaks.\n"
228
229
"     --no-bg-sub          Don't subtract local background estimates from\n"
"                           integrated intensities.\n"
230
"\n"
Thomas White's avatar
Thomas White committed
231
232
"\nYou can tune the CPU affinities for enhanced performance on NUMA machines:\n"
"\n"
Thomas White's avatar
Thomas White committed
233
234
"     --cpus=<n>           Specify number of CPUs.  This is NOT the same as\n"
"                           giving the number of analyses to run in parallel.\n"
235
236
"     --cpugroup=<n>       Batch threads in groups of this size.\n"
"     --cpuoffset=<n>      Start using CPUs at this group number.\n"
Thomas White's avatar
Thomas White committed
237
);
Thomas White's avatar
Thomas White committed
238
239
240
}


241
static void process_image(void *pp, int cookie)
242
{
243
	struct index_args *pargs = pp;
244
245
246
247
	struct hdfile *hdfile;
	struct image image;
	float *data_for_measurement;
	size_t data_size;
248
	char *filename = pargs->filename;
249
250
251
252
	UnitCell *cell = pargs->static_args.cell;
	int config_cmfilter = pargs->static_args.config_cmfilter;
	int config_noisefilter = pargs->static_args.config_noisefilter;
	int config_verbose = pargs->static_args.config_verbose;
Thomas White's avatar
Thomas White committed
253
	IndexingMethod *indm = pargs->static_args.indm;
254
	struct beam_params *beam = pargs->static_args.beam;
255
256
257

	image.features = NULL;
	image.data = NULL;
Thomas White's avatar
Thomas White committed
258
	image.flags = NULL;
259
	image.indexed_cell = NULL;
260
	image.id = cookie;
261
	image.filename = filename;
262
	image.det = copy_geom(pargs->static_args.det);
263
	image.copyme = pargs->static_args.copyme;
264
265
266
267
268
269
270
	image.beam = beam;

	if ( beam == NULL ) {
		ERROR("Warning: no beam parameters file.\n");
		ERROR("I'm going to assume 1 ADU per photon, which is almost");
		ERROR(" certainly wrong.  Peak sigmas will be incorrect.\n");
	}
271

Thomas White's avatar
Thomas White committed
272
	pargs->indexable = 0;
273

274
	hdfile = hdfile_open(filename);
Thomas White's avatar
Thomas White committed
275
276
277
278
279
280
281
282
283
284
285
286
287
288
289
290
291
292
293
294
295
296
297
	if ( hdfile == NULL ) return;

	if ( pargs->static_args.element != NULL ) {

		int r;
		r = hdfile_set_image(hdfile, pargs->static_args.element);
		if ( r ) {
			ERROR("Couldn't select path '%s'\n",
			      pargs->static_args.element);
			hdfile_close(hdfile);
			return;
		}

	} else {

		int r;
		r = hdfile_set_first_image(hdfile, "/");
		if ( r ) {
			ERROR("Couldn't select first path\n");
			hdfile_close(hdfile);
			return;
		}

298
299
	}

300
	hdf5_read(hdfile, &image, pargs->static_args.config_satcorr);
301
302
303
304
305
306
307
308
309
310
311
312
313
314

	if ( (image.width != image.det->max_fs+1)
	  || (image.height != image.det->max_ss+1) )
	{
		ERROR("Image size doesn't match geometry size"
		      " - rejecting image.\n");
		ERROR("Image size: %i,%i.  Geometry size: %i,%i\n",
		      image.width, image.height,
		      image.det->max_fs+1, image.det->max_ss+1);
		hdfile_close(hdfile);
		free_detector_geometry(image.det);
		return;
	}

315
316
	if ( image.lambda < 0.0 ) {
		if ( beam != NULL ) {
Thomas White's avatar
Thomas White committed
317
			ERROR("Using nominal photon energy of %.2f eV\n",
318
                              beam->photon_energy);
Thomas White's avatar
Thomas White committed
319
320
			image.lambda = ph_en_to_lambda(
			                          eV_to_J(beam->photon_energy));
321
322
323
324
		} else {
			ERROR("No wavelength in file, so you need to give "
			      "a beam parameters file with -b.\n");
			hdfile_close(hdfile);
Thomas White's avatar
Thomas White committed
325
			free_detector_geometry(image.det);
326
327
328
			return;
		}
	}
329
	fill_in_values(image.det, hdfile);
330
331
332
333
334
335
336
337
338
339
340
341
342

	if ( config_cmfilter ) {
		filter_cm(&image);
	}

	/* Take snapshot of image after CM subtraction but before
	 * the aggressive noise filter. */
	data_size = image.width*image.height*sizeof(float);
	data_for_measurement = malloc(data_size);

	if ( config_noisefilter ) {
		filter_noise(&image, data_for_measurement);
	} else {
343
		memcpy(data_for_measurement, image.data, data_size);
344
345
	}

346
	switch ( pargs->static_args.peaks )
347
348
349
	{
	case PEAK_HDF5 :
		/* Get peaks from HDF5 */
350
351
352
		if ( get_peaks(&image, hdfile,
		               pargs->static_args.hdf5_peak_path) )
		{
353
354
355
356
			ERROR("Failed to get peaks from HDF5 file.\n");
		}
		break;
	case PEAK_ZAEF :
357
		search_peaks(&image, pargs->static_args.threshold,
358
		             pargs->static_args.min_gradient,
359
360
361
362
		             pargs->static_args.min_snr,
		             pargs->static_args.ir_inn,
		             pargs->static_args.ir_mid,
		             pargs->static_args.ir_out);
363
364
		break;
	}
Thomas White's avatar
Thomas White committed
365
366
367
368
369
370

	/* Get rid of noise-filtered version at this point
	 * - it was strictly for the purposes of peak detection. */
	free(image.data);
	image.data = data_for_measurement;

371
	/* Calculate orientation matrix (by magic) */
372
373
374
	image.div = beam->divergence;
	image.bw = beam->bandwidth;
	image.profile_radius = 0.0001e9;
375
	index_pattern(&image, cell, indm, pargs->static_args.cellr,
376
		      config_verbose, pargs->static_args.ipriv,
377
		      pargs->static_args.config_insane, pargs->static_args.tols);
378

379
	if ( image.indexed_cell != NULL ) {
Thomas White's avatar
Thomas White committed
380

381
		pargs->indexable = 1;
382

383
384
		image.reflections = find_intersections(&image,
		                                       image.indexed_cell);
385

386
		if ( image.reflections != NULL ) {
387

388
			integrate_reflections(&image,
389
					      pargs->static_args.config_closer,
390
					      pargs->static_args.config_bgsub,
391
392
393
394
					      pargs->static_args.min_int_snr,
					      pargs->static_args.ir_inn,
					      pargs->static_args.ir_mid,
					      pargs->static_args.ir_out);
395

396
		}
397

398
399
400
401
402
	} else {

		image.reflections = NULL;

	}
Thomas White's avatar
Thomas White committed
403
404

	pthread_mutex_lock(pargs->static_args.output_mutex);
405
	write_chunk(pargs->static_args.ofh, &image, hdfile,
Thomas White's avatar
Thomas White committed
406
407
	            pargs->static_args.stream_flags);
	pthread_mutex_unlock(pargs->static_args.output_mutex);
408
409

	/* Only free cell if found */
410
	cell_free(image.indexed_cell);
411

Thomas White's avatar
Thomas White committed
412
	reflist_free(image.reflections);
413
	free(image.data);
Thomas White's avatar
Thomas White committed
414
	if ( image.flags != NULL ) free(image.flags);
415
416
	image_feature_list_free(image.features);
	hdfile_close(hdfile);
Thomas White's avatar
Thomas White committed
417
	free_detector_geometry(image.det);
418
419
420
}


421
static void *get_image(void *qp)
422
{
423
	char *line;
424
425
426
	struct index_args *pargs;
	char *rval;
	struct queue_args *qargs = qp;
427

428
	/* Initialise new task arguments */
429
430
431
	pargs = malloc(sizeof(struct index_args));
	memcpy(&pargs->static_args, &qargs->static_args,
	       sizeof(struct static_index_args));
432

433
434
435
	/* Get the next filename */
	if ( qargs->use_this_one_instead != NULL ) {

436
		line = qargs->use_this_one_instead;
437
438
439
440
		qargs->use_this_one_instead = NULL;

	} else {

441
		line = malloc(1024*sizeof(char));
442
		rval = fgets(line, 1023, qargs->fh);
Thomas White's avatar
Thomas White committed
443
444
		if ( rval == NULL ) {
			free(pargs);
Thomas White's avatar
Thomas White committed
445
			free(line);
Thomas White's avatar
Thomas White committed
446
447
			return NULL;
		}
448
449
450
		chomp(line);

	}
451

452
453
454
455
456
457
458
459
460
461
462
463
464
	if ( qargs->config_basename ) {
		char *tmp;
		tmp = safe_basename(line);
		free(line);
		line = tmp;
	}

	pargs->filename = malloc(strlen(qargs->prefix)+strlen(line)+1);

	snprintf(pargs->filename, 1023, "%s%s", qargs->prefix, line);

	free(line);

465
466
	return pargs;
}
467
468


469
470
471
472
473
474
475
476
477
478
479
480
481
482
483
484
485
486
487
488
489
490
491
#ifdef HAVE_CLOCK_GETTIME

static time_t get_monotonic_seconds()
{
	struct timespec tp;
	clock_gettime(CLOCK_MONOTONIC, &tp);
	return tp.tv_sec;
}

#else

/* Fallback version of the above.  The time according to gettimeofday() is not
 * monotonic, so measuring intervals based on it will screw up if there's a
 * timezone change (e.g. daylight savings) while the program is running. */
static time_t get_monotonic_seconds()
{
	struct timeval tp;
	gettimeofday(&tp, NULL);
	return tp.tv_sec;
}

#endif

492
493
494
495
static void finalise_image(void *qp, void *pp)
{
	struct queue_args *qargs = qp;
	struct index_args *pargs = pp;
496
	time_t monotonic_seconds;
497

498
	qargs->n_indexable += pargs->indexable;
499
500
	qargs->n_processed++;

501
502
	monotonic_seconds = get_monotonic_seconds();
	if ( monotonic_seconds >= qargs->t_last_stats+STATS_EVERY_N_SECONDS ) {
503
504

		STATUS("%i out of %i indexed so far,"
Thomas White's avatar
Thomas White committed
505
		       " %i out of %i since the last message.\n",
506
507
		       qargs->n_indexable, qargs->n_processed,
		       qargs->n_indexable - qargs->n_indexable_last_stats,
Thomas White's avatar
Thomas White committed
508
		       qargs->n_processed - qargs->n_processed_last_stats);
509
510
511

		qargs->n_processed_last_stats = qargs->n_processed;
		qargs->n_indexable_last_stats = qargs->n_indexable;
512
		qargs->t_last_stats = monotonic_seconds;
513
514

	}
515

516
517
	free(pargs->filename);
	free(pargs);
518
519
520
}


521
522
523
static int parse_cell_reduction(const char *scellr, int *err,
                                int *reduction_needs_cell)
{
Thomas White's avatar
Thomas White committed
524
	*err = 0;
525
526
527
528
529
530
531
532
533
534
535
536
537
538
539
540
541
542
543
544
	if ( strcmp(scellr, "none") == 0 ) {
		*reduction_needs_cell = 0;
		return CELLR_NONE;
	} else if ( strcmp(scellr, "reduce") == 0) {
		*reduction_needs_cell = 1;
		return CELLR_REDUCE;
	} else if ( strcmp(scellr, "compare") == 0) {
		*reduction_needs_cell = 1;
		return CELLR_COMPARE;
	} else if ( strcmp(scellr, "compare_ab") == 0) {
		*reduction_needs_cell = 1;
		return CELLR_COMPARE_AB;
	} else {
		*err = 1;
		*reduction_needs_cell = 0;
		return CELLR_NONE;
	}
}


Thomas White's avatar
Thomas White committed
545
546
547
548
int main(int argc, char *argv[])
{
	int c;
	char *filename = NULL;
549
	char *outfile = NULL;
Thomas White's avatar
Thomas White committed
550
	FILE *fh;
551
	FILE *ofh;
552
	char *rval = NULL;
Thomas White's avatar
Thomas White committed
553
	int n_images;
554
	int config_noindex = 0;
555
556
	int config_cmfilter = 0;
	int config_noisefilter = 0;
557
	int config_verbose = 0;
558
	int config_satcorr = 1;
559
	int config_checkprefix = 1;
560
	int config_closer = 1;
561
	int config_insane = 0;
562
	int config_bgsub = 1;
563
	int config_basename = 0;
564
	float threshold = 800.0;
565
	float min_gradient = 100000.0;
Thomas White's avatar
Thomas White committed
566
	float min_snr = 5.0;
567
	double min_int_snr = -INFINITY;
Thomas White's avatar
Thomas White committed
568
569
	struct detector *det;
	char *geometry = NULL;
Thomas White's avatar
Thomas White committed
570
571
572
573
	IndexingMethod *indm;
	IndexingPrivate **ipriv;
	int indexer_needs_cell;
	int reduction_needs_cell;
Thomas White's avatar
Thomas White committed
574
	char *indm_str = NULL;
575
	UnitCell *cell;
Thomas White's avatar
Thomas White committed
576
	char *pdb = NULL;
577
	char *prefix = NULL;
578
	char *speaks = NULL;
579
	char *scellr = NULL;
580
	char *toler = NULL;
Thomas White's avatar
Thomas White committed
581
	float tols[4] = {5.0, 5.0, 5.0, 1.5}; /* a,b,c,angles (%,%,%,deg) */
582
	int cellr;
583
	int peaks;
584
	int nthreads = 1;
585
	pthread_mutex_t output_mutex = PTHREAD_MUTEX_INITIALIZER;
586
	char *prepare_line;
587
	char prepare_filename[1024];
588
	struct queue_args qargs;
589
	struct beam_params *beam = NULL;
Thomas White's avatar
Thomas White committed
590
	char *element = NULL;
591
	double nominal_photon_energy;
Thomas White's avatar
Thomas White committed
592
	int stream_flags = STREAM_INTEGRATED;
593
594
595
596
	int cpu_num = 0;
	int cpu_groupsize = 1;
	int cpu_offset = 0;
	char *endptr;
597
	char *hdf5_peak_path = NULL;
598
	struct copy_hdf5_field *copyme;
599
600
601
602
	char *intrad = NULL;
	float ir_inn = 4.0;
	float ir_mid = 5.0;
	float ir_out = 7.0;
603
604
605
606
607
608

	copyme = new_copy_hdf5_field_list();
	if ( copyme == NULL ) {
		ERROR("Couldn't allocate HDF5 field list.\n");
		return 1;
	}
Thomas White's avatar
Thomas White committed
609
610
611
612
613

	/* Long options */
	const struct option longopts[] = {
		{"help",               0, NULL,               'h'},
		{"input",              1, NULL,               'i'},
614
		{"output",             1, NULL,               'o'},
615
		{"no-index",           0, &config_noindex,     1},
Thomas White's avatar
Thomas White committed
616
		{"indexing",           1, NULL,               'z'},
Thomas White's avatar
Thomas White committed
617
		{"geometry",           1, NULL,               'g'},
618
		{"beam",               1, NULL,               'b'},
619
620
		{"filter-cm",          0, &config_cmfilter,    1},
		{"filter-noise",       0, &config_noisefilter, 1},
621
		{"verbose",            0, &config_verbose,     1},
Thomas White's avatar
Thomas White committed
622
		{"pdb",                1, NULL,               'p'},
623
		{"prefix",             1, NULL,               'x'},
624
625
		{"no-sat-corr",        0, &config_satcorr,     0},
		{"sat-corr",           0, &config_satcorr,     1}, /* Compat */
626
		{"threshold",          1, NULL,               't'},
627
		{"no-check-prefix",    0, &config_checkprefix, 0},
628
		{"no-closer-peak",     0, &config_closer,      0},
629
		{"insane",             0, &config_insane,      1},
Thomas White's avatar
Thomas White committed
630
		{"image",              1, NULL,               'e'},
631
		{"basename",           0, &config_basename,    1},
Thomas White's avatar
Thomas White committed
632
633
634
635
636
637
		{"bg-sub",             0, &config_bgsub,       1}, /* Compat */
		{"no-bg-sub",          0, &config_bgsub,       0},

		{"peaks",              1, NULL,                2},
		{"cell-reduction",     1, NULL,                3},
		{"min-gradient",       1, NULL,                4},
Thomas White's avatar
Thomas White committed
638
		{"record",             1, NULL,                5},
639
640
		{"cpus",               1, NULL,                6},
		{"cpugroup",           1, NULL,                7},
641
		{"cpuoffset",          1, NULL,                8},
642
		{"hdf5-peaks",         1, NULL,                9},
643
		{"copy-hdf5-field",    1, NULL,               10},
Thomas White's avatar
Thomas White committed
644
645
646
		{"min-snr",            1, NULL,               11},
		{"min-integration-snr",1, NULL,               12},
		{"tolerance",          1, NULL,               13},
647
		{"int-radius",         1, NULL,               14},
Thomas White's avatar
Thomas White committed
648
649
650
651
		{0, 0, NULL, 0}
	};

	/* Short options */
Thomas White's avatar
Thomas White committed
652
	while ((c = getopt_long(argc, argv, "hi:wp:j:x:g:t:o:b:e:",
Thomas White's avatar
Thomas White committed
653
654
	                        longopts, NULL)) != -1)
	{
Thomas White's avatar
Thomas White committed
655
		switch (c) {
Thomas White's avatar
Thomas White committed
656
657

			case 'h' :
Thomas White's avatar
Thomas White committed
658
659
660
			show_help(argv[0]);
			return 0;

Thomas White's avatar
Thomas White committed
661
			case 'i' :
Thomas White's avatar
Thomas White committed
662
663
664
			filename = strdup(optarg);
			break;

Thomas White's avatar
Thomas White committed
665
			case 'o' :
666
667
668
			outfile = strdup(optarg);
			break;

Thomas White's avatar
Thomas White committed
669
			case 'z' :
Thomas White's avatar
Thomas White committed
670
671
672
			indm_str = strdup(optarg);
			break;

Thomas White's avatar
Thomas White committed
673
			case 'p' :
Thomas White's avatar
Thomas White committed
674
675
676
			pdb = strdup(optarg);
			break;

Thomas White's avatar
Thomas White committed
677
			case 'x' :
678
679
680
			prefix = strdup(optarg);
			break;

Thomas White's avatar
Thomas White committed
681
			case 'j' :
682
683
684
			nthreads = atoi(optarg);
			break;

Thomas White's avatar
Thomas White committed
685
			case 'g' :
Thomas White's avatar
Thomas White committed
686
687
688
			geometry = strdup(optarg);
			break;

Thomas White's avatar
Thomas White committed
689
			case 't' :
690
691
692
			threshold = strtof(optarg, NULL);
			break;

Thomas White's avatar
Thomas White committed
693
			case 'b' :
694
695
696
697
698
699
700
701
			beam = get_beam_parameters(optarg);
			if ( beam == NULL ) {
				ERROR("Failed to load beam parameters"
				      " from '%s'\n", optarg);
				return 1;
			}
			break;

Thomas White's avatar
Thomas White committed
702
703
			case 'e' :
			element = strdup(optarg);
704
705
			break;

Thomas White's avatar
Thomas White committed
706
707
			case 2 :
			speaks = strdup(optarg);
708
709
			break;

Thomas White's avatar
Thomas White committed
710
711
			case 3 :
			scellr = strdup(optarg);
712
713
			break;

Thomas White's avatar
Thomas White committed
714
			case 4 :
715
716
717
			min_gradient = strtof(optarg, NULL);
			break;

Thomas White's avatar
Thomas White committed
718
			case 5 :
Thomas White's avatar
Thomas White committed
719
720
721
722
			stream_flags = parse_stream_flags(optarg);
			if ( stream_flags < 0 ) return 1;
			break;

Thomas White's avatar
Thomas White committed
723
			case 6 :
724
725
726
727
728
729
730
731
			cpu_num = strtol(optarg, &endptr, 10);
			if ( !( (optarg[0] != '\0') && (endptr[0] == '\0') ) ) {
				ERROR("Invalid number of CPUs ('%s')\n",
				      optarg);
				return 1;
			}
			break;

Thomas White's avatar
Thomas White committed
732
			case 7 :
733
734
735
736
737
738
739
740
741
742
743
744
745
			cpu_groupsize = strtol(optarg, &endptr, 10);
			if ( !( (optarg[0] != '\0') && (endptr[0] == '\0') ) ) {
				ERROR("Invalid CPU group size ('%s')\n",
				      optarg);
				return 1;
			}
			if ( cpu_groupsize < 1 ) {
				ERROR("CPU group size cannot be"
				      " less than 1.\n");
				return 1;
			}
			break;

Thomas White's avatar
Thomas White committed
746
			case 8 :
747
748
749
750
751
752
753
754
755
756
757
758
			cpu_offset = strtol(optarg, &endptr, 10);
			if ( !( (optarg[0] != '\0') && (endptr[0] == '\0') ) ) {
				ERROR("Invalid CPU offset ('%s')\n",
				      optarg);
				return 1;
			}
			if ( cpu_offset < 0 ) {
				ERROR("CPU offset must be positive.\n");
				return 1;
			}
			break;

Thomas White's avatar
Thomas White committed
759
			case 9 :
760
761
762
			hdf5_peak_path = strdup(optarg);
			break;

Thomas White's avatar
Thomas White committed
763
			case 10 :
764
765
766
			add_copy_hdf5_field(copyme, optarg);
			break;

Thomas White's avatar
Thomas White committed
767
768
769
770
771
772
			case 11 :
			min_snr = strtof(optarg, NULL);
			break;

			case 12 :
			min_int_snr = strtof(optarg, NULL);
Thomas White's avatar
Thomas White committed
773
774
			break;

Thomas White's avatar
Thomas White committed
775
776
777
778
			case 13 :
			toler = strdup(optarg);
			break;

779
780
781
782
			case 14 :
			intrad = strdup(optarg);
			break;

Thomas White's avatar
Thomas White committed
783
784
785
786
			case 0 :
			break;

			default :
Thomas White's avatar
Thomas White committed
787
			return 1;
Thomas White's avatar
Thomas White committed
788

Thomas White's avatar
Thomas White committed
789
790
791
792
		}

	}

793
794
795
796
797
798
	if ( (cpu_num > 0) && (cpu_num % cpu_groupsize != 0) ) {
		ERROR("Number of CPUs must be divisible by"
		      " the CPU group size.\n");
		return 1;
	}

Thomas White's avatar
Thomas White committed
799
800
801
802
803
804
805
806
807
	if ( filename == NULL ) {
		filename = strdup("-");
	}
	if ( strcmp(filename, "-") == 0 ) {
		fh = stdin;
	} else {
		fh = fopen(filename, "r");
	}
	if ( fh == NULL ) {
Thomas White's avatar
Thomas White committed
808
		ERROR("Failed to open input file '%s'\n", filename);
Thomas White's avatar
Thomas White committed
809
810
		return 1;
	}
Thomas White's avatar
Thomas White committed
811
	free(filename);
Thomas White's avatar
Thomas White committed
812

813
814
815
816
817
818
819
820
821
822
823
824
825
826
	if ( outfile == NULL ) {
		outfile = strdup("-");
	}
	if ( strcmp(outfile, "-") == 0 ) {
		ofh = stdout;
	} else {
		ofh = fopen(outfile, "w");
	}
	if ( ofh == NULL ) {
		ERROR("Failed to open output file '%s'\n", outfile);
		return 1;
	}
	free(outfile);

827
828
829
830
	if ( hdf5_peak_path == NULL ) {
		hdf5_peak_path = strdup("/processing/hitfinder/peakinfo");
	}

831
832
833
834
835
836
837
838
839
840
841
842
843
	if ( speaks == NULL ) {
		speaks = strdup("zaef");
		STATUS("You didn't specify a peak detection method.\n");
		STATUS("I'm using 'zaef' for you.\n");
	}
	if ( strcmp(speaks, "zaef") == 0 ) {
		peaks = PEAK_ZAEF;
	} else if ( strcmp(speaks, "hdf5") == 0 ) {
		peaks = PEAK_HDF5;
	} else {
		ERROR("Unrecognised peak detection method '%s'\n", speaks);
		return 1;
	}
Thomas White's avatar
Thomas White committed
844
	free(speaks);
845

Thomas White's avatar
Thomas White committed
846
847
848
849
	if ( pdb == NULL ) {
		pdb = strdup("molecule.pdb");
	}

850
	if ( prefix == NULL ) {
Thomas White's avatar
Thomas White committed
851
		prefix = strdup("");
852
	} else {
853
854
855
		if ( config_checkprefix ) {
			prefix = check_prefix(prefix);
		}
856
857
	}

858
	if ( nthreads == 0 ) {
859
860
861
862
		ERROR("Invalid number of threads.\n");
		return 1;
	}

863
864
	if ( (indm_str == NULL) ||
	     ((indm_str != NULL) && (strcmp(indm_str, "none") == 0)) ) {
865
		STATUS("Not indexing anything.\n");
866
		indexer_needs_cell = 0;
867
868
869
		reduction_needs_cell = 0;
		indm = NULL;
		cellr = CELLR_NONE;
Thomas White's avatar
Thomas White committed
870
	} else {
871
872
873
874
875
876
877
878
		if ( indm_str == NULL ) {
			STATUS("You didn't specify an indexing method, so I "
			       " won't try to index anything.\n"
			       "If that isn't what you wanted, re-run with"
			       " --indexing=<method>.\n");
			indm = NULL;
			indexer_needs_cell = 0;
		} else {
Thomas White's avatar
Thomas White committed
879
880
			indm = build_indexer_list(indm_str,
			                          &indexer_needs_cell);
881
882
883
884
885
			if ( indm == NULL ) {
				ERROR("Invalid indexer list '%s'\n", indm_str);
				return 1;
			}
			free(indm_str);
Thomas White's avatar
Thomas White committed
886
		}
Thomas White's avatar
Thomas White committed
887

888
889
890
891
892
893
894
		reduction_needs_cell = 0;
		if ( scellr == NULL ) {
			STATUS("You didn't specify a cell reduction method, so"
			       " I'm going to use 'reduce'.\n");
			cellr = CELLR_REDUCE;
			reduction_needs_cell = 1;
		} else {
895
896
897
898
899
900
901
902
903
			int err;
			cellr = parse_cell_reduction(scellr, &err,
			                             &reduction_needs_cell);
			if ( err ) {
				ERROR("Unrecognised cell reduction '%s'\n",
			              scellr);
				return 1;
			}
			free(scellr);
904
		}
905
906
	}

907
908
909
	/* No indexing -> no reduction */
	if ( indm == NULL ) reduction_needs_cell = 0;

910
911
	if ( toler != NULL ) {
		int ttt;
Thomas White's avatar
Thomas White committed
912
913
		ttt = sscanf(toler, "%f,%f,%f,%f",
		             &tols[0], &tols[1], &tols[2], &tols[3] );
914
915
916
917
918
919
		if ( ttt != 4 ) {
			ERROR("Invalid parameters for '--tolerance'\n");
			return 1;
		}
	}

920
921
922
923
924
925
926
927
928
929
930
931
932
	if ( intrad != NULL ) {
		int r;
		r = sscanf(intrad, "%f,%f,%f", &ir_inn, &ir_mid, &ir_out);
		if ( r != 3 ) {
			ERROR("Invalid parameters for '--int-radius'\n");
			return 1;
		}
	} else {
		STATUS("WARNING: You did not specify --int-radius.\n");
		STATUS("WARNING: I will use the default values, which are"
		       " probably not appropriate for your patterns.\n");
	}

Thomas White's avatar
Thomas White committed
933
934
935
936
937
938
939
940
941
942
943
944
	if ( geometry == NULL ) {
		ERROR("You need to specify a geometry file with --geometry\n");
		return 1;
	}

	det = get_detector_geometry(geometry);
	if ( det == NULL ) {
		ERROR("Failed to read detector geometry from '%s'\n", geometry);
		return 1;
	}
	free(geometry);

Thomas White's avatar
Thomas White committed
945
	if ( reduction_needs_cell || indexer_needs_cell ) {
946
947
		cell = load_cell_from_pdb(pdb);
		if ( cell == NULL ) {
948
949
950
			ERROR("Couldn't read unit cell (from %s)\n", pdb);
			return 1;
		}
951
	} else {
Thomas White's avatar
Thomas White committed
952
953
		STATUS("No cell needed for these choices of indexing"
		       " and reduction.\n");
954
		cell = NULL;
955
	}
956
	free(pdb);
957

Thomas White's avatar
Thomas White committed
958
	write_stream_header(ofh, argc, argv);
959

960
961
962
963
964
965
966
967
	if ( beam != NULL ) {
		nominal_photon_energy = beam->photon_energy;
	} else {
		STATUS("No beam parameters file was given, so I'm taking the"
		       " nominal photon energy to be 2 keV.\n");
		nominal_photon_energy = 2000.0;
	}

968
	/* Get first filename and use it to set up the indexing */
969
	prepare_line = malloc(1024*sizeof(char));
970
971
972
973
	rval = fgets(prepare_line, 1023, fh);
	if ( rval == NULL ) {
		ERROR("Failed to get filename to prepare indexing.\n");
		return 1;
974
	}
975
	chomp(prepare_line);
976
977
978
979
980
981
	if ( config_basename ) {
		char *tmp;
		tmp = safe_basename(prepare_line);
		free(prepare_line);
		prepare_line = tmp;
	}
982
983
984
985
	snprintf(prepare_filename, 1023, "%s%s", prefix, prepare_line);
	qargs.use_this_one_instead = prepare_line;

	/* Prepare the indexer */
Thomas White's avatar
Thomas White committed
986
987
988
989
990
991
992
993
994
	if ( indm != NULL ) {
		ipriv = prepare_indexing(indm, cell, prepare_filename, det,
		                         nominal_photon_energy);
		if ( ipriv == NULL ) {
			ERROR("Failed to prepare indexing.\n");
			return 1;
		}
	} else {
		ipriv = NULL;
995
996
	}

Thomas White's avatar
Thomas White committed
997
	gsl_set_error_handler_off();
Thomas White's avatar
Thomas White committed
998

999
1000
	qargs.static_args.cell = cell;
	qargs.static_args.config_cmfilter = config_cmfilter;