83char *option[N_OPTIONS] = {
99 "sddseventhist [<inputfile>] [<outputfile>]\n"
100 " [-pipe=<input>,<output>]\n"
101 " -dataColumn=<columnName>\n"
102 " -eventIdentifier=<columnName>\n"
103 " [-overlapEvent=<eventValue>]\n"
104 " [-bins=<number> | -sizeOfBins=<value>]\n"
105 " [-lowerLimit=<value>]\n"
106 " [-upperLimit=<value>]\n"
108 " [-normalize[={sum|area|peak}]]\n"
109 " [-majorOrder=row|column]\n";
111static char *additional_help =
"\n\
112dataColumn : Name of the column to histogram.\n\
113eventIdentifier : Name of the column used to identify events.\n\
114 A separate histogram is created for each unique value in this column.\n\
115 The column must contain string or integer data;\n\
116 if string data, the values must be valid SDDS column names.\n\
117overlapEvent : If specified, histograms are multiplied bin-by-bin with this event's histogram.\n\
118bins : Number of bins for the histogram.\n\
119sizeOfBins : Size of each bin for the histogram.\n\
120lowerLimit : Lower limit of the histogram range.\n\
121upperLimit : Upper limit of the histogram range.\n\
122normalize : Normalize the histogram by sum, area, or peak.\n\
123sides : Adds sides to the histogram down to the zero level.\n\
124majorOrder : Specifies the major order for the output file (row or column).\n\n\
125Program by Michael Borland. (" __DATE__
" " __TIME__
", SVN revision: " SVN_VERSION
")\n";
127#define NORMALIZE_PEAK 0
128#define NORMALIZE_AREA 1
129#define NORMALIZE_SUM 2
130#define NORMALIZE_NO 3
131#define N_NORMALIZE_OPTIONS 4
133char *normalize_option[N_NORMALIZE_OPTIONS] = {
134 "peak",
"area",
"sum",
"no"};
142 long histogramIndex, overlapIndex;
152 char *inputfile,
char *dataColumn,
char *eventIDColumn,
char *overlapEventID,
153 EVENT_DATA **eventDataRet, int64_t *eventIDsRet,
double **dataRet,
long bins,
154 double binSize,
long normalizeMode,
short columnMajorOrder);
155long makeEventHistogram(
double *hist,
long bins,
double lowerLimit,
double dx,
EVENT_DATA *eventRefData);
156void makeEventOverlap(
double *overlap,
double *hist,
double *overlapHist,
long bins);
157int event_cmpasc(
const void *ep1,
const void *ep2);
159int main(
int argc,
char **argv) {
161 long binsGiven, lowerLimitGiven, upperLimitGiven;
166 double *overlap, *overlapHist;
167 double lowerLimit, upperLimit;
168 double givenLowerLimit, givenUpperLimit;
169 double range, binSize;
171 char *dataColumn, *eventIDColumn, *overlapEventID;
172 SCANNED_ARG *scanned;
173 char *inputfile, *outputfile;
176 long normalizeMode, doSides, verbose = 0, readCode;
177 unsigned long pipeFlags, majorOrderFlag;
178 long eventIDIndex, eventIDType;
179 int64_t eventRefIDs = 0;
182 int64_t i, points, iEvent;
183 short columnMajorOrder = -1;
187 argc =
scanargs(&scanned, argc, argv);
189 fprintf(stderr,
"Usage: %s\n", USAGE);
190 fputs(additional_help, stderr);
194 hist = overlap = overlapHist = NULL;
195 binsGiven = lowerLimitGiven = upperLimitGiven = 0;
196 binSize = doSides = 0;
197 inputfile = outputfile = NULL;
198 dataColumn = eventIDColumn = overlapEventID = NULL;
199 normalizeMode = NORMALIZE_NO;
202 for (i = 1; i < argc; i++) {
203 if (scanned[i].arg_type == OPTION) {
204 switch (
match_string(scanned[i].list[0], option, N_OPTIONS, 0)) {
205 case SET_MAJOR_ORDER:
207 scanned[i].n_items--;
208 if (scanned[i].n_items > 0 && (!
scanItemList(&majorOrderFlag, scanned[i].list + 1, &scanned[i].n_items, 0,
"row", -1, NULL, 0, SDDS_ROW_MAJOR_ORDER,
"column", -1, NULL, 0, SDDS_COLUMN_MAJOR_ORDER, NULL)))
209 SDDS_Bomb(
"invalid -majorOrder syntax/values");
210 if (majorOrderFlag & SDDS_COLUMN_MAJOR_ORDER)
211 columnMajorOrder = 1;
212 else if (majorOrderFlag & SDDS_ROW_MAJOR_ORDER)
213 columnMajorOrder = 0;
217 SDDS_Bomb(
"-bins specified more than once");
219 if (sscanf(scanned[i].list[1],
"%ld", &bins) != 1 || bins <= 0)
224 SDDS_Bomb(
"-lowerLimit specified more than once");
226 if (sscanf(scanned[i].list[1],
"%lf", &givenLowerLimit) != 1)
227 SDDS_Bomb(
"invalid value for lowerLimit");
231 SDDS_Bomb(
"-upperLimit specified more than once");
233 if (sscanf(scanned[i].list[1],
"%lf", &givenUpperLimit) != 1)
234 SDDS_Bomb(
"invalid value for upperLimit");
238 SDDS_Bomb(
"-dataColumn specified more than once");
239 if (scanned[i].n_items != 2)
240 SDDS_Bomb(
"invalid -dataColumn syntax---supply name");
241 dataColumn = scanned[i].list[1];
243 case SET_EVENTIDENTIFIER:
245 SDDS_Bomb(
"-eventIdentifier specified more than once");
246 if (scanned[i].n_items != 2)
247 SDDS_Bomb(
"invalid -eventIdentifier syntax---supply name");
248 eventIDColumn = scanned[i].list[1];
250 case SET_OVERLAPEVENT:
252 SDDS_Bomb(
"-overlapEvent specified more than once");
253 if (scanned[i].n_items != 2)
254 SDDS_Bomb(
"invalid -overlapEvent syntax---supply value");
255 overlapEventID = scanned[i].list[1];
256 if (!strlen(overlapEventID))
257 SDDS_Bomb(
"invalid -overlapEvent syntax---supply value");
260 if (scanned[i].n_items == 1)
261 normalizeMode = NORMALIZE_SUM;
262 else if (scanned[i].n_items != 2 || (normalizeMode =
match_string(scanned[i].list[1], normalize_option, N_NORMALIZE_OPTIONS, 0)) < 0)
269 if (sscanf(scanned[i].list[1],
"%le", &binSize) != 1 || binSize <= 0)
277 fprintf(stderr,
"Error: option %s not recognized\n", scanned[i].list[0]);
284 inputfile = scanned[i].list[0];
285 else if (!outputfile)
286 outputfile = scanned[i].list[0];
288 SDDS_Bomb(
"Too many filenames provided.");
292 processFilenames(
"sddseventhist", &inputfile, &outputfile, pipeFlags, 0, NULL);
294 if (binSize && binsGiven)
295 SDDS_Bomb(
"Specify either -binSize or -bins, not both.");
299 SDDS_Bomb(
"-dataColumn must be specified.");
301 SDDS_Bomb(
"-eventIdentifier must be specified.");
303 if (!(indep =
SDDS_Malloc(
sizeof(*indep) * (bins + 2))) ||
304 !(hist =
SDDS_Malloc(
sizeof(*hist) * (bins + 2))) ||
305 !(overlap =
SDDS_Malloc(
sizeof(*overlap) * (bins + 2))) ||
306 !(overlapHist =
SDDS_Malloc(
sizeof(*overlapHist) * (bins + 2))))
316 SDDS_Bomb(
"Event ID column must be of string type.");
318 SDDS_Bomb(
"Data column must be of a numeric data type.");
323 SDDS_Bomb(
"This program cannot process multi-page files.");
330 if (!setupOutputFile(&outTable, outputfile, &inTable, inputfile, dataColumn, eventIDColumn, overlapEventID, &eventRefData, &eventRefIDs, &data, bins, binSize, normalizeMode, columnMajorOrder))
333 if (!lowerLimitGiven) {
336 lowerLimit = data[0];
337 for (i = 0; i < points; i++)
338 if (lowerLimit > data[i])
339 lowerLimit = data[i];
341 lowerLimit = givenLowerLimit;
344 if (!upperLimitGiven) {
347 upperLimit = data[0];
348 for (i = 0; i < points; i++)
349 if (upperLimit < data[i])
350 upperLimit = data[i];
352 upperLimit = givenUpperLimit;
357 range = upperLimit - lowerLimit;
358 if (!lowerLimitGiven)
359 lowerLimit -= range * 1e-7;
360 if (!upperLimitGiven)
361 upperLimit += range * 1e-7;
362 if (upperLimit == lowerLimit) {
364 upperLimit += binSize / 2;
365 lowerLimit -= binSize / 2;
366 }
else if (fabs(upperLimit) < sqrt(DBL_MIN)) {
367 upperLimit = sqrt(DBL_MIN);
368 lowerLimit = -sqrt(DBL_MIN);
370 upperLimit += upperLimit * (1 + 2 * DBL_EPSILON);
371 lowerLimit -= upperLimit * (1 - 2 * DBL_EPSILON);
374 dx = (upperLimit - lowerLimit) / bins;
378 range = ((range / binSize) + 1) * binSize;
379 middle = (lowerLimit + upperLimit) / 2;
380 lowerLimit = middle - range / 2;
381 upperLimit = middle + range / 2;
383 bins = range / binSize + 0.5;
384 if (bins < 1 && !doSides)
386 if (!(indep =
SDDS_Realloc(indep,
sizeof(*indep) * (bins + 2))) ||
387 !(hist =
SDDS_Realloc(hist,
sizeof(*hist) * (bins + 2))) ||
388 !(overlap =
SDDS_Realloc(overlap,
sizeof(*overlap) * (bins + 2))) ||
389 !(overlapHist =
SDDS_Realloc(overlapHist,
sizeof(*overlapHist) * (bins + 2))))
393 for (i = -1; i < bins + 1; i++) {
394 indep[i + 1] = (i + 0.5) * dx + lowerLimit;
396 if (!
SDDS_StartPage(&outTable, points ? (doSides ? bins + 2 : bins) : 0) ||
398 (points && (!
SDDS_SetColumnFromDoubles(&outTable, SDDS_SET_BY_NAME, indep + (doSides ? 0 : 1), doSides ? bins + 2 : bins, dataColumn))))
401 if (overlapEventID) {
402 for (iEvent = 0; iEvent < eventRefIDs; iEvent++) {
403 if (strcmp(eventRefData[iEvent].
string, overlapEventID) == 0)
406 if (iEvent == eventRefIDs)
407 SDDS_Bomb(
"Cannot create overlap as the specified overlap event is not present.");
408 makeEventHistogram(overlapHist, bins, lowerLimit, dx, eventRefData + iEvent);
411 for (iEvent = pointsBinned = 0; iEvent < eventRefIDs; iEvent++) {
412 pointsBinned += makeEventHistogram(hist, bins, lowerLimit, dx, eventRefData + iEvent);
413 if (normalizeMode != NORMALIZE_NO) {
415 switch (normalizeMode) {
421 for (i = 0; i < bins; i++)
423 if (normalizeMode == NORMALIZE_AREA)
427 SDDS_Bomb(
"Invalid normalization mode.");
431 for (i = 0; i < bins; i++)
435 if (!
SDDS_SetColumnFromDoubles(&outTable, SDDS_SET_BY_INDEX, hist + (doSides ? 0 : 1), doSides ? bins + 2 : bins, eventRefData[iEvent].histogramIndex))
437 if (overlapEventID) {
438 makeEventOverlap(overlap, hist, overlapHist, bins + 2);
439 if (!
SDDS_SetColumnFromDoubles(&outTable, SDDS_SET_BY_INDEX, overlap + (doSides ? 0 : 1), doSides ? bins + 2 : bins, eventRefData[iEvent].overlapIndex))
442 free(eventRefData[iEvent].data);
446 "sddseventhistBins", bins,
447 "sddseventhistBinSize", dx,
448 "sddseventhistPointsBinned", pointsBinned,
453 fprintf(stderr,
"%ld points of %" PRId64
" from page %ld histogrammed in %ld bins\n", pointsBinned, points, readCode, bins);
477 char *inputfile,
char *dataColumn,
char *eventIDColumn,
char *overlapEventID,
478 EVENT_DATA **eventDataRet, int64_t *eventIDsRet,
double **dataRet,
long bins,
479 double binSize,
long normalizeMode,
short columnMajorOrder) {
480 char **eventValue, buffer[SDDS_MAXLINE];
481 int64_t eventRows, uniqueRows, row;
484 double *eventDataValue;
485 int64_t row0, iEvent, drow;
489 (eventRows = SDDS_RowCount(inTable)) == 0 ||
493 if (columnMajorOrder != -1)
494 outTable->layout.data_mode.column_major = columnMajorOrder;
496 outTable->layout.data_mode.column_major = inTable->layout.data_mode.column_major;
498 if (!(eventPair =
SDDS_Malloc(
sizeof(*eventPair) * eventRows)))
502 for (row = 0; row < eventRows; row++) {
503 eventPair[row].string = eventValue[row];
504 eventPair[row].data = eventDataValue[row];
506 qsort(eventPair, eventRows,
sizeof(*eventPair), event_cmpasc);
510 for (row = 1; row < eventRows; row++) {
511 if (strcmp(eventPair[row - 1].
string, eventPair[row].
string) != 0)
514 *eventIDsRet = uniqueRows;
517 if (!(eventData = *eventDataRet =
SDDS_Malloc(
sizeof(**eventDataRet) * uniqueRows)))
521 for (row = 1; row < eventRows; row++) {
522 if (row == (eventRows - 1) || strcmp(eventPair[row].
string, eventPair[row0].
string) != 0) {
524 eventData[iEvent].events = row - row0;
525 if (!
SDDS_CopyString(&eventData[iEvent].
string, eventPair[row0].
string) ||
526 !(eventData[iEvent].data =
SDDS_Malloc(
sizeof(*eventData[iEvent].data) * eventData[iEvent].events)))
528 for (drow = 0; drow < eventData[iEvent].events; drow++) {
529 eventData[iEvent].data[drow] = eventPair[row0 + drow].data;
532 if (row == (eventRows - 1) && strcmp(eventPair[row].
string, eventPair[row0].
string) != 0) {
544 for (row = 0; row < eventRows; row++)
545 free(eventValue[row]);
547 if (iEvent != uniqueRows)
550 if (overlapEventID && strlen(overlapEventID)) {
551 for (iEvent = 0; iEvent < uniqueRows; iEvent++) {
552 if (strcmp(overlapEventID, eventData[iEvent].
string) == 0)
555 if (iEvent == uniqueRows)
559 for (row = 0; row < uniqueRows; row++) {
560 snprintf(buffer,
sizeof(buffer),
"%sFrequency", eventData[row].
string);
563 eventData[row].overlapIndex = -1;
564 if (overlapEventID) {
565 snprintf(buffer,
sizeof(buffer),
"%s.%sOverlap", eventData[row].
string, overlapEventID);
587long makeEventHistogram(
double *hist,
long bins,
double lowerLimit,
double dx,
EVENT_DATA *eventRefData) {
588 long iBin, pointsBinned;
592 for (iBin = 0; iBin <= bins + 1; iBin++)
594 for (iRow = 0; iRow < eventRefData->events; iRow++) {
595 iBin = (eventRefData->data[iRow] - lowerLimit) / dx;
596 if (iBin >= 0 && iBin < bins)
599 for (iBin = pointsBinned = 0; iBin < bins; iBin++)
600 pointsBinned += hist1[iBin];
604void makeEventOverlap(
double *overlap,
double *hist,
double *overlapHist,
long bins) {
606 for (i = 0; i < bins; i++) {
607 overlap[i] = fmin(hist[i], overlapHist[i]);
611int event_cmpasc(
const void *ep1,
const void *ep2) {
616 if ((comp = strcmp(ev1->string, ev2->string)) != 0)
618 if (ev1->data < ev2->data)
620 else if (ev1->data > ev2->data)
SDDS (Self Describing Data Set) Data Types Definitions and Function Prototypes.
int32_t SDDS_CopyParameters(SDDS_DATASET *SDDS_target, SDDS_DATASET *SDDS_source)
int32_t SDDS_StartPage(SDDS_DATASET *SDDS_dataset, int64_t expected_n_rows)
int32_t SDDS_SetParameters(SDDS_DATASET *SDDS_dataset, int32_t mode,...)
int32_t SDDS_SetColumnFromDoubles(SDDS_DATASET *SDDS_dataset, int32_t mode, double *data, int64_t rows,...)
Sets the values for a single data column using double-precision floating-point numbers.
int32_t SDDS_InitializeOutput(SDDS_DATASET *SDDS_dataset, int32_t data_mode, int32_t lines_per_row, const char *description, const char *contents, const char *filename)
Initializes the SDDS output dataset.
int32_t SDDS_WritePage(SDDS_DATASET *SDDS_dataset)
Writes the current data table to the output file.
int32_t SDDS_DefineColumn(SDDS_DATASET *SDDS_dataset, const char *name, const char *symbol, const char *units, const char *description, const char *format_string, int32_t type, int32_t field_length)
Defines a data column within the SDDS dataset.
int32_t SDDS_WriteLayout(SDDS_DATASET *SDDS_dataset)
Writes the SDDS layout header to the output file.
int32_t SDDS_DefineParameter(SDDS_DATASET *SDDS_dataset, const char *name, const char *symbol, const char *units, const char *description, const char *format_string, int32_t type, char *fixed_value)
Defines a data parameter with a fixed string value.
int32_t SDDS_TransferColumnDefinition(SDDS_DATASET *target, SDDS_DATASET *source, char *name, char *newName)
Transfers a column definition from a source dataset to a target dataset.
int32_t SDDS_TransferAllParameterDefinitions(SDDS_DATASET *SDDS_target, SDDS_DATASET *SDDS_source, uint32_t mode)
Transfers all parameter definitions from a source dataset to a target dataset.
int32_t SDDS_GetNamedColumnType(SDDS_DATASET *SDDS_dataset, char *name)
Retrieves the data type of a column in the SDDS dataset by its name.
int32_t SDDS_GetColumnIndex(SDDS_DATASET *SDDS_dataset, char *name)
Retrieves the index of a named column in the SDDS dataset.
void SDDS_PrintErrors(FILE *fp, int32_t mode)
Prints recorded error messages to a specified file stream.
void * SDDS_Malloc(size_t size)
Allocates memory of a specified size.
void SDDS_RegisterProgramName(const char *name)
Registers the executable program name for use in error messages.
int32_t SDDS_GetColumnType(SDDS_DATASET *SDDS_dataset, int32_t index)
Retrieves the data type of a column in the SDDS dataset by its index.
void SDDS_Bomb(char *message)
Terminates the program after printing an error message and recorded errors.
int32_t SDDS_CopyString(char **target, const char *source)
Copies a source string to a target string with memory allocation.
void * SDDS_Realloc(void *old_ptr, size_t new_size)
Reallocates memory to a new size.
#define SDDS_STRING
Identifier for the string data type.
#define SDDS_LONG
Identifier for the signed 32-bit integer data type.
#define SDDS_DOUBLE
Identifier for the double data type.
#define SDDS_NUMERIC_TYPE(type)
Checks if the given type identifier corresponds to any numeric type.
double max_in_array(double *array, long n)
Finds the maximum value in an array of doubles.
long match_string(char *string, char **option, long n_options, long mode)
Matches a given string against an array of option strings based on specified modes.
int scanargs(SCANNED_ARG **scanned, int argc, char **argv)
long processPipeOption(char **item, long items, unsigned long *flags)
void processFilenames(char *programName, char **input, char **output, unsigned long pipeFlags, long noWarnings, long *tmpOutputUsed)
long scanItemList(unsigned long *flags, char **item, long *items, unsigned long mode,...)
Scans a list of items and assigns values based on provided keywords and types.