63char *option[N_OPTIONS] = {
73char *USAGE =
"Usage: sddsselect [OPTIONS] [<input1>] <input2> [<output>]\n\
76 -pipe[=input][,output] Use pipe for input and/or output.\n\
77 -match=<column1>[=<column2>] Specify columns to match between input1 and input2.\n\
78 -equate=<column1>[=<column2>] Specify columns to equate between input1 and input2.\n\
79 -invert Invert the selection to keep non-matching rows.\n\
80 -reuse[=rows][,page] Allow reusing rows or specify page reuse.\n\
81 -majorOrder=row|column Set the output file to row or column major order.\n\
82 -nowarnings Suppress warning messages.\n\
85 sddsselect -match=colA=colB input1.sdds input2.sdds output.sdds\n\
87Program by Michael Borland. (" __DATE__
" " __TIME__
", SVN revision: " SVN_VERSION
")\n";
89int main(
int argc,
char **argv) {
91 long i, j, i_arg, reuse, reusePage;
92 int64_t rows1, rows2, i1, i2;
95 char **match_column, **equate_column;
96 long match_columns, equate_columns;
97 char *input1, *input2, *output;
98 long tmpfile_used, retval1, retval2;
99 long warnings, invert;
100 unsigned long pipeFlags, majorOrderFlag;
101 KEYED_EQUIVALENT **keyGroup = NULL;
103 short columnMajorOrder = -1;
106 argc =
scanargs(&s_arg, argc, argv);
110 input1 = input2 = output = NULL;
111 match_column = equate_column = NULL;
112 match_columns = equate_columns = reuse = reusePage = 0;
113 tmpfile_used = invert = 0;
117 for (i_arg = 1; i_arg < argc; i_arg++) {
118 if (s_arg[i_arg].arg_type == OPTION) {
120 switch (
match_string(s_arg[i_arg].list[0], option, N_OPTIONS, 0)) {
121 case SET_MAJOR_ORDER:
123 s_arg[i_arg].n_items--;
124 if (s_arg[i_arg].n_items > 0 &&
125 (!
scanItemList(&majorOrderFlag, s_arg[i_arg].list + 1, &s_arg[i_arg].n_items, 0,
126 "row", -1, NULL, 0, SDDS_ROW_MAJOR_ORDER,
127 "column", -1, NULL, 0, SDDS_COLUMN_MAJOR_ORDER, NULL)))
128 SDDS_Bomb(
"invalid -majorOrder syntax/values");
129 if (majorOrderFlag & SDDS_COLUMN_MAJOR_ORDER)
130 columnMajorOrder = 1;
131 else if (majorOrderFlag & SDDS_ROW_MAJOR_ORDER)
132 columnMajorOrder = 0;
134 case SET_MATCH_COLUMN:
135 if (s_arg[i_arg].n_items != 2)
137 if (match_columns != 0)
138 SDDS_Bomb(
"only one -match option may be given");
139 match_column =
tmalloc(
sizeof(*match_column) * 2);
140 if ((ptr = strchr(s_arg[i_arg].list[1],
'=')))
143 ptr = s_arg[i_arg].list[1];
144 match_column[0] = s_arg[i_arg].list[1];
145 match_column[1] = ptr;
148 case SET_EQUATE_COLUMN:
149 if (s_arg[i_arg].n_items != 2)
151 if (equate_columns != 0)
152 SDDS_Bomb(
"only one -equate option may be given");
153 equate_column =
tmalloc(
sizeof(*equate_column) * 2);
154 if ((ptr = strchr(s_arg[i_arg].list[1],
'=')))
157 ptr = s_arg[i_arg].list[1];
158 equate_column[0] = s_arg[i_arg].list[1];
159 equate_column[1] = ptr;
163 if (s_arg[i_arg].n_items == 1)
166 char *reuseOptions[2] = {
"rows",
"page"};
167 for (i = 1; i < s_arg[i_arg].n_items; i++) {
168 switch (
match_string(s_arg[i_arg].list[i], reuseOptions, 2, 0)) {
189 if (!
processPipeOption(s_arg[i_arg].list + 1, s_arg[i_arg].n_items - 1, &pipeFlags))
193 fprintf(stderr,
"error: unknown switch: %s\n", s_arg[i_arg].list[0]);
199 input1 = s_arg[i_arg].list[0];
200 else if (input2 == NULL)
201 input2 = s_arg[i_arg].list[0];
202 else if (output == NULL)
203 output = s_arg[i_arg].list[0];
209 if (pipeFlags & USE_STDIN && input1) {
211 SDDS_Bomb(
"too many filenames (sddsxref)");
216 processFilenames(
"sddsselect", &input1, &output, pipeFlags, !warnings, &tmpfile_used);
218 SDDS_Bomb(
"second input file not specified (sddsxref)");
220 if (equate_columns && match_columns)
221 SDDS_Bomb(
"only one of -equate or -match may be given");
222 if (!equate_columns && !match_columns)
223 SDDS_Bomb(
"one of -equate or -match must be given");
237 sprintf(s,
"error: column %s not found or not string type in file %s", match_column[0], input1 ? input1 :
"stdin");
243 sprintf(s,
"error: column %s not found or not string type in file %s", match_column[1], input2);
248 if (equate_columns) {
251 sprintf(s,
"error: column %s not found or not numeric type in file %s", equate_column[0], input1 ? input1 :
"stdin");
257 sprintf(s,
"error: column %s not found or not numeric type in file %s", equate_column[1], input2);
263 if (output && pipeFlags & USE_STDOUT)
264 SDDS_Bomb(
"too many filenames with -pipe option");
265 if (!output && !(pipeFlags & USE_STDOUT)) {
267 fprintf(stderr,
"warning: existing file %s will be replaced (sddsselect)\n", input1 ? input1 :
"stdin");
275 if (columnMajorOrder != -1)
276 SDDS_output.layout.data_mode.column_major = columnMajorOrder;
278 SDDS_output.layout.data_mode.column_major = SDDS_1.layout.data_mode.column_major;
286 fprintf(stderr,
"warning: <input2> ends before <input1>\n");
311 SDDS_SetError(
"Problem copying parameter or array data from second input file");
316 SDDS_SetError(
"Problem copying parameter or array data from first input file");
321 char **string1, **string2;
325 fprintf(stderr,
"Error: problem getting column %s from file %s\n", match_column[0], input1 ? input1 :
"stdin");
328 if (rows2 && !(string2 =
SDDS_GetColumn(&SDDS_2, match_column[1]))) {
329 fprintf(stderr,
"Error: problem getting column %s from file %s\n", match_column[1], input2);
334 for (i1 = 0; i1 < rows1; i1++) {
336 sprintf(s,
"Problem copying row %" PRId64
" of first data set", i1);
344 if ((!matched && !invert) || (matched && invert)) {
350 for (i = 0; i < rows1; i++)
356 for (i = 0; i < rows2; i++)
361 for (i = 0; i < keyGroups; i++) {
363 if (keyGroup[i]->equivalent)
364 free(keyGroup[i]->equivalent);
374 }
else if (equate_columns) {
375 double *value1, *value2;
379 fprintf(stderr,
"Error: problem getting column %s from file %s\n", equate_column[0], input1 ? input1 :
"stdin");
383 fprintf(stderr,
"Error: problem getting column %s from file %s\n", equate_column[1], input2);
388 for (i1 = 0; i1 < rows1; i1++) {
390 sprintf(s,
"Problem copying row %" PRId64
" of first data set", i1);
399 if ((!equated && !invert) || (equated && invert)) {
410 for (i = 0; i < keyGroups; i++) {
412 if (keyGroup[i]->equivalent)
413 free(keyGroup[i]->equivalent);
SDDS (Self Describing Data Set) Data Types Definitions and Function Prototypes.
int32_t SDDS_CopyParameters(SDDS_DATASET *SDDS_target, SDDS_DATASET *SDDS_source)
int32_t SDDS_InitializeCopy(SDDS_DATASET *SDDS_target, SDDS_DATASET *SDDS_source, char *filename, char *filemode)
int32_t SDDS_CopyRowDirect(SDDS_DATASET *SDDS_target, int64_t target_row, SDDS_DATASET *SDDS_source, int64_t source_row)
int32_t SDDS_CopyPage(SDDS_DATASET *SDDS_target, SDDS_DATASET *SDDS_source)
int32_t SDDS_CopyArrays(SDDS_DATASET *SDDS_target, SDDS_DATASET *SDDS_source)
int32_t SDDS_StartPage(SDDS_DATASET *SDDS_dataset, int64_t expected_n_rows)
int32_t SDDS_WritePage(SDDS_DATASET *SDDS_dataset)
Writes the current data table to the output file.
int32_t SDDS_WriteLayout(SDDS_DATASET *SDDS_dataset)
Writes the SDDS layout header to the output file.
void SDDS_SetError(char *error_text)
Records an error message in the SDDS error stack.
int32_t SDDS_GetColumnIndex(SDDS_DATASET *SDDS_dataset, char *name)
Retrieves the index of a named column in the SDDS dataset.
void SDDS_PrintErrors(FILE *fp, int32_t mode)
Prints recorded error messages to a specified file stream.
void SDDS_RegisterProgramName(const char *name)
Registers the executable program name for use in error messages.
int32_t SDDS_GetColumnType(SDDS_DATASET *SDDS_dataset, int32_t index)
Retrieves the data type of a column in the SDDS dataset by its index.
void SDDS_Bomb(char *message)
Terminates the program after printing an error message and recorded errors.
#define SDDS_STRING
Identifier for the string data type.
#define SDDS_DOUBLE
Identifier for the double data type.
#define SDDS_NUMERIC_TYPE(type)
Checks if the given type identifier corresponds to any numeric type.
void * tmalloc(uint64_t size_of_block)
Allocates a memory block of the specified size with zero initialization.
void bomb(char *error, char *usage)
Reports error messages to the terminal and aborts the program.
char * cp_str(char **s, char *t)
Copies a string, allocating memory for storage.
char * delete_chars(char *s, char *t)
Removes all occurrences of characters found in string t from string s.
long match_string(char *string, char **option, long n_options, long mode)
Matches a given string against an array of option strings based on specified modes.
long replaceFileAndBackUp(char *file, char *replacement)
Replaces a file with a replacement file and creates a backup of the original.
int scanargs(SCANNED_ARG **scanned, int argc, char **argv)
long processPipeOption(char **item, long items, unsigned long *flags)
void processFilenames(char *programName, char **input, char **output, unsigned long pipeFlags, long noWarnings, long *tmpOutputUsed)
void free_scanargs(SCANNED_ARG **scanned, int argc)
long scanItemList(unsigned long *flags, char **item, long *items, unsigned long mode,...)
Scans a list of items and assigns values based on provided keywords and types.
KEYED_EQUIVALENT ** MakeSortedKeyGroups(long *keyGroups, long keyType, void *data, long points)
Create sorted key groups from data.
long FindMatchingKeyGroup(KEYED_EQUIVALENT **keyGroup, long keyGroups, long keyType, void *searchKeyData, long reuse)
Find a matching key group for a search key.
char * tmpname(char *s)
Supplies a unique temporary filename.