Update copyright for 2022
[pgsql.git] / src / bin / psql / crosstabview.c
blob5628db2ce6aa9fd501a07884948eba23913629c4
1 /*
2 * psql - the PostgreSQL interactive terminal
4 * Copyright (c) 2000-2022, PostgreSQL Global Development Group
6 * src/bin/psql/crosstabview.c
7 */
8 #include "postgres_fe.h"
10 #include "common.h"
11 #include "common/logging.h"
12 #include "crosstabview.h"
13 #include "pqexpbuffer.h"
14 #include "psqlscanslash.h"
15 #include "settings.h"
18 * Value/position from the resultset that goes into the horizontal or vertical
19 * crosstabview header.
21 typedef struct _pivot_field
24 * Pointer obtained from PQgetvalue() for colV or colH. Each distinct
25 * value becomes an entry in the vertical header (colV), or horizontal
26 * header (colH). A Null value is represented by a NULL pointer.
28 char *name;
31 * When a sort is requested on an alternative column, this holds
32 * PQgetvalue() for the sort column corresponding to <name>. If <name>
33 * appear multiple times, it's the first value in the order of the results
34 * that is kept. A Null value is represented by a NULL pointer.
36 char *sort_value;
39 * Rank of this value, starting at 0. Initially, it's the relative
40 * position of the first appearance of <name> in the resultset. For
41 * example, if successive rows contain B,A,C,A,D then it's B:0,A:1,C:2,D:3
42 * When a sort column is specified, ranks get updated in a final pass to
43 * reflect the desired order.
45 int rank;
46 } pivot_field;
48 /* Node in avl_tree */
49 typedef struct _avl_node
51 /* Node contents */
52 pivot_field field;
55 * Height of this node in the tree (number of nodes on the longest path to
56 * a leaf).
58 int height;
61 * Child nodes. [0] points to left subtree, [1] to right subtree. Never
62 * NULL, points to the empty node avl_tree.end when no left or right
63 * value.
65 struct _avl_node *children[2];
66 } avl_node;
69 * Control structure for the AVL tree (binary search tree kept
70 * balanced with the AVL algorithm)
72 typedef struct _avl_tree
74 int count; /* Total number of nodes */
75 avl_node *root; /* root of the tree */
76 avl_node *end; /* Immutable dereferenceable empty tree */
77 } avl_tree;
80 static bool printCrosstab(const PGresult *results,
81 int num_columns, pivot_field *piv_columns, int field_for_columns,
82 int num_rows, pivot_field *piv_rows, int field_for_rows,
83 int field_for_data);
84 static void avlInit(avl_tree *tree);
85 static void avlMergeValue(avl_tree *tree, char *name, char *sort_value);
86 static int avlCollectFields(avl_tree *tree, avl_node *node,
87 pivot_field *fields, int idx);
88 static void avlFree(avl_tree *tree, avl_node *node);
89 static void rankSort(int num_columns, pivot_field *piv_columns);
90 static int indexOfColumn(char *arg, const PGresult *res);
91 static int pivotFieldCompare(const void *a, const void *b);
92 static int rankCompare(const void *a, const void *b);
96 * Main entry point to this module.
98 * Process the data from *res according to the options in pset (global),
99 * to generate the horizontal and vertical headers contents,
100 * then call printCrosstab() for the actual output.
102 bool
103 PrintResultsInCrosstab(const PGresult *res)
105 bool retval = false;
106 avl_tree piv_columns;
107 avl_tree piv_rows;
108 pivot_field *array_columns = NULL;
109 pivot_field *array_rows = NULL;
110 int num_columns = 0;
111 int num_rows = 0;
112 int field_for_rows;
113 int field_for_columns;
114 int field_for_data;
115 int sort_field_for_columns;
116 int rn;
118 avlInit(&piv_rows);
119 avlInit(&piv_columns);
121 if (PQresultStatus(res) != PGRES_TUPLES_OK)
123 pg_log_error("\\crosstabview: statement did not return a result set");
124 goto error_return;
127 if (PQnfields(res) < 3)
129 pg_log_error("\\crosstabview: query must return at least three columns");
130 goto error_return;
133 /* Process first optional arg (vertical header column) */
134 if (pset.ctv_args[0] == NULL)
135 field_for_rows = 0;
136 else
138 field_for_rows = indexOfColumn(pset.ctv_args[0], res);
139 if (field_for_rows < 0)
140 goto error_return;
143 /* Process second optional arg (horizontal header column) */
144 if (pset.ctv_args[1] == NULL)
145 field_for_columns = 1;
146 else
148 field_for_columns = indexOfColumn(pset.ctv_args[1], res);
149 if (field_for_columns < 0)
150 goto error_return;
153 /* Insist that header columns be distinct */
154 if (field_for_columns == field_for_rows)
156 pg_log_error("\\crosstabview: vertical and horizontal headers must be different columns");
157 goto error_return;
160 /* Process third optional arg (data column) */
161 if (pset.ctv_args[2] == NULL)
163 int i;
166 * If the data column was not specified, we search for the one not
167 * used as either vertical or horizontal headers. Must be exactly
168 * three columns, or this won't be unique.
170 if (PQnfields(res) != 3)
172 pg_log_error("\\crosstabview: data column must be specified when query returns more than three columns");
173 goto error_return;
176 field_for_data = -1;
177 for (i = 0; i < PQnfields(res); i++)
179 if (i != field_for_rows && i != field_for_columns)
181 field_for_data = i;
182 break;
185 Assert(field_for_data >= 0);
187 else
189 field_for_data = indexOfColumn(pset.ctv_args[2], res);
190 if (field_for_data < 0)
191 goto error_return;
194 /* Process fourth optional arg (horizontal header sort column) */
195 if (pset.ctv_args[3] == NULL)
196 sort_field_for_columns = -1; /* no sort column */
197 else
199 sort_field_for_columns = indexOfColumn(pset.ctv_args[3], res);
200 if (sort_field_for_columns < 0)
201 goto error_return;
205 * First part: accumulate the names that go into the vertical and
206 * horizontal headers, each into an AVL binary tree to build the set of
207 * DISTINCT values.
210 for (rn = 0; rn < PQntuples(res); rn++)
212 char *val;
213 char *val1;
215 /* horizontal */
216 val = PQgetisnull(res, rn, field_for_columns) ? NULL :
217 PQgetvalue(res, rn, field_for_columns);
218 val1 = NULL;
220 if (sort_field_for_columns >= 0 &&
221 !PQgetisnull(res, rn, sort_field_for_columns))
222 val1 = PQgetvalue(res, rn, sort_field_for_columns);
224 avlMergeValue(&piv_columns, val, val1);
226 if (piv_columns.count > CROSSTABVIEW_MAX_COLUMNS)
228 pg_log_error("\\crosstabview: maximum number of columns (%d) exceeded",
229 CROSSTABVIEW_MAX_COLUMNS);
230 goto error_return;
233 /* vertical */
234 val = PQgetisnull(res, rn, field_for_rows) ? NULL :
235 PQgetvalue(res, rn, field_for_rows);
237 avlMergeValue(&piv_rows, val, NULL);
241 * Second part: Generate sorted arrays from the AVL trees.
244 num_columns = piv_columns.count;
245 num_rows = piv_rows.count;
247 array_columns = (pivot_field *)
248 pg_malloc(sizeof(pivot_field) * num_columns);
250 array_rows = (pivot_field *)
251 pg_malloc(sizeof(pivot_field) * num_rows);
253 avlCollectFields(&piv_columns, piv_columns.root, array_columns, 0);
254 avlCollectFields(&piv_rows, piv_rows.root, array_rows, 0);
257 * Third part: optionally, process the ranking data for the horizontal
258 * header
260 if (sort_field_for_columns >= 0)
261 rankSort(num_columns, array_columns);
264 * Fourth part: print the crosstab'ed results.
266 retval = printCrosstab(res,
267 num_columns, array_columns, field_for_columns,
268 num_rows, array_rows, field_for_rows,
269 field_for_data);
271 error_return:
272 avlFree(&piv_columns, piv_columns.root);
273 avlFree(&piv_rows, piv_rows.root);
274 pg_free(array_columns);
275 pg_free(array_rows);
277 return retval;
281 * Output the pivoted resultset with the printTable* functions. Return true
282 * if successful, false otherwise.
284 static bool
285 printCrosstab(const PGresult *results,
286 int num_columns, pivot_field *piv_columns, int field_for_columns,
287 int num_rows, pivot_field *piv_rows, int field_for_rows,
288 int field_for_data)
290 printQueryOpt popt = pset.popt;
291 printTableContent cont;
292 int i,
294 char col_align;
295 int *horiz_map;
296 bool retval = false;
298 printTableInit(&cont, &popt.topt, popt.title, num_columns + 1, num_rows);
300 /* Step 1: set target column names (horizontal header) */
302 /* The name of the first column is kept unchanged by the pivoting */
303 printTableAddHeader(&cont,
304 PQfname(results, field_for_rows),
305 false,
306 column_type_alignment(PQftype(results,
307 field_for_rows)));
310 * To iterate over piv_columns[] by piv_columns[].rank, create a reverse
311 * map associating each piv_columns[].rank to its index in piv_columns.
312 * This avoids an O(N^2) loop later.
314 horiz_map = (int *) pg_malloc(sizeof(int) * num_columns);
315 for (i = 0; i < num_columns; i++)
316 horiz_map[piv_columns[i].rank] = i;
319 * The display alignment depends on its PQftype().
321 col_align = column_type_alignment(PQftype(results, field_for_data));
323 for (i = 0; i < num_columns; i++)
325 char *colname;
327 colname = piv_columns[horiz_map[i]].name ?
328 piv_columns[horiz_map[i]].name :
329 (popt.nullPrint ? popt.nullPrint : "");
331 printTableAddHeader(&cont, colname, false, col_align);
333 pg_free(horiz_map);
335 /* Step 2: set row names in the first output column (vertical header) */
336 for (i = 0; i < num_rows; i++)
338 int k = piv_rows[i].rank;
340 cont.cells[k * (num_columns + 1)] = piv_rows[i].name ?
341 piv_rows[i].name :
342 (popt.nullPrint ? popt.nullPrint : "");
344 cont.cellsadded = num_rows * (num_columns + 1);
347 * Step 3: fill in the content cells.
349 for (rn = 0; rn < PQntuples(results); rn++)
351 int row_number;
352 int col_number;
353 pivot_field *rp,
354 *cp;
355 pivot_field elt;
357 /* Find target row */
358 if (!PQgetisnull(results, rn, field_for_rows))
359 elt.name = PQgetvalue(results, rn, field_for_rows);
360 else
361 elt.name = NULL;
362 rp = (pivot_field *) bsearch(&elt,
363 piv_rows,
364 num_rows,
365 sizeof(pivot_field),
366 pivotFieldCompare);
367 Assert(rp != NULL);
368 row_number = rp->rank;
370 /* Find target column */
371 if (!PQgetisnull(results, rn, field_for_columns))
372 elt.name = PQgetvalue(results, rn, field_for_columns);
373 else
374 elt.name = NULL;
376 cp = (pivot_field *) bsearch(&elt,
377 piv_columns,
378 num_columns,
379 sizeof(pivot_field),
380 pivotFieldCompare);
381 Assert(cp != NULL);
382 col_number = cp->rank;
384 /* Place value into cell */
385 if (col_number >= 0 && row_number >= 0)
387 int idx;
389 /* index into the cont.cells array */
390 idx = 1 + col_number + row_number * (num_columns + 1);
393 * If the cell already contains a value, raise an error.
395 if (cont.cells[idx] != NULL)
397 pg_log_error("\\crosstabview: query result contains multiple data values for row \"%s\", column \"%s\"",
398 rp->name ? rp->name :
399 (popt.nullPrint ? popt.nullPrint : "(null)"),
400 cp->name ? cp->name :
401 (popt.nullPrint ? popt.nullPrint : "(null)"));
402 goto error;
405 cont.cells[idx] = !PQgetisnull(results, rn, field_for_data) ?
406 PQgetvalue(results, rn, field_for_data) :
407 (popt.nullPrint ? popt.nullPrint : "");
412 * The non-initialized cells must be set to an empty string for the print
413 * functions
415 for (i = 0; i < cont.cellsadded; i++)
417 if (cont.cells[i] == NULL)
418 cont.cells[i] = "";
421 printTable(&cont, pset.queryFout, false, pset.logfile);
422 retval = true;
424 error:
425 printTableCleanup(&cont);
427 return retval;
431 * The avl* functions below provide a minimalistic implementation of AVL binary
432 * trees, to efficiently collect the distinct values that will form the horizontal
433 * and vertical headers. It only supports adding new values, no removal or even
434 * search.
436 static void
437 avlInit(avl_tree *tree)
439 tree->end = (avl_node *) pg_malloc0(sizeof(avl_node));
440 tree->end->children[0] = tree->end->children[1] = tree->end;
441 tree->count = 0;
442 tree->root = tree->end;
445 /* Deallocate recursively an AVL tree, starting from node */
446 static void
447 avlFree(avl_tree *tree, avl_node *node)
449 if (node->children[0] != tree->end)
451 avlFree(tree, node->children[0]);
452 pg_free(node->children[0]);
454 if (node->children[1] != tree->end)
456 avlFree(tree, node->children[1]);
457 pg_free(node->children[1]);
459 if (node == tree->root)
461 /* free the root separately as it's not child of anything */
462 if (node != tree->end)
463 pg_free(node);
464 /* free the tree->end struct only once and when all else is freed */
465 pg_free(tree->end);
469 /* Set the height to 1 plus the greatest of left and right heights */
470 static void
471 avlUpdateHeight(avl_node *n)
473 n->height = 1 + (n->children[0]->height > n->children[1]->height ?
474 n->children[0]->height :
475 n->children[1]->height);
478 /* Rotate a subtree left (dir=0) or right (dir=1). Not recursive */
479 static avl_node *
480 avlRotate(avl_node **current, int dir)
482 avl_node *before = *current;
483 avl_node *after = (*current)->children[dir];
485 *current = after;
486 before->children[dir] = after->children[!dir];
487 avlUpdateHeight(before);
488 after->children[!dir] = before;
490 return after;
493 static int
494 avlBalance(avl_node *n)
496 return n->children[0]->height - n->children[1]->height;
500 * After an insertion, possibly rebalance the tree so that the left and right
501 * node heights don't differ by more than 1.
502 * May update *node.
504 static void
505 avlAdjustBalance(avl_tree *tree, avl_node **node)
507 avl_node *current = *node;
508 int b = avlBalance(current) / 2;
510 if (b != 0)
512 int dir = (1 - b) / 2;
514 if (avlBalance(current->children[dir]) == -b)
515 avlRotate(&current->children[dir], !dir);
516 current = avlRotate(node, dir);
518 if (current != tree->end)
519 avlUpdateHeight(current);
523 * Insert a new value/field, starting from *node, reaching the correct position
524 * in the tree by recursion. Possibly rebalance the tree and possibly update
525 * *node. Do nothing if the value is already present in the tree.
527 static void
528 avlInsertNode(avl_tree *tree, avl_node **node, pivot_field field)
530 avl_node *current = *node;
532 if (current == tree->end)
534 avl_node *new_node = (avl_node *)
535 pg_malloc(sizeof(avl_node));
537 new_node->height = 1;
538 new_node->field = field;
539 new_node->children[0] = new_node->children[1] = tree->end;
540 tree->count++;
541 *node = new_node;
543 else
545 int cmp = pivotFieldCompare(&field, &current->field);
547 if (cmp != 0)
549 avlInsertNode(tree,
550 cmp > 0 ? &current->children[1] : &current->children[0],
551 field);
552 avlAdjustBalance(tree, node);
557 /* Insert the value into the AVL tree, if it does not preexist */
558 static void
559 avlMergeValue(avl_tree *tree, char *name, char *sort_value)
561 pivot_field field;
563 field.name = name;
564 field.rank = tree->count;
565 field.sort_value = sort_value;
566 avlInsertNode(tree, &tree->root, field);
570 * Recursively extract node values into the names array, in sorted order with a
571 * left-to-right tree traversal.
572 * Return the next candidate offset to write into the names array.
573 * fields[] must be preallocated to hold tree->count entries
575 static int
576 avlCollectFields(avl_tree *tree, avl_node *node, pivot_field *fields, int idx)
578 if (node == tree->end)
579 return idx;
581 idx = avlCollectFields(tree, node->children[0], fields, idx);
582 fields[idx] = node->field;
583 return avlCollectFields(tree, node->children[1], fields, idx + 1);
586 static void
587 rankSort(int num_columns, pivot_field *piv_columns)
589 int *hmap; /* [[offset in piv_columns, rank], ...for
590 * every header entry] */
591 int i;
593 hmap = (int *) pg_malloc(sizeof(int) * num_columns * 2);
594 for (i = 0; i < num_columns; i++)
596 char *val = piv_columns[i].sort_value;
598 /* ranking information is valid if non null and matches /^-?\d+$/ */
599 if (val &&
600 ((*val == '-' &&
601 strspn(val + 1, "0123456789") == strlen(val + 1)) ||
602 strspn(val, "0123456789") == strlen(val)))
604 hmap[i * 2] = atoi(val);
605 hmap[i * 2 + 1] = i;
607 else
609 /* invalid rank information ignored (equivalent to rank 0) */
610 hmap[i * 2] = 0;
611 hmap[i * 2 + 1] = i;
615 qsort(hmap, num_columns, sizeof(int) * 2, rankCompare);
617 for (i = 0; i < num_columns; i++)
619 piv_columns[hmap[i * 2 + 1]].rank = i;
622 pg_free(hmap);
626 * Look up a column reference, which can be either:
627 * - a number from 1 to PQnfields(res)
628 * - a column name matching one of PQfname(res,...)
630 * Returns zero-based column number, or -1 if not found or ambiguous.
632 * Note: may modify contents of "arg" string.
634 static int
635 indexOfColumn(char *arg, const PGresult *res)
637 int idx;
639 if (arg[0] && strspn(arg, "0123456789") == strlen(arg))
641 /* if arg contains only digits, it's a column number */
642 idx = atoi(arg) - 1;
643 if (idx < 0 || idx >= PQnfields(res))
645 pg_log_error("\\crosstabview: column number %d is out of range 1..%d",
646 idx + 1, PQnfields(res));
647 return -1;
650 else
652 int i;
655 * Dequote and downcase the column name. By checking for all-digits
656 * before doing this, we can ensure that a quoted name is treated as a
657 * name even if it's all digits.
659 dequote_downcase_identifier(arg, true, pset.encoding);
661 /* Now look for match(es) among res' column names */
662 idx = -1;
663 for (i = 0; i < PQnfields(res); i++)
665 if (strcmp(arg, PQfname(res, i)) == 0)
667 if (idx >= 0)
669 /* another idx was already found for the same name */
670 pg_log_error("\\crosstabview: ambiguous column name: \"%s\"", arg);
671 return -1;
673 idx = i;
676 if (idx == -1)
678 pg_log_error("\\crosstabview: column name not found: \"%s\"", arg);
679 return -1;
683 return idx;
687 * Value comparator for vertical and horizontal headers
688 * used for deduplication only.
689 * - null values are considered equal
690 * - non-null < null
691 * - non-null values are compared with strcmp()
693 static int
694 pivotFieldCompare(const void *a, const void *b)
696 const pivot_field *pa = (const pivot_field *) a;
697 const pivot_field *pb = (const pivot_field *) b;
699 /* test null values */
700 if (!pb->name)
701 return pa->name ? -1 : 0;
702 else if (!pa->name)
703 return 1;
705 /* non-null values */
706 return strcmp(pa->name, pb->name);
709 static int
710 rankCompare(const void *a, const void *b)
712 return *((const int *) a) - *((const int *) b);