summaryrefslogtreecommitdiff
path: root/src/backend/commands/statscmds.c
diff options
context:
space:
mode:
authorTomas Vondra <tomas.vondra@postgresql.org>2021-09-01 17:41:54 +0200
committerTomas Vondra <tomas.vondra@postgresql.org>2021-09-01 18:08:43 +0200
commit50ba70a957f9e018495a111fc4b5e5eb2ea62044 (patch)
tree893632c00d63dc397fd13f04c1f0e7785c07f38c /src/backend/commands/statscmds.c
parentd760d942c73c9a161feefb7dc4a0004b9b4e7787 (diff)
Identify simple column references in extended statistics
Until now, when defining extended statistics, everything except a plain column reference was treated as complex expression. So for example "a" was a column reference, but "(a)" would be an expression. In most cases this does not matter much, but there were a couple strange consequences. For example CREATE STATISTICS s ON a FROM t; would fail, because extended stats require at least two columns. But CREATE STATISTICS s ON (a) FROM t; would succeed, because that requirement does not apply to expressions. Moreover, that statistics object is useless - the optimizer will always use the regular statistics collected for attribute "a". So do a bit more work to identify those expressions referencing a single column, and translate them to a simple column reference. Backpatch to 14, where support for extended statistics on expressions was introduced. Reported-by: Justin Pryzby Backpatch-through: 14 Discussion: https://postgr.es/m/20210816013255.GS10479%40telsasoft.com
Diffstat (limited to 'src/backend/commands/statscmds.c')
-rw-r--r--src/backend/commands/statscmds.c37
1 files changed, 31 insertions, 6 deletions
diff --git a/src/backend/commands/statscmds.c b/src/backend/commands/statscmds.c
index b244a0fbd7b..651b85ccc91 100644
--- a/src/backend/commands/statscmds.c
+++ b/src/backend/commands/statscmds.c
@@ -33,6 +33,7 @@
#include "optimizer/optimizer.h"
#include "statistics/statistics.h"
#include "utils/builtins.h"
+#include "utils/lsyscache.h"
#include "utils/fmgroids.h"
#include "utils/inval.h"
#include "utils/memutils.h"
@@ -210,13 +211,15 @@ CreateStatistics(CreateStatsStmt *stmt)
/*
* Convert the expression list to a simple array of attnums, but also keep
* a list of more complex expressions. While at it, enforce some
- * constraints.
+ * constraints - we don't allow extended statistics on system attributes,
+ * and we require the data type to have less-than operator.
*
- * XXX We do only the bare minimum to separate simple attribute and
- * complex expressions - for example "(a)" will be treated as a complex
- * expression. No matter how elaborate the check is, there'll always be a
- * way around it, if the user is determined (consider e.g. "(a+0)"), so
- * it's not worth protecting against it.
+ * There are many ways how to "mask" a simple attribute refenrece as an
+ * expression, for example "(a+0)" etc. We can't possibly detect all of
+ * them, but we handle at least the simple case with attribute in parens.
+ * There'll always be a way around this, if the user is determined (like
+ * the "(a+0)" example), but this makes it somewhat consistent with how
+ * indexes treat attributes/expressions.
*/
foreach(cell, stmt->exprs)
{
@@ -257,6 +260,28 @@ CreateStatistics(CreateStatsStmt *stmt)
nattnums++;
ReleaseSysCache(atttuple);
}
+ else if (IsA(selem->expr, Var)) /* column reference in parens */
+ {
+ Var *var = (Var *) selem->expr;
+ TypeCacheEntry *type;
+
+ /* Disallow use of system attributes in extended stats */
+ if (var->varattno <= 0)
+ ereport(ERROR,
+ (errcode(ERRCODE_FEATURE_NOT_SUPPORTED),
+ errmsg("statistics creation on system columns is not supported")));
+
+ /* Disallow data types without a less-than operator */
+ type = lookup_type_cache(var->vartype, TYPECACHE_LT_OPR);
+ if (type->lt_opr == InvalidOid)
+ ereport(ERROR,
+ (errcode(ERRCODE_FEATURE_NOT_SUPPORTED),
+ errmsg("column \"%s\" cannot be used in statistics because its type %s has no default btree operator class",
+ get_attname(relid, var->varattno, false), format_type_be(var->vartype))));
+
+ attnums[nattnums] = var->varattno;
+ nattnums++;
+ }
else /* expression */
{
Node *expr = selem->expr;