Commit 751a14e6 authored by Tom Lane's avatar Tom Lane

Repair longstanding violation of SQL92 semantics: GROUP BY would

interpret a column name as an output column alias (targetlist AS name),
ather than a real column name as it ought to.  According to the spec,
only ORDER BY should look at output column names.  I left in GROUP BY's
willingness to use an output column number ('GROUP BY 2'), even though
this is also contrary to the spec --- again, only ORDER BY is supposed
to accept that.  But there is no possible reason to want to GROUP BY
an integer constant, so keeping this old behavior won't break any
SQL-compliant queries.  DISTINCT ON will behave the same as GROUP BY.

Change numerology regress test, which depended on the incorrect
behavior.
parent b48f983e
...@@ -8,7 +8,7 @@ ...@@ -8,7 +8,7 @@
* *
* *
* IDENTIFICATION * IDENTIFICATION
* $Header: /cvsroot/pgsql/src/backend/parser/parse_clause.c,v 1.54 2000/02/15 23:09:08 tgl Exp $ * $Header: /cvsroot/pgsql/src/backend/parser/parse_clause.c,v 1.55 2000/02/19 23:45:05 tgl Exp $
* *
*------------------------------------------------------------------------- *-------------------------------------------------------------------------
*/ */
...@@ -721,7 +721,7 @@ parseFromClause(ParseState *pstate, List *frmList) ...@@ -721,7 +721,7 @@ parseFromClause(ParseState *pstate, List *frmList)
* node the ORDER BY, GROUP BY, or DISTINCT ON expression to be matched * node the ORDER BY, GROUP BY, or DISTINCT ON expression to be matched
* tlist the existing target list (NB: this cannot be NIL, which is a * tlist the existing target list (NB: this cannot be NIL, which is a
* good thing since we'd be unable to append to it...) * good thing since we'd be unable to append to it...)
* clause identifies clause type for error messages. * clause identifies clause type (mainly for error messages).
*/ */
static TargetEntry * static TargetEntry *
findTargetlistEntry(ParseState *pstate, Node *node, List *tlist, int clause) findTargetlistEntry(ParseState *pstate, Node *node, List *tlist, int clause)
...@@ -733,7 +733,7 @@ findTargetlistEntry(ParseState *pstate, Node *node, List *tlist, int clause) ...@@ -733,7 +733,7 @@ findTargetlistEntry(ParseState *pstate, Node *node, List *tlist, int clause)
/*---------- /*----------
* Handle two special cases as mandated by the SQL92 spec: * Handle two special cases as mandated by the SQL92 spec:
* *
* 1. ORDER/GROUP BY ColumnName * 1. ORDER BY ColumnName
* For a bare identifier, we search for a matching column name * For a bare identifier, we search for a matching column name
* in the existing target list. Multiple matches are an error * in the existing target list. Multiple matches are an error
* unless they refer to identical values; for example, * unless they refer to identical values; for example,
...@@ -741,17 +741,26 @@ findTargetlistEntry(ParseState *pstate, Node *node, List *tlist, int clause) ...@@ -741,17 +741,26 @@ findTargetlistEntry(ParseState *pstate, Node *node, List *tlist, int clause)
* but not SELECT a AS b, b FROM table ORDER BY b * but not SELECT a AS b, b FROM table ORDER BY b
* If no match is found, we fall through and treat the identifier * If no match is found, we fall through and treat the identifier
* as an expression. * as an expression.
* We do NOT attempt this match for GROUP BY, since it is clearly
* contrary to the spec to use an output column name in preference
* to an underlying column name in GROUP BY. DISTINCT ON isn't in
* the standard, so we can do what we like there; we choose to make
* it work like GROUP BY.
* *
* 2. ORDER/GROUP BY IntegerConstant * 2. ORDER BY/GROUP BY/DISTINCT ON IntegerConstant
* This means to use the n'th item in the existing target list. * This means to use the n'th item in the existing target list.
* Note that it would make no sense to order/group by an actual * Note that it would make no sense to order/group/distinct by an
* constant, so this does not create a conflict with our extension * actual constant, so this does not create a conflict with our
* to order/group by an expression. * extension to order/group by an expression.
* I believe that GROUP BY column-number is not sanctioned by SQL92,
* but since the standard has no other behavior defined for this
* syntax, we may as well continue to support our past behavior.
* *
* Note that pre-existing resjunk targets must not be used in either case. * Note that pre-existing resjunk targets must not be used in either case.
*---------- *----------
*/ */
if (IsA(node, Ident) && ((Ident *) node)->indirection == NIL) if (clause == ORDER_CLAUSE &&
IsA(node, Ident) && ((Ident *) node)->indirection == NIL)
{ {
char *name = ((Ident *) node)->name; char *name = ((Ident *) node)->name;
foreach(tl, tlist) foreach(tl, tlist)
......
...@@ -88,7 +88,7 @@ SELECT DISTINCT f1 AS two FROM TEMP_GROUP; ...@@ -88,7 +88,7 @@ SELECT DISTINCT f1 AS two FROM TEMP_GROUP;
SELECT f1 AS two, max(f3) AS max_float, min(f3) as min_float SELECT f1 AS two, max(f3) AS max_float, min(f3) as min_float
FROM TEMP_GROUP FROM TEMP_GROUP
GROUP BY two GROUP BY f1
ORDER BY two, max_float, min_float; ORDER BY two, max_float, min_float;
two | max_float | min_float two | max_float | min_float
-----+----------------------+----------------------- -----+----------------------+-----------------------
...@@ -96,19 +96,17 @@ SELECT f1 AS two, max(f3) AS max_float, min(f3) as min_float ...@@ -96,19 +96,17 @@ SELECT f1 AS two, max(f3) AS max_float, min(f3) as min_float
2 | 0 | -1.2345678901234e+200 2 | 0 | -1.2345678901234e+200
(2 rows) (2 rows)
-- Postgres used to accept this, but it is clearly against SQL92 to
-- interpret GROUP BY arguments as result column names; they should
-- be source column names *only*. An error is expected.
SELECT f1 AS two, max(f3) AS max_float, min(f3) AS min_float SELECT f1 AS two, max(f3) AS max_float, min(f3) AS min_float
FROM TEMP_GROUP FROM TEMP_GROUP
GROUP BY two GROUP BY two
ORDER BY two, max_float, min_float; ORDER BY two, max_float, min_float;
two | max_float | min_float ERROR: Attribute 'two' not found
-----+----------------------+-----------------------
1 | 1.2345678901234e+200 | 0
2 | 0 | -1.2345678901234e+200
(2 rows)
SELECT f1 AS two, (max(f3) + 1) AS max_plus_1, (min(f3) - 1) AS min_minus_1 SELECT f1 AS two, (max(f3) + 1) AS max_plus_1, (min(f3) - 1) AS min_minus_1
FROM TEMP_GROUP FROM TEMP_GROUP
GROUP BY two GROUP BY f1
ORDER BY two, min_minus_1; ORDER BY two, min_minus_1;
two | max_plus_1 | min_minus_1 two | max_plus_1 | min_minus_1
-----+----------------------+----------------------- -----+----------------------+-----------------------
...@@ -116,14 +114,16 @@ SELECT f1 AS two, (max(f3) + 1) AS max_plus_1, (min(f3) - 1) AS min_minus_1 ...@@ -116,14 +114,16 @@ SELECT f1 AS two, (max(f3) + 1) AS max_plus_1, (min(f3) - 1) AS min_minus_1
2 | 1 | -1.2345678901234e+200 2 | 1 | -1.2345678901234e+200
(2 rows) (2 rows)
SELECT f1 AS two, (max(f3) + 1) AS max_plus_1, (min(f3) - 1) AS min_minus_1 SELECT f1 AS two,
max(f2) + min(f2) AS max_plus_min,
min(f3) - 1 AS min_minus_1
FROM TEMP_GROUP FROM TEMP_GROUP
GROUP BY two GROUP BY f1
ORDER BY two, min_minus_1; ORDER BY two, min_minus_1;
two | max_plus_1 | min_minus_1 two | max_plus_min | min_minus_1
-----+----------------------+----------------------- -----+--------------+-----------------------
1 | 1.2345678901234e+200 | -1 1 | 0 | -1
2 | 1 | -1.2345678901234e+200 2 | 0 | -1.2345678901234e+200
(2 rows) (2 rows)
DROP TABLE TEMP_INT2; DROP TABLE TEMP_INT2;
......
...@@ -67,9 +67,12 @@ SELECT DISTINCT f1 AS two FROM TEMP_GROUP; ...@@ -67,9 +67,12 @@ SELECT DISTINCT f1 AS two FROM TEMP_GROUP;
SELECT f1 AS two, max(f3) AS max_float, min(f3) as min_float SELECT f1 AS two, max(f3) AS max_float, min(f3) as min_float
FROM TEMP_GROUP FROM TEMP_GROUP
GROUP BY two GROUP BY f1
ORDER BY two, max_float, min_float; ORDER BY two, max_float, min_float;
-- Postgres used to accept this, but it is clearly against SQL92 to
-- interpret GROUP BY arguments as result column names; they should
-- be source column names *only*. An error is expected.
SELECT f1 AS two, max(f3) AS max_float, min(f3) AS min_float SELECT f1 AS two, max(f3) AS max_float, min(f3) AS min_float
FROM TEMP_GROUP FROM TEMP_GROUP
GROUP BY two GROUP BY two
...@@ -77,12 +80,14 @@ SELECT f1 AS two, max(f3) AS max_float, min(f3) AS min_float ...@@ -77,12 +80,14 @@ SELECT f1 AS two, max(f3) AS max_float, min(f3) AS min_float
SELECT f1 AS two, (max(f3) + 1) AS max_plus_1, (min(f3) - 1) AS min_minus_1 SELECT f1 AS two, (max(f3) + 1) AS max_plus_1, (min(f3) - 1) AS min_minus_1
FROM TEMP_GROUP FROM TEMP_GROUP
GROUP BY two GROUP BY f1
ORDER BY two, min_minus_1; ORDER BY two, min_minus_1;
SELECT f1 AS two, (max(f3) + 1) AS max_plus_1, (min(f3) - 1) AS min_minus_1 SELECT f1 AS two,
max(f2) + min(f2) AS max_plus_min,
min(f3) - 1 AS min_minus_1
FROM TEMP_GROUP FROM TEMP_GROUP
GROUP BY two GROUP BY f1
ORDER BY two, min_minus_1; ORDER BY two, min_minus_1;
DROP TABLE TEMP_INT2; DROP TABLE TEMP_INT2;
......
Markdown is supported
0% or
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment