WL#1972 "Evaluate HAVING before SELECT"

- more tests, post-review changes, bug-fixes, simplifications, and improved comments

WL#1972 "Evaluate HAVING before SELECT"
- more tests, post-review changes, bug-fixes, simplifications, and improved comments
660e1236 · timour@mysql.com · 7031a0b0 · 660e1236 · 660e1236 · 660e1236
Commit 660e1236 authored Nov 05, 2004 by timour@mysql.com
Showing with 520 additions and 325 deletions

mysql-test/r/having.result mysql-test/r/having.result +124 -50

mysql-test/t/having.test mysql-test/t/having.test +134 -62

sql/item.cc sql/item.cc +259 -209

sql/sql_base.cc sql/sql_base.cc +3 -4

No files found.
--- a/mysql-test/r/having.result
+++ b/mysql-test/r/having.result
-drop table if exists t1,t2;
+drop table if exists t1,t2,t3;
 create table t1 (a int);
 select count(a) as b from t1 where a=0 having b > 0;
 b
@@ -128,74 +128,76 @@ id	description	c
 1	test	0
 2	test2	0
 drop table t1,t2,t3;
-drop table if exists wl1972;
+create table t1 (col1 int, col2 varchar(5), col_t1 int);
-create table wl1972 (
+create table t2 (col1 int, col2 varchar(5), col_t2 int);
-col1 int, 
+create table t3 (col1 int, col2 varchar(5), col_t3 int);
-col2 varchar(5) character set latin1 collate latin1_bin) 
+insert into t1 values(10,'hello',10);
-engine=innodb;
+insert into t1 values(20,'hello',20);
-insert into wl1972 values(10,'hello');
+insert into t1 values(30,'hello',30);
-insert into wl1972 values(20,'hello');
+insert into t1 values(10,'bye',10);
-insert into wl1972 values(30,'hello');
+insert into t1 values(10,'sam',10);
-insert into wl1972 values(10,'bye');
+insert into t1 values(10,'bob',10);
-insert into wl1972 values(10,'sam');
+insert into t2 select * from t1;
-insert into wl1972 values(10,'bob');
+insert into t3 select * from t1;
-select count(*) from wl1972 group by col1 having col1 = 10;
+select count(*) from t1 group by col1 having col1 = 10;
 count(*)
 4
-select count(*) as count_col1 from wl1972 group by col1 having col1 = 10;
+select count(*) as count_col1 from t1 group by col1 having col1 = 10;
 count_col1
 4
-select count(*) as count_col1 from wl1972 as t1 group by col1 having col1 = 10;
+select count(*) as count_col1 from t1 as tmp1 group by col1 having col1 = 10;
 count_col1
 4
-select count(*) from wl1972 group by col2 having col2 = 'hello';
+select count(*) from t1 group by col2 having col2 = 'hello';
 count(*)
 3
-select count(*) from wl1972 group by col2 having col1 = 10;
+select count(*) from t1 group by col2 having col1 = 10;
 ERROR 42S22: Unknown column 'col1' in 'having clause'
-select col1 as count_col1 from wl1972 as t1 group by col1 having col1 = 10;
+select col1 as count_col1 from t1 as tmp1 group by col1 having col1 = 10;
 count_col1
 10
-select col1 as count_col1 from wl1972 as t1 group by col1 having count_col1 = 10;
+select col1 as count_col1 from t1 as tmp1 group by col1 having count_col1 = 10;
 count_col1
 10
-select col1 as count_col1 from wl1972 as t1 group by count_col1 having col1 = 10;
+select col1 as count_col1 from t1 as tmp1 group by count_col1 having col1 = 10;
 count_col1
 10
-select col1 as count_col1 from wl1972 as t1 group by count_col1 having count_col1 = 10;
+select col1 as count_col1 from t1 as tmp1 group by count_col1 having count_col1 = 10;
 count_col1
 10
-select col1 as count_col1,col2 from wl1972 as t1 group by col1,col2 having col1 = 10;
+select col1 as count_col1,col2 from t1 as tmp1 group by col1,col2 having col1 = 10;
 count_col1	col2
 10	bob
 10	bye
 10	hello
 10	sam
-select col1 as count_col1,col2 from wl1972 as t1 group by col1,col2 having count_col1 = 10;
+select col1 as count_col1,col2 from t1 as tmp1 group by col1,col2 having count_col1 = 10;
 count_col1	col2
 10	bob
 10	bye
 10	hello
 10	sam
-select col1 as count_col1,col2 from wl1972 as t1 group by col1,col2 having col2 = 'hello';
+select col1 as count_col1,col2 from t1 as tmp1 group by col1,col2 having col2 = 'hello';
 count_col1	col2
 10	hello
 20	hello
 30	hello
-select col1 as count_col1,col2 as group_col2 from wl1972 as t1 
+select col1 as count_col1,col2 as group_col2 from t1 as tmp1 group by col1,col2 having group_col2 = 'hello';
-group by col1,col2 having group_col2 = 'hello';
 count_col1	group_col2
 10	hello
 20	hello
 30	hello
-select sum(col1) as co12 from wl1972 group by col2 having col2 10;
+select sum(col1) as co12 from t1 group by col2 having col2 10;
 ERROR 42000: You have an error in your SQL syntax; check the manual that corresponds to your MySQL server version for the right syntax to use near '10' at line 1
-select sum(col1) as co2, count(col2) as cc from wl1972 group by col1 having col1 =10;
+select sum(col1) as co2, count(col2) as cc from t1 group by col1 having col1 =10;
 co2	cc
 40	4
-select t1.col1 from wl1972 as t1 where t1.col2 in 
+select t2.col2 from t2 group by t2.col1, t2.col2 having t1.col1 <= 10;
-(select t2.col2 from wl1972 as t2 
+ERROR 42S22: Unknown column 't1.col1' in 'having clause'
-group by t2.col1,t2.col2 having t2.col1<=10);
+select t1.col1 from t1
+where t1.col2 in 
+(select t2.col2 from t2 
+group by t2.col1, t2.col2 having t2.col1 <= 10);
 col1
 10
 20
@@ -203,10 +205,12 @@ col1
 10
 10
 10
-select t1.col1 from wl1972 as t1 where t1.col2 in 
+select t1.col1 from t1
-(select t2.col2 from wl1972 as t2 
+where t1.col2 in 
-group by t2.col1,t2.col2 having t2.col1<=
+(select t2.col2 from t2
-(select min(t3.col1) from wl1972 as t3));
+group by t2.col1, t2.col2
+having t2.col1 <=
+(select min(t3.col1) from t3));
 col1
 10
 20
@@ -214,36 +218,106 @@ col1
 10
 10
 10
-drop table wl1972;
+select t1.col1 from t1
-create table wl1972 (s1 int);
+where t1.col2 in
-insert into wl1972 values (1),(2),(3);
+(select t2.col2 from t2 
-select count(*) from wl1972 group by s1 having s1 is null;
+group by t2.col1, t2.col2 having t1.col1 <= 10);
+col1
+10
+10
+10
+10
+select t1.col1 as tmp_col from t1
+where t1.col2 in 
+(select t2.col2 from t2 
+group by t2.col1, t2.col2 having tmp_col <= 10);
+tmp_col
+10
+10
+10
+10
+select t1.col1 from t1
+where t1.col2 in 
+(select t2.col2 from t2 
+group by t2.col1, t2.col2 having col_t1 <= 10);
+col1
+10
+10
+10
+10
+select t1.col1 from t1
+where t1.col2 in 
+(select t2.col2 from t2 
+group by t2.col1, t2.col2 having col_t1 <= 10)
+having col_t1 <= 20;
+ERROR 42S22: Unknown column 'col_t1' in 'having clause'
+select t1.col1 from t1
+where t1.col2 in 
+(select t2.col2 from t2 
+group by t2.col1, t2.col2 having col_t1 <= 10)
+group by col_t1
+having col_t1 <= 20;
+col1
+10
+select col_t1, sum(col1) from t1
+group by col_t1
+having col_t1 > 10 and
+exists (select sum(t2.col1) from t2
+group by t2.col2 having t2.col2 > 'b');
+col_t1	sum(col1)
+20	20
+30	30
+select sum(col1) from t1
+group by col_t1
+having col_t1 in (select sum(t2.col1) from t2
+group by t2.col2, t2.col1 having t2.col1 = t1.col1);
+ERROR 42S22: Unknown column 't1.col1' in 'having clause'
+select sum(col1) from t1
+group by col_t1
+having col_t1 in (select sum(t2.col1) from t2
+group by t2.col2, t2.col1 having t2.col1 = col_t1);
+sum(col1)
+40
+20
+30
+select t1.col1, t2.col1 from t1, t2 where t1.col1 = t2.col1
+group by t1.col1, t2.col1 having col1 = 2;
+ERROR 23000: Column 'col1' in having clause is ambiguous
+select t1.col1*10+t2.col1 from t1,t2 where t1.col1=t2.col1
+group by t1.col1, t2.col1 having col1 = 2;
+ERROR 23000: Column 'col1' in having clause is ambiguous
+drop table t1, t2, t3;
+create table t1 (s1 int);
+insert into t1 values (1),(2),(3);
+select count(*) from t1 group by s1 having s1 is null;
 count(*)
-select s1*0 as s1 from wl1972 group by s1 having s1 <> 0;
+select s1*0 as s1 from t1 group by s1 having s1 <> 0;
 s1
 0
 0
 0
-select s1*0 from wl1972 group by s1 having s1 = 0;
+Warnings:
+Warning	1052	Column 's1' in having clause is ambiguous
+select s1*0 from t1 group by s1 having s1 = 0;
 s1*0
-select s1 from wl1972 group by 1 having 1 = 0;
+select s1 from t1 group by 1 having 1 = 0;
 s1
-select count(s1) from wl1972 group by s1 having count(1+1)=2;
+select count(s1) from t1 group by s1 having count(1+1)=2;
 count(s1)
-select count(s1) from wl1972 group by s1 having s1*0=0;
+select count(s1) from t1 group by s1 having s1*0=0;
 count(s1)
 1
 1
 1
-select * from wl1972 a, wl1972 b group by a.s1 having s1 is null;
+select * from t1 a, t1 b group by a.s1 having s1 is null;
 ERROR 23000: Column 's1' in having clause is ambiguous
-drop table wl1972;
+drop table t1;
-create table wl1972 (s1 char character set latin1 collate latin1_german1_ci);
+create table t1 (s1 char character set latin1 collate latin1_german1_ci);
-insert into wl1972 values ('ü'),('y');
+insert into t1 values ('ü'),('y');
 Warnings:
 Warning	1265	Data truncated for column 's1' at row 1
-select s1,count(s1) from wl1972
+select s1,count(s1) from t1
 group by s1 collate latin1_swedish_ci having s1 = 'y';
 s1	count(s1)
 y	1
-drop table wl1972;
+drop table t1;
--- a/mysql-test/t/having.test
+++ b/mysql-test/t/having.test
@@ -2,7 +2,7 @@
 #
 --disable_warnings
-drop table if exists t1,t2;
+drop table if exists t1,t2,t3;
 --enable_warnings
 create table t1 (a int);
@@ -134,108 +134,180 @@ drop table t1,t2,t3;
 # set global sql_mode='ansi';
 # set session sql_mode='ansi';
--disable_warnings
+create table t1 (col1 int, col2 varchar(5), col_t1 int);
-drop table if exists wl1972;
+create table t2 (col1 int, col2 varchar(5), col_t2 int);
--enable_warnings
+create table t3 (col1 int, col2 varchar(5), col_t3 int);
-create table wl1972 (
-   col1 int, 
-   col2 varchar(5) character set latin1 collate latin1_bin) 
-engine=innodb;
-insert into wl1972 values(10,'hello');
-insert into wl1972 values(20,'hello');
-insert into wl1972 values(30,'hello');
-insert into wl1972 values(10,'bye');
-insert into wl1972 values(10,'sam');
-insert into wl1972 values(10,'bob');
-select count(*) from wl1972 group by col1 having col1 = 10;
+insert into t1 values(10,'hello',10);
+insert into t1 values(20,'hello',20);
+insert into t1 values(30,'hello',30);
+insert into t1 values(10,'bye',10);
+insert into t1 values(10,'sam',10);
+insert into t1 values(10,'bob',10);
-select count(*) as count_col1 from wl1972 group by col1 having col1 = 10;
+insert into t2 select * from t1;
+insert into t3 select * from t1;
-select count(*) as count_col1 from wl1972 as t1 group by col1 having col1 = 10;
-select count(*) from wl1972 group by col2 having col2 = 'hello';
+select count(*) from t1 group by col1 having col1 = 10;
+select count(*) as count_col1 from t1 group by col1 having col1 = 10;
+select count(*) as count_col1 from t1 as tmp1 group by col1 having col1 = 10;
+select count(*) from t1 group by col2 having col2 = 'hello';
 --error 1054
-select count(*) from wl1972 group by col2 having col1 = 10;
+select count(*) from t1 group by col2 having col1 = 10;
+select col1 as count_col1 from t1 as tmp1 group by col1 having col1 = 10;
-select col1 as count_col1 from wl1972 as t1 group by col1 having col1 = 10;
+select col1 as count_col1 from t1 as tmp1 group by col1 having count_col1 = 10;
+select col1 as count_col1 from t1 as tmp1 group by count_col1 having col1 = 10;
-select col1 as count_col1 from wl1972 as t1 group by col1 having count_col1 = 10;
-select col1 as count_col1 from wl1972 as t1 group by count_col1 having col1 = 10;
 # ANSI: should return SQLSTATE 42000 Syntax error or access violation 
 # MySQL: returns 10 - because of GROUP BY name resolution
+select col1 as count_col1 from t1 as tmp1 group by count_col1 having count_col1 = 10;
-select col1 as count_col1 from wl1972 as t1 group by count_col1 having count_col1 = 10;
 # ANSI: should return SQLSTATE 42000 Syntax error or access violation 
 # MySQL: returns 10 - because of GROUP BY name resolution
+select col1 as count_col1,col2 from t1 as tmp1 group by col1,col2 having col1 = 10;
+select col1 as count_col1,col2 from t1 as tmp1 group by col1,col2 having count_col1 = 10;
+select col1 as count_col1,col2 from t1 as tmp1 group by col1,col2 having col2 = 'hello';
+select col1 as count_col1,col2 as group_col2 from t1 as tmp1 group by col1,col2 having group_col2 = 'hello';
+--error 1064
+select sum(col1) as co12 from t1 group by col2 having col2 10; 
+select sum(col1) as co2, count(col2) as cc from t1 group by col1 having col1 =10; 
+--error 1054
+select t2.col2 from t2 group by t2.col1, t2.col2 having t1.col1 <= 10;
-select col1 as count_col1,col2 from wl1972 as t1 group by col1,col2 having col1 = 10;
-select col1 as count_col1,col2 from wl1972 as t1 group by col1,col2 having count_col1 = 10;
+#
+# queries with nested sub-queries
+#
-select col1 as count_col1,col2 from wl1972 as t1 group by col1,col2 having col2 = 'hello';
+# the having column is resolved in the same query
+select t1.col1 from t1
+where t1.col2 in 
+      (select t2.col2 from t2 
+       group by t2.col1, t2.col2 having t2.col1 <= 10);
+select t1.col1 from t1
+where t1.col2 in 
+      (select t2.col2 from t2
+       group by t2.col1, t2.col2
+       having t2.col1 <=
+              (select min(t3.col1) from t3));
+# the having column is resolved in the SELECT clause of the outer query -
+# works in ANSI
+select t1.col1 from t1
+where t1.col2 in
+      (select t2.col2 from t2 
+       group by t2.col1, t2.col2 having t1.col1 <= 10);
+# the having column is resolved in the SELECT clause of the outer query -
+# error in ANSI, works with MySQL extension
+select t1.col1 as tmp_col from t1
+where t1.col2 in 
+      (select t2.col2 from t2 
+       group by t2.col1, t2.col2 having tmp_col <= 10);
+# the having column is resolved in the FROM clause of the outer query -
+# works in ANSI
+select t1.col1 from t1
+where t1.col2 in 
+      (select t2.col2 from t2 
+       group by t2.col1, t2.col2 having col_t1 <= 10);
+# nested queries with HAVING, inner having column resolved in outer FROM clause
+# the outer having column is not referenced in GROUP BY which results in an error
+--error 1054
+select t1.col1 from t1
+where t1.col2 in 
+      (select t2.col2 from t2 
+       group by t2.col1, t2.col2 having col_t1 <= 10)
+having col_t1 <= 20;
-select col1 as count_col1,col2 as group_col2 from wl1972 as t1 
+# both having columns are resolved in the GROUP clause of the outer query
-group by col1,col2 having group_col2 = 'hello';
+select t1.col1 from t1
+where t1.col2 in 
+      (select t2.col2 from t2 
+       group by t2.col1, t2.col2 having col_t1 <= 10)
+group by col_t1
+having col_t1 <= 20;
--error 1064
-select sum(col1) as co12 from wl1972 group by col2 having col2 10; 
-select sum(col1) as co2, count(col2) as cc from wl1972 group by col1 having col1 =10; 
+#
+# nested HAVING clauses
+#
-select t1.col1 from wl1972 as t1 where t1.col2 in 
+# non-correlated subqueries
-   (select t2.col2 from wl1972 as t2 
+select col_t1, sum(col1) from t1
-     group by t2.col1,t2.col2 having t2.col1<=10);
+group by col_t1
+having col_t1 > 10 and
+       exists (select sum(t2.col1) from t2
+               group by t2.col2 having t2.col2 > 'b');
-select t1.col1 from wl1972 as t1 where t1.col2 in 
+# correlated subqueries - inner having column 't1.col2' resolves to
-   (select t2.col2 from wl1972 as t2 
+# the outer FROM clause, which cannot be used because the outer query
-     group by t2.col1,t2.col2 having t2.col1<=
+# is grouped
-        (select min(t3.col1) from wl1972 as t3));
+--error 1054
+select sum(col1) from t1
+group by col_t1
+having col_t1 in (select sum(t2.col1) from t2
+                  group by t2.col2, t2.col1 having t2.col1 = t1.col1);
+# correlated subqueries - inner having column 'col_t1' resolves to
+# the outer GROUP clause
+select sum(col1) from t1
+group by col_t1
+having col_t1 in (select sum(t2.col1) from t2
+                  group by t2.col2, t2.col1 having t2.col1 = col_t1);
-drop table wl1972;
+#
+# queries with joins and ambiguous column names
+#
+--error 1052
+select t1.col1, t2.col1 from t1, t2 where t1.col1 = t2.col1
+group by t1.col1, t2.col1 having col1 = 2;
+--error 1052
+select t1.col1*10+t2.col1 from t1,t2 where t1.col1=t2.col1
+group by t1.col1, t2.col1 having col1 = 2;
+drop table t1, t2, t3;
 # More queries to test ANSI compatibility
-create table wl1972 (s1 int);
+create table t1 (s1 int);
-insert into wl1972 values (1),(2),(3);
+insert into t1 values (1),(2),(3);
-select count(*) from wl1972 group by s1 having s1 is null;
+select count(*) from t1 group by s1 having s1 is null;
-select s1*0 as s1 from wl1972 group by s1 having s1 <> 0;
+select s1*0 as s1 from t1 group by s1 having s1 <> 0;
 # ANSI requires: 3 rows
 # MySQL returns: 0 rows - because of GROUP BY name resolution
-select s1*0 from wl1972 group by s1 having s1 = 0;
+select s1*0 from t1 group by s1 having s1 = 0;
-select s1 from wl1972 group by 1 having 1 = 0;
+select s1 from t1 group by 1 having 1 = 0;
-select count(s1) from wl1972 group by s1 having count(1+1)=2;
+select count(s1) from t1 group by s1 having count(1+1)=2;
 # ANSI requires: 3 rows
 # MySQL returns: 0 rows - because of GROUP BY name resolution
-select count(s1) from wl1972 group by s1 having s1*0=0;
+select count(s1) from t1 group by s1 having s1*0=0;
 -- error 1052
-select * from wl1972 a, wl1972 b group by a.s1 having s1 is null;
+select * from t1 a, t1 b group by a.s1 having s1 is null;
 # ANSI requires: 0 rows
 # MySQL returns:
 # "ERROR 1052 (23000): Column 's1' in having clause is ambiguous"
 # I think the column is ambiguous in ANSI too.
 # It is the same as:
-#   select a.s1, b.s1 from wl1972 a, wl1972 b group by a.s1 having s1 is null;
+#   select a.s1, b.s1 from t1 a, t1 b group by a.s1 having s1 is null;
 # currently we first check SELECT, thus s1 is ambiguous.
-drop table wl1972;
+drop table t1;
-create table wl1972 (s1 char character set latin1 collate latin1_german1_ci);
+create table t1 (s1 char character set latin1 collate latin1_german1_ci);
-insert into wl1972 values ('ü'),('y');
+insert into t1 values ('ü'),('y');
-select s1,count(s1) from wl1972
+select s1,count(s1) from t1
 group by s1 collate latin1_swedish_ci having s1 = 'y';
 # ANSI requires: 1 row, with count(s1) = 2
 # MySQL returns: 1 row, with count(s1) = 1
-drop table wl1972;
+drop table t1;
--- a/sql/item.cc
+++ b/sql/item.cc
@@ -2320,23 +2320,44 @@ static Item** find_field_in_group_list(Item *find_item, ORDER *group_list)
      else
        continue;
-      if (cur_field->table_name && table_name &&
+      if (cur_field->table_name && table_name)
-          !strcmp(cur_field->table_name, table_name))
+      {
-      { /* If field_name is qualified by a table name. */
+        /* If field_name is qualified by a table name. */
+        if (strcmp(cur_field->table_name, table_name))
+          /* Same field names, different tables. */
+          return NULL;
        ++cur_match_degree;
-        if (cur_field->db_name && db_name &&
+        if (cur_field->db_name && db_name)
-            !strcmp(cur_field->db_name, db_name))
+        {
          /* If field_name is also qualified by a database name. */
+          if (strcmp(cur_field->db_name, db_name))
+            /* Same field names, different databases. */
+            return NULL;
          ++cur_match_degree;
        }
+      }
      if (cur_match_degree > found_match_degree)
      {
        found_match_degree= cur_match_degree;
        found_group= cur_group;
      }
+      else if (found_group && (cur_match_degree == found_match_degree) &&
+               ! (*(found_group->item))->eq(cur_field, 0))
+      {
+        /*
+          If the current resolve candidate matches equally well as the current
+          best match, they must reference the same column, otherwise the field
+          is ambiguous.
+        */
+        my_printf_error(ER_NON_UNIQ_ERROR, ER(ER_NON_UNIQ_ERROR),
+                        MYF(0), find_item->full_name(), current_thd->where);
+        return NULL;
+      }
    }
  }
  if (found_group)
    return found_group->item;
  else
@@ -2344,6 +2365,97 @@ static Item** find_field_in_group_list(Item *find_item, ORDER *group_list)
 }
+/*
+  Resolve a column reference in a sub-select.
+  SYNOPSIS
+    resolve_ref_in_select_and_group()
+    thd     current thread
+    ref     column reference being resolved
+    select  the sub-select that ref is resolved against
+  DESCRIPTION
+    Resolve a column reference (usually inside a HAVING clause) against the
+    SELECT and GROUP BY clauses of the query described by 'select'. The name
+    resolution algorithm searches both the SELECT and GROUP BY clauses, and in
+    case of a name conflict prefers GROUP BY column names over SELECT names. If
+    both clauses contain different fields with the same names, a warning is
+    issued that name of 'ref' is ambiguous. We extend ANSI SQL in that when no
+    GROUP BY column is found, then a HAVING name is resolved as a possibly
+    derived SELECT column.
+  NOTES
+    The resolution procedure is:
+    - Search for a column or derived column named col_ref_i [in table T_j]
+      in the SELECT clause of Q.
+    - Search for a column named col_ref_i [in table T_j]
+      in the GROUP BY clause of Q.
+    - If found different columns with the same name in GROUP BY and SELECT
+      - issue a warning and return the GROUP BY column,
+      - otherwise return the found SELECT column.
+  RETURN
+    NULL - there was an error, and the error was already reported
+    not_found_item - the item was not resolved, no error was reported
+    resolved item - if the item was resolved
+*/
+static Item**
+resolve_ref_in_select_and_group(THD *thd, Item_ref *ref, SELECT_LEX *select)
+{
+  Item **group_by_ref= NULL;
+  Item **select_ref= NULL;
+  ORDER *group_list= (ORDER*) select->group_list.first;
+  bool ambiguous_fields= FALSE;
+  uint counter;
+  /*
+    Search for a column or derived column named as 'ref' in the SELECT
+    clause of the current select.
+  */
+  if (!(select_ref= find_item_in_list(ref, *(select->get_item_list()), &counter,
+                                      REPORT_EXCEPT_NOT_FOUND)))
+    return NULL; /* Some error occurred. */
+  /* If this is a non-aggregated field inside HAVING, search in GROUP BY. */
+  if (select->having_fix_field && !ref->with_sum_func && group_list)
+  {
+    group_by_ref= find_field_in_group_list(ref, group_list);
+    /* Check if the fields found in SELECT and GROUP BY are the same field. */
+    if (group_by_ref && (select_ref != not_found_item) &&
+        !((*group_by_ref)->eq(*select_ref, 0)))
+    {
+      ambiguous_fields= TRUE;
+      push_warning_printf(thd, MYSQL_ERROR::WARN_LEVEL_WARN, ER_NON_UNIQ_ERROR,
+                          ER(ER_NON_UNIQ_ERROR), ref->full_name(),
+                          current_thd->where);
+    }
+  }
+  if (select_ref != not_found_item || group_by_ref)
+  {
+    if (select_ref != not_found_item && !ambiguous_fields)
+    {
+      if (*select_ref && !(*select_ref)->fixed)
+      {
+        my_error(ER_ILLEGAL_REFERENCE, MYF(0), ref->name,
+                 "forward reference in item list");
+        return NULL;
+      }
+      return (select->ref_pointer_array + counter);
+    }
+    else if (group_by_ref)
+      return group_by_ref;
+    else
+      DBUG_ASSERT(FALSE);
+  }
+  else
+    return (Item**) not_found_item;
+}
 /*
  Resolve the name of a column reference.
@@ -2356,38 +2468,30 @@ static Item** find_field_in_group_list(Item *find_item, ORDER *group_list)
  DESCRIPTION
    The method resolves the column reference represented by 'this' as a column
    present in one of: GROUP BY clause, SELECT clause, outer queries. It is
-    used for columns in the HAVING clause which are not under aggregate
+    used typically for columns in the HAVING clause which are not under
-    functions.
+    aggregate functions.
  NOTES
-    The general idea behind the name resolution algorithm is that it searches
-    both the SELECT and GROUP BY clauses, and in case of a name conflict
-    prefers GROUP BY column names over SELECT names. We extend ANSI SQL in that
-    when no GROUP BY column is found, then a HAVING name is resolved as a
-    possibly derived SELECT column.
    The name resolution algorithm used is:
      resolve_extended([T_j].col_ref_i)
      {
        Search for a column or derived column named col_ref_i [in table T_j]
-        in the SELECT list of Q.
+        in the SELECT and GROUP clauses of Q.
-        Search for a column named col_ref_i [in table T_j]
-        in the GROUP BY clause of Q.
-        If found different columns with the same name in GROUP BY and SELECT
-        issue a warning and return the GROUP BY column,
-        otherwise return the found SELECT column.
        if such a column is NOT found AND    // Lookup in outer queries.
           there are outer queries
        {
          for each outer query Q_k beginning from the inner-most one
         {
-            search for a column or derived column named col_ref_i
+            Search for a column or derived column named col_ref_i
-            [in table T_j] in the SELECT list of Q_k;
+            [in table T_j] in the SELECT and GROUP clauses of Q_k.
-            if such a column is not found
+            if such a column is not found AND
+               - Q_k is not a group query AND
+               - Q_k is not inside an aggregate function
+               OR
+               - Q_(k-1) is not in a HAVING or SELECT clause of Q_k
            {
              search for a column or derived column named col_ref_i
              [in table T_j] in the FROM clause of Q_k;
@@ -2407,66 +2511,36 @@ static Item** find_field_in_group_list(Item *find_item, ORDER *group_list)
 bool Item_ref::fix_fields(THD *thd, TABLE_LIST *tables, Item **reference)
 {
  DBUG_ASSERT(fixed == 0);
-  uint counter;
  SELECT_LEX *current_sel= thd->lex->current_select;
-  List<Item> *select_fields= current_sel->get_item_list();
-  bool is_having_field= current_sel->having_fix_field;
-  Item **group_by_ref= NULL;
-  bool ambiguous_fields= FALSE;
  if (!ref)
  {
-    TABLE_LIST *table_list;
-    bool upward_lookup= 0;
    SELECT_LEX_UNIT *prev_unit= current_sel->master_unit();
    SELECT_LEX *outer_sel= prev_unit->outer_select();
+    ORDER *group_list= (ORDER*) current_sel->group_list.first;
+    bool ambiguous_fields= FALSE;
+    Item **group_by_ref= NULL;
-    /*
+    if (!(ref= resolve_ref_in_select_and_group(thd, this, current_sel)))
-      Search for a column or derived column named as 'this' in the SELECT
+      return TRUE;             /* Some error occured (e.g. ambigous names). */
-      clause of current_select.
-    */
-    if (!(ref= find_item_in_list(this, *select_fields, &counter,
-                                 REPORT_EXCEPT_NOT_FOUND)))
-      return TRUE; /* Some error occurred. */
-    /* If this is a non-aggregated field inside HAVING, search in GROUP BY. */
+    if (ref == not_found_item) /* This reference was not resolved. */
-    if (is_having_field && !this->with_sum_func)
    {
-      group_by_ref= find_field_in_group_list(this, (ORDER*)
-                                             current_sel->group_list.first);
-      /* Check if the fields found in SELECT and GROUP BY are the same field. */
-      if (group_by_ref && ref != (Item **) not_found_item &&
-          !((*group_by_ref)->eq(*ref, 0)))
-      {
-        ambiguous_fields= TRUE;
-        push_warning_printf(thd, MYSQL_ERROR::WARN_LEVEL_WARN,
-                            ER_NON_UNIQ_ERROR, ER(ER_NON_UNIQ_ERROR),
-                            this->full_name(), current_thd->where);
-      }
-    }
      /*
-      If we didn't find such a column in the current query, and if there is an
+        If there is an outer select, and it is not a derived table (which do
-      outer select, and it is not a derived table (which do not support the
+        not support the use of outer fields for now), try to resolve this
-      use of outer fields for now), search the outer select(s) for a column
+        reference in the outer select(s).
-      named as 'this'.
+        We treat each subselect as a separate namespace, so that different
+        subselects may contain columns with the same names. The subselects are
+        searched starting from the innermost.
      */
-    if (!group_by_ref && (ref == (Item **) not_found_item) && outer_sel && 
+      if (outer_sel && (current_sel->master_unit()->first_select()->linkage !=
-        (current_sel->master_unit()->first_select()->linkage !=
                        DERIVED_TABLE_TYPE))
      {
-      /*
+        TABLE_LIST *table_list;
-	We can't join the columns of the outer & current selects, because of
-	scope of view rules. For example if both tables (outer & current) have
-	field 'field' it is not a mistake to refer to this field without
-	qualifying it with a table name, but if we join tables in one list it
-	will cause error ER_NON_UNIQ_ERROR in find_item_in_list.
-      */
-      upward_lookup= 1;
        Field *tmp= (Field*) not_found_field;
-      SELECT_LEX *last=0;
+        SELECT_LEX *last= 0;
        for ( ; outer_sel ;
              outer_sel= (prev_unit= outer_sel->master_unit())->outer_select())
@@ -2474,22 +2548,25 @@ bool Item_ref::fix_fields(THD *thd, TABLE_LIST *tables, Item **reference)
          last= outer_sel;
          Item_subselect *prev_subselect_item= prev_unit->item;
-        /* Search in the SELECT list of the current outer sub-select. */
+          /* Search in the SELECT and GROUP lists of the outer select. */
-	if (outer_sel->resolve_mode == SELECT_LEX::SELECT_MODE &&
+          if (outer_sel->resolve_mode == SELECT_LEX::SELECT_MODE)
-	    (ref= find_item_in_list(this, outer_sel->item_list,
-				    &counter,
-				    REPORT_EXCEPT_NOT_FOUND)) !=
-	   (Item **)not_found_item)
          {
-	  if (*ref && (*ref)->fixed) // Avoid crash in case of error
+            if (!(ref= resolve_ref_in_select_and_group(thd, this, outer_sel)))
+              return TRUE; /* Some error occured (e.g. ambigous names). */
+            if (ref != not_found_item)
            {
+              DBUG_ASSERT(*ref && (*ref)->fixed);
+              /*
+                Avoid crash in case of error.
+                TODO: what does this comment mean?
+              */
              prev_subselect_item->used_tables_cache|= (*ref)->used_tables();
              prev_subselect_item->const_item_cache&= (*ref)->const_item();
-	  }
              break;
            }
+          }
-        /* Search in the tables in the FROM clause of the outer select. */
+          /* Search in the tables of the FROM clause of the outer select. */
          table_list= outer_sel->get_table_list();
          if (outer_sel->resolve_mode == SELECT_LEX::INSERT_MODE && table_list)
          {
@@ -2500,18 +2577,20 @@ bool Item_ref::fix_fields(THD *thd, TABLE_LIST *tables, Item **reference)
          /*
            Check table fields only if the subquery is used somewhere out of
            HAVING or SELECT list, or outer SELECT does not use grouping
-          (i.e. tables are accessible)
+            (i.e. tables are accessible).
+            TODO: 
+            Here we could first find the field anyway, and then test this
+            condition, so that we can give a better error message -
+            ER_WRONG_FIELD_WITH_GROUP, instead of the less informative
+            ER_BAD_FIELD_ERROR which we produce now.
          */
-        if (((place != IN_HAVING &&
+          if (((place != IN_HAVING && place != SELECT_LIST) ||
-              place != SELECT_LIST) ||
+               (!outer_sel->with_sum_func &&
-             (outer_sel->with_sum_func == 0 &&
+                outer_sel->group_list.elements == 0)))
-              outer_sel->group_list.elements == 0)) &&
+          {
-            (tmp= find_field_in_tables(thd, this,
+            if ((tmp= find_field_in_tables(thd, this, table_list, reference,
-				       table_list, reference,
                                           IGNORE_EXCEPT_NON_UNIQUE, TRUE)) !=
                not_found_field)
-	{
-          if (tmp)
            {
              if (tmp != view_ref_found)
              {
@@ -2525,11 +2604,11 @@ bool Item_ref::fix_fields(THD *thd, TABLE_LIST *tables, Item **reference)
                prev_subselect_item->const_item_cache&=
                  (*reference)->const_item();
              }
-          }
              break;
            }
+          }
-	// Reference is not found => depend from outer (or just error)
+          /* Reference is not found => depend on outer (or just error). */
          prev_subselect_item->used_tables_cache|= OUTER_REF_TABLE_BIT;
          prev_subselect_item->const_item_cache= 0;
@@ -2538,24 +2617,13 @@ bool Item_ref::fix_fields(THD *thd, TABLE_LIST *tables, Item **reference)
            break; /* Do not consider derived tables. */
        }
-      if (!ref)
+        DBUG_ASSERT(ref);
-	return TRUE;
+        if (!tmp)
-      else if (!tmp)
          return TRUE;
-      else if (ref == (Item **)not_found_item && tmp == not_found_field)
+        else if (ref == not_found_item && tmp == not_found_field)
-      {
-	if (upward_lookup)
        {
-	  /* We can't say exactly what was absent (a table or a field). */
          my_printf_error(ER_BAD_FIELD_ERROR, ER(ER_BAD_FIELD_ERROR), MYF(0),
-			  full_name(), thd->where);
+                          this->full_name(), current_thd->where);
-	}
-	else
-	{
-	  // Call to report error
-	  find_item_in_list(this, *select_fields, &counter,
-			    REPORT_ALL_ERRORS);
-	}
          ref= 0;
          return TRUE;
        }
@@ -2564,8 +2632,8 @@ bool Item_ref::fix_fields(THD *thd, TABLE_LIST *tables, Item **reference)
          ref= 0; // To prevent "delete *ref;" on ~Item_ref() of this item
          if (tmp != view_ref_found)
          {
-	  Item_field* fld;
+            Item_field* fld= new Item_field(tmp);
-	  if (!((*reference)= fld= new Item_field(tmp)))
+            if (!((*reference)= fld))
              return TRUE;
            mark_as_dependent(thd, last, current_sel, fld);
            register_item_tree_changing(reference);
@@ -2573,49 +2641,28 @@ bool Item_ref::fix_fields(THD *thd, TABLE_LIST *tables, Item **reference)
          }
          /*
            We can leave expression substituted from view for next PS/SP
-	  re-execution (i.e. do not register this substitution for reverting on
+            re-execution (i.e. do not register this substitution for reverting
-	  cleanup() (register_item_tree_changing())), because this subtree will
+            on cleanup() (register_item_tree_changing())), because this subtree
-	  be fix_field'ed during setup_tables()->setup_ancestor() (i.e. before
+            will be fix_field'ed during setup_tables()->setup_ancestor()
-	  all other expressions of query, and references on tables which do not
+            (i.e. before all other expressions of query, and references on
-	  present in query will not make problems.
+            tables which do not present in query will not make problems.
            Also we suppose that view can't be changed during PS/SP life.
          */
        }
        else
        {
-	if (!(*ref)->fixed)
+          DBUG_ASSERT(*ref && (*ref)->fixed);
-	{
+          mark_as_dependent(thd, last, current_sel, this);
-	  my_error(ER_ILLEGAL_REFERENCE, MYF(0), name,
-		   "forward reference in item list");
-	  return TRUE;
        }
-	mark_as_dependent(thd, last, current_sel,
-			  this);
-	ref= last->ref_pointer_array + counter;
      }
-    }
+      else
-    else if (!group_by_ref && ref == (Item **) not_found_item)
      {
+        /* The current reference cannot be resolved in this query. */
        my_printf_error(ER_BAD_FIELD_ERROR, ER(ER_BAD_FIELD_ERROR), MYF(0),
                        this->full_name(), current_thd->where);
        return TRUE;
      }
-    else
-    {
-      if (ref != (Item **) not_found_item && !ambiguous_fields)
-        ref= current_sel->ref_pointer_array + counter;
-      else if (group_by_ref)
-        ref= group_by_ref;
-      else
-        DBUG_ASSERT(FALSE);
-      if (!(*ref)->fixed)
-      {
-	my_error(ER_ILLEGAL_REFERENCE, MYF(0), name,
-		 "forward reference in item list");
-	return TRUE;
-      }
    }
  }
@@ -2625,15 +2672,18 @@ bool Item_ref::fix_fields(THD *thd, TABLE_LIST *tables, Item **reference)
    with sub-select's / derived tables, while it prevents this 
    check when Item_ref is created in an expression involving 
    summing function, which is to be placed in the user variable.
+    TODO: this comment is impossible to understand.
  */
  if (((*ref)->with_sum_func && name &&
       (depended_from ||
-	!(current_sel->linkage != GLOBAL_OPTIONS_TYPE && is_having_field))) ||
+	!(current_sel->linkage != GLOBAL_OPTIONS_TYPE &&
+          current_sel->having_fix_field))) ||
      !(*ref)->fixed)
  {
    my_error(ER_ILLEGAL_REFERENCE, MYF(0), name, 
 	     ((*ref)->with_sum_func?
-	      "reference on group function":
+	      "reference to group function":
 	      "forward reference in item list"));
    return TRUE;
  }

--- a/sql/sql_base.cc
+++ b/sql/sql_base.cc
@@ -2186,10 +2186,9 @@ Field *find_field_in_real_table(THD *thd, TABLE *table,
    check_privileges    need to check privileges
  RETURN VALUES
-    0			No field was found, or the found field is not unique, or
+    0			If error: the found field is not unique, or there are
-                        there are no sufficient access priviliges for the
+                        no sufficient access priviliges for the found field,
-                        found field, or the field is qualified with non-existing
+                        or the field is qualified with non-existing table.
-                        table.
    not_found_field	The function was called with report_error ==
                        (IGNORE_ERRORS || IGNORE_EXCEPT_NON_UNIQUE) and a
 			field was not found.