postgrespro
diff --git a/‎src/backend/parser/gram.y
Lines changed: 25 additions & 10 deletions b/‎src/backend/parser/gram.y
Lines changed: 25 additions & 10 deletions
diff --git a/‎src/backend/parser/parser.c
Lines changed: 58 additions & 47 deletions b/‎src/backend/parser/parser.c
Lines changed: 58 additions & 47 deletions
diff --git a/‎src/include/parser/gramparse.h
Lines changed: 2 additions & 0 deletions b/‎src/include/parser/gramparse.h
Lines changed: 2 additions & 0 deletions
diff --git a/‎src/interfaces/ecpg/preproc/parse.pl
Lines changed: 2 additions & 4 deletions b/‎src/interfaces/ecpg/preproc/parse.pl
Lines changed: 2 additions & 4 deletions
@@ -633,9 +633,9 @@ static Node *makeRecursiveViewSelect(char *relname, List *aliases, Node *query);
 /*
  * The grammar thinks these are keywords, but they are not in the kwlist.h
  * list and so can never be entered directly.  The filter in parser.c
- * creates these tokens when required.
+ * creates these tokens when required (based on looking one token ahead).
  */
-%token			NULLS_FIRST NULLS_LAST WITH_ORDINALITY WITH_TIME
+%token			NULLS_LA WITH_LA
 
 
 /* Precedence: lowest to highest */
@@ -873,6 +873,7 @@ CreateRoleStmt:
 
 
 opt_with:	WITH									{}
+			| WITH_LA								{}
 			| /*EMPTY*/								{}
 		;
 
@@ -6673,8 +6674,8 @@ opt_asc_desc: ASC							{ $$ = SORTBY_ASC; }
 			| /*EMPTY*/						{ $$ = SORTBY_DEFAULT; }
 		;
 
-opt_nulls_order: NULLS_FIRST				{ $$ = SORTBY_NULLS_FIRST; }
-			| NULLS_LAST					{ $$ = SORTBY_NULLS_LAST; }
+opt_nulls_order: NULLS_LA FIRST_P			{ $$ = SORTBY_NULLS_FIRST; }
+			| NULLS_LA LAST_P				{ $$ = SORTBY_NULLS_LAST; }
 			| /*EMPTY*/						{ $$ = SORTBY_NULLS_DEFAULT; }
 		;
 
@@ -8923,7 +8924,7 @@ AlterTSDictionaryStmt:
 		;
 
 AlterTSConfigurationStmt:
-			ALTER TEXT_P SEARCH CONFIGURATION any_name ADD_P MAPPING FOR name_list WITH any_name_list
+			ALTER TEXT_P SEARCH CONFIGURATION any_name ADD_P MAPPING FOR name_list any_with any_name_list
 				{
 					AlterTSConfigurationStmt *n = makeNode(AlterTSConfigurationStmt);
 					n->cfgname = $5;
@@ -8933,7 +8934,7 @@ AlterTSConfigurationStmt:
 					n->replace = false;
 					$$ = (Node*)n;
 				}
-			| ALTER TEXT_P SEARCH CONFIGURATION any_name ALTER MAPPING FOR name_list WITH any_name_list
+			| ALTER TEXT_P SEARCH CONFIGURATION any_name ALTER MAPPING FOR name_list any_with any_name_list
 				{
 					AlterTSConfigurationStmt *n = makeNode(AlterTSConfigurationStmt);
 					n->cfgname = $5;
@@ -8943,7 +8944,7 @@ AlterTSConfigurationStmt:
 					n->replace = false;
 					$$ = (Node*)n;
 				}
-			| ALTER TEXT_P SEARCH CONFIGURATION any_name ALTER MAPPING REPLACE any_name WITH any_name
+			| ALTER TEXT_P SEARCH CONFIGURATION any_name ALTER MAPPING REPLACE any_name any_with any_name
 				{
 					AlterTSConfigurationStmt *n = makeNode(AlterTSConfigurationStmt);
 					n->cfgname = $5;
@@ -8953,7 +8954,7 @@ AlterTSConfigurationStmt:
 					n->replace = true;
 					$$ = (Node*)n;
 				}
-			| ALTER TEXT_P SEARCH CONFIGURATION any_name ALTER MAPPING FOR name_list REPLACE any_name WITH any_name
+			| ALTER TEXT_P SEARCH CONFIGURATION any_name ALTER MAPPING FOR name_list REPLACE any_name any_with any_name
 				{
 					AlterTSConfigurationStmt *n = makeNode(AlterTSConfigurationStmt);
 					n->cfgname = $5;
@@ -8981,6 +8982,11 @@ AlterTSConfigurationStmt:
 				}
 		;
 
+/* Use this if TIME or ORDINALITY after WITH should be taken as an identifier */
+any_with:	WITH									{}
+			| WITH_LA								{}
+		;
+
 
 /*****************************************************************************
  *
@@ -9891,6 +9897,8 @@ simple_select:
  *		AS (query) [ SEARCH or CYCLE clause ]
  *
  * We don't currently support the SEARCH or CYCLE clause.
+ *
+ * Recognizing WITH_LA here allows a CTE to be named TIME or ORDINALITY.
  */
 with_clause:
 		WITH cte_list
@@ -9900,6 +9908,13 @@ with_clause:
 				$$->recursive = false;
 				$$->location = @1;
 			}
+		| WITH_LA cte_list
+			{
+				$$ = makeNode(WithClause);
+				$$->ctes = $2;
+				$$->recursive = false;
+				$$->location = @1;
+			}
 		| WITH RECURSIVE cte_list
 			{
 				$$ = makeNode(WithClause);
@@ -10601,7 +10616,7 @@ opt_col_def_list: AS '(' TableFuncElementList ')'	{ $$ = $3; }
 			| /*EMPTY*/								{ $$ = NIL; }
 		;
 
-opt_ordinality: WITH_ORDINALITY						{ $$ = true; }
+opt_ordinality: WITH_LA ORDINALITY					{ $$ = true; }
 			| /*EMPTY*/								{ $$ = false; }
 		;
 
@@ -11057,7 +11072,7 @@ ConstInterval:
 		;
 
 opt_timezone:
-			WITH_TIME ZONE							{ $$ = TRUE; }
+			WITH_LA TIME ZONE						{ $$ = TRUE; }
 			| WITHOUT TIME ZONE						{ $$ = FALSE; }
 			| /*EMPTY*/								{ $$ = FALSE; }
 		;
 
@@ -64,13 +64,13 @@ raw_parser(const char *str)
 /*
  * Intermediate filter between parser and core lexer (core_yylex in scan.l).
  *
- * The filter is needed because in some cases the standard SQL grammar
+ * This filter is needed because in some cases the standard SQL grammar
  * requires more than one token lookahead.  We reduce these cases to one-token
- * lookahead by combining tokens here, in order to keep the grammar LALR(1).
+ * lookahead by replacing tokens here, in order to keep the grammar LALR(1).
  *
  * Using a filter is simpler than trying to recognize multiword tokens
  * directly in scan.l, because we'd have to allow for comments between the
- * words.  Furthermore it's not clear how to do it without re-introducing
+ * words.  Furthermore it's not clear how to do that without re-introducing
  * scanner backtrack, which would cost more performance than this filter
  * layer does.
  *
@@ -84,7 +84,7 @@ base_yylex(YYSTYPE *lvalp, YYLTYPE *llocp, core_yyscan_t yyscanner)
 	base_yy_extra_type *yyextra = pg_yyget_extra(yyscanner);
 	int			cur_token;
 	int			next_token;
-	core_YYSTYPE cur_yylval;
+	int			cur_token_length;
 	YYLTYPE		cur_yylloc;
 
 	/* Get next token --- we might already have it */
@@ -93,74 +93,85 @@ base_yylex(YYSTYPE *lvalp, YYLTYPE *llocp, core_yyscan_t yyscanner)
 		cur_token = yyextra->lookahead_token;
 		lvalp->core_yystype = yyextra->lookahead_yylval;
 		*llocp = yyextra->lookahead_yylloc;
+		*(yyextra->lookahead_end) = yyextra->lookahead_hold_char;
 		yyextra->have_lookahead = false;
 	}
 	else
 		cur_token = core_yylex(&(lvalp->core_yystype), llocp, yyscanner);
 
-	/* Do we need to look ahead for a possible multiword token? */
+	/*
+	 * If this token isn't one that requires lookahead, just return it.  If it
+	 * does, determine the token length.  (We could get that via strlen(), but
+	 * since we have such a small set of possibilities, hardwiring seems
+	 * feasible and more efficient.)
+	 */
 	switch (cur_token)
 	{
 		case NULLS_P:
+			cur_token_length = 5;
+			break;
+		case WITH:
+			cur_token_length = 4;
+			break;
+		default:
+			return cur_token;
+	}
 
-			/*
-			 * NULLS FIRST and NULLS LAST must be reduced to one token
-			 */
-			cur_yylval = lvalp->core_yystype;
-			cur_yylloc = *llocp;
-			next_token = core_yylex(&(lvalp->core_yystype), llocp, yyscanner);
+	/*
+	 * Identify end+1 of current token.  core_yylex() has temporarily stored a
+	 * '\0' here, and will undo that when we call it again.  We need to redo
+	 * it to fully revert the lookahead call for error reporting purposes.
+	 */
+	yyextra->lookahead_end = yyextra->core_yy_extra.scanbuf +
+		*llocp + cur_token_length;
+	Assert(*(yyextra->lookahead_end) == '\0');
+
+	/*
+	 * Save and restore *llocp around the call.  It might look like we could
+	 * avoid this by just passing &lookahead_yylloc to core_yylex(), but that
+	 * does not work because flex actually holds onto the last-passed pointer
+	 * internally, and will use that for error reporting.  We need any error
+	 * reports to point to the current token, not the next one.
+	 */
+	cur_yylloc = *llocp;
+
+	/* Get next token, saving outputs into lookahead variables */
+	next_token = core_yylex(&(yyextra->lookahead_yylval), llocp, yyscanner);
+	yyextra->lookahead_token = next_token;
+	yyextra->lookahead_yylloc = *llocp;
+
+	*llocp = cur_yylloc;
+
+	/* Now revert the un-truncation of the current token */
+	yyextra->lookahead_hold_char = *(yyextra->lookahead_end);
+	*(yyextra->lookahead_end) = '\0';
+
+	yyextra->have_lookahead = true;
+
+	/* Replace cur_token if needed, based on lookahead */
+	switch (cur_token)
+	{
+		case NULLS_P:
+			/* Replace NULLS_P by NULLS_LA if it's followed by FIRST or LAST */
 			switch (next_token)
 			{
 				case FIRST_P:
-					cur_token = NULLS_FIRST;
-					break;
 				case LAST_P:
-					cur_token = NULLS_LAST;
-					break;
-				default:
-					/* save the lookahead token for next time */
-					yyextra->lookahead_token = next_token;
-					yyextra->lookahead_yylval = lvalp->core_yystype;
-					yyextra->lookahead_yylloc = *llocp;
-					yyextra->have_lookahead = true;
-					/* and back up the output info to cur_token */
-					lvalp->core_yystype = cur_yylval;
-					*llocp = cur_yylloc;
+					cur_token = NULLS_LA;
 					break;
 			}
 			break;
 
 		case WITH:
-
-			/*
-			 * WITH TIME and WITH ORDINALITY must each be reduced to one token
-			 */
-			cur_yylval = lvalp->core_yystype;
-			cur_yylloc = *llocp;
-			next_token = core_yylex(&(lvalp->core_yystype), llocp, yyscanner);
+			/* Replace WITH by WITH_LA if it's followed by TIME or ORDINALITY */
 			switch (next_token)
 			{
 				case TIME:
-					cur_token = WITH_TIME;
-					break;
 				case ORDINALITY:
-					cur_token = WITH_ORDINALITY;
-					break;
-				default:
-					/* save the lookahead token for next time */
-					yyextra->lookahead_token = next_token;
-					yyextra->lookahead_yylval = lvalp->core_yystype;
-					yyextra->lookahead_yylloc = *llocp;
-					yyextra->have_lookahead = true;
-					/* and back up the output info to cur_token */
-					lvalp->core_yystype = cur_yylval;
-					*llocp = cur_yylloc;
+					cur_token = WITH_LA;
 					break;
 			}
 			break;
-
-		default:
-			break;
 	}
 
 	return cur_token;
 
@@ -46,6 +46,8 @@ typedef struct base_yy_extra_type
 	int			lookahead_token;	/* one-token lookahead */
 	core_YYSTYPE lookahead_yylval;		/* yylval for lookahead token */
 	YYLTYPE		lookahead_yylloc;		/* yylloc for lookahead token */
+	char	   *lookahead_end;	/* end of current token */
+	char		lookahead_hold_char;	/* to be put back at *lookahead_end */
 
 	/*
 	 * State variables that belong to the grammar.
 
@@ -42,10 +42,8 @@
 
 # or in the block
 my %replace_string = (
-	'WITH_TIME'       => 'with time',
-	'WITH_ORDINALITY' => 'with ordinality',
-	'NULLS_FIRST'     => 'nulls first',
-	'NULLS_LAST'      => 'nulls last',
+	'NULLS_LA'        => 'nulls',
+	'WITH_LA'         => 'with',
 	'TYPECAST'        => '::',
 	'DOT_DOT'         => '..',
 	'COLON_EQUALS'    => ':=',);
Original file line number	Diff line number	Diff line change
`@@ -633,9 +633,9 @@ static Node makeRecursiveViewSelect(char relname, List aliases, Node query);`
`633`	`633`	`/*`
`634`	`634`	`* The grammar thinks these are keywords, but they are not in the kwlist.h`
`635`	`635`	`* list and so can never be entered directly. The filter in parser.c`
`636`		`- * creates these tokens when required.`
	`636`	`+ * creates these tokens when required (based on looking one token ahead).`
`637`	`637`	`*/`
`638`		`-%token NULLS_FIRST NULLS_LAST WITH_ORDINALITY WITH_TIME`
	`638`	`+%token NULLS_LA WITH_LA`
`639`	`639`
`640`	`640`
`641`	`641`	`/* Precedence: lowest to highest */`
`@@ -873,6 +873,7 @@ CreateRoleStmt:`
`873`	`873`
`874`	`874`
`875`	`875`	`opt_with: WITH {}`
	`876`	`+ \| WITH_LA {}`
`876`	`877`	`\| /EMPTY/ {}`
`877`	`878`	`;`
`878`	`879`
`@@ -6673,8 +6674,8 @@ opt_asc_desc: ASC { $$ = SORTBY_ASC; }`
`6673`	`6674`	`\| /EMPTY/ { $$ = SORTBY_DEFAULT; }`
`6674`	`6675`	`;`
`6675`	`6676`
`6676`		`-opt_nulls_order: NULLS_FIRST { $$ = SORTBY_NULLS_FIRST; }`
`6677`		`- \| NULLS_LAST { $$ = SORTBY_NULLS_LAST; }`
	`6677`	`+opt_nulls_order: NULLS_LA FIRST_P { $$ = SORTBY_NULLS_FIRST; }`
	`6678`	`+ \| NULLS_LA LAST_P { $$ = SORTBY_NULLS_LAST; }`
`6678`	`6679`	`\| /EMPTY/ { $$ = SORTBY_NULLS_DEFAULT; }`
`6679`	`6680`	`;`
`6680`	`6681`
`@@ -8923,7 +8924,7 @@ AlterTSDictionaryStmt:`
`8923`	`8924`	`;`
`8924`	`8925`
`8925`	`8926`	`AlterTSConfigurationStmt:`
`8926`		`- ALTER TEXT_P SEARCH CONFIGURATION any_name ADD_P MAPPING FOR name_list WITH any_name_list`
	`8927`	`+ ALTER TEXT_P SEARCH CONFIGURATION any_name ADD_P MAPPING FOR name_list any_with any_name_list`
`8927`	`8928`	`{`
`8928`	`8929`	`AlterTSConfigurationStmt *n = makeNode(AlterTSConfigurationStmt);`
`8929`	`8930`	`n->cfgname = $5;`
`@@ -8933,7 +8934,7 @@ AlterTSConfigurationStmt:`
`8933`	`8934`	`n->replace = false;`
`8934`	`8935`	`$$ = (Node*)n;`
`8935`	`8936`	`}`
`8936`		`- \| ALTER TEXT_P SEARCH CONFIGURATION any_name ALTER MAPPING FOR name_list WITH any_name_list`
	`8937`	`+ \| ALTER TEXT_P SEARCH CONFIGURATION any_name ALTER MAPPING FOR name_list any_with any_name_list`
`8937`	`8938`	`{`
`8938`	`8939`	`AlterTSConfigurationStmt *n = makeNode(AlterTSConfigurationStmt);`
`8939`	`8940`	`n->cfgname = $5;`
`@@ -8943,7 +8944,7 @@ AlterTSConfigurationStmt:`
`8943`	`8944`	`n->replace = false;`
`8944`	`8945`	`$$ = (Node*)n;`
`8945`	`8946`	`}`
`8946`		`- \| ALTER TEXT_P SEARCH CONFIGURATION any_name ALTER MAPPING REPLACE any_name WITH any_name`
	`8947`	`+ \| ALTER TEXT_P SEARCH CONFIGURATION any_name ALTER MAPPING REPLACE any_name any_with any_name`
`8947`	`8948`	`{`
`8948`	`8949`	`AlterTSConfigurationStmt *n = makeNode(AlterTSConfigurationStmt);`
`8949`	`8950`	`n->cfgname = $5;`
`@@ -8953,7 +8954,7 @@ AlterTSConfigurationStmt:`
`8953`	`8954`	`n->replace = true;`
`8954`	`8955`	`$$ = (Node*)n;`
`8955`	`8956`	`}`
`8956`		`- \| ALTER TEXT_P SEARCH CONFIGURATION any_name ALTER MAPPING FOR name_list REPLACE any_name WITH any_name`
	`8957`	`+ \| ALTER TEXT_P SEARCH CONFIGURATION any_name ALTER MAPPING FOR name_list REPLACE any_name any_with any_name`
`8957`	`8958`	`{`
`8958`	`8959`	`AlterTSConfigurationStmt *n = makeNode(AlterTSConfigurationStmt);`
`8959`	`8960`	`n->cfgname = $5;`
`@@ -8981,6 +8982,11 @@ AlterTSConfigurationStmt:`
`8981`	`8982`	`}`
`8982`	`8983`	`;`
`8983`	`8984`
	`8985`	`+/* Use this if TIME or ORDINALITY after WITH should be taken as an identifier */`
	`8986`	`+any_with: WITH {}`
	`8987`	`+ \| WITH_LA {}`
	`8988`	`+ ;`
	`8989`	`+`
`8984`	`8990`
`8985`	`8991`	`/*****************************************************************************`
`8986`	`8992`	`*`
`@@ -9891,6 +9897,8 @@ simple_select:`
`9891`	`9897`	`* AS (query) [ SEARCH or CYCLE clause ]`
`9892`	`9898`	`*`
`9893`	`9899`	`* We don't currently support the SEARCH or CYCLE clause.`
	`9900`	`+ *`
	`9901`	`+ * Recognizing WITH_LA here allows a CTE to be named TIME or ORDINALITY.`
`9894`	`9902`	`*/`
`9895`	`9903`	`with_clause:`
`9896`	`9904`	`WITH cte_list`
`@@ -9900,6 +9908,13 @@ with_clause:`
`9900`	`9908`	`$$->recursive = false;`
`9901`	`9909`	`$$->location = @1;`
`9902`	`9910`	`}`
	`9911`	`+ \| WITH_LA cte_list`
	`9912`	`+ {`
	`9913`	`+ $$ = makeNode(WithClause);`
	`9914`	`+ $$->ctes = $2;`
	`9915`	`+ $$->recursive = false;`
	`9916`	`+ $$->location = @1;`
	`9917`	`+ }`
`9903`	`9918`	`\| WITH RECURSIVE cte_list`
`9904`	`9919`	`{`
`9905`	`9920`	`$$ = makeNode(WithClause);`
`@@ -10601,7 +10616,7 @@ opt_col_def_list: AS '(' TableFuncElementList ')' { $$ = $3; }`
`10601`	`10616`	`\| /EMPTY/ { $$ = NIL; }`
`10602`	`10617`	`;`
`10603`	`10618`
`10604`		`-opt_ordinality: WITH_ORDINALITY { $$ = true; }`
	`10619`	`+opt_ordinality: WITH_LA ORDINALITY { $$ = true; }`
`10605`	`10620`	`\| /EMPTY/ { $$ = false; }`
`10606`	`10621`	`;`
`10607`	`10622`
`@@ -11057,7 +11072,7 @@ ConstInterval:`
`11057`	`11072`	`;`
`11058`	`11073`
`11059`	`11074`	`opt_timezone:`
`11060`		`- WITH_TIME ZONE { $$ = TRUE; }`
	`11075`	`+ WITH_LA TIME ZONE { $$ = TRUE; }`
`11061`	`11076`	`\| WITHOUT TIME ZONE { $$ = FALSE; }`
`11062`	`11077`	`\| /EMPTY/ { $$ = FALSE; }`
`11063`	`11078`	`;`