Commit ec937d08 authored by Tom Lane's avatar Tom Lane

Align ECPG lexer more closely with the core and psql lexers.

Make a bunch of basically-cosmetic changes to reduce the diffs between
the flex rules in scan.l, psqlscan.l, and pgc.l.  Reorder some code,
adjust a lot of whitespace, sync some comments, make use of flex start
condition scopes to do that.

There are a few non-cosmetic changes in the ECPG lexer:

* Bring over the decimalfail rule (and support function
process_integer_literal) so that ECPG will lex "1..10" into
the same tokens as the backend would.  I'm not sure this makes any
visible difference to users, but I'm not sure it doesn't, either.

* <xdc><<EOF>> gets its own rule so as to produce a more on-point
error message.

* Remove duplicate <SQL>{xdstart} rule.

John Naylor, with a few additional changes by me

Discussion: https://postgr.es/m/CAJVSVGWGqY9YBs2EwtRUkbNv=hXkN8yRPOoD1wxE6COgvvrz5g@mail.gmail.com
parent d20dceaf
...@@ -6,7 +6,8 @@ ...@@ -6,7 +6,8 @@
* *
* NOTE NOTE NOTE: * NOTE NOTE NOTE:
* *
* The rules in this file must be kept in sync with src/fe_utils/psqlscan.l! * The rules in this file must be kept in sync with src/fe_utils/psqlscan.l
* and src/interfaces/ecpg/preproc/pgc.l!
* *
* The rules are designed so that the scanner never has to backtrack, * The rules are designed so that the scanner never has to backtrack,
* in the sense that there is always a rule that can match the input * in the sense that there is always a rule that can match the input
...@@ -168,8 +169,8 @@ extern void core_yyset_column(int column_no, yyscan_t yyscanner); ...@@ -168,8 +169,8 @@ extern void core_yyset_column(int column_no, yyscan_t yyscanner);
%x xc %x xc
%x xd %x xd
%x xh %x xh
%x xe
%x xq %x xq
%x xe
%x xdolq %x xdolq
%x xui %x xui
%x xuiend %x xuiend
...@@ -192,7 +193,7 @@ extern void core_yyset_column(int column_no, yyscan_t yyscanner); ...@@ -192,7 +193,7 @@ extern void core_yyset_column(int column_no, yyscan_t yyscanner);
* XXX perhaps \f (formfeed) should be treated as a newline as well? * XXX perhaps \f (formfeed) should be treated as a newline as well?
* *
* XXX if you change the set of whitespace characters, fix scanner_isspace() * XXX if you change the set of whitespace characters, fix scanner_isspace()
* to agree, and see also the plpgsql lexer. * to agree.
*/ */
space [ \t\n\r\f] space [ \t\n\r\f]
...@@ -417,32 +418,36 @@ other . ...@@ -417,32 +418,36 @@ other .
yyless(2); yyless(2);
} }
<xc>{xcstart} { <xc>{
{xcstart} {
(yyextra->xcdepth)++; (yyextra->xcdepth)++;
/* Put back any characters past slash-star; see above */ /* Put back any characters past slash-star; see above */
yyless(2); yyless(2);
} }
<xc>{xcstop} { {xcstop} {
if (yyextra->xcdepth <= 0) if (yyextra->xcdepth <= 0)
BEGIN(INITIAL); BEGIN(INITIAL);
else else
(yyextra->xcdepth)--; (yyextra->xcdepth)--;
} }
<xc>{xcinside} { {xcinside} {
/* ignore */ /* ignore */
} }
<xc>{op_chars} { {op_chars} {
/* ignore */ /* ignore */
} }
<xc>\*+ { \*+ {
/* ignore */ /* ignore */
} }
<xc><<EOF>> { yyerror("unterminated /* comment"); } <<EOF>> {
yyerror("unterminated /* comment");
}
} /* <xc> */
{xbstart} { {xbstart} {
/* Binary bit type. /* Binary bit type.
......
...@@ -23,6 +23,7 @@ ...@@ -23,6 +23,7 @@
* *
* See psqlscan_int.h for additional commentary. * See psqlscan_int.h for additional commentary.
* *
*
* Portions Copyright (c) 1996-2018, PostgreSQL Global Development Group * Portions Copyright (c) 1996-2018, PostgreSQL Global Development Group
* Portions Copyright (c) 1994, Regents of the University of California * Portions Copyright (c) 1994, Regents of the University of California
* *
...@@ -39,6 +40,9 @@ ...@@ -39,6 +40,9 @@
} }
%{ %{
/* LCOV_EXCL_START */
#include "fe_utils/psqlscan_int.h" #include "fe_utils/psqlscan_int.h"
/* /*
...@@ -71,8 +75,6 @@ typedef int YYSTYPE; ...@@ -71,8 +75,6 @@ typedef int YYSTYPE;
extern int psql_yyget_column(yyscan_t yyscanner); extern int psql_yyget_column(yyscan_t yyscanner);
extern void psql_yyset_column(int column_no, yyscan_t yyscanner); extern void psql_yyset_column(int column_no, yyscan_t yyscanner);
/* LCOV_EXCL_START */
%} %}
%option reentrant %option reentrant
...@@ -128,8 +130,8 @@ extern void psql_yyset_column(int column_no, yyscan_t yyscanner); ...@@ -128,8 +130,8 @@ extern void psql_yyset_column(int column_no, yyscan_t yyscanner);
%x xc %x xc
%x xd %x xd
%x xh %x xh
%x xe
%x xq %x xq
%x xe
%x xdolq %x xdolq
%x xui %x xui
%x xuiend %x xuiend
...@@ -151,7 +153,7 @@ extern void psql_yyset_column(int column_no, yyscan_t yyscanner); ...@@ -151,7 +153,7 @@ extern void psql_yyset_column(int column_no, yyscan_t yyscanner);
* XXX perhaps \f (formfeed) should be treated as a newline as well? * XXX perhaps \f (formfeed) should be treated as a newline as well?
* *
* XXX if you change the set of whitespace characters, fix scanner_isspace() * XXX if you change the set of whitespace characters, fix scanner_isspace()
* to agree, and see also the plpgsql lexer. * to agree.
*/ */
space [ \t\n\r\f] space [ \t\n\r\f]
...@@ -402,14 +404,15 @@ other . ...@@ -402,14 +404,15 @@ other .
ECHO; ECHO;
} }
<xc>{xcstart} { <xc>{
{xcstart} {
cur_state->xcdepth++; cur_state->xcdepth++;
/* Put back any characters past slash-star; see above */ /* Put back any characters past slash-star; see above */
yyless(2); yyless(2);
ECHO; ECHO;
} }
<xc>{xcstop} { {xcstop} {
if (cur_state->xcdepth <= 0) if (cur_state->xcdepth <= 0)
BEGIN(INITIAL); BEGIN(INITIAL);
else else
...@@ -417,17 +420,18 @@ other . ...@@ -417,17 +420,18 @@ other .
ECHO; ECHO;
} }
<xc>{xcinside} { {xcinside} {
ECHO; ECHO;
} }
<xc>{op_chars} { {op_chars} {
ECHO; ECHO;
} }
<xc>\*+ { \*+ {
ECHO; ECHO;
} }
} /* <xc> */
{xbstart} { {xbstart} {
BEGIN(xb); BEGIN(xb);
......
...@@ -10,7 +10,6 @@ ...@@ -10,7 +10,6 @@
* Portions Copyright (c) 1996-2018, PostgreSQL Global Development Group * Portions Copyright (c) 1996-2018, PostgreSQL Global Development Group
* Portions Copyright (c) 1994, Regents of the University of California * Portions Copyright (c) 1994, Regents of the University of California
* *
*
* IDENTIFICATION * IDENTIFICATION
* src/interfaces/ecpg/preproc/pgc.l * src/interfaces/ecpg/preproc/pgc.l
* *
...@@ -28,6 +27,9 @@ ...@@ -28,6 +27,9 @@
} }
%{ %{
/* LCOV_EXCL_START */
extern YYSTYPE base_yylval; extern YYSTYPE base_yylval;
static int xcdepth = 0; /* depth of nesting in slash-star comments */ static int xcdepth = 0; /* depth of nesting in slash-star comments */
...@@ -53,8 +55,9 @@ static bool include_next; ...@@ -53,8 +55,9 @@ static bool include_next;
#define startlit() (literalbuf[0] = '\0', literallen = 0) #define startlit() (literalbuf[0] = '\0', literallen = 0)
static void addlit(char *ytext, int yleng); static void addlit(char *ytext, int yleng);
static void addlitchar (unsigned char); static void addlitchar(unsigned char);
static void parse_include (void); static int process_integer_literal(const char *token, YYSTYPE *lval);
static void parse_include(void);
static bool ecpg_isspace(char ch); static bool ecpg_isspace(char ch);
static bool isdefine(void); static bool isdefine(void);
static bool isinformixdefine(void); static bool isinformixdefine(void);
...@@ -81,8 +84,6 @@ static struct _if_value ...@@ -81,8 +84,6 @@ static struct _if_value
short else_branch; short else_branch;
} stacked_if_value[MAX_NESTED_IF]; } stacked_if_value[MAX_NESTED_IF];
/* LCOV_EXCL_START */
%} %}
%option 8bit %option 8bit
...@@ -91,11 +92,8 @@ static struct _if_value ...@@ -91,11 +92,8 @@ static struct _if_value
%option noinput %option noinput
%option noyywrap %option noyywrap
%option warn %option warn
%option prefix="base_yy"
%option yylineno %option yylineno
%option prefix="base_yy"
%x C SQL incl def def_ident undef
/* /*
* OK, here is a short description of lex/flex rules behavior. * OK, here is a short description of lex/flex rules behavior.
...@@ -108,18 +106,24 @@ static struct _if_value ...@@ -108,18 +106,24 @@ static struct _if_value
* We use exclusive states for quoted strings, extended comments, * We use exclusive states for quoted strings, extended comments,
* and to eliminate parsing troubles for numeric strings. * and to eliminate parsing troubles for numeric strings.
* Exclusive states: * Exclusive states:
* <xb> bit string literal * <xb> bit string literal
* <xcc> extended C-style comments in C * <xcc> extended C-style comments in C
* <xcsql> extended C-style comments in SQL * <xcsql> extended C-style comments in SQL
* <xd> delimited identifiers (double-quoted identifiers) - thomas 1997-10-27 * <xd> delimited identifiers (double-quoted identifiers)
* <xh> hexadecimal numeric string - thomas 1997-11-16 * <xdc> double-quoted strings in C
* <xq> standard quoted strings - thomas 1997-07-30 * <xh> hexadecimal numeric string
* <xqc> standard quoted strings in C - michael * <xn> national character quoted strings
* <xe> extended quoted strings (support backslash escape sequences) * <xq> standard quoted strings
* <xn> national character quoted strings * <xe> extended quoted strings (support backslash escape sequences)
* <xqc> single-quoted strings in C
* <xdolq> $foo$ quoted strings * <xdolq> $foo$ quoted strings
* <xui> quoted identifier with Unicode escapes * <xui> quoted identifier with Unicode escapes
* <xus> quoted string with Unicode escapes * <xus> quoted string with Unicode escapes
* <xcond> condition of an EXEC SQL IFDEF construct
* <xskip> skipping the inactive part of an EXEC SQL IFDEF construct
*
* Remember to add an <<EOF>> case whenever you add a new exclusive state!
* The default one is probably not the right thing.
*/ */
%x xb %x xb
...@@ -128,15 +132,60 @@ static struct _if_value ...@@ -128,15 +132,60 @@ static struct _if_value
%x xd %x xd
%x xdc %x xdc
%x xh %x xh
%x xe
%x xn %x xn
%x xq %x xq
%x xe
%x xqc %x xqc
%x xdolq %x xdolq
%x xcond
%x xskip
%x xui %x xui
%x xus %x xus
%x xcond
%x xskip
/* Additional exclusive states that are specific to ECPG */
%x C SQL incl def def_ident undef
/*
* In order to make the world safe for Windows and Mac clients as well as
* Unix ones, we accept either \n or \r as a newline. A DOS-style \r\n
* sequence will be seen as two successive newlines, but that doesn't cause
* any problems. SQL-style comments, which start with -- and extend to the
* next newline, are treated as equivalent to a single whitespace character.
*
* NOTE a fine point: if there is no newline following --, we will absorb
* everything to the end of the input as a comment. This is correct. Older
* versions of Postgres failed to recognize -- as a comment if the input
* did not end with a newline.
*
* XXX perhaps \f (formfeed) should be treated as a newline as well?
*
* XXX if you change the set of whitespace characters, fix ecpg_isspace()
* to agree.
*/
space [ \t\n\r\f]
horiz_space [ \t\f]
newline [\n\r]
non_newline [^\n\r]
comment ("--"{non_newline}*)
whitespace ({space}+|{comment})
/*
* SQL requires at least one newline in the whitespace separating
* string literals that are to be concatenated. Silly, but who are we
* to argue? Note that {whitespace_with_newline} should not have * after
* it, whereas {whitespace} should generally have a * after it...
*/
horiz_whitespace ({horiz_space}|{comment})
whitespace_with_newline ({horiz_whitespace}*{newline}{whitespace}*)
quote '
quotestop {quote}{whitespace}*
quotecontinue {quote}{whitespace_with_newline}{quote}
quotefail {quote}{whitespace}*"-"
/* Bit string /* Bit string
*/ */
...@@ -158,9 +207,6 @@ xeoctesc [\\][0-7]{1,3} ...@@ -158,9 +207,6 @@ xeoctesc [\\][0-7]{1,3}
xehexesc [\\]x[0-9A-Fa-f]{1,2} xehexesc [\\]x[0-9A-Fa-f]{1,2}
xeunicode [\\](u[0-9A-Fa-f]{4}|U[0-9A-Fa-f]{8}) xeunicode [\\](u[0-9A-Fa-f]{4}|U[0-9A-Fa-f]{8})
/* C version of hex number */
xch 0[xX][0-9A-Fa-f]*
/* Extended quote /* Extended quote
* xqdouble implements embedded quote, '''' * xqdouble implements embedded quote, ''''
*/ */
...@@ -194,7 +240,9 @@ xddouble {dquote}{dquote} ...@@ -194,7 +240,9 @@ xddouble {dquote}{dquote}
xdinside [^"]+ xdinside [^"]+
/* Unicode escapes */ /* Unicode escapes */
/* (The ecpg scanner is not backup-free, so the fail rules in scan.l are not needed here, but could be added if desired.) */ /* (The ecpg scanner is not backup-free, so the fail rules in scan.l are
* not needed here, but could be added if desired.)
*/
uescape [uU][eE][sS][cC][aA][pP][eE]{whitespace}*{quote}[^']{quote} uescape [uU][eE][sS][cC][aA][pP][eE]{whitespace}*{quote}[^']{quote}
/* Quoted identifier with Unicode escapes */ /* Quoted identifier with Unicode escapes */
...@@ -211,22 +259,23 @@ xdcqdq \\\" ...@@ -211,22 +259,23 @@ xdcqdq \\\"
xdcother [^"] xdcother [^"]
xdcinside ({xdcqq}|{xdcqdq}|{xdcother}) xdcinside ({xdcqq}|{xdcqdq}|{xdcother})
/* C-style comments /* C-style comments
* *
* The "extended comment" syntax closely resembles allowable operator syntax. * The "extended comment" syntax closely resembles allowable operator syntax.
* The tricky part here is to get lex to recognize a string starting with * The tricky part here is to get lex to recognize a string starting with
* slash-star as a comment, when interpreting it as an operator would produce * slash-star as a comment, when interpreting it as an operator would produce
* a longer match --- remember lex will prefer a longer match! Also, if we * a longer match --- remember lex will prefer a longer match! Also, if we
* have something like plus-slash-star, lex will think this is a 3-character * have something like plus-slash-star, lex will think this is a 3-character
* operator whereas we want to see it as a + operator and a comment start. * operator whereas we want to see it as a + operator and a comment start.
* The solution is two-fold: * The solution is two-fold:
* 1. append {op_chars}* to xcstart so that it matches as much text as * 1. append {op_chars}* to xcstart so that it matches as much text as
* {operator} would. Then the tie-breaker (first matching rule of same * {operator} would. Then the tie-breaker (first matching rule of same
* length) ensures xcstart wins. We put back the extra stuff with yyless() * length) ensures xcstart wins. We put back the extra stuff with yyless()
* in case it contains a star-slash that should terminate the comment. * in case it contains a star-slash that should terminate the comment.
* 2. In the operator rule, check for slash-star within the operator, and * 2. In the operator rule, check for slash-star within the operator, and
* if found throw it back with yyless(). This handles the plus-slash-star * if found throw it back with yyless(). This handles the plus-slash-star
* problem. * problem.
* Dash-dash comments have similar interactions with the operator rule. * Dash-dash comments have similar interactions with the operator rule.
*/ */
xcstart \/\*{op_chars}* xcstart \/\*{op_chars}*
...@@ -262,7 +311,7 @@ not_equals "!=" ...@@ -262,7 +311,7 @@ not_equals "!="
/* /*
* "self" is the set of chars that should be returned as single-character * "self" is the set of chars that should be returned as single-character
* tokens. "op_chars" is the set of chars that can make up "Op" tokens, * tokens. "op_chars" is the set of chars that can make up "Op" tokens,
* which can be one or more characters long (but if a single-char token * which can be one or more characters long (but if a single-char token
* appears in the "self" set, it is not to be returned as an Op). Note * appears in the "self" set, it is not to be returned as an Op). Note
* that the sets overlap, but each has some chars that are not in the other. * that the sets overlap, but each has some chars that are not in the other.
...@@ -278,68 +327,40 @@ operator {op_chars}+ ...@@ -278,68 +327,40 @@ operator {op_chars}+
* instead we pass it separately to parser. there it gets * instead we pass it separately to parser. there it gets
* coerced via doNegate() -- Leon aug 20 1999 * coerced via doNegate() -- Leon aug 20 1999
* *
* {decimalfail} is used because we would like "1..10" to lex as 1, dot_dot, 10.
*
* {realfail1} and {realfail2} are added to prevent the need for scanner * {realfail1} and {realfail2} are added to prevent the need for scanner
* backup when the {real} rule fails to match completely. * backup when the {real} rule fails to match completely.
*/ */
integer {digit}+ integer {digit}+
decimal (({digit}*\.{digit}+)|({digit}+\.{digit}*)) decimal (({digit}*\.{digit}+)|({digit}+\.{digit}*))
decimalfail {digit}+\.\.
real ({integer}|{decimal})[Ee][-+]?{digit}+ real ({integer}|{decimal})[Ee][-+]?{digit}+
realfail1 ({integer}|{decimal})[Ee] realfail1 ({integer}|{decimal})[Ee]
realfail2 ({integer}|{decimal})[Ee][-+] realfail2 ({integer}|{decimal})[Ee][-+]
param \${integer} param \${integer}
/*
* In order to make the world safe for Windows and Mac clients as well as
* Unix ones, we accept either \n or \r as a newline. A DOS-style \r\n
* sequence will be seen as two successive newlines, but that doesn't cause
* any problems. SQL-style comments, which start with -- and extend to the
* next newline, are treated as equivalent to a single whitespace character.
*
* NOTE a fine point: if there is no newline following --, we will absorb
* everything to the end of the input as a comment. This is correct. Older
* versions of Postgres failed to recognize -- as a comment if the input
* did not end with a newline.
*
* XXX perhaps \f (formfeed) should be treated as a newline as well?
*
* XXX if you change the set of whitespace characters, fix ecpg_isspace()
* to agree.
*/
ccomment "//".*\n
space [ \t\n\r\f]
horiz_space [ \t\f]
newline [\n\r]
non_newline [^\n\r]
comment ("--"{non_newline}*)
whitespace ({space}+|{comment})
/*
* SQL requires at least one newline in the whitespace separating
* string literals that are to be concatenated. Silly, but who are we
* to argue? Note that {whitespace_with_newline} should not have * after
* it, whereas {whitespace} should generally have a * after it...
*/
horiz_whitespace ({horiz_space}|{comment})
whitespace_with_newline ({horiz_whitespace}*{newline}{whitespace}*)
quote '
quotestop {quote}{whitespace}*
quotecontinue {quote}{whitespace_with_newline}{quote}
quotefail {quote}{whitespace}*"-"
/* special characters for other dbms */ /* special characters for other dbms */
/* we have to react differently in compat mode */ /* we have to react differently in compat mode */
informix_special [\$] informix_special [\$]
other . other .
/*
* Dollar quoted strings are totally opaque, and no escaping is done on them.
* Other quoted strings must allow some special characters such as single-quote
* and newline.
* Embedded single-quotes are implemented both in the SQL standard
* style of two adjacent single quotes "''" and in the Postgres/Java style
* of escaped-quote "\'".
* Other embedded escaped characters are matched explicitly and the leading
* backslash is dropped from the string.
* Note that xcstart must appear before operator, as explained above!
* Also whitespace (comment) must appear before operator.
*/
/* some stuff needed for ecpg */ /* some stuff needed for ecpg */
exec [eE][xX][eE][cC] exec [eE][xX][eE][cC]
sql [sS][qQ][lL] sql [sS][qQ][lL]
...@@ -349,6 +370,11 @@ include_next [iI][nN][cC][lL][uU][dD][eE]_[nN][eE][xX][tT] ...@@ -349,6 +370,11 @@ include_next [iI][nN][cC][lL][uU][dD][eE]_[nN][eE][xX][tT]
import [iI][mM][pP][oO][rR][tT] import [iI][mM][pP][oO][rR][tT]
undef [uU][nN][dD][eE][fF] undef [uU][nN][dD][eE][fF]
/* C version of hex number */
xch 0[xX][0-9A-Fa-f]*
ccomment "//".*\n
if [iI][fF] if [iI][fF]
ifdef [iI][fF][dD][eE][fF] ifdef [iI][fF][dD][eE][fF]
ifndef [iI][fF][nN][dD][eE][fF] ifndef [iI][fF][nN][dD][eE][fF]
...@@ -366,24 +392,12 @@ ip {ipdigit}\.{ipdigit}\.{ipdigit}\.{ipdigit} ...@@ -366,24 +392,12 @@ ip {ipdigit}\.{ipdigit}\.{ipdigit}\.{ipdigit}
cppinclude {space}*#{include}{space}* cppinclude {space}*#{include}{space}*
cppinclude_next {space}*#{include_next}{space}* cppinclude_next {space}*#{include_next}{space}*
/* take care of cpp lines, they may also be continuated */ /* take care of cpp lines, they may also be continued */
/* first a general line for all commands not starting with "i" */ /* first a general line for all commands not starting with "i" */
/* and then the other commands starting with "i", we have to add these /* and then the other commands starting with "i", we have to add these
* separately because the cppline production would match on "include" too */ * separately because the cppline production would match on "include" too
cppline {space}*#([^i][A-Za-z]*|{if}|{ifdef}|{ifndef}|{import})((\/\*[^*/]*\*+\/)|.|\\{space}*{newline})*{newline}
/*
* Dollar quoted strings are totally opaque, and no escaping is done on them.
* Other quoted strings must allow some special characters such as single-quote
* and newline.
* Embedded single-quotes are implemented both in the SQL standard
* style of two adjacent single quotes "''" and in the Postgres/Java style
* of escaped-quote "\'".
* Other embedded escaped characters are matched explicitly and the leading
* backslash is dropped from the string. - thomas 1997-09-24
* Note that xcstart must appear before operator, as explained above!
* Also whitespace (comment) must appear before operator.
*/ */
cppline {space}*#([^i][A-Za-z]*|{if}|{ifdef}|{ifndef}|{import})((\/\*[^*/]*\*+\/)|.|\\{space}*{newline})*{newline}
%% %%
...@@ -392,22 +406,27 @@ cppline {space}*#([^i][A-Za-z]*|{if}|{ifdef}|{ifndef}|{import})((\/\*[^*/]*\*+ ...@@ -392,22 +406,27 @@ cppline {space}*#([^i][A-Za-z]*|{if}|{ifdef}|{ifndef}|{import})((\/\*[^*/]*\*+
token_start = NULL; token_start = NULL;
%} %}
<SQL>{whitespace} { /* ignore */ } <SQL>{
{whitespace} {
/* ignore */
}
<C>{xcstart} { {xcstart} {
token_start = yytext; token_start = yytext;
state_before = YYSTATE; state_before = YYSTATE;
xcdepth = 0; xcdepth = 0;
BEGIN(xcc); BEGIN(xcsql);
/* Put back any characters past slash-star; see above */ /* Put back any characters past slash-star; see above */
yyless(2); yyless(2);
fputs("/*", yyout); fputs("/*", yyout);
} }
<SQL>{xcstart} { } /* <SQL> */
<C>{xcstart} {
token_start = yytext; token_start = yytext;
state_before = YYSTATE; state_before = YYSTATE;
xcdepth = 0; xcdepth = 0;
BEGIN(xcsql); BEGIN(xcc);
/* Put back any characters past slash-star; see above */ /* Put back any characters past slash-star; see above */
yyless(2); yyless(2);
fputs("/*", yyout); fputs("/*", yyout);
...@@ -437,20 +456,36 @@ cppline {space}*#([^i][A-Za-z]*|{if}|{ifdef}|{ifndef}|{import})((\/\*[^*/]*\*+ ...@@ -437,20 +456,36 @@ cppline {space}*#([^i][A-Za-z]*|{if}|{ifdef}|{ifndef}|{import})((\/\*[^*/]*\*+
BEGIN(state_before); BEGIN(state_before);
token_start = NULL; token_start = NULL;
} }
<xcc,xcsql>{xcinside} { ECHO; }
<xcc,xcsql>{op_chars} { ECHO; }
<xcc,xcsql>\*+ { ECHO; }
<xcc,xcsql><<EOF>> { mmfatal(PARSE_ERROR, "unterminated /* comment"); } <xcc,xcsql>{
{xcinside} {
ECHO;
}
{op_chars} {
ECHO;
}
\*+ {
ECHO;
}
<<EOF>> {
mmfatal(PARSE_ERROR, "unterminated /* comment");
}
} /* <xcc,xcsql> */
<SQL>{xbstart} { <SQL>{
{xbstart} {
token_start = yytext; token_start = yytext;
BEGIN(xb); BEGIN(xb);
startlit(); startlit();
addlitchar('b'); addlitchar('b');
} }
<xb>{quotestop} | } /* <SQL> */
<xb>{quotefail} {
<xb>{quotestop} |
<xb>{quotefail} {
yyless(1); yyless(1);
BEGIN(SQL); BEGIN(SQL);
if (literalbuf[strspn(literalbuf, "01") + 1] != '\0') if (literalbuf[strspn(literalbuf, "01") + 1] != '\0')
...@@ -458,11 +493,14 @@ cppline {space}*#([^i][A-Za-z]*|{if}|{ifdef}|{ifndef}|{import})((\/\*[^*/]*\*+ ...@@ -458,11 +493,14 @@ cppline {space}*#([^i][A-Za-z]*|{if}|{ifdef}|{ifndef}|{import})((\/\*[^*/]*\*+
base_yylval.str = mm_strdup(literalbuf); base_yylval.str = mm_strdup(literalbuf);
return BCONST; return BCONST;
} }
<xh>{xhinside} | <xh>{xhinside} |
<xb>{xbinside} { addlit(yytext, yyleng); } <xb>{xbinside} {
addlit(yytext, yyleng);
}
<xh>{quotecontinue} | <xh>{quotecontinue} |
<xb>{quotecontinue} { /* ignore */ } <xb>{quotecontinue} {
/* ignore */
}
<xb><<EOF>> { mmfatal(PARSE_ERROR, "unterminated bit string literal"); } <xb><<EOF>> { mmfatal(PARSE_ERROR, "unterminated bit string literal"); }
<SQL>{xhstart} { <SQL>{xhstart} {
...@@ -472,186 +510,251 @@ cppline {space}*#([^i][A-Za-z]*|{if}|{ifdef}|{ifndef}|{import})((\/\*[^*/]*\*+ ...@@ -472,186 +510,251 @@ cppline {space}*#([^i][A-Za-z]*|{if}|{ifdef}|{ifndef}|{import})((\/\*[^*/]*\*+
addlitchar('x'); addlitchar('x');
} }
<xh>{quotestop} | <xh>{quotestop} |
<xh>{quotefail} { <xh>{quotefail} {
yyless(1); yyless(1);
BEGIN(SQL); BEGIN(SQL);
base_yylval.str = mm_strdup(literalbuf); base_yylval.str = mm_strdup(literalbuf);
return XCONST; return XCONST;
} }
<xh><<EOF>> { mmfatal(PARSE_ERROR, "unterminated hexadecimal string literal"); } <xh><<EOF>> { mmfatal(PARSE_ERROR, "unterminated hexadecimal string literal"); }
<SQL>{xnstart} {
/* National character.
* Transfer it as-is to the backend.
*/
token_start = yytext;
state_before = YYSTATE;
BEGIN(xn);
startlit();
}
<C>{xqstart} { <C>{xqstart} {
token_start = yytext; token_start = yytext;
state_before = YYSTATE; state_before = YYSTATE;
BEGIN(xqc); BEGIN(xqc);
startlit(); startlit();
} }
<SQL>{xqstart} {
token_start = yytext; <SQL>{
state_before = YYSTATE; {xnstart} {
BEGIN(xq); /* National character.
startlit(); * Transfer it as-is to the backend.
} */
<SQL>{xestart} { token_start = yytext;
token_start = yytext; state_before = YYSTATE;
state_before = YYSTATE; BEGIN(xn);
BEGIN(xe); startlit();
startlit(); }
}
<SQL>{xusstart} { {xqstart} {
token_start = yytext; token_start = yytext;
state_before = YYSTATE; state_before = YYSTATE;
BEGIN(xus); BEGIN(xq);
startlit(); startlit();
addlit(yytext, yyleng); }
} {xestart} {
token_start = yytext;
state_before = YYSTATE;
BEGIN(xe);
startlit();
}
{xusstart} {
token_start = yytext;
state_before = YYSTATE;
BEGIN(xus);
startlit();
addlit(yytext, yyleng);
}
} /* <SQL> */
<xq,xqc>{quotestop} | <xq,xqc>{quotestop} |
<xq,xqc>{quotefail} { <xq,xqc>{quotefail} {
yyless(1); yyless(1);
BEGIN(state_before); BEGIN(state_before);
base_yylval.str = mm_strdup(literalbuf); base_yylval.str = mm_strdup(literalbuf);
return SCONST; return SCONST;
} }
<xe>{quotestop} | <xe>{quotestop} |
<xe>{quotefail} { <xe>{quotefail} {
yyless(1); yyless(1);
BEGIN(state_before); BEGIN(state_before);
base_yylval.str = mm_strdup(literalbuf); base_yylval.str = mm_strdup(literalbuf);
return ECONST; return ECONST;
} }
<xn>{quotestop} | <xn>{quotestop} |
<xn>{quotefail} { <xn>{quotefail} {
yyless(1); yyless(1);
BEGIN(state_before); BEGIN(state_before);
base_yylval.str = mm_strdup(literalbuf); base_yylval.str = mm_strdup(literalbuf);
return NCONST; return NCONST;
} }
<xus>{xusstop} { <xus>{xusstop} {
addlit(yytext, yyleng); addlit(yytext, yyleng);
BEGIN(state_before); BEGIN(state_before);
base_yylval.str = mm_strdup(literalbuf); base_yylval.str = mm_strdup(literalbuf);
return UCONST; return UCONST;
} }
<xq,xe,xn,xus>{xqdouble} { addlitchar('\''); } <xq,xe,xn,xus>{xqdouble} { addlitchar('\''); }
<xqc>{xqcquote} { <xqc>{xqcquote} {
addlitchar('\\'); addlitchar('\\');
addlitchar('\''); addlitchar('\'');
} }
<xq,xqc,xn,xus>{xqinside} { addlit(yytext, yyleng); } <xq,xqc,xn,xus>{xqinside} { addlit(yytext, yyleng); }
<xe>{xeinside} { addlit(yytext, yyleng); } <xe>{xeinside} {
<xe>{xeunicode} { addlit(yytext, yyleng); } addlit(yytext, yyleng);
<xe>{xeescape} { addlit(yytext, yyleng); } }
<xe>{xeoctesc} { addlit(yytext, yyleng); } <xe>{xeunicode} {
<xe>{xehexesc} { addlit(yytext, yyleng); } addlit(yytext, yyleng);
<xq,xqc,xe,xn,xus>{quotecontinue} { /* ignore */ } }
<xe>. { <xe>{xeescape} {
/* This is only needed for \ just before EOF */ addlit(yytext, yyleng);
addlitchar(yytext[0]); }
} <xe>{xeoctesc} {
addlit(yytext, yyleng);
}
<xe>{xehexesc} {
addlit(yytext, yyleng);
}
<xq,xqc,xe,xn,xus>{quotecontinue} {
/* ignore */
}
<xe>. {
/* This is only needed for \ just before EOF */
addlitchar(yytext[0]);
}
<xq,xqc,xe,xn,xus><<EOF>> { mmfatal(PARSE_ERROR, "unterminated quoted string"); } <xq,xqc,xe,xn,xus><<EOF>> { mmfatal(PARSE_ERROR, "unterminated quoted string"); }
<SQL>{dolqfailed} {
/* throw back all but the initial "$" */ <SQL>{
yyless(1); {dolqdelim} {
/* and treat it as {other} */ token_start = yytext;
return yytext[0]; if (dolqstart)
} free(dolqstart);
<SQL>{dolqdelim} { dolqstart = mm_strdup(yytext);
token_start = yytext; BEGIN(xdolq);
if (dolqstart) startlit();
free(dolqstart);
dolqstart = mm_strdup(yytext);
BEGIN(xdolq);
startlit();
addlit(yytext, yyleng);
}
<xdolq>{dolqdelim} {
if (strcmp(yytext, dolqstart) == 0)
{
addlit(yytext, yyleng); addlit(yytext, yyleng);
free(dolqstart);
dolqstart = NULL;
BEGIN(SQL);
base_yylval.str = mm_strdup(literalbuf);
return DOLCONST;
} }
else {dolqfailed} {
{ /* throw back all but the initial "$" */
/* yyless(1);
* When we fail to match $...$ to dolqstart, transfer /* and treat it as {other} */
* the $... part to the output, but put back the final return yytext[0];
* $ for rescanning. Consider $delim$...$junk$delim$
*/
addlit(yytext, yyleng-1);
yyless(yyleng-1);
} }
} } /* <SQL> */
<xdolq>{dolqinside} { addlit(yytext, yyleng); }
<xdolq>{dolqfailed} { addlit(yytext, yyleng); } <xdolq>{dolqdelim} {
<xdolq>{other} { if (strcmp(yytext, dolqstart) == 0)
/* single quote or dollar sign */ {
addlitchar(yytext[0]);
}
<xdolq><<EOF>> { base_yyerror("unterminated dollar-quoted string"); }
<SQL>{xdstart} {
state_before = YYSTATE;
BEGIN(xd);
startlit();
}
<SQL>{xuistart} {
state_before = YYSTATE;
BEGIN(xui);
startlit();
addlit(yytext, yyleng);
}
<xd>{xdstop} {
BEGIN(state_before);
if (literallen == 0)
mmerror(PARSE_ERROR, ET_ERROR, "zero-length delimited identifier");
/* The backend will truncate the identifier here. We do not as it does not change the result. */
base_yylval.str = mm_strdup(literalbuf);
return CSTRING;
}
<xdc>{xdstop} {
BEGIN(state_before);
base_yylval.str = mm_strdup(literalbuf);
return CSTRING;
}
<xui>{xuistop} {
BEGIN(state_before);
if (literallen == 2) /* "U&" */
mmerror(PARSE_ERROR, ET_ERROR, "zero-length delimited identifier");
/* The backend will truncate the identifier here. We do not as it does not change the result. */
addlit(yytext, yyleng); addlit(yytext, yyleng);
free(dolqstart);
dolqstart = NULL;
BEGIN(SQL);
base_yylval.str = mm_strdup(literalbuf); base_yylval.str = mm_strdup(literalbuf);
return UIDENT; return DOLCONST;
} }
<xd,xui>{xddouble} { addlitchar('"'); } else
<xd,xui>{xdinside} { addlit(yytext, yyleng); } {
<xd,xdc,xui><<EOF>> { mmfatal(PARSE_ERROR, "unterminated quoted identifier"); } /*
<C,SQL>{xdstart} { * When we fail to match $...$ to dolqstart, transfer
state_before = YYSTATE; * the $... part to the output, but put back the final
BEGIN(xdc); * $ for rescanning. Consider $delim$...$junk$delim$
startlit(); */
addlit(yytext, yyleng - 1);
yyless(yyleng - 1);
} }
<xdc>{xdcinside} { addlit(yytext, yyleng); } }
<SQL>{typecast} { return TYPECAST; } <xdolq>{dolqinside} {
<SQL>{dot_dot} { return DOT_DOT; } addlit(yytext, yyleng);
<SQL>{colon_equals} { return COLON_EQUALS; } }
<SQL>{equals_greater} { return EQUALS_GREATER; } <xdolq>{dolqfailed} {
<SQL>{less_equals} { return LESS_EQUALS; } addlit(yytext, yyleng);
<SQL>{greater_equals} { return GREATER_EQUALS; } }
<SQL>{less_greater} { return NOT_EQUALS; } <xdolq>. {
<SQL>{not_equals} { return NOT_EQUALS; } /* single quote or dollar sign */
<SQL>{informix_special} { addlitchar(yytext[0]);
}
<xdolq><<EOF>> { mmfatal(PARSE_ERROR, "unterminated dollar-quoted string"); }
<SQL>{
{xdstart} {
state_before = YYSTATE;
BEGIN(xd);
startlit();
}
{xuistart} {
state_before = YYSTATE;
BEGIN(xui);
startlit();
addlit(yytext, yyleng);
}
} /* <SQL> */
<xd>{xdstop} {
BEGIN(state_before);
if (literallen == 0)
mmerror(PARSE_ERROR, ET_ERROR, "zero-length delimited identifier");
/* The backend will truncate the identifier here. We do not as it does not change the result. */
base_yylval.str = mm_strdup(literalbuf);
return CSTRING;
}
<xdc>{xdstop} {
BEGIN(state_before);
base_yylval.str = mm_strdup(literalbuf);
return CSTRING;
}
<xui>{xuistop} {
BEGIN(state_before);
if (literallen == 2) /* "U&" */
mmerror(PARSE_ERROR, ET_ERROR, "zero-length delimited identifier");
/* The backend will truncate the identifier here. We do not as it does not change the result. */
addlit(yytext, yyleng);
base_yylval.str = mm_strdup(literalbuf);
return UIDENT;
}
<xd,xui>{xddouble} {
addlitchar('"');
}
<xd,xui>{xdinside} {
addlit(yytext, yyleng);
}
<xd,xui><<EOF>> { mmfatal(PARSE_ERROR, "unterminated quoted identifier"); }
<C>{xdstart} {
state_before = YYSTATE;
BEGIN(xdc);
startlit();
}
<xdc>{xdcinside} {
addlit(yytext, yyleng);
}
<xdc><<EOF>> { mmfatal(PARSE_ERROR, "unterminated quoted string"); }
<SQL>{
{typecast} {
return TYPECAST;
}
{dot_dot} {
return DOT_DOT;
}
{colon_equals} {
return COLON_EQUALS;
}
{equals_greater} {
return EQUALS_GREATER;
}
{less_equals} {
return LESS_EQUALS;
}
{greater_equals} {
return GREATER_EQUALS;
}
{less_greater} {
/* We accept both "<>" and "!=" as meaning NOT_EQUALS */
return NOT_EQUALS;
}
{not_equals} {
/* We accept both "<>" and "!=" as meaning NOT_EQUALS */
return NOT_EQUALS;
}
{informix_special} {
/* are we simulating Informix? */ /* are we simulating Informix? */
if (INFORMIX_MODE) if (INFORMIX_MODE)
{ {
...@@ -660,184 +763,205 @@ cppline {space}*#([^i][A-Za-z]*|{if}|{ifdef}|{ifndef}|{import})((\/\*[^*/]*\*+ ...@@ -660,184 +763,205 @@ cppline {space}*#([^i][A-Za-z]*|{if}|{ifdef}|{ifndef}|{import})((\/\*[^*/]*\*+
else else
return yytext[0]; return yytext[0];
} }
<SQL>{self} { /*
* We may find a ';' inside a structure
* definition in a TYPE or VAR statement.
* This is not an EOL marker.
*/
if (yytext[0] == ';' && struct_level == 0)
BEGIN(C);
return yytext[0];
}
<SQL>{operator} {
/*
* Check for embedded slash-star or dash-dash; those
* are comment starts, so operator must stop there.
* Note that slash-star or dash-dash at the first
* character will match a prior rule, not this one.
*/
int nchars = yyleng;
char *slashstar = strstr(yytext, "/*");
char *dashdash = strstr(yytext, "--");
if (slashstar && dashdash) {self} {
{ /*
/* if both appear, take the first one */ * We may find a ';' inside a structure
if (slashstar > dashdash) * definition in a TYPE or VAR statement.
slashstar = dashdash; * This is not an EOL marker.
} */
else if (!slashstar) if (yytext[0] == ';' && struct_level == 0)
BEGIN(C);
return yytext[0];
}
{operator} {
/*
* Check for embedded slash-star or dash-dash; those
* are comment starts, so operator must stop there.
* Note that slash-star or dash-dash at the first
* character will match a prior rule, not this one.
*/
int nchars = yyleng;
char *slashstar = strstr(yytext, "/*");
char *dashdash = strstr(yytext, "--");
if (slashstar && dashdash)
{
/* if both appear, take the first one */
if (slashstar > dashdash)
slashstar = dashdash; slashstar = dashdash;
if (slashstar) }
nchars = slashstar - yytext; else if (!slashstar)
slashstar = dashdash;
if (slashstar)
nchars = slashstar - yytext;
/* /*
* For SQL compatibility, '+' and '-' cannot be the * For SQL compatibility, '+' and '-' cannot be the
* last char of a multi-char operator unless the operator * last char of a multi-char operator unless the operator
* contains chars that are not in SQL operators. * contains chars that are not in SQL operators.
* The idea is to lex '=-' as two operators, but not * The idea is to lex '=-' as two operators, but not
* to forbid operator names like '?-' that could not be * to forbid operator names like '?-' that could not be
* sequences of SQL operators. * sequences of SQL operators.
*/ */
if (nchars > 1 && if (nchars > 1 &&
(yytext[nchars - 1] == '+' || (yytext[nchars - 1] == '+' ||
yytext[nchars - 1] == '-')) yytext[nchars - 1] == '-'))
{ {
int ic; int ic;
for (ic = nchars - 2; ic >= 0; ic--) for (ic = nchars - 2; ic >= 0; ic--)
{ {
char c = yytext[ic]; char c = yytext[ic];
if (c == '~' || c == '!' || c == '@' || if (c == '~' || c == '!' || c == '@' ||
c == '#' || c == '^' || c == '&' || c == '#' || c == '^' || c == '&' ||
c == '|' || c == '`' || c == '?' || c == '|' || c == '`' || c == '?' ||
c == '%') c == '%')
break; break;
}
if (ic < 0)
{
/*
* didn't find a qualifying character, so remove
* all trailing [+-]
*/
do {
nchars--;
} while (nchars > 1 &&
(yytext[nchars - 1] == '+' ||
yytext[nchars - 1] == '-'));
}
} }
if (ic < 0)
if (nchars < yyleng)
{ {
/* Strip the unwanted chars from the token */
yyless(nchars);
/*
* If what we have left is only one char, and it's
* one of the characters matching "self", then
* return it as a character token the same way
* that the "self" rule would have.
*/
if (nchars == 1 &&
strchr(",()[].;:+-*/%^<>=", yytext[0]))
return yytext[0];
/* /*
* Likewise, if what we have left is two chars, and * didn't find a qualifying character, so remove
* those match the tokens ">=", "<=", "=>", "<>" or * all trailing [+-]
* "!=", then we must return the appropriate token
* rather than the generic Op.
*/ */
if (nchars == 2) do {
{ nchars--;
if (yytext[0] == '=' && yytext[1] == '>') } while (nchars > 1 &&
return EQUALS_GREATER; (yytext[nchars - 1] == '+' ||
if (yytext[0] == '>' && yytext[1] == '=') yytext[nchars - 1] == '-'));
return GREATER_EQUALS;
if (yytext[0] == '<' && yytext[1] == '=')
return LESS_EQUALS;
if (yytext[0] == '<' && yytext[1] == '>')
return NOT_EQUALS;
if (yytext[0] == '!' && yytext[1] == '=')
return NOT_EQUALS;
}
} }
base_yylval.str = mm_strdup(yytext);
return Op;
}
<SQL>{param} {
base_yylval.ival = atol(yytext+1);
return PARAM;
} }
<C,SQL>{integer} {
int val;
char* endptr;
errno = 0; if (nchars < yyleng)
val = strtoint(yytext, &endptr, 10); {
if (*endptr != '\0' || errno == ERANGE) /* Strip the unwanted chars from the token */
yyless(nchars);
/*
* If what we have left is only one char, and it's
* one of the characters matching "self", then
* return it as a character token the same way
* that the "self" rule would have.
*/
if (nchars == 1 &&
strchr(",()[].;:+-*/%^<>=", yytext[0]))
return yytext[0];
/*
* Likewise, if what we have left is two chars, and
* those match the tokens ">=", "<=", "=>", "<>" or
* "!=", then we must return the appropriate token
* rather than the generic Op.
*/
if (nchars == 2)
{ {
errno = 0; if (yytext[0] == '=' && yytext[1] == '>')
base_yylval.str = mm_strdup(yytext); return EQUALS_GREATER;
return FCONST; if (yytext[0] == '>' && yytext[1] == '=')
return GREATER_EQUALS;
if (yytext[0] == '<' && yytext[1] == '=')
return LESS_EQUALS;
if (yytext[0] == '<' && yytext[1] == '>')
return NOT_EQUALS;
if (yytext[0] == '!' && yytext[1] == '=')
return NOT_EQUALS;
} }
base_yylval.ival = val;
return ICONST;
} }
<SQL>{ip} {
base_yylval.str = mm_strdup(yytext); base_yylval.str = mm_strdup(yytext);
return IP; return Op;
} }
<C,SQL>{decimal} {
base_yylval.str = mm_strdup(yytext); {param} {
return FCONST; base_yylval.ival = atol(yytext+1);
} return PARAM;
<C,SQL>{real} { }
base_yylval.str = mm_strdup(yytext);
return FCONST; {ip} {
} base_yylval.str = mm_strdup(yytext);
<SQL>{realfail1} { return IP;
yyless(yyleng-1); }
base_yylval.str = mm_strdup(yytext); } /* <SQL> */
return FCONST;
} <C,SQL>{
<SQL>{realfail2} { {integer} {
yyless(yyleng-2); return process_integer_literal(yytext, &base_yylval);
}
{decimal} {
base_yylval.str = mm_strdup(yytext);
return FCONST;
}
{decimalfail} {
/* throw back the .., and treat as integer */
yyless(yyleng - 2);
return process_integer_literal(yytext, &base_yylval);
}
{real} {
base_yylval.str = mm_strdup(yytext);
return FCONST;
}
{realfail1} {
/*
* throw back the [Ee], and treat as {decimal}. Note
* that it is possible the input is actually {integer},
* but since this case will almost certainly lead to a
* syntax error anyway, we don't bother to distinguish.
*/
yyless(yyleng - 1);
base_yylval.str = mm_strdup(yytext);
return FCONST;
}
{realfail2} {
/* throw back the [Ee][+-], and proceed as above */
yyless(yyleng - 2);
base_yylval.str = mm_strdup(yytext);
return FCONST;
}
} /* <C,SQL> */
<SQL>{
:{identifier}((("->"|\.){identifier})|(\[{array}\]))* {
base_yylval.str = mm_strdup(yytext+1);
return CVARIABLE;
}
{identifier} {
const ScanKeyword *keyword;
if (!isdefine())
{
/* Is it an SQL/ECPG keyword? */
keyword = ScanECPGKeywordLookup(yytext);
if (keyword != NULL)
return keyword->value;
/* Is it a C keyword? */
keyword = ScanCKeywordLookup(yytext);
if (keyword != NULL)
return keyword->value;
/*
* None of the above. Return it as an identifier.
*
* The backend will attempt to truncate and case-fold
* the identifier, but I see no good reason for ecpg
* to do so; that's just another way that ecpg could get
* out of step with the backend.
*/
base_yylval.str = mm_strdup(yytext); base_yylval.str = mm_strdup(yytext);
return FCONST; return IDENT;
}
<SQL>:{identifier}((("->"|\.){identifier})|(\[{array}\]))* {
base_yylval.str = mm_strdup(yytext+1);
return CVARIABLE;
} }
<SQL>{identifier} { }
const ScanKeyword *keyword;
if (!isdefine()) {other} {
{ return yytext[0];
/* Is it an SQL/ECPG keyword? */ }
keyword = ScanECPGKeywordLookup(yytext); } /* <SQL> */
if (keyword != NULL)
return keyword->value;
/* Is it a C keyword? */ /*
keyword = ScanCKeywordLookup(yytext); * Begin ECPG-specific rules
if (keyword != NULL) */
return keyword->value;
/*
* None of the above. Return it as an identifier.
*
* The backend will attempt to truncate and case-fold
* the identifier, but I see no good reason for ecpg
* to do so; that's just another way that ecpg could get
* out of step with the backend.
*/
base_yylval.str = mm_strdup(yytext);
return IDENT;
}
}
<SQL>{other} { return yytext[0]; }
<C>{exec_sql} { BEGIN(SQL); return SQL_START; } <C>{exec_sql} { BEGIN(SQL); return SQL_START; }
<C>{informix_special} { <C>{informix_special} {
/* are we simulating Informix? */ /* are we simulating Informix? */
...@@ -1288,6 +1412,7 @@ cppline {space}*#([^i][A-Za-z]*|{if}|{ifdef}|{ifndef}|{import})((\/\*[^*/]*\*+ ...@@ -1288,6 +1412,7 @@ cppline {space}*#([^i][A-Za-z]*|{if}|{ifdef}|{ifndef}|{import})((\/\*[^*/]*\*+
} }
} }
<INITIAL>{other}|\n { mmfatal(PARSE_ERROR, "internal error: unreachable state; please report this to <pgsql-bugs@postgresql.org>"); } <INITIAL>{other}|\n { mmfatal(PARSE_ERROR, "internal error: unreachable state; please report this to <pgsql-bugs@postgresql.org>"); }
%% %%
...@@ -1350,6 +1475,24 @@ addlitchar(unsigned char ychar) ...@@ -1350,6 +1475,24 @@ addlitchar(unsigned char ychar)
literalbuf[literallen] = '\0'; literalbuf[literallen] = '\0';
} }
static int
process_integer_literal(const char *token, YYSTYPE *lval)
{
int val;
char *endptr;
errno = 0;
val = strtoint(token, &endptr, 10);
if (*endptr != '\0' || errno == ERANGE)
{
/* integer too large, treat it as a float */
lval->str = mm_strdup(token);
return FCONST;
}
lval->ival = val;
return ICONST;
}
static void static void
parse_include(void) parse_include(void)
{ {
......
Markdown is supported
0% or
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment