%{ /*------------------------------------------------------------------------- * * pgc.l * lexical scanner for ecpg * * This is a modified version of src/backend/parser/scan.l * * * Portions Copyright (c) 1996-2000, PostgreSQL, Inc * Portions Copyright (c) 1994, Regents of the University of California * * * IDENTIFICATION * $Header: /cvsroot/pgsql/src/interfaces/ecpg/preproc/pgc.l,v 1.49 2000/01/26 05:58:41 momjian Exp $ * *------------------------------------------------------------------------- */ #include #include #include #include #include "postgres.h" #include "miscadmin.h" #include "nodes/parsenodes.h" #include "nodes/pg_list.h" #include "parser/scansup.h" #include "extern.h" #include "preproc.h" #include "utils/builtins.h" /* some versions of lex define this as a macro */ #if defined(yywrap) #undef yywrap #endif /* yywrap */ extern YYSTYPE yylval; /* * literalbuf is used to accumulate literal values when multiple rules * are needed to parse a single literal. Call startlit to reset buffer * to empty, addlit to add text. Note that the buffer is permanently * malloc'd to the largest size needed so far in the current run. */ static char *literalbuf = NULL; /* expandable buffer */ static int literallen; /* actual current length */ static int literalalloc; /* current allocated buffer size */ #define startlit() (literalbuf[0] = '\0', literallen = 0) static void addlit(char *ytext, int yleng); int before_comment; struct _yy_buffer { YY_BUFFER_STATE buffer; long lineno; char * filename; struct _yy_buffer * next; } *yy_buffer = NULL; static char *old; #define MAX_NESTED_IF 128 static short preproc_tos; static short ifcond; static struct _if_value { short condition; short else_branch; } stacked_if_value[MAX_NESTED_IF]; %} %option yylineno %s C SQL incl def def_ident /* OK, here is a short description of lex/flex rules behavior. * The longest pattern which matches an input string is always chosen. * For equal-length patterns, the first occurring in the rules list is chosen. * INITIAL is the starting condition, to which all non-conditional rules apply. * When in an exclusive condition, only those rules defined for that condition apply. * * Exclusive states change parsing rules while the state is active. * There are exclusive states for quoted strings, extended comments, * and to eliminate parsing troubles for numeric strings. * Exclusive states: * binary numeric string - thomas 1997-11-16 * extended C-style comments - tgl 1997-07-12 * delimited identifiers (double-quoted identifiers) - tgl 1997-10-27 * hexadecimal numeric string - thomas 1997-11-16 * quoted strings - tgl 1997-07-30 * * The "extended comment" syntax closely resembles allowable operator syntax. * So, when in condition , only strings which would terminate the * "extended comment" trigger any action other than "ignore". * Be sure to match _any_ candidate comment, including those with appended * operator-like symbols. - thomas 1997-07-14 */ %x xb %x xc %x xd %x xdc %x xh %x xq %x xpre %x xcond %x xskip /* Binary number */ xbstart [bB]{quote} xbstop {quote} xbinside [^']* xbcat {quote}{space}*\n{space}*{quote} /* Hexadecimal number */ xhstart [xX]{quote} xhstop {quote} xhinside [^']* xhcat {quote}{space}*\n{space}*{quote} /* C version of hex number */ xch 0[xX][0-9A-Fa-f]* /* Extended quote * xqdouble implements SQL92 embedded quote * xqcat allows strings to cross input lines */ quote ' xqstart {quote} xqstop {quote} xqdouble {quote}{quote} xqinside [^\\']* xqliteral [\\](.|\n) xqcat {quote}{space}*\n{space}*{quote} /* Delimited quote * Allows embedded spaces and other special characters into identifiers. */ dquote \" xdstart {dquote} xdstop {dquote} xdinside [^"]* /* special stuff for C strings */ xdcqq \\\\ xdcqdq \\\" xdcother [^"] xdcinside ({xdcqq}|{xdcqdq}|{xdcother}) /* Comments * Ignored by the scanner and parser. */ xcline [\/][\*].*[\*][\/]{line_end}+ xcstart [\/][\*]{op_and_self}* xcstop {op_and_self}*[\*][\/]{space_or_nl}* xcinside [^*]* xcstar [^/] digit [0-9] letter [\200-\377_A-Za-z] letter_or_digit [\200-\377_A-Za-z0-9] identifier {letter}{letter_or_digit}* typecast "::" self [,()\[\].;$\:\+\-\*\/\%\^\<\>\=\|] op_and_self [\~\!\@\#\^\&\|\`\?\$\:\+\-\*\/\%\<\>\=] operator {op_and_self}+ /* we no longer allow unary minus in numbers. * instead we pass it separately to parser. there it gets * coerced via doNegate() -- Leon aug 20 1999 */ integer {digit}+ decimal (({digit}*\.{digit}+)|({digit}+\.{digit}*)) real ((({digit}*\.{digit}+)|({digit}+\.{digit}*)|({digit}+))([Ee][-+]?{digit}+)) param \${integer} comment ("--"|"//").* ccomment "//".*\n space [ \t\r\f] space_or_nl [ \t\r\f\n] line_end {space}*\n other . /* some stuff needed for ecpg */ exec [eE][xX][eE][cC] sql [sS][qQ][lL] define [dD][eE][fF][iI][nN][eE] include [iI][nN][cC][lL][uU][dD][eE] ifdef [iI][fF][dD][eE][fF] ifndef [iI][fF][nN][dD][eE][fF] else [eE][lL][sS][eE] elif [eE][lL][iI][fF] endif [eE][nN][dD][iI][fF] exec_sql {exec}{space_or_nl}*{sql}{space_or_nl}* /* Take care of cpp continuation lines */ cppline {space}*#(.*\\{line_end})*.* /* DO NOT PUT ANY COMMENTS IN THE FOLLOWING SECTION. * AT&T lex does not properly handle C-style comments in this second lex block. * So, put comments here. tgl - 1997-09-08 * * Quoted strings must allow some special characters such as single-quote * and newline. * Embedded single-quotes are implemented both in the SQL/92-standard * style of two adjacent single quotes "''" and in the Postgres/Java style * of escaped-quote "\'". * Other embedded escaped characters are matched explicitly and the leading * backslash is dropped from the string. - thomas 1997-09-24 */ %% {comment} { /* ignore */ } {xcline} { ECHO; } {xcstar} { ECHO; } {xcstart} { before_comment = YYSTATE; ECHO; BEGIN(xc); } {xcstop} { ECHO; BEGIN(before_comment); } {xcinside} { ECHO; } {xbstart} { BEGIN(xb); startlit(); } {xbstop} { char* endptr; BEGIN(SQL); errno = 0; yylval.ival = strtol(literalbuf, &endptr, 2); if (*endptr != '\0' || errno == ERANGE) yyerror("ERROR: Bad binary integer input!"); return ICONST; } {xhinside} | {xbinside} { addlit(yytext, yyleng); } {xhcat} | {xbcat} { } {xhstart} { BEGIN(xh); startlit(); } {xhstop} { char* endptr; BEGIN(SQL); errno = 0; yylval.ival = strtol(literalbuf, &endptr, 16); if (*endptr != '\0' || errno == ERANGE) yyerror("ERROR: Bad hexadecimal integer input"); return ICONST; } {xqstart} { BEGIN(xq); startlit(); } {xqstop} { BEGIN(SQL); yylval.str = mm_strdup(literalbuf); return SCONST; } {xqdouble} | {xqinside} | {xqliteral} { addlit(yytext, yyleng); } {xqcat} { } {xdstart} { BEGIN(xd); startlit(); } {xdstop} { BEGIN(SQL); yylval.str = mm_strdup(literalbuf); return CSTRING; } {xdinside} { addlit(yytext, yyleng); } {xdstart} { BEGIN(xdc); startlit(); } {xdstop} { BEGIN(C); yylval.str = mm_strdup(literalbuf); return CSTRING; } {xdcinside} { addlit(yytext, yyleng); } {typecast} { return TYPECAST; } {self} { /* * We may find a ';' inside a structure * definition in a TYPE or VAR statement. * This is not an EOL marker. */ if (yytext[0] == ';' && struct_level == 0) BEGIN C; return yytext[0]; } {operator} { if (strcmp((char*)yytext,"!=") == 0) yylval.str = mm_strdup("<>"); /* compatability */ else yylval.str = mm_strdup((char*)yytext); return Op; } {param} { yylval.ival = atoi((char*)&yytext[1]); return PARAM; } {integer} { char* endptr; errno = 0; yylval.ival = strtol((char *)yytext,&endptr,10); if (*endptr != '\0' || errno == ERANGE) { errno = 0; yylval.str = mm_strdup((char*)yytext); return SCONST; } return ICONST; } {decimal} { char* endptr; if (strlen((char *)yytext) <= 17) { errno = 0; yylval.dval = strtod((char *)yytext,&endptr); if (*endptr != '\0' || errno == ERANGE) yyerror("ERROR: Bad float8 input"); return FCONST; } yylval.str = mm_strdup((char*)yytext); return SCONST; } {real} { char* endptr; errno = 0; yylval.dval = strtod((char *)yytext,&endptr); if (*endptr != '\0' || errno == ERANGE) yyerror("ERROR: Bad float input"); return FCONST; } :{identifier}(("->"|\.){identifier})* { yylval.str = mm_strdup((char*)yytext+1); return(CVARIABLE); } {identifier} { int i; ScanKeyword *keyword; char lower_text[NAMEDATALEN]; /* this should leave the last byte set to '\0' */ strncpy(lower_text, yytext, NAMEDATALEN-1); for(i = 0; lower_text[i]; i++) if (isascii((unsigned char)lower_text[i]) && isupper(lower_text[i])) lower_text[i] = tolower(lower_text[i]); keyword = ScanKeywordLookup((char*)lower_text); if (keyword != NULL) { return keyword->value; } else { keyword = ScanECPGKeywordLookup((char*)lower_text); if (keyword != NULL) { return keyword->value; } else { struct _defines *ptr; for (ptr = defines; ptr; ptr = ptr->next) { if (strcmp(yytext, ptr->old) == 0) { struct _yy_buffer *yb; yb = mm_alloc(sizeof(struct _yy_buffer)); yb->buffer = YY_CURRENT_BUFFER; yb->lineno = yylineno; yb->filename = mm_strdup(input_filename); yb->next = yy_buffer; yy_buffer = yb; yy_scan_string(ptr->new); break; } } if (ptr == NULL) { yylval.str = mm_strdup((char*)yytext); return IDENT; } } } } {space_or_nl} { /* ignore */ } {other} { return yytext[0]; } {exec_sql} { BEGIN SQL; return SQL_START; } {ccomment} { /* ignore */ } {xch} { char* endptr; errno = 0; yylval.ival = strtol((char *)yytext,&endptr,16); if (*endptr != '\0' || errno == ERANGE) { errno = 0; yylval.str = mm_strdup((char*)yytext); return SCONST; } return ICONST; } {cppline} { yylval.str = mm_strdup((char*)yytext); return(CPP_LINE); } {identifier} { ScanKeyword *keyword; keyword = ScanCKeywordLookup((char*)yytext); if (keyword != NULL) { return keyword->value; } else { struct _defines *ptr; for (ptr = defines; ptr; ptr = ptr->next) { if (strcmp(yytext, ptr->old) == 0) { struct _yy_buffer *yb; yb = mm_alloc(sizeof(struct _yy_buffer)); yb->buffer = YY_CURRENT_BUFFER; yb->lineno = yylineno; yb->filename = mm_strdup(input_filename); yb->next = yy_buffer; yy_buffer = yb; yy_scan_string(ptr->new); break; } } if (ptr == NULL) { yylval.str = mm_strdup((char*)yytext); return IDENT; } } } ";" { return(';'); } "," { return(','); } "*" { return('*'); } "%" { return('%'); } "/" { return('/'); } "+" { return('+'); } "-" { return('-'); } "(" { return('('); } ")" { return(')'); } {space_or_nl} { ECHO; } \{ { return('{'); } \} { return('}'); } \[ { return('['); } \] { return(']'); } \= { return('='); } {other} { return S_ANYTHING; } {exec_sql}{define}{space_or_nl}* { BEGIN(def_ident); } {exec_sql}{include}{space_or_nl}* { BEGIN(incl); } {exec_sql}{ifdef}{space_or_nl}* { ifcond = TRUE; BEGIN(xcond); } {exec_sql}{ifndef}{space_or_nl}* { ifcond = FALSE; BEGIN(xcond); } {exec_sql}{elif}{space_or_nl}* { /* pop stack */ if ( preproc_tos == 0 ) { yyerror("ERROR: missing matching 'EXEC SQL IFDEF / EXEC SQL IFNDEF'"); } else if ( stacked_if_value[preproc_tos].else_branch ) { yyerror("ERROR: missing 'EXEC SQL ENDIF;'"); } else { preproc_tos--; } ifcond = TRUE; BEGIN(xcond); } {exec_sql}{else}{space_or_nl}*";" { /* only exec sql endif pops the stack, so take care of duplicated 'else' */ if ( stacked_if_value[preproc_tos].else_branch ) { yyerror("ERROR: duplicated 'EXEC SQL ELSE;'"); } else { stacked_if_value[preproc_tos].else_branch = TRUE; stacked_if_value[preproc_tos].condition = (stacked_if_value[preproc_tos-1].condition && ! stacked_if_value[preproc_tos].condition); if ( stacked_if_value[preproc_tos].condition ) { BEGIN(C); } else { BEGIN(xskip); } } } {exec_sql}{endif}{space_or_nl}*";" { if ( preproc_tos == 0 ) { yyerror("ERROR: unmatched 'EXEC SQL ENDIF;'"); } else { preproc_tos--; } if ( stacked_if_value[preproc_tos].condition ) { BEGIN(C); } else { BEGIN(xskip); } } {other} { /* ignore */ } {identifier}{space_or_nl}*";" { if ( preproc_tos >= MAX_NESTED_IF-1 ) { yyerror("ERROR: too many nested 'EXEC SQL IFDEF' conditions"); } else { struct _defines *defptr; unsigned int i; /* skip the ";" and trailing whitespace. Note that yytext contains at least one non-space character plus the ";" */ for ( i = strlen(yytext)-2; i > 0 && isspace(yytext[i]); i-- ) {} yytext[i+1] = '\0'; for ( defptr = defines; defptr != NULL && ( strcmp((char*)yytext, defptr->old) != 0 ); defptr = defptr->next ); preproc_tos++; stacked_if_value[preproc_tos].else_branch = FALSE; stacked_if_value[preproc_tos].condition = ( (defptr ? ifcond : !ifcond) && stacked_if_value[preproc_tos-1].condition ); } if ( stacked_if_value[preproc_tos].condition ) { BEGIN C; } else { BEGIN(xskip); } } {identifier} { old = mm_strdup(yytext); BEGIN(def); startlit(); } {space_or_nl}*";" { struct _defines *ptr, *this; for (ptr = defines; ptr != NULL; ptr = ptr->next) { if (strcmp(old, ptr->old) == 0) { free(ptr->new); /* ptr->new = mm_strdup(scanstr(literalbuf));*/ ptr->new = mm_strdup(literalbuf); } } if (ptr == NULL) { this = (struct _defines *) mm_alloc(sizeof(struct _defines)); /* initial definition */ this->old = old; /* this->new = mm_strdup(scanstr(literalbuf));*/ this->new = mm_strdup(literalbuf); this->next = defines; defines = this; } BEGIN(C); } [^";"] { addlit(yytext, yyleng); } [^";"]+";" { /* got the include file name */ struct _yy_buffer *yb; struct _include_path *ip; char inc_file[MAXPGPATH]; unsigned int i; yb = mm_alloc(sizeof(struct _yy_buffer)); yb->buffer = YY_CURRENT_BUFFER; yb->lineno = yylineno; yb->filename = input_filename; yb->next = yy_buffer; yy_buffer = yb; /* skip the ";" and trailing whitespace. Note that yytext contains at least one non-space character plus the ";" */ for ( i = strlen(yytext)-2; i > 0 && isspace(yytext[i]); i-- ) {} yytext[i+1] = '\0'; yyin = NULL; for (ip = include_paths; yyin == NULL && ip != NULL; ip = ip->next) { if (strlen(ip->path) + strlen(yytext) + 3 > MAXPGPATH) { fprintf(stderr, "Error: Path %s/%s is too long in line %d, skipping.\n", ip->path, yytext, yylineno); continue; } sprintf (inc_file, "%s/%s", ip->path, yytext); yyin = fopen( inc_file, "r" ); if (!yyin) { if (strcmp(inc_file + strlen(inc_file) - 2, ".h")) { strcat(inc_file, ".h"); yyin = fopen( inc_file, "r" ); } } } if (!yyin) { fprintf(stderr, "Error: Cannot open include file %s in line %d\n", yytext, yylineno); exit(NO_INCLUDE_FILE); } input_filename = mm_strdup(inc_file); yy_switch_to_buffer(yy_create_buffer(yyin,YY_BUF_SIZE )); yylineno = 1; output_line_number(); BEGIN C; } <> { if ( preproc_tos > 0 ) { preproc_tos = 0; yyerror("ERROR: missing 'EXEC SQL ENDIF;'"); } if (yy_buffer == NULL) yyterminate(); else { struct _yy_buffer *yb = yy_buffer; if (yyin != NULL) fclose(yyin); yy_delete_buffer( YY_CURRENT_BUFFER ); yy_switch_to_buffer(yy_buffer->buffer); yylineno = yy_buffer->lineno; free(input_filename); input_filename = yy_buffer->filename; yy_buffer = yy_buffer->next; free(yb); output_line_number(); } } %% void lex_init(void) { braces_open = 0; preproc_tos = 0; ifcond = TRUE; stacked_if_value[preproc_tos].condition = ifcond; stacked_if_value[preproc_tos].else_branch = FALSE; /* initialize literal buffer to a reasonable but expansible size */ if (literalbuf == NULL) { literalalloc = 128; literalbuf = (char *) malloc(literalalloc); } startlit(); BEGIN C; } static void addlit(char *ytext, int yleng) { /* enlarge buffer if needed */ if ((literallen+yleng) >= literalalloc) { do { literalalloc *= 2; } while ((literallen+yleng) >= literalalloc); literalbuf = (char *) realloc(literalbuf, literalalloc); } /* append data --- note we assume ytext is null-terminated */ memcpy(literalbuf+literallen, ytext, yleng+1); literallen += yleng; } int yywrap(void) { return 1; }