/* Copyright (c) 2011, 2015, Oracle and/or its affiliates. All rights reserved. This program is free software; you can redistribute it and/or modify it under the terms of the GNU General Public License, version 2.0, as published by the Free Software Foundation. This program is also distributed with certain software (including but not limited to OpenSSL) that is licensed under separate terms, as designated in a particular file or component or in included license documentation. The authors of MySQL hereby grant you an additional permission to link the program and your derivative works with the separately licensed software that they have included with MySQL. This program is distributed in the hope that it will be useful, but WITHOUT ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU General Public License, version 2.0, for more details. You should have received a copy of the GNU General Public License along with this program; if not, write to the Free Software Foundation, 51 Franklin Street, Suite 500, Boston, MA 02110-1335 USA */ #include #include #include #include /* We only need the tokens here */ #define YYSTYPE_IS_DECLARED #include #include #include /* ORACLE_WELCOME_COPYRIGHT_NOTICE */ /* This is a tool used during build only, so MY_MAX_TOKEN does not need to be exact, only big enough to hold: - 256 character terminal tokens - YYNTOKENS named terminal tokens from bison. See also YYMAXUTOK. */ #define MY_MAX_TOKEN 1000 /** Generated token. */ struct gen_lex_token_string { const char *m_token_string; int m_token_length; bool m_append_space; bool m_start_expr; }; gen_lex_token_string compiled_token_array[MY_MAX_TOKEN]; int max_token_seen= 0; char char_tokens[256]; int tok_generic_value= 0; int tok_generic_value_list= 0; int tok_row_single_value= 0; int tok_row_single_value_list= 0; int tok_row_multiple_value= 0; int tok_row_multiple_value_list= 0; int tok_ident= 0; int tok_unused= 0; void set_token(int tok, const char *str) { if (tok <= 0) { fprintf(stderr, "Bad token found\n"); exit(1); } if (tok > max_token_seen) { max_token_seen= tok; } if (max_token_seen >= MY_MAX_TOKEN) { fprintf(stderr, "Added that many new keywords ? Increase MY_MAX_TOKEN\n"); exit(1); } compiled_token_array[tok].m_token_string= str; compiled_token_array[tok].m_token_length= strlen(str); compiled_token_array[tok].m_append_space= true; compiled_token_array[tok].m_start_expr= false; } void set_start_expr_token(int tok) { compiled_token_array[tok].m_start_expr= true; } void compute_tokens() { int tok; unsigned int i; char *str; /* Default value. */ for (tok= 0; tok < MY_MAX_TOKEN; tok++) { compiled_token_array[tok].m_token_string= "(unknown)"; compiled_token_array[tok].m_token_length= 9; compiled_token_array[tok].m_append_space= true; compiled_token_array[tok].m_start_expr= false; } /* Tokens made of just one terminal character */ for (tok=0; tok < 256; tok++) { str= & char_tokens[tok]; str[0]= (char) tok; compiled_token_array[tok].m_token_string= str; compiled_token_array[tok].m_token_length= 1; compiled_token_array[tok].m_append_space= true; } max_token_seen= 255; /* String terminal tokens, used in sql_yacc.yy */ set_token(NEG, "~"); set_token(TABLE_REF_PRIORITY, "TABLE_REF_PRIORITY"); /* Tokens hard coded in sql_lex.cc */ set_token(WITH_CUBE_SYM, "WITH CUBE"); set_token(WITH_ROLLUP_SYM, "WITH ROLLUP"); set_token(NOT2_SYM, "!"); set_token(OR2_SYM, "|"); set_token(PARAM_MARKER, "?"); set_token(SET_VAR, ":="); set_token(UNDERSCORE_CHARSET, "(_charset)"); set_token(END_OF_INPUT, ""); /* Values. These tokens are all normalized later, so this strings will never be displayed. */ set_token(BIN_NUM, "(bin)"); set_token(DECIMAL_NUM, "(decimal)"); set_token(FLOAT_NUM, "(float)"); set_token(HEX_NUM, "(hex)"); set_token(LEX_HOSTNAME, "(hostname)"); set_token(LONG_NUM, "(long)"); set_token(NUM, "(num)"); set_token(TEXT_STRING, "(text)"); set_token(NCHAR_STRING, "(nchar)"); set_token(ULONGLONG_NUM, "(ulonglong)"); /* Identifiers. */ set_token(IDENT, "(id)"); set_token(IDENT_QUOTED, "(id_quoted)"); /* Unused tokens */ set_token(LOCATOR_SYM, "LOCATOR"); set_token(SERVER_OPTIONS, "SERVER_OPTIONS"); set_token(UDF_RETURNS_SYM, "UDF_RETURNS"); /* See symbols[] in sql/lex.h */ for (i= 0; i< sizeof(symbols)/sizeof(symbols[0]); i++) { set_token(symbols[i].tok, symbols[i].name); } /* See sql_functions[] in sql/lex.h */ for (i= 0; i< sizeof(sql_functions)/sizeof(sql_functions[0]); i++) { set_token(sql_functions[i].tok, sql_functions[i].name); } /* Additional FAKE tokens, used internally to normalize a digest text. */ max_token_seen++; tok_generic_value= max_token_seen; set_token(tok_generic_value, "?"); max_token_seen++; tok_generic_value_list= max_token_seen; set_token(tok_generic_value_list, "?, ..."); max_token_seen++; tok_row_single_value= max_token_seen; set_token(tok_row_single_value, "(?)"); max_token_seen++; tok_row_single_value_list= max_token_seen; set_token(tok_row_single_value_list, "(?) /* , ... */"); max_token_seen++; tok_row_multiple_value= max_token_seen; set_token(tok_row_multiple_value, "(...)"); max_token_seen++; tok_row_multiple_value_list= max_token_seen; set_token(tok_row_multiple_value_list, "(...) /* , ... */"); max_token_seen++; tok_ident= max_token_seen; set_token(tok_ident, "(tok_id)"); max_token_seen++; tok_unused= max_token_seen; set_token(tok_unused, "UNUSED"); /* Fix whitespace for some special tokens. */ /* The lexer parses "@@variable" as '@', '@', 'variable', returning a token for '@' alone. This is incorrect, '@' is not really a token, because the syntax "@ @ variable" (with spaces) is not accepted: The lexer keeps some internal state after the '@' fake token. To work around this, digest text are printed as "@@variable". */ compiled_token_array[(int) '@'].m_append_space= false; /* Define additional properties for tokens. List all the token that are followed by an expression. This is needed to differentiate unary from binary '+' and '-' operators, because we want to: - reduce to , - preserve <...> as is. */ set_start_expr_token('('); set_start_expr_token(','); set_start_expr_token(EVERY_SYM); set_start_expr_token(AT_SYM); set_start_expr_token(STARTS_SYM); set_start_expr_token(ENDS_SYM); set_start_expr_token(DEFAULT); set_start_expr_token(RETURN_SYM); set_start_expr_token(IF); set_start_expr_token(ELSEIF_SYM); set_start_expr_token(CASE_SYM); set_start_expr_token(WHEN_SYM); set_start_expr_token(WHILE_SYM); set_start_expr_token(UNTIL_SYM); set_start_expr_token(SELECT_SYM); set_start_expr_token(OR_SYM); set_start_expr_token(OR2_SYM); set_start_expr_token(XOR); set_start_expr_token(AND_SYM); set_start_expr_token(AND_AND_SYM); set_start_expr_token(NOT_SYM); set_start_expr_token(BETWEEN_SYM); set_start_expr_token(LIKE); set_start_expr_token(REGEXP); set_start_expr_token('|'); set_start_expr_token('&'); set_start_expr_token(SHIFT_LEFT); set_start_expr_token(SHIFT_RIGHT); set_start_expr_token('+'); set_start_expr_token('-'); set_start_expr_token(INTERVAL_SYM); set_start_expr_token('*'); set_start_expr_token('/'); set_start_expr_token('%'); set_start_expr_token(DIV_SYM); set_start_expr_token(MOD_SYM); set_start_expr_token('^'); } void print_tokens() { int tok; printf("#ifdef LEX_TOKEN_WITH_DEFINITION\n"); printf("lex_token_string lex_token_array[]=\n"); printf("{\n"); printf("/* PART 1: character tokens. */\n"); for (tok= 0; tok<256; tok++) { printf("/* %03d */ { \"\\x%02x\", 1, %s, %s},\n", tok, tok, compiled_token_array[tok].m_append_space ? "true" : "false", compiled_token_array[tok].m_start_expr ? "true" : "false"); } printf("/* PART 2: named tokens. */\n"); for (tok= 256; tok<= max_token_seen; tok++) { printf("/* %03d */ { \"%s\", %d, %s, %s},\n", tok, compiled_token_array[tok].m_token_string, compiled_token_array[tok].m_token_length, compiled_token_array[tok].m_append_space ? "true" : "false", compiled_token_array[tok].m_start_expr ? "true" : "false"); } printf("/* DUMMY */ { \"\", 0, false, false}\n"); printf("};\n"); printf("#endif /* LEX_TOKEN_WITH_DEFINITION */\n"); printf("/* DIGEST specific tokens. */\n"); printf("#define TOK_GENERIC_VALUE %d\n", tok_generic_value); printf("#define TOK_GENERIC_VALUE_LIST %d\n", tok_generic_value_list); printf("#define TOK_ROW_SINGLE_VALUE %d\n", tok_row_single_value); printf("#define TOK_ROW_SINGLE_VALUE_LIST %d\n", tok_row_single_value_list); printf("#define TOK_ROW_MULTIPLE_VALUE %d\n", tok_row_multiple_value); printf("#define TOK_ROW_MULTIPLE_VALUE_LIST %d\n", tok_row_multiple_value_list); printf("#define TOK_IDENT %d\n", tok_ident); printf("#define TOK_UNUSED %d\n", tok_unused); } int main(int argc,char **argv) { puts("/*"); puts(ORACLE_WELCOME_COPYRIGHT_NOTICE("2011")); puts("*/"); printf("/*\n"); printf(" This file is generated, do not edit.\n"); printf(" See file sql/gen_lex_token.cc.\n"); printf("*/\n"); printf("struct lex_token_string\n"); printf("{\n"); printf(" const char *m_token_string;\n"); printf(" int m_token_length;\n"); printf(" bool m_append_space;\n"); printf(" bool m_start_expr;\n"); printf("};\n"); printf("typedef struct lex_token_string lex_token_string;\n"); compute_tokens(); print_tokens(); return 0; }