| /* Bison Grammar Parser -*- C -*- |
| |
| Copyright (C) 2002-2015, 2018-2021 Free Software Foundation, Inc. |
| |
| This file is part of Bison, the GNU Compiler Compiler. |
| |
| This program is free software: you can redistribute it and/or modify |
| it under the terms of the GNU General Public License as published by |
| the Free Software Foundation, either version 3 of the License, or |
| (at your option) any later version. |
| |
| This program is distributed in the hope that it will be useful, |
| but WITHOUT ANY WARRANTY; without even the implied warranty of |
| MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the |
| GNU General Public License for more details. |
| |
| You should have received a copy of the GNU General Public License |
| along with this program. If not, see <https://www.gnu.org/licenses/>. */ |
| |
| %code requires |
| { |
| #include "symlist.h" |
| #include "symtab.h" |
| } |
| |
| %code provides |
| { |
| /* Initialize unquote. */ |
| void parser_init (void); |
| /* Deallocate storage for unquote. */ |
| void parser_free (void); |
| } |
| |
| %code top |
| { |
| /* On column 0 to please syntax-check. */ |
| #include <config.h> |
| } |
| |
| %code |
| { |
| #include "system.h" |
| |
| #include <c-ctype.h> |
| #include <quotearg.h> |
| #include <vasnprintf.h> |
| #include <xmemdup0.h> |
| |
| #include "complain.h" |
| #include "conflicts.h" |
| #include "files.h" |
| #include "getargs.h" |
| #include "gram.h" |
| #include "named-ref.h" |
| #include "reader.h" |
| #include "scan-code.h" |
| #include "scan-gram.h" |
| #include "strversion.h" |
| |
| /* Pretend to be at least that version, to check features published |
| in that version while developping it. */ |
| static const char* api_version = "3.8"; |
| |
| static int current_prec = 0; |
| static location current_lhs_loc; |
| static named_ref *current_lhs_named_ref; |
| static symbol *current_lhs_symbol; |
| static symbol_class current_class = unknown_sym; |
| |
| /** Set the new current left-hand side symbol, possibly common |
| * to several right-hand side parts of rule. |
| */ |
| static void current_lhs (symbol *sym, location loc, named_ref *ref); |
| |
| #define YYLLOC_DEFAULT(Current, Rhs, N) \ |
| (Current) = lloc_default (Rhs, N) |
| static YYLTYPE lloc_default (YYLTYPE const *, int); |
| |
| #define YY_LOCATION_PRINT(File, Loc) \ |
| location_print (Loc, File) |
| |
| /* Strip initial '{' and final '}' (must be first and last characters). |
| Return the result. */ |
| static char *strip_braces (char *code); |
| |
| /* Convert CODE by calling code_props_plain_init if PLAIN, otherwise |
| code_props_symbol_action_init. Calls |
| gram_scanner_last_string_free to release the latest string from |
| the scanner (should be CODE). */ |
| static char const *translate_code (char *code, location loc, bool plain); |
| |
| /* Convert CODE by calling code_props_plain_init after having |
| stripped the first and last characters (expected to be '{', and |
| '}'). Calls gram_scanner_last_string_free to release the latest |
| string from the scanner (should be CODE). */ |
| static char const *translate_code_braceless (char *code, location loc); |
| |
| /* Handle a %header directive. */ |
| static void handle_header (char const *value); |
| |
| /* Handle a %error-verbose directive. */ |
| static void handle_error_verbose (location const *loc, char const *directive); |
| |
| /* Handle a %file-prefix directive. */ |
| static void handle_file_prefix (location const *loc, |
| location const *dir_loc, |
| char const *directive, char const *value); |
| |
| /* Handle a %language directive. */ |
| static void handle_language (location const *loc, char const *lang); |
| |
| /* Handle a %name-prefix directive. */ |
| static void handle_name_prefix (location const *loc, |
| char const *directive, char const *value); |
| |
| /* Handle a %pure-parser directive. */ |
| static void handle_pure_parser (location const *loc, char const *directive); |
| |
| /* Handle a %require directive. */ |
| static void handle_require (location const *loc, char const *version); |
| |
| /* Handle a %skeleton directive. */ |
| static void handle_skeleton (location const *loc, char const *skel); |
| |
| /* Handle a %yacc directive. */ |
| static void handle_yacc (location const *loc); |
| |
| /* Implementation of yyerror. */ |
| static void gram_error (location const *, char const *); |
| |
| /* A string that describes a char (e.g., 'a' -> "'a'"). */ |
| static char const *char_name (char); |
| |
| /* Add style to semantic values in traces. */ |
| static void tron (FILE *yyo); |
| static void troff (FILE *yyo); |
| |
| /* Interpret a quoted string (such as `"Hello, \"World\"\n\""`). |
| Manages the memory of the result. */ |
| static char *unquote (const char *str); |
| |
| /* Discard the latest unquoted string. */ |
| static void unquote_free (char *last_string); |
| } |
| |
| %define api.header.include {"parse-gram.h"} |
| %define api.prefix {gram_} |
| %define api.pure full |
| %define api.token.raw |
| %define api.value.type union |
| %define locations |
| %define parse.error custom |
| %define parse.lac full |
| %define parse.trace |
| %header |
| %expect 0 |
| %verbose |
| |
| %initial-action |
| { |
| /* Bison's grammar can initial empty locations, hence a default |
| location is needed. */ |
| boundary_set (&@$.start, grammar_file, 1, 1, 1); |
| boundary_set (&@$.end, grammar_file, 1, 1, 1); |
| } |
| |
| %token |
| STRING _("string") |
| TSTRING _("translatable string") |
| |
| PERCENT_TOKEN "%token" |
| PERCENT_NTERM "%nterm" |
| |
| PERCENT_TYPE "%type" |
| PERCENT_DESTRUCTOR "%destructor" |
| PERCENT_PRINTER "%printer" |
| |
| PERCENT_LEFT "%left" |
| PERCENT_RIGHT "%right" |
| PERCENT_NONASSOC "%nonassoc" |
| PERCENT_PRECEDENCE "%precedence" |
| |
| PERCENT_PREC "%prec" |
| PERCENT_DPREC "%dprec" |
| PERCENT_MERGE "%merge" |
| |
| PERCENT_CODE "%code" |
| PERCENT_DEFAULT_PREC "%default-prec" |
| PERCENT_DEFINE "%define" |
| PERCENT_ERROR_VERBOSE "%error-verbose" |
| PERCENT_EXPECT "%expect" |
| PERCENT_EXPECT_RR "%expect-rr" |
| PERCENT_FILE_PREFIX "%file-prefix" |
| PERCENT_FLAG "%<flag>" |
| PERCENT_GLR_PARSER "%glr-parser" |
| PERCENT_HEADER "%header" |
| PERCENT_INITIAL_ACTION "%initial-action" |
| PERCENT_LANGUAGE "%language" |
| PERCENT_NAME_PREFIX "%name-prefix" |
| PERCENT_NO_DEFAULT_PREC "%no-default-prec" |
| PERCENT_NO_LINES "%no-lines" |
| PERCENT_NONDETERMINISTIC_PARSER "%nondeterministic-parser" |
| PERCENT_OUTPUT "%output" |
| PERCENT_PURE_PARSER "%pure-parser" |
| PERCENT_REQUIRE "%require" |
| PERCENT_SKELETON "%skeleton" |
| PERCENT_START "%start" |
| PERCENT_TOKEN_TABLE "%token-table" |
| PERCENT_VERBOSE "%verbose" |
| PERCENT_YACC "%yacc" |
| |
| BRACED_CODE "{...}" |
| BRACED_PREDICATE "%?{...}" |
| BRACKETED_ID _("[identifier]") |
| CHAR_LITERAL _("character literal") |
| COLON ":" |
| EPILOGUE _("epilogue") |
| EQUAL "=" |
| ID _("identifier") |
| ID_COLON _("identifier:") |
| PERCENT_PERCENT "%%" |
| PIPE "|" |
| PROLOGUE "%{...%}" |
| SEMICOLON ";" |
| TAG _("<tag>") |
| TAG_ANY "<*>" |
| TAG_NONE "<>" |
| |
| /* Experimental feature, don't rely on it. */ |
| %code pre-printer {tron (yyo);} |
| %code post-printer {troff (yyo);} |
| |
| %type <unsigned char> CHAR_LITERAL |
| %printer { fputs (char_name ($$), yyo); } <unsigned char> |
| |
| %type <char*> "{...}" "%?{...}" "%{...%}" EPILOGUE STRING TSTRING |
| %printer { fputs ($$, yyo); } <char*> |
| |
| %type <uniqstr> |
| BRACKETED_ID ID ID_COLON |
| PERCENT_ERROR_VERBOSE PERCENT_FILE_PREFIX PERCENT_FLAG PERCENT_NAME_PREFIX |
| PERCENT_PURE_PARSER |
| TAG tag tag.opt variable |
| %printer { fputs ($$, yyo); } <uniqstr> |
| %printer { fprintf (yyo, "[%s]", $$); } BRACKETED_ID |
| %printer { fprintf (yyo, "%s:", $$); } ID_COLON |
| %printer { fprintf (yyo, "%%%s", $$); } PERCENT_FLAG |
| %printer { fprintf (yyo, "<%s>", $$); } TAG tag |
| |
| %token <int> INT_LITERAL _("integer literal") |
| %printer { fprintf (yyo, "%d", $$); } <int> |
| |
| %type <symbol*> id id_colon string_as_id symbol token_decl token_decl_for_prec |
| %printer { fprintf (yyo, "%s", $$ ? $$->tag : "<NULL>"); } <symbol*> |
| %printer { fprintf (yyo, "%s:", $$->tag); } id_colon |
| |
| %type <assoc> precedence_declarator |
| |
| %destructor { symbol_list_free ($$); } <symbol_list*> |
| %printer { symbol_list_syms_print ($$, yyo); } <symbol_list*> |
| |
| %type <named_ref*> named_ref.opt |
| |
| /*---------. |
| | %param. | |
| `---------*/ |
| %code requires |
| { |
| typedef enum |
| { |
| param_none = 0, |
| param_lex = 1 << 0, |
| param_parse = 1 << 1, |
| param_both = param_lex | param_parse |
| } param_type; |
| }; |
| %code |
| { |
| /** Add a lex-param and/or a parse-param. |
| * |
| * \param type where to push this formal argument. |
| * \param decl the formal argument. Destroyed. |
| * \param loc the location in the source. |
| */ |
| static void add_param (param_type type, char *decl, location loc); |
| static param_type current_param = param_none; |
| }; |
| %token <param_type> PERCENT_PARAM "%param"; |
| %printer |
| { |
| switch ($$) |
| { |
| #define CASE(In, Out) \ |
| case param_ ## In: fputs ("%" #Out, yyo); break |
| CASE (lex, lex-param); |
| CASE (parse, parse-param); |
| CASE (both, param); |
| #undef CASE |
| case param_none: aver (false); break; |
| } |
| } <param_type>; |
| |
| |
| /*==========\ |
| | Grammar. | |
| \==========*/ |
| %% |
| |
| input: |
| prologue_declarations "%%" grammar epilogue.opt |
| ; |
| |
| |
| /*------------------------------------. |
| | Declarations: before the first %%. | |
| `------------------------------------*/ |
| |
| prologue_declarations: |
| %empty |
| | prologue_declarations prologue_declaration |
| ; |
| |
| prologue_declaration: |
| grammar_declaration |
| | "%{...%}" |
| { |
| muscle_code_grow (union_seen ? "post_prologue" : "pre_prologue", |
| translate_code ($1, @1, true), @1); |
| code_scanner_last_string_free (); |
| } |
| | "%<flag>" |
| { |
| muscle_percent_define_ensure ($1, @1, true); |
| } |
| | "%define" variable value |
| { |
| muscle_percent_define_insert ($2, @$, $3.kind, $3.chars, |
| MUSCLE_PERCENT_DEFINE_GRAMMAR_FILE); |
| } |
| | "%header" string.opt { handle_header ($2); } |
| | "%error-verbose" { handle_error_verbose (&@$, $1); } |
| | "%expect" INT_LITERAL { expected_sr_conflicts = $2; } |
| | "%expect-rr" INT_LITERAL { expected_rr_conflicts = $2; } |
| | "%file-prefix" STRING { handle_file_prefix (&@$, &@1, $1, $2); } |
| | "%glr-parser" |
| { |
| nondeterministic_parser = true; |
| glr_parser = true; |
| } |
| | "%initial-action" "{...}" |
| { |
| muscle_code_grow ("initial_action", translate_code ($2, @2, false), @2); |
| code_scanner_last_string_free (); |
| } |
| | "%language" STRING { handle_language (&@1, $2); } |
| | "%name-prefix" STRING { handle_name_prefix (&@$, $1, $2); } |
| | "%no-lines" { no_lines_flag = true; } |
| | "%nondeterministic-parser" { nondeterministic_parser = true; } |
| | "%output" STRING { spec_outfile = unquote ($2); gram_scanner_last_string_free (); } |
| | "%param" { current_param = $1; } params { current_param = param_none; } |
| | "%pure-parser" { handle_pure_parser (&@$, $1); } |
| | "%require" STRING { handle_require (&@2, $2); } |
| | "%skeleton" STRING { handle_skeleton (&@2, $2); } |
| | "%token-table" { token_table_flag = true; } |
| | "%verbose" { report_flag |= report_states; } |
| | "%yacc" { handle_yacc (&@$); } |
| | error ";" { current_class = unknown_sym; yyerrok; } |
| | /*FIXME: Err? What is this horror doing here? */ ";" |
| ; |
| |
| params: |
| params "{...}" { add_param (current_param, $2, @2); } |
| | "{...}" { add_param (current_param, $1, @1); } |
| ; |
| |
| |
| /*----------------------. |
| | grammar_declaration. | |
| `----------------------*/ |
| |
| grammar_declaration: |
| symbol_declaration |
| | "%start" symbols.1 |
| { |
| grammar_start_symbols_add ($2); |
| } |
| | code_props_type "{...}" generic_symlist |
| { |
| code_props code; |
| code_props_symbol_action_init (&code, $2, @2); |
| code_props_translate_code (&code); |
| { |
| for (symbol_list *list = $3; list; list = list->next) |
| symbol_list_code_props_set (list, $1, &code); |
| symbol_list_free ($3); |
| } |
| } |
| | "%default-prec" |
| { |
| default_prec = true; |
| } |
| | "%no-default-prec" |
| { |
| default_prec = false; |
| } |
| | "%code" "{...}" |
| { |
| /* Do not invoke muscle_percent_code_grow here since it invokes |
| muscle_user_name_list_grow. */ |
| muscle_code_grow ("percent_code()", |
| translate_code_braceless ($2, @2), @2); |
| code_scanner_last_string_free (); |
| } |
| | "%code" ID "{...}" |
| { |
| muscle_percent_code_grow ($2, @2, translate_code_braceless ($3, @3), @3); |
| code_scanner_last_string_free (); |
| } |
| ; |
| |
| %type <code_props_type> code_props_type; |
| %printer { fprintf (yyo, "%s", code_props_type_string ($$)); } <code_props_type>; |
| code_props_type: |
| "%destructor" { $$ = destructor; } |
| | "%printer" { $$ = printer; } |
| ; |
| |
| /*---------. |
| | %union. | |
| `---------*/ |
| |
| %token PERCENT_UNION "%union"; |
| |
| union_name: |
| %empty {} |
| | ID { muscle_percent_define_insert ("api.value.union.name", |
| @1, muscle_keyword, $1, |
| MUSCLE_PERCENT_DEFINE_GRAMMAR_FILE); } |
| ; |
| |
| grammar_declaration: |
| "%union" union_name "{...}" |
| { |
| union_seen = true; |
| muscle_code_grow ("union_members", translate_code_braceless ($3, @3), @3); |
| code_scanner_last_string_free (); |
| } |
| ; |
| |
| |
| %type <symbol_list*> nterm_decls symbol_decls symbols.1 |
| token_decls token_decls_for_prec |
| token_decl.1 token_decl_for_prec.1; |
| symbol_declaration: |
| "%nterm" { current_class = nterm_sym; } nterm_decls[syms] |
| { |
| current_class = unknown_sym; |
| symbol_list_free ($syms); |
| } |
| | "%token" { current_class = token_sym; } token_decls[syms] |
| { |
| current_class = unknown_sym; |
| symbol_list_free ($syms); |
| } |
| | "%type" { current_class = pct_type_sym; } symbol_decls[syms] |
| { |
| current_class = unknown_sym; |
| symbol_list_free ($syms); |
| } |
| | precedence_declarator token_decls_for_prec[syms] |
| { |
| ++current_prec; |
| for (symbol_list *list = $syms; list; list = list->next) |
| symbol_precedence_set (list->content.sym, current_prec, $1, @1); |
| symbol_list_free ($syms); |
| } |
| ; |
| |
| precedence_declarator: |
| "%left" { $$ = left_assoc; } |
| | "%right" { $$ = right_assoc; } |
| | "%nonassoc" { $$ = non_assoc; } |
| | "%precedence" { $$ = precedence_assoc; } |
| ; |
| |
| %type <char*> string.opt; |
| string.opt: |
| %empty { $$ = NULL; } |
| | STRING { $$ = $1; } |
| ; |
| |
| tag.opt: |
| %empty { $$ = NULL; } |
| | TAG { $$ = $1; } |
| ; |
| |
| %type <symbol_list*> generic_symlist generic_symlist_item; |
| generic_symlist: |
| generic_symlist_item |
| | generic_symlist generic_symlist_item { $$ = symbol_list_append ($1, $2); } |
| ; |
| |
| generic_symlist_item: |
| symbol { $$ = symbol_list_sym_new ($1, @1); } |
| | tag { $$ = symbol_list_type_new ($1, @1); } |
| ; |
| |
| tag: |
| TAG |
| | "<*>" { $$ = uniqstr_new ("*"); } |
| | "<>" { $$ = uniqstr_new (""); } |
| ; |
| |
| /*-----------------------. |
| | nterm_decls (%nterm). | |
| `-----------------------*/ |
| |
| // A non empty list of possibly tagged symbols for %nterm. |
| // |
| // Can easily be defined like symbol_decls but restricted to ID, but |
| // using token_decls allows to reduce the number of rules, and also to |
| // make nicer error messages on "%nterm 'a'" or '%nterm FOO "foo"'. |
| nterm_decls: |
| token_decls |
| ; |
| |
| /*-----------------------------------. |
| | token_decls (%token, and %nterm). | |
| `-----------------------------------*/ |
| |
| // A non empty list of possibly tagged symbols for %token or %nterm. |
| token_decls: |
| token_decl.1[syms] |
| { |
| $$ = $syms; |
| } |
| | TAG token_decl.1[syms] |
| { |
| $$ = symbol_list_type_set ($syms, $TAG); |
| } |
| | token_decls TAG token_decl.1[syms] |
| { |
| $$ = symbol_list_append ($1, symbol_list_type_set ($syms, $TAG)); |
| } |
| ; |
| |
| // One or more symbol declarations for %token or %nterm. |
| token_decl.1: |
| token_decl { $$ = symbol_list_sym_new ($1, @1); } |
| | token_decl.1 token_decl { $$ = symbol_list_append ($1, symbol_list_sym_new ($2, @2)); } |
| |
| // One symbol declaration for %token or %nterm. |
| token_decl: |
| id int.opt[num] alias |
| { |
| $$ = $id; |
| symbol_class_set ($id, current_class, @id, true); |
| if (0 <= $num) |
| symbol_code_set ($id, $num, @num); |
| if ($alias) |
| symbol_make_alias ($id, $alias, @alias); |
| } |
| ; |
| |
| %type <int> int.opt; |
| int.opt: |
| %empty { $$ = -1; } |
| | INT_LITERAL |
| ; |
| |
| %type <symbol*> alias; |
| alias: |
| %empty { $$ = NULL; } |
| | string_as_id { $$ = $1; } |
| | TSTRING |
| { |
| $$ = symbol_get ($1, @1); |
| symbol_class_set ($$, token_sym, @1, false); |
| $$->translatable = true; |
| } |
| ; |
| |
| |
| /*-------------------------------------. |
| | token_decls_for_prec (%left, etc.). | |
| `-------------------------------------*/ |
| |
| // A non empty list of possibly tagged tokens for precedence declaration. |
| // |
| // Similar to %token (token_decls), but in '%left FOO 1 "foo"', it treats |
| // FOO and "foo" as two different symbols instead of aliasing them. |
| token_decls_for_prec: |
| token_decl_for_prec.1[syms] |
| { |
| $$ = $syms; |
| } |
| | TAG token_decl_for_prec.1[syms] |
| { |
| $$ = symbol_list_type_set ($syms, $TAG); |
| } |
| | token_decls_for_prec TAG token_decl_for_prec.1[syms] |
| { |
| $$ = symbol_list_append ($1, symbol_list_type_set ($syms, $TAG)); |
| } |
| ; |
| |
| // One or more token declarations for precedence declaration. |
| token_decl_for_prec.1: |
| token_decl_for_prec |
| { $$ = symbol_list_sym_new ($1, @1); } |
| | token_decl_for_prec.1 token_decl_for_prec |
| { $$ = symbol_list_append ($1, symbol_list_sym_new ($2, @2)); } |
| |
| // One token declaration for precedence declaration. |
| token_decl_for_prec: |
| id int.opt[num] |
| { |
| $$ = $id; |
| symbol_class_set ($id, token_sym, @id, false); |
| if (0 <= $num) |
| symbol_code_set ($id, $num, @num); |
| } |
| | string_as_id |
| ; |
| |
| |
| /*-----------------------------------. |
| | symbol_decls (argument of %type). | |
| `-----------------------------------*/ |
| |
| // A non empty list of typed symbols (for %type). |
| symbol_decls: |
| symbols.1[syms] |
| { |
| $$ = $syms; |
| } |
| | TAG symbols.1[syms] |
| { |
| $$ = symbol_list_type_set ($syms, $TAG); |
| } |
| | symbol_decls TAG symbols.1[syms] |
| { |
| $$ = symbol_list_append ($1, symbol_list_type_set ($syms, $TAG)); |
| } |
| ; |
| |
| // One or more symbols. |
| symbols.1: |
| symbol |
| { |
| if (current_class != unknown_sym) |
| symbol_class_set ($symbol, current_class, @symbol, false); |
| $$ = symbol_list_sym_new ($symbol, @symbol); |
| } |
| | symbols.1 symbol |
| { |
| if (current_class != unknown_sym) |
| symbol_class_set ($symbol, current_class, @symbol, false); |
| $$ = symbol_list_append ($1, symbol_list_sym_new ($symbol, @symbol)); |
| } |
| ; |
| |
| /*------------------------------------------. |
| | The grammar section: between the two %%. | |
| `------------------------------------------*/ |
| |
| grammar: |
| rules_or_grammar_declaration |
| | grammar rules_or_grammar_declaration |
| ; |
| |
| /* As a Bison extension, one can use the grammar declarations in the |
| body of the grammar. */ |
| rules_or_grammar_declaration: |
| rules |
| | grammar_declaration ";" |
| | error ";" |
| { |
| yyerrok; |
| } |
| ; |
| |
| rules: |
| id_colon named_ref.opt { current_lhs ($1, @1, $2); } ":" rhses.1 |
| { |
| /* Free the current lhs. */ |
| current_lhs (0, @1, 0); |
| } |
| ; |
| |
| rhses.1: |
| rhs { grammar_current_rule_end (@rhs); } |
| | rhses.1 "|" rhs { grammar_current_rule_end (@rhs); } |
| | rhses.1 ";" |
| ; |
| |
| %token PERCENT_EMPTY "%empty"; |
| rhs: |
| %empty |
| { grammar_current_rule_begin (current_lhs_symbol, current_lhs_loc, |
| current_lhs_named_ref); } |
| | rhs symbol named_ref.opt |
| { grammar_current_rule_symbol_append ($2, @2, $3); } |
| | rhs tag.opt "{...}"[action] named_ref.opt[name] |
| { grammar_current_rule_action_append ($action, @action, $name, $[tag.opt]); } |
| | rhs "%?{...}" |
| { grammar_current_rule_predicate_append ($2, @2); } |
| | rhs "%empty" |
| { grammar_current_rule_empty_set (@2); } |
| | rhs "%prec" symbol |
| { grammar_current_rule_prec_set ($3, @3); } |
| | rhs "%dprec" INT_LITERAL |
| { grammar_current_rule_dprec_set ($3, @3); } |
| | rhs "%merge" TAG |
| { grammar_current_rule_merge_set ($3, @3); } |
| | rhs "%expect" INT_LITERAL |
| { grammar_current_rule_expect_sr ($3, @3); } |
| | rhs "%expect-rr" INT_LITERAL |
| { grammar_current_rule_expect_rr ($3, @3); } |
| ; |
| |
| named_ref.opt: |
| %empty { $$ = NULL; } |
| | BRACKETED_ID { $$ = named_ref_new ($1, @1); } |
| ; |
| |
| |
| /*---------------------. |
| | variable and value. | |
| `---------------------*/ |
| |
| variable: |
| ID |
| ; |
| |
| /* Some content or empty by default. */ |
| %code requires { |
| #include "muscle-tab.h" |
| typedef struct |
| { |
| char const *chars; |
| muscle_kind kind; |
| } value_type; |
| }; |
| %type <value_type> value; |
| %printer |
| { |
| switch ($$.kind) |
| { |
| case muscle_code: fprintf (yyo, "{%s}", $$.chars); break; |
| case muscle_keyword: fprintf (yyo, "%s", $$.chars); break; |
| case muscle_string: fprintf (yyo, "\"%s\"", $$.chars); break; |
| } |
| } <value_type>; |
| |
| value: |
| %empty { $$.kind = muscle_keyword; $$.chars = ""; } |
| | ID { $$.kind = muscle_keyword; $$.chars = $1; } |
| | STRING { $$.kind = muscle_string; $$.chars = unquote ($1); gram_scanner_last_string_free ();} |
| | "{...}" { $$.kind = muscle_code; $$.chars = strip_braces ($1); gram_scanner_last_string_free (); } |
| ; |
| |
| |
| /*--------------. |
| | Identifiers. | |
| `--------------*/ |
| |
| /* Identifiers are returned as uniqstr values by the scanner. |
| Depending on their use, we may need to make them genuine symbols. */ |
| |
| id: |
| ID |
| { $$ = symbol_from_uniqstr ($1, @1); } |
| | CHAR_LITERAL |
| { |
| const char *var = "api.token.raw"; |
| if (current_class == nterm_sym) |
| { |
| complain (&@1, complaint, |
| _("character literals cannot be nonterminals")); |
| YYERROR; |
| } |
| if (muscle_percent_define_ifdef (var)) |
| { |
| complain (&@1, complaint, |
| _("character literals cannot be used together" |
| " with %s"), var); |
| location loc = muscle_percent_define_get_loc (var); |
| subcomplain (&loc, complaint, _("definition of %s"), var); |
| } |
| $$ = symbol_get (char_name ($1), @1); |
| symbol_class_set ($$, token_sym, @1, false); |
| symbol_code_set ($$, $1, @1); |
| } |
| ; |
| |
| id_colon: |
| ID_COLON { $$ = symbol_from_uniqstr ($1, @1); } |
| ; |
| |
| |
| symbol: |
| id |
| | string_as_id |
| ; |
| |
| /* A string used as an ID. */ |
| string_as_id: |
| STRING |
| { |
| $$ = symbol_get ($1, @1); |
| symbol_class_set ($$, token_sym, @1, false); |
| } |
| ; |
| |
| epilogue.opt: |
| %empty |
| | "%%" EPILOGUE |
| { |
| muscle_code_grow ("epilogue", translate_code ($2, @2, true), @2); |
| code_scanner_last_string_free (); |
| } |
| ; |
| |
| %% |
| |
| int |
| yyreport_syntax_error (const yypcontext_t *ctx) |
| { |
| int res = 0; |
| /* Arguments of format: reported tokens (one for the "unexpected", |
| one per "expected"). */ |
| enum { ARGS_MAX = 5 }; |
| const char *argv[ARGS_MAX]; |
| int argc = 0; |
| yysymbol_kind_t unexpected = yypcontext_token (ctx); |
| if (unexpected != YYSYMBOL_YYEMPTY) |
| { |
| argv[argc++] = yysymbol_name (unexpected); |
| yysymbol_kind_t expected[ARGS_MAX - 1]; |
| int nexpected = yypcontext_expected_tokens (ctx, expected, ARGS_MAX - 1); |
| if (nexpected < 0) |
| res = nexpected; |
| else |
| for (int i = 0; i < nexpected; ++i) |
| argv[argc++] = yysymbol_name (expected[i]); |
| } |
| syntax_error (*yypcontext_location (ctx), argc, argv); |
| return res; |
| } |
| |
| |
| /* Return the location of the left-hand side of a rule whose |
| right-hand side is RHS[1] ... RHS[N]. Ignore empty nonterminals in |
| the right-hand side, and return an empty location equal to the end |
| boundary of RHS[0] if the right-hand side is empty. */ |
| |
| static YYLTYPE |
| lloc_default (YYLTYPE const *rhs, int n) |
| { |
| YYLTYPE loc; |
| |
| /* SGI MIPSpro 7.4.1m miscompiles "loc.start = loc.end = rhs[n].end;". |
| The bug is fixed in 7.4.2m, but play it safe for now. */ |
| loc.start = rhs[n].end; |
| loc.end = rhs[n].end; |
| |
| /* Ignore empty nonterminals the start of the right-hand side. |
| Do not bother to ignore them at the end of the right-hand side, |
| since empty nonterminals have the same end as their predecessors. */ |
| for (int i = 1; i <= n; i++) |
| if (! equal_boundaries (rhs[i].start, rhs[i].end)) |
| { |
| loc.start = rhs[i].start; |
| break; |
| } |
| |
| return loc; |
| } |
| |
| static |
| char *strip_braces (char *code) |
| { |
| code[strlen (code) - 1] = 0; |
| return code + 1; |
| } |
| |
| static |
| char const * |
| translate_code (char *code, location loc, bool plain) |
| { |
| code_props plain_code; |
| if (plain) |
| code_props_plain_init (&plain_code, code, loc); |
| else |
| code_props_symbol_action_init (&plain_code, code, loc); |
| code_props_translate_code (&plain_code); |
| gram_scanner_last_string_free (); |
| return plain_code.code; |
| } |
| |
| static |
| char const * |
| translate_code_braceless (char *code, location loc) |
| { |
| return translate_code (strip_braces (code), loc, true); |
| } |
| |
| static void |
| add_param (param_type type, char *decl, location loc) |
| { |
| static char const alphanum[26 + 26 + 1 + 10 + 1] = |
| "abcdefghijklmnopqrstuvwxyz" |
| "ABCDEFGHIJKLMNOPQRSTUVWXYZ" |
| "_" |
| "0123456789"; |
| |
| char const *name_start = NULL; |
| { |
| char *p; |
| /* Stop on last actual character. */ |
| for (p = decl; p[1]; p++) |
| if ((p == decl |
| || ! memchr (alphanum, p[-1], sizeof alphanum - 1)) |
| && memchr (alphanum, p[0], sizeof alphanum - 10 - 1)) |
| name_start = p; |
| |
| /* Strip the surrounding '{' and '}', and any blanks just inside |
| the braces. */ |
| --p; |
| while (c_isspace ((unsigned char) *p)) |
| --p; |
| p[1] = '\0'; |
| ++decl; |
| while (c_isspace ((unsigned char) *decl)) |
| ++decl; |
| } |
| |
| if (! name_start) |
| complain (&loc, complaint, _("missing identifier in parameter declaration")); |
| else |
| { |
| char *name = xmemdup0 (name_start, strspn (name_start, alphanum)); |
| if (type & param_lex) |
| muscle_pair_list_grow ("lex_param", decl, name); |
| if (type & param_parse) |
| muscle_pair_list_grow ("parse_param", decl, name); |
| free (name); |
| } |
| |
| gram_scanner_last_string_free (); |
| } |
| |
| |
| static void |
| handle_header (char const *value) |
| { |
| header_flag = true; |
| if (value) |
| { |
| char *file = unquote (value); |
| spec_header_file = xstrdup (file); |
| gram_scanner_last_string_free (); |
| unquote_free (file); |
| } |
| } |
| |
| |
| static void |
| handle_error_verbose (location const *loc, char const *directive) |
| { |
| bison_directive (loc, directive); |
| muscle_percent_define_insert (directive, *loc, muscle_keyword, "", |
| MUSCLE_PERCENT_DEFINE_GRAMMAR_FILE); |
| } |
| |
| |
| static void |
| handle_file_prefix (location const *loc, |
| location const *dir_loc, |
| char const *directive, char const *value_quoted) |
| { |
| char *value = unquote (value_quoted); |
| bison_directive (loc, directive); |
| bool warned = false; |
| |
| if (location_empty (spec_file_prefix_loc)) |
| { |
| spec_file_prefix_loc = *loc; |
| spec_file_prefix = value; |
| } |
| else |
| { |
| duplicate_directive (directive, spec_file_prefix_loc, *loc); |
| warned = true; |
| } |
| |
| if (!warned |
| && STRNEQ (directive, "%file-prefix")) |
| deprecated_directive (dir_loc, directive, "%file-prefix"); |
| } |
| |
| static void |
| handle_language (location const *loc, char const *lang) |
| { |
| language_argmatch (unquote (lang), grammar_prio, *loc); |
| } |
| |
| |
| static void |
| handle_name_prefix (location const *loc, |
| char const *directive, char const *value_quoted) |
| { |
| char *value = unquote (value_quoted); |
| bison_directive (loc, directive); |
| |
| char buf1[1024]; |
| size_t len1 = sizeof (buf1); |
| char *old = asnprintf (buf1, &len1, "%s\"%s\"", directive, value); |
| if (!old) |
| xalloc_die (); |
| |
| if (location_empty (spec_name_prefix_loc)) |
| { |
| spec_name_prefix = value; |
| spec_name_prefix_loc = *loc; |
| |
| char buf2[1024]; |
| size_t len2 = sizeof (buf2); |
| char *new = asnprintf (buf2, &len2, "%%define api.prefix {%s}", value); |
| if (!new) |
| xalloc_die (); |
| deprecated_directive (loc, old, new); |
| if (new != buf2) |
| free (new); |
| } |
| else |
| duplicate_directive (old, spec_file_prefix_loc, *loc); |
| |
| if (old != buf1) |
| free (old); |
| } |
| |
| |
| static void |
| handle_pure_parser (location const *loc, char const *directive) |
| { |
| bison_directive (loc, directive); |
| deprecated_directive (loc, directive, "%define api.pure"); |
| muscle_percent_define_insert ("api.pure", *loc, muscle_keyword, "", |
| MUSCLE_PERCENT_DEFINE_GRAMMAR_FILE); |
| } |
| |
| |
| static void |
| handle_require (location const *loc, char const *version_quoted) |
| { |
| char *version = unquote (version_quoted); |
| required_version = strversion_to_int (version); |
| if (required_version == -1) |
| { |
| complain (loc, complaint, _("invalid version requirement: %s"), |
| version); |
| required_version = 0; |
| } |
| else |
| { |
| const char* package_version = |
| 0 < strverscmp (api_version, PACKAGE_VERSION) |
| ? api_version : PACKAGE_VERSION; |
| if (0 < strverscmp (version, package_version)) |
| { |
| complain (loc, complaint, _("require bison %s, but have %s"), |
| version, package_version); |
| exit (EX_MISMATCH); |
| } |
| } |
| unquote_free (version); |
| gram_scanner_last_string_free (); |
| } |
| |
| static void |
| handle_skeleton (location const *loc, char const *skel_quoted) |
| { |
| char *skel = unquote (skel_quoted); |
| char const *skeleton_user = skel; |
| if (strchr (skeleton_user, '/')) |
| { |
| size_t dir_length = strlen (grammar_file); |
| while (dir_length && grammar_file[dir_length - 1] != '/') |
| --dir_length; |
| while (dir_length && grammar_file[dir_length - 1] == '/') |
| --dir_length; |
| char *skeleton_build = |
| xmalloc (dir_length + 1 + strlen (skeleton_user) + 1); |
| if (dir_length > 0) |
| { |
| memcpy (skeleton_build, grammar_file, dir_length); |
| skeleton_build[dir_length++] = '/'; |
| } |
| strcpy (skeleton_build + dir_length, skeleton_user); |
| skeleton_user = uniqstr_new (skeleton_build); |
| free (skeleton_build); |
| } |
| skeleton_arg (skeleton_user, grammar_prio, *loc); |
| } |
| |
| |
| static void |
| handle_yacc (location const *loc) |
| { |
| const char *directive = "%yacc"; |
| bison_directive (loc, directive); |
| if (location_empty (yacc_loc)) |
| set_yacc (*loc); |
| else |
| duplicate_directive (directive, yacc_loc, *loc); |
| } |
| |
| |
| static void |
| gram_error (location const *loc, char const *msg) |
| { |
| complain (loc, complaint, "%s", msg); |
| } |
| |
| static char const * |
| char_name (char c) |
| { |
| if (c == '\'') |
| return "'\\''"; |
| else |
| { |
| char buf[4]; |
| buf[0] = '\''; buf[1] = c; buf[2] = '\''; buf[3] = '\0'; |
| return quotearg_style (escape_quoting_style, buf); |
| } |
| } |
| |
| static void |
| current_lhs (symbol *sym, location loc, named_ref *ref) |
| { |
| current_lhs_symbol = sym; |
| current_lhs_loc = loc; |
| if (sym) |
| symbol_location_as_lhs_set (sym, loc); |
| /* In order to simplify memory management, named references for lhs |
| are always assigned by deep copy into the current symbol_list |
| node. This is because a single named-ref in the grammar may |
| result in several uses when the user factors lhs between several |
| rules using "|". Therefore free the parser's original copy. */ |
| free (current_lhs_named_ref); |
| current_lhs_named_ref = ref; |
| } |
| |
| static void tron (FILE *yyo) |
| { |
| begin_use_class ("value", yyo); |
| } |
| |
| static void troff (FILE *yyo) |
| { |
| end_use_class ("value", yyo); |
| } |
| |
| |
| /*----------. |
| | Unquote. | |
| `----------*/ |
| |
| struct obstack obstack_for_unquote; |
| |
| void |
| parser_init (void) |
| { |
| obstack_init (&obstack_for_unquote); |
| } |
| |
| void |
| parser_free (void) |
| { |
| obstack_free (&obstack_for_unquote, 0); |
| } |
| |
| static void |
| unquote_free (char *last_string) |
| { |
| obstack_free (&obstack_for_unquote, last_string); |
| } |
| |
| static char * |
| unquote (const char *cp) |
| { |
| #define GROW(Char) \ |
| obstack_1grow (&obstack_for_unquote, Char); |
| for (++cp; *cp && *cp != '"'; ++cp) |
| switch (*cp) |
| { |
| case '"': |
| break; |
| case '\\': |
| ++cp; |
| switch (*cp) |
| { |
| case '0': case '1': case '2': case '3': case '4': |
| case '5': case '6': case '7': case '8': case '9': |
| { |
| int c = cp[0] - '0'; |
| if (c_isdigit (cp[1])) |
| { |
| ++cp; |
| c = c * 8 + cp[0] - '0'; |
| } |
| if (c_isdigit (cp[1])) |
| { |
| ++cp; |
| c = c * 8 + cp[0] - '0'; |
| } |
| GROW (c); |
| } |
| break; |
| |
| case 'a': GROW ('\a'); break; |
| case 'b': GROW ('\b'); break; |
| case 'f': GROW ('\f'); break; |
| case 'n': GROW ('\n'); break; |
| case 'r': GROW ('\r'); break; |
| case 't': GROW ('\t'); break; |
| case 'v': GROW ('\v'); break; |
| |
| case 'x': |
| { |
| int c = 0; |
| while (c_isxdigit (cp[1])) |
| { |
| ++cp; |
| c = (c * 16 + (c_isdigit (cp[0]) ? cp[0] - '0' |
| : c_isupper (cp[0]) ? cp[0] - 'A' |
| : cp[0] - '0')); |
| } |
| GROW (c); |
| break; |
| } |
| } |
| break; |
| |
| default: |
| GROW (*cp); |
| break; |
| } |
| assert (*cp == '"'); |
| ++cp; |
| assert (*cp == '\0'); |
| #undef GROW |
| return obstack_finish0 (&obstack_for_unquote); |
| } |