src/parse-gram.y - platform/external/bison - Git at Google

 /* Bison Grammar Parser                             -*- C -*-

    Copyright (C) 2002-2015, 2018-2021 Free Software Foundation, Inc.

    This file is part of Bison, the GNU Compiler Compiler.

    This program is free software: you can redistribute it and/or modify
    it under the terms of the GNU General Public License as published by
    the Free Software Foundation, either version 3 of the License, or
    (at your option) any later version.

    This program is distributed in the hope that it will be useful,
    but WITHOUT ANY WARRANTY; without even the implied warranty of
    MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
    GNU General Public License for more details.

    You should have received a copy of the GNU General Public License
    along with this program.  If not, see <https://www.gnu.org/licenses/>.  */

 %code requires
 {
   #include "symlist.h"
   #include "symtab.h"
 }

 %code provides
 {
   /* Initialize unquote.  */
   void parser_init (void);
   /* Deallocate storage for unquote.  */
   void parser_free (void);
 }

 %code top
 {
   /* On column 0 to please syntax-check.  */
 #include <config.h>
 }

 %code
 {
   #include "system.h"

   #include <c-ctype.h>
   #include <quotearg.h>
   #include <vasnprintf.h>
   #include <xmemdup0.h>

   #include "complain.h"
   #include "conflicts.h"
   #include "files.h"
   #include "getargs.h"
   #include "gram.h"
   #include "named-ref.h"
   #include "reader.h"
   #include "scan-code.h"
   #include "scan-gram.h"
   #include "strversion.h"

   /* Pretend to be at least that version, to check features published
      in that version while developping it.  */
   static const char* api_version = "3.8";

   static int current_prec = 0;
   static location current_lhs_loc;
   static named_ref *current_lhs_named_ref;
   static symbol *current_lhs_symbol;
   static symbol_class current_class = unknown_sym;

   /** Set the new current left-hand side symbol, possibly common
    * to several right-hand side parts of rule.
    */
   static void current_lhs (symbol *sym, location loc, named_ref *ref);

   #define YYLLOC_DEFAULT(Current, Rhs, N)         \
     (Current) = lloc_default (Rhs, N)
   static YYLTYPE lloc_default (YYLTYPE const *, int);

   #define YY_LOCATION_PRINT(File, Loc)            \
     location_print (Loc, File)

   /* Strip initial '{' and final '}' (must be first and last characters).
      Return the result.  */
   static char *strip_braces (char *code);

   /* Convert CODE by calling code_props_plain_init if PLAIN, otherwise
      code_props_symbol_action_init.  Calls
      gram_scanner_last_string_free to release the latest string from
      the scanner (should be CODE). */
   static char const *translate_code (char *code, location loc, bool plain);

   /* Convert CODE by calling code_props_plain_init after having
      stripped the first and last characters (expected to be '{', and
      '}').  Calls gram_scanner_last_string_free to release the latest
      string from the scanner (should be CODE). */
   static char const *translate_code_braceless (char *code, location loc);

   /* Handle a %header directive.  */
   static void handle_header (char const *value);

   /* Handle a %error-verbose directive.  */
   static void handle_error_verbose (location const *loc, char const *directive);

   /* Handle a %file-prefix directive.  */
   static void handle_file_prefix (location const *loc,
                                   location const *dir_loc,
                                   char const *directive, char const *value);

   /* Handle a %language directive.  */
   static void handle_language (location const *loc, char const *lang);

   /* Handle a %name-prefix directive.  */
   static void handle_name_prefix (location const *loc,
                                   char const *directive, char const *value);

   /* Handle a %pure-parser directive.  */
   static void handle_pure_parser (location const *loc, char const *directive);

   /* Handle a %require directive.  */
   static void handle_require (location const *loc, char const *version);

   /* Handle a %skeleton directive.  */
   static void handle_skeleton (location const *loc, char const *skel);

   /* Handle a %yacc directive.  */
   static void handle_yacc (location const *loc);

   /* Implementation of yyerror.  */
   static void gram_error (location const *, char const *);

   /* A string that describes a char (e.g., 'a' -> "'a'").  */
   static char const *char_name (char);

   /* Add style to semantic values in traces.  */
   static void tron (FILE *yyo);
   static void troff (FILE *yyo);

   /* Interpret a quoted string (such as `"Hello, \"World\"\n\""`).
      Manages the memory of the result.  */
   static char *unquote (const char *str);

   /* Discard the latest unquoted string.  */
   static void unquote_free (char *last_string);
 }

 %define api.header.include {"parse-gram.h"}
 %define api.prefix {gram_}
 %define api.pure full
 %define api.token.raw
 %define api.value.type union
 %define locations
 %define parse.error custom
 %define parse.lac full
 %define parse.trace
 %header
 %expect 0
 %verbose

 %initial-action
 {
   /* Bison's grammar can initial empty locations, hence a default
      location is needed. */
   boundary_set (&@$.start, grammar_file, 1, 1, 1);
   boundary_set (&@$.end, grammar_file, 1, 1, 1);
 }

 %token
   STRING              _("string")
   TSTRING             _("translatable string")

   PERCENT_TOKEN       "%token"
   PERCENT_NTERM       "%nterm"

   PERCENT_TYPE        "%type"
   PERCENT_DESTRUCTOR  "%destructor"
   PERCENT_PRINTER     "%printer"

   PERCENT_LEFT        "%left"
   PERCENT_RIGHT       "%right"
   PERCENT_NONASSOC    "%nonassoc"
   PERCENT_PRECEDENCE  "%precedence"

   PERCENT_PREC        "%prec"
   PERCENT_DPREC       "%dprec"
   PERCENT_MERGE       "%merge"

   PERCENT_CODE            "%code"
   PERCENT_DEFAULT_PREC    "%default-prec"
   PERCENT_DEFINE          "%define"
   PERCENT_ERROR_VERBOSE   "%error-verbose"
   PERCENT_EXPECT          "%expect"
   PERCENT_EXPECT_RR       "%expect-rr"
   PERCENT_FILE_PREFIX     "%file-prefix"
   PERCENT_FLAG            "%<flag>"
   PERCENT_GLR_PARSER      "%glr-parser"
   PERCENT_HEADER          "%header"
   PERCENT_INITIAL_ACTION  "%initial-action"
   PERCENT_LANGUAGE        "%language"
   PERCENT_NAME_PREFIX     "%name-prefix"
   PERCENT_NO_DEFAULT_PREC "%no-default-prec"
   PERCENT_NO_LINES        "%no-lines"
   PERCENT_NONDETERMINISTIC_PARSER "%nondeterministic-parser"
   PERCENT_OUTPUT          "%output"
   PERCENT_PURE_PARSER     "%pure-parser"
   PERCENT_REQUIRE         "%require"
   PERCENT_SKELETON        "%skeleton"
   PERCENT_START           "%start"
   PERCENT_TOKEN_TABLE     "%token-table"
   PERCENT_VERBOSE         "%verbose"
   PERCENT_YACC            "%yacc"

   BRACED_CODE       "{...}"
   BRACED_PREDICATE  "%?{...}"
   BRACKETED_ID      _("[identifier]")
   CHAR_LITERAL      _("character literal")
   COLON             ":"
   EPILOGUE          _("epilogue")
   EQUAL             "="
   ID                _("identifier")
   ID_COLON          _("identifier:")
   PERCENT_PERCENT   "%%"
   PIPE              "|"
   PROLOGUE          "%{...%}"
   SEMICOLON         ";"
   TAG               _("<tag>")
   TAG_ANY           "<*>"
   TAG_NONE          "<>"

  /* Experimental feature, don't rely on it.  */
 %code pre-printer  {tron (yyo);}
 %code post-printer {troff (yyo);}

 %type <unsigned char> CHAR_LITERAL
 %printer { fputs (char_name ($$), yyo); } <unsigned char>

 %type <char*> "{...}" "%?{...}" "%{...%}" EPILOGUE STRING TSTRING
 %printer { fputs ($$, yyo); } <char*>

 %type <uniqstr>
   BRACKETED_ID ID ID_COLON
   PERCENT_ERROR_VERBOSE PERCENT_FILE_PREFIX PERCENT_FLAG PERCENT_NAME_PREFIX
   PERCENT_PURE_PARSER
   TAG tag tag.opt variable
 %printer { fputs ($$, yyo); } <uniqstr>
 %printer { fprintf (yyo, "[%s]", $$); } BRACKETED_ID
 %printer { fprintf (yyo, "%s:", $$); } ID_COLON
 %printer { fprintf (yyo, "%%%s", $$); } PERCENT_FLAG
 %printer { fprintf (yyo, "<%s>", $$); } TAG tag

 %token <int> INT_LITERAL _("integer literal")
 %printer { fprintf (yyo, "%d", $$); } <int>

 %type <symbol*> id id_colon string_as_id symbol token_decl token_decl_for_prec
 %printer { fprintf (yyo, "%s", $$ ? $$->tag : "<NULL>"); } <symbol*>
 %printer { fprintf (yyo, "%s:", $$->tag); } id_colon

 %type <assoc> precedence_declarator

 %destructor { symbol_list_free ($$); } <symbol_list*>
 %printer { symbol_list_syms_print ($$, yyo); } <symbol_list*>

 %type <named_ref*> named_ref.opt

 /*---------.
 | %param.  |
 `---------*/
 %code requires
 {
   typedef enum
   {
     param_none   = 0,
     param_lex    = 1 << 0,
     param_parse  = 1 << 1,
     param_both   = param_lex | param_parse
   } param_type;
 };
 %code
 {
   /** Add a lex-param and/or a parse-param.
    *
    * \param type  where to push this formal argument.
    * \param decl  the formal argument.  Destroyed.
    * \param loc   the location in the source.
    */
   static void add_param (param_type type, char *decl, location loc);
   static param_type current_param = param_none;
 };
 %token <param_type> PERCENT_PARAM "%param";
 %printer
 {
   switch ($$)
     {
 #define CASE(In, Out)                                           \
       case param_ ## In: fputs ("%" #Out, yyo); break
       CASE (lex,   lex-param);
       CASE (parse, parse-param);
       CASE (both,  param);
 #undef CASE
       case param_none: aver (false); break;
     }
 } <param_type>;


                      /*==========\
                      | Grammar.  |
                      \==========*/
 %%

 input:
   prologue_declarations "%%" grammar epilogue.opt
 ;


         /*------------------------------------.
         | Declarations: before the first %%.  |
         `------------------------------------*/

 prologue_declarations:
   %empty
 | prologue_declarations prologue_declaration
 ;

 prologue_declaration:
   grammar_declaration
 | "%{...%}"
     {
       muscle_code_grow (union_seen ? "post_prologue" : "pre_prologue",
                         translate_code ($1, @1, true), @1);
       code_scanner_last_string_free ();
     }
 | "%<flag>"
     {
       muscle_percent_define_ensure ($1, @1, true);
     }
 | "%define" variable value
     {
       muscle_percent_define_insert ($2, @$, $3.kind, $3.chars,
                                     MUSCLE_PERCENT_DEFINE_GRAMMAR_FILE);
     }
 | "%header" string.opt             { handle_header ($2); }
 | "%error-verbose"                 { handle_error_verbose (&@$, $1); }
 | "%expect" INT_LITERAL            { expected_sr_conflicts = $2; }
 | "%expect-rr" INT_LITERAL         { expected_rr_conflicts = $2; }
 | "%file-prefix" STRING            { handle_file_prefix (&@$, &@1, $1, $2); }
 | "%glr-parser"
     {
       nondeterministic_parser = true;
       glr_parser = true;
     }
 | "%initial-action" "{...}"
     {
       muscle_code_grow ("initial_action", translate_code ($2, @2, false), @2);
       code_scanner_last_string_free ();
     }
 | "%language" STRING            { handle_language (&@1, $2); }
 | "%name-prefix" STRING         { handle_name_prefix (&@$, $1, $2); }
 | "%no-lines"                   { no_lines_flag = true; }
 | "%nondeterministic-parser"    { nondeterministic_parser = true; }
 | "%output" STRING              { spec_outfile = unquote ($2); gram_scanner_last_string_free (); }
 | "%param" { current_param = $1; } params { current_param = param_none; }
 | "%pure-parser"                { handle_pure_parser (&@$, $1); }
 | "%require" STRING             { handle_require (&@2, $2); }
 | "%skeleton" STRING            { handle_skeleton (&@2, $2); }
 | "%token-table"                { token_table_flag = true; }
 | "%verbose"                    { report_flag |= report_states; }
 | "%yacc"                       { handle_yacc (&@$); }
 | error ";"                     { current_class = unknown_sym; yyerrok; }
 | /*FIXME: Err?  What is this horror doing here? */ ";"
 ;

 params:
    params "{...}"  { add_param (current_param, $2, @2); }
 | "{...}"          { add_param (current_param, $1, @1); }
 ;


 /*----------------------.
 | grammar_declaration.  |
 `----------------------*/

 grammar_declaration:
   symbol_declaration
 | "%start" symbols.1
     {
       grammar_start_symbols_add ($2);
     }
 | code_props_type "{...}" generic_symlist
     {
       code_props code;
       code_props_symbol_action_init (&code, $2, @2);
       code_props_translate_code (&code);
       {
         for (symbol_list *list = $3; list; list = list->next)
           symbol_list_code_props_set (list, $1, &code);
         symbol_list_free ($3);
       }
     }
 | "%default-prec"
     {
       default_prec = true;
     }
 | "%no-default-prec"
     {
       default_prec = false;
     }
 | "%code" "{...}"
     {
       /* Do not invoke muscle_percent_code_grow here since it invokes
          muscle_user_name_list_grow.  */
       muscle_code_grow ("percent_code()",
                         translate_code_braceless ($2, @2), @2);
       code_scanner_last_string_free ();
     }
 | "%code" ID "{...}"
     {
       muscle_percent_code_grow ($2, @2, translate_code_braceless ($3, @3), @3);
       code_scanner_last_string_free ();
     }
 ;

 %type <code_props_type> code_props_type;
 %printer { fprintf (yyo, "%s", code_props_type_string ($$)); } <code_props_type>;
 code_props_type:
   "%destructor"  { $$ = destructor; }
 | "%printer"     { $$ = printer; }
 ;

 /*---------.
 | %union.  |
 `---------*/

 %token PERCENT_UNION "%union";

 union_name:
   %empty {}
 | ID     { muscle_percent_define_insert ("api.value.union.name",
                                          @1, muscle_keyword, $1,
                                          MUSCLE_PERCENT_DEFINE_GRAMMAR_FILE); }
 ;

 grammar_declaration:
   "%union" union_name "{...}"
     {
       union_seen = true;
       muscle_code_grow ("union_members", translate_code_braceless ($3, @3), @3);
       code_scanner_last_string_free ();
     }
 ;


 %type <symbol_list*> nterm_decls symbol_decls symbols.1
       token_decls token_decls_for_prec
       token_decl.1 token_decl_for_prec.1;
 symbol_declaration:
   "%nterm" { current_class = nterm_sym; } nterm_decls[syms]
     {
       current_class = unknown_sym;
       symbol_list_free ($syms);
     }
 | "%token" { current_class = token_sym; } token_decls[syms]
     {
       current_class = unknown_sym;
       symbol_list_free ($syms);
     }
 | "%type" { current_class = pct_type_sym; } symbol_decls[syms]
     {
       current_class = unknown_sym;
       symbol_list_free ($syms);
     }
 | precedence_declarator token_decls_for_prec[syms]
     {
       ++current_prec;
       for (symbol_list *list = $syms; list; list = list->next)
         symbol_precedence_set (list->content.sym, current_prec, $1, @1);
       symbol_list_free ($syms);
     }
 ;

 precedence_declarator:
   "%left"       { $$ = left_assoc; }
 | "%right"      { $$ = right_assoc; }
 | "%nonassoc"   { $$ = non_assoc; }
 | "%precedence" { $$ = precedence_assoc; }
 ;

 %type <char*> string.opt;
 string.opt:
   %empty  { $$ = NULL; }
 | STRING  { $$ = $1; }
 ;

 tag.opt:
   %empty { $$ = NULL; }
 | TAG    { $$ = $1; }
 ;

 %type <symbol_list*> generic_symlist generic_symlist_item;
 generic_symlist:
   generic_symlist_item
 | generic_symlist generic_symlist_item   { $$ = symbol_list_append ($1, $2); }
 ;

 generic_symlist_item:
   symbol    { $$ = symbol_list_sym_new ($1, @1); }
 | tag       { $$ = symbol_list_type_new ($1, @1); }
 ;

 tag:
   TAG
 | "<*>" { $$ = uniqstr_new ("*"); }
 | "<>"  { $$ = uniqstr_new (""); }
 ;

 /*-----------------------.
 | nterm_decls (%nterm).  |
 `-----------------------*/

 // A non empty list of possibly tagged symbols for %nterm.
 //
 // Can easily be defined like symbol_decls but restricted to ID, but
 // using token_decls allows to reduce the number of rules, and also to
 // make nicer error messages on "%nterm 'a'" or '%nterm FOO "foo"'.
 nterm_decls:
   token_decls
 ;

 /*-----------------------------------.
 | token_decls (%token, and %nterm).  |
 `-----------------------------------*/

 // A non empty list of possibly tagged symbols for %token or %nterm.
 token_decls:
   token_decl.1[syms]
     {
       $$ = $syms;
     }
 | TAG token_decl.1[syms]
     {
       $$ = symbol_list_type_set ($syms, $TAG);
     }
 | token_decls TAG token_decl.1[syms]
     {
       $$ = symbol_list_append ($1, symbol_list_type_set ($syms, $TAG));
     }
 ;

 // One or more symbol declarations for %token or %nterm.
 token_decl.1:
   token_decl                { $$ = symbol_list_sym_new ($1, @1); }
 | token_decl.1 token_decl   { $$ = symbol_list_append ($1, symbol_list_sym_new ($2, @2)); }

 // One symbol declaration for %token or %nterm.
 token_decl:
   id int.opt[num] alias
     {
       $$ = $id;
       symbol_class_set ($id, current_class, @id, true);
       if (0 <= $num)
         symbol_code_set ($id, $num, @num);
       if ($alias)
         symbol_make_alias ($id, $alias, @alias);
     }
 ;

 %type <int> int.opt;
 int.opt:
   %empty  { $$ = -1; }
 | INT_LITERAL
 ;

 %type <symbol*> alias;
 alias:
   %empty         { $$ = NULL; }
 | string_as_id   { $$ = $1; }
 | TSTRING
     {
       $$ = symbol_get ($1, @1);
       symbol_class_set ($$, token_sym, @1, false);
       $$->translatable = true;
     }
 ;


 /*-------------------------------------.
 | token_decls_for_prec (%left, etc.).  |
 `-------------------------------------*/

 // A non empty list of possibly tagged tokens for precedence declaration.
 //
 // Similar to %token (token_decls), but in '%left FOO 1 "foo"', it treats
 // FOO and "foo" as two different symbols instead of aliasing them.
 token_decls_for_prec:
   token_decl_for_prec.1[syms]
     {
       $$ = $syms;
     }
 | TAG token_decl_for_prec.1[syms]
     {
       $$ = symbol_list_type_set ($syms, $TAG);
     }
 | token_decls_for_prec TAG token_decl_for_prec.1[syms]
     {
       $$ = symbol_list_append ($1, symbol_list_type_set ($syms, $TAG));
     }
 ;

 // One or more token declarations for precedence declaration.
 token_decl_for_prec.1:
   token_decl_for_prec
     { $$ = symbol_list_sym_new ($1, @1); }
 | token_decl_for_prec.1 token_decl_for_prec
     { $$ = symbol_list_append ($1, symbol_list_sym_new ($2, @2)); }

 // One token declaration for precedence declaration.
 token_decl_for_prec:
   id int.opt[num]
     {
       $$ = $id;
       symbol_class_set ($id, token_sym, @id, false);
       if (0 <= $num)
         symbol_code_set ($id, $num, @num);
     }
 | string_as_id
 ;


 /*-----------------------------------.
 | symbol_decls (argument of %type).  |
 `-----------------------------------*/

 // A non empty list of typed symbols (for %type).
 symbol_decls:
   symbols.1[syms]
     {
       $$ = $syms;
     }
 | TAG symbols.1[syms]
     {
       $$ = symbol_list_type_set ($syms, $TAG);
     }
 | symbol_decls TAG symbols.1[syms]
     {
       $$ = symbol_list_append ($1, symbol_list_type_set ($syms, $TAG));
     }
 ;

 // One or more symbols.
 symbols.1:
   symbol
     {
       if (current_class != unknown_sym)
         symbol_class_set ($symbol, current_class, @symbol, false);
       $$ = symbol_list_sym_new ($symbol, @symbol);
     }
   | symbols.1 symbol
     {
       if (current_class != unknown_sym)
         symbol_class_set ($symbol, current_class, @symbol, false);
       $$ = symbol_list_append ($1, symbol_list_sym_new ($symbol, @symbol));
     }
 ;

         /*------------------------------------------.
         | The grammar section: between the two %%.  |
         `------------------------------------------*/

 grammar:
   rules_or_grammar_declaration
 | grammar rules_or_grammar_declaration
 ;

 /* As a Bison extension, one can use the grammar declarations in the
    body of the grammar.  */
 rules_or_grammar_declaration:
   rules
 | grammar_declaration ";"
 | error ";"
     {
       yyerrok;
     }
 ;

 rules:
   id_colon named_ref.opt { current_lhs ($1, @1, $2); } ":" rhses.1
     {
       /* Free the current lhs. */
       current_lhs (0, @1, 0);
     }
 ;

 rhses.1:
   rhs                { grammar_current_rule_end (@rhs); }
 | rhses.1 "|" rhs    { grammar_current_rule_end (@rhs); }
 | rhses.1 ";"
 ;

 %token PERCENT_EMPTY "%empty";
 rhs:
   %empty
     { grammar_current_rule_begin (current_lhs_symbol, current_lhs_loc,
                                   current_lhs_named_ref); }
 | rhs symbol named_ref.opt
     { grammar_current_rule_symbol_append ($2, @2, $3); }
 | rhs tag.opt "{...}"[action] named_ref.opt[name]
     { grammar_current_rule_action_append ($action, @action, $name, $[tag.opt]); }
 | rhs "%?{...}"
     { grammar_current_rule_predicate_append ($2, @2); }
 | rhs "%empty"
     { grammar_current_rule_empty_set (@2); }
 | rhs "%prec" symbol
     { grammar_current_rule_prec_set ($3, @3); }
 | rhs "%dprec" INT_LITERAL
     { grammar_current_rule_dprec_set ($3, @3); }
 | rhs "%merge" TAG
     { grammar_current_rule_merge_set ($3, @3); }
 | rhs "%expect" INT_LITERAL
     { grammar_current_rule_expect_sr ($3, @3); }
 | rhs "%expect-rr" INT_LITERAL
     { grammar_current_rule_expect_rr ($3, @3); }
 ;

 named_ref.opt:
   %empty         { $$ = NULL; }
 | BRACKETED_ID   { $$ = named_ref_new ($1, @1); }
 ;


 /*---------------------.
 | variable and value.  |
 `---------------------*/

 variable:
   ID
 ;

 /* Some content or empty by default. */
 %code requires {
   #include "muscle-tab.h"
   typedef struct
   {
     char const *chars;
     muscle_kind kind;
   } value_type;
 };
 %type <value_type> value;
 %printer
 {
   switch ($$.kind)
     {
     case muscle_code:    fprintf (yyo,  "{%s}",  $$.chars); break;
     case muscle_keyword: fprintf (yyo,   "%s",   $$.chars); break;
     case muscle_string:  fprintf (yyo, "\"%s\"", $$.chars); break;
     }
 } <value_type>;

 value:
   %empty  { $$.kind = muscle_keyword; $$.chars = ""; }
 | ID      { $$.kind = muscle_keyword; $$.chars = $1; }
 | STRING  { $$.kind = muscle_string;  $$.chars = unquote ($1); gram_scanner_last_string_free ();}
 | "{...}" { $$.kind = muscle_code;    $$.chars = strip_braces ($1); gram_scanner_last_string_free (); }
 ;


 /*--------------.
 | Identifiers.  |
 `--------------*/

 /* Identifiers are returned as uniqstr values by the scanner.
    Depending on their use, we may need to make them genuine symbols.  */

 id:
   ID
     { $$ = symbol_from_uniqstr ($1, @1); }
 | CHAR_LITERAL
     {
       const char *var = "api.token.raw";
       if (current_class == nterm_sym)
         {
           complain (&@1, complaint,
                     _("character literals cannot be nonterminals"));
           YYERROR;
         }
       if (muscle_percent_define_ifdef (var))
         {
           complain (&@1, complaint,
                     _("character literals cannot be used together"
                     " with %s"), var);
           location loc = muscle_percent_define_get_loc (var);
           subcomplain (&loc, complaint, _("definition of %s"), var);
         }
       $$ = symbol_get (char_name ($1), @1);
       symbol_class_set ($$, token_sym, @1, false);
       symbol_code_set ($$, $1, @1);
     }
 ;

 id_colon:
   ID_COLON { $$ = symbol_from_uniqstr ($1, @1); }
 ;


 symbol:
   id
 | string_as_id
 ;

 /* A string used as an ID.  */
 string_as_id:
   STRING
     {
       $$ = symbol_get ($1, @1);
       symbol_class_set ($$, token_sym, @1, false);
     }
 ;

 epilogue.opt:
   %empty
 | "%%" EPILOGUE
     {
       muscle_code_grow ("epilogue", translate_code ($2, @2, true), @2);
       code_scanner_last_string_free ();
     }
 ;

 %%

 int
 yyreport_syntax_error (const yypcontext_t *ctx)
 {
   int res = 0;
   /* Arguments of format: reported tokens (one for the "unexpected",
      one per "expected"). */
   enum { ARGS_MAX = 5 };
   const char *argv[ARGS_MAX];
   int argc = 0;
   yysymbol_kind_t unexpected = yypcontext_token (ctx);
   if (unexpected != YYSYMBOL_YYEMPTY)
     {
       argv[argc++] = yysymbol_name (unexpected);
       yysymbol_kind_t expected[ARGS_MAX - 1];
       int nexpected = yypcontext_expected_tokens (ctx, expected, ARGS_MAX - 1);
       if (nexpected < 0)
         res = nexpected;
       else
         for (int i = 0; i < nexpected; ++i)
           argv[argc++] = yysymbol_name (expected[i]);
     }
   syntax_error (*yypcontext_location (ctx), argc, argv);
   return res;
 }


 /* Return the location of the left-hand side of a rule whose
    right-hand side is RHS[1] ... RHS[N].  Ignore empty nonterminals in
    the right-hand side, and return an empty location equal to the end
    boundary of RHS[0] if the right-hand side is empty.  */

 static YYLTYPE
 lloc_default (YYLTYPE const *rhs, int n)
 {
   YYLTYPE loc;

   /* SGI MIPSpro 7.4.1m miscompiles "loc.start = loc.end = rhs[n].end;".
      The bug is fixed in 7.4.2m, but play it safe for now.  */
   loc.start = rhs[n].end;
   loc.end = rhs[n].end;

   /* Ignore empty nonterminals the start of the right-hand side.
      Do not bother to ignore them at the end of the right-hand side,
      since empty nonterminals have the same end as their predecessors.  */
   for (int i = 1; i <= n; i++)
     if (! equal_boundaries (rhs[i].start, rhs[i].end))
       {
         loc.start = rhs[i].start;
         break;
       }

   return loc;
 }

 static
 char *strip_braces (char *code)
 {
   code[strlen (code) - 1] = 0;
   return code + 1;
 }

 static
 char const *
 translate_code (char *code, location loc, bool plain)
 {
   code_props plain_code;
   if (plain)
     code_props_plain_init (&plain_code, code, loc);
   else
     code_props_symbol_action_init (&plain_code, code, loc);
   code_props_translate_code (&plain_code);
   gram_scanner_last_string_free ();
   return plain_code.code;
 }

 static
 char const *
 translate_code_braceless (char *code, location loc)
 {
   return translate_code (strip_braces (code), loc, true);
 }

 static void
 add_param (param_type type, char *decl, location loc)
 {
   static char const alphanum[26 + 26 + 1 + 10 + 1] =
     "abcdefghijklmnopqrstuvwxyz"
     "ABCDEFGHIJKLMNOPQRSTUVWXYZ"
     "_"
     "0123456789";

   char const *name_start = NULL;
   {
     char *p;
     /* Stop on last actual character.  */
     for (p = decl; p[1]; p++)
       if ((p == decl
            || ! memchr (alphanum, p[-1], sizeof alphanum - 1))
           && memchr (alphanum, p[0], sizeof alphanum - 10 - 1))
         name_start = p;

     /* Strip the surrounding '{' and '}', and any blanks just inside
        the braces.  */
     --p;
     while (c_isspace ((unsigned char) *p))
       --p;
     p[1] = '\0';
     ++decl;
     while (c_isspace ((unsigned char) *decl))
       ++decl;
   }

   if (! name_start)
     complain (&loc, complaint, _("missing identifier in parameter declaration"));
   else
     {
       char *name = xmemdup0 (name_start, strspn (name_start, alphanum));
       if (type & param_lex)
         muscle_pair_list_grow ("lex_param", decl, name);
       if (type & param_parse)
         muscle_pair_list_grow ("parse_param", decl, name);
       free (name);
     }

   gram_scanner_last_string_free ();
 }


 static void
 handle_header (char const *value)
 {
   header_flag = true;
   if (value)
     {
       char *file = unquote (value);
       spec_header_file = xstrdup (file);
       gram_scanner_last_string_free ();
       unquote_free (file);
     }
 }


 static void
 handle_error_verbose (location const *loc, char const *directive)
 {
   bison_directive (loc, directive);
   muscle_percent_define_insert (directive, *loc, muscle_keyword, "",
                                 MUSCLE_PERCENT_DEFINE_GRAMMAR_FILE);
 }


 static void
 handle_file_prefix (location const *loc,
                     location const *dir_loc,
                     char const *directive, char const *value_quoted)
 {
   char *value = unquote (value_quoted);
   bison_directive (loc, directive);
   bool warned = false;

   if (location_empty (spec_file_prefix_loc))
     {
       spec_file_prefix_loc = *loc;
       spec_file_prefix = value;
     }
   else
     {
       duplicate_directive (directive, spec_file_prefix_loc, *loc);
       warned = true;
     }

   if (!warned
       && STRNEQ (directive, "%file-prefix"))
     deprecated_directive (dir_loc, directive, "%file-prefix");
 }

 static void
 handle_language (location const *loc, char const *lang)
 {
   language_argmatch (unquote (lang), grammar_prio, *loc);
 }


 static void
 handle_name_prefix (location const *loc,
                     char const *directive, char const *value_quoted)
 {
   char *value = unquote (value_quoted);
   bison_directive (loc, directive);

   char buf1[1024];
   size_t len1 = sizeof (buf1);
   char *old = asnprintf (buf1, &len1, "%s\"%s\"", directive, value);
   if (!old)
     xalloc_die ();

   if (location_empty (spec_name_prefix_loc))
     {
       spec_name_prefix = value;
       spec_name_prefix_loc = *loc;

       char buf2[1024];
       size_t len2 = sizeof (buf2);
       char *new = asnprintf (buf2, &len2, "%%define api.prefix {%s}", value);
       if (!new)
         xalloc_die ();
       deprecated_directive (loc, old, new);
       if (new != buf2)
         free (new);
     }
   else
     duplicate_directive (old, spec_file_prefix_loc, *loc);

   if (old != buf1)
     free (old);
 }


 static void
 handle_pure_parser (location const *loc, char const *directive)
 {
   bison_directive (loc, directive);
   deprecated_directive (loc, directive, "%define api.pure");
   muscle_percent_define_insert ("api.pure", *loc, muscle_keyword, "",
                                 MUSCLE_PERCENT_DEFINE_GRAMMAR_FILE);
 }


 static void
 handle_require (location const *loc, char const *version_quoted)
 {
   char *version = unquote (version_quoted);
   required_version = strversion_to_int (version);
   if (required_version == -1)
     {
       complain (loc, complaint, _("invalid version requirement: %s"),
                 version);
       required_version = 0;
     }
   else
     {
       const char* package_version =
         0 < strverscmp (api_version, PACKAGE_VERSION)
         ? api_version : PACKAGE_VERSION;
       if (0 < strverscmp (version, package_version))
         {
           complain (loc, complaint, _("require bison %s, but have %s"),
                     version, package_version);
           exit (EX_MISMATCH);
         }
     }
   unquote_free (version);
   gram_scanner_last_string_free ();
 }

 static void
 handle_skeleton (location const *loc, char const *skel_quoted)
 {
   char *skel = unquote (skel_quoted);
   char const *skeleton_user = skel;
   if (strchr (skeleton_user, '/'))
     {
       size_t dir_length = strlen (grammar_file);
       while (dir_length && grammar_file[dir_length - 1] != '/')
         --dir_length;
       while (dir_length && grammar_file[dir_length - 1] == '/')
         --dir_length;
       char *skeleton_build =
         xmalloc (dir_length + 1 + strlen (skeleton_user) + 1);
       if (dir_length > 0)
         {
           memcpy (skeleton_build, grammar_file, dir_length);
           skeleton_build[dir_length++] = '/';
         }
       strcpy (skeleton_build + dir_length, skeleton_user);
       skeleton_user = uniqstr_new (skeleton_build);
       free (skeleton_build);
     }
   skeleton_arg (skeleton_user, grammar_prio, *loc);
 }


 static void
 handle_yacc (location const *loc)
 {
   const char *directive = "%yacc";
   bison_directive (loc, directive);
   if (location_empty (yacc_loc))
     set_yacc (*loc);
   else
     duplicate_directive (directive, yacc_loc, *loc);
 }


 static void
 gram_error (location const *loc, char const *msg)
 {
   complain (loc, complaint, "%s", msg);
 }

 static char const *
 char_name (char c)
 {
   if (c == '\'')
     return "'\\''";
   else
     {
       char buf[4];
       buf[0] = '\''; buf[1] = c; buf[2] = '\''; buf[3] = '\0';
       return quotearg_style (escape_quoting_style, buf);
     }
 }

 static void
 current_lhs (symbol *sym, location loc, named_ref *ref)
 {
   current_lhs_symbol = sym;
   current_lhs_loc = loc;
   if (sym)
     symbol_location_as_lhs_set (sym, loc);
   /* In order to simplify memory management, named references for lhs
      are always assigned by deep copy into the current symbol_list
      node.  This is because a single named-ref in the grammar may
      result in several uses when the user factors lhs between several
      rules using "|".  Therefore free the parser's original copy.  */
   free (current_lhs_named_ref);
   current_lhs_named_ref = ref;
 }

 static void tron (FILE *yyo)
 {
   begin_use_class ("value", yyo);
 }

 static void troff (FILE *yyo)
 {
   end_use_class ("value", yyo);
 }


 /*----------.
 | Unquote.  |
 `----------*/

 struct obstack obstack_for_unquote;

 void
 parser_init (void)
 {
   obstack_init (&obstack_for_unquote);
 }

 void
 parser_free (void)
 {
   obstack_free (&obstack_for_unquote, 0);
 }

 static void
 unquote_free (char *last_string)
 {
   obstack_free (&obstack_for_unquote, last_string);
 }

 static char *
 unquote (const char *cp)
 {
 #define GROW(Char)                              \
   obstack_1grow (&obstack_for_unquote, Char);
   for (++cp; *cp && *cp != '"'; ++cp)
     switch (*cp)
       {
       case '"':
         break;
       case '\\':
         ++cp;
         switch (*cp)
           {
           case '0': case '1': case '2': case '3': case '4':
           case '5': case '6': case '7': case '8': case '9':
             {
               int c = cp[0] - '0';
               if (c_isdigit (cp[1]))
                 {
                   ++cp;
                   c = c * 8 + cp[0] - '0';
                 }
               if (c_isdigit (cp[1]))
                 {
                   ++cp;
                   c = c * 8 + cp[0] - '0';
                 }
               GROW (c);
             }
             break;

           case 'a': GROW ('\a'); break;
           case 'b': GROW ('\b'); break;
           case 'f': GROW ('\f'); break;
           case 'n': GROW ('\n'); break;
           case 'r': GROW ('\r'); break;
           case 't': GROW ('\t'); break;
           case 'v': GROW ('\v'); break;

           case 'x':
             {
               int c = 0;
               while (c_isxdigit (cp[1]))
                 {
                   ++cp;
                   c = (c * 16 + (c_isdigit (cp[0]) ? cp[0] - '0'
                                  : c_isupper (cp[0]) ? cp[0] - 'A'
                                  : cp[0] - '0'));
                 }
               GROW (c);
               break;
             }
           }
         break;

       default:
         GROW (*cp);
         break;
       }
   assert (*cp == '"');
   ++cp;
   assert (*cp == '\0');
 #undef GROW
   return obstack_finish0 (&obstack_for_unquote);
 }