/* Bison Grammar Parser -*- C -*- Copyright (C) 2002-2015, 2018-2022 Free Software Foundation, Inc. This file is part of Bison, the GNU Compiler Compiler. This program is free software: you can redistribute it and/or modify it under the terms of the GNU General Public License as published by the Free Software Foundation, either version 3 of the License, or (at your option) any later version. This program is distributed in the hope that it will be useful, but WITHOUT ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU General Public License for more details. You should have received a copy of the GNU General Public License along with this program. If not, see . */ %code requires { #include "symlist.h" #include "symtab.h" } %code provides { /* Initialize unquote. */ void parser_init (void); /* Deallocate storage for unquote. */ void parser_free (void); } %code top { /* On column 0 to please syntax-check. */ #include } %code { #include "system.h" #include #include #include #include #include "complain.h" #include "conflicts.h" #include "files.h" #include "getargs.h" #include "gram.h" #include "named-ref.h" #include "reader.h" #include "scan-code.h" #include "scan-gram.h" #include "strversion.h" /* Pretend to be at least that version, to check features published in that version while developping it. */ static const char* api_version = "3.8"; static int current_prec = 0; static location current_lhs_loc; static named_ref *current_lhs_named_ref; static symbol *current_lhs_symbol; static symbol_class current_class = unknown_sym; /** Set the new current left-hand side symbol, possibly common * to several right-hand side parts of rule. */ static void current_lhs (symbol *sym, location loc, named_ref *ref); #define YYLLOC_DEFAULT(Current, Rhs, N) \ (Current) = lloc_default (Rhs, N) static YYLTYPE lloc_default (YYLTYPE const *, int); #define YY_LOCATION_PRINT(File, Loc) \ location_print (Loc, File) /* Strip initial '{' and final '}' (must be first and last characters). Return the result. */ static char *strip_braces (char *code); /* Convert CODE by calling code_props_plain_init if PLAIN, otherwise code_props_symbol_action_init. Calls gram_scanner_last_string_free to release the latest string from the scanner (should be CODE). */ static char const *translate_code (char *code, location loc, bool plain); /* Convert CODE by calling code_props_plain_init after having stripped the first and last characters (expected to be '{', and '}'). Calls gram_scanner_last_string_free to release the latest string from the scanner (should be CODE). */ static char const *translate_code_braceless (char *code, location loc); /* Handle a %header directive. */ static void handle_header (char const *value); /* Handle a %error-verbose directive. */ static void handle_error_verbose (location const *loc, char const *directive); /* Handle a %file-prefix directive. */ static void handle_file_prefix (location const *loc, location const *dir_loc, char const *directive, char const *value); /* Handle a %language directive. */ static void handle_language (location const *loc, char const *lang); /* Handle a %name-prefix directive. */ static void handle_name_prefix (location const *loc, char const *directive, char const *value); /* Handle a %pure-parser directive. */ static void handle_pure_parser (location const *loc, char const *directive); /* Handle a %require directive. */ static void handle_require (location const *loc, char const *version); /* Handle a %skeleton directive. */ static void handle_skeleton (location const *loc, char const *skel); /* Handle a %yacc directive. */ static void handle_yacc (location const *loc); /* Implementation of yyerror. */ static void gram_error (location const *, char const *); /* A string that describes a char (e.g., 'a' -> "'a'"). */ static char const *char_name (char); /* Add style to semantic values in traces. */ static void tron (FILE *yyo); static void troff (FILE *yyo); /* Interpret a quoted string (such as `"Hello, \"World\"\n\""`). Manages the memory of the result. */ static char *unquote (const char *str); /* Discard the latest unquoted string. */ static void unquote_free (char *last_string); } %define api.header.include {"parse-gram.h"} %define api.prefix {gram_} %define api.pure full %define api.token.raw %define api.value.type union %define locations %define parse.error custom %define parse.lac full %define parse.trace %header %expect 0 %verbose %initial-action { /* Bison's grammar can initial empty locations, hence a default location is needed. */ boundary_set (&@$.start, grammar_file, 1, 1, 1); boundary_set (&@$.end, grammar_file, 1, 1, 1); } %token STRING _("string") TSTRING _("translatable string") PERCENT_TOKEN "%token" PERCENT_NTERM "%nterm" PERCENT_TYPE "%type" PERCENT_DESTRUCTOR "%destructor" PERCENT_PRINTER "%printer" PERCENT_LEFT "%left" PERCENT_RIGHT "%right" PERCENT_NONASSOC "%nonassoc" PERCENT_PRECEDENCE "%precedence" PERCENT_PREC "%prec" PERCENT_DPREC "%dprec" PERCENT_MERGE "%merge" PERCENT_CODE "%code" PERCENT_DEFAULT_PREC "%default-prec" PERCENT_DEFINE "%define" PERCENT_ERROR_VERBOSE "%error-verbose" PERCENT_EXPECT "%expect" PERCENT_EXPECT_RR "%expect-rr" PERCENT_FILE_PREFIX "%file-prefix" PERCENT_FLAG "%" PERCENT_GLR_PARSER "%glr-parser" PERCENT_HEADER "%header" PERCENT_INITIAL_ACTION "%initial-action" PERCENT_LANGUAGE "%language" PERCENT_NAME_PREFIX "%name-prefix" PERCENT_NO_DEFAULT_PREC "%no-default-prec" PERCENT_NO_LINES "%no-lines" PERCENT_NONDETERMINISTIC_PARSER "%nondeterministic-parser" PERCENT_OUTPUT "%output" PERCENT_PURE_PARSER "%pure-parser" PERCENT_REQUIRE "%require" PERCENT_SKELETON "%skeleton" PERCENT_START "%start" PERCENT_TOKEN_TABLE "%token-table" PERCENT_VERBOSE "%verbose" PERCENT_YACC "%yacc" BRACED_CODE "{...}" BRACED_PREDICATE "%?{...}" BRACKETED_ID _("[identifier]") CHAR_LITERAL _("character literal") COLON ":" EPILOGUE _("epilogue") EQUAL "=" ID _("identifier") ID_COLON _("identifier:") PERCENT_PERCENT "%%" PIPE "|" PROLOGUE "%{...%}" SEMICOLON ";" TAG _("") TAG_ANY "<*>" TAG_NONE "<>" /* Experimental feature, don't rely on it. */ %code pre-printer {tron (yyo);} %code post-printer {troff (yyo);} %type CHAR_LITERAL %printer { fputs (char_name ($$), yyo); } %type "{...}" "%?{...}" "%{...%}" EPILOGUE STRING TSTRING %printer { fputs ($$, yyo); } %type BRACKETED_ID ID ID_COLON PERCENT_ERROR_VERBOSE PERCENT_FILE_PREFIX PERCENT_FLAG PERCENT_NAME_PREFIX PERCENT_PURE_PARSER TAG tag tag.opt variable %printer { fputs ($$, yyo); } %printer { fprintf (yyo, "[%s]", $$); } BRACKETED_ID %printer { fprintf (yyo, "%s:", $$); } ID_COLON %printer { fprintf (yyo, "%%%s", $$); } PERCENT_FLAG %printer { fprintf (yyo, "<%s>", $$); } TAG tag %token INT_LITERAL _("integer literal") %printer { fprintf (yyo, "%d", $$); } %type id id_colon string_as_id symbol token_decl token_decl_for_prec %printer { fprintf (yyo, "%s", $$ ? $$->tag : ""); } %printer { fprintf (yyo, "%s:", $$->tag); } id_colon %type precedence_declarator %destructor { symbol_list_free ($$); } %printer { symbol_list_syms_print ($$, yyo); } %type named_ref.opt /*---------. | %param. | `---------*/ %code requires { typedef enum { param_none = 0, param_lex = 1 << 0, param_parse = 1 << 1, param_both = param_lex | param_parse } param_type; }; %code { /** Add a lex-param and/or a parse-param. * * \param type where to push this formal argument. * \param decl the formal argument. Destroyed. * \param loc the location in the source. */ static void add_param (param_type type, char *decl, location loc); static param_type current_param = param_none; }; %token PERCENT_PARAM "%param"; %printer { switch ($$) { #define CASE(In, Out) \ case param_ ## In: fputs ("%" #Out, yyo); break CASE (lex, lex-param); CASE (parse, parse-param); CASE (both, param); #undef CASE case param_none: aver (false); break; } } ; /*==========\ | Grammar. | \==========*/ %% input: prologue_declarations "%%" grammar epilogue.opt ; /*------------------------------------. | Declarations: before the first %%. | `------------------------------------*/ prologue_declarations: %empty | prologue_declarations prologue_declaration ; prologue_declaration: grammar_declaration | "%{...%}" { muscle_code_grow (union_seen ? "post_prologue" : "pre_prologue", translate_code ($1, @1, true), @1); code_scanner_last_string_free (); } | "%" { muscle_percent_define_ensure ($1, @1, true); } | "%define" variable value { muscle_percent_define_insert ($2, @$, $3.kind, $3.chars, MUSCLE_PERCENT_DEFINE_GRAMMAR_FILE); } | "%header" string.opt { handle_header ($2); } | "%error-verbose" { handle_error_verbose (&@$, $1); } | "%expect" INT_LITERAL { expected_sr_conflicts = $2; } | "%expect-rr" INT_LITERAL { expected_rr_conflicts = $2; } | "%file-prefix" STRING { handle_file_prefix (&@$, &@1, $1, $2); } | "%glr-parser" { nondeterministic_parser = true; glr_parser = true; } | "%initial-action" "{...}" { muscle_code_grow ("initial_action", translate_code ($2, @2, false), @2); code_scanner_last_string_free (); } | "%language" STRING { handle_language (&@1, $2); } | "%name-prefix" STRING { handle_name_prefix (&@$, $1, $2); } | "%no-lines" { no_lines_flag = true; } | "%nondeterministic-parser" { nondeterministic_parser = true; } | "%output" STRING { spec_outfile = unquote ($2); gram_scanner_last_string_free (); } | "%param" { current_param = $1; } params { current_param = param_none; } | "%pure-parser" { handle_pure_parser (&@$, $1); } | "%require" STRING { handle_require (&@2, $2); } | "%skeleton" STRING { handle_skeleton (&@2, $2); } | "%token-table" { token_table_flag = true; } | "%verbose" { report_flag |= report_states; } | "%yacc" { handle_yacc (&@$); } | error ";" { current_class = unknown_sym; yyerrok; } | /*FIXME: Err? What is this horror doing here? */ ";" ; params: params "{...}" { add_param (current_param, $2, @2); } | "{...}" { add_param (current_param, $1, @1); } ; /*----------------------. | grammar_declaration. | `----------------------*/ grammar_declaration: symbol_declaration | "%start" symbols.1 { grammar_start_symbols_add ($2); } | code_props_type "{...}" generic_symlist { code_props code; code_props_symbol_action_init (&code, $2, @2); code_props_translate_code (&code); { for (symbol_list *list = $3; list; list = list->next) symbol_list_code_props_set (list, $1, &code); symbol_list_free ($3); } } | "%default-prec" { default_prec = true; } | "%no-default-prec" { default_prec = false; } | "%code" "{...}" { /* Do not invoke muscle_percent_code_grow here since it invokes muscle_user_name_list_grow. */ muscle_code_grow ("percent_code()", translate_code_braceless ($2, @2), @2); code_scanner_last_string_free (); } | "%code" ID "{...}" { muscle_percent_code_grow ($2, @2, translate_code_braceless ($3, @3), @3); code_scanner_last_string_free (); } ; %type code_props_type; %printer { fprintf (yyo, "%s", code_props_type_string ($$)); } ; code_props_type: "%destructor" { $$ = destructor; } | "%printer" { $$ = printer; } ; /*---------. | %union. | `---------*/ %token PERCENT_UNION "%union"; union_name: %empty {} | ID { muscle_percent_define_insert ("api.value.union.name", @1, muscle_keyword, $1, MUSCLE_PERCENT_DEFINE_GRAMMAR_FILE); } ; grammar_declaration: "%union" union_name "{...}" { union_seen = true; muscle_code_grow ("union_members", translate_code_braceless ($3, @3), @3); code_scanner_last_string_free (); } ; %type nterm_decls symbol_decls symbols.1 token_decls token_decls_for_prec token_decl.1 token_decl_for_prec.1; symbol_declaration: "%nterm" { current_class = nterm_sym; } nterm_decls[syms] { current_class = unknown_sym; symbol_list_free ($syms); } | "%token" { current_class = token_sym; } token_decls[syms] { current_class = unknown_sym; symbol_list_free ($syms); } | "%type" { current_class = pct_type_sym; } symbol_decls[syms] { current_class = unknown_sym; symbol_list_free ($syms); } | precedence_declarator token_decls_for_prec[syms] { ++current_prec; for (symbol_list *list = $syms; list; list = list->next) symbol_precedence_set (list->content.sym, current_prec, $1, @1); symbol_list_free ($syms); } ; precedence_declarator: "%left" { $$ = left_assoc; } | "%right" { $$ = right_assoc; } | "%nonassoc" { $$ = non_assoc; } | "%precedence" { $$ = precedence_assoc; } ; %type string.opt; string.opt: %empty { $$ = NULL; } | STRING { $$ = $1; } ; tag.opt: %empty { $$ = NULL; } | TAG { $$ = $1; } ; %type generic_symlist generic_symlist_item; generic_symlist: generic_symlist_item | generic_symlist generic_symlist_item { $$ = symbol_list_append ($1, $2); } ; generic_symlist_item: symbol { $$ = symbol_list_sym_new ($1, @1); } | tag { $$ = symbol_list_type_new ($1, @1); } ; tag: TAG | "<*>" { $$ = uniqstr_new ("*"); } | "<>" { $$ = uniqstr_new (""); } ; /*-----------------------. | nterm_decls (%nterm). | `-----------------------*/ // A non empty list of possibly tagged symbols for %nterm. // // Can easily be defined like symbol_decls but restricted to ID, but // using token_decls allows to reduce the number of rules, and also to // make nicer error messages on "%nterm 'a'" or '%nterm FOO "foo"'. nterm_decls: token_decls ; /*-----------------------------------. | token_decls (%token, and %nterm). | `-----------------------------------*/ // A non empty list of possibly tagged symbols for %token or %nterm. token_decls: token_decl.1[syms] { $$ = $syms; } | TAG token_decl.1[syms] { $$ = symbol_list_type_set ($syms, $TAG); } | token_decls TAG token_decl.1[syms] { $$ = symbol_list_append ($1, symbol_list_type_set ($syms, $TAG)); } ; // One or more symbol declarations for %token or %nterm. token_decl.1: token_decl { $$ = symbol_list_sym_new ($1, @1); } | token_decl.1 token_decl { $$ = symbol_list_append ($1, symbol_list_sym_new ($2, @2)); } // One symbol declaration for %token or %nterm. token_decl: id int.opt[num] alias { $$ = $id; symbol_class_set ($id, current_class, @id, true); if (0 <= $num) symbol_code_set ($id, $num, @num); if ($alias) symbol_make_alias ($id, $alias, @alias); } ; %type int.opt; int.opt: %empty { $$ = -1; } | INT_LITERAL ; %type alias; alias: %empty { $$ = NULL; } | string_as_id { $$ = $1; } | TSTRING { $$ = symbol_get ($1, @1); symbol_class_set ($$, token_sym, @1, false); $$->translatable = true; } ; /*-------------------------------------. | token_decls_for_prec (%left, etc.). | `-------------------------------------*/ // A non empty list of possibly tagged tokens for precedence declaration. // // Similar to %token (token_decls), but in '%left FOO 1 "foo"', it treats // FOO and "foo" as two different symbols instead of aliasing them. token_decls_for_prec: token_decl_for_prec.1[syms] { $$ = $syms; } | TAG token_decl_for_prec.1[syms] { $$ = symbol_list_type_set ($syms, $TAG); } | token_decls_for_prec TAG token_decl_for_prec.1[syms] { $$ = symbol_list_append ($1, symbol_list_type_set ($syms, $TAG)); } ; // One or more token declarations for precedence declaration. token_decl_for_prec.1: token_decl_for_prec { $$ = symbol_list_sym_new ($1, @1); } | token_decl_for_prec.1 token_decl_for_prec { $$ = symbol_list_append ($1, symbol_list_sym_new ($2, @2)); } // One token declaration for precedence declaration. token_decl_for_prec: id int.opt[num] { $$ = $id; symbol_class_set ($id, token_sym, @id, false); if (0 <= $num) symbol_code_set ($id, $num, @num); } | string_as_id ; /*-----------------------------------. | symbol_decls (argument of %type). | `-----------------------------------*/ // A non empty list of typed symbols (for %type). symbol_decls: symbols.1[syms] { $$ = $syms; } | TAG symbols.1[syms] { $$ = symbol_list_type_set ($syms, $TAG); } | symbol_decls TAG symbols.1[syms] { $$ = symbol_list_append ($1, symbol_list_type_set ($syms, $TAG)); } ; // One or more symbols. symbols.1: symbol { if (current_class != unknown_sym) symbol_class_set ($symbol, current_class, @symbol, false); $$ = symbol_list_sym_new ($symbol, @symbol); } | symbols.1 symbol { if (current_class != unknown_sym) symbol_class_set ($symbol, current_class, @symbol, false); $$ = symbol_list_append ($1, symbol_list_sym_new ($symbol, @symbol)); } ; /*------------------------------------------. | The grammar section: between the two %%. | `------------------------------------------*/ grammar: rules_or_grammar_declaration | grammar rules_or_grammar_declaration ; /* As a Bison extension, one can use the grammar declarations in the body of the grammar. */ rules_or_grammar_declaration: rules | grammar_declaration ";" | error ";" { yyerrok; } ; rules: id_colon named_ref.opt { current_lhs ($1, @1, $2); } ":" rhses.1 { /* Free the current lhs. */ current_lhs (0, @1, 0); } ; rhses.1: rhs { grammar_current_rule_end (@rhs); } | rhses.1 "|" rhs { grammar_current_rule_end (@rhs); } | rhses.1 ";" ; %token PERCENT_EMPTY "%empty"; rhs: %empty { grammar_current_rule_begin (current_lhs_symbol, current_lhs_loc, current_lhs_named_ref); } | rhs symbol named_ref.opt { grammar_current_rule_symbol_append ($2, @2, $3); } | rhs tag.opt "{...}"[action] named_ref.opt[name] { grammar_current_rule_action_append ($action, @action, $name, $[tag.opt]); } | rhs "%?{...}" { grammar_current_rule_predicate_append ($2, @2); } | rhs "%empty" { grammar_current_rule_empty_set (@2); } | rhs "%prec" symbol { grammar_current_rule_prec_set ($3, @3); } | rhs "%dprec" INT_LITERAL { grammar_current_rule_dprec_set ($3, @3); } | rhs "%merge" TAG { grammar_current_rule_merge_set ($3, @3); } | rhs "%expect" INT_LITERAL { grammar_current_rule_expect_sr ($3, @3); } | rhs "%expect-rr" INT_LITERAL { grammar_current_rule_expect_rr ($3, @3); } ; named_ref.opt: %empty { $$ = NULL; } | BRACKETED_ID { $$ = named_ref_new ($1, @1); } ; /*---------------------. | variable and value. | `---------------------*/ variable: ID ; /* Some content or empty by default. */ %code requires { #include "muscle-tab.h" typedef struct { char const *chars; muscle_kind kind; } value_type; }; %type value; %printer { switch ($$.kind) { case muscle_code: fprintf (yyo, "{%s}", $$.chars); break; case muscle_keyword: fprintf (yyo, "%s", $$.chars); break; case muscle_string: fprintf (yyo, "\"%s\"", $$.chars); break; } } ; value: %empty { $$.kind = muscle_keyword; $$.chars = ""; } | ID { $$.kind = muscle_keyword; $$.chars = $1; } | STRING { $$.kind = muscle_string; $$.chars = unquote ($1); gram_scanner_last_string_free ();} | "{...}" { $$.kind = muscle_code; $$.chars = strip_braces ($1); gram_scanner_last_string_free (); } ; /*--------------. | Identifiers. | `--------------*/ /* Identifiers are returned as uniqstr values by the scanner. Depending on their use, we may need to make them genuine symbols. */ id: ID { $$ = symbol_from_uniqstr ($1, @1); } | CHAR_LITERAL { const char *var = "api.token.raw"; if (current_class == nterm_sym) { complain (&@1, complaint, _("character literals cannot be nonterminals")); YYERROR; } if (muscle_percent_define_ifdef (var)) { complain (&@1, complaint, _("character literals cannot be used together" " with %s"), var); location loc = muscle_percent_define_get_loc (var); subcomplain (&loc, complaint, _("definition of %s"), var); } $$ = symbol_get (char_name ($1), @1); symbol_class_set ($$, token_sym, @1, false); symbol_code_set ($$, $1, @1); } ; id_colon: ID_COLON { $$ = symbol_from_uniqstr ($1, @1); } ; symbol: id | string_as_id ; /* A string used as an ID. */ string_as_id: STRING { $$ = symbol_get ($1, @1); symbol_class_set ($$, token_sym, @1, false); } ; epilogue.opt: %empty | "%%" EPILOGUE { muscle_code_grow ("epilogue", translate_code ($2, @2, true), @2); code_scanner_last_string_free (); } ; %% int yyreport_syntax_error (const yypcontext_t *ctx) { int res = 0; /* Arguments of format: reported tokens (one for the "unexpected", one per "expected"). */ enum { ARGS_MAX = 5 }; const char *argv[ARGS_MAX]; int argc = 0; yysymbol_kind_t unexpected = yypcontext_token (ctx); if (unexpected != YYSYMBOL_YYEMPTY) { argv[argc++] = yysymbol_name (unexpected); yysymbol_kind_t expected[ARGS_MAX - 1]; int nexpected = yypcontext_expected_tokens (ctx, expected, ARGS_MAX - 1); if (nexpected < 0) res = nexpected; else for (int i = 0; i < nexpected; ++i) argv[argc++] = yysymbol_name (expected[i]); } syntax_error (*yypcontext_location (ctx), argc, argv); return res; } /* Return the location of the left-hand side of a rule whose right-hand side is RHS[1] ... RHS[N]. Ignore empty nonterminals in the right-hand side, and return an empty location equal to the end boundary of RHS[0] if the right-hand side is empty. */ static YYLTYPE lloc_default (YYLTYPE const *rhs, int n) { YYLTYPE loc; /* SGI MIPSpro 7.4.1m miscompiles "loc.start = loc.end = rhs[n].end;". The bug is fixed in 7.4.2m, but play it safe for now. */ loc.start = rhs[n].end; loc.end = rhs[n].end; /* Ignore empty nonterminals the start of the right-hand side. Do not bother to ignore them at the end of the right-hand side, since empty nonterminals have the same end as their predecessors. */ for (int i = 1; i <= n; i++) if (! equal_boundaries (rhs[i].start, rhs[i].end)) { loc.start = rhs[i].start; break; } return loc; } static char *strip_braces (char *code) { code[strlen (code) - 1] = 0; return code + 1; } static char const * translate_code (char *code, location loc, bool plain) { code_props plain_code; if (plain) code_props_plain_init (&plain_code, code, loc); else code_props_symbol_action_init (&plain_code, code, loc); code_props_translate_code (&plain_code); gram_scanner_last_string_free (); return plain_code.code; } static char const * translate_code_braceless (char *code, location loc) { return translate_code (strip_braces (code), loc, true); } static void add_param (param_type type, char *decl, location loc) { static char const alphanum[26 + 26 + 1 + 10 + 1] = "abcdefghijklmnopqrstuvwxyz" "ABCDEFGHIJKLMNOPQRSTUVWXYZ" "_" "0123456789"; char const *name_start = NULL; { char *p; /* Stop on last actual character. */ for (p = decl; p[1]; p++) if ((p == decl || ! memchr (alphanum, p[-1], sizeof alphanum - 1)) && memchr (alphanum, p[0], sizeof alphanum - 10 - 1)) name_start = p; /* Strip the surrounding '{' and '}', and any blanks just inside the braces. */ --p; while (c_isspace (*p)) --p; p[1] = '\0'; ++decl; while (c_isspace (*decl)) ++decl; } if (! name_start) complain (&loc, complaint, _("missing identifier in parameter declaration")); else { char *name = xmemdup0 (name_start, strspn (name_start, alphanum)); if (type & param_lex) muscle_pair_list_grow ("lex_param", decl, name); if (type & param_parse) muscle_pair_list_grow ("parse_param", decl, name); free (name); } gram_scanner_last_string_free (); } static void handle_header (char const *value) { header_flag = true; if (value) { char *file = unquote (value); spec_header_file = xstrdup (file); gram_scanner_last_string_free (); unquote_free (file); } } static void handle_error_verbose (location const *loc, char const *directive) { bison_directive (loc, directive); muscle_percent_define_insert (directive, *loc, muscle_keyword, "", MUSCLE_PERCENT_DEFINE_GRAMMAR_FILE); } static void handle_file_prefix (location const *loc, location const *dir_loc, char const *directive, char const *value_quoted) { char *value = unquote (value_quoted); bison_directive (loc, directive); bool warned = false; if (location_empty (spec_file_prefix_loc)) { spec_file_prefix_loc = *loc; spec_file_prefix = value; } else { duplicate_directive (directive, spec_file_prefix_loc, *loc); warned = true; } if (!warned && STRNEQ (directive, "%file-prefix")) deprecated_directive (dir_loc, directive, "%file-prefix"); } static void handle_language (location const *loc, char const *lang) { language_argmatch (unquote (lang), grammar_prio, *loc); } static void handle_name_prefix (location const *loc, char const *directive, char const *value_quoted) { char *value = unquote (value_quoted); bison_directive (loc, directive); char buf1[1024]; size_t len1 = sizeof (buf1); char *old = asnprintf (buf1, &len1, "%s\"%s\"", directive, value); if (!old) xalloc_die (); if (location_empty (spec_name_prefix_loc)) { spec_name_prefix = value; spec_name_prefix_loc = *loc; char buf2[1024]; size_t len2 = sizeof (buf2); char *new = asnprintf (buf2, &len2, "%%define api.prefix {%s}", value); if (!new) xalloc_die (); deprecated_directive (loc, old, new); if (new != buf2) free (new); } else duplicate_directive (old, spec_file_prefix_loc, *loc); if (old != buf1) free (old); } static void handle_pure_parser (location const *loc, char const *directive) { bison_directive (loc, directive); deprecated_directive (loc, directive, "%define api.pure"); muscle_percent_define_insert ("api.pure", *loc, muscle_keyword, "", MUSCLE_PERCENT_DEFINE_GRAMMAR_FILE); } static void handle_require (location const *loc, char const *version_quoted) { char *version = unquote (version_quoted); required_version = strversion_to_int (version); if (required_version == -1) { complain (loc, complaint, _("invalid version requirement: %s"), version); required_version = 0; } else { const char* package_version = 0 < strverscmp (api_version, PACKAGE_VERSION) ? api_version : PACKAGE_VERSION; if (0 < strverscmp (version, package_version)) { complain (loc, complaint, _("require bison %s, but have %s"), version, package_version); exit (EX_MISMATCH); } } unquote_free (version); gram_scanner_last_string_free (); } static void handle_skeleton (location const *loc, char const *skel_quoted) { char *skel = unquote (skel_quoted); char const *skeleton_user = skel; if (strchr (skeleton_user, '/')) { size_t dir_length = strlen (grammar_file); while (dir_length && grammar_file[dir_length - 1] != '/') --dir_length; while (dir_length && grammar_file[dir_length - 1] == '/') --dir_length; char *skeleton_build = xmalloc (dir_length + 1 + strlen (skeleton_user) + 1); if (dir_length > 0) { memcpy (skeleton_build, grammar_file, dir_length); skeleton_build[dir_length++] = '/'; } strcpy (skeleton_build + dir_length, skeleton_user); skeleton_user = uniqstr_new (skeleton_build); free (skeleton_build); } skeleton_arg (skeleton_user, grammar_prio, *loc); } static void handle_yacc (location const *loc) { const char *directive = "%yacc"; bison_directive (loc, directive); if (location_empty (yacc_loc)) set_yacc (*loc); else duplicate_directive (directive, yacc_loc, *loc); } static void gram_error (location const *loc, char const *msg) { complain (loc, complaint, "%s", msg); } static char const * char_name (char c) { if (c == '\'') return "'\\''"; else { char buf[4]; buf[0] = '\''; buf[1] = c; buf[2] = '\''; buf[3] = '\0'; return quotearg_style (escape_quoting_style, buf); } } static void current_lhs (symbol *sym, location loc, named_ref *ref) { current_lhs_symbol = sym; current_lhs_loc = loc; if (sym) symbol_location_as_lhs_set (sym, loc); /* In order to simplify memory management, named references for lhs are always assigned by deep copy into the current symbol_list node. This is because a single named-ref in the grammar may result in several uses when the user factors lhs between several rules using "|". Therefore free the parser's original copy. */ free (current_lhs_named_ref); current_lhs_named_ref = ref; } static void tron (FILE *yyo) { begin_use_class ("value", yyo); } static void troff (FILE *yyo) { end_use_class ("value", yyo); } /*----------. | Unquote. | `----------*/ struct obstack obstack_for_unquote; void parser_init (void) { obstack_init (&obstack_for_unquote); } void parser_free (void) { obstack_free (&obstack_for_unquote, 0); } static void unquote_free (char *last_string) { obstack_free (&obstack_for_unquote, last_string); } static char * unquote (const char *cp) { #define GROW(Char) \ obstack_1grow (&obstack_for_unquote, Char); for (++cp; *cp && *cp != '"'; ++cp) switch (*cp) { case '"': break; case '\\': ++cp; switch (*cp) { case '0': case '1': case '2': case '3': case '4': case '5': case '6': case '7': case '8': case '9': { int c = cp[0] - '0'; if (c_isdigit (cp[1])) { ++cp; c = c * 8 + cp[0] - '0'; } if (c_isdigit (cp[1])) { ++cp; c = c * 8 + cp[0] - '0'; } GROW (c); } break; case 'a': GROW ('\a'); break; case 'b': GROW ('\b'); break; case 'f': GROW ('\f'); break; case 'n': GROW ('\n'); break; case 'r': GROW ('\r'); break; case 't': GROW ('\t'); break; case 'v': GROW ('\v'); break; case 'x': { int c = 0; while (c_isxdigit (cp[1])) { ++cp; c = (c * 16 + (c_isdigit (cp[0]) ? cp[0] - '0' : c_isupper (cp[0]) ? cp[0] - 'A' : cp[0] - '0')); } GROW (c); break; } } break; default: GROW (*cp); break; } assert (*cp == '"'); ++cp; assert (*cp == '\0'); #undef GROW return obstack_finish0 (&obstack_for_unquote); }