mirror of
https://git.savannah.gnu.org/git/bison.git
synced 2026-03-09 20:33:03 +00:00
* src/muscle_tab.h, src/muscle_tab.c: Rename as... * src/muscle-tab.h, src/muscle-tab.c: these. * src/getargs.c, src/local.mk, src/main.c, src/output.c, * src/parse-gram.y, src/reader.c, src/scan-code.l: Adjust.
518 lines
14 KiB
C
518 lines
14 KiB
C
/* Bison Action Scanner -*- C -*-
|
|
|
|
Copyright (C) 2006, 2007, 2008, 2009 Free Software Foundation, Inc.
|
|
|
|
This file is part of Bison, the GNU Compiler Compiler.
|
|
|
|
This program is free software: you can redistribute it and/or modify
|
|
it under the terms of the GNU General Public License as published by
|
|
the Free Software Foundation, either version 3 of the License, or
|
|
(at your option) any later version.
|
|
|
|
This program is distributed in the hope that it will be useful,
|
|
but WITHOUT ANY WARRANTY; without even the implied warranty of
|
|
MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
|
|
GNU General Public License for more details.
|
|
|
|
You should have received a copy of the GNU General Public License
|
|
along with this program. If not, see <http://www.gnu.org/licenses/>. */
|
|
|
|
%option debug nodefault nounput noyywrap never-interactive
|
|
%option prefix="code_" outfile="lex.yy.c"
|
|
|
|
%{
|
|
/* Work around a bug in flex 2.5.31. See Debian bug 333231
|
|
<http://bugs.debian.org/cgi-bin/bugreport.cgi?bug=333231>. */
|
|
#undef code_wrap
|
|
#define code_wrap() 1
|
|
|
|
#define FLEX_PREFIX(Id) code_ ## Id
|
|
#include <src/flex-scanner.h>
|
|
|
|
#include <src/complain.h>
|
|
#include <src/reader.h>
|
|
#include <src/getargs.h>
|
|
#include <get-errno.h>
|
|
#include <quote.h>
|
|
#include <src/muscle-tab.h>
|
|
#include <src/scan-code.h>
|
|
#include <src/symlist.h>
|
|
|
|
/* The current calling start condition: SC_RULE_ACTION or
|
|
SC_SYMBOL_ACTION. */
|
|
# define YY_DECL static char *code_lex (code_props *self, int sc_context)
|
|
YY_DECL;
|
|
|
|
#define YY_USER_ACTION location_compute (loc, &loc->end, yytext, yyleng);
|
|
|
|
static void handle_action_dollar (symbol_list *rule, char *cp,
|
|
location dollar_loc);
|
|
static void handle_action_at (symbol_list *rule, char *cp, location at_loc);
|
|
static location the_location;
|
|
static location *loc = &the_location;
|
|
|
|
/* A string representing the most recent translation. */
|
|
static char *last_string;
|
|
|
|
/* True if an untyped $$ or $n was seen. */
|
|
static bool untyped_var_seen;
|
|
%}
|
|
/* C and C++ comments in code. */
|
|
%x SC_COMMENT SC_LINE_COMMENT
|
|
/* Strings and characters in code. */
|
|
%x SC_STRING SC_CHARACTER
|
|
/* Whether in a rule or symbol action. Specifies the translation
|
|
of $ and @. */
|
|
%x SC_RULE_ACTION SC_SYMBOL_ACTION
|
|
|
|
|
|
/* POSIX says that a tag must be both an id and a C union member, but
|
|
historically almost any character is allowed in a tag. We disallow
|
|
NUL and newline, as this simplifies our implementation. */
|
|
tag [^\0\n>]+
|
|
|
|
/* Zero or more instances of backslash-newline. Following GCC, allow
|
|
white space between the backslash and the newline. */
|
|
splice (\\[ \f\t\v]*\n)*
|
|
|
|
%%
|
|
|
|
%{
|
|
/* Nesting level of the current code in braces. */
|
|
int braces_level = 0;
|
|
|
|
/* Whether a semicolon is probably needed.
|
|
The heuristic is that a semicolon is not needed after `{', `}', `;',
|
|
or a C preprocessor directive, and that whitespaces and comments
|
|
do not affect this flag.
|
|
Note that `{' does not need a semicolon because of `{}'.
|
|
A semicolon may be needed before a cpp direcive, but don't bother. */
|
|
bool need_semicolon = false;
|
|
|
|
/* Whether in a C preprocessor directive. Don't use a start condition
|
|
for this because, at the end of strings and comments, we still need
|
|
to know whether we're in a directive. */
|
|
bool in_cpp = false;
|
|
|
|
/* This scanner is special: it is invoked only once, henceforth
|
|
is expected to return only once. This initialization is
|
|
therefore done once per action to translate. */
|
|
aver (sc_context == SC_SYMBOL_ACTION
|
|
|| sc_context == SC_RULE_ACTION
|
|
|| sc_context == INITIAL);
|
|
BEGIN sc_context;
|
|
%}
|
|
|
|
/*------------------------------------------------------------.
|
|
| Scanning a C comment. The initial `/ *' is already eaten. |
|
|
`------------------------------------------------------------*/
|
|
|
|
<SC_COMMENT>
|
|
{
|
|
"*"{splice}"/" STRING_GROW; BEGIN sc_context;
|
|
}
|
|
|
|
|
|
/*--------------------------------------------------------------.
|
|
| Scanning a line comment. The initial `//' is already eaten. |
|
|
`--------------------------------------------------------------*/
|
|
|
|
<SC_LINE_COMMENT>
|
|
{
|
|
"\n" STRING_GROW; BEGIN sc_context;
|
|
{splice} STRING_GROW;
|
|
}
|
|
|
|
|
|
/*--------------------------------------------.
|
|
| Scanning user-code characters and strings. |
|
|
`--------------------------------------------*/
|
|
|
|
<SC_CHARACTER,SC_STRING>
|
|
{
|
|
{splice}|\\{splice}. STRING_GROW;
|
|
}
|
|
|
|
<SC_CHARACTER>
|
|
{
|
|
"'" STRING_GROW; BEGIN sc_context;
|
|
}
|
|
|
|
<SC_STRING>
|
|
{
|
|
"\"" STRING_GROW; BEGIN sc_context;
|
|
}
|
|
|
|
|
|
<SC_RULE_ACTION,SC_SYMBOL_ACTION>{
|
|
"'" {
|
|
STRING_GROW;
|
|
BEGIN SC_CHARACTER;
|
|
need_semicolon = true;
|
|
}
|
|
"\"" {
|
|
STRING_GROW;
|
|
BEGIN SC_STRING;
|
|
need_semicolon = true;
|
|
}
|
|
"/"{splice}"*" {
|
|
STRING_GROW;
|
|
BEGIN SC_COMMENT;
|
|
}
|
|
"/"{splice}"/" {
|
|
STRING_GROW;
|
|
BEGIN SC_LINE_COMMENT;
|
|
}
|
|
}
|
|
|
|
<SC_RULE_ACTION>
|
|
{
|
|
"$"("<"{tag}">")?(-?[0-9]+|"$") {
|
|
handle_action_dollar (self->rule, yytext, *loc);
|
|
need_semicolon = true;
|
|
}
|
|
"@"(-?[0-9]+|"$") {
|
|
handle_action_at (self->rule, yytext, *loc);
|
|
need_semicolon = true;
|
|
}
|
|
|
|
"$" {
|
|
warn_at (*loc, _("stray `$'"));
|
|
obstack_sgrow (&obstack_for_string, "$][");
|
|
need_semicolon = true;
|
|
}
|
|
"@" {
|
|
warn_at (*loc, _("stray `@'"));
|
|
obstack_sgrow (&obstack_for_string, "@@");
|
|
need_semicolon = true;
|
|
}
|
|
"[" {
|
|
obstack_sgrow (&obstack_for_string, "@{");
|
|
need_semicolon = true;
|
|
}
|
|
"]" {
|
|
obstack_sgrow (&obstack_for_string, "@}");
|
|
need_semicolon = true;
|
|
}
|
|
|
|
";" STRING_GROW; need_semicolon = false;
|
|
"{" STRING_GROW; ++braces_level; need_semicolon = false;
|
|
"}" {
|
|
bool outer_brace = --braces_level == 0;
|
|
|
|
/* As an undocumented Bison extension, append `;' before the last
|
|
brace in braced code, so that the user code can omit trailing
|
|
`;'. But do not append `;' if emulating Yacc, since Yacc does
|
|
not append one. */
|
|
if (outer_brace && !yacc_flag && language_prio == default_prio
|
|
&& skeleton_prio == default_prio && need_semicolon && ! in_cpp)
|
|
{
|
|
warn_at (*loc, _("a `;' might be needed at the end of action code"));
|
|
warn_at (*loc, _("future versions of Bison will not add the `;'"));
|
|
obstack_1grow (&obstack_for_string, ';');
|
|
}
|
|
|
|
STRING_GROW;
|
|
need_semicolon = false;
|
|
}
|
|
|
|
/* Preprocessing directives should only be recognized at the beginning
|
|
of lines, allowing whitespace including comments, but in C/C++,
|
|
`#' can only be the start of preprocessor directives or within
|
|
`#define' directives anyway, so don't bother with begin of line. */
|
|
"#" STRING_GROW; in_cpp = true;
|
|
|
|
{splice} STRING_GROW;
|
|
[\n\r] STRING_GROW; if (in_cpp) in_cpp = need_semicolon = false;
|
|
[ \t\f] STRING_GROW;
|
|
. STRING_GROW; need_semicolon = true;
|
|
}
|
|
|
|
<SC_SYMBOL_ACTION>
|
|
{
|
|
"$$" {
|
|
obstack_sgrow (&obstack_for_string, "]b4_dollar_dollar[");
|
|
self->is_value_used = true;
|
|
}
|
|
"@$" {
|
|
obstack_sgrow (&obstack_for_string, "]b4_at_dollar[");
|
|
muscle_percent_define_ensure("locations", the_location, true);
|
|
}
|
|
}
|
|
|
|
|
|
/*-----------------------------------------.
|
|
| Escape M4 quoting characters in C code. |
|
|
`-----------------------------------------*/
|
|
|
|
<*>
|
|
{
|
|
\$ obstack_sgrow (&obstack_for_string, "$][");
|
|
\@ obstack_sgrow (&obstack_for_string, "@@");
|
|
\[ obstack_sgrow (&obstack_for_string, "@{");
|
|
\] obstack_sgrow (&obstack_for_string, "@}");
|
|
}
|
|
|
|
/*-----------------------------------------------------.
|
|
| By default, grow the string obstack with the input. |
|
|
`-----------------------------------------------------*/
|
|
|
|
<*>.|\n STRING_GROW;
|
|
|
|
/* End of processing. */
|
|
<*><<EOF>> {
|
|
STRING_FINISH;
|
|
return last_string;
|
|
}
|
|
|
|
%%
|
|
|
|
/* Keeps track of the maximum number of semantic values to the left of
|
|
a handle (those referenced by $0, $-1, etc.) are required by the
|
|
semantic actions of this grammar. */
|
|
int max_left_semantic_context = 0;
|
|
|
|
|
|
/*------------------------------------------------------------------.
|
|
| TEXT is pointing to a wannabee semantic value (i.e., a `$'). |
|
|
| |
|
|
| Possible inputs: $[<TYPENAME>]($|integer) |
|
|
| |
|
|
| Output to OBSTACK_FOR_STRING a reference to this semantic value. |
|
|
`------------------------------------------------------------------*/
|
|
|
|
static void
|
|
handle_action_dollar (symbol_list *rule, char *text, location dollar_loc)
|
|
{
|
|
char const *type_name = NULL;
|
|
char *cp = text + 1;
|
|
symbol_list *effective_rule;
|
|
int effective_rule_length;
|
|
|
|
if (rule->midrule_parent_rule)
|
|
{
|
|
effective_rule = rule->midrule_parent_rule;
|
|
effective_rule_length = rule->midrule_parent_rhs_index - 1;
|
|
}
|
|
else
|
|
{
|
|
effective_rule = rule;
|
|
effective_rule_length = symbol_list_length (rule->next);
|
|
}
|
|
|
|
/* Get the type name if explicit. */
|
|
if (*cp == '<')
|
|
{
|
|
type_name = ++cp;
|
|
while (*cp != '>')
|
|
++cp;
|
|
*cp = '\0';
|
|
++cp;
|
|
if (untyped_var_seen)
|
|
complain_at (dollar_loc, _("explicit type given in untyped grammar"));
|
|
tag_seen = true;
|
|
}
|
|
|
|
if (*cp == '$')
|
|
{
|
|
if (!type_name)
|
|
type_name = symbol_list_n_type_name_get (rule, dollar_loc, 0);
|
|
|
|
if (!type_name)
|
|
{
|
|
if (union_seen | tag_seen)
|
|
{
|
|
if (rule->midrule_parent_rule)
|
|
complain_at (dollar_loc,
|
|
_("$$ for the midrule at $%d of `%s'"
|
|
" has no declared type"),
|
|
rule->midrule_parent_rhs_index,
|
|
effective_rule->content.sym->tag);
|
|
else
|
|
complain_at (dollar_loc, _("$$ of `%s' has no declared type"),
|
|
rule->content.sym->tag);
|
|
}
|
|
else
|
|
untyped_var_seen = true;
|
|
type_name = "";
|
|
}
|
|
|
|
obstack_fgrow1 (&obstack_for_string,
|
|
"]b4_lhs_value([%s])[", type_name);
|
|
rule->action_props.is_value_used = true;
|
|
}
|
|
else
|
|
{
|
|
long int num = strtol (cp, NULL, 10);
|
|
|
|
if (1 - INT_MAX + effective_rule_length <= num
|
|
&& num <= effective_rule_length)
|
|
{
|
|
int n = num;
|
|
if (max_left_semantic_context < 1 - n)
|
|
max_left_semantic_context = 1 - n;
|
|
if (!type_name && 0 < n)
|
|
type_name =
|
|
symbol_list_n_type_name_get (effective_rule, dollar_loc, n);
|
|
if (!type_name)
|
|
{
|
|
if (union_seen | tag_seen)
|
|
complain_at (dollar_loc, _("$%d of `%s' has no declared type"),
|
|
n, effective_rule->content.sym->tag);
|
|
else
|
|
untyped_var_seen = true;
|
|
type_name = "";
|
|
}
|
|
|
|
obstack_fgrow3 (&obstack_for_string,
|
|
"]b4_rhs_value(%d, %d, [%s])[",
|
|
effective_rule_length, n, type_name);
|
|
if (n > 0)
|
|
symbol_list_n_get (effective_rule, n)->action_props.is_value_used =
|
|
true;
|
|
}
|
|
else
|
|
complain_at (dollar_loc, _("integer out of range: %s"), quote (text));
|
|
}
|
|
}
|
|
|
|
|
|
/*------------------------------------------------------.
|
|
| TEXT is a location token (i.e., a `@...'). Output to |
|
|
| OBSTACK_FOR_STRING a reference to this location. |
|
|
`------------------------------------------------------*/
|
|
|
|
static void
|
|
handle_action_at (symbol_list *rule, char *text, location at_loc)
|
|
{
|
|
char *cp = text + 1;
|
|
int effective_rule_length =
|
|
(rule->midrule_parent_rule
|
|
? rule->midrule_parent_rhs_index - 1
|
|
: symbol_list_length (rule->next));
|
|
|
|
muscle_percent_define_ensure("locations", at_loc, true);
|
|
|
|
if (*cp == '$')
|
|
obstack_sgrow (&obstack_for_string, "]b4_lhs_location[");
|
|
else
|
|
{
|
|
long int num = strtol (cp, NULL, 10);
|
|
|
|
if (1 - INT_MAX + effective_rule_length <= num
|
|
&& num <= effective_rule_length)
|
|
{
|
|
int n = num;
|
|
obstack_fgrow2 (&obstack_for_string, "]b4_rhs_location(%d, %d)[",
|
|
effective_rule_length, n);
|
|
}
|
|
else
|
|
complain_at (at_loc, _("integer out of range: %s"), quote (text));
|
|
}
|
|
}
|
|
|
|
|
|
/*-------------------------.
|
|
| Initialize the scanner. |
|
|
`-------------------------*/
|
|
|
|
/* Translate the dollars and ats in \a self, in the context \a sc_context
|
|
(SC_RULE_ACTION, SC_SYMBOL_ACTION, INITIAL). */
|
|
|
|
static char const *
|
|
translate_action (code_props *self, int sc_context)
|
|
{
|
|
char *res;
|
|
static bool initialized = false;
|
|
if (!initialized)
|
|
{
|
|
obstack_init (&obstack_for_string);
|
|
yy_flex_debug = 0;
|
|
initialized = true;
|
|
}
|
|
|
|
loc->start = loc->end = self->location.start;
|
|
yy_switch_to_buffer (yy_scan_string (self->code));
|
|
res = code_lex (self, sc_context);
|
|
yy_delete_buffer (YY_CURRENT_BUFFER);
|
|
|
|
return res;
|
|
}
|
|
|
|
/*------------------------------------------------------------------------.
|
|
| Implementation of the public interface as documented in "scan-code.h". |
|
|
`------------------------------------------------------------------------*/
|
|
|
|
void
|
|
code_props_none_init (code_props *self)
|
|
{
|
|
*self = code_props_none;
|
|
}
|
|
|
|
code_props const code_props_none = CODE_PROPS_NONE_INIT;
|
|
|
|
void
|
|
code_props_plain_init (code_props *self, char const *code, location code_loc)
|
|
{
|
|
self->kind = CODE_PROPS_PLAIN;
|
|
self->code = code;
|
|
self->location = code_loc;
|
|
self->is_value_used = false;
|
|
self->rule = NULL;
|
|
}
|
|
|
|
void
|
|
code_props_symbol_action_init (code_props *self, char const *code,
|
|
location code_loc)
|
|
{
|
|
self->kind = CODE_PROPS_SYMBOL_ACTION;
|
|
self->code = code;
|
|
self->location = code_loc;
|
|
self->is_value_used = false;
|
|
self->rule = NULL;
|
|
}
|
|
|
|
void
|
|
code_props_rule_action_init (code_props *self, char const *code,
|
|
location code_loc, symbol_list *rule)
|
|
{
|
|
self->kind = CODE_PROPS_RULE_ACTION;
|
|
self->code = code;
|
|
self->location = code_loc;
|
|
self->is_value_used = false;
|
|
self->rule = rule;
|
|
}
|
|
|
|
void
|
|
code_props_translate_code (code_props *self)
|
|
{
|
|
switch (self->kind)
|
|
{
|
|
case CODE_PROPS_NONE:
|
|
break;
|
|
case CODE_PROPS_PLAIN:
|
|
self->code = translate_action (self, INITIAL);
|
|
break;
|
|
case CODE_PROPS_SYMBOL_ACTION:
|
|
self->code = translate_action (self, SC_SYMBOL_ACTION);
|
|
break;
|
|
case CODE_PROPS_RULE_ACTION:
|
|
self->code = translate_action (self, SC_RULE_ACTION);
|
|
break;
|
|
}
|
|
}
|
|
|
|
void
|
|
code_scanner_last_string_free (void)
|
|
{
|
|
STRING_FREE;
|
|
}
|
|
|
|
void
|
|
code_scanner_free (void)
|
|
{
|
|
obstack_free (&obstack_for_string, 0);
|
|
/* Reclaim Flex's buffers. */
|
|
yylex_destroy ();
|
|
}
|