Baptiste Daroussin 0c8de5b03c Update to byacc 20140409
Among all the modifications, this new byacc also solves a 14 year old bug [1]

PR:		bin/23254 [1]
Submitted by:	marka@nominum.com [1]
MFC after:	3 weeks
2014-04-23 05:57:45 +00:00

3307 lines
57 KiB
C

/* $Id: reader.c,v 1.47 2014/04/09 21:09:27 tom Exp $ */
#include "defs.h"
/* The line size must be a positive integer. One hundred was chosen */
/* because few lines in Yacc input grammars exceed 100 characters. */
/* Note that if a line exceeds LINESIZE characters, the line buffer */
/* will be expanded to accomodate it. */
#define LINESIZE 100
#define L_CURL '{'
#define R_CURL '}'
#define L_PAREN '('
#define R_PAREN ')'
#define L_BRAC '['
#define R_BRAC ']'
/* the maximum number of arguments (inherited attributes) to a non-terminal */
/* this is a hard limit, but seems more than adequate */
#define MAXARGS 20
static void start_rule(bucket *bp, int s_lineno);
#if defined(YYBTYACC)
static void copy_destructor(void);
static char *process_destructor_XX(char *code, char *tag);
#endif
static char *cache;
static int cinc, cache_size;
int ntags;
static int tagmax, havetags;
static char **tag_table;
static char saw_eof;
char unionized;
char *cptr, *line;
static int linesize;
static bucket *goal;
static Value_t prec;
static int gensym;
static char last_was_action;
static int maxitems;
static bucket **pitem;
static int maxrules;
static bucket **plhs;
static size_t name_pool_size;
static char *name_pool;
char line_format[] = "#line %d \"%s\"\n";
param *lex_param;
param *parse_param;
#if defined(YYBTYACC)
int destructor = 0; /* =1 if at least one %destructor */
static bucket *default_destructor[3] =
{0, 0, 0};
#define UNTYPED_DEFAULT 0
#define TYPED_DEFAULT 1
#define TYPE_SPECIFIED 2
static bucket *
lookup_type_destructor(char *tag)
{
char name[1024] = "\0";
bucket *bp, **bpp = &default_destructor[TYPE_SPECIFIED];
while ((bp = *bpp) != NULL)
{
if (bp->tag == tag)
return (bp);
bpp = &bp->link;
}
*bpp = bp = make_bucket(strcat(strcpy(name, tag), " destructor"));
bp->tag = tag;
return (bp);
}
#endif /* defined(YYBTYACC) */
static void
cachec(int c)
{
assert(cinc >= 0);
if (cinc >= cache_size)
{
cache_size += 256;
cache = TREALLOC(char, cache, cache_size);
NO_SPACE(cache);
}
cache[cinc] = (char)c;
++cinc;
}
static void
get_line(void)
{
FILE *f = input_file;
int c;
int i;
if (saw_eof || (c = getc(f)) == EOF)
{
if (line)
{
FREE(line);
line = 0;
}
cptr = 0;
saw_eof = 1;
return;
}
if (line == 0 || linesize != (LINESIZE + 1))
{
if (line)
FREE(line);
linesize = LINESIZE + 1;
line = TMALLOC(char, linesize);
NO_SPACE(line);
}
i = 0;
++lineno;
for (;;)
{
line[i] = (char)c;
if (c == '\n')
break;
if (++i >= linesize)
{
linesize += LINESIZE;
line = TREALLOC(char, line, linesize);
NO_SPACE(line);
}
c = getc(f);
if (c == EOF)
{
line[i] = '\n';
saw_eof = 1;
break;
}
}
cptr = line;
return;
}
static char *
dup_line(void)
{
char *p, *s, *t;
if (line == 0)
return (0);
s = line;
while (*s != '\n')
++s;
p = TMALLOC(char, s - line + 1);
NO_SPACE(p);
s = line;
t = p;
while ((*t++ = *s++) != '\n')
continue;
return (p);
}
static void
skip_comment(void)
{
char *s;
int st_lineno = lineno;
char *st_line = dup_line();
char *st_cptr = st_line + (cptr - line);
s = cptr + 2;
for (;;)
{
if (*s == '*' && s[1] == '/')
{
cptr = s + 2;
FREE(st_line);
return;
}
if (*s == '\n')
{
get_line();
if (line == 0)
unterminated_comment(st_lineno, st_line, st_cptr);
s = cptr;
}
else
++s;
}
}
static int
nextc(void)
{
char *s;
if (line == 0)
{
get_line();
if (line == 0)
return (EOF);
}
s = cptr;
for (;;)
{
switch (*s)
{
case '\n':
get_line();
if (line == 0)
return (EOF);
s = cptr;
break;
case ' ':
case '\t':
case '\f':
case '\r':
case '\v':
case ',':
case ';':
++s;
break;
case '\\':
cptr = s;
return ('%');
case '/':
if (s[1] == '*')
{
cptr = s;
skip_comment();
s = cptr;
break;
}
else if (s[1] == '/')
{
get_line();
if (line == 0)
return (EOF);
s = cptr;
break;
}
/* FALLTHRU */
default:
cptr = s;
return (*s);
}
}
}
/* *INDENT-OFF* */
static struct keyword
{
char name[13];
int token;
}
keywords[] = {
{ "binary", NONASSOC },
#if defined(YYBTYACC)
{ "destructor", DESTRUCTOR },
#endif
{ "expect", EXPECT },
{ "expect-rr", EXPECT_RR },
{ "ident", IDENT },
{ "left", LEFT },
{ "lex-param", LEX_PARAM },
#if defined(YYBTYACC)
{ "locations", LOCATIONS },
#endif
{ "nonassoc", NONASSOC },
{ "parse-param", PARSE_PARAM },
{ "pure-parser", PURE_PARSER },
{ "right", RIGHT },
{ "start", START },
{ "term", TOKEN },
{ "token", TOKEN },
{ "token-table", TOKEN_TABLE },
{ "type", TYPE },
{ "union", UNION },
{ "yacc", POSIX_YACC },
};
/* *INDENT-ON* */
static int
compare_keys(const void *a, const void *b)
{
const struct keyword *p = (const struct keyword *)a;
const struct keyword *q = (const struct keyword *)b;
return strcmp(p->name, q->name);
}
static int
keyword(void)
{
int c;
char *t_cptr = cptr;
struct keyword *key;
c = *++cptr;
if (isalpha(c))
{
cinc = 0;
for (;;)
{
if (isalpha(c))
{
if (isupper(c))
c = tolower(c);
cachec(c);
}
else if (isdigit(c)
|| c == '-'
|| c == '.'
|| c == '$')
{
cachec(c);
}
else if (c == '_')
{
/* treat keywords spelled with '_' as if it were '-' */
cachec('-');
}
else
{
break;
}
c = *++cptr;
}
cachec(NUL);
if ((key = bsearch(cache, keywords,
sizeof(keywords) / sizeof(*key),
sizeof(*key), compare_keys)))
return key->token;
}
else
{
++cptr;
if (c == L_CURL)
return (TEXT);
if (c == '%' || c == '\\')
return (MARK);
if (c == '<')
return (LEFT);
if (c == '>')
return (RIGHT);
if (c == '0')
return (TOKEN);
if (c == '2')
return (NONASSOC);
}
syntax_error(lineno, line, t_cptr);
return (-1);
}
static void
copy_ident(void)
{
int c;
FILE *f = output_file;
c = nextc();
if (c == EOF)
unexpected_EOF();
if (c != '"')
syntax_error(lineno, line, cptr);
++outline;
fprintf(f, "#ident \"");
for (;;)
{
c = *++cptr;
if (c == '\n')
{
fprintf(f, "\"\n");
return;
}
putc(c, f);
if (c == '"')
{
putc('\n', f);
++cptr;
return;
}
}
}
static char *
copy_string(int quote)
{
struct mstring *temp = msnew();
int c;
int s_lineno = lineno;
char *s_line = dup_line();
char *s_cptr = s_line + (cptr - line - 1);
for (;;)
{
c = *cptr++;
mputc(temp, c);
if (c == quote)
{
FREE(s_line);
return msdone(temp);
}
if (c == '\n')
unterminated_string(s_lineno, s_line, s_cptr);
if (c == '\\')
{
c = *cptr++;
mputc(temp, c);
if (c == '\n')
{
get_line();
if (line == 0)
unterminated_string(s_lineno, s_line, s_cptr);
}
}
}
}
static char *
copy_comment(void)
{
struct mstring *temp = msnew();
int c;
c = *cptr;
if (c == '/')
{
mputc(temp, '*');
while ((c = *++cptr) != '\n')
{
mputc(temp, c);
if (c == '*' && cptr[1] == '/')
mputc(temp, ' ');
}
mputc(temp, '*');
mputc(temp, '/');
}
else if (c == '*')
{
int c_lineno = lineno;
char *c_line = dup_line();
char *c_cptr = c_line + (cptr - line - 1);
mputc(temp, c);
++cptr;
for (;;)
{
c = *cptr++;
mputc(temp, c);
if (c == '*' && *cptr == '/')
{
mputc(temp, '/');
++cptr;
FREE(c_line);
return msdone(temp);
}
if (c == '\n')
{
get_line();
if (line == 0)
unterminated_comment(c_lineno, c_line, c_cptr);
}
}
}
return msdone(temp);
}
static void
copy_text(void)
{
int c;
FILE *f = text_file;
int need_newline = 0;
int t_lineno = lineno;
char *t_line = dup_line();
char *t_cptr = t_line + (cptr - line - 2);
if (*cptr == '\n')
{
get_line();
if (line == 0)
unterminated_text(t_lineno, t_line, t_cptr);
}
if (!lflag)
fprintf(f, line_format, lineno, input_file_name);
loop:
c = *cptr++;
switch (c)
{
case '\n':
putc('\n', f);
need_newline = 0;
get_line();
if (line)
goto loop;
unterminated_text(t_lineno, t_line, t_cptr);
case '\'':
case '"':
putc(c, f);
{
char *s = copy_string(c);
fputs(s, f);
free(s);
}
need_newline = 1;
goto loop;
case '/':
putc(c, f);
{
char *s = copy_comment();
fputs(s, f);
free(s);
}
need_newline = 1;
goto loop;
case '%':
case '\\':
if (*cptr == R_CURL)
{
if (need_newline)
putc('\n', f);
++cptr;
FREE(t_line);
return;
}
/* FALLTHRU */
default:
putc(c, f);
need_newline = 1;
goto loop;
}
}
static void
puts_both(const char *s)
{
fputs(s, text_file);
if (dflag)
fputs(s, union_file);
}
static void
putc_both(int c)
{
putc(c, text_file);
if (dflag)
putc(c, union_file);
}
static void
copy_union(void)
{
int c;
int depth;
int u_lineno = lineno;
char *u_line = dup_line();
char *u_cptr = u_line + (cptr - line - 6);
if (unionized)
over_unionized(cptr - 6);
unionized = 1;
if (!lflag)
fprintf(text_file, line_format, lineno, input_file_name);
puts_both("#ifdef YYSTYPE\n");
puts_both("#undef YYSTYPE_IS_DECLARED\n");
puts_both("#define YYSTYPE_IS_DECLARED 1\n");
puts_both("#endif\n");
puts_both("#ifndef YYSTYPE_IS_DECLARED\n");
puts_both("#define YYSTYPE_IS_DECLARED 1\n");
puts_both("typedef union");
depth = 0;
loop:
c = *cptr++;
putc_both(c);
switch (c)
{
case '\n':
get_line();
if (line == 0)
unterminated_union(u_lineno, u_line, u_cptr);
goto loop;
case L_CURL:
++depth;
goto loop;
case R_CURL:
if (--depth == 0)
{
puts_both(" YYSTYPE;\n");
puts_both("#endif /* !YYSTYPE_IS_DECLARED */\n");
FREE(u_line);
return;
}
goto loop;
case '\'':
case '"':
{
char *s = copy_string(c);
puts_both(s);
free(s);
}
goto loop;
case '/':
{
char *s = copy_comment();
puts_both(s);
free(s);
}
goto loop;
default:
goto loop;
}
}
/*
* Keep a linked list of parameters
*/
static void
copy_param(int k)
{
char *buf;
int c;
param *head, *p;
int i;
int name, type2;
c = nextc();
if (c == EOF)
unexpected_EOF();
if (c != L_CURL)
goto out;
cptr++;
c = nextc();
if (c == EOF)
unexpected_EOF();
if (c == R_CURL)
goto out;
buf = TMALLOC(char, linesize);
NO_SPACE(buf);
for (i = 0; (c = *cptr++) != R_CURL; i++)
{
if (c == '\0')
missing_brace();
if (c == EOF)
unexpected_EOF();
buf[i] = (char)c;
}
if (i == 0)
goto out;
buf[i--] = '\0';
while (i > 0 && isspace(UCH(buf[i])))
buf[i--] = '\0';
if (buf[i] == ']')
{
int level = 1;
while (i >= 0 && level > 0 && buf[i] != '[')
{
if (buf[i] == ']')
++level;
else if (buf[i] == '[')
--level;
i--;
}
if (i <= 0)
unexpected_EOF();
type2 = i--;
}
else
{
type2 = i + 1;
}
while (i > 0 && (isalnum(UCH(buf[i])) ||
UCH(buf[i]) == '_'))
i--;
if (!isspace(UCH(buf[i])) && buf[i] != '*')
goto out;
name = i + 1;
p = TMALLOC(param, 1);
NO_SPACE(p);
p->type2 = strdup(buf + type2);
NO_SPACE(p->type2);
buf[type2] = '\0';
p->name = strdup(buf + name);
NO_SPACE(p->name);
buf[name] = '\0';
p->type = buf;
if (k == LEX_PARAM)
head = lex_param;
else
head = parse_param;
if (head != NULL)
{
while (head->next)
head = head->next;
head->next = p;
}
else
{
if (k == LEX_PARAM)
lex_param = p;
else
parse_param = p;
}
p->next = NULL;
return;
out:
syntax_error(lineno, line, cptr);
}
static int
hexval(int c)
{
if (c >= '0' && c <= '9')
return (c - '0');
if (c >= 'A' && c <= 'F')
return (c - 'A' + 10);
if (c >= 'a' && c <= 'f')
return (c - 'a' + 10);
return (-1);
}
static bucket *
get_literal(void)
{
int c, quote;
int i;
int n;
char *s;
bucket *bp;
int s_lineno = lineno;
char *s_line = dup_line();
char *s_cptr = s_line + (cptr - line);
quote = *cptr++;
cinc = 0;
for (;;)
{
c = *cptr++;
if (c == quote)
break;
if (c == '\n')
unterminated_string(s_lineno, s_line, s_cptr);
if (c == '\\')
{
char *c_cptr = cptr - 1;
c = *cptr++;
switch (c)
{
case '\n':
get_line();
if (line == 0)
unterminated_string(s_lineno, s_line, s_cptr);
continue;
case '0':
case '1':
case '2':
case '3':
case '4':
case '5':
case '6':
case '7':
n = c - '0';
c = *cptr;
if (IS_OCTAL(c))
{
n = (n << 3) + (c - '0');
c = *++cptr;
if (IS_OCTAL(c))
{
n = (n << 3) + (c - '0');
++cptr;
}
}
if (n > MAXCHAR)
illegal_character(c_cptr);
c = n;
break;
case 'x':
c = *cptr++;
n = hexval(c);
if (n < 0 || n >= 16)
illegal_character(c_cptr);
for (;;)
{
c = *cptr;
i = hexval(c);
if (i < 0 || i >= 16)
break;
++cptr;
n = (n << 4) + i;
if (n > MAXCHAR)
illegal_character(c_cptr);
}
c = n;
break;
case 'a':
c = 7;
break;
case 'b':
c = '\b';
break;
case 'f':
c = '\f';
break;
case 'n':
c = '\n';
break;
case 'r':
c = '\r';
break;
case 't':
c = '\t';
break;
case 'v':
c = '\v';
break;
}
}
cachec(c);
}
FREE(s_line);
n = cinc;
s = TMALLOC(char, n);
NO_SPACE(s);
for (i = 0; i < n; ++i)
s[i] = cache[i];
cinc = 0;
if (n == 1)
cachec('\'');
else
cachec('"');
for (i = 0; i < n; ++i)
{
c = UCH(s[i]);
if (c == '\\' || c == cache[0])
{
cachec('\\');
cachec(c);
}
else if (isprint(c))
cachec(c);
else
{
cachec('\\');
switch (c)
{
case 7:
cachec('a');
break;
case '\b':
cachec('b');
break;
case '\f':
cachec('f');
break;
case '\n':
cachec('n');
break;
case '\r':
cachec('r');
break;
case '\t':
cachec('t');
break;
case '\v':
cachec('v');
break;
default:
cachec(((c >> 6) & 7) + '0');
cachec(((c >> 3) & 7) + '0');
cachec((c & 7) + '0');
break;
}
}
}
if (n == 1)
cachec('\'');
else
cachec('"');
cachec(NUL);
bp = lookup(cache);
bp->class = TERM;
if (n == 1 && bp->value == UNDEFINED)
bp->value = UCH(*s);
FREE(s);
return (bp);
}
static int
is_reserved(char *name)
{
char *s;
if (strcmp(name, ".") == 0 ||
strcmp(name, "$accept") == 0 ||
strcmp(name, "$end") == 0)
return (1);
if (name[0] == '$' && name[1] == '$' && isdigit(UCH(name[2])))
{
s = name + 3;
while (isdigit(UCH(*s)))
++s;
if (*s == NUL)
return (1);
}
return (0);
}
static bucket *
get_name(void)
{
int c;
cinc = 0;
for (c = *cptr; IS_IDENT(c); c = *++cptr)
cachec(c);
cachec(NUL);
if (is_reserved(cache))
used_reserved(cache);
return (lookup(cache));
}
static Value_t
get_number(void)
{
int c;
Value_t n;
n = 0;
for (c = *cptr; isdigit(c); c = *++cptr)
n = (Value_t) (10 * n + (c - '0'));
return (n);
}
static char *
cache_tag(char *tag, size_t len)
{
int i;
char *s;
for (i = 0; i < ntags; ++i)
{
if (strncmp(tag, tag_table[i], len) == 0 &&
tag_table[i][len] == NUL)
return (tag_table[i]);
}
if (ntags >= tagmax)
{
tagmax += 16;
tag_table =
(tag_table
? TREALLOC(char *, tag_table, tagmax)
: TMALLOC(char *, tagmax));
NO_SPACE(tag_table);
}
s = TMALLOC(char, len + 1);
NO_SPACE(s);
strncpy(s, tag, len);
s[len] = 0;
tag_table[ntags++] = s;
return s;
}
static char *
get_tag(void)
{
int c;
int t_lineno = lineno;
char *t_line = dup_line();
char *t_cptr = t_line + (cptr - line);
++cptr;
c = nextc();
if (c == EOF)
unexpected_EOF();
if (!isalpha(c) && c != '_' && c != '$')
illegal_tag(t_lineno, t_line, t_cptr);
cinc = 0;
do
{
cachec(c);
c = *++cptr;
}
while (IS_IDENT(c));
cachec(NUL);
c = nextc();
if (c == EOF)
unexpected_EOF();
if (c != '>')
illegal_tag(t_lineno, t_line, t_cptr);
++cptr;
FREE(t_line);
havetags = 1;
return cache_tag(cache, (size_t) cinc);
}
#if defined(YYBTYACC)
static char *
scan_id(void)
{
char *b = cptr;
while (isalnum(*cptr) || *cptr == '_' || *cptr == '$')
cptr++;
return cache_tag(b, (size_t) (cptr - b));
}
#endif
static void
declare_tokens(int assoc)
{
int c;
bucket *bp;
Value_t value;
char *tag = 0;
if (assoc != TOKEN)
++prec;
c = nextc();
if (c == EOF)
unexpected_EOF();
if (c == '<')
{
tag = get_tag();
c = nextc();
if (c == EOF)
unexpected_EOF();
}
for (;;)
{
if (isalpha(c) || c == '_' || c == '.' || c == '$')
bp = get_name();
else if (c == '\'' || c == '"')
bp = get_literal();
else
return;
if (bp == goal)
tokenized_start(bp->name);
bp->class = TERM;
if (tag)
{
if (bp->tag && tag != bp->tag)
retyped_warning(bp->name);
bp->tag = tag;
}
if (assoc != TOKEN)
{
if (bp->prec && prec != bp->prec)
reprec_warning(bp->name);
bp->assoc = (Assoc_t) assoc;
bp->prec = prec;
}
c = nextc();
if (c == EOF)
unexpected_EOF();
if (isdigit(c))
{
value = get_number();
if (bp->value != UNDEFINED && value != bp->value)
revalued_warning(bp->name);
bp->value = value;
c = nextc();
if (c == EOF)
unexpected_EOF();
}
}
}
/*
* %expect requires special handling
* as it really isn't part of the yacc
* grammar only a flag for yacc proper.
*/
static void
declare_expect(int assoc)
{
int c;
if (assoc != EXPECT && assoc != EXPECT_RR)
++prec;
/*
* Stay away from nextc - doesn't
* detect EOL and will read to EOF.
*/
c = *++cptr;
if (c == EOF)
unexpected_EOF();
for (;;)
{
if (isdigit(c))
{
if (assoc == EXPECT)
SRexpect = get_number();
else
RRexpect = get_number();
break;
}
/*
* Looking for number before EOL.
* Spaces, tabs, and numbers are ok,
* words, punc., etc. are syntax errors.
*/
else if (c == '\n' || isalpha(c) || !isspace(c))
{
syntax_error(lineno, line, cptr);
}
else
{
c = *++cptr;
if (c == EOF)
unexpected_EOF();
}
}
}
#if defined(YYBTYACC)
static void
declare_argtypes(bucket *bp)
{
char *tags[MAXARGS];
int args = 0, c;
if (bp->args >= 0)
retyped_warning(bp->name);
cptr++; /* skip open paren */
for (;;)
{
c = nextc();
if (c == EOF)
unexpected_EOF();
if (c != '<')
syntax_error(lineno, line, cptr);
tags[args++] = get_tag();
c = nextc();
if (c == R_PAREN)
break;
if (c == EOF)
unexpected_EOF();
}
cptr++; /* skip close paren */
bp->args = args;
bp->argnames = TMALLOC(char *, args);
NO_SPACE(bp->argnames);
bp->argtags = CALLOC(sizeof(char *), args + 1);
NO_SPACE(bp->argtags);
while (--args >= 0)
{
bp->argtags[args] = tags[args];
bp->argnames[args] = NULL;
}
}
#endif
static void
declare_types(void)
{
int c;
bucket *bp;
char *tag = NULL;
c = nextc();
if (c == EOF)
unexpected_EOF();
if (c == '<')
tag = get_tag();
for (;;)
{
c = nextc();
if (c == EOF)
unexpected_EOF();
if (isalpha(c) || c == '_' || c == '.' || c == '$')
{
bp = get_name();
#if defined(YYBTYACC)
if (nextc() == L_PAREN)
declare_argtypes(bp);
else
bp->args = 0;
#endif
}
else if (c == '\'' || c == '"')
{
bp = get_literal();
#if defined(YYBTYACC)
bp->args = 0;
#endif
}
else
return;
if (tag)
{
if (bp->tag && tag != bp->tag)
retyped_warning(bp->name);
bp->tag = tag;
}
}
}
static void
declare_start(void)
{
int c;
bucket *bp;
c = nextc();
if (c == EOF)
unexpected_EOF();
if (!isalpha(c) && c != '_' && c != '.' && c != '$')
syntax_error(lineno, line, cptr);
bp = get_name();
if (bp->class == TERM)
terminal_start(bp->name);
if (goal && goal != bp)
restarted_warning();
goal = bp;
}
static void
read_declarations(void)
{
int c, k;
cache_size = 256;
cache = TMALLOC(char, cache_size);
NO_SPACE(cache);
for (;;)
{
c = nextc();
if (c == EOF)
unexpected_EOF();
if (c != '%')
syntax_error(lineno, line, cptr);
switch (k = keyword())
{
case MARK:
return;
case IDENT:
copy_ident();
break;
case TEXT:
copy_text();
break;
case UNION:
copy_union();
break;
case TOKEN:
case LEFT:
case RIGHT:
case NONASSOC:
declare_tokens(k);
break;
case EXPECT:
case EXPECT_RR:
declare_expect(k);
break;
case TYPE:
declare_types();
break;
case START:
declare_start();
break;
case PURE_PARSER:
pure_parser = 1;
break;
case PARSE_PARAM:
case LEX_PARAM:
copy_param(k);
break;
case TOKEN_TABLE:
token_table = 1;
break;
#if defined(YYBTYACC)
case LOCATIONS:
locations = 1;
break;
case DESTRUCTOR:
destructor = 1;
copy_destructor();
break;
#endif
case POSIX_YACC:
/* noop for bison compatibility. byacc is already designed to be posix
* yacc compatible. */
break;
}
}
}
static void
initialize_grammar(void)
{
nitems = 4;
maxitems = 300;
pitem = TMALLOC(bucket *, maxitems);
NO_SPACE(pitem);
pitem[0] = 0;
pitem[1] = 0;
pitem[2] = 0;
pitem[3] = 0;
nrules = 3;
maxrules = 100;
plhs = TMALLOC(bucket *, maxrules);
NO_SPACE(plhs);
plhs[0] = 0;
plhs[1] = 0;
plhs[2] = 0;
rprec = TMALLOC(Value_t, maxrules);
NO_SPACE(rprec);
rprec[0] = 0;
rprec[1] = 0;
rprec[2] = 0;
rassoc = TMALLOC(Assoc_t, maxrules);
NO_SPACE(rassoc);
rassoc[0] = TOKEN;
rassoc[1] = TOKEN;
rassoc[2] = TOKEN;
}
static void
expand_items(void)
{
maxitems += 300;
pitem = TREALLOC(bucket *, pitem, maxitems);
NO_SPACE(pitem);
}
static void
expand_rules(void)
{
maxrules += 100;
plhs = TREALLOC(bucket *, plhs, maxrules);
NO_SPACE(plhs);
rprec = TREALLOC(Value_t, rprec, maxrules);
NO_SPACE(rprec);
rassoc = TREALLOC(Assoc_t, rassoc, maxrules);
NO_SPACE(rassoc);
}
/* set immediately prior to where copy_args() could be called, and incremented by
the various routines that will rescan the argument list as appropriate */
static int rescan_lineno;
#if defined(YYBTYACC)
static char *
copy_args(int *alen)
{
struct mstring *s = msnew();
int depth = 0, len = 1;
char c, quote = 0;
int a_lineno = lineno;
char *a_line = dup_line();
char *a_cptr = a_line + (cptr - line - 1);
while ((c = *cptr++) != R_PAREN || depth || quote)
{
if (c == ',' && !quote && !depth)
{
len++;
mputc(s, 0);
continue;
}
mputc(s, c);
if (c == '\n')
{
get_line();
if (!line)
{
if (quote)
unterminated_string(a_lineno, a_line, a_cptr);
else
unterminated_arglist(a_lineno, a_line, a_cptr);
}
}
else if (quote)
{
if (c == quote)
quote = 0;
else if (c == '\\')
{
if (*cptr != '\n')
mputc(s, *cptr++);
}
}
else
{
if (c == L_PAREN)
depth++;
else if (c == R_PAREN)
depth--;
else if (c == '\"' || c == '\'')
quote = c;
}
}
if (alen)
*alen = len;
FREE(a_line);
return msdone(s);
}
static char *
parse_id(char *p, char **save)
{
char *b;
while (isspace(*p))
if (*p++ == '\n')
rescan_lineno++;
if (!isalpha(*p) && *p != '_')
return NULL;
b = p;
while (isalnum(*p) || *p == '_' || *p == '$')
p++;
if (save)
{
*save = cache_tag(b, (size_t) (p - b));
}
return p;
}
static char *
parse_int(char *p, int *save)
{
int neg = 0, val = 0;
while (isspace(*p))
if (*p++ == '\n')
rescan_lineno++;
if (*p == '-')
{
neg = 1;
p++;
}
if (!isdigit(*p))
return NULL;
while (isdigit(*p))
val = val * 10 + *p++ - '0';
if (neg)
val = -val;
if (save)
*save = val;
return p;
}
static void
parse_arginfo(bucket *a, char *args, int argslen)
{
char *p = args, *tmp;
int i, redec = 0;
if (a->args > 0)
{
if (a->args != argslen)
arg_number_disagree_warning(rescan_lineno, a->name);
redec = 1;
}
else
{
if ((a->args = argslen) == 0)
return;
a->argnames = TMALLOC(char *, argslen);
NO_SPACE(a->argnames);
a->argtags = TMALLOC(char *, argslen);
NO_SPACE(a->argtags);
}
if (!args)
return;
for (i = 0; i < argslen; i++)
{
while (isspace(*p))
if (*p++ == '\n')
rescan_lineno++;
if (*p++ != '$')
bad_formals();
while (isspace(*p))
if (*p++ == '\n')
rescan_lineno++;
if (*p == '<')
{
havetags = 1;
if (!(p = parse_id(p + 1, &tmp)))
bad_formals();
while (isspace(*p))
if (*p++ == '\n')
rescan_lineno++;
if (*p++ != '>')
bad_formals();
if (redec)
{
if (a->argtags[i] != tmp)
arg_type_disagree_warning(rescan_lineno, i + 1, a->name);
}
else
a->argtags[i] = tmp;
}
else if (!redec)
a->argtags[i] = NULL;
if (!(p = parse_id(p, &a->argnames[i])))
bad_formals();
while (isspace(*p))
if (*p++ == '\n')
rescan_lineno++;
if (*p++)
bad_formals();
}
free(args);
}
static char *
compile_arg(char **theptr, char *yyvaltag)
{
char *p = *theptr;
struct mstring *c = msnew();
int i, j, n;
Value_t *offsets = NULL, maxoffset;
bucket **rhs;
maxoffset = 0;
n = 0;
for (i = nitems - 1; pitem[i]; --i)
{
n++;
if (pitem[i]->class != ARGUMENT)
maxoffset++;
}
if (maxoffset > 0)
{
offsets = TMALLOC(Value_t, maxoffset + 1);
NO_SPACE(offsets);
}
for (j = 0, i++; i < nitems; i++)
if (pitem[i]->class != ARGUMENT)
offsets[++j] = (Value_t) (i - nitems + 1);
rhs = pitem + nitems - 1;
if (yyvaltag)
msprintf(c, "yyval.%s = ", yyvaltag);
else
msprintf(c, "yyval = ");
while (*p)
{
if (*p == '$')
{
char *tag = NULL;
if (*++p == '<')
if (!(p = parse_id(++p, &tag)) || *p++ != '>')
illegal_tag(rescan_lineno, NULL, NULL);
if (isdigit(*p) || *p == '-')
{
int val;
if (!(p = parse_int(p, &val)))
dollar_error(rescan_lineno, NULL, NULL);
if (val <= 0)
i = val - n;
else if (val > maxoffset)
{
dollar_warning(rescan_lineno, val);
i = val - maxoffset;
}
else
{
i = offsets[val];
if (!tag && !(tag = rhs[i]->tag) && havetags)
untyped_rhs(val, rhs[i]->name);
}
msprintf(c, "yystack.l_mark[%d]", i);
if (tag)
msprintf(c, ".%s", tag);
else if (havetags)
unknown_rhs(val);
}
else if (isalpha(*p) || *p == '_')
{
char *arg;
if (!(p = parse_id(p, &arg)))
dollar_error(rescan_lineno, NULL, NULL);
for (i = plhs[nrules]->args - 1; i >= 0; i--)
if (arg == plhs[nrules]->argnames[i])
break;
if (i < 0)
unknown_arg_warning(rescan_lineno, "$", arg, NULL, NULL);
else if (!tag)
tag = plhs[nrules]->argtags[i];
msprintf(c, "yystack.l_mark[%d]", i - plhs[nrules]->args + 1
- n);
if (tag)
msprintf(c, ".%s", tag);
else if (havetags)
untyped_arg_warning(rescan_lineno, "$", arg);
}
else
dollar_error(rescan_lineno, NULL, NULL);
}
else if (*p == '@')
{
at_error(rescan_lineno, NULL, NULL);
}
else
{
if (*p == '\n')
rescan_lineno++;
mputc(c, *p++);
}
}
*theptr = p;
if (maxoffset > 0)
FREE(offsets);
return msdone(c);
}
#define ARG_CACHE_SIZE 1024
static struct arg_cache
{
struct arg_cache *next;
char *code;
int rule;
}
*arg_cache[ARG_CACHE_SIZE];
static int
lookup_arg_cache(char *code)
{
struct arg_cache *entry;
entry = arg_cache[strnshash(code) % ARG_CACHE_SIZE];
while (entry)
{
if (!strnscmp(entry->code, code))
return entry->rule;
entry = entry->next;
}
return -1;
}
static void
insert_arg_cache(char *code, int rule)
{
struct arg_cache *entry = NEW(struct arg_cache);
int i;
NO_SPACE(entry);
i = strnshash(code) % ARG_CACHE_SIZE;
entry->code = code;
entry->rule = rule;
entry->next = arg_cache[i];
arg_cache[i] = entry;
}
static void
clean_arg_cache(void)
{
struct arg_cache *e, *t;
int i;
for (i = 0; i < ARG_CACHE_SIZE; i++)
{
for (e = arg_cache[i]; (t = e); e = e->next, FREE(t))
free(e->code);
arg_cache[i] = NULL;
}
}
#endif
static void
advance_to_start(void)
{
int c;
bucket *bp;
char *s_cptr;
int s_lineno;
#if defined(YYBTYACC)
char *args = NULL;
int argslen = 0;
#endif
for (;;)
{
c = nextc();
if (c != '%')
break;
s_cptr = cptr;
switch (keyword())
{
case MARK:
no_grammar();
case TEXT:
copy_text();
break;
case START:
declare_start();
break;
default:
syntax_error(lineno, line, s_cptr);
}
}
c = nextc();
if (!isalpha(c) && c != '_' && c != '.' && c != '_')
syntax_error(lineno, line, cptr);
bp = get_name();
if (goal == 0)
{
if (bp->class == TERM)
terminal_start(bp->name);
goal = bp;
}
s_lineno = lineno;
c = nextc();
if (c == EOF)
unexpected_EOF();
rescan_lineno = lineno; /* line# for possible inherited args rescan */
#if defined(YYBTYACC)
if (c == L_PAREN)
{
++cptr;
args = copy_args(&argslen);
NO_SPACE(args);
c = nextc();
}
#endif
if (c != ':')
syntax_error(lineno, line, cptr);
start_rule(bp, s_lineno);
#if defined(YYBTYACC)
parse_arginfo(bp, args, argslen);
#endif
++cptr;
}
static void
start_rule(bucket *bp, int s_lineno)
{
if (bp->class == TERM)
terminal_lhs(s_lineno);
bp->class = NONTERM;
if (!bp->index)
bp->index = nrules;
if (nrules >= maxrules)
expand_rules();
plhs[nrules] = bp;
rprec[nrules] = UNDEFINED;
rassoc[nrules] = TOKEN;
}
static void
end_rule(void)
{
int i;
if (!last_was_action && plhs[nrules]->tag)
{
if (pitem[nitems - 1])
{
for (i = nitems - 1; (i > 0) && pitem[i]; --i)
continue;
if (pitem[i + 1] == 0 || pitem[i + 1]->tag != plhs[nrules]->tag)
default_action_warning();
}
else
{
default_action_warning();
}
}
last_was_action = 0;
if (nitems >= maxitems)
expand_items();
pitem[nitems] = 0;
++nitems;
++nrules;
}
static void
insert_empty_rule(void)
{
bucket *bp, **bpp;
assert(cache);
sprintf(cache, "$$%d", ++gensym);
bp = make_bucket(cache);
last_symbol->next = bp;
last_symbol = bp;
bp->tag = plhs[nrules]->tag;
bp->class = ACTION;
#if defined(YYBTYACC)
bp->args = 0;
#endif
nitems = (Value_t) (nitems + 2);
if (nitems > maxitems)
expand_items();
bpp = pitem + nitems - 1;
*bpp-- = bp;
while ((bpp[0] = bpp[-1]) != 0)
--bpp;
if (++nrules >= maxrules)
expand_rules();
plhs[nrules] = plhs[nrules - 1];
plhs[nrules - 1] = bp;
rprec[nrules] = rprec[nrules - 1];
rprec[nrules - 1] = 0;
rassoc[nrules] = rassoc[nrules - 1];
rassoc[nrules - 1] = TOKEN;
}
#if defined(YYBTYACC)
static char *
insert_arg_rule(char *arg, char *tag)
{
int line_number = rescan_lineno;
char *code = compile_arg(&arg, tag);
int rule = lookup_arg_cache(code);
FILE *f = action_file;
if (rule < 0)
{
rule = nrules;
insert_arg_cache(code, rule);
fprintf(f, "case %d:\n", rule - 2);
if (!lflag)
fprintf(f, line_format, line_number, input_file_name);
fprintf(f, "%s;\n", code);
fprintf(f, "break;\n");
insert_empty_rule();
plhs[rule]->tag = tag;
plhs[rule]->class = ARGUMENT;
}
else
{
if (++nitems > maxitems)
expand_items();
pitem[nitems - 1] = plhs[rule];
free(code);
}
return arg + 1;
}
#endif
static void
add_symbol(void)
{
int c;
bucket *bp;
int s_lineno = lineno;
#if defined(YYBTYACC)
char *args = NULL;
int argslen = 0;
#endif
c = *cptr;
if (c == '\'' || c == '"')
bp = get_literal();
else
bp = get_name();
c = nextc();
rescan_lineno = lineno; /* line# for possible inherited args rescan */
#if defined(YYBTYACC)
if (c == L_PAREN)
{
++cptr;
args = copy_args(&argslen);
NO_SPACE(args);
c = nextc();
}
#endif
if (c == ':')
{
end_rule();
start_rule(bp, s_lineno);
#if defined(YYBTYACC)
parse_arginfo(bp, args, argslen);
#endif
++cptr;
return;
}
if (last_was_action)
insert_empty_rule();
last_was_action = 0;
#if defined(YYBTYACC)
if (bp->args < 0)
bp->args = argslen;
if (argslen == 0 && bp->args > 0 && pitem[nitems - 1] == NULL)
{
int i;
if (plhs[nrules]->args != bp->args)
wrong_number_args_warning("default ", bp->name);
for (i = bp->args - 1; i >= 0; i--)
if (plhs[nrules]->argtags[i] != bp->argtags[i])
wrong_type_for_arg_warning(i + 1, bp->name);
}
else if (bp->args != argslen)
wrong_number_args_warning("", bp->name);
if (bp->args > 0 && argslen > 0)
{
char *ap;
int i;
for (ap = args, i = 0; i < argslen; i++)
ap = insert_arg_rule(ap, bp->argtags[i]);
free(args);
}
#endif /* defined(YYBTYACC) */
if (++nitems > maxitems)
expand_items();
pitem[nitems - 1] = bp;
}
static char *
after_blanks(char *s)
{
while (*s != '\0' && isspace(UCH(*s)))
++s;
return s;
}
static void
copy_action(void)
{
int c;
int i, j, n;
int depth;
#if defined(YYBTYACC)
int trialaction = 0;
int haveyyval = 0;
#endif
char *tag;
FILE *f = action_file;
int a_lineno = lineno;
char *a_line = dup_line();
char *a_cptr = a_line + (cptr - line);
Value_t *offsets = NULL, maxoffset;
bucket **rhs;
if (last_was_action)
insert_empty_rule();
last_was_action = 1;
fprintf(f, "case %d:\n", nrules - 2);
#if defined(YYBTYACC)
if (backtrack)
{
if (*cptr != L_BRAC)
fprintf(f, " if (!yytrial)\n");
else
trialaction = 1;
}
#endif
if (!lflag)
fprintf(f, line_format, lineno, input_file_name);
if (*cptr == '=')
++cptr;
/* avoid putting curly-braces in first column, to ease editing */
if (*after_blanks(cptr) == L_CURL)
{
putc('\t', f);
cptr = after_blanks(cptr);
}
maxoffset = 0;
n = 0;
for (i = nitems - 1; pitem[i]; --i)
{
++n;
if (pitem[i]->class != ARGUMENT)
maxoffset++;
}
if (maxoffset > 0)
{
offsets = TMALLOC(Value_t, maxoffset + 1);
NO_SPACE(offsets);
}
for (j = 0, i++; i < nitems; i++)
{
if (pitem[i]->class != ARGUMENT)
{
offsets[++j] = (Value_t) (i - nitems + 1);
}
}
rhs = pitem + nitems - 1;
depth = 0;
loop:
c = *cptr;
if (c == '$')
{
if (cptr[1] == '<')
{
int d_lineno = lineno;
char *d_line = dup_line();
char *d_cptr = d_line + (cptr - line);
++cptr;
tag = get_tag();
c = *cptr;
if (c == '$')
{
fprintf(f, "yyval.%s", tag);
++cptr;
FREE(d_line);
goto loop;
}
else if (isdigit(c))
{
i = get_number();
if (i == 0)
fprintf(f, "yystack.l_mark[%d].%s", -n, tag);
else if (i > maxoffset)
{
dollar_warning(d_lineno, i);
fprintf(f, "yystack.l_mark[%d].%s", i - maxoffset, tag);
}
else if (offsets)
fprintf(f, "yystack.l_mark[%d].%s", offsets[i], tag);
FREE(d_line);
goto loop;
}
else if (c == '-' && isdigit(UCH(cptr[1])))
{
++cptr;
i = -get_number() - n;
fprintf(f, "yystack.l_mark[%d].%s", i, tag);
FREE(d_line);
goto loop;
}
#if defined(YYBTYACC)
else if (isalpha(c) || c == '_')
{
char *arg = scan_id();
for (i = plhs[nrules]->args - 1; i >= 0; i--)
if (arg == plhs[nrules]->argnames[i])
break;
if (i < 0)
unknown_arg_warning(d_lineno, "$", arg, d_line, d_cptr);
fprintf(f, "yystack.l_mark[%d].%s", i - plhs[nrules]->args +
1 - n, tag);
FREE(d_line);
goto loop;
}
#endif
else
dollar_error(d_lineno, d_line, d_cptr);
}
else if (cptr[1] == '$')
{
if (havetags)
{
tag = plhs[nrules]->tag;
if (tag == 0)
untyped_lhs();
fprintf(f, "yyval.%s", tag);
}
else
fprintf(f, "yyval");
cptr += 2;
#if defined(YYBTYACC)
haveyyval = 1;
#endif
goto loop;
}
else if (isdigit(UCH(cptr[1])))
{
++cptr;
i = get_number();
if (havetags)
{
if (i <= 0 || i > maxoffset)
unknown_rhs(i);
tag = rhs[offsets[i]]->tag;
if (tag == 0)
untyped_rhs(i, rhs[offsets[i]]->name);
fprintf(f, "yystack.l_mark[%d].%s", offsets[i], tag);
}
else
{
if (i == 0)
fprintf(f, "yystack.l_mark[%d]", -n);
else if (i > maxoffset)
{
dollar_warning(lineno, i);
fprintf(f, "yystack.l_mark[%d]", i - maxoffset);
}
else if (offsets)
fprintf(f, "yystack.l_mark[%d]", offsets[i]);
}
goto loop;
}
else if (cptr[1] == '-')
{
cptr += 2;
i = get_number();
if (havetags)
unknown_rhs(-i);
fprintf(f, "yystack.l_mark[%d]", -i - n);
goto loop;
}
#if defined(YYBTYACC)
else if (isalpha(cptr[1]) || cptr[1] == '_')
{
char *arg;
++cptr;
arg = scan_id();
for (i = plhs[nrules]->args - 1; i >= 0; i--)
if (arg == plhs[nrules]->argnames[i])
break;
if (i < 0)
unknown_arg_warning(lineno, "$", arg, line, cptr);
tag = (i < 0 ? NULL : plhs[nrules]->argtags[i]);
fprintf(f, "yystack.l_mark[%d]", i - plhs[nrules]->args + 1 - n);
if (tag)
fprintf(f, ".%s", tag);
else if (havetags)
untyped_arg_warning(lineno, "$", arg);
goto loop;
}
#endif
}
#if defined(YYBTYACC)
if (c == '@')
{
if (!locations)
{
int l_lineno = lineno;
char *l_line = dup_line();
char *l_cptr = l_line + (cptr - line);
syntax_error(l_lineno, l_line, l_cptr);
}
if (cptr[1] == '$')
{
fprintf(f, "yyloc");
cptr += 2;
goto loop;
}
else if (isdigit(UCH(cptr[1])))
{
++cptr;
i = get_number();
if (i == 0)
fprintf(f, "yystack.p_mark[%d]", -n);
else if (i > maxoffset)
{
at_warning(lineno, i);
fprintf(f, "yystack.p_mark[%d]", i - maxoffset);
}
else if (offsets)
fprintf(f, "yystack.p_mark[%d]", offsets[i]);
goto loop;
}
}
#endif
if (isalpha(c) || c == '_' || c == '$')
{
do
{
putc(c, f);
c = *++cptr;
}
while (isalnum(c) || c == '_' || c == '$');
goto loop;
}
++cptr;
#if defined(YYBTYACC)
if (backtrack)
{
if (trialaction && c == L_BRAC && depth == 0)
{
++depth;
putc(L_CURL, f);
goto loop;
}
if (trialaction && c == R_BRAC && depth == 1)
{
--depth;
putc(R_CURL, f);
c = nextc();
if (c == L_BRAC && !haveyyval)
{
goto loop;
}
if (c == L_CURL && !haveyyval)
{
fprintf(f, " if (!yytrial)\n");
if (!lflag)
fprintf(f, line_format, lineno, input_file_name);
trialaction = 0;
goto loop;
}
fprintf(f, "\nbreak;\n");
FREE(a_line);
if (maxoffset > 0)
FREE(offsets);
return;
}
}
#endif
putc(c, f);
switch (c)
{
case '\n':
get_line();
if (line)
goto loop;
unterminated_action(a_lineno, a_line, a_cptr);
case ';':
if (depth > 0)
goto loop;
fprintf(f, "\nbreak;\n");
free(a_line);
if (maxoffset > 0)
FREE(offsets);
return;
#if defined(YYBTYACC)
case L_BRAC:
if (backtrack)
++depth;
goto loop;
case R_BRAC:
if (backtrack)
--depth;
goto loop;
#endif
case L_CURL:
++depth;
goto loop;
case R_CURL:
if (--depth > 0)
goto loop;
#if defined(YYBTYACC)
if (backtrack)
{
c = nextc();
if (c == L_BRAC && !haveyyval)
{
trialaction = 1;
goto loop;
}
if (c == L_CURL && !haveyyval)
{
fprintf(f, " if (!yytrial)\n");
if (!lflag)
fprintf(f, line_format, lineno, input_file_name);
goto loop;
}
}
#endif
fprintf(f, "\nbreak;\n");
free(a_line);
if (maxoffset > 0)
FREE(offsets);
return;
case '\'':
case '"':
{
char *s = copy_string(c);
fputs(s, f);
free(s);
}
goto loop;
case '/':
{
char *s = copy_comment();
fputs(s, f);
free(s);
}
goto loop;
default:
goto loop;
}
}
#if defined(YYBTYACC)
static void
copy_destructor(void)
{
int c;
int depth;
char *tag;
bucket *bp;
struct mstring *destructor_text = msnew();
char *code_text;
int a_lineno;
char *a_line;
char *a_cptr;
if (!lflag)
msprintf(destructor_text, line_format, lineno, input_file_name);
cptr = after_blanks(cptr);
if (*cptr == L_CURL)
/* avoid putting curly-braces in first column, to ease editing */
mputc(destructor_text, '\t');
else
syntax_error(lineno, line, cptr);
a_lineno = lineno;
a_line = dup_line();
a_cptr = a_line + (cptr - line);
depth = 0;
loop:
c = *cptr;
if (c == '$')
{
if (cptr[1] == '<')
{
int d_lineno = lineno;
char *d_line = dup_line();
char *d_cptr = d_line + (cptr - line);
++cptr;
tag = get_tag();
c = *cptr;
if (c == '$')
{
msprintf(destructor_text, "(*val).%s", tag);
++cptr;
FREE(d_line);
goto loop;
}
else
dollar_error(d_lineno, d_line, d_cptr);
}
else if (cptr[1] == '$')
{
/* process '$$' later; replacement is context dependent */
msprintf(destructor_text, "$$");
cptr += 2;
goto loop;
}
}
if (c == '@' && cptr[1] == '$')
{
if (!locations)
{
int l_lineno = lineno;
char *l_line = dup_line();
char *l_cptr = l_line + (cptr - line);
syntax_error(l_lineno, l_line, l_cptr);
}
msprintf(destructor_text, "(*loc)");
cptr += 2;
goto loop;
}
if (isalpha(c) || c == '_' || c == '$')
{
do
{
mputc(destructor_text, c);
c = *++cptr;
}
while (isalnum(c) || c == '_' || c == '$');
goto loop;
}
++cptr;
mputc(destructor_text, c);
switch (c)
{
case '\n':
get_line();
if (line)
goto loop;
unterminated_action(a_lineno, a_line, a_cptr);
case L_CURL:
++depth;
goto loop;
case R_CURL:
if (--depth > 0)
goto loop;
goto process_symbols;
case '\'':
case '"':
{
char *s = copy_string(c);
msprintf(destructor_text, "%s", s);
free(s);
}
goto loop;
case '/':
{
char *s = copy_comment();
msprintf(destructor_text, "%s", s);
free(s);
}
goto loop;
default:
goto loop;
}
process_symbols:
code_text = msdone(destructor_text);
for (;;)
{
c = nextc();
if (c == EOF)
unexpected_EOF();
if (c == '<')
{
if (cptr[1] == '>')
{ /* "no semantic type" default destructor */
cptr += 2;
if ((bp = default_destructor[UNTYPED_DEFAULT]) == NULL)
{
static char untyped_default[] = "<>";
bp = make_bucket("untyped default");
bp->tag = untyped_default;
default_destructor[UNTYPED_DEFAULT] = bp;
}
if (bp->destructor != NULL)
destructor_redeclared_warning(a_lineno, a_line, a_cptr);
else
/* replace "$$" with "(*val)" in destructor code */
bp->destructor = process_destructor_XX(code_text, NULL);
}
else if (cptr[1] == '*' && cptr[2] == '>')
{ /* "no per-symbol or per-type" default destructor */
cptr += 3;
if ((bp = default_destructor[TYPED_DEFAULT]) == NULL)
{
static char typed_default[] = "<*>";
bp = make_bucket("typed default");
bp->tag = typed_default;
default_destructor[TYPED_DEFAULT] = bp;
}
if (bp->destructor != NULL)
destructor_redeclared_warning(a_lineno, a_line, a_cptr);
else
{
/* postpone re-processing destructor $$s until end of grammar spec */
bp->destructor = TMALLOC(char, strlen(code_text) + 1);
NO_SPACE(bp->destructor);
strcpy(bp->destructor, code_text);
}
}
else
{ /* "semantic type" default destructor */
tag = get_tag();
bp = lookup_type_destructor(tag);
if (bp->destructor != NULL)
destructor_redeclared_warning(a_lineno, a_line, a_cptr);
else
/* replace "$$" with "(*val).tag" in destructor code */
bp->destructor = process_destructor_XX(code_text, tag);
}
}
else if (isalpha(c) || c == '_' || c == '.' || c == '$')
{ /* "symbol" destructor */
bp = get_name();
if (bp->destructor != NULL)
destructor_redeclared_warning(a_lineno, a_line, a_cptr);
else
{
/* postpone re-processing destructor $$s until end of grammar spec */
bp->destructor = TMALLOC(char, strlen(code_text) + 1);
NO_SPACE(bp->destructor);
strcpy(bp->destructor, code_text);
}
}
else
break;
}
free(a_line);
free(code_text);
}
static char *
process_destructor_XX(char *code, char *tag)
{
int c;
int quote;
int depth;
struct mstring *new_code = msnew();
char *codeptr = code;
depth = 0;
loop: /* step thru code */
c = *codeptr;
if (c == '$' && codeptr[1] == '$')
{
codeptr += 2;
if (tag == NULL)
msprintf(new_code, "(*val)");
else
msprintf(new_code, "(*val).%s", tag);
goto loop;
}
if (isalpha(c) || c == '_' || c == '$')
{
do
{
mputc(new_code, c);
c = *++codeptr;
}
while (isalnum(c) || c == '_' || c == '$');
goto loop;
}
++codeptr;
mputc(new_code, c);
switch (c)
{
case L_CURL:
++depth;
goto loop;
case R_CURL:
if (--depth > 0)
goto loop;
return msdone(new_code);
case '\'':
case '"':
quote = c;
for (;;)
{
c = *codeptr++;
mputc(new_code, c);
if (c == quote)
goto loop;
if (c == '\\')
{
c = *codeptr++;
mputc(new_code, c);
}
}
case '/':
c = *codeptr;
if (c == '*')
{
mputc(new_code, c);
++codeptr;
for (;;)
{
c = *codeptr++;
mputc(new_code, c);
if (c == '*' && *codeptr == '/')
{
mputc(new_code, '/');
++codeptr;
goto loop;
}
}
}
goto loop;
default:
goto loop;
}
}
#endif /* defined(YYBTYACC) */
static int
mark_symbol(void)
{
int c;
bucket *bp = NULL;
c = cptr[1];
if (c == '%' || c == '\\')
{
cptr += 2;
return (1);
}
if (c == '=')
cptr += 2;
else if ((c == 'p' || c == 'P') &&
((c = cptr[2]) == 'r' || c == 'R') &&
((c = cptr[3]) == 'e' || c == 'E') &&
((c = cptr[4]) == 'c' || c == 'C') &&
((c = cptr[5], !IS_IDENT(c))))
cptr += 5;
else
syntax_error(lineno, line, cptr);
c = nextc();
if (isalpha(c) || c == '_' || c == '.' || c == '$')
bp = get_name();
else if (c == '\'' || c == '"')
bp = get_literal();
else
{
syntax_error(lineno, line, cptr);
}
if (rprec[nrules] != UNDEFINED && bp->prec != rprec[nrules])
prec_redeclared();
rprec[nrules] = bp->prec;
rassoc[nrules] = bp->assoc;
return (0);
}
static void
read_grammar(void)
{
int c;
initialize_grammar();
advance_to_start();
for (;;)
{
c = nextc();
if (c == EOF)
break;
if (isalpha(c)
|| c == '_'
|| c == '.'
|| c == '$'
|| c == '\''
|| c == '"')
add_symbol();
#if defined(YYBTYACC)
else if (c == L_CURL || c == '=' || (backtrack && c == L_BRAC))
#else
else if (c == L_CURL || c == '=')
#endif
copy_action();
else if (c == '|')
{
end_rule();
start_rule(plhs[nrules - 1], 0);
++cptr;
}
else if (c == '%')
{
if (mark_symbol())
break;
}
else
syntax_error(lineno, line, cptr);
}
end_rule();
#if defined(YYBTYACC)
if (goal->args > 0)
start_requires_args(goal->name);
#endif
}
static void
free_tags(void)
{
int i;
if (tag_table == 0)
return;
for (i = 0; i < ntags; ++i)
{
assert(tag_table[i]);
FREE(tag_table[i]);
}
FREE(tag_table);
}
static void
pack_names(void)
{
bucket *bp;
char *p, *s, *t;
name_pool_size = 13; /* 13 == sizeof("$end") + sizeof("$accept") */
for (bp = first_symbol; bp; bp = bp->next)
name_pool_size += strlen(bp->name) + 1;
name_pool = TMALLOC(char, name_pool_size);
NO_SPACE(name_pool);
strcpy(name_pool, "$accept");
strcpy(name_pool + 8, "$end");
t = name_pool + 13;
for (bp = first_symbol; bp; bp = bp->next)
{
p = t;
s = bp->name;
while ((*t++ = *s++) != 0)
continue;
FREE(bp->name);
bp->name = p;
}
}
static void
check_symbols(void)
{
bucket *bp;
if (goal->class == UNKNOWN)
undefined_goal(goal->name);
for (bp = first_symbol; bp; bp = bp->next)
{
if (bp->class == UNKNOWN)
{
undefined_symbol_warning(bp->name);
bp->class = TERM;
}
}
}
static void
protect_string(char *src, char **des)
{
unsigned len;
char *s;
char *d;
*des = src;
if (src)
{
len = 1;
s = src;
while (*s)
{
if ('\\' == *s || '"' == *s)
len++;
s++;
len++;
}
*des = d = TMALLOC(char, len);
NO_SPACE(d);
s = src;
while (*s)
{
if ('\\' == *s || '"' == *s)
*d++ = '\\';
*d++ = *s++;
}
*d = '\0';
}
}
static void
pack_symbols(void)
{
bucket *bp;
bucket **v;
Value_t i, j, k, n;
#if defined(YYBTYACC)
Value_t max_tok_pval;
#endif
nsyms = 2;
ntokens = 1;
for (bp = first_symbol; bp; bp = bp->next)
{
++nsyms;
if (bp->class == TERM)
++ntokens;
}
start_symbol = (Value_t) ntokens;
nvars = (Value_t) (nsyms - ntokens);
symbol_name = TMALLOC(char *, nsyms);
NO_SPACE(symbol_name);
symbol_value = TMALLOC(Value_t, nsyms);
NO_SPACE(symbol_value);
symbol_prec = TMALLOC(Value_t, nsyms);
NO_SPACE(symbol_prec);
symbol_assoc = TMALLOC(char, nsyms);
NO_SPACE(symbol_assoc);
#if defined(YYBTYACC)
symbol_pval = TMALLOC(Value_t, nsyms);
NO_SPACE(symbol_pval);
if (destructor)
{
symbol_destructor = CALLOC(sizeof(char *), nsyms);
NO_SPACE(symbol_destructor);
symbol_type_tag = CALLOC(sizeof(char *), nsyms);
NO_SPACE(symbol_type_tag);
}
#endif
v = TMALLOC(bucket *, nsyms);
NO_SPACE(v);
v[0] = 0;
v[start_symbol] = 0;
i = 1;
j = (Value_t) (start_symbol + 1);
for (bp = first_symbol; bp; bp = bp->next)
{
if (bp->class == TERM)
v[i++] = bp;
else
v[j++] = bp;
}
assert(i == ntokens && j == nsyms);
for (i = 1; i < ntokens; ++i)
v[i]->index = i;
goal->index = (Index_t) (start_symbol + 1);
k = (Value_t) (start_symbol + 2);
while (++i < nsyms)
if (v[i] != goal)
{
v[i]->index = k;
++k;
}
goal->value = 0;
k = 1;
for (i = (Value_t) (start_symbol + 1); i < nsyms; ++i)
{
if (v[i] != goal)
{
v[i]->value = k;
++k;
}
}
k = 0;
for (i = 1; i < ntokens; ++i)
{
n = v[i]->value;
if (n > 256)
{
for (j = k++; j > 0 && symbol_value[j - 1] > n; --j)
symbol_value[j] = symbol_value[j - 1];
symbol_value[j] = n;
}
}
assert(v[1] != 0);
if (v[1]->value == UNDEFINED)
v[1]->value = 256;
j = 0;
n = 257;
for (i = 2; i < ntokens; ++i)
{
if (v[i]->value == UNDEFINED)
{
while (j < k && n == symbol_value[j])
{
while (++j < k && n == symbol_value[j])
continue;
++n;
}
v[i]->value = n;
++n;
}
}
symbol_name[0] = name_pool + 8;
symbol_value[0] = 0;
symbol_prec[0] = 0;
symbol_assoc[0] = TOKEN;
#if defined(YYBTYACC)
symbol_pval[0] = 0;
max_tok_pval = 0;
#endif
for (i = 1; i < ntokens; ++i)
{
symbol_name[i] = v[i]->name;
symbol_value[i] = v[i]->value;
symbol_prec[i] = v[i]->prec;
symbol_assoc[i] = v[i]->assoc;
#if defined(YYBTYACC)
symbol_pval[i] = v[i]->value;
if (symbol_pval[i] > max_tok_pval)
max_tok_pval = symbol_pval[i];
if (destructor)
{
symbol_destructor[i] = v[i]->destructor;
symbol_type_tag[i] = v[i]->tag;
}
#endif
}
symbol_name[start_symbol] = name_pool;
symbol_value[start_symbol] = -1;
symbol_prec[start_symbol] = 0;
symbol_assoc[start_symbol] = TOKEN;
#if defined(YYBTYACC)
symbol_pval[start_symbol] = (Value_t) (max_tok_pval + 1);
#endif
for (++i; i < nsyms; ++i)
{
k = v[i]->index;
symbol_name[k] = v[i]->name;
symbol_value[k] = v[i]->value;
symbol_prec[k] = v[i]->prec;
symbol_assoc[k] = v[i]->assoc;
#if defined(YYBTYACC)
symbol_pval[k] = (Value_t) ((max_tok_pval + 1) + v[i]->value + 1);
if (destructor)
{
symbol_destructor[k] = v[i]->destructor;
symbol_type_tag[k] = v[i]->tag;
}
#endif
}
if (gflag)
{
symbol_pname = TMALLOC(char *, nsyms);
NO_SPACE(symbol_pname);
for (i = 0; i < nsyms; ++i)
protect_string(symbol_name[i], &(symbol_pname[i]));
}
FREE(v);
}
static void
pack_grammar(void)
{
int i;
Value_t j;
Assoc_t assoc;
Value_t prec2;
ritem = TMALLOC(Value_t, nitems);
NO_SPACE(ritem);
rlhs = TMALLOC(Value_t, nrules);
NO_SPACE(rlhs);
rrhs = TMALLOC(Value_t, nrules + 1);
NO_SPACE(rrhs);
rprec = TREALLOC(Value_t, rprec, nrules);
NO_SPACE(rprec);
rassoc = TREALLOC(Assoc_t, rassoc, nrules);
NO_SPACE(rassoc);
ritem[0] = -1;
ritem[1] = goal->index;
ritem[2] = 0;
ritem[3] = -2;
rlhs[0] = 0;
rlhs[1] = 0;
rlhs[2] = start_symbol;
rrhs[0] = 0;
rrhs[1] = 0;
rrhs[2] = 1;
j = 4;
for (i = 3; i < nrules; ++i)
{
#if defined(YYBTYACC)
if (plhs[i]->args > 0)
{
if (plhs[i]->argnames)
{
FREE(plhs[i]->argnames);
plhs[i]->argnames = NULL;
}
if (plhs[i]->argtags)
{
FREE(plhs[i]->argtags);
plhs[i]->argtags = NULL;
}
}
#endif /* defined(YYBTYACC) */
rlhs[i] = plhs[i]->index;
rrhs[i] = j;
assoc = TOKEN;
prec2 = 0;
while (pitem[j])
{
ritem[j] = pitem[j]->index;
if (pitem[j]->class == TERM)
{
prec2 = pitem[j]->prec;
assoc = pitem[j]->assoc;
}
++j;
}
ritem[j] = (Value_t) - i;
++j;
if (rprec[i] == UNDEFINED)
{
rprec[i] = prec2;
rassoc[i] = assoc;
}
}
rrhs[i] = j;
FREE(plhs);
FREE(pitem);
#if defined(YYBTYACC)
clean_arg_cache();
#endif
}
static void
print_grammar(void)
{
int i, k;
size_t j, spacing = 0;
FILE *f = verbose_file;
if (!vflag)
return;
k = 1;
for (i = 2; i < nrules; ++i)
{
if (rlhs[i] != rlhs[i - 1])
{
if (i != 2)
fprintf(f, "\n");
fprintf(f, "%4d %s :", i - 2, symbol_name[rlhs[i]]);
spacing = strlen(symbol_name[rlhs[i]]) + 1;
}
else
{
fprintf(f, "%4d ", i - 2);
j = spacing;
while (j-- != 0)
putc(' ', f);
putc('|', f);
}
while (ritem[k] >= 0)
{
fprintf(f, " %s", symbol_name[ritem[k]]);
++k;
}
++k;
putc('\n', f);
}
}
#if defined(YYBTYACC)
static void
finalize_destructors(void)
{
int i;
bucket *bp;
char *tag;
for (i = 2; i < nsyms; ++i)
{
tag = symbol_type_tag[i];
if (symbol_destructor[i] == NULL)
{
if (tag == NULL)
{ /* use <> destructor, if there is one */
if ((bp = default_destructor[UNTYPED_DEFAULT]) != NULL)
{
symbol_destructor[i] = TMALLOC(char,
strlen(bp->destructor) + 1);
NO_SPACE(symbol_destructor[i]);
strcpy(symbol_destructor[i], bp->destructor);
}
}
else
{ /* use type destructor for this tag, if there is one */
bp = lookup_type_destructor(tag);
if (bp->destructor != NULL)
{
symbol_destructor[i] = TMALLOC(char,
strlen(bp->destructor) + 1);
NO_SPACE(symbol_destructor[i]);
strcpy(symbol_destructor[i], bp->destructor);
}
else
{ /* use <*> destructor, if there is one */
if ((bp = default_destructor[TYPED_DEFAULT]) != NULL)
/* replace "$$" with "(*val).tag" in destructor code */
symbol_destructor[i]
= process_destructor_XX(bp->destructor, tag);
}
}
}
else
{ /* replace "$$" with "(*val)[.tag]" in destructor code */
symbol_destructor[i]
= process_destructor_XX(symbol_destructor[i], tag);
}
}
/* 'symbol_type_tag[]' elements are freed by 'free_tags()' */
DO_FREE(symbol_type_tag); /* no longer needed */
if ((bp = default_destructor[UNTYPED_DEFAULT]) != NULL)
{
FREE(bp->name);
/* 'bp->tag' is a static value, don't free */
FREE(bp->destructor);
FREE(bp);
}
if ((bp = default_destructor[TYPED_DEFAULT]) != NULL)
{
FREE(bp->name);
/* 'bp->tag' is a static value, don't free */
FREE(bp->destructor);
FREE(bp);
}
if ((bp = default_destructor[TYPE_SPECIFIED]) != NULL)
{
bucket *p;
for (; bp; bp = p)
{
p = bp->link;
FREE(bp->name);
/* 'bp->tag' freed by 'free_tags()' */
FREE(bp->destructor);
FREE(bp);
}
}
}
#endif /* defined(YYBTYACC) */
void
reader(void)
{
write_section(code_file, banner);
create_symbol_table();
read_declarations();
read_grammar();
free_symbol_table();
pack_names();
check_symbols();
pack_symbols();
pack_grammar();
free_symbols();
print_grammar();
#if defined(YYBTYACC)
if (destructor)
finalize_destructors();
#endif
free_tags();
}
#ifdef NO_LEAKS
static param *
free_declarations(param * list)
{
while (list != 0)
{
param *next = list->next;
free(list->type);
free(list->name);
free(list->type2);
free(list);
list = next;
}
return list;
}
void
reader_leaks(void)
{
lex_param = free_declarations(lex_param);
parse_param = free_declarations(parse_param);
DO_FREE(line);
DO_FREE(rrhs);
DO_FREE(rlhs);
DO_FREE(rprec);
DO_FREE(ritem);
DO_FREE(rassoc);
DO_FREE(cache);
DO_FREE(name_pool);
DO_FREE(symbol_name);
DO_FREE(symbol_prec);
DO_FREE(symbol_assoc);
DO_FREE(symbol_value);
#if defined(YYBTYACC)
DO_FREE(symbol_pval);
DO_FREE(symbol_destructor);
DO_FREE(symbol_type_tag);
#endif
}
#endif