1 /* YACC grammar for Modula-2 expressions, for GDB.
2 Copyright (C) 1986-2017 Free Software Foundation, Inc.
3 Generated from expread.y (now c-exp.y) and contributed by the Department
4 of Computer Science at the State University of New York at Buffalo, 1991.
6 This file is part of GDB.
8 This program is free software; you can redistribute it and/or modify
9 it under the terms of the GNU General Public License as published by
10 the Free Software Foundation; either version 3 of the License, or
11 (at your option) any later version.
13 This program is distributed in the hope that it will be useful,
14 but WITHOUT ANY WARRANTY; without even the implied warranty of
15 MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
16 GNU General Public License for more details.
18 You should have received a copy of the GNU General Public License
19 along with this program. If not, see <http://www.gnu.org/licenses/>. */
21 /* Parse a Modula-2 expression from text in a string,
22 and return the result as a struct expression pointer.
23 That structure contains arithmetic operations in reverse polish,
24 with constants represented by operations that are followed by special data.
25 See expression.h for the details of the format.
26 What is important here is that it can be built up sequentially
27 during the process of parsing; the lower levels of the tree always
28 come first in the result.
30 Note that malloc's and realloc's in this file are transformed to
31 xmalloc and xrealloc respectively by the same sed command in the
32 makefile that remaps any other malloc/realloc inserted by the parser
33 generator. Doing this with #defines and trying to control the interaction
34 with include files (<malloc.h> and <stdlib.h> for example) just became
35 too messy, particularly when such includes can be inserted at random
36 times by the parser generator. */
41 #include "expression.h"
44 #include "parser-defs.h"
46 #include "bfd.h" /* Required by objfiles.h. */
47 #include "symfile.h" /* Required by objfiles.h. */
48 #include "objfiles.h" /* For have_full_symbols and have_partial_symbols */
51 #define parse_type(ps) builtin_type (parse_gdbarch (ps))
52 #define parse_m2_type(ps) builtin_m2_type (parse_gdbarch (ps))
54 /* Remap normal yacc parser interface names (yyparse, yylex, yyerror,
56 #define GDB_YY_REMAP_PREFIX m2_
59 /* The state of the parser, used internally when we are parsing the
62 static struct parser_state *pstate = NULL;
66 static int yylex (void);
68 void yyerror (const char *);
70 static int parse_number (int);
72 /* The sign of the number being parsed. */
73 static int number_sign = 1;
77 /* Although the yacc "value" of an expression is not used,
78 since the result is stored in the structure being created,
79 other node types do have values. */
90 const struct block *bval;
91 enum exp_opcode opcode;
92 struct internalvar *ivar;
98 %type <voidval> exp type_exp start set
99 %type <voidval> variable
104 %token <lval> INT HEX ERROR
105 %token <ulval> UINT M2_TRUE M2_FALSE CHAR
108 /* Both NAME and TYPENAME tokens represent symbols in the input,
109 and both convey their data as strings.
110 But a TYPENAME is a string that happens to be defined as a typedef
111 or builtin type name (such as int or char)
112 and a NAME is any other symbol.
114 Contexts where this distinction is not important can use the
115 nonterminal "name", which matches either NAME or TYPENAME. */
118 %token <sval> NAME BLOCKNAME IDENT VARNAME
119 %token <sval> TYPENAME
121 %token SIZE CAP ORD HIGH ABS MIN_FUNC MAX_FUNC FLOAT_FUNC VAL CHR ODD TRUNC
123 %token INC DEC INCL EXCL
125 /* The GDB scope operator */
128 %token <voidval> INTERNAL_VAR
134 %left '<' '>' LEQ GEQ '=' NOTEQUAL '#' IN
136 %left LOGICAL_AND '&'
139 %left '*' '/' DIV MOD
141 %right '^' DOT '[' '('
144 /* This is not an actual token ; it is used for precedence.
156 { write_exp_elt_opcode (pstate, OP_TYPE);
157 write_exp_elt_type (pstate, $1);
158 write_exp_elt_opcode (pstate, OP_TYPE);
164 exp : exp '^' %prec UNARY
165 { write_exp_elt_opcode (pstate, UNOP_IND); }
169 { number_sign = -1; }
172 write_exp_elt_opcode (pstate, UNOP_NEG); }
175 exp : '+' exp %prec UNARY
176 { write_exp_elt_opcode (pstate, UNOP_PLUS); }
179 exp : not_exp exp %prec UNARY
180 { write_exp_elt_opcode (pstate, UNOP_LOGICAL_NOT); }
187 exp : CAP '(' exp ')'
188 { write_exp_elt_opcode (pstate, UNOP_CAP); }
191 exp : ORD '(' exp ')'
192 { write_exp_elt_opcode (pstate, UNOP_ORD); }
195 exp : ABS '(' exp ')'
196 { write_exp_elt_opcode (pstate, UNOP_ABS); }
199 exp : HIGH '(' exp ')'
200 { write_exp_elt_opcode (pstate, UNOP_HIGH); }
203 exp : MIN_FUNC '(' type ')'
204 { write_exp_elt_opcode (pstate, UNOP_MIN);
205 write_exp_elt_type (pstate, $3);
206 write_exp_elt_opcode (pstate, UNOP_MIN); }
209 exp : MAX_FUNC '(' type ')'
210 { write_exp_elt_opcode (pstate, UNOP_MAX);
211 write_exp_elt_type (pstate, $3);
212 write_exp_elt_opcode (pstate, UNOP_MAX); }
215 exp : FLOAT_FUNC '(' exp ')'
216 { write_exp_elt_opcode (pstate, UNOP_FLOAT); }
219 exp : VAL '(' type ',' exp ')'
220 { write_exp_elt_opcode (pstate, BINOP_VAL);
221 write_exp_elt_type (pstate, $3);
222 write_exp_elt_opcode (pstate, BINOP_VAL); }
225 exp : CHR '(' exp ')'
226 { write_exp_elt_opcode (pstate, UNOP_CHR); }
229 exp : ODD '(' exp ')'
230 { write_exp_elt_opcode (pstate, UNOP_ODD); }
233 exp : TRUNC '(' exp ')'
234 { write_exp_elt_opcode (pstate, UNOP_TRUNC); }
237 exp : TSIZE '(' exp ')'
238 { write_exp_elt_opcode (pstate, UNOP_SIZEOF); }
241 exp : SIZE exp %prec UNARY
242 { write_exp_elt_opcode (pstate, UNOP_SIZEOF); }
246 exp : INC '(' exp ')'
247 { write_exp_elt_opcode (pstate, UNOP_PREINCREMENT); }
250 exp : INC '(' exp ',' exp ')'
251 { write_exp_elt_opcode (pstate, BINOP_ASSIGN_MODIFY);
252 write_exp_elt_opcode (pstate, BINOP_ADD);
253 write_exp_elt_opcode (pstate,
254 BINOP_ASSIGN_MODIFY); }
257 exp : DEC '(' exp ')'
258 { write_exp_elt_opcode (pstate, UNOP_PREDECREMENT);}
261 exp : DEC '(' exp ',' exp ')'
262 { write_exp_elt_opcode (pstate, BINOP_ASSIGN_MODIFY);
263 write_exp_elt_opcode (pstate, BINOP_SUB);
264 write_exp_elt_opcode (pstate,
265 BINOP_ASSIGN_MODIFY); }
269 { write_exp_elt_opcode (pstate, STRUCTOP_STRUCT);
270 write_exp_string (pstate, $3);
271 write_exp_elt_opcode (pstate, STRUCTOP_STRUCT); }
278 { error (_("Sets are not implemented."));}
281 exp : INCL '(' exp ',' exp ')'
282 { error (_("Sets are not implemented."));}
285 exp : EXCL '(' exp ',' exp ')'
286 { error (_("Sets are not implemented."));}
289 set : '{' arglist '}'
290 { error (_("Sets are not implemented."));}
291 | type '{' arglist '}'
292 { error (_("Sets are not implemented."));}
296 /* Modula-2 array subscript notation [a,b,c...] */
298 /* This function just saves the number of arguments
299 that follow in the list. It is *not* specific to
302 non_empty_arglist ']' %prec DOT
303 { write_exp_elt_opcode (pstate, MULTI_SUBSCRIPT);
304 write_exp_elt_longcst (pstate,
305 (LONGEST) end_arglist());
306 write_exp_elt_opcode (pstate, MULTI_SUBSCRIPT); }
309 exp : exp '[' exp ']'
310 { write_exp_elt_opcode (pstate, BINOP_SUBSCRIPT); }
314 /* This is to save the value of arglist_len
315 being accumulated by an outer function call. */
316 { start_arglist (); }
317 arglist ')' %prec DOT
318 { write_exp_elt_opcode (pstate, OP_FUNCALL);
319 write_exp_elt_longcst (pstate,
320 (LONGEST) end_arglist ());
321 write_exp_elt_opcode (pstate, OP_FUNCALL); }
331 arglist : arglist ',' exp %prec ABOVE_COMMA
341 : non_empty_arglist ',' exp %prec ABOVE_COMMA
346 exp : '{' type '}' exp %prec UNARY
347 { write_exp_elt_opcode (pstate, UNOP_MEMVAL);
348 write_exp_elt_type (pstate, $2);
349 write_exp_elt_opcode (pstate, UNOP_MEMVAL); }
352 exp : type '(' exp ')' %prec UNARY
353 { write_exp_elt_opcode (pstate, UNOP_CAST);
354 write_exp_elt_type (pstate, $1);
355 write_exp_elt_opcode (pstate, UNOP_CAST); }
362 /* Binary operators in order of decreasing precedence. Note that some
363 of these operators are overloaded! (ie. sets) */
367 { write_exp_elt_opcode (pstate, BINOP_REPEAT); }
371 { write_exp_elt_opcode (pstate, BINOP_MUL); }
375 { write_exp_elt_opcode (pstate, BINOP_DIV); }
379 { write_exp_elt_opcode (pstate, BINOP_INTDIV); }
383 { write_exp_elt_opcode (pstate, BINOP_REM); }
387 { write_exp_elt_opcode (pstate, BINOP_ADD); }
391 { write_exp_elt_opcode (pstate, BINOP_SUB); }
395 { write_exp_elt_opcode (pstate, BINOP_EQUAL); }
398 exp : exp NOTEQUAL exp
399 { write_exp_elt_opcode (pstate, BINOP_NOTEQUAL); }
401 { write_exp_elt_opcode (pstate, BINOP_NOTEQUAL); }
405 { write_exp_elt_opcode (pstate, BINOP_LEQ); }
409 { write_exp_elt_opcode (pstate, BINOP_GEQ); }
413 { write_exp_elt_opcode (pstate, BINOP_LESS); }
417 { write_exp_elt_opcode (pstate, BINOP_GTR); }
420 exp : exp LOGICAL_AND exp
421 { write_exp_elt_opcode (pstate, BINOP_LOGICAL_AND); }
425 { write_exp_elt_opcode (pstate, BINOP_LOGICAL_OR); }
429 { write_exp_elt_opcode (pstate, BINOP_ASSIGN); }
436 { write_exp_elt_opcode (pstate, OP_BOOL);
437 write_exp_elt_longcst (pstate, (LONGEST) $1);
438 write_exp_elt_opcode (pstate, OP_BOOL); }
442 { write_exp_elt_opcode (pstate, OP_BOOL);
443 write_exp_elt_longcst (pstate, (LONGEST) $1);
444 write_exp_elt_opcode (pstate, OP_BOOL); }
448 { write_exp_elt_opcode (pstate, OP_LONG);
449 write_exp_elt_type (pstate,
450 parse_m2_type (pstate)->builtin_int);
451 write_exp_elt_longcst (pstate, (LONGEST) $1);
452 write_exp_elt_opcode (pstate, OP_LONG); }
457 write_exp_elt_opcode (pstate, OP_LONG);
458 write_exp_elt_type (pstate,
459 parse_m2_type (pstate)
461 write_exp_elt_longcst (pstate, (LONGEST) $1);
462 write_exp_elt_opcode (pstate, OP_LONG);
467 { write_exp_elt_opcode (pstate, OP_LONG);
468 write_exp_elt_type (pstate,
469 parse_m2_type (pstate)
471 write_exp_elt_longcst (pstate, (LONGEST) $1);
472 write_exp_elt_opcode (pstate, OP_LONG); }
477 { write_exp_elt_opcode (pstate, OP_DOUBLE);
478 write_exp_elt_type (pstate,
479 parse_m2_type (pstate)
481 write_exp_elt_dblcst (pstate, $1);
482 write_exp_elt_opcode (pstate, OP_DOUBLE); }
488 exp : SIZE '(' type ')' %prec UNARY
489 { write_exp_elt_opcode (pstate, OP_LONG);
490 write_exp_elt_type (pstate,
491 parse_type (pstate)->builtin_int);
492 write_exp_elt_longcst (pstate,
493 (LONGEST) TYPE_LENGTH ($3));
494 write_exp_elt_opcode (pstate, OP_LONG); }
498 { write_exp_elt_opcode (pstate, OP_M2_STRING);
499 write_exp_string (pstate, $1);
500 write_exp_elt_opcode (pstate, OP_M2_STRING); }
503 /* This will be used for extensions later. Like adding modules. */
505 { $$ = SYMBOL_BLOCK_VALUE($1); }
510 = lookup_symbol (copy_name ($1),
511 expression_context_block,
512 VAR_DOMAIN, 0).symbol;
517 /* GDB scope operator */
518 fblock : block COLONCOLON BLOCKNAME
520 = lookup_symbol (copy_name ($3), $1,
521 VAR_DOMAIN, 0).symbol;
522 if (!tem || SYMBOL_CLASS (tem) != LOC_BLOCK)
523 error (_("No function \"%s\" in specified context."),
529 /* Useful for assigning to PROCEDURE variables */
531 { write_exp_elt_opcode (pstate, OP_VAR_VALUE);
532 write_exp_elt_block (pstate, NULL);
533 write_exp_elt_sym (pstate, $1);
534 write_exp_elt_opcode (pstate, OP_VAR_VALUE); }
537 /* GDB internal ($foo) variable */
538 variable: INTERNAL_VAR
541 /* GDB scope operator */
542 variable: block COLONCOLON NAME
543 { struct block_symbol sym
544 = lookup_symbol (copy_name ($3), $1,
548 error (_("No symbol \"%s\" in specified context."),
550 if (symbol_read_needs_frame (sym.symbol))
552 if (innermost_block == 0
553 || contained_in (sym.block,
555 innermost_block = sym.block;
558 write_exp_elt_opcode (pstate, OP_VAR_VALUE);
559 write_exp_elt_block (pstate, sym.block);
560 write_exp_elt_sym (pstate, sym.symbol);
561 write_exp_elt_opcode (pstate, OP_VAR_VALUE); }
564 /* Base case for variables. */
566 { struct block_symbol sym;
567 struct field_of_this_result is_a_field_of_this;
569 sym = lookup_symbol (copy_name ($1),
570 expression_context_block,
572 &is_a_field_of_this);
576 if (symbol_read_needs_frame (sym.symbol))
578 if (innermost_block == 0 ||
579 contained_in (sym.block,
581 innermost_block = sym.block;
584 write_exp_elt_opcode (pstate, OP_VAR_VALUE);
585 write_exp_elt_block (pstate, sym.block);
586 write_exp_elt_sym (pstate, sym.symbol);
587 write_exp_elt_opcode (pstate, OP_VAR_VALUE);
591 struct bound_minimal_symbol msymbol;
592 char *arg = copy_name ($1);
595 lookup_bound_minimal_symbol (arg);
596 if (msymbol.minsym != NULL)
597 write_exp_msymbol (pstate, msymbol);
598 else if (!have_full_symbols () && !have_partial_symbols ())
599 error (_("No symbol table is loaded. Use the \"symbol-file\" command."));
601 error (_("No symbol \"%s\" in current context."),
609 { $$ = lookup_typename (parse_language (pstate),
610 parse_gdbarch (pstate),
612 expression_context_block, 0); }
618 /* Take care of parsing a number (anything that starts with a digit).
619 Set yylval and return the token type; update lexptr.
620 LEN is the number of characters in it. */
622 /*** Needs some error checking for the float case ***/
625 parse_number (int olen)
627 const char *p = lexptr;
631 int base = input_radix;
633 int unsigned_p = number_sign == 1 ? 1 : 0;
640 else if(p[len-1] == 'C' || p[len-1] == 'B')
643 ischar = p[len-1] == 'C';
647 /* Scan the number */
648 for (c = 0; c < len; c++)
650 if (p[c] == '.' && base == 10)
652 /* It's a float since it contains a point. */
653 yylval.dval = atof (p);
657 if (p[c] == '.' && base != 10)
658 error (_("Floating point numbers must be base 10."));
659 if (base == 10 && (p[c] < '0' || p[c] > '9'))
660 error (_("Invalid digit \'%c\' in number."),p[c]);
667 if( base == 8 && (c == '8' || c == '9'))
668 error (_("Invalid digit \'%c\' in octal number."),c);
669 if (c >= '0' && c <= '9')
673 if (base == 16 && c >= 'A' && c <= 'F')
681 if(!unsigned_p && number_sign == 1 && (prevn >= n))
682 unsigned_p=1; /* Try something unsigned */
683 /* Don't do the range check if n==i and i==0, since that special
684 case will give an overflow error. */
685 if(RANGE_CHECK && n!=i && i)
687 if((unsigned_p && (unsigned)prevn >= (unsigned)n) ||
688 ((!unsigned_p && number_sign==-1) && -prevn <= -n))
689 range_error (_("Overflow on numeric constant."));
695 if(*p == 'B' || *p == 'C' || *p == 'H')
696 lexptr++; /* Advance past B,C or H */
703 else if ( unsigned_p && number_sign == 1)
708 else if((unsigned_p && (n<0))) {
709 range_error (_("Overflow on numeric constant -- number too large."));
710 /* But, this can return if range_check == range_warn. */
725 { {'<', '>'}, NOTEQUAL },
726 { {':', '='}, ASSIGN },
729 { {':', ':'}, COLONCOLON },
733 /* Some specific keywords */
740 static struct keyword keytab[] =
743 {"IN", IN },/* Note space after IN */
744 {"AND", LOGICAL_AND},
762 {"FLOAT", FLOAT_FUNC },
768 /* Read one token, getting characters through lexptr. */
770 /* This is where we will check to make sure that the language and the
771 operators used are compatible */
779 const char *tokstart;
784 prev_lexptr = lexptr;
789 /* See if it is a special token of length 2 */
790 for( i = 0 ; i < (int) (sizeof tokentab2 / sizeof tokentab2[0]) ; i++)
791 if (strncmp (tokentab2[i].name, tokstart, 2) == 0)
794 return tokentab2[i].token;
797 switch (c = *tokstart)
814 if (paren_depth == 0)
821 if (comma_terminates && paren_depth == 0)
827 /* Might be a floating point number. */
828 if (lexptr[1] >= '0' && lexptr[1] <= '9')
829 break; /* Falls into number code. */
836 /* These are character tokens that appear as-is in the YACC grammar */
859 for (namelen = 1; (c = tokstart[namelen]) != quote && c != '\0'; namelen++)
862 c = tokstart[++namelen];
863 if (c >= '0' && c <= '9')
865 c = tokstart[++namelen];
866 if (c >= '0' && c <= '9')
867 c = tokstart[++namelen];
871 error (_("Unterminated string or character constant."));
872 yylval.sval.ptr = tokstart + 1;
873 yylval.sval.length = namelen - 1;
874 lexptr += namelen + 1;
876 if(namelen == 2) /* Single character */
878 yylval.ulval = tokstart[1];
885 /* Is it a number? */
886 /* Note: We have already dealt with the case of the token '.'.
887 See case '.' above. */
888 if ((c >= '0' && c <= '9'))
891 int got_dot = 0, got_e = 0;
892 const char *p = tokstart;
897 if (!got_e && (*p == 'e' || *p == 'E'))
899 else if (!got_dot && *p == '.')
901 else if (got_e && (p[-1] == 'e' || p[-1] == 'E')
902 && (*p == '-' || *p == '+'))
903 /* This is the sign of the exponent, not the end of the
906 else if ((*p < '0' || *p > '9') &&
907 (*p < 'A' || *p > 'F') &&
908 (*p != 'H')) /* Modula-2 hexadecimal number */
911 toktype = parse_number (p - tokstart);
912 if (toktype == ERROR)
914 char *err_copy = (char *) alloca (p - tokstart + 1);
916 memcpy (err_copy, tokstart, p - tokstart);
917 err_copy[p - tokstart] = 0;
918 error (_("Invalid number \"%s\"."), err_copy);
924 if (!(c == '_' || c == '$'
925 || (c >= 'a' && c <= 'z') || (c >= 'A' && c <= 'Z')))
926 /* We must have come across a bad character (e.g. ';'). */
927 error (_("Invalid character '%c' in expression."), c);
929 /* It's a name. See how long it is. */
931 for (c = tokstart[namelen];
932 (c == '_' || c == '$' || (c >= '0' && c <= '9')
933 || (c >= 'a' && c <= 'z') || (c >= 'A' && c <= 'Z'));
934 c = tokstart[++namelen])
937 /* The token "if" terminates the expression and is NOT
938 removed from the input stream. */
939 if (namelen == 2 && tokstart[0] == 'i' && tokstart[1] == 'f')
946 /* Lookup special keywords */
947 for(i = 0 ; i < (int) (sizeof(keytab) / sizeof(keytab[0])) ; i++)
948 if (namelen == strlen (keytab[i].keyw)
949 && strncmp (tokstart, keytab[i].keyw, namelen) == 0)
950 return keytab[i].token;
952 yylval.sval.ptr = tokstart;
953 yylval.sval.length = namelen;
955 if (*tokstart == '$')
957 write_dollar_variable (pstate, yylval.sval);
961 /* Use token-type BLOCKNAME for symbols that happen to be defined as
962 functions. If this is not so, then ...
963 Use token-type TYPENAME for symbols that happen to be defined
964 currently as names of types; NAME for other symbols.
965 The caller is not constrained to care about the distinction. */
969 char *tmp = copy_name (yylval.sval);
972 if (lookup_symtab (tmp))
974 sym = lookup_symbol (tmp, expression_context_block, VAR_DOMAIN, 0).symbol;
975 if (sym && SYMBOL_CLASS (sym) == LOC_BLOCK)
977 if (lookup_typename (parse_language (pstate), parse_gdbarch (pstate),
978 copy_name (yylval.sval),
979 expression_context_block, 1))
984 switch(SYMBOL_CLASS (sym))
990 case LOC_REGPARM_ADDR:
993 case LOC_CONST_BYTES:
994 case LOC_OPTIMIZED_OUT:
1005 error (_("internal: Undefined class in m2lex()"));
1008 case LOC_UNRESOLVED:
1009 error (_("internal: Unforseen case in m2lex()"));
1012 error (_("unhandled token in m2lex()"));
1018 /* Built-in BOOLEAN type. This is sort of a hack. */
1019 if (strncmp (tokstart, "TRUE", 4) == 0)
1024 else if (strncmp (tokstart, "FALSE", 5) == 0)
1031 /* Must be another type of name... */
1037 m2_parse (struct parser_state *par_state)
1039 /* Setting up the parser state. */
1040 scoped_restore pstate_restore = make_scoped_restore (&pstate);
1041 gdb_assert (par_state != NULL);
1048 yyerror (const char *msg)
1051 lexptr = prev_lexptr;
1053 error (_("A %s in expression, near `%s'."), (msg ? msg : "error"), lexptr);