1 /* YACC parser for Pascal expressions, for GDB.
3 Free Software Foundation, Inc.
5 This file is part of GDB.
7 This program is free software; you can redistribute it and/or modify
8 it under the terms of the GNU General Public License as published by
9 the Free Software Foundation; either version 2 of the License, or
10 (at your option) any later version.
12 This program is distributed in the hope that it will be useful,
13 but WITHOUT ANY WARRANTY; without even the implied warranty of
14 MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
15 GNU General Public License for more details.
17 You should have received a copy of the GNU General Public License
18 along with this program; if not, write to the Free Software
19 Foundation, Inc., 59 Temple Place - Suite 330, Boston, MA 02111-1307, USA. */
21 /* This file is derived from c-exp.y */
23 /* Parse a Pascal expression from text in a string,
24 and return the result as a struct expression pointer.
25 That structure contains arithmetic operations in reverse polish,
26 with constants represented by operations that are followed by special data.
27 See expression.h for the details of the format.
28 What is important here is that it can be built up sequentially
29 during the process of parsing; the lower levels of the tree always
30 come first in the result.
32 Note that malloc's and realloc's in this file are transformed to
33 xmalloc and xrealloc respectively by the same sed command in the
34 makefile that remaps any other malloc/realloc inserted by the parser
35 generator. Doing this with #defines and trying to control the interaction
36 with include files (<malloc.h> and <stdlib.h> for example) just became
37 too messy, particularly when such includes can be inserted at random
38 times by the parser generator. */
40 /* Known bugs or limitations:
41 - pascal string operations are not supported at all.
42 - there are some problems with boolean types.
43 - Pascal type hexadecimal constants are not supported
44 because they conflict with the internal variables format.
45 Probably also lots of other problems, less well defined PM */
49 #include "gdb_string.h"
51 #include "expression.h"
53 #include "parser-defs.h"
56 #include "bfd.h" /* Required by objfiles.h. */
57 #include "symfile.h" /* Required by objfiles.h. */
58 #include "objfiles.h" /* For have_full_symbols and have_partial_symbols */
60 /* Remap normal yacc parser interface names (yyparse, yylex, yyerror, etc),
61 as well as gratuitiously global symbol names, so we can have multiple
62 yacc generated parsers in gdb. Note that these are only the variables
63 produced by yacc. If other parser generators (bison, byacc, etc) produce
64 additional global names that conflict at link time, then those parser
65 generators need to be fixed instead of adding those names to this list. */
67 #define yymaxdepth pascal_maxdepth
68 #define yyparse pascal_parse
69 #define yylex pascal_lex
70 #define yyerror pascal_error
71 #define yylval pascal_lval
72 #define yychar pascal_char
73 #define yydebug pascal_debug
74 #define yypact pascal_pact
75 #define yyr1 pascal_r1
76 #define yyr2 pascal_r2
77 #define yydef pascal_def
78 #define yychk pascal_chk
79 #define yypgo pascal_pgo
80 #define yyact pascal_act
81 #define yyexca pascal_exca
82 #define yyerrflag pascal_errflag
83 #define yynerrs pascal_nerrs
84 #define yyps pascal_ps
85 #define yypv pascal_pv
87 #define yy_yys pascal_yys
88 #define yystate pascal_state
89 #define yytmp pascal_tmp
91 #define yy_yyv pascal_yyv
92 #define yyval pascal_val
93 #define yylloc pascal_lloc
94 #define yyreds pascal_reds /* With YYDEBUG defined */
95 #define yytoks pascal_toks /* With YYDEBUG defined */
96 #define yyname pascal_name /* With YYDEBUG defined */
97 #define yyrule pascal_rule /* With YYDEBUG defined */
98 #define yylhs pascal_yylhs
99 #define yylen pascal_yylen
100 #define yydefred pascal_yydefred
101 #define yydgoto pascal_yydgoto
102 #define yysindex pascal_yysindex
103 #define yyrindex pascal_yyrindex
104 #define yygindex pascal_yygindex
105 #define yytable pascal_yytable
106 #define yycheck pascal_yycheck
109 #define YYDEBUG 1 /* Default to yydebug support */
112 #define YYFPRINTF parser_fprintf
116 static int yylex (void);
121 static char * uptok (char *, int);
124 /* Although the yacc "value" of an expression is not used,
125 since the result is stored in the structure being created,
126 other node types do have values. */
143 struct symtoken ssym;
146 enum exp_opcode opcode;
147 struct internalvar *ivar;
154 /* YYSTYPE gets defined by %union */
156 parse_number (char *, int, int, YYSTYPE *);
158 static struct type *current_type;
160 static void push_current_type ();
161 static void pop_current_type ();
162 static int search_field;
165 %type <voidval> exp exp1 type_exp start normal_start variable qualified_name
166 %type <tval> type typebase
167 /* %type <bval> block */
169 /* Fancy type parsing. */
172 %token <typed_val_int> INT
173 %token <typed_val_float> FLOAT
175 /* Both NAME and TYPENAME tokens represent symbols in the input,
176 and both convey their data as strings.
177 But a TYPENAME is a string that happens to be defined as a typedef
178 or builtin type name (such as int or char)
179 and a NAME is any other symbol.
180 Contexts where this distinction is not important can use the
181 nonterminal "name", which matches either NAME or TYPENAME. */
184 %token <sval> FIELDNAME
185 %token <ssym> NAME /* BLOCKNAME defined below to give it higher precedence. */
186 %token <tsym> TYPENAME
188 %type <ssym> name_not_typename
190 /* A NAME_OR_INT is a symbol which is not known in the symbol table,
191 but which would parse as a valid number in the current input radix.
192 E.g. "c" when input_radix==16. Depending on the parse, it will be
193 turned into a name or into a number. */
195 %token <ssym> NAME_OR_INT
197 %token STRUCT CLASS SIZEOF COLONCOLON
200 /* Special type cases, put in to allow the parser to distinguish different
203 %token <voidval> VARIABLE
208 %token <lval> TRUE FALSE
218 %left '<' '>' LEQ GEQ
219 %left LSH RSH DIV MOD
223 %right UNARY INCREMENT DECREMENT
224 %right ARROW '.' '[' '('
226 %token <ssym> BLOCKNAME
233 start : { current_type = NULL;
244 { write_exp_elt_opcode(OP_TYPE);
245 write_exp_elt_type($1);
246 write_exp_elt_opcode(OP_TYPE);
247 current_type = $1; } ;
249 /* Expressions, including the comma operator. */
252 { write_exp_elt_opcode (BINOP_COMMA); }
255 /* Expressions, not including the comma operator. */
256 exp : exp '^' %prec UNARY
257 { write_exp_elt_opcode (UNOP_IND);
259 current_type = TYPE_TARGET_TYPE (current_type); }
261 exp : '@' exp %prec UNARY
262 { write_exp_elt_opcode (UNOP_ADDR);
264 current_type = TYPE_POINTER_TYPE (current_type); }
266 exp : '-' exp %prec UNARY
267 { write_exp_elt_opcode (UNOP_NEG); }
270 exp : NOT exp %prec UNARY
271 { write_exp_elt_opcode (UNOP_LOGICAL_NOT); }
274 exp : INCREMENT '(' exp ')' %prec UNARY
275 { write_exp_elt_opcode (UNOP_PREINCREMENT); }
278 exp : DECREMENT '(' exp ')' %prec UNARY
279 { write_exp_elt_opcode (UNOP_PREDECREMENT); }
282 exp : exp '.' { search_field = 1; }
285 { write_exp_elt_opcode (STRUCTOP_STRUCT);
286 write_exp_string ($4);
287 write_exp_elt_opcode (STRUCTOP_STRUCT);
290 { while (TYPE_CODE (current_type) == TYPE_CODE_PTR)
291 current_type = TYPE_TARGET_TYPE (current_type);
292 current_type = lookup_struct_elt_type (
293 current_type, $4.ptr, false); };
296 /* We need to save the current_type value */
299 arrayfieldindex = is_pascal_string_type (
300 current_type, NULL, NULL,
301 NULL, NULL, &arrayname);
304 struct stoken stringsval;
305 stringsval.ptr = alloca (strlen (arrayname) + 1);
306 stringsval.length = strlen (arrayname);
307 strcpy (stringsval.ptr, arrayname);
308 current_type = TYPE_FIELD_TYPE (current_type,
309 arrayfieldindex - 1);
310 write_exp_elt_opcode (STRUCTOP_STRUCT);
311 write_exp_string (stringsval);
312 write_exp_elt_opcode (STRUCTOP_STRUCT);
314 push_current_type (); }
316 { pop_current_type ();
317 write_exp_elt_opcode (BINOP_SUBSCRIPT);
319 current_type = TYPE_TARGET_TYPE (current_type); }
322 /* This is to save the value of arglist_len
323 being accumulated by an outer function call. */
324 { push_current_type ();
326 arglist ')' %prec ARROW
327 { write_exp_elt_opcode (OP_FUNCALL);
328 write_exp_elt_longcst ((LONGEST) end_arglist ());
329 write_exp_elt_opcode (OP_FUNCALL);
330 pop_current_type (); }
336 | arglist ',' exp %prec ABOVE_COMMA
340 exp : type '(' exp ')' %prec UNARY
341 { write_exp_elt_opcode (UNOP_CAST);
342 write_exp_elt_type ($1);
343 write_exp_elt_opcode (UNOP_CAST);
351 /* Binary operators in order of decreasing precedence. */
354 { write_exp_elt_opcode (BINOP_MUL); }
358 { write_exp_elt_opcode (BINOP_DIV); }
362 { write_exp_elt_opcode (BINOP_INTDIV); }
366 { write_exp_elt_opcode (BINOP_REM); }
370 { write_exp_elt_opcode (BINOP_ADD); }
374 { write_exp_elt_opcode (BINOP_SUB); }
378 { write_exp_elt_opcode (BINOP_LSH); }
382 { write_exp_elt_opcode (BINOP_RSH); }
386 { write_exp_elt_opcode (BINOP_EQUAL); }
389 exp : exp NOTEQUAL exp
390 { write_exp_elt_opcode (BINOP_NOTEQUAL); }
394 { write_exp_elt_opcode (BINOP_LEQ); }
398 { write_exp_elt_opcode (BINOP_GEQ); }
402 { write_exp_elt_opcode (BINOP_LESS); }
406 { write_exp_elt_opcode (BINOP_GTR); }
410 { write_exp_elt_opcode (BINOP_BITWISE_AND); }
414 { write_exp_elt_opcode (BINOP_BITWISE_XOR); }
418 { write_exp_elt_opcode (BINOP_BITWISE_IOR); }
422 { write_exp_elt_opcode (BINOP_ASSIGN); }
426 { write_exp_elt_opcode (OP_BOOL);
427 write_exp_elt_longcst ((LONGEST) $1);
428 write_exp_elt_opcode (OP_BOOL); }
432 { write_exp_elt_opcode (OP_BOOL);
433 write_exp_elt_longcst ((LONGEST) $1);
434 write_exp_elt_opcode (OP_BOOL); }
438 { write_exp_elt_opcode (OP_LONG);
439 write_exp_elt_type ($1.type);
440 write_exp_elt_longcst ((LONGEST)($1.val));
441 write_exp_elt_opcode (OP_LONG); }
446 parse_number ($1.stoken.ptr, $1.stoken.length, 0, &val);
447 write_exp_elt_opcode (OP_LONG);
448 write_exp_elt_type (val.typed_val_int.type);
449 write_exp_elt_longcst ((LONGEST)val.typed_val_int.val);
450 write_exp_elt_opcode (OP_LONG);
456 { write_exp_elt_opcode (OP_DOUBLE);
457 write_exp_elt_type ($1.type);
458 write_exp_elt_dblcst ($1.dval);
459 write_exp_elt_opcode (OP_DOUBLE); }
466 /* Already written by write_dollar_variable. */
469 exp : SIZEOF '(' type ')' %prec UNARY
470 { write_exp_elt_opcode (OP_LONG);
471 write_exp_elt_type (builtin_type_int);
473 write_exp_elt_longcst ((LONGEST) TYPE_LENGTH ($3));
474 write_exp_elt_opcode (OP_LONG); }
478 { /* C strings are converted into array constants with
479 an explicit null byte added at the end. Thus
480 the array upper bound is the string length.
481 There is no such thing in C as a completely empty
483 char *sp = $1.ptr; int count = $1.length;
486 write_exp_elt_opcode (OP_LONG);
487 write_exp_elt_type (builtin_type_char);
488 write_exp_elt_longcst ((LONGEST)(*sp++));
489 write_exp_elt_opcode (OP_LONG);
491 write_exp_elt_opcode (OP_LONG);
492 write_exp_elt_type (builtin_type_char);
493 write_exp_elt_longcst ((LONGEST)'\0');
494 write_exp_elt_opcode (OP_LONG);
495 write_exp_elt_opcode (OP_ARRAY);
496 write_exp_elt_longcst ((LONGEST) 0);
497 write_exp_elt_longcst ((LONGEST) ($1.length));
498 write_exp_elt_opcode (OP_ARRAY); }
503 { write_exp_elt_opcode (OP_THIS);
504 write_exp_elt_opcode (OP_THIS); }
507 /* end of object pascal. */
512 $$ = SYMBOL_BLOCK_VALUE ($1.sym);
516 lookup_symtab (copy_name ($1.stoken));
518 $$ = BLOCKVECTOR_BLOCK (BLOCKVECTOR (tem), STATIC_BLOCK);
520 error ("No file or function \"%s\".",
521 copy_name ($1.stoken));
526 block : block COLONCOLON name
528 = lookup_symbol (copy_name ($3), $1,
529 VAR_NAMESPACE, (int *) NULL,
530 (struct symtab **) NULL);
531 if (!tem || SYMBOL_CLASS (tem) != LOC_BLOCK)
532 error ("No function \"%s\" in specified context.",
534 $$ = SYMBOL_BLOCK_VALUE (tem); }
537 variable: block COLONCOLON name
538 { struct symbol *sym;
539 sym = lookup_symbol (copy_name ($3), $1,
540 VAR_NAMESPACE, (int *) NULL,
541 (struct symtab **) NULL);
543 error ("No symbol \"%s\" in specified context.",
546 write_exp_elt_opcode (OP_VAR_VALUE);
547 /* block_found is set by lookup_symbol. */
548 write_exp_elt_block (block_found);
549 write_exp_elt_sym (sym);
550 write_exp_elt_opcode (OP_VAR_VALUE); }
553 qualified_name: typebase COLONCOLON name
555 struct type *type = $1;
556 if (TYPE_CODE (type) != TYPE_CODE_STRUCT
557 && TYPE_CODE (type) != TYPE_CODE_UNION)
558 error ("`%s' is not defined as an aggregate type.",
561 write_exp_elt_opcode (OP_SCOPE);
562 write_exp_elt_type (type);
563 write_exp_string ($3);
564 write_exp_elt_opcode (OP_SCOPE);
568 variable: qualified_name
571 char *name = copy_name ($2);
573 struct minimal_symbol *msymbol;
576 lookup_symbol (name, (const struct block *) NULL,
577 VAR_NAMESPACE, (int *) NULL,
578 (struct symtab **) NULL);
581 write_exp_elt_opcode (OP_VAR_VALUE);
582 write_exp_elt_block (NULL);
583 write_exp_elt_sym (sym);
584 write_exp_elt_opcode (OP_VAR_VALUE);
588 msymbol = lookup_minimal_symbol (name, NULL, NULL);
591 write_exp_msymbol (msymbol,
592 lookup_function_type (builtin_type_int),
596 if (!have_full_symbols () && !have_partial_symbols ())
597 error ("No symbol table is loaded. Use the \"file\" command.");
599 error ("No symbol \"%s\" in current context.", name);
603 variable: name_not_typename
604 { struct symbol *sym = $1.sym;
608 if (symbol_read_needs_frame (sym))
610 if (innermost_block == 0 ||
611 contained_in (block_found,
613 innermost_block = block_found;
616 write_exp_elt_opcode (OP_VAR_VALUE);
617 /* We want to use the selected frame, not
618 another more inner frame which happens to
619 be in the same block. */
620 write_exp_elt_block (NULL);
621 write_exp_elt_sym (sym);
622 write_exp_elt_opcode (OP_VAR_VALUE);
623 current_type = sym->type; }
624 else if ($1.is_a_field_of_this)
626 struct value * this_val;
627 struct type * this_type;
628 /* Object pascal: it hangs off of `this'. Must
629 not inadvertently convert from a method call
631 if (innermost_block == 0 ||
632 contained_in (block_found, innermost_block))
633 innermost_block = block_found;
634 write_exp_elt_opcode (OP_THIS);
635 write_exp_elt_opcode (OP_THIS);
636 write_exp_elt_opcode (STRUCTOP_PTR);
637 write_exp_string ($1.stoken);
638 write_exp_elt_opcode (STRUCTOP_PTR);
639 /* we need type of this */
640 this_val = value_of_this (0);
642 this_type = this_val->type;
646 current_type = lookup_struct_elt_type (
648 $1.stoken.ptr, false);
654 struct minimal_symbol *msymbol;
655 register char *arg = copy_name ($1.stoken);
658 lookup_minimal_symbol (arg, NULL, NULL);
661 write_exp_msymbol (msymbol,
662 lookup_function_type (builtin_type_int),
665 else if (!have_full_symbols () && !have_partial_symbols ())
666 error ("No symbol table is loaded. Use the \"file\" command.");
668 error ("No symbol \"%s\" in current context.",
669 copy_name ($1.stoken));
678 /* We used to try to recognize more pointer to member types here, but
679 that didn't work (shift/reduce conflicts meant that these rules never
680 got executed). The problem is that
681 int (foo::bar::baz::bizzle)
682 is a function type but
683 int (foo::bar::baz::bizzle::*)
684 is a pointer to member type. Stroustrup loses again! */
687 | typebase COLONCOLON '*'
688 { $$ = lookup_member_type (builtin_type_int, $1); }
691 typebase /* Implements (approximately): (type-qualifier)* type-specifier */
695 { $$ = lookup_struct (copy_name ($2),
696 expression_context_block); }
698 { $$ = lookup_struct (copy_name ($2),
699 expression_context_block); }
700 /* "const" and "volatile" are curently ignored. A type qualifier
701 after the type is handled in the ptype rule. I think these could
705 name : NAME { $$ = $1.stoken; }
706 | BLOCKNAME { $$ = $1.stoken; }
707 | TYPENAME { $$ = $1.stoken; }
708 | NAME_OR_INT { $$ = $1.stoken; }
711 name_not_typename : NAME
713 /* These would be useful if name_not_typename was useful, but it is just
714 a fake for "variable", so these cause reduce/reduce conflicts because
715 the parser can't tell whether NAME_OR_INT is a name_not_typename (=variable,
716 =exp) or just an exp. If name_not_typename was ever used in an lvalue
717 context where only a name could occur, this might be useful.
724 /* Take care of parsing a number (anything that starts with a digit).
725 Set yylval and return the token type; update lexptr.
726 LEN is the number of characters in it. */
728 /*** Needs some error checking for the float case ***/
731 parse_number (p, len, parsed_float, putithere)
737 /* FIXME: Shouldn't these be unsigned? We don't deal with negative values
738 here, and we do kind of silly things like cast to unsigned. */
739 register LONGEST n = 0;
740 register LONGEST prevn = 0;
745 register int base = input_radix;
748 /* Number of "L" suffixes encountered. */
751 /* We have found a "L" or "U" suffix. */
752 int found_suffix = 0;
755 struct type *signed_type;
756 struct type *unsigned_type;
760 /* It's a float since it contains a point or an exponent. */
762 int num = 0; /* number of tokens scanned by scanf */
763 char saved_char = p[len];
765 p[len] = 0; /* null-terminate the token */
766 if (sizeof (putithere->typed_val_float.dval) <= sizeof (float))
767 num = sscanf (p, "%g%c", (float *) &putithere->typed_val_float.dval,&c);
768 else if (sizeof (putithere->typed_val_float.dval) <= sizeof (double))
769 num = sscanf (p, "%lg%c", (double *) &putithere->typed_val_float.dval,&c);
772 #ifdef SCANF_HAS_LONG_DOUBLE
773 num = sscanf (p, "%Lg%c", &putithere->typed_val_float.dval,&c);
775 /* Scan it into a double, then assign it to the long double.
776 This at least wins with values representable in the range
779 num = sscanf (p, "%lg%c", &temp,&c);
780 putithere->typed_val_float.dval = temp;
783 p[len] = saved_char; /* restore the input stream */
784 if (num != 1) /* check scanf found ONLY a float ... */
786 /* See if it has `f' or `l' suffix (float or long double). */
788 c = tolower (p[len - 1]);
791 putithere->typed_val_float.type = builtin_type_float;
793 putithere->typed_val_float.type = builtin_type_long_double;
794 else if (isdigit (c) || c == '.')
795 putithere->typed_val_float.type = builtin_type_double;
802 /* Handle base-switching prefixes 0x, 0t, 0d, 0 */
836 if (c >= 'A' && c <= 'Z')
838 if (c != 'l' && c != 'u')
840 if (c >= '0' && c <= '9')
848 if (base > 10 && c >= 'a' && c <= 'f')
852 n += i = c - 'a' + 10;
865 return ERROR; /* Char not a digit */
868 return ERROR; /* Invalid digit in this base */
870 /* Portably test for overflow (only works for nonzero values, so make
871 a second check for zero). FIXME: Can't we just make n and prevn
872 unsigned and avoid this? */
873 if (c != 'l' && c != 'u' && (prevn >= n) && n != 0)
874 unsigned_p = 1; /* Try something unsigned */
876 /* Portably test for unsigned overflow.
877 FIXME: This check is wrong; for example it doesn't find overflow
878 on 0x123456789 when LONGEST is 32 bits. */
879 if (c != 'l' && c != 'u' && n != 0)
881 if ((unsigned_p && (ULONGEST) prevn >= (ULONGEST) n))
882 error ("Numeric constant too large.");
887 /* An integer constant is an int, a long, or a long long. An L
888 suffix forces it to be long; an LL suffix forces it to be long
889 long. If not forced to a larger size, it gets the first type of
890 the above that it fits in. To figure out whether it fits, we
891 shift it right and see whether anything remains. Note that we
892 can't shift sizeof (LONGEST) * HOST_CHAR_BIT bits or more in one
893 operation, because many compilers will warn about such a shift
894 (which always produces a zero result). Sometimes TARGET_INT_BIT
895 or TARGET_LONG_BIT will be that big, sometimes not. To deal with
896 the case where it is we just always shift the value more than
897 once, with fewer bits each time. */
899 un = (ULONGEST)n >> 2;
901 && (un >> (TARGET_INT_BIT - 2)) == 0)
903 high_bit = ((ULONGEST)1) << (TARGET_INT_BIT-1);
905 /* A large decimal (not hex or octal) constant (between INT_MAX
906 and UINT_MAX) is a long or unsigned long, according to ANSI,
907 never an unsigned int, but this code treats it as unsigned
908 int. This probably should be fixed. GCC gives a warning on
911 unsigned_type = builtin_type_unsigned_int;
912 signed_type = builtin_type_int;
915 && (un >> (TARGET_LONG_BIT - 2)) == 0)
917 high_bit = ((ULONGEST)1) << (TARGET_LONG_BIT-1);
918 unsigned_type = builtin_type_unsigned_long;
919 signed_type = builtin_type_long;
924 if (sizeof (ULONGEST) * HOST_CHAR_BIT < TARGET_LONG_LONG_BIT)
925 /* A long long does not fit in a LONGEST. */
926 shift = (sizeof (ULONGEST) * HOST_CHAR_BIT - 1);
928 shift = (TARGET_LONG_LONG_BIT - 1);
929 high_bit = (ULONGEST) 1 << shift;
930 unsigned_type = builtin_type_unsigned_long_long;
931 signed_type = builtin_type_long_long;
934 putithere->typed_val_int.val = n;
936 /* If the high bit of the worked out type is set then this number
937 has to be unsigned. */
939 if (unsigned_p || (n & high_bit))
941 putithere->typed_val_int.type = unsigned_type;
945 putithere->typed_val_int.type = signed_type;
955 struct type_push *next;
958 static struct type_push *tp_top = NULL;
960 static void push_current_type ()
962 struct type_push *tpnew;
963 tpnew = (struct type_push *) malloc (sizeof (struct type_push));
964 tpnew->next = tp_top;
965 tpnew->stored = current_type;
970 static void pop_current_type ()
972 struct type_push *tp = tp_top;
975 current_type = tp->stored;
985 enum exp_opcode opcode;
988 static const struct token tokentab3[] =
990 {"shr", RSH, BINOP_END},
991 {"shl", LSH, BINOP_END},
992 {"and", ANDAND, BINOP_END},
993 {"div", DIV, BINOP_END},
994 {"not", NOT, BINOP_END},
995 {"mod", MOD, BINOP_END},
996 {"inc", INCREMENT, BINOP_END},
997 {"dec", DECREMENT, BINOP_END},
998 {"xor", XOR, BINOP_END}
1001 static const struct token tokentab2[] =
1003 {"or", OR, BINOP_END},
1004 {"<>", NOTEQUAL, BINOP_END},
1005 {"<=", LEQ, BINOP_END},
1006 {">=", GEQ, BINOP_END},
1007 {":=", ASSIGN, BINOP_END},
1008 {"::", COLONCOLON, BINOP_END} };
1010 /* Allocate uppercased var */
1011 /* make an uppercased copy of tokstart */
1012 static char * uptok (tokstart, namelen)
1017 char *uptokstart = (char *)malloc(namelen+1);
1018 for (i = 0;i <= namelen;i++)
1020 if ((tokstart[i]>='a' && tokstart[i]<='z'))
1021 uptokstart[i] = tokstart[i]-('a'-'A');
1023 uptokstart[i] = tokstart[i];
1025 uptokstart[namelen]='\0';
1028 /* Read one token, getting characters through lexptr. */
1041 int explen, tempbufindex;
1042 static char *tempbuf;
1043 static int tempbufsize;
1047 prev_lexptr = lexptr;
1050 explen = strlen (lexptr);
1051 /* See if it is a special token of length 3. */
1053 for (i = 0; i < sizeof (tokentab3) / sizeof (tokentab3[0]); i++)
1054 if (strncasecmp (tokstart, tokentab3[i].operator, 3) == 0
1055 && (!isalpha (tokentab3[i].operator[0]) || explen == 3
1056 || (!isalpha (tokstart[3]) && !isdigit (tokstart[3]) && tokstart[3] != '_')))
1059 yylval.opcode = tokentab3[i].opcode;
1060 return tokentab3[i].token;
1063 /* See if it is a special token of length 2. */
1065 for (i = 0; i < sizeof (tokentab2) / sizeof (tokentab2[0]); i++)
1066 if (strncasecmp (tokstart, tokentab2[i].operator, 2) == 0
1067 && (!isalpha (tokentab2[i].operator[0]) || explen == 2
1068 || (!isalpha (tokstart[2]) && !isdigit (tokstart[2]) && tokstart[2] != '_')))
1071 yylval.opcode = tokentab2[i].opcode;
1072 return tokentab2[i].token;
1075 switch (c = *tokstart)
1087 /* We either have a character constant ('0' or '\177' for example)
1088 or we have a quoted symbol reference ('foo(int,int)' in object pascal
1093 c = parse_escape (&lexptr);
1095 error ("Empty character constant.");
1097 yylval.typed_val_int.val = c;
1098 yylval.typed_val_int.type = builtin_type_char;
1103 namelen = skip_quoted (tokstart) - tokstart;
1106 lexptr = tokstart + namelen;
1107 if (lexptr[-1] != '\'')
1108 error ("Unmatched single quote.");
1111 uptokstart = uptok(tokstart,namelen);
1114 error ("Invalid character constant.");
1124 if (paren_depth == 0)
1131 if (comma_terminates && paren_depth == 0)
1137 /* Might be a floating point number. */
1138 if (lexptr[1] < '0' || lexptr[1] > '9')
1139 goto symbol; /* Nope, must be a symbol. */
1140 /* FALL THRU into number case. */
1153 /* It's a number. */
1154 int got_dot = 0, got_e = 0, toktype;
1155 register char *p = tokstart;
1156 int hex = input_radix > 10;
1158 if (c == '0' && (p[1] == 'x' || p[1] == 'X'))
1163 else if (c == '0' && (p[1]=='t' || p[1]=='T' || p[1]=='d' || p[1]=='D'))
1171 /* This test includes !hex because 'e' is a valid hex digit
1172 and thus does not indicate a floating point number when
1173 the radix is hex. */
1174 if (!hex && !got_e && (*p == 'e' || *p == 'E'))
1175 got_dot = got_e = 1;
1176 /* This test does not include !hex, because a '.' always indicates
1177 a decimal floating point number regardless of the radix. */
1178 else if (!got_dot && *p == '.')
1180 else if (got_e && (p[-1] == 'e' || p[-1] == 'E')
1181 && (*p == '-' || *p == '+'))
1182 /* This is the sign of the exponent, not the end of the
1185 /* We will take any letters or digits. parse_number will
1186 complain if past the radix, or if L or U are not final. */
1187 else if ((*p < '0' || *p > '9')
1188 && ((*p < 'a' || *p > 'z')
1189 && (*p < 'A' || *p > 'Z')))
1192 toktype = parse_number (tokstart, p - tokstart, got_dot|got_e, &yylval);
1193 if (toktype == ERROR)
1195 char *err_copy = (char *) alloca (p - tokstart + 1);
1197 memcpy (err_copy, tokstart, p - tokstart);
1198 err_copy[p - tokstart] = 0;
1199 error ("Invalid number \"%s\".", err_copy);
1230 /* Build the gdb internal form of the input string in tempbuf,
1231 translating any standard C escape forms seen. Note that the
1232 buffer is null byte terminated *only* for the convenience of
1233 debugging gdb itself and printing the buffer contents when
1234 the buffer contains no embedded nulls. Gdb does not depend
1235 upon the buffer being null byte terminated, it uses the length
1236 string instead. This allows gdb to handle C strings (as well
1237 as strings in other languages) with embedded null bytes */
1239 tokptr = ++tokstart;
1243 /* Grow the static temp buffer if necessary, including allocating
1244 the first one on demand. */
1245 if (tempbufindex + 1 >= tempbufsize)
1247 tempbuf = (char *) realloc (tempbuf, tempbufsize += 64);
1254 /* Do nothing, loop will terminate. */
1258 c = parse_escape (&tokptr);
1263 tempbuf[tempbufindex++] = c;
1266 tempbuf[tempbufindex++] = *tokptr++;
1269 } while ((*tokptr != '"') && (*tokptr != '\0'));
1270 if (*tokptr++ != '"')
1272 error ("Unterminated string in expression.");
1274 tempbuf[tempbufindex] = '\0'; /* See note above */
1275 yylval.sval.ptr = tempbuf;
1276 yylval.sval.length = tempbufindex;
1281 if (!(c == '_' || c == '$'
1282 || (c >= 'a' && c <= 'z') || (c >= 'A' && c <= 'Z')))
1283 /* We must have come across a bad character (e.g. ';'). */
1284 error ("Invalid character '%c' in expression.", c);
1286 /* It's a name. See how long it is. */
1288 for (c = tokstart[namelen];
1289 (c == '_' || c == '$' || (c >= '0' && c <= '9')
1290 || (c >= 'a' && c <= 'z') || (c >= 'A' && c <= 'Z') || c == '<');)
1292 /* Template parameter lists are part of the name.
1293 FIXME: This mishandles `print $a<4&&$a>3'. */
1297 int nesting_level = 1;
1298 while (tokstart[++i])
1300 if (tokstart[i] == '<')
1302 else if (tokstart[i] == '>')
1304 if (--nesting_level == 0)
1308 if (tokstart[i] == '>')
1314 /* do NOT uppercase internals because of registers !!! */
1315 c = tokstart[++namelen];
1318 uptokstart = uptok(tokstart,namelen);
1320 /* The token "if" terminates the expression and is NOT
1321 removed from the input stream. */
1322 if (namelen == 2 && uptokstart[0] == 'I' && uptokstart[1] == 'F')
1331 /* Catch specific keywords. Should be done with a data structure. */
1335 if (STREQ (uptokstart, "OBJECT"))
1337 if (STREQ (uptokstart, "RECORD"))
1339 if (STREQ (uptokstart, "SIZEOF"))
1343 if (STREQ (uptokstart, "CLASS"))
1345 if (STREQ (uptokstart, "FALSE"))
1352 if (STREQ (uptokstart, "TRUE"))
1357 if (STREQ (uptokstart, "SELF"))
1359 /* here we search for 'this' like
1360 inserted in FPC stabs debug info */
1361 static const char this_name[] =
1362 { /* CPLUS_MARKER,*/ 't', 'h', 'i', 's', '\0' };
1364 if (lookup_symbol (this_name, expression_context_block,
1365 VAR_NAMESPACE, (int *) NULL,
1366 (struct symtab **) NULL))
1374 yylval.sval.ptr = tokstart;
1375 yylval.sval.length = namelen;
1377 if (*tokstart == '$')
1379 /* $ is the normal prefix for pascal hexadecimal values
1380 but this conflicts with the GDB use for debugger variables
1381 so in expression to enter hexadecimal values
1382 we still need to use C syntax with 0xff */
1383 write_dollar_variable (yylval.sval);
1387 /* Use token-type BLOCKNAME for symbols that happen to be defined as
1388 functions or symtabs. If this is not so, then ...
1389 Use token-type TYPENAME for symbols that happen to be defined
1390 currently as names of types; NAME for other symbols.
1391 The caller is not constrained to care about the distinction. */
1393 char *tmp = copy_name (yylval.sval);
1395 int is_a_field_of_this = 0;
1400 if (search_field && current_type)
1401 is_a_field = (lookup_struct_elt_type (current_type, tmp, 1) != NULL);
1405 sym = lookup_symbol (tmp, expression_context_block,
1407 &is_a_field_of_this,
1408 (struct symtab **) NULL);
1409 /* second chance uppercased (as Free Pascal does). */
1410 if (!sym && !is_a_field_of_this && !is_a_field)
1412 for (i = 0; i <= namelen; i++)
1414 if ((tmp[i] >= 'a' && tmp[i] <= 'z'))
1415 tmp[i] -= ('a'-'A');
1417 if (search_field && current_type)
1418 is_a_field = (lookup_struct_elt_type (current_type, tmp, 1) != NULL);
1422 sym = lookup_symbol (tmp, expression_context_block,
1424 &is_a_field_of_this,
1425 (struct symtab **) NULL);
1426 if (sym || is_a_field_of_this || is_a_field)
1427 for (i = 0; i <= namelen; i++)
1429 if ((tokstart[i] >= 'a' && tokstart[i] <= 'z'))
1430 tokstart[i] -= ('a'-'A');
1433 /* Third chance Capitalized (as GPC does). */
1434 if (!sym && !is_a_field_of_this && !is_a_field)
1436 for (i = 0; i <= namelen; i++)
1440 if ((tmp[i] >= 'a' && tmp[i] <= 'z'))
1441 tmp[i] -= ('a'-'A');
1444 if ((tmp[i] >= 'A' && tmp[i] <= 'Z'))
1445 tmp[i] -= ('A'-'a');
1447 if (search_field && current_type)
1448 is_a_field = (lookup_struct_elt_type (current_type, tmp, 1) != NULL);
1452 sym = lookup_symbol (tmp, expression_context_block,
1454 &is_a_field_of_this,
1455 (struct symtab **) NULL);
1456 if (sym || is_a_field_of_this || is_a_field)
1457 for (i = 0; i <= namelen; i++)
1461 if ((tokstart[i] >= 'a' && tokstart[i] <= 'z'))
1462 tokstart[i] -= ('a'-'A');
1465 if ((tokstart[i] >= 'A' && tokstart[i] <= 'Z'))
1466 tokstart[i] -= ('A'-'a');
1472 tempbuf = (char *) realloc (tempbuf, namelen + 1);
1473 strncpy (tempbuf, tokstart, namelen); tempbuf [namelen] = 0;
1474 yylval.sval.ptr = tempbuf;
1475 yylval.sval.length = namelen;
1478 /* Call lookup_symtab, not lookup_partial_symtab, in case there are
1479 no psymtabs (coff, xcoff, or some future change to blow away the
1480 psymtabs once once symbols are read). */
1481 if ((sym && SYMBOL_CLASS (sym) == LOC_BLOCK) ||
1482 lookup_symtab (tmp))
1484 yylval.ssym.sym = sym;
1485 yylval.ssym.is_a_field_of_this = is_a_field_of_this;
1488 if (sym && SYMBOL_CLASS (sym) == LOC_TYPEDEF)
1491 /* Despite the following flaw, we need to keep this code enabled.
1492 Because we can get called from check_stub_method, if we don't
1493 handle nested types then it screws many operations in any
1494 program which uses nested types. */
1495 /* In "A::x", if x is a member function of A and there happens
1496 to be a type (nested or not, since the stabs don't make that
1497 distinction) named x, then this code incorrectly thinks we
1498 are dealing with nested types rather than a member function. */
1502 struct symbol *best_sym;
1504 /* Look ahead to detect nested types. This probably should be
1505 done in the grammar, but trying seemed to introduce a lot
1506 of shift/reduce and reduce/reduce conflicts. It's possible
1507 that it could be done, though. Or perhaps a non-grammar, but
1508 less ad hoc, approach would work well. */
1510 /* Since we do not currently have any way of distinguishing
1511 a nested type from a non-nested one (the stabs don't tell
1512 us whether a type is nested), we just ignore the
1519 /* Skip whitespace. */
1520 while (*p == ' ' || *p == '\t' || *p == '\n')
1522 if (*p == ':' && p[1] == ':')
1524 /* Skip the `::'. */
1526 /* Skip whitespace. */
1527 while (*p == ' ' || *p == '\t' || *p == '\n')
1530 while (*p == '_' || *p == '$' || (*p >= '0' && *p <= '9')
1531 || (*p >= 'a' && *p <= 'z')
1532 || (*p >= 'A' && *p <= 'Z'))
1536 struct symbol *cur_sym;
1537 /* As big as the whole rest of the expression, which is
1538 at least big enough. */
1539 char *ncopy = alloca (strlen (tmp)+strlen (namestart)+3);
1543 memcpy (tmp1, tmp, strlen (tmp));
1544 tmp1 += strlen (tmp);
1545 memcpy (tmp1, "::", 2);
1547 memcpy (tmp1, namestart, p - namestart);
1548 tmp1[p - namestart] = '\0';
1549 cur_sym = lookup_symbol (ncopy, expression_context_block,
1550 VAR_NAMESPACE, (int *) NULL,
1551 (struct symtab **) NULL);
1554 if (SYMBOL_CLASS (cur_sym) == LOC_TYPEDEF)
1572 yylval.tsym.type = SYMBOL_TYPE (best_sym);
1574 yylval.tsym.type = SYMBOL_TYPE (sym);
1578 if ((yylval.tsym.type = lookup_primitive_typename (tmp)) != 0)
1581 /* Input names that aren't symbols but ARE valid hex numbers,
1582 when the input radix permits them, can be names or numbers
1583 depending on the parse. Note we support radixes > 16 here. */
1585 ((tokstart[0] >= 'a' && tokstart[0] < 'a' + input_radix - 10) ||
1586 (tokstart[0] >= 'A' && tokstart[0] < 'A' + input_radix - 10)))
1588 YYSTYPE newlval; /* Its value is ignored. */
1589 hextype = parse_number (tokstart, namelen, 0, &newlval);
1592 yylval.ssym.sym = sym;
1593 yylval.ssym.is_a_field_of_this = is_a_field_of_this;
1599 /* Any other kind of symbol */
1600 yylval.ssym.sym = sym;
1601 yylval.ssym.is_a_field_of_this = is_a_field_of_this;
1611 lexptr = prev_lexptr;
1613 error ("A %s in expression, near `%s'.", (msg ? msg : "error"), lexptr);