1 /* YACC parser for D expressions, for GDB.
3 Copyright (C) 2014-2017 Free Software Foundation, Inc.
5 This file is part of GDB.
7 This program is free software; you can redistribute it and/or modify
8 it under the terms of the GNU General Public License as published by
9 the Free Software Foundation; either version 3 of the License, or
10 (at your option) any later version.
12 This program is distributed in the hope that it will be useful,
13 but WITHOUT ANY WARRANTY; without even the implied warranty of
14 MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
15 GNU General Public License for more details.
17 You should have received a copy of the GNU General Public License
18 along with this program. If not, see <http://www.gnu.org/licenses/>. */
20 /* This file is derived from c-exp.y, jv-exp.y. */
22 /* Parse a D expression from text in a string,
23 and return the result as a struct expression pointer.
24 That structure contains arithmetic operations in reverse polish,
25 with constants represented by operations that are followed by special data.
26 See expression.h for the details of the format.
27 What is important here is that it can be built up sequentially
28 during the process of parsing; the lower levels of the tree always
29 come first in the result.
31 Note that malloc's and realloc's in this file are transformed to
32 xmalloc and xrealloc respectively by the same sed command in the
33 makefile that remaps any other malloc/realloc inserted by the parser
34 generator. Doing this with #defines and trying to control the interaction
35 with include files (<malloc.h> and <stdlib.h> for example) just became
36 too messy, particularly when such includes can be inserted at random
37 times by the parser generator. */
43 #include "expression.h"
45 #include "parser-defs.h"
49 #include "bfd.h" /* Required by objfiles.h. */
50 #include "symfile.h" /* Required by objfiles.h. */
51 #include "objfiles.h" /* For have_full_symbols and have_partial_symbols */
55 #define parse_type(ps) builtin_type (parse_gdbarch (ps))
56 #define parse_d_type(ps) builtin_d_type (parse_gdbarch (ps))
58 /* Remap normal yacc parser interface names (yyparse, yylex, yyerror,
60 #define GDB_YY_REMAP_PREFIX d_
63 /* The state of the parser, used internally when we are parsing the
66 static struct parser_state *pstate = NULL;
70 static int yylex (void);
72 void yyerror (char *);
74 static int type_aggregate_p (struct type *);
78 /* Although the yacc "value" of an expression is not used,
79 since the result is stored in the structure being created,
80 other node types do have values. */
94 struct typed_stoken tsval;
101 enum exp_opcode opcode;
102 struct stoken_vector svec;
106 /* YYSTYPE gets defined by %union */
107 static int parse_number (struct parser_state *, const char *,
108 int, int, YYSTYPE *);
111 %token <sval> IDENTIFIER UNKNOWN_NAME
112 %token <tsym> TYPENAME
113 %token <voidval> COMPLETE
115 /* A NAME_OR_INT is a symbol which is not known in the symbol table,
116 but which would parse as a valid number in the current input radix.
117 E.g. "c" when input_radix==16. Depending on the parse, it will be
118 turned into a name or into a number. */
120 %token <sval> NAME_OR_INT
122 %token <typed_val_int> INTEGER_LITERAL
123 %token <typed_val_float> FLOAT_LITERAL
124 %token <tsval> CHARACTER_LITERAL
125 %token <tsval> STRING_LITERAL
127 %type <svec> StringExp
128 %type <tval> BasicType TypeExp
129 %type <sval> IdentifierExp
130 %type <ival> ArrayLiteral
135 /* Keywords that have a constant value. */
136 %token TRUE_KEYWORD FALSE_KEYWORD NULL_KEYWORD
137 /* Class 'super' accessor. */
140 %token CAST_KEYWORD SIZEOF_KEYWORD
141 %token TYPEOF_KEYWORD TYPEID_KEYWORD
143 /* Comparison keywords. */
144 /* Type storage classes. */
145 %token IMMUTABLE_KEYWORD CONST_KEYWORD SHARED_KEYWORD
146 /* Non-scalar type keywords. */
147 %token STRUCT_KEYWORD UNION_KEYWORD
148 %token CLASS_KEYWORD INTERFACE_KEYWORD
149 %token ENUM_KEYWORD TEMPLATE_KEYWORD
150 %token DELEGATE_KEYWORD FUNCTION_KEYWORD
152 %token <sval> DOLLAR_VARIABLE
154 %token <opcode> ASSIGN_MODIFY
157 %right '=' ASSIGN_MODIFY
164 %left EQUAL NOTEQUAL '<' '>' LEQ GEQ
169 %left IDENTITY NOTIDENTITY
170 %right INCREMENT DECREMENT
182 /* Expressions, including the comma operator. */
190 | AssignExpression ',' CommaExpression
191 { write_exp_elt_opcode (pstate, BINOP_COMMA); }
195 ConditionalExpression
196 | ConditionalExpression '=' AssignExpression
197 { write_exp_elt_opcode (pstate, BINOP_ASSIGN); }
198 | ConditionalExpression ASSIGN_MODIFY AssignExpression
199 { write_exp_elt_opcode (pstate, BINOP_ASSIGN_MODIFY);
200 write_exp_elt_opcode (pstate, $2);
201 write_exp_elt_opcode (pstate, BINOP_ASSIGN_MODIFY); }
204 ConditionalExpression:
206 | OrOrExpression '?' Expression ':' ConditionalExpression
207 { write_exp_elt_opcode (pstate, TERNOP_COND); }
212 | OrOrExpression OROR AndAndExpression
213 { write_exp_elt_opcode (pstate, BINOP_LOGICAL_OR); }
218 | AndAndExpression ANDAND OrExpression
219 { write_exp_elt_opcode (pstate, BINOP_LOGICAL_AND); }
224 | OrExpression '|' XorExpression
225 { write_exp_elt_opcode (pstate, BINOP_BITWISE_IOR); }
230 | XorExpression '^' AndExpression
231 { write_exp_elt_opcode (pstate, BINOP_BITWISE_XOR); }
236 | AndExpression '&' CmpExpression
237 { write_exp_elt_opcode (pstate, BINOP_BITWISE_AND); }
248 ShiftExpression EQUAL ShiftExpression
249 { write_exp_elt_opcode (pstate, BINOP_EQUAL); }
250 | ShiftExpression NOTEQUAL ShiftExpression
251 { write_exp_elt_opcode (pstate, BINOP_NOTEQUAL); }
255 ShiftExpression IDENTITY ShiftExpression
256 { write_exp_elt_opcode (pstate, BINOP_EQUAL); }
257 | ShiftExpression NOTIDENTITY ShiftExpression
258 { write_exp_elt_opcode (pstate, BINOP_NOTEQUAL); }
262 ShiftExpression '<' ShiftExpression
263 { write_exp_elt_opcode (pstate, BINOP_LESS); }
264 | ShiftExpression LEQ ShiftExpression
265 { write_exp_elt_opcode (pstate, BINOP_LEQ); }
266 | ShiftExpression '>' ShiftExpression
267 { write_exp_elt_opcode (pstate, BINOP_GTR); }
268 | ShiftExpression GEQ ShiftExpression
269 { write_exp_elt_opcode (pstate, BINOP_GEQ); }
274 | ShiftExpression LSH AddExpression
275 { write_exp_elt_opcode (pstate, BINOP_LSH); }
276 | ShiftExpression RSH AddExpression
277 { write_exp_elt_opcode (pstate, BINOP_RSH); }
282 | AddExpression '+' MulExpression
283 { write_exp_elt_opcode (pstate, BINOP_ADD); }
284 | AddExpression '-' MulExpression
285 { write_exp_elt_opcode (pstate, BINOP_SUB); }
286 | AddExpression '~' MulExpression
287 { write_exp_elt_opcode (pstate, BINOP_CONCAT); }
292 | MulExpression '*' UnaryExpression
293 { write_exp_elt_opcode (pstate, BINOP_MUL); }
294 | MulExpression '/' UnaryExpression
295 { write_exp_elt_opcode (pstate, BINOP_DIV); }
296 | MulExpression '%' UnaryExpression
297 { write_exp_elt_opcode (pstate, BINOP_REM); }
301 { write_exp_elt_opcode (pstate, UNOP_ADDR); }
302 | INCREMENT UnaryExpression
303 { write_exp_elt_opcode (pstate, UNOP_PREINCREMENT); }
304 | DECREMENT UnaryExpression
305 { write_exp_elt_opcode (pstate, UNOP_PREDECREMENT); }
306 | '*' UnaryExpression
307 { write_exp_elt_opcode (pstate, UNOP_IND); }
308 | '-' UnaryExpression
309 { write_exp_elt_opcode (pstate, UNOP_NEG); }
310 | '+' UnaryExpression
311 { write_exp_elt_opcode (pstate, UNOP_PLUS); }
312 | '!' UnaryExpression
313 { write_exp_elt_opcode (pstate, UNOP_LOGICAL_NOT); }
314 | '~' UnaryExpression
315 { write_exp_elt_opcode (pstate, UNOP_COMPLEMENT); }
316 | TypeExp '.' SIZEOF_KEYWORD
317 { write_exp_elt_opcode (pstate, UNOP_SIZEOF); }
323 CAST_KEYWORD '(' TypeExp ')' UnaryExpression
324 { write_exp_elt_opcode (pstate, UNOP_CAST_TYPE); }
325 /* C style cast is illegal D, but is still recognised in
326 the grammar, so we keep this around for convenience. */
327 | '(' TypeExp ')' UnaryExpression
328 { write_exp_elt_opcode (pstate, UNOP_CAST_TYPE); }
334 | PostfixExpression HATHAT UnaryExpression
335 { write_exp_elt_opcode (pstate, BINOP_EXP); }
340 | PostfixExpression '.' COMPLETE
342 mark_struct_expression (pstate);
343 write_exp_elt_opcode (pstate, STRUCTOP_STRUCT);
346 write_exp_string (pstate, s);
347 write_exp_elt_opcode (pstate, STRUCTOP_STRUCT); }
348 | PostfixExpression '.' IDENTIFIER
349 { write_exp_elt_opcode (pstate, STRUCTOP_STRUCT);
350 write_exp_string (pstate, $3);
351 write_exp_elt_opcode (pstate, STRUCTOP_STRUCT); }
352 | PostfixExpression '.' IDENTIFIER COMPLETE
353 { mark_struct_expression (pstate);
354 write_exp_elt_opcode (pstate, STRUCTOP_STRUCT);
355 write_exp_string (pstate, $3);
356 write_exp_elt_opcode (pstate, STRUCTOP_STRUCT); }
357 | PostfixExpression '.' SIZEOF_KEYWORD
358 { write_exp_elt_opcode (pstate, UNOP_SIZEOF); }
359 | PostfixExpression INCREMENT
360 { write_exp_elt_opcode (pstate, UNOP_POSTINCREMENT); }
361 | PostfixExpression DECREMENT
362 { write_exp_elt_opcode (pstate, UNOP_POSTDECREMENT); }
371 | ArgumentList ',' AssignExpression
382 PostfixExpression '('
383 { start_arglist (); }
385 { write_exp_elt_opcode (pstate, OP_FUNCALL);
386 write_exp_elt_longcst (pstate, (LONGEST) end_arglist ());
387 write_exp_elt_opcode (pstate, OP_FUNCALL); }
391 PostfixExpression '[' ArgumentList ']'
392 { if (arglist_len > 0)
394 write_exp_elt_opcode (pstate, MULTI_SUBSCRIPT);
395 write_exp_elt_longcst (pstate, (LONGEST) arglist_len);
396 write_exp_elt_opcode (pstate, MULTI_SUBSCRIPT);
399 write_exp_elt_opcode (pstate, BINOP_SUBSCRIPT);
404 PostfixExpression '[' ']'
405 { /* Do nothing. */ }
406 | PostfixExpression '[' AssignExpression DOTDOT AssignExpression ']'
407 { write_exp_elt_opcode (pstate, TERNOP_SLICE); }
412 { /* Do nothing. */ }
414 { struct bound_minimal_symbol msymbol;
415 char *copy = copy_name ($1);
416 struct field_of_this_result is_a_field_of_this;
417 struct block_symbol sym;
419 /* Handle VAR, which could be local or global. */
420 sym = lookup_symbol (copy, expression_context_block, VAR_DOMAIN,
421 &is_a_field_of_this);
422 if (sym.symbol && SYMBOL_CLASS (sym.symbol) != LOC_TYPEDEF)
424 if (symbol_read_needs_frame (sym.symbol))
426 if (innermost_block == 0
427 || contained_in (sym.block, innermost_block))
428 innermost_block = sym.block;
431 write_exp_elt_opcode (pstate, OP_VAR_VALUE);
432 write_exp_elt_block (pstate, sym.block);
433 write_exp_elt_sym (pstate, sym.symbol);
434 write_exp_elt_opcode (pstate, OP_VAR_VALUE);
436 else if (is_a_field_of_this.type != NULL)
438 /* It hangs off of `this'. Must not inadvertently convert from a
439 method call to data ref. */
440 if (innermost_block == 0
441 || contained_in (sym.block, innermost_block))
442 innermost_block = sym.block;
443 write_exp_elt_opcode (pstate, OP_THIS);
444 write_exp_elt_opcode (pstate, OP_THIS);
445 write_exp_elt_opcode (pstate, STRUCTOP_PTR);
446 write_exp_string (pstate, $1);
447 write_exp_elt_opcode (pstate, STRUCTOP_PTR);
451 /* Lookup foreign name in global static symbols. */
452 msymbol = lookup_bound_minimal_symbol (copy);
453 if (msymbol.minsym != NULL)
454 write_exp_msymbol (pstate, msymbol);
455 else if (!have_full_symbols () && !have_partial_symbols ())
456 error (_("No symbol table is loaded. Use the \"file\" command"));
458 error (_("No symbol \"%s\" in current context."), copy);
461 | TypeExp '.' IdentifierExp
462 { struct type *type = check_typedef ($1);
464 /* Check if the qualified name is in the global
465 context. However if the symbol has not already
466 been resolved, it's not likely to be found. */
467 if (TYPE_CODE (type) == TYPE_CODE_MODULE)
469 struct bound_minimal_symbol msymbol;
470 struct block_symbol sym;
471 const char *type_name = TYPE_SAFE_NAME (type);
472 int type_name_len = strlen (type_name);
475 name = xstrprintf ("%.*s.%.*s",
476 type_name_len, type_name,
478 make_cleanup (xfree, name);
481 lookup_symbol (name, (const struct block *) NULL,
485 write_exp_elt_opcode (pstate, OP_VAR_VALUE);
486 write_exp_elt_block (pstate, sym.block);
487 write_exp_elt_sym (pstate, sym.symbol);
488 write_exp_elt_opcode (pstate, OP_VAR_VALUE);
492 msymbol = lookup_bound_minimal_symbol (name);
493 if (msymbol.minsym != NULL)
494 write_exp_msymbol (pstate, msymbol);
495 else if (!have_full_symbols () && !have_partial_symbols ())
496 error (_("No symbol table is loaded. Use the \"file\" command."));
498 error (_("No symbol \"%s\" in current context."), name);
501 /* Check if the qualified name resolves as a member
502 of an aggregate or an enum type. */
503 if (!type_aggregate_p (type))
504 error (_("`%s' is not defined as an aggregate type."),
505 TYPE_SAFE_NAME (type));
507 write_exp_elt_opcode (pstate, OP_SCOPE);
508 write_exp_elt_type (pstate, type);
509 write_exp_string (pstate, $3);
510 write_exp_elt_opcode (pstate, OP_SCOPE);
513 { write_dollar_variable (pstate, $1); }
516 parse_number (pstate, $1.ptr, $1.length, 0, &val);
517 write_exp_elt_opcode (pstate, OP_LONG);
518 write_exp_elt_type (pstate, val.typed_val_int.type);
519 write_exp_elt_longcst (pstate,
520 (LONGEST) val.typed_val_int.val);
521 write_exp_elt_opcode (pstate, OP_LONG); }
523 { struct type *type = parse_d_type (pstate)->builtin_void;
524 type = lookup_pointer_type (type);
525 write_exp_elt_opcode (pstate, OP_LONG);
526 write_exp_elt_type (pstate, type);
527 write_exp_elt_longcst (pstate, (LONGEST) 0);
528 write_exp_elt_opcode (pstate, OP_LONG); }
530 { write_exp_elt_opcode (pstate, OP_BOOL);
531 write_exp_elt_longcst (pstate, (LONGEST) 1);
532 write_exp_elt_opcode (pstate, OP_BOOL); }
534 { write_exp_elt_opcode (pstate, OP_BOOL);
535 write_exp_elt_longcst (pstate, (LONGEST) 0);
536 write_exp_elt_opcode (pstate, OP_BOOL); }
538 { write_exp_elt_opcode (pstate, OP_LONG);
539 write_exp_elt_type (pstate, $1.type);
540 write_exp_elt_longcst (pstate, (LONGEST)($1.val));
541 write_exp_elt_opcode (pstate, OP_LONG); }
543 { write_exp_elt_opcode (pstate, OP_DOUBLE);
544 write_exp_elt_type (pstate, $1.type);
545 write_exp_elt_dblcst (pstate, $1.dval);
546 write_exp_elt_opcode (pstate, OP_DOUBLE); }
548 { struct stoken_vector vec;
551 write_exp_string_vector (pstate, $1.type, &vec); }
554 write_exp_string_vector (pstate, 0, &$1);
555 for (i = 0; i < $1.len; ++i)
556 free ($1.tokens[i].ptr);
559 { write_exp_elt_opcode (pstate, OP_ARRAY);
560 write_exp_elt_longcst (pstate, (LONGEST) 0);
561 write_exp_elt_longcst (pstate, (LONGEST) $1 - 1);
562 write_exp_elt_opcode (pstate, OP_ARRAY); }
563 | TYPEOF_KEYWORD '(' Expression ')'
564 { write_exp_elt_opcode (pstate, OP_TYPEOF); }
568 '[' ArgumentList_opt ']'
569 { $$ = arglist_len; }
578 { /* We copy the string here, and not in the
579 lexer, to guarantee that we do not leak a
580 string. Note that we follow the
581 NUL-termination convention of the
583 struct typed_stoken *vec = XNEW (struct typed_stoken);
588 vec->length = $1.length;
589 vec->ptr = (char *) malloc ($1.length + 1);
590 memcpy (vec->ptr, $1.ptr, $1.length + 1);
592 | StringExp STRING_LITERAL
593 { /* Note that we NUL-terminate here, but just
598 = XRESIZEVEC (struct typed_stoken, $$.tokens, $$.len);
600 p = (char *) malloc ($2.length + 1);
601 memcpy (p, $2.ptr, $2.length + 1);
603 $$.tokens[$$.len - 1].type = $2.type;
604 $$.tokens[$$.len - 1].length = $2.length;
605 $$.tokens[$$.len - 1].ptr = p;
611 { /* Do nothing. */ }
613 { write_exp_elt_opcode (pstate, OP_TYPE);
614 write_exp_elt_type (pstate, $1);
615 write_exp_elt_opcode (pstate, OP_TYPE); }
616 | BasicType BasicType2
617 { $$ = follow_types ($1);
618 write_exp_elt_opcode (pstate, OP_TYPE);
619 write_exp_elt_type (pstate, $$);
620 write_exp_elt_opcode (pstate, OP_TYPE);
626 { push_type (tp_pointer); }
628 { push_type (tp_pointer); }
629 | '[' INTEGER_LITERAL ']'
630 { push_type_int ($2.val);
631 push_type (tp_array); }
632 | '[' INTEGER_LITERAL ']' BasicType2
633 { push_type_int ($2.val);
634 push_type (tp_array); }
644 /* Return true if the type is aggregate-like. */
647 type_aggregate_p (struct type *type)
649 return (TYPE_CODE (type) == TYPE_CODE_STRUCT
650 || TYPE_CODE (type) == TYPE_CODE_UNION
651 || TYPE_CODE (type) == TYPE_CODE_MODULE
652 || (TYPE_CODE (type) == TYPE_CODE_ENUM
653 && TYPE_DECLARED_CLASS (type)));
656 /* Take care of parsing a number (anything that starts with a digit).
657 Set yylval and return the token type; update lexptr.
658 LEN is the number of characters in it. */
660 /*** Needs some error checking for the float case ***/
663 parse_number (struct parser_state *ps, const char *p,
664 int len, int parsed_float, YYSTYPE *putithere)
672 int base = input_radix;
676 /* We have found a "L" or "U" suffix. */
677 int found_suffix = 0;
680 struct type *signed_type;
681 struct type *unsigned_type;
689 /* Strip out all embedded '_' before passing to parse_float. */
690 s = (char *) alloca (len + 1);
701 if (! parse_float (s, len, &putithere->typed_val_float.dval, &suffix))
704 suffix_len = s + len - suffix;
708 putithere->typed_val_float.type
709 = parse_d_type (ps)->builtin_double;
711 else if (suffix_len == 1)
713 /* Check suffix for `f', `l', or `i' (float, real, or idouble). */
714 if (tolower (*suffix) == 'f')
716 putithere->typed_val_float.type
717 = parse_d_type (ps)->builtin_float;
719 else if (tolower (*suffix) == 'l')
721 putithere->typed_val_float.type
722 = parse_d_type (ps)->builtin_real;
724 else if (tolower (*suffix) == 'i')
726 putithere->typed_val_float.type
727 = parse_d_type (ps)->builtin_idouble;
732 else if (suffix_len == 2)
734 /* Check suffix for `fi' or `li' (ifloat or ireal). */
735 if (tolower (suffix[0]) == 'f' && tolower (suffix[1] == 'i'))
737 putithere->typed_val_float.type
738 = parse_d_type (ps)->builtin_ifloat;
740 else if (tolower (suffix[0]) == 'l' && tolower (suffix[1] == 'i'))
742 putithere->typed_val_float.type
743 = parse_d_type (ps)->builtin_ireal;
751 return FLOAT_LITERAL;
754 /* Handle base-switching prefixes 0x, 0b, 0 */
787 continue; /* Ignore embedded '_'. */
788 if (c >= 'A' && c <= 'Z')
790 if (c != 'l' && c != 'u')
792 if (c >= '0' && c <= '9')
800 if (base > 10 && c >= 'a' && c <= 'f')
804 n += i = c - 'a' + 10;
806 else if (c == 'l' && long_p == 0)
811 else if (c == 'u' && unsigned_p == 0)
817 return ERROR; /* Char not a digit */
820 return ERROR; /* Invalid digit in this base. */
821 /* Portably test for integer overflow. */
822 if (c != 'l' && c != 'u')
824 ULONGEST n2 = prevn * base;
825 if ((n2 / base != prevn) || (n2 + i < prevn))
826 error (_("Numeric constant too large."));
831 /* An integer constant is an int or a long. An L suffix forces it to
832 be long, and a U suffix forces it to be unsigned. To figure out
833 whether it fits, we shift it right and see whether anything remains.
834 Note that we can't shift sizeof (LONGEST) * HOST_CHAR_BIT bits or
835 more in one operation, because many compilers will warn about such a
836 shift (which always produces a zero result). To deal with the case
837 where it is we just always shift the value more than once, with fewer
839 un = (ULONGEST) n >> 2;
840 if (long_p == 0 && (un >> 30) == 0)
842 high_bit = ((ULONGEST) 1) << 31;
843 signed_type = parse_d_type (ps)->builtin_int;
844 /* For decimal notation, keep the sign of the worked out type. */
845 if (base == 10 && !unsigned_p)
846 unsigned_type = parse_d_type (ps)->builtin_long;
848 unsigned_type = parse_d_type (ps)->builtin_uint;
853 if (sizeof (ULONGEST) * HOST_CHAR_BIT < 64)
854 /* A long long does not fit in a LONGEST. */
855 shift = (sizeof (ULONGEST) * HOST_CHAR_BIT - 1);
858 high_bit = (ULONGEST) 1 << shift;
859 signed_type = parse_d_type (ps)->builtin_long;
860 unsigned_type = parse_d_type (ps)->builtin_ulong;
863 putithere->typed_val_int.val = n;
865 /* If the high bit of the worked out type is set then this number
866 has to be unsigned_type. */
867 if (unsigned_p || (n & high_bit))
868 putithere->typed_val_int.type = unsigned_type;
870 putithere->typed_val_int.type = signed_type;
872 return INTEGER_LITERAL;
875 /* Temporary obstack used for holding strings. */
876 static struct obstack tempbuf;
877 static int tempbuf_init;
879 /* Parse a string or character literal from TOKPTR. The string or
880 character may be wide or unicode. *OUTPTR is set to just after the
881 end of the literal in the input string. The resulting token is
882 stored in VALUE. This returns a token value, either STRING or
883 CHAR, depending on what was parsed. *HOST_CHARS is set to the
884 number of host characters in the literal. */
887 parse_string_or_char (const char *tokptr, const char **outptr,
888 struct typed_stoken *value, int *host_chars)
892 /* Build the gdb internal form of the input string in tempbuf. Note
893 that the buffer is null byte terminated *only* for the
894 convenience of debugging gdb itself and printing the buffer
895 contents when the buffer contains no embedded nulls. Gdb does
896 not depend upon the buffer being null byte terminated, it uses
897 the length string instead. This allows gdb to handle C strings
898 (as well as strings in other languages) with embedded null
904 obstack_free (&tempbuf, NULL);
905 obstack_init (&tempbuf);
907 /* Skip the quote. */
919 *host_chars += c_parse_escape (&tokptr, &tempbuf);
925 obstack_1grow (&tempbuf, c);
927 /* FIXME: this does the wrong thing with multi-byte host
928 characters. We could use mbrlen here, but that would
929 make "set host-charset" a bit less useful. */
934 if (*tokptr != quote)
936 if (quote == '"' || quote == '`')
937 error (_("Unterminated string in expression."));
939 error (_("Unmatched single quote."));
943 /* FIXME: should instead use own language string_type enum
944 and handle D-specific string suffixes here. */
946 value->type = C_CHAR;
948 value->type = C_STRING;
950 value->ptr = (char *) obstack_base (&tempbuf);
951 value->length = obstack_object_size (&tempbuf);
955 return quote == '\'' ? CHARACTER_LITERAL : STRING_LITERAL;
962 enum exp_opcode opcode;
965 static const struct token tokentab3[] =
967 {"^^=", ASSIGN_MODIFY, BINOP_EXP},
968 {"<<=", ASSIGN_MODIFY, BINOP_LSH},
969 {">>=", ASSIGN_MODIFY, BINOP_RSH},
972 static const struct token tokentab2[] =
974 {"+=", ASSIGN_MODIFY, BINOP_ADD},
975 {"-=", ASSIGN_MODIFY, BINOP_SUB},
976 {"*=", ASSIGN_MODIFY, BINOP_MUL},
977 {"/=", ASSIGN_MODIFY, BINOP_DIV},
978 {"%=", ASSIGN_MODIFY, BINOP_REM},
979 {"|=", ASSIGN_MODIFY, BINOP_BITWISE_IOR},
980 {"&=", ASSIGN_MODIFY, BINOP_BITWISE_AND},
981 {"^=", ASSIGN_MODIFY, BINOP_BITWISE_XOR},
982 {"++", INCREMENT, BINOP_END},
983 {"--", DECREMENT, BINOP_END},
984 {"&&", ANDAND, BINOP_END},
985 {"||", OROR, BINOP_END},
986 {"^^", HATHAT, BINOP_END},
987 {"<<", LSH, BINOP_END},
988 {">>", RSH, BINOP_END},
989 {"==", EQUAL, BINOP_END},
990 {"!=", NOTEQUAL, BINOP_END},
991 {"<=", LEQ, BINOP_END},
992 {">=", GEQ, BINOP_END},
993 {"..", DOTDOT, BINOP_END},
996 /* Identifier-like tokens. */
997 static const struct token ident_tokens[] =
999 {"is", IDENTITY, BINOP_END},
1000 {"!is", NOTIDENTITY, BINOP_END},
1002 {"cast", CAST_KEYWORD, OP_NULL},
1003 {"const", CONST_KEYWORD, OP_NULL},
1004 {"immutable", IMMUTABLE_KEYWORD, OP_NULL},
1005 {"shared", SHARED_KEYWORD, OP_NULL},
1006 {"super", SUPER_KEYWORD, OP_NULL},
1008 {"null", NULL_KEYWORD, OP_NULL},
1009 {"true", TRUE_KEYWORD, OP_NULL},
1010 {"false", FALSE_KEYWORD, OP_NULL},
1012 {"init", INIT_KEYWORD, OP_NULL},
1013 {"sizeof", SIZEOF_KEYWORD, OP_NULL},
1014 {"typeof", TYPEOF_KEYWORD, OP_NULL},
1015 {"typeid", TYPEID_KEYWORD, OP_NULL},
1017 {"delegate", DELEGATE_KEYWORD, OP_NULL},
1018 {"function", FUNCTION_KEYWORD, OP_NULL},
1019 {"struct", STRUCT_KEYWORD, OP_NULL},
1020 {"union", UNION_KEYWORD, OP_NULL},
1021 {"class", CLASS_KEYWORD, OP_NULL},
1022 {"interface", INTERFACE_KEYWORD, OP_NULL},
1023 {"enum", ENUM_KEYWORD, OP_NULL},
1024 {"template", TEMPLATE_KEYWORD, OP_NULL},
1027 /* This is set if a NAME token appeared at the very end of the input
1028 string, with no whitespace separating the name from the EOF. This
1029 is used only when parsing to do field name completion. */
1030 static int saw_name_at_eof;
1032 /* This is set if the previously-returned token was a structure operator.
1033 This is used only when parsing to do field name completion. */
1034 static int last_was_structop;
1036 /* Read one token, getting characters through lexptr. */
1039 lex_one_token (struct parser_state *par_state)
1044 const char *tokstart;
1045 int saw_structop = last_was_structop;
1048 last_was_structop = 0;
1052 prev_lexptr = lexptr;
1055 /* See if it is a special token of length 3. */
1056 for (i = 0; i < sizeof tokentab3 / sizeof tokentab3[0]; i++)
1057 if (strncmp (tokstart, tokentab3[i].oper, 3) == 0)
1060 yylval.opcode = tokentab3[i].opcode;
1061 return tokentab3[i].token;
1064 /* See if it is a special token of length 2. */
1065 for (i = 0; i < sizeof tokentab2 / sizeof tokentab2[0]; i++)
1066 if (strncmp (tokstart, tokentab2[i].oper, 2) == 0)
1069 yylval.opcode = tokentab2[i].opcode;
1070 return tokentab2[i].token;
1073 switch (c = *tokstart)
1076 /* If we're parsing for field name completion, and the previous
1077 token allows such completion, return a COMPLETE token.
1078 Otherwise, we were already scanning the original text, and
1079 we're really done. */
1080 if (saw_name_at_eof)
1082 saw_name_at_eof = 0;
1085 else if (saw_structop)
1104 if (paren_depth == 0)
1111 if (comma_terminates && paren_depth == 0)
1117 /* Might be a floating point number. */
1118 if (lexptr[1] < '0' || lexptr[1] > '9')
1120 if (parse_completion)
1121 last_was_structop = 1;
1122 goto symbol; /* Nope, must be a symbol. */
1124 /* FALL THRU into number case. */
1137 /* It's a number. */
1138 int got_dot = 0, got_e = 0, toktype;
1139 const char *p = tokstart;
1140 int hex = input_radix > 10;
1142 if (c == '0' && (p[1] == 'x' || p[1] == 'X'))
1150 /* Hex exponents start with 'p', because 'e' is a valid hex
1151 digit and thus does not indicate a floating point number
1152 when the radix is hex. */
1153 if ((!hex && !got_e && tolower (p[0]) == 'e')
1154 || (hex && !got_e && tolower (p[0] == 'p')))
1155 got_dot = got_e = 1;
1156 /* A '.' always indicates a decimal floating point number
1157 regardless of the radix. If we have a '..' then its the
1158 end of the number and the beginning of a slice. */
1159 else if (!got_dot && (p[0] == '.' && p[1] != '.'))
1161 /* This is the sign of the exponent, not the end of the number. */
1162 else if (got_e && (tolower (p[-1]) == 'e' || tolower (p[-1]) == 'p')
1163 && (*p == '-' || *p == '+'))
1165 /* We will take any letters or digits, ignoring any embedded '_'.
1166 parse_number will complain if past the radix, or if L or U are
1168 else if ((*p < '0' || *p > '9') && (*p != '_')
1169 && ((*p < 'a' || *p > 'z') && (*p < 'A' || *p > 'Z')))
1173 toktype = parse_number (par_state, tokstart, p - tokstart,
1174 got_dot|got_e, &yylval);
1175 if (toktype == ERROR)
1177 char *err_copy = (char *) alloca (p - tokstart + 1);
1179 memcpy (err_copy, tokstart, p - tokstart);
1180 err_copy[p - tokstart] = 0;
1181 error (_("Invalid number \"%s\"."), err_copy);
1189 const char *p = &tokstart[1];
1190 size_t len = strlen ("entry");
1192 while (isspace (*p))
1194 if (strncmp (p, "entry", len) == 0 && !isalnum (p[len])
1228 int result = parse_string_or_char (tokstart, &lexptr, &yylval.tsval,
1230 if (result == CHARACTER_LITERAL)
1233 error (_("Empty character constant."));
1234 else if (host_len > 2 && c == '\'')
1237 namelen = lexptr - tokstart - 1;
1240 else if (host_len > 1)
1241 error (_("Invalid character constant."));
1247 if (!(c == '_' || c == '$'
1248 || (c >= 'a' && c <= 'z') || (c >= 'A' && c <= 'Z')))
1249 /* We must have come across a bad character (e.g. ';'). */
1250 error (_("Invalid character '%c' in expression"), c);
1252 /* It's a name. See how long it is. */
1254 for (c = tokstart[namelen];
1255 (c == '_' || c == '$' || (c >= '0' && c <= '9')
1256 || (c >= 'a' && c <= 'z') || (c >= 'A' && c <= 'Z'));)
1257 c = tokstart[++namelen];
1259 /* The token "if" terminates the expression and is NOT
1260 removed from the input stream. */
1261 if (namelen == 2 && tokstart[0] == 'i' && tokstart[1] == 'f')
1264 /* For the same reason (breakpoint conditions), "thread N"
1265 terminates the expression. "thread" could be an identifier, but
1266 an identifier is never followed by a number without intervening
1267 punctuation. "task" is similar. Handle abbreviations of these,
1268 similarly to breakpoint.c:find_condition_and_thread. */
1270 && (strncmp (tokstart, "thread", namelen) == 0
1271 || strncmp (tokstart, "task", namelen) == 0)
1272 && (tokstart[namelen] == ' ' || tokstart[namelen] == '\t'))
1274 const char *p = tokstart + namelen + 1;
1276 while (*p == ' ' || *p == '\t')
1278 if (*p >= '0' && *p <= '9')
1286 yylval.sval.ptr = tokstart;
1287 yylval.sval.length = namelen;
1289 /* Catch specific keywords. */
1290 copy = copy_name (yylval.sval);
1291 for (i = 0; i < sizeof ident_tokens / sizeof ident_tokens[0]; i++)
1292 if (strcmp (copy, ident_tokens[i].oper) == 0)
1294 /* It is ok to always set this, even though we don't always
1295 strictly need to. */
1296 yylval.opcode = ident_tokens[i].opcode;
1297 return ident_tokens[i].token;
1300 if (*tokstart == '$')
1301 return DOLLAR_VARIABLE;
1304 = language_lookup_primitive_type (parse_language (par_state),
1305 parse_gdbarch (par_state), copy);
1306 if (yylval.tsym.type != NULL)
1309 /* Input names that aren't symbols but ARE valid hex numbers,
1310 when the input radix permits them, can be names or numbers
1311 depending on the parse. Note we support radixes > 16 here. */
1312 if ((tokstart[0] >= 'a' && tokstart[0] < 'a' + input_radix - 10)
1313 || (tokstart[0] >= 'A' && tokstart[0] < 'A' + input_radix - 10))
1315 YYSTYPE newlval; /* Its value is ignored. */
1316 int hextype = parse_number (par_state, tokstart, namelen, 0, &newlval);
1317 if (hextype == INTEGER_LITERAL)
1321 if (parse_completion && *lexptr == '\0')
1322 saw_name_at_eof = 1;
1327 /* An object of this type is pushed on a FIFO by the "outer" lexer. */
1334 DEF_VEC_O (token_and_value);
1336 /* A FIFO of tokens that have been read but not yet returned to the
1338 static VEC (token_and_value) *token_fifo;
1340 /* Non-zero if the lexer should return tokens from the FIFO. */
1343 /* Temporary storage for yylex; this holds symbol names as they are
1345 static struct obstack name_obstack;
1347 /* Classify an IDENTIFIER token. The contents of the token are in `yylval'.
1348 Updates yylval and returns the new token type. BLOCK is the block
1349 in which lookups start; this can be NULL to mean the global scope. */
1352 classify_name (struct parser_state *par_state, const struct block *block)
1354 struct block_symbol sym;
1356 struct field_of_this_result is_a_field_of_this;
1358 copy = copy_name (yylval.sval);
1360 sym = lookup_symbol (copy, block, VAR_DOMAIN, &is_a_field_of_this);
1361 if (sym.symbol && SYMBOL_CLASS (sym.symbol) == LOC_TYPEDEF)
1363 yylval.tsym.type = SYMBOL_TYPE (sym.symbol);
1366 else if (sym.symbol == NULL)
1368 /* Look-up first for a module name, then a type. */
1369 sym = lookup_symbol (copy, block, MODULE_DOMAIN, NULL);
1370 if (sym.symbol == NULL)
1371 sym = lookup_symbol (copy, block, STRUCT_DOMAIN, NULL);
1373 if (sym.symbol != NULL)
1375 yylval.tsym.type = SYMBOL_TYPE (sym.symbol);
1379 return UNKNOWN_NAME;
1385 /* Like classify_name, but used by the inner loop of the lexer, when a
1386 name might have already been seen. CONTEXT is the context type, or
1387 NULL if this is the first component of a name. */
1390 classify_inner_name (struct parser_state *par_state,
1391 const struct block *block, struct type *context)
1396 if (context == NULL)
1397 return classify_name (par_state, block);
1399 type = check_typedef (context);
1400 if (!type_aggregate_p (type))
1403 copy = copy_name (yylval.ssym.stoken);
1404 yylval.ssym.sym = d_lookup_nested_symbol (type, copy, block);
1406 if (yylval.ssym.sym.symbol == NULL)
1409 if (SYMBOL_CLASS (yylval.ssym.sym.symbol) == LOC_TYPEDEF)
1411 yylval.tsym.type = SYMBOL_TYPE (yylval.ssym.sym.symbol);
1418 /* The outer level of a two-level lexer. This calls the inner lexer
1419 to return tokens. It then either returns these tokens, or
1420 aggregates them into a larger token. This lets us work around a
1421 problem in our parsing approach, where the parser could not
1422 distinguish between qualified names and qualified types at the
1428 token_and_value current;
1430 struct type *context_type = NULL;
1431 int last_to_examine, next_to_examine, checkpoint;
1432 const struct block *search_block;
1434 if (popping && !VEC_empty (token_and_value, token_fifo))
1438 /* Read the first token and decide what to do. */
1439 current.token = lex_one_token (pstate);
1440 if (current.token != IDENTIFIER && current.token != '.')
1441 return current.token;
1443 /* Read any sequence of alternating "." and identifier tokens into
1445 current.value = yylval;
1446 VEC_safe_push (token_and_value, token_fifo, ¤t);
1447 last_was_dot = current.token == '.';
1451 current.token = lex_one_token (pstate);
1452 current.value = yylval;
1453 VEC_safe_push (token_and_value, token_fifo, ¤t);
1455 if ((last_was_dot && current.token != IDENTIFIER)
1456 || (!last_was_dot && current.token != '.'))
1459 last_was_dot = !last_was_dot;
1463 /* We always read one extra token, so compute the number of tokens
1464 to examine accordingly. */
1465 last_to_examine = VEC_length (token_and_value, token_fifo) - 2;
1466 next_to_examine = 0;
1468 current = *VEC_index (token_and_value, token_fifo, next_to_examine);
1471 /* If we are not dealing with a typename, now is the time to find out. */
1472 if (current.token == IDENTIFIER)
1474 yylval = current.value;
1475 current.token = classify_name (pstate, expression_context_block);
1476 current.value = yylval;
1479 /* If the IDENTIFIER is not known, it could be a package symbol,
1480 first try building up a name until we find the qualified module. */
1481 if (current.token == UNKNOWN_NAME)
1483 obstack_free (&name_obstack, obstack_base (&name_obstack));
1484 obstack_grow (&name_obstack, current.value.sval.ptr,
1485 current.value.sval.length);
1489 while (next_to_examine <= last_to_examine)
1491 token_and_value *next;
1493 next = VEC_index (token_and_value, token_fifo, next_to_examine);
1496 if (next->token == IDENTIFIER && last_was_dot)
1498 /* Update the partial name we are constructing. */
1499 obstack_grow_str (&name_obstack, ".");
1500 obstack_grow (&name_obstack, next->value.sval.ptr,
1501 next->value.sval.length);
1503 yylval.sval.ptr = (char *) obstack_base (&name_obstack);
1504 yylval.sval.length = obstack_object_size (&name_obstack);
1506 current.token = classify_name (pstate, expression_context_block);
1507 current.value = yylval;
1509 /* We keep going until we find a TYPENAME. */
1510 if (current.token == TYPENAME)
1512 /* Install it as the first token in the FIFO. */
1513 VEC_replace (token_and_value, token_fifo, 0, ¤t);
1514 VEC_block_remove (token_and_value, token_fifo, 1,
1515 next_to_examine - 1);
1519 else if (next->token == '.' && !last_was_dot)
1523 /* We've reached the end of the name. */
1528 /* Reset our current token back to the start, if we found nothing
1529 this means that we will just jump to do pop. */
1530 current = *VEC_index (token_and_value, token_fifo, 0);
1531 next_to_examine = 1;
1533 if (current.token != TYPENAME && current.token != '.')
1536 obstack_free (&name_obstack, obstack_base (&name_obstack));
1538 if (current.token == '.')
1539 search_block = NULL;
1542 gdb_assert (current.token == TYPENAME);
1543 search_block = expression_context_block;
1544 obstack_grow (&name_obstack, current.value.sval.ptr,
1545 current.value.sval.length);
1546 context_type = current.value.tsym.type;
1550 last_was_dot = current.token == '.';
1552 while (next_to_examine <= last_to_examine)
1554 token_and_value *next;
1556 next = VEC_index (token_and_value, token_fifo, next_to_examine);
1559 if (next->token == IDENTIFIER && last_was_dot)
1563 yylval = next->value;
1564 classification = classify_inner_name (pstate, search_block,
1566 /* We keep going until we either run out of names, or until
1567 we have a qualified name which is not a type. */
1568 if (classification != TYPENAME && classification != IDENTIFIER)
1571 /* Accept up to this token. */
1572 checkpoint = next_to_examine;
1574 /* Update the partial name we are constructing. */
1575 if (context_type != NULL)
1577 /* We don't want to put a leading "." into the name. */
1578 obstack_grow_str (&name_obstack, ".");
1580 obstack_grow (&name_obstack, next->value.sval.ptr,
1581 next->value.sval.length);
1583 yylval.sval.ptr = (char *) obstack_base (&name_obstack);
1584 yylval.sval.length = obstack_object_size (&name_obstack);
1585 current.value = yylval;
1586 current.token = classification;
1590 if (classification == IDENTIFIER)
1593 context_type = yylval.tsym.type;
1595 else if (next->token == '.' && !last_was_dot)
1599 /* We've reached the end of the name. */
1604 /* If we have a replacement token, install it as the first token in
1605 the FIFO, and delete the other constituent tokens. */
1608 VEC_replace (token_and_value, token_fifo, 0, ¤t);
1610 VEC_block_remove (token_and_value, token_fifo, 1, checkpoint - 1);
1614 current = *VEC_index (token_and_value, token_fifo, 0);
1615 VEC_ordered_remove (token_and_value, token_fifo, 0);
1616 yylval = current.value;
1617 return current.token;
1621 d_parse (struct parser_state *par_state)
1624 struct cleanup *back_to;
1626 /* Setting up the parser state. */
1627 gdb_assert (par_state != NULL);
1630 back_to = make_cleanup (null_cleanup, NULL);
1632 make_cleanup_restore_integer (&yydebug);
1633 make_cleanup_clear_parser_state (&pstate);
1634 yydebug = parser_debug;
1636 /* Initialize some state used by the lexer. */
1637 last_was_structop = 0;
1638 saw_name_at_eof = 0;
1640 VEC_free (token_and_value, token_fifo);
1642 obstack_init (&name_obstack);
1643 make_cleanup_obstack_free (&name_obstack);
1645 result = yyparse ();
1646 do_cleanups (back_to);
1654 lexptr = prev_lexptr;
1656 error (_("A %s in expression, near `%s'."), (msg ? msg : "error"), lexptr);