1 /* YACC grammar for Chill expressions, for GDB.
2 Copyright 1992, 1993, 1994 Free Software Foundation, Inc.
4 This file is part of GDB.
6 This program is free software; you can redistribute it and/or modify
7 it under the terms of the GNU General Public License as published by
8 the Free Software Foundation; either version 2 of the License, or
9 (at your option) any later version.
11 This program is distributed in the hope that it will be useful,
12 but WITHOUT ANY WARRANTY; without even the implied warranty of
13 MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
14 GNU General Public License for more details.
16 You should have received a copy of the GNU General Public License
17 along with this program; if not, write to the Free Software
18 Foundation, Inc., 675 Mass Ave, Cambridge, MA 02139, USA. */
20 /* Parse a Chill expression from text in a string,
21 and return the result as a struct expression pointer.
22 That structure contains arithmetic operations in reverse polish,
23 with constants represented by operations that are followed by special data.
24 See expression.h for the details of the format.
25 What is important here is that it can be built up sequentially
26 during the process of parsing; the lower levels of the tree always
27 come first in the result.
29 Note that malloc's and realloc's in this file are transformed to
30 xmalloc and xrealloc respectively by the same sed command in the
31 makefile that remaps any other malloc/realloc inserted by the parser
32 generator. Doing this with #defines and trying to control the interaction
33 with include files (<malloc.h> and <stdlib.h> for example) just became
34 too messy, particularly when such includes can be inserted at random
35 times by the parser generator.
37 Also note that the language accepted by this parser is more liberal
38 than the one accepted by an actual Chill compiler. For example, the
39 language rule that a simple name string can not be one of the reserved
40 simple name strings is not enforced (e.g "case" is not treated as a
41 reserved name). Another example is that Chill is a strongly typed
42 language, and certain expressions that violate the type constraints
43 may still be evaluated if gdb can do so in a meaningful manner, while
44 such expressions would be rejected by the compiler. The reason for
45 this more liberal behavior is the philosophy that the debugger
46 is intended to be a tool that is used by the programmer when things
47 go wrong, and as such, it should provide as few artificial barriers
48 to it's use as possible. If it can do something meaningful, even
49 something that violates language contraints that are enforced by the
50 compiler, it should do so without complaint.
59 #include "expression.h"
62 #include "parser-defs.h"
64 #include "bfd.h" /* Required by objfiles.h. */
65 #include "symfile.h" /* Required by objfiles.h. */
66 #include "objfiles.h" /* For have_full_symbols and have_partial_symbols */
68 /* Remap normal yacc parser interface names (yyparse, yylex, yyerror, etc),
69 as well as gratuitiously global symbol names, so we can have multiple
70 yacc generated parsers in gdb. Note that these are only the variables
71 produced by yacc. If other parser generators (bison, byacc, etc) produce
72 additional global names that conflict at link time, then those parser
73 generators need to be fixed instead of adding those names to this list. */
75 #define yymaxdepth chill_maxdepth
76 #define yyparse chill_parse
77 #define yylex chill_lex
78 #define yyerror chill_error
79 #define yylval chill_lval
80 #define yychar chill_char
81 #define yydebug chill_debug
82 #define yypact chill_pact
85 #define yydef chill_def
86 #define yychk chill_chk
87 #define yypgo chill_pgo
88 #define yyact chill_act
89 #define yyexca chill_exca
90 #define yyerrflag chill_errflag
91 #define yynerrs chill_nerrs
95 #define yy_yys chill_yys
96 #define yystate chill_state
97 #define yytmp chill_tmp
99 #define yy_yyv chill_yyv
100 #define yyval chill_val
101 #define yylloc chill_lloc
102 #define yyreds chill_reds /* With YYDEBUG defined */
103 #define yytoks chill_toks /* With YYDEBUG defined */
104 #define yylhs chill_yylhs
105 #define yylen chill_yylen
106 #define yydefred chill_yydefred
107 #define yydgoto chill_yydgoto
108 #define yysindex chill_yysindex
109 #define yyrindex chill_yyrindex
110 #define yygindex chill_yygindex
111 #define yytable chill_yytable
112 #define yycheck chill_yycheck
115 #define YYDEBUG 0 /* Default to no yydebug support */
119 yyparse PARAMS ((void));
122 yylex PARAMS ((void));
125 yyerror PARAMS ((char *));
129 /* Although the yacc "value" of an expression is not used,
130 since the result is stored in the structure being created,
131 other node types do have values. */
136 unsigned LONGEST ulval;
146 struct symtoken ssym;
149 enum exp_opcode opcode;
150 struct internalvar *ivar;
156 %token <voidval> FIXME_01
157 %token <voidval> FIXME_02
158 %token <voidval> FIXME_03
159 %token <voidval> FIXME_04
160 %token <voidval> FIXME_05
161 %token <voidval> FIXME_06
162 %token <voidval> FIXME_07
163 %token <voidval> FIXME_08
164 %token <voidval> FIXME_09
165 %token <voidval> FIXME_10
166 %token <voidval> FIXME_11
167 %token <voidval> FIXME_12
168 %token <voidval> FIXME_13
169 %token <voidval> FIXME_14
170 %token <voidval> FIXME_15
171 %token <voidval> FIXME_16
172 %token <voidval> FIXME_17
173 %token <voidval> FIXME_18
174 %token <voidval> FIXME_19
175 %token <voidval> FIXME_20
176 %token <voidval> FIXME_21
177 %token <voidval> FIXME_22
178 %token <voidval> FIXME_24
179 %token <voidval> FIXME_25
180 %token <voidval> FIXME_26
181 %token <voidval> FIXME_27
182 %token <voidval> FIXME_28
183 %token <voidval> FIXME_29
184 %token <voidval> FIXME_30
186 %token <typed_val> INTEGER_LITERAL
187 %token <ulval> BOOLEAN_LITERAL
188 %token <typed_val> CHARACTER_LITERAL
189 %token <dval> FLOAT_LITERAL
190 %token <ssym> GENERAL_PROCEDURE_NAME
191 %token <ssym> LOCATION_NAME
192 %token <voidval> SET_LITERAL
193 %token <voidval> EMPTINESS_LITERAL
194 %token <sval> CHARACTER_STRING_LITERAL
195 %token <sval> BIT_STRING_LITERAL
196 %token <tsym> TYPENAME
197 %token <sval> FIELD_NAME
202 %token <voidval> CASE
204 %token <voidval> ESAC
205 %token <voidval> LOGIOR
206 %token <voidval> ORIF
207 %token <voidval> LOGXOR
208 %token <voidval> LOGAND
209 %token <voidval> ANDIF
211 %token <voidval> NOTEQUAL
221 %token <voidval> SLASH_SLASH
225 %token <voidval> POINTER
226 %token <voidval> RECEIVE
233 %token <voidval> THEN
234 %token <voidval> ELSE
236 %token <voidval> ELSIF
237 %token <voidval> ILLEGAL_TOKEN
239 %token <voidval> PRED
240 %token <voidval> SUCC
242 %token <voidval> CARD
243 %token <voidval> MAX_TOKEN
244 %token <voidval> MIN_TOKEN
245 %token <voidval> SIZE
246 %token <voidval> UPPER
247 %token <voidval> LOWER
248 %token <voidval> LENGTH
249 %token <voidval> ARRAY
251 /* Tokens which are not Chill tokens used in expressions, but rather GDB
252 specific things that we recognize in the same context as Chill tokens
253 (register names for example). */
255 %token <lval> GDB_REGNAME /* Machine register name */
256 %token <lval> GDB_LAST /* Value history */
257 %token <ivar> GDB_VARIABLE /* Convenience variable */
258 %token <voidval> GDB_ASSIGNMENT /* Assign value to somewhere */
260 %type <voidval> access_name
261 %type <voidval> primitive_value
262 %type <voidval> value_name
263 %type <voidval> literal
264 %type <voidval> tuple
265 %type <voidval> slice
266 %type <voidval> expression_conversion
267 %type <voidval> value_procedure_call
268 %type <voidval> value_built_in_routine_call
269 %type <voidval> chill_value_built_in_routine_call
270 %type <voidval> start_expression
271 %type <voidval> zero_adic_operator
272 %type <voidval> parenthesised_expression
273 %type <voidval> value
274 %type <voidval> undefined_value
275 %type <voidval> expression
276 %type <voidval> conditional_expression
277 %type <voidval> then_alternative
278 %type <voidval> else_alternative
279 %type <voidval> sub_expression
280 %type <voidval> value_case_alternative
281 %type <voidval> operand_0
282 %type <voidval> operand_1
283 %type <voidval> operand_2
284 %type <voidval> operand_3
285 %type <voidval> operand_4
286 %type <voidval> operand_5
287 %type <voidval> operand_6
288 %type <voidval> synonym_name
289 %type <voidval> value_enumeration_name
290 %type <voidval> value_do_with_name
291 %type <voidval> value_receive_name
292 %type <voidval> expression_list
293 %type <tval> mode_argument
294 %type <voidval> array_mode_name
295 %type <voidval> string_mode_name
296 %type <voidval> variant_structure_mode_name
297 %type <voidval> boolean_expression
298 %type <voidval> case_selector_list
299 %type <voidval> subexpression
300 %type <voidval> case_label_specification
301 %type <voidval> buffer_location
302 %type <voidval> single_assignment_action
303 %type <tsym> mode_name
312 { write_exp_elt_opcode(OP_TYPE);
313 write_exp_elt_type($1.type);
314 write_exp_elt_opcode(OP_TYPE);}
327 undefined_value : FIXME_01
335 access_name : LOCATION_NAME
337 write_exp_elt_opcode (OP_VAR_VALUE);
338 write_exp_elt_block (NULL);
339 write_exp_elt_sym ($1.sym);
340 write_exp_elt_opcode (OP_VAR_VALUE);
342 | GDB_LAST /* gdb specific */
344 write_exp_elt_opcode (OP_LAST);
345 write_exp_elt_longcst ($1);
346 write_exp_elt_opcode (OP_LAST);
348 | GDB_REGNAME /* gdb specific */
350 write_exp_elt_opcode (OP_REGISTER);
351 write_exp_elt_longcst ($1);
352 write_exp_elt_opcode (OP_REGISTER);
354 | GDB_VARIABLE /* gdb specific */
356 write_exp_elt_opcode (OP_INTERNALVAR);
357 write_exp_elt_intern ($1);
358 write_exp_elt_opcode (OP_INTERNALVAR);
368 expression_list : expression
372 | expression_list ',' expression
378 maybe_expression_list: /* EMPTY */
388 primitive_value_lparen: primitive_value '('
389 /* This is to save the value of arglist_len
390 being accumulated for each dimension. */
391 { start_arglist (); }
395 { $$ = end_arglist (); }
400 | primitive_value_lparen maybe_expression_list rparen
402 write_exp_elt_opcode (MULTI_SUBSCRIPT);
403 write_exp_elt_longcst ($3);
404 write_exp_elt_opcode (MULTI_SUBSCRIPT);
406 | primitive_value FIELD_NAME
407 { write_exp_elt_opcode (STRUCTOP_STRUCT);
408 write_exp_string ($2);
409 write_exp_elt_opcode (STRUCTOP_STRUCT);
411 | primitive_value POINTER
413 write_exp_elt_opcode (UNOP_IND);
415 | primitive_value POINTER mode_name
417 write_exp_elt_opcode (UNOP_CAST);
418 write_exp_elt_type (lookup_pointer_type ($3.type));
419 write_exp_elt_opcode (UNOP_CAST);
420 write_exp_elt_opcode (UNOP_IND);
438 | expression_conversion
442 | value_procedure_call
446 | value_built_in_routine_call
458 | parenthesised_expression
466 value_name : synonym_name
470 | value_enumeration_name
482 | GENERAL_PROCEDURE_NAME
484 write_exp_elt_opcode (OP_VAR_VALUE);
485 write_exp_elt_block (NULL);
486 write_exp_elt_sym ($1.sym);
487 write_exp_elt_opcode (OP_VAR_VALUE);
493 literal : INTEGER_LITERAL
495 write_exp_elt_opcode (OP_LONG);
496 write_exp_elt_type ($1.type);
497 write_exp_elt_longcst ((LONGEST) ($1.val));
498 write_exp_elt_opcode (OP_LONG);
502 write_exp_elt_opcode (OP_BOOL);
503 write_exp_elt_longcst ((LONGEST) $1);
504 write_exp_elt_opcode (OP_BOOL);
508 write_exp_elt_opcode (OP_LONG);
509 write_exp_elt_type ($1.type);
510 write_exp_elt_longcst ((LONGEST) ($1.val));
511 write_exp_elt_opcode (OP_LONG);
515 write_exp_elt_opcode (OP_DOUBLE);
516 write_exp_elt_type (builtin_type_double);
517 write_exp_elt_dblcst ($1);
518 write_exp_elt_opcode (OP_DOUBLE);
526 struct type *void_ptr_type
527 = lookup_pointer_type (builtin_type_void);
528 write_exp_elt_opcode (OP_LONG);
529 write_exp_elt_type (void_ptr_type);
530 write_exp_elt_longcst (0);
531 write_exp_elt_opcode (OP_LONG);
533 | CHARACTER_STRING_LITERAL
535 write_exp_elt_opcode (OP_STRING);
536 write_exp_string ($1);
537 write_exp_elt_opcode (OP_STRING);
541 write_exp_elt_opcode (OP_BITSTRING);
542 write_exp_bitstring ($1);
543 write_exp_elt_opcode (OP_BITSTRING);
549 tuple_element : expression
550 | named_record_element
553 named_record_element: FIELD_NAME ',' named_record_element
554 { write_exp_elt_opcode (OP_LABELED);
555 write_exp_string ($1);
556 write_exp_elt_opcode (OP_LABELED);
558 | FIELD_NAME ':' expression
559 { write_exp_elt_opcode (OP_LABELED);
560 write_exp_string ($1);
561 write_exp_elt_opcode (OP_LABELED);
565 tuple_elements : tuple_element
569 | tuple_elements ',' tuple_element
575 maybe_tuple_elements : tuple_elements
580 { start_arglist (); }
581 maybe_tuple_elements ']'
583 write_exp_elt_opcode (OP_ARRAY);
584 write_exp_elt_longcst ((LONGEST) 0);
585 write_exp_elt_longcst ((LONGEST) end_arglist () - 1);
586 write_exp_elt_opcode (OP_ARRAY);
590 { start_arglist (); }
591 maybe_tuple_elements ']'
593 write_exp_elt_opcode (OP_ARRAY);
594 write_exp_elt_longcst ((LONGEST) 0);
595 write_exp_elt_longcst ((LONGEST) end_arglist () - 1);
596 write_exp_elt_opcode (OP_ARRAY);
598 write_exp_elt_opcode (UNOP_CAST);
599 write_exp_elt_type ($1.type);
600 write_exp_elt_opcode (UNOP_CAST);
608 slice: primitive_value_lparen expression ':' expression rparen
610 write_exp_elt_opcode (TERNOP_SLICE);
612 | primitive_value_lparen expression UP expression rparen
614 write_exp_elt_opcode (TERNOP_SLICE_COUNT);
620 expression_conversion: mode_name parenthesised_expression
622 write_exp_elt_opcode (UNOP_CAST);
623 write_exp_elt_type ($1.type);
624 write_exp_elt_opcode (UNOP_CAST);
626 | ARRAY '(' ')' mode_name parenthesised_expression
627 /* This is pseudo-Chill, similar to C's '(TYPE[])EXPR'
628 which casts to an artificial array. */
630 struct type *range_type
631 = create_range_type ((struct type *) NULL,
632 builtin_type_int, 0, 0);
633 struct type *array_type
634 = create_array_type ((struct type *) NULL,
635 $4.type, range_type);
636 TYPE_ARRAY_UPPER_BOUND_TYPE(array_type)
637 = BOUND_CANNOT_BE_DETERMINED;
638 write_exp_elt_opcode (UNOP_CAST);
639 write_exp_elt_type (array_type);
640 write_exp_elt_opcode (UNOP_CAST);
646 value_procedure_call: FIXME_05
654 value_built_in_routine_call: chill_value_built_in_routine_call
662 start_expression: FIXME_06
665 } /* Not in GNU-Chill */
670 zero_adic_operator: FIXME_07
678 parenthesised_expression: '(' expression ')'
686 expression : operand_0
690 | single_assignment_action
694 | conditional_expression
700 conditional_expression : IF boolean_expression then_alternative else_alternative FI
704 | CASE case_selector_list OF value_case_alternative ELSE sub_expression ESAC
710 then_alternative: THEN subexpression
716 else_alternative: ELSE subexpression
720 | ELSIF boolean_expression then_alternative else_alternative
726 sub_expression : expression
732 value_case_alternative: case_label_specification ':' sub_expression ';'
740 operand_0 : operand_1
744 | operand_0 LOGIOR operand_1
746 write_exp_elt_opcode (BINOP_BITWISE_IOR);
748 | operand_0 ORIF operand_1
752 | operand_0 LOGXOR operand_1
754 write_exp_elt_opcode (BINOP_BITWISE_XOR);
760 operand_1 : operand_2
764 | operand_1 LOGAND operand_2
766 write_exp_elt_opcode (BINOP_BITWISE_AND);
768 | operand_1 ANDIF operand_2
776 operand_2 : operand_3
780 | operand_2 '=' operand_3
782 write_exp_elt_opcode (BINOP_EQUAL);
784 | operand_2 NOTEQUAL operand_3
786 write_exp_elt_opcode (BINOP_NOTEQUAL);
788 | operand_2 '>' operand_3
790 write_exp_elt_opcode (BINOP_GTR);
792 | operand_2 GTR operand_3
794 write_exp_elt_opcode (BINOP_GEQ);
796 | operand_2 '<' operand_3
798 write_exp_elt_opcode (BINOP_LESS);
800 | operand_2 LEQ operand_3
802 write_exp_elt_opcode (BINOP_LEQ);
804 | operand_2 IN operand_3
806 write_exp_elt_opcode (BINOP_IN);
813 operand_3 : operand_4
817 | operand_3 '+' operand_4
819 write_exp_elt_opcode (BINOP_ADD);
821 | operand_3 '-' operand_4
823 write_exp_elt_opcode (BINOP_SUB);
825 | operand_3 SLASH_SLASH operand_4
827 write_exp_elt_opcode (BINOP_CONCAT);
833 operand_4 : operand_5
837 | operand_4 '*' operand_5
839 write_exp_elt_opcode (BINOP_MUL);
841 | operand_4 '/' operand_5
843 write_exp_elt_opcode (BINOP_DIV);
845 | operand_4 MOD operand_5
847 write_exp_elt_opcode (BINOP_MOD);
849 | operand_4 REM operand_5
851 write_exp_elt_opcode (BINOP_REM);
857 operand_5 : operand_6
863 write_exp_elt_opcode (UNOP_NEG);
867 write_exp_elt_opcode (UNOP_LOGICAL_NOT);
869 | parenthesised_expression literal
870 /* We require the string operand to be a literal, to avoid some
871 nasty parsing ambiguities. */
873 write_exp_elt_opcode (BINOP_CONCAT);
879 operand_6 : POINTER primitive_value
881 write_exp_elt_opcode (UNOP_ADDR);
883 | RECEIVE buffer_location
896 single_assignment_action :
897 primitive_value GDB_ASSIGNMENT value
899 write_exp_elt_opcode (BINOP_ASSIGN);
905 chill_value_built_in_routine_call :
906 NUM '(' expression ')'
910 | PRED '(' expression ')'
914 | SUCC '(' expression ')'
918 | ABS '(' expression ')'
922 | CARD '(' expression ')'
926 | MAX_TOKEN '(' expression ')'
930 | MIN_TOKEN '(' expression ')'
934 | SIZE '(' expression ')'
935 { write_exp_elt_opcode (UNOP_SIZEOF); }
936 | SIZE '(' mode_argument ')'
937 { write_exp_elt_opcode (OP_LONG);
938 write_exp_elt_type (builtin_type_int);
939 write_exp_elt_longcst ((LONGEST) TYPE_LENGTH ($3));
940 write_exp_elt_opcode (OP_LONG); }
941 | LOWER '(' mode_argument ')'
942 { write_lower_upper_value (UNOP_LOWER, $3); }
943 | UPPER '(' mode_argument ')'
944 { write_lower_upper_value (UNOP_UPPER, $3); }
945 | LOWER '(' expression ')'
946 { write_exp_elt_opcode (UNOP_LOWER); }
947 | UPPER '(' expression ')'
948 { write_exp_elt_opcode (UNOP_UPPER); }
949 | LENGTH '(' expression ')'
950 { write_exp_elt_opcode (UNOP_LENGTH); }
953 mode_argument : mode_name
957 | array_mode_name '(' expression ')'
961 | string_mode_name '(' expression ')'
965 | variant_structure_mode_name '(' expression_list ')'
974 /* Things which still need productions... */
976 array_mode_name : FIXME_08 { $$ = 0; }
977 string_mode_name : FIXME_09 { $$ = 0; }
978 variant_structure_mode_name: FIXME_10 { $$ = 0; }
979 synonym_name : FIXME_11 { $$ = 0; }
980 value_enumeration_name : FIXME_12 { $$ = 0; }
981 value_do_with_name : FIXME_13 { $$ = 0; }
982 value_receive_name : FIXME_14 { $$ = 0; }
983 boolean_expression : FIXME_26 { $$ = 0; }
984 case_selector_list : FIXME_27 { $$ = 0; }
985 subexpression : FIXME_28 { $$ = 0; }
986 case_label_specification: FIXME_29 { $$ = 0; }
987 buffer_location : FIXME_30 { $$ = 0; }
991 /* Implementation of a dynamically expandable buffer for processing input
992 characters acquired through lexptr and building a value to return in
995 static char *tempbuf; /* Current buffer contents */
996 static int tempbufsize; /* Size of allocated buffer */
997 static int tempbufindex; /* Current index into buffer */
999 #define GROWBY_MIN_SIZE 64 /* Minimum amount to grow buffer by */
1001 #define CHECKBUF(size) \
1003 if (tempbufindex + (size) >= tempbufsize) \
1005 growbuf_by_size (size); \
1009 /* Grow the static temp buffer if necessary, including allocating the first one
1013 growbuf_by_size (count)
1018 growby = max (count, GROWBY_MIN_SIZE);
1019 tempbufsize += growby;
1020 if (tempbuf == NULL)
1022 tempbuf = (char *) malloc (tempbufsize);
1026 tempbuf = (char *) realloc (tempbuf, tempbufsize);
1030 /* Try to consume a simple name string token. If successful, returns
1031 a pointer to a nullbyte terminated copy of the name that can be used
1032 in symbol table lookups. If not successful, returns NULL. */
1035 match_simple_name_string ()
1037 char *tokptr = lexptr;
1039 if (isalpha (*tokptr) || *tokptr == '_')
1044 } while (isalnum (*tokptr) || (*tokptr == '_'));
1045 yylval.sval.ptr = lexptr;
1046 yylval.sval.length = tokptr - lexptr;
1048 result = copy_name (yylval.sval);
1054 /* Start looking for a value composed of valid digits as set by the base
1055 in use. Note that '_' characters are valid anywhere, in any quantity,
1056 and are simply ignored. Since we must find at least one valid digit,
1057 or reject this token as an integer literal, we keep track of how many
1058 digits we have encountered. */
1061 decode_integer_value (base, tokptrptr, ivalptr)
1066 char *tokptr = *tokptrptr;
1070 while (*tokptr != '\0')
1074 temp = tolower (temp);
1080 case '0': case '1': case '2': case '3': case '4':
1081 case '5': case '6': case '7': case '8': case '9':
1084 case 'a': case 'b': case 'c': case 'd': case 'e': case 'f':
1100 /* Found something not in domain for current base. */
1101 tokptr--; /* Unconsume what gave us indigestion. */
1106 /* If we didn't find any digits, then we don't have a valid integer
1107 value, so reject the entire token. Otherwise, update the lexical
1108 scan pointer, and return non-zero for success. */
1116 *tokptrptr = tokptr;
1122 decode_integer_literal (valptr, tokptrptr)
1126 char *tokptr = *tokptrptr;
1129 int explicit_base = 0;
1131 /* Look for an explicit base specifier, which is optional. */
1164 /* If we found an explicit base ensure that the character after the
1165 explicit base is a single quote. */
1167 if (explicit_base && (*tokptr++ != '\''))
1172 /* Attempt to decode whatever follows as an integer value in the
1173 indicated base, updating the token pointer in the process and
1174 computing the value into ival. Also, if we have an explicit
1175 base, then the next character must not be a single quote, or we
1176 have a bitstring literal, so reject the entire token in this case.
1177 Otherwise, update the lexical scan pointer, and return non-zero
1180 if (!decode_integer_value (base, &tokptr, &ival))
1184 else if (explicit_base && (*tokptr == '\''))
1191 *tokptrptr = tokptr;
1196 /* If it wasn't for the fact that floating point values can contain '_'
1197 characters, we could just let strtod do all the hard work by letting it
1198 try to consume as much of the current token buffer as possible and
1199 find a legal conversion. Unfortunately we need to filter out the '_'
1200 characters before calling strtod, which we do by copying the other
1201 legal chars to a local buffer to be converted. However since we also
1202 need to keep track of where the last unconsumed character in the input
1203 buffer is, we have transfer only as many characters as may compose a
1204 legal floating point value. */
1207 match_float_literal ()
1209 char *tokptr = lexptr;
1213 extern double strtod ();
1215 /* Make local buffer in which to build the string to convert. This is
1216 required because underscores are valid in chill floating point numbers
1217 but not in the string passed to strtod to convert. The string will be
1218 no longer than our input string. */
1220 copy = buf = (char *) alloca (strlen (tokptr) + 1);
1222 /* Transfer all leading digits to the conversion buffer, discarding any
1225 while (isdigit (*tokptr) || *tokptr == '_')
1234 /* Now accept either a '.', or one of [eEdD]. Dot is legal regardless
1235 of whether we found any leading digits, and we simply accept it and
1236 continue on to look for the fractional part and/or exponent. One of
1237 [eEdD] is legal only if we have seen digits, and means that there
1238 is no fractional part. If we find neither of these, then this is
1239 not a floating point number, so return failure. */
1244 /* Accept and then look for fractional part and/or exponent. */
1257 goto collect_exponent;
1265 /* We found a '.', copy any fractional digits to the conversion buffer, up
1266 to the first nondigit, non-underscore character. */
1268 while (isdigit (*tokptr) || *tokptr == '_')
1277 /* Look for an exponent, which must start with one of [eEdD]. If none
1278 is found, jump directly to trying to convert what we have collected
1295 /* Accept an optional '-' or '+' following one of [eEdD]. */
1298 if (*tokptr == '+' || *tokptr == '-')
1300 *copy++ = *tokptr++;
1303 /* Now copy an exponent into the conversion buffer. Note that at the
1304 moment underscores are *not* allowed in exponents. */
1306 while (isdigit (*tokptr))
1308 *copy++ = *tokptr++;
1311 /* If we transfered any chars to the conversion buffer, try to interpret its
1312 contents as a floating point value. If any characters remain, then we
1313 must not have a valid floating point string. */
1319 dval = strtod (buf, ©);
1324 return (FLOAT_LITERAL);
1330 /* Recognize a string literal. A string literal is a sequence
1331 of characters enclosed in matching single or double quotes, except that
1332 a single character inside single quotes is a character literal, which
1333 we reject as a string literal. To embed the terminator character inside
1334 a string, it is simply doubled (I.E. "this""is""one""string") */
1337 match_string_literal ()
1339 char *tokptr = lexptr;
1341 for (tempbufindex = 0, tokptr++; *tokptr != '\0'; tokptr++)
1344 if (*tokptr == *lexptr)
1346 if (*(tokptr + 1) == *lexptr)
1355 tempbuf[tempbufindex++] = *tokptr;
1357 if (*tokptr == '\0' /* no terminator */
1358 || (tempbufindex == 1 && *tokptr == '\'')) /* char literal */
1364 tempbuf[tempbufindex] = '\0';
1365 yylval.sval.ptr = tempbuf;
1366 yylval.sval.length = tempbufindex;
1368 return (CHARACTER_STRING_LITERAL);
1372 /* Recognize a character literal. A character literal is single character
1373 or a control sequence, enclosed in single quotes. A control sequence
1374 is a comma separated list of one or more integer literals, enclosed
1375 in parenthesis and introduced with a circumflex character.
1377 EX: 'a' '^(7)' '^(7,8)'
1379 As a GNU chill extension, the syntax C'xx' is also recognized as a
1380 character literal, where xx is a hex value for the character.
1382 Note that more than a single character, enclosed in single quotes, is
1385 Also note that the control sequence form is not in GNU Chill since it
1386 is ambiguous with the string literal form using single quotes. I.E.
1387 is '^(7)' a character literal or a string literal. In theory it it
1388 possible to tell by context, but GNU Chill doesn't accept the control
1389 sequence form, so neither do we (for now the code is disabled).
1391 Returns CHARACTER_LITERAL if a match is found.
1395 match_character_literal ()
1397 char *tokptr = lexptr;
1400 if ((*tokptr == 'c' || *tokptr == 'C') && (*(tokptr + 1) == '\''))
1402 /* We have a GNU chill extension form, so skip the leading "C'",
1403 decode the hex value, and then ensure that we have a trailing
1404 single quote character. */
1406 if (!decode_integer_value (16, &tokptr, &ival) || (*tokptr != '\''))
1412 else if (*tokptr == '\'')
1416 /* Determine which form we have, either a control sequence or the
1417 single character form. */
1419 if ((*tokptr == '^') && (*(tokptr + 1) == '('))
1421 #if 0 /* Disable, see note above. -fnf */
1422 /* Match and decode a control sequence. Return zero if we don't
1423 find a valid integer literal, or if the next unconsumed character
1424 after the integer literal is not the trailing ')'.
1425 FIXME: We currently don't handle the multiple integer literal
1428 if (!decode_integer_literal (&ival, &tokptr) || (*tokptr++ != ')'))
1441 /* The trailing quote has not yet been consumed. If we don't find
1442 it, then we have no match. */
1444 if (*tokptr++ != '\'')
1451 /* Not a character literal. */
1454 yylval.typed_val.val = ival;
1455 yylval.typed_val.type = builtin_type_chill_char;
1457 return (CHARACTER_LITERAL);
1460 /* Recognize an integer literal, as specified in Z.200 sec 5.2.4.2.
1461 Note that according to 5.2.4.2, a single "_" is also a valid integer
1462 literal, however GNU-chill requires there to be at least one "digit"
1463 in any integer literal. */
1466 match_integer_literal ()
1468 char *tokptr = lexptr;
1471 if (!decode_integer_literal (&ival, &tokptr))
1477 yylval.typed_val.val = ival;
1478 yylval.typed_val.type = builtin_type_int;
1480 return (INTEGER_LITERAL);
1484 /* Recognize a bit-string literal, as specified in Z.200 sec 5.2.4.8
1485 Note that according to 5.2.4.8, a single "_" is also a valid bit-string
1486 literal, however GNU-chill requires there to be at least one "digit"
1487 in any bit-string literal. */
1490 match_bitstring_literal ()
1492 register char *tokptr = lexptr;
1502 /* Look for the required explicit base specifier. */
1523 /* Ensure that the character after the explicit base is a single quote. */
1525 if (*tokptr++ != '\'')
1530 while (*tokptr != '\0' && *tokptr != '\'')
1533 if (isupper (digit))
1534 digit = tolower (digit);
1540 case '0': case '1': case '2': case '3': case '4':
1541 case '5': case '6': case '7': case '8': case '9':
1544 case 'a': case 'b': case 'c': case 'd': case 'e': case 'f':
1552 if (digit >= 1 << bits_per_char)
1554 /* Found something not in domain for current base. */
1559 /* Extract bits from digit, packing them into the bitstring byte. */
1560 int k = TARGET_BYTE_ORDER == BIG_ENDIAN ? bits_per_char - 1 : 0;
1561 for (; TARGET_BYTE_ORDER == BIG_ENDIAN ? k >= 0 : k < bits_per_char;
1562 TARGET_BYTE_ORDER == BIG_ENDIAN ? k-- : k++)
1565 if (digit & (1 << k))
1567 tempbuf[tempbufindex] |=
1568 (TARGET_BYTE_ORDER == BIG_ENDIAN)
1569 ? (1 << (HOST_CHAR_BIT - 1 - bitoffset))
1573 if (bitoffset == HOST_CHAR_BIT)
1578 tempbuf[tempbufindex] = 0;
1584 /* Verify that we consumed everything up to the trailing single quote,
1585 and that we found some bits (IE not just underbars). */
1587 if (*tokptr++ != '\'')
1593 yylval.sval.ptr = tempbuf;
1594 yylval.sval.length = bitcount;
1596 return (BIT_STRING_LITERAL);
1600 /* Recognize tokens that start with '$'. These include:
1602 $regname A native register name or a "standard
1604 Return token GDB_REGNAME.
1606 $variable A convenience variable with a name chosen
1608 Return token GDB_VARIABLE.
1610 $digits Value history with index <digits>, starting
1611 from the first value which has index 1.
1614 $$digits Value history with index <digits> relative
1615 to the last value. I.E. $$0 is the last
1616 value, $$1 is the one previous to that, $$2
1617 is the one previous to $$1, etc.
1618 Return token GDB_LAST.
1620 $ | $0 | $$0 The last value in the value history.
1621 Return token GDB_LAST.
1623 $$ An abbreviation for the second to the last
1624 value in the value history, I.E. $$1
1625 Return token GDB_LAST.
1627 Note that we currently assume that register names and convenience
1628 variables follow the convention of starting with a letter or '_'.
1633 match_dollar_tokens ()
1641 /* We will always have a successful match, even if it is just for
1642 a single '$', the abbreviation for $$0. So advance lexptr. */
1646 if (*tokptr == '_' || isalpha (*tokptr))
1648 /* Look for a match with a native register name, usually something
1649 like "r0" for example. */
1651 for (regno = 0; regno < NUM_REGS; regno++)
1653 namelength = strlen (reg_names[regno]);
1654 if (STREQN (tokptr, reg_names[regno], namelength)
1655 && !isalnum (tokptr[namelength]))
1657 yylval.lval = regno;
1658 lexptr += namelength;
1659 return (GDB_REGNAME);
1663 /* Look for a match with a standard register name, usually something
1664 like "pc", which gdb always recognizes as the program counter
1665 regardless of what the native register name is. */
1667 for (regno = 0; regno < num_std_regs; regno++)
1669 namelength = strlen (std_regs[regno].name);
1670 if (STREQN (tokptr, std_regs[regno].name, namelength)
1671 && !isalnum (tokptr[namelength]))
1673 yylval.lval = std_regs[regno].regnum;
1674 lexptr += namelength;
1675 return (GDB_REGNAME);
1679 /* Attempt to match against a convenience variable. Note that
1680 this will always succeed, because if no variable of that name
1681 already exists, the lookup_internalvar will create one for us.
1682 Also note that both lexptr and tokptr currently point to the
1683 start of the input string we are trying to match, and that we
1684 have already tested the first character for non-numeric, so we
1685 don't have to treat it specially. */
1687 while (*tokptr == '_' || isalnum (*tokptr))
1691 yylval.sval.ptr = lexptr;
1692 yylval.sval.length = tokptr - lexptr;
1693 yylval.ivar = lookup_internalvar (copy_name (yylval.sval));
1695 return (GDB_VARIABLE);
1698 /* Since we didn't match against a register name or convenience
1699 variable, our only choice left is a history value. */
1713 /* Attempt to decode more characters as an integer value giving
1714 the index in the history list. If successful, the value will
1715 overwrite ival (currently 0 or 1), and if not, ival will be
1716 left alone, which is good since it is currently correct for
1717 the '$' or '$$' case. */
1719 decode_integer_literal (&ival, &tokptr);
1720 yylval.lval = negate ? -ival : ival;
1731 static const struct token idtokentab[] =
1734 { "length", LENGTH },
1745 { "max", MAX_TOKEN },
1746 { "min", MIN_TOKEN },
1755 { "null", EMPTINESS_LITERAL }
1758 static const struct token tokentab2[] =
1760 { ":=", GDB_ASSIGNMENT },
1761 { "//", SLASH_SLASH },
1768 /* Read one token, getting characters through lexptr. */
1769 /* This is where we will check to make sure that the language and the
1770 operators used are compatible. */
1780 /* Skip over any leading whitespace. */
1781 while (isspace (*lexptr))
1785 /* Look for special single character cases which can't be the first
1786 character of some other multicharacter token. */
1803 /* Look for characters which start a particular kind of multicharacter
1804 token, such as a character literal, register name, convenience
1805 variable name, string literal, etc. */
1810 /* First try to match a string literal, which is any
1811 sequence of characters enclosed in matching single or double
1812 quotes, except that a single character inside single quotes
1813 is a character literal, so we have to catch that case also. */
1814 token = match_string_literal ();
1819 if (*lexptr == '\'')
1821 token = match_character_literal ();
1830 token = match_character_literal ();
1837 token = match_dollar_tokens ();
1844 /* See if it is a special token of length 2. */
1845 for (i = 0; i < sizeof (tokentab2) / sizeof (tokentab2[0]); i++)
1847 if (STREQN (lexptr, tokentab2[i].operator, 2))
1850 return (tokentab2[i].token);
1853 /* Look for single character cases which which could be the first
1854 character of some other multicharacter token, but aren't, or we
1855 would already have found it. */
1865 /* Look for a float literal before looking for an integer literal, so
1866 we match as much of the input stream as possible. */
1867 token = match_float_literal ();
1872 token = match_bitstring_literal ();
1877 token = match_integer_literal ();
1883 /* Try to match a simple name string, and if a match is found, then
1884 further classify what sort of name it is and return an appropriate
1885 token. Note that attempting to match a simple name string consumes
1886 the token from lexptr, so we can't back out if we later find that
1887 we can't classify what sort of name it is. */
1889 inputname = match_simple_name_string ();
1891 if (inputname != NULL)
1893 char *simplename = (char*) alloca (strlen (inputname) + 1);
1895 char *dptr = simplename, *sptr = inputname;
1896 for (; *sptr; sptr++)
1897 *dptr++ = isupper (*sptr) ? tolower(*sptr) : *sptr;
1900 /* See if it is a reserved identifier. */
1901 for (i = 0; i < sizeof (idtokentab) / sizeof (idtokentab[0]); i++)
1903 if (STREQ (simplename, idtokentab[i].operator))
1905 return (idtokentab[i].token);
1909 /* Look for other special tokens. */
1910 if (STREQ (simplename, "true"))
1913 return (BOOLEAN_LITERAL);
1915 if (STREQ (simplename, "false"))
1918 return (BOOLEAN_LITERAL);
1921 sym = lookup_symbol (inputname, expression_context_block,
1922 VAR_NAMESPACE, (int *) NULL,
1923 (struct symtab **) NULL);
1924 if (sym == NULL && strcmp (inputname, simplename) != 0)
1926 sym = lookup_symbol (simplename, expression_context_block,
1927 VAR_NAMESPACE, (int *) NULL,
1928 (struct symtab **) NULL);
1932 yylval.ssym.stoken.ptr = NULL;
1933 yylval.ssym.stoken.length = 0;
1934 yylval.ssym.sym = sym;
1935 yylval.ssym.is_a_field_of_this = 0; /* FIXME, C++'ism */
1936 switch (SYMBOL_CLASS (sym))
1939 /* Found a procedure name. */
1940 return (GENERAL_PROCEDURE_NAME);
1942 /* Found a global or local static variable. */
1943 return (LOCATION_NAME);
1948 case LOC_REGPARM_ADDR:
1952 case LOC_BASEREG_ARG:
1953 if (innermost_block == NULL
1954 || contained_in (block_found, innermost_block))
1956 innermost_block = block_found;
1958 return (LOCATION_NAME);
1962 return (LOCATION_NAME);
1965 yylval.tsym.type = SYMBOL_TYPE (sym);
1968 case LOC_CONST_BYTES:
1969 case LOC_OPTIMIZED_OUT:
1970 error ("Symbol \"%s\" names no location.", inputname);
1974 else if (!have_full_symbols () && !have_partial_symbols ())
1976 error ("No symbol table is loaded. Use the \"file\" command.");
1980 error ("No symbol \"%s\" in current context.", inputname);
1984 /* Catch single character tokens which are not part of some
1989 case '.': /* Not float for example. */
1991 while (isspace (*lexptr)) lexptr++;
1992 inputname = match_simple_name_string ();
1998 return (ILLEGAL_TOKEN);
2002 write_lower_upper_value (opcode, type)
2003 enum exp_opcode opcode; /* Either UNOP_LOWER or UNOP_UPPER */
2006 extern LONGEST type_lower_upper ();
2007 struct type *result_type;
2008 LONGEST val = type_lower_upper (opcode, type, &result_type);
2009 write_exp_elt_opcode (OP_LONG);
2010 write_exp_elt_type (result_type);
2011 write_exp_elt_longcst (val);
2012 write_exp_elt_opcode (OP_LONG);
2019 error ("A %s in expression, near `%s'.", (msg ? msg : "error"), lexptr);