]> git.ipfire.org Git - thirdparty/binutils-gdb.git/blob - gdb/parse.c
import gdb-1999-06-07 snapshot
[thirdparty/binutils-gdb.git] / gdb / parse.c
1 /* Parse expressions for GDB.
2 Copyright (C) 1986, 89, 90, 91, 94, 98, 1999 Free Software Foundation, Inc.
3 Modified from expread.y by the Department of Computer Science at the
4 State University of New York at Buffalo, 1991.
5
6 This file is part of GDB.
7
8 This program is free software; you can redistribute it and/or modify
9 it under the terms of the GNU General Public License as published by
10 the Free Software Foundation; either version 2 of the License, or
11 (at your option) any later version.
12
13 This program is distributed in the hope that it will be useful,
14 but WITHOUT ANY WARRANTY; without even the implied warranty of
15 MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
16 GNU General Public License for more details.
17
18 You should have received a copy of the GNU General Public License
19 along with this program; if not, write to the Free Software
20 Foundation, Inc., 59 Temple Place - Suite 330, Boston, MA 02111-1307, USA. */
21
22 /* Parse an expression from text in a string,
23 and return the result as a struct expression pointer.
24 That structure contains arithmetic operations in reverse polish,
25 with constants represented by operations that are followed by special data.
26 See expression.h for the details of the format.
27 What is important here is that it can be built up sequentially
28 during the process of parsing; the lower levels of the tree always
29 come first in the result. */
30
31 #include <ctype.h>
32
33 #include "defs.h"
34 #include "gdb_string.h"
35 #include "symtab.h"
36 #include "gdbtypes.h"
37 #include "frame.h"
38 #include "expression.h"
39 #include "value.h"
40 #include "command.h"
41 #include "language.h"
42 #include "parser-defs.h"
43 #include "gdbcmd.h"
44 #include "symfile.h" /* for overlay functions */
45 \f
46 /* Global variables declared in parser-defs.h (and commented there). */
47 struct expression *expout;
48 int expout_size;
49 int expout_ptr;
50 struct block *expression_context_block;
51 struct block *innermost_block;
52 int arglist_len;
53 union type_stack_elt *type_stack;
54 int type_stack_depth, type_stack_size;
55 char *lexptr;
56 char *namecopy;
57 int paren_depth;
58 int comma_terminates;
59 \f
60 static int expressiondebug = 0;
61
62 extern int hp_som_som_object_present;
63
64 static void
65 free_funcalls PARAMS ((void));
66
67 static void
68 prefixify_expression PARAMS ((struct expression *));
69
70 static void
71 prefixify_subexp PARAMS ((struct expression *, struct expression *, int, int));
72
73 void _initialize_parse PARAMS ((void));
74
75 /* Data structure for saving values of arglist_len for function calls whose
76 arguments contain other function calls. */
77
78 struct funcall
79 {
80 struct funcall *next;
81 int arglist_len;
82 };
83
84 static struct funcall *funcall_chain;
85
86 /* Assign machine-independent names to certain registers
87 (unless overridden by the REGISTER_NAMES table) */
88
89 unsigned num_std_regs = 0;
90 struct std_regs *std_regs;
91
92 /* The generic method for targets to specify how their registers are
93 named. The mapping can be derived from three sources:
94 REGISTER_NAME; std_regs; or a target specific alias hook. */
95
96 int
97 target_map_name_to_register (str, len)
98 char *str;
99 int len;
100 {
101 int i;
102
103 /* First try target specific aliases. We try these first because on some
104 systems standard names can be context dependent (eg. $pc on a
105 multiprocessor can be could be any of several PCs). */
106 #ifdef REGISTER_NAME_ALIAS_HOOK
107 i = REGISTER_NAME_ALIAS_HOOK (str, len);
108 if (i >= 0)
109 return i;
110 #endif
111
112 /* Search architectural register name space. */
113 for (i = 0; i < NUM_REGS; i++)
114 if (REGISTER_NAME (i) && len == strlen (REGISTER_NAME (i))
115 && STREQN (str, REGISTER_NAME (i), len))
116 {
117 return i;
118 }
119
120 /* Try standard aliases */
121 for (i = 0; i < num_std_regs; i++)
122 if (std_regs[i].name && len == strlen (std_regs[i].name)
123 && STREQN (str, std_regs[i].name, len))
124 {
125 return std_regs[i].regnum;
126 }
127
128 return -1;
129 }
130
131 /* Begin counting arguments for a function call,
132 saving the data about any containing call. */
133
134 void
135 start_arglist ()
136 {
137 register struct funcall *new;
138
139 new = (struct funcall *) xmalloc (sizeof (struct funcall));
140 new->next = funcall_chain;
141 new->arglist_len = arglist_len;
142 arglist_len = 0;
143 funcall_chain = new;
144 }
145
146 /* Return the number of arguments in a function call just terminated,
147 and restore the data for the containing function call. */
148
149 int
150 end_arglist ()
151 {
152 register int val = arglist_len;
153 register struct funcall *call = funcall_chain;
154 funcall_chain = call->next;
155 arglist_len = call->arglist_len;
156 free ((PTR)call);
157 return val;
158 }
159
160 /* Free everything in the funcall chain.
161 Used when there is an error inside parsing. */
162
163 static void
164 free_funcalls ()
165 {
166 register struct funcall *call, *next;
167
168 for (call = funcall_chain; call; call = next)
169 {
170 next = call->next;
171 free ((PTR)call);
172 }
173 }
174 \f
175 /* This page contains the functions for adding data to the struct expression
176 being constructed. */
177
178 /* Add one element to the end of the expression. */
179
180 /* To avoid a bug in the Sun 4 compiler, we pass things that can fit into
181 a register through here */
182
183 void
184 write_exp_elt (expelt)
185 union exp_element expelt;
186 {
187 if (expout_ptr >= expout_size)
188 {
189 expout_size *= 2;
190 expout = (struct expression *)
191 xrealloc ((char *) expout, sizeof (struct expression)
192 + EXP_ELEM_TO_BYTES (expout_size));
193 }
194 expout->elts[expout_ptr++] = expelt;
195 }
196
197 void
198 write_exp_elt_opcode (expelt)
199 enum exp_opcode expelt;
200 {
201 union exp_element tmp;
202
203 tmp.opcode = expelt;
204
205 write_exp_elt (tmp);
206 }
207
208 void
209 write_exp_elt_sym (expelt)
210 struct symbol *expelt;
211 {
212 union exp_element tmp;
213
214 tmp.symbol = expelt;
215
216 write_exp_elt (tmp);
217 }
218
219 void
220 write_exp_elt_block (b)
221 struct block *b;
222 {
223 union exp_element tmp;
224 tmp.block = b;
225 write_exp_elt (tmp);
226 }
227
228 void
229 write_exp_elt_longcst (expelt)
230 LONGEST expelt;
231 {
232 union exp_element tmp;
233
234 tmp.longconst = expelt;
235
236 write_exp_elt (tmp);
237 }
238
239 void
240 write_exp_elt_dblcst (expelt)
241 DOUBLEST expelt;
242 {
243 union exp_element tmp;
244
245 tmp.doubleconst = expelt;
246
247 write_exp_elt (tmp);
248 }
249
250 void
251 write_exp_elt_type (expelt)
252 struct type *expelt;
253 {
254 union exp_element tmp;
255
256 tmp.type = expelt;
257
258 write_exp_elt (tmp);
259 }
260
261 void
262 write_exp_elt_intern (expelt)
263 struct internalvar *expelt;
264 {
265 union exp_element tmp;
266
267 tmp.internalvar = expelt;
268
269 write_exp_elt (tmp);
270 }
271
272 /* Add a string constant to the end of the expression.
273
274 String constants are stored by first writing an expression element
275 that contains the length of the string, then stuffing the string
276 constant itself into however many expression elements are needed
277 to hold it, and then writing another expression element that contains
278 the length of the string. I.E. an expression element at each end of
279 the string records the string length, so you can skip over the
280 expression elements containing the actual string bytes from either
281 end of the string. Note that this also allows gdb to handle
282 strings with embedded null bytes, as is required for some languages.
283
284 Don't be fooled by the fact that the string is null byte terminated,
285 this is strictly for the convenience of debugging gdb itself. Gdb
286 Gdb does not depend up the string being null terminated, since the
287 actual length is recorded in expression elements at each end of the
288 string. The null byte is taken into consideration when computing how
289 many expression elements are required to hold the string constant, of
290 course. */
291
292
293 void
294 write_exp_string (str)
295 struct stoken str;
296 {
297 register int len = str.length;
298 register int lenelt;
299 register char *strdata;
300
301 /* Compute the number of expression elements required to hold the string
302 (including a null byte terminator), along with one expression element
303 at each end to record the actual string length (not including the
304 null byte terminator). */
305
306 lenelt = 2 + BYTES_TO_EXP_ELEM (len + 1);
307
308 /* Ensure that we have enough available expression elements to store
309 everything. */
310
311 if ((expout_ptr + lenelt) >= expout_size)
312 {
313 expout_size = max (expout_size * 2, expout_ptr + lenelt + 10);
314 expout = (struct expression *)
315 xrealloc ((char *) expout, (sizeof (struct expression)
316 + EXP_ELEM_TO_BYTES (expout_size)));
317 }
318
319 /* Write the leading length expression element (which advances the current
320 expression element index), then write the string constant followed by a
321 terminating null byte, and then write the trailing length expression
322 element. */
323
324 write_exp_elt_longcst ((LONGEST) len);
325 strdata = (char *) &expout->elts[expout_ptr];
326 memcpy (strdata, str.ptr, len);
327 *(strdata + len) = '\0';
328 expout_ptr += lenelt - 2;
329 write_exp_elt_longcst ((LONGEST) len);
330 }
331
332 /* Add a bitstring constant to the end of the expression.
333
334 Bitstring constants are stored by first writing an expression element
335 that contains the length of the bitstring (in bits), then stuffing the
336 bitstring constant itself into however many expression elements are
337 needed to hold it, and then writing another expression element that
338 contains the length of the bitstring. I.E. an expression element at
339 each end of the bitstring records the bitstring length, so you can skip
340 over the expression elements containing the actual bitstring bytes from
341 either end of the bitstring. */
342
343 void
344 write_exp_bitstring (str)
345 struct stoken str;
346 {
347 register int bits = str.length; /* length in bits */
348 register int len = (bits + HOST_CHAR_BIT - 1) / HOST_CHAR_BIT;
349 register int lenelt;
350 register char *strdata;
351
352 /* Compute the number of expression elements required to hold the bitstring,
353 along with one expression element at each end to record the actual
354 bitstring length in bits. */
355
356 lenelt = 2 + BYTES_TO_EXP_ELEM (len);
357
358 /* Ensure that we have enough available expression elements to store
359 everything. */
360
361 if ((expout_ptr + lenelt) >= expout_size)
362 {
363 expout_size = max (expout_size * 2, expout_ptr + lenelt + 10);
364 expout = (struct expression *)
365 xrealloc ((char *) expout, (sizeof (struct expression)
366 + EXP_ELEM_TO_BYTES (expout_size)));
367 }
368
369 /* Write the leading length expression element (which advances the current
370 expression element index), then write the bitstring constant, and then
371 write the trailing length expression element. */
372
373 write_exp_elt_longcst ((LONGEST) bits);
374 strdata = (char *) &expout->elts[expout_ptr];
375 memcpy (strdata, str.ptr, len);
376 expout_ptr += lenelt - 2;
377 write_exp_elt_longcst ((LONGEST) bits);
378 }
379
380 /* Add the appropriate elements for a minimal symbol to the end of
381 the expression. The rationale behind passing in text_symbol_type and
382 data_symbol_type was so that Modula-2 could pass in WORD for
383 data_symbol_type. Perhaps it still is useful to have those types vary
384 based on the language, but they no longer have names like "int", so
385 the initial rationale is gone. */
386
387 static struct type *msym_text_symbol_type;
388 static struct type *msym_data_symbol_type;
389 static struct type *msym_unknown_symbol_type;
390
391 void
392 write_exp_msymbol (msymbol, text_symbol_type, data_symbol_type)
393 struct minimal_symbol *msymbol;
394 struct type *text_symbol_type;
395 struct type *data_symbol_type;
396 {
397 CORE_ADDR addr;
398
399 write_exp_elt_opcode (OP_LONG);
400 write_exp_elt_type (lookup_pointer_type (builtin_type_void));
401
402 addr = SYMBOL_VALUE_ADDRESS (msymbol);
403 if (overlay_debugging)
404 addr = symbol_overlayed_address (addr, SYMBOL_BFD_SECTION (msymbol));
405 write_exp_elt_longcst ((LONGEST) addr);
406
407 write_exp_elt_opcode (OP_LONG);
408
409 write_exp_elt_opcode (UNOP_MEMVAL);
410 switch (msymbol -> type)
411 {
412 case mst_text:
413 case mst_file_text:
414 case mst_solib_trampoline:
415 write_exp_elt_type (msym_text_symbol_type);
416 break;
417
418 case mst_data:
419 case mst_file_data:
420 case mst_bss:
421 case mst_file_bss:
422 write_exp_elt_type (msym_data_symbol_type);
423 break;
424
425 default:
426 write_exp_elt_type (msym_unknown_symbol_type);
427 break;
428 }
429 write_exp_elt_opcode (UNOP_MEMVAL);
430 }
431 \f
432 /* Recognize tokens that start with '$'. These include:
433
434 $regname A native register name or a "standard
435 register name".
436
437 $variable A convenience variable with a name chosen
438 by the user.
439
440 $digits Value history with index <digits>, starting
441 from the first value which has index 1.
442
443 $$digits Value history with index <digits> relative
444 to the last value. I.E. $$0 is the last
445 value, $$1 is the one previous to that, $$2
446 is the one previous to $$1, etc.
447
448 $ | $0 | $$0 The last value in the value history.
449
450 $$ An abbreviation for the second to the last
451 value in the value history, I.E. $$1
452
453 */
454
455 void
456 write_dollar_variable (str)
457 struct stoken str;
458 {
459 /* Handle the tokens $digits; also $ (short for $0) and $$ (short for $$1)
460 and $$digits (equivalent to $<-digits> if you could type that). */
461
462 struct symbol * sym = NULL;
463 struct minimal_symbol * msym = NULL;
464
465 int negate = 0;
466 int i = 1;
467 /* Double dollar means negate the number and add -1 as well.
468 Thus $$ alone means -1. */
469 if (str.length >= 2 && str.ptr[1] == '$')
470 {
471 negate = 1;
472 i = 2;
473 }
474 if (i == str.length)
475 {
476 /* Just dollars (one or two) */
477 i = - negate;
478 goto handle_last;
479 }
480 /* Is the rest of the token digits? */
481 for (; i < str.length; i++)
482 if (!(str.ptr[i] >= '0' && str.ptr[i] <= '9'))
483 break;
484 if (i == str.length)
485 {
486 i = atoi (str.ptr + 1 + negate);
487 if (negate)
488 i = - i;
489 goto handle_last;
490 }
491
492 /* Handle tokens that refer to machine registers:
493 $ followed by a register name. */
494 i = target_map_name_to_register( str.ptr + 1, str.length - 1 );
495 if( i >= 0 )
496 goto handle_register;
497
498 /* On HP-UX, certain system routines (millicode) have names beginning
499 with $ or $$, e.g. $$dyncall, which handles inter-space procedure
500 calls on PA-RISC. Check for those, first. */
501
502 sym = lookup_symbol (copy_name (str), (struct block *) NULL,
503 VAR_NAMESPACE, (int *) NULL, (struct symtab **) NULL);
504 if (sym)
505 {
506 write_exp_elt_opcode (OP_VAR_VALUE);
507 write_exp_elt_block (block_found); /* set by lookup_symbol */
508 write_exp_elt_sym (sym);
509 write_exp_elt_opcode (OP_VAR_VALUE);
510 return;
511 }
512 msym = lookup_minimal_symbol (copy_name (str), NULL, NULL);
513 if (msym)
514 {
515 write_exp_msymbol (msym,
516 lookup_function_type (builtin_type_int),
517 builtin_type_int);
518 return;
519 }
520
521 /* Any other names starting in $ are debugger internal variables. */
522
523 write_exp_elt_opcode (OP_INTERNALVAR);
524 write_exp_elt_intern (lookup_internalvar (copy_name (str) + 1));
525 write_exp_elt_opcode (OP_INTERNALVAR);
526 return;
527 handle_last:
528 write_exp_elt_opcode (OP_LAST);
529 write_exp_elt_longcst ((LONGEST) i);
530 write_exp_elt_opcode (OP_LAST);
531 return;
532 handle_register:
533 write_exp_elt_opcode (OP_REGISTER);
534 write_exp_elt_longcst (i);
535 write_exp_elt_opcode (OP_REGISTER);
536 return;
537 }
538
539
540 /* Parse a string that is possibly a namespace / nested class
541 specification, i.e., something of the form A::B::C::x. Input
542 (NAME) is the entire string; LEN is the current valid length; the
543 output is a string, TOKEN, which points to the largest recognized
544 prefix which is a series of namespaces or classes. CLASS_PREFIX is
545 another output, which records whether a nested class spec was
546 recognized (= 1) or a fully qualified variable name was found (=
547 0). ARGPTR is side-effected (if non-NULL) to point to beyond the
548 string recognized and consumed by this routine.
549
550 The return value is a pointer to the symbol for the base class or
551 variable if found, or NULL if not found. Callers must check this
552 first -- if NULL, the outputs may not be correct.
553
554 This function is used c-exp.y. This is used specifically to get
555 around HP aCC (and possibly other compilers), which insists on
556 generating names with embedded colons for namespace or nested class
557 members.
558
559 (Argument LEN is currently unused. 1997-08-27)
560
561 Callers must free memory allocated for the output string TOKEN. */
562
563 static const char coloncolon[2] = {':',':'};
564
565 struct symbol *
566 parse_nested_classes_for_hpacc (name, len, token, class_prefix, argptr)
567 char * name;
568 int len;
569 char ** token;
570 int * class_prefix;
571 char ** argptr;
572 {
573 /* Comment below comes from decode_line_1 which has very similar
574 code, which is called for "break" command parsing. */
575
576 /* We have what looks like a class or namespace
577 scope specification (A::B), possibly with many
578 levels of namespaces or classes (A::B::C::D).
579
580 Some versions of the HP ANSI C++ compiler (as also possibly
581 other compilers) generate class/function/member names with
582 embedded double-colons if they are inside namespaces. To
583 handle this, we loop a few times, considering larger and
584 larger prefixes of the string as though they were single
585 symbols. So, if the initially supplied string is
586 A::B::C::D::foo, we have to look up "A", then "A::B",
587 then "A::B::C", then "A::B::C::D", and finally
588 "A::B::C::D::foo" as single, monolithic symbols, because
589 A, B, C or D may be namespaces.
590
591 Note that namespaces can nest only inside other
592 namespaces, and not inside classes. So we need only
593 consider *prefixes* of the string; there is no need to look up
594 "B::C" separately as a symbol in the previous example. */
595
596 register char * p;
597 char * start, * end;
598 char * prefix = NULL;
599 char * tmp;
600 struct symbol * sym_class = NULL;
601 struct symbol * sym_var = NULL;
602 struct type * t;
603 register int i;
604 int colons_found = 0;
605 int prefix_len = 0;
606 int done = 0;
607 char * q;
608
609 /* Check for HP-compiled executable -- in other cases
610 return NULL, and caller must default to standard GDB
611 behaviour. */
612
613 if (!hp_som_som_object_present)
614 return (struct symbol *) NULL;
615
616 p = name;
617
618 /* Skip over whitespace and possible global "::" */
619 while (*p && (*p == ' ' || *p == '\t')) p++;
620 if (p[0] == ':' && p[1] == ':')
621 p += 2;
622 while (*p && (*p == ' ' || *p == '\t')) p++;
623
624 while (1)
625 {
626 /* Get to the end of the next namespace or class spec. */
627 /* If we're looking at some non-token, fail immediately */
628 start = p;
629 if (!(isalpha (*p) || *p == '$' || *p == '_'))
630 return (struct symbol *) NULL;
631 p++;
632 while (*p && (isalnum (*p) || *p == '$' || *p == '_')) p++;
633
634 if (*p == '<')
635 {
636 /* If we have the start of a template specification,
637 scan right ahead to its end */
638 q = find_template_name_end (p);
639 if (q)
640 p = q;
641 }
642
643 end = p;
644
645 /* Skip over "::" and whitespace for next time around */
646 while (*p && (*p == ' ' || *p == '\t')) p++;
647 if (p[0] == ':' && p[1] == ':')
648 p += 2;
649 while (*p && (*p == ' ' || *p == '\t')) p++;
650
651 /* Done with tokens? */
652 if (!*p || !(isalpha (*p) || *p == '$' || *p == '_'))
653 done = 1;
654
655 tmp = (char *) alloca (prefix_len + end - start + 3);
656 if (prefix)
657 {
658 memcpy (tmp, prefix, prefix_len);
659 memcpy (tmp + prefix_len, coloncolon, 2);
660 memcpy (tmp + prefix_len + 2, start, end - start);
661 tmp[prefix_len + 2 + end - start] = '\000';
662 }
663 else
664 {
665 memcpy (tmp, start, end - start);
666 tmp[end - start] = '\000';
667 }
668
669 prefix = tmp;
670 prefix_len = strlen (prefix);
671
672 /* See if the prefix we have now is something we know about */
673
674 if (!done)
675 {
676 /* More tokens to process, so this must be a class/namespace */
677 sym_class = lookup_symbol (prefix, 0, STRUCT_NAMESPACE,
678 0, (struct symtab **) NULL);
679 }
680 else
681 {
682 /* No more tokens, so try as a variable first */
683 sym_var = lookup_symbol (prefix, 0, VAR_NAMESPACE,
684 0, (struct symtab **) NULL);
685 /* If failed, try as class/namespace */
686 if (!sym_var)
687 sym_class = lookup_symbol (prefix, 0, STRUCT_NAMESPACE,
688 0, (struct symtab **) NULL);
689 }
690
691 if (sym_var ||
692 (sym_class &&
693 (t = check_typedef (SYMBOL_TYPE (sym_class)),
694 (TYPE_CODE (t) == TYPE_CODE_STRUCT
695 || TYPE_CODE (t) == TYPE_CODE_UNION))))
696 {
697 /* We found a valid token */
698 *token = (char *) xmalloc (prefix_len + 1 );
699 memcpy (*token, prefix, prefix_len);
700 (*token)[prefix_len] = '\000';
701 break;
702 }
703
704 /* No variable or class/namespace found, no more tokens */
705 if (done)
706 return (struct symbol *) NULL;
707 }
708
709 /* Out of loop, so we must have found a valid token */
710 if (sym_var)
711 *class_prefix = 0;
712 else
713 *class_prefix = 1;
714
715 if (argptr)
716 *argptr = done ? p : end;
717
718 return sym_var ? sym_var : sym_class; /* found */
719 }
720
721 char *
722 find_template_name_end (p)
723 char * p;
724 {
725 int depth = 1;
726 int just_seen_right = 0;
727 int just_seen_colon = 0;
728 int just_seen_space = 0;
729
730 if (!p || (*p != '<'))
731 return 0;
732
733 while (*++p)
734 {
735 switch (*p)
736 {
737 case '\'': case '\"':
738 case '{': case '}':
739 /* In future, may want to allow these?? */
740 return 0;
741 case '<':
742 depth++; /* start nested template */
743 if (just_seen_colon || just_seen_right || just_seen_space)
744 return 0; /* but not after : or :: or > or space */
745 break;
746 case '>':
747 if (just_seen_colon || just_seen_right)
748 return 0; /* end a (nested?) template */
749 just_seen_right = 1; /* but not after : or :: */
750 if (--depth == 0) /* also disallow >>, insist on > > */
751 return ++p; /* if outermost ended, return */
752 break;
753 case ':':
754 if (just_seen_space || (just_seen_colon > 1))
755 return 0; /* nested class spec coming up */
756 just_seen_colon++; /* we allow :: but not :::: */
757 break;
758 case ' ':
759 break;
760 default:
761 if (!((*p >= 'a' && *p <= 'z') || /* allow token chars */
762 (*p >= 'A' && *p <= 'Z') ||
763 (*p >= '0' && *p <= '9') ||
764 (*p == '_') || (*p == ',') || /* commas for template args */
765 (*p == '&') || (*p == '*') || /* pointer and ref types */
766 (*p == '(') || (*p == ')') || /* function types */
767 (*p == '[') || (*p == ']') )) /* array types */
768 return 0;
769 }
770 if (*p != ' ')
771 just_seen_space = 0;
772 if (*p != ':')
773 just_seen_colon = 0;
774 if (*p != '>')
775 just_seen_right = 0;
776 }
777 return 0;
778 }
779
780
781 \f
782 /* Return a null-terminated temporary copy of the name
783 of a string token. */
784
785 char *
786 copy_name (token)
787 struct stoken token;
788 {
789 memcpy (namecopy, token.ptr, token.length);
790 namecopy[token.length] = 0;
791 return namecopy;
792 }
793 \f
794 /* Reverse an expression from suffix form (in which it is constructed)
795 to prefix form (in which we can conveniently print or execute it). */
796
797 static void
798 prefixify_expression (expr)
799 register struct expression *expr;
800 {
801 register int len =
802 sizeof (struct expression) + EXP_ELEM_TO_BYTES (expr->nelts);
803 register struct expression *temp;
804 register int inpos = expr->nelts, outpos = 0;
805
806 temp = (struct expression *) alloca (len);
807
808 /* Copy the original expression into temp. */
809 memcpy (temp, expr, len);
810
811 prefixify_subexp (temp, expr, inpos, outpos);
812 }
813
814 /* Return the number of exp_elements in the subexpression of EXPR
815 whose last exp_element is at index ENDPOS - 1 in EXPR. */
816
817 int
818 length_of_subexp (expr, endpos)
819 register struct expression *expr;
820 register int endpos;
821 {
822 register int oplen = 1;
823 register int args = 0;
824 register int i;
825
826 if (endpos < 1)
827 error ("?error in length_of_subexp");
828
829 i = (int) expr->elts[endpos - 1].opcode;
830
831 switch (i)
832 {
833 /* C++ */
834 case OP_SCOPE:
835 oplen = longest_to_int (expr->elts[endpos - 2].longconst);
836 oplen = 5 + BYTES_TO_EXP_ELEM (oplen + 1);
837 break;
838
839 case OP_LONG:
840 case OP_DOUBLE:
841 case OP_VAR_VALUE:
842 oplen = 4;
843 break;
844
845 case OP_TYPE:
846 case OP_BOOL:
847 case OP_LAST:
848 case OP_REGISTER:
849 case OP_INTERNALVAR:
850 oplen = 3;
851 break;
852
853 case OP_COMPLEX:
854 oplen = 1;
855 args = 2;
856 break;
857
858 case OP_FUNCALL:
859 case OP_F77_UNDETERMINED_ARGLIST:
860 oplen = 3;
861 args = 1 + longest_to_int (expr->elts[endpos - 2].longconst);
862 break;
863
864 case UNOP_MAX:
865 case UNOP_MIN:
866 oplen = 3;
867 break;
868
869 case BINOP_VAL:
870 case UNOP_CAST:
871 case UNOP_MEMVAL:
872 oplen = 3;
873 args = 1;
874 break;
875
876 case UNOP_ABS:
877 case UNOP_CAP:
878 case UNOP_CHR:
879 case UNOP_FLOAT:
880 case UNOP_HIGH:
881 case UNOP_ODD:
882 case UNOP_ORD:
883 case UNOP_TRUNC:
884 oplen = 1;
885 args = 1;
886 break;
887
888 case OP_LABELED:
889 case STRUCTOP_STRUCT:
890 case STRUCTOP_PTR:
891 args = 1;
892 /* fall through */
893 case OP_M2_STRING:
894 case OP_STRING:
895 case OP_NAME:
896 case OP_EXPRSTRING:
897 oplen = longest_to_int (expr->elts[endpos - 2].longconst);
898 oplen = 4 + BYTES_TO_EXP_ELEM (oplen + 1);
899 break;
900
901 case OP_BITSTRING:
902 oplen = longest_to_int (expr->elts[endpos - 2].longconst);
903 oplen = (oplen + HOST_CHAR_BIT - 1) / HOST_CHAR_BIT;
904 oplen = 4 + BYTES_TO_EXP_ELEM (oplen);
905 break;
906
907 case OP_ARRAY:
908 oplen = 4;
909 args = longest_to_int (expr->elts[endpos - 2].longconst);
910 args -= longest_to_int (expr->elts[endpos - 3].longconst);
911 args += 1;
912 break;
913
914 case TERNOP_COND:
915 case TERNOP_SLICE:
916 case TERNOP_SLICE_COUNT:
917 args = 3;
918 break;
919
920 /* Modula-2 */
921 case MULTI_SUBSCRIPT:
922 oplen = 3;
923 args = 1 + longest_to_int (expr->elts[endpos- 2].longconst);
924 break;
925
926 case BINOP_ASSIGN_MODIFY:
927 oplen = 3;
928 args = 2;
929 break;
930
931 /* C++ */
932 case OP_THIS:
933 oplen = 2;
934 break;
935
936 default:
937 args = 1 + (i < (int) BINOP_END);
938 }
939
940 while (args > 0)
941 {
942 oplen += length_of_subexp (expr, endpos - oplen);
943 args--;
944 }
945
946 return oplen;
947 }
948
949 /* Copy the subexpression ending just before index INEND in INEXPR
950 into OUTEXPR, starting at index OUTBEG.
951 In the process, convert it from suffix to prefix form. */
952
953 static void
954 prefixify_subexp (inexpr, outexpr, inend, outbeg)
955 register struct expression *inexpr;
956 struct expression *outexpr;
957 register int inend;
958 int outbeg;
959 {
960 register int oplen = 1;
961 register int args = 0;
962 register int i;
963 int *arglens;
964 enum exp_opcode opcode;
965
966 /* Compute how long the last operation is (in OPLEN),
967 and also how many preceding subexpressions serve as
968 arguments for it (in ARGS). */
969
970 opcode = inexpr->elts[inend - 1].opcode;
971 switch (opcode)
972 {
973 /* C++ */
974 case OP_SCOPE:
975 oplen = longest_to_int (inexpr->elts[inend - 2].longconst);
976 oplen = 5 + BYTES_TO_EXP_ELEM (oplen + 1);
977 break;
978
979 case OP_LONG:
980 case OP_DOUBLE:
981 case OP_VAR_VALUE:
982 oplen = 4;
983 break;
984
985 case OP_TYPE:
986 case OP_BOOL:
987 case OP_LAST:
988 case OP_REGISTER:
989 case OP_INTERNALVAR:
990 oplen = 3;
991 break;
992
993 case OP_COMPLEX:
994 oplen = 1;
995 args = 2;
996 break;
997
998 case OP_FUNCALL:
999 case OP_F77_UNDETERMINED_ARGLIST:
1000 oplen = 3;
1001 args = 1 + longest_to_int (inexpr->elts[inend - 2].longconst);
1002 break;
1003
1004 case UNOP_MIN:
1005 case UNOP_MAX:
1006 oplen = 3;
1007 break;
1008
1009 case UNOP_CAST:
1010 case UNOP_MEMVAL:
1011 oplen = 3;
1012 args = 1;
1013 break;
1014
1015 case UNOP_ABS:
1016 case UNOP_CAP:
1017 case UNOP_CHR:
1018 case UNOP_FLOAT:
1019 case UNOP_HIGH:
1020 case UNOP_ODD:
1021 case UNOP_ORD:
1022 case UNOP_TRUNC:
1023 oplen=1;
1024 args=1;
1025 break;
1026
1027 case STRUCTOP_STRUCT:
1028 case STRUCTOP_PTR:
1029 case OP_LABELED:
1030 args = 1;
1031 /* fall through */
1032 case OP_M2_STRING:
1033 case OP_STRING:
1034 case OP_NAME:
1035 case OP_EXPRSTRING:
1036 oplen = longest_to_int (inexpr->elts[inend - 2].longconst);
1037 oplen = 4 + BYTES_TO_EXP_ELEM (oplen + 1);
1038 break;
1039
1040 case OP_BITSTRING:
1041 oplen = longest_to_int (inexpr->elts[inend - 2].longconst);
1042 oplen = (oplen + HOST_CHAR_BIT - 1) / HOST_CHAR_BIT;
1043 oplen = 4 + BYTES_TO_EXP_ELEM (oplen);
1044 break;
1045
1046 case OP_ARRAY:
1047 oplen = 4;
1048 args = longest_to_int (inexpr->elts[inend - 2].longconst);
1049 args -= longest_to_int (inexpr->elts[inend - 3].longconst);
1050 args += 1;
1051 break;
1052
1053 case TERNOP_COND:
1054 case TERNOP_SLICE:
1055 case TERNOP_SLICE_COUNT:
1056 args = 3;
1057 break;
1058
1059 case BINOP_ASSIGN_MODIFY:
1060 oplen = 3;
1061 args = 2;
1062 break;
1063
1064 /* Modula-2 */
1065 case MULTI_SUBSCRIPT:
1066 oplen = 3;
1067 args = 1 + longest_to_int (inexpr->elts[inend - 2].longconst);
1068 break;
1069
1070 /* C++ */
1071 case OP_THIS:
1072 oplen = 2;
1073 break;
1074
1075 default:
1076 args = 1 + ((int) opcode < (int) BINOP_END);
1077 }
1078
1079 /* Copy the final operator itself, from the end of the input
1080 to the beginning of the output. */
1081 inend -= oplen;
1082 memcpy (&outexpr->elts[outbeg], &inexpr->elts[inend],
1083 EXP_ELEM_TO_BYTES (oplen));
1084 outbeg += oplen;
1085
1086 /* Find the lengths of the arg subexpressions. */
1087 arglens = (int *) alloca (args * sizeof (int));
1088 for (i = args - 1; i >= 0; i--)
1089 {
1090 oplen = length_of_subexp (inexpr, inend);
1091 arglens[i] = oplen;
1092 inend -= oplen;
1093 }
1094
1095 /* Now copy each subexpression, preserving the order of
1096 the subexpressions, but prefixifying each one.
1097 In this loop, inend starts at the beginning of
1098 the expression this level is working on
1099 and marches forward over the arguments.
1100 outbeg does similarly in the output. */
1101 for (i = 0; i < args; i++)
1102 {
1103 oplen = arglens[i];
1104 inend += oplen;
1105 prefixify_subexp (inexpr, outexpr, inend, outbeg);
1106 outbeg += oplen;
1107 }
1108 }
1109 \f
1110 /* This page contains the two entry points to this file. */
1111
1112 /* Read an expression from the string *STRINGPTR points to,
1113 parse it, and return a pointer to a struct expression that we malloc.
1114 Use block BLOCK as the lexical context for variable names;
1115 if BLOCK is zero, use the block of the selected stack frame.
1116 Meanwhile, advance *STRINGPTR to point after the expression,
1117 at the first nonwhite character that is not part of the expression
1118 (possibly a null character).
1119
1120 If COMMA is nonzero, stop if a comma is reached. */
1121
1122 struct expression *
1123 parse_exp_1 (stringptr, block, comma)
1124 char **stringptr;
1125 struct block *block;
1126 int comma;
1127 {
1128 struct cleanup *old_chain;
1129
1130 lexptr = *stringptr;
1131
1132 paren_depth = 0;
1133 type_stack_depth = 0;
1134
1135 comma_terminates = comma;
1136
1137 if (lexptr == 0 || *lexptr == 0)
1138 error_no_arg ("expression to compute");
1139
1140 old_chain = make_cleanup ((make_cleanup_func) free_funcalls, 0);
1141 funcall_chain = 0;
1142
1143 expression_context_block = block ? block : get_selected_block ();
1144
1145 namecopy = (char *) alloca (strlen (lexptr) + 1);
1146 expout_size = 10;
1147 expout_ptr = 0;
1148 expout = (struct expression *)
1149 xmalloc (sizeof (struct expression) + EXP_ELEM_TO_BYTES (expout_size));
1150 expout->language_defn = current_language;
1151 make_cleanup ((make_cleanup_func) free_current_contents, &expout);
1152
1153 if (current_language->la_parser ())
1154 current_language->la_error (NULL);
1155
1156 discard_cleanups (old_chain);
1157
1158 /* Record the actual number of expression elements, and then
1159 reallocate the expression memory so that we free up any
1160 excess elements. */
1161
1162 expout->nelts = expout_ptr;
1163 expout = (struct expression *)
1164 xrealloc ((char *) expout,
1165 sizeof (struct expression) + EXP_ELEM_TO_BYTES (expout_ptr));;
1166
1167 /* Convert expression from postfix form as generated by yacc
1168 parser, to a prefix form. */
1169
1170 if (expressiondebug)
1171 dump_prefix_expression (expout, gdb_stdout,
1172 "before conversion to prefix form");
1173
1174 prefixify_expression (expout);
1175
1176 if (expressiondebug)
1177 dump_postfix_expression (expout, gdb_stdout,
1178 "after conversion to prefix form");
1179
1180 *stringptr = lexptr;
1181 return expout;
1182 }
1183
1184 /* Parse STRING as an expression, and complain if this fails
1185 to use up all of the contents of STRING. */
1186
1187 struct expression *
1188 parse_expression (string)
1189 char *string;
1190 {
1191 register struct expression *exp;
1192 exp = parse_exp_1 (&string, 0, 0);
1193 if (*string)
1194 error ("Junk after end of expression.");
1195 return exp;
1196 }
1197 \f
1198 /* Stuff for maintaining a stack of types. Currently just used by C, but
1199 probably useful for any language which declares its types "backwards". */
1200
1201 void
1202 push_type (tp)
1203 enum type_pieces tp;
1204 {
1205 if (type_stack_depth == type_stack_size)
1206 {
1207 type_stack_size *= 2;
1208 type_stack = (union type_stack_elt *)
1209 xrealloc ((char *) type_stack, type_stack_size * sizeof (*type_stack));
1210 }
1211 type_stack[type_stack_depth++].piece = tp;
1212 }
1213
1214 void
1215 push_type_int (n)
1216 int n;
1217 {
1218 if (type_stack_depth == type_stack_size)
1219 {
1220 type_stack_size *= 2;
1221 type_stack = (union type_stack_elt *)
1222 xrealloc ((char *) type_stack, type_stack_size * sizeof (*type_stack));
1223 }
1224 type_stack[type_stack_depth++].int_val = n;
1225 }
1226
1227 enum type_pieces
1228 pop_type ()
1229 {
1230 if (type_stack_depth)
1231 return type_stack[--type_stack_depth].piece;
1232 return tp_end;
1233 }
1234
1235 int
1236 pop_type_int ()
1237 {
1238 if (type_stack_depth)
1239 return type_stack[--type_stack_depth].int_val;
1240 /* "Can't happen". */
1241 return 0;
1242 }
1243
1244 /* Pop the type stack and return the type which corresponds to FOLLOW_TYPE
1245 as modified by all the stuff on the stack. */
1246 struct type *
1247 follow_types (follow_type)
1248 struct type *follow_type;
1249 {
1250 int done = 0;
1251 int array_size;
1252 struct type *range_type;
1253
1254 while (!done)
1255 switch (pop_type ())
1256 {
1257 case tp_end:
1258 done = 1;
1259 break;
1260 case tp_pointer:
1261 follow_type = lookup_pointer_type (follow_type);
1262 break;
1263 case tp_reference:
1264 follow_type = lookup_reference_type (follow_type);
1265 break;
1266 case tp_array:
1267 array_size = pop_type_int ();
1268 /* FIXME-type-allocation: need a way to free this type when we are
1269 done with it. */
1270 range_type =
1271 create_range_type ((struct type *) NULL,
1272 builtin_type_int, 0,
1273 array_size >= 0 ? array_size - 1 : 0);
1274 follow_type =
1275 create_array_type ((struct type *) NULL,
1276 follow_type, range_type);
1277 if (array_size < 0)
1278 TYPE_ARRAY_UPPER_BOUND_TYPE(follow_type)
1279 = BOUND_CANNOT_BE_DETERMINED;
1280 break;
1281 case tp_function:
1282 /* FIXME-type-allocation: need a way to free this type when we are
1283 done with it. */
1284 follow_type = lookup_function_type (follow_type);
1285 break;
1286 }
1287 return follow_type;
1288 }
1289 \f
1290 static void build_parse PARAMS ((void));
1291 static void
1292 build_parse ()
1293 {
1294 int i;
1295
1296 msym_text_symbol_type =
1297 init_type (TYPE_CODE_FUNC, 1, 0, "<text variable, no debug info>", NULL);
1298 TYPE_TARGET_TYPE (msym_text_symbol_type) = builtin_type_int;
1299 msym_data_symbol_type =
1300 init_type (TYPE_CODE_INT, TARGET_INT_BIT / HOST_CHAR_BIT, 0,
1301 "<data variable, no debug info>", NULL);
1302 msym_unknown_symbol_type =
1303 init_type (TYPE_CODE_INT, 1, 0,
1304 "<variable (not text or data), no debug info>",
1305 NULL);
1306
1307 /* create the std_regs table */
1308
1309 num_std_regs = 0;
1310 #ifdef PC_REGNUM
1311 if (PC_REGNUM >= 0)
1312 num_std_regs++;
1313 #endif
1314 #ifdef FP_REGNUM
1315 if (FP_REGNUM >= 0)
1316 num_std_regs++;
1317 #endif
1318 #ifdef FP_REGNUM
1319 if (SP_REGNUM >= 0)
1320 num_std_regs++;
1321 #endif
1322 #ifdef PS_REGNUM
1323 if (PS_REGNUM >= 0)
1324 num_std_regs++;
1325 #endif
1326 /* create an empty table */
1327 std_regs = xmalloc ((num_std_regs + 1) * sizeof *std_regs);
1328 i = 0;
1329 /* fill it in */
1330 #ifdef PC_REGNUM
1331 std_regs[i].name = "pc";
1332 std_regs[i].regnum = PC_REGNUM;
1333 i++;
1334 #endif
1335 #ifdef FP_REGNUM
1336 std_regs[i].name = "fp";
1337 std_regs[i].regnum = FP_REGNUM;
1338 i++;
1339 #endif
1340 #ifdef SP_REGNUM
1341 std_regs[i].name = "sp";
1342 std_regs[i].regnum = SP_REGNUM;
1343 i++;
1344 #endif
1345 #ifdef PS_REGNUM
1346 std_regs[i].name = "ps";
1347 std_regs[i].regnum = PS_REGNUM;
1348 i++;
1349 #endif
1350 memset (&std_regs[i], 0, sizeof (std_regs[i]));
1351 }
1352
1353 void
1354 _initialize_parse ()
1355 {
1356 type_stack_size = 80;
1357 type_stack_depth = 0;
1358 type_stack = (union type_stack_elt *)
1359 xmalloc (type_stack_size * sizeof (*type_stack));
1360
1361 build_parse ();
1362
1363 add_show_from_set (
1364 add_set_cmd ("expressiondebug", class_maintenance, var_zinteger,
1365 (char *)&expressiondebug,
1366 "Set expression debugging.\n\
1367 When non-zero, the internal representation of expressions will be printed.",
1368 &setlist),
1369 &showlist);
1370 }