* parser-defs.h (write_exp_msymbol): Remove TEXT_SYMBOL_TYPE
[deliverable/binutils-gdb.git] / gdb / ada-lex.l
CommitLineData
14f9c5c9 1/* FLEX lexer for Ada expressions, for GDB.
9b254dd1 2 Copyright (C) 1994, 1997, 1998, 2000, 2001, 2002, 2003, 2007, 2008
14f9c5c9
AS
3 Free Software Foundation, Inc.
4
5This file is part of GDB.
6
7This program is free software; you can redistribute it and/or modify
8it under the terms of the GNU General Public License as published by
9the Free Software Foundation; either version 2 of the License, or
10(at your option) any later version.
11
12This program is distributed in the hope that it will be useful,
13but WITHOUT ANY WARRANTY; without even the implied warranty of
14MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
15GNU General Public License for more details.
16
17You should have received a copy of the GNU General Public License
18along with this program; if not, write to the Free Software
197e01b6
EZ
19Foundation, Inc., 51 Franklin Street, Fifth Floor,
20Boston, MA 02110-1301, USA. */
14f9c5c9
AS
21
22/*----------------------------------------------------------------------*/
23
24/* The converted version of this file is to be included in ada-exp.y, */
25/* the Ada parser for gdb. The function yylex obtains characters from */
26/* the global pointer lexptr. It returns a syntactic category for */
27/* each successive token and places a semantic value into yylval */
28/* (ada-lval), defined by the parser. */
29
14f9c5c9
AS
30DIG [0-9]
31NUM10 ({DIG}({DIG}|_)*)
32HEXDIG [0-9a-f]
33NUM16 ({HEXDIG}({HEXDIG}|_)*)
34OCTDIG [0-7]
35LETTER [a-z_]
36ID ({LETTER}({LETTER}|{DIG})*|"<"{LETTER}({LETTER}|{DIG})*">")
37WHITE [ \t\n]
38TICK ("'"{WHITE}*)
39GRAPHIC [a-z0-9 #&'()*+,-./:;<>=_|!$%?@\[\]\\^`{}~]
40OPER ([-+*/=<>&]|"<="|">="|"**"|"/="|"and"|"or"|"xor"|"not"|"mod"|"rem"|"abs")
41
42EXP (e[+-]{NUM10})
43POSEXP (e"+"?{NUM10})
44
45%{
4c4b4cd2 46
14f9c5c9
AS
47#define NUMERAL_WIDTH 256
48#define LONGEST_SIGN ((ULONGEST) 1 << (sizeof(LONGEST) * HOST_CHAR_BIT - 1))
49
4c4b4cd2
PH
50/* Temporary staging for numeric literals. */
51static char numbuf[NUMERAL_WIDTH];
52 static void canonicalizeNumeral (char *s1, const char *);
52ce6436 53static struct stoken processString (const char*, int);
4c4b4cd2
PH
54static int processInt (const char *, const char *, const char *);
55static int processReal (const char *);
52ce6436 56static struct stoken processId (const char *, int);
4c4b4cd2
PH
57static int processAttribute (const char *);
58static int find_dot_all (const char *);
14f9c5c9
AS
59
60#undef YY_DECL
4c4b4cd2 61#define YY_DECL static int yylex ( void )
14f9c5c9
AS
62
63#undef YY_INPUT
64#define YY_INPUT(BUF, RESULT, MAX_SIZE) \
65 if ( *lexptr == '\000' ) \
66 (RESULT) = YY_NULL; \
67 else \
68 { \
69 *(BUF) = *lexptr; \
70 (RESULT) = 1; \
71 lexptr += 1; \
72 }
73
4c4b4cd2 74static int find_dot_all (const char *);
14f9c5c9
AS
75
76%}
77
7dc1ef8d
PH
78%option case-insensitive interactive nodefault
79
52ce6436 80%s BEFORE_QUAL_QUOTE
14f9c5c9
AS
81
82%%
83
84{WHITE} { }
85
86"--".* { yyterminate(); }
87
4c4b4cd2
PH
88{NUM10}{POSEXP} {
89 canonicalizeNumeral (numbuf, yytext);
14f9c5c9
AS
90 return processInt (NULL, numbuf, strrchr(numbuf, 'e')+1);
91 }
92
4c4b4cd2
PH
93{NUM10} {
94 canonicalizeNumeral (numbuf, yytext);
14f9c5c9
AS
95 return processInt (NULL, numbuf, NULL);
96 }
97
98{NUM10}"#"{HEXDIG}({HEXDIG}|_)*"#"{POSEXP} {
99 canonicalizeNumeral (numbuf, yytext);
100 return processInt (numbuf,
4c4b4cd2 101 strchr (numbuf, '#') + 1,
14f9c5c9
AS
102 strrchr(numbuf, '#') + 1);
103 }
104
105{NUM10}"#"{HEXDIG}({HEXDIG}|_)*"#" {
106 canonicalizeNumeral (numbuf, yytext);
107 return processInt (numbuf, strchr (numbuf, '#') + 1, NULL);
108 }
109
110"0x"{HEXDIG}+ {
111 canonicalizeNumeral (numbuf, yytext+2);
112 return processInt ("16#", numbuf, NULL);
113 }
114
115
116{NUM10}"."{NUM10}{EXP} {
4c4b4cd2 117 canonicalizeNumeral (numbuf, yytext);
14f9c5c9
AS
118 return processReal (numbuf);
119 }
120
121{NUM10}"."{NUM10} {
4c4b4cd2 122 canonicalizeNumeral (numbuf, yytext);
14f9c5c9
AS
123 return processReal (numbuf);
124 }
125
126{NUM10}"#"{NUM16}"."{NUM16}"#"{EXP} {
e1d5a0d2 127 error (_("Based real literals not implemented yet."));
14f9c5c9
AS
128 }
129
130{NUM10}"#"{NUM16}"."{NUM16}"#" {
e1d5a0d2 131 error (_("Based real literals not implemented yet."));
14f9c5c9
AS
132 }
133
134<INITIAL>"'"({GRAPHIC}|\")"'" {
72d5681a 135 yylval.typed_val.type = type_char ();
14f9c5c9
AS
136 yylval.typed_val.val = yytext[1];
137 return CHARLIT;
138 }
139
140<INITIAL>"'[\""{HEXDIG}{2}"\"]'" {
141 int v;
72d5681a 142 yylval.typed_val.type = type_char ();
14f9c5c9
AS
143 sscanf (yytext+3, "%2x", &v);
144 yylval.typed_val.val = v;
145 return CHARLIT;
146 }
147
52ce6436
PH
148\"({GRAPHIC}|"[\""({HEXDIG}{2}|\")"\"]")*\" {
149 yylval.sval = processString (yytext+1, yyleng-2);
14f9c5c9
AS
150 return STRING;
151 }
152
52ce6436 153\" {
e1d5a0d2 154 error (_("ill-formed or non-terminated string literal"));
14f9c5c9
AS
155 }
156
14f9c5c9 157
4c4b4cd2
PH
158if {
159 while (*lexptr != 'i' && *lexptr != 'I')
160 lexptr -= 1;
161 yyrestart(NULL);
14f9c5c9
AS
162 return 0;
163 }
164
165 /* ADA KEYWORDS */
166
167abs { return ABS; }
168and { return _AND_; }
169else { return ELSE; }
170in { return IN; }
171mod { return MOD; }
172new { return NEW; }
173not { return NOT; }
174null { return NULL_PTR; }
175or { return OR; }
52ce6436 176others { return OTHERS; }
14f9c5c9
AS
177rem { return REM; }
178then { return THEN; }
179xor { return XOR; }
180
690cc4eb
PH
181 /* BOOLEAN "KEYWORDS" */
182
183 /* True and False are not keywords in Ada, but rather enumeration constants.
184 However, the boolean type is no longer represented as an enum, so True
185 and False are no longer defined in symbol tables. We compromise by
186 making them keywords (when bare). */
187
188true { return TRUEKEYWORD; }
189false { return FALSEKEYWORD; }
190
14f9c5c9
AS
191 /* ATTRIBUTES */
192
193{TICK}[a-zA-Z][a-zA-Z]+ { return processAttribute (yytext+1); }
194
195 /* PUNCTUATION */
196
197"=>" { return ARROW; }
198".." { return DOTDOT; }
199"**" { return STARSTAR; }
200":=" { return ASSIGN; }
201"/=" { return NOTEQUAL; }
202"<=" { return LEQ; }
203">=" { return GEQ; }
204
205<BEFORE_QUAL_QUOTE>"'" { BEGIN INITIAL; return '\''; }
206
207[-&*+./:<>=|;\[\]] { return yytext[0]; }
208
209"," { if (paren_depth == 0 && comma_terminates)
210 {
211 lexptr -= 1;
212 yyrestart(NULL);
213 return 0;
214 }
4c4b4cd2 215 else
14f9c5c9
AS
216 return ',';
217 }
218
219"(" { paren_depth += 1; return '('; }
4c4b4cd2 220")" { if (paren_depth == 0)
14f9c5c9
AS
221 {
222 lexptr -= 1;
223 yyrestart(NULL);
224 return 0;
225 }
4c4b4cd2 226 else
14f9c5c9 227 {
4c4b4cd2 228 paren_depth -= 1;
14f9c5c9
AS
229 return ')';
230 }
231 }
232
233"."{WHITE}*all { return DOT_ALL; }
234
4c4b4cd2 235"."{WHITE}*{ID} {
52ce6436 236 yylval.sval = processId (yytext+1, yyleng-1);
4c4b4cd2 237 return DOT_ID;
14f9c5c9
AS
238 }
239
4c4b4cd2 240{ID}({WHITE}*"."{WHITE}*({ID}|\"{OPER}\"))*(" "*"'")? {
14f9c5c9 241 int all_posn = find_dot_all (yytext);
14f9c5c9 242
4c4b4cd2 243 if (all_posn == -1 && yytext[yyleng-1] == '\'')
14f9c5c9 244 {
52ce6436
PH
245 BEGIN BEFORE_QUAL_QUOTE;
246 yyless (yyleng-1);
14f9c5c9 247 }
52ce6436 248 else if (all_posn >= 0)
14f9c5c9 249 yyless (all_posn);
52ce6436
PH
250 yylval.sval = processId (yytext, yyleng);
251 return NAME;
252 }
14f9c5c9 253
14f9c5c9 254
52ce6436 255 /* GDB EXPRESSION CONSTRUCTS */
14f9c5c9
AS
256
257"'"[^']+"'"{WHITE}*:: {
52ce6436
PH
258 yyless (yyleng - 2);
259 yylval.sval = processId (yytext, yyleng);
260 return NAME;
14f9c5c9
AS
261 }
262
52ce6436 263"::" { return COLONCOLON; }
14f9c5c9
AS
264
265[{}@] { return yytext[0]; }
266
14f9c5c9
AS
267 /* REGISTERS AND GDB CONVENIENCE VARIABLES */
268
4c4b4cd2 269"$"({LETTER}|{DIG}|"$")* {
14f9c5c9
AS
270 yylval.sval.ptr = yytext;
271 yylval.sval.length = yyleng;
4c4b4cd2 272 return SPECIAL_VARIABLE;
14f9c5c9
AS
273 }
274
275 /* CATCH-ALL ERROR CASE */
276
e1d5a0d2 277. { error (_("Invalid character '%s' in expression."), yytext); }
14f9c5c9
AS
278%%
279
280#include <ctype.h>
19c1ef65 281#include "gdb_string.h"
14f9c5c9 282
52ce6436
PH
283/* Initialize the lexer for processing new expression. */
284
14f9c5c9 285void
4c4b4cd2 286lexer_init (FILE *inp)
14f9c5c9
AS
287{
288 BEGIN INITIAL;
289 yyrestart (inp);
290}
291
292
4c4b4cd2 293/* Copy S2 to S1, removing all underscores, and downcasing all letters. */
14f9c5c9
AS
294
295static void
4c4b4cd2 296canonicalizeNumeral (char *s1, const char *s2)
14f9c5c9 297{
4c4b4cd2 298 for (; *s2 != '\000'; s2 += 1)
14f9c5c9
AS
299 {
300 if (*s2 != '_')
301 {
302 *s1 = tolower(*s2);
303 s1 += 1;
304 }
305 }
306 s1[0] = '\000';
307}
308
14f9c5c9
AS
309/* Interprets the prefix of NUM that consists of digits of the given BASE
310 as an integer of that BASE, with the string EXP as an exponent.
311 Puts value in yylval, and returns INT, if the string is valid. Causes
4c4b4cd2 312 an error if the number is improperly formated. BASE, if NULL, defaults
52ce6436
PH
313 to "10", and EXP to "1". The EXP does not contain a leading 'e' or 'E'.
314 */
14f9c5c9
AS
315
316static int
4c4b4cd2 317processInt (const char *base0, const char *num0, const char *exp0)
14f9c5c9
AS
318{
319 ULONGEST result;
320 long exp;
321 int base;
322
4c4b4cd2 323 char *trailer;
14f9c5c9
AS
324
325 if (base0 == NULL)
326 base = 10;
327 else
4c4b4cd2
PH
328 {
329 base = strtol (base0, (char **) NULL, 10);
14f9c5c9 330 if (base < 2 || base > 16)
e1d5a0d2 331 error (_("Invalid base: %d."), base);
14f9c5c9
AS
332 }
333
334 if (exp0 == NULL)
335 exp = 0;
336 else
4c4b4cd2 337 exp = strtol(exp0, (char **) NULL, 10);
14f9c5c9
AS
338
339 errno = 0;
4c4b4cd2 340 result = strtoulst (num0, (const char **) &trailer, base);
14f9c5c9 341 if (errno == ERANGE)
e1d5a0d2 342 error (_("Integer literal out of range"));
14f9c5c9 343 if (isxdigit(*trailer))
e1d5a0d2 344 error (_("Invalid digit `%c' in based literal"), *trailer);
14f9c5c9 345
4c4b4cd2 346 while (exp > 0)
14f9c5c9
AS
347 {
348 if (result > (ULONG_MAX / base))
e1d5a0d2 349 error (_("Integer literal out of range"));
14f9c5c9
AS
350 result *= base;
351 exp -= 1;
352 }
4c4b4cd2 353
9a76efb6 354 if ((result >> (gdbarch_int_bit (current_gdbarch)-1)) == 0)
72d5681a 355 yylval.typed_val.type = type_int ();
9a76efb6 356 else if ((result >> (gdbarch_long_bit (current_gdbarch)-1)) == 0)
72d5681a 357 yylval.typed_val.type = type_long ();
9a76efb6 358 else if (((result >> (gdbarch_long_bit (current_gdbarch)-1)) >> 1) == 0)
14f9c5c9
AS
359 {
360 /* We have a number representable as an unsigned integer quantity.
4c4b4cd2 361 For consistency with the C treatment, we will treat it as an
14f9c5c9 362 anonymous modular (unsigned) quantity. Alas, the types are such
4c4b4cd2 363 that we need to store .val as a signed quantity. Sorry
14f9c5c9
AS
364 for the mess, but C doesn't officially guarantee that a simple
365 assignment does the trick (no, it doesn't; read the reference manual).
366 */
367 yylval.typed_val.type = builtin_type_unsigned_long;
368 if (result & LONGEST_SIGN)
4c4b4cd2
PH
369 yylval.typed_val.val =
370 (LONGEST) (result & ~LONGEST_SIGN)
14f9c5c9
AS
371 - (LONGEST_SIGN>>1) - (LONGEST_SIGN>>1);
372 else
373 yylval.typed_val.val = (LONGEST) result;
374 return INT;
375 }
4c4b4cd2 376 else
72d5681a 377 yylval.typed_val.type = type_long_long ();
14f9c5c9
AS
378
379 yylval.typed_val.val = (LONGEST) result;
380 return INT;
381}
382
383static int
4c4b4cd2 384processReal (const char *num0)
14f9c5c9 385{
689e4e2d 386 sscanf (num0, "%" DOUBLEST_SCAN_FORMAT, &yylval.typed_val_float.dval);
14f9c5c9 387
72d5681a 388 yylval.typed_val_float.type = type_float ();
ea06eb3d
UW
389 if (sizeof(DOUBLEST) >= gdbarch_double_bit (current_gdbarch)
390 / TARGET_CHAR_BIT)
72d5681a 391 yylval.typed_val_float.type = type_double ();
ea06eb3d
UW
392 if (sizeof(DOUBLEST) >= gdbarch_long_double_bit (current_gdbarch)
393 / TARGET_CHAR_BIT)
72d5681a 394 yylval.typed_val_float.type = type_long_double ();
14f9c5c9
AS
395
396 return FLOAT;
397}
398
52ce6436
PH
399
400/* Store a canonicalized version of NAME0[0..LEN-1] in yylval.ssym. The
401 resulting string is valid until the next call to ada_parse. It differs
402 from NAME0 in that:
403 + Characters between '...' or <...> are transfered verbatim to
404 yylval.ssym.
405 + <, >, and trailing "'" characters in quoted sequences are removed
406 (a leading quote is preserved to indicate that the name is not to be
407 GNAT-encoded).
408 + Unquoted whitespace is removed.
409 + Unquoted alphabetic characters are mapped to lower case.
410 Result is returned as a struct stoken, but for convenience, the string
411 is also null-terminated. Result string valid until the next call of
412 ada_parse.
413 */
414static struct stoken
4c4b4cd2 415processId (const char *name0, int len)
14f9c5c9 416{
4c4b4cd2 417 char *name = obstack_alloc (&temp_parse_space, len + 11);
14f9c5c9 418 int i0, i;
52ce6436 419 struct stoken result;
4c4b4cd2 420
14f9c5c9
AS
421 while (len > 0 && isspace (name0[len-1]))
422 len -= 1;
423 i = i0 = 0;
4c4b4cd2 424 while (i0 < len)
14f9c5c9
AS
425 {
426 if (isalnum (name0[i0]))
427 {
428 name[i] = tolower (name0[i0]);
429 i += 1; i0 += 1;
430 }
4c4b4cd2 431 else switch (name0[i0])
14f9c5c9
AS
432 {
433 default:
434 name[i] = name0[i0];
435 i += 1; i0 += 1;
436 break;
437 case ' ': case '\t':
438 i0 += 1;
439 break;
440 case '\'':
52ce6436 441 do
14f9c5c9
AS
442 {
443 name[i] = name0[i0];
444 i += 1; i0 += 1;
445 }
52ce6436 446 while (i0 < len && name0[i0] != '\'');
14f9c5c9
AS
447 i0 += 1;
448 break;
449 case '<':
450 i0 += 1;
451 while (i0 < len && name0[i0] != '>')
452 {
453 name[i] = name0[i0];
454 i += 1; i0 += 1;
455 }
456 i0 += 1;
457 break;
458 }
459 }
460 name[i] = '\000';
461
52ce6436
PH
462 result.ptr = name;
463 result.length = i;
464 return result;
14f9c5c9
AS
465}
466
52ce6436
PH
467/* Return TEXT[0..LEN-1], a string literal without surrounding quotes,
468 with special hex character notations replaced with characters.
469 Result valid until the next call to ada_parse. */
14f9c5c9 470
52ce6436
PH
471static struct stoken
472processString (const char *text, int len)
14f9c5c9 473{
52ce6436
PH
474 const char *p;
475 char *q;
476 const char *lim = text + len;
477 struct stoken result;
478
479 q = result.ptr = obstack_alloc (&temp_parse_space, len);
480 p = text;
481 while (p < lim)
14f9c5c9 482 {
52ce6436
PH
483 if (p[0] == '[' && p[1] == '"' && p+2 < lim)
484 {
485 if (p[2] == '"') /* "...["""]... */
486 {
487 *q = '"';
488 p += 4;
489 }
490 else
491 {
492 int chr;
493 sscanf (p+2, "%2x", &chr);
494 *q = (char) chr;
495 p += 5;
496 }
497 }
498 else
499 *q = *p;
500 q += 1;
501 p += 1;
502 }
503 result.length = q - result.ptr;
504 return result;
14f9c5c9
AS
505}
506
507/* Returns the position within STR of the '.' in a
52ce6436
PH
508 '.{WHITE}*all' component of a dotted name, or -1 if there is none.
509 Note: we actually don't need this routine, since 'all' can never be an
510 Ada identifier. Thus, looking up foo.all or foo.all.x as a name
511 must fail, and will eventually be interpreted as (foo).all or
512 (foo).all.x. However, this does avoid an extraneous lookup. */
513
14f9c5c9 514static int
4c4b4cd2 515find_dot_all (const char *str)
14f9c5c9
AS
516{
517 int i;
518 for (i = 0; str[i] != '\000'; i += 1)
519 {
520 if (str[i] == '.')
521 {
522 int i0 = i;
4c4b4cd2 523 do
14f9c5c9
AS
524 i += 1;
525 while (isspace (str[i]));
52ce6436 526 if (strncmp (str+i, "all", 3) == 0
14f9c5c9
AS
527 && ! isalnum (str[i+3]) && str[i+3] != '_')
528 return i0;
529 }
530 }
531 return -1;
4c4b4cd2 532}
14f9c5c9
AS
533
534/* Returns non-zero iff string SUBSEQ matches a subsequence of STR, ignoring
4c4b4cd2 535 case. */
14f9c5c9
AS
536
537static int
4c4b4cd2 538subseqMatch (const char *subseq, const char *str)
14f9c5c9
AS
539{
540 if (subseq[0] == '\0')
541 return 1;
542 else if (str[0] == '\0')
543 return 0;
544 else if (tolower (subseq[0]) == tolower (str[0]))
545 return subseqMatch (subseq+1, str+1) || subseqMatch (subseq, str+1);
546 else
547 return subseqMatch (subseq, str+1);
548}
14f9c5c9 549
4c4b4cd2
PH
550
551static struct { const char *name; int code; }
14f9c5c9
AS
552attributes[] = {
553 { "address", TICK_ADDRESS },
554 { "unchecked_access", TICK_ACCESS },
555 { "unrestricted_access", TICK_ACCESS },
556 { "access", TICK_ACCESS },
557 { "first", TICK_FIRST },
558 { "last", TICK_LAST },
559 { "length", TICK_LENGTH },
560 { "max", TICK_MAX },
561 { "min", TICK_MIN },
562 { "modulus", TICK_MODULUS },
563 { "pos", TICK_POS },
564 { "range", TICK_RANGE },
565 { "size", TICK_SIZE },
566 { "tag", TICK_TAG },
567 { "val", TICK_VAL },
568 { NULL, -1 }
569};
570
571/* Return the syntactic code corresponding to the attribute name or
572 abbreviation STR. */
573
574static int
4c4b4cd2 575processAttribute (const char *str)
14f9c5c9
AS
576{
577 int i, k;
578
579 for (i = 0; attributes[i].code != -1; i += 1)
580 if (strcasecmp (str, attributes[i].name) == 0)
581 return attributes[i].code;
582
583 for (i = 0, k = -1; attributes[i].code != -1; i += 1)
4c4b4cd2 584 if (subseqMatch (str, attributes[i].name))
14f9c5c9
AS
585 {
586 if (k == -1)
587 k = i;
4c4b4cd2 588 else
e1d5a0d2 589 error (_("ambiguous attribute name: `%s'"), str);
14f9c5c9
AS
590 }
591 if (k == -1)
e1d5a0d2 592 error (_("unrecognized attribute: `%s'"), str);
14f9c5c9
AS
593
594 return attributes[k].code;
595}
596
597int
4c4b4cd2 598yywrap(void)
14f9c5c9
AS
599{
600 return 1;
601}
23485554
PH
602
603/* Dummy definition to suppress warnings about unused static definitions. */
604typedef void (*dummy_function) ();
605dummy_function ada_flex_use[] =
606{
375c0479 607 (dummy_function) yyunput
23485554 608};
This page took 0.426865 seconds and 4 git commands to generate.