]> gcc.gnu.org Git - gcc.git/blame - gcc/c-lex.c
(yylex): Integer constant is unsigned for purposes of
[gcc.git] / gcc / c-lex.c
CommitLineData
d45cf215 1/* Lexical analyzer for C and Objective C.
e8bbfc4e
RK
2 Copyright (C) 1987, 1988, 1989, 1992 Free Software Foundation, Inc.
3
4This file is part of GNU CC.
5
6GNU CC is free software; you can redistribute it and/or modify
7it under the terms of the GNU General Public License as published by
8the Free Software Foundation; either version 2, or (at your option)
9any later version.
10
11GNU CC is distributed in the hope that it will be useful,
12but WITHOUT ANY WARRANTY; without even the implied warranty of
13MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
14GNU General Public License for more details.
15
16You should have received a copy of the GNU General Public License
17along with GNU CC; see the file COPYING. If not, write to
18the Free Software Foundation, 675 Mass Ave, Cambridge, MA 02139, USA. */
19
20
21#include <stdio.h>
22#include <errno.h>
23#include <setjmp.h>
24
25#include "config.h"
26#include "rtl.h"
27#include "tree.h"
28#include "input.h"
29#include "c-lex.h"
30#include "c-tree.h"
31#include "flags.h"
32#include "c-parse.h"
33
34#ifdef MULTIBYTE_CHARS
35#include <stdlib.h>
36#include <locale.h>
37#endif
38
39#ifndef errno
40extern int errno;
41#endif
42
43/* The elements of `ridpointers' are identifier nodes
44 for the reserved type names and storage classes.
45 It is indexed by a RID_... value. */
46tree ridpointers[(int) RID_MAX];
47
48/* Cause the `yydebug' variable to be defined. */
49#define YYDEBUG 1
50
51/* the declaration found for the last IDENTIFIER token read in.
52 yylex must look this up to detect typedefs, which get token type TYPENAME,
53 so it is left around in case the identifier is not a typedef but is
54 used in a context which makes it a reference to a variable. */
55tree lastiddecl;
56
57/* Nonzero enables objc features. */
58
59int doing_objc_thang;
60
61extern tree lookup_interface ();
62
63extern int yydebug;
64
65/* File used for outputting assembler code. */
66extern FILE *asm_out_file;
67
68#ifndef WCHAR_TYPE_SIZE
69#ifdef INT_TYPE_SIZE
70#define WCHAR_TYPE_SIZE INT_TYPE_SIZE
71#else
72#define WCHAR_TYPE_SIZE BITS_PER_WORD
73#endif
74#endif
75
76/* Number of bytes in a wide character. */
77#define WCHAR_BYTES (WCHAR_TYPE_SIZE / BITS_PER_UNIT)
78
79static int maxtoken; /* Current nominal length of token buffer. */
80char *token_buffer; /* Pointer to token buffer.
81 Actual allocated length is maxtoken + 2.
82 This is not static because objc-parse.y uses it. */
83
84/* Nonzero if end-of-file has been seen on input. */
85static int end_of_file;
86
87/* Buffered-back input character; faster than using ungetc. */
88static int nextchar = -1;
89
90int check_newline ();
91
92/* Nonzero tells yylex to ignore \ in string constants. */
93static int ignore_escape_flag = 0;
94\f
95/* C code produced by gperf version 2.5 (GNU C++ version) */
96/* Command-line: gperf -p -j1 -i 1 -g -o -t -N is_reserved_word -k1,3,$ c-parse.gperf */
97struct resword { char *name; short token; enum rid rid; };
98
99#define TOTAL_KEYWORDS 53
100#define MIN_WORD_LENGTH 2
101#define MAX_WORD_LENGTH 13
102#define MIN_HASH_VALUE 7
103#define MAX_HASH_VALUE 102
104/* maximum key range = 96, duplicates = 0 */
105
106#ifdef __GNUC__
107__inline
108#endif
109static unsigned int
110hash (str, len)
111 register char *str;
112 register int unsigned len;
113{
114 static unsigned char asso_values[] =
115 {
116 103, 103, 103, 103, 103, 103, 103, 103, 103, 103,
117 103, 103, 103, 103, 103, 103, 103, 103, 103, 103,
118 103, 103, 103, 103, 103, 103, 103, 103, 103, 103,
119 103, 103, 103, 103, 103, 103, 103, 103, 103, 103,
120 103, 103, 103, 103, 103, 103, 103, 103, 103, 103,
121 103, 103, 103, 103, 103, 103, 103, 103, 103, 103,
122 103, 103, 103, 103, 103, 103, 103, 103, 103, 103,
123 103, 103, 103, 103, 103, 103, 103, 103, 103, 103,
124 103, 103, 103, 103, 103, 103, 103, 103, 103, 103,
125 103, 103, 103, 103, 103, 1, 103, 2, 1, 24,
126 1, 5, 19, 39, 16, 13, 103, 1, 25, 1,
127 34, 34, 24, 103, 13, 12, 1, 45, 24, 7,
128 103, 103, 2, 103, 103, 103, 103, 103,
129 };
130 register int hval = len;
131
132 switch (hval)
133 {
134 default:
135 case 3:
136 hval += asso_values[str[2]];
137 case 2:
138 case 1:
139 hval += asso_values[str[0]];
140 }
141 return hval + asso_values[str[len - 1]];
142}
143
144#ifdef __GNUC__
145__inline
146#endif
147struct resword *
148is_reserved_word (str, len)
149 register char *str;
150 register unsigned int len;
151{
152 static struct resword wordlist[] =
153 {
154 {"",}, {"",}, {"",}, {"",}, {"",}, {"",}, {"",},
d45cf215 155 {"asm", ASM_KEYWORD, NORID},
e8bbfc4e 156 {"",},
d45cf215 157 {"__asm", ASM_KEYWORD, NORID},
e8bbfc4e 158 {"",},
d45cf215 159 {"__asm__", ASM_KEYWORD, NORID},
e8bbfc4e
RK
160 {"break", BREAK, NORID},
161 {"__typeof__", TYPEOF, NORID},
162 {"",},
163 {"__alignof__", ALIGNOF, NORID},
164 {"",},
165 {"__attribute__", ATTRIBUTE, NORID},
166 {"int", TYPESPEC, RID_INT},
167 {"__attribute", ATTRIBUTE, NORID},
168 {"__extension__", EXTENSION, NORID},
169 {"",},
170 {"__signed", TYPESPEC, RID_SIGNED},
171 {"",},
172 {"__signed__", TYPESPEC, RID_SIGNED},
173 {"__inline__", SCSPEC, RID_INLINE},
174 {"else", ELSE, NORID},
175 {"__inline", SCSPEC, RID_INLINE},
176 {"default", DEFAULT, NORID},
177 {"__typeof", TYPEOF, NORID},
178 {"while", WHILE, NORID},
179 {"__alignof", ALIGNOF, NORID},
180 {"struct", STRUCT, NORID},
181 {"__const", TYPE_QUAL, RID_CONST},
182 {"if", IF, NORID},
183 {"__const__", TYPE_QUAL, RID_CONST},
184 {"__label__", LABEL, NORID},
185 {"do", DO, NORID},
186 {"__volatile__", TYPE_QUAL, RID_VOLATILE},
187 {"sizeof", SIZEOF, NORID},
188 {"__volatile", TYPE_QUAL, RID_VOLATILE},
189 {"auto", SCSPEC, RID_AUTO},
190 {"void", TYPESPEC, RID_VOID},
191 {"char", TYPESPEC, RID_CHAR},
192 {"static", SCSPEC, RID_STATIC},
193 {"case", CASE, NORID},
194 {"extern", SCSPEC, RID_EXTERN},
195 {"switch", SWITCH, NORID},
196 {"for", FOR, NORID},
197 {"inline", SCSPEC, RID_INLINE},
198 {"typeof", TYPEOF, NORID},
199 {"typedef", SCSPEC, RID_TYPEDEF},
200 {"short", TYPESPEC, RID_SHORT},
201 {"",},
202 {"return", RETURN, NORID},
203 {"enum", ENUM, NORID},
204 {"",},
205 {"double", TYPESPEC, RID_DOUBLE},
206 {"signed", TYPESPEC, RID_SIGNED},
207 {"float", TYPESPEC, RID_FLOAT},
208 {"",}, {"",},
209 {"volatile", TYPE_QUAL, RID_VOLATILE},
210 {"",},
211 {"const", TYPE_QUAL, RID_CONST},
212 {"",},
213 {"unsigned", TYPESPEC, RID_UNSIGNED},
214 {"",}, {"",}, {"",}, {"",},
215 {"continue", CONTINUE, NORID},
216 {"",},
217 {"register", SCSPEC, RID_REGISTER},
218 {"",}, {"",}, {"",}, {"",},
219 {"goto", GOTO, NORID},
220 {"",}, {"",}, {"",}, {"",}, {"",}, {"",}, {"",}, {"",}, {"",},
221 {"",}, {"",}, {"",}, {"",}, {"",}, {"",}, {"",}, {"",}, {"",},
222
223 {"union", UNION, NORID},
224 {"",}, {"",}, {"",}, {"",},
225 {"long", TYPESPEC, RID_LONG},
226 };
227
228 if (len <= MAX_WORD_LENGTH && len >= MIN_WORD_LENGTH)
229 {
230 register int key = hash (str, len);
231
232 if (key <= MAX_HASH_VALUE && key >= 0)
233 {
234 register char *s = wordlist[key].name;
235
236 if (*s == *str && !strcmp (str + 1, s + 1))
237 return &wordlist[key];
238 }
239 }
240 return 0;
241}
242\f
243/* Return something to represent absolute declarators containing a *.
244 TARGET is the absolute declarator that the * contains.
245 TYPE_QUALS is a list of modifiers such as const or volatile
246 to apply to the pointer type, represented as identifiers.
247
248 We return an INDIRECT_REF whose "contents" are TARGET
249 and whose type is the modifier list. */
250
251tree
252make_pointer_declarator (type_quals, target)
253 tree type_quals, target;
254{
255 return build1 (INDIRECT_REF, type_quals, target);
256}
257\f
258void
259init_lex ()
260{
261 /* Make identifier nodes long enough for the language-specific slots. */
262 set_identifier_size (sizeof (struct lang_identifier));
263
264 /* Start it at 0, because check_newline is called at the very beginning
265 and will increment it to 1. */
266 lineno = 0;
267
268#ifdef MULTIBYTE_CHARS
269 /* Change to the native locale for multibyte conversions. */
270 setlocale (LC_CTYPE, "");
271#endif
272
273 maxtoken = 40;
274 token_buffer = (char *) xmalloc (maxtoken + 2);
275
276 ridpointers[(int) RID_INT] = get_identifier ("int");
277 ridpointers[(int) RID_CHAR] = get_identifier ("char");
278 ridpointers[(int) RID_VOID] = get_identifier ("void");
279 ridpointers[(int) RID_FLOAT] = get_identifier ("float");
280 ridpointers[(int) RID_DOUBLE] = get_identifier ("double");
281 ridpointers[(int) RID_SHORT] = get_identifier ("short");
282 ridpointers[(int) RID_LONG] = get_identifier ("long");
283 ridpointers[(int) RID_UNSIGNED] = get_identifier ("unsigned");
284 ridpointers[(int) RID_SIGNED] = get_identifier ("signed");
285 ridpointers[(int) RID_INLINE] = get_identifier ("inline");
286 ridpointers[(int) RID_CONST] = get_identifier ("const");
287 ridpointers[(int) RID_VOLATILE] = get_identifier ("volatile");
288 ridpointers[(int) RID_AUTO] = get_identifier ("auto");
289 ridpointers[(int) RID_STATIC] = get_identifier ("static");
290 ridpointers[(int) RID_EXTERN] = get_identifier ("extern");
291 ridpointers[(int) RID_TYPEDEF] = get_identifier ("typedef");
292 ridpointers[(int) RID_REGISTER] = get_identifier ("register");
293
294 /* Some options inhibit certain reserved words.
295 Clear those words out of the hash table so they won't be recognized. */
296#define UNSET_RESERVED_WORD(STRING) \
297 do { struct resword *s = is_reserved_word (STRING, sizeof (STRING) - 1); \
298 if (s) s->name = ""; } while (0)
299
300 if (flag_traditional)
301 {
302 UNSET_RESERVED_WORD ("const");
303 UNSET_RESERVED_WORD ("volatile");
304 UNSET_RESERVED_WORD ("typeof");
305 UNSET_RESERVED_WORD ("signed");
306 UNSET_RESERVED_WORD ("inline");
307 }
308 if (flag_no_asm)
309 {
310 UNSET_RESERVED_WORD ("asm");
311 UNSET_RESERVED_WORD ("typeof");
312 UNSET_RESERVED_WORD ("inline");
313 }
314}
315
316void
317reinit_parse_for_function ()
318{
319}
320\f
321/* Function used when yydebug is set, to print a token in more detail. */
322
323void
324yyprint (file, yychar, yylval)
325 FILE *file;
326 int yychar;
327 YYSTYPE yylval;
328{
329 tree t;
330 switch (yychar)
331 {
332 case IDENTIFIER:
333 case TYPENAME:
334 t = yylval.ttype;
335 if (IDENTIFIER_POINTER (t))
336 fprintf (file, " `%s'", IDENTIFIER_POINTER (t));
337 break;
338
339 case CONSTANT:
340 t = yylval.ttype;
341 if (TREE_CODE (t) == INTEGER_CST)
8d9bfdc5
RK
342 fprintf (file,
343#if HOST_BITS_PER_WIDE_INT == 64
344#if HOST_BITS_PER_WIDE_INT != HOST_BITS_PER_INT
345 " 0x%lx%016lx",
346#else
347 " 0x%x%016x",
348#endif
349#else
350#if HOST_BITS_PER_WIDE_INT != HOST_BITS_PER_INT
351 " 0x%lx%08lx",
352#else
353 " 0x%x%08x",
354#endif
355#endif
356 TREE_INT_CST_HIGH (t), TREE_INT_CST_LOW (t));
e8bbfc4e
RK
357 break;
358 }
359}
360
361\f
362/* If C is not whitespace, return C.
363 Otherwise skip whitespace and return first nonwhite char read. */
364
365static int
366skip_white_space (c)
367 register int c;
368{
0dcd8cee 369 static int newline_warning = 0;
e8bbfc4e
RK
370
371 for (;;)
372 {
373 switch (c)
374 {
0dcd8cee
RS
375 /* We don't recognize comments here, because
376 cpp output can include / and * consecutively as operators.
377 Also, there's no need, since cpp removes all comments. */
e8bbfc4e
RK
378
379 case '\n':
380 c = check_newline ();
381 break;
382
383 case ' ':
384 case '\t':
385 case '\f':
e8bbfc4e
RK
386 case '\v':
387 case '\b':
388 c = getc (finput);
389 break;
390
0dcd8cee
RS
391 case '\r':
392 /* ANSI C says the effects of a carriage return in a source file
393 are undefined. */
394 if (pedantic && !newline_warning)
395 {
396 warning ("carriage return in source file");
397 warning ("(we only warn about the first carriage return)");
398 newline_warning = 1;
399 }
400 c = getc (finput);
401 break;
402
e8bbfc4e
RK
403 case '\\':
404 c = getc (finput);
405 if (c == '\n')
406 lineno++;
407 else
408 error ("stray '\\' in program");
409 c = getc (finput);
410 break;
411
412 default:
413 return (c);
414 }
415 }
416}
417
418/* Skips all of the white space at the current location in the input file.
419 Must use and reset nextchar if it has the next character. */
420
421void
422position_after_white_space ()
423{
424 register int c;
425
426 if (nextchar != -1)
427 c = nextchar, nextchar = -1;
428 else
429 c = getc (finput);
430
431 ungetc (skip_white_space (c), finput);
432}
433
434/* Make the token buffer longer, preserving the data in it.
435 P should point to just beyond the last valid character in the old buffer.
436 The value we return is a pointer to the new buffer
437 at a place corresponding to P. */
438
439static char *
440extend_token_buffer (p)
441 char *p;
442{
443 int offset = p - token_buffer;
444
445 maxtoken = maxtoken * 2 + 10;
446 token_buffer = (char *) xrealloc (token_buffer, maxtoken + 2);
447
448 return token_buffer + offset;
449}
450\f
451/* At the beginning of a line, increment the line number
452 and process any #-directive on this line.
453 If the line is a #-directive, read the entire line and return a newline.
454 Otherwise, return the line's first non-whitespace character. */
455
456int
457check_newline ()
458{
459 register int c;
460 register int token;
461
462 lineno++;
463
464 /* Read first nonwhite char on the line. */
465
466 c = getc (finput);
467 while (c == ' ' || c == '\t')
468 c = getc (finput);
469
470 if (c != '#')
471 {
472 /* If not #, return it so caller will use it. */
473 return c;
474 }
475
476 /* Read first nonwhite char after the `#'. */
477
478 c = getc (finput);
479 while (c == ' ' || c == '\t')
480 c = getc (finput);
481
482 /* If a letter follows, then if the word here is `line', skip
483 it and ignore it; otherwise, ignore the line, with an error
484 if the word isn't `pragma', `ident', `define', or `undef'. */
485
486 if ((c >= 'a' && c <= 'z') || (c >= 'A' && c <= 'Z'))
487 {
488 if (c == 'p')
489 {
490 if (getc (finput) == 'r'
491 && getc (finput) == 'a'
492 && getc (finput) == 'g'
493 && getc (finput) == 'm'
494 && getc (finput) == 'a'
495 && ((c = getc (finput)) == ' ' || c == '\t' || c == '\n'))
496 {
ca5b800a 497#ifdef HANDLE_SYSV_PRAGMA
a3100298 498 return handle_sysv_pragma (finput, c);
ca5b800a 499#endif /* HANDLE_SYSV_PRAGMA */
e8bbfc4e
RK
500#ifdef HANDLE_PRAGMA
501 HANDLE_PRAGMA (finput);
502#endif /* HANDLE_PRAGMA */
503 goto skipline;
504 }
505 }
506
507 else if (c == 'd')
508 {
509 if (getc (finput) == 'e'
510 && getc (finput) == 'f'
511 && getc (finput) == 'i'
512 && getc (finput) == 'n'
513 && getc (finput) == 'e'
514 && ((c = getc (finput)) == ' ' || c == '\t' || c == '\n'))
515 {
516#ifdef DWARF_DEBUGGING_INFO
517 if ((debug_info_level == DINFO_LEVEL_VERBOSE)
518 && (write_symbols == DWARF_DEBUG))
519 dwarfout_define (lineno, get_directive_line (finput));
520#endif /* DWARF_DEBUGGING_INFO */
521 goto skipline;
522 }
523 }
524 else if (c == 'u')
525 {
526 if (getc (finput) == 'n'
527 && getc (finput) == 'd'
528 && getc (finput) == 'e'
529 && getc (finput) == 'f'
530 && ((c = getc (finput)) == ' ' || c == '\t' || c == '\n'))
531 {
532#ifdef DWARF_DEBUGGING_INFO
533 if ((debug_info_level == DINFO_LEVEL_VERBOSE)
534 && (write_symbols == DWARF_DEBUG))
535 dwarfout_undef (lineno, get_directive_line (finput));
536#endif /* DWARF_DEBUGGING_INFO */
537 goto skipline;
538 }
539 }
540 else if (c == 'l')
541 {
542 if (getc (finput) == 'i'
543 && getc (finput) == 'n'
544 && getc (finput) == 'e'
545 && ((c = getc (finput)) == ' ' || c == '\t'))
546 goto linenum;
547 }
548 else if (c == 'i')
549 {
550 if (getc (finput) == 'd'
551 && getc (finput) == 'e'
552 && getc (finput) == 'n'
553 && getc (finput) == 't'
554 && ((c = getc (finput)) == ' ' || c == '\t'))
555 {
556 /* #ident. The pedantic warning is now in cccp.c. */
557
558 /* Here we have just seen `#ident '.
559 A string constant should follow. */
560
561 while (c == ' ' || c == '\t')
562 c = getc (finput);
563
564 /* If no argument, ignore the line. */
565 if (c == '\n')
566 return c;
567
568 ungetc (c, finput);
569 token = yylex ();
570 if (token != STRING
571 || TREE_CODE (yylval.ttype) != STRING_CST)
572 {
573 error ("invalid #ident");
574 goto skipline;
575 }
576
577 if (!flag_no_ident)
578 {
579#ifdef ASM_OUTPUT_IDENT
580 ASM_OUTPUT_IDENT (asm_out_file, TREE_STRING_POINTER (yylval.ttype));
581#endif
582 }
583
584 /* Skip the rest of this line. */
585 goto skipline;
586 }
587 }
588
589 error ("undefined or invalid # directive");
590 goto skipline;
591 }
592
593linenum:
594 /* Here we have either `#line' or `# <nonletter>'.
595 In either case, it should be a line number; a digit should follow. */
596
597 while (c == ' ' || c == '\t')
598 c = getc (finput);
599
600 /* If the # is the only nonwhite char on the line,
601 just ignore it. Check the new newline. */
602 if (c == '\n')
603 return c;
604
605 /* Something follows the #; read a token. */
606
607 ungetc (c, finput);
608 token = yylex ();
609
610 if (token == CONSTANT
611 && TREE_CODE (yylval.ttype) == INTEGER_CST)
612 {
613 int old_lineno = lineno;
614 int used_up = 0;
615 /* subtract one, because it is the following line that
616 gets the specified number */
617
618 int l = TREE_INT_CST_LOW (yylval.ttype) - 1;
619
620 /* Is this the last nonwhite stuff on the line? */
621 c = getc (finput);
622 while (c == ' ' || c == '\t')
623 c = getc (finput);
624 if (c == '\n')
625 {
626 /* No more: store the line number and check following line. */
627 lineno = l;
628 return c;
629 }
630 ungetc (c, finput);
631
632 /* More follows: it must be a string constant (filename). */
633
634 /* Read the string constant, but don't treat \ as special. */
635 ignore_escape_flag = 1;
636 token = yylex ();
637 ignore_escape_flag = 0;
638
639 if (token != STRING || TREE_CODE (yylval.ttype) != STRING_CST)
640 {
641 error ("invalid #line");
642 goto skipline;
643 }
644
645 input_filename
646 = (char *) permalloc (TREE_STRING_LENGTH (yylval.ttype) + 1);
647 strcpy (input_filename, TREE_STRING_POINTER (yylval.ttype));
648 lineno = l;
649
650 /* Each change of file name
651 reinitializes whether we are now in a system header. */
652 in_system_header = 0;
653
654 if (main_input_filename == 0)
655 main_input_filename = input_filename;
656
657 /* Is this the last nonwhite stuff on the line? */
658 c = getc (finput);
659 while (c == ' ' || c == '\t')
660 c = getc (finput);
661 if (c == '\n')
662 return c;
663 ungetc (c, finput);
664
665 token = yylex ();
666 used_up = 0;
667
668 /* `1' after file name means entering new file.
669 `2' after file name means just left a file. */
670
671 if (token == CONSTANT
672 && TREE_CODE (yylval.ttype) == INTEGER_CST)
673 {
674 if (TREE_INT_CST_LOW (yylval.ttype) == 1)
675 {
676 /* Pushing to a new file. */
677 struct file_stack *p
678 = (struct file_stack *) xmalloc (sizeof (struct file_stack));
679 input_file_stack->line = old_lineno;
680 p->next = input_file_stack;
681 p->name = input_filename;
682 input_file_stack = p;
683 input_file_stack_tick++;
684#ifdef DWARF_DEBUGGING_INFO
685 if (debug_info_level == DINFO_LEVEL_VERBOSE
686 && write_symbols == DWARF_DEBUG)
687 dwarfout_start_new_source_file (input_filename);
688#endif /* DWARF_DEBUGGING_INFO */
689
690 used_up = 1;
691 }
692 else if (TREE_INT_CST_LOW (yylval.ttype) == 2)
693 {
694 /* Popping out of a file. */
695 if (input_file_stack->next)
696 {
697 struct file_stack *p = input_file_stack;
698 input_file_stack = p->next;
699 free (p);
700 input_file_stack_tick++;
701#ifdef DWARF_DEBUGGING_INFO
702 if (debug_info_level == DINFO_LEVEL_VERBOSE
703 && write_symbols == DWARF_DEBUG)
704 dwarfout_resume_previous_source_file (input_file_stack->line);
705#endif /* DWARF_DEBUGGING_INFO */
706 }
707 else
708 error ("#-lines for entering and leaving files don't match");
709
710 used_up = 1;
711 }
712 }
713
714 /* If we have handled a `1' or a `2',
715 see if there is another number to read. */
716 if (used_up)
717 {
718 /* Is this the last nonwhite stuff on the line? */
719 c = getc (finput);
720 while (c == ' ' || c == '\t')
721 c = getc (finput);
722 if (c == '\n')
723 return c;
724 ungetc (c, finput);
725
726 token = yylex ();
727 used_up = 0;
728 }
729
730 /* `3' after file name means this is a system header file. */
731
732 if (token == CONSTANT
733 && TREE_CODE (yylval.ttype) == INTEGER_CST
734 && TREE_INT_CST_LOW (yylval.ttype) == 3)
735 in_system_header = 1;
736 }
737 else
738 error ("invalid #-line");
739
740 /* skip the rest of this line. */
741 skipline:
742 if (c == '\n')
743 return c;
744 while ((c = getc (finput)) != EOF && c != '\n');
745 return c;
746}
747\f
ca5b800a
RS
748#ifdef HANDLE_SYSV_PRAGMA
749
750/* Handle a #pragma directive. INPUT is the current input stream,
a3100298
TW
751 and C is a character to reread. Processes the entire input line
752 and returns a character for the caller to reread: either \n or EOF. */
ca5b800a
RS
753
754/* This function has to be in this file, in order to get at
755 the token types. */
756
757int
758handle_sysv_pragma (input, c)
759 FILE *input;
760 int c;
761{
a3100298 762 for (;;)
ca5b800a 763 {
a3100298
TW
764 while (c == ' ' || c == '\t')
765 c = getc (input);
766 if (c == '\n' || c == EOF)
767 {
768 handle_pragma_token (0, 0);
769 return c;
770 }
771 ungetc (c, input);
772 switch (yylex ())
773 {
774 case IDENTIFIER:
775 case TYPENAME:
776 case STRING:
777 case CONSTANT:
778 handle_pragma_token (token_buffer, yylval.ttype);
779 break;
780 default:
781 handle_pragma_token (token_buffer, 0);
782 }
783 if (nextchar >= 0)
784 c = nextchar, nextchar = -1;
785 else
786 c = getc (input);
ca5b800a 787 }
ca5b800a
RS
788}
789
790#endif /* HANDLE_SYSV_PRAGMA */
791\f
e8bbfc4e
RK
792#define isalnum(char) ((char >= 'a' && char <= 'z') || (char >= 'A' && char <= 'Z') || (char >= '0' && char <= '9'))
793#define isdigit(char) (char >= '0' && char <= '9')
794#define ENDFILE -1 /* token that represents end-of-file */
795
796/* Read an escape sequence, returning its equivalent as a character,
797 or -1 if it is backslash-newline. */
798
799static int
800readescape ()
801{
802 register int c = getc (finput);
803 register int code;
804 register unsigned count;
805 unsigned firstdig;
8696da34 806 int nonnull;
e8bbfc4e
RK
807
808 switch (c)
809 {
810 case 'x':
811 if (warn_traditional)
812 warning ("the meaning of `\\x' varies with -traditional");
813
814 if (flag_traditional)
815 return c;
816
817 code = 0;
818 count = 0;
8696da34 819 nonnull = 0;
e8bbfc4e
RK
820 while (1)
821 {
822 c = getc (finput);
823 if (!(c >= 'a' && c <= 'f')
824 && !(c >= 'A' && c <= 'F')
825 && !(c >= '0' && c <= '9'))
826 {
827 ungetc (c, finput);
828 break;
829 }
830 code *= 16;
831 if (c >= 'a' && c <= 'f')
832 code += c - 'a' + 10;
833 if (c >= 'A' && c <= 'F')
834 code += c - 'A' + 10;
835 if (c >= '0' && c <= '9')
836 code += c - '0';
8696da34
RS
837 if (code != 0 || count != 0)
838 {
839 if (count == 0)
840 firstdig = code;
841 count++;
842 }
843 nonnull = 1;
e8bbfc4e 844 }
8696da34 845 if (! nonnull)
e8bbfc4e
RK
846 error ("\\x used with no following hex digits");
847 else if ((count - 1) * 4 >= TYPE_PRECISION (integer_type_node)
848 || (count > 1
849 && ((1 << (TYPE_PRECISION (integer_type_node) - (count - 1) * 4))
850 <= firstdig)))
851 pedwarn ("hex escape out of range");
852 return code;
853
854 case '0': case '1': case '2': case '3': case '4':
855 case '5': case '6': case '7':
856 code = 0;
857 count = 0;
858 while ((c <= '7') && (c >= '0') && (count++ < 3))
859 {
860 code = (code * 8) + (c - '0');
861 c = getc (finput);
862 }
863 ungetc (c, finput);
864 return code;
865
866 case '\\': case '\'': case '"':
867 return c;
868
869 case '\n':
870 lineno++;
871 return -1;
872
873 case 'n':
874 return TARGET_NEWLINE;
875
876 case 't':
877 return TARGET_TAB;
878
879 case 'r':
880 return TARGET_CR;
881
882 case 'f':
883 return TARGET_FF;
884
885 case 'b':
886 return TARGET_BS;
887
888 case 'a':
889 if (warn_traditional)
890 warning ("the meaning of `\\a' varies with -traditional");
891
892 if (flag_traditional)
893 return c;
894 return TARGET_BELL;
895
896 case 'v':
897#if 0 /* Vertical tab is present in common usage compilers. */
898 if (flag_traditional)
899 return c;
900#endif
901 return TARGET_VT;
902
903 case 'E':
904 pedwarn ("non-ANSI-standard escape sequence, `\\E'");
905 return 033;
906
907 case '?':
908 return c;
909
910 /* `\(', etc, are used at beginning of line to avoid confusing Emacs. */
911 case '(':
912 case '{':
913 case '[':
914 if (pedantic)
915 pedwarn ("non-ANSI escape sequence `\\%c'", c);
916 return c;
917 }
7e6b19dc 918 if (c >= 040 && c < 0177)
e8bbfc4e
RK
919 pedwarn ("unknown escape sequence `\\%c'", c);
920 else
921 pedwarn ("unknown escape sequence: `\\' followed by char code 0x%x", c);
922 return c;
923}
924\f
925void
926yyerror (string)
927 char *string;
928{
929 char buf[200];
930
931 strcpy (buf, string);
932
933 /* We can't print string and character constants well
934 because the token_buffer contains the result of processing escapes. */
935 if (end_of_file)
936 strcat (buf, " at end of input");
937 else if (token_buffer[0] == 0)
938 strcat (buf, " at null character");
939 else if (token_buffer[0] == '"')
940 strcat (buf, " before string constant");
941 else if (token_buffer[0] == '\'')
942 strcat (buf, " before character constant");
943 else if (token_buffer[0] < 040 || (unsigned char) token_buffer[0] >= 0177)
944 sprintf (buf + strlen (buf), " before character 0%o",
945 (unsigned char) token_buffer[0]);
946 else
947 strcat (buf, " before `%s'");
948
949 error (buf, token_buffer);
950}
951
952#if 0
953
954struct try_type
955{
956 tree *node_var;
957 char unsigned_flag;
958 char long_flag;
959 char long_long_flag;
960};
961
962struct try_type type_sequence[] =
963{
964 { &integer_type_node, 0, 0, 0},
965 { &unsigned_type_node, 1, 0, 0},
966 { &long_integer_type_node, 0, 1, 0},
967 { &long_unsigned_type_node, 1, 1, 0},
968 { &long_long_integer_type_node, 0, 1, 1},
969 { &long_long_unsigned_type_node, 1, 1, 1}
970};
971#endif /* 0 */
972\f
973int
974yylex ()
975{
976 register int c;
977 register char *p;
978 register int value;
979 int wide_flag = 0;
980
981 if (nextchar >= 0)
982 c = nextchar, nextchar = -1;
983 else
984 c = getc (finput);
985
986 /* Effectively do c = skip_white_space (c)
987 but do it faster in the usual cases. */
988 while (1)
989 switch (c)
990 {
e8bbfc4e
RK
991 case ' ':
992 case '\t':
993 case '\f':
994 case '\v':
995 case '\b':
996 c = getc (finput);
997 break;
998
80f5b9d8
RS
999 case '\r':
1000 /* Call skip_white_space so we can warn if appropriate. */
1001
e8bbfc4e
RK
1002 case '\n':
1003 case '/':
1004 case '\\':
1005 c = skip_white_space (c);
1006 default:
1007 goto found_nonwhite;
1008 }
1009 found_nonwhite:
1010
1011 token_buffer[0] = c;
1012 token_buffer[1] = 0;
1013
1014/* yylloc.first_line = lineno; */
1015
1016 switch (c)
1017 {
1018 case EOF:
1019 end_of_file = 1;
1020 token_buffer[0] = 0;
1021 value = ENDFILE;
1022 break;
1023
1024 case '$':
1025 if (dollars_in_ident)
1026 goto letter;
1027 return '$';
1028
1029 case 'L':
1030 /* Capital L may start a wide-string or wide-character constant. */
1031 {
1032 register int c = getc (finput);
1033 if (c == '\'')
1034 {
1035 wide_flag = 1;
1036 goto char_constant;
1037 }
1038 if (c == '"')
1039 {
1040 wide_flag = 1;
1041 goto string_constant;
1042 }
1043 ungetc (c, finput);
1044 }
1045 goto letter;
1046
1047 case '@':
1048 if (!doing_objc_thang)
1049 {
1050 value = c;
1051 break;
1052 }
1053 p = token_buffer;
1054 *p++ = '@';
1055 c = getc (finput);
1056 while (isalnum (c) || c == '_')
1057 {
1058 if (p >= token_buffer + maxtoken)
1059 p = extend_token_buffer (p);
1060
1061 *p++ = c;
1062 c = getc (finput);
1063 }
1064
1065 *p = 0;
1066 nextchar = c;
1067 value = recognize_objc_keyword (token_buffer + 1);
1068 if (value != 0)
1069 break;
1070 error ("invalid Objective C keyword `%s'", token_buffer);
1071 /* Cause a syntax error--1 is not a valid token type. */
1072 value = 1;
1073 break;
1074
1075 case 'A': case 'B': case 'C': case 'D': case 'E':
1076 case 'F': case 'G': case 'H': case 'I': case 'J':
1077 case 'K': case 'M': case 'N': case 'O':
1078 case 'P': case 'Q': case 'R': case 'S': case 'T':
1079 case 'U': case 'V': case 'W': case 'X': case 'Y':
1080 case 'Z':
1081 case 'a': case 'b': case 'c': case 'd': case 'e':
1082 case 'f': case 'g': case 'h': case 'i': case 'j':
1083 case 'k': case 'l': case 'm': case 'n': case 'o':
1084 case 'p': case 'q': case 'r': case 's': case 't':
1085 case 'u': case 'v': case 'w': case 'x': case 'y':
1086 case 'z':
1087 case '_':
1088 letter:
1089 p = token_buffer;
1090 while (isalnum (c) || c == '_' || c == '$' || c == '@')
1091 {
1092 if (p >= token_buffer + maxtoken)
1093 p = extend_token_buffer (p);
1094 if (c == '$' && ! dollars_in_ident)
1095 break;
1096
1097 *p++ = c;
1098 c = getc (finput);
1099 }
1100
1101 *p = 0;
1102 nextchar = c;
1103
1104 value = IDENTIFIER;
1105 yylval.itype = 0;
1106
1107 /* Try to recognize a keyword. Uses minimum-perfect hash function */
1108
1109 {
1110 register struct resword *ptr;
1111
1112 if (ptr = is_reserved_word (token_buffer, p - token_buffer))
1113 {
1114 if (ptr->rid)
1115 yylval.ttype = ridpointers[(int) ptr->rid];
1116 value = (int) ptr->token;
1117
1118 /* Even if we decided to recognize asm, still perhaps warn. */
1119 if (pedantic
d45cf215 1120 && (value == ASM_KEYWORD || value == TYPEOF
e8bbfc4e
RK
1121 || ptr->rid == RID_INLINE)
1122 && token_buffer[0] != '_')
1123 pedwarn ("ANSI does not permit the keyword `%s'",
1124 token_buffer);
1125 }
1126 }
1127
1128 /* If we did not find a keyword, look for an identifier
1129 (or a typename). */
1130
1131 if (value == IDENTIFIER)
1132 {
1133 yylval.ttype = get_identifier (token_buffer);
1134 lastiddecl = lookup_name (yylval.ttype);
1135
1136 if (lastiddecl != 0 && TREE_CODE (lastiddecl) == TYPE_DECL)
1137 value = TYPENAME;
6dbf678a
RS
1138 /* A user-invisible read-only initialized variable
1139 should be replaced by its value.
1140 We handle only strings since that's the only case used in C. */
1141 else if (lastiddecl != 0 && TREE_CODE (lastiddecl) == VAR_DECL
1142 && DECL_IGNORED_P (lastiddecl)
1143 && TREE_READONLY (lastiddecl)
1144 && DECL_INITIAL (lastiddecl) != 0
1145 && TREE_CODE (DECL_INITIAL (lastiddecl)) == STRING_CST)
1146 {
1147 yylval.ttype = DECL_INITIAL (lastiddecl);
1148 value = STRING;
1149 }
e8bbfc4e
RK
1150 else if (doing_objc_thang)
1151 {
1152 tree objc_interface_decl = lookup_interface (yylval.ttype);
1153
1154 if (objc_interface_decl)
1155 {
1156 value = CLASSNAME;
1157 yylval.ttype = objc_interface_decl;
1158 }
1159 }
1160 }
1161
1162 break;
1163
1164 case '0': case '1': case '2': case '3': case '4':
1165 case '5': case '6': case '7': case '8': case '9':
1166 case '.':
1167 {
1168 int base = 10;
1169 int count = 0;
1170 int largest_digit = 0;
1171 int numdigits = 0;
1172 /* for multi-precision arithmetic,
4ca827d0
RS
1173 we actually store only HOST_BITS_PER_CHAR bits in each part.
1174 The number of parts is chosen so as to be sufficient to hold
9b0995aa
RK
1175 the enough bits to fit into the two HOST_WIDE_INTs that contain
1176 the integer value (this is always at least as many bits as are
1177 in a target `long long' value, but may be wider). */
1178#define TOTAL_PARTS ((HOST_BITS_PER_WIDE_INT / HOST_BITS_PER_CHAR) * 2 + 2)
4ca827d0 1179 int parts[TOTAL_PARTS];
e8bbfc4e
RK
1180 int overflow = 0;
1181
1182 enum anon1 { NOT_FLOAT, AFTER_POINT, TOO_MANY_POINTS} floatflag
1183 = NOT_FLOAT;
1184
4ca827d0
RS
1185 for (count = 0; count < TOTAL_PARTS; count++)
1186 parts[count] = 0;
e8bbfc4e
RK
1187
1188 p = token_buffer;
1189 *p++ = c;
1190
1191 if (c == '0')
1192 {
1193 *p++ = (c = getc (finput));
1194 if ((c == 'x') || (c == 'X'))
1195 {
1196 base = 16;
1197 *p++ = (c = getc (finput));
1198 }
1199 /* Leading 0 forces octal unless the 0 is the only digit. */
1200 else if (c >= '0' && c <= '9')
1201 {
1202 base = 8;
1203 numdigits++;
1204 }
1205 else
1206 numdigits++;
1207 }
1208
1209 /* Read all the digits-and-decimal-points. */
1210
1211 while (c == '.'
1212 || (isalnum (c) && (c != 'l') && (c != 'L')
1213 && (c != 'u') && (c != 'U')
1214 && (floatflag == NOT_FLOAT || ((c != 'f') && (c != 'F')))))
1215 {
1216 if (c == '.')
1217 {
1218 if (base == 16)
1219 error ("floating constant may not be in radix 16");
1220 if (floatflag == AFTER_POINT)
1221 {
1222 error ("malformed floating constant");
1223 floatflag = TOO_MANY_POINTS;
1224 }
1225 else
1226 floatflag = AFTER_POINT;
1227
1228 base = 10;
1229 *p++ = c = getc (finput);
1230 /* Accept '.' as the start of a floating-point number
1231 only when it is followed by a digit.
1232 Otherwise, unread the following non-digit
1233 and use the '.' as a structural token. */
1234 if (p == token_buffer + 2 && !isdigit (c))
1235 {
1236 if (c == '.')
1237 {
1238 c = getc (finput);
1239 if (c == '.')
1240 {
1241 *p++ = c;
1242 *p = 0;
1243 return ELLIPSIS;
1244 }
1245 error ("parse error at `..'");
1246 }
1247 ungetc (c, finput);
1248 token_buffer[1] = 0;
1249 value = '.';
1250 goto done;
1251 }
1252 }
1253 else
1254 {
1255 /* It is not a decimal point.
1256 It should be a digit (perhaps a hex digit). */
1257
1258 if (isdigit (c))
1259 {
1260 c = c - '0';
1261 }
1262 else if (base <= 10)
1263 {
1264 if ((c&~040) == 'E')
1265 {
1266 base = 10;
1267 floatflag = AFTER_POINT;
1268 break; /* start of exponent */
1269 }
1270 error ("nondigits in number and not hexadecimal");
1271 c = 0;
1272 }
1273 else if (c >= 'a')
1274 {
1275 c = c - 'a' + 10;
1276 }
1277 else
1278 {
1279 c = c - 'A' + 10;
1280 }
1281 if (c >= largest_digit)
1282 largest_digit = c;
1283 numdigits++;
1284
4ca827d0 1285 for (count = 0; count < TOTAL_PARTS; count++)
e8bbfc4e 1286 {
4ca827d0 1287 parts[count] *= base;
e8bbfc4e
RK
1288 if (count)
1289 {
4ca827d0
RS
1290 parts[count]
1291 += (parts[count-1] >> HOST_BITS_PER_CHAR);
1292 parts[count-1]
1293 &= (1 << HOST_BITS_PER_CHAR) - 1;
e8bbfc4e 1294 }
4ca827d0
RS
1295 else
1296 parts[0] += c;
e8bbfc4e
RK
1297 }
1298
4ca827d0
RS
1299 /* If the extra highest-order part ever gets anything in it,
1300 the number is certainly too big. */
1301 if (parts[TOTAL_PARTS - 1] != 0)
1302 overflow = 1;
e8bbfc4e
RK
1303
1304 if (p >= token_buffer + maxtoken - 3)
1305 p = extend_token_buffer (p);
1306 *p++ = (c = getc (finput));
1307 }
1308 }
1309
1310 if (numdigits == 0)
1311 error ("numeric constant with no digits");
1312
1313 if (largest_digit >= base)
1314 error ("numeric constant contains digits beyond the radix");
1315
1316 /* Remove terminating char from the token buffer and delimit the string */
1317 *--p = 0;
1318
1319 if (floatflag != NOT_FLOAT)
1320 {
1321 tree type = double_type_node;
63ea33ce 1322 int garbage_chars = 0, exceeds_double = 0;
e8bbfc4e
RK
1323 REAL_VALUE_TYPE value;
1324 jmp_buf handler;
1325
1326 /* Read explicit exponent if any, and put it in tokenbuf. */
1327
1328 if ((c == 'e') || (c == 'E'))
1329 {
1330 if (p >= token_buffer + maxtoken - 3)
1331 p = extend_token_buffer (p);
1332 *p++ = c;
1333 c = getc (finput);
1334 if ((c == '+') || (c == '-'))
1335 {
1336 *p++ = c;
1337 c = getc (finput);
1338 }
1339 if (! isdigit (c))
1340 error ("floating constant exponent has no digits");
1341 while (isdigit (c))
1342 {
1343 if (p >= token_buffer + maxtoken - 3)
1344 p = extend_token_buffer (p);
1345 *p++ = c;
1346 c = getc (finput);
1347 }
1348 }
1349
1350 *p = 0;
1351 errno = 0;
1352
1353 /* Convert string to a double, checking for overflow. */
1354 if (setjmp (handler))
1355 {
1356 error ("floating constant out of range");
1357 value = dconst0;
1358 }
1359 else
1360 {
1361 set_float_handler (handler);
1362 value = REAL_VALUE_ATOF (token_buffer);
8d9bfdc5 1363 set_float_handler (NULL_PTR);
e8bbfc4e
RK
1364 }
1365#ifdef ERANGE
e53c841d 1366 if (errno == ERANGE && !flag_traditional && pedantic)
e8bbfc4e
RK
1367 {
1368 char *p1 = token_buffer;
1369 /* Check for "0.0" and variants;
7b6327ae 1370 SunOS 4 spuriously returns ERANGE for them. */
e8bbfc4e
RK
1371 while (*p1 == '0') p1++;
1372 if (*p1 == '.')
1373 {
1374 p1++;
1375 while (*p1 == '0') p1++;
1376 }
1377 if (*p1 == 'e' || *p1 == 'E')
1378 {
1379 /* with significand==0, ignore the exponent */
1380 p1++;
1381 while (*p1 != 0) p1++;
1382 }
1383 /* ERANGE is also reported for underflow,
1384 so test the value to distinguish overflow from that. */
1385 if (*p1 != 0 && (value > 1.0 || value < -1.0))
63ea33ce
RS
1386 {
1387 pedwarn ("floating point number exceeds range of `double'");
1388 exceeds_double = 1;
1389 }
e8bbfc4e
RK
1390 }
1391#endif
1392
1393 /* Read the suffixes to choose a data type. */
63ea33ce
RS
1394 switch (c)
1395 {
1396 case 'f': case 'F':
1397 type = float_type_node;
1398 value = REAL_VALUE_TRUNCATE (TYPE_MODE (type), value);
1399 if (REAL_VALUE_ISINF (value) && ! exceeds_double && pedantic)
1400 pedwarn ("floating point number exceeds range of `float'");
1401 garbage_chars = -1;
1402 break;
1403
1404 case 'l': case 'L':
1405 type = long_double_type_node;
1406 garbage_chars = -1;
1407 break;
1408 }
1409 /* Note: garbage_chars is -1 if first char is *not* garbage. */
1410 while (isalnum (c))
e8bbfc4e 1411 {
e8bbfc4e
RK
1412 if (p >= token_buffer + maxtoken - 3)
1413 p = extend_token_buffer (p);
1414 *p++ = c;
1415 c = getc (finput);
63ea33ce 1416 garbage_chars++;
e8bbfc4e 1417 }
63ea33ce
RS
1418 if (garbage_chars > 0)
1419 error ("garbage at end of number");
e8bbfc4e
RK
1420
1421 /* Create a node with determined type and value. */
1422 yylval.ttype = build_real (type, value);
1423
1424 ungetc (c, finput);
1425 *p = 0;
1426 }
1427 else
1428 {
1429 tree traditional_type, ansi_type, type;
8d9bfdc5 1430 HOST_WIDE_INT high, low;
e8bbfc4e
RK
1431 int spec_unsigned = 0;
1432 int spec_long = 0;
1433 int spec_long_long = 0;
1434 int bytes, warn, i;
1435
1436 while (1)
1437 {
1438 if (c == 'u' || c == 'U')
1439 {
1440 if (spec_unsigned)
1441 error ("two `u's in integer constant");
1442 spec_unsigned = 1;
1443 }
1444 else if (c == 'l' || c == 'L')
1445 {
1446 if (spec_long)
1447 {
1448 if (spec_long_long)
1449 error ("three `l's in integer constant");
1450 else if (pedantic)
1451 pedwarn ("ANSI C forbids long long integer constants");
1452 spec_long_long = 1;
1453 }
1454 spec_long = 1;
1455 }
1456 else
1457 {
1458 if (isalnum (c))
1459 {
1460 error ("garbage at end of number");
1461 while (isalnum (c))
1462 {
1463 if (p >= token_buffer + maxtoken - 3)
1464 p = extend_token_buffer (p);
1465 *p++ = c;
1466 c = getc (finput);
1467 }
1468 }
1469 break;
1470 }
1471 if (p >= token_buffer + maxtoken - 3)
1472 p = extend_token_buffer (p);
1473 *p++ = c;
1474 c = getc (finput);
1475 }
1476
1477 ungetc (c, finput);
1478
1479 /* If the constant is not long long and it won't fit in an
1480 unsigned long, or if the constant is long long and won't fit
1481 in an unsigned long long, then warn that the constant is out
1482 of range. */
1483
1484 /* ??? This assumes that long long and long integer types are
1485 a multiple of 8 bits. This better than the original code
1486 though which assumed that long was exactly 32 bits and long
1487 long was exactly 64 bits. */
1488
1489 if (spec_long_long)
1490 bytes = TYPE_PRECISION (long_long_integer_type_node) / 8;
1491 else
1492 bytes = TYPE_PRECISION (long_integer_type_node) / 8;
1493
4ca827d0
RS
1494 warn = overflow;
1495 for (i = bytes; i < TOTAL_PARTS; i++)
1496 if (parts[i])
1497 warn = 1;
1498 if (warn)
1499 pedwarn ("integer constant out of range");
e8bbfc4e
RK
1500
1501 /* This is simplified by the fact that our constant
1502 is always positive. */
8d9bfdc5
RK
1503
1504 high = low = 0;
1505
1506 for (i = 0; i < HOST_BITS_PER_WIDE_INT / HOST_BITS_PER_CHAR; i++)
1507 {
1508 high |= ((HOST_WIDE_INT) parts[i + (HOST_BITS_PER_WIDE_INT
1509 / HOST_BITS_PER_CHAR)]
1510 << (i * HOST_BITS_PER_CHAR));
1511 low |= (HOST_WIDE_INT) parts[i] << (i * HOST_BITS_PER_CHAR);
1512 }
1513
1514 yylval.ttype = build_int_2 (low, high);
5a9085c7 1515 TREE_TYPE (yylval.ttype) = long_long_unsigned_type_node;
e8bbfc4e 1516
e8bbfc4e
RK
1517 /* If warn_traditional, calculate both the ANSI type and the
1518 traditional type, then see if they disagree.
1519 Otherwise, calculate only the type for the dialect in use. */
1520 if (warn_traditional || flag_traditional)
1521 {
1522 /* Calculate the traditional type. */
1523 /* Traditionally, any constant is signed;
1524 but if unsigned is specified explicitly, obey that.
1525 Use the smallest size with the right number of bits,
1526 except for one special case with decimal constants. */
1527 if (! spec_long && base != 10
1528 && int_fits_type_p (yylval.ttype, unsigned_type_node))
1529 traditional_type = (spec_unsigned ? unsigned_type_node
1530 : integer_type_node);
1531 /* A decimal constant must be long
1532 if it does not fit in type int.
1533 I think this is independent of whether
1534 the constant is signed. */
1535 else if (! spec_long && base == 10
1536 && int_fits_type_p (yylval.ttype, integer_type_node))
1537 traditional_type = (spec_unsigned ? unsigned_type_node
1538 : integer_type_node);
4ca827d0 1539 else if (! spec_long_long)
e8bbfc4e
RK
1540 traditional_type = (spec_unsigned ? long_unsigned_type_node
1541 : long_integer_type_node);
1542 else
1543 traditional_type = (spec_unsigned
1544 ? long_long_unsigned_type_node
1545 : long_long_integer_type_node);
1546 }
1547 if (warn_traditional || ! flag_traditional)
1548 {
1549 /* Calculate the ANSI type. */
1550 if (! spec_long && ! spec_unsigned
1551 && int_fits_type_p (yylval.ttype, integer_type_node))
1552 ansi_type = integer_type_node;
1553 else if (! spec_long && (base != 10 || spec_unsigned)
1554 && int_fits_type_p (yylval.ttype, unsigned_type_node))
1555 ansi_type = unsigned_type_node;
1556 else if (! spec_unsigned && !spec_long_long
1557 && int_fits_type_p (yylval.ttype, long_integer_type_node))
1558 ansi_type = long_integer_type_node;
4ca827d0 1559 else if (! spec_long_long)
e8bbfc4e
RK
1560 ansi_type = long_unsigned_type_node;
1561 else if (! spec_unsigned
a120b788
RS
1562 /* Verify value does not overflow into sign bit. */
1563 && TREE_INT_CST_HIGH (yylval.ttype) >= 0
e8bbfc4e
RK
1564 && int_fits_type_p (yylval.ttype,
1565 long_long_integer_type_node))
1566 ansi_type = long_long_integer_type_node;
1567 else
1568 ansi_type = long_long_unsigned_type_node;
1569 }
1570
1571 type = flag_traditional ? traditional_type : ansi_type;
1572
1573 if (warn_traditional && traditional_type != ansi_type)
1574 {
1575 if (TYPE_PRECISION (traditional_type)
1576 != TYPE_PRECISION (ansi_type))
1577 warning ("width of integer constant changes with -traditional");
1578 else if (TREE_UNSIGNED (traditional_type)
1579 != TREE_UNSIGNED (ansi_type))
1580 warning ("integer constant is unsigned in ANSI C, signed with -traditional");
a3ee5899
JW
1581 else
1582 warning ("width of integer constant may change on other systems with -traditional");
e8bbfc4e 1583 }
e8bbfc4e 1584
4ca827d0
RS
1585 if (!flag_traditional && !int_fits_type_p (yylval.ttype, type)
1586 && !warn)
88d92ca5
RS
1587 pedwarn ("integer constant out of range");
1588
c832a30e
RS
1589 if (base == 10 && ! spec_unsigned && TREE_UNSIGNED (type))
1590 warning ("integer constant is so large that it is unsigned");
1591
88dd95c1
RS
1592 if (flag_traditional && !int_fits_type_p (yylval.ttype, type))
1593 /* The traditional constant 0x80000000 is signed
1594 but doesn't fit in the range of int.
1595 This will change it to -0x80000000, which does fit. */
1596 {
1597 TREE_TYPE (yylval.ttype) = unsigned_type (type);
1598 yylval.ttype = convert (type, yylval.ttype);
1599 }
1600 else
1601 TREE_TYPE (yylval.ttype) = type;
1602
e8bbfc4e
RK
1603 *p = 0;
1604 }
1605
1606 value = CONSTANT; break;
1607 }
1608
1609 case '\'':
1610 char_constant:
1611 {
1612 register int result = 0;
a2543283 1613 register int num_chars = 0;
e8bbfc4e
RK
1614 unsigned width = TYPE_PRECISION (char_type_node);
1615 int max_chars;
1616
1617 if (wide_flag)
1618 {
1619 width = WCHAR_TYPE_SIZE;
1620#ifdef MULTIBYTE_CHARS
1621 max_chars = MB_CUR_MAX;
1622#else
1623 max_chars = 1;
1624#endif
1625 }
1626 else
1627 max_chars = TYPE_PRECISION (integer_type_node) / width;
1628
1629 while (1)
1630 {
1631 tryagain:
1632
1633 c = getc (finput);
1634
1635 if (c == '\'' || c == EOF)
1636 break;
1637
1638 if (c == '\\')
1639 {
1640 c = readescape ();
1641 if (c < 0)
1642 goto tryagain;
1643 if (width < HOST_BITS_PER_INT
1644 && (unsigned) c >= (1 << width))
1645 pedwarn ("escape sequence out of range for character");
1646 }
1647 else if (c == '\n')
1648 {
1649 if (pedantic)
1650 pedwarn ("ANSI C forbids newline in character constant");
1651 lineno++;
1652 }
1653
1654 num_chars++;
1655 if (num_chars > maxtoken - 4)
1656 extend_token_buffer (token_buffer);
1657
1658 token_buffer[num_chars] = c;
1659
1660 /* Merge character into result; ignore excess chars. */
1661 if (num_chars < max_chars + 1)
1662 {
1663 if (width < HOST_BITS_PER_INT)
1664 result = (result << width) | (c & ((1 << width) - 1));
1665 else
1666 result = c;
1667 }
1668 }
1669
1670 token_buffer[num_chars + 1] = '\'';
1671 token_buffer[num_chars + 2] = 0;
1672
1673 if (c != '\'')
1674 error ("malformatted character constant");
1675 else if (num_chars == 0)
1676 error ("empty character constant");
1677 else if (num_chars > max_chars)
1678 {
1679 num_chars = max_chars;
1680 error ("character constant too long");
1681 }
1682 else if (num_chars != 1 && ! flag_traditional)
1683 warning ("multi-character character constant");
1684
1685 /* If char type is signed, sign-extend the constant. */
1686 if (! wide_flag)
1687 {
1688 int num_bits = num_chars * width;
1689 if (TREE_UNSIGNED (char_type_node)
1690 || ((result >> (num_bits - 1)) & 1) == 0)
1691 yylval.ttype
8d9bfdc5
RK
1692 = build_int_2 (result & ((unsigned HOST_WIDE_INT) ~0
1693 >> (HOST_BITS_PER_WIDE_INT - num_bits)),
e8bbfc4e
RK
1694 0);
1695 else
1696 yylval.ttype
8d9bfdc5
RK
1697 = build_int_2 (result | ~((unsigned HOST_WIDE_INT) ~0
1698 >> (HOST_BITS_PER_WIDE_INT - num_bits)),
e8bbfc4e
RK
1699 -1);
1700 }
1701 else
1702 {
1703#ifdef MULTIBYTE_CHARS
1704 /* Set the initial shift state and convert the next sequence. */
1705 result = 0;
1706 /* In all locales L'\0' is zero and mbtowc will return zero,
1707 so don't use it. */
1708 if (num_chars > 1
1709 || (num_chars == 1 && token_buffer[1] != '\0'))
1710 {
1711 wchar_t wc;
8d9bfdc5 1712 (void) mbtowc (NULL_PTR, NULL_PTR, 0);
e8bbfc4e
RK
1713 if (mbtowc (& wc, token_buffer + 1, num_chars) == num_chars)
1714 result = wc;
1715 else
1716 warning ("Ignoring invalid multibyte character");
1717 }
1718#endif
1719 yylval.ttype = build_int_2 (result, 0);
1720 }
1721
1722 TREE_TYPE (yylval.ttype) = integer_type_node;
1723 value = CONSTANT;
1724 break;
1725 }
1726
1727 case '"':
1728 string_constant:
1729 {
1730 c = getc (finput);
1731 p = token_buffer + 1;
1732
1733 while (c != '"' && c >= 0)
1734 {
1735 /* ignore_escape_flag is set for reading the filename in #line. */
1736 if (!ignore_escape_flag && c == '\\')
1737 {
1738 c = readescape ();
1739 if (c < 0)
1740 goto skipnewline;
1741 if (!wide_flag
1742 && TYPE_PRECISION (char_type_node) < HOST_BITS_PER_INT
1743 && c >= (1 << TYPE_PRECISION (char_type_node)))
1744 pedwarn ("escape sequence out of range for character");
1745 }
1746 else if (c == '\n')
1747 {
1748 if (pedantic)
1749 pedwarn ("ANSI C forbids newline in string constant");
1750 lineno++;
1751 }
1752
1753 if (p == token_buffer + maxtoken)
1754 p = extend_token_buffer (p);
1755 *p++ = c;
1756
1757 skipnewline:
1758 c = getc (finput);
1759 }
1760 *p = 0;
1761
1762 /* We have read the entire constant.
1763 Construct a STRING_CST for the result. */
1764
1765 if (wide_flag)
1766 {
1767 /* If this is a L"..." wide-string, convert the multibyte string
1768 to a wide character string. */
1769 char *widep = (char *) alloca ((p - token_buffer) * WCHAR_BYTES);
1770 int len;
1771
1772#ifdef MULTIBYTE_CHARS
1773 len = mbstowcs ((wchar_t *) widep, token_buffer + 1, p - token_buffer);
1774 if ((unsigned) len >= (p - token_buffer))
1775 {
1776 warning ("Ignoring invalid multibyte string");
1777 len = 0;
1778 }
1779 bzero (widep + (len * WCHAR_BYTES), WCHAR_BYTES);
1780#else
1781 {
1782 union { long l; char c[sizeof (long)]; } u;
1783 int big_endian;
1784 char *wp, *cp;
1785
1786 /* Determine whether host is little or big endian. */
1787 u.l = 1;
1788 big_endian = u.c[sizeof (long) - 1];
1789 wp = widep + (big_endian ? WCHAR_BYTES - 1 : 0);
1790
1791 bzero (widep, (p - token_buffer) * WCHAR_BYTES);
1792 for (cp = token_buffer + 1; cp < p; cp++)
1793 *wp = *cp, wp += WCHAR_BYTES;
1794 len = p - token_buffer - 1;
1795 }
1796#endif
1797 yylval.ttype = build_string ((len + 1) * WCHAR_BYTES, widep);
1798 TREE_TYPE (yylval.ttype) = wchar_array_type_node;
1799 }
1800 else
1801 {
1802 yylval.ttype = build_string (p - token_buffer, token_buffer + 1);
1803 TREE_TYPE (yylval.ttype) = char_array_type_node;
1804 }
1805
1806 *p++ = '"';
1807 *p = 0;
1808
1809 value = STRING; break;
1810 }
1811
1812 case '+':
1813 case '-':
1814 case '&':
1815 case '|':
1816 case '<':
1817 case '>':
1818 case '*':
1819 case '/':
1820 case '%':
1821 case '^':
1822 case '!':
1823 case '=':
1824 {
1825 register int c1;
1826
1827 combine:
1828
1829 switch (c)
1830 {
1831 case '+':
1832 yylval.code = PLUS_EXPR; break;
1833 case '-':
1834 yylval.code = MINUS_EXPR; break;
1835 case '&':
1836 yylval.code = BIT_AND_EXPR; break;
1837 case '|':
1838 yylval.code = BIT_IOR_EXPR; break;
1839 case '*':
1840 yylval.code = MULT_EXPR; break;
1841 case '/':
1842 yylval.code = TRUNC_DIV_EXPR; break;
1843 case '%':
1844 yylval.code = TRUNC_MOD_EXPR; break;
1845 case '^':
1846 yylval.code = BIT_XOR_EXPR; break;
1847 case LSHIFT:
1848 yylval.code = LSHIFT_EXPR; break;
1849 case RSHIFT:
1850 yylval.code = RSHIFT_EXPR; break;
1851 case '<':
1852 yylval.code = LT_EXPR; break;
1853 case '>':
1854 yylval.code = GT_EXPR; break;
1855 }
1856
1857 token_buffer[1] = c1 = getc (finput);
1858 token_buffer[2] = 0;
1859
1860 if (c1 == '=')
1861 {
1862 switch (c)
1863 {
1864 case '<':
1865 value = ARITHCOMPARE; yylval.code = LE_EXPR; goto done;
1866 case '>':
1867 value = ARITHCOMPARE; yylval.code = GE_EXPR; goto done;
1868 case '!':
1869 value = EQCOMPARE; yylval.code = NE_EXPR; goto done;
1870 case '=':
1871 value = EQCOMPARE; yylval.code = EQ_EXPR; goto done;
1872 }
1873 value = ASSIGN; goto done;
1874 }
1875 else if (c == c1)
1876 switch (c)
1877 {
1878 case '+':
1879 value = PLUSPLUS; goto done;
1880 case '-':
1881 value = MINUSMINUS; goto done;
1882 case '&':
1883 value = ANDAND; goto done;
1884 case '|':
1885 value = OROR; goto done;
1886 case '<':
1887 c = LSHIFT;
1888 goto combine;
1889 case '>':
1890 c = RSHIFT;
1891 goto combine;
1892 }
1893 else if ((c == '-') && (c1 == '>'))
1894 { value = POINTSAT; goto done; }
1895 ungetc (c1, finput);
1896 token_buffer[1] = 0;
1897
1898 if ((c == '<') || (c == '>'))
1899 value = ARITHCOMPARE;
1900 else value = c;
1901 goto done;
1902 }
1903
1904 case 0:
1905 /* Don't make yyparse think this is eof. */
1906 value = 1;
1907 break;
1908
1909 default:
1910 value = c;
1911 }
1912
1913done:
1914/* yylloc.last_line = lineno; */
1915
1916 return value;
1917}
1918
d45cf215 1919/* Sets the value of the 'yydebug' variable to VALUE.
e8bbfc4e
RK
1920 This is a function so we don't have to have YYDEBUG defined
1921 in order to build the compiler. */
1922
1923void
1924set_yydebug (value)
1925 int value;
1926{
1927#if YYDEBUG != 0
1928 yydebug = value;
1929#else
1930 warning ("YYDEBUG not defined.");
1931#endif
1932}
This page took 0.610112 seconds and 5 git commands to generate.