/* Definitions for CPP library.
- Copyright (C) 1995, 96-99, 2000 Free Software Foundation, Inc.
+ Copyright (C) 1995, 1996, 1997, 1998, 1999, 2000, 2001
+ Free Software Foundation, Inc.
Written by Per Bothner, 1994-95.
This program is free software; you can redistribute it and/or modify it
extern "C" {
#endif
+/* For complex reasons, cpp_reader is also typedefed in c-pragma.h. */
+#ifndef _C_PRAGMA_H
typedef struct cpp_reader cpp_reader;
+#endif
typedef struct cpp_buffer cpp_buffer;
typedef struct cpp_options cpp_options;
-typedef struct cpp_printer cpp_printer;
typedef struct cpp_token cpp_token;
-typedef struct cpp_toklist cpp_toklist;
typedef struct cpp_string cpp_string;
typedef struct cpp_hashnode cpp_hashnode;
+typedef struct cpp_macro cpp_macro;
+typedef struct cpp_lexer_pos cpp_lexer_pos;
+typedef struct cpp_lookahead cpp_lookahead;
+typedef struct cpp_callbacks cpp_callbacks;
+
+struct answer;
+struct file_name_map_list;
/* The first two groups, apart from '=', can appear in preprocessor
expressions. This allows a lookup table to be implemented in
the same order as their counterparts without the '=', like ">>". */
/* Positions in the table. */
-#define CPP_LAST_EQ CPP_LSHIFT
+#define CPP_LAST_EQ CPP_MAX
#define CPP_FIRST_DIGRAPH CPP_HASH
+#define CPP_LAST_PUNCTUATOR CPP_DOT_STAR
#define TTYPE_TABLE \
- T(CPP_EQ = 0, "=") \
- T(CPP_NOT, "!") \
- T(CPP_GREATER, ">") /* compare */ \
- T(CPP_LESS, "<") \
- T(CPP_PLUS, "+") /* math */ \
- T(CPP_MINUS, "-") \
- T(CPP_MULT, "*") \
- T(CPP_DIV, "/") \
- T(CPP_MOD, "%") \
- T(CPP_AND, "&") /* bit ops */ \
- T(CPP_OR, "|") \
- T(CPP_XOR, "^") \
- T(CPP_RSHIFT, ">>") \
- T(CPP_LSHIFT, "<<") \
+ OP(CPP_EQ = 0, "=") \
+ OP(CPP_NOT, "!") \
+ OP(CPP_GREATER, ">") /* compare */ \
+ OP(CPP_LESS, "<") \
+ OP(CPP_PLUS, "+") /* math */ \
+ OP(CPP_MINUS, "-") \
+ OP(CPP_MULT, "*") \
+ OP(CPP_DIV, "/") \
+ OP(CPP_MOD, "%") \
+ OP(CPP_AND, "&") /* bit ops */ \
+ OP(CPP_OR, "|") \
+ OP(CPP_XOR, "^") \
+ OP(CPP_RSHIFT, ">>") \
+ OP(CPP_LSHIFT, "<<") \
+ OP(CPP_MIN, "<?") /* extension */ \
+ OP(CPP_MAX, ">?") \
\
- T(CPP_COMPL, "~") \
- T(CPP_AND_AND, "&&") /* logical */ \
- T(CPP_OR_OR, "||") \
- T(CPP_QUERY, "?") \
- T(CPP_COLON, ":") \
- T(CPP_COMMA, ",") /* grouping */ \
- T(CPP_OPEN_PAREN, "(") \
- T(CPP_CLOSE_PAREN, ")") \
- T(CPP_EQ_EQ, "==") /* compare */ \
- T(CPP_NOT_EQ, "!=") \
- T(CPP_GREATER_EQ, ">=") \
- T(CPP_LESS_EQ, "<=") \
+ OP(CPP_COMPL, "~") \
+ OP(CPP_AND_AND, "&&") /* logical */ \
+ OP(CPP_OR_OR, "||") \
+ OP(CPP_QUERY, "?") \
+ OP(CPP_COLON, ":") \
+ OP(CPP_COMMA, ",") /* grouping */ \
+ OP(CPP_OPEN_PAREN, "(") \
+ OP(CPP_CLOSE_PAREN, ")") \
+ OP(CPP_EQ_EQ, "==") /* compare */ \
+ OP(CPP_NOT_EQ, "!=") \
+ OP(CPP_GREATER_EQ, ">=") \
+ OP(CPP_LESS_EQ, "<=") \
\
- T(CPP_PLUS_EQ, "+=") /* math */ \
- T(CPP_MINUS_EQ, "-=") \
- T(CPP_MULT_EQ, "*=") \
- T(CPP_DIV_EQ, "/=") \
- T(CPP_MOD_EQ, "%=") \
- T(CPP_AND_EQ, "&=") /* bit ops */ \
- T(CPP_OR_EQ, "|=") \
- T(CPP_XOR_EQ, "^=") \
- T(CPP_RSHIFT_EQ, ">>=") \
- T(CPP_LSHIFT_EQ, "<<=") \
+ OP(CPP_PLUS_EQ, "+=") /* math */ \
+ OP(CPP_MINUS_EQ, "-=") \
+ OP(CPP_MULT_EQ, "*=") \
+ OP(CPP_DIV_EQ, "/=") \
+ OP(CPP_MOD_EQ, "%=") \
+ OP(CPP_AND_EQ, "&=") /* bit ops */ \
+ OP(CPP_OR_EQ, "|=") \
+ OP(CPP_XOR_EQ, "^=") \
+ OP(CPP_RSHIFT_EQ, ">>=") \
+ OP(CPP_LSHIFT_EQ, "<<=") \
+ OP(CPP_MIN_EQ, "<?=") /* extension */ \
+ OP(CPP_MAX_EQ, ">?=") \
/* Digraphs together, beginning with CPP_FIRST_DIGRAPH. */ \
- T(CPP_HASH, "#") /* digraphs */ \
- T(CPP_PASTE, "##") \
- T(CPP_OPEN_SQUARE, "[") \
- T(CPP_CLOSE_SQUARE, "]") \
- T(CPP_OPEN_BRACE, "{") \
- T(CPP_CLOSE_BRACE, "}") \
- /* The remainder of the punctuation. Order is not significant. */ \
- T(CPP_SEMICOLON, ";") /* structure */ \
- T(CPP_ELLIPSIS, "...") \
- T(CPP_BACKSLASH, "\\") \
- T(CPP_PLUS_PLUS, "++") /* increment */ \
- T(CPP_MINUS_MINUS, "--") \
- T(CPP_DEREF, "->") /* accessors */ \
- T(CPP_DOT, ".") \
- T(CPP_SCOPE, "::") \
- T(CPP_DEREF_STAR, "->*") \
- T(CPP_DOT_STAR, ".*") \
- T(CPP_MIN, "<?") /* extension */ \
- T(CPP_MAX, ">?") \
- T(CPP_PLACEMARKER, "") /* Placemarker token. */ \
- C(CPP_OTHER, 0) /* stray punctuation */ \
+ OP(CPP_HASH, "#") /* digraphs */ \
+ OP(CPP_PASTE, "##") \
+ OP(CPP_OPEN_SQUARE, "[") \
+ OP(CPP_CLOSE_SQUARE, "]") \
+ OP(CPP_OPEN_BRACE, "{") \
+ OP(CPP_CLOSE_BRACE, "}") \
+ /* The remainder of the punctuation. Order is not significant. */ \
+ OP(CPP_SEMICOLON, ";") /* structure */ \
+ OP(CPP_ELLIPSIS, "...") \
+ OP(CPP_PLUS_PLUS, "++") /* increment */ \
+ OP(CPP_MINUS_MINUS, "--") \
+ OP(CPP_DEREF, "->") /* accessors */ \
+ OP(CPP_DOT, ".") \
+ OP(CPP_SCOPE, "::") \
+ OP(CPP_DEREF_STAR, "->*") \
+ OP(CPP_DOT_STAR, ".*") \
+\
+ TK(CPP_NAME, SPELL_IDENT) /* word */ \
+ TK(CPP_INT, SPELL_STRING) /* 23 */ \
+ TK(CPP_FLOAT, SPELL_STRING) /* 3.14159 */ \
+ TK(CPP_NUMBER, SPELL_STRING) /* 34_be+ta */ \
+\
+ TK(CPP_CHAR, SPELL_STRING) /* 'char' */ \
+ TK(CPP_WCHAR, SPELL_STRING) /* L'char' */ \
+ TK(CPP_OTHER, SPELL_CHAR) /* stray punctuation */ \
\
- I(CPP_NAME, 0) /* word */ \
- S(CPP_INT, 0) /* 23 */ \
- S(CPP_FLOAT, 0) /* 3.14159 */ \
- S(CPP_NUMBER, 0) /* 34_be+ta */ \
- S(CPP_CHAR, 0) /* 'char' */ \
- S(CPP_WCHAR, 0) /* L'char' */ \
- S(CPP_STRING, 0) /* "string" */ \
- S(CPP_WSTRING, 0) /* L"string" */ \
+ TK(CPP_STRING, SPELL_STRING) /* "string" */ \
+ TK(CPP_WSTRING, SPELL_STRING) /* L"string" */ \
+ TK(CPP_OSTRING, SPELL_STRING) /* @"string" - Objective C */ \
+ TK(CPP_HEADER_NAME, SPELL_STRING) /* <stdio.h> in #include */ \
\
- S(CPP_COMMENT, 0) /* Only if output comments. */ \
- N(CPP_MACRO_ARG, 0) /* Macro argument. */ \
- N(CPP_EOF, 0) /* End of file. */ \
- S(CPP_HEADER_NAME, 0) /* <stdio.h> in #include */
-
-#define T(e, s) e,
-#define I(e, s) e,
-#define S(e, s) e,
-#define C(e, s) e,
-#define N(e, s) e,
+ TK(CPP_COMMENT, SPELL_STRING) /* Only if output comments. */ \
+ TK(CPP_MACRO_ARG, SPELL_NONE) /* Macro argument. */ \
+ OP(CPP_EOF, "EOL") /* End of line or file. */
+
+#define OP(e, s) e,
+#define TK(e, s) e,
enum cpp_ttype
{
TTYPE_TABLE
N_TTYPES
};
-#undef T
-#undef I
-#undef S
-#undef C
-#undef N
+#undef OP
+#undef TK
+
+/* C language kind, used when calling cpp_reader_init. */
+enum c_lang {CLK_GNUC89 = 0, CLK_GNUC99, CLK_STDC89, CLK_STDC94, CLK_STDC99,
+ CLK_GNUCXX, CLK_CXX98, CLK_OBJC, CLK_OBJCXX, CLK_ASM};
/* Payload of a NUMBER, FLOAT, STRING, or COMMENT token. */
struct cpp_string
/* Flags for the cpp_token structure. */
#define PREV_WHITE (1 << 0) /* If whitespace before this token. */
-#define BOL (1 << 1) /* Beginning of logical line. */
-#define DIGRAPH (1 << 2) /* If it was a digraph. */
-#define STRINGIFY_ARG (1 << 3) /* If macro argument to be stringified. */
-#define PASTE_LEFT (1 << 4) /* If on LHS of a ## operator. */
-#define PASTED (1 << 5) /* The result of a ## operator. */
+#define DIGRAPH (1 << 1) /* If it was a digraph. */
+#define STRINGIFY_ARG (1 << 2) /* If macro argument to be stringified. */
+#define PASTE_LEFT (1 << 3) /* If on LHS of a ## operator. */
+#define NAMED_OP (1 << 4) /* C++ named operators. */
+#define NO_EXPAND (1 << 5) /* Do not macro-expand this token. */
+#define AVOID_LPASTE (1 << 6) /* Check left for accidental pastes. */
/* A preprocessing token. This has been carefully packed and should
- occupy 16 bytes on 32-bit hosts and 24 bytes on 64-bit hosts. */
+ occupy 12 bytes on 32-bit hosts and 16 bytes on 64-bit hosts. */
struct cpp_token
{
- unsigned int line; /* starting line number of this token */
- unsigned short col; /* starting column of this token */
ENUM_BITFIELD(cpp_ttype) type : CHAR_BIT; /* token type */
unsigned char flags; /* flags - see above */
union
{
- HOST_WIDEST_INT integer; /* an integer */
- struct cpp_hashnode *node; /* an identifier */
- struct cpp_string str; /* a string, or number */
- unsigned int aux; /* argument no. for a CPP_MACRO_ARG, or
- character represented by CPP_OTHER. */
+ struct cpp_hashnode *node; /* An identifier. */
+ struct cpp_string str; /* A string, or number. */
+ unsigned int arg_no; /* Argument no. for a CPP_MACRO_ARG. */
+ unsigned char c; /* Character represented by CPP_OTHER. */
} val;
};
-/* cpp_toklist flags. */
-#define LIST_OFFSET (1 << 0)
-#define VAR_ARGS (1 << 1)
-#define GNU_REST_ARGS (1 << 2) /* Set in addition to VAR_ARGS. */
-#define BEG_OF_FILE (1 << 3)
-
-struct directive; /* These are deliberately incomplete. */
-struct answer;
-struct macro_args;
-struct cpp_context;
-
-struct cpp_toklist
+/* The position of a token in the current file. */
+struct cpp_lexer_pos
{
- cpp_token *tokens; /* actual tokens as an array */
- unsigned int tokens_used; /* tokens used */
- unsigned int tokens_cap; /* tokens allocated */
-
- unsigned char *namebuf; /* names buffer */
- unsigned int name_used; /* _bytes_ used */
- unsigned int name_cap; /* _bytes_ allocated */
-
- /* If the list represents a directive, this points to it. */
- const struct directive *directive;
-
- const char *file; /* in file name */
- unsigned int line; /* starting line number */
-
- unsigned short params_len; /* length of macro parameter names. */
-
- short int paramc; /* no. of macro params (-1 = obj-like). */
-
- /* Per-list flags, see above */
- unsigned short flags;
+ unsigned int line;
+ unsigned int output_line;
+ unsigned short col;
};
-struct cpp_buffer
+typedef struct cpp_token_with_pos cpp_token_with_pos;
+struct cpp_token_with_pos
{
- const unsigned char *cur; /* current position */
- const unsigned char *rlimit; /* end of valid data */
- const unsigned char *buf; /* entire buffer */
- const unsigned char *line_base; /* start of current line */
-
- struct cpp_buffer *prev;
-
- /* Filename specified with #line command. */
- const char *nominal_fname;
-
- /* Actual directory of this file, used only for "" includes */
- struct file_name_list *actual_dir;
-
- /* Pointer into the include table. Used for include_next and
- to record control macros. */
- struct include_file *inc;
-
- /* Value of if_stack at start of this file.
- Used to prohibit unmatched #endif (etc) in an include file. */
- struct if_stack *if_stack;
-
- /* Line number at line_base (above). */
- unsigned int lineno;
-
- /* True if we have already warned about C++ comments in this file.
- The warning happens only for C89 extended mode with -pedantic on,
- or for -Wtraditional, and only once per file (otherwise it would
- be far too noisy). */
- char warned_cplusplus_comments;
-
- /* True if this buffer's data is mmapped. */
- char mapped;
+ cpp_token token;
+ cpp_lexer_pos pos;
};
-struct file_name_map_list;
-struct htab;
+/* Token lookahead. */
+struct cpp_lookahead
+{
+ struct cpp_lookahead *next;
+ cpp_token_with_pos *tokens;
+ cpp_lexer_pos pos;
+ unsigned int cur, count, cap;
+};
-/* Maximum nesting of cpp_buffers. We use a static limit, partly for
- efficiency, and partly to limit runaway recursion. */
-#define CPP_STACK_MAX 200
+/* A standalone character. We may want to make it unsigned for the
+ same reason we use unsigned char - to avoid signedness issues. */
+typedef int cppchar_t;
/* Values for opts.dump_macros.
dump_only means inhibit output of the preprocessed text
being written to stdout. */
const char *deps_file;
- /* Target-name to write with the dependency information. */
- char *deps_target;
-
/* Search paths for include files. */
struct file_name_list *quote_include; /* First dir to search for "file" */
struct file_name_list *bracket_include;/* First dir to search for <file> */
const char *include_prefix;
unsigned int include_prefix_len;
+ /* -fleading_underscore sets this to "_". */
+ const char *user_label_prefix;
+
+ /* The language we're preprocessing. */
+ enum c_lang lang;
+
/* Non-0 means -v, so print the full set of include dirs. */
unsigned char verbose;
/* Nonzero means handle #import, for objective C. */
unsigned char objc;
- /* Nonzero means this is an assembly file, so ignore unrecognized
- directives and the "# 33" form of #line, both of which are
- probably comments. Also, permit unbalanced ' strings (again,
- likely to be in comments). */
- unsigned char lang_asm;
-
/* Nonzero means don't copy comments into the output file. */
unsigned char discard_comments;
/* Nonzero means process the ISO digraph sequences. */
unsigned char digraphs;
+ /* Nonzero means to allow hexadecimal floats and LL suffixes. */
+ unsigned char extended_numbers;
+
/* Nonzero means print the names of included files rather than the
preprocessed output. 1 means just the #include "...", 2 means
#include <...> as well. */
unsigned char print_deps;
+ /* Nonzero if phony targets are created for each header. */
+ unsigned char deps_phony_targets;
+
/* Nonzero if missing .h files in -M output are assumed to be
generated files and not errors. */
unsigned char print_deps_missing_files;
/* Nonzero means don't print warning messages. */
unsigned char inhibit_warnings;
+ /* Nonzero means don't suppress warnings from system headers. */
+ unsigned char warn_system_headers;
+
/* Nonzero means don't print error messages. Has no option to
select it, but can be set by a user of cpplib (e.g. fix-header). */
unsigned char inhibit_errors;
traditional C. */
unsigned char warn_traditional;
- /* Nonzero means warn if ## is applied to two tokens that cannot be
- pasted together. */
- unsigned char warn_paste;
-
/* Nonzero means turn warnings into errors. */
unsigned char warnings_are_errors;
/* Nonzero means warn if undefined identifiers are evaluated in an #if. */
unsigned char warn_undef;
- /* Nonzero for the 1989 C Standard, including corrigenda and amendments. */
- unsigned char c89;
-
/* Nonzero for the 1999 C Standard, including corrigenda and amendments. */
unsigned char c99;
/* Nonzero means dump macros in some fashion - see above. */
unsigned char dump_macros;
- /* Nonzero means pass all #define and #undef directives which we
- actually process through to the output stream. This feature is
- used primarily to allow cc1 to record the #defines and #undefs
- for the sake of debuggers which understand about preprocessor
- macros, but it may also be useful with -E to figure out how
- symbols are defined, and where they are defined. */
- unsigned char debug_output;
-
/* Nonzero means pass #include lines through to the output. */
unsigned char dump_includes;
/* Print column number in error messages. */
unsigned char show_column;
-};
-
-/* A cpp_reader encapsulates the "state" of a pre-processor run.
- Applying cpp_get_token repeatedly yields a stream of pre-processor
- tokens. Usually, there is only one cpp_reader object active. */
-
-struct cpp_reader
-{
- /* HACK FIXME. Maybe make into cpp_printer printer later. */
- cpp_printer *printer;
- /* Top of buffer stack. */
- cpp_buffer *buffer;
+ /* Treat C++ alternate operator names special. */
+ unsigned char operator_names;
- /* A buffer used for both for cpp_get_token's output, and also internally. */
- unsigned char *token_buffer;
- /* Allocated size of token_buffer. CPP_RESERVE allocates space. */
- unsigned int token_buffer_size;
- /* End of the written part of token_buffer. */
- unsigned char *limit;
-
- /* Error counter for exit code */
- unsigned int errors;
-
- /* Line and column where a newline was first seen in a string constant. */
- unsigned int multiline_string_line;
- unsigned int multiline_string_column;
-
- /* Current depth in #include directives that use <...>. */
- unsigned int system_include_depth;
-
- /* Current depth of buffer stack. */
- unsigned int buffer_stack_depth;
-
- /* Current depth in #include directives. */
- unsigned int include_depth;
-
- /* Hash table of macros and assertions. See cpphash.c */
- struct htab *hashtab;
-
- /* Tree of other included files. See cppfiles.c */
- struct splay_tree_s *all_include_files;
-
- /* Chain of `actual directory' file_name_list entries,
- for "" inclusion. */
- struct file_name_list *actual_dirs;
-
- /* Current maximum length of directory names in the search path
- for include files. (Altered as we get more of them.) */
- unsigned int max_include_len;
-
- /* Potential controlling macro for the current buffer. This is only
- live between the #endif and the end of file, and there can only
- be one at a time, so it is per-reader not per-buffer. */
- const cpp_hashnode *potential_control_macro;
-
- /* Token column position adjustment owing to tabs in whitespace. */
- unsigned int col_adjust;
-
- /* Token list used to store logical lines with new lexer. */
- cpp_toklist token_list;
-
- /* Temporary token store. */
- cpp_token **temp_tokens;
- unsigned int temp_cap;
- unsigned int temp_alloced;
- unsigned int temp_used;
-
- /* Date and time tokens. Calculated together if either is requested. */
- cpp_token *date;
- cpp_token *time;
-
- /* The # of a the current directive. It may not be first in line if
- we append, and finding it is tedious. */
- const cpp_token *first_directive_token;
-
- /* Context stack. Used for macro expansion and for determining
- which macros are disabled. */
- unsigned int context_cap;
- unsigned int cur_context;
- unsigned int no_expand_level;
- unsigned int paste_level;
- struct cpp_context *contexts;
-
- /* Current arguments when scanning arguments. Used for pointer
- fix-up. */
- struct macro_args *args;
-
- /* Buffer of -M output. */
- struct deps *deps;
-
- /* Obstack holding all macro hash nodes. This never shrinks.
- See cpphash.c */
- struct obstack *hash_ob;
-
- /* Obstack holding buffer and conditional structures. This is a
- real stack. See cpplib.c */
- struct obstack *buffer_ob;
-
- /* User visible options. */
- struct cpp_options opts;
-
- /* Nonzero means we have printed (while error reporting) a list of
- containing files that matches the current status. */
- unsigned char input_stack_listing_current;
-
- /* We're printed a warning recommending against using #import. */
- unsigned char import_warning;
-
- /* True after cpp_start_read completes. Used to inhibit some
- warnings while parsing the command line. */
- unsigned char done_initializing;
-
- /* True if we are skipping a failed conditional group. */
- unsigned char skipping;
-
- /* True if we need to save parameter spellings - only if -pedantic,
- or we might need to write out definitions. */
- unsigned char save_parameter_spellings;
-
- /* If we're in lex_line. */
- unsigned char in_lex_line;
+ /* True if --help, --version or --target-help appeared in the
+ options. Stand-alone CPP should then bail out after option
+ parsing; drivers might want to continue printing help. */
+ unsigned char help_only;
+};
- /* True if output_line_command needs to output a newline. */
- unsigned char need_newline;
+/* This structure is passed to the call back when changing file. */
+enum cpp_fc_reason {FC_ENTER = 0, FC_LEAVE, FC_RENAME};
- /* Special nodes - identifiers with predefined significance to the
- preprocessor. */
- struct spec_nodes *spec_nodes;
+struct cpp_file_loc
+{
+ const char *filename;
+ unsigned int lineno;
};
-/* struct cpp_printer encapsulates state used to convert the stream of
- tokens coming from cpp_get_token back into a text file. Not
- everyone wants to do that, hence we separate the function. */
+typedef struct cpp_file_change cpp_file_change;
+struct cpp_file_change
+{
+ struct cpp_file_loc from; /* Line of #include or #line. */
+ struct cpp_file_loc to; /* Line after #include or #line, or start. */
+ enum cpp_fc_reason reason; /* Reason for change. */
+ unsigned char sysp; /* Nonzero if system header. */
+ unsigned char externc; /* Nonzero if wrapper needed. */
+};
-struct cpp_printer
+/* Call backs. */
+struct cpp_callbacks
{
- FILE *outf; /* stream to write to */
- const char *last_fname; /* previous file name */
- unsigned int last_id; /* did we just push? */
- unsigned int lineno; /* line currently being written */
- unsigned int written; /* low water mark in token buffer */
+ void (*file_change) PARAMS ((cpp_reader *, const cpp_file_change *));
+ void (*include) PARAMS ((cpp_reader *, const unsigned char *,
+ const cpp_token *));
+ void (*define) PARAMS ((cpp_reader *, cpp_hashnode *));
+ void (*undef) PARAMS ((cpp_reader *, cpp_hashnode *));
+ void (*poison) PARAMS ((cpp_reader *));
+ void (*ident) PARAMS ((cpp_reader *, const cpp_string *));
+ void (*def_pragma) PARAMS ((cpp_reader *));
};
#define CPP_FATAL_LIMIT 1000
/* True if we have seen a "fatal" error. */
-#define CPP_FATAL_ERRORS(READER) ((READER)->errors >= CPP_FATAL_LIMIT)
-
-/* Macros for manipulating the token_buffer. */
-
-/* Number of characters currently in PFILE's output buffer. */
-#define CPP_WRITTEN(PFILE) ((size_t)((PFILE)->limit - (PFILE)->token_buffer))
-#define CPP_PWRITTEN(PFILE) ((PFILE)->limit)
-#define CPP_ADJUST_WRITTEN(PFILE,DELTA) ((PFILE)->limit += (DELTA))
-#define CPP_SET_WRITTEN(PFILE,N) ((PFILE)->limit = (PFILE)->token_buffer + (N))
-
-#define CPP_OPTION(PFILE, OPTION) ((PFILE)->opts.OPTION)
-#define CPP_BUFFER(PFILE) ((PFILE)->buffer)
-#define CPP_BUF_LINE(BUF) ((BUF)->lineno)
-#define CPP_BUF_COLUMN(BUF, CUR) ((CUR) - (BUF)->line_base + pfile->col_adjust)
-#define CPP_BUF_COL(BUF) CPP_BUF_COLUMN(BUF, (BUF)->cur)
+#define CPP_FATAL_ERRORS(PFILE) (cpp_errors (PFILE) >= CPP_FATAL_LIMIT)
/* Name under which this program was invoked. */
extern const char *progname;
-/* The structure of a node in the hash table. The hash table
- has entries for all tokens defined by #define commands (type T_MACRO),
- plus some special tokens like __LINE__ (these each have their own
- type, and the appropriate code is run when that type of node is seen.
- It does not contain control words like "#define", which are recognized
- by a separate piece of code. */
-
-/* different flavors of hash nodes */
+/* Where does this buffer come from? A faked include, a source file,
+ a builtin macro, a command-line option, or a _Pragma operator. */
+enum cpp_buffer_type {BUF_FAKE, BUF_FILE, BUF_BUILTIN,
+ BUF_CL_OPTION, BUF_PRAGMA};
+
+/* The structure of a node in the hash table. The hash table has
+ entries for all identifiers: either macros defined by #define
+ commands (type NT_MACRO), assertions created with #assert
+ (NT_ASSERTION), or neither of the above (NT_VOID). Builtin macros
+ like __LINE__ are flagged NODE_BUILTIN. Poisioned identifiers are
+ flagged NODE_POISONED. NODE_OPERATOR (C++ only) indicates an
+ identifier that behaves like an operator such as "xor".
+ NODE_DIAGNOSTIC is for speed in lex_token: it indicates a
+ diagnostic may be required for this node. Currently this only
+ applies to __VA_ARGS__ and poisoned identifiers. */
+
+/* Hash node flags. */
+#define NODE_OPERATOR (1 << 0) /* C++ named operator. */
+#define NODE_POISONED (1 << 1) /* Poisoned identifier. */
+#define NODE_BUILTIN (1 << 2) /* Builtin macro. */
+#define NODE_DIAGNOSTIC (1 << 3) /* Possible diagnostic when lexed. */
+
+/* Different flavors of hash node. */
enum node_type
{
- T_VOID = 0, /* no definition yet */
- T_SPECLINE, /* `__LINE__' */
- T_DATE, /* `__DATE__' */
- T_FILE, /* `__FILE__' */
- T_BASE_FILE, /* `__BASE_FILE__' */
- T_INCLUDE_LEVEL, /* `__INCLUDE_LEVEL__' */
- T_TIME, /* `__TIME__' */
- T_STDC, /* `__STDC__' */
- T_POISON, /* poisoned identifier */
- T_MACRO, /* a macro, either object-like or function-like */
- T_ASSERTION /* predicate for #assert */
+ NT_VOID = 0, /* No definition yet. */
+ NT_MACRO, /* A macro of some form. */
+ NT_ASSERTION /* Predicate for #assert. */
+};
+
+/* Different flavors of builtin macro. */
+enum builtin_type
+{
+ BT_SPECLINE = 0, /* `__LINE__' */
+ BT_DATE, /* `__DATE__' */
+ BT_FILE, /* `__FILE__' */
+ BT_BASE_FILE, /* `__BASE_FILE__' */
+ BT_INCLUDE_LEVEL, /* `__INCLUDE_LEVEL__' */
+ BT_TIME, /* `__TIME__' */
+ BT_STDC, /* `__STDC__' */
+ BT_WEAK /* Whether or not G++ supports weak
+ symbols. */
};
/* There is a slot in the hashnode for use by front ends when integrated
struct cpp_hashnode
{
- unsigned int hash; /* cached hash value */
- unsigned short length; /* length of name */
- ENUM_BITFIELD(node_type) type : 8; /* node type */
+ const unsigned char *name; /* Null-terminated name. */
+ unsigned int hash; /* Cached hash value. */
+ unsigned short length; /* Length of name excluding null. */
+ unsigned short arg_index; /* Macro argument index. */
+ unsigned char directive_index; /* Index into directive table. */
+ ENUM_BITFIELD(node_type) type : 8; /* Node type. */
+ unsigned char flags; /* Node flags. */
union
{
- const cpp_toklist *expansion; /* a macro's replacement list. */
- struct answer *answers; /* answers to an assertion. */
+ cpp_macro *macro; /* If a macro. */
+ struct answer *answers; /* Answers to an assertion. */
+ enum cpp_ttype operator; /* Code for a named operator. */
+ enum builtin_type builtin; /* Code for a builtin macro. */
} value;
-
- union tree_node *fe_value; /* front end value */
-
- const unsigned char name[1]; /* name[length] */
};
+/* Call this first to get a handle to pass to other functions. */
+extern cpp_reader *cpp_create_reader PARAMS ((enum c_lang));
+
+/* Call this to release the handle. Any use of the handle after this
+ function returns is invalid. Returns cpp_errors (pfile). */
+extern int cpp_destroy PARAMS ((cpp_reader *));
+
+/* Call these to get pointers to the options and callback structures
+ for a given reader. These pointers are good until you call
+ cpp_finish on that reader. You can either edit the callbacks
+ through the pointer returned from cpp_get_callbacks, or set them
+ with cpp_set_callbacks. */
+extern cpp_options *cpp_get_options PARAMS ((cpp_reader *));
+extern cpp_callbacks *cpp_get_callbacks PARAMS ((cpp_reader *));
+extern void cpp_set_callbacks PARAMS ((cpp_reader *, cpp_callbacks *));
+
+/* Now call cpp_handle_option[s] to handle 1[or more] switches. The
+ return value is the number of arguments used. If
+ cpp_handle_options returns without using all arguments, it couldn't
+ understand the next switch. When there are no switches left, you
+ must call cpp_post_options before calling cpp_start_read. Only
+ after cpp_post_options are the contents of the cpp_options
+ structure reliable. */
extern int cpp_handle_options PARAMS ((cpp_reader *, int, char **));
extern int cpp_handle_option PARAMS ((cpp_reader *, int, char **));
-extern void cpp_reader_init PARAMS ((cpp_reader *));
-extern cpp_printer *cpp_printer_init PARAMS ((cpp_reader *, cpp_printer *));
-extern int cpp_start_read PARAMS ((cpp_reader *, cpp_printer *, const char *));
-extern void cpp_output_tokens PARAMS ((cpp_reader *, cpp_printer *,
- unsigned int));
-extern void cpp_finish PARAMS ((cpp_reader *, cpp_printer *));
-extern void cpp_cleanup PARAMS ((cpp_reader *));
-
-extern const cpp_token *cpp_get_token PARAMS ((cpp_reader *));
+extern void cpp_post_options PARAMS ((cpp_reader *));
+
+/* Error count. */
+extern unsigned int cpp_errors PARAMS ((cpp_reader *));
+
+extern unsigned int cpp_token_len PARAMS ((const cpp_token *));
+extern unsigned char *cpp_token_as_text PARAMS ((cpp_reader *,
+ const cpp_token *));
+extern unsigned char *cpp_spell_token PARAMS ((cpp_reader *, const cpp_token *,
+ unsigned char *));
+extern void cpp_register_pragma PARAMS ((cpp_reader *,
+ const char *, const char *,
+ void (*) PARAMS ((cpp_reader *))));
+extern void cpp_register_pragma_space PARAMS ((cpp_reader *, const char *));
+
+extern int cpp_start_read PARAMS ((cpp_reader *, const char *));
+extern void cpp_finish PARAMS ((cpp_reader *));
+extern int cpp_avoid_paste PARAMS ((cpp_reader *, const cpp_token *,
+ const cpp_token *));
+extern enum cpp_ttype cpp_can_paste PARAMS ((cpp_reader *, const cpp_token *,
+ const cpp_token *, int *));
+extern void cpp_get_token PARAMS ((cpp_reader *, cpp_token *));
+extern const cpp_lexer_pos *cpp_get_line PARAMS ((cpp_reader *));
+extern const unsigned char *cpp_macro_definition PARAMS ((cpp_reader *,
+ const cpp_hashnode *));
extern void cpp_define PARAMS ((cpp_reader *, const char *));
extern void cpp_assert PARAMS ((cpp_reader *, const char *));
extern void cpp_undef PARAMS ((cpp_reader *, const char *));
extern void cpp_unassert PARAMS ((cpp_reader *, const char *));
-extern void cpp_free_token_list PARAMS ((cpp_toklist *));
+extern cpp_buffer *cpp_push_buffer PARAMS ((cpp_reader *,
+ const unsigned char *, size_t,
+ enum cpp_buffer_type,
+ const char *));
+extern cpp_buffer *cpp_pop_buffer PARAMS ((cpp_reader *));
+extern int cpp_defined PARAMS ((cpp_reader *, const unsigned char *, int));
/* N.B. The error-message-printer prototypes have not been nicely
formatted because exgettext needs to see 'msgid' on the same line
ATTRIBUTE_PRINTF_4;
extern void cpp_pedwarn_with_file_and_line PARAMS ((cpp_reader *, const char *, int, int, const char *msgid, ...))
ATTRIBUTE_PRINTF_5;
-extern void cpp_error_from_errno PARAMS ((cpp_reader *, const char *));
-extern void cpp_notice_from_errno PARAMS ((cpp_reader *, const char *));
+extern void cpp_error_from_errno PARAMS ((cpp_reader *, const char *));
+extern void cpp_notice_from_errno PARAMS ((cpp_reader *, const char *));
/* In cpplex.c */
-extern cpp_buffer *cpp_push_buffer PARAMS ((cpp_reader *,
- const unsigned char *, long));
-extern cpp_buffer *cpp_pop_buffer PARAMS ((cpp_reader *));
-extern void cpp_scan_buffer PARAMS ((cpp_reader *, cpp_printer *));
-extern void cpp_scan_buffer_nooutput PARAMS ((cpp_reader *));
-extern int cpp_scan_line PARAMS ((cpp_reader *));
extern int cpp_ideq PARAMS ((const cpp_token *,
const char *));
+extern void cpp_output_line PARAMS ((cpp_reader *, FILE *));
+extern void cpp_output_token PARAMS ((const cpp_token *, FILE *));
+extern const char *cpp_type2name PARAMS ((enum cpp_ttype));
/* In cpphash.c */
-extern int cpp_defined PARAMS ((cpp_reader *,
- const unsigned char *, int));
extern cpp_hashnode *cpp_lookup PARAMS ((cpp_reader *,
- const unsigned char *, int));
+ const unsigned char *, size_t));
+extern void cpp_forall_identifiers PARAMS ((cpp_reader *,
+ int (*) PARAMS ((cpp_reader *,
+ cpp_hashnode *,
+ void *)),
+ void *));
+
+/* In cppmacro.c */
+extern void cpp_scan_buffer_nooutput PARAMS ((cpp_reader *, int));
+extern void cpp_start_lookahead PARAMS ((cpp_reader *));
+extern void cpp_stop_lookahead PARAMS ((cpp_reader *, int));
/* In cppfiles.c */
-extern int cpp_included PARAMS ((cpp_reader *, const char *));
-extern int cpp_read_file PARAMS ((cpp_reader *, const char *));
-extern void cpp_make_system_header PARAMS ((cpp_reader *,
- cpp_buffer *, int));
+extern int cpp_included PARAMS ((cpp_reader *, const char *));
+extern void cpp_make_system_header PARAMS ((cpp_reader *, int, int));
#ifdef __cplusplus
}