2c6e3f5540
* charset.c (cpp_init_iconv): Initialize utf8_cset_desc. (_cpp_destroy_iconv): Destroy utf8_cset_desc, char16_cset_desc and char32_cset_desc. (converter_for_type): Handle CPP_UTF8STRING. (cpp_interpret_string): Handle CPP_UTF8STRING and raw-strings. * directives.c (get__Pragma_string): Handle CPP_UTF8STRING. (parse_include): Reject raw strings. * include/cpplib.h (CPP_UTF8STRING): New token type. * internal.h (struct cpp_reader): Add utf8_cset_desc field. * lex.c (lex_raw_string): New function. (lex_string): Handle u8 string literals, call lex_raw_string for raw string literals. (_cpp_lex_direct): Call lex_string even for u8" and {,u,U,L,u8}R" sequences. * macro.c (stringify_arg): Handle CPP_UTF8STRING. * c-common.c (c_parse_error): Handle CPP_UTF8STRING. * c-lex.c (c_lex_with_flags): Likewise. Test C_LEX_STRING_NO_JOIN instead of C_LEX_RAW_STRINGS. (lex_string): Handle CPP_UTF8STRING. * c-parser.c (c_parser_postfix_expression): Likewise. * c-pragma.h (C_LEX_RAW_STRINGS): Rename to ... (C_LEX_STRING_NO_JOIN): ... this. * parser.c (cp_lexer_print_token, cp_parser_is_string_literal, cp_parser_string_literal, cp_parser_primary_expression): Likewise. (cp_lexer_get_preprocessor_token): Use C_LEX_STRING_JOIN instead of C_LEX_RAW_STRINGS. * gcc.dg/raw-string-1.c: New test. * gcc.dg/raw-string-2.c: New test. * gcc.dg/raw-string-3.c: New test. * gcc.dg/raw-string-4.c: New test. * gcc.dg/raw-string-5.c: New test. * gcc.dg/raw-string-6.c: New test. * gcc.dg/raw-string-7.c: New test. * gcc.dg/utf8-1.c: New test. * gcc.dg/utf8-2.c: New test. * gcc.dg/utf-badconcat2.c: New test. * gcc.dg/utf-dflt2.c: New test. * gcc.dg/cpp/include6.c: New test. * g++.dg/ext/raw-string-1.C: New test. * g++.dg/ext/raw-string-2.C: New test. * g++.dg/ext/raw-string-3.C: New test. * g++.dg/ext/raw-string-4.C: New test. * g++.dg/ext/raw-string-5.C: New test. * g++.dg/ext/raw-string-6.C: New test. * g++.dg/ext/raw-string-7.C: New test. * g++.dg/ext/utf8-1.C: New test. * g++.dg/ext/utf8-2.C: New test. * g++.dg/ext/utf-badconcat2.C: New test. * g++.dg/ext/utf-dflt2.C: New test. From-SVN: r152995
944 lines
34 KiB
C++
944 lines
34 KiB
C++
/* Definitions for CPP library.
|
|
Copyright (C) 1995, 1996, 1997, 1998, 1999, 2000, 2001, 2002, 2003,
|
|
2004, 2005, 2007, 2008, 2009
|
|
Free Software Foundation, Inc.
|
|
Written by Per Bothner, 1994-95.
|
|
|
|
This program is free software; you can redistribute it and/or modify it
|
|
under the terms of the GNU General Public License as published by the
|
|
Free Software Foundation; either version 3, or (at your option) any
|
|
later version.
|
|
|
|
This program is distributed in the hope that it will be useful,
|
|
but WITHOUT ANY WARRANTY; without even the implied warranty of
|
|
MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
|
|
GNU General Public License for more details.
|
|
|
|
You should have received a copy of the GNU General Public License
|
|
along with this program; see the file COPYING3. If not see
|
|
<http://www.gnu.org/licenses/>.
|
|
|
|
In other words, you are welcome to use, share and improve this program.
|
|
You are forbidden to forbid anyone else to use, share and improve
|
|
what you give them. Help stamp out software-hoarding! */
|
|
#ifndef LIBCPP_CPPLIB_H
|
|
#define LIBCPP_CPPLIB_H
|
|
|
|
#include <sys/types.h>
|
|
#include "symtab.h"
|
|
#include "line-map.h"
|
|
|
|
typedef struct cpp_reader cpp_reader;
|
|
typedef struct cpp_buffer cpp_buffer;
|
|
typedef struct cpp_options cpp_options;
|
|
typedef struct cpp_token cpp_token;
|
|
typedef struct cpp_string cpp_string;
|
|
typedef struct cpp_hashnode cpp_hashnode;
|
|
typedef struct cpp_macro cpp_macro;
|
|
typedef struct cpp_callbacks cpp_callbacks;
|
|
typedef struct cpp_dir cpp_dir;
|
|
|
|
struct answer;
|
|
struct _cpp_file;
|
|
|
|
/* The first three groups, apart from '=', can appear in preprocessor
|
|
expressions (+= and -= are used to indicate unary + and - resp.).
|
|
This allows a lookup table to be implemented in _cpp_parse_expr.
|
|
|
|
The first group, to CPP_LAST_EQ, can be immediately followed by an
|
|
'='. The lexer needs operators ending in '=', like ">>=", to be in
|
|
the same order as their counterparts without the '=', like ">>".
|
|
|
|
See the cpp_operator table optab in expr.c if you change the order or
|
|
add or remove anything in the first group. */
|
|
|
|
#define TTYPE_TABLE \
|
|
OP(EQ, "=") \
|
|
OP(NOT, "!") \
|
|
OP(GREATER, ">") /* compare */ \
|
|
OP(LESS, "<") \
|
|
OP(PLUS, "+") /* math */ \
|
|
OP(MINUS, "-") \
|
|
OP(MULT, "*") \
|
|
OP(DIV, "/") \
|
|
OP(MOD, "%") \
|
|
OP(AND, "&") /* bit ops */ \
|
|
OP(OR, "|") \
|
|
OP(XOR, "^") \
|
|
OP(RSHIFT, ">>") \
|
|
OP(LSHIFT, "<<") \
|
|
\
|
|
OP(COMPL, "~") \
|
|
OP(AND_AND, "&&") /* logical */ \
|
|
OP(OR_OR, "||") \
|
|
OP(QUERY, "?") \
|
|
OP(COLON, ":") \
|
|
OP(COMMA, ",") /* grouping */ \
|
|
OP(OPEN_PAREN, "(") \
|
|
OP(CLOSE_PAREN, ")") \
|
|
TK(EOF, NONE) \
|
|
OP(EQ_EQ, "==") /* compare */ \
|
|
OP(NOT_EQ, "!=") \
|
|
OP(GREATER_EQ, ">=") \
|
|
OP(LESS_EQ, "<=") \
|
|
\
|
|
/* These two are unary + / - in preprocessor expressions. */ \
|
|
OP(PLUS_EQ, "+=") /* math */ \
|
|
OP(MINUS_EQ, "-=") \
|
|
\
|
|
OP(MULT_EQ, "*=") \
|
|
OP(DIV_EQ, "/=") \
|
|
OP(MOD_EQ, "%=") \
|
|
OP(AND_EQ, "&=") /* bit ops */ \
|
|
OP(OR_EQ, "|=") \
|
|
OP(XOR_EQ, "^=") \
|
|
OP(RSHIFT_EQ, ">>=") \
|
|
OP(LSHIFT_EQ, "<<=") \
|
|
/* Digraphs together, beginning with CPP_FIRST_DIGRAPH. */ \
|
|
OP(HASH, "#") /* digraphs */ \
|
|
OP(PASTE, "##") \
|
|
OP(OPEN_SQUARE, "[") \
|
|
OP(CLOSE_SQUARE, "]") \
|
|
OP(OPEN_BRACE, "{") \
|
|
OP(CLOSE_BRACE, "}") \
|
|
/* The remainder of the punctuation. Order is not significant. */ \
|
|
OP(SEMICOLON, ";") /* structure */ \
|
|
OP(ELLIPSIS, "...") \
|
|
OP(PLUS_PLUS, "++") /* increment */ \
|
|
OP(MINUS_MINUS, "--") \
|
|
OP(DEREF, "->") /* accessors */ \
|
|
OP(DOT, ".") \
|
|
OP(SCOPE, "::") \
|
|
OP(DEREF_STAR, "->*") \
|
|
OP(DOT_STAR, ".*") \
|
|
OP(ATSIGN, "@") /* used in Objective-C */ \
|
|
\
|
|
TK(NAME, IDENT) /* word */ \
|
|
TK(AT_NAME, IDENT) /* @word - Objective-C */ \
|
|
TK(NUMBER, LITERAL) /* 34_be+ta */ \
|
|
\
|
|
TK(CHAR, LITERAL) /* 'char' */ \
|
|
TK(WCHAR, LITERAL) /* L'char' */ \
|
|
TK(CHAR16, LITERAL) /* u'char' */ \
|
|
TK(CHAR32, LITERAL) /* U'char' */ \
|
|
TK(OTHER, LITERAL) /* stray punctuation */ \
|
|
\
|
|
TK(STRING, LITERAL) /* "string" */ \
|
|
TK(WSTRING, LITERAL) /* L"string" */ \
|
|
TK(STRING16, LITERAL) /* u"string" */ \
|
|
TK(STRING32, LITERAL) /* U"string" */ \
|
|
TK(UTF8STRING, LITERAL) /* u8"string" */ \
|
|
TK(OBJC_STRING, LITERAL) /* @"string" - Objective-C */ \
|
|
TK(HEADER_NAME, LITERAL) /* <stdio.h> in #include */ \
|
|
\
|
|
TK(COMMENT, LITERAL) /* Only if output comments. */ \
|
|
/* SPELL_LITERAL happens to DTRT. */ \
|
|
TK(MACRO_ARG, NONE) /* Macro argument. */ \
|
|
TK(PRAGMA, NONE) /* Only for deferred pragmas. */ \
|
|
TK(PRAGMA_EOL, NONE) /* End-of-line for deferred pragmas. */ \
|
|
TK(PADDING, NONE) /* Whitespace for -E. */
|
|
|
|
#define OP(e, s) CPP_ ## e,
|
|
#define TK(e, s) CPP_ ## e,
|
|
enum cpp_ttype
|
|
{
|
|
TTYPE_TABLE
|
|
N_TTYPES,
|
|
|
|
/* Positions in the table. */
|
|
CPP_LAST_EQ = CPP_LSHIFT,
|
|
CPP_FIRST_DIGRAPH = CPP_HASH,
|
|
CPP_LAST_PUNCTUATOR= CPP_ATSIGN,
|
|
CPP_LAST_CPP_OP = CPP_LESS_EQ
|
|
};
|
|
#undef OP
|
|
#undef TK
|
|
|
|
/* C language kind, used when calling cpp_create_reader. */
|
|
enum c_lang {CLK_GNUC89 = 0, CLK_GNUC99, CLK_STDC89, CLK_STDC94, CLK_STDC99,
|
|
CLK_GNUCXX, CLK_CXX98, CLK_GNUCXX0X, CLK_CXX0X, CLK_ASM};
|
|
|
|
/* Payload of a NUMBER, STRING, CHAR or COMMENT token. */
|
|
struct GTY(()) cpp_string {
|
|
unsigned int len;
|
|
const unsigned char *text;
|
|
};
|
|
|
|
/* Flags for the cpp_token structure. */
|
|
#define PREV_WHITE (1 << 0) /* If whitespace before this token. */
|
|
#define DIGRAPH (1 << 1) /* If it was a digraph. */
|
|
#define STRINGIFY_ARG (1 << 2) /* If macro argument to be stringified. */
|
|
#define PASTE_LEFT (1 << 3) /* If on LHS of a ## operator. */
|
|
#define NAMED_OP (1 << 4) /* C++ named operators. */
|
|
#define NO_EXPAND (1 << 5) /* Do not macro-expand this token. */
|
|
#define BOL (1 << 6) /* Token at beginning of line. */
|
|
#define PURE_ZERO (1 << 7) /* Single 0 digit, used by the C++ frontend,
|
|
set in c-lex.c. */
|
|
#define SP_DIGRAPH (1 << 8) /* # or ## token was a digraph. */
|
|
#define SP_PREV_WHITE (1 << 9) /* If whitespace before a ##
|
|
operator, or before this token
|
|
after a # operator. */
|
|
|
|
/* Specify which field, if any, of the cpp_token union is used. */
|
|
|
|
enum cpp_token_fld_kind {
|
|
CPP_TOKEN_FLD_NODE,
|
|
CPP_TOKEN_FLD_SOURCE,
|
|
CPP_TOKEN_FLD_STR,
|
|
CPP_TOKEN_FLD_ARG_NO,
|
|
CPP_TOKEN_FLD_TOKEN_NO,
|
|
CPP_TOKEN_FLD_PRAGMA,
|
|
CPP_TOKEN_FLD_NONE
|
|
};
|
|
|
|
/* A macro argument in the cpp_token union. */
|
|
struct GTY(()) cpp_macro_arg {
|
|
/* Argument number. */
|
|
unsigned int arg_no;
|
|
};
|
|
|
|
/* An identifier in the cpp_token union. */
|
|
struct GTY(()) cpp_identifier {
|
|
/* The canonical (UTF-8) spelling of the identifier. */
|
|
cpp_hashnode *
|
|
GTY ((nested_ptr (union tree_node,
|
|
"%h ? CPP_HASHNODE (GCC_IDENT_TO_HT_IDENT (%h)) : NULL",
|
|
"%h ? HT_IDENT_TO_GCC_IDENT (HT_NODE (%h)) : NULL")))
|
|
node;
|
|
};
|
|
|
|
/* A preprocessing token. This has been carefully packed and should
|
|
occupy 16 bytes on 32-bit hosts and 24 bytes on 64-bit hosts. */
|
|
struct GTY(()) cpp_token {
|
|
source_location src_loc; /* Location of first char of token. */
|
|
ENUM_BITFIELD(cpp_ttype) type : CHAR_BIT; /* token type */
|
|
unsigned short flags; /* flags - see above */
|
|
|
|
union cpp_token_u
|
|
{
|
|
/* An identifier. */
|
|
struct cpp_identifier GTY ((tag ("CPP_TOKEN_FLD_NODE"))) node;
|
|
|
|
/* Inherit padding from this token. */
|
|
cpp_token * GTY ((tag ("CPP_TOKEN_FLD_SOURCE"))) source;
|
|
|
|
/* A string, or number. */
|
|
struct cpp_string GTY ((tag ("CPP_TOKEN_FLD_STR"))) str;
|
|
|
|
/* Argument no. for a CPP_MACRO_ARG. */
|
|
struct cpp_macro_arg GTY ((tag ("CPP_TOKEN_FLD_ARG_NO"))) macro_arg;
|
|
|
|
/* Original token no. for a CPP_PASTE (from a sequence of
|
|
consecutive paste tokens in a macro expansion). */
|
|
unsigned int GTY ((tag ("CPP_TOKEN_FLD_TOKEN_NO"))) token_no;
|
|
|
|
/* Caller-supplied identifier for a CPP_PRAGMA. */
|
|
unsigned int GTY ((tag ("CPP_TOKEN_FLD_PRAGMA"))) pragma;
|
|
} GTY ((desc ("cpp_token_val_index (&%1)"))) val;
|
|
};
|
|
|
|
/* Say which field is in use. */
|
|
extern enum cpp_token_fld_kind cpp_token_val_index (cpp_token *tok);
|
|
|
|
/* A type wide enough to hold any multibyte source character.
|
|
cpplib's character constant interpreter requires an unsigned type.
|
|
Also, a typedef for the signed equivalent.
|
|
The width of this type is capped at 32 bits; there do exist targets
|
|
where wchar_t is 64 bits, but only in a non-default mode, and there
|
|
would be no meaningful interpretation for a wchar_t value greater
|
|
than 2^32 anyway -- the widest wide-character encoding around is
|
|
ISO 10646, which stops at 2^31. */
|
|
#if CHAR_BIT * SIZEOF_INT >= 32
|
|
# define CPPCHAR_SIGNED_T int
|
|
#elif CHAR_BIT * SIZEOF_LONG >= 32
|
|
# define CPPCHAR_SIGNED_T long
|
|
#else
|
|
# error "Cannot find a least-32-bit signed integer type"
|
|
#endif
|
|
typedef unsigned CPPCHAR_SIGNED_T cppchar_t;
|
|
typedef CPPCHAR_SIGNED_T cppchar_signed_t;
|
|
|
|
/* Style of header dependencies to generate. */
|
|
enum cpp_deps_style { DEPS_NONE = 0, DEPS_USER, DEPS_SYSTEM };
|
|
|
|
/* The possible normalization levels, from most restrictive to least. */
|
|
enum cpp_normalize_level {
|
|
/* In NFKC. */
|
|
normalized_KC = 0,
|
|
/* In NFC. */
|
|
normalized_C,
|
|
/* In NFC, except for subsequences where being in NFC would make
|
|
the identifier invalid. */
|
|
normalized_identifier_C,
|
|
/* Not normalized at all. */
|
|
normalized_none
|
|
};
|
|
|
|
/* This structure is nested inside struct cpp_reader, and
|
|
carries all the options visible to the command line. */
|
|
struct cpp_options
|
|
{
|
|
/* Characters between tab stops. */
|
|
unsigned int tabstop;
|
|
|
|
/* The language we're preprocessing. */
|
|
enum c_lang lang;
|
|
|
|
/* Nonzero means use extra default include directories for C++. */
|
|
unsigned char cplusplus;
|
|
|
|
/* Nonzero means handle cplusplus style comments. */
|
|
unsigned char cplusplus_comments;
|
|
|
|
/* Nonzero means define __OBJC__, treat @ as a special token, use
|
|
the OBJC[PLUS]_INCLUDE_PATH environment variable, and allow
|
|
"#import". */
|
|
unsigned char objc;
|
|
|
|
/* Nonzero means don't copy comments into the output file. */
|
|
unsigned char discard_comments;
|
|
|
|
/* Nonzero means don't copy comments into the output file during
|
|
macro expansion. */
|
|
unsigned char discard_comments_in_macro_exp;
|
|
|
|
/* Nonzero means process the ISO trigraph sequences. */
|
|
unsigned char trigraphs;
|
|
|
|
/* Nonzero means process the ISO digraph sequences. */
|
|
unsigned char digraphs;
|
|
|
|
/* Nonzero means to allow hexadecimal floats and LL suffixes. */
|
|
unsigned char extended_numbers;
|
|
|
|
/* Nonzero means process u/U prefix literals (UTF-16/32). */
|
|
unsigned char uliterals;
|
|
|
|
/* Nonzero means print names of header files (-H). */
|
|
unsigned char print_include_names;
|
|
|
|
/* Nonzero means complain about deprecated features. */
|
|
unsigned char warn_deprecated;
|
|
|
|
/* Nonzero means warn if slash-star appears in a comment. */
|
|
unsigned char warn_comments;
|
|
|
|
/* Nonzero means warn if a user-supplied include directory does not
|
|
exist. */
|
|
unsigned char warn_missing_include_dirs;
|
|
|
|
/* Nonzero means warn if there are any trigraphs. */
|
|
unsigned char warn_trigraphs;
|
|
|
|
/* Nonzero means warn about multicharacter charconsts. */
|
|
unsigned char warn_multichar;
|
|
|
|
/* Nonzero means warn about various incompatibilities with
|
|
traditional C. */
|
|
unsigned char warn_traditional;
|
|
|
|
/* Nonzero means warn about long long numeric constants. */
|
|
unsigned char warn_long_long;
|
|
|
|
/* Nonzero means warn about text after an #endif (or #else). */
|
|
unsigned char warn_endif_labels;
|
|
|
|
/* Nonzero means warn about implicit sign changes owing to integer
|
|
promotions. */
|
|
unsigned char warn_num_sign_change;
|
|
|
|
/* Zero means don't warn about __VA_ARGS__ usage in c89 pedantic mode.
|
|
Presumably the usage is protected by the appropriate #ifdef. */
|
|
unsigned char warn_variadic_macros;
|
|
|
|
/* Nonzero means warn about builtin macros that are redefined or
|
|
explicitly undefined. */
|
|
unsigned char warn_builtin_macro_redefined;
|
|
|
|
/* Nonzero means we should look for header.gcc files that remap file
|
|
names. */
|
|
unsigned char remap;
|
|
|
|
/* Zero means dollar signs are punctuation. */
|
|
unsigned char dollars_in_ident;
|
|
|
|
/* Nonzero means UCNs are accepted in identifiers. */
|
|
unsigned char extended_identifiers;
|
|
|
|
/* True if we should warn about dollars in identifiers or numbers
|
|
for this translation unit. */
|
|
unsigned char warn_dollars;
|
|
|
|
/* Nonzero means warn if undefined identifiers are evaluated in an #if. */
|
|
unsigned char warn_undef;
|
|
|
|
/* Nonzero means warn of unused macros from the main file. */
|
|
unsigned char warn_unused_macros;
|
|
|
|
/* Nonzero for the 1999 C Standard, including corrigenda and amendments. */
|
|
unsigned char c99;
|
|
|
|
/* Nonzero if we are conforming to a specific C or C++ standard. */
|
|
unsigned char std;
|
|
|
|
/* Nonzero means give all the error messages the ANSI standard requires. */
|
|
unsigned char pedantic;
|
|
|
|
/* Nonzero means we're looking at already preprocessed code, so don't
|
|
bother trying to do macro expansion and whatnot. */
|
|
unsigned char preprocessed;
|
|
|
|
/* Print column number in error messages. */
|
|
unsigned char show_column;
|
|
|
|
/* Nonzero means handle C++ alternate operator names. */
|
|
unsigned char operator_names;
|
|
|
|
/* Nonzero means warn about use of C++ alternate operator names. */
|
|
unsigned char warn_cxx_operator_names;
|
|
|
|
/* True for traditional preprocessing. */
|
|
unsigned char traditional;
|
|
|
|
/* Holds the name of the target (execution) character set. */
|
|
const char *narrow_charset;
|
|
|
|
/* Holds the name of the target wide character set. */
|
|
const char *wide_charset;
|
|
|
|
/* Holds the name of the input character set. */
|
|
const char *input_charset;
|
|
|
|
/* The minimum permitted level of normalization before a warning
|
|
is generated. */
|
|
enum cpp_normalize_level warn_normalize;
|
|
|
|
/* True to warn about precompiled header files we couldn't use. */
|
|
bool warn_invalid_pch;
|
|
|
|
/* True if dependencies should be restored from a precompiled header. */
|
|
bool restore_pch_deps;
|
|
|
|
/* Dependency generation. */
|
|
struct
|
|
{
|
|
/* Style of header dependencies to generate. */
|
|
enum cpp_deps_style style;
|
|
|
|
/* Assume missing files are generated files. */
|
|
bool missing_files;
|
|
|
|
/* Generate phony targets for each dependency apart from the first
|
|
one. */
|
|
bool phony_targets;
|
|
|
|
/* If true, no dependency is generated on the main file. */
|
|
bool ignore_main_file;
|
|
|
|
/* If true, intend to use the preprocessor output (e.g., for compilation)
|
|
in addition to the dependency info. */
|
|
bool need_preprocessor_output;
|
|
} deps;
|
|
|
|
/* Target-specific features set by the front end or client. */
|
|
|
|
/* Precision for target CPP arithmetic, target characters, target
|
|
ints and target wide characters, respectively. */
|
|
size_t precision, char_precision, int_precision, wchar_precision;
|
|
|
|
/* True means chars (wide chars) are unsigned. */
|
|
bool unsigned_char, unsigned_wchar;
|
|
|
|
/* True if the most significant byte in a word has the lowest
|
|
address in memory. */
|
|
bool bytes_big_endian;
|
|
|
|
/* Nonzero means __STDC__ should have the value 0 in system headers. */
|
|
unsigned char stdc_0_in_system_headers;
|
|
|
|
/* True disables tokenization outside of preprocessing directives. */
|
|
bool directives_only;
|
|
};
|
|
|
|
/* Callback for header lookup for HEADER, which is the name of a
|
|
source file. It is used as a method of last resort to find headers
|
|
that are not otherwise found during the normal include processing.
|
|
The return value is the malloced name of a header to try and open,
|
|
if any, or NULL otherwise. This callback is called only if the
|
|
header is otherwise unfound. */
|
|
typedef const char *(*missing_header_cb)(cpp_reader *, const char *header, cpp_dir **);
|
|
|
|
/* Call backs to cpplib client. */
|
|
struct cpp_callbacks
|
|
{
|
|
/* Called when a new line of preprocessed output is started. */
|
|
void (*line_change) (cpp_reader *, const cpp_token *, int);
|
|
|
|
/* Called when switching to/from a new file.
|
|
The line_map is for the new file. It is NULL if there is no new file.
|
|
(In C this happens when done with <built-in>+<command line> and also
|
|
when done with a main file.) This can be used for resource cleanup. */
|
|
void (*file_change) (cpp_reader *, const struct line_map *);
|
|
|
|
void (*dir_change) (cpp_reader *, const char *);
|
|
void (*include) (cpp_reader *, unsigned int, const unsigned char *,
|
|
const char *, int, const cpp_token **);
|
|
void (*define) (cpp_reader *, unsigned int, cpp_hashnode *);
|
|
void (*undef) (cpp_reader *, unsigned int, cpp_hashnode *);
|
|
void (*ident) (cpp_reader *, unsigned int, const cpp_string *);
|
|
void (*def_pragma) (cpp_reader *, unsigned int);
|
|
int (*valid_pch) (cpp_reader *, const char *, int);
|
|
void (*read_pch) (cpp_reader *, const char *, int, const char *);
|
|
missing_header_cb missing_header;
|
|
|
|
/* Context-sensitive macro support. Returns macro (if any) that should
|
|
be expanded. */
|
|
cpp_hashnode * (*macro_to_expand) (cpp_reader *, const cpp_token *);
|
|
|
|
/* Called to emit a diagnostic. This callback receives the
|
|
translated message. */
|
|
bool (*error) (cpp_reader *, int, source_location, unsigned int,
|
|
const char *, va_list *)
|
|
ATTRIBUTE_FPTR_PRINTF(5,0);
|
|
|
|
/* Callbacks for when a macro is expanded, or tested (whether
|
|
defined or not at the time) in #ifdef, #ifndef or "defined". */
|
|
void (*used_define) (cpp_reader *, unsigned int, cpp_hashnode *);
|
|
void (*used_undef) (cpp_reader *, unsigned int, cpp_hashnode *);
|
|
/* Called before #define and #undef or other macro definition
|
|
changes are processed. */
|
|
void (*before_define) (cpp_reader *);
|
|
};
|
|
|
|
#ifdef VMS
|
|
#define INO_T_CPP ino_t ino[3]
|
|
#else
|
|
#define INO_T_CPP ino_t ino
|
|
#endif
|
|
|
|
/* Chain of directories to look for include files in. */
|
|
struct cpp_dir
|
|
{
|
|
/* NULL-terminated singly-linked list. */
|
|
struct cpp_dir *next;
|
|
|
|
/* NAME of the directory, NUL-terminated. */
|
|
char *name;
|
|
unsigned int len;
|
|
|
|
/* One if a system header, two if a system header that has extern
|
|
"C" guards for C++. */
|
|
unsigned char sysp;
|
|
|
|
/* Is this a user-supplied directory? */
|
|
bool user_supplied_p;
|
|
|
|
/* The canonicalized NAME as determined by lrealpath. This field
|
|
is only used by hosts that lack reliable inode numbers. */
|
|
char *canonical_name;
|
|
|
|
/* Mapping of file names for this directory for MS-DOS and related
|
|
platforms. A NULL-terminated array of (from, to) pairs. */
|
|
const char **name_map;
|
|
|
|
/* Routine to construct pathname, given the search path name and the
|
|
HEADER we are trying to find, return a constructed pathname to
|
|
try and open. If this is NULL, the constructed pathname is as
|
|
constructed by append_file_to_dir. */
|
|
char *(*construct) (const char *header, cpp_dir *dir);
|
|
|
|
/* The C front end uses these to recognize duplicated
|
|
directories in the search path. */
|
|
INO_T_CPP;
|
|
dev_t dev;
|
|
};
|
|
|
|
/* The structure of a node in the hash table. The hash table has
|
|
entries for all identifiers: either macros defined by #define
|
|
commands (type NT_MACRO), assertions created with #assert
|
|
(NT_ASSERTION), or neither of the above (NT_VOID). Builtin macros
|
|
like __LINE__ are flagged NODE_BUILTIN. Poisoned identifiers are
|
|
flagged NODE_POISONED. NODE_OPERATOR (C++ only) indicates an
|
|
identifier that behaves like an operator such as "xor".
|
|
NODE_DIAGNOSTIC is for speed in lex_token: it indicates a
|
|
diagnostic may be required for this node. Currently this only
|
|
applies to __VA_ARGS__, poisoned identifiers, and -Wc++-compat
|
|
warnings about NODE_OPERATOR. */
|
|
|
|
/* Hash node flags. */
|
|
#define NODE_OPERATOR (1 << 0) /* C++ named operator. */
|
|
#define NODE_POISONED (1 << 1) /* Poisoned identifier. */
|
|
#define NODE_BUILTIN (1 << 2) /* Builtin macro. */
|
|
#define NODE_DIAGNOSTIC (1 << 3) /* Possible diagnostic when lexed. */
|
|
#define NODE_WARN (1 << 4) /* Warn if redefined or undefined. */
|
|
#define NODE_DISABLED (1 << 5) /* A disabled macro. */
|
|
#define NODE_MACRO_ARG (1 << 6) /* Used during #define processing. */
|
|
#define NODE_USED (1 << 7) /* Dumped with -dU. */
|
|
#define NODE_CONDITIONAL (1 << 8) /* Conditional macro */
|
|
#define NODE_WARN_OPERATOR (1 << 9) /* Warn about C++ named operator. */
|
|
|
|
/* Different flavors of hash node. */
|
|
enum node_type
|
|
{
|
|
NT_VOID = 0, /* No definition yet. */
|
|
NT_MACRO, /* A macro of some form. */
|
|
NT_ASSERTION /* Predicate for #assert. */
|
|
};
|
|
|
|
/* Different flavors of builtin macro. _Pragma is an operator, but we
|
|
handle it with the builtin code for efficiency reasons. */
|
|
enum cpp_builtin_type
|
|
{
|
|
BT_SPECLINE = 0, /* `__LINE__' */
|
|
BT_DATE, /* `__DATE__' */
|
|
BT_FILE, /* `__FILE__' */
|
|
BT_BASE_FILE, /* `__BASE_FILE__' */
|
|
BT_INCLUDE_LEVEL, /* `__INCLUDE_LEVEL__' */
|
|
BT_TIME, /* `__TIME__' */
|
|
BT_STDC, /* `__STDC__' */
|
|
BT_PRAGMA, /* `_Pragma' operator */
|
|
BT_TIMESTAMP, /* `__TIMESTAMP__' */
|
|
BT_COUNTER /* `__COUNTER__' */
|
|
};
|
|
|
|
#define CPP_HASHNODE(HNODE) ((cpp_hashnode *) (HNODE))
|
|
#define HT_NODE(NODE) ((ht_identifier *) (NODE))
|
|
#define NODE_LEN(NODE) HT_LEN (&(NODE)->ident)
|
|
#define NODE_NAME(NODE) HT_STR (&(NODE)->ident)
|
|
|
|
/* Specify which field, if any, of the union is used. */
|
|
|
|
enum {
|
|
NTV_MACRO,
|
|
NTV_ANSWER,
|
|
NTV_BUILTIN,
|
|
NTV_ARGUMENT,
|
|
NTV_NONE
|
|
};
|
|
|
|
#define CPP_HASHNODE_VALUE_IDX(HNODE) \
|
|
((HNODE.flags & NODE_MACRO_ARG) ? NTV_ARGUMENT \
|
|
: HNODE.type == NT_MACRO ? ((HNODE.flags & NODE_BUILTIN) \
|
|
? NTV_BUILTIN : NTV_MACRO) \
|
|
: HNODE.type == NT_ASSERTION ? NTV_ANSWER \
|
|
: NTV_NONE)
|
|
|
|
/* The common part of an identifier node shared amongst all 3 C front
|
|
ends. Also used to store CPP identifiers, which are a superset of
|
|
identifiers in the grammatical sense. */
|
|
|
|
union GTY(()) _cpp_hashnode_value {
|
|
/* If a macro. */
|
|
cpp_macro * GTY((tag ("NTV_MACRO"))) macro;
|
|
/* Answers to an assertion. */
|
|
struct answer * GTY ((tag ("NTV_ANSWER"))) answers;
|
|
/* Code for a builtin macro. */
|
|
enum cpp_builtin_type GTY ((tag ("NTV_BUILTIN"))) builtin;
|
|
/* Macro argument index. */
|
|
unsigned short GTY ((tag ("NTV_ARGUMENT"))) arg_index;
|
|
};
|
|
|
|
struct GTY(()) cpp_hashnode {
|
|
struct ht_identifier ident;
|
|
unsigned int is_directive : 1;
|
|
unsigned int directive_index : 7; /* If is_directive,
|
|
then index into directive table.
|
|
Otherwise, a NODE_OPERATOR. */
|
|
unsigned char rid_code; /* Rid code - for front ends. */
|
|
ENUM_BITFIELD(node_type) type : 6; /* CPP node type. */
|
|
unsigned int flags : 10; /* CPP flags. */
|
|
|
|
union _cpp_hashnode_value GTY ((desc ("CPP_HASHNODE_VALUE_IDX (%1)"))) value;
|
|
};
|
|
|
|
/* Call this first to get a handle to pass to other functions.
|
|
|
|
If you want cpplib to manage its own hashtable, pass in a NULL
|
|
pointer. Otherwise you should pass in an initialized hash table
|
|
that cpplib will share; this technique is used by the C front
|
|
ends. */
|
|
extern cpp_reader *cpp_create_reader (enum c_lang, struct ht *,
|
|
struct line_maps *);
|
|
|
|
/* Reset the cpp_reader's line_map. This is only used after reading a
|
|
PCH file. */
|
|
extern void cpp_set_line_map (cpp_reader *, struct line_maps *);
|
|
|
|
/* Call this to change the selected language standard (e.g. because of
|
|
command line options). */
|
|
extern void cpp_set_lang (cpp_reader *, enum c_lang);
|
|
|
|
/* Set the include paths. */
|
|
extern void cpp_set_include_chains (cpp_reader *, cpp_dir *, cpp_dir *, int);
|
|
|
|
/* Call these to get pointers to the options, callback, and deps
|
|
structures for a given reader. These pointers are good until you
|
|
call cpp_finish on that reader. You can either edit the callbacks
|
|
through the pointer returned from cpp_get_callbacks, or set them
|
|
with cpp_set_callbacks. */
|
|
extern cpp_options *cpp_get_options (cpp_reader *);
|
|
extern cpp_callbacks *cpp_get_callbacks (cpp_reader *);
|
|
extern void cpp_set_callbacks (cpp_reader *, cpp_callbacks *);
|
|
extern struct deps *cpp_get_deps (cpp_reader *);
|
|
|
|
/* This function reads the file, but does not start preprocessing. It
|
|
returns the name of the original file; this is the same as the
|
|
input file, except for preprocessed input. This will generate at
|
|
least one file change callback, and possibly a line change callback
|
|
too. If there was an error opening the file, it returns NULL. */
|
|
extern const char *cpp_read_main_file (cpp_reader *, const char *);
|
|
|
|
/* Set up built-ins with special behavior. Use cpp_init_builtins()
|
|
instead unless your know what you are doing. */
|
|
extern void cpp_init_special_builtins (cpp_reader *);
|
|
|
|
/* Set up built-ins like __FILE__. */
|
|
extern void cpp_init_builtins (cpp_reader *, int);
|
|
|
|
/* This is called after options have been parsed, and partially
|
|
processed. */
|
|
extern void cpp_post_options (cpp_reader *);
|
|
|
|
/* Set up translation to the target character set. */
|
|
extern void cpp_init_iconv (cpp_reader *);
|
|
|
|
/* Call this to finish preprocessing. If you requested dependency
|
|
generation, pass an open stream to write the information to,
|
|
otherwise NULL. It is your responsibility to close the stream. */
|
|
extern void cpp_finish (cpp_reader *, FILE *deps_stream);
|
|
|
|
/* Call this to release the handle at the end of preprocessing. Any
|
|
use of the handle after this function returns is invalid. */
|
|
extern void cpp_destroy (cpp_reader *);
|
|
|
|
extern unsigned int cpp_token_len (const cpp_token *);
|
|
extern unsigned char *cpp_token_as_text (cpp_reader *, const cpp_token *);
|
|
extern unsigned char *cpp_spell_token (cpp_reader *, const cpp_token *,
|
|
unsigned char *, bool);
|
|
extern void cpp_register_pragma (cpp_reader *, const char *, const char *,
|
|
void (*) (cpp_reader *), bool);
|
|
extern void cpp_register_deferred_pragma (cpp_reader *, const char *,
|
|
const char *, unsigned, bool, bool);
|
|
extern int cpp_avoid_paste (cpp_reader *, const cpp_token *,
|
|
const cpp_token *);
|
|
extern const cpp_token *cpp_get_token (cpp_reader *);
|
|
extern const cpp_token *cpp_get_token_with_location (cpp_reader *,
|
|
source_location *);
|
|
extern const unsigned char *cpp_macro_definition (cpp_reader *,
|
|
const cpp_hashnode *);
|
|
extern void _cpp_backup_tokens (cpp_reader *, unsigned int);
|
|
extern const cpp_token *cpp_peek_token (cpp_reader *, int);
|
|
|
|
/* Evaluate a CPP_*CHAR* token. */
|
|
extern cppchar_t cpp_interpret_charconst (cpp_reader *, const cpp_token *,
|
|
unsigned int *, int *);
|
|
/* Evaluate a vector of CPP_*STRING* tokens. */
|
|
extern bool cpp_interpret_string (cpp_reader *,
|
|
const cpp_string *, size_t,
|
|
cpp_string *, enum cpp_ttype);
|
|
extern bool cpp_interpret_string_notranslate (cpp_reader *,
|
|
const cpp_string *, size_t,
|
|
cpp_string *, enum cpp_ttype);
|
|
|
|
/* Convert a host character constant to the execution character set. */
|
|
extern cppchar_t cpp_host_to_exec_charset (cpp_reader *, cppchar_t);
|
|
|
|
/* Used to register macros and assertions, perhaps from the command line.
|
|
The text is the same as the command line argument. */
|
|
extern void cpp_define (cpp_reader *, const char *);
|
|
extern void cpp_define_formatted (cpp_reader *pfile,
|
|
const char *fmt, ...) ATTRIBUTE_PRINTF_2;
|
|
extern void cpp_assert (cpp_reader *, const char *);
|
|
extern void cpp_undef (cpp_reader *, const char *);
|
|
extern void cpp_unassert (cpp_reader *, const char *);
|
|
|
|
extern cpp_macro *cpp_push_definition (cpp_reader *, const char *);
|
|
extern void cpp_pop_definition (cpp_reader *, const char *, cpp_macro *);
|
|
|
|
/* Undefine all macros and assertions. */
|
|
extern void cpp_undef_all (cpp_reader *);
|
|
|
|
extern cpp_buffer *cpp_push_buffer (cpp_reader *, const unsigned char *,
|
|
size_t, int);
|
|
extern int cpp_defined (cpp_reader *, const unsigned char *, int);
|
|
|
|
/* A preprocessing number. Code assumes that any unused high bits of
|
|
the double integer are set to zero. */
|
|
typedef unsigned HOST_WIDE_INT cpp_num_part;
|
|
typedef struct cpp_num cpp_num;
|
|
struct cpp_num
|
|
{
|
|
cpp_num_part high;
|
|
cpp_num_part low;
|
|
bool unsignedp; /* True if value should be treated as unsigned. */
|
|
bool overflow; /* True if the most recent calculation overflowed. */
|
|
};
|
|
|
|
/* cpplib provides two interfaces for interpretation of preprocessing
|
|
numbers.
|
|
|
|
cpp_classify_number categorizes numeric constants according to
|
|
their field (integer, floating point, or invalid), radix (decimal,
|
|
octal, hexadecimal), and type suffixes. */
|
|
|
|
#define CPP_N_CATEGORY 0x000F
|
|
#define CPP_N_INVALID 0x0000
|
|
#define CPP_N_INTEGER 0x0001
|
|
#define CPP_N_FLOATING 0x0002
|
|
|
|
#define CPP_N_WIDTH 0x00F0
|
|
#define CPP_N_SMALL 0x0010 /* int, float, shrot _Fract/Accum */
|
|
#define CPP_N_MEDIUM 0x0020 /* long, double, long _Fract/_Accum. */
|
|
#define CPP_N_LARGE 0x0040 /* long long, long double,
|
|
long long _Fract/Accum. */
|
|
|
|
#define CPP_N_WIDTH_MD 0xF0000 /* machine defined. */
|
|
#define CPP_N_MD_W 0x10000
|
|
#define CPP_N_MD_Q 0x20000
|
|
|
|
#define CPP_N_RADIX 0x0F00
|
|
#define CPP_N_DECIMAL 0x0100
|
|
#define CPP_N_HEX 0x0200
|
|
#define CPP_N_OCTAL 0x0400
|
|
#define CPP_N_BINARY 0x0800
|
|
|
|
#define CPP_N_UNSIGNED 0x1000 /* Properties. */
|
|
#define CPP_N_IMAGINARY 0x2000
|
|
#define CPP_N_DFLOAT 0x4000
|
|
#define CPP_N_DEFAULT 0x8000
|
|
|
|
#define CPP_N_FRACT 0x100000 /* Fract types. */
|
|
#define CPP_N_ACCUM 0x200000 /* Accum types. */
|
|
|
|
/* Classify a CPP_NUMBER token. The return value is a combination of
|
|
the flags from the above sets. */
|
|
extern unsigned cpp_classify_number (cpp_reader *, const cpp_token *);
|
|
|
|
/* Evaluate a token classified as category CPP_N_INTEGER. */
|
|
extern cpp_num cpp_interpret_integer (cpp_reader *, const cpp_token *,
|
|
unsigned int type);
|
|
|
|
/* Sign extend a number, with PRECISION significant bits and all
|
|
others assumed clear, to fill out a cpp_num structure. */
|
|
cpp_num cpp_num_sign_extend (cpp_num, size_t);
|
|
|
|
/* Diagnostic levels. To get a diagnostic without associating a
|
|
position in the translation unit with it, use cpp_error_with_line
|
|
with a line number of zero. */
|
|
|
|
/* Warning, an error with -Werror. */
|
|
#define CPP_DL_WARNING 0x00
|
|
/* Same as CPP_DL_WARNING, except it is not suppressed in system headers. */
|
|
#define CPP_DL_WARNING_SYSHDR 0x01
|
|
/* Warning, an error with -pedantic-errors or -Werror. */
|
|
#define CPP_DL_PEDWARN 0x02
|
|
/* An error. */
|
|
#define CPP_DL_ERROR 0x03
|
|
/* An internal consistency check failed. Prints "internal error: ",
|
|
otherwise the same as CPP_DL_ERROR. */
|
|
#define CPP_DL_ICE 0x04
|
|
/* An informative note following a warning. */
|
|
#define CPP_DL_NOTE 0x05
|
|
/* A fatal error. */
|
|
#define CPP_DL_FATAL 0x06
|
|
|
|
/* Output a diagnostic of some kind. */
|
|
extern bool cpp_error (cpp_reader *, int, const char *msgid, ...)
|
|
ATTRIBUTE_PRINTF_3;
|
|
|
|
/* Output a diagnostic with "MSGID: " preceding the
|
|
error string of errno. No location is printed. */
|
|
extern bool cpp_errno (cpp_reader *, int, const char *msgid);
|
|
|
|
/* Same as cpp_error, except additionally specifies a position as a
|
|
(translation unit) physical line and physical column. If the line is
|
|
zero, then no location is printed. */
|
|
extern bool cpp_error_with_line (cpp_reader *, int, source_location, unsigned,
|
|
const char *msgid, ...) ATTRIBUTE_PRINTF_5;
|
|
|
|
/* In lex.c */
|
|
extern int cpp_ideq (const cpp_token *, const char *);
|
|
extern void cpp_output_line (cpp_reader *, FILE *);
|
|
extern unsigned char *cpp_output_line_to_string (cpp_reader *,
|
|
const unsigned char *);
|
|
extern void cpp_output_token (const cpp_token *, FILE *);
|
|
extern const char *cpp_type2name (enum cpp_ttype, unsigned char flags);
|
|
/* Returns the value of an escape sequence, truncated to the correct
|
|
target precision. PSTR points to the input pointer, which is just
|
|
after the backslash. LIMIT is how much text we have. WIDE is true
|
|
if the escape sequence is part of a wide character constant or
|
|
string literal. Handles all relevant diagnostics. */
|
|
extern cppchar_t cpp_parse_escape (cpp_reader *, const unsigned char ** pstr,
|
|
const unsigned char *limit, int wide);
|
|
|
|
/* Structure used to hold a comment block at a given location in the
|
|
source code. */
|
|
|
|
typedef struct
|
|
{
|
|
/* Text of the comment including the terminators. */
|
|
char *comment;
|
|
|
|
/* source location for the given comment. */
|
|
source_location sloc;
|
|
} cpp_comment;
|
|
|
|
/* Structure holding all comments for a given cpp_reader. */
|
|
|
|
typedef struct
|
|
{
|
|
/* table of comment entries. */
|
|
cpp_comment *entries;
|
|
|
|
/* number of actual entries entered in the table. */
|
|
int count;
|
|
|
|
/* number of entries allocated currently. */
|
|
int allocated;
|
|
} cpp_comment_table;
|
|
|
|
/* Returns the table of comments encountered by the preprocessor. This
|
|
table is only populated when pfile->state.save_comments is true. */
|
|
extern cpp_comment_table *cpp_get_comments (cpp_reader *);
|
|
|
|
/* In hash.c */
|
|
|
|
/* Lookup an identifier in the hashtable. Puts the identifier in the
|
|
table if it is not already there. */
|
|
extern cpp_hashnode *cpp_lookup (cpp_reader *, const unsigned char *,
|
|
unsigned int);
|
|
|
|
typedef int (*cpp_cb) (cpp_reader *, cpp_hashnode *, void *);
|
|
extern void cpp_forall_identifiers (cpp_reader *, cpp_cb, void *);
|
|
|
|
/* In macro.c */
|
|
extern void cpp_scan_nooutput (cpp_reader *);
|
|
extern int cpp_sys_macro_p (cpp_reader *);
|
|
extern unsigned char *cpp_quote_string (unsigned char *, const unsigned char *,
|
|
unsigned int);
|
|
|
|
/* In files.c */
|
|
extern bool cpp_included (cpp_reader *, const char *);
|
|
extern bool cpp_included_before (cpp_reader *, const char *, source_location);
|
|
extern void cpp_make_system_header (cpp_reader *, int, int);
|
|
extern bool cpp_push_include (cpp_reader *, const char *);
|
|
extern void cpp_change_file (cpp_reader *, enum lc_reason, const char *);
|
|
extern const char *cpp_get_path (struct _cpp_file *);
|
|
extern cpp_dir *cpp_get_dir (struct _cpp_file *);
|
|
extern cpp_buffer *cpp_get_buffer (cpp_reader *);
|
|
extern struct _cpp_file *cpp_get_file (cpp_buffer *);
|
|
extern cpp_buffer *cpp_get_prev (cpp_buffer *);
|
|
extern void cpp_clear_file_cache (cpp_reader *);
|
|
|
|
/* In pch.c */
|
|
struct save_macro_data;
|
|
extern int cpp_save_state (cpp_reader *, FILE *);
|
|
extern int cpp_write_pch_deps (cpp_reader *, FILE *);
|
|
extern int cpp_write_pch_state (cpp_reader *, FILE *);
|
|
extern int cpp_valid_state (cpp_reader *, const char *, int);
|
|
extern void cpp_prepare_state (cpp_reader *, struct save_macro_data **);
|
|
extern int cpp_read_state (cpp_reader *, const char *, FILE *,
|
|
struct save_macro_data *);
|
|
|
|
#endif /* ! LIBCPP_CPPLIB_H */
|