1 /* Definitions for CPP library. 2 Copyright (C) 1995, 1996, 1997, 1998, 1999, 2000, 2001, 2002, 2003, 3 2004, 2005, 2007, 2008, 2009 4 Free Software Foundation, Inc. 5 Written by Per Bothner, 1994-95. 6 7 This program is free software; you can redistribute it and/or modify it 8 under the terms of the GNU General Public License as published by the 9 Free Software Foundation; either version 3, or (at your option) any 10 later version. 11 12 This program is distributed in the hope that it will be useful, 13 but WITHOUT ANY WARRANTY; without even the implied warranty of 14 MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the 15 GNU General Public License for more details. 16 17 You should have received a copy of the GNU General Public License 18 along with this program; see the file COPYING3. If not see 19 <http://www.gnu.org/licenses/>. 20 21 In other words, you are welcome to use, share and improve this program. 22 You are forbidden to forbid anyone else to use, share and improve 23 what you give them. Help stamp out software-hoarding! */ 24 #ifndef LIBCPP_CPPLIB_H 25 #define LIBCPP_CPPLIB_H 26 27 #include <sys/types.h> 28 #include "symtab.h" 29 #include "line-map.h" 30 31 #ifdef __cplusplus 32 extern "C" { 33 #endif 34 35 typedef struct cpp_reader cpp_reader; 36 typedef struct cpp_buffer cpp_buffer; 37 typedef struct cpp_options cpp_options; 38 typedef struct cpp_token cpp_token; 39 typedef struct cpp_string cpp_string; 40 typedef struct cpp_hashnode cpp_hashnode; 41 typedef struct cpp_macro cpp_macro; 42 typedef struct cpp_callbacks cpp_callbacks; 43 typedef struct cpp_dir cpp_dir; 44 45 struct answer; 46 struct _cpp_file; 47 48 /* The first three groups, apart from '=', can appear in preprocessor 49 expressions (+= and -= are used to indicate unary + and - resp.). 50 This allows a lookup table to be implemented in _cpp_parse_expr. 51 52 The first group, to CPP_LAST_EQ, can be immediately followed by an 53 '='. The lexer needs operators ending in '=', like ">>=", to be in 54 the same order as their counterparts without the '=', like ">>". 55 56 See the cpp_operator table optab in expr.c if you change the order or 57 add or remove anything in the first group. */ 58 59 #define TTYPE_TABLE \ 60 OP(EQ, "=") \ 61 OP(NOT, "!") \ 62 OP(GREATER, ">") /* compare */ \ 63 OP(LESS, "<") \ 64 OP(PLUS, "+") /* math */ \ 65 OP(MINUS, "-") \ 66 OP(MULT, "*") \ 67 OP(DIV, "/") \ 68 OP(MOD, "%") \ 69 OP(AND, "&") /* bit ops */ \ 70 OP(OR, "|") \ 71 OP(XOR, "^") \ 72 OP(RSHIFT, ">>") \ 73 OP(LSHIFT, "<<") \ 74 \ 75 OP(COMPL, "~") \ 76 OP(AND_AND, "&&") /* logical */ \ 77 OP(OR_OR, "||") \ 78 OP(QUERY, "?") \ 79 OP(COLON, ":") \ 80 OP(COMMA, ",") /* grouping */ \ 81 OP(OPEN_PAREN, "(") \ 82 OP(CLOSE_PAREN, ")") \ 83 TK(EOF, NONE) \ 84 OP(EQ_EQ, "==") /* compare */ \ 85 OP(NOT_EQ, "!=") \ 86 OP(GREATER_EQ, ">=") \ 87 OP(LESS_EQ, "<=") \ 88 \ 89 /* These two are unary + / - in preprocessor expressions. */ \ 90 OP(PLUS_EQ, "+=") /* math */ \ 91 OP(MINUS_EQ, "-=") \ 92 \ 93 OP(MULT_EQ, "*=") \ 94 OP(DIV_EQ, "/=") \ 95 OP(MOD_EQ, "%=") \ 96 OP(AND_EQ, "&=") /* bit ops */ \ 97 OP(OR_EQ, "|=") \ 98 OP(XOR_EQ, "^=") \ 99 OP(RSHIFT_EQ, ">>=") \ 100 OP(LSHIFT_EQ, "<<=") \ 101 /* Digraphs together, beginning with CPP_FIRST_DIGRAPH. */ \ 102 OP(HASH, "#") /* digraphs */ \ 103 OP(PASTE, "##") \ 104 OP(OPEN_SQUARE, "[") \ 105 OP(CLOSE_SQUARE, "]") \ 106 OP(OPEN_BRACE, "{") \ 107 OP(CLOSE_BRACE, "}") \ 108 /* The remainder of the punctuation. Order is not significant. */ \ 109 OP(SEMICOLON, ";") /* structure */ \ 110 OP(ELLIPSIS, "...") \ 111 OP(PLUS_PLUS, "++") /* increment */ \ 112 OP(MINUS_MINUS, "--") \ 113 OP(DEREF, "->") /* accessors */ \ 114 OP(DOT, ".") \ 115 OP(SCOPE, "::") \ 116 OP(DEREF_STAR, "->*") \ 117 OP(DOT_STAR, ".*") \ 118 OP(ATSIGN, "@") /* used in Objective-C */ \ 119 \ 120 TK(NAME, IDENT) /* word */ \ 121 TK(AT_NAME, IDENT) /* @word - Objective-C */ \ 122 TK(NUMBER, LITERAL) /* 34_be+ta */ \ 123 \ 124 TK(CHAR, LITERAL) /* 'char' */ \ 125 TK(WCHAR, LITERAL) /* L'char' */ \ 126 TK(CHAR16, LITERAL) /* u'char' */ \ 127 TK(CHAR32, LITERAL) /* U'char' */ \ 128 TK(OTHER, LITERAL) /* stray punctuation */ \ 129 \ 130 TK(STRING, LITERAL) /* "string" */ \ 131 TK(WSTRING, LITERAL) /* L"string" */ \ 132 TK(STRING16, LITERAL) /* u"string" */ \ 133 TK(STRING32, LITERAL) /* U"string" */ \ 134 TK(OBJC_STRING, LITERAL) /* @"string" - Objective-C */ \ 135 TK(HEADER_NAME, LITERAL) /* <stdio.h> in #include */ \ 136 \ 137 TK(COMMENT, LITERAL) /* Only if output comments. */ \ 138 /* SPELL_LITERAL happens to DTRT. */ \ 139 TK(MACRO_ARG, NONE) /* Macro argument. */ \ 140 TK(PRAGMA, NONE) /* Only for deferred pragmas. */ \ 141 TK(PRAGMA_EOL, NONE) /* End-of-line for deferred pragmas. */ \ 142 TK(PADDING, NONE) /* Whitespace for -E. */ 143 144 #define OP(e, s) CPP_ ## e, 145 #define TK(e, s) CPP_ ## e, 146 enum cpp_ttype 147 { 148 TTYPE_TABLE 149 N_TTYPES, 150 151 /* Positions in the table. */ 152 CPP_LAST_EQ = CPP_LSHIFT, 153 CPP_FIRST_DIGRAPH = CPP_HASH, 154 CPP_LAST_PUNCTUATOR= CPP_ATSIGN, 155 CPP_LAST_CPP_OP = CPP_LESS_EQ 156 }; 157 #undef OP 158 #undef TK 159 160 /* C language kind, used when calling cpp_create_reader. */ 161 enum c_lang {CLK_GNUC89 = 0, CLK_GNUC99, CLK_STDC89, CLK_STDC94, CLK_STDC99, 162 CLK_GNUCXX, CLK_CXX98, CLK_GNUCXX0X, CLK_CXX0X, CLK_ASM}; 163 164 /* Payload of a NUMBER, STRING, CHAR or COMMENT token. */ 165 struct cpp_string GTY(()) 166 { 167 unsigned int len; 168 const unsigned char *text; 169 }; 170 171 /* Flags for the cpp_token structure. */ 172 #define PREV_WHITE (1 << 0) /* If whitespace before this token. */ 173 #define DIGRAPH (1 << 1) /* If it was a digraph. */ 174 #define STRINGIFY_ARG (1 << 2) /* If macro argument to be stringified. */ 175 #define PASTE_LEFT (1 << 3) /* If on LHS of a ## operator. */ 176 #define NAMED_OP (1 << 4) /* C++ named operators. */ 177 #define NO_EXPAND (1 << 5) /* Do not macro-expand this token. */ 178 #define BOL (1 << 6) /* Token at beginning of line. */ 179 #define PURE_ZERO (1 << 7) /* Single 0 digit, used by the C++ frontend, 180 set in c-lex.c. */ 181 182 /* Specify which field, if any, of the cpp_token union is used. */ 183 184 enum cpp_token_fld_kind { 185 CPP_TOKEN_FLD_NODE, 186 CPP_TOKEN_FLD_SOURCE, 187 CPP_TOKEN_FLD_STR, 188 CPP_TOKEN_FLD_ARG_NO, 189 CPP_TOKEN_FLD_PRAGMA, 190 CPP_TOKEN_FLD_NONE 191 }; 192 193 /* A preprocessing token. This has been carefully packed and should 194 occupy 16 bytes on 32-bit hosts and 24 bytes on 64-bit hosts. */ 195 struct cpp_token GTY(()) 196 { 197 source_location src_loc; /* Location of first char of token. */ 198 ENUM_BITFIELD(cpp_ttype) type : CHAR_BIT; /* token type */ 199 unsigned char flags; /* flags - see above */ 200 201 union cpp_token_u 202 { 203 /* An identifier. */ 204 cpp_hashnode * 205 GTY ((nested_ptr (union tree_node, 206 "%h ? CPP_HASHNODE (GCC_IDENT_TO_HT_IDENT (%h)) : NULL", 207 "%h ? HT_IDENT_TO_GCC_IDENT (HT_NODE (%h)) : NULL"), 208 tag ("CPP_TOKEN_FLD_NODE"))) 209 node; 210 211 /* Inherit padding from this token. */ 212 cpp_token * GTY ((tag ("CPP_TOKEN_FLD_SOURCE"))) source; 213 214 /* A string, or number. */ 215 struct cpp_string GTY ((tag ("CPP_TOKEN_FLD_STR"))) str; 216 217 /* Argument no. for a CPP_MACRO_ARG. */ 218 unsigned int GTY ((tag ("CPP_TOKEN_FLD_ARG_NO"))) arg_no; 219 220 /* Caller-supplied identifier for a CPP_PRAGMA. */ 221 unsigned int GTY ((tag ("CPP_TOKEN_FLD_PRAGMA"))) pragma; 222 } GTY ((desc ("cpp_token_val_index (&%1)"))) val; 223 }; 224 225 /* Say which field is in use. */ 226 extern enum cpp_token_fld_kind cpp_token_val_index (cpp_token *tok); 227 228 /* A type wide enough to hold any multibyte source character. 229 cpplib's character constant interpreter requires an unsigned type. 230 Also, a typedef for the signed equivalent. 231 The width of this type is capped at 32 bits; there do exist targets 232 where wchar_t is 64 bits, but only in a non-default mode, and there 233 would be no meaningful interpretation for a wchar_t value greater 234 than 2^32 anyway -- the widest wide-character encoding around is 235 ISO 10646, which stops at 2^31. */ 236 #if CHAR_BIT * SIZEOF_INT >= 32 237 # define CPPCHAR_SIGNED_T int 238 #elif CHAR_BIT * SIZEOF_LONG >= 32 239 # define CPPCHAR_SIGNED_T long 240 #else 241 # error "Cannot find a least-32-bit signed integer type" 242 #endif 243 typedef unsigned CPPCHAR_SIGNED_T cppchar_t; 244 typedef CPPCHAR_SIGNED_T cppchar_signed_t; 245 246 /* Style of header dependencies to generate. */ 247 enum cpp_deps_style { DEPS_NONE = 0, DEPS_USER, DEPS_SYSTEM }; 248 249 /* The possible normalization levels, from most restrictive to least. */ 250 enum cpp_normalize_level { 251 /* In NFKC. */ 252 normalized_KC = 0, 253 /* In NFC. */ 254 normalized_C, 255 /* In NFC, except for subsequences where being in NFC would make 256 the identifier invalid. */ 257 normalized_identifier_C, 258 /* Not normalized at all. */ 259 normalized_none 260 }; 261 262 /* This structure is nested inside struct cpp_reader, and 263 carries all the options visible to the command line. */ 264 struct cpp_options 265 { 266 /* Characters between tab stops. */ 267 unsigned int tabstop; 268 269 /* The language we're preprocessing. */ 270 enum c_lang lang; 271 272 /* Nonzero means use extra default include directories for C++. */ 273 unsigned char cplusplus; 274 275 /* Nonzero means handle cplusplus style comments. */ 276 unsigned char cplusplus_comments; 277 278 /* Nonzero means define __OBJC__, treat @ as a special token, use 279 the OBJC[PLUS]_INCLUDE_PATH environment variable, and allow 280 "#import". */ 281 unsigned char objc; 282 283 /* Nonzero means don't copy comments into the output file. */ 284 unsigned char discard_comments; 285 286 /* Nonzero means don't copy comments into the output file during 287 macro expansion. */ 288 unsigned char discard_comments_in_macro_exp; 289 290 /* Nonzero means process the ISO trigraph sequences. */ 291 unsigned char trigraphs; 292 293 /* Nonzero means process the ISO digraph sequences. */ 294 unsigned char digraphs; 295 296 /* Nonzero means to allow hexadecimal floats and LL suffixes. */ 297 unsigned char extended_numbers; 298 299 /* Nonzero means process u/U prefix literals (UTF-16/32). */ 300 unsigned char uliterals; 301 302 /* Nonzero means print names of header files (-H). */ 303 unsigned char print_include_names; 304 305 /* Nonzero means cpp_pedwarn causes a hard error. */ 306 unsigned char pedantic_errors; 307 308 /* Nonzero means don't print warning messages. */ 309 unsigned char inhibit_warnings; 310 311 /* Nonzero means complain about deprecated features. */ 312 unsigned char warn_deprecated; 313 314 /* Nonzero means don't suppress warnings from system headers. */ 315 unsigned char warn_system_headers; 316 317 /* Nonzero means don't print error messages. Has no option to 318 select it, but can be set by a user of cpplib (e.g. fix-header). */ 319 unsigned char inhibit_errors; 320 321 /* Nonzero means warn if slash-star appears in a comment. */ 322 unsigned char warn_comments; 323 324 /* Nonzero means warn if a user-supplied include directory does not 325 exist. */ 326 unsigned char warn_missing_include_dirs; 327 328 /* Nonzero means warn if there are any trigraphs. */ 329 unsigned char warn_trigraphs; 330 331 /* Nonzero means warn about multicharacter charconsts. */ 332 unsigned char warn_multichar; 333 334 /* Nonzero means warn about various incompatibilities with 335 traditional C. */ 336 unsigned char warn_traditional; 337 338 /* Nonzero means warn about long long numeric constants. */ 339 unsigned char warn_long_long; 340 341 /* Nonzero means warn about text after an #endif (or #else). */ 342 unsigned char warn_endif_labels; 343 344 /* Nonzero means warn about implicit sign changes owing to integer 345 promotions. */ 346 unsigned char warn_num_sign_change; 347 348 /* Zero means don't warn about __VA_ARGS__ usage in c89 pedantic mode. 349 Presumably the usage is protected by the appropriate #ifdef. */ 350 unsigned char warn_variadic_macros; 351 352 /* Nonzero means warn about builtin macros that are redefined or 353 explicitly undefined. */ 354 unsigned char warn_builtin_macro_redefined; 355 356 /* Nonzero means turn warnings into errors. */ 357 unsigned char warnings_are_errors; 358 359 /* Nonzero means we should look for header.gcc files that remap file 360 names. */ 361 unsigned char remap; 362 363 /* Zero means dollar signs are punctuation. */ 364 unsigned char dollars_in_ident; 365 366 /* Nonzero means UCNs are accepted in identifiers. */ 367 unsigned char extended_identifiers; 368 369 /* True if we should warn about dollars in identifiers or numbers 370 for this translation unit. */ 371 unsigned char warn_dollars; 372 373 /* Nonzero means warn if undefined identifiers are evaluated in an #if. */ 374 unsigned char warn_undef; 375 376 /* Nonzero means warn of unused macros from the main file. */ 377 unsigned char warn_unused_macros; 378 379 /* Nonzero for the 1999 C Standard, including corrigenda and amendments. */ 380 unsigned char c99; 381 382 /* Nonzero if we are conforming to a specific C or C++ standard. */ 383 unsigned char std; 384 385 /* Nonzero means give all the error messages the ANSI standard requires. */ 386 unsigned char pedantic; 387 388 /* Nonzero means we're looking at already preprocessed code, so don't 389 bother trying to do macro expansion and whatnot. */ 390 unsigned char preprocessed; 391 392 /* Print column number in error messages. */ 393 unsigned char show_column; 394 395 /* Nonzero means handle C++ alternate operator names. */ 396 unsigned char operator_names; 397 398 /* True for traditional preprocessing. */ 399 unsigned char traditional; 400 401 /* Holds the name of the target (execution) character set. */ 402 const char *narrow_charset; 403 404 /* Holds the name of the target wide character set. */ 405 const char *wide_charset; 406 407 /* Holds the name of the input character set. */ 408 const char *input_charset; 409 410 /* The minimum permitted level of normalization before a warning 411 is generated. */ 412 enum cpp_normalize_level warn_normalize; 413 414 /* True to warn about precompiled header files we couldn't use. */ 415 bool warn_invalid_pch; 416 417 /* True if dependencies should be restored from a precompiled header. */ 418 bool restore_pch_deps; 419 420 /* Dependency generation. */ 421 struct 422 { 423 /* Style of header dependencies to generate. */ 424 enum cpp_deps_style style; 425 426 /* Assume missing files are generated files. */ 427 bool missing_files; 428 429 /* Generate phony targets for each dependency apart from the first 430 one. */ 431 bool phony_targets; 432 433 /* If true, no dependency is generated on the main file. */ 434 bool ignore_main_file; 435 436 /* If true, intend to use the preprocessor output (e.g., for compilation) 437 in addition to the dependency info. */ 438 bool need_preprocessor_output; 439 } deps; 440 441 /* Target-specific features set by the front end or client. */ 442 443 /* Precision for target CPP arithmetic, target characters, target 444 ints and target wide characters, respectively. */ 445 size_t precision, char_precision, int_precision, wchar_precision; 446 447 /* True means chars (wide chars) are unsigned. */ 448 bool unsigned_char, unsigned_wchar; 449 450 /* True if the most significant byte in a word has the lowest 451 address in memory. */ 452 bool bytes_big_endian; 453 454 /* Nonzero means __STDC__ should have the value 0 in system headers. */ 455 unsigned char stdc_0_in_system_headers; 456 457 /* True means error callback should be used for diagnostics. */ 458 bool client_diagnostic; 459 460 /* True disables tokenization outside of preprocessing directives. */ 461 bool directives_only; 462 }; 463 464 /* Callback for header lookup for HEADER, which is the name of a 465 source file. It is used as a method of last resort to find headers 466 that are not otherwise found during the normal include processing. 467 The return value is the malloced name of a header to try and open, 468 if any, or NULL otherwise. This callback is called only if the 469 header is otherwise unfound. */ 470 typedef const char *(*missing_header_cb)(cpp_reader *, const char *header, cpp_dir **); 471 472 /* Call backs to cpplib client. */ 473 struct cpp_callbacks 474 { 475 /* Called when a new line of preprocessed output is started. */ 476 void (*line_change) (cpp_reader *, const cpp_token *, int); 477 478 /* Called when switching to/from a new file. 479 The line_map is for the new file. It is NULL if there is no new file. 480 (In C this happens when done with <built-in>+<command line> and also 481 when done with a main file.) This can be used for resource cleanup. */ 482 void (*file_change) (cpp_reader *, const struct line_map *); 483 484 void (*dir_change) (cpp_reader *, const char *); 485 void (*include) (cpp_reader *, unsigned int, const unsigned char *, 486 const char *, int, const cpp_token **); 487 void (*define) (cpp_reader *, unsigned int, cpp_hashnode *); 488 void (*undef) (cpp_reader *, unsigned int, cpp_hashnode *); 489 void (*ident) (cpp_reader *, unsigned int, const cpp_string *); 490 void (*def_pragma) (cpp_reader *, unsigned int); 491 int (*valid_pch) (cpp_reader *, const char *, int); 492 void (*read_pch) (cpp_reader *, const char *, int, const char *); 493 missing_header_cb missing_header; 494 495 /* Context-sensitive macro support. Returns macro (if any) that should 496 be expanded. */ 497 cpp_hashnode * (*macro_to_expand) (cpp_reader *, const cpp_token *); 498 499 /* Called to emit a diagnostic if client_diagnostic option is true. 500 This callback receives the translated message. */ 501 void (*error) (cpp_reader *, int, const char *, va_list *) 502 ATTRIBUTE_FPTR_PRINTF(3,0); 503 504 /* Callbacks for when a macro is expanded, or tested (whether 505 defined or not at the time) in #ifdef, #ifndef or "defined". */ 506 void (*used_define) (cpp_reader *, unsigned int, cpp_hashnode *); 507 void (*used_undef) (cpp_reader *, unsigned int, cpp_hashnode *); 508 /* Called before #define and #undef or other macro definition 509 changes are processed. */ 510 void (*before_define) (cpp_reader *); 511 }; 512 513 /* Chain of directories to look for include files in. */ 514 struct cpp_dir 515 { 516 /* NULL-terminated singly-linked list. */ 517 struct cpp_dir *next; 518 519 /* NAME of the directory, NUL-terminated. */ 520 char *name; 521 unsigned int len; 522 523 /* One if a system header, two if a system header that has extern 524 "C" guards for C++. */ 525 unsigned char sysp; 526 527 /* Is this a user-supplied directory? */ 528 bool user_supplied_p; 529 530 /* The canonicalized NAME as determined by lrealpath. This field 531 is only used by hosts that lack reliable inode numbers. */ 532 char *canonical_name; 533 534 /* Mapping of file names for this directory for MS-DOS and related 535 platforms. A NULL-terminated array of (from, to) pairs. */ 536 const char **name_map; 537 538 /* Routine to construct pathname, given the search path name and the 539 HEADER we are trying to find, return a constructed pathname to 540 try and open. If this is NULL, the constructed pathname is as 541 constructed by append_file_to_dir. */ 542 char *(*construct) (const char *header, cpp_dir *dir); 543 544 /* The C front end uses these to recognize duplicated 545 directories in the search path. */ 546 ino_t ino; 547 dev_t dev; 548 }; 549 550 /* Name under which this program was invoked. */ 551 extern const char *progname; 552 553 /* The structure of a node in the hash table. The hash table has 554 entries for all identifiers: either macros defined by #define 555 commands (type NT_MACRO), assertions created with #assert 556 (NT_ASSERTION), or neither of the above (NT_VOID). Builtin macros 557 like __LINE__ are flagged NODE_BUILTIN. Poisoned identifiers are 558 flagged NODE_POISONED. NODE_OPERATOR (C++ only) indicates an 559 identifier that behaves like an operator such as "xor". 560 NODE_DIAGNOSTIC is for speed in lex_token: it indicates a 561 diagnostic may be required for this node. Currently this only 562 applies to __VA_ARGS__ and poisoned identifiers. */ 563 564 /* Hash node flags. */ 565 #define NODE_OPERATOR (1 << 0) /* C++ named operator. */ 566 #define NODE_POISONED (1 << 1) /* Poisoned identifier. */ 567 #define NODE_BUILTIN (1 << 2) /* Builtin macro. */ 568 #define NODE_DIAGNOSTIC (1 << 3) /* Possible diagnostic when lexed. */ 569 #define NODE_WARN (1 << 4) /* Warn if redefined or undefined. */ 570 #define NODE_DISABLED (1 << 5) /* A disabled macro. */ 571 #define NODE_MACRO_ARG (1 << 6) /* Used during #define processing. */ 572 #define NODE_USED (1 << 7) /* Dumped with -dU. */ 573 #define NODE_CONDITIONAL (1 << 8) /* Conditional macro */ 574 575 /* Different flavors of hash node. */ 576 enum node_type 577 { 578 NT_VOID = 0, /* No definition yet. */ 579 NT_MACRO, /* A macro of some form. */ 580 NT_ASSERTION /* Predicate for #assert. */ 581 }; 582 583 /* Different flavors of builtin macro. _Pragma is an operator, but we 584 handle it with the builtin code for efficiency reasons. */ 585 enum builtin_type 586 { 587 BT_SPECLINE = 0, /* `__LINE__' */ 588 BT_DATE, /* `__DATE__' */ 589 BT_FILE, /* `__FILE__' */ 590 BT_BASE_FILE, /* `__BASE_FILE__' */ 591 BT_INCLUDE_LEVEL, /* `__INCLUDE_LEVEL__' */ 592 BT_TIME, /* `__TIME__' */ 593 BT_STDC, /* `__STDC__' */ 594 BT_PRAGMA, /* `_Pragma' operator */ 595 BT_TIMESTAMP, /* `__TIMESTAMP__' */ 596 BT_COUNTER /* `__COUNTER__' */ 597 }; 598 599 #define CPP_HASHNODE(HNODE) ((cpp_hashnode *) (HNODE)) 600 #define HT_NODE(NODE) ((ht_identifier *) (NODE)) 601 #define NODE_LEN(NODE) HT_LEN (&(NODE)->ident) 602 #define NODE_NAME(NODE) HT_STR (&(NODE)->ident) 603 604 /* Specify which field, if any, of the union is used. */ 605 606 enum { 607 NTV_MACRO, 608 NTV_ANSWER, 609 NTV_BUILTIN, 610 NTV_ARGUMENT, 611 NTV_NONE 612 }; 613 614 #define CPP_HASHNODE_VALUE_IDX(HNODE) \ 615 ((HNODE.flags & NODE_MACRO_ARG) ? NTV_ARGUMENT \ 616 : HNODE.type == NT_MACRO ? ((HNODE.flags & NODE_BUILTIN) \ 617 ? NTV_BUILTIN : NTV_MACRO) \ 618 : HNODE.type == NT_ASSERTION ? NTV_ANSWER \ 619 : NTV_NONE) 620 621 /* The common part of an identifier node shared amongst all 3 C front 622 ends. Also used to store CPP identifiers, which are a superset of 623 identifiers in the grammatical sense. */ 624 625 union _cpp_hashnode_value GTY(()) 626 { 627 /* If a macro. */ 628 cpp_macro * GTY((tag ("NTV_MACRO"))) macro; 629 /* Answers to an assertion. */ 630 struct answer * GTY ((tag ("NTV_ANSWER"))) answers; 631 /* Code for a builtin macro. */ 632 enum builtin_type GTY ((tag ("NTV_BUILTIN"))) builtin; 633 /* Macro argument index. */ 634 unsigned short GTY ((tag ("NTV_ARGUMENT"))) arg_index; 635 }; 636 637 struct cpp_hashnode GTY(()) 638 { 639 struct ht_identifier ident; 640 unsigned int is_directive : 1; 641 unsigned int directive_index : 7; /* If is_directive, 642 then index into directive table. 643 Otherwise, a NODE_OPERATOR. */ 644 unsigned char rid_code; /* Rid code - for front ends. */ 645 ENUM_BITFIELD(node_type) type : 7; /* CPP node type. */ 646 unsigned int flags : 9; /* CPP flags. */ 647 648 union _cpp_hashnode_value GTY ((desc ("CPP_HASHNODE_VALUE_IDX (%1)"))) value; 649 }; 650 651 /* Call this first to get a handle to pass to other functions. 652 653 If you want cpplib to manage its own hashtable, pass in a NULL 654 pointer. Otherwise you should pass in an initialized hash table 655 that cpplib will share; this technique is used by the C front 656 ends. */ 657 extern cpp_reader *cpp_create_reader (enum c_lang, struct ht *, 658 struct line_maps *); 659 660 /* Reset the cpp_reader's line_map. This is only used after reading a 661 PCH file. */ 662 extern void cpp_set_line_map (cpp_reader *, struct line_maps *); 663 664 /* Call this to change the selected language standard (e.g. because of 665 command line options). */ 666 extern void cpp_set_lang (cpp_reader *, enum c_lang); 667 668 /* Set the include paths. */ 669 extern void cpp_set_include_chains (cpp_reader *, cpp_dir *, cpp_dir *, int); 670 671 /* Call these to get pointers to the options, callback, and deps 672 structures for a given reader. These pointers are good until you 673 call cpp_finish on that reader. You can either edit the callbacks 674 through the pointer returned from cpp_get_callbacks, or set them 675 with cpp_set_callbacks. */ 676 extern cpp_options *cpp_get_options (cpp_reader *); 677 extern cpp_callbacks *cpp_get_callbacks (cpp_reader *); 678 extern void cpp_set_callbacks (cpp_reader *, cpp_callbacks *); 679 extern struct deps *cpp_get_deps (cpp_reader *); 680 681 /* This function reads the file, but does not start preprocessing. It 682 returns the name of the original file; this is the same as the 683 input file, except for preprocessed input. This will generate at 684 least one file change callback, and possibly a line change callback 685 too. If there was an error opening the file, it returns NULL. */ 686 extern const char *cpp_read_main_file (cpp_reader *, const char *); 687 688 /* Set up built-ins with special behavior. Use cpp_init_builtins() 689 instead unless your know what you are doing. */ 690 extern void cpp_init_special_builtins (cpp_reader *); 691 692 /* Set up built-ins like __FILE__. */ 693 extern void cpp_init_builtins (cpp_reader *, int); 694 695 /* This is called after options have been parsed, and partially 696 processed. */ 697 extern void cpp_post_options (cpp_reader *); 698 699 /* Set up translation to the target character set. */ 700 extern void cpp_init_iconv (cpp_reader *); 701 702 /* Call this to finish preprocessing. If you requested dependency 703 generation, pass an open stream to write the information to, 704 otherwise NULL. It is your responsibility to close the stream. 705 706 Returns cpp_errors (pfile). */ 707 extern int cpp_finish (cpp_reader *, FILE *deps_stream); 708 709 /* Call this to release the handle at the end of preprocessing. Any 710 use of the handle after this function returns is invalid. Returns 711 cpp_errors (pfile). */ 712 extern void cpp_destroy (cpp_reader *); 713 714 /* Error count. */ 715 extern unsigned int cpp_errors (cpp_reader *); 716 717 extern unsigned int cpp_token_len (const cpp_token *); 718 extern unsigned char *cpp_token_as_text (cpp_reader *, const cpp_token *); 719 extern unsigned char *cpp_spell_token (cpp_reader *, const cpp_token *, 720 unsigned char *, bool); 721 extern void cpp_register_pragma (cpp_reader *, const char *, const char *, 722 void (*) (cpp_reader *), bool); 723 extern void cpp_register_deferred_pragma (cpp_reader *, const char *, 724 const char *, unsigned, bool, bool); 725 extern int cpp_avoid_paste (cpp_reader *, const cpp_token *, 726 const cpp_token *); 727 extern const cpp_token *cpp_get_token (cpp_reader *); 728 extern const cpp_token *cpp_get_token_with_location (cpp_reader *, 729 source_location *); 730 extern const unsigned char *cpp_macro_definition (cpp_reader *, 731 const cpp_hashnode *); 732 extern void _cpp_backup_tokens (cpp_reader *, unsigned int); 733 extern const cpp_token *cpp_peek_token (cpp_reader *, int); 734 735 /* Evaluate a CPP_CHAR or CPP_WCHAR token. */ 736 extern cppchar_t cpp_interpret_charconst (cpp_reader *, const cpp_token *, 737 unsigned int *, int *); 738 /* Evaluate a vector of CPP_STRING or CPP_WSTRING tokens. */ 739 extern bool cpp_interpret_string (cpp_reader *, 740 const cpp_string *, size_t, 741 cpp_string *, enum cpp_ttype); 742 extern bool cpp_interpret_string_notranslate (cpp_reader *, 743 const cpp_string *, size_t, 744 cpp_string *, enum cpp_ttype); 745 746 /* Convert a host character constant to the execution character set. */ 747 extern cppchar_t cpp_host_to_exec_charset (cpp_reader *, cppchar_t); 748 749 /* Used to register macros and assertions, perhaps from the command line. 750 The text is the same as the command line argument. */ 751 extern void cpp_define (cpp_reader *, const char *); 752 extern void cpp_define_formatted (cpp_reader *pfile, 753 const char *fmt, ...) ATTRIBUTE_PRINTF_2; 754 extern void cpp_assert (cpp_reader *, const char *); 755 extern void cpp_undef (cpp_reader *, const char *); 756 extern void cpp_unassert (cpp_reader *, const char *); 757 758 extern cpp_macro *cpp_push_definition (cpp_reader *, const char *); 759 extern void cpp_pop_definition (cpp_reader *, const char *, cpp_macro *); 760 761 /* Undefine all macros and assertions. */ 762 extern void cpp_undef_all (cpp_reader *); 763 764 extern cpp_buffer *cpp_push_buffer (cpp_reader *, const unsigned char *, 765 size_t, int); 766 extern int cpp_defined (cpp_reader *, const unsigned char *, int); 767 768 /* A preprocessing number. Code assumes that any unused high bits of 769 the double integer are set to zero. */ 770 typedef unsigned HOST_WIDE_INT cpp_num_part; 771 typedef struct cpp_num cpp_num; 772 struct cpp_num 773 { 774 cpp_num_part high; 775 cpp_num_part low; 776 bool unsignedp; /* True if value should be treated as unsigned. */ 777 bool overflow; /* True if the most recent calculation overflowed. */ 778 }; 779 780 /* cpplib provides two interfaces for interpretation of preprocessing 781 numbers. 782 783 cpp_classify_number categorizes numeric constants according to 784 their field (integer, floating point, or invalid), radix (decimal, 785 octal, hexadecimal), and type suffixes. */ 786 787 #define CPP_N_CATEGORY 0x000F 788 #define CPP_N_INVALID 0x0000 789 #define CPP_N_INTEGER 0x0001 790 #define CPP_N_FLOATING 0x0002 791 792 #define CPP_N_WIDTH 0x00F0 793 #define CPP_N_SMALL 0x0010 /* int, float, shrot _Fract/Accum */ 794 #define CPP_N_MEDIUM 0x0020 /* long, double, long _Fract/_Accum. */ 795 #define CPP_N_LARGE 0x0040 /* long long, long double, 796 long long _Fract/Accum. */ 797 798 #define CPP_N_WIDTH_MD 0xF0000 /* machine defined. */ 799 #define CPP_N_MD_W 0x10000 800 #define CPP_N_MD_Q 0x20000 801 802 #define CPP_N_RADIX 0x0F00 803 #define CPP_N_DECIMAL 0x0100 804 #define CPP_N_HEX 0x0200 805 #define CPP_N_OCTAL 0x0400 806 #define CPP_N_BINARY 0x0800 807 808 #define CPP_N_UNSIGNED 0x1000 /* Properties. */ 809 #define CPP_N_IMAGINARY 0x2000 810 #define CPP_N_DFLOAT 0x4000 811 812 #define CPP_N_FRACT 0x100000 /* Fract types. */ 813 #define CPP_N_ACCUM 0x200000 /* Accum types. */ 814 815 /* Classify a CPP_NUMBER token. The return value is a combination of 816 the flags from the above sets. */ 817 extern unsigned cpp_classify_number (cpp_reader *, const cpp_token *); 818 819 /* Evaluate a token classified as category CPP_N_INTEGER. */ 820 extern cpp_num cpp_interpret_integer (cpp_reader *, const cpp_token *, 821 unsigned int type); 822 823 /* Sign extend a number, with PRECISION significant bits and all 824 others assumed clear, to fill out a cpp_num structure. */ 825 cpp_num cpp_num_sign_extend (cpp_num, size_t); 826 827 /* Diagnostic levels. To get a diagnostic without associating a 828 position in the translation unit with it, use cpp_error_with_line 829 with a line number of zero. */ 830 831 /* Warning, an error with -Werror. */ 832 #define CPP_DL_WARNING 0x00 833 /* Same as CPP_DL_WARNING, except it is not suppressed in system headers. */ 834 #define CPP_DL_WARNING_SYSHDR 0x01 835 /* Warning, an error with -pedantic-errors or -Werror. */ 836 #define CPP_DL_PEDWARN 0x02 837 /* An error. */ 838 #define CPP_DL_ERROR 0x03 839 /* An internal consistency check failed. Prints "internal error: ", 840 otherwise the same as CPP_DL_ERROR. */ 841 #define CPP_DL_ICE 0x04 842 /* Extracts a diagnostic level from an int. */ 843 #define CPP_DL_EXTRACT(l) (l & 0xf) 844 /* Nonzero if a diagnostic level is one of the warnings. */ 845 #define CPP_DL_WARNING_P(l) (CPP_DL_EXTRACT (l) >= CPP_DL_WARNING \ 846 && CPP_DL_EXTRACT (l) <= CPP_DL_PEDWARN) 847 848 /* Output a diagnostic of some kind. */ 849 extern void cpp_error (cpp_reader *, int, const char *msgid, ...) 850 ATTRIBUTE_PRINTF_3; 851 852 /* Output a diagnostic with "MSGID: " preceding the 853 error string of errno. No location is printed. */ 854 extern void cpp_errno (cpp_reader *, int, const char *msgid); 855 856 /* Same as cpp_error, except additionally specifies a position as a 857 (translation unit) physical line and physical column. If the line is 858 zero, then no location is printed. */ 859 extern void cpp_error_with_line (cpp_reader *, int, source_location, unsigned, 860 const char *msgid, ...) ATTRIBUTE_PRINTF_5; 861 862 /* In lex.c */ 863 extern int cpp_ideq (const cpp_token *, const char *); 864 extern void cpp_output_line (cpp_reader *, FILE *); 865 extern unsigned char *cpp_output_line_to_string (cpp_reader *, 866 const unsigned char *); 867 extern void cpp_output_token (const cpp_token *, FILE *); 868 extern const char *cpp_type2name (enum cpp_ttype); 869 /* Returns the value of an escape sequence, truncated to the correct 870 target precision. PSTR points to the input pointer, which is just 871 after the backslash. LIMIT is how much text we have. WIDE is true 872 if the escape sequence is part of a wide character constant or 873 string literal. Handles all relevant diagnostics. */ 874 extern cppchar_t cpp_parse_escape (cpp_reader *, const unsigned char ** pstr, 875 const unsigned char *limit, int wide); 876 877 /* Structure used to hold a comment block at a given location in the 878 source code. */ 879 880 typedef struct 881 { 882 /* Text of the comment including the terminators. */ 883 char *comment; 884 885 /* source location for the given comment. */ 886 source_location sloc; 887 } cpp_comment; 888 889 /* Structure holding all comments for a given cpp_reader. */ 890 891 typedef struct 892 { 893 /* table of comment entries. */ 894 cpp_comment *entries; 895 896 /* number of actual entries entered in the table. */ 897 int count; 898 899 /* number of entries allocated currently. */ 900 int allocated; 901 } cpp_comment_table; 902 903 /* Returns the table of comments encountered by the preprocessor. This 904 table is only populated when pfile->state.save_comments is true. */ 905 extern cpp_comment_table *cpp_get_comments (cpp_reader *); 906 907 /* In hash.c */ 908 909 /* Lookup an identifier in the hashtable. Puts the identifier in the 910 table if it is not already there. */ 911 extern cpp_hashnode *cpp_lookup (cpp_reader *, const unsigned char *, 912 unsigned int); 913 914 typedef int (*cpp_cb) (cpp_reader *, cpp_hashnode *, void *); 915 extern void cpp_forall_identifiers (cpp_reader *, cpp_cb, void *); 916 917 /* In macro.c */ 918 extern void cpp_scan_nooutput (cpp_reader *); 919 extern int cpp_sys_macro_p (cpp_reader *); 920 extern unsigned char *cpp_quote_string (unsigned char *, const unsigned char *, 921 unsigned int); 922 923 /* In files.c */ 924 extern bool cpp_included (cpp_reader *, const char *); 925 extern bool cpp_included_before (cpp_reader *, const char *, source_location); 926 extern void cpp_make_system_header (cpp_reader *, int, int); 927 extern bool cpp_push_include (cpp_reader *, const char *); 928 extern void cpp_change_file (cpp_reader *, enum lc_reason, const char *); 929 extern const char *cpp_get_path (struct _cpp_file *); 930 extern cpp_dir *cpp_get_dir (struct _cpp_file *); 931 extern cpp_buffer *cpp_get_buffer (cpp_reader *); 932 extern struct _cpp_file *cpp_get_file (cpp_buffer *); 933 extern cpp_buffer *cpp_get_prev (cpp_buffer *); 934 extern void cpp_clear_file_cache (cpp_reader *); 935 936 /* In pch.c */ 937 struct save_macro_data; 938 extern int cpp_save_state (cpp_reader *, FILE *); 939 extern int cpp_write_pch_deps (cpp_reader *, FILE *); 940 extern int cpp_write_pch_state (cpp_reader *, FILE *); 941 extern int cpp_valid_state (cpp_reader *, const char *, int); 942 extern void cpp_prepare_state (cpp_reader *, struct save_macro_data **); 943 extern int cpp_read_state (cpp_reader *, const char *, FILE *, 944 struct save_macro_data *); 945 946 #ifdef __cplusplus 947 } 948 #endif 949 950 #endif /* ! LIBCPP_CPPLIB_H */ 951