1 /* Part of CPP library. 2 Copyright (C) 1997-2015 Free Software Foundation, Inc. 3 4 This program is free software; you can redistribute it and/or modify it 5 under the terms of the GNU General Public License as published by the 6 Free Software Foundation; either version 3, or (at your option) any 7 later version. 8 9 This program is distributed in the hope that it will be useful, 10 but WITHOUT ANY WARRANTY; without even the implied warranty of 11 MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the 12 GNU General Public License for more details. 13 14 You should have received a copy of the GNU General Public License 15 along with this program; see the file COPYING3. If not see 16 <http://www.gnu.org/licenses/>. */ 17 18 /* This header defines all the internal data structures and functions 19 that need to be visible across files. It should not be used outside 20 cpplib. */ 21 22 #ifndef LIBCPP_INTERNAL_H 23 #define LIBCPP_INTERNAL_H 24 25 #include "symtab.h" 26 #include "cpp-id-data.h" 27 28 #if HAVE_ICONV 29 #include <iconv.h> 30 #else 31 #define HAVE_ICONV 0 32 typedef int iconv_t; /* dummy */ 33 #endif 34 35 #ifdef __cplusplus 36 extern "C" { 37 #endif 38 39 struct directive; /* Deliberately incomplete. */ 40 struct pending_option; 41 struct op; 42 struct _cpp_strbuf; 43 44 typedef bool (*convert_f) (iconv_t, const unsigned char *, size_t, 45 struct _cpp_strbuf *); 46 struct cset_converter 47 { 48 convert_f func; 49 iconv_t cd; 50 int width; 51 }; 52 53 #define BITS_PER_CPPCHAR_T (CHAR_BIT * sizeof (cppchar_t)) 54 55 /* Test if a sign is valid within a preprocessing number. */ 56 #define VALID_SIGN(c, prevc) \ 57 (((c) == '+' || (c) == '-') && \ 58 ((prevc) == 'e' || (prevc) == 'E' \ 59 || (((prevc) == 'p' || (prevc) == 'P') \ 60 && CPP_OPTION (pfile, extended_numbers)))) 61 62 #define DIGIT_SEP(c) ((c) == '\'' && CPP_OPTION (pfile, digit_separators)) 63 64 #define CPP_OPTION(PFILE, OPTION) ((PFILE)->opts.OPTION) 65 #define CPP_BUFFER(PFILE) ((PFILE)->buffer) 66 #define CPP_BUF_COLUMN(BUF, CUR) ((CUR) - (BUF)->line_base) 67 #define CPP_BUF_COL(BUF) CPP_BUF_COLUMN(BUF, (BUF)->cur) 68 69 #define CPP_INCREMENT_LINE(PFILE, COLS_HINT) do { \ 70 const struct line_maps *line_table = PFILE->line_table; \ 71 const struct line_map *map = \ 72 LINEMAPS_LAST_ORDINARY_MAP (line_table); \ 73 linenum_type line = SOURCE_LINE (map, line_table->highest_line); \ 74 linemap_line_start (PFILE->line_table, line + 1, COLS_HINT); \ 75 } while (0) 76 77 /* Maximum nesting of cpp_buffers. We use a static limit, partly for 78 efficiency, and partly to limit runaway recursion. */ 79 #define CPP_STACK_MAX 200 80 81 /* Host alignment handling. */ 82 struct dummy 83 { 84 char c; 85 union 86 { 87 double d; 88 int *p; 89 } u; 90 }; 91 92 #define DEFAULT_ALIGNMENT offsetof (struct dummy, u) 93 #define CPP_ALIGN2(size, align) (((size) + ((align) - 1)) & ~((align) - 1)) 94 #define CPP_ALIGN(size) CPP_ALIGN2 (size, DEFAULT_ALIGNMENT) 95 96 #define _cpp_mark_macro_used(NODE) do { \ 97 if ((NODE)->type == NT_MACRO && !((NODE)->flags & NODE_BUILTIN)) \ 98 (NODE)->value.macro->used = 1; } while (0) 99 100 /* A generic memory buffer, and operations on it. */ 101 typedef struct _cpp_buff _cpp_buff; 102 struct _cpp_buff 103 { 104 struct _cpp_buff *next; 105 unsigned char *base, *cur, *limit; 106 }; 107 108 extern _cpp_buff *_cpp_get_buff (cpp_reader *, size_t); 109 extern void _cpp_release_buff (cpp_reader *, _cpp_buff *); 110 extern void _cpp_extend_buff (cpp_reader *, _cpp_buff **, size_t); 111 extern _cpp_buff *_cpp_append_extend_buff (cpp_reader *, _cpp_buff *, size_t); 112 extern void _cpp_free_buff (_cpp_buff *); 113 extern unsigned char *_cpp_aligned_alloc (cpp_reader *, size_t); 114 extern unsigned char *_cpp_unaligned_alloc (cpp_reader *, size_t); 115 116 #define BUFF_ROOM(BUFF) (size_t) ((BUFF)->limit - (BUFF)->cur) 117 #define BUFF_FRONT(BUFF) ((BUFF)->cur) 118 #define BUFF_LIMIT(BUFF) ((BUFF)->limit) 119 120 /* #include types. */ 121 enum include_type {IT_INCLUDE, IT_INCLUDE_NEXT, IT_IMPORT, IT_CMDLINE, IT_DEFAULT}; 122 123 union utoken 124 { 125 const cpp_token *token; 126 const cpp_token **ptoken; 127 }; 128 129 /* A "run" of tokens; part of a chain of runs. */ 130 typedef struct tokenrun tokenrun; 131 struct tokenrun 132 { 133 tokenrun *next, *prev; 134 cpp_token *base, *limit; 135 }; 136 137 /* Accessor macros for struct cpp_context. */ 138 #define FIRST(c) ((c)->u.iso.first) 139 #define LAST(c) ((c)->u.iso.last) 140 #define CUR(c) ((c)->u.trad.cur) 141 #define RLIMIT(c) ((c)->u.trad.rlimit) 142 143 /* This describes some additional data that is added to the macro 144 token context of type cpp_context, when -ftrack-macro-expansion is 145 on. */ 146 typedef struct 147 { 148 /* The node of the macro we are referring to. */ 149 cpp_hashnode *macro_node; 150 /* This buffer contains an array of virtual locations. The virtual 151 location at index 0 is the virtual location of the token at index 152 0 in the current instance of cpp_context; similarly for all the 153 other virtual locations. */ 154 source_location *virt_locs; 155 /* This is a pointer to the current virtual location. This is used 156 to iterate over the virtual locations while we iterate over the 157 tokens they belong to. */ 158 source_location *cur_virt_loc; 159 } macro_context; 160 161 /* The kind of tokens carried by a cpp_context. */ 162 enum context_tokens_kind { 163 /* This is the value of cpp_context::tokens_kind if u.iso.first 164 contains an instance of cpp_token **. */ 165 TOKENS_KIND_INDIRECT, 166 /* This is the value of cpp_context::tokens_kind if u.iso.first 167 contains an instance of cpp_token *. */ 168 TOKENS_KIND_DIRECT, 169 /* This is the value of cpp_context::tokens_kind when the token 170 context contains tokens resulting from macro expansion. In that 171 case struct cpp_context::macro points to an instance of struct 172 macro_context. This is used only when the 173 -ftrack-macro-expansion flag is on. */ 174 TOKENS_KIND_EXTENDED 175 }; 176 177 typedef struct cpp_context cpp_context; 178 struct cpp_context 179 { 180 /* Doubly-linked list. */ 181 cpp_context *next, *prev; 182 183 union 184 { 185 /* For ISO macro expansion. Contexts other than the base context 186 are contiguous tokens. e.g. macro expansions, expanded 187 argument tokens. */ 188 struct 189 { 190 union utoken first; 191 union utoken last; 192 } iso; 193 194 /* For traditional macro expansion. */ 195 struct 196 { 197 const unsigned char *cur; 198 const unsigned char *rlimit; 199 } trad; 200 } u; 201 202 /* If non-NULL, a buffer used for storage related to this context. 203 When the context is popped, the buffer is released. */ 204 _cpp_buff *buff; 205 206 /* If tokens_kind is TOKEN_KIND_EXTENDED, then (as we thus are in a 207 macro context) this is a pointer to an instance of macro_context. 208 Otherwise if tokens_kind is *not* TOKEN_KIND_EXTENDED, then, if 209 we are in a macro context, this is a pointer to an instance of 210 cpp_hashnode, representing the name of the macro this context is 211 for. If we are not in a macro context, then this is just NULL. 212 Note that when tokens_kind is TOKEN_KIND_EXTENDED, the memory 213 used by the instance of macro_context pointed to by this member 214 is de-allocated upon de-allocation of the instance of struct 215 cpp_context. */ 216 union 217 { 218 macro_context *mc; 219 cpp_hashnode *macro; 220 } c; 221 222 /* This determines the type of tokens held by this context. */ 223 enum context_tokens_kind tokens_kind; 224 }; 225 226 struct lexer_state 227 { 228 /* Nonzero if first token on line is CPP_HASH. */ 229 unsigned char in_directive; 230 231 /* Nonzero if we are collecting macro arguments */ 232 unsigned char collecting_args; 233 234 /* Nonzero if in a directive that will handle padding tokens itself. 235 #include needs this to avoid problems with computed include and 236 spacing between tokens. */ 237 unsigned char directive_wants_padding; 238 239 /* True if we are skipping a failed conditional group. */ 240 unsigned char skipping; 241 242 /* Nonzero if in a directive that takes angle-bracketed headers. */ 243 unsigned char angled_headers; 244 245 /* Nonzero if in a #if or #elif directive. */ 246 unsigned char in_expression; 247 248 /* Nonzero to save comments. Turned off if discard_comments, and in 249 all directives apart from #define. */ 250 unsigned char save_comments; 251 252 /* Nonzero if lexing __VA_ARGS__ is valid. */ 253 unsigned char va_args_ok; 254 255 /* Nonzero if lexing poisoned identifiers is valid. */ 256 unsigned char poisoned_ok; 257 258 /* Nonzero to prevent macro expansion. */ 259 unsigned char prevent_expansion; 260 261 /* Nonzero when parsing arguments to a function-like macro. */ 262 unsigned char parsing_args; 263 264 /* Nonzero if in a __has_include__ or __has_include_next__ statement. */ 265 unsigned char in__has_include__; 266 267 /* Nonzero if prevent_expansion is true only because output is 268 being discarded. */ 269 unsigned char discarding_output; 270 271 /* Nonzero to skip evaluating part of an expression. */ 272 unsigned int skip_eval; 273 274 /* Nonzero when handling a deferred pragma. */ 275 unsigned char in_deferred_pragma; 276 277 /* Nonzero if the deferred pragma being handled allows macro expansion. */ 278 unsigned char pragma_allow_expansion; 279 }; 280 281 /* Special nodes - identifiers with predefined significance. */ 282 struct spec_nodes 283 { 284 cpp_hashnode *n_defined; /* defined operator */ 285 cpp_hashnode *n_true; /* C++ keyword true */ 286 cpp_hashnode *n_false; /* C++ keyword false */ 287 cpp_hashnode *n__VA_ARGS__; /* C99 vararg macros */ 288 cpp_hashnode *n__has_include__; /* __has_include__ operator */ 289 cpp_hashnode *n__has_include_next__; /* __has_include_next__ operator */ 290 }; 291 292 typedef struct _cpp_line_note _cpp_line_note; 293 struct _cpp_line_note 294 { 295 /* Location in the clean line the note refers to. */ 296 const unsigned char *pos; 297 298 /* Type of note. The 9 'from' trigraph characters represent those 299 trigraphs, '\\' an escaped newline, ' ' an escaped newline with 300 intervening space, 0 represents a note that has already been handled, 301 and anything else is invalid. */ 302 unsigned int type; 303 }; 304 305 /* Represents the contents of a file cpplib has read in. */ 306 struct cpp_buffer 307 { 308 const unsigned char *cur; /* Current location. */ 309 const unsigned char *line_base; /* Start of current physical line. */ 310 const unsigned char *next_line; /* Start of to-be-cleaned logical line. */ 311 312 const unsigned char *buf; /* Entire character buffer. */ 313 const unsigned char *rlimit; /* Writable byte at end of file. */ 314 const unsigned char *to_free; /* Pointer that should be freed when 315 popping the buffer. */ 316 317 _cpp_line_note *notes; /* Array of notes. */ 318 unsigned int cur_note; /* Next note to process. */ 319 unsigned int notes_used; /* Number of notes. */ 320 unsigned int notes_cap; /* Size of allocated array. */ 321 322 struct cpp_buffer *prev; 323 324 /* Pointer into the file table; non-NULL if this is a file buffer. 325 Used for include_next and to record control macros. */ 326 struct _cpp_file *file; 327 328 /* Saved value of __TIMESTAMP__ macro - date and time of last modification 329 of the assotiated file. */ 330 const unsigned char *timestamp; 331 332 /* Value of if_stack at start of this file. 333 Used to prohibit unmatched #endif (etc) in an include file. */ 334 struct if_stack *if_stack; 335 336 /* True if we need to get the next clean line. */ 337 bool need_line; 338 339 /* True if we have already warned about C++ comments in this file. 340 The warning happens only for C89 extended mode with -pedantic on, 341 or for -Wtraditional, and only once per file (otherwise it would 342 be far too noisy). */ 343 unsigned int warned_cplusplus_comments : 1; 344 345 /* True if we don't process trigraphs and escaped newlines. True 346 for preprocessed input, command line directives, and _Pragma 347 buffers. */ 348 unsigned int from_stage3 : 1; 349 350 /* At EOF, a buffer is automatically popped. If RETURN_AT_EOF is 351 true, a CPP_EOF token is then returned. Otherwise, the next 352 token from the enclosing buffer is returned. */ 353 unsigned int return_at_eof : 1; 354 355 /* One for a system header, two for a C system header file that therefore 356 needs to be extern "C" protected in C++, and zero otherwise. */ 357 unsigned char sysp; 358 359 /* The directory of the this buffer's file. Its NAME member is not 360 allocated, so we don't need to worry about freeing it. */ 361 struct cpp_dir dir; 362 363 /* Descriptor for converting from the input character set to the 364 source character set. */ 365 struct cset_converter input_cset_desc; 366 }; 367 368 /* The list of saved macros by push_macro pragma. */ 369 struct def_pragma_macro { 370 /* Chain element to previous saved macro. */ 371 struct def_pragma_macro *next; 372 /* Name of the macro. */ 373 char *name; 374 /* The stored macro content. */ 375 unsigned char *definition; 376 377 /* Definition line number. */ 378 source_location line; 379 /* If macro defined in system header. */ 380 unsigned int syshdr : 1; 381 /* Nonzero if it has been expanded or had its existence tested. */ 382 unsigned int used : 1; 383 384 /* Mark if we save an undefined macro. */ 385 unsigned int is_undef : 1; 386 }; 387 388 /* A cpp_reader encapsulates the "state" of a pre-processor run. 389 Applying cpp_get_token repeatedly yields a stream of pre-processor 390 tokens. Usually, there is only one cpp_reader object active. */ 391 struct cpp_reader 392 { 393 /* Top of buffer stack. */ 394 cpp_buffer *buffer; 395 396 /* Overlaid buffer (can be different after processing #include). */ 397 cpp_buffer *overlaid_buffer; 398 399 /* Lexer state. */ 400 struct lexer_state state; 401 402 /* Source line tracking. */ 403 struct line_maps *line_table; 404 405 /* The line of the '#' of the current directive. */ 406 source_location directive_line; 407 408 /* Memory buffers. */ 409 _cpp_buff *a_buff; /* Aligned permanent storage. */ 410 _cpp_buff *u_buff; /* Unaligned permanent storage. */ 411 _cpp_buff *free_buffs; /* Free buffer chain. */ 412 413 /* Context stack. */ 414 struct cpp_context base_context; 415 struct cpp_context *context; 416 417 /* If in_directive, the directive if known. */ 418 const struct directive *directive; 419 420 /* Token generated while handling a directive, if any. */ 421 cpp_token directive_result; 422 423 /* When expanding a macro at top-level, this is the location of the 424 macro invocation. */ 425 source_location invocation_location; 426 427 /* This is the node representing the macro being expanded at 428 top-level. The value of this data member is valid iff 429 in_macro_expansion_p() returns TRUE. */ 430 cpp_hashnode *top_most_macro_node; 431 432 /* Nonzero if we are about to expand a macro. Note that if we are 433 really expanding a macro, the function macro_of_context returns 434 the macro being expanded and this flag is set to false. Client 435 code should use the function in_macro_expansion_p to know if we 436 are either about to expand a macro, or are actually expanding 437 one. */ 438 bool about_to_expand_macro_p; 439 440 /* Search paths for include files. */ 441 struct cpp_dir *quote_include; /* "" */ 442 struct cpp_dir *bracket_include; /* <> */ 443 struct cpp_dir no_search_path; /* No path. */ 444 445 /* Chain of all hashed _cpp_file instances. */ 446 struct _cpp_file *all_files; 447 448 struct _cpp_file *main_file; 449 450 /* File and directory hash table. */ 451 struct htab *file_hash; 452 struct htab *dir_hash; 453 struct file_hash_entry_pool *file_hash_entries; 454 455 /* Negative path lookup hash table. */ 456 struct htab *nonexistent_file_hash; 457 struct obstack nonexistent_file_ob; 458 459 /* Nonzero means don't look for #include "foo" the source-file 460 directory. */ 461 bool quote_ignores_source_dir; 462 463 /* Nonzero if any file has contained #pragma once or #import has 464 been used. */ 465 bool seen_once_only; 466 467 /* Multiple include optimization. */ 468 const cpp_hashnode *mi_cmacro; 469 const cpp_hashnode *mi_ind_cmacro; 470 bool mi_valid; 471 472 /* Lexing. */ 473 cpp_token *cur_token; 474 tokenrun base_run, *cur_run; 475 unsigned int lookaheads; 476 477 /* Nonzero prevents the lexer from re-using the token runs. */ 478 unsigned int keep_tokens; 479 480 /* Buffer to hold macro definition string. */ 481 unsigned char *macro_buffer; 482 unsigned int macro_buffer_len; 483 484 /* Descriptor for converting from the source character set to the 485 execution character set. */ 486 struct cset_converter narrow_cset_desc; 487 488 /* Descriptor for converting from the source character set to the 489 UTF-8 execution character set. */ 490 struct cset_converter utf8_cset_desc; 491 492 /* Descriptor for converting from the source character set to the 493 UTF-16 execution character set. */ 494 struct cset_converter char16_cset_desc; 495 496 /* Descriptor for converting from the source character set to the 497 UTF-32 execution character set. */ 498 struct cset_converter char32_cset_desc; 499 500 /* Descriptor for converting from the source character set to the 501 wide execution character set. */ 502 struct cset_converter wide_cset_desc; 503 504 /* Date and time text. Calculated together if either is requested. */ 505 const unsigned char *date; 506 const unsigned char *time; 507 508 /* EOF token, and a token forcing paste avoidance. */ 509 cpp_token avoid_paste; 510 cpp_token eof; 511 512 /* Opaque handle to the dependencies of mkdeps.c. */ 513 struct deps *deps; 514 515 /* Obstack holding all macro hash nodes. This never shrinks. 516 See identifiers.c */ 517 struct obstack hash_ob; 518 519 /* Obstack holding buffer and conditional structures. This is a 520 real stack. See directives.c. */ 521 struct obstack buffer_ob; 522 523 /* Pragma table - dynamic, because a library user can add to the 524 list of recognized pragmas. */ 525 struct pragma_entry *pragmas; 526 527 /* Call backs to cpplib client. */ 528 struct cpp_callbacks cb; 529 530 /* Identifier hash table. */ 531 struct ht *hash_table; 532 533 /* Expression parser stack. */ 534 struct op *op_stack, *op_limit; 535 536 /* User visible options. */ 537 struct cpp_options opts; 538 539 /* Special nodes - identifiers with predefined significance to the 540 preprocessor. */ 541 struct spec_nodes spec_nodes; 542 543 /* Whether cpplib owns the hashtable. */ 544 bool our_hashtable; 545 546 /* Traditional preprocessing output buffer (a logical line). */ 547 struct 548 { 549 unsigned char *base; 550 unsigned char *limit; 551 unsigned char *cur; 552 source_location first_line; 553 } out; 554 555 /* Used for buffer overlays by traditional.c. */ 556 const unsigned char *saved_cur, *saved_rlimit, *saved_line_base; 557 558 /* A saved list of the defined macros, for dependency checking 559 of precompiled headers. */ 560 struct cpp_savedstate *savedstate; 561 562 /* Next value of __COUNTER__ macro. */ 563 unsigned int counter; 564 565 /* Table of comments, when state.save_comments is true. */ 566 cpp_comment_table comments; 567 568 /* List of saved macros by push_macro. */ 569 struct def_pragma_macro *pushed_macros; 570 571 /* If non-null, the lexer will use this location for the next token 572 instead of getting a location from the linemap. */ 573 source_location *forced_token_location_p; 574 }; 575 576 /* Character classes. Based on the more primitive macros in safe-ctype.h. 577 If the definition of `numchar' looks odd to you, please look up the 578 definition of a pp-number in the C standard [section 6.4.8 of C99]. 579 580 In the unlikely event that characters other than \r and \n enter 581 the set is_vspace, the macro handle_newline() in lex.c must be 582 updated. */ 583 #define _dollar_ok(x) ((x) == '$' && CPP_OPTION (pfile, dollars_in_ident)) 584 585 #define is_idchar(x) (ISIDNUM(x) || _dollar_ok(x)) 586 #define is_numchar(x) ISIDNUM(x) 587 #define is_idstart(x) (ISIDST(x) || _dollar_ok(x)) 588 #define is_numstart(x) ISDIGIT(x) 589 #define is_hspace(x) ISBLANK(x) 590 #define is_vspace(x) IS_VSPACE(x) 591 #define is_nvspace(x) IS_NVSPACE(x) 592 #define is_space(x) IS_SPACE_OR_NUL(x) 593 594 /* This table is constant if it can be initialized at compile time, 595 which is the case if cpp was compiled with GCC >=2.7, or another 596 compiler that supports C99. */ 597 #if HAVE_DESIGNATED_INITIALIZERS 598 extern const unsigned char _cpp_trigraph_map[UCHAR_MAX + 1]; 599 #else 600 extern unsigned char _cpp_trigraph_map[UCHAR_MAX + 1]; 601 #endif 602 603 /* Macros. */ 604 605 static inline int cpp_in_system_header (cpp_reader *); 606 static inline int 607 cpp_in_system_header (cpp_reader *pfile) 608 { 609 return pfile->buffer ? pfile->buffer->sysp : 0; 610 } 611 #define CPP_PEDANTIC(PF) CPP_OPTION (PF, cpp_pedantic) 612 #define CPP_WTRADITIONAL(PF) CPP_OPTION (PF, cpp_warn_traditional) 613 614 static inline int cpp_in_primary_file (cpp_reader *); 615 static inline int 616 cpp_in_primary_file (cpp_reader *pfile) 617 { 618 return pfile->line_table->depth == 1; 619 } 620 621 /* In macro.c */ 622 extern void _cpp_free_definition (cpp_hashnode *); 623 extern bool _cpp_create_definition (cpp_reader *, cpp_hashnode *); 624 extern void _cpp_pop_context (cpp_reader *); 625 extern void _cpp_push_text_context (cpp_reader *, cpp_hashnode *, 626 const unsigned char *, size_t); 627 extern bool _cpp_save_parameter (cpp_reader *, cpp_macro *, cpp_hashnode *, 628 cpp_hashnode *); 629 extern bool _cpp_arguments_ok (cpp_reader *, cpp_macro *, const cpp_hashnode *, 630 unsigned int); 631 extern const unsigned char *_cpp_builtin_macro_text (cpp_reader *, 632 cpp_hashnode *); 633 extern int _cpp_warn_if_unused_macro (cpp_reader *, cpp_hashnode *, void *); 634 extern void _cpp_push_token_context (cpp_reader *, cpp_hashnode *, 635 const cpp_token *, unsigned int); 636 extern void _cpp_backup_tokens_direct (cpp_reader *, unsigned int); 637 638 /* In identifiers.c */ 639 extern void _cpp_init_hashtable (cpp_reader *, cpp_hash_table *); 640 extern void _cpp_destroy_hashtable (cpp_reader *); 641 642 /* In files.c */ 643 typedef struct _cpp_file _cpp_file; 644 extern _cpp_file *_cpp_find_file (cpp_reader *, const char *, cpp_dir *, 645 bool, int, bool); 646 extern bool _cpp_find_failed (_cpp_file *); 647 extern void _cpp_mark_file_once_only (cpp_reader *, struct _cpp_file *); 648 extern void _cpp_fake_include (cpp_reader *, const char *); 649 extern bool _cpp_stack_file (cpp_reader *, _cpp_file*, bool); 650 extern bool _cpp_stack_include (cpp_reader *, const char *, int, 651 enum include_type); 652 extern int _cpp_compare_file_date (cpp_reader *, const char *, int); 653 extern void _cpp_report_missing_guards (cpp_reader *); 654 extern void _cpp_init_files (cpp_reader *); 655 extern void _cpp_cleanup_files (cpp_reader *); 656 extern void _cpp_pop_file_buffer (cpp_reader *, struct _cpp_file *, 657 const unsigned char *); 658 extern bool _cpp_save_file_entries (cpp_reader *pfile, FILE *f); 659 extern bool _cpp_read_file_entries (cpp_reader *, FILE *); 660 extern const char *_cpp_get_file_name (_cpp_file *); 661 extern struct stat *_cpp_get_file_stat (_cpp_file *); 662 extern bool _cpp_has_header (cpp_reader *, const char *, int, 663 enum include_type); 664 665 /* In expr.c */ 666 extern bool _cpp_parse_expr (cpp_reader *, bool); 667 extern struct op *_cpp_expand_op_stack (cpp_reader *); 668 669 /* In lex.c */ 670 extern void _cpp_process_line_notes (cpp_reader *, int); 671 extern void _cpp_clean_line (cpp_reader *); 672 extern bool _cpp_get_fresh_line (cpp_reader *); 673 extern bool _cpp_skip_block_comment (cpp_reader *); 674 extern cpp_token *_cpp_temp_token (cpp_reader *); 675 extern const cpp_token *_cpp_lex_token (cpp_reader *); 676 extern cpp_token *_cpp_lex_direct (cpp_reader *); 677 extern unsigned char *_cpp_spell_ident_ucns (unsigned char *, cpp_hashnode *); 678 extern int _cpp_equiv_tokens (const cpp_token *, const cpp_token *); 679 extern void _cpp_init_tokenrun (tokenrun *, unsigned int); 680 extern cpp_hashnode *_cpp_lex_identifier (cpp_reader *, const char *); 681 extern int _cpp_remaining_tokens_num_in_context (cpp_context *); 682 extern void _cpp_init_lexer (void); 683 684 /* In init.c. */ 685 extern void _cpp_maybe_push_include_file (cpp_reader *); 686 extern const char *cpp_named_operator2name (enum cpp_ttype type); 687 688 /* In directives.c */ 689 extern int _cpp_test_assertion (cpp_reader *, unsigned int *); 690 extern int _cpp_handle_directive (cpp_reader *, int); 691 extern void _cpp_define_builtin (cpp_reader *, const char *); 692 extern char ** _cpp_save_pragma_names (cpp_reader *); 693 extern void _cpp_restore_pragma_names (cpp_reader *, char **); 694 extern int _cpp_do__Pragma (cpp_reader *); 695 extern void _cpp_init_directives (cpp_reader *); 696 extern void _cpp_init_internal_pragmas (cpp_reader *); 697 extern void _cpp_do_file_change (cpp_reader *, enum lc_reason, const char *, 698 linenum_type, unsigned int); 699 extern void _cpp_pop_buffer (cpp_reader *); 700 extern char *_cpp_bracket_include (cpp_reader *); 701 702 /* In directives.c */ 703 struct _cpp_dir_only_callbacks 704 { 705 /* Called to print a block of lines. */ 706 void (*print_lines) (int, const void *, size_t); 707 void (*maybe_print_line) (source_location); 708 }; 709 710 extern void _cpp_preprocess_dir_only (cpp_reader *, 711 const struct _cpp_dir_only_callbacks *); 712 713 /* In traditional.c. */ 714 extern bool _cpp_scan_out_logical_line (cpp_reader *, cpp_macro *, bool); 715 extern bool _cpp_read_logical_line_trad (cpp_reader *); 716 extern void _cpp_overlay_buffer (cpp_reader *pfile, const unsigned char *, 717 size_t); 718 extern void _cpp_remove_overlay (cpp_reader *); 719 extern bool _cpp_create_trad_definition (cpp_reader *, cpp_macro *); 720 extern bool _cpp_expansions_different_trad (const cpp_macro *, 721 const cpp_macro *); 722 extern unsigned char *_cpp_copy_replacement_text (const cpp_macro *, 723 unsigned char *); 724 extern size_t _cpp_replacement_text_len (const cpp_macro *); 725 726 /* In charset.c. */ 727 728 /* The normalization state at this point in the sequence. 729 It starts initialized to all zeros, and at the end 730 'level' is the normalization level of the sequence. */ 731 732 struct normalize_state 733 { 734 /* The previous starter character. */ 735 cppchar_t previous; 736 /* The combining class of the previous character (whether or not a 737 starter). */ 738 unsigned char prev_class; 739 /* The lowest normalization level so far. */ 740 enum cpp_normalize_level level; 741 }; 742 #define INITIAL_NORMALIZE_STATE { 0, 0, normalized_KC } 743 #define NORMALIZE_STATE_RESULT(st) ((st)->level) 744 745 /* We saw a character C that matches ISIDNUM(), update a 746 normalize_state appropriately. */ 747 #define NORMALIZE_STATE_UPDATE_IDNUM(st, c) \ 748 ((st)->previous = (c), (st)->prev_class = 0) 749 750 extern cppchar_t _cpp_valid_ucn (cpp_reader *, const unsigned char **, 751 const unsigned char *, int, 752 struct normalize_state *state); 753 extern void _cpp_destroy_iconv (cpp_reader *); 754 extern unsigned char *_cpp_convert_input (cpp_reader *, const char *, 755 unsigned char *, size_t, size_t, 756 const unsigned char **, off_t *); 757 extern const char *_cpp_default_encoding (void); 758 extern cpp_hashnode * _cpp_interpret_identifier (cpp_reader *pfile, 759 const unsigned char *id, 760 size_t len); 761 762 /* Utility routines and macros. */ 763 #define DSC(str) (const unsigned char *)str, sizeof str - 1 764 765 /* These are inline functions instead of macros so we can get type 766 checking. */ 767 static inline int ustrcmp (const unsigned char *, const unsigned char *); 768 static inline int ustrncmp (const unsigned char *, const unsigned char *, 769 size_t); 770 static inline size_t ustrlen (const unsigned char *); 771 static inline const unsigned char *uxstrdup (const unsigned char *); 772 static inline const unsigned char *ustrchr (const unsigned char *, int); 773 static inline int ufputs (const unsigned char *, FILE *); 774 775 /* Use a const char for the second parameter since it is usually a literal. */ 776 static inline int ustrcspn (const unsigned char *, const char *); 777 778 static inline int 779 ustrcmp (const unsigned char *s1, const unsigned char *s2) 780 { 781 return strcmp ((const char *)s1, (const char *)s2); 782 } 783 784 static inline int 785 ustrncmp (const unsigned char *s1, const unsigned char *s2, size_t n) 786 { 787 return strncmp ((const char *)s1, (const char *)s2, n); 788 } 789 790 static inline int 791 ustrcspn (const unsigned char *s1, const char *s2) 792 { 793 return strcspn ((const char *)s1, s2); 794 } 795 796 static inline size_t 797 ustrlen (const unsigned char *s1) 798 { 799 return strlen ((const char *)s1); 800 } 801 802 static inline const unsigned char * 803 uxstrdup (const unsigned char *s1) 804 { 805 return (const unsigned char *) xstrdup ((const char *)s1); 806 } 807 808 static inline const unsigned char * 809 ustrchr (const unsigned char *s1, int c) 810 { 811 return (const unsigned char *) strchr ((const char *)s1, c); 812 } 813 814 static inline int 815 ufputs (const unsigned char *s, FILE *f) 816 { 817 return fputs ((const char *)s, f); 818 } 819 820 /* In line-map.c. */ 821 822 /* Create a macro map. A macro map encodes source locations of tokens 823 that are part of a macro replacement-list, at a macro expansion 824 point. See the extensive comments of struct line_map and struct 825 line_map_macro, in line-map.h. 826 827 This map shall be created when the macro is expanded. The map 828 encodes the source location of the expansion point of the macro as 829 well as the "original" source location of each token that is part 830 of the macro replacement-list. If a macro is defined but never 831 expanded, it has no macro map. SET is the set of maps the macro 832 map should be part of. MACRO_NODE is the macro which the new macro 833 map should encode source locations for. EXPANSION is the location 834 of the expansion point of MACRO. For function-like macros 835 invocations, it's best to make it point to the closing parenthesis 836 of the macro, rather than the the location of the first character 837 of the macro. NUM_TOKENS is the number of tokens that are part of 838 the replacement-list of MACRO. */ 839 const struct line_map *linemap_enter_macro (struct line_maps *, 840 struct cpp_hashnode*, 841 source_location, 842 unsigned int); 843 844 /* Create and return a virtual location for a token that is part of a 845 macro expansion-list at a macro expansion point. See the comment 846 inside struct line_map_macro to see what an expansion-list exactly 847 is. 848 849 A call to this function must come after a call to 850 linemap_enter_macro. 851 852 MAP is the map into which the source location is created. TOKEN_NO 853 is the index of the token in the macro replacement-list, starting 854 at number 0. 855 856 ORIG_LOC is the location of the token outside of this macro 857 expansion. If the token comes originally from the macro 858 definition, it is the locus in the macro definition; otherwise it 859 is a location in the context of the caller of this macro expansion 860 (which is a virtual location or a source location if the caller is 861 itself a macro expansion or not). 862 863 MACRO_DEFINITION_LOC is the location in the macro definition, 864 either of the token itself or of a macro parameter that it 865 replaces. */ 866 source_location linemap_add_macro_token (const struct line_map *, 867 unsigned int, 868 source_location, 869 source_location); 870 871 /* Return the source line number corresponding to source location 872 LOCATION. SET is the line map set LOCATION comes from. If 873 LOCATION is the location of token that is part of the 874 expansion-list of a macro expansion return the line number of the 875 macro expansion point. */ 876 int linemap_get_expansion_line (struct line_maps *, 877 source_location); 878 879 /* Return the path of the file corresponding to source code location 880 LOCATION. 881 882 If LOCATION is the location of a token that is part of the 883 replacement-list of a macro expansion return the file path of the 884 macro expansion point. 885 886 SET is the line map set LOCATION comes from. */ 887 const char* linemap_get_expansion_filename (struct line_maps *, 888 source_location); 889 890 #ifdef __cplusplus 891 } 892 #endif 893 894 #endif /* ! LIBCPP_INTERNAL_H */ 895