* cpplib.c: Include symcat.h. Add 'origin' field to struct directive. Add origin values to DIRECTIVE_TABLE. Generate the strings and function names on the fly. Take the #sccs entry out of the table if SCCS_DIRECTIVE is not defined. (_cpp_handle_directive): Decide if the # was at the beginning of the line here. Issue -pedantic warnings for extended directives here. Warn about K+R directives with the # indented, and C89/extended directives with the # not indented, here. (do_import, do_include_next, do_warning, do_ident, do_sccs, do_assert, do_unassert): Don't issue pedantic warning here. * cpphash.h: Add CPP_WTRADITIONAL macro. * cpplib.h (struct cpp_options): Rename warn_stringify to warn_traditional; update comments. * cppinit.c (handle_option): Set warn_traditional not warn_stringify. * cpphash.c: Replace CPP_OPTION (pfile, warn_stringify) with CPP_WTRADITIONAL (pfile). * cpplex.c (_cpp_lex_token): Don't decide if directives should be ignored in -traditional mode here. * cpplex.c: Copy ISTABLE macros from cppinit.c, and adapt them to initialize speccase[] and trigraph_map[]. Delete all references to pfile->input_speccase. Always treat '?' as a special character. Remove table-initialization code from _cpp_init_input_buffer. * cpplib.h (struct cpp_reader): Remove input_speccase field. * cppinit.c (cpp_cleanup): Don't free input_speccase. From-SVN: r32860
483 lines
17 KiB
C
483 lines
17 KiB
C
/* Definitions for CPP library.
|
|
Copyright (C) 1995, 96-99, 2000 Free Software Foundation, Inc.
|
|
Written by Per Bothner, 1994-95.
|
|
|
|
This program is free software; you can redistribute it and/or modify it
|
|
under the terms of the GNU General Public License as published by the
|
|
Free Software Foundation; either version 2, or (at your option) any
|
|
later version.
|
|
|
|
This program is distributed in the hope that it will be useful,
|
|
but WITHOUT ANY WARRANTY; without even the implied warranty of
|
|
MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
|
|
GNU General Public License for more details.
|
|
|
|
You should have received a copy of the GNU General Public License
|
|
along with this program; if not, write to the Free Software
|
|
Foundation, 59 Temple Place - Suite 330, Boston, MA 02111-1307, USA.
|
|
|
|
In other words, you are welcome to use, share and improve this program.
|
|
You are forbidden to forbid anyone else to use, share and improve
|
|
what you give them. Help stamp out software-hoarding! */
|
|
#ifndef __GCC_CPPLIB__
|
|
#define __GCC_CPPLIB__
|
|
|
|
#include <sys/types.h>
|
|
|
|
#ifdef __cplusplus
|
|
extern "C" {
|
|
#endif
|
|
|
|
typedef struct cpp_reader cpp_reader;
|
|
typedef struct cpp_buffer cpp_buffer;
|
|
typedef struct cpp_options cpp_options;
|
|
|
|
enum cpp_token
|
|
{
|
|
CPP_EOF = -1,
|
|
CPP_OTHER = 0,
|
|
CPP_COMMENT = 1,
|
|
CPP_HSPACE,
|
|
CPP_VSPACE, /* newlines and #line directives */
|
|
CPP_NAME,
|
|
CPP_MACRO,
|
|
CPP_NUMBER,
|
|
CPP_CHAR,
|
|
CPP_WCHAR,
|
|
CPP_STRING,
|
|
CPP_WSTRING,
|
|
CPP_DIRECTIVE,
|
|
CPP_ASSERTION, /* #machine(a29k) */
|
|
CPP_STRINGIZE, /* stringize macro argument */
|
|
CPP_TOKPASTE, /* paste macro arg with next/prev token */
|
|
CPP_LPAREN, /* "(" */
|
|
CPP_RPAREN, /* ")" */
|
|
CPP_LBRACE, /* "{" */
|
|
CPP_RBRACE, /* "}" */
|
|
CPP_COMMA, /* "," */
|
|
CPP_SEMICOLON, /* ";" */
|
|
CPP_3DOTS, /* "..." */
|
|
CPP_POP /* We're about to pop the buffer stack. */
|
|
};
|
|
|
|
typedef int (*parse_cleanup_t) PARAMS((cpp_buffer *, cpp_reader *));
|
|
|
|
struct cpp_buffer
|
|
{
|
|
const unsigned char *cur; /* current position */
|
|
const unsigned char *rlimit; /* end of valid data */
|
|
const unsigned char *buf; /* entire buffer */
|
|
const unsigned char *alimit; /* end of allocated buffer */
|
|
const unsigned char *line_base; /* start of current line */
|
|
|
|
struct cpp_buffer *prev;
|
|
|
|
/* Filename specified with #line command. */
|
|
const char *nominal_fname;
|
|
/* Last filename specified with #line command. */
|
|
const char *last_nominal_fname;
|
|
/* Actual directory of this file, used only for "" includes */
|
|
struct file_name_list *actual_dir;
|
|
|
|
/* Pointer into the include hash table. Used for include_next and
|
|
to record control macros. */
|
|
struct ihash *ihash;
|
|
|
|
long lineno; /* Line number at CPP_LINE_BASE. */
|
|
long colno; /* Column number at CPP_LINE_BASE. */
|
|
long mark; /* Saved position for lengthy backtrack. */
|
|
parse_cleanup_t cleanup;
|
|
void *data;
|
|
|
|
/* Value of if_stack at start of this file.
|
|
Used to prohibit unmatched #endif (etc) in an include file. */
|
|
struct if_stack *if_stack;
|
|
|
|
/* True if this is a header file included using <FILENAME>. */
|
|
char system_header_p;
|
|
char seen_eof;
|
|
|
|
/* True if buffer contains escape sequences.
|
|
Currently there are two kinds:
|
|
"\r-" means following identifier should not be macro-expanded.
|
|
"\r " means a token-separator. This turns into " " in final output
|
|
if not stringizing and needed to separate tokens; otherwise nothing.
|
|
Any other two-character sequence beginning with \r is an error.
|
|
|
|
If this is NOT set, then \r is a one-character escape meaning backslash
|
|
newline. This is guaranteed not to occur in the middle of a token.
|
|
The two interpretations of \r do not conflict, because the two-character
|
|
escapes are used only in macro buffers, and backslash-newline is removed
|
|
from macro expansion text in collect_expansion and/or macarg. */
|
|
char has_escapes;
|
|
|
|
/* Used by the C++ frontend to implement redirected input (such as for
|
|
default argument and/or template parsing). */
|
|
char manual_pop;
|
|
|
|
/* True if we have already warned about C++ comments in this file.
|
|
The warning happens only for C89 extended mode with -pedantic on,
|
|
and only once per file (otherwise it would be far too noisy). */
|
|
char warned_cplusplus_comments;
|
|
};
|
|
|
|
struct file_name_map_list;
|
|
struct htab;
|
|
|
|
/* Maximum nesting of cpp_buffers. We use a static limit, partly for
|
|
efficiency, and partly to limit runaway recursion. */
|
|
#define CPP_STACK_MAX 200
|
|
|
|
/* Values for opts.dump_macros.
|
|
dump_only means inhibit output of the preprocessed text
|
|
and instead output the definitions of all user-defined
|
|
macros in a form suitable for use as input to cccp.
|
|
dump_names means pass #define and the macro name through to output.
|
|
dump_definitions means pass the whole definition (plus #define) through
|
|
*/
|
|
enum { dump_none = 0, dump_only, dump_names, dump_definitions };
|
|
|
|
/* This structure is nested inside struct cpp_reader, and
|
|
carries all the options visible to the command line. */
|
|
struct cpp_options
|
|
{
|
|
/* Name of input and output files. */
|
|
const char *in_fname;
|
|
const char *out_fname;
|
|
|
|
/* Pending options - -D, -U, -A, -I, -ixxx. */
|
|
struct cpp_pending *pending;
|
|
|
|
/* File name which deps are being written to. This is 0 if deps are
|
|
being written to stdout. */
|
|
const char *deps_file;
|
|
|
|
/* Target-name to write with the dependency information. */
|
|
char *deps_target;
|
|
|
|
/* Search paths for include files. */
|
|
struct file_name_list *quote_include; /* First dir to search for "file" */
|
|
struct file_name_list *bracket_include;/* First dir to search for <file> */
|
|
|
|
/* Map between header names and file names, used only on DOS where
|
|
file names are limited in length. */
|
|
struct file_name_map_list *map_list;
|
|
|
|
/* Directory prefix that should replace `/usr/lib/gcc-lib/TARGET/VERSION'
|
|
in the standard include file directories. */
|
|
const char *include_prefix;
|
|
unsigned int include_prefix_len;
|
|
|
|
/* Non-0 means -v, so print the full set of include dirs. */
|
|
unsigned char verbose;
|
|
|
|
/* Nonzero means use extra default include directories for C++. */
|
|
unsigned char cplusplus;
|
|
|
|
/* Nonzero means handle cplusplus style comments */
|
|
unsigned char cplusplus_comments;
|
|
|
|
/* Nonzero means handle #import, for objective C. */
|
|
unsigned char objc;
|
|
|
|
/* Nonzero means this is an assembly file, so ignore unrecognized
|
|
directives and the "# 33" form of #line, both of which are
|
|
probably comments. Also, permit unbalanced ' strings (again,
|
|
likely to be in comments). */
|
|
unsigned char lang_asm;
|
|
|
|
/* Nonzero means this is Fortran, and we don't know where the
|
|
comments are, so permit unbalanced ' strings. Unlike lang_asm,
|
|
this does not ignore unrecognized directives. */
|
|
unsigned char lang_fortran;
|
|
|
|
/* Nonzero means handle CHILL comment syntax and output CHILL string
|
|
delimiters for __DATE__ etc. */
|
|
unsigned char chill;
|
|
|
|
/* Nonzero means don't copy comments into the output file. */
|
|
unsigned char discard_comments;
|
|
|
|
/* Nonzero means process the ANSI trigraph sequences. */
|
|
unsigned char trigraphs;
|
|
|
|
/* Nonzero means print the names of included files rather than the
|
|
preprocessed output. 1 means just the #include "...", 2 means
|
|
#include <...> as well. */
|
|
unsigned char print_deps;
|
|
|
|
/* Nonzero if missing .h files in -M output are assumed to be
|
|
generated files and not errors. */
|
|
unsigned char print_deps_missing_files;
|
|
|
|
/* If true, fopen (deps_file, "a") else fopen (deps_file, "w"). */
|
|
unsigned char print_deps_append;
|
|
|
|
/* Nonzero means print names of header files (-H). */
|
|
unsigned char print_include_names;
|
|
|
|
/* Nonzero means cpp_pedwarn causes a hard error. */
|
|
unsigned char pedantic_errors;
|
|
|
|
/* Nonzero means don't print warning messages. */
|
|
unsigned char inhibit_warnings;
|
|
|
|
/* Nonzero means don't print error messages. Has no option to
|
|
select it, but can be set by a user of cpplib (e.g. fix-header). */
|
|
unsigned char inhibit_errors;
|
|
|
|
/* Nonzero means warn if slash-star appears in a comment. */
|
|
unsigned char warn_comments;
|
|
|
|
/* Nonzero means warn if there are any trigraphs. */
|
|
unsigned char warn_trigraphs;
|
|
|
|
/* Nonzero means warn if #import is used. */
|
|
unsigned char warn_import;
|
|
|
|
/* Nonzero means warn if a macro argument is (or would be)
|
|
stringified with -traditional, and warn about directives
|
|
with the # indented from the beginning of the line. */
|
|
unsigned char warn_traditional;
|
|
|
|
/* Nonzero means turn warnings into errors. */
|
|
unsigned char warnings_are_errors;
|
|
|
|
/* Nonzero causes output not to be done, but directives such as
|
|
#define that have side effects are still obeyed. */
|
|
unsigned char no_output;
|
|
|
|
/* Nonzero means we should look for header.gcc files that remap file
|
|
names. */
|
|
unsigned char remap;
|
|
|
|
/* Nonzero means don't output line number information. */
|
|
unsigned char no_line_commands;
|
|
|
|
/* Nonzero means -I- has been seen, so don't look for #include "foo"
|
|
the source-file directory. */
|
|
unsigned char ignore_srcdir;
|
|
|
|
/* Zero means dollar signs are punctuation. */
|
|
unsigned char dollars_in_ident;
|
|
|
|
/* Nonzero means try to imitate old fashioned non-ANSI preprocessor. */
|
|
unsigned char traditional;
|
|
|
|
/* Nonzero means warn if undefined identifiers are evaluated in an #if. */
|
|
unsigned char warn_undef;
|
|
|
|
/* Nonzero for the 1989 C Standard, including corrigenda and amendments. */
|
|
unsigned char c89;
|
|
|
|
/* Nonzero for the 1999 C Standard, including corrigenda and amendments. */
|
|
unsigned char c99;
|
|
|
|
/* Nonzero means give all the error messages the ANSI standard requires. */
|
|
unsigned char pedantic;
|
|
|
|
/* Nonzero means we're looking at already preprocessed code, so don't
|
|
bother trying to do macro expansion and whatnot. */
|
|
unsigned char preprocessed;
|
|
|
|
/* Nonzero disables all the standard directories for headers. */
|
|
unsigned char no_standard_includes;
|
|
|
|
/* Nonzero disables the C++-specific standard directories for headers. */
|
|
unsigned char no_standard_cplusplus_includes;
|
|
|
|
/* Nonzero means dump macros in some fashion - see above. */
|
|
unsigned char dump_macros;
|
|
|
|
/* Nonzero means pass all #define and #undef directives which we
|
|
actually process through to the output stream. This feature is
|
|
used primarily to allow cc1 to record the #defines and #undefs
|
|
for the sake of debuggers which understand about preprocessor
|
|
macros, but it may also be useful with -E to figure out how
|
|
symbols are defined, and where they are defined. */
|
|
unsigned char debug_output;
|
|
|
|
/* Nonzero means pass #include lines through to the output. */
|
|
unsigned char dump_includes;
|
|
|
|
/* Print column number in error messages. */
|
|
unsigned char show_column;
|
|
};
|
|
|
|
|
|
/* A cpp_reader encapsulates the "state" of a pre-processor run.
|
|
Applying cpp_get_token repeatedly yields a stream of pre-processor
|
|
tokens. Usually, there is only one cpp_reader object active. */
|
|
|
|
struct cpp_reader
|
|
{
|
|
cpp_buffer *buffer;
|
|
|
|
/* A buffer used for both for cpp_get_token's output, and also internally. */
|
|
unsigned char *token_buffer;
|
|
/* Allocated size of token_buffer. CPP_RESERVE allocates space. */
|
|
unsigned int token_buffer_size;
|
|
/* End of the written part of token_buffer. */
|
|
unsigned char *limit;
|
|
|
|
/* Error counter for exit code */
|
|
int errors;
|
|
|
|
/* Line where a newline was first seen in a string constant. */
|
|
int multiline_string_line;
|
|
|
|
/* Current depth in #include directives that use <...>. */
|
|
int system_include_depth;
|
|
|
|
/* Current depth of buffer stack. */
|
|
int buffer_stack_depth;
|
|
|
|
/* Hash table of macros and assertions. See cpphash.c */
|
|
struct htab *hashtab;
|
|
|
|
/* Hash table of other included files. See cppfiles.c */
|
|
struct htab *all_include_files;
|
|
|
|
/* Chain of `actual directory' file_name_list entries,
|
|
for "" inclusion. */
|
|
struct file_name_list *actual_dirs;
|
|
|
|
/* Current maximum length of directory names in the search path
|
|
for include files. (Altered as we get more of them.) */
|
|
unsigned int max_include_len;
|
|
|
|
struct if_stack *if_stack;
|
|
|
|
long lineno;
|
|
|
|
struct tm *timebuf;
|
|
|
|
/* Buffer of -M output. */
|
|
struct deps *deps;
|
|
|
|
/* A buffer used only by read_and_prescan (in cppfiles.c), which is
|
|
allocated once per cpp_reader object to keep it off the stack. */
|
|
unsigned char *input_buffer;
|
|
size_t input_buffer_len;
|
|
|
|
/* User visible options. */
|
|
struct cpp_options opts;
|
|
|
|
/* Nonzero means we have printed (while error reporting) a list of
|
|
containing files that matches the current status. */
|
|
unsigned char input_stack_listing_current;
|
|
|
|
/* If non-zero, macros are not expanded. */
|
|
unsigned char no_macro_expand;
|
|
|
|
/* If non-zero, directives cause a hard error. Used when parsing
|
|
macro arguments. */
|
|
unsigned char no_directives;
|
|
|
|
/* We're printed a warning recommending against using #import. */
|
|
unsigned char import_warning;
|
|
|
|
/* If true, characters between '<' and '>' are a single (string) token. */
|
|
unsigned char parsing_include_directive;
|
|
|
|
/* If true, # introduces an assertion (see do_assert) */
|
|
unsigned char parsing_if_directive;
|
|
|
|
/* If true, # and ## are the STRINGIZE and TOKPASTE operators */
|
|
unsigned char parsing_define_directive;
|
|
|
|
/* True if escape sequences (as described for has_escapes in
|
|
parse_buffer) should be emitted. */
|
|
unsigned char output_escapes;
|
|
|
|
/* 0: Have seen non-white-space on this line.
|
|
1: Only seen white space so far on this line.
|
|
2: Only seen white space so far in this file. */
|
|
unsigned char only_seen_white;
|
|
|
|
/* True after cpp_start_read completes. Used to inhibit some
|
|
warnings while parsing the command line. */
|
|
unsigned char done_initializing;
|
|
};
|
|
|
|
#define CPP_FATAL_LIMIT 1000
|
|
/* True if we have seen a "fatal" error. */
|
|
#define CPP_FATAL_ERRORS(READER) ((READER)->errors >= CPP_FATAL_LIMIT)
|
|
|
|
/* Macros for manipulating the token_buffer. */
|
|
|
|
/* Number of characters currently in PFILE's output buffer. */
|
|
#define CPP_WRITTEN(PFILE) ((size_t)((PFILE)->limit - (PFILE)->token_buffer))
|
|
#define CPP_PWRITTEN(PFILE) ((PFILE)->limit)
|
|
#define CPP_ADJUST_WRITTEN(PFILE,DELTA) ((PFILE)->limit += (DELTA))
|
|
#define CPP_SET_WRITTEN(PFILE,N) ((PFILE)->limit = (PFILE)->token_buffer + (N))
|
|
|
|
#define CPP_OPTION(PFILE, OPTION) ((PFILE)->opts.OPTION)
|
|
#define CPP_BUFFER(PFILE) ((PFILE)->buffer)
|
|
|
|
/* Name under which this program was invoked. */
|
|
extern const char *progname;
|
|
|
|
extern int cpp_handle_options PARAMS ((cpp_reader *, int, char **));
|
|
extern enum cpp_token cpp_get_token PARAMS ((cpp_reader *));
|
|
extern enum cpp_token cpp_get_non_space_token PARAMS ((cpp_reader *));
|
|
|
|
extern void cpp_reader_init PARAMS ((cpp_reader *));
|
|
extern int cpp_start_read PARAMS ((cpp_reader *, const char *));
|
|
extern void cpp_finish PARAMS ((cpp_reader *));
|
|
extern void cpp_cleanup PARAMS ((cpp_reader *PFILE));
|
|
|
|
extern void cpp_buf_line_and_col PARAMS((cpp_buffer *, long *, long *));
|
|
extern cpp_buffer *cpp_file_buffer PARAMS((cpp_reader *));
|
|
extern void cpp_define PARAMS ((cpp_reader *, const char *));
|
|
extern void cpp_assert PARAMS ((cpp_reader *, const char *));
|
|
extern void cpp_undef PARAMS ((cpp_reader *, const char *));
|
|
extern void cpp_unassert PARAMS ((cpp_reader *, const char *));
|
|
|
|
/* N.B. The error-message-printer prototypes have not been nicely
|
|
formatted because exgettext needs to see 'msgid' on the same line
|
|
as the name of the function in order to work properly. Only the
|
|
string argument gets a name in an effort to keep the lines from
|
|
getting ridiculously oversized. */
|
|
|
|
extern void cpp_ice PARAMS ((cpp_reader *, const char *msgid, ...))
|
|
ATTRIBUTE_PRINTF_2;
|
|
extern void cpp_fatal PARAMS ((cpp_reader *, const char *msgid, ...))
|
|
ATTRIBUTE_PRINTF_2;
|
|
extern void cpp_error PARAMS ((cpp_reader *, const char *msgid, ...))
|
|
ATTRIBUTE_PRINTF_2;
|
|
extern void cpp_warning PARAMS ((cpp_reader *, const char *msgid, ...))
|
|
ATTRIBUTE_PRINTF_2;
|
|
extern void cpp_pedwarn PARAMS ((cpp_reader *, const char *msgid, ...))
|
|
ATTRIBUTE_PRINTF_2;
|
|
extern void cpp_notice PARAMS ((cpp_reader *, const char *msgid, ...))
|
|
ATTRIBUTE_PRINTF_2;
|
|
extern void cpp_error_with_line PARAMS ((cpp_reader *, int, int, const char *msgid, ...))
|
|
ATTRIBUTE_PRINTF_4;
|
|
extern void cpp_warning_with_line PARAMS ((cpp_reader *, int, int, const char *msgid, ...))
|
|
ATTRIBUTE_PRINTF_4;
|
|
extern void cpp_pedwarn_with_line PARAMS ((cpp_reader *, int, int, const char *msgid, ...))
|
|
ATTRIBUTE_PRINTF_4;
|
|
extern void cpp_pedwarn_with_file_and_line PARAMS ((cpp_reader *, const char *, int, int, const char *msgid, ...))
|
|
ATTRIBUTE_PRINTF_5;
|
|
extern void cpp_error_from_errno PARAMS ((cpp_reader *, const char *));
|
|
extern void cpp_notice_from_errno PARAMS ((cpp_reader *, const char *));
|
|
|
|
extern cpp_buffer *cpp_push_buffer PARAMS ((cpp_reader *,
|
|
const unsigned char *, long));
|
|
extern cpp_buffer *cpp_pop_buffer PARAMS ((cpp_reader *));
|
|
extern int cpp_defined PARAMS ((cpp_reader *, const unsigned char *, int));
|
|
|
|
extern void cpp_expand_to_buffer PARAMS ((cpp_reader *,
|
|
const unsigned char *, int));
|
|
extern void cpp_scan_buffer PARAMS ((cpp_reader *));
|
|
|
|
/* In cppfiles.c */
|
|
extern int cpp_included PARAMS ((cpp_reader *, const char *));
|
|
extern int cpp_read_file PARAMS ((cpp_reader *, const char *));
|
|
|
|
#ifdef __cplusplus
|
|
}
|
|
#endif
|
|
#endif /* __GCC_CPPLIB__ */
|