* jcf-parse.c (parse_class_file): Use linemap_line_start. (parse_source_file_1): Pass filename as extra parameter, so we can call linemap_add and set input_location here, rather than in both callers. (read_class): Pass copied filename to parse_source_file_1. Don't initialize wfl_operator - only needed for source compilation. (read_class, jcf_parse): Call linemap_add with LC_LEAVE. * lex.h: Remove a bunch of debugging macros. * lex.h (struct_java_line, struct java_error): Remove types. (JAVA_COLUMN_DELTA): Remove - use java_lexer.next_colums instead. (struct java_lc_s): Remove prev_col field. (struct java_lexer): New fields next_unicode, next_columns, and avail_unicode. New position field, and maybe token_start field. Don't need hit_eof field - use next_unicode == -1 instead. (JAVA_INTEGERAL_RANGE_ERROR): Rename to JAVA_RANGE_ERROR. (JAVA_RANGE_ERROR, JAVA_FLOAT_ANGE_ERROR): Update accordingly. * parse.h: Various changes for USE_MAPPED_LOCATION. (EXPR_WFL_EMIT_LINE_NOTE): XXX (BUILD_EXPR_WFL, EXPR_WFL_ADD_COL): Remove no-longer-used macros. (struct parser_ctxt): New file_start_location field. Remove p_line, c_line fields since we no longer save lines. Remove elc, lineno, and current_jcf fields - no longer used. * parse.y: Updates for USE_MAPPED_LOCATION and new lexer. Don't use EXPR_WFL_ADD_COL since that isn't trivial with source_location and is probably not needed anymore anyway. Use new expr_add_Location function. (SET_EXPR_LOCATION_FROM_TOKEN): New convenience macro. (java_pop_parser_context): Minor cleanup. (java_parser_context_save_global, java_parser_context_restore_global, java_pop_parser_context): Save/restore input_location as a unit. (issue_warning_error_from_context): If USE_MAPPED_LOCATION take a source_location instead of a wfl context node. (check_class_interface_creation): input_filename is not addressable. (create_artificial_method): Calling java_parser_context_save_global and java_parser_context_restore_global is overkill. Instead, temporarily set input_location from class decl. (java_layout_seen_class_methods): Set input_location from method decl. (fix_constructors): Make more robust if no EXPR_WITH_FILE_LOCATION. (finish_loop_body): Likewise. * lex.c: Updates for USE_MAPPED_LOCATION. Use build_unknwon_wfl. (java_sprint_unicode): Take a character, not index in line. (java_sneak_uncode): Replaced by java_peek_unicode. (java_unget_unicode): No longer used. (java_allocate_new_line. java_store_unicode): Removed, since we no longer remember "lines". (java_new_lexer): Update for new data structures. (java_read_char): Move unget_value checking to java_read_unicode. (java_get_unicode, java_peek_unicode, java_next_unicode): New more efficient functions that are used directly when lexing. (java_read_unicode_collapsing_terminators): No longer needed. (java_parse_end_comment, java_parse_escape_sequence, do_java_lex): Re-organize to use java_peek_unicode to avoid java_unget_unicode. (java_parse_escape_sequence): Rewrite to be simpler / more efficient. (do_java_lex): Lots of movings around to avoid java_unget_unicode, combine switch branches, and test for common token kinds earlier. (java_lex_error): Rewrite. * jv-scan.c (expand_location): New function, copied from tree.c. (main): Set ctxp->filename instead of setting input_filename directly. From-SVN: r88367
244 lines
7.9 KiB
C
244 lines
7.9 KiB
C
/* Language lexer definitions for the GNU compiler for the Java(TM) language.
|
|
Copyright (C) 1997, 1998, 1999, 2000, 2001, 2002, 2003
|
|
Free Software Foundation, Inc.
|
|
Contributed by Alexandre Petit-Bianco (apbianco@cygnus.com)
|
|
|
|
This file is part of GCC.
|
|
|
|
GCC is free software; you can redistribute it and/or modify
|
|
it under the terms of the GNU General Public License as published by
|
|
the Free Software Foundation; either version 2, or (at your option)
|
|
any later version.
|
|
|
|
GCC is distributed in the hope that it will be useful,
|
|
but WITHOUT ANY WARRANTY; without even the implied warranty of
|
|
MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
|
|
GNU General Public License for more details.
|
|
|
|
You should have received a copy of the GNU General Public License
|
|
along with GCC; see the file COPYING. If not, write to
|
|
the Free Software Foundation, 59 Temple Place - Suite 330,
|
|
Boston, MA 02111-1307, USA.
|
|
|
|
Java and all Java-based marks are trademarks or registered trademarks
|
|
of Sun Microsystems, Inc. in the United States and other countries.
|
|
The Free Software Foundation is independent of Sun Microsystems, Inc. */
|
|
|
|
#ifndef GCC_JAVA_LEX_H
|
|
#define GCC_JAVA_LEX_H
|
|
|
|
#include "input.h"
|
|
|
|
/* Extern global variables declarations */
|
|
extern FILE *finput;
|
|
|
|
/* A Unicode character, as read from the input file */
|
|
typedef unsigned short unicode_t;
|
|
|
|
#if defined HAVE_ICONV_H && defined HAVE_ICONV
|
|
#include <iconv.h>
|
|
#endif /* HAVE_ICONV */
|
|
|
|
/* Default encoding to use if no encoding is specified. */
|
|
#define DEFAULT_ENCODING "UTF-8"
|
|
|
|
typedef struct java_lc_s GTY(()) {
|
|
int line; /* line number (1-based) */
|
|
int col; /* column number number (1-based) */
|
|
} java_lc;
|
|
|
|
struct java_lexer
|
|
{
|
|
/* The file from which we're reading. */
|
|
FILE *finput;
|
|
|
|
/* Number of consecutive backslashes we've read. */
|
|
int bs_count;
|
|
|
|
/* Next available Unicode character.
|
|
* This is post-Unicode-escape-processing. -1 if EOF. */
|
|
int next_unicode;
|
|
|
|
/* True if next_unicode is next available character, or EOF. */
|
|
bool avail_unicode;
|
|
|
|
/* Number of source columns of the previous Unicode character (next_unicode).
|
|
If next_unicode==-2, then this is the number of columns of the previous
|
|
Unicode character (most recent result of java_{get,peek}_unicode). */
|
|
int next_columns;
|
|
|
|
/* If nonzero, a value that was pushed back. This is a unicode character,
|
|
but (unlike next_unicode) is pre-'\uXXXX'-processing. It is also used
|
|
when a '\r' is *not* followed by a '\n'. */
|
|
unicode_t unget_value;
|
|
|
|
/* Name of the character encoding we're using. */
|
|
const char *encoding;
|
|
|
|
/* Current source position. */
|
|
java_lc position;
|
|
|
|
#ifndef USE_MAPPED_LOCATION
|
|
java_lc token_start; /* Error's line column info */
|
|
#endif
|
|
|
|
#ifdef HAVE_ICONV
|
|
/* Nonzero if we've read any bytes. We only recognize the
|
|
byte-order-marker (BOM) as the first word. */
|
|
unsigned int read_anything : 1;
|
|
|
|
/* Nonzero if we have to byte swap. */
|
|
unsigned int byte_swap : 1;
|
|
|
|
/* Nonzero if we're using the fallback decoder. */
|
|
unsigned int use_fallback : 1;
|
|
|
|
/* The handle for the iconv converter we're using. */
|
|
iconv_t handle;
|
|
|
|
/* Bytes we've read from the file but have not sent to iconv. */
|
|
char buffer[1024];
|
|
|
|
/* Index of first valid character in buffer, -1 if no valid
|
|
characters. */
|
|
int first;
|
|
|
|
/* Index of last valid character in buffer, plus one. -1 if no
|
|
valid characters in buffer. */
|
|
int last;
|
|
|
|
/* This is a buffer of characters already converted by iconv. We
|
|
use `char' here because we're assuming that iconv() converts to
|
|
UCS-2, and then we convert it ourselves. */
|
|
unsigned char out_buffer[1024];
|
|
|
|
/* Index of first valid output character. -1 if no valid
|
|
characters. */
|
|
int out_first;
|
|
|
|
/* Index of last valid output character, plus one. -1 if no valid
|
|
characters. */
|
|
int out_last;
|
|
|
|
#endif /* HAVE_ICONV */
|
|
};
|
|
typedef struct java_lexer java_lexer;
|
|
|
|
/* Destroy a lexer object. */
|
|
extern void java_destroy_lexer (java_lexer *);
|
|
|
|
#define JAVA_LINE_MAX 80
|
|
|
|
/* Build a location compound integer */
|
|
#ifdef USE_MAPPED_LOCATION
|
|
#define BUILD_LOCATION() input_location
|
|
#else
|
|
#define BUILD_LOCATION() ((ctxp->lexer->token_start.line << 12) \
|
|
| (ctxp->lexer->token_start.col & 0xfff))
|
|
#endif
|
|
|
|
/* Those macros are defined differently if we compile jc1-lite
|
|
(JC1_LITE defined) or jc1. */
|
|
#ifdef JC1_LITE
|
|
|
|
#define DCONST0 0
|
|
#define REAL_VALUE_TYPE int
|
|
#define GET_IDENTIFIER(S) xstrdup ((S))
|
|
#define REAL_VALUE_ATOF(LIT,MODE) 0
|
|
#define REAL_VALUE_ISINF(VALUE) 0
|
|
#define REAL_VALUE_ISNAN(VALUE) 0
|
|
#define SET_REAL_VALUE_ATOF(TARGET,SOURCE)
|
|
#define FLOAT_TYPE_NODE 0
|
|
#define DOUBLE_TYPE_NODE 0
|
|
#define SET_MODIFIER_CTX(TOKEN) java_lval->value = (TOKEN)
|
|
#define GET_TYPE_PRECISION(NODE) 4
|
|
#define BUILD_OPERATOR(TOKEN) return TOKEN
|
|
#define BUILD_OPERATOR2(TOKEN) return ASSIGN_ANY_TK
|
|
#define SET_LVAL_NODE(NODE)
|
|
#define BUILD_ID_WFL(EXP) (EXP)
|
|
#define JAVA_FLOAT_RANGE_ERROR(S) {}
|
|
#define JAVA_RANGE_ERROR(S) do { } while (0)
|
|
|
|
#else
|
|
|
|
#define DCONST0 dconst0
|
|
#define GET_IDENTIFIER(S) get_identifier ((S))
|
|
#define SET_REAL_VALUE_ATOF(TARGET,SOURCE) (TARGET) = (SOURCE)
|
|
#define FLOAT_TYPE_NODE float_type_node
|
|
#define DOUBLE_TYPE_NODE double_type_node
|
|
/* Set modifier_ctx according to TOKEN */
|
|
#define SET_MODIFIER_CTX(TOKEN) \
|
|
{ \
|
|
ctxp->modifier_ctx [(TOKEN)-PUBLIC_TK] = build_wfl_node (NULL_TREE); \
|
|
java_lval->value = (TOKEN)-PUBLIC_TK; \
|
|
}
|
|
/* Type precision for long */
|
|
#define GET_TYPE_PRECISION(NODE) TYPE_PRECISION (long_type_node) / 8;
|
|
/* Build an operator tree node and return TOKEN */
|
|
#define BUILD_OPERATOR(TOKEN) \
|
|
{ \
|
|
java_lval->operator.token = (TOKEN); \
|
|
java_lval->operator.location = BUILD_LOCATION(); \
|
|
return (TOKEN); \
|
|
}
|
|
|
|
/* Build an operator tree node but return ASSIGN_ANY_TK */
|
|
#define BUILD_OPERATOR2(TOKEN) \
|
|
{ \
|
|
java_lval->operator.token = (TOKEN); \
|
|
java_lval->operator.location = BUILD_LOCATION(); \
|
|
return ASSIGN_ANY_TK; \
|
|
}
|
|
/* Set java_lval->node and TREE_TYPE(java_lval->node) in macros */
|
|
#define SET_LVAL_NODE(NODE) java_lval->node = (NODE)
|
|
/* Wrap identifier around a wfl */
|
|
#define BUILD_ID_WFL(EXP) build_wfl_node ((EXP))
|
|
/* Special ways to report error on numeric literals */
|
|
#define JAVA_FLOAT_RANGE_ERROR(m) \
|
|
{ \
|
|
char *msg = xmalloc (100 + strlen (m)); \
|
|
sprintf (msg, "Floating point literal exceeds range of `%s'", (m)); \
|
|
JAVA_RANGE_ERROR(msg); \
|
|
free (msg); \
|
|
}
|
|
#define JAVA_RANGE_ERROR(msg) \
|
|
do { \
|
|
int save_col = ctxp->lexer->position.col; \
|
|
ctxp->lexer->position.col = number_beginning; \
|
|
java_lex_error (msg, 0); \
|
|
ctxp->lexer->position.col = save_col; \
|
|
} while (0)
|
|
|
|
#endif /* Definitions for jc1 compilation only */
|
|
|
|
/* Macros to decode character ranges */
|
|
#define RANGE(c, l, h) (((c) >= l && (c) <= h))
|
|
#define JAVA_WHITE_SPACE_P(c) (c == ' ' || c == '\t' || c == '\f')
|
|
#define JAVA_START_CHAR_P(c) ((c < 128 \
|
|
&& (ISIDST (c) || c == '$')) \
|
|
|| (c >= 128 && java_start_char_p (c)))
|
|
#define JAVA_PART_CHAR_P(c) ((c < 128 \
|
|
&& (ISIDNUM (c) \
|
|
|| c == '$' \
|
|
|| c == 0x0000 \
|
|
|| RANGE (c, 0x01, 0x08) \
|
|
|| RANGE (c, 0x0e, 0x1b) \
|
|
|| c == 0x7f)) \
|
|
|| (c >= 128 && java_part_char_p (c)))
|
|
#define JAVA_ASCII_DIGIT(c) ISDIGIT (c)
|
|
#define JAVA_ASCII_OCTDIGIT(c) RANGE (c, '0', '7')
|
|
#define JAVA_ASCII_HEXDIGIT(c) ISXDIGIT (c)
|
|
#define JAVA_ASCII_FPCHAR(c) (RANGE (c, 'd', 'f') || RANGE (c, 'D', 'F') || \
|
|
c == '.' || JAVA_ASCII_DIGIT (c))
|
|
#define JAVA_FP_SUFFIX(c) (c == 'D' || c == 'd' || c == 'f' || c == 'F')
|
|
#define JAVA_FP_EXP(c) (c == 'E' || c == 'F')
|
|
#define JAVA_FP_PM(c) (c == '-' || c == '+')
|
|
#define JAVA_ASCII_LETTER(c) ISALPHA (c)
|
|
|
|
/* Constants */
|
|
#define JAVA_READ_BUFFER 256
|
|
#define JAVA_CHAR_ERROR -2
|
|
#define UEOF -1
|
|
|
|
#endif /* ! GCC_JAVA_LEX_H */
|