[Top][All Lists]
[Date Prev][Date Next][Thread Prev][Thread Next][Date Index][Thread Index]
[Emacs-diffs] Changes to emacs/src/syntax.h [emacs-unicode-2]
From: |
Kenichi Handa |
Subject: |
[Emacs-diffs] Changes to emacs/src/syntax.h [emacs-unicode-2] |
Date: |
Mon, 08 Sep 2003 08:49:30 -0400 |
Index: emacs/src/syntax.h
diff -c /dev/null emacs/src/syntax.h:1.39.6.1
*** /dev/null Mon Sep 8 08:49:30 2003
--- emacs/src/syntax.h Mon Sep 8 08:48:12 2003
***************
*** 0 ****
--- 1,346 ----
+ /* Declarations having to do with GNU Emacs syntax tables.
+ Copyright (C) 1985, 93, 94, 97, 1998 Free Software Foundation, Inc.
+
+ This file is part of GNU Emacs.
+
+ GNU Emacs is free software; you can redistribute it and/or modify
+ it under the terms of the GNU General Public License as published by
+ the Free Software Foundation; either version 2, or (at your option)
+ any later version.
+
+ GNU Emacs is distributed in the hope that it will be useful,
+ but WITHOUT ANY WARRANTY; without even the implied warranty of
+ MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
+ GNU General Public License for more details.
+
+ You should have received a copy of the GNU General Public License
+ along with GNU Emacs; see the file COPYING. If not, write to
+ the Free Software Foundation, Inc., 59 Temple Place - Suite 330,
+ Boston, MA 02111-1307, USA. */
+
+
+ extern Lisp_Object Qsyntax_table_p;
+ extern void update_syntax_table P_ ((int, int, int, Lisp_Object));
+
+ /* The standard syntax table is stored where it will automatically
+ be used in all new buffers. */
+ #define Vstandard_syntax_table buffer_defaults.syntax_table
+
+ /* A syntax table is a chartable whose elements are cons cells
+ (CODE+FLAGS . MATCHING-CHAR). MATCHING-CHAR can be nil if the char
+ is not a kind of parenthesis.
+
+ The low 8 bits of CODE+FLAGS is a code, as follows: */
+
+ enum syntaxcode
+ {
+ Swhitespace, /* for a whitespace character */
+ Spunct, /* for random punctuation characters */
+ Sword, /* for a word constituent */
+ Ssymbol, /* symbol constituent but not word constituent */
+ Sopen, /* for a beginning delimiter */
+ Sclose, /* for an ending delimiter */
+ Squote, /* for a prefix character like Lisp ' */
+ Sstring, /* for a string-grouping character like Lisp " */
+ Smath, /* for delimiters like $ in Tex. */
+ Sescape, /* for a character that begins a C-style escape */
+ Scharquote, /* for a character that quotes the following character */
+ Scomment, /* for a comment-starting character */
+ Sendcomment, /* for a comment-ending character */
+ Sinherit, /* use the standard syntax table for this character */
+ Scomment_fence, /* Starts/ends comment which is delimited on the
+ other side by any char with the same syntaxcode. */
+ Sstring_fence, /* Starts/ends string which is delimited on the
+ other side by any char with the same syntaxcode. */
+ Smax /* Upper bound on codes that are meaningful */
+ };
+
+ /* Set the syntax entry VAL for char C in table TABLE. */
+
+ #define SET_RAW_SYNTAX_ENTRY(table, c, val) \
+ CHAR_TABLE_SET ((table), c, (val))
+
+ /* Set the syntax entry VAL for char-range RANGE in table TABLE.
+ RANGE is a cons (FROM . TO) specifying the range of characters. */
+
+ #define SET_RAW_SYNTAX_ENTRY_RANGE(table, range, val) \
+ Fset_char_table_range ((table), (range), (val))
+
+ /* SYNTAX_ENTRY fetches the information from the entry for character C
+ in syntax table TABLE, or from globally kept data (gl_state).
+ Does inheritance. */
+ /* CURRENT_SYNTAX_TABLE gives the syntax table valid for current
+ position, it is either the buffer's syntax table, or syntax table
+ found in text properties. */
+
+ #ifdef SYNTAX_ENTRY_VIA_PROPERTY
+ # define SYNTAX_ENTRY(c) \
+ (gl_state.use_global ? gl_state.global_code : SYNTAX_ENTRY_INT (c))
+ # define CURRENT_SYNTAX_TABLE gl_state.current_syntax_table
+ #else
+ # define SYNTAX_ENTRY SYNTAX_ENTRY_INT
+ # define CURRENT_SYNTAX_TABLE current_buffer->syntax_table
+ #endif
+
+ #define SYNTAX_ENTRY_INT(c) CHAR_TABLE_REF (CURRENT_SYNTAX_TABLE, (c))
+
+ /* Extract the information from the entry for character C
+ in the current syntax table. */
+
+ #ifdef __GNUC__
+ #define SYNTAX(c) \
+ ({ Lisp_Object temp;
\
+ temp = SYNTAX_ENTRY (c); \
+ (CONSP (temp) \
+ ? (enum syntaxcode) (XINT (XCAR (temp)) & 0xff) \
+ : Swhitespace); })
+
+ #define SYNTAX_WITH_FLAGS(c) \
+ ({ Lisp_Object temp;
\
+ temp = SYNTAX_ENTRY (c); \
+ (CONSP (temp) \
+ ? XINT (XCAR (temp)) \
+ : (int) Swhitespace); })
+
+ #define SYNTAX_MATCH(c)
\
+ ({ Lisp_Object temp;
\
+ temp = SYNTAX_ENTRY (c); \
+ (CONSP (temp) \
+ ? XCDR (temp) \
+ : Qnil); })
+ #else
+ extern Lisp_Object syntax_temp;
+ #define SYNTAX(c) \
+ (syntax_temp = SYNTAX_ENTRY ((c)), \
+ (CONSP (syntax_temp)
\
+ ? (enum syntaxcode) (XINT (XCAR (syntax_temp)) & 0xff) \
+ : Swhitespace))
+
+ #define SYNTAX_WITH_FLAGS(c) \
+ (syntax_temp = SYNTAX_ENTRY ((c)), \
+ (CONSP (syntax_temp)
\
+ ? XINT (XCAR (syntax_temp)) \
+ : (int) Swhitespace))
+
+ #define SYNTAX_MATCH(c)
\
+ (syntax_temp = SYNTAX_ENTRY ((c)), \
+ (CONSP (syntax_temp)
\
+ ? XCDR (syntax_temp) \
+ : Qnil))
+ #endif
+
+ /* Then there are seven single-bit flags that have the following meanings:
+ 1. This character is the first of a two-character comment-start sequence.
+ 2. This character is the second of a two-character comment-start sequence.
+ 3. This character is the first of a two-character comment-end sequence.
+ 4. This character is the second of a two-character comment-end sequence.
+ 5. This character is a prefix, for backward-prefix-chars.
+ 6. see below
+ 7. This character is part of a nestable comment sequence.
+ Note that any two-character sequence whose first character has flag 1
+ and whose second character has flag 2 will be interpreted as a comment
start.
+
+ bit 6 is used to discriminate between two different comment styles.
+ Languages such as C++ allow two orthogonal syntax start/end pairs
+ and bit 6 is used to determine whether a comment-end or Scommentend
+ ends style a or b. Comment start sequences can start style a or b.
+ Style a is always the default.
+ */
+
+ /* These macros extract a particular flag for a given character. */
+
+ #define SYNTAX_COMSTART_FIRST(c) ((SYNTAX_WITH_FLAGS (c) >> 16) & 1)
+
+ #define SYNTAX_COMSTART_SECOND(c) ((SYNTAX_WITH_FLAGS (c) >> 17) & 1)
+
+ #define SYNTAX_COMEND_FIRST(c) ((SYNTAX_WITH_FLAGS (c) >> 18) & 1)
+
+ #define SYNTAX_COMEND_SECOND(c) ((SYNTAX_WITH_FLAGS (c) >> 19) & 1)
+
+ #define SYNTAX_PREFIX(c) ((SYNTAX_WITH_FLAGS (c) >> 20) & 1)
+
+ #define SYNTAX_COMMENT_STYLE(c) ((SYNTAX_WITH_FLAGS (c) >> 21) & 1)
+
+ #define SYNTAX_COMMENT_NESTED(c) ((SYNTAX_WITH_FLAGS (c) >> 22) & 1)
+
+ /* These macros extract specific flags from an integer
+ that holds the syntax code and the flags. */
+
+ #define SYNTAX_FLAGS_COMSTART_FIRST(flags) (((flags) >> 16) & 1)
+
+ #define SYNTAX_FLAGS_COMSTART_SECOND(flags) (((flags) >> 17) & 1)
+
+ #define SYNTAX_FLAGS_COMEND_FIRST(flags) (((flags) >> 18) & 1)
+
+ #define SYNTAX_FLAGS_COMEND_SECOND(flags) (((flags) >> 19) & 1)
+
+ #define SYNTAX_FLAGS_PREFIX(flags) (((flags) >> 20) & 1)
+
+ #define SYNTAX_FLAGS_COMMENT_STYLE(flags) (((flags) >> 21) & 1)
+
+ #define SYNTAX_FLAGS_COMMENT_NESTED(flags) (((flags) >> 22) & 1)
+
+ /* This array, indexed by a character, contains the syntax code which that
+ character signifies (as a char). For example,
+ (enum syntaxcode) syntax_spec_code['w'] is Sword. */
+
+ extern unsigned char syntax_spec_code[0400];
+
+ /* Indexed by syntax code, give the letter that describes it. */
+
+ extern char syntax_code_spec[16];
+
+ /* Convert the byte offset BYTEPOS into a character position,
+ for the object recorded in gl_state with SETUP_SYNTAX_TABLE_FOR_OBJECT.
+
+ The value is meant for use in the UPDATE_SYNTAX_TABLE... macros.
+ These macros do nothing when parse_sexp_lookup_properties is 0,
+ so we return 0 in that case, for speed. */
+
+ #define SYNTAX_TABLE_BYTE_TO_CHAR(bytepos) \
+ (! parse_sexp_lookup_properties \
+ ? 0
\
+ : STRINGP (gl_state.object)
\
+ ? string_byte_to_char (gl_state.object, (bytepos)) \
+ : BUFFERP (gl_state.object)
\
+ ? buf_bytepos_to_charpos (XBUFFER (gl_state.object),
\
+ (bytepos) + BUF_BEGV_BYTE (XBUFFER
(gl_state.object)) - 1) - BUF_BEGV (XBUFFER (gl_state.object)) + 1 \
+ : NILP (gl_state.object) \
+ ? BYTE_TO_CHAR ((bytepos) + BEGV_BYTE - 1) - BEGV + 1 \
+ : (bytepos))
+
+ /* Make syntax table state (gl_state) good for CHARPOS, assuming it is
+ currently good for a position before CHARPOS. */
+
+ #define UPDATE_SYNTAX_TABLE_FORWARD(charpos) \
+ (parse_sexp_lookup_properties \
+ && (charpos) >= gl_state.e_property \
+ ? (update_syntax_table ((charpos) + gl_state.offset, 1, 0, \
+ gl_state.object), \
+ 1) \
+ : 0)
+
+ /* Make syntax table state (gl_state) good for CHARPOS, assuming it is
+ currently good for a position after CHARPOS. */
+
+ #define UPDATE_SYNTAX_TABLE_BACKWARD(charpos) \
+ (parse_sexp_lookup_properties \
+ && (charpos) < gl_state.b_property \
+ ? (update_syntax_table ((charpos) + gl_state.offset, -1, 0, \
+ gl_state.object), \
+ 1) \
+ : 0)
+
+ /* Make syntax table good for CHARPOS. */
+
+ #define UPDATE_SYNTAX_TABLE(charpos) \
+ (parse_sexp_lookup_properties \
+ && (charpos) < gl_state.b_property \
+ ? (update_syntax_table ((charpos) + gl_state.offset, -1, 0, \
+ gl_state.object), \
+ 1) \
+ : (parse_sexp_lookup_properties \
+ && (charpos) >= gl_state.e_property \
+ ? (update_syntax_table ((charpos) + gl_state.offset, 1, 0,\
+ gl_state.object), \
+ 1) \
+ : 0))
+
+ /* This macro should be called with FROM at the start of forward
+ search, or after the last position of the backward search. It
+ makes sure that the first char is picked up with correct table, so
+ one does not need to call UPDATE_SYNTAX_TABLE immediately after the
+ call.
+ Sign of COUNT gives the direction of the search.
+ */
+
+ #define SETUP_SYNTAX_TABLE(FROM, COUNT)
\
+ if (1)
\
+ { \
+ gl_state.b_property = BEGV;
\
+ gl_state.e_property = ZV + 1; \
+ gl_state.object = Qnil; \
+ gl_state.use_global = 0; \
+ gl_state.offset = 0; \
+ gl_state.current_syntax_table = current_buffer->syntax_table; \
+ if (parse_sexp_lookup_properties) \
+ if ((COUNT) > 0 || (FROM) > BEGV)
\
+ update_syntax_table ((COUNT) > 0 ? (FROM) : (FROM) - 1, (COUNT),\
+ 1, Qnil); \
+ } \
+ else
+
+ /* Same as above, but in OBJECT. If OBJECT is nil, use current buffer.
+ If it is t, ignore properties altogether.
+
+ This is meant for regex.c to use. For buffers, regex.c passes arguments
+ to the UPDATE_SYNTAX_TABLE macros which are relative to BEGV.
+ So if it is a buffer, we set the offset field to BEGV. */
+
+ #define SETUP_SYNTAX_TABLE_FOR_OBJECT(OBJECT, FROM, COUNT) \
+ if (1)
\
+ { \
+ gl_state.object = (OBJECT);
\
+ if (BUFFERP (gl_state.object)) \
+ {
\
+ struct buffer *buf = XBUFFER (gl_state.object); \
+ gl_state.b_property = 1; \
+ gl_state.e_property = BUF_ZV (buf) - BUF_BEGV (buf) + 1; \
+ gl_state.offset = BUF_BEGV (buf) - 1; \
+ }
\
+ else if (NILP (gl_state.object)) \
+ {
\
+ gl_state.b_property = 1; \
+ gl_state.e_property = ZV - BEGV + 1; \
+ gl_state.offset = BEGV - 1; \
+ }
\
+ else if (EQ (gl_state.object, Qt))
\
+ {
\
+ gl_state.b_property = 0; \
+ gl_state.e_property = 1500000000; \
+ gl_state.offset = 0; \
+ }
\
+ else \
+ {
\
+ gl_state.b_property = 0; \
+ gl_state.e_property = 1 + SCHARS (gl_state.object); \
+ gl_state.offset = 0; \
+ }
\
+ gl_state.use_global = 0; \
+ gl_state.current_syntax_table = current_buffer->syntax_table; \
+ if (parse_sexp_lookup_properties) \
+ update_syntax_table (((FROM) + gl_state.offset \
+ + (COUNT > 0 ? 0 : -1)), \
+ COUNT, 1, gl_state.object); \
+ } \
+ else
+
+ struct gl_state_s
+ {
+ Lisp_Object object; /* The object we are scanning. */
+ int start; /* Where to stop. */
+ int stop; /* Where to stop. */
+ int use_global; /* Whether to use global_code
+ or c_s_t. */
+ Lisp_Object global_code; /* Syntax code of current char. */
+ Lisp_Object current_syntax_table; /* Syntax table for current pos. */
+ Lisp_Object old_prop; /* Syntax-table prop at prev
pos. */
+ int b_property; /* First index where c_s_t is valid. */
+ int e_property; /* First index where c_s_t is
+ not valid. */
+ INTERVAL forward_i; /* Where to start lookup on forward */
+ INTERVAL backward_i; /* or backward movement. The
+ data in c_s_t is valid
+ between these intervals,
+ and possibly at the
+ intervals too, depending
+ on: */
+ /* Offset for positions specified to UPDATE_SYNTAX_TABLE. */
+ int offset;
+ };
+
+ extern struct gl_state_s gl_state;
+ extern int parse_sexp_lookup_properties;
+ extern INTERVAL interval_of P_ ((int, Lisp_Object));
+
+ extern int scan_words P_ ((int, int));
[Prev in Thread] |
Current Thread |
[Next in Thread] |
- [Emacs-diffs] Changes to emacs/src/syntax.h [emacs-unicode-2],
Kenichi Handa <=