annotate src/regex.h @ 510:5bdbc721d46a

[xemacs-hg @ 2001-05-06 08:33:35 by ben] implement printing the selection when it's selected. force redisplay when set-charset-ccl-program called. if bytecomp or byte-optimize need recompiling, then load the .el version of them first, recompile them, and reload the .elc versions to recompile everything else (so we won't be waiting until the cows come home).
author ben
date Sun, 06 May 2001 08:33:41 +0000
parents 7039e6323819
children b39c14581166
Ignore whitespace changes - Everywhere: Within whitespace: At end of lines:
rev   line source
428
3ecd8885ac67 Import from CVS: tag r21-2-22
cvs
parents:
diff changeset
1 /* Definitions for data structures and routines for the regular
3ecd8885ac67 Import from CVS: tag r21-2-22
cvs
parents:
diff changeset
2 expression library, version 0.12.
3ecd8885ac67 Import from CVS: tag r21-2-22
cvs
parents:
diff changeset
3
3ecd8885ac67 Import from CVS: tag r21-2-22
cvs
parents:
diff changeset
4 Copyright (C) 1985, 89, 90, 91, 92, 93, 95 Free Software Foundation, Inc.
3ecd8885ac67 Import from CVS: tag r21-2-22
cvs
parents:
diff changeset
5
3ecd8885ac67 Import from CVS: tag r21-2-22
cvs
parents:
diff changeset
6 This program is free software; you can redistribute it and/or modify
3ecd8885ac67 Import from CVS: tag r21-2-22
cvs
parents:
diff changeset
7 it under the terms of the GNU General Public License as published by
3ecd8885ac67 Import from CVS: tag r21-2-22
cvs
parents:
diff changeset
8 the Free Software Foundation; either version 2, or (at your option)
3ecd8885ac67 Import from CVS: tag r21-2-22
cvs
parents:
diff changeset
9 any later version.
3ecd8885ac67 Import from CVS: tag r21-2-22
cvs
parents:
diff changeset
10
3ecd8885ac67 Import from CVS: tag r21-2-22
cvs
parents:
diff changeset
11 This program is distributed in the hope that it will be useful,
3ecd8885ac67 Import from CVS: tag r21-2-22
cvs
parents:
diff changeset
12 but WITHOUT ANY WARRANTY; without even the implied warranty of
3ecd8885ac67 Import from CVS: tag r21-2-22
cvs
parents:
diff changeset
13 MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
3ecd8885ac67 Import from CVS: tag r21-2-22
cvs
parents:
diff changeset
14 GNU General Public License for more details.
3ecd8885ac67 Import from CVS: tag r21-2-22
cvs
parents:
diff changeset
15
3ecd8885ac67 Import from CVS: tag r21-2-22
cvs
parents:
diff changeset
16 You should have received a copy of the GNU General Public License
3ecd8885ac67 Import from CVS: tag r21-2-22
cvs
parents:
diff changeset
17 along with this program; see the file COPYING. If not, write to
3ecd8885ac67 Import from CVS: tag r21-2-22
cvs
parents:
diff changeset
18 the Free Software Foundation, Inc., 59 Temple Place - Suite 330,
3ecd8885ac67 Import from CVS: tag r21-2-22
cvs
parents:
diff changeset
19 Boston, MA 02111-1307, USA. */
3ecd8885ac67 Import from CVS: tag r21-2-22
cvs
parents:
diff changeset
20
3ecd8885ac67 Import from CVS: tag r21-2-22
cvs
parents:
diff changeset
21 /* Synched up with: FSF 19.29. */
3ecd8885ac67 Import from CVS: tag r21-2-22
cvs
parents:
diff changeset
22
440
8de8e3f6228a Import from CVS: tag r21-2-28
cvs
parents: 428
diff changeset
23 #ifndef INCLUDED_regex_h_
8de8e3f6228a Import from CVS: tag r21-2-28
cvs
parents: 428
diff changeset
24 #define INCLUDED_regex_h_
428
3ecd8885ac67 Import from CVS: tag r21-2-22
cvs
parents:
diff changeset
25
446
1ccc32a20af4 Import from CVS: tag r21-2-38
cvs
parents: 442
diff changeset
26 #ifdef emacs
1ccc32a20af4 Import from CVS: tag r21-2-38
cvs
parents: 442
diff changeset
27 #define RE_TRANSLATE_TYPE Lisp_Object
1ccc32a20af4 Import from CVS: tag r21-2-38
cvs
parents: 442
diff changeset
28 #else
1ccc32a20af4 Import from CVS: tag r21-2-38
cvs
parents: 442
diff changeset
29 #define RE_TRANSLATE_TYPE char *
1ccc32a20af4 Import from CVS: tag r21-2-38
cvs
parents: 442
diff changeset
30 #endif /* emacs */
1ccc32a20af4 Import from CVS: tag r21-2-38
cvs
parents: 442
diff changeset
31
428
3ecd8885ac67 Import from CVS: tag r21-2-22
cvs
parents:
diff changeset
32 /* POSIX says that <sys/types.h> must be included (by the caller) before
3ecd8885ac67 Import from CVS: tag r21-2-22
cvs
parents:
diff changeset
33 <regex.h>. */
3ecd8885ac67 Import from CVS: tag r21-2-22
cvs
parents:
diff changeset
34
3ecd8885ac67 Import from CVS: tag r21-2-22
cvs
parents:
diff changeset
35
3ecd8885ac67 Import from CVS: tag r21-2-22
cvs
parents:
diff changeset
36 /* The following bits are used to determine the regexp syntax we
3ecd8885ac67 Import from CVS: tag r21-2-22
cvs
parents:
diff changeset
37 recognize. The not-set meaning typically corresponds to the syntax
3ecd8885ac67 Import from CVS: tag r21-2-22
cvs
parents:
diff changeset
38 used by Emacs (the exception is RE_INTERVAL, made for historical
3ecd8885ac67 Import from CVS: tag r21-2-22
cvs
parents:
diff changeset
39 reasons). The bits are given in alphabetical order, and the
3ecd8885ac67 Import from CVS: tag r21-2-22
cvs
parents:
diff changeset
40 definitions shifted by one from the previous bit; thus, when we add or
3ecd8885ac67 Import from CVS: tag r21-2-22
cvs
parents:
diff changeset
41 remove a bit, only one other definition need change. */
3ecd8885ac67 Import from CVS: tag r21-2-22
cvs
parents:
diff changeset
42 typedef unsigned reg_syntax_t;
3ecd8885ac67 Import from CVS: tag r21-2-22
cvs
parents:
diff changeset
43
3ecd8885ac67 Import from CVS: tag r21-2-22
cvs
parents:
diff changeset
44 /* If this bit is not set, then \ inside a bracket expression is literal.
3ecd8885ac67 Import from CVS: tag r21-2-22
cvs
parents:
diff changeset
45 If set, then such a \ quotes the following character. */
3ecd8885ac67 Import from CVS: tag r21-2-22
cvs
parents:
diff changeset
46 #define RE_BACKSLASH_ESCAPE_IN_LISTS (1)
3ecd8885ac67 Import from CVS: tag r21-2-22
cvs
parents:
diff changeset
47
3ecd8885ac67 Import from CVS: tag r21-2-22
cvs
parents:
diff changeset
48 /* If this bit is not set, then + and ? are operators, and \+ and \? are
3ecd8885ac67 Import from CVS: tag r21-2-22
cvs
parents:
diff changeset
49 literals.
3ecd8885ac67 Import from CVS: tag r21-2-22
cvs
parents:
diff changeset
50 If set, then \+ and \? are operators and + and ? are literals. */
3ecd8885ac67 Import from CVS: tag r21-2-22
cvs
parents:
diff changeset
51 #define RE_BK_PLUS_QM (RE_BACKSLASH_ESCAPE_IN_LISTS << 1)
3ecd8885ac67 Import from CVS: tag r21-2-22
cvs
parents:
diff changeset
52
3ecd8885ac67 Import from CVS: tag r21-2-22
cvs
parents:
diff changeset
53 /* If this bit is set, then character classes are supported. They are:
3ecd8885ac67 Import from CVS: tag r21-2-22
cvs
parents:
diff changeset
54 [:alpha:], [:upper:], [:lower:], [:digit:], [:alnum:], [:xdigit:],
3ecd8885ac67 Import from CVS: tag r21-2-22
cvs
parents:
diff changeset
55 [:space:], [:print:], [:punct:], [:graph:], and [:cntrl:].
3ecd8885ac67 Import from CVS: tag r21-2-22
cvs
parents:
diff changeset
56 If not set, then character classes are not supported. */
3ecd8885ac67 Import from CVS: tag r21-2-22
cvs
parents:
diff changeset
57 #define RE_CHAR_CLASSES (RE_BK_PLUS_QM << 1)
3ecd8885ac67 Import from CVS: tag r21-2-22
cvs
parents:
diff changeset
58
3ecd8885ac67 Import from CVS: tag r21-2-22
cvs
parents:
diff changeset
59 /* If this bit is set, then ^ and $ are always anchors (outside bracket
3ecd8885ac67 Import from CVS: tag r21-2-22
cvs
parents:
diff changeset
60 expressions, of course).
3ecd8885ac67 Import from CVS: tag r21-2-22
cvs
parents:
diff changeset
61 If this bit is not set, then it depends:
3ecd8885ac67 Import from CVS: tag r21-2-22
cvs
parents:
diff changeset
62 ^ is an anchor if it is at the beginning of a regular
3ecd8885ac67 Import from CVS: tag r21-2-22
cvs
parents:
diff changeset
63 expression or after an open-group or an alternation operator;
3ecd8885ac67 Import from CVS: tag r21-2-22
cvs
parents:
diff changeset
64 $ is an anchor if it is at the end of a regular expression, or
3ecd8885ac67 Import from CVS: tag r21-2-22
cvs
parents:
diff changeset
65 before a close-group or an alternation operator.
3ecd8885ac67 Import from CVS: tag r21-2-22
cvs
parents:
diff changeset
66
3ecd8885ac67 Import from CVS: tag r21-2-22
cvs
parents:
diff changeset
67 This bit could be (re)combined with RE_CONTEXT_INDEP_OPS, because
3ecd8885ac67 Import from CVS: tag r21-2-22
cvs
parents:
diff changeset
68 POSIX draft 11.2 says that * etc. in leading positions is undefined.
3ecd8885ac67 Import from CVS: tag r21-2-22
cvs
parents:
diff changeset
69 We already implemented a previous draft which made those constructs
3ecd8885ac67 Import from CVS: tag r21-2-22
cvs
parents:
diff changeset
70 invalid, though, so we haven't changed the code back. */
3ecd8885ac67 Import from CVS: tag r21-2-22
cvs
parents:
diff changeset
71 #define RE_CONTEXT_INDEP_ANCHORS (RE_CHAR_CLASSES << 1)
3ecd8885ac67 Import from CVS: tag r21-2-22
cvs
parents:
diff changeset
72
3ecd8885ac67 Import from CVS: tag r21-2-22
cvs
parents:
diff changeset
73 /* If this bit is set, then special characters are always special
3ecd8885ac67 Import from CVS: tag r21-2-22
cvs
parents:
diff changeset
74 regardless of where they are in the pattern.
3ecd8885ac67 Import from CVS: tag r21-2-22
cvs
parents:
diff changeset
75 If this bit is not set, then special characters are special only in
3ecd8885ac67 Import from CVS: tag r21-2-22
cvs
parents:
diff changeset
76 some contexts; otherwise they are ordinary. Specifically,
3ecd8885ac67 Import from CVS: tag r21-2-22
cvs
parents:
diff changeset
77 * + ? and intervals are only special when not after the beginning,
3ecd8885ac67 Import from CVS: tag r21-2-22
cvs
parents:
diff changeset
78 open-group, or alternation operator. */
3ecd8885ac67 Import from CVS: tag r21-2-22
cvs
parents:
diff changeset
79 #define RE_CONTEXT_INDEP_OPS (RE_CONTEXT_INDEP_ANCHORS << 1)
3ecd8885ac67 Import from CVS: tag r21-2-22
cvs
parents:
diff changeset
80
3ecd8885ac67 Import from CVS: tag r21-2-22
cvs
parents:
diff changeset
81 /* If this bit is set, then *, +, ?, and { cannot be first in an re or
3ecd8885ac67 Import from CVS: tag r21-2-22
cvs
parents:
diff changeset
82 immediately after an alternation or begin-group operator. */
3ecd8885ac67 Import from CVS: tag r21-2-22
cvs
parents:
diff changeset
83 #define RE_CONTEXT_INVALID_OPS (RE_CONTEXT_INDEP_OPS << 1)
3ecd8885ac67 Import from CVS: tag r21-2-22
cvs
parents:
diff changeset
84
3ecd8885ac67 Import from CVS: tag r21-2-22
cvs
parents:
diff changeset
85 /* If this bit is set, then . matches newline.
3ecd8885ac67 Import from CVS: tag r21-2-22
cvs
parents:
diff changeset
86 If not set, then it doesn't. */
3ecd8885ac67 Import from CVS: tag r21-2-22
cvs
parents:
diff changeset
87 #define RE_DOT_NEWLINE (RE_CONTEXT_INVALID_OPS << 1)
3ecd8885ac67 Import from CVS: tag r21-2-22
cvs
parents:
diff changeset
88
3ecd8885ac67 Import from CVS: tag r21-2-22
cvs
parents:
diff changeset
89 /* If this bit is set, then . doesn't match NUL.
3ecd8885ac67 Import from CVS: tag r21-2-22
cvs
parents:
diff changeset
90 If not set, then it does. */
3ecd8885ac67 Import from CVS: tag r21-2-22
cvs
parents:
diff changeset
91 #define RE_DOT_NOT_NULL (RE_DOT_NEWLINE << 1)
3ecd8885ac67 Import from CVS: tag r21-2-22
cvs
parents:
diff changeset
92
3ecd8885ac67 Import from CVS: tag r21-2-22
cvs
parents:
diff changeset
93 /* If this bit is set, nonmatching lists [^...] do not match newline.
3ecd8885ac67 Import from CVS: tag r21-2-22
cvs
parents:
diff changeset
94 If not set, they do. */
3ecd8885ac67 Import from CVS: tag r21-2-22
cvs
parents:
diff changeset
95 #define RE_HAT_LISTS_NOT_NEWLINE (RE_DOT_NOT_NULL << 1)
3ecd8885ac67 Import from CVS: tag r21-2-22
cvs
parents:
diff changeset
96
3ecd8885ac67 Import from CVS: tag r21-2-22
cvs
parents:
diff changeset
97 /* If this bit is set, either \{...\} or {...} defines an
3ecd8885ac67 Import from CVS: tag r21-2-22
cvs
parents:
diff changeset
98 interval, depending on RE_NO_BK_BRACES.
3ecd8885ac67 Import from CVS: tag r21-2-22
cvs
parents:
diff changeset
99 If not set, \{, \}, {, and } are literals. */
3ecd8885ac67 Import from CVS: tag r21-2-22
cvs
parents:
diff changeset
100 #define RE_INTERVALS (RE_HAT_LISTS_NOT_NEWLINE << 1)
3ecd8885ac67 Import from CVS: tag r21-2-22
cvs
parents:
diff changeset
101
3ecd8885ac67 Import from CVS: tag r21-2-22
cvs
parents:
diff changeset
102 /* If this bit is set, +, ? and | aren't recognized as operators.
3ecd8885ac67 Import from CVS: tag r21-2-22
cvs
parents:
diff changeset
103 If not set, they are. */
3ecd8885ac67 Import from CVS: tag r21-2-22
cvs
parents:
diff changeset
104 #define RE_LIMITED_OPS (RE_INTERVALS << 1)
3ecd8885ac67 Import from CVS: tag r21-2-22
cvs
parents:
diff changeset
105
3ecd8885ac67 Import from CVS: tag r21-2-22
cvs
parents:
diff changeset
106 /* If this bit is set, newline is an alternation operator.
3ecd8885ac67 Import from CVS: tag r21-2-22
cvs
parents:
diff changeset
107 If not set, newline is literal. */
3ecd8885ac67 Import from CVS: tag r21-2-22
cvs
parents:
diff changeset
108 #define RE_NEWLINE_ALT (RE_LIMITED_OPS << 1)
3ecd8885ac67 Import from CVS: tag r21-2-22
cvs
parents:
diff changeset
109
3ecd8885ac67 Import from CVS: tag r21-2-22
cvs
parents:
diff changeset
110 /* If this bit is set, then `{...}' defines an interval, and \{ and \}
3ecd8885ac67 Import from CVS: tag r21-2-22
cvs
parents:
diff changeset
111 are literals.
3ecd8885ac67 Import from CVS: tag r21-2-22
cvs
parents:
diff changeset
112 If not set, then `\{...\}' defines an interval. */
3ecd8885ac67 Import from CVS: tag r21-2-22
cvs
parents:
diff changeset
113 #define RE_NO_BK_BRACES (RE_NEWLINE_ALT << 1)
3ecd8885ac67 Import from CVS: tag r21-2-22
cvs
parents:
diff changeset
114
3ecd8885ac67 Import from CVS: tag r21-2-22
cvs
parents:
diff changeset
115 /* If this bit is set, (...) defines a group, and \( and \) are literals.
3ecd8885ac67 Import from CVS: tag r21-2-22
cvs
parents:
diff changeset
116 If not set, \(...\) defines a group, and ( and ) are literals. */
3ecd8885ac67 Import from CVS: tag r21-2-22
cvs
parents:
diff changeset
117 #define RE_NO_BK_PARENS (RE_NO_BK_BRACES << 1)
3ecd8885ac67 Import from CVS: tag r21-2-22
cvs
parents:
diff changeset
118
3ecd8885ac67 Import from CVS: tag r21-2-22
cvs
parents:
diff changeset
119 /* If this bit is set, then \<digit> matches <digit>.
3ecd8885ac67 Import from CVS: tag r21-2-22
cvs
parents:
diff changeset
120 If not set, then \<digit> is a back-reference. */
3ecd8885ac67 Import from CVS: tag r21-2-22
cvs
parents:
diff changeset
121 #define RE_NO_BK_REFS (RE_NO_BK_PARENS << 1)
3ecd8885ac67 Import from CVS: tag r21-2-22
cvs
parents:
diff changeset
122
3ecd8885ac67 Import from CVS: tag r21-2-22
cvs
parents:
diff changeset
123 /* If this bit is set, then | is an alternation operator, and \| is literal.
3ecd8885ac67 Import from CVS: tag r21-2-22
cvs
parents:
diff changeset
124 If not set, then \| is an alternation operator, and | is literal. */
3ecd8885ac67 Import from CVS: tag r21-2-22
cvs
parents:
diff changeset
125 #define RE_NO_BK_VBAR (RE_NO_BK_REFS << 1)
3ecd8885ac67 Import from CVS: tag r21-2-22
cvs
parents:
diff changeset
126
3ecd8885ac67 Import from CVS: tag r21-2-22
cvs
parents:
diff changeset
127 /* If this bit is set, then an ending range point collating higher
3ecd8885ac67 Import from CVS: tag r21-2-22
cvs
parents:
diff changeset
128 than the starting range point, as in [z-a], is invalid.
3ecd8885ac67 Import from CVS: tag r21-2-22
cvs
parents:
diff changeset
129 If not set, then when ending range point collates higher than the
3ecd8885ac67 Import from CVS: tag r21-2-22
cvs
parents:
diff changeset
130 starting range point, the range is ignored. */
3ecd8885ac67 Import from CVS: tag r21-2-22
cvs
parents:
diff changeset
131 #define RE_NO_EMPTY_RANGES (RE_NO_BK_VBAR << 1)
3ecd8885ac67 Import from CVS: tag r21-2-22
cvs
parents:
diff changeset
132
3ecd8885ac67 Import from CVS: tag r21-2-22
cvs
parents:
diff changeset
133 /* If this bit is not set, allow minimal matching:
3ecd8885ac67 Import from CVS: tag r21-2-22
cvs
parents:
diff changeset
134 - a*? and a+? and a?? perform shortest-possible matching (compare with a*
3ecd8885ac67 Import from CVS: tag r21-2-22
cvs
parents:
diff changeset
135 and a+ and a?, respectively, which perform longest-possible matching)
3ecd8885ac67 Import from CVS: tag r21-2-22
cvs
parents:
diff changeset
136 - other juxtaposing of * + and ? is rejected.
3ecd8885ac67 Import from CVS: tag r21-2-22
cvs
parents:
diff changeset
137 If this bit is set, consecutive * + and ?'s are collapsed in a logical
3ecd8885ac67 Import from CVS: tag r21-2-22
cvs
parents:
diff changeset
138 manner:
3ecd8885ac67 Import from CVS: tag r21-2-22
cvs
parents:
diff changeset
139 - a*? and a+? are the same as a*
3ecd8885ac67 Import from CVS: tag r21-2-22
cvs
parents:
diff changeset
140 - a?? is the same as a?
3ecd8885ac67 Import from CVS: tag r21-2-22
cvs
parents:
diff changeset
141 */
3ecd8885ac67 Import from CVS: tag r21-2-22
cvs
parents:
diff changeset
142 #define RE_NO_MINIMAL_MATCHING (RE_NO_EMPTY_RANGES << 1)
3ecd8885ac67 Import from CVS: tag r21-2-22
cvs
parents:
diff changeset
143
3ecd8885ac67 Import from CVS: tag r21-2-22
cvs
parents:
diff changeset
144 /* If this bit is set, succeed as soon as we match the whole pattern,
3ecd8885ac67 Import from CVS: tag r21-2-22
cvs
parents:
diff changeset
145 without further backtracking. */
3ecd8885ac67 Import from CVS: tag r21-2-22
cvs
parents:
diff changeset
146 #define RE_NO_POSIX_BACKTRACKING (RE_NO_MINIMAL_MATCHING << 1)
3ecd8885ac67 Import from CVS: tag r21-2-22
cvs
parents:
diff changeset
147
3ecd8885ac67 Import from CVS: tag r21-2-22
cvs
parents:
diff changeset
148 /* If this bit is not set, (?:re) behaves like (re) (or \(?:re\) behaves like
3ecd8885ac67 Import from CVS: tag r21-2-22
cvs
parents:
diff changeset
149 \(re\)) except that the matched string is not registered. */
3ecd8885ac67 Import from CVS: tag r21-2-22
cvs
parents:
diff changeset
150 #define RE_NO_SHY_GROUPS (RE_NO_POSIX_BACKTRACKING << 1)
3ecd8885ac67 Import from CVS: tag r21-2-22
cvs
parents:
diff changeset
151
3ecd8885ac67 Import from CVS: tag r21-2-22
cvs
parents:
diff changeset
152 /* If this bit is set, then an unmatched ) is ordinary.
3ecd8885ac67 Import from CVS: tag r21-2-22
cvs
parents:
diff changeset
153 If not set, then an unmatched ) is invalid. */
3ecd8885ac67 Import from CVS: tag r21-2-22
cvs
parents:
diff changeset
154 #define RE_UNMATCHED_RIGHT_PAREN_ORD (RE_NO_SHY_GROUPS << 1)
3ecd8885ac67 Import from CVS: tag r21-2-22
cvs
parents:
diff changeset
155
502
7039e6323819 [xemacs-hg @ 2001-05-04 22:41:46 by ben]
ben
parents: 446
diff changeset
156 /* If this bit is set, then \22 will read as a back reference,
7039e6323819 [xemacs-hg @ 2001-05-04 22:41:46 by ben]
ben
parents: 446
diff changeset
157 provided at least 22 non-shy groups have been seen so far. In all
7039e6323819 [xemacs-hg @ 2001-05-04 22:41:46 by ben]
ben
parents: 446
diff changeset
158 other cases (bit not set, not 22 non-shy groups seen so far), it
7039e6323819 [xemacs-hg @ 2001-05-04 22:41:46 by ben]
ben
parents: 446
diff changeset
159 reads as a back reference \2 followed by a digit 2. */
7039e6323819 [xemacs-hg @ 2001-05-04 22:41:46 by ben]
ben
parents: 446
diff changeset
160 #define RE_NO_MULTI_DIGIT_BK_REFS (RE_UNMATCHED_RIGHT_PAREN_ORD << 1)
7039e6323819 [xemacs-hg @ 2001-05-04 22:41:46 by ben]
ben
parents: 446
diff changeset
161
428
3ecd8885ac67 Import from CVS: tag r21-2-22
cvs
parents:
diff changeset
162 /* This global variable defines the particular regexp syntax to use (for
3ecd8885ac67 Import from CVS: tag r21-2-22
cvs
parents:
diff changeset
163 some interfaces). When a regexp is compiled, the syntax used is
3ecd8885ac67 Import from CVS: tag r21-2-22
cvs
parents:
diff changeset
164 stored in the pattern buffer, so changing this does not affect
3ecd8885ac67 Import from CVS: tag r21-2-22
cvs
parents:
diff changeset
165 already-compiled regexps. */
3ecd8885ac67 Import from CVS: tag r21-2-22
cvs
parents:
diff changeset
166 extern reg_syntax_t re_syntax_options;
3ecd8885ac67 Import from CVS: tag r21-2-22
cvs
parents:
diff changeset
167
3ecd8885ac67 Import from CVS: tag r21-2-22
cvs
parents:
diff changeset
168 /* Define combinations of the above bits for the standard possibilities.
3ecd8885ac67 Import from CVS: tag r21-2-22
cvs
parents:
diff changeset
169 (The [[[ comments delimit what gets put into the Texinfo file, so
3ecd8885ac67 Import from CVS: tag r21-2-22
cvs
parents:
diff changeset
170 don't delete them!) */
3ecd8885ac67 Import from CVS: tag r21-2-22
cvs
parents:
diff changeset
171 /* [[[begin syntaxes]]] */
3ecd8885ac67 Import from CVS: tag r21-2-22
cvs
parents:
diff changeset
172 #define RE_SYNTAX_EMACS RE_INTERVALS
3ecd8885ac67 Import from CVS: tag r21-2-22
cvs
parents:
diff changeset
173
3ecd8885ac67 Import from CVS: tag r21-2-22
cvs
parents:
diff changeset
174 #define RE_SYNTAX_AWK \
3ecd8885ac67 Import from CVS: tag r21-2-22
cvs
parents:
diff changeset
175 (RE_BACKSLASH_ESCAPE_IN_LISTS | RE_DOT_NOT_NULL \
3ecd8885ac67 Import from CVS: tag r21-2-22
cvs
parents:
diff changeset
176 | RE_NO_BK_PARENS | RE_NO_BK_REFS \
3ecd8885ac67 Import from CVS: tag r21-2-22
cvs
parents:
diff changeset
177 | RE_NO_BK_VBAR | RE_NO_EMPTY_RANGES \
3ecd8885ac67 Import from CVS: tag r21-2-22
cvs
parents:
diff changeset
178 | RE_UNMATCHED_RIGHT_PAREN_ORD | RE_NO_SHY_GROUPS \
502
7039e6323819 [xemacs-hg @ 2001-05-04 22:41:46 by ben]
ben
parents: 446
diff changeset
179 | RE_NO_MINIMAL_MATCHING | RE_NO_MULTI_DIGIT_BK_REFS)
428
3ecd8885ac67 Import from CVS: tag r21-2-22
cvs
parents:
diff changeset
180
3ecd8885ac67 Import from CVS: tag r21-2-22
cvs
parents:
diff changeset
181 #define RE_SYNTAX_POSIX_AWK \
3ecd8885ac67 Import from CVS: tag r21-2-22
cvs
parents:
diff changeset
182 (RE_SYNTAX_POSIX_EXTENDED | RE_BACKSLASH_ESCAPE_IN_LISTS)
3ecd8885ac67 Import from CVS: tag r21-2-22
cvs
parents:
diff changeset
183
3ecd8885ac67 Import from CVS: tag r21-2-22
cvs
parents:
diff changeset
184 #define RE_SYNTAX_GREP \
3ecd8885ac67 Import from CVS: tag r21-2-22
cvs
parents:
diff changeset
185 (RE_BK_PLUS_QM | RE_CHAR_CLASSES \
3ecd8885ac67 Import from CVS: tag r21-2-22
cvs
parents:
diff changeset
186 | RE_HAT_LISTS_NOT_NEWLINE | RE_INTERVALS \
3ecd8885ac67 Import from CVS: tag r21-2-22
cvs
parents:
diff changeset
187 | RE_NEWLINE_ALT | RE_NO_SHY_GROUPS \
502
7039e6323819 [xemacs-hg @ 2001-05-04 22:41:46 by ben]
ben
parents: 446
diff changeset
188 | RE_NO_MINIMAL_MATCHING | RE_NO_MULTI_DIGIT_BK_REFS)
428
3ecd8885ac67 Import from CVS: tag r21-2-22
cvs
parents:
diff changeset
189
3ecd8885ac67 Import from CVS: tag r21-2-22
cvs
parents:
diff changeset
190 #define RE_SYNTAX_EGREP \
3ecd8885ac67 Import from CVS: tag r21-2-22
cvs
parents:
diff changeset
191 (RE_CHAR_CLASSES | RE_CONTEXT_INDEP_ANCHORS \
3ecd8885ac67 Import from CVS: tag r21-2-22
cvs
parents:
diff changeset
192 | RE_CONTEXT_INDEP_OPS | RE_HAT_LISTS_NOT_NEWLINE \
3ecd8885ac67 Import from CVS: tag r21-2-22
cvs
parents:
diff changeset
193 | RE_NEWLINE_ALT | RE_NO_BK_PARENS \
3ecd8885ac67 Import from CVS: tag r21-2-22
cvs
parents:
diff changeset
194 | RE_NO_BK_VBAR | RE_NO_SHY_GROUPS \
502
7039e6323819 [xemacs-hg @ 2001-05-04 22:41:46 by ben]
ben
parents: 446
diff changeset
195 | RE_NO_MINIMAL_MATCHING | RE_NO_MULTI_DIGIT_BK_REFS)
428
3ecd8885ac67 Import from CVS: tag r21-2-22
cvs
parents:
diff changeset
196
3ecd8885ac67 Import from CVS: tag r21-2-22
cvs
parents:
diff changeset
197 #define RE_SYNTAX_POSIX_EGREP \
502
7039e6323819 [xemacs-hg @ 2001-05-04 22:41:46 by ben]
ben
parents: 446
diff changeset
198 (RE_SYNTAX_EGREP | RE_INTERVALS | RE_NO_BK_BRACES | \
7039e6323819 [xemacs-hg @ 2001-05-04 22:41:46 by ben]
ben
parents: 446
diff changeset
199 RE_NO_MULTI_DIGIT_BK_REFS)
428
3ecd8885ac67 Import from CVS: tag r21-2-22
cvs
parents:
diff changeset
200
3ecd8885ac67 Import from CVS: tag r21-2-22
cvs
parents:
diff changeset
201 /* P1003.2/D11.2, section 4.20.7.1, lines 5078ff. */
3ecd8885ac67 Import from CVS: tag r21-2-22
cvs
parents:
diff changeset
202 #define RE_SYNTAX_ED RE_SYNTAX_POSIX_BASIC
3ecd8885ac67 Import from CVS: tag r21-2-22
cvs
parents:
diff changeset
203
3ecd8885ac67 Import from CVS: tag r21-2-22
cvs
parents:
diff changeset
204 #define RE_SYNTAX_SED RE_SYNTAX_POSIX_BASIC
3ecd8885ac67 Import from CVS: tag r21-2-22
cvs
parents:
diff changeset
205
3ecd8885ac67 Import from CVS: tag r21-2-22
cvs
parents:
diff changeset
206 /* Syntax bits common to both basic and extended POSIX regex syntax. */
3ecd8885ac67 Import from CVS: tag r21-2-22
cvs
parents:
diff changeset
207 #define _RE_SYNTAX_POSIX_COMMON \
3ecd8885ac67 Import from CVS: tag r21-2-22
cvs
parents:
diff changeset
208 (RE_CHAR_CLASSES | RE_DOT_NEWLINE | RE_DOT_NOT_NULL \
3ecd8885ac67 Import from CVS: tag r21-2-22
cvs
parents:
diff changeset
209 | RE_INTERVALS | RE_NO_EMPTY_RANGES | RE_NO_SHY_GROUPS \
502
7039e6323819 [xemacs-hg @ 2001-05-04 22:41:46 by ben]
ben
parents: 446
diff changeset
210 | RE_NO_MINIMAL_MATCHING | RE_NO_MULTI_DIGIT_BK_REFS)
428
3ecd8885ac67 Import from CVS: tag r21-2-22
cvs
parents:
diff changeset
211
3ecd8885ac67 Import from CVS: tag r21-2-22
cvs
parents:
diff changeset
212 #define RE_SYNTAX_POSIX_BASIC \
3ecd8885ac67 Import from CVS: tag r21-2-22
cvs
parents:
diff changeset
213 (_RE_SYNTAX_POSIX_COMMON | RE_BK_PLUS_QM)
3ecd8885ac67 Import from CVS: tag r21-2-22
cvs
parents:
diff changeset
214
3ecd8885ac67 Import from CVS: tag r21-2-22
cvs
parents:
diff changeset
215 /* Differs from ..._POSIX_BASIC only in that RE_BK_PLUS_QM becomes
3ecd8885ac67 Import from CVS: tag r21-2-22
cvs
parents:
diff changeset
216 RE_LIMITED_OPS, i.e., \? \+ \| are not recognized. Actually, this
3ecd8885ac67 Import from CVS: tag r21-2-22
cvs
parents:
diff changeset
217 isn't minimal, since other operators, such as \`, aren't disabled. */
3ecd8885ac67 Import from CVS: tag r21-2-22
cvs
parents:
diff changeset
218 #define RE_SYNTAX_POSIX_MINIMAL_BASIC \
3ecd8885ac67 Import from CVS: tag r21-2-22
cvs
parents:
diff changeset
219 (_RE_SYNTAX_POSIX_COMMON | RE_LIMITED_OPS)
3ecd8885ac67 Import from CVS: tag r21-2-22
cvs
parents:
diff changeset
220
3ecd8885ac67 Import from CVS: tag r21-2-22
cvs
parents:
diff changeset
221 #define RE_SYNTAX_POSIX_EXTENDED \
3ecd8885ac67 Import from CVS: tag r21-2-22
cvs
parents:
diff changeset
222 (_RE_SYNTAX_POSIX_COMMON | RE_CONTEXT_INDEP_ANCHORS \
3ecd8885ac67 Import from CVS: tag r21-2-22
cvs
parents:
diff changeset
223 | RE_CONTEXT_INDEP_OPS | RE_NO_BK_BRACES \
3ecd8885ac67 Import from CVS: tag r21-2-22
cvs
parents:
diff changeset
224 | RE_NO_BK_PARENS | RE_NO_BK_VBAR \
3ecd8885ac67 Import from CVS: tag r21-2-22
cvs
parents:
diff changeset
225 | RE_UNMATCHED_RIGHT_PAREN_ORD)
3ecd8885ac67 Import from CVS: tag r21-2-22
cvs
parents:
diff changeset
226
3ecd8885ac67 Import from CVS: tag r21-2-22
cvs
parents:
diff changeset
227 /* Differs from ..._POSIX_EXTENDED in that RE_CONTEXT_INVALID_OPS
3ecd8885ac67 Import from CVS: tag r21-2-22
cvs
parents:
diff changeset
228 replaces RE_CONTEXT_INDEP_OPS and RE_NO_BK_REFS is added. */
3ecd8885ac67 Import from CVS: tag r21-2-22
cvs
parents:
diff changeset
229 #define RE_SYNTAX_POSIX_MINIMAL_EXTENDED \
3ecd8885ac67 Import from CVS: tag r21-2-22
cvs
parents:
diff changeset
230 (_RE_SYNTAX_POSIX_COMMON | RE_CONTEXT_INDEP_ANCHORS \
3ecd8885ac67 Import from CVS: tag r21-2-22
cvs
parents:
diff changeset
231 | RE_CONTEXT_INVALID_OPS | RE_NO_BK_BRACES \
3ecd8885ac67 Import from CVS: tag r21-2-22
cvs
parents:
diff changeset
232 | RE_NO_BK_PARENS | RE_NO_BK_REFS \
3ecd8885ac67 Import from CVS: tag r21-2-22
cvs
parents:
diff changeset
233 | RE_NO_BK_VBAR | RE_UNMATCHED_RIGHT_PAREN_ORD)
3ecd8885ac67 Import from CVS: tag r21-2-22
cvs
parents:
diff changeset
234 /* [[[end syntaxes]]] */
3ecd8885ac67 Import from CVS: tag r21-2-22
cvs
parents:
diff changeset
235
3ecd8885ac67 Import from CVS: tag r21-2-22
cvs
parents:
diff changeset
236 /* Maximum number of duplicates an interval can allow. Some systems
3ecd8885ac67 Import from CVS: tag r21-2-22
cvs
parents:
diff changeset
237 (erroneously) define this in other header files, but we want our
3ecd8885ac67 Import from CVS: tag r21-2-22
cvs
parents:
diff changeset
238 value, so remove any previous define. */
3ecd8885ac67 Import from CVS: tag r21-2-22
cvs
parents:
diff changeset
239 #ifdef RE_DUP_MAX
3ecd8885ac67 Import from CVS: tag r21-2-22
cvs
parents:
diff changeset
240 #undef RE_DUP_MAX
3ecd8885ac67 Import from CVS: tag r21-2-22
cvs
parents:
diff changeset
241 #endif
3ecd8885ac67 Import from CVS: tag r21-2-22
cvs
parents:
diff changeset
242 #define RE_DUP_MAX ((1 << 15) - 1)
3ecd8885ac67 Import from CVS: tag r21-2-22
cvs
parents:
diff changeset
243
3ecd8885ac67 Import from CVS: tag r21-2-22
cvs
parents:
diff changeset
244
3ecd8885ac67 Import from CVS: tag r21-2-22
cvs
parents:
diff changeset
245 /* POSIX `cflags' bits (i.e., information for `regcomp'). */
3ecd8885ac67 Import from CVS: tag r21-2-22
cvs
parents:
diff changeset
246
3ecd8885ac67 Import from CVS: tag r21-2-22
cvs
parents:
diff changeset
247 /* If this bit is set, then use extended regular expression syntax.
3ecd8885ac67 Import from CVS: tag r21-2-22
cvs
parents:
diff changeset
248 If not set, then use basic regular expression syntax. */
3ecd8885ac67 Import from CVS: tag r21-2-22
cvs
parents:
diff changeset
249 #define REG_EXTENDED 1
3ecd8885ac67 Import from CVS: tag r21-2-22
cvs
parents:
diff changeset
250
3ecd8885ac67 Import from CVS: tag r21-2-22
cvs
parents:
diff changeset
251 /* If this bit is set, then ignore case when matching.
3ecd8885ac67 Import from CVS: tag r21-2-22
cvs
parents:
diff changeset
252 If not set, then case is significant. */
3ecd8885ac67 Import from CVS: tag r21-2-22
cvs
parents:
diff changeset
253 #define REG_ICASE (REG_EXTENDED << 1)
3ecd8885ac67 Import from CVS: tag r21-2-22
cvs
parents:
diff changeset
254
3ecd8885ac67 Import from CVS: tag r21-2-22
cvs
parents:
diff changeset
255 /* If this bit is set, then anchors do not match at newline
3ecd8885ac67 Import from CVS: tag r21-2-22
cvs
parents:
diff changeset
256 characters in the string.
3ecd8885ac67 Import from CVS: tag r21-2-22
cvs
parents:
diff changeset
257 If not set, then anchors do match at newlines. */
3ecd8885ac67 Import from CVS: tag r21-2-22
cvs
parents:
diff changeset
258 #define REG_NEWLINE (REG_ICASE << 1)
3ecd8885ac67 Import from CVS: tag r21-2-22
cvs
parents:
diff changeset
259
3ecd8885ac67 Import from CVS: tag r21-2-22
cvs
parents:
diff changeset
260 /* If this bit is set, then report only success or fail in regexec.
3ecd8885ac67 Import from CVS: tag r21-2-22
cvs
parents:
diff changeset
261 If not set, then returns differ between not matching and errors. */
3ecd8885ac67 Import from CVS: tag r21-2-22
cvs
parents:
diff changeset
262 #define REG_NOSUB (REG_NEWLINE << 1)
3ecd8885ac67 Import from CVS: tag r21-2-22
cvs
parents:
diff changeset
263
3ecd8885ac67 Import from CVS: tag r21-2-22
cvs
parents:
diff changeset
264
3ecd8885ac67 Import from CVS: tag r21-2-22
cvs
parents:
diff changeset
265 /* POSIX `eflags' bits (i.e., information for regexec). */
3ecd8885ac67 Import from CVS: tag r21-2-22
cvs
parents:
diff changeset
266
3ecd8885ac67 Import from CVS: tag r21-2-22
cvs
parents:
diff changeset
267 /* If this bit is set, then the beginning-of-line operator doesn't match
3ecd8885ac67 Import from CVS: tag r21-2-22
cvs
parents:
diff changeset
268 the beginning of the string (presumably because it's not the
3ecd8885ac67 Import from CVS: tag r21-2-22
cvs
parents:
diff changeset
269 beginning of a line).
3ecd8885ac67 Import from CVS: tag r21-2-22
cvs
parents:
diff changeset
270 If not set, then the beginning-of-line operator does match the
3ecd8885ac67 Import from CVS: tag r21-2-22
cvs
parents:
diff changeset
271 beginning of the string. */
3ecd8885ac67 Import from CVS: tag r21-2-22
cvs
parents:
diff changeset
272 #define REG_NOTBOL 1
3ecd8885ac67 Import from CVS: tag r21-2-22
cvs
parents:
diff changeset
273
3ecd8885ac67 Import from CVS: tag r21-2-22
cvs
parents:
diff changeset
274 /* Like REG_NOTBOL, except for the end-of-line. */
3ecd8885ac67 Import from CVS: tag r21-2-22
cvs
parents:
diff changeset
275 #define REG_NOTEOL (1 << 1)
3ecd8885ac67 Import from CVS: tag r21-2-22
cvs
parents:
diff changeset
276
3ecd8885ac67 Import from CVS: tag r21-2-22
cvs
parents:
diff changeset
277
3ecd8885ac67 Import from CVS: tag r21-2-22
cvs
parents:
diff changeset
278 /* If any error codes are removed, changed, or added, update the
3ecd8885ac67 Import from CVS: tag r21-2-22
cvs
parents:
diff changeset
279 `re_error_msg' table in regex.c. */
3ecd8885ac67 Import from CVS: tag r21-2-22
cvs
parents:
diff changeset
280 typedef enum
3ecd8885ac67 Import from CVS: tag r21-2-22
cvs
parents:
diff changeset
281 {
3ecd8885ac67 Import from CVS: tag r21-2-22
cvs
parents:
diff changeset
282 REG_NOERROR = 0, /* Success. */
3ecd8885ac67 Import from CVS: tag r21-2-22
cvs
parents:
diff changeset
283 REG_NOMATCH, /* Didn't find a match (for regexec). */
3ecd8885ac67 Import from CVS: tag r21-2-22
cvs
parents:
diff changeset
284
3ecd8885ac67 Import from CVS: tag r21-2-22
cvs
parents:
diff changeset
285 /* POSIX regcomp return error codes. (In the order listed in the
3ecd8885ac67 Import from CVS: tag r21-2-22
cvs
parents:
diff changeset
286 standard.) */
3ecd8885ac67 Import from CVS: tag r21-2-22
cvs
parents:
diff changeset
287 REG_BADPAT, /* Invalid pattern. */
3ecd8885ac67 Import from CVS: tag r21-2-22
cvs
parents:
diff changeset
288 REG_ECOLLATE, /* Not implemented. */
3ecd8885ac67 Import from CVS: tag r21-2-22
cvs
parents:
diff changeset
289 REG_ECTYPE, /* Invalid character class name. */
3ecd8885ac67 Import from CVS: tag r21-2-22
cvs
parents:
diff changeset
290 REG_EESCAPE, /* Trailing backslash. */
3ecd8885ac67 Import from CVS: tag r21-2-22
cvs
parents:
diff changeset
291 REG_ESUBREG, /* Invalid back reference. */
3ecd8885ac67 Import from CVS: tag r21-2-22
cvs
parents:
diff changeset
292 REG_EBRACK, /* Unmatched left bracket. */
3ecd8885ac67 Import from CVS: tag r21-2-22
cvs
parents:
diff changeset
293 REG_EPAREN, /* Parenthesis imbalance. */
3ecd8885ac67 Import from CVS: tag r21-2-22
cvs
parents:
diff changeset
294 REG_EBRACE, /* Unmatched \{. */
3ecd8885ac67 Import from CVS: tag r21-2-22
cvs
parents:
diff changeset
295 REG_BADBR, /* Invalid contents of \{\}. */
3ecd8885ac67 Import from CVS: tag r21-2-22
cvs
parents:
diff changeset
296 REG_ERANGE, /* Invalid range end. */
3ecd8885ac67 Import from CVS: tag r21-2-22
cvs
parents:
diff changeset
297 REG_ESPACE, /* Ran out of memory. */
3ecd8885ac67 Import from CVS: tag r21-2-22
cvs
parents:
diff changeset
298 REG_BADRPT, /* No preceding re for repetition op. */
3ecd8885ac67 Import from CVS: tag r21-2-22
cvs
parents:
diff changeset
299
3ecd8885ac67 Import from CVS: tag r21-2-22
cvs
parents:
diff changeset
300 /* Error codes we've added. */
3ecd8885ac67 Import from CVS: tag r21-2-22
cvs
parents:
diff changeset
301 REG_EEND, /* Premature end. */
3ecd8885ac67 Import from CVS: tag r21-2-22
cvs
parents:
diff changeset
302 REG_ESIZE, /* Compiled pattern bigger than 2^16 bytes. */
3ecd8885ac67 Import from CVS: tag r21-2-22
cvs
parents:
diff changeset
303 REG_ERPAREN /* Unmatched ) or \); not returned from regcomp. */
3ecd8885ac67 Import from CVS: tag r21-2-22
cvs
parents:
diff changeset
304 #ifdef emacs
3ecd8885ac67 Import from CVS: tag r21-2-22
cvs
parents:
diff changeset
305 ,REG_ESYNTAX /* Invalid syntax designator. */
3ecd8885ac67 Import from CVS: tag r21-2-22
cvs
parents:
diff changeset
306 #endif
3ecd8885ac67 Import from CVS: tag r21-2-22
cvs
parents:
diff changeset
307 #ifdef MULE
3ecd8885ac67 Import from CVS: tag r21-2-22
cvs
parents:
diff changeset
308 ,REG_ERANGESPAN /* Ranges may not span charsets. */
3ecd8885ac67 Import from CVS: tag r21-2-22
cvs
parents:
diff changeset
309 ,REG_ECATEGORY /* Invalid category designator */
3ecd8885ac67 Import from CVS: tag r21-2-22
cvs
parents:
diff changeset
310 #endif
3ecd8885ac67 Import from CVS: tag r21-2-22
cvs
parents:
diff changeset
311 } reg_errcode_t;
3ecd8885ac67 Import from CVS: tag r21-2-22
cvs
parents:
diff changeset
312
3ecd8885ac67 Import from CVS: tag r21-2-22
cvs
parents:
diff changeset
313 /* This data structure represents a compiled pattern. Before calling
3ecd8885ac67 Import from CVS: tag r21-2-22
cvs
parents:
diff changeset
314 the pattern compiler, the fields `buffer', `allocated', `fastmap',
3ecd8885ac67 Import from CVS: tag r21-2-22
cvs
parents:
diff changeset
315 `translate', and `no_sub' can be set. After the pattern has been
3ecd8885ac67 Import from CVS: tag r21-2-22
cvs
parents:
diff changeset
316 compiled, the `re_nsub' field is available. All other fields are
3ecd8885ac67 Import from CVS: tag r21-2-22
cvs
parents:
diff changeset
317 private to the regex routines. */
3ecd8885ac67 Import from CVS: tag r21-2-22
cvs
parents:
diff changeset
318
3ecd8885ac67 Import from CVS: tag r21-2-22
cvs
parents:
diff changeset
319 struct re_pattern_buffer
3ecd8885ac67 Import from CVS: tag r21-2-22
cvs
parents:
diff changeset
320 {
3ecd8885ac67 Import from CVS: tag r21-2-22
cvs
parents:
diff changeset
321 /* [[[begin pattern_buffer]]] */
3ecd8885ac67 Import from CVS: tag r21-2-22
cvs
parents:
diff changeset
322 /* Space that holds the compiled pattern. It is declared as
3ecd8885ac67 Import from CVS: tag r21-2-22
cvs
parents:
diff changeset
323 `unsigned char *' because its elements are
3ecd8885ac67 Import from CVS: tag r21-2-22
cvs
parents:
diff changeset
324 sometimes used as array indexes. */
3ecd8885ac67 Import from CVS: tag r21-2-22
cvs
parents:
diff changeset
325 unsigned char *buffer;
3ecd8885ac67 Import from CVS: tag r21-2-22
cvs
parents:
diff changeset
326
3ecd8885ac67 Import from CVS: tag r21-2-22
cvs
parents:
diff changeset
327 /* Number of bytes to which `buffer' points. */
3ecd8885ac67 Import from CVS: tag r21-2-22
cvs
parents:
diff changeset
328 unsigned long allocated;
3ecd8885ac67 Import from CVS: tag r21-2-22
cvs
parents:
diff changeset
329
3ecd8885ac67 Import from CVS: tag r21-2-22
cvs
parents:
diff changeset
330 /* Number of bytes actually used in `buffer'. */
3ecd8885ac67 Import from CVS: tag r21-2-22
cvs
parents:
diff changeset
331 unsigned long used;
3ecd8885ac67 Import from CVS: tag r21-2-22
cvs
parents:
diff changeset
332
3ecd8885ac67 Import from CVS: tag r21-2-22
cvs
parents:
diff changeset
333 /* Syntax setting with which the pattern was compiled. */
3ecd8885ac67 Import from CVS: tag r21-2-22
cvs
parents:
diff changeset
334 reg_syntax_t syntax;
3ecd8885ac67 Import from CVS: tag r21-2-22
cvs
parents:
diff changeset
335
3ecd8885ac67 Import from CVS: tag r21-2-22
cvs
parents:
diff changeset
336 /* Pointer to a fastmap, if any, otherwise zero. re_search uses
3ecd8885ac67 Import from CVS: tag r21-2-22
cvs
parents:
diff changeset
337 the fastmap, if there is one, to skip over impossible
3ecd8885ac67 Import from CVS: tag r21-2-22
cvs
parents:
diff changeset
338 starting points for matches. */
3ecd8885ac67 Import from CVS: tag r21-2-22
cvs
parents:
diff changeset
339 char *fastmap;
3ecd8885ac67 Import from CVS: tag r21-2-22
cvs
parents:
diff changeset
340
3ecd8885ac67 Import from CVS: tag r21-2-22
cvs
parents:
diff changeset
341 /* Either a translate table to apply to all characters before
3ecd8885ac67 Import from CVS: tag r21-2-22
cvs
parents:
diff changeset
342 comparing them, or zero for no translation. The translation
3ecd8885ac67 Import from CVS: tag r21-2-22
cvs
parents:
diff changeset
343 is applied to a pattern when it is compiled and to a string
3ecd8885ac67 Import from CVS: tag r21-2-22
cvs
parents:
diff changeset
344 when it is matched. */
446
1ccc32a20af4 Import from CVS: tag r21-2-38
cvs
parents: 442
diff changeset
345 RE_TRANSLATE_TYPE translate;
428
3ecd8885ac67 Import from CVS: tag r21-2-22
cvs
parents:
diff changeset
346
502
7039e6323819 [xemacs-hg @ 2001-05-04 22:41:46 by ben]
ben
parents: 446
diff changeset
347 /* Number of returnable groups found by the compiler. (This does
7039e6323819 [xemacs-hg @ 2001-05-04 22:41:46 by ben]
ben
parents: 446
diff changeset
348 not count shy groups.) */
428
3ecd8885ac67 Import from CVS: tag r21-2-22
cvs
parents:
diff changeset
349 size_t re_nsub;
3ecd8885ac67 Import from CVS: tag r21-2-22
cvs
parents:
diff changeset
350
502
7039e6323819 [xemacs-hg @ 2001-05-04 22:41:46 by ben]
ben
parents: 446
diff changeset
351 /* Total number of groups found by the compiler. (Including
7039e6323819 [xemacs-hg @ 2001-05-04 22:41:46 by ben]
ben
parents: 446
diff changeset
352 shy ones.) */
7039e6323819 [xemacs-hg @ 2001-05-04 22:41:46 by ben]
ben
parents: 446
diff changeset
353 int re_ngroups;
7039e6323819 [xemacs-hg @ 2001-05-04 22:41:46 by ben]
ben
parents: 446
diff changeset
354
428
3ecd8885ac67 Import from CVS: tag r21-2-22
cvs
parents:
diff changeset
355 /* Zero if this pattern cannot match the empty string, one else.
3ecd8885ac67 Import from CVS: tag r21-2-22
cvs
parents:
diff changeset
356 Well, in truth it's used only in `re_search_2', to see
3ecd8885ac67 Import from CVS: tag r21-2-22
cvs
parents:
diff changeset
357 whether or not we should use the fastmap, so we don't set
3ecd8885ac67 Import from CVS: tag r21-2-22
cvs
parents:
diff changeset
358 this absolutely perfectly; see `re_compile_fastmap' (the
3ecd8885ac67 Import from CVS: tag r21-2-22
cvs
parents:
diff changeset
359 `duplicate' case). */
3ecd8885ac67 Import from CVS: tag r21-2-22
cvs
parents:
diff changeset
360 unsigned can_be_null : 1;
3ecd8885ac67 Import from CVS: tag r21-2-22
cvs
parents:
diff changeset
361
3ecd8885ac67 Import from CVS: tag r21-2-22
cvs
parents:
diff changeset
362 /* If REGS_UNALLOCATED, allocate space in the `regs' structure
3ecd8885ac67 Import from CVS: tag r21-2-22
cvs
parents:
diff changeset
363 for `max (RE_NREGS, re_nsub + 1)' groups.
3ecd8885ac67 Import from CVS: tag r21-2-22
cvs
parents:
diff changeset
364 If REGS_REALLOCATE, reallocate space if necessary.
3ecd8885ac67 Import from CVS: tag r21-2-22
cvs
parents:
diff changeset
365 If REGS_FIXED, use what's there. */
3ecd8885ac67 Import from CVS: tag r21-2-22
cvs
parents:
diff changeset
366 #define REGS_UNALLOCATED 0
3ecd8885ac67 Import from CVS: tag r21-2-22
cvs
parents:
diff changeset
367 #define REGS_REALLOCATE 1
3ecd8885ac67 Import from CVS: tag r21-2-22
cvs
parents:
diff changeset
368 #define REGS_FIXED 2
3ecd8885ac67 Import from CVS: tag r21-2-22
cvs
parents:
diff changeset
369 unsigned regs_allocated : 2;
3ecd8885ac67 Import from CVS: tag r21-2-22
cvs
parents:
diff changeset
370
3ecd8885ac67 Import from CVS: tag r21-2-22
cvs
parents:
diff changeset
371 /* Set to zero when `regex_compile' compiles a pattern; set to one
3ecd8885ac67 Import from CVS: tag r21-2-22
cvs
parents:
diff changeset
372 by `re_compile_fastmap' if it updates the fastmap. */
3ecd8885ac67 Import from CVS: tag r21-2-22
cvs
parents:
diff changeset
373 unsigned fastmap_accurate : 1;
3ecd8885ac67 Import from CVS: tag r21-2-22
cvs
parents:
diff changeset
374
3ecd8885ac67 Import from CVS: tag r21-2-22
cvs
parents:
diff changeset
375 /* If set, `re_match_2' does not return information about
3ecd8885ac67 Import from CVS: tag r21-2-22
cvs
parents:
diff changeset
376 subexpressions. */
3ecd8885ac67 Import from CVS: tag r21-2-22
cvs
parents:
diff changeset
377 unsigned no_sub : 1;
3ecd8885ac67 Import from CVS: tag r21-2-22
cvs
parents:
diff changeset
378
3ecd8885ac67 Import from CVS: tag r21-2-22
cvs
parents:
diff changeset
379 /* If set, a beginning-of-line anchor doesn't match at the
3ecd8885ac67 Import from CVS: tag r21-2-22
cvs
parents:
diff changeset
380 beginning of the string. */
3ecd8885ac67 Import from CVS: tag r21-2-22
cvs
parents:
diff changeset
381 unsigned not_bol : 1;
3ecd8885ac67 Import from CVS: tag r21-2-22
cvs
parents:
diff changeset
382
3ecd8885ac67 Import from CVS: tag r21-2-22
cvs
parents:
diff changeset
383 /* Similarly for an end-of-line anchor. */
3ecd8885ac67 Import from CVS: tag r21-2-22
cvs
parents:
diff changeset
384 unsigned not_eol : 1;
3ecd8885ac67 Import from CVS: tag r21-2-22
cvs
parents:
diff changeset
385
3ecd8885ac67 Import from CVS: tag r21-2-22
cvs
parents:
diff changeset
386 /* If true, an anchor at a newline matches. */
3ecd8885ac67 Import from CVS: tag r21-2-22
cvs
parents:
diff changeset
387 unsigned newline_anchor : 1;
3ecd8885ac67 Import from CVS: tag r21-2-22
cvs
parents:
diff changeset
388
502
7039e6323819 [xemacs-hg @ 2001-05-04 22:41:46 by ben]
ben
parents: 446
diff changeset
389 unsigned warned_about_incompatible_back_references : 1;
7039e6323819 [xemacs-hg @ 2001-05-04 22:41:46 by ben]
ben
parents: 446
diff changeset
390
7039e6323819 [xemacs-hg @ 2001-05-04 22:41:46 by ben]
ben
parents: 446
diff changeset
391 /* Mapping between back references and groups (may not be
7039e6323819 [xemacs-hg @ 2001-05-04 22:41:46 by ben]
ben
parents: 446
diff changeset
392 equivalent with shy groups). */
7039e6323819 [xemacs-hg @ 2001-05-04 22:41:46 by ben]
ben
parents: 446
diff changeset
393 int *external_to_internal_register;
7039e6323819 [xemacs-hg @ 2001-05-04 22:41:46 by ben]
ben
parents: 446
diff changeset
394
7039e6323819 [xemacs-hg @ 2001-05-04 22:41:46 by ben]
ben
parents: 446
diff changeset
395 int external_to_internal_register_size;
7039e6323819 [xemacs-hg @ 2001-05-04 22:41:46 by ben]
ben
parents: 446
diff changeset
396
428
3ecd8885ac67 Import from CVS: tag r21-2-22
cvs
parents:
diff changeset
397 /* [[[end pattern_buffer]]] */
3ecd8885ac67 Import from CVS: tag r21-2-22
cvs
parents:
diff changeset
398 };
3ecd8885ac67 Import from CVS: tag r21-2-22
cvs
parents:
diff changeset
399
3ecd8885ac67 Import from CVS: tag r21-2-22
cvs
parents:
diff changeset
400 typedef struct re_pattern_buffer regex_t;
3ecd8885ac67 Import from CVS: tag r21-2-22
cvs
parents:
diff changeset
401
3ecd8885ac67 Import from CVS: tag r21-2-22
cvs
parents:
diff changeset
402 /* Type for byte offsets within the string. POSIX mandates this. */
3ecd8885ac67 Import from CVS: tag r21-2-22
cvs
parents:
diff changeset
403 typedef int regoff_t;
3ecd8885ac67 Import from CVS: tag r21-2-22
cvs
parents:
diff changeset
404
3ecd8885ac67 Import from CVS: tag r21-2-22
cvs
parents:
diff changeset
405
3ecd8885ac67 Import from CVS: tag r21-2-22
cvs
parents:
diff changeset
406 /* This is the structure we store register match data in. See
3ecd8885ac67 Import from CVS: tag r21-2-22
cvs
parents:
diff changeset
407 regex.texinfo for a full description of what registers match. */
3ecd8885ac67 Import from CVS: tag r21-2-22
cvs
parents:
diff changeset
408 struct re_registers
3ecd8885ac67 Import from CVS: tag r21-2-22
cvs
parents:
diff changeset
409 {
3ecd8885ac67 Import from CVS: tag r21-2-22
cvs
parents:
diff changeset
410 unsigned num_regs;
3ecd8885ac67 Import from CVS: tag r21-2-22
cvs
parents:
diff changeset
411 regoff_t *start;
3ecd8885ac67 Import from CVS: tag r21-2-22
cvs
parents:
diff changeset
412 regoff_t *end;
3ecd8885ac67 Import from CVS: tag r21-2-22
cvs
parents:
diff changeset
413 };
3ecd8885ac67 Import from CVS: tag r21-2-22
cvs
parents:
diff changeset
414
3ecd8885ac67 Import from CVS: tag r21-2-22
cvs
parents:
diff changeset
415
3ecd8885ac67 Import from CVS: tag r21-2-22
cvs
parents:
diff changeset
416 /* If `regs_allocated' is REGS_UNALLOCATED in the pattern buffer,
3ecd8885ac67 Import from CVS: tag r21-2-22
cvs
parents:
diff changeset
417 `re_match_2' returns information about at least this many registers
3ecd8885ac67 Import from CVS: tag r21-2-22
cvs
parents:
diff changeset
418 the first time a `regs' structure is passed. */
3ecd8885ac67 Import from CVS: tag r21-2-22
cvs
parents:
diff changeset
419 #ifndef RE_NREGS
3ecd8885ac67 Import from CVS: tag r21-2-22
cvs
parents:
diff changeset
420 #define RE_NREGS 30
3ecd8885ac67 Import from CVS: tag r21-2-22
cvs
parents:
diff changeset
421 #endif
3ecd8885ac67 Import from CVS: tag r21-2-22
cvs
parents:
diff changeset
422
3ecd8885ac67 Import from CVS: tag r21-2-22
cvs
parents:
diff changeset
423
3ecd8885ac67 Import from CVS: tag r21-2-22
cvs
parents:
diff changeset
424 /* POSIX specification for registers. Aside from the different names than
3ecd8885ac67 Import from CVS: tag r21-2-22
cvs
parents:
diff changeset
425 `re_registers', POSIX uses an array of structures, instead of a
3ecd8885ac67 Import from CVS: tag r21-2-22
cvs
parents:
diff changeset
426 structure of arrays. */
3ecd8885ac67 Import from CVS: tag r21-2-22
cvs
parents:
diff changeset
427 typedef struct
3ecd8885ac67 Import from CVS: tag r21-2-22
cvs
parents:
diff changeset
428 {
3ecd8885ac67 Import from CVS: tag r21-2-22
cvs
parents:
diff changeset
429 regoff_t rm_so; /* Byte offset from string's start to substring's start. */
3ecd8885ac67 Import from CVS: tag r21-2-22
cvs
parents:
diff changeset
430 regoff_t rm_eo; /* Byte offset from string's start to substring's end. */
3ecd8885ac67 Import from CVS: tag r21-2-22
cvs
parents:
diff changeset
431 } regmatch_t;
3ecd8885ac67 Import from CVS: tag r21-2-22
cvs
parents:
diff changeset
432
3ecd8885ac67 Import from CVS: tag r21-2-22
cvs
parents:
diff changeset
433 /* Declarations for routines. */
3ecd8885ac67 Import from CVS: tag r21-2-22
cvs
parents:
diff changeset
434
3ecd8885ac67 Import from CVS: tag r21-2-22
cvs
parents:
diff changeset
435 /* Sets the current default syntax to SYNTAX, and return the old syntax.
3ecd8885ac67 Import from CVS: tag r21-2-22
cvs
parents:
diff changeset
436 You can also simply assign to the `re_syntax_options' variable. */
3ecd8885ac67 Import from CVS: tag r21-2-22
cvs
parents:
diff changeset
437 reg_syntax_t re_set_syntax (reg_syntax_t syntax);
3ecd8885ac67 Import from CVS: tag r21-2-22
cvs
parents:
diff changeset
438
3ecd8885ac67 Import from CVS: tag r21-2-22
cvs
parents:
diff changeset
439 /* Compile the regular expression PATTERN, with length LENGTH
3ecd8885ac67 Import from CVS: tag r21-2-22
cvs
parents:
diff changeset
440 and syntax given by the global `re_syntax_options', into the buffer
3ecd8885ac67 Import from CVS: tag r21-2-22
cvs
parents:
diff changeset
441 BUFFER. Return NULL if successful, and an error string if not. */
442
abe6d1db359e Import from CVS: tag r21-2-36
cvs
parents: 440
diff changeset
442 const char *re_compile_pattern (const char *pattern, int length,
428
3ecd8885ac67 Import from CVS: tag r21-2-22
cvs
parents:
diff changeset
443 struct re_pattern_buffer *buffer);
3ecd8885ac67 Import from CVS: tag r21-2-22
cvs
parents:
diff changeset
444
3ecd8885ac67 Import from CVS: tag r21-2-22
cvs
parents:
diff changeset
445
3ecd8885ac67 Import from CVS: tag r21-2-22
cvs
parents:
diff changeset
446 /* Compile a fastmap for the compiled pattern in BUFFER; used to
3ecd8885ac67 Import from CVS: tag r21-2-22
cvs
parents:
diff changeset
447 accelerate searches. Return 0 if successful and -2 if was an
3ecd8885ac67 Import from CVS: tag r21-2-22
cvs
parents:
diff changeset
448 internal error. */
3ecd8885ac67 Import from CVS: tag r21-2-22
cvs
parents:
diff changeset
449 int re_compile_fastmap (struct re_pattern_buffer *buffer);
3ecd8885ac67 Import from CVS: tag r21-2-22
cvs
parents:
diff changeset
450
3ecd8885ac67 Import from CVS: tag r21-2-22
cvs
parents:
diff changeset
451
3ecd8885ac67 Import from CVS: tag r21-2-22
cvs
parents:
diff changeset
452 /* Search in the string STRING (with length LENGTH) for the pattern
3ecd8885ac67 Import from CVS: tag r21-2-22
cvs
parents:
diff changeset
453 compiled into BUFFER. Start searching at position START, for RANGE
3ecd8885ac67 Import from CVS: tag r21-2-22
cvs
parents:
diff changeset
454 characters. Return the starting position of the match, -1 for no
3ecd8885ac67 Import from CVS: tag r21-2-22
cvs
parents:
diff changeset
455 match, or -2 for an internal error. Also return register
3ecd8885ac67 Import from CVS: tag r21-2-22
cvs
parents:
diff changeset
456 information in REGS (if REGS and BUFFER->no_sub are nonzero). */
442
abe6d1db359e Import from CVS: tag r21-2-36
cvs
parents: 440
diff changeset
457 int re_search (struct re_pattern_buffer *buffer, const char *string,
428
3ecd8885ac67 Import from CVS: tag r21-2-22
cvs
parents:
diff changeset
458 int length, int start, int range,
3ecd8885ac67 Import from CVS: tag r21-2-22
cvs
parents:
diff changeset
459 struct re_registers *regs);
3ecd8885ac67 Import from CVS: tag r21-2-22
cvs
parents:
diff changeset
460
3ecd8885ac67 Import from CVS: tag r21-2-22
cvs
parents:
diff changeset
461
3ecd8885ac67 Import from CVS: tag r21-2-22
cvs
parents:
diff changeset
462 /* Like `re_search', but search in the concatenation of STRING1 and
3ecd8885ac67 Import from CVS: tag r21-2-22
cvs
parents:
diff changeset
463 STRING2. Also, stop searching at index START + STOP. */
442
abe6d1db359e Import from CVS: tag r21-2-36
cvs
parents: 440
diff changeset
464 int re_search_2 (struct re_pattern_buffer *buffer, const char *string1,
abe6d1db359e Import from CVS: tag r21-2-36
cvs
parents: 440
diff changeset
465 int length1, const char *string2, int length2, int start,
428
3ecd8885ac67 Import from CVS: tag r21-2-22
cvs
parents:
diff changeset
466 int range, struct re_registers *regs, int stop);
3ecd8885ac67 Import from CVS: tag r21-2-22
cvs
parents:
diff changeset
467
3ecd8885ac67 Import from CVS: tag r21-2-22
cvs
parents:
diff changeset
468
3ecd8885ac67 Import from CVS: tag r21-2-22
cvs
parents:
diff changeset
469 /* Like `re_search', but return how many characters in STRING the regexp
3ecd8885ac67 Import from CVS: tag r21-2-22
cvs
parents:
diff changeset
470 in BUFFER matched, starting at position START. */
442
abe6d1db359e Import from CVS: tag r21-2-36
cvs
parents: 440
diff changeset
471 int re_match (struct re_pattern_buffer *buffer, const char *string,
428
3ecd8885ac67 Import from CVS: tag r21-2-22
cvs
parents:
diff changeset
472 int length, int start, struct re_registers *regs);
3ecd8885ac67 Import from CVS: tag r21-2-22
cvs
parents:
diff changeset
473
3ecd8885ac67 Import from CVS: tag r21-2-22
cvs
parents:
diff changeset
474
3ecd8885ac67 Import from CVS: tag r21-2-22
cvs
parents:
diff changeset
475 /* Relates to `re_match' as `re_search_2' relates to `re_search'. */
442
abe6d1db359e Import from CVS: tag r21-2-36
cvs
parents: 440
diff changeset
476 int re_match_2 (struct re_pattern_buffer *buffer, const char *string1,
abe6d1db359e Import from CVS: tag r21-2-36
cvs
parents: 440
diff changeset
477 int length1, const char *string2, int length2,
428
3ecd8885ac67 Import from CVS: tag r21-2-22
cvs
parents:
diff changeset
478 int start, struct re_registers *regs, int stop);
3ecd8885ac67 Import from CVS: tag r21-2-22
cvs
parents:
diff changeset
479
3ecd8885ac67 Import from CVS: tag r21-2-22
cvs
parents:
diff changeset
480
3ecd8885ac67 Import from CVS: tag r21-2-22
cvs
parents:
diff changeset
481 /* Set REGS to hold NUM_REGS registers, storing them in STARTS and
3ecd8885ac67 Import from CVS: tag r21-2-22
cvs
parents:
diff changeset
482 ENDS. Subsequent matches using BUFFER and REGS will use this memory
3ecd8885ac67 Import from CVS: tag r21-2-22
cvs
parents:
diff changeset
483 for recording register information. STARTS and ENDS must be
3ecd8885ac67 Import from CVS: tag r21-2-22
cvs
parents:
diff changeset
484 allocated with malloc, and must each be at least `NUM_REGS * sizeof
3ecd8885ac67 Import from CVS: tag r21-2-22
cvs
parents:
diff changeset
485 (regoff_t)' bytes long.
3ecd8885ac67 Import from CVS: tag r21-2-22
cvs
parents:
diff changeset
486
3ecd8885ac67 Import from CVS: tag r21-2-22
cvs
parents:
diff changeset
487 If NUM_REGS == 0, then subsequent matches should allocate their own
3ecd8885ac67 Import from CVS: tag r21-2-22
cvs
parents:
diff changeset
488 register data.
3ecd8885ac67 Import from CVS: tag r21-2-22
cvs
parents:
diff changeset
489
3ecd8885ac67 Import from CVS: tag r21-2-22
cvs
parents:
diff changeset
490 Unless this function is called, the first search or match using
3ecd8885ac67 Import from CVS: tag r21-2-22
cvs
parents:
diff changeset
491 PATTERN_BUFFER will allocate its own register data, without
3ecd8885ac67 Import from CVS: tag r21-2-22
cvs
parents:
diff changeset
492 freeing the old data. */
3ecd8885ac67 Import from CVS: tag r21-2-22
cvs
parents:
diff changeset
493 void re_set_registers (struct re_pattern_buffer *buffer,
3ecd8885ac67 Import from CVS: tag r21-2-22
cvs
parents:
diff changeset
494 struct re_registers *regs, unsigned num_regs,
3ecd8885ac67 Import from CVS: tag r21-2-22
cvs
parents:
diff changeset
495 regoff_t *starts, regoff_t *ends);
3ecd8885ac67 Import from CVS: tag r21-2-22
cvs
parents:
diff changeset
496
3ecd8885ac67 Import from CVS: tag r21-2-22
cvs
parents:
diff changeset
497 #ifdef _REGEX_RE_COMP
3ecd8885ac67 Import from CVS: tag r21-2-22
cvs
parents:
diff changeset
498 /* 4.2 bsd compatibility. */
442
abe6d1db359e Import from CVS: tag r21-2-36
cvs
parents: 440
diff changeset
499 char *re_comp (const char *);
abe6d1db359e Import from CVS: tag r21-2-36
cvs
parents: 440
diff changeset
500 int re_exec (const char *);
428
3ecd8885ac67 Import from CVS: tag r21-2-22
cvs
parents:
diff changeset
501 #endif
3ecd8885ac67 Import from CVS: tag r21-2-22
cvs
parents:
diff changeset
502
3ecd8885ac67 Import from CVS: tag r21-2-22
cvs
parents:
diff changeset
503 /* POSIX compatibility. */
442
abe6d1db359e Import from CVS: tag r21-2-36
cvs
parents: 440
diff changeset
504 int regcomp (regex_t *preg, const char *pattern, int cflags);
abe6d1db359e Import from CVS: tag r21-2-36
cvs
parents: 440
diff changeset
505 int regexec (const regex_t *preg, const char *string, size_t nmatch,
428
3ecd8885ac67 Import from CVS: tag r21-2-22
cvs
parents:
diff changeset
506 regmatch_t pmatch[], int eflags);
442
abe6d1db359e Import from CVS: tag r21-2-36
cvs
parents: 440
diff changeset
507 size_t regerror (int errcode, const regex_t *preg, char *errbuf,
428
3ecd8885ac67 Import from CVS: tag r21-2-22
cvs
parents:
diff changeset
508 size_t errbuf_size);
3ecd8885ac67 Import from CVS: tag r21-2-22
cvs
parents:
diff changeset
509 void regfree (regex_t *preg);
3ecd8885ac67 Import from CVS: tag r21-2-22
cvs
parents:
diff changeset
510
440
8de8e3f6228a Import from CVS: tag r21-2-28
cvs
parents: 428
diff changeset
511 #endif /* INCLUDED_regex_h_ */