428
|
1 /* Header file for the buffer manipulation primitives.
|
|
2 Copyright (C) 1985, 1986, 1992, 1993, 1994, 1995
|
|
3 Free Software Foundation, Inc.
|
|
4 Copyright (C) 1995 Sun Microsystems, Inc.
|
771
|
5 Copyright (C) 2001, 2002 Ben Wing.
|
428
|
6
|
|
7 This file is part of XEmacs.
|
|
8
|
|
9 XEmacs is free software; you can redistribute it and/or modify it
|
|
10 under the terms of the GNU General Public License as published by the
|
|
11 Free Software Foundation; either version 2, or (at your option) any
|
|
12 later version.
|
|
13
|
|
14 XEmacs is distributed in the hope that it will be useful, but WITHOUT
|
|
15 ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
|
|
16 FITNESS FOR A PARTICULAR PURPOSE. See the GNU General Public License
|
|
17 for more details.
|
|
18
|
|
19 You should have received a copy of the GNU General Public License
|
|
20 along with XEmacs; see the file COPYING. If not, write to
|
|
21 the Free Software Foundation, Inc., 59 Temple Place - Suite 330,
|
|
22 Boston, MA 02111-1307, USA. */
|
|
23
|
|
24 /* Synched up with: FSF 19.30. */
|
|
25
|
|
26 /* Authorship:
|
|
27
|
|
28 FSF: long ago.
|
|
29 JWZ: separated out bufslots.h, early in Lemacs.
|
|
30 Ben Wing: almost completely rewritten for Mule, 19.12.
|
|
31 */
|
|
32
|
440
|
33 #ifndef INCLUDED_buffer_h_
|
|
34 #define INCLUDED_buffer_h_
|
428
|
35
|
446
|
36 #include "casetab.h"
|
|
37 #include "chartab.h"
|
|
38
|
428
|
39 /************************************************************************/
|
|
40 /* */
|
|
41 /* definition of Lisp buffer object */
|
|
42 /* */
|
|
43 /************************************************************************/
|
|
44
|
665
|
45 /* Note: we keep both Bytebpos and Charbpos versions of some of the
|
428
|
46 important buffer positions because they are accessed so much.
|
|
47 If we didn't do this, we would constantly be invalidating the
|
665
|
48 charbpos<->bytebpos cache under Mule.
|
428
|
49
|
|
50 Note that under non-Mule, both versions will always be the
|
|
51 same so we don't really need to keep track of them. But it
|
|
52 simplifies the logic to go ahead and do so all the time and
|
|
53 the memory loss is insignificant. */
|
|
54
|
|
55 /* Formerly, it didn't much matter what went inside the struct buffer_text
|
|
56 and what went outside it. Now it does, with the advent of "indirect
|
|
57 buffers" that share text with another buffer. An indirect buffer
|
|
58 shares the same *text* as another buffer, but has its own buffer-local
|
|
59 variables, its own accessible region, and its own markers and extents.
|
|
60 (Due to the nature of markers, it doesn't actually matter much whether
|
|
61 we stick them inside or out of the struct buffer_text -- the user won't
|
|
62 notice any difference -- but we go ahead and put them outside for
|
|
63 consistency and overall saneness of algorithm.)
|
|
64
|
|
65 FSFmacs gets away with not maintaining any "children" pointers from
|
|
66 a buffer to the indirect buffers that refer to it by putting the
|
|
67 markers inside of the struct buffer_text, using markers to keep track
|
|
68 of BEGV and ZV in indirect buffers, and relying on the fact that
|
|
69 all intervals (text properties and overlays) use markers for their
|
|
70 start and end points. We don't do this for extents (markers are
|
|
71 inefficient anyway and take up space), so we have to maintain
|
|
72 children pointers. This is not terribly hard, though, and the
|
|
73 code to maintain this is just like the code already present in
|
|
74 extent-parent and extent-children.
|
|
75 */
|
|
76
|
|
77 struct buffer_text
|
|
78 {
|
867
|
79 Ibyte *beg; /* Actual address of buffer contents. */
|
665
|
80 Bytebpos gpt; /* Index of gap in buffer. */
|
|
81 Bytebpos z; /* Index of end of buffer. */
|
|
82 Charbpos bufz; /* Equivalent as a Charbpos. */
|
|
83 Bytecount gap_size;/* Size of buffer's gap */
|
|
84 Bytecount end_gap_size;/* Size of buffer's end gap */
|
428
|
85 long modiff; /* This counts buffer-modification events
|
|
86 for this buffer. It is incremented for
|
|
87 each such event, and never otherwise
|
|
88 changed. */
|
|
89 long save_modiff; /* Previous value of modiff, as of last
|
|
90 time buffer visited or saved a file. */
|
|
91
|
|
92 #ifdef MULE
|
771
|
93 /* We keep track of a "known" region for very fast access. This
|
|
94 information is text-only so it goes here. We update this at each
|
|
95 change to the buffer, so if it's entirely ASCII, these will always
|
|
96 contain the minimum and maximum positions of the buffer. */
|
665
|
97 Charbpos mule_bufmin, mule_bufmax;
|
|
98 Bytebpos mule_bytmin, mule_bytmax;
|
428
|
99 int mule_shifter, mule_three_p;
|
|
100
|
|
101 /* And we also cache 16 positions for fairly fast access near those
|
|
102 positions. */
|
665
|
103 Charbpos mule_charbpos_cache[16];
|
|
104 Bytebpos mule_bytebpos_cache[16];
|
771
|
105
|
826
|
106 /* True if all chars fit into one byte;
|
|
107 == (format == FORMAT_8_BIT_FIXED ||
|
|
108 (format == FORMAT_DEFAULT && num_ascii_chars == bufz - 1))
|
|
109 kept around to speed up (slightly?) the byte-char conversion routines. */
|
|
110 int entirely_one_byte_p;
|
|
111 /* Number of ASCII chars in buffer (0 - 127) */
|
|
112 Charcount num_ascii_chars;
|
|
113 /* Number of chars in buffer that would fit in an 8-bit-fixed buffer. */
|
|
114 Charcount num_8_bit_fixed_chars;
|
|
115 /* Number of chars in buffer that would fit in an 16-bit-fixed buffer. */
|
|
116 Charcount num_16_bit_fixed_chars;
|
|
117
|
|
118 /* Currently we only handle 8 bit fixed and default */
|
|
119 Internal_Format format;
|
428
|
120 #endif
|
|
121
|
|
122 /* Similar to the above, we keep track of positions for which line
|
|
123 number has last been calculated. See line-number.c. */
|
|
124 Lisp_Object line_number_cache;
|
|
125
|
|
126 /* Change data that goes with the text. */
|
|
127 struct buffer_text_change_data *changes;
|
|
128 };
|
|
129
|
|
130 struct buffer
|
|
131 {
|
|
132 struct lcrecord_header header;
|
|
133
|
|
134 /* This structure holds the coordinates of the buffer contents
|
|
135 in ordinary buffers. In indirect buffers, this is not used. */
|
|
136 struct buffer_text own_text;
|
|
137
|
|
138 /* This points to the `struct buffer_text' that is used for this buffer.
|
|
139 In an ordinary buffer, this is the own_text field above.
|
|
140 In an indirect buffer, this is the own_text field of another buffer. */
|
|
141 struct buffer_text *text;
|
|
142
|
665
|
143 Bytebpos pt; /* Position of point in buffer. */
|
|
144 Charbpos bufpt; /* Equivalent as a Charbpos. */
|
|
145 Bytebpos begv; /* Index of beginning of accessible range. */
|
|
146 Charbpos bufbegv; /* Equivalent as a Charbpos. */
|
|
147 Bytebpos zv; /* Index of end of accessible range. */
|
|
148 Charbpos bufzv; /* Equivalent as a Charbpos. */
|
428
|
149
|
|
150 int face_change; /* This is set when a change in how the text should
|
|
151 be displayed (e.g., font, color) is made. */
|
|
152
|
448
|
153 /* Whether buffer specific face is specified. */
|
|
154 int buffer_local_face_property;
|
|
155
|
428
|
156 /* change data indicating what portion of the text has changed
|
|
157 since the last time this was reset. Used by redisplay.
|
|
158 Logically we should keep this with the text structure, but
|
|
159 redisplay resets it for each buffer individually and we don't
|
|
160 want interference between an indirect buffer and its base
|
|
161 buffer. */
|
|
162 struct each_buffer_change_data *changes;
|
|
163
|
|
164 #ifdef REGION_CACHE_NEEDS_WORK
|
|
165 /* If the long line scan cache is enabled (i.e. the buffer-local
|
|
166 variable cache-long-line-scans is non-nil), newline_cache
|
|
167 points to the newline cache, and width_run_cache points to the
|
|
168 width run cache.
|
|
169
|
|
170 The newline cache records which stretches of the buffer are
|
|
171 known *not* to contain newlines, so that they can be skipped
|
|
172 quickly when we search for newlines.
|
|
173
|
|
174 The width run cache records which stretches of the buffer are
|
|
175 known to contain characters whose widths are all the same. If
|
|
176 the width run cache maps a character to a value > 0, that value
|
|
177 is the character's width; if it maps a character to zero, we
|
|
178 don't know what its width is. This allows compute_motion to
|
|
179 process such regions very quickly, using algebra instead of
|
|
180 inspecting each character. See also width_table, below. */
|
|
181 struct region_cache *newline_cache;
|
|
182 struct region_cache *width_run_cache;
|
|
183 #endif /* REGION_CACHE_NEEDS_WORK */
|
|
184
|
|
185 /* The markers that refer to this buffer. This is actually a single
|
|
186 marker -- successive elements in its marker `chain' are the other
|
|
187 markers referring to this buffer */
|
440
|
188 Lisp_Marker *markers;
|
428
|
189
|
|
190 /* The buffer's extent info. This is its own type, an extent-info
|
|
191 object (done this way for ease in marking / finalizing). */
|
|
192 Lisp_Object extent_info;
|
|
193
|
826
|
194 /* The buffer's syntax cache. This caches a known region where the
|
|
195 `syntax-table' property is unchanged, for quick lookup in the routines
|
|
196 that scan a buffer looking for a particular syntax (regex routines,
|
|
197 parse-partial-sexp, etc.). */
|
|
198 struct syntax_cache *syntax_cache;
|
|
199
|
428
|
200 /* ----------------------------------------------------------------- */
|
|
201 /* All the stuff above this line is the responsibility of insdel.c,
|
826
|
202 with some help from marker.c, extents.c and syntax.c.
|
428
|
203 All the stuff below this line is the responsibility of buffer.c. */
|
|
204
|
|
205 /* In an indirect buffer, this points to the base buffer.
|
|
206 In an ordinary buffer, it is 0.
|
|
207 We DO mark through this slot. */
|
|
208 struct buffer *base_buffer;
|
|
209
|
|
210 /* List of indirect buffers whose base is this buffer.
|
|
211 If we are an indirect buffer, this will be nil.
|
|
212 Do NOT mark through this. */
|
|
213 Lisp_Object indirect_children;
|
|
214
|
|
215 /* Flags saying which DEFVAR_PER_BUFFER variables
|
|
216 are local to this buffer. */
|
|
217 int local_var_flags;
|
|
218
|
|
219 /* Set to the modtime of the visited file when read or written.
|
|
220 -1 means visited file was nonexistent.
|
|
221 0 means visited file modtime unknown; in no case complain
|
|
222 about any mismatch on next save attempt. */
|
|
223 int modtime;
|
|
224
|
|
225 /* the value of text->modiff at the last auto-save. */
|
442
|
226 long auto_save_modified;
|
428
|
227
|
|
228 /* The time at which we detected a failure to auto-save,
|
|
229 Or -1 if we didn't have a failure. */
|
|
230 int auto_save_failure_time;
|
|
231
|
|
232 /* Position in buffer at which display started
|
|
233 the last time this buffer was displayed. */
|
|
234 int last_window_start;
|
|
235
|
|
236 /* Everything from here down must be a Lisp_Object */
|
|
237
|
1204
|
238 #define MARKED_SLOT(x) Lisp_Object x;
|
428
|
239 #include "bufslots.h"
|
|
240 #undef MARKED_SLOT
|
|
241 };
|
|
242
|
|
243 DECLARE_LRECORD (buffer, struct buffer);
|
|
244 #define XBUFFER(x) XRECORD (x, buffer, struct buffer)
|
617
|
245 #define wrap_buffer(p) wrap_record (p, buffer)
|
428
|
246 #define BUFFERP(x) RECORDP (x, buffer)
|
|
247 #define CHECK_BUFFER(x) CHECK_RECORD (x, buffer)
|
|
248 #define CONCHECK_BUFFER(x) CONCHECK_RECORD (x, buffer)
|
|
249
|
|
250 #define BUFFER_LIVE_P(b) (!NILP ((b)->name))
|
|
251
|
|
252 #define CHECK_LIVE_BUFFER(x) do { \
|
|
253 CHECK_BUFFER (x); \
|
|
254 if (!BUFFER_LIVE_P (XBUFFER (x))) \
|
|
255 dead_wrong_type_argument (Qbuffer_live_p, (x)); \
|
|
256 } while (0)
|
|
257
|
|
258 #define CONCHECK_LIVE_BUFFER(x) do { \
|
|
259 CONCHECK_BUFFER (x); \
|
|
260 if (!BUFFER_LIVE_P (XBUFFER (x))) \
|
|
261 x = wrong_type_argument (Qbuffer_live_p, (x)); \
|
|
262 } while (0)
|
|
263
|
|
264
|
|
265 #define BUFFER_BASE_BUFFER(b) ((b)->base_buffer ? (b)->base_buffer : (b))
|
|
266
|
|
267 /* Map over buffers sharing the same text as MPS_BUF. MPS_BUFVAR is a
|
|
268 variable that gets the buffer values (beginning with the base
|
|
269 buffer, then the children), and MPS_BUFCONS should be a temporary
|
|
270 Lisp_Object variable. */
|
647
|
271 #define MAP_INDIRECT_BUFFERS(mps_buf, mps_bufvar, mps_bufcons) \
|
|
272 for (mps_bufcons = Qunbound, \
|
|
273 mps_bufvar = BUFFER_BASE_BUFFER (mps_buf); \
|
|
274 UNBOUNDP (mps_bufcons) ? \
|
|
275 (mps_bufcons = mps_bufvar->indirect_children, \
|
|
276 1) \
|
|
277 : (!NILP (mps_bufcons) \
|
|
278 && (mps_bufvar = XBUFFER (XCAR (mps_bufcons)), 1) \
|
|
279 && (mps_bufcons = XCDR (mps_bufcons), 1)); \
|
428
|
280 )
|
|
281
|
|
282
|
826
|
283 /* All macros below follow the three golden rules of macros (see text.h),
|
|
284 with the following exception:
|
|
285
|
|
286 -- 'struct buffer *' arguments can be evaluated more than once.
|
|
287 */
|
|
288
|
428
|
289 /*----------------------------------------------------------------------*/
|
|
290 /* Accessor macros for important positions in a buffer */
|
|
291 /*----------------------------------------------------------------------*/
|
|
292
|
|
293 /* We put them here because some stuff below wants them before the
|
|
294 place where we would normally put them. */
|
|
295
|
|
296 /* None of these are lvalues. Use the settor macros below to change
|
|
297 the positions. */
|
|
298
|
|
299 /* Beginning of buffer. */
|
826
|
300 #define BYTE_BUF_BEG(buf) ((Bytebpos) 1)
|
665
|
301 #define BUF_BEG(buf) ((Charbpos) 1)
|
428
|
302
|
|
303 /* Beginning of accessible range of buffer. */
|
826
|
304 #define BYTE_BUF_BEGV(buf) ((buf)->begv + 0)
|
428
|
305 #define BUF_BEGV(buf) ((buf)->bufbegv + 0)
|
|
306
|
|
307 /* End of accessible range of buffer. */
|
826
|
308 #define BYTE_BUF_ZV(buf) ((buf)->zv + 0)
|
428
|
309 #define BUF_ZV(buf) ((buf)->bufzv + 0)
|
|
310
|
|
311 /* End of buffer. */
|
826
|
312 #define BYTE_BUF_Z(buf) ((buf)->text->z + 0)
|
428
|
313 #define BUF_Z(buf) ((buf)->text->bufz + 0)
|
|
314
|
|
315 /* Point. */
|
826
|
316 #define BYTE_BUF_PT(buf) ((buf)->pt + 0)
|
428
|
317 #define BUF_PT(buf) ((buf)->bufpt + 0)
|
|
318
|
826
|
319 /* Internal format of buffer. */
|
|
320 #ifdef MULE
|
|
321 #define BUF_FORMAT(buf) ((buf)->text->format)
|
|
322 #else
|
|
323 #define BUF_FORMAT(buf) FORMAT_DEFAULT
|
|
324 #endif
|
|
325
|
428
|
326 /*----------------------------------------------------------------------*/
|
826
|
327 /* Validating byte positions */
|
428
|
328 /*----------------------------------------------------------------------*/
|
|
329
|
826
|
330 /* Address of byte at position POS in buffer, no error checking. */
|
|
331 DECLARE_INLINE_HEADER (
|
867
|
332 Ibyte *
|
826
|
333 BYTE_BUF_BYTE_ADDRESS_NO_VERIFY (struct buffer *buf, Bytebpos pos)
|
|
334 )
|
428
|
335 {
|
|
336 return (buf->text->beg +
|
|
337 ((pos >= buf->text->gpt ? (pos + buf->text->gap_size) : pos)
|
|
338 - 1));
|
|
339 }
|
|
340
|
826
|
341 /* Given a byte position, does it point to the beginning of a character?
|
|
342 */
|
|
343 #ifdef MULE
|
|
344 DECLARE_INLINE_HEADER (
|
|
345 int
|
|
346 VALID_BYTEBPOS_P (struct buffer *buf, Bytebpos x)
|
|
347 )
|
428
|
348 {
|
826
|
349 switch (BUF_FORMAT (buf))
|
|
350 {
|
|
351 case FORMAT_DEFAULT:
|
867
|
352 return ibyte_first_byte_p (*BYTE_BUF_BYTE_ADDRESS_NO_VERIFY (buf, x));
|
826
|
353 case FORMAT_16_BIT_FIXED:
|
|
354 return ((x - 1) & 1) == 0;
|
|
355 case FORMAT_32_BIT_FIXED:
|
|
356 return ((x - 1) & 3) == 0;
|
|
357 default:
|
|
358 return 1;
|
|
359 }
|
428
|
360 }
|
|
361 #else
|
665
|
362 # define VALID_BYTEBPOS_P(buf, x) 1
|
428
|
363 #endif
|
|
364
|
826
|
365 /* If error-checking is enabled, assert that the given char position is
|
|
366 within range. Otherwise, do nothing.
|
|
367 */
|
|
368 # define ASSERT_VALID_CHARBPOS_UNSAFE(buf, x) do { \
|
|
369 text_checking_assert (BUFFER_LIVE_P (buf)); \
|
|
370 text_checking_assert ((x) >= BUF_BEG (buf) && x <= BUF_Z (buf)); \
|
428
|
371 } while (0)
|
826
|
372
|
|
373 /* If error-checking is enabled, assert that the given byte position is
|
|
374 within range and points to the beginning of a character or to the end of
|
|
375 the buffer. Otherwise, do nothing.
|
|
376 */
|
|
377 # define ASSERT_VALID_BYTEBPOS_UNSAFE(buf, x) do { \
|
|
378 text_checking_assert (BUFFER_LIVE_P (buf)); \
|
|
379 text_checking_assert ((x) >= BYTE_BUF_BEG (buf) && x <= BYTE_BUF_Z (buf)); \
|
|
380 text_checking_assert (VALID_BYTEBPOS_P (buf, x)); \
|
428
|
381 } while (0)
|
826
|
382
|
|
383 /* If error-checking is enabled, assert that the given byte position is
|
|
384 within range and satisfies ASSERT_VALID_BYTEBPOS() and also does not
|
|
385 refer to the beginning of the buffer. (i.e. movement backwards is OK.)
|
|
386 Otherwise, do nothing.
|
|
387 */
|
|
388 # define ASSERT_VALID_BYTEBPOS_BACKWARD_UNSAFE(buf, x) do { \
|
|
389 text_checking_assert (BUFFER_LIVE_P (buf)); \
|
|
390 text_checking_assert ((x) > BYTE_BUF_BEG (buf) && x <= BYTE_BUF_Z (buf)); \
|
|
391 text_checking_assert (VALID_BYTEBPOS_P (buf, x)); \
|
428
|
392 } while (0)
|
|
393
|
826
|
394 /* If error-checking is enabled, assert that the given byte position is
|
|
395 within range and satisfies ASSERT_VALID_BYTEBPOS() and also does not
|
|
396 refer to the end of the buffer. (i.e. movement forwards is OK.)
|
|
397 Otherwise, do nothing.
|
|
398 */
|
|
399 # define ASSERT_VALID_BYTEBPOS_FORWARD_UNSAFE(buf, x) do { \
|
|
400 text_checking_assert (BUFFER_LIVE_P (buf)); \
|
|
401 text_checking_assert ((x) >= BYTE_BUF_BEG (buf) && x < BYTE_BUF_Z (buf)); \
|
|
402 text_checking_assert (VALID_BYTEBPOS_P (buf, x)); \
|
|
403 } while (0)
|
428
|
404
|
|
405 #ifdef MULE
|
826
|
406 /* Make sure that the given byte position is pointing to the beginning of a
|
|
407 character. If not, back up until this is the case. Note that there are
|
|
408 not too many places where it is legitimate to do this sort of thing.
|
|
409 It's an error if you're passed an "invalid" byte position.
|
|
410 */
|
|
411 # define VALIDATE_BYTEBPOS_BACKWARD(buf, x) do { \
|
|
412 switch (BUF_FORMAT (buf)) \
|
|
413 { \
|
|
414 case FORMAT_DEFAULT: \
|
|
415 { \
|
867
|
416 Ibyte *VBB_ptr = BYTE_BUF_BYTE_ADDRESS_NO_VERIFY (buf, x); \
|
|
417 while (!ibyte_first_byte_p (*VBB_ptr)) \
|
826
|
418 VBB_ptr--, (x)--; \
|
|
419 } \
|
|
420 break; \
|
|
421 case FORMAT_16_BIT_FIXED: \
|
|
422 if (((x - 1) & 1) != 0) \
|
|
423 x--; \
|
|
424 break; \
|
|
425 case FORMAT_32_BIT_FIXED: \
|
|
426 while (((x - 1) & 3) != 0) \
|
|
427 x--; \
|
|
428 break; \
|
|
429 default: \
|
|
430 break; \
|
|
431 } \
|
428
|
432 } while (0)
|
|
433 #else
|
665
|
434 # define VALIDATE_BYTEBPOS_BACKWARD(buf, x)
|
428
|
435 #endif
|
|
436
|
|
437 #ifdef MULE
|
826
|
438 /* Make sure that the given byte position is pointing to the beginning of a
|
|
439 character. If not, move forward until this is the case. Note that
|
|
440 there are not too many places where it is legitimate to do this sort of
|
|
441 thing. It's an error if you're passed an "invalid" byte position.
|
|
442 */
|
|
443 # define VALIDATE_BYTEBPOS_FORWARD(buf, x) do { \
|
|
444 switch (BUF_FORMAT (buf)) \
|
|
445 { \
|
|
446 case FORMAT_DEFAULT: \
|
|
447 { \
|
867
|
448 Ibyte *VBF_ptr = BYTE_BUF_BYTE_ADDRESS_NO_VERIFY (buf, x); \
|
|
449 while (!ibyte_first_byte_p (*VBF_ptr)) \
|
826
|
450 VBF_ptr++, (x)++; \
|
|
451 } \
|
|
452 break; \
|
|
453 case FORMAT_16_BIT_FIXED: \
|
|
454 if (((x - 1) & 1) != 0) \
|
|
455 x++; \
|
|
456 break; \
|
|
457 case FORMAT_32_BIT_FIXED: \
|
|
458 while (((x - 1) & 3) != 0) \
|
|
459 x++; \
|
|
460 break; \
|
|
461 default: \
|
|
462 break; \
|
|
463 } \
|
428
|
464 } while (0)
|
|
465 #else
|
665
|
466 # define VALIDATE_BYTEBPOS_FORWARD(buf, x)
|
428
|
467 #endif
|
|
468
|
826
|
469 /*----------------------------------------------------------------------*/
|
|
470 /* Working with byte positions */
|
|
471 /*----------------------------------------------------------------------*/
|
|
472
|
|
473
|
|
474 /* Given a byte position (assumed to point at the beginning of a
|
|
475 character), modify that value so it points to the beginning of the next
|
|
476 character.
|
|
477
|
|
478 Note that in the simplest case (no MULE, no ERROR_CHECK_TEXT),
|
|
479 this crap reduces down to simply (x)++. */
|
428
|
480
|
665
|
481 #define INC_BYTEBPOS(buf, x) do \
|
428
|
482 { \
|
826
|
483 ASSERT_VALID_BYTEBPOS_FORWARD_UNSAFE (buf, x); \
|
428
|
484 /* Note that we do the increment first to \
|
|
485 make sure that the pointer in \
|
665
|
486 VALIDATE_BYTEBPOS_FORWARD() ends up on \
|
428
|
487 the correct side of the gap */ \
|
|
488 (x)++; \
|
665
|
489 VALIDATE_BYTEBPOS_FORWARD (buf, x); \
|
428
|
490 } while (0)
|
|
491
|
826
|
492 /* Given a byte position (assumed to point at the beginning of a
|
|
493 character), modify that value so it points to the beginning of the
|
867
|
494 previous character. Unlike for DEC_IBYTEPTR(), we can do all the
|
826
|
495 assert()s because there are sentinels at the beginning of the gap and
|
|
496 the end of the buffer.
|
|
497
|
|
498 Note that in the simplest case (no MULE, no ERROR_CHECK_TEXT), this
|
|
499 crap reduces down to simply (x)--. */
|
428
|
500
|
665
|
501 #define DEC_BYTEBPOS(buf, x) do \
|
428
|
502 { \
|
771
|
503 ASSERT_VALID_BYTEBPOS_BACKWARD_UNSAFE (buf, x); \
|
428
|
504 /* Note that we do the decrement first to \
|
|
505 make sure that the pointer in \
|
665
|
506 VALIDATE_BYTEBPOS_BACKWARD() ends up on \
|
428
|
507 the correct side of the gap */ \
|
|
508 (x)--; \
|
665
|
509 VALIDATE_BYTEBPOS_BACKWARD (buf, x); \
|
428
|
510 } while (0)
|
|
511
|
826
|
512 DECLARE_INLINE_HEADER (
|
|
513 Bytebpos
|
2333
|
514 prev_bytebpos (struct buffer *USED_IF_MULE_OR_CHECK_TEXT (buf), Bytebpos x)
|
826
|
515 )
|
428
|
516 {
|
665
|
517 DEC_BYTEBPOS (buf, x);
|
428
|
518 return x;
|
|
519 }
|
|
520
|
826
|
521 DECLARE_INLINE_HEADER (
|
|
522 Bytebpos
|
2333
|
523 next_bytebpos (struct buffer *USED_IF_MULE_OR_CHECK_TEXT (buf), Bytebpos x)
|
826
|
524 )
|
428
|
525 {
|
665
|
526 INC_BYTEBPOS (buf, x);
|
428
|
527 return x;
|
|
528 }
|
|
529
|
826
|
530 /* A constant representing an invalid Bytebpos. Valid Bytebposes
|
|
531 can never have this value. */
|
|
532
|
665
|
533 #define BYTEBPOS_INVALID ((Bytebpos) -1)
|
428
|
534
|
|
535 /*----------------------------------------------------------------------*/
|
826
|
536 /* Converting between byte and character positions */
|
428
|
537 /*----------------------------------------------------------------------*/
|
|
538
|
|
539 #ifdef MULE
|
|
540
|
|
541 /* The basic algorithm we use is to keep track of a known region of
|
771
|
542 characters in each buffer, all of which are of the same width. We keep
|
|
543 track of the boundaries of the region in both Charbpos and Bytebpos
|
|
544 coordinates and also keep track of the char width, which is 1 - 4 bytes.
|
|
545 If the position we're translating is not in the known region, then we
|
|
546 invoke a function to update the known region to surround the position in
|
|
547 question. This assumes locality of reference, which is usually the
|
|
548 case.
|
|
549
|
|
550 Note that the function to update the known region can be simple or
|
|
551 complicated depending on how much information we cache. In addition to
|
|
552 the known region, we always cache the correct conversions for point,
|
|
553 BEGV, and ZV, and in addition to this we cache 16 positions where the
|
|
554 conversion is known. We only look in the cache or update it when we
|
|
555 need to move the known region more than a certain amount (currently 50
|
|
556 chars), and then we throw away a "random" value and replace it with the
|
|
557 newly calculated value.
|
|
558
|
|
559 Finally, we maintain an extra flag that tracks whether the buffer is
|
|
560 entirely ASCII, to speed up the conversions even more. This flag is
|
|
561 actually of dubious value because in an entirely-ASCII buffer the known
|
|
562 region will always span the entire buffer (in fact, we update the flag
|
|
563 based on this fact), and so all we're saving is a few machine cycles.
|
428
|
564
|
771
|
565 A potentially smarter method than what we do with known regions and
|
|
566 cached positions would be to keep some sort of pseudo-extent layer over
|
|
567 the buffer; maybe keep track of the charbpos/bytebpos correspondence at the
|
|
568 beginning of each line, which would allow us to do a binary search over
|
|
569 the pseudo-extents to narrow things down to the correct line, at which
|
|
570 point you could use a linear movement method. This would also mesh well
|
|
571 with efficiently implementing a line-numbering scheme. However, you
|
|
572 have to weigh the amount of time spent updating the cache vs. the
|
|
573 savings that result from it. In reality, we modify the buffer far less
|
|
574 often than we access it, so a cache of this sort that provides
|
|
575 guaranteed LOG (N) performance (or perhaps N * LOG (N), if we set a
|
|
576 maximum on the cache size) would indeed be a win, particularly in very
|
|
577 large buffers. If we ever implement this, we should probably set a
|
|
578 reasonably high minimum below which we use the old method, because the
|
|
579 time spent updating the fancy cache would likely become dominant when
|
|
580 making buffer modifications in smaller buffers.
|
428
|
581
|
771
|
582 Note also that we have to multiply or divide by the char width in order
|
|
583 to convert the positions. We do some tricks to avoid ever actually
|
|
584 having to do a multiply or divide, because that is typically an
|
|
585 expensive operation (esp. divide). Multiplying or dividing by 1, 2, or
|
|
586 4 can be implemented simply as a shift left or shift right, and we keep
|
|
587 track of a shifter value (0, 1, or 2) indicating how much to shift.
|
|
588 Multiplying by 3 can be implemented by doubling and then adding the
|
|
589 original value. Dividing by 3, alas, cannot be implemented in any
|
|
590 simple shift/subtract method, as far as I know; so we just do a table
|
|
591 lookup. For simplicity, we use a table of size 128K, which indexes the
|
|
592 "divide-by-3" values for the first 64K non-negative numbers. (Note that
|
|
593 we can increase the size up to 384K, i.e. indexing the first 192K
|
|
594 non-negative numbers, while still using shorts in the array.) This also
|
|
595 means that the size of the known region can be at most 64K for
|
|
596 width-three characters.
|
|
597
|
|
598 !!#### We should investigate the algorithm in GNU Emacs. I think it
|
|
599 does something similar, but it may differ in some details, and it's
|
|
600 worth seeing if anything can be gleaned.
|
428
|
601 */
|
|
602
|
826
|
603 Bytebpos charbpos_to_bytebpos_func (struct buffer *buf, Charbpos x);
|
|
604 Charbpos bytebpos_to_charbpos_func (struct buffer *buf, Bytebpos x);
|
428
|
605 extern short three_to_one_table[];
|
|
606
|
826
|
607 #endif /* MULE */
|
|
608
|
|
609 /* Given a Charbpos, return the equivalent Bytebpos. */
|
|
610
|
|
611 DECLARE_INLINE_HEADER (
|
|
612 Bytebpos
|
2333
|
613 charbpos_to_bytebpos (struct buffer *USED_IF_MULE_OR_CHECK_TEXT (buf),
|
|
614 Charbpos x)
|
826
|
615 )
|
428
|
616 {
|
826
|
617 Bytebpos retval;
|
|
618 ASSERT_VALID_CHARBPOS_UNSAFE (buf, x);
|
|
619 #ifdef MULE
|
|
620 if (buf->text->entirely_one_byte_p)
|
|
621 retval = (Bytebpos) x;
|
|
622 else if (BUF_FORMAT (buf) == FORMAT_16_BIT_FIXED)
|
|
623 retval = (Bytebpos) (x << 1);
|
|
624 else if (BUF_FORMAT (buf) == FORMAT_32_BIT_FIXED)
|
|
625 retval = (Bytebpos) (x << 2);
|
|
626 else if (x >= buf->text->mule_bufmin && x <= buf->text->mule_bufmax)
|
|
627 retval = (buf->text->mule_bytmin +
|
428
|
628 ((x - buf->text->mule_bufmin) << buf->text->mule_shifter) +
|
814
|
629 (buf->text->mule_three_p ? (x - buf->text->mule_bufmin) :
|
|
630 (Bytebpos) 0));
|
428
|
631 else
|
826
|
632 retval = charbpos_to_bytebpos_func (buf, x);
|
|
633 #else
|
|
634 retval = (Bytebpos) x;
|
|
635 #endif
|
|
636 ASSERT_VALID_BYTEBPOS_UNSAFE (buf, retval);
|
|
637 return retval;
|
|
638 }
|
|
639
|
|
640 /* Given a Bytebpos, return the equivalent Charbpos. */
|
|
641
|
|
642 DECLARE_INLINE_HEADER (
|
|
643 Charbpos
|
2333
|
644 bytebpos_to_charbpos (struct buffer *USED_IF_MULE_OR_CHECK_TEXT (buf),
|
|
645 Bytebpos x)
|
826
|
646 )
|
|
647 {
|
|
648 Charbpos retval;
|
|
649 ASSERT_VALID_BYTEBPOS_UNSAFE (buf, x);
|
|
650 #ifdef MULE
|
|
651 if (buf->text->entirely_one_byte_p)
|
|
652 retval = (Charbpos) x;
|
|
653 else if (BUF_FORMAT (buf) == FORMAT_16_BIT_FIXED)
|
|
654 retval = (Charbpos) (x >> 1);
|
|
655 else if (BUF_FORMAT (buf) == FORMAT_32_BIT_FIXED)
|
|
656 retval = (Charbpos) (x >> 2);
|
|
657 else if (x >= buf->text->mule_bytmin && x <= buf->text->mule_bytmax)
|
|
658 retval = (buf->text->mule_bufmin +
|
|
659 ((buf->text->mule_three_p
|
|
660 ? three_to_one_table[x - buf->text->mule_bytmin]
|
|
661 : (x - buf->text->mule_bytmin) >> buf->text->mule_shifter)));
|
|
662 else
|
|
663 retval = bytebpos_to_charbpos_func (buf, x);
|
|
664 #else
|
|
665 retval = (Charbpos) x;
|
|
666 #endif
|
|
667 ASSERT_VALID_CHARBPOS_UNSAFE (buf, retval);
|
|
668 return retval;
|
|
669 }
|
|
670
|
|
671 /* Given a Bytebpos, return the equivalent Charbpos as a Lisp Object. */
|
|
672
|
|
673 #define make_charbpos(buf, ind) make_int (bytebpos_to_charbpos (buf, ind))
|
|
674
|
|
675 /*----------------------------------------------------------------------*/
|
|
676 /* Converting between byte and memory positions */
|
|
677 /*----------------------------------------------------------------------*/
|
|
678
|
|
679 DECLARE_INLINE_HEADER (
|
|
680 int
|
|
681 valid_membpos_p (struct buffer *buf, Membpos x)
|
|
682 )
|
|
683 {
|
|
684 return ((x >= 1 && x <= (Membpos) buf->text->gpt) ||
|
|
685 (x > (Membpos) (buf->text->gpt + buf->text->gap_size) &&
|
|
686 x <= (Membpos) (buf->text->z + buf->text->gap_size)));
|
428
|
687 }
|
|
688
|
826
|
689 DECLARE_INLINE_HEADER (
|
|
690 Membpos
|
|
691 bytebpos_to_membpos (struct buffer *buf, Bytebpos x)
|
|
692 )
|
|
693 {
|
|
694 ASSERT_VALID_BYTEBPOS_UNSAFE (buf, x);
|
|
695 return (Membpos) ((x > buf->text->gpt) ? (x + buf->text->gap_size) : x);
|
|
696 }
|
|
697
|
|
698
|
|
699 DECLARE_INLINE_HEADER (
|
|
700 Bytebpos
|
|
701 membpos_to_bytebpos (struct buffer *buf, Membpos x)
|
|
702 )
|
|
703 {
|
|
704 Bytebpos retval;
|
|
705 text_checking_assert (valid_membpos_p (buf, x));
|
|
706 retval = (Bytebpos) ((x > (Membpos) buf->text->gpt) ?
|
|
707 x - buf->text->gap_size :
|
|
708 x);
|
|
709 ASSERT_VALID_BYTEBPOS_UNSAFE (buf, retval);
|
|
710 return retval;
|
|
711 }
|
|
712
|
|
713 DECLARE_INLINE_HEADER (
|
|
714 Charbpos
|
|
715 membpos_to_charbpos (struct buffer *buf, Membpos x)
|
|
716 )
|
428
|
717 {
|
826
|
718 return bytebpos_to_charbpos (buf, membpos_to_bytebpos (buf, x));
|
|
719 }
|
|
720
|
|
721 DECLARE_INLINE_HEADER (
|
|
722 Membpos
|
|
723 charbpos_to_membpos (struct buffer *buf, Charbpos x)
|
|
724 )
|
|
725 {
|
|
726 return bytebpos_to_membpos (buf, charbpos_to_bytebpos (buf, x));
|
|
727 }
|
|
728
|
|
729 /*----------------------------------------------------------------------*/
|
|
730 /* Generalized buffer/string position convertors */
|
|
731 /*----------------------------------------------------------------------*/
|
|
732
|
|
733 /* These macros generalize many standard buffer-position functions to
|
|
734 either a buffer or a string. */
|
|
735
|
|
736 /* Converting between Memxpos's and Bytexpos's, for a buffer-or-string.
|
|
737 For strings, this is a no-op. For buffers, this resolves
|
|
738 to the standard membpos<->bytebpos converters. */
|
|
739
|
|
740 DECLARE_INLINE_HEADER (
|
|
741 Memxpos buffer_or_string_bytexpos_to_memxpos (Lisp_Object obj, Bytexpos pos)
|
|
742 )
|
|
743 {
|
|
744 return (BUFFERP (obj) ? bytebpos_to_membpos (XBUFFER (obj), pos) :
|
|
745 (Memxpos) pos);
|
428
|
746 }
|
|
747
|
826
|
748 DECLARE_INLINE_HEADER (
|
|
749 Bytexpos buffer_or_string_memxpos_to_bytexpos (Lisp_Object obj, Memxpos pos)
|
|
750 )
|
|
751 {
|
|
752 return (BUFFERP (obj) ? membpos_to_bytebpos (XBUFFER (obj), pos) :
|
|
753 (Bytexpos) pos);
|
|
754 }
|
|
755
|
|
756 /* Converting between Charxpos's and Bytexpos's, for a buffer-or-string.
|
|
757 For strings, this maps to the bytecount<->charcount converters. */
|
|
758
|
|
759 DECLARE_INLINE_HEADER (
|
|
760 Bytexpos buffer_or_string_charxpos_to_bytexpos (Lisp_Object obj, Charxpos pos)
|
|
761 )
|
|
762 {
|
|
763 return (BUFFERP (obj) ? charbpos_to_bytebpos (XBUFFER (obj), pos) :
|
|
764 (Bytexpos) string_index_char_to_byte (obj, pos));
|
|
765 }
|
|
766
|
|
767 DECLARE_INLINE_HEADER (
|
|
768 Charxpos buffer_or_string_bytexpos_to_charxpos (Lisp_Object obj, Bytexpos pos)
|
|
769 )
|
|
770 {
|
|
771 return (BUFFERP (obj) ? bytebpos_to_charbpos (XBUFFER (obj), pos) :
|
|
772 (Charxpos) string_index_byte_to_char (obj, pos));
|
|
773 }
|
428
|
774
|
826
|
775 /* Similar for Charxpos's and Memxpos's. */
|
|
776
|
|
777 DECLARE_INLINE_HEADER (
|
|
778 Memxpos buffer_or_string_charxpos_to_memxpos (Lisp_Object obj, Charxpos pos)
|
|
779 )
|
|
780 {
|
|
781 return (BUFFERP (obj) ? charbpos_to_membpos (XBUFFER (obj), pos) :
|
|
782 (Memxpos) string_index_char_to_byte (obj, pos));
|
|
783 }
|
428
|
784
|
826
|
785 DECLARE_INLINE_HEADER (
|
|
786 Charxpos buffer_or_string_memxpos_to_charxpos (Lisp_Object obj, Memxpos pos)
|
|
787 )
|
|
788 {
|
|
789 return (BUFFERP (obj) ? membpos_to_charbpos (XBUFFER (obj), pos) :
|
|
790 (Charxpos) string_index_byte_to_char (obj, pos));
|
|
791 }
|
428
|
792
|
826
|
793 DECLARE_INLINE_HEADER (
|
|
794 Internal_Format buffer_or_other_internal_format (Lisp_Object obj)
|
|
795 )
|
|
796 {
|
|
797 return BUFFERP (obj) ? BUF_FORMAT (XBUFFER (obj)) : FORMAT_DEFAULT;
|
|
798 }
|
|
799
|
|
800 /* Return the index to the character before the one at X,
|
|
801 in a buffer or string. */
|
428
|
802
|
826
|
803 DECLARE_INLINE_HEADER (
|
|
804 Bytebpos
|
|
805 prev_bytexpos (Lisp_Object obj, Bytebpos x)
|
|
806 )
|
|
807 {
|
|
808 return BUFFERP (obj) ? prev_bytebpos (XBUFFER (obj), x) :
|
|
809 prev_string_index (obj, x);
|
|
810 }
|
|
811
|
|
812 /* Return the index to the character after the one at X,
|
|
813 in a buffer or string. */
|
428
|
814
|
826
|
815 DECLARE_INLINE_HEADER (
|
|
816 Bytebpos
|
|
817 next_bytexpos (Lisp_Object obj, Bytebpos x)
|
|
818 )
|
|
819 {
|
|
820 return BUFFERP (obj) ? next_bytebpos (XBUFFER (obj), x) :
|
|
821 next_string_index (obj, x);
|
|
822 }
|
|
823
|
|
824 /*----------------------------------------------------------------------*/
|
|
825 /* Converting between positions and addresses */
|
|
826 /*----------------------------------------------------------------------*/
|
428
|
827
|
826
|
828 /* Convert the address of a byte in the buffer into a position. */
|
|
829 DECLARE_INLINE_HEADER (
|
|
830 Bytebpos
|
867
|
831 BYTE_BUF_PTR_BYTE_POS (struct buffer *buf, Ibyte *ptr)
|
826
|
832 )
|
|
833 {
|
|
834 Bytebpos retval = (ptr - buf->text->beg + 1
|
|
835 - ((ptr - buf->text->beg + 1) > buf->text->gpt
|
|
836 ? buf->text->gap_size : (Bytebpos) 0));
|
|
837 ASSERT_VALID_BYTEBPOS_UNSAFE (buf, retval);
|
|
838 return retval;
|
|
839 }
|
|
840
|
|
841 #define BUF_PTR_BYTE_POS(buf, ptr) \
|
|
842 bytebpos_to_charbpos (buf, BYTE_BUF_PTR_BYTE_POS (buf, ptr))
|
428
|
843
|
826
|
844 /* Address of byte at position POS in buffer. */
|
|
845 DECLARE_INLINE_HEADER (
|
867
|
846 Ibyte *
|
826
|
847 BYTE_BUF_BYTE_ADDRESS (struct buffer *buf, Bytebpos pos)
|
|
848 )
|
|
849 {
|
|
850 ASSERT_VALID_BYTEBPOS_UNSAFE (buf, pos);
|
|
851 return BYTE_BUF_BYTE_ADDRESS_NO_VERIFY (buf, pos);
|
|
852 }
|
|
853
|
|
854 #define BUF_BYTE_ADDRESS(buf, pos) \
|
|
855 BYTE_BUF_BYTE_ADDRESS (buf, charbpos_to_bytebpos (buf, pos))
|
428
|
856
|
826
|
857 /* Address of byte before position POS in buffer. */
|
|
858 DECLARE_INLINE_HEADER (
|
867
|
859 Ibyte *
|
826
|
860 BYTE_BUF_BYTE_ADDRESS_BEFORE (struct buffer *buf, Bytebpos pos)
|
|
861 )
|
|
862 {
|
|
863 ASSERT_VALID_BYTEBPOS_UNSAFE (buf, pos);
|
|
864 return (buf->text->beg +
|
|
865 ((pos > buf->text->gpt ? (pos + buf->text->gap_size) : pos)
|
|
866 - 2));
|
|
867 }
|
|
868
|
|
869 #define BUF_BYTE_ADDRESS_BEFORE(buf, pos) \
|
|
870 BYTE_BUF_BYTE_ADDRESS_BEFORE (buf, charbpos_to_bytebpos (buf, pos))
|
428
|
871
|
|
872 /*----------------------------------------------------------------------*/
|
|
873 /* Converting between buffer bytes and Emacs characters */
|
|
874 /*----------------------------------------------------------------------*/
|
|
875
|
|
876 /* The character at position POS in buffer. */
|
826
|
877
|
|
878 #define BYTE_BUF_FETCH_CHAR(buf, pos) \
|
867
|
879 itext_ichar_fmt (BYTE_BUF_BYTE_ADDRESS (buf, pos), BUF_FORMAT (buf), \
|
826
|
880 wrap_buffer (buf))
|
428
|
881 #define BUF_FETCH_CHAR(buf, pos) \
|
826
|
882 BYTE_BUF_FETCH_CHAR (buf, charbpos_to_bytebpos (buf, pos))
|
|
883
|
|
884 /* The "raw value" of the character at position POS in buffer.
|
867
|
885 See ichar_to_raw(). */
|
826
|
886
|
|
887 #define BYTE_BUF_FETCH_CHAR_RAW(buf, pos) \
|
867
|
888 itext_ichar_raw_fmt (BYTE_BUF_BYTE_ADDRESS (buf, pos), BUF_FORMAT (buf))
|
826
|
889 #define BUF_FETCH_CHAR_RAW(buf, pos) \
|
|
890 BYTE_BUF_FETCH_CHAR_RAW (buf, charbpos_to_bytebpos (buf, pos))
|
428
|
891
|
|
892 /* The character at position POS in buffer, as a string. This is
|
867
|
893 equivalent to set_itext_ichar (str, BUF_FETCH_CHAR (buf, pos))
|
428
|
894 but is faster for Mule. */
|
|
895
|
867
|
896 # define BYTE_BUF_ITEXT_COPY_ICHAR(buf, pos, str) \
|
826
|
897 (BUF_FORMAT (buf) == FORMAT_DEFAULT ? \
|
867
|
898 itext_copy_ichar (BYTE_BUF_BYTE_ADDRESS (buf, pos), str) : \
|
|
899 set_itext_ichar (str, BYTE_BUF_FETCH_CHAR (buf, pos)))
|
|
900 #define BUF_ITEXT_COPY_ICHAR(buf, pos, str) \
|
|
901 BYTE_BUF_ITEXT_COPY_ICHAR (buf, charbpos_to_bytebpos (buf, pos), str)
|
428
|
902
|
|
903
|
|
904 /************************************************************************/
|
440
|
905 /* */
|
428
|
906 /* higher-level buffer-position functions */
|
|
907 /* */
|
|
908 /************************************************************************/
|
|
909
|
|
910 /*----------------------------------------------------------------------*/
|
|
911 /* Settor macros for important positions in a buffer */
|
|
912 /*----------------------------------------------------------------------*/
|
|
913
|
|
914 /* Set beginning of accessible range of buffer. */
|
826
|
915 #define SET_BOTH_BUF_BEGV(buf, val, bpval) \
|
428
|
916 do \
|
|
917 { \
|
826
|
918 (buf)->begv = (bpval); \
|
428
|
919 (buf)->bufbegv = (val); \
|
|
920 } while (0)
|
|
921
|
|
922 /* Set end of accessible range of buffer. */
|
826
|
923 #define SET_BOTH_BUF_ZV(buf, val, bpval) \
|
428
|
924 do \
|
|
925 { \
|
826
|
926 (buf)->zv = (bpval); \
|
428
|
927 (buf)->bufzv = (val); \
|
|
928 } while (0)
|
|
929
|
|
930 /* Set point. */
|
|
931 /* Since BEGV and ZV are almost never set, it's reasonable to enforce
|
665
|
932 the restriction that the Charbpos and Bytebpos values must both be
|
428
|
933 specified. However, point is set in lots and lots of places. So
|
|
934 we provide the ability to specify both (for efficiency) or just
|
|
935 one. */
|
826
|
936 #define BOTH_BUF_SET_PT(buf, val, bpval) set_buffer_point (buf, val, bpval)
|
|
937 #define BYTE_BUF_SET_PT(buf, bpval) \
|
|
938 do \
|
|
939 { \
|
|
940 Bytebpos __bpbsp_bpval = (bpval); \
|
|
941 BOTH_BUF_SET_PT (buf, bytebpos_to_charbpos (buf, __bpbsp_bpval), \
|
|
942 __bpbsp_bpval); \
|
|
943 } while (0)
|
|
944 #define BUF_SET_PT(buf, value) \
|
|
945 do \
|
|
946 { \
|
|
947 Bytebpos __bsp_val = (value); \
|
|
948 BOTH_BUF_SET_PT (buf, __bsp_val, charbpos_to_bytebpos (buf, __bsp_val)); \
|
|
949 } while (0)
|
428
|
950
|
|
951
|
|
952 #if 0 /* FSFmacs */
|
|
953 /* These macros exist in FSFmacs because SET_PT() in FSFmacs incorrectly
|
|
954 does too much stuff, such as moving out of invisible extents. */
|
|
955 #define TEMP_SET_PT(position) (temp_set_point ((position), current_buffer))
|
|
956 #define SET_BUF_PT(buf, value) ((buf)->pt = (value))
|
|
957 #endif /* FSFmacs */
|
|
958
|
|
959 /*----------------------------------------------------------------------*/
|
|
960 /* Miscellaneous buffer values */
|
|
961 /*----------------------------------------------------------------------*/
|
|
962
|
|
963 /* Number of characters in buffer */
|
|
964 #define BUF_SIZE(buf) (BUF_Z (buf) - BUF_BEG (buf))
|
|
965
|
|
966 /* Is this buffer narrowed? */
|
|
967 #define BUF_NARROWED(buf) \
|
826
|
968 ((BYTE_BUF_BEGV (buf) != BYTE_BUF_BEG (buf)) || \
|
|
969 (BYTE_BUF_ZV (buf) != BYTE_BUF_Z (buf)))
|
428
|
970
|
826
|
971 /* Modification count */
|
428
|
972 #define BUF_MODIFF(buf) ((buf)->text->modiff)
|
|
973
|
826
|
974 /* Saved modification count */
|
428
|
975 #define BUF_SAVE_MODIFF(buf) ((buf)->text->save_modiff)
|
|
976
|
|
977 /* Face changed. */
|
|
978 #define BUF_FACECHANGE(buf) ((buf)->face_change)
|
|
979
|
826
|
980 DECLARE_INLINE_HEADER (
|
|
981 int
|
|
982 POINT_MARKER_P (Lisp_Object marker)
|
|
983 )
|
|
984 {
|
|
985 return (XMARKER (marker)->buffer != 0 &&
|
|
986 EQ (marker, XMARKER (marker)->buffer->point_marker));
|
|
987 }
|
428
|
988
|
|
989 #define BUF_MARKERS(buf) ((buf)->markers)
|
|
990
|
826
|
991 #ifdef MULE
|
|
992
|
|
993 DECLARE_INLINE_HEADER (
|
|
994 Lisp_Object
|
|
995 BUFFER_CATEGORY_TABLE (struct buffer *buf)
|
|
996 )
|
|
997 {
|
|
998 return buf ? buf->category_table : Vstandard_category_table;
|
|
999 }
|
|
1000
|
|
1001 #endif /* MULE */
|
|
1002
|
|
1003 DECLARE_INLINE_HEADER (
|
|
1004 Lisp_Object
|
|
1005 BUFFER_SYNTAX_TABLE (struct buffer *buf)
|
|
1006 )
|
|
1007 {
|
|
1008 return buf ? buf->syntax_table : Vstandard_syntax_table;
|
|
1009 }
|
|
1010
|
|
1011 DECLARE_INLINE_HEADER (
|
|
1012 Lisp_Object
|
|
1013 BUFFER_MIRROR_SYNTAX_TABLE (struct buffer *buf)
|
|
1014 )
|
|
1015 {
|
|
1016 return buf ? buf->mirror_syntax_table :
|
|
1017 XCHAR_TABLE (Vstandard_syntax_table)->mirror_table;
|
|
1018 }
|
|
1019
|
428
|
1020 /* WARNING:
|
|
1021
|
|
1022 The new definitions of CEILING_OF() and FLOOR_OF() differ semantically
|
|
1023 from the old ones (in FSF Emacs and XEmacs 19.11 and before).
|
|
1024 Conversion is as follows:
|
|
1025
|
826
|
1026 OLD_BYTE_CEILING_OF(n) = NEW_BYTE_CEILING_OF(n) - 1
|
|
1027 OLD_BYTE_FLOOR_OF(n) = NEW_BYTE_FLOOR_OF(n + 1)
|
428
|
1028
|
|
1029 The definitions were changed because the new definitions are more
|
771
|
1030 consistent with the way everything else works in XEmacs.
|
428
|
1031 */
|
|
1032
|
826
|
1033 /* Properties of CEILING_OF and FLOOR_OF (also apply to BYTE_ variants):
|
428
|
1034
|
|
1035 1) FLOOR_OF (CEILING_OF (n)) = n
|
|
1036 CEILING_OF (FLOOR_OF (n)) = n
|
|
1037
|
|
1038 2) CEILING_OF (n) = n if and only if n = ZV
|
|
1039 FLOOR_OF (n) = n if and only if n = BEGV
|
|
1040
|
|
1041 3) CEILING_OF (CEILING_OF (n)) = ZV
|
|
1042 FLOOR_OF (FLOOR_OF (n)) = BEGV
|
|
1043
|
|
1044 4) The bytes in the regions
|
|
1045
|
|
1046 [BYTE_ADDRESS (n), BYTE_ADDRESS_BEFORE (CEILING_OF (n))]
|
|
1047
|
|
1048 and
|
|
1049
|
|
1050 [BYTE_ADDRESS (FLOOR_OF (n)), BYTE_ADDRESS_BEFORE (n)]
|
|
1051
|
|
1052 are contiguous.
|
771
|
1053
|
|
1054 A typical loop using CEILING_OF to process contiguous ranges of text
|
|
1055 between [from, to) looks like this:
|
|
1056
|
|
1057 {
|
|
1058 Bytebpos pos = from;
|
|
1059
|
|
1060 while (pos < to)
|
|
1061 {
|
826
|
1062 Bytebpos ceil = BYTE_BUF_CEILING_OF (buf, pos);
|
771
|
1063 ceil = min (to, ceil);
|
867
|
1064 process_ibyte_string (BYTE_BUF_BYTE_ADDRESS (buf, pos), ceil - pos);
|
771
|
1065 pos = ceil;
|
|
1066 }
|
|
1067 }
|
|
1068
|
|
1069 Currently there will be at most two iterations in the loop, but it is
|
|
1070 written in such a way that it will still work if the buffer
|
|
1071 representation is changed to have multiple gaps in it.
|
|
1072 */
|
428
|
1073
|
|
1074
|
826
|
1075 /* Return the maximum position in the buffer it is safe to scan forwards
|
428
|
1076 past N to. This is used to prevent buffer scans from running into
|
|
1077 the gap (e.g. search.c). All characters between N and CEILING_OF(N)
|
|
1078 are located contiguous in memory. Note that the character *at*
|
|
1079 CEILING_OF(N) is not contiguous in memory. */
|
826
|
1080 #define BYTE_BUF_CEILING_OF(b, n) \
|
|
1081 ((n) < (b)->text->gpt && (b)->text->gpt < BYTE_BUF_ZV (b) ? \
|
|
1082 (b)->text->gpt : BYTE_BUF_ZV (b))
|
428
|
1083 #define BUF_CEILING_OF(b, n) \
|
826
|
1084 bytebpos_to_charbpos (b, BYTE_BUF_CEILING_OF (b, charbpos_to_bytebpos (b, n)))
|
428
|
1085
|
826
|
1086 /* Return the minimum position in the buffer it is safe to scan backwards
|
428
|
1087 past N to. All characters between FLOOR_OF(N) and N are located
|
|
1088 contiguous in memory. Note that the character *at* N may not be
|
|
1089 contiguous in memory. */
|
826
|
1090 #define BYTE_BUF_FLOOR_OF(b, n) \
|
|
1091 (BYTE_BUF_BEGV (b) < (b)->text->gpt && (b)->text->gpt < (n) ? \
|
|
1092 (b)->text->gpt : BYTE_BUF_BEGV (b))
|
428
|
1093 #define BUF_FLOOR_OF(b, n) \
|
826
|
1094 bytebpos_to_charbpos (b, BYTE_BUF_FLOOR_OF (b, charbpos_to_bytebpos (b, n)))
|
428
|
1095
|
826
|
1096 #define BYTE_BUF_CEILING_OF_IGNORE_ACCESSIBLE(b, n) \
|
|
1097 ((n) < (b)->text->gpt && (b)->text->gpt < BYTE_BUF_Z (b) ? \
|
|
1098 (b)->text->gpt : BYTE_BUF_Z (b))
|
428
|
1099 #define BUF_CEILING_OF_IGNORE_ACCESSIBLE(b, n) \
|
665
|
1100 bytebpos_to_charbpos \
|
826
|
1101 (b, BYTE_BUF_CEILING_OF_IGNORE_ACCESSIBLE (b, charbpos_to_bytebpos (b, n)))
|
428
|
1102
|
826
|
1103 #define BYTE_BUF_FLOOR_OF_IGNORE_ACCESSIBLE(b, n) \
|
|
1104 (BYTE_BUF_BEG (b) < (b)->text->gpt && (b)->text->gpt < (n) ? \
|
|
1105 (b)->text->gpt : BYTE_BUF_BEG (b))
|
428
|
1106 #define BUF_FLOOR_OF_IGNORE_ACCESSIBLE(b, n) \
|
665
|
1107 bytebpos_to_charbpos \
|
826
|
1108 (b, BYTE_BUF_FLOOR_OF_IGNORE_ACCESSIBLE (b, charbpos_to_bytebpos (b, n)))
|
|
1109
|
|
1110 /* Iterate over contiguous chunks of text in buffer BUF, starting at POS,
|
|
1111 of length LEN. Evaluates POS and LEN only once, but BUF multiply. In
|
|
1112 each iteration, store the current chunk into RUNPTR/RUNLEN, which will
|
|
1113 be automatically declared (don't declare them yourself). This does not
|
|
1114 respect the limits of accessibility (BUF_BEGV/BUF_ZV); if you want these
|
|
1115 limits respected, you need to impose them yourself.
|
|
1116
|
|
1117 NOTE: This must be surrounded with braces! */
|
|
1118
|
|
1119 #define BUFFER_TEXT_LOOP(buf, pos, len, runptr, runlen) \
|
867
|
1120 Ibyte *runptr; \
|
826
|
1121 Bytecount runlen; \
|
|
1122 Bytebpos BTL_pos = (pos); \
|
|
1123 Bytebpos BTL_len = (len); \
|
|
1124 for (runptr = BYTE_BUF_BYTE_ADDRESS (buf, BTL_pos), \
|
|
1125 runlen = BYTE_BUF_CEILING_OF_IGNORE_ACCESSIBLE (buf, BTL_pos) - BTL_pos, \
|
|
1126 runlen = min (BTL_len, runlen); \
|
|
1127 BTL_len > 0; \
|
|
1128 BTL_pos += runlen, \
|
|
1129 BTL_len -= runlen, \
|
|
1130 runptr = BYTE_BUF_BYTE_ADDRESS (buf, BTL_pos), \
|
|
1131 runlen = BYTE_BUF_CEILING_OF_IGNORE_ACCESSIBLE (buf, BTL_pos) - BTL_pos, \
|
|
1132 runlen = min (BTL_len, runlen))
|
428
|
1133
|
|
1134 /* This structure marks which slots in a buffer have corresponding
|
|
1135 default values in Vbuffer_defaults.
|
|
1136 Each such slot has a nonzero value in this structure.
|
|
1137 The value has only one nonzero bit.
|
|
1138
|
|
1139 When a buffer has its own local value for a slot,
|
|
1140 the bit for that slot (found in the same slot in this structure)
|
|
1141 is turned on in the buffer's local_var_flags slot.
|
|
1142
|
|
1143 If a slot in this structure is zero, then even though there may
|
|
1144 be a DEFVAR_BUFFER_LOCAL for the slot, there is no default value for it;
|
|
1145 and the corresponding slot in Vbuffer_defaults is not used. */
|
|
1146
|
|
1147 extern struct buffer buffer_local_flags;
|
|
1148
|
|
1149
|
|
1150 /* Allocation of buffer data. */
|
|
1151
|
|
1152 #ifdef REL_ALLOC
|
|
1153
|
440
|
1154 char *r_alloc (unsigned char **, size_t);
|
|
1155 char *r_re_alloc (unsigned char **, size_t);
|
428
|
1156 void r_alloc_free (unsigned char **);
|
|
1157
|
|
1158 #define BUFFER_ALLOC(data, size) \
|
867
|
1159 ((Ibyte *) r_alloc ((unsigned char **) &data, (size) * sizeof(Ibyte)))
|
428
|
1160 #define BUFFER_REALLOC(data, size) \
|
867
|
1161 ((Ibyte *) r_re_alloc ((unsigned char **) &data, (size) * sizeof(Ibyte)))
|
428
|
1162 #define BUFFER_FREE(data) r_alloc_free ((unsigned char **) &(data))
|
|
1163 #define R_ALLOC_DECLARE(var,data) r_alloc_declare (&(var), data)
|
|
1164
|
|
1165 #else /* !REL_ALLOC */
|
|
1166
|
|
1167 #define BUFFER_ALLOC(data,size)\
|
867
|
1168 (data = xnew_array (Ibyte, size))
|
428
|
1169 #define BUFFER_REALLOC(data,size)\
|
867
|
1170 ((Ibyte *) xrealloc (data, (size) * sizeof(Ibyte)))
|
428
|
1171 /* Avoid excess parentheses, or syntax errors may rear their heads. */
|
1726
|
1172 #define BUFFER_FREE(data) xfree (data, Ibyte *)
|
428
|
1173 #define R_ALLOC_DECLARE(var,data)
|
|
1174
|
|
1175 #endif /* !REL_ALLOC */
|
|
1176
|
|
1177
|
|
1178 /************************************************************************/
|
|
1179 /* Case conversion */
|
|
1180 /************************************************************************/
|
|
1181
|
|
1182 /* A "trt" table is a mapping from characters to other characters,
|
826
|
1183 typically used to convert between uppercase and lowercase.
|
428
|
1184 */
|
|
1185
|
|
1186 /* The _1 macros are named as such because they assume that you have
|
|
1187 already guaranteed that the character values are all in the range
|
|
1188 0 - 255. Bad lossage will happen otherwise. */
|
|
1189
|
446
|
1190 #define MAKE_TRT_TABLE() Fmake_char_table (Qgeneric)
|
826
|
1191 DECLARE_INLINE_HEADER (
|
867
|
1192 Ichar
|
|
1193 TRT_TABLE_OF (Lisp_Object table, Ichar ch)
|
826
|
1194 )
|
446
|
1195 {
|
|
1196 Lisp_Object TRT_char;
|
826
|
1197 TRT_char = get_char_table (ch, table);
|
446
|
1198 if (NILP (TRT_char))
|
|
1199 return ch;
|
|
1200 else
|
|
1201 return XCHAR (TRT_char);
|
|
1202 }
|
826
|
1203 #define SET_TRT_TABLE_OF(table, ch1, ch2) \
|
|
1204 Fput_char_table (make_char (ch1), make_char (ch2), table)
|
428
|
1205
|
826
|
1206 DECLARE_INLINE_HEADER (
|
|
1207 Lisp_Object
|
771
|
1208 BUFFER_CASE_TABLE (struct buffer *buf)
|
826
|
1209 )
|
771
|
1210 {
|
|
1211 return buf ? buf->case_table : Vstandard_case_table;
|
|
1212 }
|
|
1213
|
428
|
1214 /* Macros used below. */
|
446
|
1215 #define DOWNCASE_TABLE_OF(buf, c) \
|
771
|
1216 TRT_TABLE_OF (XCASE_TABLE_DOWNCASE (BUFFER_CASE_TABLE (buf)), c)
|
446
|
1217 #define UPCASE_TABLE_OF(buf, c) \
|
771
|
1218 TRT_TABLE_OF (XCASE_TABLE_UPCASE (BUFFER_CASE_TABLE (buf)), c)
|
428
|
1219
|
|
1220 /* 1 if CH is upper case. */
|
|
1221
|
826
|
1222 DECLARE_INLINE_HEADER (
|
|
1223 int
|
867
|
1224 UPPERCASEP (struct buffer *buf, Ichar ch)
|
826
|
1225 )
|
428
|
1226 {
|
|
1227 return DOWNCASE_TABLE_OF (buf, ch) != ch;
|
|
1228 }
|
|
1229
|
|
1230 /* 1 if CH is lower case. */
|
|
1231
|
826
|
1232 DECLARE_INLINE_HEADER (
|
|
1233 int
|
867
|
1234 LOWERCASEP (struct buffer *buf, Ichar ch)
|
826
|
1235 )
|
428
|
1236 {
|
|
1237 return (UPCASE_TABLE_OF (buf, ch) != ch &&
|
|
1238 DOWNCASE_TABLE_OF (buf, ch) == ch);
|
|
1239 }
|
|
1240
|
|
1241 /* 1 if CH is neither upper nor lower case. */
|
|
1242
|
826
|
1243 DECLARE_INLINE_HEADER (
|
|
1244 int
|
867
|
1245 NOCASEP (struct buffer *buf, Ichar ch)
|
826
|
1246 )
|
428
|
1247 {
|
|
1248 return UPCASE_TABLE_OF (buf, ch) == ch;
|
|
1249 }
|
|
1250
|
|
1251 /* Upcase a character, or make no change if that cannot be done. */
|
|
1252
|
826
|
1253 DECLARE_INLINE_HEADER (
|
867
|
1254 Ichar
|
|
1255 UPCASE (struct buffer *buf, Ichar ch)
|
826
|
1256 )
|
428
|
1257 {
|
|
1258 return (DOWNCASE_TABLE_OF (buf, ch) == ch) ? UPCASE_TABLE_OF (buf, ch) : ch;
|
|
1259 }
|
|
1260
|
|
1261 /* Upcase a character known to be not upper case. Unused. */
|
|
1262
|
|
1263 #define UPCASE1(buf, ch) UPCASE_TABLE_OF (buf, ch)
|
|
1264
|
|
1265 /* Downcase a character, or make no change if that cannot be done. */
|
|
1266
|
|
1267 #define DOWNCASE(buf, ch) DOWNCASE_TABLE_OF (buf, ch)
|
|
1268
|
440
|
1269 #endif /* INCLUDED_buffer_h_ */
|