428
|
1 /* Header file for the buffer manipulation primitives.
|
|
2 Copyright (C) 1985, 1986, 1992, 1993, 1994, 1995
|
|
3 Free Software Foundation, Inc.
|
|
4 Copyright (C) 1995 Sun Microsystems, Inc.
|
|
5
|
|
6 This file is part of XEmacs.
|
|
7
|
|
8 XEmacs is free software; you can redistribute it and/or modify it
|
|
9 under the terms of the GNU General Public License as published by the
|
|
10 Free Software Foundation; either version 2, or (at your option) any
|
|
11 later version.
|
|
12
|
|
13 XEmacs is distributed in the hope that it will be useful, but WITHOUT
|
|
14 ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
|
|
15 FITNESS FOR A PARTICULAR PURPOSE. See the GNU General Public License
|
|
16 for more details.
|
|
17
|
|
18 You should have received a copy of the GNU General Public License
|
|
19 along with XEmacs; see the file COPYING. If not, write to
|
|
20 the Free Software Foundation, Inc., 59 Temple Place - Suite 330,
|
|
21 Boston, MA 02111-1307, USA. */
|
|
22
|
|
23 /* Synched up with: FSF 19.30. */
|
|
24
|
|
25 /* Authorship:
|
|
26
|
|
27 FSF: long ago.
|
|
28 JWZ: separated out bufslots.h, early in Lemacs.
|
|
29 Ben Wing: almost completely rewritten for Mule, 19.12.
|
|
30 */
|
|
31
|
440
|
32 #ifndef INCLUDED_buffer_h_
|
|
33 #define INCLUDED_buffer_h_
|
428
|
34
|
|
35 #ifdef MULE
|
|
36 #include "mule-charset.h"
|
|
37 #endif
|
|
38
|
446
|
39 #include "casetab.h"
|
|
40 #include "chartab.h"
|
|
41
|
428
|
42 /************************************************************************/
|
|
43 /* */
|
|
44 /* definition of Lisp buffer object */
|
|
45 /* */
|
|
46 /************************************************************************/
|
|
47
|
665
|
48 /* Note: we keep both Bytebpos and Charbpos versions of some of the
|
428
|
49 important buffer positions because they are accessed so much.
|
|
50 If we didn't do this, we would constantly be invalidating the
|
665
|
51 charbpos<->bytebpos cache under Mule.
|
428
|
52
|
|
53 Note that under non-Mule, both versions will always be the
|
|
54 same so we don't really need to keep track of them. But it
|
|
55 simplifies the logic to go ahead and do so all the time and
|
|
56 the memory loss is insignificant. */
|
|
57
|
|
58 /* Formerly, it didn't much matter what went inside the struct buffer_text
|
|
59 and what went outside it. Now it does, with the advent of "indirect
|
|
60 buffers" that share text with another buffer. An indirect buffer
|
|
61 shares the same *text* as another buffer, but has its own buffer-local
|
|
62 variables, its own accessible region, and its own markers and extents.
|
|
63 (Due to the nature of markers, it doesn't actually matter much whether
|
|
64 we stick them inside or out of the struct buffer_text -- the user won't
|
|
65 notice any difference -- but we go ahead and put them outside for
|
|
66 consistency and overall saneness of algorithm.)
|
|
67
|
|
68 FSFmacs gets away with not maintaining any "children" pointers from
|
|
69 a buffer to the indirect buffers that refer to it by putting the
|
|
70 markers inside of the struct buffer_text, using markers to keep track
|
|
71 of BEGV and ZV in indirect buffers, and relying on the fact that
|
|
72 all intervals (text properties and overlays) use markers for their
|
|
73 start and end points. We don't do this for extents (markers are
|
|
74 inefficient anyway and take up space), so we have to maintain
|
|
75 children pointers. This is not terribly hard, though, and the
|
|
76 code to maintain this is just like the code already present in
|
|
77 extent-parent and extent-children.
|
|
78 */
|
|
79
|
|
80 struct buffer_text
|
|
81 {
|
665
|
82 Intbyte *beg; /* Actual address of buffer contents. */
|
|
83 Bytebpos gpt; /* Index of gap in buffer. */
|
|
84 Bytebpos z; /* Index of end of buffer. */
|
|
85 Charbpos bufz; /* Equivalent as a Charbpos. */
|
|
86 Bytecount gap_size;/* Size of buffer's gap */
|
|
87 Bytecount end_gap_size;/* Size of buffer's end gap */
|
428
|
88 long modiff; /* This counts buffer-modification events
|
|
89 for this buffer. It is incremented for
|
|
90 each such event, and never otherwise
|
|
91 changed. */
|
|
92 long save_modiff; /* Previous value of modiff, as of last
|
|
93 time buffer visited or saved a file. */
|
|
94
|
|
95 #ifdef MULE
|
|
96 /* We keep track of a "known" region for very fast access.
|
|
97 This information is text-only so it goes here. */
|
665
|
98 Charbpos mule_bufmin, mule_bufmax;
|
|
99 Bytebpos mule_bytmin, mule_bytmax;
|
428
|
100 int mule_shifter, mule_three_p;
|
|
101
|
|
102 /* And we also cache 16 positions for fairly fast access near those
|
|
103 positions. */
|
665
|
104 Charbpos mule_charbpos_cache[16];
|
|
105 Bytebpos mule_bytebpos_cache[16];
|
428
|
106 #endif
|
|
107
|
|
108 /* Similar to the above, we keep track of positions for which line
|
|
109 number has last been calculated. See line-number.c. */
|
|
110 Lisp_Object line_number_cache;
|
|
111
|
|
112 /* Change data that goes with the text. */
|
|
113 struct buffer_text_change_data *changes;
|
|
114
|
|
115 };
|
|
116
|
|
117 struct buffer
|
|
118 {
|
|
119 struct lcrecord_header header;
|
|
120
|
|
121 /* This structure holds the coordinates of the buffer contents
|
|
122 in ordinary buffers. In indirect buffers, this is not used. */
|
|
123 struct buffer_text own_text;
|
|
124
|
|
125 /* This points to the `struct buffer_text' that is used for this buffer.
|
|
126 In an ordinary buffer, this is the own_text field above.
|
|
127 In an indirect buffer, this is the own_text field of another buffer. */
|
|
128 struct buffer_text *text;
|
|
129
|
665
|
130 Bytebpos pt; /* Position of point in buffer. */
|
|
131 Charbpos bufpt; /* Equivalent as a Charbpos. */
|
|
132 Bytebpos begv; /* Index of beginning of accessible range. */
|
|
133 Charbpos bufbegv; /* Equivalent as a Charbpos. */
|
|
134 Bytebpos zv; /* Index of end of accessible range. */
|
|
135 Charbpos bufzv; /* Equivalent as a Charbpos. */
|
428
|
136
|
|
137 int face_change; /* This is set when a change in how the text should
|
|
138 be displayed (e.g., font, color) is made. */
|
|
139
|
448
|
140 /* Whether buffer specific face is specified. */
|
|
141 int buffer_local_face_property;
|
|
142
|
428
|
143 /* change data indicating what portion of the text has changed
|
|
144 since the last time this was reset. Used by redisplay.
|
|
145 Logically we should keep this with the text structure, but
|
|
146 redisplay resets it for each buffer individually and we don't
|
|
147 want interference between an indirect buffer and its base
|
|
148 buffer. */
|
|
149 struct each_buffer_change_data *changes;
|
|
150
|
|
151 #ifdef REGION_CACHE_NEEDS_WORK
|
|
152 /* If the long line scan cache is enabled (i.e. the buffer-local
|
|
153 variable cache-long-line-scans is non-nil), newline_cache
|
|
154 points to the newline cache, and width_run_cache points to the
|
|
155 width run cache.
|
|
156
|
|
157 The newline cache records which stretches of the buffer are
|
|
158 known *not* to contain newlines, so that they can be skipped
|
|
159 quickly when we search for newlines.
|
|
160
|
|
161 The width run cache records which stretches of the buffer are
|
|
162 known to contain characters whose widths are all the same. If
|
|
163 the width run cache maps a character to a value > 0, that value
|
|
164 is the character's width; if it maps a character to zero, we
|
|
165 don't know what its width is. This allows compute_motion to
|
|
166 process such regions very quickly, using algebra instead of
|
|
167 inspecting each character. See also width_table, below. */
|
|
168 struct region_cache *newline_cache;
|
|
169 struct region_cache *width_run_cache;
|
|
170 #endif /* REGION_CACHE_NEEDS_WORK */
|
|
171
|
|
172 /* The markers that refer to this buffer. This is actually a single
|
|
173 marker -- successive elements in its marker `chain' are the other
|
|
174 markers referring to this buffer */
|
440
|
175 Lisp_Marker *markers;
|
428
|
176
|
|
177 /* The buffer's extent info. This is its own type, an extent-info
|
|
178 object (done this way for ease in marking / finalizing). */
|
|
179 Lisp_Object extent_info;
|
|
180
|
|
181 /* ----------------------------------------------------------------- */
|
|
182 /* All the stuff above this line is the responsibility of insdel.c,
|
|
183 with some help from marker.c and extents.c.
|
|
184 All the stuff below this line is the responsibility of buffer.c. */
|
|
185
|
|
186 /* In an indirect buffer, this points to the base buffer.
|
|
187 In an ordinary buffer, it is 0.
|
|
188 We DO mark through this slot. */
|
|
189 struct buffer *base_buffer;
|
|
190
|
|
191 /* List of indirect buffers whose base is this buffer.
|
|
192 If we are an indirect buffer, this will be nil.
|
|
193 Do NOT mark through this. */
|
|
194 Lisp_Object indirect_children;
|
|
195
|
|
196 /* Flags saying which DEFVAR_PER_BUFFER variables
|
|
197 are local to this buffer. */
|
|
198 int local_var_flags;
|
|
199
|
|
200 /* Set to the modtime of the visited file when read or written.
|
|
201 -1 means visited file was nonexistent.
|
|
202 0 means visited file modtime unknown; in no case complain
|
|
203 about any mismatch on next save attempt. */
|
|
204 int modtime;
|
|
205
|
|
206 /* the value of text->modiff at the last auto-save. */
|
442
|
207 long auto_save_modified;
|
428
|
208
|
|
209 /* The time at which we detected a failure to auto-save,
|
|
210 Or -1 if we didn't have a failure. */
|
|
211 int auto_save_failure_time;
|
|
212
|
|
213 /* Position in buffer at which display started
|
|
214 the last time this buffer was displayed. */
|
|
215 int last_window_start;
|
|
216
|
|
217 /* Everything from here down must be a Lisp_Object */
|
|
218
|
|
219 #define MARKED_SLOT(x) Lisp_Object x
|
|
220 #include "bufslots.h"
|
|
221 #undef MARKED_SLOT
|
|
222 };
|
|
223
|
|
224 DECLARE_LRECORD (buffer, struct buffer);
|
|
225 #define XBUFFER(x) XRECORD (x, buffer, struct buffer)
|
|
226 #define XSETBUFFER(x, p) XSETRECORD (x, p, buffer)
|
617
|
227 #define wrap_buffer(p) wrap_record (p, buffer)
|
428
|
228 #define BUFFERP(x) RECORDP (x, buffer)
|
|
229 #define CHECK_BUFFER(x) CHECK_RECORD (x, buffer)
|
|
230 #define CONCHECK_BUFFER(x) CONCHECK_RECORD (x, buffer)
|
|
231
|
|
232 #define BUFFER_LIVE_P(b) (!NILP ((b)->name))
|
|
233
|
|
234 #define CHECK_LIVE_BUFFER(x) do { \
|
|
235 CHECK_BUFFER (x); \
|
|
236 if (!BUFFER_LIVE_P (XBUFFER (x))) \
|
|
237 dead_wrong_type_argument (Qbuffer_live_p, (x)); \
|
|
238 } while (0)
|
|
239
|
|
240 #define CONCHECK_LIVE_BUFFER(x) do { \
|
|
241 CONCHECK_BUFFER (x); \
|
|
242 if (!BUFFER_LIVE_P (XBUFFER (x))) \
|
|
243 x = wrong_type_argument (Qbuffer_live_p, (x)); \
|
|
244 } while (0)
|
|
245
|
|
246
|
|
247 #define BUFFER_BASE_BUFFER(b) ((b)->base_buffer ? (b)->base_buffer : (b))
|
|
248
|
|
249 /* Map over buffers sharing the same text as MPS_BUF. MPS_BUFVAR is a
|
|
250 variable that gets the buffer values (beginning with the base
|
|
251 buffer, then the children), and MPS_BUFCONS should be a temporary
|
|
252 Lisp_Object variable. */
|
647
|
253 #define MAP_INDIRECT_BUFFERS(mps_buf, mps_bufvar, mps_bufcons) \
|
|
254 for (mps_bufcons = Qunbound, \
|
|
255 mps_bufvar = BUFFER_BASE_BUFFER (mps_buf); \
|
|
256 UNBOUNDP (mps_bufcons) ? \
|
|
257 (mps_bufcons = mps_bufvar->indirect_children, \
|
|
258 1) \
|
|
259 : (!NILP (mps_bufcons) \
|
|
260 && (mps_bufvar = XBUFFER (XCAR (mps_bufcons)), 1) \
|
|
261 && (mps_bufcons = XCDR (mps_bufcons), 1)); \
|
428
|
262 )
|
|
263
|
|
264
|
|
265
|
|
266 /************************************************************************/
|
|
267 /* */
|
|
268 /* working with raw internal-format data */
|
|
269 /* */
|
|
270 /************************************************************************/
|
|
271
|
|
272 /* NOTE: In all the following macros, we follow these rules concerning
|
|
273 multiple evaluation of the arguments:
|
|
274
|
|
275 1) Anything that's an lvalue can be evaluated more than once.
|
|
276 2) Anything that's a Lisp Object can be evaluated more than once.
|
|
277 This should probably be changed, but this follows the way
|
|
278 that all the macros in lisp.h do things.
|
|
279 3) 'struct buffer *' arguments can be evaluated more than once.
|
|
280 4) Nothing else can be evaluated more than once. Use inline
|
|
281 functions, if necessary, to prevent multiple evaluation.
|
|
282 5) An exception to (4) is that there are some macros below that
|
|
283 may evaluate their arguments more than once. They are all
|
|
284 denoted with the word "unsafe" in their name and are generally
|
|
285 meant to be called only by other macros that have already
|
|
286 stored the calling values in temporary variables.
|
|
287
|
|
288
|
|
289 Use the following functions/macros on contiguous strings of data.
|
|
290 If the text you're operating on is known to come from a buffer, use
|
|
291 the buffer-level functions below -- they know about the gap and may
|
|
292 be more efficient.
|
|
293
|
|
294
|
|
295 (A) For working with charptr's (pointers to internally-formatted text):
|
|
296 -----------------------------------------------------------------------
|
|
297
|
|
298 VALID_CHARPTR_P (ptr):
|
|
299 Given a charptr, does it point to the beginning of a character?
|
|
300
|
|
301 ASSERT_VALID_CHARPTR (ptr):
|
|
302 If error-checking is enabled, assert that the given charptr
|
|
303 points to the beginning of a character. Otherwise, do nothing.
|
|
304
|
|
305 INC_CHARPTR (ptr):
|
|
306 Given a charptr (assumed to point at the beginning of a character),
|
|
307 modify that pointer so it points to the beginning of the next
|
|
308 character.
|
|
309
|
|
310 DEC_CHARPTR (ptr):
|
|
311 Given a charptr (assumed to point at the beginning of a
|
|
312 character or at the very end of the text), modify that pointer
|
|
313 so it points to the beginning of the previous character.
|
|
314
|
|
315 VALIDATE_CHARPTR_BACKWARD (ptr):
|
|
316 Make sure that PTR is pointing to the beginning of a character.
|
|
317 If not, back up until this is the case. Note that there are not
|
|
318 too many places where it is legitimate to do this sort of thing.
|
|
319 It's an error if you're passed an "invalid" char * pointer.
|
|
320 NOTE: PTR *must* be pointing to a valid part of the string (i.e.
|
|
321 not the very end, unless the string is zero-terminated or
|
|
322 something) in order for this function to not cause crashes.
|
|
323
|
|
324 VALIDATE_CHARPTR_FORWARD (ptr):
|
|
325 Make sure that PTR is pointing to the beginning of a character.
|
|
326 If not, move forward until this is the case. Note that there
|
|
327 are not too many places where it is legitimate to do this sort
|
|
328 of thing. It's an error if you're passed an "invalid" char *
|
|
329 pointer.
|
|
330
|
|
331
|
|
332 (B) For working with the length (in bytes and characters) of a
|
|
333 section of internally-formatted text:
|
|
334 --------------------------------------------------------------
|
|
335
|
|
336 bytecount_to_charcount (ptr, nbi):
|
|
337 Given a pointer to a text string and a length in bytes,
|
|
338 return the equivalent length in characters.
|
|
339
|
|
340 charcount_to_bytecount (ptr, nch):
|
|
341 Given a pointer to a text string and a length in characters,
|
|
342 return the equivalent length in bytes.
|
|
343
|
|
344 charptr_n_addr (ptr, n):
|
|
345 Return a pointer to the beginning of the character offset N
|
|
346 (in characters) from PTR.
|
|
347
|
|
348
|
|
349 (C) For retrieving or changing the character pointed to by a charptr:
|
|
350 ---------------------------------------------------------------------
|
|
351
|
|
352 charptr_emchar (ptr):
|
|
353 Retrieve the character pointed to by PTR as an Emchar.
|
|
354
|
|
355 charptr_emchar_n (ptr, n):
|
|
356 Retrieve the character at offset N (in characters) from PTR,
|
|
357 as an Emchar.
|
|
358
|
|
359 set_charptr_emchar (ptr, ch):
|
|
360 Store the character CH (an Emchar) as internally-formatted
|
|
361 text starting at PTR. Return the number of bytes stored.
|
|
362
|
|
363 charptr_copy_char (ptr, ptr2):
|
|
364 Retrieve the character pointed to by PTR and store it as
|
|
365 internally-formatted text in PTR2.
|
|
366
|
|
367
|
|
368 (D) For working with Emchars:
|
|
369 -----------------------------
|
|
370
|
|
371 [Note that there are other functions/macros for working with Emchars
|
|
372 in mule-charset.h, for retrieving the charset of an Emchar
|
|
373 and such. These are only valid when MULE is defined.]
|
|
374
|
|
375 valid_char_p (ch):
|
|
376 Return whether the given Emchar is valid.
|
|
377
|
|
378 CHARP (ch):
|
|
379 Return whether the given Lisp_Object is a character.
|
|
380
|
|
381 CHECK_CHAR_COERCE_INT (ch):
|
|
382 Signal an error if CH is not a valid character or integer Lisp_Object.
|
|
383 If CH is an integer Lisp_Object, convert it to a character Lisp_Object,
|
|
384 but merely by repackaging, without performing tests for char validity.
|
|
385
|
|
386 MAX_EMCHAR_LEN:
|
|
387 Maximum number of buffer bytes per Emacs character.
|
|
388
|
|
389 */
|
|
390
|
|
391
|
|
392 /* ---------------------------------------------------------------------- */
|
|
393 /* (A) For working with charptr's (pointers to internally-formatted text) */
|
|
394 /* ---------------------------------------------------------------------- */
|
|
395
|
|
396 #ifdef MULE
|
665
|
397 # define VALID_CHARPTR_P(ptr) INTBYTE_FIRST_BYTE_P (* (unsigned char *) ptr)
|
428
|
398 #else
|
|
399 # define VALID_CHARPTR_P(ptr) 1
|
|
400 #endif
|
|
401
|
665
|
402 #ifdef ERROR_CHECK_CHARBPOS
|
428
|
403 # define ASSERT_VALID_CHARPTR(ptr) assert (VALID_CHARPTR_P (ptr))
|
|
404 #else
|
|
405 # define ASSERT_VALID_CHARPTR(ptr)
|
|
406 #endif
|
|
407
|
|
408 /* Note that INC_CHARPTR() and DEC_CHARPTR() have to be written in
|
|
409 completely separate ways. INC_CHARPTR() cannot use the DEC_CHARPTR()
|
|
410 trick of looking for a valid first byte because it might run off
|
|
411 the end of the string. DEC_CHARPTR() can't use the INC_CHARPTR()
|
|
412 method because it doesn't have easy access to the first byte of
|
|
413 the character it's moving over. */
|
|
414
|
|
415 #define REAL_INC_CHARPTR(ptr) \
|
|
416 ((void) ((ptr) += REP_BYTES_BY_FIRST_BYTE (* (unsigned char *) (ptr))))
|
|
417
|
665
|
418 #define REAL_INC_CHARBYTEBPOS(ptr, pos) \
|
428
|
419 (pos += REP_BYTES_BY_FIRST_BYTE (* (unsigned char *) (ptr)))
|
|
420
|
|
421 #define REAL_DEC_CHARPTR(ptr) do { \
|
|
422 (ptr)--; \
|
|
423 } while (!VALID_CHARPTR_P (ptr))
|
|
424
|
665
|
425 #ifdef ERROR_CHECK_CHARBPOS
|
428
|
426 #define INC_CHARPTR(ptr) do { \
|
|
427 ASSERT_VALID_CHARPTR (ptr); \
|
|
428 REAL_INC_CHARPTR (ptr); \
|
|
429 } while (0)
|
|
430
|
665
|
431 #define INC_CHARBYTEBPOS(ptr, pos) do { \
|
444
|
432 ASSERT_VALID_CHARPTR (ptr); \
|
665
|
433 REAL_INC_CHARBYTEBPOS (ptr, pos); \
|
428
|
434 } while (0)
|
|
435
|
|
436 #define DEC_CHARPTR(ptr) do { \
|
665
|
437 const Intbyte *dc_ptr1 = (ptr); \
|
|
438 const Intbyte *dc_ptr2 = dc_ptr1; \
|
428
|
439 REAL_DEC_CHARPTR (dc_ptr2); \
|
|
440 assert (dc_ptr1 - dc_ptr2 == \
|
|
441 REP_BYTES_BY_FIRST_BYTE (*dc_ptr2)); \
|
665
|
442 (ptr) = (Intbyte *) dc_ptr2; \
|
428
|
443 } while (0)
|
|
444
|
665
|
445 #else /* ! ERROR_CHECK_CHARBPOS */
|
|
446 #define INC_CHARBYTEBPOS(ptr, pos) REAL_INC_CHARBYTEBPOS (ptr, pos)
|
428
|
447 #define INC_CHARPTR(ptr) REAL_INC_CHARPTR (ptr)
|
|
448 #define DEC_CHARPTR(ptr) REAL_DEC_CHARPTR (ptr)
|
665
|
449 #endif /* ! ERROR_CHECK_CHARBPOS */
|
428
|
450
|
|
451 #ifdef MULE
|
|
452
|
|
453 #define VALIDATE_CHARPTR_BACKWARD(ptr) do { \
|
|
454 while (!VALID_CHARPTR_P (ptr)) ptr--; \
|
|
455 } while (0)
|
|
456
|
|
457 /* This needs to be trickier to avoid the possibility of running off
|
|
458 the end of the string. */
|
|
459
|
|
460 #define VALIDATE_CHARPTR_FORWARD(ptr) do { \
|
665
|
461 Intbyte *vcf_ptr = (ptr); \
|
428
|
462 VALIDATE_CHARPTR_BACKWARD (vcf_ptr); \
|
|
463 if (vcf_ptr != (ptr)) \
|
|
464 { \
|
|
465 (ptr) = vcf_ptr; \
|
|
466 INC_CHARPTR (ptr); \
|
|
467 } \
|
|
468 } while (0)
|
|
469
|
|
470 #else /* not MULE */
|
|
471 #define VALIDATE_CHARPTR_BACKWARD(ptr)
|
|
472 #define VALIDATE_CHARPTR_FORWARD(ptr)
|
|
473 #endif /* not MULE */
|
|
474
|
|
475 /* -------------------------------------------------------------- */
|
|
476 /* (B) For working with the length (in bytes and characters) of a */
|
|
477 /* section of internally-formatted text */
|
|
478 /* -------------------------------------------------------------- */
|
|
479
|
665
|
480 INLINE_HEADER const Intbyte *
|
|
481 charptr_n_addr (const Intbyte *ptr, Charcount offset);
|
|
482 INLINE_HEADER const Intbyte *
|
|
483 charptr_n_addr (const Intbyte *ptr, Charcount offset)
|
428
|
484 {
|
|
485 return ptr + charcount_to_bytecount (ptr, offset);
|
|
486 }
|
|
487
|
|
488 /* -------------------------------------------------------------------- */
|
|
489 /* (C) For retrieving or changing the character pointed to by a charptr */
|
|
490 /* -------------------------------------------------------------------- */
|
|
491
|
|
492 #define simple_charptr_emchar(ptr) ((Emchar) (ptr)[0])
|
665
|
493 #define simple_set_charptr_emchar(ptr, x) ((ptr)[0] = (Intbyte) (x), 1)
|
428
|
494 #define simple_charptr_copy_char(ptr, ptr2) ((ptr2)[0] = *(ptr), 1)
|
|
495
|
|
496 #ifdef MULE
|
|
497
|
665
|
498 Emchar non_ascii_charptr_emchar (const Intbyte *ptr);
|
|
499 Bytecount non_ascii_set_charptr_emchar (Intbyte *ptr, Emchar c);
|
|
500 Bytecount non_ascii_charptr_copy_char (const Intbyte *src, Intbyte *dst);
|
428
|
501
|
665
|
502 INLINE_HEADER Emchar charptr_emchar (const Intbyte *ptr);
|
442
|
503 INLINE_HEADER Emchar
|
665
|
504 charptr_emchar (const Intbyte *ptr)
|
428
|
505 {
|
|
506 return BYTE_ASCII_P (*ptr) ?
|
|
507 simple_charptr_emchar (ptr) :
|
|
508 non_ascii_charptr_emchar (ptr);
|
|
509 }
|
|
510
|
665
|
511 INLINE_HEADER Bytecount set_charptr_emchar (Intbyte *ptr, Emchar x);
|
442
|
512 INLINE_HEADER Bytecount
|
665
|
513 set_charptr_emchar (Intbyte *ptr, Emchar x)
|
428
|
514 {
|
|
515 return !CHAR_MULTIBYTE_P (x) ?
|
|
516 simple_set_charptr_emchar (ptr, x) :
|
|
517 non_ascii_set_charptr_emchar (ptr, x);
|
|
518 }
|
|
519
|
444
|
520 /* Copy the character pointed to by SRC into DST.
|
|
521 Return the number of bytes copied. */
|
442
|
522 INLINE_HEADER Bytecount
|
665
|
523 charptr_copy_char (const Intbyte *src, Intbyte *dst);
|
442
|
524 INLINE_HEADER Bytecount
|
665
|
525 charptr_copy_char (const Intbyte *src, Intbyte *dst)
|
428
|
526 {
|
444
|
527 return BYTE_ASCII_P (*src) ?
|
|
528 simple_charptr_copy_char (src, dst) :
|
|
529 non_ascii_charptr_copy_char (src, dst);
|
428
|
530 }
|
|
531
|
|
532 #else /* not MULE */
|
|
533
|
|
534 # define charptr_emchar(ptr) simple_charptr_emchar (ptr)
|
|
535 # define set_charptr_emchar(ptr, x) simple_set_charptr_emchar (ptr, x)
|
|
536 # define charptr_copy_char(ptr, ptr2) simple_charptr_copy_char (ptr, ptr2)
|
|
537
|
|
538 #endif /* not MULE */
|
|
539
|
|
540 #define charptr_emchar_n(ptr, offset) \
|
|
541 charptr_emchar (charptr_n_addr (ptr, offset))
|
|
542
|
|
543
|
|
544 /* ---------------------------- */
|
|
545 /* (D) For working with Emchars */
|
|
546 /* ---------------------------- */
|
|
547
|
|
548 #ifdef MULE
|
|
549
|
|
550 int non_ascii_valid_char_p (Emchar ch);
|
|
551
|
442
|
552 INLINE_HEADER int valid_char_p (Emchar ch);
|
|
553 INLINE_HEADER int
|
428
|
554 valid_char_p (Emchar ch)
|
|
555 {
|
650
|
556 return (! (ch & ~0xFF)) || non_ascii_valid_char_p (ch);
|
428
|
557 }
|
|
558
|
|
559 #else /* not MULE */
|
|
560
|
650
|
561 #define valid_char_p(ch) (! (ch & ~0xFF))
|
428
|
562
|
|
563 #endif /* not MULE */
|
|
564
|
|
565 #define CHAR_INTP(x) (INTP (x) && valid_char_p (XINT (x)))
|
|
566
|
|
567 #define CHAR_OR_CHAR_INTP(x) (CHARP (x) || CHAR_INTP (x))
|
|
568
|
442
|
569 INLINE_HEADER Emchar XCHAR_OR_CHAR_INT (Lisp_Object obj);
|
|
570 INLINE_HEADER Emchar
|
428
|
571 XCHAR_OR_CHAR_INT (Lisp_Object obj)
|
|
572 {
|
|
573 return CHARP (obj) ? XCHAR (obj) : XINT (obj);
|
|
574 }
|
|
575
|
|
576 #define CHECK_CHAR_COERCE_INT(x) do { \
|
|
577 if (CHARP (x)) \
|
|
578 ; \
|
|
579 else if (CHAR_INTP (x)) \
|
|
580 x = make_char (XINT (x)); \
|
|
581 else \
|
|
582 x = wrong_type_argument (Qcharacterp, x); \
|
|
583 } while (0)
|
|
584
|
|
585 #ifdef MULE
|
|
586 # define MAX_EMCHAR_LEN 4
|
|
587 #else
|
|
588 # define MAX_EMCHAR_LEN 1
|
|
589 #endif
|
|
590
|
|
591
|
|
592 /*----------------------------------------------------------------------*/
|
|
593 /* Accessor macros for important positions in a buffer */
|
|
594 /*----------------------------------------------------------------------*/
|
|
595
|
|
596 /* We put them here because some stuff below wants them before the
|
|
597 place where we would normally put them. */
|
|
598
|
|
599 /* None of these are lvalues. Use the settor macros below to change
|
|
600 the positions. */
|
|
601
|
|
602 /* Beginning of buffer. */
|
665
|
603 #define BI_BUF_BEG(buf) ((Bytebpos) 1)
|
|
604 #define BUF_BEG(buf) ((Charbpos) 1)
|
428
|
605
|
|
606 /* Beginning of accessible range of buffer. */
|
|
607 #define BI_BUF_BEGV(buf) ((buf)->begv + 0)
|
|
608 #define BUF_BEGV(buf) ((buf)->bufbegv + 0)
|
|
609
|
|
610 /* End of accessible range of buffer. */
|
|
611 #define BI_BUF_ZV(buf) ((buf)->zv + 0)
|
|
612 #define BUF_ZV(buf) ((buf)->bufzv + 0)
|
|
613
|
|
614 /* End of buffer. */
|
|
615 #define BI_BUF_Z(buf) ((buf)->text->z + 0)
|
|
616 #define BUF_Z(buf) ((buf)->text->bufz + 0)
|
|
617
|
|
618 /* Point. */
|
|
619 #define BI_BUF_PT(buf) ((buf)->pt + 0)
|
|
620 #define BUF_PT(buf) ((buf)->bufpt + 0)
|
|
621
|
|
622 /*----------------------------------------------------------------------*/
|
|
623 /* Converting between positions and addresses */
|
|
624 /*----------------------------------------------------------------------*/
|
|
625
|
|
626 /* Convert the address of a byte in the buffer into a position. */
|
665
|
627 INLINE_HEADER Bytebpos BI_BUF_PTR_BYTE_POS (struct buffer *buf, Intbyte *ptr);
|
|
628 INLINE_HEADER Bytebpos
|
|
629 BI_BUF_PTR_BYTE_POS (struct buffer *buf, Intbyte *ptr)
|
428
|
630 {
|
|
631 return (ptr - buf->text->beg + 1
|
|
632 - ((ptr - buf->text->beg + 1) > buf->text->gpt
|
|
633 ? buf->text->gap_size : 0));
|
|
634 }
|
|
635
|
|
636 #define BUF_PTR_BYTE_POS(buf, ptr) \
|
665
|
637 bytebpos_to_charbpos (buf, BI_BUF_PTR_BYTE_POS (buf, ptr))
|
428
|
638
|
|
639 /* Address of byte at position POS in buffer. */
|
665
|
640 INLINE_HEADER Intbyte * BI_BUF_BYTE_ADDRESS (struct buffer *buf, Bytebpos pos);
|
|
641 INLINE_HEADER Intbyte *
|
|
642 BI_BUF_BYTE_ADDRESS (struct buffer *buf, Bytebpos pos)
|
428
|
643 {
|
|
644 return (buf->text->beg +
|
|
645 ((pos >= buf->text->gpt ? (pos + buf->text->gap_size) : pos)
|
|
646 - 1));
|
|
647 }
|
|
648
|
|
649 #define BUF_BYTE_ADDRESS(buf, pos) \
|
665
|
650 BI_BUF_BYTE_ADDRESS (buf, charbpos_to_bytebpos (buf, pos))
|
428
|
651
|
|
652 /* Address of byte before position POS in buffer. */
|
665
|
653 INLINE_HEADER Intbyte * BI_BUF_BYTE_ADDRESS_BEFORE (struct buffer *buf, Bytebpos pos);
|
|
654 INLINE_HEADER Intbyte *
|
|
655 BI_BUF_BYTE_ADDRESS_BEFORE (struct buffer *buf, Bytebpos pos)
|
428
|
656 {
|
|
657 return (buf->text->beg +
|
|
658 ((pos > buf->text->gpt ? (pos + buf->text->gap_size) : pos)
|
|
659 - 2));
|
|
660 }
|
|
661
|
|
662 #define BUF_BYTE_ADDRESS_BEFORE(buf, pos) \
|
665
|
663 BI_BUF_BYTE_ADDRESS_BEFORE (buf, charbpos_to_bytebpos (buf, pos))
|
428
|
664
|
|
665 /*----------------------------------------------------------------------*/
|
|
666 /* Converting between byte indices and memory indices */
|
|
667 /*----------------------------------------------------------------------*/
|
|
668
|
665
|
669 INLINE_HEADER int valid_membpos_p (struct buffer *buf, Membpos x);
|
442
|
670 INLINE_HEADER int
|
665
|
671 valid_membpos_p (struct buffer *buf, Membpos x)
|
428
|
672 {
|
665
|
673 return ((x >= 1 && x <= (Membpos) buf->text->gpt) ||
|
|
674 (x > (Membpos) (buf->text->gpt + buf->text->gap_size) &&
|
|
675 x <= (Membpos) (buf->text->z + buf->text->gap_size)));
|
428
|
676 }
|
|
677
|
665
|
678 INLINE_HEADER Membpos bytebpos_to_membpos (struct buffer *buf, Bytebpos x);
|
|
679 INLINE_HEADER Membpos
|
|
680 bytebpos_to_membpos (struct buffer *buf, Bytebpos x)
|
428
|
681 {
|
665
|
682 return (Membpos) ((x > buf->text->gpt) ? (x + buf->text->gap_size) : x);
|
428
|
683 }
|
|
684
|
|
685
|
665
|
686 INLINE_HEADER Bytebpos membpos_to_bytebpos (struct buffer *buf, Membpos x);
|
|
687 INLINE_HEADER Bytebpos
|
|
688 membpos_to_bytebpos (struct buffer *buf, Membpos x)
|
428
|
689 {
|
665
|
690 #ifdef ERROR_CHECK_CHARBPOS
|
|
691 assert (valid_membpos_p (buf, x));
|
428
|
692 #endif
|
665
|
693 return (Bytebpos) ((x > (Membpos) buf->text->gpt) ?
|
428
|
694 x - buf->text->gap_size :
|
|
695 x);
|
|
696 }
|
|
697
|
665
|
698 #define membpos_to_charbpos(buf, x) \
|
|
699 bytebpos_to_charbpos (buf, membpos_to_bytebpos (buf, x))
|
|
700 #define charbpos_to_membpos(buf, x) \
|
|
701 bytebpos_to_membpos (buf, charbpos_to_bytebpos (buf, x))
|
428
|
702
|
|
703 /* These macros generalize many standard buffer-position functions to
|
|
704 either a buffer or a string. */
|
|
705
|
665
|
706 /* Converting between Membposs and Bytebposs, for a buffer-or-string.
|
428
|
707 For strings, this is a no-op. For buffers, this resolves
|
665
|
708 to the standard membpos<->bytebpos converters. */
|
428
|
709
|
665
|
710 #define buffer_or_string_bytebpos_to_membpos(obj, ind) \
|
|
711 (BUFFERP (obj) ? bytebpos_to_membpos (XBUFFER (obj), ind) : (Membpos) ind)
|
428
|
712
|
665
|
713 #define buffer_or_string_membpos_to_bytebpos(obj, ind) \
|
|
714 (BUFFERP (obj) ? membpos_to_bytebpos (XBUFFER (obj), ind) : (Bytebpos) ind)
|
428
|
715
|
665
|
716 /* Converting between Charbpos's and Bytebposs, for a buffer-or-string.
|
428
|
717 For strings, this maps to the bytecount<->charcount converters. */
|
|
718
|
665
|
719 #define buffer_or_string_charbpos_to_bytebpos(obj, pos) \
|
|
720 (BUFFERP (obj) ? charbpos_to_bytebpos (XBUFFER (obj), pos) : \
|
|
721 (Bytebpos) charcount_to_bytecount (XSTRING_DATA (obj), pos))
|
428
|
722
|
665
|
723 #define buffer_or_string_bytebpos_to_charbpos(obj, ind) \
|
|
724 (BUFFERP (obj) ? bytebpos_to_charbpos (XBUFFER (obj), ind) : \
|
|
725 (Charbpos) bytecount_to_charcount (XSTRING_DATA (obj), ind))
|
428
|
726
|
665
|
727 /* Similar for Charbpos's and Membposs. */
|
428
|
728
|
665
|
729 #define buffer_or_string_charbpos_to_membpos(obj, pos) \
|
|
730 (BUFFERP (obj) ? charbpos_to_membpos (XBUFFER (obj), pos) : \
|
|
731 (Membpos) charcount_to_bytecount (XSTRING_DATA (obj), pos))
|
428
|
732
|
665
|
733 #define buffer_or_string_membpos_to_charbpos(obj, ind) \
|
|
734 (BUFFERP (obj) ? membpos_to_charbpos (XBUFFER (obj), ind) : \
|
|
735 (Charbpos) bytecount_to_charcount (XSTRING_DATA (obj), ind))
|
428
|
736
|
|
737 /************************************************************************/
|
|
738 /* */
|
|
739 /* working with buffer-level data */
|
|
740 /* */
|
|
741 /************************************************************************/
|
|
742
|
|
743 /*
|
|
744
|
|
745 (A) Working with byte indices:
|
|
746 ------------------------------
|
|
747
|
665
|
748 VALID_BYTEBPOS_P(buf, bi):
|
428
|
749 Given a byte index, does it point to the beginning of a character?
|
|
750
|
665
|
751 ASSERT_VALID_BYTEBPOS_UNSAFE(buf, bi):
|
428
|
752 If error-checking is enabled, assert that the given byte index
|
|
753 is within range and points to the beginning of a character
|
|
754 or to the end of the buffer. Otherwise, do nothing.
|
|
755
|
665
|
756 ASSERT_VALID_BYTEBPOS_BACKWARD_UNSAFE(buf, bi):
|
428
|
757 If error-checking is enabled, assert that the given byte index
|
665
|
758 is within range and satisfies ASSERT_VALID_BYTEBPOS() and also
|
428
|
759 does not refer to the beginning of the buffer. (i.e. movement
|
|
760 backwards is OK.) Otherwise, do nothing.
|
|
761
|
665
|
762 ASSERT_VALID_BYTEBPOS_FORWARD_UNSAFE(buf, bi):
|
428
|
763 If error-checking is enabled, assert that the given byte index
|
665
|
764 is within range and satisfies ASSERT_VALID_BYTEBPOS() and also
|
428
|
765 does not refer to the end of the buffer. (i.e. movement
|
|
766 forwards is OK.) Otherwise, do nothing.
|
|
767
|
665
|
768 VALIDATE_BYTEBPOS_BACKWARD(buf, bi):
|
428
|
769 Make sure that the given byte index is pointing to the beginning
|
|
770 of a character. If not, back up until this is the case. Note
|
|
771 that there are not too many places where it is legitimate to do
|
|
772 this sort of thing. It's an error if you're passed an "invalid"
|
|
773 byte index.
|
|
774
|
665
|
775 VALIDATE_BYTEBPOS_FORWARD(buf, bi):
|
428
|
776 Make sure that the given byte index is pointing to the beginning
|
|
777 of a character. If not, move forward until this is the case.
|
|
778 Note that there are not too many places where it is legitimate
|
|
779 to do this sort of thing. It's an error if you're passed an
|
|
780 "invalid" byte index.
|
|
781
|
665
|
782 INC_BYTEBPOS(buf, bi):
|
428
|
783 Given a byte index (assumed to point at the beginning of a
|
|
784 character), modify that value so it points to the beginning
|
|
785 of the next character.
|
|
786
|
665
|
787 DEC_BYTEBPOS(buf, bi):
|
428
|
788 Given a byte index (assumed to point at the beginning of a
|
|
789 character), modify that value so it points to the beginning
|
|
790 of the previous character. Unlike for DEC_CHARPTR(), we can
|
|
791 do all the assert()s because there are sentinels at the
|
|
792 beginning of the gap and the end of the buffer.
|
|
793
|
665
|
794 BYTEBPOS_INVALID:
|
|
795 A constant representing an invalid Bytebpos. Valid Bytebposs
|
428
|
796 can never have this value.
|
|
797
|
|
798
|
665
|
799 (B) Converting between Charbpos's and Bytebposs:
|
428
|
800 --------------------------------------------
|
|
801
|
665
|
802 charbpos_to_bytebpos(buf, bu):
|
|
803 Given a Charbpos, return the equivalent Bytebpos.
|
428
|
804
|
665
|
805 bytebpos_to_charbpos(buf, bi):
|
|
806 Given a Bytebpos, return the equivalent Charbpos.
|
428
|
807
|
665
|
808 make_charbpos(buf, bi):
|
|
809 Given a Bytebpos, return the equivalent Charbpos as a Lisp Object.
|
428
|
810 */
|
|
811
|
|
812
|
|
813 /*----------------------------------------------------------------------*/
|
|
814 /* working with byte indices */
|
|
815 /*----------------------------------------------------------------------*/
|
|
816
|
|
817 #ifdef MULE
|
665
|
818 # define VALID_BYTEBPOS_P(buf, x) \
|
|
819 INTBYTE_FIRST_BYTE_P (*BI_BUF_BYTE_ADDRESS (buf, x))
|
428
|
820 #else
|
665
|
821 # define VALID_BYTEBPOS_P(buf, x) 1
|
428
|
822 #endif
|
|
823
|
665
|
824 #ifdef ERROR_CHECK_CHARBPOS
|
428
|
825
|
665
|
826 # define ASSERT_VALID_BYTEBPOS_UNSAFE(buf, x) do { \
|
428
|
827 assert (BUFFER_LIVE_P (buf)); \
|
|
828 assert ((x) >= BI_BUF_BEG (buf) && x <= BI_BUF_Z (buf)); \
|
665
|
829 assert (VALID_BYTEBPOS_P (buf, x)); \
|
428
|
830 } while (0)
|
665
|
831 # define ASSERT_VALID_BYTEBPOS_BACKWARD_UNSAFE(buf, x) do { \
|
428
|
832 assert (BUFFER_LIVE_P (buf)); \
|
|
833 assert ((x) > BI_BUF_BEG (buf) && x <= BI_BUF_Z (buf)); \
|
665
|
834 assert (VALID_BYTEBPOS_P (buf, x)); \
|
428
|
835 } while (0)
|
665
|
836 # define ASSERT_VALID_BYTEBPOS_FORWARD_UNSAFE(buf, x) do { \
|
428
|
837 assert (BUFFER_LIVE_P (buf)); \
|
|
838 assert ((x) >= BI_BUF_BEG (buf) && x < BI_BUF_Z (buf)); \
|
665
|
839 assert (VALID_BYTEBPOS_P (buf, x)); \
|
428
|
840 } while (0)
|
|
841
|
665
|
842 #else /* not ERROR_CHECK_CHARBPOS */
|
|
843 # define ASSERT_VALID_BYTEBPOS_UNSAFE(buf, x)
|
|
844 # define ASSERT_VALID_BYTEBPOS_BACKWARD_UNSAFE(buf, x)
|
|
845 # define ASSERT_VALID_BYTEBPOS_FORWARD_UNSAFE(buf, x)
|
428
|
846
|
665
|
847 #endif /* not ERROR_CHECK_CHARBPOS */
|
428
|
848
|
|
849 /* Note that, although the Mule version will work fine for non-Mule
|
|
850 as well (it should reduce down to nothing), we provide a separate
|
|
851 version to avoid compilation warnings and possible non-optimal
|
|
852 results with stupid compilers. */
|
|
853
|
|
854 #ifdef MULE
|
665
|
855 # define VALIDATE_BYTEBPOS_BACKWARD(buf, x) do { \
|
|
856 Intbyte *VBB_ptr = BI_BUF_BYTE_ADDRESS (buf, x); \
|
|
857 while (!INTBYTE_FIRST_BYTE_P (*VBB_ptr)) \
|
428
|
858 VBB_ptr--, (x)--; \
|
|
859 } while (0)
|
|
860 #else
|
665
|
861 # define VALIDATE_BYTEBPOS_BACKWARD(buf, x)
|
428
|
862 #endif
|
|
863
|
|
864 /* Note that, although the Mule version will work fine for non-Mule
|
|
865 as well (it should reduce down to nothing), we provide a separate
|
|
866 version to avoid compilation warnings and possible non-optimal
|
|
867 results with stupid compilers. */
|
|
868
|
|
869 #ifdef MULE
|
665
|
870 # define VALIDATE_BYTEBPOS_FORWARD(buf, x) do { \
|
|
871 Intbyte *VBF_ptr = BI_BUF_BYTE_ADDRESS (buf, x); \
|
|
872 while (!INTBYTE_FIRST_BYTE_P (*VBF_ptr)) \
|
428
|
873 VBF_ptr++, (x)++; \
|
|
874 } while (0)
|
|
875 #else
|
665
|
876 # define VALIDATE_BYTEBPOS_FORWARD(buf, x)
|
428
|
877 #endif
|
|
878
|
665
|
879 /* Note that in the simplest case (no MULE, no ERROR_CHECK_CHARBPOS),
|
428
|
880 this crap reduces down to simply (x)++. */
|
|
881
|
665
|
882 #define INC_BYTEBPOS(buf, x) do \
|
428
|
883 { \
|
665
|
884 ASSERT_VALID_BYTEBPOS_FORWARD_UNSAFE (buf, x); \
|
428
|
885 /* Note that we do the increment first to \
|
|
886 make sure that the pointer in \
|
665
|
887 VALIDATE_BYTEBPOS_FORWARD() ends up on \
|
428
|
888 the correct side of the gap */ \
|
|
889 (x)++; \
|
665
|
890 VALIDATE_BYTEBPOS_FORWARD (buf, x); \
|
428
|
891 } while (0)
|
|
892
|
665
|
893 /* Note that in the simplest case (no MULE, no ERROR_CHECK_CHARBPOS),
|
428
|
894 this crap reduces down to simply (x)--. */
|
|
895
|
665
|
896 #define DEC_BYTEBPOS(buf, x) do \
|
428
|
897 { \
|
665
|
898 ASSERT_VALID_BYTEBPOS_BACKWARD_UNSAFE (buf, x); \
|
428
|
899 /* Note that we do the decrement first to \
|
|
900 make sure that the pointer in \
|
665
|
901 VALIDATE_BYTEBPOS_BACKWARD() ends up on \
|
428
|
902 the correct side of the gap */ \
|
|
903 (x)--; \
|
665
|
904 VALIDATE_BYTEBPOS_BACKWARD (buf, x); \
|
428
|
905 } while (0)
|
|
906
|
665
|
907 INLINE_HEADER Bytebpos prev_bytebpos (struct buffer *buf, Bytebpos x);
|
|
908 INLINE_HEADER Bytebpos
|
|
909 prev_bytebpos (struct buffer *buf, Bytebpos x)
|
428
|
910 {
|
665
|
911 DEC_BYTEBPOS (buf, x);
|
428
|
912 return x;
|
|
913 }
|
|
914
|
665
|
915 INLINE_HEADER Bytebpos next_bytebpos (struct buffer *buf, Bytebpos x);
|
|
916 INLINE_HEADER Bytebpos
|
|
917 next_bytebpos (struct buffer *buf, Bytebpos x)
|
428
|
918 {
|
665
|
919 INC_BYTEBPOS (buf, x);
|
428
|
920 return x;
|
|
921 }
|
|
922
|
665
|
923 #define BYTEBPOS_INVALID ((Bytebpos) -1)
|
428
|
924
|
|
925 /*----------------------------------------------------------------------*/
|
|
926 /* Converting between buffer positions and byte indices */
|
|
927 /*----------------------------------------------------------------------*/
|
|
928
|
|
929 #ifdef MULE
|
|
930
|
665
|
931 Bytebpos charbpos_to_bytebpos_func (struct buffer *buf, Charbpos x);
|
|
932 Charbpos bytebpos_to_charbpos_func (struct buffer *buf, Bytebpos x);
|
428
|
933
|
|
934 /* The basic algorithm we use is to keep track of a known region of
|
|
935 characters in each buffer, all of which are of the same width. We
|
665
|
936 keep track of the boundaries of the region in both Charbpos and
|
|
937 Bytebpos coordinates and also keep track of the char width, which
|
428
|
938 is 1 - 4 bytes. If the position we're translating is not in
|
|
939 the known region, then we invoke a function to update the known
|
|
940 region to surround the position in question. This assumes
|
|
941 locality of reference, which is usually the case.
|
|
942
|
|
943 Note that the function to update the known region can be simple
|
|
944 or complicated depending on how much information we cache.
|
|
945 For the moment, we don't cache any information, and just move
|
|
946 linearly forward or back from the known region, with a few
|
|
947 shortcuts to catch all-ASCII buffers. (Note that this will
|
|
948 thrash with bad locality of reference.) A smarter method would
|
|
949 be to keep some sort of pseudo-extent layer over the buffer;
|
665
|
950 maybe keep track of the charbpos/bytebpos correspondence at the
|
428
|
951 beginning of each line, which would allow us to do a binary
|
|
952 search over the pseudo-extents to narrow things down to the
|
|
953 correct line, at which point you could use a linear movement
|
|
954 method. This would also mesh well with efficiently
|
|
955 implementing a line-numbering scheme.
|
|
956
|
|
957 Note also that we have to multiply or divide by the char width
|
|
958 in order to convert the positions. We do some tricks to avoid
|
|
959 ever actually having to do a multiply or divide, because that
|
|
960 is typically an expensive operation (esp. divide). Multiplying
|
|
961 or dividing by 1, 2, or 4 can be implemented simply as a
|
|
962 shift left or shift right, and we keep track of a shifter value
|
|
963 (0, 1, or 2) indicating how much to shift. Multiplying by 3
|
|
964 can be implemented by doubling and then adding the original
|
|
965 value. Dividing by 3, alas, cannot be implemented in any
|
|
966 simple shift/subtract method, as far as I know; so we just
|
|
967 do a table lookup. For simplicity, we use a table of size
|
|
968 128K, which indexes the "divide-by-3" values for the first
|
|
969 64K non-negative numbers. (Note that we can increase the
|
|
970 size up to 384K, i.e. indexing the first 192K non-negative
|
|
971 numbers, while still using shorts in the array.) This also
|
|
972 means that the size of the known region can be at most
|
|
973 64K for width-three characters.
|
|
974 */
|
|
975
|
|
976 extern short three_to_one_table[];
|
|
977
|
665
|
978 INLINE_HEADER int real_charbpos_to_bytebpos (struct buffer *buf, Charbpos x);
|
442
|
979 INLINE_HEADER int
|
665
|
980 real_charbpos_to_bytebpos (struct buffer *buf, Charbpos x)
|
428
|
981 {
|
|
982 if (x >= buf->text->mule_bufmin && x <= buf->text->mule_bufmax)
|
|
983 return (buf->text->mule_bytmin +
|
|
984 ((x - buf->text->mule_bufmin) << buf->text->mule_shifter) +
|
|
985 (buf->text->mule_three_p ? (x - buf->text->mule_bufmin) : 0));
|
|
986 else
|
665
|
987 return charbpos_to_bytebpos_func (buf, x);
|
428
|
988 }
|
|
989
|
665
|
990 INLINE_HEADER int real_bytebpos_to_charbpos (struct buffer *buf, Bytebpos x);
|
442
|
991 INLINE_HEADER int
|
665
|
992 real_bytebpos_to_charbpos (struct buffer *buf, Bytebpos x)
|
428
|
993 {
|
|
994 if (x >= buf->text->mule_bytmin && x <= buf->text->mule_bytmax)
|
|
995 return (buf->text->mule_bufmin +
|
|
996 ((buf->text->mule_three_p
|
|
997 ? three_to_one_table[x - buf->text->mule_bytmin]
|
|
998 : (x - buf->text->mule_bytmin) >> buf->text->mule_shifter)));
|
|
999 else
|
665
|
1000 return bytebpos_to_charbpos_func (buf, x);
|
428
|
1001 }
|
|
1002
|
|
1003 #else /* not MULE */
|
|
1004
|
665
|
1005 # define real_charbpos_to_bytebpos(buf, x) ((Bytebpos) x)
|
|
1006 # define real_bytebpos_to_charbpos(buf, x) ((Charbpos) x)
|
428
|
1007
|
|
1008 #endif /* not MULE */
|
|
1009
|
665
|
1010 #ifdef ERROR_CHECK_CHARBPOS
|
428
|
1011
|
665
|
1012 Bytebpos charbpos_to_bytebpos (struct buffer *buf, Charbpos x);
|
|
1013 Charbpos bytebpos_to_charbpos (struct buffer *buf, Bytebpos x);
|
428
|
1014
|
665
|
1015 #else /* not ERROR_CHECK_CHARBPOS */
|
428
|
1016
|
665
|
1017 #define charbpos_to_bytebpos real_charbpos_to_bytebpos
|
|
1018 #define bytebpos_to_charbpos real_bytebpos_to_charbpos
|
428
|
1019
|
665
|
1020 #endif /* not ERROR_CHECK_CHARBPOS */
|
428
|
1021
|
665
|
1022 #define make_charbpos(buf, ind) make_int (bytebpos_to_charbpos (buf, ind))
|
428
|
1023
|
|
1024 /*----------------------------------------------------------------------*/
|
|
1025 /* Converting between buffer bytes and Emacs characters */
|
|
1026 /*----------------------------------------------------------------------*/
|
|
1027
|
|
1028 /* The character at position POS in buffer. */
|
|
1029 #define BI_BUF_FETCH_CHAR(buf, pos) \
|
|
1030 charptr_emchar (BI_BUF_BYTE_ADDRESS (buf, pos))
|
|
1031 #define BUF_FETCH_CHAR(buf, pos) \
|
665
|
1032 BI_BUF_FETCH_CHAR (buf, charbpos_to_bytebpos (buf, pos))
|
428
|
1033
|
|
1034 /* The character at position POS in buffer, as a string. This is
|
|
1035 equivalent to set_charptr_emchar (str, BUF_FETCH_CHAR (buf, pos))
|
|
1036 but is faster for Mule. */
|
|
1037
|
|
1038 # define BI_BUF_CHARPTR_COPY_CHAR(buf, pos, str) \
|
|
1039 charptr_copy_char (BI_BUF_BYTE_ADDRESS (buf, pos), str)
|
|
1040 #define BUF_CHARPTR_COPY_CHAR(buf, pos, str) \
|
665
|
1041 BI_BUF_CHARPTR_COPY_CHAR (buf, charbpos_to_bytebpos (buf, pos), str)
|
428
|
1042
|
|
1043
|
|
1044 /************************************************************************/
|
440
|
1045 /* */
|
|
1046 /* Converting between internal and external format */
|
|
1047 /* */
|
428
|
1048 /************************************************************************/
|
440
|
1049 /*
|
|
1050 All client code should use only the two macros
|
428
|
1051
|
440
|
1052 TO_EXTERNAL_FORMAT (source_type, source, sink_type, sink, coding_system)
|
|
1053 TO_INTERNAL_FORMAT (source_type, source, sink_type, sink, coding_system)
|
|
1054
|
|
1055 Typical use is
|
428
|
1056
|
440
|
1057 TO_EXTERNAL_FORMAT (DATA, (ptr, len),
|
|
1058 LISP_BUFFER, buffer,
|
|
1059 Qfile_name);
|
428
|
1060
|
440
|
1061 The source or sink can be specified in one of these ways:
|
428
|
1062
|
440
|
1063 DATA, (ptr, len), // input data is a fixed buffer of size len
|
|
1064 ALLOCA, (ptr, len), // output data is in a alloca()ed buffer of size len
|
|
1065 MALLOC, (ptr, len), // output data is in a malloc()ed buffer of size len
|
444
|
1066 C_STRING_ALLOCA, ptr, // equivalent to ALLOCA (ptr, len_ignored) on output
|
|
1067 C_STRING_MALLOC, ptr, // equivalent to MALLOC (ptr, len_ignored) on output
|
440
|
1068 C_STRING, ptr, // equivalent to DATA, (ptr, strlen (ptr) + 1) on input
|
|
1069 LISP_STRING, string, // input or output is a Lisp_Object of type string
|
|
1070 LISP_BUFFER, buffer, // output is written to (point) in lisp buffer
|
|
1071 LISP_LSTREAM, lstream, // input or output is a Lisp_Object of type lstream
|
|
1072 LISP_OPAQUE, object, // input or output is a Lisp_Object of type opaque
|
428
|
1073
|
440
|
1074 When specifying the sink, use lvalues, since the macro will assign to them,
|
|
1075 except when the sink is an lstream or a lisp buffer.
|
428
|
1076
|
440
|
1077 The macros accept the kinds of sources and sinks appropriate for
|
|
1078 internal and external data representation. See the type_checking_assert
|
|
1079 macros below for the actual allowed types.
|
428
|
1080
|
440
|
1081 Since some sources and sinks use one argument (a Lisp_Object) to
|
|
1082 specify them, while others take a (pointer, length) pair, we use
|
|
1083 some C preprocessor trickery to allow pair arguments to be specified
|
|
1084 by parenthesizing them, as in the examples above.
|
428
|
1085
|
440
|
1086 Anything prefixed by dfc_ (`data format conversion') is private.
|
|
1087 They are only used to implement these macros.
|
428
|
1088
|
440
|
1089 Using C_STRING* is appropriate for using with external APIs that take
|
|
1090 null-terminated strings. For internal data, we should try to be
|
|
1091 '\0'-clean - i.e. allow arbitrary data to contain embedded '\0'.
|
428
|
1092
|
440
|
1093 Sometime in the future we might allow output to C_STRING_ALLOCA or
|
|
1094 C_STRING_MALLOC _only_ with TO_EXTERNAL_FORMAT(), not
|
|
1095 TO_INTERNAL_FORMAT(). */
|
428
|
1096
|
440
|
1097 #define TO_EXTERNAL_FORMAT(source_type, source, sink_type, sink, coding_system) \
|
|
1098 do { \
|
|
1099 dfc_conversion_type dfc_simplified_source_type; \
|
|
1100 dfc_conversion_type dfc_simplified_sink_type; \
|
|
1101 dfc_conversion_data dfc_source; \
|
|
1102 dfc_conversion_data dfc_sink; \
|
|
1103 \
|
|
1104 type_checking_assert \
|
|
1105 ((DFC_TYPE_##source_type == DFC_TYPE_DATA || \
|
|
1106 DFC_TYPE_##source_type == DFC_TYPE_C_STRING || \
|
|
1107 DFC_TYPE_##source_type == DFC_TYPE_LISP_STRING || \
|
|
1108 DFC_TYPE_##source_type == DFC_TYPE_LISP_OPAQUE || \
|
|
1109 DFC_TYPE_##source_type == DFC_TYPE_LISP_LSTREAM) \
|
|
1110 && \
|
|
1111 (DFC_TYPE_##sink_type == DFC_TYPE_ALLOCA || \
|
|
1112 DFC_TYPE_##sink_type == DFC_TYPE_MALLOC || \
|
|
1113 DFC_TYPE_##sink_type == DFC_TYPE_C_STRING_ALLOCA || \
|
|
1114 DFC_TYPE_##sink_type == DFC_TYPE_C_STRING_MALLOC || \
|
|
1115 DFC_TYPE_##sink_type == DFC_TYPE_LISP_LSTREAM || \
|
|
1116 DFC_TYPE_##sink_type == DFC_TYPE_LISP_OPAQUE)); \
|
|
1117 \
|
|
1118 DFC_SOURCE_##source_type##_TO_ARGS (source); \
|
|
1119 DFC_SINK_##sink_type##_TO_ARGS (sink); \
|
|
1120 \
|
|
1121 DFC_CONVERT_TO_EXTERNAL_FORMAT (dfc_simplified_source_type, &dfc_source, \
|
|
1122 coding_system, \
|
|
1123 dfc_simplified_sink_type, &dfc_sink); \
|
|
1124 \
|
|
1125 DFC_##sink_type##_USE_CONVERTED_DATA (sink); \
|
428
|
1126 } while (0)
|
|
1127
|
440
|
1128 #define TO_INTERNAL_FORMAT(source_type, source, sink_type, sink, coding_system) \
|
|
1129 do { \
|
|
1130 dfc_conversion_type dfc_simplified_source_type; \
|
|
1131 dfc_conversion_type dfc_simplified_sink_type; \
|
|
1132 dfc_conversion_data dfc_source; \
|
|
1133 dfc_conversion_data dfc_sink; \
|
|
1134 \
|
|
1135 type_checking_assert \
|
|
1136 ((DFC_TYPE_##source_type == DFC_TYPE_DATA || \
|
|
1137 DFC_TYPE_##source_type == DFC_TYPE_C_STRING || \
|
|
1138 DFC_TYPE_##source_type == DFC_TYPE_LISP_OPAQUE || \
|
|
1139 DFC_TYPE_##source_type == DFC_TYPE_LISP_LSTREAM) \
|
|
1140 && \
|
|
1141 (DFC_TYPE_##sink_type == DFC_TYPE_ALLOCA || \
|
|
1142 DFC_TYPE_##sink_type == DFC_TYPE_MALLOC || \
|
|
1143 DFC_TYPE_##sink_type == DFC_TYPE_C_STRING_ALLOCA || \
|
|
1144 DFC_TYPE_##sink_type == DFC_TYPE_C_STRING_MALLOC || \
|
|
1145 DFC_TYPE_##sink_type == DFC_TYPE_LISP_STRING || \
|
|
1146 DFC_TYPE_##sink_type == DFC_TYPE_LISP_LSTREAM || \
|
|
1147 DFC_TYPE_##sink_type == DFC_TYPE_LISP_BUFFER)); \
|
|
1148 \
|
|
1149 DFC_SOURCE_##source_type##_TO_ARGS (source); \
|
|
1150 DFC_SINK_##sink_type##_TO_ARGS (sink); \
|
|
1151 \
|
|
1152 DFC_CONVERT_TO_INTERNAL_FORMAT (dfc_simplified_source_type, &dfc_source, \
|
|
1153 coding_system, \
|
|
1154 dfc_simplified_sink_type, &dfc_sink); \
|
|
1155 \
|
|
1156 DFC_##sink_type##_USE_CONVERTED_DATA (sink); \
|
428
|
1157 } while (0)
|
|
1158
|
440
|
1159 #ifdef FILE_CODING
|
|
1160 #define DFC_CONVERT_TO_EXTERNAL_FORMAT dfc_convert_to_external_format
|
|
1161 #define DFC_CONVERT_TO_INTERNAL_FORMAT dfc_convert_to_internal_format
|
|
1162 #else
|
|
1163 /* ignore coding_system argument */
|
|
1164 #define DFC_CONVERT_TO_EXTERNAL_FORMAT(a, b, coding_system, c, d) \
|
|
1165 dfc_convert_to_external_format (a, b, c, d)
|
|
1166 #define DFC_CONVERT_TO_INTERNAL_FORMAT(a, b, coding_system, c, d) \
|
|
1167 dfc_convert_to_internal_format (a, b, c, d)
|
|
1168 #endif
|
428
|
1169
|
440
|
1170 typedef union
|
|
1171 {
|
665
|
1172 struct { const void *ptr; Bytecount len; } data;
|
440
|
1173 Lisp_Object lisp_object;
|
|
1174 } dfc_conversion_data;
|
428
|
1175
|
440
|
1176 enum dfc_conversion_type
|
|
1177 {
|
|
1178 DFC_TYPE_DATA,
|
|
1179 DFC_TYPE_ALLOCA,
|
|
1180 DFC_TYPE_MALLOC,
|
|
1181 DFC_TYPE_C_STRING,
|
|
1182 DFC_TYPE_C_STRING_ALLOCA,
|
|
1183 DFC_TYPE_C_STRING_MALLOC,
|
|
1184 DFC_TYPE_LISP_STRING,
|
|
1185 DFC_TYPE_LISP_LSTREAM,
|
|
1186 DFC_TYPE_LISP_OPAQUE,
|
|
1187 DFC_TYPE_LISP_BUFFER
|
|
1188 };
|
|
1189 typedef enum dfc_conversion_type dfc_conversion_type;
|
428
|
1190
|
440
|
1191 /* WARNING: These use a static buffer. This can lead to disaster if
|
|
1192 these functions are not used *very* carefully. Another reason to only use
|
442
|
1193 TO_EXTERNAL_FORMAT() and TO_INTERNAL_FORMAT(). */
|
440
|
1194 void
|
|
1195 dfc_convert_to_external_format (dfc_conversion_type source_type,
|
|
1196 dfc_conversion_data *source,
|
|
1197 #ifdef FILE_CODING
|
|
1198 Lisp_Object coding_system,
|
|
1199 #endif
|
|
1200 dfc_conversion_type sink_type,
|
|
1201 dfc_conversion_data *sink);
|
|
1202 void
|
|
1203 dfc_convert_to_internal_format (dfc_conversion_type source_type,
|
|
1204 dfc_conversion_data *source,
|
|
1205 #ifdef FILE_CODING
|
|
1206 Lisp_Object coding_system,
|
|
1207 #endif
|
|
1208 dfc_conversion_type sink_type,
|
|
1209 dfc_conversion_data *sink);
|
|
1210 /* CPP Trickery */
|
|
1211 #define DFC_CPP_CAR(x,y) (x)
|
|
1212 #define DFC_CPP_CDR(x,y) (y)
|
|
1213
|
|
1214 /* Convert `source' to args for dfc_convert_to_*_format() */
|
|
1215 #define DFC_SOURCE_DATA_TO_ARGS(val) do { \
|
|
1216 dfc_source.data.ptr = DFC_CPP_CAR val; \
|
|
1217 dfc_source.data.len = DFC_CPP_CDR val; \
|
|
1218 dfc_simplified_source_type = DFC_TYPE_DATA; \
|
428
|
1219 } while (0)
|
440
|
1220 #define DFC_SOURCE_C_STRING_TO_ARGS(val) do { \
|
|
1221 dfc_source.data.len = \
|
|
1222 strlen ((char *) (dfc_source.data.ptr = (val))); \
|
|
1223 dfc_simplified_source_type = DFC_TYPE_DATA; \
|
|
1224 } while (0)
|
|
1225 #define DFC_SOURCE_LISP_STRING_TO_ARGS(val) do { \
|
|
1226 Lisp_Object dfc_slsta = (val); \
|
|
1227 type_checking_assert (STRINGP (dfc_slsta)); \
|
|
1228 dfc_source.lisp_object = dfc_slsta; \
|
|
1229 dfc_simplified_source_type = DFC_TYPE_LISP_STRING; \
|
|
1230 } while (0)
|
|
1231 #define DFC_SOURCE_LISP_LSTREAM_TO_ARGS(val) do { \
|
|
1232 Lisp_Object dfc_sllta = (val); \
|
|
1233 type_checking_assert (LSTREAMP (dfc_sllta)); \
|
|
1234 dfc_source.lisp_object = dfc_sllta; \
|
|
1235 dfc_simplified_source_type = DFC_TYPE_LISP_LSTREAM; \
|
|
1236 } while (0)
|
|
1237 #define DFC_SOURCE_LISP_OPAQUE_TO_ARGS(val) do { \
|
|
1238 Lisp_Opaque *dfc_slota = XOPAQUE (val); \
|
|
1239 dfc_source.data.ptr = OPAQUE_DATA (dfc_slota); \
|
|
1240 dfc_source.data.len = OPAQUE_SIZE (dfc_slota); \
|
|
1241 dfc_simplified_source_type = DFC_TYPE_DATA; \
|
428
|
1242 } while (0)
|
|
1243
|
440
|
1244 /* Convert `sink' to args for dfc_convert_to_*_format() */
|
|
1245 #define DFC_SINK_ALLOCA_TO_ARGS(val) \
|
|
1246 dfc_simplified_sink_type = DFC_TYPE_DATA
|
|
1247 #define DFC_SINK_C_STRING_ALLOCA_TO_ARGS(val) \
|
|
1248 dfc_simplified_sink_type = DFC_TYPE_DATA
|
|
1249 #define DFC_SINK_MALLOC_TO_ARGS(val) \
|
|
1250 dfc_simplified_sink_type = DFC_TYPE_DATA
|
|
1251 #define DFC_SINK_C_STRING_MALLOC_TO_ARGS(val) \
|
|
1252 dfc_simplified_sink_type = DFC_TYPE_DATA
|
|
1253 #define DFC_SINK_LISP_STRING_TO_ARGS(val) \
|
|
1254 dfc_simplified_sink_type = DFC_TYPE_DATA
|
|
1255 #define DFC_SINK_LISP_OPAQUE_TO_ARGS(val) \
|
|
1256 dfc_simplified_sink_type = DFC_TYPE_DATA
|
|
1257 #define DFC_SINK_LISP_LSTREAM_TO_ARGS(val) do { \
|
|
1258 Lisp_Object dfc_sllta = (val); \
|
|
1259 type_checking_assert (LSTREAMP (dfc_sllta)); \
|
|
1260 dfc_sink.lisp_object = dfc_sllta; \
|
|
1261 dfc_simplified_sink_type = DFC_TYPE_LISP_LSTREAM; \
|
|
1262 } while (0)
|
|
1263 #define DFC_SINK_LISP_BUFFER_TO_ARGS(val) do { \
|
|
1264 struct buffer *dfc_slbta = XBUFFER (val); \
|
|
1265 dfc_sink.lisp_object = \
|
|
1266 make_lisp_buffer_output_stream \
|
|
1267 (dfc_slbta, BUF_PT (dfc_slbta), 0); \
|
|
1268 dfc_simplified_sink_type = DFC_TYPE_LISP_LSTREAM; \
|
428
|
1269 } while (0)
|
|
1270
|
440
|
1271 /* Assign to the `sink' lvalue(s) using the converted data. */
|
442
|
1272 typedef union { char c; void *p; } *dfc_aliasing_voidpp;
|
440
|
1273 #define DFC_ALLOCA_USE_CONVERTED_DATA(sink) do { \
|
|
1274 void * dfc_sink_ret = alloca (dfc_sink.data.len + 1); \
|
|
1275 memcpy (dfc_sink_ret, dfc_sink.data.ptr, dfc_sink.data.len + 1); \
|
442
|
1276 ((dfc_aliasing_voidpp) &(DFC_CPP_CAR sink))->p = dfc_sink_ret; \
|
440
|
1277 (DFC_CPP_CDR sink) = dfc_sink.data.len; \
|
|
1278 } while (0)
|
|
1279 #define DFC_MALLOC_USE_CONVERTED_DATA(sink) do { \
|
|
1280 void * dfc_sink_ret = xmalloc (dfc_sink.data.len + 1); \
|
|
1281 memcpy (dfc_sink_ret, dfc_sink.data.ptr, dfc_sink.data.len + 1); \
|
442
|
1282 ((dfc_aliasing_voidpp) &(DFC_CPP_CAR sink))->p = dfc_sink_ret; \
|
440
|
1283 (DFC_CPP_CDR sink) = dfc_sink.data.len; \
|
|
1284 } while (0)
|
|
1285 #define DFC_C_STRING_ALLOCA_USE_CONVERTED_DATA(sink) do { \
|
|
1286 void * dfc_sink_ret = alloca (dfc_sink.data.len + 1); \
|
|
1287 memcpy (dfc_sink_ret, dfc_sink.data.ptr, dfc_sink.data.len + 1); \
|
617
|
1288 ((dfc_aliasing_voidpp) &(sink))->p = dfc_sink_ret; \
|
440
|
1289 } while (0)
|
|
1290 #define DFC_C_STRING_MALLOC_USE_CONVERTED_DATA(sink) do { \
|
|
1291 void * dfc_sink_ret = xmalloc (dfc_sink.data.len + 1); \
|
|
1292 memcpy (dfc_sink_ret, dfc_sink.data.ptr, dfc_sink.data.len + 1); \
|
617
|
1293 ((dfc_aliasing_voidpp) &(sink))->p = dfc_sink_ret; \
|
440
|
1294 } while (0)
|
|
1295 #define DFC_LISP_STRING_USE_CONVERTED_DATA(sink) \
|
665
|
1296 sink = make_string ((Intbyte *) dfc_sink.data.ptr, dfc_sink.data.len)
|
440
|
1297 #define DFC_LISP_OPAQUE_USE_CONVERTED_DATA(sink) \
|
|
1298 sink = make_opaque (dfc_sink.data.ptr, dfc_sink.data.len)
|
|
1299 #define DFC_LISP_LSTREAM_USE_CONVERTED_DATA(sink) /* data already used */
|
|
1300 #define DFC_LISP_BUFFER_USE_CONVERTED_DATA(sink) \
|
|
1301 Lstream_delete (XLSTREAM (dfc_sink.lisp_object))
|
428
|
1302
|
440
|
1303 /* Someday we might want to distinguish between Qnative and Qfile_name
|
|
1304 by using coding-system aliases, but for now it suffices to have
|
|
1305 these be identical. Qnative can be used as the coding_system
|
|
1306 argument to TO_EXTERNAL_FORMAT() and TO_INTERNAL_FORMAT(). */
|
|
1307 #define Qnative Qfile_name
|
428
|
1308
|
442
|
1309 #if defined (WIN32_NATIVE) || defined (CYGWIN)
|
|
1310 /* #### kludge!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!
|
|
1311 Remove this as soon as my Mule code is integrated. */
|
|
1312 #define Qmswindows_tstr Qnative
|
|
1313 #endif
|
|
1314
|
|
1315 /* More stand-ins */
|
|
1316 #define Qcommand_argument_encoding Qnative
|
|
1317 #define Qenvironment_variable_encoding Qnative
|
|
1318
|
|
1319 /* Convenience macros for extremely common invocations */
|
|
1320 #define C_STRING_TO_EXTERNAL(in, out, coding_system) \
|
|
1321 TO_EXTERNAL_FORMAT (C_STRING, in, C_STRING_ALLOCA, out, coding_system)
|
|
1322 #define C_STRING_TO_EXTERNAL_MALLOC(in, out, coding_system) \
|
|
1323 TO_EXTERNAL_FORMAT (C_STRING, in, C_STRING_MALLOC, out, coding_system)
|
|
1324 #define EXTERNAL_TO_C_STRING(in, out, coding_system) \
|
|
1325 TO_INTERNAL_FORMAT (C_STRING, in, C_STRING_ALLOCA, out, coding_system)
|
|
1326 #define EXTERNAL_TO_C_STRING_MALLOC(in, out, coding_system) \
|
|
1327 TO_INTERNAL_FORMAT (C_STRING, in, C_STRING_MALLOC, out, coding_system)
|
|
1328 #define LISP_STRING_TO_EXTERNAL(in, out, coding_system) \
|
|
1329 TO_EXTERNAL_FORMAT (LISP_STRING, in, C_STRING_ALLOCA, out, coding_system)
|
|
1330 #define LISP_STRING_TO_EXTERNAL_MALLOC(in, out, coding_system) \
|
|
1331 TO_EXTERNAL_FORMAT (LISP_STRING, in, C_STRING_MALLOC, out, coding_system)
|
|
1332
|
428
|
1333
|
|
1334 /************************************************************************/
|
|
1335 /* */
|
|
1336 /* fake charset functions */
|
|
1337 /* */
|
|
1338 /************************************************************************/
|
|
1339
|
|
1340 /* used when MULE is not defined, so that Charset-type stuff can still
|
|
1341 be done */
|
|
1342
|
|
1343 #ifndef MULE
|
|
1344
|
|
1345 #define Vcharset_ascii Qnil
|
|
1346
|
|
1347 #define CHAR_CHARSET(ch) Vcharset_ascii
|
|
1348 #define CHAR_LEADING_BYTE(ch) LEADING_BYTE_ASCII
|
|
1349 #define LEADING_BYTE_ASCII 0x80
|
|
1350 #define NUM_LEADING_BYTES 1
|
|
1351 #define MIN_LEADING_BYTE 0x80
|
|
1352 #define CHARSETP(cs) 1
|
|
1353 #define CHARSET_BY_LEADING_BYTE(lb) Vcharset_ascii
|
|
1354 #define XCHARSET_LEADING_BYTE(cs) LEADING_BYTE_ASCII
|
|
1355 #define XCHARSET_GRAPHIC(cs) -1
|
|
1356 #define XCHARSET_COLUMNS(cs) 1
|
|
1357 #define XCHARSET_DIMENSION(cs) 1
|
|
1358 #define REP_BYTES_BY_FIRST_BYTE(fb) 1
|
|
1359 #define BREAKUP_CHAR(ch, charset, byte1, byte2) do { \
|
|
1360 (charset) = Vcharset_ascii; \
|
|
1361 (byte1) = (ch); \
|
|
1362 (byte2) = 0; \
|
|
1363 } while (0)
|
|
1364 #define BYTE_ASCII_P(byte) 1
|
|
1365
|
|
1366 #endif /* ! MULE */
|
|
1367
|
|
1368 /************************************************************************/
|
|
1369 /* */
|
|
1370 /* higher-level buffer-position functions */
|
|
1371 /* */
|
|
1372 /************************************************************************/
|
|
1373
|
|
1374 /*----------------------------------------------------------------------*/
|
|
1375 /* Settor macros for important positions in a buffer */
|
|
1376 /*----------------------------------------------------------------------*/
|
|
1377
|
|
1378 /* Set beginning of accessible range of buffer. */
|
|
1379 #define SET_BOTH_BUF_BEGV(buf, val, bival) \
|
|
1380 do \
|
|
1381 { \
|
|
1382 (buf)->begv = (bival); \
|
|
1383 (buf)->bufbegv = (val); \
|
|
1384 } while (0)
|
|
1385
|
|
1386 /* Set end of accessible range of buffer. */
|
|
1387 #define SET_BOTH_BUF_ZV(buf, val, bival) \
|
|
1388 do \
|
|
1389 { \
|
|
1390 (buf)->zv = (bival); \
|
|
1391 (buf)->bufzv = (val); \
|
|
1392 } while (0)
|
|
1393
|
|
1394 /* Set point. */
|
|
1395 /* Since BEGV and ZV are almost never set, it's reasonable to enforce
|
665
|
1396 the restriction that the Charbpos and Bytebpos values must both be
|
428
|
1397 specified. However, point is set in lots and lots of places. So
|
|
1398 we provide the ability to specify both (for efficiency) or just
|
|
1399 one. */
|
|
1400 #define BOTH_BUF_SET_PT(buf, val, bival) set_buffer_point (buf, val, bival)
|
|
1401 #define BI_BUF_SET_PT(buf, bival) \
|
665
|
1402 BOTH_BUF_SET_PT (buf, bytebpos_to_charbpos (buf, bival), bival)
|
428
|
1403 #define BUF_SET_PT(buf, value) \
|
665
|
1404 BOTH_BUF_SET_PT (buf, value, charbpos_to_bytebpos (buf, value))
|
428
|
1405
|
|
1406
|
|
1407 #if 0 /* FSFmacs */
|
|
1408 /* These macros exist in FSFmacs because SET_PT() in FSFmacs incorrectly
|
|
1409 does too much stuff, such as moving out of invisible extents. */
|
|
1410 #define TEMP_SET_PT(position) (temp_set_point ((position), current_buffer))
|
|
1411 #define SET_BUF_PT(buf, value) ((buf)->pt = (value))
|
|
1412 #endif /* FSFmacs */
|
|
1413
|
|
1414 /*----------------------------------------------------------------------*/
|
|
1415 /* Miscellaneous buffer values */
|
|
1416 /*----------------------------------------------------------------------*/
|
|
1417
|
|
1418 /* Number of characters in buffer */
|
|
1419 #define BUF_SIZE(buf) (BUF_Z (buf) - BUF_BEG (buf))
|
|
1420
|
|
1421 /* Is this buffer narrowed? */
|
|
1422 #define BUF_NARROWED(buf) \
|
|
1423 ((BI_BUF_BEGV (buf) != BI_BUF_BEG (buf)) || \
|
|
1424 (BI_BUF_ZV (buf) != BI_BUF_Z (buf)))
|
|
1425
|
|
1426 /* Modification count. */
|
|
1427 #define BUF_MODIFF(buf) ((buf)->text->modiff)
|
|
1428
|
|
1429 /* Saved modification count. */
|
|
1430 #define BUF_SAVE_MODIFF(buf) ((buf)->text->save_modiff)
|
|
1431
|
|
1432 /* Face changed. */
|
|
1433 #define BUF_FACECHANGE(buf) ((buf)->face_change)
|
|
1434
|
|
1435 #define POINT_MARKER_P(marker) \
|
|
1436 (XMARKER (marker)->buffer != 0 && \
|
434
|
1437 EQ (marker, XMARKER (marker)->buffer->point_marker))
|
428
|
1438
|
|
1439 #define BUF_MARKERS(buf) ((buf)->markers)
|
|
1440
|
|
1441 /* WARNING:
|
|
1442
|
|
1443 The new definitions of CEILING_OF() and FLOOR_OF() differ semantically
|
|
1444 from the old ones (in FSF Emacs and XEmacs 19.11 and before).
|
|
1445 Conversion is as follows:
|
|
1446
|
|
1447 OLD_BI_CEILING_OF(n) = NEW_BI_CEILING_OF(n) - 1
|
|
1448 OLD_BI_FLOOR_OF(n) = NEW_BI_FLOOR_OF(n + 1)
|
|
1449
|
|
1450 The definitions were changed because the new definitions are more
|
|
1451 consistent with the way everything else works in Emacs.
|
|
1452 */
|
|
1453
|
|
1454 /* Properties of CEILING_OF and FLOOR_OF (also apply to BI_ variants):
|
|
1455
|
|
1456 1) FLOOR_OF (CEILING_OF (n)) = n
|
|
1457 CEILING_OF (FLOOR_OF (n)) = n
|
|
1458
|
|
1459 2) CEILING_OF (n) = n if and only if n = ZV
|
|
1460 FLOOR_OF (n) = n if and only if n = BEGV
|
|
1461
|
|
1462 3) CEILING_OF (CEILING_OF (n)) = ZV
|
|
1463 FLOOR_OF (FLOOR_OF (n)) = BEGV
|
|
1464
|
|
1465 4) The bytes in the regions
|
|
1466
|
|
1467 [BYTE_ADDRESS (n), BYTE_ADDRESS_BEFORE (CEILING_OF (n))]
|
|
1468
|
|
1469 and
|
|
1470
|
|
1471 [BYTE_ADDRESS (FLOOR_OF (n)), BYTE_ADDRESS_BEFORE (n)]
|
|
1472
|
|
1473 are contiguous.
|
|
1474 */
|
|
1475
|
|
1476
|
|
1477 /* Return the maximum index in the buffer it is safe to scan forwards
|
|
1478 past N to. This is used to prevent buffer scans from running into
|
|
1479 the gap (e.g. search.c). All characters between N and CEILING_OF(N)
|
|
1480 are located contiguous in memory. Note that the character *at*
|
|
1481 CEILING_OF(N) is not contiguous in memory. */
|
|
1482 #define BI_BUF_CEILING_OF(b, n) \
|
|
1483 ((n) < (b)->text->gpt && (b)->text->gpt < BI_BUF_ZV (b) ? \
|
|
1484 (b)->text->gpt : BI_BUF_ZV (b))
|
|
1485 #define BUF_CEILING_OF(b, n) \
|
665
|
1486 bytebpos_to_charbpos (b, BI_BUF_CEILING_OF (b, charbpos_to_bytebpos (b, n)))
|
428
|
1487
|
|
1488 /* Return the minimum index in the buffer it is safe to scan backwards
|
|
1489 past N to. All characters between FLOOR_OF(N) and N are located
|
|
1490 contiguous in memory. Note that the character *at* N may not be
|
|
1491 contiguous in memory. */
|
|
1492 #define BI_BUF_FLOOR_OF(b, n) \
|
|
1493 (BI_BUF_BEGV (b) < (b)->text->gpt && (b)->text->gpt < (n) ? \
|
|
1494 (b)->text->gpt : BI_BUF_BEGV (b))
|
|
1495 #define BUF_FLOOR_OF(b, n) \
|
665
|
1496 bytebpos_to_charbpos (b, BI_BUF_FLOOR_OF (b, charbpos_to_bytebpos (b, n)))
|
428
|
1497
|
|
1498 #define BI_BUF_CEILING_OF_IGNORE_ACCESSIBLE(b, n) \
|
|
1499 ((n) < (b)->text->gpt && (b)->text->gpt < BI_BUF_Z (b) ? \
|
|
1500 (b)->text->gpt : BI_BUF_Z (b))
|
|
1501 #define BUF_CEILING_OF_IGNORE_ACCESSIBLE(b, n) \
|
665
|
1502 bytebpos_to_charbpos \
|
|
1503 (b, BI_BUF_CEILING_OF_IGNORE_ACCESSIBLE (b, charbpos_to_bytebpos (b, n)))
|
428
|
1504
|
|
1505 #define BI_BUF_FLOOR_OF_IGNORE_ACCESSIBLE(b, n) \
|
|
1506 (BI_BUF_BEG (b) < (b)->text->gpt && (b)->text->gpt < (n) ? \
|
|
1507 (b)->text->gpt : BI_BUF_BEG (b))
|
|
1508 #define BUF_FLOOR_OF_IGNORE_ACCESSIBLE(b, n) \
|
665
|
1509 bytebpos_to_charbpos \
|
|
1510 (b, BI_BUF_FLOOR_OF_IGNORE_ACCESSIBLE (b, charbpos_to_bytebpos (b, n)))
|
428
|
1511
|
|
1512
|
|
1513 extern struct buffer *current_buffer;
|
|
1514
|
|
1515 /* This is the initial (startup) directory, as used for the *scratch* buffer.
|
|
1516 We're making this a global to make others aware of the startup directory.
|
|
1517 `initial_directory' is stored in external format.
|
|
1518 */
|
|
1519 extern char initial_directory[];
|
|
1520 extern void init_initial_directory (void); /* initialize initial_directory */
|
|
1521
|
|
1522 EXFUN (Fbuffer_disable_undo, 1);
|
|
1523 EXFUN (Fbuffer_modified_p, 1);
|
|
1524 EXFUN (Fbuffer_name, 1);
|
|
1525 EXFUN (Fcurrent_buffer, 0);
|
|
1526 EXFUN (Ferase_buffer, 1);
|
|
1527 EXFUN (Fget_buffer, 1);
|
|
1528 EXFUN (Fget_buffer_create, 1);
|
|
1529 EXFUN (Fget_file_buffer, 1);
|
|
1530 EXFUN (Fkill_buffer, 1);
|
|
1531 EXFUN (Fother_buffer, 3);
|
|
1532 EXFUN (Frecord_buffer, 1);
|
|
1533 EXFUN (Fset_buffer, 1);
|
|
1534 EXFUN (Fset_buffer_modified_p, 2);
|
|
1535
|
|
1536 extern Lisp_Object QSscratch, Qafter_change_function, Qafter_change_functions;
|
|
1537 extern Lisp_Object Qbefore_change_function, Qbefore_change_functions;
|
|
1538 extern Lisp_Object Qbuffer_or_string_p, Qdefault_directory, Qfirst_change_hook;
|
|
1539 extern Lisp_Object Qpermanent_local, Vafter_change_function;
|
|
1540 extern Lisp_Object Vafter_change_functions, Vbefore_change_function;
|
|
1541 extern Lisp_Object Vbefore_change_functions, Vbuffer_alist, Vbuffer_defaults;
|
|
1542 extern Lisp_Object Vinhibit_read_only, Vtransient_mark_mode;
|
|
1543
|
|
1544 /* This structure marks which slots in a buffer have corresponding
|
|
1545 default values in Vbuffer_defaults.
|
|
1546 Each such slot has a nonzero value in this structure.
|
|
1547 The value has only one nonzero bit.
|
|
1548
|
|
1549 When a buffer has its own local value for a slot,
|
|
1550 the bit for that slot (found in the same slot in this structure)
|
|
1551 is turned on in the buffer's local_var_flags slot.
|
|
1552
|
|
1553 If a slot in this structure is zero, then even though there may
|
|
1554 be a DEFVAR_BUFFER_LOCAL for the slot, there is no default value for it;
|
|
1555 and the corresponding slot in Vbuffer_defaults is not used. */
|
|
1556
|
|
1557 extern struct buffer buffer_local_flags;
|
|
1558
|
|
1559
|
|
1560 /* Allocation of buffer data. */
|
|
1561
|
|
1562 #ifdef REL_ALLOC
|
|
1563
|
440
|
1564 char *r_alloc (unsigned char **, size_t);
|
|
1565 char *r_re_alloc (unsigned char **, size_t);
|
428
|
1566 void r_alloc_free (unsigned char **);
|
|
1567
|
|
1568 #define BUFFER_ALLOC(data, size) \
|
665
|
1569 ((Intbyte *) r_alloc ((unsigned char **) &data, (size) * sizeof(Intbyte)))
|
428
|
1570 #define BUFFER_REALLOC(data, size) \
|
665
|
1571 ((Intbyte *) r_re_alloc ((unsigned char **) &data, (size) * sizeof(Intbyte)))
|
428
|
1572 #define BUFFER_FREE(data) r_alloc_free ((unsigned char **) &(data))
|
|
1573 #define R_ALLOC_DECLARE(var,data) r_alloc_declare (&(var), data)
|
|
1574
|
|
1575 #else /* !REL_ALLOC */
|
|
1576
|
|
1577 #define BUFFER_ALLOC(data,size)\
|
665
|
1578 (data = xnew_array (Intbyte, size))
|
428
|
1579 #define BUFFER_REALLOC(data,size)\
|
665
|
1580 ((Intbyte *) xrealloc (data, (size) * sizeof(Intbyte)))
|
428
|
1581 /* Avoid excess parentheses, or syntax errors may rear their heads. */
|
|
1582 #define BUFFER_FREE(data) xfree (data)
|
|
1583 #define R_ALLOC_DECLARE(var,data)
|
|
1584
|
|
1585 #endif /* !REL_ALLOC */
|
|
1586
|
|
1587 extern Lisp_Object Vbuffer_alist;
|
|
1588 void set_buffer_internal (struct buffer *b);
|
|
1589 struct buffer *decode_buffer (Lisp_Object buffer, int allow_string);
|
|
1590
|
|
1591 /* from editfns.c */
|
|
1592 void widen_buffer (struct buffer *b, int no_clip);
|
665
|
1593 int beginning_of_line_p (struct buffer *b, Charbpos pt);
|
428
|
1594
|
|
1595 /* from insdel.c */
|
665
|
1596 void set_buffer_point (struct buffer *buf, Charbpos pos, Bytebpos bipos);
|
|
1597 void find_charsets_in_intbyte_string (unsigned char *charsets,
|
|
1598 const Intbyte *str,
|
428
|
1599 Bytecount len);
|
|
1600 void find_charsets_in_emchar_string (unsigned char *charsets,
|
442
|
1601 const Emchar *str,
|
428
|
1602 Charcount len);
|
665
|
1603 int intbyte_string_displayed_columns (const Intbyte *str, Bytecount len);
|
442
|
1604 int emchar_string_displayed_columns (const Emchar *str, Charcount len);
|
665
|
1605 void convert_intbyte_string_into_emchar_dynarr (const Intbyte *str,
|
428
|
1606 Bytecount len,
|
|
1607 Emchar_dynarr *dyn);
|
665
|
1608 Charcount convert_intbyte_string_into_emchar_string (const Intbyte *str,
|
428
|
1609 Bytecount len,
|
|
1610 Emchar *arr);
|
665
|
1611 void convert_emchar_string_into_intbyte_dynarr (Emchar *arr, int nels,
|
|
1612 Intbyte_dynarr *dyn);
|
|
1613 Intbyte *convert_emchar_string_into_malloced_string (Emchar *arr, int nels,
|
428
|
1614 Bytecount *len_out);
|
|
1615 /* from marker.c */
|
|
1616 void init_buffer_markers (struct buffer *b);
|
|
1617 void uninit_buffer_markers (struct buffer *b);
|
|
1618
|
|
1619 /* flags for get_buffer_pos_char(), get_buffer_range_char(), etc. */
|
|
1620 /* At most one of GB_COERCE_RANGE and GB_NO_ERROR_IF_BAD should be
|
|
1621 specified. At most one of GB_NEGATIVE_FROM_END and GB_NO_ERROR_IF_BAD
|
|
1622 should be specified. */
|
|
1623
|
|
1624 #define GB_ALLOW_PAST_ACCESSIBLE (1 << 0)
|
|
1625 #define GB_ALLOW_NIL (1 << 1)
|
|
1626 #define GB_CHECK_ORDER (1 << 2)
|
|
1627 #define GB_COERCE_RANGE (1 << 3)
|
|
1628 #define GB_NO_ERROR_IF_BAD (1 << 4)
|
|
1629 #define GB_NEGATIVE_FROM_END (1 << 5)
|
|
1630 #define GB_HISTORICAL_STRING_BEHAVIOR (GB_NEGATIVE_FROM_END | GB_ALLOW_NIL)
|
|
1631
|
665
|
1632 Charbpos get_buffer_pos_char (struct buffer *b, Lisp_Object pos,
|
428
|
1633 unsigned int flags);
|
665
|
1634 Bytebpos get_buffer_pos_byte (struct buffer *b, Lisp_Object pos,
|
428
|
1635 unsigned int flags);
|
|
1636 void get_buffer_range_char (struct buffer *b, Lisp_Object from, Lisp_Object to,
|
665
|
1637 Charbpos *from_out, Charbpos *to_out,
|
428
|
1638 unsigned int flags);
|
|
1639 void get_buffer_range_byte (struct buffer *b, Lisp_Object from, Lisp_Object to,
|
665
|
1640 Bytebpos *from_out, Bytebpos *to_out,
|
428
|
1641 unsigned int flags);
|
|
1642 Charcount get_string_pos_char (Lisp_Object string, Lisp_Object pos,
|
|
1643 unsigned int flags);
|
|
1644 Bytecount get_string_pos_byte (Lisp_Object string, Lisp_Object pos,
|
|
1645 unsigned int flags);
|
|
1646 void get_string_range_char (Lisp_Object string, Lisp_Object from,
|
|
1647 Lisp_Object to, Charcount *from_out,
|
|
1648 Charcount *to_out, unsigned int flags);
|
|
1649 void get_string_range_byte (Lisp_Object string, Lisp_Object from,
|
|
1650 Lisp_Object to, Bytecount *from_out,
|
|
1651 Bytecount *to_out, unsigned int flags);
|
665
|
1652 Charbpos get_buffer_or_string_pos_char (Lisp_Object object, Lisp_Object pos,
|
428
|
1653 unsigned int flags);
|
665
|
1654 Bytebpos get_buffer_or_string_pos_byte (Lisp_Object object, Lisp_Object pos,
|
428
|
1655 unsigned int flags);
|
|
1656 void get_buffer_or_string_range_char (Lisp_Object object, Lisp_Object from,
|
665
|
1657 Lisp_Object to, Charbpos *from_out,
|
|
1658 Charbpos *to_out, unsigned int flags);
|
428
|
1659 void get_buffer_or_string_range_byte (Lisp_Object object, Lisp_Object from,
|
665
|
1660 Lisp_Object to, Bytebpos *from_out,
|
|
1661 Bytebpos *to_out, unsigned int flags);
|
|
1662 Charbpos buffer_or_string_accessible_begin_char (Lisp_Object object);
|
|
1663 Charbpos buffer_or_string_accessible_end_char (Lisp_Object object);
|
|
1664 Bytebpos buffer_or_string_accessible_begin_byte (Lisp_Object object);
|
|
1665 Bytebpos buffer_or_string_accessible_end_byte (Lisp_Object object);
|
|
1666 Charbpos buffer_or_string_absolute_begin_char (Lisp_Object object);
|
|
1667 Charbpos buffer_or_string_absolute_end_char (Lisp_Object object);
|
|
1668 Bytebpos buffer_or_string_absolute_begin_byte (Lisp_Object object);
|
|
1669 Bytebpos buffer_or_string_absolute_end_byte (Lisp_Object object);
|
428
|
1670 void record_buffer (Lisp_Object buf);
|
|
1671 Lisp_Object get_buffer (Lisp_Object name,
|
|
1672 int error_if_deleted_or_does_not_exist);
|
|
1673 int map_over_sharing_buffers (struct buffer *buf,
|
|
1674 int (*mapfun) (struct buffer *buf,
|
|
1675 void *closure),
|
|
1676 void *closure);
|
|
1677
|
|
1678
|
|
1679 /************************************************************************/
|
|
1680 /* Case conversion */
|
|
1681 /************************************************************************/
|
|
1682
|
|
1683 /* A "trt" table is a mapping from characters to other characters,
|
|
1684 typically used to convert between uppercase and lowercase. For
|
|
1685 compatibility reasons, trt tables are currently in the form of
|
|
1686 a Lisp string of 256 characters, specifying the conversion for each
|
|
1687 of the first 256 Emacs characters (i.e. the 256 Latin-1 characters).
|
|
1688 This should be generalized at some point to support conversions for
|
|
1689 all of the allowable Mule characters.
|
|
1690 */
|
|
1691
|
|
1692 /* The _1 macros are named as such because they assume that you have
|
|
1693 already guaranteed that the character values are all in the range
|
|
1694 0 - 255. Bad lossage will happen otherwise. */
|
|
1695
|
446
|
1696 #define MAKE_TRT_TABLE() Fmake_char_table (Qgeneric)
|
|
1697 INLINE_HEADER Emchar TRT_TABLE_CHAR_1 (Lisp_Object table, Emchar c);
|
|
1698 INLINE_HEADER Emchar
|
|
1699 TRT_TABLE_CHAR_1 (Lisp_Object table, Emchar ch)
|
|
1700 {
|
|
1701 Lisp_Object TRT_char;
|
|
1702 TRT_char = get_char_table (ch, XCHAR_TABLE (table));
|
|
1703 if (NILP (TRT_char))
|
|
1704 return ch;
|
|
1705 else
|
|
1706 return XCHAR (TRT_char);
|
|
1707 }
|
|
1708 #define SET_TRT_TABLE_CHAR_1(table, ch1, ch2) \
|
|
1709 Fput_char_table (make_char (ch1), make_char (ch2), table);
|
428
|
1710
|
442
|
1711 INLINE_HEADER Emchar TRT_TABLE_OF (Lisp_Object trt, Emchar c);
|
|
1712 INLINE_HEADER Emchar
|
428
|
1713 TRT_TABLE_OF (Lisp_Object trt, Emchar c)
|
|
1714 {
|
446
|
1715 return TRT_TABLE_CHAR_1 (trt, c);
|
428
|
1716 }
|
|
1717
|
|
1718 /* Macros used below. */
|
446
|
1719 #define DOWNCASE_TABLE_OF(buf, c) \
|
|
1720 TRT_TABLE_OF (XCASE_TABLE_DOWNCASE (buf->case_table), c)
|
|
1721 #define UPCASE_TABLE_OF(buf, c) \
|
|
1722 TRT_TABLE_OF (XCASE_TABLE_UPCASE (buf->case_table), c)
|
428
|
1723
|
|
1724 /* 1 if CH is upper case. */
|
|
1725
|
442
|
1726 INLINE_HEADER int UPPERCASEP (struct buffer *buf, Emchar ch);
|
|
1727 INLINE_HEADER int
|
428
|
1728 UPPERCASEP (struct buffer *buf, Emchar ch)
|
|
1729 {
|
|
1730 return DOWNCASE_TABLE_OF (buf, ch) != ch;
|
|
1731 }
|
|
1732
|
|
1733 /* 1 if CH is lower case. */
|
|
1734
|
442
|
1735 INLINE_HEADER int LOWERCASEP (struct buffer *buf, Emchar ch);
|
|
1736 INLINE_HEADER int
|
428
|
1737 LOWERCASEP (struct buffer *buf, Emchar ch)
|
|
1738 {
|
|
1739 return (UPCASE_TABLE_OF (buf, ch) != ch &&
|
|
1740 DOWNCASE_TABLE_OF (buf, ch) == ch);
|
|
1741 }
|
|
1742
|
|
1743 /* 1 if CH is neither upper nor lower case. */
|
|
1744
|
442
|
1745 INLINE_HEADER int NOCASEP (struct buffer *buf, Emchar ch);
|
|
1746 INLINE_HEADER int
|
428
|
1747 NOCASEP (struct buffer *buf, Emchar ch)
|
|
1748 {
|
|
1749 return UPCASE_TABLE_OF (buf, ch) == ch;
|
|
1750 }
|
|
1751
|
|
1752 /* Upcase a character, or make no change if that cannot be done. */
|
|
1753
|
442
|
1754 INLINE_HEADER Emchar UPCASE (struct buffer *buf, Emchar ch);
|
|
1755 INLINE_HEADER Emchar
|
428
|
1756 UPCASE (struct buffer *buf, Emchar ch)
|
|
1757 {
|
|
1758 return (DOWNCASE_TABLE_OF (buf, ch) == ch) ? UPCASE_TABLE_OF (buf, ch) : ch;
|
|
1759 }
|
|
1760
|
|
1761 /* Upcase a character known to be not upper case. Unused. */
|
|
1762
|
|
1763 #define UPCASE1(buf, ch) UPCASE_TABLE_OF (buf, ch)
|
|
1764
|
|
1765 /* Downcase a character, or make no change if that cannot be done. */
|
|
1766
|
|
1767 #define DOWNCASE(buf, ch) DOWNCASE_TABLE_OF (buf, ch)
|
|
1768
|
444
|
1769 /************************************************************************/
|
|
1770 /* Lisp string representation convenience functions */
|
|
1771 /************************************************************************/
|
|
1772 /* Because the representation of internally formatted data is subject to change,
|
|
1773 It's bad style to do something like strcmp (XSTRING_DATA (s), "foo")
|
665
|
1774 Instead, use the portable: intbyte_strcmp (XSTRING_DATA (s), "foo")
|
|
1775 or intbyte_memcmp (XSTRING_DATA (s), "foo", 3) */
|
444
|
1776
|
|
1777 /* Like strcmp, except first arg points at internally formatted data,
|
|
1778 while the second points at a string of only ASCII chars. */
|
|
1779 INLINE_HEADER int
|
665
|
1780 intbyte_strcmp (const Intbyte *bp, const char *ascii_string);
|
444
|
1781 INLINE_HEADER int
|
665
|
1782 intbyte_strcmp (const Intbyte *bp, const char *ascii_string)
|
444
|
1783 {
|
|
1784 #ifdef MULE
|
|
1785 while (1)
|
|
1786 {
|
|
1787 int diff;
|
|
1788 type_checking_assert (BYTE_ASCII_P (*ascii_string));
|
665
|
1789 if ((diff = charptr_emchar (bp) - *(Intbyte *) ascii_string) != 0)
|
444
|
1790 return diff;
|
|
1791 if (*ascii_string == '\0')
|
|
1792 return 0;
|
|
1793 ascii_string++;
|
|
1794 INC_CHARPTR (bp);
|
|
1795 }
|
|
1796 #else
|
|
1797 return strcmp ((char *)bp, ascii_string);
|
|
1798 #endif
|
|
1799 }
|
|
1800
|
|
1801
|
|
1802 /* Like memcmp, except first arg points at internally formatted data,
|
|
1803 while the second points at a string of only ASCII chars. */
|
|
1804 INLINE_HEADER int
|
665
|
1805 intbyte_memcmp (const Intbyte *bp, const char *ascii_string, Bytecount len);
|
444
|
1806 INLINE_HEADER int
|
665
|
1807 intbyte_memcmp (const Intbyte *bp, const char *ascii_string, Bytecount len)
|
444
|
1808 {
|
|
1809 #ifdef MULE
|
|
1810 while (len--)
|
|
1811 {
|
665
|
1812 int diff = charptr_emchar (bp) - *(Intbyte *) ascii_string;
|
444
|
1813 type_checking_assert (BYTE_ASCII_P (*ascii_string));
|
|
1814 if (diff != 0)
|
|
1815 return diff;
|
|
1816 ascii_string++;
|
|
1817 INC_CHARPTR (bp);
|
|
1818 }
|
|
1819 return 0;
|
|
1820 #else
|
|
1821 return memcmp (bp, ascii_string, len);
|
|
1822 #endif
|
|
1823 }
|
|
1824
|
440
|
1825 #endif /* INCLUDED_buffer_h_ */
|