502
|
1 ;;; mule-charset.el --- Charset functions for Mule. -*- coding: iso-2022-7bit; -*-
|
428
|
2
|
788
|
3 ;; Copyright (C) 1995 Electrotechnical Laboratory, JAPAN.
|
|
4 ;; Copyright (C) 1992, 2001 Free Software Foundation, Inc.
|
|
5 ;; Licensed to the Free Software Foundation.
|
428
|
6 ;; Copyright (C) 1995 Amdahl Corporation.
|
|
7 ;; Copyright (C) 1996 Sun Microsystems.
|
777
|
8 ;; Copyright (C) 2002 Ben Wing.
|
428
|
9
|
|
10 ;; Author: Unknown
|
|
11 ;; Keywords: i18n, mule, internal
|
|
12
|
|
13 ;; This file is part of XEmacs.
|
|
14
|
|
15 ;; XEmacs is free software; you can redistribute it and/or modify it
|
|
16 ;; under the terms of the GNU General Public License as published by
|
|
17 ;; the Free Software Foundation; either version 2, or (at your option)
|
|
18 ;; any later version.
|
|
19
|
|
20 ;; XEmacs is distributed in the hope that it will be useful, but
|
|
21 ;; WITHOUT ANY WARRANTY; without even the implied warranty of
|
|
22 ;; MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
|
|
23 ;; General Public License for more details.
|
|
24
|
|
25 ;; You should have received a copy of the GNU General Public License
|
|
26 ;; along with XEmacs; see the file COPYING. If not, write to the
|
|
27 ;; Free Software Foundation, Inc., 59 Temple Place - Suite 330,
|
|
28 ;; Boston, MA 02111-1307, USA.
|
|
29
|
|
30 ;;; Synched up with: Not synched. API at source level synched with FSF 20.3.9.
|
|
31
|
|
32 ;;; Commentary:
|
|
33
|
|
34 ;; These functions are not compatible at the bytecode level with Emacs/Mule,
|
|
35 ;; and they never will be. -sb [1999-05-26]
|
|
36
|
|
37 ;;; Code:
|
|
38
|
|
39 ;;;; Classifying text according to charsets
|
|
40
|
1309
|
41 ;; the old version was broken in a couple of ways
|
|
42 ;; this is one of several versions, I tried a hash as well as the
|
|
43 ;; `prev-charset' cache used in the old version, but this was definitely
|
|
44 ;; faster than the hash version and marginally faster than the prev-charset
|
|
45 ;; version
|
|
46 ;; #### this really needs to be moved into C
|
428
|
47 (defun charsets-in-region (start end &optional buffer)
|
|
48 "Return a list of the charsets in the region between START and END.
|
|
49 BUFFER defaults to the current buffer if omitted."
|
|
50 (let (list)
|
|
51 (save-excursion
|
|
52 (if buffer
|
|
53 (set-buffer buffer))
|
|
54 (save-restriction
|
|
55 (narrow-to-region start end)
|
|
56 (goto-char (point-min))
|
|
57 (while (not (eobp))
|
1309
|
58 ;; the first test will usually succeed on testing the
|
|
59 ;; car of the list; don't waste time let-binding.
|
|
60 (or (memq (char-charset (char-after (point))) list)
|
|
61 (setq list (cons (char-charset (char-after (point))) list)))
|
428
|
62 (forward-char))))
|
|
63 list))
|
|
64
|
|
65 (defun charsets-in-string (string)
|
|
66 "Return a list of the charsets in STRING."
|
1309
|
67 (let (list)
|
|
68 (mapc (lambda (ch)
|
|
69 ;; the first test will usually succeed on testing the
|
|
70 ;; car of the list; don't waste time let-binding.
|
|
71 (or (memq (char-charset ch) list)
|
|
72 (setq list (cons (char-charset ch) list))))
|
|
73 string)
|
428
|
74 list))
|
|
75
|
771
|
76 (defalias 'find-charset-string 'charsets-in-string)
|
|
77 (defalias 'find-charset-region 'charsets-in-region)
|
818
|
78
|
428
|
79
|
|
80 ;;;; Charset accessors
|
|
81
|
|
82 (defun charset-iso-graphic-plane (charset)
|
|
83 "Return the `graphic' property of CHARSET.
|
|
84 See `make-charset'."
|
|
85 (charset-property charset 'graphic))
|
|
86
|
|
87 (defun charset-iso-final-char (charset)
|
|
88 "Return the final byte of the ISO 2022 escape sequence designating CHARSET."
|
|
89 (charset-property charset 'final))
|
|
90
|
|
91 (defun charset-chars (charset)
|
|
92 "Return the number of characters per dimension of CHARSET."
|
|
93 (charset-property charset 'chars))
|
|
94
|
|
95 (defun charset-width (charset)
|
|
96 "Return the number of display columns per character of CHARSET.
|
|
97 This only applies to TTY mode (under X, the actual display width can
|
|
98 be automatically determined)."
|
|
99 (charset-property charset 'columns))
|
|
100
|
|
101 ;; #### FSFmacs returns 0
|
|
102 (defun charset-direction (charset)
|
|
103 "Return the display direction (0 for `l2r' or 1 for `r2l') of CHARSET.
|
|
104 Only left-to-right is currently implemented."
|
|
105 (if (eq (charset-property charset 'direction) 'l2r)
|
|
106 0
|
|
107 1))
|
|
108
|
3659
|
109 ;; Not in GNU Emacs/Mule
|
428
|
110 (defun charset-registry (charset)
|
|
111 "Return the registry of CHARSET.
|
|
112 This is a regular expression matching the registry field of fonts
|
|
113 that can display the characters in CHARSET."
|
3659
|
114 (lwarn 'xintl 'warning
|
|
115 "charset-registry is obsolete--use charset-registries instead. ")
|
|
116 (when (charset-property charset 'registries)
|
|
117 (elt (charset-property charset 'registries) 0)))
|
|
118
|
|
119 (defun charset-registries (charset)
|
|
120 "Return the registries of CHARSET."
|
|
121 (charset-property charset 'registries))
|
|
122
|
|
123 (defun set-charset-registry (charset registry)
|
|
124 "Obsolete; use set-charset-registries instead. "
|
|
125 (check-argument-type 'stringp registry)
|
|
126 (check-argument-type 'charsetp (find-charset charset))
|
|
127 (unless (equal registry (regexp-quote registry))
|
|
128 (lwarn 'xintl 'warning
|
|
129 "Regexps no longer allowed for charset-registry. Treating %s%s"
|
|
130 registry " as a string."))
|
|
131 (set-charset-registries
|
|
132 charset
|
|
133 (apply 'vector registry (append (charset-registries charset) nil))))
|
428
|
134
|
|
135 (defun charset-ccl-program (charset)
|
|
136 "Return the CCL program of CHARSET.
|
|
137 See `make-charset'."
|
|
138 (charset-property charset 'ccl-program))
|
|
139
|
|
140 (defun charset-bytes (charset)
|
|
141 "Useless in XEmacs, returns 1."
|
|
142 1)
|
|
143
|
|
144 (define-obsolete-function-alias 'charset-columns 'charset-width) ;; 19990409
|
|
145 (define-obsolete-function-alias 'charset-final 'charset-iso-final-char) ;; 19990409
|
|
146 (define-obsolete-function-alias 'charset-graphic 'charset-iso-graphic-plane) ;; 19990409
|
|
147 (define-obsolete-function-alias 'charset-doc-string 'charset-description) ;; 19990409
|
|
148
|
|
149 ;;;; Define setf methods for all settable Charset properties
|
|
150
|
|
151 (defsetf charset-registry set-charset-registry)
|
|
152 (defsetf charset-ccl-program set-charset-ccl-program)
|
|
153
|
|
154 ;;; FSF compatibility functions
|
|
155 (defun charset-after (&optional pos)
|
|
156 "Return charset of a character in current buffer at position POS.
|
|
157 If POS is nil, it defauls to the current point.
|
|
158 If POS is out of range, the value is nil."
|
|
159 (when (null pos)
|
|
160 (setq pos (point)))
|
|
161 (check-argument-type 'integerp pos)
|
|
162 (unless (or (< pos (point-min))
|
|
163 (> pos (point-max)))
|
|
164 (char-charset (char-after pos))))
|
|
165
|
|
166 ;; Yuck!
|
771
|
167 ;; We're not going to support these.
|
|
168 ;(defun charset-info (charset) [incredibly broken function with random vectors]
|
|
169 ;(defun define-charset (...) [incredibly broken function with random vectors]
|
428
|
170
|
|
171 ;;; Charset property
|
|
172
|
|
173 (defalias 'get-charset-property 'get)
|
|
174 (defalias 'put-charset-property 'put)
|
|
175 (defalias 'charset-plist 'object-plist)
|
|
176 (defalias 'set-charset-plist 'setplist)
|
|
177
|
771
|
178
|
788
|
179 ;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;
|
|
180 ; translation tables ;
|
|
181 ;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;
|
|
182
|
|
183 (defstruct (translation-table (:constructor internal-make-translation-table))
|
|
184 forward
|
|
185 reverse)
|
|
186
|
|
187 (defun make-translation-table (&rest args)
|
|
188 "Make a translation table from arguments.
|
2116
|
189 A translation table is a char table intended for character translation
|
|
190 in CCL programs.
|
788
|
191
|
|
192 Each argument is a list of elemnts of the form (FROM . TO), where FROM
|
|
193 is a character to be translated to TO.
|
|
194
|
|
195 FROM can be a generic character (see `make-char'). In this case, TO is
|
|
196 a generic character containing the same number of characters, or a
|
|
197 ordinary character. If FROM and TO are both generic characters, all
|
|
198 characters belonging to FROM are translated to characters belonging to TO
|
|
199 without changing their position code(s).
|
|
200
|
|
201 The arguments and forms in each argument are processed in the given
|
|
202 order, and if a previous form already translates TO to some other
|
|
203 character, say TO-ALT, FROM is also translated to TO-ALT."
|
|
204 (let ((table (internal-make-translation-table
|
|
205 :forward (make-char-table 'generic)))
|
|
206 revlist)
|
|
207 (while args
|
|
208 (let ((elts (car args)))
|
|
209 (while elts
|
|
210 (let* ((from (car (car elts)))
|
|
211 (from-i 0) ; degree of freedom of FROM
|
|
212 (from-rev (nreverse (split-char from)))
|
|
213 (to (cdr (car elts)))
|
|
214 (to-i 0) ; degree of freedom of TO
|
|
215 (to-rev (nreverse (split-char to))))
|
|
216 ;; Check numbers of heading 0s in FROM-REV and TO-REV.
|
|
217 (while (eq (car from-rev) 0)
|
|
218 (setq from-i (1+ from-i) from-rev (cdr from-rev)))
|
|
219 (while (eq (car to-rev) 0)
|
|
220 (setq to-i (1+ to-i) to-rev (cdr to-rev)))
|
|
221 (if (and (/= from-i to-i) (/= to-i 0))
|
|
222 (error "Invalid character pair (%d . %d)" from to))
|
|
223 ;; If we have already translated TO to TO-ALT, FROM should
|
|
224 ;; also be translated to TO-ALT. But, this is only if TO
|
|
225 ;; is a generic character or TO-ALT is not a generic
|
|
226 ;; character.
|
|
227 (let ((to-alt (get-char-table to table)))
|
|
228 (if (and to-alt
|
|
229 (or (> to-i 0) (not (find-charset to-alt))))
|
|
230 (setq to to-alt)))
|
|
231 (if (> from-i 0)
|
|
232 (set-char-table-default table from to)
|
|
233 (put-char-table from to table))
|
|
234 ;; If we have already translated some chars to FROM, they
|
|
235 ;; should also be translated to TO.
|
|
236 (let ((l (assq from revlist)))
|
|
237 (if l
|
|
238 (let ((ch (car l)))
|
|
239 (setcar l to)
|
|
240 (setq l (cdr l))
|
|
241 (while l
|
|
242 (put-char-table ch to table)
|
|
243 (setq l (cdr l)) ))))
|
|
244 ;; Now update REVLIST.
|
|
245 (let ((l (assq to revlist)))
|
|
246 (if l
|
|
247 (setcdr l (cons from (cdr l)))
|
|
248 (setq revlist (cons (list to from) revlist)))))
|
|
249 (setq elts (cdr elts))))
|
|
250 (setq args (cdr args)))
|
|
251 ;; Return TABLE just created.
|
|
252 table))
|
|
253
|
|
254 ;; Do we really need this?
|
|
255 ; (defun make-translation-table-from-vector (vec)
|
|
256 ; "Make translation table from decoding vector VEC.
|
|
257 ; VEC is an array of 256 elements to map unibyte codes to multibyte characters.
|
|
258 ; See also the variable `nonascii-translation-table'."
|
|
259 ; (let ((table (make-char-table 'translation-table))
|
|
260 ; (rev-table (make-char-table 'translation-table))
|
|
261 ; (i 0)
|
|
262 ; ch)
|
|
263 ; (while (< i 256)
|
|
264 ; (setq ch (aref vec i))
|
|
265 ; (aset table i ch)
|
|
266 ; (if (>= ch 256)
|
|
267 ; (aset rev-table ch i))
|
|
268 ; (setq i (1+ i)))
|
|
269 ; (set-char-table-extra-slot table 0 rev-table)
|
|
270 ; table))
|
|
271
|
|
272 (defvar named-translation-table-hash-table (make-hash-table))
|
|
273
|
|
274 (defun define-translation-table (symbol &rest args)
|
|
275 "Define SYMBOL as the name of translation table made by ARGS.
|
|
276 This sets up information so that the table can be used for
|
|
277 translations in a CCL program.
|
|
278
|
|
279 If the first element of ARGS is a translation table, just define SYMBOL to
|
|
280 name it. (Note that this function does not bind SYMBOL.)
|
|
281
|
|
282 Any other ARGS should be suitable as arguments of the function
|
|
283 `make-translation-table' (which see).
|
|
284
|
|
285 Look up a named translation table using `find-translation-table' or
|
|
286 `get-translation-table'."
|
|
287 (let ((table (if (translation-table-p (car args))
|
|
288 (car args)
|
|
289 (apply 'make-translation-table args))))
|
|
290 (puthash symbol table named-translation-table-hash-table)))
|
|
291
|
|
292 (defun find-translation-table (table-or-name)
|
|
293 "Retrieve the translation table of the given name.
|
|
294 If TABLE-OR-NAME is a translation table object, it is simply returned.
|
|
295 Otherwise, TABLE-OR-NAME should be a symbol. If there is no such
|
|
296 translation table, nil is returned. Otherwise the associated translation
|
|
297 table object is returned."
|
|
298 (if (translation-table-p table-or-name)
|
|
299 table-or-name
|
|
300 (check-argument-type 'symbolp table-or-name)
|
|
301 (gethash table-or-name named-translation-table-hash-table)))
|
|
302
|
|
303 (defun get-translation-table (table-or-name)
|
|
304 "Retrieve the translation table of the given name.
|
|
305 Same as `find-translation-table' except an error is signalled if there is
|
|
306 no such translation table instead of returning nil."
|
|
307 (or (find-translation-table table-or-name)
|
|
308 (error 'invalid-argument "No such translation table" table-or-name)))
|
|
309
|
|
310
|
442
|
311 ;; Setup auto-fill-chars for charsets that should invoke auto-filling.
|
777
|
312 ;; SPACE and NEWLINE are already set.
|
442
|
313 (let ((l '(katakana-jisx0201
|
|
314 japanese-jisx0208 japanese-jisx0212
|
|
315 chinese-gb2312 chinese-big5-1 chinese-big5-2)))
|
|
316 (while l
|
|
317 (put-char-table (car l) t auto-fill-chars)
|
|
318 (setq l (cdr l))))
|
|
319
|
778
|
320
|
|
321 ;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;
|
|
322 ; charsets ;
|
|
323 ;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;
|
|
324
|
|
325 ;; Synched up with: FSF 21.1.
|
|
326
|
|
327 ;; All FSF charset definitions are in mule-conf.el. I copied the relevant
|
|
328 ;; part of that file below, then converted all charset definitions using
|
|
329 ;; the macro below, then globally replaced 'direction 0' with 'direction
|
|
330 ;; l2r' and 'direction 1' with 'direction r2l', then commented everything
|
|
331 ;; out. Copy the definitions as necessary to individual files.
|
|
332
|
|
333 ;; Kbd macro to convert from FSF-style define-charset to our make-charset.
|
|
334
|
|
335 ; (setq last-kbd-macro (read-kbd-macro
|
|
336 ; "<right> M-d make <M-right> M-d <home> <down> TAB '[dimension DEL SPC <M-right> RET TAB chars SPC <M-right> RET TAB columns SPC <M-right> RET TAB direction SPC <M-right> RET TAB final SPC <M-right> RET TAB graphic SPC <M-right> RET TAB short- name SPC <M-right> RET TAB long- name SPC <M-right> RET TAB <S-M-right> <f2> DEL TAB <end> ] <M-left> <end> SPC <f4> 3*<M-left> <left> <M-right> RET <down>"))
|
|
337
|
|
338 ;; Kbd macro to take one registry entry from the list of registry entries,
|
|
339 ;; find the appropriate make-charset call, and add the appropriate registry
|
|
340 ;; property.
|
|
341
|
|
342 ; (setq last-kbd-macro (read-kbd-macro
|
|
343 ; "3*<right> <S-M-right> C-x x 1 <right> <S-M-right> C-x x 2 <home> C-x r m foo RET <M-down> M-x sear TAB for TAB RET C-x g 1 RET C-s dimen RET <end> RET TAB 3*<backspace> registry SPC C-x g 2 C-x r b RET <down>"))
|
|
344
|
|
345 ;; List from FSF international/fontset.el of registries for charsets.
|
|
346
|
|
347 ;; latin-iso8859-1 "ISO8859-1"
|
|
348 ;; latin-iso8859-2 "ISO8859-2"
|
|
349 ;; latin-iso8859-3 "ISO8859-3"
|
|
350 ;; latin-iso8859-4 "ISO8859-4"
|
|
351 ;; thai-tis620 "TIS620"
|
|
352 ;; greek-iso8859-7 "ISO8859-7"
|
|
353 ;; arabic-iso8859-6 "ISO8859-6"
|
|
354 ;; hebrew-iso8859-8 "ISO8859-8"
|
|
355 ;; katakana-jisx0201 "JISX0201"
|
|
356 ;; latin-jisx0201 "JISX0201"
|
|
357 ;; cyrillic-iso8859-5 "ISO8859-5"
|
|
358 ;; latin-iso8859-9 "ISO8859-9"
|
|
359 ;; japanese-jisx0208-1978 "JISX0208.1978"
|
|
360 ;; chinese-gb2312 "GB2312.1980"
|
|
361 ;; japanese-jisx0208 "JISX0208.1990"
|
|
362 ;; korean-ksc5601 "KSC5601.1989"
|
|
363 ;; japanese-jisx0212 "JISX0212"
|
|
364 ;; chinese-cns11643-1 "CNS11643.1992-1"
|
|
365 ;; chinese-cns11643-2 "CNS11643.1992-2"
|
|
366 ;; chinese-cns11643-3 "CNS11643.1992-3"
|
|
367 ;; chinese-cns11643-4 "CNS11643.1992-4"
|
|
368 ;; chinese-cns11643-5 "CNS11643.1992-5"
|
|
369 ;; chinese-cns11643-6 "CNS11643.1992-6"
|
|
370 ;; chinese-cns11643-7 "CNS11643.1992-7"
|
|
371 ;; chinese-big5-1 "Big5"
|
|
372 ;; chinese-big5-2 "Big5"
|
|
373 ;; chinese-sisheng "sisheng_cwnn"
|
|
374 ;; vietnamese-viscii-lower "VISCII1.1"
|
|
375 ;; vietnamese-viscii-upper "VISCII1.1"
|
|
376 ;; arabic-digit "MuleArabic-0"
|
|
377 ;; arabic-1-column "MuleArabic-1"
|
|
378 ;; arabic-2-column "MuleArabic-2"
|
|
379 ;; ipa "MuleIPA"
|
|
380 ;; ethiopic "Ethiopic-Unicode"
|
|
381 ;; ascii-right-to-left "ISO8859-1"
|
|
382 ;; indian-is13194 "IS13194-Devanagari"
|
|
383 ;; indian-2-column "MuleIndian-2"
|
|
384 ;; indian-1-column "MuleIndian-1"
|
|
385 ;; lao "MuleLao-1"
|
|
386 ;; tibetan "MuleTibetan-2"
|
|
387 ;; tibetan-1-column "MuleTibetan-1"
|
|
388 ;; latin-iso8859-14 "ISO8859-14"
|
|
389 ;; latin-iso8859-15 "ISO8859-15"
|
|
390 ;; mule-unicode-0100-24ff "ISO10646-1"
|
|
391 ;; mule-unicode-2500-33ff "ISO10646-1"
|
|
392 ;; mule-unicode-e000-ffff "ISO10646-1"
|
|
393 ;; japanese-jisx0213-1 "JISX0213.2000-1"
|
|
394 ;; japanese-jisx0213-2 "JISX0213.2000-2"
|
|
395
|
|
396 ;;; Begin stuff from international/mule-conf.el.
|
|
397
|
|
398 ; ;;; Definitions of character sets.
|
|
399
|
|
400 ; ;; Basic (official) character sets. These character sets are treated
|
|
401 ; ;; efficiently with respect to buffer memory.
|
|
402
|
|
403 ; ;; Syntax:
|
|
404 ; ;; (define-charset CHARSET-ID CHARSET
|
|
405 ; ;; [ DIMENSION CHARS WIDTH DIRECTION ISO-FINAL-CHAR ISO-GRAPHIC-PLANE
|
|
406 ; ;; SHORT-NAME LONG-NAME DESCRIPTION ])
|
|
407 ; ;; ASCII charset is defined in src/charset.c as below.
|
|
408 ; ;; (define-charset 0 ascii
|
|
409 ; ;; [1 94 1 0 ?B 0 "ASCII" "ASCII" "ASCII (ISO646 IRV)"])
|
|
410
|
|
411 ; ;; 1-byte charsets. Valid range of CHARSET-ID is 128..143.
|
|
412
|
|
413 ; ;; CHARSET-ID 128 is not used.
|
|
414
|
|
415 ; ; An extra level of commenting means an official (done in C) charset.
|
|
416 ; ; (make-charset 'latin-iso8859-1
|
|
417 ; ; "Right-Hand Part of Latin Alphabet 1 (ISO/IEC 8859-1): ISO-IR-100"
|
|
418 ; ; '(dimension
|
|
419 ; ; 1
|
|
420 ; ; registry "ISO8859-1"
|
|
421 ; ; chars 96
|
|
422 ; ; columns 1
|
|
423 ; ; direction l2r
|
|
424 ; ; final ?A
|
|
425 ; ; graphic 1
|
|
426 ; ; short-name "RHP of Latin-1"
|
|
427 ; ; long-name "RHP of Latin-1 (ISO 8859-1): ISO-IR-100"
|
|
428 ; ; ))
|
|
429
|
|
430 ; ; (make-charset 'latin-iso8859-2
|
|
431 ; ; "Right-Hand Part of Latin Alphabet 2 (ISO/IEC 8859-2): ISO-IR-101"
|
|
432 ; ; '(dimension
|
|
433 ; ; 1
|
|
434 ; ; registry "ISO8859-2"
|
|
435 ; ; chars 96
|
|
436 ; ; columns 1
|
|
437 ; ; direction l2r
|
|
438 ; ; final ?B
|
|
439 ; ; graphic 1
|
|
440 ; ; short-name "RHP of Latin-2"
|
|
441 ; ; long-name "RHP of Latin-2 (ISO 8859-2): ISO-IR-101"
|
|
442 ; ; ))
|
|
443
|
|
444 ; ; (make-charset 'latin-iso8859-3
|
|
445 ; ; "Right-Hand Part of Latin Alphabet 3 (ISO/IEC 8859-3): ISO-IR-109"
|
|
446 ; ; '(dimension
|
|
447 ; ; 1
|
|
448 ; ; registry "ISO8859-3"
|
|
449 ; ; chars 96
|
|
450 ; ; columns 1
|
|
451 ; ; direction l2r
|
|
452 ; ; final ?C
|
|
453 ; ; graphic 1
|
|
454 ; ; short-name "RHP of Latin-3"
|
|
455 ; ; long-name "RHP of Latin-3 (ISO 8859-3): ISO-IR-109"
|
|
456 ; ; ))
|
|
457
|
|
458 ; ; (make-charset 'latin-iso8859-4
|
|
459 ; ; "Right-Hand Part of Latin Alphabet 4 (ISO/IEC 8859-4): ISO-IR-110"
|
|
460 ; ; '(dimension
|
|
461 ; ; 1
|
|
462 ; ; registry "ISO8859-4"
|
|
463 ; ; chars 96
|
|
464 ; ; columns 1
|
|
465 ; ; direction l2r
|
|
466 ; ; final ?D
|
|
467 ; ; graphic 1
|
|
468 ; ; short-name "RHP of Latin-4"
|
|
469 ; ; long-name "RHP of Latin-4 (ISO 8859-4): ISO-IR-110"
|
|
470 ; ; ))
|
|
471
|
|
472 ; ; (make-charset 'thai-tis620
|
|
473 ; ; "Right-Hand Part of TIS620.2533 (Thai): ISO-IR-166"
|
|
474 ; ; '(dimension
|
|
475 ; ; 1
|
|
476 ; ; registry "TIS620"
|
|
477 ; ; chars 96
|
|
478 ; ; columns 1
|
|
479 ; ; direction l2r
|
|
480 ; ; final ?T
|
|
481 ; ; graphic 1
|
|
482 ; ; short-name "RHP of TIS620"
|
|
483 ; ; long-name "RHP of Thai (TIS620): ISO-IR-166"
|
|
484 ; ; ))
|
|
485
|
|
486 ; ; (make-charset 'greek-iso8859-7
|
|
487 ; ; "Right-Hand Part of Latin/Greek Alphabet (ISO/IEC 8859-7): ISO-IR-126"
|
|
488 ; ; '(dimension
|
|
489 ; ; 1
|
|
490 ; ; registry "ISO8859-7"
|
|
491 ; ; chars 96
|
|
492 ; ; columns 1
|
|
493 ; ; direction l2r
|
|
494 ; ; final ?F
|
|
495 ; ; graphic 1
|
|
496 ; ; short-name "RHP of ISO8859/7"
|
|
497 ; ; long-name "RHP of Greek (ISO 8859-7): ISO-IR-126"
|
|
498 ; ; ))
|
|
499
|
|
500 ; ; (make-charset 'arabic-iso8859-6
|
|
501 ; ; "Right-Hand Part of Latin/Arabic Alphabet (ISO/IEC 8859-6): ISO-IR-127"
|
|
502 ; ; '(dimension
|
|
503 ; ; 1
|
|
504 ; ; registry "ISO8859-6"
|
|
505 ; ; chars 96
|
|
506 ; ; columns 1
|
|
507 ; ; direction r2l
|
|
508 ; ; final ?G
|
|
509 ; ; graphic 1
|
|
510 ; ; short-name "RHP of ISO8859/6"
|
|
511 ; ; long-name "RHP of Arabic (ISO 8859-6): ISO-IR-127"
|
|
512 ; ; ))
|
|
513
|
|
514 ; ; (make-charset 'hebrew-iso8859-8
|
|
515 ; ; "Right-Hand Part of Latin/Hebrew Alphabet (ISO/IEC 8859-8): ISO-IR-138"
|
|
516 ; ; '(dimension
|
|
517 ; ; 1
|
|
518 ; ; registry "ISO8859-8"
|
|
519 ; ; chars 96
|
|
520 ; ; columns 1
|
|
521 ; ; direction r2l
|
|
522 ; ; final ?H
|
|
523 ; ; graphic 1
|
|
524 ; ; short-name "RHP of ISO8859/8"
|
|
525 ; ; long-name "RHP of Hebrew (ISO 8859-8): ISO-IR-138"
|
|
526 ; ; ))
|
|
527
|
|
528 ; ; (make-charset 'katakana-jisx0201
|
|
529 ; ; "Katakana Part of JISX0201.1976"
|
|
530 ; ; '(dimension
|
|
531 ; ; 1
|
|
532 ; ; registry "JISX0201"
|
|
533 ; ; chars 94
|
|
534 ; ; columns 1
|
|
535 ; ; direction l2r
|
|
536 ; ; final ?I
|
|
537 ; ; graphic 1
|
|
538 ; ; short-name "JISX0201 Katakana"
|
|
539 ; ; long-name "Japanese Katakana (JISX0201.1976)"
|
|
540 ; ; ))
|
|
541
|
|
542 ; ; (make-charset 'latin-jisx0201
|
|
543 ; ; "Roman Part of JISX0201.1976"
|
|
544 ; ; '(dimension
|
|
545 ; ; 1
|
|
546 ; ; registry "JISX0201"
|
|
547 ; ; chars 94
|
|
548 ; ; columns 1
|
|
549 ; ; direction l2r
|
|
550 ; ; final ?J
|
|
551 ; ; graphic 0
|
|
552 ; ; short-name "JISX0201 Roman"
|
|
553 ; ; long-name "Japanese Roman (JISX0201.1976)"
|
|
554 ; ; ))
|
|
555
|
|
556
|
|
557 ; ;; CHARSET-ID is not used 139.
|
|
558
|
|
559 ; ; (make-charset 'cyrillic-iso8859-5
|
|
560 ; ; "Right-Hand Part of Latin/Cyrillic Alphabet (ISO/IEC 8859-5): ISO-IR-144"
|
|
561 ; ; '(dimension
|
|
562 ; ; 1
|
|
563 ; ; registry "ISO8859-5"
|
|
564 ; ; chars 96
|
|
565 ; ; columns 1
|
|
566 ; ; direction l2r
|
|
567 ; ; final ?L
|
|
568 ; ; graphic 1
|
|
569 ; ; short-name "RHP of ISO8859/5"
|
|
570 ; ; long-name "RHP of Cyrillic (ISO 8859-5): ISO-IR-144"
|
|
571 ; ; ))
|
|
572
|
|
573 ; ; (make-charset 'latin-iso8859-9
|
|
574 ; ; "Right-Hand Part of Latin Alphabet 5 (ISO/IEC 8859-9): ISO-IR-148"
|
|
575 ; ; '(dimension
|
|
576 ; ; 1
|
|
577 ; ; registry "ISO8859-9"
|
|
578 ; ; chars 96
|
|
579 ; ; columns 1
|
|
580 ; ; direction l2r
|
|
581 ; ; final ?M
|
|
582 ; ; graphic 1
|
|
583 ; ; short-name "RHP of Latin-5"
|
|
584 ; ; long-name "RHP of Latin-5 (ISO 8859-9): ISO-IR-148"
|
|
585 ; ; ))
|
|
586
|
|
587 ; ; (make-charset 'latin-iso8859-15
|
|
588 ; ; "Right-Hand Part of Latin Alphabet 9 (ISO/IEC 8859-15): ISO-IR-203"
|
|
589 ; ; '(dimension
|
|
590 ; ; 1
|
|
591 ; ; registry "ISO8859-15"
|
|
592 ; ; chars 96
|
|
593 ; ; columns 1
|
|
594 ; ; direction l2r
|
|
595 ; ; final ?b
|
|
596 ; ; graphic 1
|
|
597 ; ; short-name "RHP of Latin-9"
|
|
598 ; ; long-name "RHP of Latin-9 (ISO 8859-15): ISO-IR-203"
|
|
599 ; ; ))
|
|
600
|
|
601 ; (make-charset 'latin-iso8859-14
|
|
602 ; "Right-Hand Part of Latin Alphabet 8 (ISO/IEC 8859-14)"
|
|
603 ; '(dimension
|
|
604 ; 1
|
|
605 ; registry "ISO8859-14"
|
|
606 ; chars 96
|
|
607 ; columns 1
|
|
608 ; direction l2r
|
|
609 ; final ?_
|
|
610 ; graphic 1
|
|
611 ; short-name "RHP of Latin-8"
|
|
612 ; long-name "RHP of Latin-8 (ISO 8859-14)"
|
|
613 ; ))
|
|
614
|
|
615
|
|
616 ; ;; 2-byte charsets. Valid range of CHARSET-ID is 144..153.
|
|
617
|
|
618 ; ; (make-charset 'japanese-jisx0208-1978
|
|
619 ; ; "JISX0208.1978 Japanese Kanji (so called \"old JIS\"): ISO-IR-42"
|
|
620 ; ; '(dimension
|
|
621 ; ; 2
|
|
622 ; ; registry "JISX0208.1990"
|
|
623 ; ; registry "JISX0208.1978"
|
|
624 ; ; chars 94
|
|
625 ; ; columns 2
|
|
626 ; ; direction l2r
|
|
627 ; ; final ?@
|
|
628 ; ; graphic 0
|
|
629 ; ; short-name "JISX0208.1978"
|
|
630 ; ; long-name "JISX0208.1978 (Japanese): ISO-IR-42"
|
|
631 ; ; ))
|
|
632
|
|
633 ; ; (make-charset 'chinese-gb2312
|
|
634 ; ; "GB2312 Chinese simplified: ISO-IR-58"
|
|
635 ; ; '(dimension
|
|
636 ; ; 2
|
|
637 ; ; registry "GB2312.1980"
|
|
638 ; ; chars 94
|
|
639 ; ; columns 2
|
|
640 ; ; direction l2r
|
|
641 ; ; final ?A
|
|
642 ; ; graphic 0
|
|
643 ; ; short-name "GB2312"
|
|
644 ; ; long-name "GB2312: ISO-IR-58"
|
|
645 ; ; ))
|
|
646
|
|
647 ; ; (make-charset 'japanese-jisx0208
|
|
648 ; ; "JISX0208.1983/1990 Japanese Kanji: ISO-IR-87"
|
|
649 ; ; '(dimension
|
|
650 ; ; 2
|
|
651 ; ; chars 94
|
|
652 ; ; columns 2
|
|
653 ; ; direction l2r
|
|
654 ; ; final ?B
|
|
655 ; ; graphic 0
|
|
656 ; ; short-name "JISX0208"
|
|
657 ; ; long-name "JISX0208.1983/1990 (Japanese): ISO-IR-87"
|
|
658 ; ; ))
|
|
659
|
|
660 ; ; (make-charset 'korean-ksc5601
|
|
661 ; ; "KSC5601 Korean Hangul and Hanja: ISO-IR-149"
|
|
662 ; ; '(dimension
|
|
663 ; ; 2
|
|
664 ; ; registry "KSC5601.1989"
|
|
665 ; ; chars 94
|
|
666 ; ; columns 2
|
|
667 ; ; direction l2r
|
|
668 ; ; final ?C
|
|
669 ; ; graphic 0
|
|
670 ; ; short-name "KSC5601"
|
|
671 ; ; long-name "KSC5601 (Korean): ISO-IR-149"
|
|
672 ; ; ))
|
|
673
|
|
674 ; ; (make-charset 'japanese-jisx0212
|
|
675 ; ; "JISX0212 Japanese supplement: ISO-IR-159"
|
|
676 ; ; '(dimension
|
|
677 ; ; 2
|
|
678 ; ; registry "JISX0212"
|
|
679 ; ; chars 94
|
|
680 ; ; columns 2
|
|
681 ; ; direction l2r
|
|
682 ; ; final ?D
|
|
683 ; ; graphic 0
|
|
684 ; ; short-name "JISX0212"
|
|
685 ; ; long-name "JISX0212 (Japanese): ISO-IR-159"
|
|
686 ; ; ))
|
|
687
|
|
688 ; ; (make-charset 'chinese-cns11643-1
|
|
689 ; ; "CNS11643 Plane 1 Chinese traditional: ISO-IR-171"
|
|
690 ; ; '(dimension
|
|
691 ; ; 2
|
|
692 ; ; registry "CNS11643.1992-1"
|
|
693 ; ; chars 94
|
|
694 ; ; columns 2
|
|
695 ; ; direction l2r
|
|
696 ; ; final ?G
|
|
697 ; ; graphic 0
|
|
698 ; ; short-name "CNS11643-1"
|
|
699 ; ; long-name "CNS11643-1 (Chinese traditional): ISO-IR-171"
|
|
700 ; ; ))
|
|
701
|
|
702 ; ; (make-charset 'chinese-cns11643-2
|
|
703 ; ; "CNS11643 Plane 2 Chinese traditional: ISO-IR-172"
|
|
704 ; ; '(dimension
|
|
705 ; ; 2
|
|
706 ; ; registry "CNS11643.1992-2"
|
|
707 ; ; chars 94
|
|
708 ; ; columns 2
|
|
709 ; ; direction l2r
|
|
710 ; ; final ?H
|
|
711 ; ; graphic 0
|
|
712 ; ; short-name "CNS11643-2"
|
|
713 ; ; long-name "CNS11643-2 (Chinese traditional): ISO-IR-172"
|
|
714 ; ; ))
|
|
715
|
|
716 ; (make-charset 'japanese-jisx0213-1 "JISX0213 Plane 1 (Japanese)"
|
|
717 ; '(dimension
|
|
718 ; 2
|
|
719 ; registry "JISX0213.2000-1"
|
|
720 ; chars 94
|
|
721 ; columns 2
|
|
722 ; direction l2r
|
|
723 ; final ?O
|
|
724 ; graphic 0
|
|
725 ; short-name "JISX0213-1"
|
|
726 ; long-name "JISX0213-1"
|
|
727 ; ))
|
|
728
|
|
729 ; ; (make-charset 'chinese-big5-1
|
|
730 ; ; "Frequently used part (A141-C67F) of Big5 (Chinese traditional)"
|
|
731 ; ; '(dimension
|
|
732 ; ; 2
|
|
733 ; ; registry "Big5"
|
|
734 ; ; chars 94
|
|
735 ; ; columns 2
|
|
736 ; ; direction l2r
|
|
737 ; ; final ?0
|
|
738 ; ; graphic 0
|
|
739 ; ; short-name "Big5 (Level-1)"
|
|
740 ; ; long-name "Big5 (Level-1) A141-C67F"
|
|
741 ; ; ))
|
|
742
|
|
743 ; ; (make-charset 'chinese-big5-2
|
|
744 ; ; "Less frequently used part (C940-FEFE) of Big5 (Chinese traditional)"
|
|
745 ; ; '(dimension
|
|
746 ; ; 2
|
|
747 ; ; registry "Big5"
|
|
748 ; ; chars 94
|
|
749 ; ; columns 2
|
|
750 ; ; direction l2r
|
|
751 ; ; final ?1
|
|
752 ; ; graphic 0
|
|
753 ; ; short-name "Big5 (Level-2)"
|
|
754 ; ; long-name "Big5 (Level-2) C940-FEFE"
|
|
755 ; ; ))
|
|
756
|
|
757
|
|
758 ; ;; Additional (private) character sets. These character sets are
|
|
759 ; ;; treated less space-efficiently in the buffer.
|
|
760
|
|
761 ; ;; Syntax:
|
|
762 ; ;; (define-charset CHARSET-ID CHARSET
|
|
763 ; ;; [ DIMENSION CHARS WIDTH DIRECTION ISO-FINAL-CHAR ISO-GRAPHIC-PLANE
|
|
764 ; ;; SHORT-NAME LONG-NAME DESCRIPTION ])
|
|
765
|
|
766 ; ;; ISO-2022 allows a use of character sets not registered in ISO with
|
|
767 ; ;; final characters `0' (0x30) through `?' (0x3F). Among them, Emacs
|
|
768 ; ;; reserves `0' through `9' to support several private character sets.
|
|
769 ; ;; The remaining final characters `:' through `?' are for users.
|
|
770
|
|
771 ; ;; 1-byte 1-column charsets. Valid range of CHARSET-ID is 160..223.
|
|
772
|
|
773 ; (make-charset 'chinese-sisheng
|
|
774 ; "SiSheng characters for PinYin/ZhuYin"
|
|
775 ; '(dimension
|
|
776 ; 1
|
|
777 ; registry "sisheng_cwnn"
|
|
778 ; chars 94
|
|
779 ; columns 1
|
|
780 ; direction l2r
|
|
781 ; final ?0
|
|
782 ; graphic 0
|
|
783 ; short-name "SiSheng"
|
|
784 ; long-name "SiSheng (PinYin/ZhuYin)"
|
|
785 ; ))
|
|
786
|
|
787
|
|
788 ; ;; IPA characters for phonetic symbols.
|
|
789 ; (make-charset 'ipa "IPA (International Phonetic Association)"
|
|
790 ; '(dimension
|
|
791 ; 1
|
|
792 ; registry "MuleIPA"
|
|
793 ; chars 96
|
|
794 ; columns 1
|
|
795 ; direction l2r
|
|
796 ; final ?0
|
|
797 ; graphic 1
|
|
798 ; short-name "IPA"
|
|
799 ; long-name "IPA"
|
|
800 ; ))
|
|
801
|
|
802
|
|
803 ; ;; Vietnamese VISCII. VISCII is 1-byte character set which contains
|
|
804 ; ;; more than 96 characters. Since Emacs can't handle it as one
|
|
805 ; ;; character set, it is divided into two: lower case letters and upper
|
|
806 ; ;; case letters.
|
|
807 ; (make-charset 'vietnamese-viscii-lower "VISCII1.1 lower-case"
|
|
808 ; '(dimension
|
|
809 ; 1
|
|
810 ; registry "VISCII1.1"
|
|
811 ; chars 96
|
|
812 ; columns 1
|
|
813 ; direction l2r
|
|
814 ; final ?1
|
|
815 ; graphic 1
|
|
816 ; short-name "VISCII lower"
|
|
817 ; long-name "VISCII lower-case"
|
|
818 ; ))
|
|
819
|
|
820 ; (make-charset 'vietnamese-viscii-upper "VISCII1.1 upper-case"
|
|
821 ; '(dimension
|
|
822 ; 1
|
|
823 ; registry "VISCII1.1"
|
|
824 ; chars 96
|
|
825 ; columns 1
|
|
826 ; direction l2r
|
|
827 ; final ?2
|
|
828 ; graphic 1
|
|
829 ; short-name "VISCII upper"
|
|
830 ; long-name "VISCII upper-case"
|
|
831 ; ))
|
|
832
|
|
833
|
|
834 ; ;; For Arabic, we need three different types of character sets.
|
|
835 ; ;; Digits are of direction left-to-right and of width 1-column.
|
|
836 ; ;; Others are of direction right-to-left and of width 1-column or
|
|
837 ; ;; 2-column.
|
|
838 ; (make-charset 'arabic-digit "Arabic digit"
|
|
839 ; '(dimension
|
|
840 ; 1
|
|
841 ; registry "MuleArabic-0"
|
|
842 ; chars 94
|
|
843 ; columns 1
|
|
844 ; direction l2r
|
|
845 ; final ?2
|
|
846 ; graphic 0
|
|
847 ; short-name "Arabic digit"
|
|
848 ; long-name "Arabic digit"
|
|
849 ; ))
|
|
850
|
|
851 ; (make-charset 'arabic-1-column "Arabic 1-column"
|
|
852 ; '(dimension
|
|
853 ; 1
|
|
854 ; registry "MuleArabic-1"
|
|
855 ; chars 94
|
|
856 ; columns 1
|
|
857 ; direction r2l
|
|
858 ; final ?3
|
|
859 ; graphic 0
|
|
860 ; short-name "Arabic 1-col"
|
|
861 ; long-name "Arabic 1-column"
|
|
862 ; ))
|
|
863
|
|
864
|
|
865 ; ;; ASCII with right-to-left direction.
|
|
866 ; (make-charset 'ascii-right-to-left
|
|
867 ; "ASCII (left half of ISO 8859-1) with right-to-left direction"
|
|
868 ; '(dimension
|
|
869 ; 1
|
|
870 ; registry "ISO8859-1"
|
|
871 ; chars 94
|
|
872 ; columns 1
|
|
873 ; direction r2l
|
|
874 ; final ?B
|
|
875 ; graphic 0
|
|
876 ; short-name "rev ASCII"
|
|
877 ; long-name "ASCII with right-to-left direction"
|
|
878 ; ))
|
|
879
|
|
880
|
|
881 ; ;; Lao script.
|
|
882 ; ;; ISO10646's 0x0E80..0x0EDF are mapped to 0x20..0x7F.
|
|
883 ; (make-charset 'lao "Lao characters (ISO10646 0E80..0EDF)"
|
|
884 ; '(dimension
|
|
885 ; 1
|
|
886 ; registry "MuleLao-1"
|
|
887 ; chars 94
|
|
888 ; columns 1
|
|
889 ; direction l2r
|
|
890 ; final ?1
|
|
891 ; graphic 0
|
|
892 ; short-name "Lao"
|
|
893 ; long-name "Lao"
|
|
894 ; ))
|
|
895
|
|
896
|
|
897 ; ;; CHARSET-IDs 168..223 are not used.
|
|
898
|
|
899 ; ;; 1-byte 2-column charsets. Valid range of CHARSET-ID is 224..239.
|
|
900
|
|
901 ; (make-charset 'arabic-2-column "Arabic 2-column"
|
|
902 ; '(dimension
|
|
903 ; 1
|
|
904 ; registry "MuleArabic-2"
|
|
905 ; chars 94
|
|
906 ; columns 2
|
|
907 ; direction r2l
|
|
908 ; final ?4
|
|
909 ; graphic 0
|
|
910 ; short-name "Arabic 2-col"
|
|
911 ; long-name "Arabic 2-column"
|
|
912 ; ))
|
|
913
|
|
914
|
|
915 ; ;; Indian scripts. Symbolic charset for data exchange. Glyphs are
|
|
916 ; ;; not assigned. They are automatically converted to each Indian
|
|
917 ; ;; script which IS-13194 supports.
|
|
918
|
|
919 ; (make-charset 'indian-is13194
|
|
920 ; "Generic Indian charset for data exchange with IS 13194"
|
|
921 ; '(dimension
|
|
922 ; 1
|
|
923 ; registry "IS13194-Devanagari"
|
|
924 ; chars 94
|
|
925 ; columns 2
|
|
926 ; direction l2r
|
|
927 ; final ?5
|
|
928 ; graphic 1
|
|
929 ; short-name "IS 13194"
|
|
930 ; long-name "Indian IS 13194"
|
|
931 ; ))
|
|
932
|
|
933
|
|
934 ; ;; CHARSET-IDs 226..239 are not used.
|
|
935
|
|
936 ; ;; 2-byte 1-column charsets. Valid range of CHARSET-ID is 240..244.
|
|
937
|
|
938 ; ;; Actual Glyph for 1-column width.
|
|
939 ; (make-charset 'indian-1-column
|
|
940 ; "Indian charset for 2-column width glyphs"
|
|
941 ; '(dimension
|
|
942 ; 2
|
|
943 ; registry "MuleIndian-1"
|
|
944 ; chars 94
|
|
945 ; columns 1
|
|
946 ; direction l2r
|
|
947 ; final ?6
|
|
948 ; graphic 0
|
|
949 ; short-name "Indian 1-col"
|
|
950 ; long-name "Indian 1 Column"
|
|
951 ; ))
|
|
952
|
|
953
|
|
954 ; (make-charset 'tibetan-1-column "Tibetan 1 column glyph"
|
|
955 ; '(dimension
|
|
956 ; 2
|
|
957 ; registry "MuleTibetan-1"
|
|
958 ; chars 94
|
|
959 ; columns 1
|
|
960 ; direction l2r
|
|
961 ; final ?8
|
|
962 ; graphic 0
|
|
963 ; short-name "Tibetan 1-col"
|
|
964 ; long-name "Tibetan 1 column"
|
|
965 ; ))
|
|
966
|
|
967
|
|
968 ; ;; Subsets of Unicode.
|
|
969
|
|
970 ; (make-charset 'mule-unicode-2500-33ff
|
|
971 ; "Unicode characters of the range U+2500..U+33FF."
|
|
972 ; '(dimension
|
|
973 ; 2
|
|
974 ; registry "ISO10646-1"
|
|
975 ; chars 96
|
|
976 ; columns 1
|
|
977 ; direction l2r
|
|
978 ; final ?2
|
|
979 ; graphic 0
|
|
980 ; short-name "Unicode subset 2"
|
|
981 ; long-name "Unicode subset (U+2500..U+33FF)"
|
|
982 ; ))
|
|
983
|
|
984
|
|
985 ; (make-charset 'mule-unicode-e000-ffff
|
|
986 ; "Unicode characters of the range U+E000..U+FFFF."
|
|
987 ; '(dimension
|
|
988 ; 2
|
|
989 ; registry "ISO10646-1"
|
|
990 ; chars 96
|
|
991 ; columns 1
|
|
992 ; direction l2r
|
|
993 ; final ?3
|
|
994 ; graphic 0
|
|
995 ; short-name "Unicode subset 3"
|
|
996 ; long-name "Unicode subset (U+E000+FFFF)"
|
|
997 ; ))
|
|
998
|
|
999
|
|
1000 ; (make-charset 'mule-unicode-0100-24ff
|
|
1001 ; "Unicode characters of the range U+0100..U+24FF."
|
|
1002 ; '(dimension
|
|
1003 ; 2
|
|
1004 ; registry "ISO10646-1"
|
|
1005 ; chars 96
|
|
1006 ; columns 1
|
|
1007 ; direction l2r
|
|
1008 ; final ?1
|
|
1009 ; graphic 0
|
|
1010 ; short-name "Unicode subset"
|
|
1011 ; long-name "Unicode subset (U+0100..U+24FF)"
|
|
1012 ; ))
|
|
1013
|
|
1014
|
|
1015 ; ;; 2-byte 2-column charsets. Valid range of CHARSET-ID is 245..254.
|
|
1016
|
|
1017 ; ;; Ethiopic characters (Amahric and Tigrigna).
|
|
1018 ; (make-charset 'ethiopic "Ethiopic characters"
|
|
1019 ; '(dimension
|
|
1020 ; 2
|
|
1021 ; registry "Ethiopic-Unicode"
|
|
1022 ; chars 94
|
|
1023 ; columns 2
|
|
1024 ; direction l2r
|
|
1025 ; final ?3
|
|
1026 ; graphic 0
|
|
1027 ; short-name "Ethiopic"
|
|
1028 ; long-name "Ethiopic characters"
|
|
1029 ; ))
|
|
1030
|
|
1031
|
|
1032 ; ;; Chinese CNS11643 Plane3 thru Plane7. Although these are official
|
|
1033 ; ;; character sets, the use is rare and don't have to be treated
|
|
1034 ; ;; space-efficiently in the buffer.
|
|
1035 ; (make-charset 'chinese-cns11643-3
|
|
1036 ; "CNS11643 Plane 3 Chinese Traditional: ISO-IR-183"
|
|
1037 ; '(dimension
|
|
1038 ; 2
|
|
1039 ; registry "CNS11643.1992-3"
|
|
1040 ; chars 94
|
|
1041 ; columns 2
|
|
1042 ; direction l2r
|
|
1043 ; final ?I
|
|
1044 ; graphic 0
|
|
1045 ; short-name "CNS11643-3"
|
|
1046 ; long-name "CNS11643-3 (Chinese traditional): ISO-IR-183"
|
|
1047 ; ))
|
|
1048
|
|
1049 ; (make-charset 'chinese-cns11643-4
|
|
1050 ; "CNS11643 Plane 4 Chinese Traditional: ISO-IR-184"
|
|
1051 ; '(dimension
|
|
1052 ; 2
|
|
1053 ; registry "CNS11643.1992-4"
|
|
1054 ; chars 94
|
|
1055 ; columns 2
|
|
1056 ; direction l2r
|
|
1057 ; final ?J
|
|
1058 ; graphic 0
|
|
1059 ; short-name "CNS11643-4"
|
|
1060 ; long-name "CNS11643-4 (Chinese traditional): ISO-IR-184"
|
|
1061 ; ))
|
|
1062
|
|
1063 ; (make-charset 'chinese-cns11643-5
|
|
1064 ; "CNS11643 Plane 5 Chinese Traditional: ISO-IR-185"
|
|
1065 ; '(dimension
|
|
1066 ; 2
|
|
1067 ; registry "CNS11643.1992-5"
|
|
1068 ; chars 94
|
|
1069 ; columns 2
|
|
1070 ; direction l2r
|
|
1071 ; final ?K
|
|
1072 ; graphic 0
|
|
1073 ; short-name "CNS11643-5"
|
|
1074 ; long-name "CNS11643-5 (Chinese traditional): ISO-IR-185"
|
|
1075 ; ))
|
|
1076
|
|
1077 ; (make-charset 'chinese-cns11643-6
|
|
1078 ; "CNS11643 Plane 6 Chinese Traditional: ISO-IR-186"
|
|
1079 ; '(dimension
|
|
1080 ; 2
|
|
1081 ; registry "CNS11643.1992-6"
|
|
1082 ; chars 94
|
|
1083 ; columns 2
|
|
1084 ; direction l2r
|
|
1085 ; final ?L
|
|
1086 ; graphic 0
|
|
1087 ; short-name "CNS11643-6"
|
|
1088 ; long-name "CNS11643-6 (Chinese traditional): ISO-IR-186"
|
|
1089 ; ))
|
|
1090
|
|
1091 ; (make-charset 'chinese-cns11643-7
|
|
1092 ; "CNS11643 Plane 7 Chinese Traditional: ISO-IR-187"
|
|
1093 ; '(dimension
|
|
1094 ; 2
|
|
1095 ; registry "CNS11643.1992-7"
|
|
1096 ; chars 94
|
|
1097 ; columns 2
|
|
1098 ; direction l2r
|
|
1099 ; final ?M
|
|
1100 ; graphic 0
|
|
1101 ; short-name "CNS11643-7"
|
|
1102 ; long-name "CNS11643-7 (Chinese traditional): ISO-IR-187"
|
|
1103 ; ))
|
|
1104
|
|
1105
|
|
1106 ; ;; Actual Glyph for 2-column width.
|
|
1107 ; (make-charset 'indian-2-column
|
|
1108 ; "Indian charset for 2-column width glyphs"
|
|
1109 ; '(dimension
|
|
1110 ; 2
|
|
1111 ; registry "MuleIndian-2"
|
|
1112 ; chars 94
|
|
1113 ; columns 2
|
|
1114 ; direction l2r
|
|
1115 ; final ?5
|
|
1116 ; graphic 0
|
|
1117 ; short-name "Indian 2-col"
|
|
1118 ; long-name "Indian 2 Column"
|
|
1119 ; ))
|
|
1120
|
|
1121
|
|
1122 ; ;; Tibetan script.
|
|
1123 ; (make-charset 'tibetan "Tibetan characters"
|
|
1124 ; '(dimension
|
|
1125 ; 2
|
|
1126 ; registry "MuleTibetan-2"
|
|
1127 ; chars 94
|
|
1128 ; columns 2
|
|
1129 ; direction l2r
|
|
1130 ; final ?7
|
|
1131 ; graphic 0
|
|
1132 ; short-name "Tibetan 2-col"
|
|
1133 ; long-name "Tibetan 2 column"
|
|
1134 ; ))
|
|
1135
|
|
1136
|
|
1137 ; ;; CHARSET-ID 253 is not used.
|
|
1138
|
|
1139 ; ;; JISX0213 Plane 2
|
|
1140 ; (make-charset 'japanese-jisx0213-2 "JISX0213 Plane 2 (Japanese)"
|
|
1141 ; '(dimension
|
|
1142 ; 2
|
|
1143 ; registry "JISX0213.2000-2"
|
|
1144 ; chars 94
|
|
1145 ; columns 2
|
|
1146 ; direction l2r
|
|
1147 ; final ?P
|
|
1148 ; graphic 0
|
|
1149 ; short-name "JISX0213-2"
|
|
1150 ; long-name "JISX0213-2"
|
|
1151 ; ))
|
|
1152
|
428
|
1153 ;;; mule-charset.el ends here
|
778
|
1154
|