xemacs-beta: lisp/unicode.el comparison

comparison lisp/unicode.el @ 2297:13a418960a88

[xemacs-hg @ 2004-09-22 02:05:42 by stephent] various doc patches <87isa7awrh.fsf@tleepslib.sk.tsukuba.ac.jp>

author	stephent
date	Wed, 22 Sep 2004 02:06:52 +0000
parents	b531bf8658e9
children	ecf1ebac70d8

comparison

equal deleted inserted replaced

-:a58ea4d0d0cd
+:13a418960a88
 ;;; Code:
 ; ;; Subsets of Unicode.
+; #### what is this bogosity ... "chars 96, final ?2" !!?!
 ; (make-charset 'mule-unicode-2500-33ff
 ; 	      "Unicode characters of the range U+2500..U+33FF."
 ; 	      '(dimension
 ; 		2
 ; 		registry "ISO10646-1"
 	    ;; "CP936.TXT"
 	    ;; "CP949.TXT"
 	    ;; "CP950.TXT"
 	    ;; "GB12345.TXT"
 	    ("GB2312.TXT" chinese-gb2312)
 	    ;; "HANGUL.TXT"
+	    ;; #### shouldn't JIS X 0201's upper limit be 7f?
 	    ("JIS0201.TXT" latin-jisx0201 #x21 #x80)
 	    ("JIS0201.TXT" katakana-jisx0201 #xA0 #xFF #x-80)
 	    ("JIS0208.TXT" japanese-jisx0208 nil nil nil ignore-first-column)
 	    ("JIS0212.TXT" japanese-jisx0212)
 	    ;; "JOHAB.TXT"
 	    ("KSX1001.TXT" korean-ksc5601)
 	    ;; "OLD5601.TXT"
 	    ;; "SHIFTJIS.TXT"
 	    )
 	   ("unicode/mule-ucs"
+	    ;; #### we don't support surrogates?!??
 	    ;; use these instead of the above ones once we support surrogates
 	    ;;("chinese-cns11643-1.txt" chinese-cns11643-1)
 	    ;;("chinese-cns11643-2.txt" chinese-cns11643-2)
 	    ;;("chinese-cns11643-3.txt" chinese-cns11643-3)
 	    ;;("chinese-cns11643-4.txt" chinese-cns11643-4)
 (make-coding-system
 'ucs-4-little-endian 'unicode
 "UCS-4 Little Endian"
 '(mnemonic "UCS4-LE"
 documentation
+;; #### I don't think this is permitted by ISO 10646, only Unicode.
+;; Call it UTF-32 instead?
 "Little-endian version of UCS-4 Unicode encoding.  See `ucs-4' coding system."
 type ucs-4
 little-endian t))
 (make-coding-system
 'utf-8 'unicode
 "UTF-8"
 '(mnemonic "UTF8"
 documentation
 "UTF-8 Unicode encoding -- ASCII-compatible 8-bit variable-width encoding
-with the same principles as the Mule-internal encoding:
+sharing the following principles with the Mule-internal encoding:
 -- All ASCII characters (codepoints 0 through 127) are represented
 by themselves (i.e. using one byte, with the same value as the
 ASCII codepoint), and these bytes are disjoint from bytes
 representing non-ASCII characters.

Mercurial > hg > xemacs-beta

comparison lisp/unicode.el @ 2297:13a418960a88