xemacs-beta: lisp/unicode.el comparison

comparison lisp/unicode.el @ 4268:75d0292c1bff

[xemacs-hg @ 2007-11-14 19:41:04 by aidan] Correct the dumped information for the Unicode JIT infrastructure.

author	aidan
date	Wed, 14 Nov 2007 19:41:09 +0000
parents	38ef5a6da799
children	15d36164ebd7

comparison

equal deleted inserted replaced

-:66e2714696bd
+:75d0292c1bff
 (modify-syntax-entry decoded
 (string
 (char-syntax ascii-or-latin-1))
 syntax-table))
-;; Create all the Unicode error sequences, normally as jit-ucs-charset-0
+;; *Sigh*, declarations needs to be at the start of the line to be picked up
-;; characters starting at U+200000 (which isn't a valid Unicode code
+;; by make-docfile. Not so much an issue with ccl-encode-to-ucs-2, which we
-;; point). Make them available to user code.
+;; don't necessarily want to advertise, but the following are important.
-(defvar unicode-error-default-translation-table
-(loop
+;; Create all the Unicode error sequences, normally as jit-ucs-charset-0
-with char-table = (make-char-table 'char)
+;; characters starting at U+200000 (which isn't a valid Unicode code
-for i from ?\x00 to ?\xFF
+;; point). Make them available to user code.
-do
+(defvar unicode-error-default-translation-table
-(put-char-table (aref
+(loop
-		       ;; #xd800 is the first leading surrogate;
+with char-table = (make-char-table 'char)
-		       ;; trailing surrogates must be in the range
+for i from ?\x00 to ?\xFF
-		       ;; #xdc00-#xdfff. These examples are not, so we
+do
-		       ;; intentionally provoke an error sequence.
+(put-char-table (aref
-		       (decode-coding-string (format "\xd8\x00\x00%c" i)
+;; #xd800 is the first leading surrogate;
-					     'utf-16-be)
+;; trailing surrogates must be in the range
-		       3)
+;; #xdc00-#xdfff. These examples are not, so we
-		      i
+;; intentionally provoke an error sequence.
-char-table)
+(decode-coding-string (format "\xd8\x00\x00%c" i)
-finally return char-table)
+'utf-16-be)
-"Translation table mapping Unicode error sequences to Latin-1 chars.
+3)
+i
+char-table)
+finally return char-table)
+"Translation table mapping Unicode error sequences to Latin-1 chars.
 To transform XEmacs Unicode error sequences to the Latin-1 characters that
 correspond to the octets on disk, you can use this variable.  ")
 (defvar unicode-error-sequence-regexp-range
 (format "%c%c-%c"
 (aref (decode-coding-string "\xd8\x00\x00\x00" 'utf-16-be) 0)
 (aref (decode-coding-string "\xd8\x00\x00\x00" 'utf-16-be) 3)
 (aref (decode-coding-string "\xd8\x00\x00\xFF" 'utf-16-be) 3))
 "Regular expression range to match Unicode error sequences in XEmacs.
 Invalid Unicode sequences on input are represented as XEmacs
 characters with values stored as the keys in
 `unicode-error-default-translation-table', one character for each
 invalid octet.  You can use this variable (with `re-search-forward' or
 		;			 unicode-error-sequence-regexp-range
 		;			 "]"))
 	      nil
 	      (format "Could not find char ?\\x%x in buffer" i))))
 (defun frob-unicode-errors-region (frob-function begin end &optional buffer)
 "Call FROB-FUNCTION on the Unicode error sequences between BEGIN and END.
 Optional argument BUFFER specifies the buffer that should be examined for
 such sequences.  "
 (check-argument-type #'functionp frob-function)
 (check-argument-range begin (point-min buffer) (point-max buffer))
 (check-argument-range end (point-min buffer) (point-max buffer))
 (save-excursion
 (save-restriction
 	(if buffer (set-buffer buffer))
 	(narrow-to-region begin end)
 	(goto-char (point-min))

Mercurial > hg > xemacs-beta

comparison lisp/unicode.el @ 4268:75d0292c1bff