diff lisp/mule/cyrillic.el @ 428:3ecd8885ac67 r21-2-22

Import from CVS: tag r21-2-22
author cvs
date Mon, 13 Aug 2007 11:28:15 +0200
parents
children 576fb035e263
line wrap: on
line diff
--- /dev/null	Thu Jan 01 00:00:00 1970 +0000
+++ b/lisp/mule/cyrillic.el	Mon Aug 13 11:28:15 2007 +0200
@@ -0,0 +1,292 @@
+;;; cyrillic.el --- Support for Cyrillic -*- coding: iso-2022-7bit; -*-
+
+;; Copyright (C) 1995,1999 Electrotechnical Laboratory, JAPAN.
+;; Licensed to the Free Software Foundation.
+;; Copyright (C) 1997 MORIOKA Tomohiko
+
+;; Keywords: multilingual, Cyrillic
+
+;; This file is part of XEmacs.
+
+;; XEmacs is free software; you can redistribute it and/or modify it
+;; under the terms of the GNU General Public License as published by
+;; the Free Software Foundation; either version 2, or (at your option)
+;; any later version.
+
+;; XEmacs is distributed in the hope that it will be useful, but
+;; WITHOUT ANY WARRANTY; without even the implied warranty of
+;; MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the GNU
+;; General Public License for more details.
+
+;; You should have received a copy of the GNU General Public License
+;; along with XEmacs; see the file COPYING.  If not, write to the Free
+;; Software Foundation, Inc., 59 Temple Place - Suite 330, Boston, MA
+;; 02111-1307, USA.
+
+;;; Commentary:
+
+;; The character set ISO8859-5 is supported.  KOI-8 and ALTERNATIVNYJ
+;; are converted to ISO8859-5 internally.
+
+;;; Code:
+
+;; For syntax of Cyrillic
+(modify-syntax-entry 'cyrillic-iso8859-5 "w")
+(modify-syntax-entry ?,L-(B ".")
+(modify-syntax-entry ?,Lp(B ".")
+(modify-syntax-entry ?,L}(B ".")
+
+;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;
+;;; CYRILLIC
+;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;
+
+;; ISO-8859-5 staff
+
+;; (make-coding-system
+;;  'cyrillic-iso-8bit 2 ?5
+;;  "ISO 2022 based 8-bit encoding for Cyrillic script (MIME:ISO-8859-5)"
+;;  '(ascii cyrillic-iso8859-5  nil nil
+;;    nil nil nil nil nil nil nil)
+;;  '((safe-charsets ascii cyrillic-iso8859-5)
+;;    (mime-charset . iso-8859-5)))
+
+;; (define-coding-system-alias 'iso-8859-5 'cyrillic-iso-8bit)
+
+(make-coding-system
+ 'iso-8859-5 'iso2022
+ "MIME ISO-8859-5"
+ '(charset-g0 ascii
+   charset-g1 cyrillic-iso8859-5
+   charset-g2 t
+   charset-g3 t
+   mnemonic "ISO8/Cyr"
+   ))
+
+(set-language-info-alist
+ "Cyrillic-ISO" '((charset cyrillic-iso8859-5)
+		  (tutorial . "TUTORIAL.ru")
+		  (coding-system iso-8859-5)
+		  (coding-priority iso-8859-5)
+		  (input-method . "cyrillic-yawerty")
+		  (features cyril-util)
+		  (sample-text . "Russian (,L@caaZXY(B)	,L7T`PRabRcYbU(B!")
+		  (documentation . "Support for Cyrillic ISO-8859-5."))
+ '("Cyrillic"))
+
+;; KOI-8 staff
+
+(eval-and-compile
+
+(defvar cyrillic-koi8-r-decode-table
+  [
+   0 1 2 3 4 5 6 7 8 9 10 11 12 13 14 15
+   16 17 18 19 20 21 22 23 24 25 26 27 28 29 30 31
+   32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47
+   48 49 50 51 52 53 54 55 56 57 58 59 60 61 62 63
+   64 65 66 67 68 69 70 71 72 73 74 75 76 77 78 79
+   80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95
+   96 97 98 99 100 101 102 103 104 105 106 107 108 109 110 111
+   112 113 114 115 116 117 118 119 120 121 122 123 124 125 126 127
+   ?$B(!(B ?$B("(B ?$B(#(B ?$B($(B ?$B(&(B ?$B(%(B ?$B('(B ?$B()(B ?$B(((B ?$B(*(B ?$B(+(B 32  ?$(G#'(B ?$(G#+(B ?$(G#/(B 32
+   32  ?$(C"F(B 32  32  ?$B"#(B 32  ?$B"e(B ?$A!V(B ?$A!\(B ?$A!](B ?,L (B  32  ?,A0(B  ?,A2(B  ?,A7(B  ?,Aw(B
+   ?$(G#D(B 32  32  ?,Lq(B  32  32  32  32  32  32  32  32  32  32  32  ?$(G#E(B
+   32  32  ?$(G#G(B ?,L!(B  32  32  32  32  32  32  32  32  ?$(G#F(B 32  32  ?,A)(B
+   ?,Ln(B  ?,LP(B  ?,LQ(B  ?,Lf(B  ?,LT(B  ?,LU(B  ?,Ld(B  ?,LS(B  ?,Le(B  ?,LX(B  ?,LY(B  ?,LZ(B  ?,L[(B  ?,L\(B  ?,L](B  ?,L^(B 
+   ?,L_(B  ?,Lo(B  ?,L`(B  ?,La(B  ?,Lb(B  ?,Lc(B  ?,LV(B  ?,LR(B  ?,Ll(B  ?,Lk(B  ?,LW(B  ?,Lh(B  ?,Lm(B  ?,Li(B  ?,Lg(B  ?,Lj(B 
+   ?,LN(B  ?,L0(B  ?,L1(B  ?,LF(B  ?,L4(B  ?,L5(B  ?,LD(B  ?,L3(B  ?,LE(B  ?,L8(B  ?,L9(B  ?,L:(B  ?,L;(B  ?,L<(B  ?,L=(B  ?,L>(B 
+   ?,L?(B  ?,LO(B  ?,L@(B  ?,LA(B  ?,LB(B  ?,LC(B  ?,L6(B  ?,L2(B  ?,LL(B  ?,LK(B  ?,L7(B  ?,LH(B  ?,LM(B  ?,LI(B  ?,LG(B  ?,LJ(B ]
+  "Cyrillic KOI8-R decoding table.")
+
+(defvar cyrillic-koi8-r-encode-table
+  (let ((table (make-vector 256 32))
+	(i 0))
+    (while (< i 256)
+      (let* ((ch (aref cyrillic-koi8-r-decode-table i))
+	     (split (split-char ch)))
+	(cond ((eq (car split) 'cyrillic-iso8859-5)
+	       (aset table (logior (nth 1 split) 128) i)
+	       )
+	      ((eq ch 32))
+	      ((eq (car split) 'ascii)
+	       (aset table ch i)
+	       )))
+      (setq i (1+ i)))
+    table)
+  "Cyrillic KOI8-R encoding table.")
+
+)
+
+(define-ccl-program ccl-decode-koi8
+  `(3
+    ((read r0)
+     (loop
+      (write-read-repeat r0 ,cyrillic-koi8-r-decode-table))))
+  "CCL program to decode KOI8.")
+
+(define-ccl-program ccl-encode-koi8
+  `(1
+    ((read r0)
+     (loop
+      (if (r0 != ,(charset-id 'cyrillic-iso8859-5))
+	  (write-read-repeat r0)
+	((read r0)
+	 (write-read-repeat r0 , cyrillic-koi8-r-encode-table))))))
+  "CCL program to encode KOI8.")
+
+;; (make-coding-system
+;;  'cyrillic-koi8 4
+;;  ;; We used to use ?K.  It is true that ?K is more strictly correct,
+;;  ;; but it is also used for Korean.
+;;  ;; So people who use koi8 for languages other than Russian
+;;  ;; will have to forgive us.
+;;  ?R "KOI8 8-bit encoding for Cyrillic (MIME: KOI8-R)"
+;;  '(ccl-decode-koi8 . ccl-encode-koi8)
+;;  '((safe-charsets ascii cyrillic-iso8859-5)
+;;    (mime-charset . koi8-r)
+;;    (valid-codes (0 . 127) 163 179 (192 . 255))
+;;    (charset-origin-alist (cyrillic-iso8859-5 "KOI8-R"
+;;                                              cyrillic-encode-koi8-r-char))))
+
+;; (define-coding-system-alias 'koi8-r 'cyrillic-koi8)
+;; (define-coding-system-alias 'koi8 'cyrillic-koi8)
+
+(make-coding-system
+ 'koi8-r 'ccl
+ "Coding-system used for KOI8-R."
+ `(decode ,ccl-decode-koi8
+   encode ,ccl-encode-koi8
+   mnemonic "KOI8"))
+
+;; it is not correct, but XEmacs doesn't have `ccl' category...
+(coding-system-put 'koi8-r 'category 'iso-8-1)
+
+;; (define-ccl-program ccl-encode-koi8-font
+;;   `(0
+;;     ((r1 |= 128)
+;;      (r1 = r1 ,cyrillic-koi8-r-encode-table)))
+;;   "CCL program to encode Cyrillic chars to KOI font.")
+
+;; (setq font-ccl-encoder-alist
+;;       (cons (cons "koi8" ccl-encode-koi8-font) font-ccl-encoder-alist))
+
+;; (defvar cyrillic-koi8-r-nonascii-translation-table
+;;   (make-translation-table-from-vector cyrillic-koi8-r-decode-table)
+;;   "Value of `nonascii-translation-table' in Cyrillic-KOI8 language environment..")
+
+(set-language-info-alist
+ "Cyrillic-KOI8" '((charset cyrillic-iso8859-5)
+		   (coding-system koi8-r)
+		   (coding-priority koi8-r)
+		   (input-method . "cyrillic-yawerty")
+		   (features cyril-util)
+		   (tutorial . "TUTORIAL.ru")
+		   (sample-text . "Russian (,L@caaZXY(B)	,L7T`PRabRcYbU(B!")
+		   (documentation . "Support for Cyrillic KOI8-R."))
+ '("Cyrillic"))
+
+;;; ALTERNATIVNYJ staff
+
+(eval-and-compile
+
+(defvar cyrillic-alternativnyj-decode-table
+  [
+   0   1   2   3   4   5   6   7   8   9  10  11  12  13  14  15
+   16  17  18  19  20  21  22  23  24  25  26  27  28  29  30  31
+   32  33  34  35  36  37  38  39  40  41  42  43  44  45  46  47
+   48  49  50  51  52  53  54  55  56  57  58  59  60  61  62  63
+   64  65  66  67  68  69  70  71  72  73  74  75  76  77  78  79
+   80  81  82  83  84  85  86  87  88  89  90  91  92  93  94  95
+   96  97  98  99 100 101 102 103 104 105 106 107 108 109 110 111
+   112 113 114 115 116 117 118 119 120 121 122 123 124 125 126 127
+   ?,L0(B  ?,L1(B  ?,L2(B  ?,L3(B  ?,L4(B  ?,L5(B  ?,L6(B  ?,L7(B  ?,L8(B  ?,L9(B  ?,L:(B  ?,L;(B  ?,L<(B  ?,L=(B  ?,L>(B  ?,L?(B
+   ?,L@(B  ?,LA(B  ?,LB(B  ?,LC(B  ?,LD(B  ?,LE(B  ?,LF(B  ?,LG(B  ?,LH(B  ?,LI(B  ?,LJ(B  ?,LK(B  ?,LL(B  ?,LM(B  ?,LN(B  ?,LO(B
+   ?,LP(B  ?,LQ(B  ?,LR(B  ?,LS(B  ?,LT(B  ?,LU(B  ?,LV(B  ?,LW(B  ?,LX(B  ?,LY(B  ?,LZ(B  ?,L[(B  ?,L\(B  ?,L](B  ?,L^(B  ?,L_(B
+   32  32  32  32  32  32  32  32  32  32  32  32  32  32  32  32
+   32  32  32  32  32  32  32  32  32  32  32  32  32  32  32  32
+   32  32  32  32  32  32  32  32  32  32  32  32  32  32  32  32
+   ?,L`(B  ?,La(B  ?,Lb(B  ?,Lc(B  ?,Ld(B  ?,Le(B  ?,Lf(B  ?,Lg(B  ?,Lh(B  ?,Li(B  ?,Lj(B  ?,Lk(B  ?,Ll(B  ?,Lm(B  ?,Ln(B  ?,Lo(B
+   ?,L!(B  ?,Lq(B   32  32  32  32  32  32  32  32  32  32  32  32  32 ?,Lp(B]
+  "Cyrillic ALTERNATIVNYJ decoding table.")
+
+(defvar cyrillic-alternativnyj-encode-table
+  (let ((table (make-vector 256 32))
+	(i 0))
+    (while (< i 256)
+      (let* ((ch (aref cyrillic-alternativnyj-decode-table i))
+	     (split (split-char ch)))
+	(if (eq (car split) 'cyrillic-iso8859-5)
+	    (aset table (logior (nth 1 split) 128) i)
+	  (if (/= ch 32)
+	      (aset table ch i))))
+      (setq i (1+ i)))
+    table)
+  "Cyrillic ALTERNATIVNYJ encoding table.")
+  
+)
+
+
+(define-ccl-program ccl-decode-alternativnyj
+  `(3
+    ((read r0)
+     (loop
+      (write-read-repeat r0 ,cyrillic-alternativnyj-decode-table))))
+  "CCL program to decode Alternativnyj.")
+
+(define-ccl-program ccl-encode-alternativnyj
+  `(1
+    ((read r0)
+     (loop
+      (if (r0 != ,(charset-id 'cyrillic-iso8859-5))
+	  (write-read-repeat r0)
+	((read r0)
+	 (write-read-repeat r0 ,cyrillic-alternativnyj-encode-table))))))
+  "CCL program to encode Alternativnyj.")
+
+;; (make-coding-system
+;;  'cyrillic-alternativnyj 4 ?A
+;;  "ALTERNATIVNYJ 8-bit encoding for Cyrillic"
+;;  '(ccl-decode-alternativnyj . ccl-encode-alternativnyj)
+;;  '((safe-charsets ascii cyrillic-iso8859-5)
+;;    (valid-codes (0 . 175) (224 . 241) 255)
+;;    (charset-origin-alist (cyrillic-iso8859-5 "ALTERNATIVNYJ"
+;;                                              cyrillic-encode-koi8-r-char))))
+
+
+;; (define-coding-system-alias 'alternativnyj 'cyrillic-alternativnyj)
+
+(make-coding-system
+ 'alternativnyj 'ccl
+ "Coding-system used for Alternativnyj"
+ `(decode ,ccl-decode-alternativnyj
+   encode ,ccl-encode-alternativnyj
+   mnemonic "Cy.Alt"))
+
+;; it is not correct, but XEmacs doesn't have `ccl' category...
+(coding-system-put 'alternativnyj 'category 'iso-8-1)
+
+;; (define-ccl-program ccl-encode-alternativnyj-font
+;;   '(0
+;;     ((r1 |= 128)
+;;      (r1 = r1 ,cyrillic-alternativnyj-encode-table)))
+;;   "CCL program to encode Cyrillic chars to Alternativnyj font.")
+
+;; (setq font-ccl-encoder-alist
+;;       (cons (cons "alternativnyj" ccl-encode-alternativnyj-font)
+;;             font-ccl-encoder-alist))
+
+;; (defvar cyrillic-alternativnyj-nonascii-translation-table
+;;   (make-translation-table-from-vector cyrillic-alternativnyj-decode-table)
+;;   "Value of `nonascii-translation-table' in Cyrillic-ALT language environment.")
+
+(set-language-info-alist
+ "Cyrillic-ALT" '((charset cyrillic-iso8859-5)
+		  (coding-system alternativnyj)
+		  (coding-priority alternativnyj)
+		  (input-method . "cyrillic-yawerty")
+		  (features cyril-util)
+		  (tutorial . "TUTORIAL.ru")
+		  (sample-text . "Russian (,L@caaZXY(B)	,L7T`PRabRcYbU(B!")
+		  (documentation . "Support for Cyrillic ALTERNATIVNYJ."))
+ '("Cyrillic"))
+
+;;; cyrillic.el ends here