Mercurial > hg > xemacs-beta
diff lisp/language/chinese.el @ 159:3bb7ccffb0c0 r20-3b6
Import from CVS: tag r20-3b6
author | cvs |
---|---|
date | Mon, 13 Aug 2007 09:41:43 +0200 |
parents | |
children | 85ec50267440 |
line wrap: on
line diff
--- /dev/null Thu Jan 01 00:00:00 1970 +0000 +++ b/lisp/language/chinese.el Mon Aug 13 09:41:43 2007 +0200 @@ -0,0 +1,426 @@ +;;; chinese.el --- Support for Chinese + +;; Copyright (C) 1995 Free Software Foundation, Inc. +;; Copyright (C) 1995 Electrotechnical Laboratory, JAPAN. +;; Copyright (C) 1997 MORIOKA Tomohiko + +;; Keywords: multilingual, Chinese + +;; This file is part of XEmacs. + +;; XEmacs is free software; you can redistribute it and/or modify it +;; under the terms of the GNU General Public License as published by +;; the Free Software Foundation; either version 2, or (at your option) +;; any later version. + +;; XEmacs is distributed in the hope that it will be useful, but +;; WITHOUT ANY WARRANTY; without even the implied warranty of +;; MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU +;; General Public License for more details. + +;; You should have received a copy of the GNU General Public License +;; along with XEmacs; see the file COPYING. If not, write to the Free +;; Software Foundation, Inc., 59 Temple Place - Suite 330, Boston, MA +;; 02111-1307, USA. + +;;; Commentary: + +;; For Chinese, three character sets GB2312, BIG5, and CNS11643 are +;; supported. + +;;; Code: + +;; Syntax of Chinese characters. +(modify-syntax-entry 'chinese-gb2312 "w") +(loop for row in '(33 34 41) + do (modify-syntax-entry `[chinese-gb2312 ,row] ".")) +;;(loop for row from 35 to 40 +;; do (modify-syntax-entry `[chinese-gb2312 ,row] "w")) +;;(loop for row from 42 to 126 +;; do (modify-syntax-entry `[chinese-gb2312 ,row] "w")) + +(modify-syntax-entry 'chinese-cns11643-1 "w") +(modify-syntax-entry 'chinese-cns11643-2 "w") +(modify-syntax-entry 'chinese-big5-1 "w") +(modify-syntax-entry 'chinese-big5-2 "w") + +;; CNS11643 Plane3 thru Plane7 +;; These represent more and more obscure Chinese characters. +;; By the time you get to Plane 7, we're talking about characters +;; that appear once in some ancient manuscript and whose meaning +;; is unknown. + +(flet + ((make-chinese-cns11643-charset + (name plane final) + (make-charset + name (concat "Chinese CNS Plane " plane) + `(registry + ,(concat "CNS11643[.-]\\(.*[.-]\\)?" plane "$") + dimension 2 + chars 94 + final ,final + graphic 0)) + (modify-syntax-entry name "w") + (modify-category-entry name ?t) + )) + (make-chinese-cns11643-charset 'chinese-cns11643-3 "3" ?I) + (make-chinese-cns11643-charset 'chinese-cns11643-4 "4" ?J) + (make-chinese-cns11643-charset 'chinese-cns11643-5 "5" ?K) + (make-chinese-cns11643-charset 'chinese-cns11643-6 "6" ?L) + (make-chinese-cns11643-charset 'chinese-cns11643-7 "7" ?M) + ) + +;; PinYin-ZhuYin +(make-charset 'sisheng "PinYin-ZhuYin" + '(registry "sisheng_cwnn\\|OMRON_UDC_ZH" + dimension 1 + chars 94 + final ?0 + graphic 0 + )) + +;; If you prefer QUAIL to EGG, please modify below as you wish. +;;(when (and (featurep 'egg) (featurep 'wnn)) +;; (setq wnn-server-type 'cserver) +;; (load "its/pinyin") +;; (setq its:*standard-modes* +;; (cons (its:get-mode-map "PinYin") its:*standard-modes*))) + +;;;;;;;;;;;;;;;;;;;;;;;;;;;;;; +;;; Chinese (general) +;;;;;;;;;;;;;;;;;;;;;;;;;;;;;; + +;; (make-coding-system +;; 'iso-2022-cn 2 ?C +;; "Coding system ISO-2022-CN for Chinese (GB and CNS character sets)." +;; '(ascii +;; (nil chinese-gb2312 chinese-cns11643-1) +;; (nil chinese-cns11643-2) +;; (nil chinese-cns11643-3 chinese-cns11643-4 chinese-cns11643-5 +;; chinese-cns11643-6 chinese-cns11643-7) +;; nil ascii-eol ascii-cntl seven locking-shift single-shift nil nil nil +;; init-bol)) + +;; (define-coding-system-alias 'iso-2022-cn 'iso-2022-cn-ext) + +(defun describe-chinese-support () + "Describe how Emacs supports Chinese." + (interactive) + (with-output-to-temp-buffer "*Help*" + (princ (get-language-info "Chinese" 'documentation)) + (princ "\n"))) + +(set-language-info-alist + "Chinese" '((describe-function . describe-chinese-support) + (documentation . "\ +Emacs provides the following three kinds of Chinese support: + Chinese-GB: for users of the charset GB2312 + Chinese-BIG5: for users of the charset Big5 + Chinese-CNS: for users of the charset CNS11643 family +Please specify one of them to get more information.") + )) + +;;;;;;;;;;;;;;;;;;;;;;;;;;;;;; +;;; Chinese GB2312 (simplified) +;;;;;;;;;;;;;;;;;;;;;;;;;;;;;; + +;; (make-coding-system +;; 'cn-gb-2312 2 ?C +;; "Coding-system of Chinese EUC (so called GB Encoding)." +;; '((ascii t) chinese-gb2312 chinese-sisheng nil +;; nil ascii-eol ascii-cntl nil nil single-shift nil)) + +(make-coding-system + 'cn-gb-2312 'iso2022 + "Coding-system of Chinese EUC (Extended Unix Code)." + '(charset-g0 ascii + charset-g1 chinese-gb2312 + charset-g2 sisheng + charset-g3 t + mnemonic "Zh-GB/EUC" + )) + +;;(define-coding-system-alias 'cn-gb-2312 'euc-china) + +(copy-coding-system 'cn-gb-2312 'gb2312) +(copy-coding-system 'cn-gb-2312 'chinese-euc) + +;; (make-coding-system +;; 'hz-gb-2312 0 ?z +;; "Codins-system of Hz/ZW used for Chinese (GB)." +;; nil) +;; (put 'hz-gb-2312 'post-read-conversion 'post-read-decode-hz) +;; (put 'hz-gb-2312 'pre-write-conversion 'pre-write-encode-hz) + +(make-coding-system + 'hz-gb-2312 'no-conversion + "Coding-system of Hz/ZW used for Chinese." + '(mnemonic "Zh-GB/Hz" + eol-type lf + post-read-conversion post-read-decode-hz + pre-write-conversion pre-write-encode-hz)) + +;; (define-coding-system-alias 'hz-gb-2312 'hz) + +(copy-coding-system 'hz-gb-2312 'hz) +(copy-coding-system 'hz-gb-2312 'chinese-hz) + +(defun post-read-decode-hz (len) + (let ((pos (point))) + (decode-hz-region pos (+ pos len)))) + +(defun pre-write-encode-hz (from to) + (let ((buf (current-buffer)) + (work (get-buffer-create " *pre-write-encoding-work*"))) + (set-buffer work) + (erase-buffer) + (if (stringp from) + (insert from) + (insert-buffer-substring buf from to)) + (encode-hz-region 1 (point-max)) + nil)) + +(register-input-method + "Chinese-GB" '("quail-ccdospy" quail-use-package "quail/ccdospy")) +(register-input-method + "Chinese-GB" '("quail-ctlau" quail-use-package "quail/ctlau")) +(register-input-method + "Chinese-GB" '("quail-punct" quail-use-package "quail/punct")) +(register-input-method + "Chinese-GB" '("quail-qj" quail-use-package "quail/qj")) +(register-input-method + "Chinese-GB" '("quail-sw" quail-use-package "quail/sw")) +(register-input-method + "Chinese-GB" '("quail-ziranma" quail-use-package "quail/ziranma")) +(register-input-method + "Chinese-GB" '("quail-tonepy" quail-use-package "quail/tonepy")) +(register-input-method + "Chinese-GB" '("quail-py" quail-use-package "quail/py")) + +(defun setup-chinese-gb-environment () + "Setup multilingual environment (MULE) for Chinese GB2312 users." + (interactive) + (setq primary-language "Chinese-GB") + + (setq coding-category-iso-8-2 'cn-gb-2312) + (setq coding-category-iso-else 'iso-2022-cn) + (setq coding-category-big5 'cn-big5) + + (set-coding-priority + '(coding-category-iso-7 + coding-category-iso-else + coding-category-iso-8-2 + coding-category-big5 + coding-category-iso-8-1 + coding-category-internal + )) + + (setq-default buffer-file-coding-system 'cn-gb-2312) + (set-terminal-coding-system 'cn-gb-2312) + (set-keyboard-coding-system 'cn-gb-2312) + + (setq default-input-method '("Chinese-GB" . "quail-py")) + ) + +(defun describe-chinese-gb-support () + "Describe how Emacs supports Chinese for GB2312 users." + (interactive) + (describe-language-support-internal "Chinese-GB")) + +(set-language-info-alist + "Chinese-GB" '((setup-function . setup-chinese-gb-environment) + (describe-function . describe-chinese-gb-support) + (charset . (chinese-gb2312 chinese-sisheng)) + (coding-system . (cn-gb-2312 hz-gb-2312 iso-2022-cn)) + (sample-text . "Chinese ($AVPND(B,$AFUM(;0(B,$A::So(B) $ADc:C(B") + (documentation . nil))) + +;;;;;;;;;;;;;;;;;;;;;;;;;;;;;; +;; Chinese BIG5 (traditional) +;;;;;;;;;;;;;;;;;;;;;;;;;;;;;; + +;; (make-coding-system +;; 'big5 3 ?B +;; "Coding-system of BIG5.") + +;;(define-coding-system-alias 'big5 'cn-big5) + +(make-coding-system + 'big5 'big5 + "Coding-system of BIG5." + '(mnemonic "Zh/Big5")) + +(copy-coding-system 'big5 'cn-big5) +(copy-coding-system 'big5 'chinese-big5) + +;; Big5 font requires special encoding. +;; (define-ccl-program ccl-encode-big5-font +;; `(0 +;; ;; In: R0:chinese-big5-1 or chinese-big5-2 +;; ;; R1:position code 1 +;; ;; R2:position code 2 +;; ;; Out: R1:font code point 1 +;; ;; R2:font code point 2 +;; ((r2 = ((((r1 - ?\x21) * 94) + r2) - ?\x21)) +;; (if (r0 == ,(charset-id 'chinese-big5-2)) (r2 += 6280)) +;; (r1 = ((r2 / 157) + ?\xA1)) +;; (r2 %= 157) +;; (if (r2 < ?\x3F) (r2 += ?\x40) (r2 += ?\x62)))) +;; "CCL program to encode a Big5 code to code point of Big5 font.") + +;; (setq font-ccl-encoder-alist +;; (cons (cons "big5" ccl-encode-big5-font) font-ccl-encoder-alist)) + +(define-ccl-program ccl-encode-big5-1-font + '(((r1 = ((((r0 - #x21) * 94) + r1) - #x21)) + (r0 = ((r1 / 157) + #xA1)) + (r1 %= 157) + (if (r1 < #x3F) (r1 += #x40) (r1 += #x62)))) + "CCL program to encode a Big5 code (level1) to code point of Big5 font.") + +;; 6280 is the number of characters that got shoved into `chinese-big5-1'. +(define-ccl-program ccl-encode-big5-2-font + '(((r1 = (((((r0 - #x21) * 94) + r1) - #x21) + 6280)) + (r0 = ((r1 / 157) + #xA1)) + (r1 %= 157) + (if (r1 < #x3F) (r1 += #x40) (r1 += #x62)))) + "CCL program to encode a Big5 code (level2) to code point of Big5 font.") + +(set-charset-ccl-program 'chinese-big5-1 ccl-encode-big5-1-font) +(set-charset-ccl-program 'chinese-big5-2 ccl-encode-big5-2-font) + +(register-input-method + "Chinese-BIG5" '("quail-qj-b5" quail-use-package "quail/qj-b5")) +(register-input-method + "Chinese-BIG5" '("quail-zozy" quail-use-package "quail/zozy")) +(register-input-method + "Chinese-BIG5" '("quail-tsangchi-b5" quail-use-package "quail/tsangchi-b5")) +(register-input-method + "Chinese-BIG5" '("quail-py-b5" quail-use-package "quail/py-b5")) +(register-input-method + "Chinese-BIG5" '("quail-quick-b5" quail-use-package "quail/quick-bt")) +(register-input-method + "Chinese-BIG5" '("quail-etzy" quail-use-package "quail/etzy")) +(register-input-method + "Chinese-BIG5" '("quail-ecdict" quail-use-package "quail/ecdict")) +(register-input-method + "Chinese-BIG5" '("quail-ctlaub" quail-use-package "quail/ctlaub")) +(register-input-method + "Chinese-BIG5" '("quail-array30" quail-use-package "quail/array30")) +(register-input-method + "Chinese-BIG5" '("quail-4corner" quail-use-package "quail/4corner")) + +(defun setup-chinese-big5-environment () + "Setup multilingual environment (MULE) for Chinese Big5 users." + (interactive) + (setq primary-language "Chinese-BIG5") + + (setq coding-category-big5 'cn-big5) + (setq coding-category-iso-else 'iso-2022-cn) + (setq coding-category-iso-8-2 'cn-gb-2312) + + (set-coding-priority + '(coding-category-iso-7 + coding-category-iso-else + coding-category-big5 + coding-category-iso-8-2)) + + (setq-default buffer-file-coding-system 'cn-big5) + (set-terminal-coding-system 'cn-big5) + (set-keyboard-coding-system 'cn-big5) + + (setq default-input-method '("Chinese-BIG5" . "quail-py-b5")) + ) + +(defun describe-chinese-big5-support () + "Describe how Emacs supports Chinese for Big5 users." + (interactive) + (describe-language-support-internal "Chinese-BIG5")) + +(set-language-info-alist + "Chinese-BIG5" '((setup-function . setup-chinese-big5-environment) + (describe-function . describe-chinese-big5-support) + (charset . (chinese-big5-1 chinese-big5-2)) + (coding-system . (cn-big5 iso-2022-cn)) + (sample-text . "Cantonese ($(0GnM$(B,$(0N]0*Hd(B) $(0*/=((B, $(0+$)p(B") + (documentation . nil))) + +;;;;;;;;;;;;;;;;;;;;;;;;;;;;;; +;; Chinese CNS11643 (traditional) +;;;;;;;;;;;;;;;;;;;;;;;;;;;;;; + +(register-input-method + "Chinese-CNS" '("quail-quick-cns" quail-use-package "quail/quick-cns")) +(register-input-method + "Chinese-CNS" '("quail-tsangchi-cns" quail-use-package "quail/tsangchi-cns")) + +(defun setup-chinese-cns-environment () + "Setup multilingual environment (MULE) for Chinese CNS11643 family users." + (interactive) + (setq primary-language "Chinese-CNS") + + (setq coding-category-iso-else 'iso-2022-cn) + (setq coding-category-big5 'cn-big5) + (setq coding-category-iso-8-2 'cn-gb-2312) + + (set-coding-priority + '(coding-category-iso-7 + coding-category-iso-else + coding-category-iso-8-2 + coding-category-big5)) + + (setq-default buffer-file-coding-system 'iso-2022-cn) + (set-terminal-coding-system 'iso-2022-cn) + (set-keyboard-coding-system 'iso-2022-cn) + + (setq default-input-method '("Chinese-CNS" . "quail-py-cns")) + ) + +(defun describe-chinese-cns-support () + "Describe how Emacs supports Chinese for CNS11643 family users." + (interactive) + (describe-language-support-internal "Chinese-CNS")) + +(set-language-info-alist + "Chinese-CNS" '((setup-function . setup-chinese-cns-environment) + (describe-function . describe-chinese-cns-support) + (charset . (chinese-cns11643-1 chinese-cns11643-2 + chinese-cns11643-3 chinese-cns11643-4 + chinese-cns11643-5 chinese-cns11643-6 + chinese-cns11643-7)) + (coding-system . (iso-2022-cn)) + (documentation . nil))) + + +;;; for XEmacs (will be obsoleted) + +(define-language-environment 'chinese + "Chinese (includes GB, Big5, and CNS)" + (lambda () + (require 'chinese) + (set-coding-category-system 'iso-8-2 'cn-gb-2312) + (set-coding-priority-list '(iso-8-2 big5 iso-8-designate)) + (set-pathname-coding-system 'cn-gb-2312) + (set-default-buffer-file-coding-system 'cn-gb-2312) ; GB encoding + (setq terminal-coding-system 'cn-gb-2312) + (setq keyboard-coding-system 'cn-gb-2312) + (add-hook 'comint-exec-hook + (lambda () + (let ((proc (get-buffer-process (current-buffer)))) + (set-process-input-coding-system proc 'cn-gb-2312) + (set-process-output-coding-system proc 'cn-gb-2312)))) + (set-buffer-file-coding-system-for-read 'automatic-conversion) + (set-default-buffer-file-coding-system 'cn-gb-2312) + (setq keyboard-coding-system 'cn-gb-2312) + (setq terminal-coding-system 'cn-gb-2312) + (when (eq 'x (device-type (selected-device))) + (x-use-halfwidth-roman-font 'chinese-gb2312 "gb1988")))) +;; (when (featurep 'egg) +;; (setq-default its:*current-map* (its:get-mode-map "PinYin"))) +;; (setq-default quail-current-package (assoc "py" quail-package-alist)))) +;; )) + +(set-coding-category-system 'big5 'big5) + +;;; chinese.el ends here