Mercurial > hg > xemacs-beta
annotate lisp/mule/mule-cmds.el @ 4468:a78d697ccd2c
Import and extend GNU's descr-text.el, supporting prefix argument for C-x =
2008-05-25 Aidan Kehoe <kehoea@parhasard.net>
* descr-text.el: New.
Taken from GNU's GPLV2 version of 2007-02-14, with modifications
for XEmacs support and extensions for Unihan.txt support and
db/dbm caches.
* simple.el (what-cursor-position):
Support an optional prefix argument, as does GNU, calling
#'describe-char to giving more detail on the character at point,
notably from UnicodeData and (in our case, optionally) Unihan.txt.
* syntax.el (syntax-after):
Make this available for the sake of #'describe-char.
* mule/mule-cmds.el (iso-2022-control-alist):
Make this available, for the sake of #'encoded-string-description
and #'describe-char.
* mule/mule-cmds.el (encoded-string-description):
Make this available, for the sake of #'describe-char.
* unicode.el (unicode-error-default-translation-table):
Make this a char table of type generic, not of type char. Makes it
possible to have the relevant logic in #'describe-char reasonably
clear; also, and this is undocumented, makes it much easier to
implement #'frob-unicode-errors-region. I should document this,
and revise #'frob-unicode-errors-region.
author | Aidan Kehoe <kehoea@parhasard.net> |
---|---|
date | Sun, 25 May 2008 21:11:35 +0200 |
parents | 0194a744d2d3 |
children | b75b075a9041 |
rev | line source |
---|---|
502 | 1 ;;; mule-cmds.el --- Commands for multilingual environment -*- coding: iso-2022-7bit; -*- |
428 | 2 |
3 ;; Copyright (C) 1995,1999 Electrotechnical Laboratory, JAPAN. | |
4 ;; Licensed to the Free Software Foundation. | |
5 ;; Copyright (C) 1997 MORIOKA Tomohiko | |
1318 | 6 ;; Copyright (C) 2000, 2001, 2002, 2003 Ben Wing. |
428 | 7 |
8 ;; Keywords: mule, multilingual | |
9 | |
10 ;; This file is part of XEmacs. | |
11 | |
12 ;; XEmacs is free software; you can redistribute it and/or modify it | |
13 ;; under the terms of the GNU General Public License as published by | |
14 ;; the Free Software Foundation; either version 2, or (at your option) | |
15 ;; any later version. | |
16 | |
17 ;; XEmacs is distributed in the hope that it will be useful, but | |
18 ;; WITHOUT ANY WARRANTY; without even the implied warranty of | |
19 ;; MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU | |
20 ;; General Public License for more details. | |
21 | |
22 ;; You should have received a copy of the GNU General Public License | |
23 ;; along with XEmacs; see the file COPYING. If not, write to the Free | |
24 ;; Software Foundation, Inc., 59 Temple Place - Suite 330, Boston, MA | |
25 ;; 02111-1307, USA. | |
26 | |
444 | 27 ;; Note: Some of the code here is now in code-cmds.el |
28 | |
428 | 29 ;;; Code: |
30 | |
31 ;;; MULE related key bindings and menus. | |
32 | |
444 | 33 ;; Preserve the old name |
34 (defvaralias 'mule-keymap 'coding-keymap) | |
35 | |
428 | 36 (define-key mule-keymap "x" 'set-selection-coding-system) |
37 (define-key mule-keymap "X" 'set-next-selection-coding-system) | |
38 (define-key mule-keymap "\C-\\" 'set-input-method) | |
39 ;;(define-key mule-keymap "c" 'list-coding-system-briefly) ; XEmacs | |
40 (define-key mule-keymap "C" 'describe-coding-system) ; XEmacs | |
41 (define-key mule-keymap "r" 'toggle-display-direction) ; XEmacs | |
42 (define-key mule-keymap "l" 'set-language-environment) | |
43 | |
44 (define-key help-map "L" 'describe-language-environment) | |
45 (define-key help-map "\C-\\" 'describe-input-method) | |
46 (define-key help-map "I" 'describe-input-method) | |
47 (define-key help-map "h" 'view-hello-file) | |
48 | |
49 ;; Menu for XEmacs were moved to menubar-items.el. | |
50 | |
51 | |
52 ;; This should be a single character key binding because users use it | |
53 ;; very frequently while editing multilingual text. Now we can use | |
54 ;; only two such keys: "\C-\\" and "\C-^", but the latter is not | |
55 ;; convenient because it requires shifting on most keyboards. An | |
56 ;; alternative is "\C-\]" which is now bound to `abort-recursive-edit' | |
57 ;; but it won't be used that frequently. | |
58 (define-key global-map "\C-\\" 'toggle-input-method) | |
59 | |
771 | 60 ;; Original mapping will be altered by set-keyboard-coding-system. |
61 (define-key global-map [(meta \#)] 'ispell-word) ;originally "$" | |
62 ;; (define-key global-map [(meta {)] 'insert-parentheses) ;originally "(" | |
63 | |
428 | 64 ;;; This is no good because people often type Shift-SPC |
65 ;;; meaning to type SPC. -- rms. | |
66 ;;; ;; Here's an alternative key binding for X users (Shift-SPACE). | |
771 | 67 ;;; (define-key global-map '(shift space) 'toggle-input-method) |
428 | 68 |
69 (defun view-hello-file () | |
70 "Display the HELLO file which list up many languages and characters." | |
71 (interactive) | |
72 ;; We have to decode the file in any environment. | |
73 (let ((coding-system-for-read 'iso-2022-7bit)) | |
74 (find-file-read-only (expand-file-name "HELLO" data-directory)))) | |
75 | |
3999 | 76 (defvar system-type-file-name-coding |
77 '((darwin . utf-8)) | |
78 "A map from values of `system-type' to invariant file name coding systems. | |
79 Used if a give system type does not vary in the coding system it uses for | |
80 file names; otherwise, `language-info-alist' is consulted for this | |
81 information. This affects the `file-name' coding system alias, but not the | |
82 `file-name-coding-system' variable, which in practice is mostly ignored. ") | |
83 | |
428 | 84 |
771 | 85 ;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;; |
86 ;;; Language Support Functions ;;; | |
87 ;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;; | |
428 | 88 (defvar language-info-alist nil |
89 "Alist of language environment definitions. | |
90 Each element looks like: | |
771 | 91 (LANGUAGE-NAME . ((PROP . VALUE) ...)) |
428 | 92 where LANGUAGE-NAME is a string, the name of the language environment, |
771 | 93 PROP is a symbol denoting a property, and VALUE is the data associated |
94 with PROP. | |
95 See `set-language-info' for documentation on PROP and VALUE.") | |
428 | 96 |
771 | 97 (defun get-language-info (lang-env prop) |
98 "Return information listed under PROP for language environment LANG-ENV. | |
99 PROP is a symbol denoting a property. | |
100 For a list of useful values for PROP and their meanings, | |
101 see `set-language-info'." | |
428 | 102 (if (symbolp lang-env) |
103 (setq lang-env (symbol-name lang-env))) | |
104 (let ((lang-slot (assoc-ignore-case lang-env language-info-alist))) | |
105 (if lang-slot | |
771 | 106 (cdr (assq prop (cdr lang-slot)))))) |
428 | 107 |
771 | 108 (defun set-language-info (lang-env prop value) |
428 | 109 "Modify part of the definition of language environment LANG-ENV. |
771 | 110 Specifically, this stores the information VALUE under PROP |
428 | 111 in the definition of this language environment. |
771 | 112 PROP is a symbol denoting a property, and VALUE is the value of that property. |
113 | |
114 Meaningful values for PROP include | |
115 | |
116 documentation VALUE is documentation of what this language environment | |
117 is meant for, and how to use it. | |
118 | |
119 charset VALUE is a list of the character sets used by this | |
120 language environment. | |
121 | |
122 sample-text VALUE is one line of text, | |
123 written using those character sets, | |
124 appropriate for this language environment. | |
125 | |
126 setup-function VALUE is a function to call to switch to this | |
127 language environment. | |
128 | |
129 exit-function VALUE is a function to call to leave this | |
130 language environment. | |
131 | |
132 coding-system VALUE is a list of coding systems that are good | |
133 for saving text written in this language environment. | |
134 This list serves as suggestions to the user; | |
135 in effect, as a kind of documentation. | |
136 | |
137 coding-priority VALUE is a list of coding systems for this language | |
138 environment, in order of decreasing priority. | |
139 This is used to set up the coding system priority | |
140 list when you switch to this language environment. | |
141 | |
142 input-method VALUE is a default input method for this language | |
143 environment. | |
144 | |
145 features VALUE is a list of features requested in this | |
146 language environment. | |
147 | |
148 tutorial VALUE is a tutorial file name written in the language. | |
149 | |
150 locale VALUE is a list of locale expressions, which serve | |
151 two purposes: (1) Determining the language | |
152 environment from the current system locale at | |
153 startup, and (2) determining how to set the system | |
154 locale when the language environment is changed. | |
155 Each expression will be tried in turn, and should | |
156 be a string (for case (1), the string is matched | |
157 against the current locale using the regular | |
158 expression \"^STRING[^A-Za-z0-9]\"; for case (2), | |
159 the string is passed directly to | |
160 `set-current-locale' until a non-nil result is | |
161 returned), or a function of one argument. For | |
162 case (1), this argument will be a locale, and the | |
163 function should return t or nil to indicate | |
164 whether this locale matches the language | |
165 environment; for case (2), the argument will be | |
166 nil, and the function should call | |
167 `set-current-locale' itself and return the set | |
168 locale string if the locale was successfully set, | |
169 and nil otherwise. | |
428 | 170 |
771 | 171 NOTE: This property is *NOT* used under MS Windows; |
172 instead, the `mswindows-locale' property is used. | |
173 | |
174 cygwin-locale VALUE specifies a general Unix-style C library | |
175 locale that will be used to initialize the LANG | |
176 environment variable under MS Windows native, when the | |
177 system cannot test out the locales specified in the | |
178 `locale' property. This is so that Cygwin programs | |
179 can be run from an MS Windows native XEmacs. If not | |
180 specified, the last entry in `locale' will be used. | |
181 | |
182 native-coding-system VALUE is a single coding-system expression, or a | |
183 list of such expressions. These expressions are | |
184 used to compute the operating system's native | |
185 coding system, i.e. the coding system to be used | |
186 as the alias for `native' and `file-name'. This | |
187 specifies the coding system used for text | |
188 exchanged with the operating system, such as file | |
189 names, environment variables, subprocess | |
190 arguments, etc. Each expression should be either | |
191 a symbol naming a coding system or a function | |
192 (anything that is `functionp') of one argument, | |
193 which is passed the current locale corresponding | |
194 to this language environment and should return a | |
195 coding system or nil. Each expression is tried in | |
196 turn until a coding system is obtained. If there | |
197 is no non-nil result, or no value is specified for | |
198 this property, the first coding system listed | |
199 under the `coding-system' property is used. | |
200 | |
201 NOTE: This is *NOT* used under MS Windows. | |
202 Instead, `mswindows-multibyte-system-default' | |
203 is always used, since the system default code | |
204 page is what the Win32 API routines make use | |
205 of, and this cannot be changed. (We get around | |
206 this by using the Unicode versions whenever | |
207 possible -- i.e. on Windows NT/2000, and on | |
208 Windows 9x with the few API's that support | |
209 Unicode.) | |
210 | |
211 mswindows-locale VALUE is an element of the form MSWINDOWS-LOCALE, or | |
212 a list of such elements. Each element is an MS | |
213 Windows locale, of the form that can be passed to | |
214 `mswindows-set-current-locale'. This property is used | |
215 both to determine the current language environment at | |
216 startup (by matching MSWINDOWS-LOCALE against the | |
217 value returned by `mswindows-user-default-locale') and | |
218 to set the values of `set-current-locale' and | |
219 `mswindows-set-current-locale' when the current | |
220 language environment is changed. (The correct CLIB | |
221 locale can always be generated by passing in the | |
222 SUBLANG, with dashes in place of underscores, or the | |
223 LANG if there's no SUBLANG. The return value will be | |
224 the canonicalized locale, in proper CLIB form.) | |
225 | |
226 If there is no value for this property, the MS Windows | |
227 locale is assumed to have the same name as the | |
228 language environment." | |
428 | 229 (if (symbolp lang-env) |
230 (setq lang-env (symbol-name lang-env))) | |
771 | 231 (let (lang-slot prop-slot) |
428 | 232 (setq lang-slot (assoc lang-env language-info-alist)) |
233 (if (null lang-slot) ; If no slot for the language, add it. | |
234 (setq lang-slot (list lang-env) | |
235 language-info-alist (cons lang-slot language-info-alist))) | |
771 | 236 (setq prop-slot (assq prop lang-slot)) |
237 (if (null prop-slot) ; If no slot for the prop, add it. | |
428 | 238 (progn |
771 | 239 (setq prop-slot (list prop)) |
240 (setcdr lang-slot (cons prop-slot (cdr lang-slot))))) | |
241 (setcdr prop-slot value))) | |
428 | 242 |
243 (defun set-language-info-alist (lang-env alist &optional parents) | |
244 "Store ALIST as the definition of language environment LANG-ENV. | |
771 | 245 ALIST is an alist of properties and values. See the documentation of |
246 `set-language-info' for the allowed properties." | |
428 | 247 (if (symbolp lang-env) |
248 (setq lang-env (symbol-name lang-env))) | |
771 | 249 ;; FSF has 30 lines of unbelievably ugly code to set up the menus |
250 ;; appropriately. We just use a filter. | |
251 (while alist | |
252 (set-language-info lang-env (car (car alist)) (cdr (car alist))) | |
3707 | 253 (setq alist (cdr alist))) |
254 lang-env) | |
428 | 255 |
256 (defun read-language-name (key prompt &optional default) | |
257 "Read a language environment name which has information for KEY. | |
258 If KEY is nil, read any language environment. | |
259 Prompt with PROMPT. DEFAULT is the default choice of language environment. | |
260 This returns a language environment name as a string." | |
261 (let* ((completion-ignore-case t) | |
262 (name (completing-read prompt | |
263 language-info-alist | |
264 (and key | |
265 (function (lambda (elm) (assq key elm)))) | |
266 t nil nil default))) | |
267 (if (and (> (length name) 0) | |
268 (or (not key) | |
269 (get-language-info name key))) | |
270 name))) | |
271 | |
272 ;;; Multilingual input methods. | |
273 | |
274 (defconst leim-list-file-name "leim-list.el" | |
275 "Name of LEIM list file. | |
276 This file contains a list of libraries of Emacs input methods (LEIM) | |
277 in the format of Lisp expression for registering each input method. | |
278 Emacs loads this file at startup time.") | |
279 | |
280 (defvar leim-list-header (format | |
281 ";;; %s -- list of LEIM (Library of Emacs Input Method) | |
282 ;; | |
283 ;; This file contains a list of LEIM (Library of Emacs Input Method) | |
284 ;; in the same directory as this file. Loading this file registers | |
285 ;; the whole input methods in Emacs. | |
286 ;; | |
287 ;; Each entry has the form: | |
288 ;; (register-input-method | |
289 ;; INPUT-METHOD LANGUAGE-NAME ACTIVATE-FUNC | |
290 ;; TITLE DESCRIPTION | |
291 ;; ARG ...) | |
292 ;; See the function `register-input-method' for the meanings of arguments. | |
293 ;; | |
294 ;; If this directory is included in load-path, Emacs automatically | |
295 ;; loads this file at startup time. | |
296 | |
297 " | |
298 leim-list-file-name) | |
299 "Header to be inserted in LEIM list file.") | |
300 | |
301 (defvar leim-list-entry-regexp "^(register-input-method" | |
302 "Regexp matching head of each entry in LEIM list file. | |
303 See also the variable `leim-list-header'") | |
304 | |
305 (defvar update-leim-list-functions | |
306 '(quail-update-leim-list-file) | |
307 "List of functions to call to update LEIM list file. | |
308 Each function is called with one arg, LEIM directory name.") | |
309 | |
310 (defun update-leim-list-file (&rest dirs) | |
311 "Update LEIM list file in directories DIRS." | |
312 (let ((functions update-leim-list-functions)) | |
313 (while functions | |
314 (apply (car functions) dirs) | |
315 (setq functions (cdr functions))))) | |
316 | |
317 (defvar current-input-method nil | |
318 "The current input method for multilingual text. | |
319 If nil, that means no input method is activated now.") | |
320 (make-variable-buffer-local 'current-input-method) | |
321 (put 'current-input-method 'permanent-local t) | |
322 | |
323 (defvar current-input-method-title nil | |
324 "Title string of the current input method shown in mode line.") | |
325 (make-variable-buffer-local 'current-input-method-title) | |
326 (put 'current-input-method-title 'permanent-local t) | |
327 | |
328 (defcustom default-input-method nil | |
329 "*Default input method for multilingual text (a string). | |
330 This is the input method activated automatically by the command | |
331 `toggle-input-method' (\\[toggle-input-method])." | |
332 :group 'mule | |
333 :type '(choice (const nil) string)) | |
334 | |
335 (put 'input-method-function 'permanent-local t) | |
336 | |
337 (defvar input-method-history nil | |
338 "History list for some commands that read input methods.") | |
339 (make-variable-buffer-local 'input-method-history) | |
340 (put 'input-method-history 'permanent-local t) | |
341 | |
342 (defvar inactivate-current-input-method-function nil | |
343 "Function to call for inactivating the current input method. | |
344 Every input method should set this to an appropriate value when activated. | |
345 This function is called with no argument. | |
346 | |
347 This function should never change the value of `current-input-method'. | |
348 It is set to nil by the function `inactivate-input-method'.") | |
349 (make-variable-buffer-local 'inactivate-current-input-method-function) | |
350 (put 'inactivate-current-input-method-function 'permanent-local t) | |
351 | |
352 (defvar describe-current-input-method-function nil | |
353 "Function to call for describing the current input method. | |
354 This function is called with no argument.") | |
355 (make-variable-buffer-local 'describe-current-input-method-function) | |
356 (put 'describe-current-input-method-function 'permanent-local t) | |
357 | |
358 (defvar input-method-alist nil | |
2970 | 359 "Alist mapping input method names to information used by the LEIM API. |
360 Elements have the form (METHOD LANGUAGE ACTIVATOR TITLE DESCRIPTION ARGS...). | |
361 Use `register-input-method' to add input methods to the database. See its | |
362 documentation for the meanings of the elements.") | |
428 | 363 |
2970 | 364 (defun register-input-method (method language |
365 ;; #### shouldn't be optional, but need to | |
366 ;; audit callers | |
367 &optional activator title description | |
368 &rest args) | |
369 "Register METHOD as an input method for language environment LANGUAGE. | |
428 | 370 |
2970 | 371 METHOD and LANGUAGE may be symbols or strings. |
372 ACTIVATOR is the function called to activate this method. METHOD (the | |
373 invocation name) and ARGS are passed to the function on activation. | |
428 | 374 TITLE is a string to show in the mode line when this method is active. |
375 DESCRIPTION is a string describing this method and what it is good for. | |
2970 | 376 Optional ARGS, if any, are stored and passed as arguments to ACTIVATOR. |
428 | 377 |
2970 | 378 When registering a new Quail input method, the input method title should be |
379 the one given in the third parameter of `quail-define-package' (if the values | |
380 are different, the string specified in this function takes precedence). | |
428 | 381 |
2970 | 382 The information provided is registered in `input-method-alist'. The commands |
383 `describe-input-method' and `list-input-methods' use this database to show | |
384 information about input methods without loading them." | |
385 (if (symbolp language) | |
386 (setq language (symbol-name language))) | |
387 (if (symbolp method) | |
388 (setq method (symbol-name method))) | |
389 (let ((info (append (list language activator title description) args)) | |
390 (slot (assoc method input-method-alist))) | |
428 | 391 (if slot |
392 (setcdr slot info) | |
2970 | 393 (setq slot (cons method info)) |
428 | 394 (setq input-method-alist (cons slot input-method-alist))))) |
395 | |
396 (defun read-input-method-name (prompt &optional default inhibit-null) | |
397 "Read a name of input method from a minibuffer prompting with PROMPT. | |
398 If DEFAULT is non-nil, use that as the default, | |
399 and substitute it into PROMPT at the first `%s'. | |
400 If INHIBIT-NULL is non-nil, null input signals an error. | |
401 | |
402 The return value is a string." | |
403 (if default | |
404 (setq prompt (format prompt default))) | |
405 (let* ((completion-ignore-case t) | |
406 ;; This binding is necessary because input-method-history is | |
407 ;; buffer local. | |
408 (input-method (completing-read prompt input-method-alist | |
409 nil t nil 'input-method-history | |
410 default))) | |
411 (if (and input-method (symbolp input-method)) | |
412 (setq input-method (symbol-name input-method))) | |
413 (if (> (length input-method) 0) | |
414 input-method | |
415 (if inhibit-null | |
416 (error "No valid input method is specified"))))) | |
417 | |
418 (defun activate-input-method (input-method) | |
419 "Switch to input method INPUT-METHOD for the current buffer. | |
420 If some other input method is already active, turn it off first. | |
421 If INPUT-METHOD is nil, deactivate any current input method." | |
422 (if (and input-method (symbolp input-method)) | |
423 (setq input-method (symbol-name input-method))) | |
424 (if (and current-input-method | |
425 (not (string= current-input-method input-method))) | |
426 (inactivate-input-method)) | |
427 (unless (or current-input-method (null input-method)) | |
428 (let ((slot (assoc input-method input-method-alist))) | |
429 (if (null slot) | |
430 (error "Can't activate input method `%s'" input-method)) | |
431 (let ((func (nth 2 slot))) | |
432 (if (functionp func) | |
433 (apply (nth 2 slot) input-method (nthcdr 5 slot)) | |
434 (if (and (consp func) (symbolp (car func)) (symbolp (cdr func))) | |
435 (progn | |
436 (require (cdr func)) | |
437 (apply (car func) input-method (nthcdr 5 slot))) | |
438 (error "Can't activate input method `%s'" input-method)))) | |
439 (setq current-input-method input-method) | |
440 (setq current-input-method-title (nth 3 slot)) | |
441 (unwind-protect | |
442 (run-hooks 'input-method-activate-hook) | |
443 (force-mode-line-update))))) | |
444 | |
445 (defun inactivate-input-method () | |
446 "Turn off the current input method." | |
447 (when current-input-method | |
448 (if input-method-history | |
449 (unless (string= current-input-method (car input-method-history)) | |
450 (setq input-method-history | |
451 (cons current-input-method | |
452 (delete current-input-method input-method-history)))) | |
453 (setq input-method-history (list current-input-method))) | |
454 (unwind-protect | |
455 (funcall inactivate-current-input-method-function) | |
456 (unwind-protect | |
457 (run-hooks 'input-method-inactivate-hook) | |
458 (setq current-input-method nil | |
459 current-input-method-title nil) | |
460 (force-mode-line-update))))) | |
461 | |
462 (defun set-input-method (input-method) | |
463 "Select and activate input method INPUT-METHOD for the current buffer. | |
464 This also sets the default input method to the one you specify." | |
465 (interactive | |
466 (let* ((default (or (car input-method-history) default-input-method))) | |
467 (list (read-input-method-name | |
468 (if default "Select input method (default %s): " "Select input method: ") | |
469 default t)))) | |
470 (activate-input-method input-method) | |
471 (setq default-input-method input-method)) | |
472 | |
473 (defun toggle-input-method (&optional arg) | |
474 "Turn on or off a multilingual text input method for the current buffer. | |
475 | |
476 With no prefix argument, if an input method is currently activated, | |
477 turn it off. Otherwise, activate an input method -- the one most | |
478 recently used, or the one specified in `default-input-method', or | |
479 the one read from the minibuffer. | |
480 | |
481 With a prefix argument, read an input method from the minibuffer and | |
482 turn it on. | |
483 | |
484 The default is to use the most recent input method specified | |
485 \(not including the currently active input method, if any)." | |
486 (interactive "P") | |
487 (if (and current-input-method (not arg)) | |
488 (inactivate-input-method) | |
489 (let ((default (or (car input-method-history) default-input-method))) | |
490 (if (and arg default (equal current-input-method default) | |
491 (> (length input-method-history) 1)) | |
492 (setq default (nth 1 input-method-history))) | |
493 (activate-input-method | |
494 (if (or arg (not default)) | |
495 (progn | |
496 (read-input-method-name | |
497 (if default "Input method (default %s): " "Input method: " ) | |
498 default t)) | |
499 default)) | |
500 (or default-input-method | |
501 (setq default-input-method current-input-method))))) | |
502 | |
503 (defun describe-input-method (input-method) | |
504 "Describe input method INPUT-METHOD." | |
505 (interactive | |
506 (list (read-input-method-name | |
507 "Describe input method (default, current choice): "))) | |
508 (if (and input-method (symbolp input-method)) | |
509 (setq input-method (symbol-name input-method))) | |
510 (if (null input-method) | |
511 (describe-current-input-method) | |
512 (with-output-to-temp-buffer "*Help*" | |
513 (let ((elt (assoc input-method input-method-alist))) | |
514 (princ (format "Input method: %s (`%s' in mode line) for %s\n %s\n" | |
515 input-method (nth 3 elt) (nth 1 elt) (nth 4 elt))))))) | |
516 | |
517 (defun describe-current-input-method () | |
518 "Describe the input method currently in use." | |
519 (if current-input-method | |
520 (if (and (symbolp describe-current-input-method-function) | |
521 (fboundp describe-current-input-method-function)) | |
522 (funcall describe-current-input-method-function) | |
523 (message "No way to describe the current input method `%s'" | |
524 current-input-method) | |
525 (ding)) | |
526 (error "No input method is activated now"))) | |
527 | |
528 (defun read-multilingual-string (prompt &optional initial-input input-method) | |
529 "Read a multilingual string from minibuffer, prompting with string PROMPT. | |
530 The input method selected last time is activated in minibuffer. | |
531 If optional second arg INITIAL-INPUT is non-nil, insert it in the minibuffer | |
532 initially. | |
533 Optional 3rd argument INPUT-METHOD specifies the input method | |
534 to be activated instead of the one selected last time. It is a symbol | |
535 or a string." | |
536 (setq input-method | |
537 (or input-method | |
538 current-input-method | |
539 default-input-method | |
540 (read-input-method-name "Input method: " nil t))) | |
541 (if (and input-method (symbolp input-method)) | |
542 (setq input-method (symbol-name input-method))) | |
543 (let ((prev-input-method current-input-method)) | |
544 (unwind-protect | |
545 (progn | |
546 (activate-input-method input-method) | |
547 ;; FSF Emacs | |
548 ;; (read-string prompt initial-input nil nil t) | |
549 (read-string prompt initial-input nil)) | |
550 (activate-input-method prev-input-method)))) | |
551 | |
552 ;; Variables to control behavior of input methods. All input methods | |
553 ;; should react to these variables. | |
554 | |
555 (defcustom input-method-verbose-flag 'default | |
556 "*A flag to control extra guidance given by input methods. | |
557 The value should be nil, t, `complex-only', or `default'. | |
558 | |
559 The extra guidance is done by showing list of available keys in echo | |
560 area. When you use the input method in the minibuffer, the guidance | |
561 is shown at the bottom short window (split from the existing window). | |
562 | |
563 If the value is t, extra guidance is always given, if the value is | |
564 nil, extra guidance is always suppressed. | |
565 | |
566 If the value is `complex-only', only complex input methods such as | |
567 `chinese-py' and `japanese' give extra guidance. | |
568 | |
569 If the value is `default', complex input methods always give extra | |
570 guidance, but simple input methods give it only when you are not in | |
571 the minibuffer. | |
572 | |
573 See also the variable `input-method-highlight-flag'." | |
574 :type '(choice (const t) (const nil) (const complex-only) (const default)) | |
575 :group 'mule) | |
576 | |
577 (defcustom input-method-highlight-flag t | |
578 "*If this flag is non-nil, input methods highlight partially-entered text. | |
579 For instance, while you are in the middle of a Quail input method sequence, | |
580 the text inserted so far is temporarily underlined. | |
581 The underlining goes away when you finish or abort the input method sequence. | |
582 See also the variable `input-method-verbose-flag'." | |
583 :type 'boolean | |
584 :group 'mule) | |
585 | |
586 (defvar input-method-activate-hook nil | |
587 "Normal hook run just after an input method is activated. | |
588 | |
589 The variable `current-input-method' keeps the input method name | |
590 just activated.") | |
591 | |
592 (defvar input-method-inactivate-hook nil | |
593 "Normal hook run just after an input method is inactivated. | |
594 | |
595 The variable `current-input-method' still keeps the input method name | |
596 just inactivated.") | |
597 | |
598 (defvar input-method-after-insert-chunk-hook nil | |
599 "Normal hook run just after an input method insert some chunk of text.") | |
600 | |
601 (defvar input-method-exit-on-first-char nil | |
602 "This flag controls a timing when an input method returns. | |
603 Usually, the input method does not return while there's a possibility | |
604 that it may find a different translation if a user types another key. | |
605 But, it this flag is non-nil, the input method returns as soon as | |
606 the current key sequence gets long enough to have some valid translation.") | |
607 | |
608 (defvar input-method-use-echo-area nil | |
609 "This flag controls how an input method shows an intermediate key sequence. | |
610 Usually, the input method inserts the intermediate key sequence, | |
611 or candidate translations corresponding to the sequence, | |
612 at point in the current buffer. | |
613 But, if this flag is non-nil, it displays them in echo area instead.") | |
614 | |
615 (defvar input-method-exit-on-invalid-key nil | |
442 | 616 "This flag controls the behavior of an input method on invalid key input. |
428 | 617 Usually, when a user types a key which doesn't start any character |
618 handled by the input method, the key is handled by turning off the | |
619 input method temporarily. After that key, the input method is re-enabled. | |
620 But, if this flag is non-nil, the input method is never back on.") | |
621 | |
622 | |
623 (defvar set-language-environment-hook nil | |
624 "Normal hook run after some language environment is set. | |
625 | |
626 When you set some hook function here, that effect usually should not | |
627 be inherited to another language environment. So, you had better set | |
628 another function in `exit-language-environment-hook' (which see) to | |
629 cancel the effect.") | |
630 | |
631 (defvar exit-language-environment-hook nil | |
632 "Normal hook run after exiting from some language environment. | |
633 When this hook is run, the variable `current-language-environment' | |
634 is still bound to the language environment being exited. | |
635 | |
636 This hook is mainly used for canceling the effect of | |
637 `set-language-environment-hook' (which-see).") | |
638 | |
771 | 639 ;; bogus FSF function setup-specified-language-support. |
428 | 640 |
641 (defcustom current-language-environment "English" | |
642 "The last language environment specified with `set-language-environment'. | |
643 This variable should be set only with \\[customize], which is equivalent | |
644 to using the function `set-language-environment'." | |
645 :link '(custom-manual "(emacs)Language Environments") | |
646 :set (lambda (symbol value) (set-language-environment value)) | |
647 :get (lambda (x) | |
648 (or (car-safe (assoc-ignore-case | |
649 (if (symbolp current-language-environment) | |
650 (symbol-name current-language-environment) | |
651 current-language-environment) | |
652 language-info-alist)) | |
653 "English")) | |
654 :type (cons 'choice (mapcar (lambda (lang) | |
655 (list 'const (car lang))) | |
656 language-info-alist)) | |
657 :initialize 'custom-initialize-default | |
658 :group 'mule | |
659 :type 'string) | |
660 | |
661 (defun set-language-environment (language-name) | |
662 "Set up multi-lingual environment for using LANGUAGE-NAME. | |
771 | 663 This sets the coding system autodetection priority, the default buffer |
664 coding system, the default input method, the system locale, and other | |
665 relevant language properties. LANGUAGE-NAME should be a string, the | |
666 name of a language environment. For example, \"Latin-1\" specifies | |
667 the language environment for the major languages of Western Europe." | |
428 | 668 (interactive (list (read-language-name |
669 nil | |
670 "Set language environment (default, English): "))) | |
671 (if language-name | |
672 (if (symbolp language-name) | |
673 (setq language-name (symbol-name language-name))) | |
674 (setq language-name "English")) | |
675 (or (assoc-ignore-case language-name language-info-alist) | |
771 | 676 (error 'invalid-argument "Language environment not defined" |
677 language-name)) | |
428 | 678 (if current-language-environment |
679 (let ((func (get-language-info current-language-environment | |
680 'exit-function))) | |
681 (run-hooks 'exit-language-environment-hook) | |
4145 | 682 (if (functionp func) (funcall func)))) |
771 | 683 (setq current-language-environment language-name) |
428 | 684 (let ((default-eol-type (coding-system-eol-type |
685 default-buffer-file-coding-system))) | |
771 | 686 (reset-coding-categories-to-default) |
687 (set-locale-for-language-environment language-name) | |
688 (set-language-environment-coding-systems language-name default-eol-type)) | |
689 | |
690 (finish-set-language-environment language-name)) | |
428 | 691 |
771 | 692 (defun finish-set-language-environment (language-name) |
693 ;; Internal function. Only what's here is called at startup, once the | |
694 ;; first language environment is determined. The above stuff was already | |
695 ;; taken care of very early in the startup sequence, in a special | |
696 ;; fashion. | |
428 | 697 (let ((input-method (get-language-info language-name 'input-method))) |
698 (when input-method | |
699 (setq default-input-method input-method) | |
700 (if input-method-history | |
701 (setq input-method-history | |
702 (cons input-method | |
703 (delete input-method input-method-history)))))) | |
704 ;; (let ((nonascii (get-language-info language-name 'nonascii-translation)) | |
705 ;; (dos-table | |
706 ;; (if (eq window-system 'pc) | |
707 ;; (intern | |
708 ;; (concat "cp" dos-codepage "-nonascii-translation-table"))))) | |
709 ;; (cond | |
710 ;; ((char-table-p nonascii) | |
711 ;; (setq nonascii-translation-table nonascii)) | |
712 ;; ((and (eq window-system 'pc) (boundp dos-table)) | |
713 ;; ;; DOS terminals' default is to use a special non-ASCII translation | |
714 ;; ;; table as appropriate for the installed codepage. | |
715 ;; (setq nonascii-translation-table (symbol-value dos-table))) | |
716 ;; ((charsetp nonascii) | |
717 ;; (setq nonascii-insert-offset (- (make-char nonascii) 128))))) | |
718 | |
719 ;; (setq charset-origin-alist | |
720 ;; (get-language-info language-name 'charset-origin-alist)) | |
721 | |
722 ;; Unibyte setups if necessary. | |
723 ;; (unless default-enable-multibyte-characters | |
724 ;; ;; Syntax and case table. | |
725 ;; (let ((syntax (get-language-info language-name 'unibyte-syntax))) | |
726 ;; (if syntax | |
727 ;; (let ((set-case-syntax-set-multibyte nil)) | |
728 ;; (load syntax nil t)) | |
729 ;; ;; No information for syntax and case. Reset to the defaults. | |
730 ;; (let ((syntax-table (standard-syntax-table)) | |
731 ;; (case-table (standard-case-table)) | |
732 ;; (ch (if (eq window-system 'pc) 128 160))) | |
733 ;; (while (< ch 256) | |
734 ;; (modify-syntax-entry ch " " syntax-table) | |
735 ;; (aset case-table ch ch) | |
736 ;; (setq ch (1+ ch))) | |
737 ;; (set-char-table-extra-slot case-table 0 nil) | |
738 ;; (set-char-table-extra-slot case-table 1 nil) | |
739 ;; (set-char-table-extra-slot case-table 2 nil)) | |
740 ;; (set-standard-case-table (standard-case-table)) | |
741 ;; (let ((list (buffer-list))) | |
742 ;; (while list | |
743 ;; (with-current-buffer (car list) | |
744 ;; (set-case-table (standard-case-table))) | |
745 ;; (setq list (cdr list)))))) | |
746 ;; ;; Display table and coding system for terminal. | |
747 ;; (let ((coding (get-language-info language-name 'unibyte-display))) | |
748 ;; (if coding | |
749 ;; (standard-display-european-internal) | |
750 ;; (standard-display-default (if (eq window-system 'pc) 128 160) 255) | |
751 ;; (aset standard-display-table 146 nil)) | |
752 ;; (or (eq window-system 'pc) | |
753 ;; (set-terminal-coding-system coding)))) | |
754 | |
755 (let ((required-features (get-language-info language-name 'features))) | |
756 (while required-features | |
757 (require (car required-features)) | |
758 (setq required-features (cdr required-features)))) | |
759 (let ((func (get-language-info language-name 'setup-function))) | |
4145 | 760 (if (functionp func) |
428 | 761 (funcall func))) |
952 | 762 |
763 ;; Fit the charsets preferences in unicode conversions for the | |
764 ;; language environment. | |
1285 | 765 (set-language-unicode-precedence-list |
766 (get-language-info language-name 'charset)) | |
952 | 767 |
428 | 768 (run-hooks 'set-language-environment-hook) |
769 (force-mode-line-update t)) | |
770 | |
771 ;; (defun standard-display-european-internal () | |
772 ;; ;; Actually set up direct output of non-ASCII characters. | |
773 ;; (standard-display-8bit (if (eq window-system 'pc) 128 160) 255) | |
774 ;; ;; Unibyte Emacs on MS-DOS wants to display all 8-bit characters with | |
775 ;; ;; the native font, and codes 160 and 146 stand for something very | |
776 ;; ;; different there. | |
777 ;; (or (and (eq window-system 'pc) (not default-enable-multibyte-characters)) | |
778 ;; (progn | |
779 ;; ;; Make non-line-break space display as a plain space. | |
780 ;; ;; Most X fonts do the wrong thing for code 160. | |
781 ;; (aset standard-display-table 160 [32]) | |
782 ;; ;; Most Windows programs send out apostrophe's as \222. Most X fonts | |
783 ;; ;; don't contain a character at that position. Map it to the ASCII | |
784 ;; ;; apostrophe. | |
785 ;; (aset standard-display-table 146 [39])))) | |
786 | |
771 | 787 ;; bogus FSF function describe-specified-language-support. |
428 | 788 |
789 (defun describe-language-environment (language-name) | |
790 "Describe how Emacs supports language environment LANGUAGE-NAME." | |
791 (interactive | |
792 (list (read-language-name | |
793 'documentation | |
794 "Describe language environment (default, current choice): "))) | |
795 (if (null language-name) | |
796 (setq language-name current-language-environment)) | |
797 (if (or (null language-name) | |
798 (null (get-language-info language-name 'documentation))) | |
799 (error "No documentation for the specified language")) | |
800 (if (symbolp language-name) | |
801 (setq language-name (symbol-name language-name))) | |
802 (let ((doc (get-language-info language-name 'documentation))) | |
771 | 803 (flet ((princ-list (&rest args) |
804 (while args (princ (car args)) (setq args (cdr args))) | |
805 (princ "\n"))) | |
806 (with-output-to-temp-buffer "*Help*" | |
807 (princ-list language-name " language environment" "\n") | |
808 (if (stringp doc) | |
428 | 809 (progn |
771 | 810 (princ-list doc) |
811 (terpri))) | |
812 (let ((str (get-language-info language-name 'sample-text))) | |
813 (if (stringp str) | |
814 (progn | |
815 (princ "Sample text:\n") | |
816 (princ-list " " str) | |
817 (terpri)))) | |
818 (let ((input-method (get-language-info language-name 'input-method)) | |
819 (l (copy-sequence input-method-alist))) | |
820 (princ "Input methods") | |
821 (when input-method | |
822 (princ (format " (default, %s)" input-method)) | |
823 (setq input-method (assoc input-method input-method-alist)) | |
824 (setq l (cons input-method (delete input-method l)))) | |
825 (princ ":\n") | |
428 | 826 (while l |
771 | 827 (if (string= language-name (nth 1 (car l))) |
828 (princ-list " " (car (car l)) | |
829 (format " (`%s' in mode line)" (nth 3 (car l))))) | |
830 (setq l (cdr l)))) | |
831 (terpri) | |
832 (princ "Character sets:\n") | |
833 (let ((l (get-language-info language-name 'charset))) | |
834 (if (null l) | |
835 (princ-list " nothing specific to " language-name) | |
836 (while l | |
837 (princ-list " " (car l) ": " | |
838 (charset-description (car l))) | |
839 (setq l (cdr l))))) | |
840 (terpri) | |
841 (princ "Coding systems:\n") | |
842 (let ((l (get-language-info language-name 'coding-system))) | |
843 (if (null l) | |
844 (princ-list " nothing specific to " language-name) | |
845 (while l | |
846 (princ ; (format " %s (`%c' in mode line):\n\t%s\n" | |
847 ;; In XEmacs, `coding-system-mnemonic' returns string. | |
848 (format " %s (`%s' in English, `%s' in mode line):\n\t%s\n" | |
849 (car l) | |
850 (coding-system-description (car l)) | |
851 (coding-system-mnemonic (car l)) | |
852 (or (coding-system-documentation (car l)) | |
853 "Not documented.")) ) | |
854 ;; (let ((aliases (coding-system-get (car l) 'alias-coding-systems))) | |
855 ;; (when aliases | |
856 ;; (princ "\t") | |
857 ;; (princ (cons 'alias: (cdr aliases))) | |
858 ;; (terpri))) | |
859 (setq l (cdr l))))))))) | |
428 | 860 |
861 ;;; Charset property | |
862 | |
863 ;; (defsubst get-charset-property (charset propname) | |
864 ;; "Return the value of CHARSET's PROPNAME property. | |
865 ;; This is the last value stored with | |
866 ;; `(put-charset-property CHARSET PROPNAME VALUE)'." | |
867 ;; (plist-get (charset-plist charset) propname)) | |
868 | |
869 ;; (defsubst put-charset-property (charset propname value) | |
870 ;; "Store CHARSETS's PROPNAME property with value VALUE. | |
871 ;; It can be retrieved with `(get-charset-property CHARSET PROPNAME)'." | |
872 ;; (set-charset-plist charset | |
873 ;; (plist-put (charset-plist charset) propname value))) | |
874 | |
875 (defvar char-code-property-table | |
876 (make-char-table 'generic) | |
877 "Char-table containing a property list of each character code. | |
878 | |
879 See also the documentation of `get-char-code-property' and | |
880 `put-char-code-property'") | |
881 ;; (let ((plist (aref char-code-property-table char))) | |
882 (defun get-char-code-property (char propname) | |
883 "Return the value of CHAR's PROPNAME property in `char-code-property-table'." | |
884 (let ((plist (get-char-table char char-code-property-table))) | |
885 (if (listp plist) | |
886 (car (cdr (memq propname plist)))))) | |
887 | |
888 (defun put-char-code-property (char propname value) | |
889 "Store CHAR's PROPNAME property with VALUE in `char-code-property-table'. | |
890 It can be retrieved with `(get-char-code-property CHAR PROPNAME)'." | |
891 (let ((plist (get-char-table char char-code-property-table))) | |
892 (if plist | |
893 (let ((slot (memq propname plist))) | |
894 (if slot | |
895 (setcar (cdr slot) value) | |
896 (nconc plist (list propname value)))) | |
897 (put-char-table char (list propname value) char-code-property-table) | |
898 ))) | |
899 | |
900 | |
901 ;; Pretty description of encoded string | |
902 | |
903 ;; Alist of ISO 2022 control code vs the corresponding mnemonic string. | |
4468
a78d697ccd2c
Import and extend GNU's descr-text.el, supporting prefix argument for C-x =
Aidan Kehoe <kehoea@parhasard.net>
parents:
4292
diff
changeset
|
904 (defvar iso-2022-control-alist |
a78d697ccd2c
Import and extend GNU's descr-text.el, supporting prefix argument for C-x =
Aidan Kehoe <kehoea@parhasard.net>
parents:
4292
diff
changeset
|
905 '((?\x1b . "ESC") |
a78d697ccd2c
Import and extend GNU's descr-text.el, supporting prefix argument for C-x =
Aidan Kehoe <kehoea@parhasard.net>
parents:
4292
diff
changeset
|
906 (?\x0e . "SO") |
a78d697ccd2c
Import and extend GNU's descr-text.el, supporting prefix argument for C-x =
Aidan Kehoe <kehoea@parhasard.net>
parents:
4292
diff
changeset
|
907 (?\x0f . "SI") |
a78d697ccd2c
Import and extend GNU's descr-text.el, supporting prefix argument for C-x =
Aidan Kehoe <kehoea@parhasard.net>
parents:
4292
diff
changeset
|
908 (?\x8e . "SS2") |
a78d697ccd2c
Import and extend GNU's descr-text.el, supporting prefix argument for C-x =
Aidan Kehoe <kehoea@parhasard.net>
parents:
4292
diff
changeset
|
909 (?\x8f . "SS3") |
a78d697ccd2c
Import and extend GNU's descr-text.el, supporting prefix argument for C-x =
Aidan Kehoe <kehoea@parhasard.net>
parents:
4292
diff
changeset
|
910 (?\x9b . "CSI"))) |
428 | 911 |
4468
a78d697ccd2c
Import and extend GNU's descr-text.el, supporting prefix argument for C-x =
Aidan Kehoe <kehoea@parhasard.net>
parents:
4292
diff
changeset
|
912 (defun encoded-string-description (str coding-system) |
a78d697ccd2c
Import and extend GNU's descr-text.el, supporting prefix argument for C-x =
Aidan Kehoe <kehoea@parhasard.net>
parents:
4292
diff
changeset
|
913 "Return a pretty description of STR that is encoded by CODING-SYSTEM." |
a78d697ccd2c
Import and extend GNU's descr-text.el, supporting prefix argument for C-x =
Aidan Kehoe <kehoea@parhasard.net>
parents:
4292
diff
changeset
|
914 ; (setq str (string-as-unibyte str)) |
a78d697ccd2c
Import and extend GNU's descr-text.el, supporting prefix argument for C-x =
Aidan Kehoe <kehoea@parhasard.net>
parents:
4292
diff
changeset
|
915 (mapconcat |
a78d697ccd2c
Import and extend GNU's descr-text.el, supporting prefix argument for C-x =
Aidan Kehoe <kehoea@parhasard.net>
parents:
4292
diff
changeset
|
916 (if (and coding-system (eq (coding-system-type coding-system) 'iso2022)) |
a78d697ccd2c
Import and extend GNU's descr-text.el, supporting prefix argument for C-x =
Aidan Kehoe <kehoea@parhasard.net>
parents:
4292
diff
changeset
|
917 ;; Try to get a pretty description for ISO 2022 escape sequences. |
a78d697ccd2c
Import and extend GNU's descr-text.el, supporting prefix argument for C-x =
Aidan Kehoe <kehoea@parhasard.net>
parents:
4292
diff
changeset
|
918 (function (lambda (x) (or (cdr (assq x iso-2022-control-alist)) |
a78d697ccd2c
Import and extend GNU's descr-text.el, supporting prefix argument for C-x =
Aidan Kehoe <kehoea@parhasard.net>
parents:
4292
diff
changeset
|
919 (format "#x%02X" x)))) |
a78d697ccd2c
Import and extend GNU's descr-text.el, supporting prefix argument for C-x =
Aidan Kehoe <kehoea@parhasard.net>
parents:
4292
diff
changeset
|
920 (function (lambda (x) (format "#x%02X" x)))) |
a78d697ccd2c
Import and extend GNU's descr-text.el, supporting prefix argument for C-x =
Aidan Kehoe <kehoea@parhasard.net>
parents:
4292
diff
changeset
|
921 str " ")) |
428 | 922 |
923 ;; (defun encode-coding-char (char coding-system) | |
924 ;; "Encode CHAR by CODING-SYSTEM and return the resulting string. | |
925 ;; If CODING-SYSTEM can't safely encode CHAR, return nil." | |
926 ;; (if (cmpcharp char) | |
927 ;; (setq char (car (decompose-composite-char char 'list)))) | |
928 ;; (let ((str1 (char-to-string char)) | |
929 ;; (str2 (make-string 2 char)) | |
930 ;; (safe-charsets (and coding-system | |
931 ;; (coding-system-get coding-system 'safe-charsets))) | |
932 ;; enc1 enc2 i1 i2) | |
933 ;; (when (or (eq safe-charsets t) | |
934 ;; (memq (char-charset char) safe-charsets)) | |
935 ;; ;; We must find the encoded string of CHAR. But, just encoding | |
936 ;; ;; CHAR will put extra control sequences (usually to designate | |
440 | 937 ;; ;; ASCII charset) at the tail if type of CODING is ISO 2022. |
428 | 938 ;; ;; To exclude such tailing bytes, we at first encode one-char |
939 ;; ;; string and two-char string, then check how many bytes at the | |
940 ;; ;; tail of both encoded strings are the same. | |
941 ;; | |
942 ;; (setq enc1 (string-as-unibyte (encode-coding-string str1 coding-system)) | |
943 ;; i1 (length enc1) | |
944 ;; enc2 (string-as-unibyte (encode-coding-string str2 coding-system)) | |
945 ;; i2 (length enc2)) | |
946 ;; (while (and (> i1 0) (= (aref enc1 (1- i1)) (aref enc2 (1- i2)))) | |
947 ;; (setq i1 (1- i1) i2 (1- i2))) | |
948 ;; | |
949 ;; ;; Now (substring enc1 i1) and (substring enc2 i2) are the same, | |
950 ;; ;; and they are the extra control sequences at the tail to | |
951 ;; ;; exclude. | |
952 ;; (substring enc2 0 i2)))) | |
953 | |
771 | 954 |
955 ;; #### The following section is utter junk from mule-misc.el. | |
956 ;; I've deleted everything that's not referenced in mule-packages and | |
957 ;; not in FSF 20.6; there's no point in keeping old namespace-polluting | |
958 ;; Mule 2.3 crap around. --ben | |
959 | |
960 (defvar self-insert-after-hook nil | |
961 "Hook to run when extended self insertion command exits. Should take | |
962 two arguments START and END corresponding to character position.") | |
963 | |
964 (make-variable-buffer-local 'self-insert-after-hook) | |
965 | |
966 (defun delete-text-in-column (from to) | |
967 "Delete the text between column FROM and TO (exclusive) of the current line. | |
968 Nil of FORM or TO means the current column. | |
969 | |
970 If there's a character across the borders, the character is replaced | |
971 with the same width of spaces before deleting." | |
972 (save-excursion | |
973 (let (p1 p2) | |
974 (if from | |
975 (progn | |
976 (setq p1 (move-to-column from)) | |
977 (if (> p1 from) | |
978 (progn | |
979 (delete-char -1) | |
980 (insert-char ? (- p1 (current-column))) | |
981 (forward-char (- from p1)))))) | |
982 (setq p1 (point)) | |
983 (if to | |
984 (progn | |
985 (setq p2 (move-to-column to)) | |
986 (if (> p2 to) | |
987 (progn | |
988 (delete-char -1) | |
989 (insert-char ? (- p2 (current-column))) | |
990 (forward-char (- to p2)))))) | |
991 (setq p2 (point)) | |
992 (delete-region p1 p2)))) | |
993 | |
994 (defun cancel-undo-boundary () | |
995 "Cancel undo boundary." | |
996 (if (and (consp buffer-undo-list) | |
997 (null (car buffer-undo-list))) | |
998 (setq buffer-undo-list (cdr buffer-undo-list)))) | |
999 | |
1000 (defun define-egg-environment (env-sym doc-string enable-function) | |
1001 "Define a new language environment for egg, named by ENV-SYM. | |
1002 DOC-STRING should be a string describing the environment. | |
1003 ENABLE-FUNCTION should be a function of no arguments that will be called | |
1004 when the language environment is made current." | |
1005 (put env-sym 'egg-environ-doc-string doc-string) | |
1006 (put env-sym 'set-egg-environ enable-function)) | |
1007 | |
1008 | |
1009 ;; Init code. | |
1010 | |
1011 ;; auto-language-alist deleted. We have a more sophisticated system, | |
1012 ;; with the locales stored in the language data. | |
1013 | |
4145 | 1014 ;; Initialised in mule/general-late.el, which is compiled after all the |
1015 ;; language support--and, thus, minority Chinese coding systems and so | |
1016 ;; on--has been loaded. | |
3707 | 1017 (defvar posix-charset-to-coding-system-hash nil |
1018 "A map from the POSIX locale charset versions of the defined coding | |
1019 systems' names, with all alpha-numeric characters removed, to the actual | |
1020 coding system names. Used at startup when working out which coding system | |
1021 should be the default for the locale. ") | |
1022 | |
1023 (defun parse-posix-locale-string (locale-string) | |
1024 "Return values \(LANGUAGE REGION CHARSET MODIFIERS\) given LOCALE-STRING. | |
1025 | |
1026 LOCALE-STRING should be a POSIX locale. If it cannot be parsed as such, this | |
1027 function returns nil. " | |
1028 (let (language region charset modifiers locinfo) | |
1029 (setq locale-string (downcase locale-string)) | |
1030 (cond ((string-match | |
1031 #r"^\([a-z0-9]\{2,2\}\)\(_[a-z0-9]\{2,2\}\)?\(\.[^@]*\)?\(@.*\)?$" | |
1032 locale-string) | |
1033 (setq language (match-string 1 locale-string) | |
1034 region (match-string 2 locale-string) | |
1035 charset (match-string 3 locale-string) | |
1036 modifiers (match-string 4 locale-string) | |
1037 region (and region (replace-in-string region "^_" "")) | |
1038 charset (and charset (replace-in-string charset #r"^\." "")) | |
1039 modifiers (and modifiers | |
1040 (replace-in-string modifiers "^@" ""))) | |
1041 (when (and modifiers (equal modifiers "euro") (null charset)) | |
1042 ;; Not ideal for Latvian, say, but I don't have any locales | |
1043 ;; where the @euro modifier doesn't mean ISO-8859-15 in the 956 | |
1044 ;; I have. | |
1045 (setq charset "iso-8859-15")) | |
4073 | 1046 (when (and modifiers (equal modifiers "cyrillic") (null charset)) |
1047 ;; Feedback wanted! | |
1048 (setq charset "windows-1251")) | |
3707 | 1049 (values language region charset modifiers)) |
1050 ((and (string-match "^[a-z0-9]+$" locale-string) | |
1051 (assoc-ignore-case locale-string language-info-alist)) | |
1052 (setq language (get-language-info locale-string 'locale) | |
1053 language (if (listp language) (car language) language)) | |
1054 (values language region charset modifiers)) | |
1055 ((string-match #r"^\([a-z0-9]+\)\.\([a-z0-9]+\)$" locale-string) | |
1056 (when (assoc-ignore-case | |
1057 (setq locinfo (match-string 1 locale-string)) | |
1058 language-info-alist) | |
1059 (setq language (get-language-info locinfo 'locale) | |
1060 language (if (listp language) (car language) language))) | |
1061 (setq charset (match-string 2 locale-string)) | |
1062 (values language region charset modifiers))))) | |
1063 | |
1064 (defun create-variant-language-environment (langenv coding-system) | |
1065 "Create a variant of LANGENV with CODING-SYSTEM as its coding systems. | |
1066 | |
1067 The coding systems in question are those described in the | |
1068 `set-language-info' docstring with the property names of | |
1069 `native-coding-system' and `coding-system'. The name of the new language | |
1070 environment is the name of the old language environment, followed by | |
1071 CODING-SYSTEM in parentheses. Returns the name of the new language | |
3767 | 1072 environment. |
1073 | |
1074 This function also modifies the `coding-priority' of a language | |
3707 | 1075 environment. " |
1076 (check-coding-system coding-system) | |
1077 (if (symbolp langenv) (setq langenv (symbol-name langenv))) | |
1078 (unless (setq langenv | |
1079 (assoc-ignore-case langenv language-info-alist)) | |
1080 (error 'wrong-type-argument "Not a known language environment")) | |
1081 (set-language-info-alist | |
1082 (if (string-match " ([^)]+)$" (car langenv)) | |
1083 (replace-match (format " (%s)" | |
1084 (upcase (symbol-name | |
1085 (coding-system-name coding-system)))) | |
3737 | 1086 nil nil (car langenv)) |
3707 | 1087 (format "%s (%s)" (car langenv) |
1088 (upcase (symbol-name (coding-system-name coding-system))))) | |
1089 (destructive-plist-to-alist | |
3767 | 1090 (plist-put |
1091 (plist-put | |
4292 | 1092 (plist-put |
1093 (plist-put (alist-to-plist (cdr langenv)) 'native-coding-system | |
1094 coding-system) | |
1095 'coding-system (cons coding-system | |
1096 (cdr (assoc 'coding-system (cdr langenv))))) | |
1097 'coding-priority (cons coding-system | |
1098 (cdr (assq 'coding-priority (cdr langenv))))) | |
1099 ;; The tutorial coding system is important; otherwise the tutorial file | |
1100 ;; gets loaded in the variant coding system. | |
1101 'tutorial-coding-system | |
1102 (or (car-safe (cdr-safe (assoc 'tutorial-coding-system (cdr langenv)))) | |
1103 (car-safe (cdr-safe (assoc 'coding-system (cdr langenv))))))))) | |
801 | 1104 |
771 | 1105 (defun get-language-environment-from-locale (locale) |
1106 "Convert LOCALE into a language environment. | |
1107 LOCALE is a C library locale string, as returned by `current-locale'. | |
1108 Uses the `locale' property of the language environment." | |
3707 | 1109 (block langenv |
4103 | 1110 (multiple-value-bind (language ignored-arg charset ignored-arg) |
3707 | 1111 (parse-posix-locale-string locale) |
1112 (let ((case-fold-search t) | |
1113 (desired-coding-system | |
1114 (and charset (gethash (replace-in-string charset "[^a-z0-9]" "") | |
1115 posix-charset-to-coding-system-hash))) | |
3767 | 1116 lang locs given-coding-system) |
3707 | 1117 (dolist (langcons language-info-alist) |
1118 (setq lang (car langcons) | |
1119 locs (get-language-info lang 'locale)) | |
1120 (dolist (loc (if (listp locs) locs (list locs))) | |
1121 (cond ((functionp loc) | |
1122 (if (funcall loc locale) | |
1123 (return-from langenv lang))) | |
1124 ((stringp loc) | |
1125 (when (or (equal loc language) | |
1126 (string-match | |
1127 (format "^%s\\([^A-Za-z0-9]\\|$\\)" loc) | |
1128 locale)) | |
1129 (if (or (null desired-coding-system) | |
1130 (and desired-coding-system | |
3767 | 1131 (or (eq desired-coding-system |
1132 (setq given-coding-system | |
1133 (get-language-info | |
1134 lang | |
1135 'native-coding-system))) | |
1136 (and (listp given-coding-system) | |
1137 (memq desired-coding-system | |
1138 given-coding-system))))) | |
3707 | 1139 (return-from langenv lang) |
1140 (return-from langenv | |
1141 (create-variant-language-environment | |
1142 lang desired-coding-system)))))))))))) | |
771 | 1143 |
1144 (defun mswindows-get-language-environment-from-locale (ms-locale) | |
1145 "Convert MS-LOCALE (an MS Windows locale) into a language environment. | |
1146 MS-LOCALE is in the format recognized by `set-mswindows-current-locale' -- | |
1147 i.e. a language string or a cons (LANG . SUBLANG). Note: This is NOT the | |
1148 same as the C library locale format (see `set-current-locale')! | |
1149 | |
1150 This looks up the `mswindows-locale' property of all language environments; | |
1151 if nothing matching is found, it looks for a language environment with the | |
1152 same name (modulo case differences) as the LANG part of the locale." | |
1153 (or (consp ms-locale) (setq ms-locale (cons ms-locale "DEFAULT"))) | |
1154 (or (block langenv | |
1155 (dolist (langcons language-info-alist) | |
1156 (let* ((lang (car langcons)) | |
1157 (mswlocs (get-language-info lang 'mswindows-locale)) | |
1158 (mswlocs (if (and (consp mswlocs) | |
1159 (listp (cdr mswlocs))) | |
1160 mswlocs (list mswlocs)))) | |
1161 (dolist (loc mswlocs) | |
1162 (or (consp loc) (setq loc (cons loc "DEFAULT"))) | |
1163 (if (equalp loc ms-locale) | |
1164 (return-from langenv lang)))))) | |
1165 (dolist (langcons language-info-alist) | |
1166 (let* ((lang (car langcons))) | |
1167 (if (equalp lang (car ms-locale)) | |
1168 (return-from nil lang)))))) | |
1169 | |
1170 (defun get-native-coding-system-from-language-environment (langenv locale) | |
1171 "Return the native coding system appropriate for LANGENV. | |
1172 LANGENV is a string naming a language environment. May use the LOCALE | |
1173 \(which should be the C library LOCALE corresponding to LANGENV) to | |
1174 determine the correct coding system. (For example, in the Japanese language | |
1175 environment, there are multiple encodings in use: euc-jp, shift-jis, jis7, | |
1176 jis8, iso-2022-jp, etc. The LOCALE may tell which one is correct.) | |
1177 | |
1178 Specifically: Under X, the returned value is determined from these two. | |
1179 Under MS Windows, the native coding system must be set from the default | |
1180 system locale and is not influenced by LOCALE. (In other words, a program | |
1181 can't set the text encoding used to communicate with the OS. To get around | |
1182 this, we use Unicode whenever available, i.e. on Windows NT always and on | |
1318 | 1183 Windows 9x whenever a Unicode version of a system call is available.)" |
771 | 1184 (if (eq system-type 'windows-nt) |
1185 ;; should not apply to Cygwin, I don't think | |
1186 'mswindows-multibyte-system-default | |
1187 (let ((ncod (get-language-info langenv 'native-coding-system))) | |
1188 (if (or (functionp ncod) (not (listp ncod))) | |
1189 (setq ncod (list ncod))) | |
1190 (let ((native | |
1191 (dolist (try-native ncod) | |
1192 (let ((result | |
1193 (if (functionp try-native) | |
1194 (funcall try-native locale) | |
1195 try-native))) | |
1196 (if result (return result)))))) | |
1197 (or native (car (get-language-info langenv 'coding-system)) | |
1198 'raw-text))))) | |
1199 | |
1200 (defun get-coding-system-from-locale (locale) | |
1201 "Return the coding system corresponding to a locale string." | |
1202 (get-native-coding-system-from-language-environment | |
1203 (get-language-environment-from-locale locale) locale)) | |
1204 | |
1205 (defvar mswindows-langenv-to-locale-table (make-hash-table) | |
1206 "Table mapping language environments to associated MS Windows locales. | |
1207 There may be more than one MS Windows locale that maps to a given language | |
1208 environment, so once we've made the mapping, we record it here when we need | |
1209 to make the reverse mapping. For example, all MS Windows locales with | |
1210 language ENGLISH will map to language environment English, and when the | |
1211 user starts up in such a locale, switches to another language environment | |
1212 and then back to English, we want the same locale again.") | |
1213 | |
1214 (defun set-locale-for-language-environment (langenv) | |
1215 "Sets the current system locale as appropriate for LANGENV. | |
1216 LANGENV is a language environment. The locale is determined by looking at | |
1217 the 'locale (or maybe 'mswindows-locale) property of LANGENV, and then | |
1218 setting it using `set-current-locale' and maybe also | |
1219 `mswindows-set-current-locale'. Also sets the LANG environment variable. | |
1220 Returns non-nil if successfully set the locale(s)." | |
1221 (flet ((mswindows-get-and-set-locale-from-langenv (langenv) | |
1222 ;; find the mswindows locale for the langenv, make it current, | |
1223 ;; and return it. first we check the langenv-to-locale table | |
1224 ;; ... | |
1225 (let ((ms-locale | |
1226 (gethash langenv mswindows-langenv-to-locale-table))) | |
1227 (if ms-locale (progn | |
778 | 1228 (declare-fboundp (mswindows-set-current-locale |
1229 ms-locale)) | |
771 | 1230 ms-locale) |
1231 ;; ... if not, see if the langenv specifies any locale(s). | |
1232 ;; if not, construct one from the langenv name. | |
1233 (let* ((mslocs (get-language-info langenv 'mswindows-locale)) | |
1234 (mslocs (or mslocs (cons (upcase langenv) "DEFAULT"))) | |
1235 (mslocs (if (and (consp mslocs) | |
1236 (listp (cdr mslocs))) | |
1237 mslocs (list mslocs)))) | |
1238 (dolist (msloc mslocs) | |
1239 ;; Sometimes a language with DEFAULT is different from | |
1240 ;; with SYS_DEFAULT, and on my system | |
1241 ;; (set-current-locale "chinese") is NOT the same as | |
1242 ;; (set-current-locale "chinese-default")! The latter | |
1243 ;; gives Taiwan (DEFAULT), the former PRC (SYS_DEFAULT). | |
1244 ;; In the interests of consistency, we always use DEFAULT. | |
1245 (or (consp msloc) (setq msloc (cons msloc "DEFAULT"))) | |
1246 (when (condition-case nil | |
1247 (progn | |
778 | 1248 (declare-fboundp (mswindows-set-current-locale |
1249 msloc)) | |
771 | 1250 t) |
1251 (error nil)) | |
1252 (return msloc)))))))) | |
1253 (if (eq system-type 'windows-nt) | |
1254 (let ((ms-locale (mswindows-get-and-set-locale-from-langenv langenv))) | |
1255 (when ms-locale | |
1256 ;; also need to set the clib locale. | |
1257 (or (set-current-locale | |
1258 ;; if the locale is '("DUTCH" . "DUTCH_BELGIAN"), | |
1259 ;; try "DUTCH-BELGIAN". (Case is insignificant; | |
1260 ;; "dutch-belgian" works just as well.) This type | |
1261 ;; of transformation should always work, and you | |
1262 ;; get back the canonicalized version -- in this | |
1263 ;; case "Dutch_Belgium.1252". Note the futility of | |
1264 ;; trying to construct "Belgium" directly from | |
1265 ;; "BELGIAN". | |
1266 ;; | |
1267 ;; BUT ... We actually have to be trickier. | |
1268 ;; ("SPANISH" . "SPANISH_DOMINICAN_REPUBLIC") needs | |
1269 ;; to end up as "SPANISH-DOMINICAN REPUBLIC"; any | |
1270 ;; other punctuation makes it fail (you either get | |
1271 ;; Spain for the country, or nil). | |
1272 ;; | |
1273 ;; assume it's DEFAULT or NEUTRAL (or something else | |
1274 ;; without the language in it?) and prepend the | |
1275 ;; language. | |
1276 (if (string-match "_" (cdr ms-locale)) | |
1277 (replace-in-string | |
1278 (replace-match "-" nil nil (cdr ms-locale)) "_" " ") | |
1279 (format "%s-%s" (car ms-locale) (cdr ms-locale)))) | |
1280 ;; ???? huh ???? if failure, just try the language | |
1281 ;; name. | |
1282 (set-current-locale (car ms-locale)))) | |
1283 ;; also set LANG, for the benefit of Cygwin subprocesses. | |
1284 (let* ((cygloc (or (get-language-info langenv 'cygwin-locale) | |
1285 (get-language-info langenv 'locale))) | |
1286 (cygloc (if (listp cygloc) (car (last cygloc)) cygloc))) | |
1287 (if (and cygloc (stringp cygloc)) (setenv "LANG" cygloc))) | |
1288 (not (null ms-locale))) | |
1289 | |
1290 ;; not MS Windows native. | |
1291 | |
1292 ;; Cygwin is as usual an unholy mixture -- C library locales | |
1293 ;; that follow Unix conventions, but also MS Windows locales. | |
1294 ;; So set the MS Windows locale, and then try to find a Unix | |
1295 ;; locale. | |
1296 (when (eq system-type 'cygwin32) | |
1297 (mswindows-get-and-set-locale-from-langenv langenv)) | |
1298 (let ((locs (get-language-info langenv 'locale))) | |
1299 (dolist (loc (if (listp locs) locs (list locs))) | |
1300 (let ((retval | |
1301 (cond ((functionp loc) (funcall loc nil)) | |
1302 ((stringp loc) (set-current-locale loc)) | |
1303 (t nil)))) | |
1304 (when retval | |
1305 (setenv "LANG" retval) | |
1306 (return t)))))))) | |
1307 | |
1308 (defun set-language-environment-coding-systems (language-name | |
1309 &optional eol-type) | |
1310 "Do various coding system setups for language environment LANGUAGE-NAME. | |
1311 This function assumes that the locale for LANGUAGE-NAME has been set using | |
1312 `set-current-locale'. | |
1313 | |
1314 The optional arg EOL-TYPE specifies the eol-type of the default value | |
1315 of buffer-file-coding-system set by this function." | |
1316 | |
1317 ;; The following appeared as the third paragraph of the doc string for this | |
778 | 1318 ;; function, but it's not in FSF 21.1, and it's not true, since we call |
771 | 1319 ;; reset-coding-categories-to-default before calling this function. #### |
1320 ;; Should we rethink this? | |
1321 | |
1322 ; Note that `coding-priority-list' is not reset first; thus changing language | |
1323 ; environment allows recognition of coding systems from previously set language | |
1324 ; environments. (This will not work if the desired coding systems are from the | |
1325 ; same category. E.g., starting with a Hebrew language environment, ISO 8859-8 | |
1326 ; will be recognized. If you shift to Russian, ISO 8859-8 will be shadowed by | |
1327 ; ISO 8859-5, and cannot be automatically recognized without resetting the | |
1328 ; language environment to Hebrew. However, if you shift from Japanese to | |
1329 ; Russian, ISO-2022-JP will continue to be automatically recognized, since | |
1330 ; ISO-8859-5 and ISO-2022-JP are different coding categories.)" | |
1331 | |
1332 (flet ((maybe-change-coding-system-with-eol (codesys eol-type) | |
1333 ;; if the EOL type specifies a specific type of ending, | |
1334 ;; then add that ending onto the given CODESYS; otherwise, | |
1335 ;; return CODESYS unchanged. | |
1336 (if (memq eol-type '(lf crlf cr unix dos mac)) | |
1337 (coding-system-change-eol-conversion codesys eol-type) | |
1338 codesys))) | |
1339 | |
1340 ;; initialize category mappings and priority list. | |
1341 (let* ((priority (get-language-info language-name 'coding-priority)) | |
1342 (default-coding (car priority))) | |
1343 (if priority | |
1344 (let ((categories (mapcar 'coding-system-category priority)) | |
1345 category checked-categories) | |
1346 (while priority | |
1347 (unless (memq (setq category (car categories)) checked-categories) | |
1348 (set-coding-category-system category (car priority)) | |
1349 (setq checked-categories (cons category checked-categories))) | |
1350 (setq priority (cdr priority) | |
1351 categories (cdr categories))) | |
1352 (set-coding-priority-list (nreverse checked-categories)) | |
1353 )) | |
1354 | |
1355 ;; set the default buffer coding system from the first element of the | |
1356 ;; list in the `coding-priority' property, under Unix. Under Windows, it | |
1357 ;; should stay at `mswindows-multibyte', which will reference the current | |
3707 | 1358 ;; code page. ([Does it really make sense to set the Unix default |
771 | 1359 ;; that way? NOTE also that it's not the same as the native coding |
1360 ;; system for the locale, which is correct -- the form we choose for text | |
3707 | 1361 ;; files should not necessarily have any relevance to whether we're in a |
1362 ;; Shift-JIS, EUC-JP, JIS, or other Japanese locale.]) | |
1363 ;; | |
1364 ;; On Unix--with the exception of Mac OS X--there is no way to | |
1365 ;; know for certain what coding system to use for file names, and | |
1366 ;; the environment is the best guess. If a particular user's | |
1367 ;; preferences differ from this, then that particular user needs | |
1368 ;; to edit ~/.xemacs/init.el. Aidan Kehoe, Sun Nov 26 18:11:31 CET | |
1369 ;; 2006. OS X uses an almost-normal-form version of UTF-8. | |
1370 | |
771 | 1371 (unless (memq system-type '(windows-nt cygwin32)) |
1372 (set-default-buffer-file-coding-system | |
1373 (maybe-change-coding-system-with-eol default-coding eol-type)))) | |
1374 ;; (setq default-sendmail-coding-system default-coding) | |
1375 | |
1318 | 1376 ;; set the native coding system and the default process-output system. |
771 | 1377 (let ((native (get-native-coding-system-from-language-environment |
1378 language-name (current-locale)))) | |
1318 | 1379 |
771 | 1380 (condition-case nil |
1318 | 1381 (define-coding-system-alias 'native |
1382 (maybe-change-coding-system-with-eol native eol-type)) | |
771 | 1383 (error |
1384 (warn "Invalid native-coding-system %s in language environment %s" | |
1385 native language-name))) | |
3999 | 1386 (define-coding-system-alias 'file-name |
1387 (or | |
1388 (let ((fncs (assq system-type system-type-file-name-coding))) | |
1389 (and fncs (cdr fncs))) | |
1390 'native)) | |
3142 | 1391 ;; Set the default keyboard and terminal coding systems to the native |
1392 ;; coding system of the language environment. | |
1393 ;; | |
1394 (setq keyboard-coding-system native | |
1395 terminal-coding-system native) | |
1396 | |
1397 ;; And do the same for any TTYs. | |
1398 (dolist (con (console-list)) | |
1399 (when (eq 'tty (device-type (car (console-device-list con)))) | |
1400 ;; Calling set-input-mode at the same time would be a sane thing | |
1401 ;; to do here. I would prefer to default to accepting eight bit | |
1402 ;; input and not using the top bit for Meta. | |
1403 (set-console-tty-coding-system con native))) | |
1404 | |
1318 | 1405 ;; process output should not have EOL conversion. under MS Windows |
1406 ;; and Cygwin, this screws things up (`cmd' is fine with just LF and | |
1407 ;; `bash' chokes on CR-LF). | |
771 | 1408 (setq default-process-coding-system |
1318 | 1409 (cons (car default-process-coding-system) native))))) |
771 | 1410 |
1411 (defun init-locale-at-early-startup () | |
1412 "Don't call this." | |
1413 ;; Called directly from the C code in intl.c, very early in the startup | |
1414 ;; sequence. Don't call this!!! The main purpose is to set things up | |
1415 ;; so that non-ASCII strings of all sorts (e.g. file names, command-line | |
1416 ;; arguments, environment variables) can be correctly processed during | |
1417 ;; the rest of the startup sequence. As a result, this will almost | |
1418 ;; certainly be the FIRST Lisp code called when a dumped XEmacs is run, | |
1419 ;; and it's called before ANY of the external environment is initialized. | |
1420 ;; Thus, it cannot interact at all with the outside world, make any | |
1421 ;; system calls, etc! (Except for `set-current-locale'.) | |
1422 ;; | |
1423 ;; NOTE: The following are the basic settings we have to deal with when | |
1424 ;; changing the language environment; | |
1425 ;; | |
1426 ;; -- current C library locale | |
1427 ;; -- under MS Windows, current MS Windows locale | |
1428 ;; -- LANG environment variable | |
1429 ;; -- native/file-name coding systems | |
1430 ;; -- subprocess write coding system (cdr of default-process-coding-system) | |
1431 ;; -- coding categories (for detection) | |
1432 | |
1433 (let (langenv) | |
1434 ;; under ms windows (any): | |
1435 (if (memq system-type '(windows-nt cygwin32)) | |
778 | 1436 (let ((userdef (declare-fboundp (mswindows-user-default-locale))) |
1437 (sysdef (declare-fboundp (mswindows-system-default-locale)))) | |
771 | 1438 ;; (1) current langenv comes from user-default locale. |
1439 (setq langenv (mswindows-get-language-environment-from-locale | |
1440 userdef)) | |
1441 ;; (2) init the langenv-to-locale table. | |
1442 (puthash (mswindows-get-language-environment-from-locale sysdef) | |
1443 sysdef mswindows-langenv-to-locale-table) | |
1444 ;; user-default second in langenv-to-locale table so it will | |
1445 ;; override the system-default if the two are different but both | |
1446 ;; map to the same language environment | |
1447 (puthash langenv userdef mswindows-langenv-to-locale-table) | |
1448 ;; (3) setup C lib locale, MS Windows locale, LANG environment | |
1449 ;; variable. Note that under Cygwin we are ignoring the | |
1450 ;; passed-in LANG environment variable for the moment -- it's | |
1451 ;; usually wrong anyway and just says "C". #### Perhaps we | |
1452 ;; should reconsider. | |
1453 (and langenv (set-locale-for-language-environment langenv)) | |
1454 ;; (4) override current MS Windows locale with the user-default | |
1455 ;; locale. Always init the MS Windows locale from the | |
1456 ;; user-default locale even if the langenv doesn't correspond; | |
1457 ;; we might not be able to find a langenv for the user-default | |
1458 ;; locale but we should still use the right code page, etc. | |
778 | 1459 (declare-fboundp (mswindows-set-current-locale userdef))) |
771 | 1460 ;; Unix: |
3173 | 1461 (let (locstring) |
1462 ;; Init the POSIX locale from the environment--this calls the C | |
1463 ;; library's setlocale(3). | |
1464 (set-current-locale "") | |
1465 ;; Can't let locstring be the result of (set-current-locale "") | |
1466 ;; because that can return a more detailed string than we know how | |
1467 ;; to handle. | |
1468 (setq locstring (current-locale) | |
1469 ;; assume C lib locale and LANG env var are set correctly. | |
1470 ;; use them to find the langenv. | |
1471 langenv | |
1472 (and locstring (get-language-environment-from-locale | |
1473 locstring))))) | |
771 | 1474 ;; All systems: |
1475 (unless langenv (setq langenv "English")) | |
1476 (setq current-language-environment langenv) | |
1477 ;; Setup various coding systems and categories. | |
1478 (let ((default-eol-type (coding-system-eol-type | |
1479 default-buffer-file-coding-system))) | |
1480 (reset-language-environment) | |
1481 (set-language-environment-coding-systems langenv default-eol-type)))) | |
1482 | |
1483 (defun init-mule-at-startup () | |
1484 "Initialize MULE environment at startup. Don't call this." | |
1485 | |
2367 | 1486 (when (not load-unicode-tables-at-dump-time) |
1487 (load-unicode-tables)) | |
771 | 1488 |
2367 | 1489 ;; This is called (currently; might be moved earlier) from startup.el, |
1490 ;; after the basic GUI systems have been initialized, and just before the | |
1491 ;; init file gets read in. It needs to finish up initializing the | |
1492 ;; current language environment. Very early in the startup procedure we | |
1493 ;; determined the default language environment from the locale, and | |
1494 ;; bootstrapped the native, file-name and process I/O coding systems. | |
1495 ;; Now we need to do it over `the right away'. | |
771 | 1496 (finish-set-language-environment current-language-environment) |
1497 | |
1498 ;; Load a (localizable) locale-specific init file, if it exists. | |
1499 ;; We now use the language environment name, NOT the locale, | |
1500 ;; whose name varies from system to system. | |
1501 (load (format "%s%s/locale-start" | |
1502 (locate-data-directory "start-files") | |
1503 current-language-environment) | |
1504 t t) | |
1505 | |
1506 ;; #### the rest is junk that should be deleted. | |
1507 | |
1508 (when current-language-environment | |
1509 ;; rman seems to be incompatible with encoded text | |
1510 (setq Manual-use-rosetta-man nil)) | |
1511 | |
1512 ;; Register available input methods by loading LEIM list file. | |
1513 (load "leim-list.el" 'noerror 'nomessage 'nosuffix) | |
1514 ) | |
1515 | |
1516 ;; Code deleted: init-mule-tm (Enable the tm package by default) | |
428 | 1517 |
1518 ;;; mule-cmds.el ends here |