771
|
1 ;;; code-init.el --- Handle coding system default values
|
|
2
|
1318
|
3 ;; Copyright (C) 2001, 2002, 2003 Ben Wing.
|
771
|
4
|
|
5 ;; This file is part of XEmacs.
|
|
6
|
|
7 ;; XEmacs is free software; you can redistribute it and/or modify it
|
|
8 ;; under the terms of the GNU General Public License as published by
|
|
9 ;; the Free Software Foundation; either version 2, or (at your option)
|
|
10 ;; any later version.
|
|
11
|
|
12 ;; XEmacs is distributed in the hope that it will be useful, but
|
|
13 ;; WITHOUT ANY WARRANTY; without even the implied warranty of
|
|
14 ;; MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
|
|
15 ;; General Public License for more details.
|
|
16
|
|
17 ;; You should have received a copy of the GNU General Public License
|
|
18 ;; along with XEmacs; see the file COPYING. If not, write to the
|
|
19 ;; Free Software Foundation, Inc., 59 Temple Place - Suite 330,
|
|
20 ;; Boston, MA 02111-1307, USA.
|
|
21
|
|
22 ;;; Commentary:
|
|
23
|
|
24 ;; Placed in a separate file so it can be loaded after the various
|
|
25 ;; coding systems have been created, because we'll be using them at
|
|
26 ;; load time.
|
|
27
|
2297
|
28 ;; #### Issues (this discussion probably belongs elsewhere)
|
|
29 ;; 1. "Big" characters are unrepresentable. Should give error, warning,
|
|
30 ;; not just substitute "~".
|
|
31 ;; 2. 21.4 compatibility?
|
|
32 ;; 3. make-char: non-mule barfs on non-iso8859-1.
|
|
33
|
771
|
34 ;;; Code:
|
|
35
|
|
36 (defcustom eol-detection-enabled-p (or (featurep 'mule)
|
|
37 (memq system-type '(windows-nt
|
|
38 cygwin32))
|
|
39 (featurep 'unix-default-eol-detection))
|
|
40 "True if XEmacs automatically detects the EOL type when reading files.
|
|
41 Normally, this is always the case on Windows or when international (Mule)
|
|
42 support is compiled into this XEmacs. Otherwise, it is currently off by
|
|
43 default, but this may change. Don't set this; nothing will happen. Instead,
|
|
44 use the Options menu or `set-eol-detection'."
|
|
45 :group 'encoding
|
|
46 :type 'boolean
|
|
47 ;; upon initialization, we don't want the whole business of
|
|
48 ;; set-eol-detection to be called. We will init everything appropriately
|
|
49 ;; later in the same file, when reset-language-environment is called.
|
|
50 :initialize #'(lambda (var val)
|
1698
|
51 (setq eol-detection-enabled-p (eval val)))
|
771
|
52 :set #'(lambda (var val)
|
|
53 (set-eol-detection val)
|
|
54 (setq eol-detection-enabled-p val)))
|
|
55
|
|
56 (defun set-eol-detection (flag)
|
|
57 "Enable (if FLAG is non-nil) or disable automatic EOL detection of files.
|
|
58 EOL detection is enabled by default on Windows or when international (Mule)
|
|
59 support is compiled into this XEmacs. Otherwise, it is currently off by
|
|
60 default, but this may change. NOTE: You *REALLY* should not turn off EOL
|
|
61 detection on Windows! Your files will have lots of annoying ^M's in them
|
|
62 if you do this."
|
|
63 (dolist (x '(buffer-file-coding-system-for-read
|
|
64 keyboard
|
2071
|
65 default-process-coding-system-read))
|
771
|
66 (set-coding-system-variable
|
|
67 x (coding-system-change-eol-conversion (get-coding-system-variable x)
|
2071
|
68 (if flag nil 'lf))))
|
|
69 (set-coding-category-system
|
|
70 'no-conversion
|
|
71 (coding-system-change-eol-conversion (coding-category-system 'no-conversion)
|
|
72 (if flag nil 'lf))))
|
771
|
73
|
|
74 (defun coding-system-current-system-configuration ()
|
|
75 (cond ((memq system-type '(windows-nt cygwin32))
|
|
76 (if (featurep 'mule) 'windows-mule 'windows-no-mule))
|
|
77 ((featurep 'mule) 'unix-mule)
|
|
78 (eol-detection-enabled-p 'unix-no-mule-eol-detection)
|
|
79 (t 'unix-no-mule-no-eol-detection)))
|
|
80
|
1318
|
81 ;; NOTE NOTE NOTE: These values may get overridden when the language
|
|
82 ;; environment is initialized (set-language-environment-coding-systems).
|
771
|
83 (defvar coding-system-variable-default-value-table
|
1318
|
84 '((buffer-file-coding-system-for-read
|
|
85 binary raw-text undecided raw-text undecided)
|
|
86 (default-buffer-file-coding-system
|
2297
|
87 ;; #### iso-2022-8 with no eol specified? can that be OK?
|
1318
|
88 binary binary iso-2022-8 raw-text-dos mswindows-multibyte-dos)
|
|
89 (native
|
|
90 binary binary binary raw-text-dos mswindows-multibyte-system-default-dos)
|
|
91 (keyboard
|
1471
|
92 binary raw-text undecided-unix raw-text undecided-unix)
|
771
|
93 ;; the `terminal' coding system is used for output to stderr. such
|
|
94 ;; streams do automatic lf->crlf encoding in the C library, so we need
|
|
95 ;; to not do the same translations ourselves.
|
1318
|
96 (terminal
|
|
97 binary binary binary binary mswindows-multibyte-unix)
|
|
98 (default-process-coding-system-read
|
|
99 binary raw-text undecided raw-text undecided)
|
|
100 (default-process-coding-system-write
|
|
101 binary binary binary raw-text mswindows-multibyte-system-default)
|
|
102 (no-conversion-coding-system-mapping
|
|
103 binary raw-text raw-text raw-text mswindows-multibyte)
|
771
|
104 ))
|
|
105
|
|
106 (defvar coding-system-default-configuration-list
|
|
107 '(unix-no-mule-no-eol-detection
|
|
108 unix-no-mule-eol-detection
|
|
109 unix-mule
|
|
110 windows-no-mule
|
|
111 windows-mule))
|
|
112
|
|
113 (defvar coding-system-default-variable-list
|
|
114 '(buffer-file-coding-system-for-read
|
|
115 default-buffer-file-coding-system
|
|
116 native
|
|
117 keyboard
|
|
118 terminal
|
|
119 default-process-coding-system-read
|
|
120 default-process-coding-system-write))
|
|
121
|
|
122 (defun get-coding-system-variable (var)
|
|
123 "Return the value of a basic coding system variable.
|
|
124 This is intended as a uniform interface onto the coding system settings that
|
|
125 control how encoding detection and conversion works. See
|
|
126 `coding-system-variable-default-value' for a list of the possible values of
|
|
127 VAR."
|
|
128 (case var
|
|
129 (buffer-file-coding-system-for-read buffer-file-coding-system-for-read)
|
|
130 (default-buffer-file-coding-system
|
|
131 (default-value 'buffer-file-coding-system))
|
|
132 (native (coding-system-aliasee 'native))
|
|
133 (keyboard (coding-system-aliasee 'keyboard))
|
|
134 (terminal (coding-system-aliasee 'terminal))
|
|
135 (default-process-coding-system-read (car default-process-coding-system))
|
|
136 (default-process-coding-system-write (cdr default-process-coding-system))
|
|
137 (t (error 'invalid-constant "Invalid coding system variable" var))))
|
|
138
|
|
139 (defun set-coding-system-variable (var value)
|
|
140 "Set a basic coding system variable to VALUE.
|
|
141 This is intended as a uniform interface onto the coding system settings that
|
|
142 control how encoding detection and conversion works. See
|
|
143 `coding-system-variable-default-value' for a list of the possible values of
|
|
144 VAR."
|
|
145 (case var
|
|
146 (buffer-file-coding-system-for-read
|
|
147 (set-buffer-file-coding-system-for-read value))
|
|
148 (default-buffer-file-coding-system
|
|
149 (set-default-buffer-file-coding-system value))
|
|
150 (native (define-coding-system-alias 'native value))
|
|
151 (keyboard (set-keyboard-coding-system value))
|
|
152 (terminal (set-terminal-coding-system value))
|
|
153 (default-process-coding-system-read
|
|
154 (setq default-process-coding-system
|
|
155 (cons value (cdr default-process-coding-system))))
|
|
156 (default-process-coding-system-write
|
|
157 (setq default-process-coding-system
|
|
158 (cons (car default-process-coding-system) value)))
|
|
159 (t (error 'invalid-constant "Invalid coding system variable" var))))
|
|
160
|
|
161 (defun coding-system-variable-default-value (var &optional config)
|
|
162 "Return the appropriate default value for a coding system variable.
|
|
163
|
|
164 VAR specifies the variable, and CONFIG the configuration, defaulting
|
|
165 to the current system configuration (as returned by
|
|
166 `coding-system-current-system-configuration').
|
|
167
|
|
168 The table of default values looks like this: (see below for abbreviations)
|
|
169
|
|
170
|
1471
|
171 Unix Unix+EOL Unix+Mule MSW MSW+Mule
|
|
172 -----------------------------------------------------------------------------
|
|
173 bfcs-for-read binary raw-text undecided raw-text undecided
|
|
174 default bfcs binary binary iso-2022-8 raw-text-dos MSW-MB-dos
|
|
175 native binary binary binary raw-text-dos MSW-MB-SD-dos
|
|
176 keyboard binary raw-text undecided-unix raw-text undecided-unix
|
|
177 terminal binary binary binary binary MSW-MB-unix
|
|
178 process-read binary raw-text undecided raw-text undecided
|
|
179 process-write binary binary binary raw-text MSW-MB-SD
|
|
180 no-conv-cs binary raw-text raw-text raw-text MSW-MB
|
771
|
181
|
|
182
|
|
183 VAR can be one of: (abbreviations in parens)
|
|
184
|
|
185 `buffer-file-coding-system-for-read' (bfcs-for-read)
|
|
186
|
|
187 Lisp variable of the same name; the default coding system used when
|
|
188 reading in a file, in the absence of more specific settings. (See
|
|
189 `insert-file-contents' for a description of exactly how a file's
|
|
190 coding system is determined when it's read in.)
|
|
191
|
|
192 `default-buffer-file-coding-system' (default bfcs)
|
|
193
|
|
194 Default value of `buffer-file-coding-system', the buffer-local
|
|
195 variable specifying a file's coding system to be used when it is
|
|
196 written out. Set using `set-default-buffer-file-coding-system' (or
|
|
197 the primitive `setq-default'). When a file is read in,
|
|
198 `buffer-file-coding-system' for that file is set from the coding
|
|
199 system used to read the file in; the default value applies to newly
|
|
200 created files.
|
|
201
|
|
202 `native' (native)
|
|
203
|
|
204 The coding system named `native'. Changed using
|
|
205 `define-coding-system-alias'. Used internally when passing
|
1318
|
206 text to or from system API's, unless the particular
|
771
|
207 API specifies another coding system.
|
|
208
|
|
209 `keyboard' (keyboard)
|
|
210
|
|
211 #### fill in
|
|
212
|
|
213 `terminal' (terminal)
|
|
214
|
|
215 #### fill in
|
|
216
|
|
217 `default-process-coding-system-read' (process-read)
|
|
218
|
|
219 #### fill in
|
|
220
|
|
221 `default-process-coding-system-write' (process-write)
|
|
222
|
|
223 #### fill in
|
|
224
|
|
225 `no-conversion-coding-system-mapping' (no-conv-cs)
|
|
226
|
|
227 Coding system used when category `no-conversion' is detected.
|
|
228
|
|
229
|
|
230 CONFIG is one of: (abbreviations in parens)
|
|
231
|
|
232 `unix-no-mule-no-eol-detection' (Unix)
|
|
233
|
|
234 Unix, no Mule support, no automatic EOL detection. (Controlled by
|
|
235 `eol-detection-enabled-p', which is set by the command-line flag
|
|
236 -enable-eol-detection or the configure flag --with-default-eol-detection.)
|
|
237
|
|
238 `unix-no-mule-eol-detection' (Unix+EOL)
|
|
239
|
|
240 Unix, no Mule support, automatic EOL detection.
|
|
241
|
|
242 `unix-mule' (Unix+Mule)
|
|
243
|
|
244 Unix, Mule support.
|
|
245
|
|
246 `windows-no-mule' (MSW)
|
|
247
|
|
248 MS Windows or Cygwin, no Mule support.
|
|
249
|
|
250 `windows-mule'. (MSW+Mule)
|
|
251
|
|
252 MS Windows or Cygwin, Mule support.
|
|
253
|
|
254
|
|
255 The following coding system abbreviations are also used in the table:
|
|
256
|
|
257 MSW-MB = mswindows-multibyte
|
|
258 MSW-MB = mswindows-multibyte-system-default
|
|
259 "
|
|
260 (setq config (or config (coding-system-current-system-configuration)))
|
|
261 (let ((defs (cdr (assq var coding-system-variable-default-value-table))))
|
|
262 (or defs (error 'invalid-constant "Invalid coding system variable" var))
|
|
263 (let ((pos (position config coding-system-default-configuration-list)))
|
|
264 (or pos (error 'invalid-constant "Invalid coding system configuration"
|
|
265 config))
|
|
266 (nth pos defs))))
|
|
267
|
|
268 (defun reset-coding-system-defaults (&optional config)
|
|
269 "Reset all basic coding system variables are set to their default values.
|
|
270 See `coding-system-variable-default-value'."
|
|
271 (setq config (or config (coding-system-current-system-configuration)))
|
|
272 (mapcar #'(lambda (var)
|
|
273 (set-coding-system-variable
|
|
274 var (coding-system-variable-default-value var config)))
|
|
275 coding-system-default-variable-list))
|
|
276
|
|
277 (defun reset-coding-categories-to-default ()
|
|
278 "Reset all coding categories (used for automatic detection) to their defaults.
|
|
279
|
|
280 The order of priorities of coding categories and the coding system
|
|
281 bound to each category are as follows:
|
|
282
|
|
283 coding category coding system
|
|
284 --------------------------------------------------
|
|
285 utf-16-little-endian-bom utf-16-little-endian
|
|
286 utf-16-bom utf-16-bom
|
985
|
287 utf-8-bom utf-8-bom
|
771
|
288 iso-7 iso-2022-7bit
|
|
289 no-conversion raw-text
|
|
290 utf-8 utf-8
|
|
291 iso-8-1 iso-8859-1
|
|
292 iso-8-2 ctext (iso-8859-1 alias)
|
|
293 iso-8-designate ctext (iso-8859-1 alias)
|
|
294 iso-lock-shift iso-2022-lock
|
|
295 shift-jis shift-jis
|
|
296 big5 big5
|
|
297 utf-16-little-endian utf-16-little-endian
|
|
298 utf-16 utf-16
|
|
299 ucs-4 ucs-4
|
|
300 "
|
|
301 ;; #### What a mess! This needs to be overhauled.
|
|
302
|
|
303 ;; The old table (from FSF synch?) was not what we use (cf mule-coding.el),
|
|
304 ;; and as documented iso-8-designate is inconsistent with iso-2022-8bit-ss2.
|
|
305 ;; The order of priorities of coding categories and the coding system
|
|
306 ;; bound to each category are as follows:
|
|
307 ;;
|
|
308 ;; coding category coding system
|
|
309 ;; --------------------------------------------------
|
|
310 ;; iso-8-2 iso-8859-1
|
|
311 ;; iso-8-1 iso-8859-1
|
|
312 ;; iso-7 iso-2022-7bit
|
|
313 ;; iso-lock-shift iso-2022-lock
|
|
314 ;; iso-8-designate iso-2022-8bit-ss2
|
|
315 ;; no-conversion raw-text
|
|
316 ;; shift-jis shift_jis
|
|
317 ;; big5 big5
|
|
318 ;; ucs-4 ----
|
|
319 ;; utf-8 ----
|
|
320 (when (featurep 'mule)
|
|
321 (set-coding-category-system 'iso-7 'iso-2022-7)
|
|
322 (set-coding-category-system 'iso-8-1 'iso-8859-1)
|
|
323 (set-coding-category-system 'iso-8-2 'ctext)
|
|
324 (set-coding-category-system 'iso-lock-shift 'iso-2022-lock)
|
|
325 (set-coding-category-system 'iso-8-designate 'ctext)
|
|
326 (if (find-coding-system 'shift-jis)
|
|
327 (set-coding-category-system 'shift-jis 'shift-jis))
|
|
328 (if (find-coding-system 'big5)
|
|
329 (set-coding-category-system 'big5 'big5))
|
|
330 )
|
|
331 (set-coding-category-system
|
|
332 'no-conversion
|
|
333 (coding-system-variable-default-value 'no-conversion-coding-system-mapping))
|
|
334 (set-coding-category-system 'ucs-4 'ucs-4)
|
|
335 (set-coding-category-system 'utf-8 'utf-8)
|
985
|
336 (set-coding-category-system 'utf-8-bom 'utf-8-bom)
|
771
|
337 (set-coding-category-system 'utf-16-little-endian 'utf-16-little-endian)
|
|
338 (set-coding-category-system 'utf-16 'utf-16)
|
|
339 (set-coding-category-system 'utf-16-little-endian-bom
|
|
340 'utf-16-little-endian-bom)
|
|
341 (set-coding-category-system 'utf-16-bom 'utf-16-bom)
|
|
342 (set-coding-priority-list
|
|
343 (if (featurep 'mule)
|
|
344 '(utf-16-little-endian-bom
|
|
345 utf-16-bom
|
985
|
346 utf-8-bom
|
771
|
347 iso-7
|
|
348 no-conversion
|
|
349 utf-8
|
|
350 iso-8-1
|
|
351 iso-8-2
|
|
352 iso-8-designate
|
|
353 iso-lock-shift
|
|
354 shift-jis
|
|
355 big5
|
|
356 utf-16-little-endian
|
|
357 utf-16
|
|
358 ucs-4)
|
|
359 '(utf-16-little-endian-bom
|
|
360 utf-16-bom
|
985
|
361 utf-8-bom
|
771
|
362 no-conversion
|
|
363 utf-8
|
|
364 utf-16-little-endian
|
|
365 utf-16
|
|
366 ucs-4))))
|
|
367
|
|
368 (defun reset-language-environment ()
|
|
369 "Reset coding system environment of XEmacs to the default status.
|
|
370 All basic coding system variables are set to their default values, as
|
|
371 are the coding categories used for automatic detection and their
|
|
372 priority.
|
|
373
|
|
374 BE VERY CERTAIN YOU WANT TO DO THIS BEFORE DOING IT!
|
|
375
|
|
376 For more information, see `reset-coding-system-defaults' and
|
|
377 `reset-coding-categories-to-default'."
|
|
378 (reset-coding-system-defaults)
|
|
379 (reset-coding-categories-to-default))
|
|
380
|
|
381 ;; Initialize everything so that the remaining Lisp files can contain
|
|
382 ;; extended characters. (They will be in ISO-7 format)
|
|
383
|
|
384 ;; !!####!! The Lisp files should all be in UTF-8!!! That way, all
|
|
385 ;; special characters appear as high bits and there's no problem with
|
|
386 ;; the Lisp parser trying to read a Mule file and getting all screwed
|
|
387 ;; up. The only other thing then would be characters; we just need to
|
|
388 ;; modify the Lisp parser to read the stuff directly after a ? as
|
|
389 ;; UTF-8 and return a 30-bit value directly, and modify the character
|
|
390 ;; routines a bit to allow such a beast to exist. MAKE IT A POINT TO
|
|
391 ;; IMPLEMENT THIS AS ONE OF MY FUTURE PROJECTS. --ben
|
|
392
|
|
393 (reset-language-environment)
|
|
394
|
|
395 ;;; code-init.el ends here
|