xemacs-beta: src/file-coding.c comparison

comparison src/file-coding.c @ 3025:facf3239ba30

[xemacs-hg @ 2005-10-25 11:16:19 by ben] rename new->new_, convert 'foo to `foo' EmacsFrame.c, ExternalClient.c, ExternalShell.c, chartab.c, cmdloop.c, compiler.h, console.c, database.c, device-msw.c, device-x.c, device.c, doc.c, dragdrop.c, eval.c, event-msw.c, event-stream.c, events.c, extents.c, file-coding.c, fns.c, frame-tty.c, frame.c, gpmevent.c, gutter.c, hash.c, imgproc.c, indent.c, keymap.c, lisp-union.h, macros.c, malloc.c, marker.c, menubar-x.c, menubar.c, mule-charset.c, number.c, process.c, profile.h, ralloc.c, redisplay.c, select-common.h, select.c, syntax.c, sysfile.h, sysproc.h, systime.h, syswindows.h, toolbar.c, tooltalk.c, tparam.c, unexaix.c, unexalpha.c, unexconvex.c, unexec.c, unexhp9k800.c, unexmips.c, unicode.c, window.c: new -> new_. 'foo -> `foo'. lwlib-internal.h: redo assert macros to follow lisp.h and not trigger warnings. lwlib.c, xlwtabs.c: new -> new_.

author	ben
date	Tue, 25 Oct 2005 11:16:49 +0000
parents	b7f26b2f78bd
children	77f5a5135b3a 3742ea8250b5

comparison

equal deleted inserted replaced

-:b7f26b2f78bd
+:facf3239ba30
 /* Text encoding conversion functions; coding-system object.
 #### rename me to coding-system.c or coding.c
 Copyright (C) 1991, 1995 Free Software Foundation, Inc.
 Copyright (C) 1995 Sun Microsystems, Inc.
-Copyright (C) 2000, 2001, 2002, 2003 Ben Wing.
+Copyright (C) 2000, 2001, 2002, 2003, 2005 Ben Wing.
 This file is part of XEmacs.
 XEmacs is free software; you can redistribute it and/or modify it
 under the terms of the GNU General Public License as published by the
 }
 DEFUN ("valid-coding-system-type-p", Fvalid_coding_system_type_p, 1, 1, 0, /*
 Given a CODING-SYSTEM-TYPE, return non-nil if it is valid.
 Valid types depend on how XEmacs was compiled but may include
-'undecided, 'chain, 'integer, 'ccl, 'iso2022, 'big5, 'shift-jis,
+`undecided', `chain', `integer', `ccl', `iso2022', `big5', `shift-jis',
-'utf-16, 'ucs-4, 'utf-8, etc.
+`utf-16', `ucs-4', `utf-8', etc.
 */
 (coding_system_type))
 {
 return valid_coding_system_type_p (coding_system_type) ? Qt : Qnil;
 }
 DEFUN ("make-coding-system", Fmake_coding_system, 2, 4, 0, /*
 Register symbol NAME as a coding system.
 TYPE describes the conversion method used and should be one of
-nil or 'undecided
+nil or `undecided'
 Automatic conversion.  XEmacs attempts to detect the coding system
 used in the file.
-'chain
+`chain'
 Chain two or more coding systems together to make a combination coding
 system.
-'no-conversion
+`no-conversion'
 No conversion.  Use this for binary files and such.  On output,
 graphic characters that are not in ASCII or Latin-1 will be
 replaced by a ?. (For a no-conversion-encoded buffer, these
 characters will only be present if you explicitly insert them.)
-'convert-eol
+`convert-eol'
 Convert CRLF sequences or CR to LF.
-'shift-jis
+`shift-jis'
 Shift-JIS (a Japanese encoding commonly used in PC operating systems).
-'unicode
+`unicode'
 Any Unicode encoding (UCS-4, UTF-8, UTF-16, etc.).
-'mswindows-unicode-to-multibyte
+`mswindows-unicode-to-multibyte'
 (MS Windows only) Converts from Windows Unicode to Windows Multibyte
 (any code page encoding) upon encoding, and the other way upon decoding.
-'mswindows-multibyte
+`mswindows-multibyte'
 Converts to or from Windows Multibyte (any code page encoding).
 This is resolved into a chain of `mswindows-unicode' and
 `mswindows-unicode-to-multibyte'.
-'iso2022
+`iso2022'
 Any ISO2022-compliant encoding.  Among other things, this includes
 JIS (the Japanese encoding commonly used for e-mail), EUC (the
 standard Unix encoding for Japanese and other languages), and
 Compound Text (the encoding used in X11).  You can specify more
 specific information about the conversion with the PROPS argument.
-'big5
+`big5'
 Big5 (the encoding commonly used for Mandarin Chinese in Taiwan).
-'ccl
+`ccl'
 The conversion is performed using a user-written pseudo-code
 program.  CCL (Code Conversion Language) is the name of this
 pseudo-code.
-'gzip
+`gzip'
 GZIP compression format.
-'internal
+`internal'
 Write out or read in the raw contents of the memory representing
 the buffer's text.  This is primarily useful for debugging
 purposes, and is only enabled when XEmacs has been compiled with
 DEBUG_XEMACS defined (via the --debug configure option).
-WARNING: Reading in a file using 'internal conversion can result
+WARNING: Reading in a file using `internal' conversion can result
 in an internal inconsistency in the memory representing a
 buffer's text, which will produce unpredictable results and may
 cause XEmacs to crash.  Under normal circumstances you should
-never use 'internal conversion.
+never use `internal' conversion.
 DESCRIPTION is a short English phrase describing the coding system,
 suitable for use as a menu item. (See also the `documentation' property
 below.)
 PROPS is a property list, describing the specific nature of the
 character set.  Recognized properties are:
-'mnemonic
+`mnemonic'
 String to be displayed in the modeline when this coding system is
 active.
-'documentation
+`documentation'
 Detailed documentation on the coding system.
-'eol-type
+`eol-type'
 End-of-line conversion to be used.  It should be one of
 	nil
 		Automatically detect the end-of-line type (LF, CRLF,
 		or CR).  Also generate subsidiary coding systems named
 		`NAME-unix', `NAME-dos', and `NAME-mac', that are
 		identical to this coding system but have an EOL-TYPE
-		value of 'lf, 'crlf, and 'cr, respectively.
+		value of `lf', `crlf', and `cr', respectively.
-	'lf
+	`lf'
 		The end of a line is marked externally using ASCII LF.
 		Since this is also the way that XEmacs represents an
 		end-of-line internally, specifying this option results
 		in no end-of-line conversion.  This is the standard
 		format for Unix text files.
-	'crlf
+	`crlf'
 		The end of a line is marked externally using ASCII
 		CRLF.  This is the standard format for MS-DOS text
 		files.
-	'cr
+	`cr'
 		The end of a line is marked externally using ASCII CR.
 		This is the standard format for Macintosh text files.
 	t
 		Automatically detect the end-of-line type but do not
 		generate subsidiary coding systems.  (This value is
 		converted to nil when stored internally, and
 		`coding-system-property' will return nil.)
-'post-read-conversion
+`post-read-conversion'
 The value is a function to call after some text is inserted and
 decoded by the coding system itself and before any functions in
 `after-change-functions' are called. (#### Not actually true in
 XEmacs. `after-change-functions' will be called twice if
 `post-read-conversion' changes something.) The argument of this
 function is the same as for a function in
 `after-insert-file-functions', i.e. LENGTH of the text inserted,
 with point at the head of the text to be decoded.
-'pre-write-conversion
+`pre-write-conversion'
 The value is a function to call after all functions in
 `write-region-annotate-functions' and `buffer-file-format' are
 called, and before the text is encoded by the coding system itself.
 The arguments to this function are the same as those of a function
 in `write-region-annotate-functions', i.e. FROM and TO, specifying
 The following properties are allowed for FSF compatibility but currently
 ignored:
-'translation-table-for-decode
+`translation-table-for-decode'
 The value is a translation table to be applied on decoding.  See
 the function `make-translation-table' for the format of translation
 table.  This is not applicable to CCL-based coding systems.
-'translation-table-for-encode
+`translation-table-for-encode'
 The value is a translation table to be applied on encoding.  This is
 not applicable to CCL-based coding systems.
-'safe-chars
+`safe-chars'
 The value is a char table.  If a character has non-nil value in it,
 the character is safely supported by the coding system.  This
 overrides the specification of safe-charsets.
-'safe-charsets
+`safe-charsets'
 The value is a list of charsets safely supported by the coding
 system.  The value t means that all charsets Emacs handles are
 supported.  Even if some charset is not in this list, it doesn't
 mean that the charset can't be encoded in the coding system;
 it just means that some other receiver of text encoded
 in the coding system won't be able to handle that charset.
-'mime-charset
+`mime-charset'
 The value is a symbol of which name is `MIME-charset' parameter of
 the coding system.
-'valid-codes (meaningful only for a coding system based on CCL)
+`valid-codes' (meaningful only for a coding system based on CCL)
 The value is a list to indicate valid byte ranges of the encoded
 file.  Each element of the list is an integer or a cons of integer.
 In the former case, the integer value is a valid byte code.  In the
 latter case, the integers specifies the range of valid byte codes.
-The following additional property is recognized if TYPE is 'convert-eol:
+The following additional property is recognized if TYPE is `convert-eol':
-'subtype
+`subtype'
 One of `lf', `crlf', `cr' or nil (for autodetection).  When decoding,
 the corresponding sequence will be converted to LF.  When encoding,
 the opposite happens.  This coding system converts characters to
 characters.
-The following additional properties are recognized if TYPE is 'iso2022:
+The following additional properties are recognized if TYPE is `iso2022':
-'charset-g0
+`charset-g0'
-'charset-g1
+`charset-g1'
-'charset-g2
+`charset-g2'
-'charset-g3
+`charset-g3'
 The character set initially designated to the G0 - G3 registers.
 The value should be one of
 -- A charset object (designate that character set)
 	  -- nil (do not ever use this register)
 	  -- t (no character set is initially designated to
 		the register, but may be later on; this automatically
 		sets the corresponding `force-g*-on-output' property)
-'force-g0-on-output
+`force-g0-on-output'
-'force-g1-on-output
+`force-g1-on-output'
-'force-g2-on-output
+`force-g2-on-output'
-'force-g2-on-output
+`force-g2-on-output'
 If non-nil, send an explicit designation sequence on output before
 using the specified register.
-'short
+`short'
 If non-nil, use the short forms "ESC $ @", "ESC $ A", and
 "ESC $ B" on output in place of the full designation sequences
 "ESC $ ( @", "ESC $ ( A", and "ESC $ ( B".
-'no-ascii-eol
+`no-ascii-eol'
 If non-nil, don't designate ASCII to G0 at each end of line on output.
 Setting this to non-nil also suppresses other state-resetting that
 normally happens at the end of a line.
-'no-ascii-cntl
+`no-ascii-cntl'
 If non-nil, don't designate ASCII to G0 before control chars on output.
-'seven
+`seven'
 If non-nil, use 7-bit environment on output.  Otherwise, use 8-bit
 environment.
-'lock-shift
+`lock-shift'
 If non-nil, use locking-shift (SO/SI) instead of single-shift
 or designation by escape sequence.
-'no-iso6429
+`no-iso6429'
 If non-nil, don't use ISO6429's direction specification.
-'escape-quoted
+`escape-quoted'
 If non-nil, literal control characters that are the same as
 the beginning of a recognized ISO2022 or ISO6429 escape sequence
 (in particular, ESC (0x1B), SO (0x0E), SI (0x0F), SS2 (0x8E),
 SS3 (0x8F), and CSI (0x9B)) are "quoted" with an escape character
 so that they can be properly distinguished from an escape sequence.
 is a good choice for a quoting character because there are no
 escape sequences whose second byte is a character from the Control-0
 or Control-1 character sets; this is explicitly disallowed by the
 ISO2022 standard.
-'input-charset-conversion
+`input-charset-conversion'
 A list of conversion specifications, specifying conversion of
 characters in one charset to another when decoding is performed.
 Each specification is a list of two elements: the source charset,
 and the destination charset.
-'output-charset-conversion
+`output-charset-conversion'
 A list of conversion specifications, specifying conversion of
 characters in one charset to another when encoding is performed.
 The form of each specification is the same as for
-'input-charset-conversion.
+`input-charset-conversion'.
 The following additional properties are recognized (and required)
-if TYPE is 'ccl:
+if TYPE is `ccl':
-'decode
+`decode'
 CCL program used for decoding (converting to internal format).
-'encode
+`encode'
 CCL program used for encoding (converting to external format).
-The following additional properties are recognized if TYPE is 'chain:
+The following additional properties are recognized if TYPE is `chain':
-'chain
+`chain'
 List of coding systems to be chained together, in decoding order.
-'canonicalize-after-coding
+`canonicalize-after-coding'
 Coding system to be returned by the detector routines in place of
 this coding system.
-The following additional properties are recognized if TYPE is 'unicode:
+The following additional properties are recognized if TYPE is `unicode':
-'type
+`type'
 One of `utf-16', `utf-8', `ucs-4', or `utf-7' (the latter is not
 yet implemented).  `utf-16' is the basic two-byte encoding;
 `ucs-4' is the four-byte encoding; `utf-8' is an ASCII-compatible
 variable-width 8-bit encoding; `utf-7' is a 7-bit encoding using
 only characters that will safely pass through all mail gateways.
 [[ This should be \"transformation format\".  There should also be
 `ucs-2' (or `bmp' -- no surrogates) and `utf-32' (range checked). ]]
-'little-endian
+`little-endian'
 If non-nil, `utf-16' and `ucs-4' will write out the groups of two
 or four bytes little-endian instead of big-endian.  This is required,
 for example, under Windows.
-'need-bom
+`need-bom'
 If non-nil, a byte order mark (BOM, or Unicode FFFE) should be
 written out at the beginning of the data.  This serves both to
 identify the endianness of the following data and to mark the
 data as Unicode (at least, this is how Windows uses it).
 [[ The correct term is \"signature\", since this technique may also
 be used with UTF-8.  That is the term used in the standard. ]]
 The following additional properties are recognized if TYPE is
-'mswindows-multibyte:
+`mswindows-multibyte':
-'code-page
+`code-page'
 Either a number (specifying a particular code page) or one of the
 symbols `ansi', `oem', `mac', or `ebcdic', specifying the ANSI,
 OEM, Macintosh, or EBCDIC code page associated with a particular
 locale (given by the `locale' property).  NOTE: EBCDIC code pages
 only exist in Windows 2000 and later.
-'locale
+`locale'
 If `code-page' is a symbol, this specifies the locale whose code
 page of the corresponding type should be used.  This should be
 one of the following: A cons of two strings, (LANGUAGE
 . SUBLANGUAGE) (see `mswindows-set-current-locale'); a string (a
 language; SUBLANG_DEFAULT, i.e. the default sublanguage, is
 `mswindows-current-locale', `mswindows-user-default-locale', or
 `mswindows-system-default-locale', respectively.
-The following additional properties are recognized if TYPE is 'undecided:
+The following additional properties are recognized if TYPE is `undecided':
 [[ Doesn't GNU use \"detect-*\" for the following two? ]]
-'do-eol
+`do-eol'
 Do EOL detection.
-'do-coding
+`do-coding'
 Do encoding detection.
-'coding-system
+`coding-system'
 If encoding detection is not done, use the specified coding system
 to do decoding.  This is used internally when implementing coding
 systems with an EOL type that specifies autodetection (the default),
 so that the detector routines return the proper subsidiary.
-The following additional property is recognized if TYPE is 'gzip:
+The following additional property is recognized if TYPE is `gzip':
-'level
+`level'
 Compression level: 0 through 9, or `default' (currently 6).
 */
 (name, type, description, props))
 {
 }
 DEFUN ("detect-coding-region", Fdetect_coding_region, 2, 3, 0, /*
 Detect coding system of the text in the region between START and END.
 Return a list of possible coding systems ordered by priority.
-If only ASCII characters are found, return 'undecided or one of
+If only ASCII characters are found, return `undecided' or one of
 its subsidiary coding systems according to a detected end-of-line
 type.  Optional arg BUFFER defaults to the current buffer.
 */
 (start, end, buffer))
 {

Mercurial > hg > xemacs-beta

comparison src/file-coding.c @ 3025:facf3239ba30