diff lisp/code-init.el @ 985:7f62a956b825

[xemacs-hg @ 2002-09-01 06:41:40 by youngs] 2002-08-31 Seiichi Ikiuo <ikiuo@polyphony.co.jp> * code-init.el (reset-coding-categories-to-default): Add new coding category 'utf-8-bom'. * coding.el (coding-system-category): Add check for 'utf-8-bom'. * unicode.el: Add new coding system 'utf-8-bom'. 2002-08-31 Seiichi Ikiuo <ikiuo@polyphony.co.jp> * file-coding.h (detection_result): fix DET_LOWEST. * mule-coding.c (big5_detector): Add member 'seen_euc_char'. (big5_detect): It was made not to become the trouble of EUC. (iso2022_detector): Add member 'longest_even_high_byte'. (iso2022_detect): Fix checking for even/odd_high_byte_group. The judgment of EUC is changed. * unicode.c: Add DETECTOR_CATEGORY utf_8_bom. (utf_8_detector): Add member byteno, first_byte and second_byte. (utf_8_detect): The judgment of UTF-8-BOM is added.
author youngs
date Sun, 01 Sep 2002 06:41:45 +0000
parents 2b6fa2618f76
children b531bf8658e9
line wrap: on
line diff
--- a/lisp/code-init.el	Sat Aug 31 11:04:01 2002 +0000
+++ b/lisp/code-init.el	Sun Sep 01 06:41:45 2002 +0000
@@ -276,6 +276,7 @@
 	--------------------------------------------------
         utf-16-little-endian-bom  utf-16-little-endian
 	utf-16-bom		  utf-16-bom
+	utf-8-bom		  utf-8-bom
 	iso-7			  iso-2022-7bit
 	no-conversion		  raw-text
 	utf-8			  utf-8
@@ -324,6 +325,7 @@
    (coding-system-variable-default-value 'no-conversion-coding-system-mapping))
   (set-coding-category-system 'ucs-4 'ucs-4)
   (set-coding-category-system 'utf-8 'utf-8)
+  (set-coding-category-system 'utf-8-bom 'utf-8-bom)
   (set-coding-category-system 'utf-16-little-endian 'utf-16-little-endian)
   (set-coding-category-system 'utf-16 'utf-16)
   (set-coding-category-system 'utf-16-little-endian-bom
@@ -333,6 +335,7 @@
    (if (featurep 'mule)
        '(utf-16-little-endian-bom
 	 utf-16-bom
+	 utf-8-bom
 	 iso-7
 	 no-conversion
 	 utf-8
@@ -347,6 +350,7 @@
 	 ucs-4)
      '(utf-16-little-endian-bom
        utf-16-bom
+       utf-8-bom
        no-conversion
        utf-8
        utf-16-little-endian