diff lisp/unicode.el @ 985:7f62a956b825

[xemacs-hg @ 2002-09-01 06:41:40 by youngs] 2002-08-31 Seiichi Ikiuo <ikiuo@polyphony.co.jp> * code-init.el (reset-coding-categories-to-default): Add new coding category 'utf-8-bom'. * coding.el (coding-system-category): Add check for 'utf-8-bom'. * unicode.el: Add new coding system 'utf-8-bom'. 2002-08-31 Seiichi Ikiuo <ikiuo@polyphony.co.jp> * file-coding.h (detection_result): fix DET_LOWEST. * mule-coding.c (big5_detector): Add member 'seen_euc_char'. (big5_detect): It was made not to become the trouble of EUC. (iso2022_detector): Add member 'longest_even_high_byte'. (iso2022_detect): Fix checking for even/odd_high_byte_group. The judgment of EUC is changed. * unicode.c: Add DETECTOR_CATEGORY utf_8_bom. (utf_8_detector): Add member byteno, first_byte and second_byte. (utf_8_detect): The judgment of UTF-8-BOM is added.
author youngs
date Sun, 01 Sep 2002 06:41:45 +0000
parents e54d47b2d736
children b531bf8658e9
line wrap: on
line diff
--- a/lisp/unicode.el	Sat Aug 31 11:04:01 2002 +0000
+++ b/lisp/unicode.el	Sun Sep 01 06:41:45 2002 +0000
@@ -281,6 +281,17 @@
 "
    type utf-8))
 
+(make-coding-system
+ 'utf-8-bom 'unicode
+ "UTF-8 w/BOM"
+ '(mnemonic "MSW-UTF8"
+   documentation
+   "UTF-8 Unicode encoding, with byte order mark.
+Standard encoding for representing UTF-8 under MS Windows."
+   type utf-8
+   little-endian t
+   need-bom t))
+
 ;; #### UTF-7 is not yet implemented, and it's tricky to do.  There's
 ;; an implementation in appendix A.1 of the Unicode Standard, Version
 ;; 2.0, but I don't know its licensing characteristics.