changeset 4084:49c847ce8aa6

[xemacs-hg @ 2007-07-28 08:25:40 by aidan] Don't map any BIG5 characters to U+FFFD.
author aidan
date Sat, 28 Jul 2007 08:25:44 +0000
parents a3f8bb07ab38
children 023ebc75c06e
files etc/ChangeLog etc/unicode/unicode-consortium/BIG5.TXT
diffstat 2 files changed, 19 insertions(+), 7 deletions(-) [+]
line wrap: on
line diff
--- a/etc/ChangeLog	Sat Jul 28 08:02:16 2007 +0000
+++ b/etc/ChangeLog	Sat Jul 28 08:25:44 2007 +0000
@@ -1,3 +1,10 @@
+2007-07-28  Aidan Kehoe  <kehoea@parhasard.net>
+
+	* unicode/unicode-consortium/BIG5.TXT:
+	Don't map any characters to U+FFFD; for round trip compatibility,
+	map those that were mapped to U+FFFD to the Unicode private use
+	area.
+
 2007-05-21  Stephen J. Turnbull  <stephen@xemacs.org>
 
 	* XEmacs 21.5.28 "fuki" is released.
--- a/etc/unicode/unicode-consortium/BIG5.TXT	Sat Jul 28 08:02:16 2007 +0000
+++ b/etc/unicode/unicode-consortium/BIG5.TXT	Sat Jul 28 08:25:44 2007 +0000
@@ -58,6 +58,11 @@
 #	We currently map all of these characters to U+FFFD REPLACEMENT CHARACTER.
 #		It is also possible to map these characters to their duplicates, or to
 #		the user zone.  
+#
+#       XEmacs change; we map them to private use characters above
+#       U+F0000. 0xA15A => U+FA15A, and so on. See
+#       http://mid.gmane.org/s3tsl7j7zg9.fsf@magellan.suse.de and related
+#       discussion.
 #	
 #	Notes:
 #
@@ -118,7 +123,7 @@
 0xA157	0xFE31	# PRESENTATION FORM FOR VERTICAL EM DASH
 0xA158	0x2014	# EM DASH
 0xA159	0xFE33	# PRESENTATION FORM FOR VERTICAL LOW LINE
-0xA15A	0xFFFD	# *** NO MAPPING ***
+0xA15A	0xFA15A	# #### PRIVATE USE
 0xA15B	0xFE34	# PRESENTATION FORM FOR VERTICAL WAVY LOW LINE
 0xA15C	0xFE4F	# WAVY LOW LINE
 0xA15D	0xFF08	# FULLWIDTH LEFT PARENTHESIS
@@ -189,9 +194,9 @@
 0xA1C0	0x32A3	# CIRCLED IDEOGRAPH CORRECT
 0xA1C1	0x2105	# CARE OF
 0xA1C2	0x203E	# OVERLINE
-0xA1C3	0xFFFD	# *** NO MAPPING ***
+0xA1C3	0xFA1C3	# #### PRIVATE USE
 0xA1C4	0xFF3F	# FULLWIDTH LOW LINE
-0xA1C5	0xFFFD	# *** NO MAPPING ***
+0xA1C5	0xFA1C5	# #### PRIVATE USE
 0xA1C6	0xFE49	# DASHED OVERLINE
 0xA1C7	0xFE4A	# CENTRELINE OVERLINE
 0xA1C8	0xFE4D	# DASHED LOW LINE
@@ -248,8 +253,8 @@
 0xA1FB	0x2198	# SOUTH EAST ARROW
 0xA1FC	0x2225	# PARALLEL TO
 0xA1FD	0x2223	# DIVIDES
-0xA1FE	0xFFFD	# *** NO MAPPING ***
-0xA240	0xFFFD	# *** NO MAPPING ***
+0xA1FE	0xFA1FE	# #### PRIVATE USE 
+0xA240	0xFA240	# #### PRIVATE USE 
 0xA241	0xFF0F	# FULLWIDTH SOLIDUS
 0xA242	0xFF3C	# FULLWIDTH REVERSE SOLIDUS
 0xA243	0xFF04	# FULLWIDTH DOLLAR SIGN
@@ -355,9 +360,9 @@
 0xA2C9	0x3027	# HANGZHOU NUMERAL SEVEN
 0xA2CA	0x3028	# HANGZHOU NUMERAL EIGHT
 0xA2CB	0x3029	# HANGZHOU NUMERAL NINE
-0xA2CC	0xFFFD	# *** NO MAPPING ***
+0xA2CC	0xFA2CC	# #### PRIVATE USE 
 0xA2CD	0x5344	# <CJK>
-0xA2CE	0xFFFD	# *** NO MAPPING ***
+0xA2CE	0xFA2CE	# #### PRIVATE USE 
 0xA2CF	0xFF21	# FULLWIDTH LATIN CAPITAL LETTER A
 0xA2D0	0xFF22	# FULLWIDTH LATIN CAPITAL LETTER B
 0xA2D1	0xFF23	# FULLWIDTH LATIN CAPITAL LETTER C