From 7e6eccb5f611973038ad78c870ffcdd6af72c228 Mon Sep 17 00:00:00 2001 From: Carlos O'Donell Date: Wed, 24 Feb 2016 14:31:35 -0500 Subject: GB 18030-2005: Document non-rountrip and PUA mappings (bug 19575). --- ChangeLog | 6 ++++++ localedata/charmaps/GB18030 | 25 +++++++++++++++++++++++++ 2 files changed, 31 insertions(+) diff --git a/ChangeLog b/ChangeLog index ce9e24ee76..d83bf39870 100644 --- a/ChangeLog +++ b/ChangeLog @@ -1,3 +1,9 @@ +2016-02-24 Carlos O'Donell + + [BZ #19575] + * localedata/charmaps/GB18030: Update comments regarding PAU to + non-PUA mappings. + 2016-02-24 Joseph Myers * sysdeps/unix/sysv/linux/configure.ac (linux/fanotify.h): Do not diff --git a/localedata/charmaps/GB18030 b/localedata/charmaps/GB18030 index 863a123440..ad6728c5bd 100644 --- a/localedata/charmaps/GB18030 +++ b/localedata/charmaps/GB18030 @@ -57234,6 +57234,22 @@ CHARMAP /xa6/xbe /xa6/xbf /xa6/xc0 +% The newest GB 18030-2005 standard still uses some private use area +% code points. Any implementation which has Unicode 4.1 or newer +% support should not use these PUA code points, and instead should +% map these entries to their equivalent non-PUA code points. There +% are 24 idiograms in GB 18030-2005 which have non-PUA equivalents. +% In glibc we only support roundtrip code points, and so must choose +% between supporting the old PUA code points, or using the newer +% non-PUA code points. We choose to use the non-PUA code points to +% be compatible with ICU's similar choice. In choosing the non-PUA +% code points we can no longer convert the old PUA code points back +% to GB-18030-2005 (technically only fixable if we added support +% for non-roundtrip code points e.g. ICU's "fallback mapping"). +% The recommendation to use the non-PUA code points, where available, +% is based on "CJKV Information Processing" 2nd Ed. by Dr. Ken Lunde. +% +% These 10 PUA mappings use equivalents from to . % /xa6/xd9 % /xa6/xda % /xa6/xdb @@ -57371,6 +57387,7 @@ CHARMAP /xd7/xfd /xd7/xfe /x83/x36/xc9/x34 +% These 3 PUA mappings use equivalents , and . % /xfe/x51 % /xfe/x52 % /xfe/x53 @@ -57379,6 +57396,7 @@ CHARMAP /x83/x36/xc9/x37 /x83/x36/xc9/x38 /x83/x36/xc9/x39 +% This 1 PUA mapping uses the equivalent . % /xfe/x59 /x83/x36/xca/x30 /x83/x36/xca/x31 @@ -57387,17 +57405,20 @@ CHARMAP /x83/x36/xca/x34 /x83/x36/xca/x35 /x83/x36/xca/x36 +% This 1 PUA mapping uses the equivalent . % /xfe/x61 /x83/x36/xca/x37 /x83/x36/xca/x38 /x83/x36/xca/x39 /x83/x36/xcb/x30 +% These 2 PUA mappings use the equivalents and . % /xfe/x66 % /xfe/x67 /x83/x36/xcb/x31 /x83/x36/xcb/x32 /x83/x36/xcb/x33 /x83/x36/xcb/x34 +% These 2 PUA mappings use the equivalents and . % /xfe/x6c % /xfe/x6d /x83/x36/xcb/x35 @@ -57408,6 +57429,7 @@ CHARMAP /x83/x36/xcc/x30 /x83/x36/xcc/x31 /x83/x36/xcc/x32 +% This 1 PUA mapping uses the equivalent . % /xfe/x76 /x83/x36/xcc/x33 /x83/x36/xcc/x34 @@ -57416,6 +57438,7 @@ CHARMAP /x83/x36/xcc/x37 /x83/x36/xcc/x38 /x83/x36/xcc/x39 +% This 1 PUA mapping uses the equivalent . % /xfe/x7e /x83/x36/xcd/x30 /x83/x36/xcd/x31 @@ -57433,6 +57456,7 @@ CHARMAP /x83/x36/xce/x33 /x83/x36/xce/x34 /x83/x36/xce/x35 +% These 2 PUA mappings use the equivalents and . % /xfe/x90 % /xfe/x91 /x83/x36/xce/x36 @@ -57449,6 +57473,7 @@ CHARMAP /x83/x36/xcf/x37 /x83/x36/xcf/x38 /x83/x36/xcf/x39 +% This 1 PUA mapping uses the equivalent . % /xfe/xa0 /x83/x36/xd0/x30 /x83/x36/xd0/x31 -- cgit 1.4.1