diff -ur original_source/data/unidata/DerivedBidiClass.txt source/data/unidata/DerivedBidiClass.txt --- original_source/data/unidata/DerivedBidiClass.txt 2006-06-14 06:14:36.000000000 +0700 +++ source/data/unidata/DerivedBidiClass.txt 2008-05-17 11:28:02.015625000 +0700 @@ -1176,7 +1176,8 @@ 0086..009F ; BN # Cc [26] .. 00AD ; BN # Cf SOFT HYPHEN 070F ; BN # Cf SYRIAC ABBREVIATION MARK -200B..200D ; BN # Cf [3] ZERO WIDTH SPACE..ZERO WIDTH JOINER +/* 200B..200D ; BN # Cf [3] ZERO WIDTH SPACE..ZERO WIDTH JOINER */ +200C..200D ; BN # Cf [3] ZERO WIDTH SPACE..ZERO WIDTH JOINER 2060..2063 ; BN # Cf [4] WORD JOINER..INVISIBLE SEPARATOR 2064..2069 ; BN # Cn [6] .. 206A..206F ; BN # Cf [6] INHIBIT SYMMETRIC SWAPPING..NOMINAL DIGIT SHAPES diff -ur original_source/data/unidata/DerivedCoreProperties.txt source/data/unidata/DerivedCoreProperties.txt --- original_source/data/unidata/DerivedCoreProperties.txt 2006-03-04 03:55:12.000000000 +0700 +++ source/data/unidata/DerivedCoreProperties.txt 2008-05-17 11:28:49.406250000 +0700 @@ -4560,7 +4560,8 @@ 1FF2..1FF4 ; Grapheme_Base 1FF6..1FFC ; Grapheme_Base 1FFD..1FFE ; Grapheme_Base -2000..200A ; Grapheme_Base +/* 2000..200A ; Grapheme_Base */ +2000..200B ; Grapheme_Base 2010..2015 ; Grapheme_Base 2016..2017 ; Grapheme_Base 2018 ; Grapheme_Base diff -ur original_source/data/unidata/DerivedJoiningType.txt source/data/unidata/DerivedJoiningType.txt --- original_source/data/unidata/DerivedJoiningType.txt 2006-06-14 06:14:38.000000000 +0700 +++ source/data/unidata/DerivedJoiningType.txt 2008-05-17 11:31:47.968750000 +0700 @@ -208,7 +208,7 @@ 1B6B..1B73 ; T # Mn [9] BALINESE MUSICAL SYMBOL COMBINING TEGEH..BALINESE MUSICAL SYMBOL COMBINING GONG 1DC0..1DCA ; T # Mn [11] COMBINING DOTTED GRAVE ACCENT..COMBINING LATIN SMALL LETTER R BELOW 1DFE..1DFF ; T # Mn [2] COMBINING LEFT ARROWHEAD ABOVE..COMBINING RIGHT ARROWHEAD AND DOWN ARROWHEAD BELOW -200B ; T # Cf ZERO WIDTH SPACE +/* 200B ; T # Cf ZERO WIDTH SPACE ---> BACK TO BE A WORD SEPARATOR CHARACTER */ 200E..200F ; T # Cf [2] LEFT-TO-RIGHT MARK..RIGHT-TO-LEFT MARK 202A..202E ; T # Cf [5] LEFT-TO-RIGHT EMBEDDING..RIGHT-TO-LEFT OVERRIDE 2060..2063 ; T # Cf [4] WORD JOINER..INVISIBLE SEPARATOR diff -ur original_source/data/unidata/GraphemeBreakProperty.txt source/data/unidata/GraphemeBreakProperty.txt --- original_source/data/unidata/GraphemeBreakProperty.txt 2006-06-14 06:14:38.000000000 +0700 +++ source/data/unidata/GraphemeBreakProperty.txt 2008-05-17 11:29:44.875000000 +0700 @@ -38,7 +38,7 @@ 06DD ; Control 070F ; Control 17B4..17B5 ; Control -200B ; Control +/* 200B ; Control --> ZWSP is a word separation character */ 200E..200F ; Control 2028 ; Control 2029 ; Control @@ -51,7 +51,7 @@ E0001 ; Control E0020..E007F ; Control -# Total code points: 201 +# Total code points: 200 # ================================================ diff -ur original_source/data/unidata/SentenceBreakProperty.txt source/data/unidata/SentenceBreakProperty.txt --- original_source/data/unidata/SentenceBreakProperty.txt 2006-06-14 06:14:38.000000000 +0700 +++ source/data/unidata/SentenceBreakProperty.txt 2008-05-17 11:31:05.000000000 +0700 @@ -32,7 +32,7 @@ 06DD ; Format 070F ; Format 17B4..17B5 ; Format -200B ; Format +/* 200B ; Format --> ZWSP is a word separation character. */ 200E..200F ; Format 202A..202E ; Format 2060..2063 ; Format @@ -43,7 +43,7 @@ E0001 ; Format E0020..E007F ; Format -# Total code points: 136 +# Total code points: 135 # ================================================ @@ -52,12 +52,13 @@ 0020 ; Sp 1680 ; Sp 180E ; Sp -2000..200A ; Sp +/* 2000..200A ; Sp */ +2000..200B ; Sp 202F ; Sp 205F ; Sp 3000 ; Sp -# Total code points: 20 +# Total code points: 21 # ================================================ diff -ur original_source/data/unidata/UnicodeData.txt source/data/unidata/UnicodeData.txt --- original_source/data/unidata/UnicodeData.txt 2006-06-14 06:14:38.000000000 +0700 +++ source/data/unidata/UnicodeData.txt 2008-05-17 09:56:05.375000000 +0700 @@ -6105,7 +6105,7 @@ 2008;PUNCTUATION SPACE;Zs;0;WS; 0020;;;;N;;;;; 2009;THIN SPACE;Zs;0;WS; 0020;;;;N;;;;; 200A;HAIR SPACE;Zs;0;WS; 0020;;;;N;;;;; -200B;ZERO WIDTH SPACE;Cf;0;BN;;;;;N;;;;; +200B;ZERO WIDTH SPACE;Zs;0;BN;;;;;N;;;;; 200C;ZERO WIDTH NON-JOINER;Cf;0;BN;;;;;N;;;;; 200D;ZERO WIDTH JOINER;Cf;0;BN;;;;;N;;;;; 200E;LEFT-TO-RIGHT MARK;Cf;0;L;;;;;N;;;;; diff -ur original_source/data/unidata/WordBreakProperty.txt source/data/unidata/WordBreakProperty.txt --- original_source/data/unidata/WordBreakProperty.txt 2006-06-14 06:14:38.000000000 +0700 +++ source/data/unidata/WordBreakProperty.txt 2008-05-17 11:31:22.609375000 +0700 @@ -22,7 +22,7 @@ 06DD ; Format 070F ; Format 17B4..17B5 ; Format -200B ; Format +/* 200B ; Format ==> ZERO WIDTH SPACE IS A WORD SEPARATION CHARACTER */ 200E..200F ; Format 202A..202E ; Format 2060..2063 ; Format @@ -33,7 +33,7 @@ E0001 ; Format E0020..E007F ; Format -# Total code points: 136 +# Total code points: 135 # ================================================ diff -ur original_source/test/cintltst/cucdtst.c source/test/cintltst/cucdtst.c --- original_source/test/cintltst/cucdtst.c 2006-08-20 12:08:34.000000000 +0700 +++ source/test/cintltst/cucdtst.c 2008-05-17 15:01:14.921875000 +0700 @@ -801,8 +801,8 @@ { 0x2002, ISPR|ISSP|ISBL }, /* en space */ { 0x2007, ISPR|ISSP|ISBL }, /* figure space */ { 0x2009, ISPR|ISSP|ISBL }, /* thin space */ - { 0x200b, ISCN }, /* ZWSP */ - /*{ 0x200b, ISPR|ISSP },*/ /* ZWSP */ /* ZWSP became a control char in 4.0.1*/ + /* { 0x200b, ISCN }, */ /* ZWSP was turned in control character, and now is back to spacing */ + { 0x200b, ISPR|ISSP }, /* ZWSP */ { 0x200e, ISCN }, /* LRM */ { 0x2028, ISPR|ISSP| ISCN }, /* LS */ { 0x2029, ISPR|ISSP| ISCN }, /* PS */