fix ab9fb5a8ad9a - private area characters were not handled correctly in non-UTF-8 locales
repertoire is all assigned unicode characters
To reduce locale object size, PUA characters are not included in collation tables for UTF-8 locales.
To generate correct ctype information for the chars, we have to add them to POSIX_LCCtype repertoire
diff -ruN cldr_tools.orig//tools/java/org/unicode/cldr/posix/POSIXLocale.java cldr_tools/tools/java/org/unicode/cldr/posix/POSIXLocale.java
--- cldr_tools.orig//tools/java/org/unicode/cldr/posix/POSIXLocale.java 2011-04-15 15:33:44.072439117 +0200
+++ cldr_tools/tools/java/org/unicode/cldr/posix/POSIXLocale.java 2011-04-15 15:37:17.712439014 +0200
@@ -100,6 +100,7 @@
}
repertoire.add(0x0000,0x007f); // Always add the ASCII set
+ repertoire.addAll(new UnicodeSet("[^[:Noncharacter_Code_Point:][:Cn:][:Cs:][:Co:]]"));
}
else if ( ! codeset.equals("UTF-8") )
{
@@ -152,6 +153,9 @@
}
}
+ if (codeset.equals("UTF-8"))
+ repertoire.addAll(new UnicodeSet("[:Co:]"));
+
lc_ctype = new POSIX_LCCtype ( doc, repertoire );
lc_numeric = new POSIX_LCNumeric( doc );
lc_monetary = new POSIX_LCMonetary( doc , supp , variant );