author | jenda |
Thu, 16 Jun 2011 15:52:21 +0200 | |
changeset 141 | 23b21efdeb7e |
parent 140 | 494b657b5f1d |
permissions | -rw-r--r-- |
134
455f05a692fc
7040301 Uncomplete LC_CTYPE information after migration to CLDR 1.9 & Unicode 6.0
jenda
parents:
130
diff
changeset
|
1 |
repertoire is all assigned unicode characters |
455f05a692fc
7040301 Uncomplete LC_CTYPE information after migration to CLDR 1.9 & Unicode 6.0
jenda
parents:
130
diff
changeset
|
2 |
|
140
494b657b5f1d
fix ab9fb5a8ad9a - private area characters were not handled correctly in non-UTF-8 locales
jenda
parents:
139
diff
changeset
|
3 |
To reduce locale object size, PUA characters are not included in collation tables for UTF-8 locales. |
494b657b5f1d
fix ab9fb5a8ad9a - private area characters were not handled correctly in non-UTF-8 locales
jenda
parents:
139
diff
changeset
|
4 |
To generate correct ctype information for the chars, we have to add them to POSIX_LCCtype repertoire |
494b657b5f1d
fix ab9fb5a8ad9a - private area characters were not handled correctly in non-UTF-8 locales
jenda
parents:
139
diff
changeset
|
5 |
|
130 | 6 |
diff -ruN cldr_tools.orig//tools/java/org/unicode/cldr/posix/POSIXLocale.java cldr_tools/tools/java/org/unicode/cldr/posix/POSIXLocale.java |
7 |
--- cldr_tools.orig//tools/java/org/unicode/cldr/posix/POSIXLocale.java 2011-04-15 15:33:44.072439117 +0200 |
|
8 |
+++ cldr_tools/tools/java/org/unicode/cldr/posix/POSIXLocale.java 2011-04-15 15:37:17.712439014 +0200 |
|
134
455f05a692fc
7040301 Uncomplete LC_CTYPE information after migration to CLDR 1.9 & Unicode 6.0
jenda
parents:
130
diff
changeset
|
9 |
@@ -100,6 +100,7 @@ |
130 | 10 |
} |
11 |
||
12 |
repertoire.add(0x0000,0x007f); // Always add the ASCII set |
|
139
ab9fb5a8ad9a
7047526 fix - do not generate collation tables for private area characters
jenda
parents:
134
diff
changeset
|
13 |
+ repertoire.addAll(new UnicodeSet("[^[:Noncharacter_Code_Point:][:Cn:][:Cs:][:Co:]]")); |
130 | 14 |
|
15 |
} |
|
16 |
else if ( ! codeset.equals("UTF-8") ) |
|
141
23b21efdeb7e
7052998 PUA Unicode characters have defined wrong LC_CTYPE properties
jenda
parents:
140
diff
changeset
|
17 |
@@ -152,6 +153,8 @@ |
140
494b657b5f1d
fix ab9fb5a8ad9a - private area characters were not handled correctly in non-UTF-8 locales
jenda
parents:
139
diff
changeset
|
18 |
} |
494b657b5f1d
fix ab9fb5a8ad9a - private area characters were not handled correctly in non-UTF-8 locales
jenda
parents:
139
diff
changeset
|
19 |
} |
494b657b5f1d
fix ab9fb5a8ad9a - private area characters were not handled correctly in non-UTF-8 locales
jenda
parents:
139
diff
changeset
|
20 |
|
494b657b5f1d
fix ab9fb5a8ad9a - private area characters were not handled correctly in non-UTF-8 locales
jenda
parents:
139
diff
changeset
|
21 |
+ if (codeset.equals("UTF-8")) |
494b657b5f1d
fix ab9fb5a8ad9a - private area characters were not handled correctly in non-UTF-8 locales
jenda
parents:
139
diff
changeset
|
22 |
+ repertoire.addAll(new UnicodeSet("[:Co:]")); |
494b657b5f1d
fix ab9fb5a8ad9a - private area characters were not handled correctly in non-UTF-8 locales
jenda
parents:
139
diff
changeset
|
23 |
lc_ctype = new POSIX_LCCtype ( doc, repertoire ); |
494b657b5f1d
fix ab9fb5a8ad9a - private area characters were not handled correctly in non-UTF-8 locales
jenda
parents:
139
diff
changeset
|
24 |
lc_numeric = new POSIX_LCNumeric( doc ); |
494b657b5f1d
fix ab9fb5a8ad9a - private area characters were not handled correctly in non-UTF-8 locales
jenda
parents:
139
diff
changeset
|
25 |
lc_monetary = new POSIX_LCMonetary( doc , supp , variant ); |