misc/patches/cldr_tools/21_default_repertire.patch
author jenda
Thu, 16 Jun 2011 15:52:21 +0200
changeset 141 23b21efdeb7e
parent 140 494b657b5f1d
permissions -rw-r--r--
7052998 PUA Unicode characters have defined wrong LC_CTYPE properties
Ignore whitespace changes - Everywhere: Within whitespace: At end of lines:
134
455f05a692fc 7040301 Uncomplete LC_CTYPE information after migration to CLDR 1.9 & Unicode 6.0
jenda
parents: 130
diff changeset
     1
repertoire is all assigned unicode characters
455f05a692fc 7040301 Uncomplete LC_CTYPE information after migration to CLDR 1.9 & Unicode 6.0
jenda
parents: 130
diff changeset
     2
140
494b657b5f1d fix ab9fb5a8ad9a - private area characters were not handled correctly in non-UTF-8 locales
jenda
parents: 139
diff changeset
     3
To reduce locale object size, PUA characters are not included in collation tables for UTF-8 locales.
494b657b5f1d fix ab9fb5a8ad9a - private area characters were not handled correctly in non-UTF-8 locales
jenda
parents: 139
diff changeset
     4
To generate correct ctype information for the chars, we have to add them to POSIX_LCCtype repertoire
494b657b5f1d fix ab9fb5a8ad9a - private area characters were not handled correctly in non-UTF-8 locales
jenda
parents: 139
diff changeset
     5
130
66e398a2332f 7011510 CLDR 1.9 locale data integration
jenda
parents:
diff changeset
     6
diff -ruN cldr_tools.orig//tools/java/org/unicode/cldr/posix/POSIXLocale.java cldr_tools/tools/java/org/unicode/cldr/posix/POSIXLocale.java
66e398a2332f 7011510 CLDR 1.9 locale data integration
jenda
parents:
diff changeset
     7
--- cldr_tools.orig//tools/java/org/unicode/cldr/posix/POSIXLocale.java	2011-04-15 15:33:44.072439117 +0200
66e398a2332f 7011510 CLDR 1.9 locale data integration
jenda
parents:
diff changeset
     8
+++ cldr_tools/tools/java/org/unicode/cldr/posix/POSIXLocale.java	2011-04-15 15:37:17.712439014 +0200
134
455f05a692fc 7040301 Uncomplete LC_CTYPE information after migration to CLDR 1.9 & Unicode 6.0
jenda
parents: 130
diff changeset
     9
@@ -100,6 +100,7 @@
130
66e398a2332f 7011510 CLDR 1.9 locale data integration
jenda
parents:
diff changeset
    10
         }
66e398a2332f 7011510 CLDR 1.9 locale data integration
jenda
parents:
diff changeset
    11
  
66e398a2332f 7011510 CLDR 1.9 locale data integration
jenda
parents:
diff changeset
    12
         repertoire.add(0x0000,0x007f);        // Always add the ASCII set
139
ab9fb5a8ad9a 7047526 fix - do not generate collation tables for private area characters
jenda
parents: 134
diff changeset
    13
+	repertoire.addAll(new UnicodeSet("[^[:Noncharacter_Code_Point:][:Cn:][:Cs:][:Co:]]"));
130
66e398a2332f 7011510 CLDR 1.9 locale data integration
jenda
parents:
diff changeset
    14
         
66e398a2332f 7011510 CLDR 1.9 locale data integration
jenda
parents:
diff changeset
    15
      }
66e398a2332f 7011510 CLDR 1.9 locale data integration
jenda
parents:
diff changeset
    16
      else if ( ! codeset.equals("UTF-8") )
141
23b21efdeb7e 7052998 PUA Unicode characters have defined wrong LC_CTYPE properties
jenda
parents: 140
diff changeset
    17
@@ -152,6 +153,8 @@
140
494b657b5f1d fix ab9fb5a8ad9a - private area characters were not handled correctly in non-UTF-8 locales
jenda
parents: 139
diff changeset
    18
          }
494b657b5f1d fix ab9fb5a8ad9a - private area characters were not handled correctly in non-UTF-8 locales
jenda
parents: 139
diff changeset
    19
        }
494b657b5f1d fix ab9fb5a8ad9a - private area characters were not handled correctly in non-UTF-8 locales
jenda
parents: 139
diff changeset
    20
       
494b657b5f1d fix ab9fb5a8ad9a - private area characters were not handled correctly in non-UTF-8 locales
jenda
parents: 139
diff changeset
    21
+      if (codeset.equals("UTF-8"))
494b657b5f1d fix ab9fb5a8ad9a - private area characters were not handled correctly in non-UTF-8 locales
jenda
parents: 139
diff changeset
    22
+         repertoire.addAll(new UnicodeSet("[:Co:]"));
494b657b5f1d fix ab9fb5a8ad9a - private area characters were not handled correctly in non-UTF-8 locales
jenda
parents: 139
diff changeset
    23
       lc_ctype = new POSIX_LCCtype ( doc, repertoire );
494b657b5f1d fix ab9fb5a8ad9a - private area characters were not handled correctly in non-UTF-8 locales
jenda
parents: 139
diff changeset
    24
       lc_numeric = new POSIX_LCNumeric( doc );
494b657b5f1d fix ab9fb5a8ad9a - private area characters were not handled correctly in non-UTF-8 locales
jenda
parents: 139
diff changeset
    25
       lc_monetary = new POSIX_LCMonetary( doc , supp , variant );