last changes (I hope) for Unicode 3.2

X-SVN-Rev: 8209
This commit is contained in:
Mark Davis 2002-03-22 22:08:53 +00:00
parent 9a6483bf77
commit 6e84854a03
3 changed files with 29 additions and 15 deletions

View file

@ -27,15 +27,16 @@
# C: common case folding, common mappings shared by both simple and full mappings.
# F: full case folding, mappings that cause strings to grow in length. Multiple characters are separated by spaces.
# S: simple case folding, mappings to single characters where different from F.
# I: special case for dotted uppercase I and dotless lowercase i
# - If this mapping is included, the result is case-insensitive, but dotless and dotted I's are not distinguished.
# - If this mapping is excluded, the result is not fully case-insensitive, but dotless and dotted I's are distinguished.
# T: special case for uppercase I and dotted uppercase I
# - For non-Turkic languages, this mapping is normally not used.
# - For Turkic languages (tr, az), this mapping can be used instead of the normal mapping for these characters.
#
# Usage:
# A. To do a simple case folding, use the mappings with status C + S + I.
# B. To do a full case folding, use the mappings with status C + F + I.
# The mappings with status I can be omitted depending on the desired case-folding
# behavior. (The default option is to retain them.)
# A. To do a simple case folding, use the mappings with status C + S.
# B. To do a full case folding, use the mappings with status C + F.
#
# The mappings with status T can be used or omitted depending on the desired case-folding
# behavior. (The default option is to exclude them.)
#
# =================================================================

View file

@ -5,8 +5,8 @@
*******************************************************************************
*
* $Source: /xsrl/Nsvn/icu/unicodetools/com/ibm/text/UCD/GenerateCaseFolding.java,v $
* $Date: 2002/03/20 00:21:43 $
* $Revision: 1.7 $
* $Date: 2002/03/22 22:08:53 $
* $Revision: 1.8 $
*
*******************************************************************************
*/
@ -85,11 +85,15 @@ public class GenerateCaseFolding implements UCD_Types {
if (rFull != null && rFull.equals(rSimple)
|| (PICK_SHORT && UTF16.countCodePoint(rFull) == 1)) {
String type = "C";
if (ch == 0x130) {
if (ch == 0x49) {
drawLine(out, ch, "C", "i");
drawLine(out, ch, "T", "\u0131");
} else if (ch == 0x130) {
drawLine(out, ch, "F", "i\u0307");
drawLine(out, ch, "I", "\u0130");
drawLine(out, ch, "T", "i");
} else if (ch == 0x131) {
drawLine(out, ch, "I", "i");
// do nothing
//drawLine(out, ch, "I", "i");
} else {
drawLine(out, ch, type, rFull);
}
@ -106,6 +110,15 @@ public class GenerateCaseFolding implements UCD_Types {
log.close();
Utility.renameIdentical(mostRecent, Utility.getOutputName(newFile));
}
/* Goal is following (with no entries for 0131 or 0069)
0049; C; 0069; # LATIN CAPITAL LETTER I
0049; T; 0131; # LATIN CAPITAL LETTER I
0130; F; 0069 0307; # LATIN CAPITAL LETTER I WITH DOT ABOVE
0130; T; 0069; # LATIN CAPITAL LETTER I WITH DOT ABOVE
*/
static void drawLine(PrintWriter out, int ch, String type, String result) {
String comment = "";

View file

@ -5,8 +5,8 @@
*******************************************************************************
*
* $Source: /xsrl/Nsvn/icu/unicodetools/com/ibm/text/UCD/UCD_Types.java,v $
* $Date: 2002/03/20 00:21:42 $
* $Revision: 1.10 $
* $Date: 2002/03/22 22:08:53 $
* $Revision: 1.11 $
*
*******************************************************************************
*/
@ -15,7 +15,7 @@ package com.ibm.text.UCD;
public interface UCD_Types {
public static final int dVersion = 8; // change to fix the generated file D version. If less than zero, no "d"
public static final int dVersion = 9; // change to fix the generated file D version. If less than zero, no "d"
public static final String BASE_DIR = "C:\\DATA\\";
public static final String UCD_DIR = BASE_DIR + "UCD\\";