From e0e7b8f937a1daed3179e2bdcc931c00a0778d53 Mon Sep 17 00:00:00 2001 From: Andy Heninger Date: Fri, 30 May 2003 16:07:39 +0000 Subject: [PATCH] ICU-2093 clean up comments in break rule files. X-SVN-Rev: 12197 --- icu4c/source/data/brkitr/char.txt | 9 ++++++--- icu4c/source/data/brkitr/line.txt | 4 +--- icu4c/source/data/brkitr/sent.txt | 2 +- icu4c/source/data/brkitr/title.txt | 2 +- 4 files changed, 9 insertions(+), 8 deletions(-) diff --git a/icu4c/source/data/brkitr/char.txt b/icu4c/source/data/brkitr/char.txt index 6c004649b2b..ff6969fd437 100644 --- a/icu4c/source/data/brkitr/char.txt +++ b/icu4c/source/data/brkitr/char.txt @@ -1,12 +1,12 @@ # -# Copyright (C) 2002, International Business Machines Corporation and others. +# Copyright (C) 2002-2003, International Business Machines Corporation and others. # All Rights Reserved. # # file: char.txt # # ICU Character Break Rules, also known as Grapheme Cluster Boundaries -# See Unicode Technical Report #29. -# These rules are based on the proposed draft dated 2002-08-06 +# See Unicode Standard Annex #29. +# These rules are based on TR29 Version 4.0.0 # # @@ -31,6 +31,9 @@ $LVT = [:Hangul_Syllable_Type = LVT:]; $HangulSyllable = $L+ | ($L* ($LV? $V+ | $LV | $LVT) $T*) | $T+; +# +# Forward Break Rules +# $CR $LF; ([^$Control] | $HangulSyllable) $Extend*; .; diff --git a/icu4c/source/data/brkitr/line.txt b/icu4c/source/data/brkitr/line.txt index 7d3f74a4fb9..128d36980f0 100644 --- a/icu4c/source/data/brkitr/line.txt +++ b/icu4c/source/data/brkitr/line.txt @@ -1,4 +1,4 @@ -# Copyright (c) 2002, 2003 International Business Machines Corporation and +# Copyright (c) 2002-2003 International Business Machines Corporation and # others. All Rights Reserved. # # file: line.txt @@ -58,8 +58,6 @@ $ALPlus = $AL | $AI | $SA; # # Combining Marks. X $CM* behaves as if it were X. Rule LB6. -# TODO: This is going to produce some odd results, because of the non-combining -# chars that are included in $CM. Use $Extend instead, where possible. # $ALcm = $ALPlus $CM*; $IDcm = ($ID $CM* | $SP $CM+); diff --git a/icu4c/source/data/brkitr/sent.txt b/icu4c/source/data/brkitr/sent.txt index a91964e85ee..e849829429b 100644 --- a/icu4c/source/data/brkitr/sent.txt +++ b/icu4c/source/data/brkitr/sent.txt @@ -6,7 +6,7 @@ # # ICU Sentence Break Rules # See Unicode Standard Annex #29. -# These rules are based on the draft dated 2003-03-31 +# These rules are based on TR 29 version 4.0.0 # diff --git a/icu4c/source/data/brkitr/title.txt b/icu4c/source/data/brkitr/title.txt index 95a3d09510d..d12517f6d2e 100644 --- a/icu4c/source/data/brkitr/title.txt +++ b/icu4c/source/data/brkitr/title.txt @@ -1,4 +1,4 @@ -# Copyright (c) 2002, International Business Machines Corporation and +# Copyright (c) 2002-2003, International Business Machines Corporation and # others. All Rights Reserved. # # Title Casing Break Rules