From 1a37348f3b79e7fab6ff4b76524dcecfb4b7c1dd Mon Sep 17 00:00:00 2001 From: Markus Scherer Date: Tue, 21 Jun 2005 15:14:27 +0000 Subject: [PATCH] ICU-4416 add test cases for ucnv_getUnicodeSet() for Unicode charsets X-SVN-Rev: 17954 --- icu4c/source/test/testdata/conversion.txt | 70 +++++++++++++++++++++++ 1 file changed, 70 insertions(+) diff --git a/icu4c/source/test/testdata/conversion.txt b/icu4c/source/test/testdata/conversion.txt index 0ae0b8c3989..773e5e4e08e 100644 --- a/icu4c/source/test/testdata/conversion.txt +++ b/icu4c/source/test/testdata/conversion.txt @@ -982,6 +982,76 @@ conversion { // which - numeric UConverterUnicodeSet value Headers { "charset", "map", "mapnot", "which" } Cases { + // Unicode charsets that do not map surrogate code points + { + "UTF-8", + "[\x00-\ud7ff\ue000-\U0010ffff]", + "[\ud800-\udfff]", + :int{0} + } + { + "UTF-16", + "[\x00-\ud7ff\ue000-\U0010ffff]", + "[\ud800-\udfff]", + :int{0} + } + { + "UTF-16BE", + "[\x00-\ud7ff\ue000-\U0010ffff]", + "[\ud800-\udfff]", + :int{0} + } + { + "UTF-16LE", + "[\x00-\ud7ff\ue000-\U0010ffff]", + "[\ud800-\udfff]", + :int{0} + } + { + "UTF-32", + "[\x00-\ud7ff\ue000-\U0010ffff]", + "[\ud800-\udfff]", + :int{0} + } + { + "UTF-32BE", + "[\x00-\ud7ff\ue000-\U0010ffff]", + "[\ud800-\udfff]", + :int{0} + } + { + "UTF-32LE", + "[\x00-\ud7ff\ue000-\U0010ffff]", + "[\ud800-\udfff]", + :int{0} + } + + // Unicode charsets that do map surrogate code points + { + "UTF-7", + "[\x00-\U0010ffff]", + "[]", + :int{0} + } + { + "SCSU", + "[\x00-\U0010ffff]", + "[]", + :int{0} + } + { + "BOCU-1", + "[\x00-\U0010ffff]", + "[]", + :int{0} + } + { + "CESU-8", + "[\x00-\U0010ffff]", + "[]", + :int{0} + } + // versions of ISO-2022-KR { "ISO-2022-KR",