1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
base / i18n / case_conversion_unittest.cc [blame]
// Copyright 2011 The Chromium Authors
// Use of this source code is governed by a BSD-style license that can be
// found in the LICENSE file.
#include "base/i18n/case_conversion.h"
#include "base/i18n/rtl.h"
#include "base/strings/utf_string_conversions.h"
#include "base/test/icu_test_util.h"
#include "testing/gtest/include/gtest/gtest.h"
#include "third_party/icu/source/i18n/unicode/usearch.h"
namespace base {
namespace i18n {
namespace {
const char16_t kNonASCIIMixed[] =
u"\xC4\xD6\xE4\xF6\x20\xCF\xEF\x20\xF7\x25"
u"\xA4\x23\x2A\x5E\x60\x40\xA3\x24\x2030\x201A\x7E\x20\x1F07\x1F0F"
u"\x20\x1E00\x1E01";
const char16_t kNonASCIILower[] =
u"\xE4\xF6\xE4\xF6\x20\xEF\xEF"
u"\x20\xF7\x25\xA4\x23\x2A\x5E\x60\x40\xA3\x24\x2030\x201A\x7E\x20\x1F07"
u"\x1F07\x20\x1E01\x1E01";
const char16_t kNonASCIIUpper[] =
u"\xC4\xD6\xC4\xD6\x20\xCF\xCF"
u"\x20\xF7\x25\xA4\x23\x2A\x5E\x60\x40\xA3\x24\x2030\x201A\x7E\x20\x1F0F"
u"\x1F0F\x20\x1E00\x1E00";
} // namespace
// Test upper and lower case string conversion.
TEST(CaseConversionTest, UpperLower) {
const std::u16string mixed(u"Text with UPPer & lowER casE.");
const std::u16string expected_lower(u"text with upper & lower case.");
const std::u16string expected_upper(u"TEXT WITH UPPER & LOWER CASE.");
std::u16string result = ToLower(mixed);
EXPECT_EQ(expected_lower, result);
result = ToUpper(mixed);
EXPECT_EQ(expected_upper, result);
}
TEST(CaseConversionTest, NonASCII) {
const std::u16string mixed(kNonASCIIMixed);
const std::u16string expected_lower(kNonASCIILower);
const std::u16string expected_upper(kNonASCIIUpper);
std::u16string result = ToLower(mixed);
EXPECT_EQ(expected_lower, result);
result = ToUpper(mixed);
EXPECT_EQ(expected_upper, result);
}
TEST(CaseConversionTest, TurkishLocaleConversion) {
const std::u16string mixed(u"\x49\x131");
const std::u16string expected_lower(u"\x69\x131");
const std::u16string expected_upper(u"\x49\x49");
test::ScopedRestoreICUDefaultLocale restore_locale;
i18n::SetICUDefaultLocale("en_US");
std::u16string result = ToLower(mixed);
EXPECT_EQ(expected_lower, result);
result = ToUpper(mixed);
EXPECT_EQ(expected_upper, result);
i18n::SetICUDefaultLocale("tr");
const std::u16string expected_lower_turkish(u"\x131\x131");
const std::u16string expected_upper_turkish(u"\x49\x49");
result = ToLower(mixed);
EXPECT_EQ(expected_lower_turkish, result);
result = ToUpper(mixed);
EXPECT_EQ(expected_upper_turkish, result);
}
TEST(CaseConversionTest, FoldCase) {
// Simple ASCII, should lower-case.
EXPECT_EQ(u"hello, world", FoldCase(u"Hello, World"));
// Non-ASCII cases from above. They should all fold to the same result.
EXPECT_EQ(FoldCase(kNonASCIIMixed), FoldCase(kNonASCIILower));
EXPECT_EQ(FoldCase(kNonASCIIMixed), FoldCase(kNonASCIIUpper));
// Turkish cases from above. This is the lower-case expected result from the
// US locale. It should be the same even when the current locale is Turkish.
const std::u16string turkish(u"\x49\x131");
const std::u16string turkish_expected(u"\x69\x131");
test::ScopedRestoreICUDefaultLocale restore_locale;
i18n::SetICUDefaultLocale("en_US");
EXPECT_EQ(turkish_expected, FoldCase(turkish));
i18n::SetICUDefaultLocale("tr");
EXPECT_EQ(turkish_expected, FoldCase(turkish));
// Test a case that gets bigger when processed.
// U+130 = LATIN CAPITAL LETTER I WITH DOT ABOVE gets folded to a lower case
// "i" followed by U+307 COMBINING DOT ABOVE.
EXPECT_EQ(u"i\u0307j", FoldCase(u"\u0130j"));
// U+00DF (SHARP S) and U+1E9E (CAPIRAL SHARP S) are both folded to "ss".
EXPECT_EQ(u"ssss", FoldCase(u"\u00DF\u1E9E"));
}
} // namespace i18n
} // namespace base