Backed out changeset 3877f1fa62f5 (bug 1927706) Backed out changeset 233c6ebf84a2 (bug 1927706) Backed out changeset 07e5871d5fa3 (bug 1927706) Backed out changeset 84ef75087931 (bug 1927706) Backed out changeset f89b916619e1 (bug 1927706) Backed out changeset b82d9d622315 (bug 1927706) Backed out changeset b0d2c5711865 (bug 1927706) Backed out changeset 9529dda25bd9 (bug 1927706) Backed out changeset 40b7907d7fc8 (bug 1927706) Backed out changeset c549655dbd73 (bug 1927706) Backed out changeset c5cc289771b3 (bug 1927706) Backed out changeset 8ef66f7822c4 (bug 1927706) Backed out changeset dff6d37fb2fe (bug 1927706) Backed out changeset 083a0b3da643 (bug 1927706) Backed out changeset 06649ac72a19 (bug 1927706) Backed out changeset 019f7533abbc (bug 1927706) Backed out changeset f1539604c459 (bug 1927706) Backed out changeset 578667f1f0d4 (bug 1927706) Backed out changeset 8ed1e7e7d4ab (bug 1927706)
63 lines
2.4 KiB
C++
63 lines
2.4 KiB
C++
/* This Source Code Form is subject to the terms of the Mozilla Public
|
|
* License, v. 2.0. If a copy of the MPL was not distributed with this
|
|
* file, You can obtain one at http://mozilla.org/MPL/2.0/. */
|
|
#include "gtest/gtest.h"
|
|
|
|
#include "mozilla/intl/UnicodeProperties.h"
|
|
#include "mozilla/intl/UnicodeScriptCodes.h"
|
|
|
|
namespace mozilla::intl {
|
|
TEST(IntlScript, GetExtensions)
|
|
{
|
|
UnicodeProperties::ScriptExtensionVector extensions;
|
|
|
|
// 0x0000..0x0040 are Common.
|
|
for (char32_t ch = 0; ch < 0x0041; ch++) {
|
|
ASSERT_TRUE(UnicodeProperties::GetExtensions(ch, extensions).isOk());
|
|
ASSERT_EQ(extensions.length(), 1u);
|
|
ASSERT_EQ(Script(extensions[0]), Script::COMMON);
|
|
}
|
|
|
|
// 0x0300..0x0341 are Inherited.
|
|
for (char32_t ch = 0x300; ch < 0x0341; ch++) {
|
|
ASSERT_TRUE(UnicodeProperties::GetExtensions(ch, extensions).isOk());
|
|
ASSERT_EQ(extensions.length(), 1u);
|
|
ASSERT_EQ(Script(extensions[0]), Script::INHERITED);
|
|
}
|
|
|
|
// 0x1cf7's script code is Common, but its script extension is Beng.
|
|
ASSERT_TRUE(UnicodeProperties::GetExtensions(0x1cf7, extensions).isOk());
|
|
ASSERT_EQ(extensions.length(), 1u);
|
|
ASSERT_EQ(Script(extensions[0]), Script::BENGALI);
|
|
|
|
// ؿ
|
|
// https://unicode-table.com/en/063F/
|
|
// This character doesn't have any script extension, so the script code is
|
|
// returned.
|
|
ASSERT_TRUE(UnicodeProperties::GetExtensions(0x063f, extensions).isOk());
|
|
ASSERT_EQ(extensions.length(), 1u);
|
|
ASSERT_EQ(Script(extensions[0]), Script::ARABIC);
|
|
|
|
// 0xff65 is the unicode character '・', see https://unicode-table.com/en/FF65/
|
|
// Halfwidth Katakana Middle Dot.
|
|
ASSERT_TRUE(UnicodeProperties::GetExtensions(0xff65, extensions).isOk());
|
|
|
|
// 0xff65 should have the following script extensions:
|
|
// Bopo Hang Hani Hira Kana Yiii.
|
|
ASSERT_EQ(extensions.length(), 6u);
|
|
|
|
ASSERT_EQ(Script(extensions[0]), Script::BOPOMOFO);
|
|
ASSERT_EQ(Script(extensions[1]), Script::HAN);
|
|
ASSERT_EQ(Script(extensions[2]), Script::HANGUL);
|
|
ASSERT_EQ(Script(extensions[3]), Script::HIRAGANA);
|
|
ASSERT_EQ(Script(extensions[4]), Script::KATAKANA);
|
|
ASSERT_EQ(Script(extensions[5]), Script::YI);
|
|
|
|
// The max code point is 0x10ffff, so 0x110000 should be invalid.
|
|
// Script::UNKNOWN should be returned for an invalid code point.
|
|
ASSERT_TRUE(UnicodeProperties::GetExtensions(0x110000, extensions).isOk());
|
|
ASSERT_EQ(extensions.length(), 1u);
|
|
ASSERT_EQ(Script(extensions[0]), Script::UNKNOWN);
|
|
}
|
|
} // namespace mozilla::intl
|