// Copyright (c) 2006-2008 The Chromium Authors. All rights reserved. // Use of this source code is governed by a BSD-style license that can be // found in the LICENSE file. #include "base/i18n/rtl.h" #include "base/file_path.h" #include "base/string_util.h" #include "base/utf_string_conversions.h" #include "testing/gtest/include/gtest/gtest.h" #include "testing/platform_test.h" namespace { base::i18n::TextDirection GetTextDirection(const char* locale_name) { return base::i18n::GetTextDirectionForLocale(locale_name); } } class RTLTest : public PlatformTest { }; TEST_F(RTLTest, GetFirstStrongCharacterDirection) { // Test pure LTR string. std::wstring string(L"foo bar"); EXPECT_EQ(base::i18n::LEFT_TO_RIGHT, base::i18n::GetFirstStrongCharacterDirection(string)); // Test bidi string in which the first character with strong directionality // is a character with type L. string.assign(L"foo \x05d0 bar"); EXPECT_EQ(base::i18n::LEFT_TO_RIGHT, base::i18n::GetFirstStrongCharacterDirection(string)); // Test bidi string in which the first character with strong directionality // is a character with type R. string.assign(L"\x05d0 foo bar"); EXPECT_EQ(base::i18n::RIGHT_TO_LEFT, base::i18n::GetFirstStrongCharacterDirection(string)); // Test bidi string which starts with a character with weak directionality // and in which the first character with strong directionality is a character // with type L. string.assign(L"!foo \x05d0 bar"); EXPECT_EQ(base::i18n::LEFT_TO_RIGHT, base::i18n::GetFirstStrongCharacterDirection(string)); // Test bidi string which starts with a character with weak directionality // and in which the first character with strong directionality is a character // with type R. string.assign(L",\x05d0 foo bar"); EXPECT_EQ(base::i18n::RIGHT_TO_LEFT, base::i18n::GetFirstStrongCharacterDirection(string)); // Test bidi string in which the first character with strong directionality // is a character with type LRE. string.assign(L"\x202a \x05d0 foo bar"); EXPECT_EQ(base::i18n::LEFT_TO_RIGHT, base::i18n::GetFirstStrongCharacterDirection(string)); // Test bidi string in which the first character with strong directionality // is a character with type LRO. string.assign(L"\x202d \x05d0 foo bar"); EXPECT_EQ(base::i18n::LEFT_TO_RIGHT, base::i18n::GetFirstStrongCharacterDirection(string)); // Test bidi string in which the first character with strong directionality // is a character with type RLE. string.assign(L"\x202b foo \x05d0 bar"); EXPECT_EQ(base::i18n::RIGHT_TO_LEFT, base::i18n::GetFirstStrongCharacterDirection(string)); // Test bidi string in which the first character with strong directionality // is a character with type RLO. string.assign(L"\x202e foo \x05d0 bar"); EXPECT_EQ(base::i18n::RIGHT_TO_LEFT, base::i18n::GetFirstStrongCharacterDirection(string)); // Test bidi string in which the first character with strong directionality // is a character with type AL. string.assign(L"\x0622 foo \x05d0 bar"); EXPECT_EQ(base::i18n::RIGHT_TO_LEFT, base::i18n::GetFirstStrongCharacterDirection(string)); // Test a string without strong directionality characters. string.assign(L",!.{}"); EXPECT_EQ(base::i18n::LEFT_TO_RIGHT, base::i18n::GetFirstStrongCharacterDirection(string)); // Test empty string. string.assign(L""); EXPECT_EQ(base::i18n::LEFT_TO_RIGHT, base::i18n::GetFirstStrongCharacterDirection(string)); // Test characters in non-BMP (e.g. Phoenician letters. Please refer to // http://demo.icu-project.org/icu-bin/ubrowse?scr=151&b=10910 for more // information). #if defined(WCHAR_T_IS_UTF32) string.assign(L" ! \x10910" L"abc 123"); #elif defined(WCHAR_T_IS_UTF16) string.assign(L" ! \xd802\xdd10" L"abc 123"); #else #error wchar_t should be either UTF-16 or UTF-32 #endif EXPECT_EQ(base::i18n::RIGHT_TO_LEFT, base::i18n::GetFirstStrongCharacterDirection(string)); #if defined(WCHAR_T_IS_UTF32) string.assign(L" ! \x10401" L"abc 123"); #elif defined(WCHAR_T_IS_UTF16) string.assign(L" ! \xd801\xdc01" L"abc 123"); #else #error wchar_t should be either UTF-16 or UTF-32 #endif EXPECT_EQ(base::i18n::LEFT_TO_RIGHT, base::i18n::GetFirstStrongCharacterDirection(string)); } typedef struct { std::wstring path; std::wstring wrapped_path; } PathAndWrappedPath; TEST_F(RTLTest, WrapPathWithLTRFormatting) { std::wstring kSeparator; kSeparator.push_back(static_cast(FilePath::kSeparators[0])); const PathAndWrappedPath test_data[] = { // Test common path, such as "c:\foo\bar". { L"c:" + kSeparator + L"foo" + kSeparator + L"bar", L"\x202a"L"c:" + kSeparator + L"foo" + kSeparator + L"bar\x202c" }, // Test path with file name, such as "c:\foo\bar\test.jpg". { L"c:" + kSeparator + L"foo" + kSeparator + L"bar" + kSeparator + L"test.jpg", L"\x202a"L"c:" + kSeparator + L"foo" + kSeparator + L"bar" + kSeparator + L"test.jpg\x202c" }, // Test path ending with punctuation, such as "c:\(foo)\bar.". { L"c:" + kSeparator + L"(foo)" + kSeparator + L"bar.", L"\x202a"L"c:" + kSeparator + L"(foo)" + kSeparator + L"bar.\x202c" }, // Test path ending with separator, such as "c:\foo\bar\". { L"c:" + kSeparator + L"foo" + kSeparator + L"bar" + kSeparator, L"\x202a"L"c:" + kSeparator + L"foo" + kSeparator + L"bar" + kSeparator + L"\x202c", }, // Test path with RTL character. { L"c:" + kSeparator + L"\x05d0", L"\x202a"L"c:" + kSeparator + L"\x05d0\x202c", }, // Test path with 2 level RTL directory names. { L"c:" + kSeparator + L"\x05d0" + kSeparator + L"\x0622", L"\x202a"L"c:" + kSeparator + L"\x05d0" + kSeparator + L"\x0622\x202c", }, // Test path with mixed RTL/LTR directory names and ending with punctuation. { L"c:" + kSeparator + L"\x05d0" + kSeparator + L"\x0622" + kSeparator + L"(foo)" + kSeparator + L"b.a.r.", L"\x202a"L"c:" + kSeparator + L"\x05d0" + kSeparator + L"\x0622" + kSeparator + L"(foo)" + kSeparator + L"b.a.r.\x202c", }, // Test path without driver name, such as "/foo/bar/test/jpg". { kSeparator + L"foo" + kSeparator + L"bar" + kSeparator + L"test.jpg", L"\x202a" + kSeparator + L"foo" + kSeparator + L"bar" + kSeparator + L"test.jpg" + L"\x202c" }, // Test path start with current directory, such as "./foo". { L"." + kSeparator + L"foo", L"\x202a"L"." + kSeparator + L"foo" + L"\x202c" }, // Test path start with parent directory, such as "../foo/bar.jpg". { L".." + kSeparator + L"foo" + kSeparator + L"bar.jpg", L"\x202a"L".." + kSeparator + L"foo" + kSeparator + L"bar.jpg" + L"\x202c" }, // Test absolute path, such as "//foo/bar.jpg". { kSeparator + kSeparator + L"foo" + kSeparator + L"bar.jpg", L"\x202a" + kSeparator + kSeparator + L"foo" + kSeparator + L"bar.jpg" + L"\x202c" }, // Test path with mixed RTL/LTR directory names. { L"c:" + kSeparator + L"foo" + kSeparator + L"\x05d0" + kSeparator + L"\x0622" + kSeparator + L"\x05d1.jpg", L"\x202a"L"c:" + kSeparator + L"foo" + kSeparator + L"\x05d0" + kSeparator + L"\x0622" + kSeparator + L"\x05d1.jpg" + L"\x202c", }, // Test empty path. { L"", L"\x202a\x202c" } }; for (unsigned int i = 0; i < arraysize(test_data); ++i) { string16 localized_file_path_string; FilePath path = FilePath::FromWStringHack(test_data[i].path); base::i18n::WrapPathWithLTRFormatting(path, &localized_file_path_string); std::wstring wrapped_path = UTF16ToWide(localized_file_path_string); EXPECT_EQ(wrapped_path, test_data[i].wrapped_path); } } typedef struct { std::wstring raw_filename; std::wstring display_string; } StringAndLTRString; TEST_F(RTLTest, GetDisplayStringInLTRDirectionality) { const StringAndLTRString test_data[] = { { L"test", L"\x202atest\x202c" }, { L"test.html", L"\x202atest.html\x202c" }, { L"\x05d0\x05d1\x05d2", L"\x202a\x05d0\x05d1\x05d2\x202c" }, { L"\x05d0\x05d1\x05d2.txt", L"\x202a\x05d0\x05d1\x05d2.txt\x202c" }, { L"\x05d0"L"abc", L"\x202a\x05d0"L"abc\x202c" }, { L"\x05d0"L"abc.txt", L"\x202a\x05d0"L"abc.txt\x202c" }, { L"abc\x05d0\x05d1", L"\x202a"L"abc\x05d0\x05d1\x202c" }, { L"abc\x05d0\x05d1.jpg", L"\x202a"L"abc\x05d0\x05d1.jpg\x202c" }, }; for (unsigned int i = 0; i < arraysize(test_data); ++i) { string16 input = WideToUTF16(test_data[i].raw_filename); string16 expected = base::i18n::GetDisplayStringInLTRDirectionality(input); if (base::i18n::IsRTL()) EXPECT_EQ(expected, WideToUTF16(test_data[i].display_string)); else EXPECT_EQ(expected, input); } } TEST_F(RTLTest, GetTextDirection) { EXPECT_EQ(base::i18n::RIGHT_TO_LEFT, GetTextDirection("ar")); EXPECT_EQ(base::i18n::RIGHT_TO_LEFT, GetTextDirection("ar_EG")); EXPECT_EQ(base::i18n::RIGHT_TO_LEFT, GetTextDirection("he")); EXPECT_EQ(base::i18n::RIGHT_TO_LEFT, GetTextDirection("he_IL")); // iw is an obsolete code for Hebrew. EXPECT_EQ(base::i18n::RIGHT_TO_LEFT, GetTextDirection("iw")); // Although we're not yet localized to Farsi and Urdu, we // do have the text layout direction information for them. EXPECT_EQ(base::i18n::RIGHT_TO_LEFT, GetTextDirection("fa")); EXPECT_EQ(base::i18n::RIGHT_TO_LEFT, GetTextDirection("ur")); #if 0 // Enable these when we include the minimal locale data for Azerbaijani // written in Arabic and Dhivehi. At the moment, our copy of // ICU data does not have entries for them. EXPECT_EQ(base::i18n::RIGHT_TO_LEFT, GetTextDirection("az_Arab")); // Dhivehi that uses Thaana script. EXPECT_EQ(base::i18n::RIGHT_TO_LEFT, GetTextDirection("dv")); #endif EXPECT_EQ(base::i18n::LEFT_TO_RIGHT, GetTextDirection("en")); // Chinese in China with '-'. EXPECT_EQ(base::i18n::LEFT_TO_RIGHT, GetTextDirection("zh-CN")); // Filipino : 3-letter code EXPECT_EQ(base::i18n::LEFT_TO_RIGHT, GetTextDirection("fil")); // Russian EXPECT_EQ(base::i18n::LEFT_TO_RIGHT, GetTextDirection("ru")); // Japanese that uses multiple scripts EXPECT_EQ(base::i18n::LEFT_TO_RIGHT, GetTextDirection("ja")); }