summaryrefslogtreecommitdiffstats
path: root/chrome/renderer/translate_helper_unittest.cc
blob: a7565d4249a7cd9e4349beb240fdb62de040da3c (plain)
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
// Copyright (c) 2013 The Chromium Authors. All rights reserved.
// Use of this source code is governed by a BSD-style license that can be
// found in the LICENSE file.

#include "chrome/renderer/translate_helper.h"

#include "base/utf_string_conversions.h"
#include "chrome/common/chrome_constants.h"
#include "testing/gtest/include/gtest/gtest.h"

typedef testing::Test TranslateHelperTest;

// Tests that well-known language code typos are fixed.
TEST_F(TranslateHelperTest, LanguageCodeTypoCorrection) {
  std::string language;

  // Strip the second and later codes.
  language = std::string("ja,en");
  TranslateHelper::CorrectLanguageCodeTypo(&language);
  EXPECT_EQ("ja", language);

  // Replace dash with hyphen.
  language = std::string("ja_JP");
  TranslateHelper::CorrectLanguageCodeTypo(&language);
  EXPECT_EQ("ja-JP", language);

  // Correct wrong cases.
  language = std::string("JA-jp");
  TranslateHelper::CorrectLanguageCodeTypo(&language);
  EXPECT_EQ("ja-JP", language);
}

// Tests that synonym language code is converted to one used in supporting list.
TEST_F(TranslateHelperTest, LanguageCodeSynonyms) {
  std::string language;

  language = std::string("nb");
  TranslateHelper::ConvertLanguageCodeSynonym(&language);
  EXPECT_EQ("no", language);

  language = std::string("he");
  TranslateHelper::ConvertLanguageCodeSynonym(&language);
  EXPECT_EQ("iw", language);

  language = std::string("jv");
  TranslateHelper::ConvertLanguageCodeSynonym(&language);
  EXPECT_EQ("jw", language);

  language = std::string("fil");
  TranslateHelper::ConvertLanguageCodeSynonym(&language);
  EXPECT_EQ("tl", language);
}

// Tests that invalid language code is reset to empty string.
TEST_F(TranslateHelperTest, ResetInvalidLanguageCode) {
  std::string language;

  language = std::string("ja");
  TranslateHelper::ResetInvalidLanguageCode(&language);
  EXPECT_EQ("ja", language);

  language = std::string("ja-JP");
  TranslateHelper::ResetInvalidLanguageCode(&language);
  EXPECT_EQ("ja-JP", language);

  // Invalid because of three characters before hyphen.
  language = std::string("utf-8");
  TranslateHelper::ResetInvalidLanguageCode(&language);
  EXPECT_TRUE(language.empty());

  // Invalid because of six characters after hyphen.
  language = std::string("ja-YUKARI");
  TranslateHelper::ResetInvalidLanguageCode(&language);
  EXPECT_TRUE(language.empty());

  // Invalid because of three characters.
  language = std::string("YMO");
  TranslateHelper::ResetInvalidLanguageCode(&language);
  EXPECT_TRUE(language.empty());
}

// Tests that the language meta tag providing wrong information is ignored by
// TranslateHelper due to disagreement between meta tag and CLD.
TEST_F(TranslateHelperTest, CLDDisagreeWithWrongLanguageCode) {
  string16 contents = ASCIIToUTF16(
      "<html><head><meta http-equiv='Content-Language' content='ja'></head>"
      "<body>This is a page apparently written in English. Even though "
      "content-language is provided, the value will be ignored if the value "
      "is suspicious.</body></html>");
  std::string language =
      TranslateHelper::DeterminePageLanguage(std::string("ja"), contents);
  EXPECT_EQ(chrome::kUnknownLanguageCode, language);
}

// Tests that the language meta tag providing wrong information is ignored and
// CLD's language will be adopted by TranslateHelper due to an invalid meta tag.
TEST_F(TranslateHelperTest, InvalidLanguageMetaTagProviding) {
  string16 contents = ASCIIToUTF16(
      "<html><head><meta http-equiv='Content-Language' content='utf-8'></head>"
      "<body>This is a page apparently written in English. Even though "
      "content-language is provided, the value will be ignored and CLD's"
      " language will be adopted if the value is invalid.</body></html>");
  std::string language =
      TranslateHelper::DeterminePageLanguage(std::string("utf-8"), contents);
  EXPECT_EQ("en", language);
}