summaryrefslogtreecommitdiffstats
path: root/net
diff options
context:
space:
mode:
authormrossetti@chromium.org <mrossetti@chromium.org@0039d316-1c4b-4281-b951-d872f2087c98>2011-04-13 01:11:50 +0000
committermrossetti@chromium.org <mrossetti@chromium.org@0039d316-1c4b-4281-b951-d872f2087c98>2011-04-13 01:11:50 +0000
commitf7b09de5cca6923a03f20be3616830a0d3fafa88 (patch)
tree8fbfe4c736468da5a4b5a7203414a32add49f9a1 /net
parent4069944681ad77bcc80b5299aff0820a667b447e (diff)
downloadchromium_src-f7b09de5cca6923a03f20be3616830a0d3fafa88.zip
chromium_src-f7b09de5cca6923a03f20be3616830a0d3fafa88.tar.gz
chromium_src-f7b09de5cca6923a03f20be3616830a0d3fafa88.tar.bz2
Revert 81343 - Add multiple-offset versions of the various URL reformatting functions. Fixed a couple of erroneous unit tests of offsets into username/password.Note: This does not complete the work required for 78153 -- tis but the first 2/3rds.BUG=78153TEST=Many unit tests updated and added.Review URL: http://codereview.chromium.org/6822038
TBR=mrossetti@chromium.org Review URL: http://codereview.chromium.org/6833011 git-svn-id: svn://svn.chromium.org/chrome/trunk/src@81348 0039d316-1c4b-4281-b951-d872f2087c98
Diffstat (limited to 'net')
-rw-r--r--net/base/escape.cc117
-rw-r--r--net/base/escape.h31
-rw-r--r--net/base/escape_unittest.cc39
-rw-r--r--net/base/net_util.cc426
-rw-r--r--net/base/net_util.h59
-rw-r--r--net/base/net_util_unittest.cc166
6 files changed, 202 insertions, 636 deletions
diff --git a/net/base/escape.cc b/net/base/escape.cc
index 61c3e81..64bd107 100644
--- a/net/base/escape.cc
+++ b/net/base/escape.cc
@@ -2,12 +2,11 @@
// Use of this source code is governed by a BSD-style license that can be
// found in the LICENSE file.
-#include "net/base/escape.h"
-
#include <algorithm>
+#include "net/base/escape.h"
+
#include "base/logging.h"
-#include "base/scoped_ptr.h"
#include "base/string_piece.h"
#include "base/string_util.h"
#include "base/utf_string_conversions.h"
@@ -99,14 +98,15 @@ const char kUrlUnescape[128] = {
};
template<typename STR>
-STR UnescapeURLWithOffsetsImpl(const STR& escaped_text,
- UnescapeRule::Type rules,
- std::vector<size_t>* offsets_for_adjustment) {
- if (offsets_for_adjustment) {
- std::for_each(offsets_for_adjustment->begin(),
- offsets_for_adjustment->end(),
- LimitOffset<std::wstring>(escaped_text.length()));
- }
+STR UnescapeURLImpl(const STR& escaped_text,
+ UnescapeRule::Type rules,
+ size_t* offset_for_adjustment) {
+ size_t offset_temp = string16::npos;
+ if (!offset_for_adjustment)
+ offset_for_adjustment = &offset_temp;
+ else if (*offset_for_adjustment >= escaped_text.length())
+ *offset_for_adjustment = string16::npos;
+
// Do not unescape anything, return the |escaped_text| text.
if (rules == UnescapeRule::NONE)
return escaped_text;
@@ -117,7 +117,6 @@ STR UnescapeURLWithOffsetsImpl(const STR& escaped_text,
STR result;
result.reserve(escaped_text.length());
- AdjustEncodingOffset::Adjustments adjustments; // Locations of adjusted text.
for (size_t i = 0, max = escaped_text.size(); i < max; ++i) {
if (static_cast<unsigned char>(escaped_text[i]) >= 128) {
// Non ASCII character, append as is.
@@ -145,9 +144,17 @@ STR UnescapeURLWithOffsetsImpl(const STR& escaped_text,
// Additionally allow control characters if requested.
(value < ' ' && (rules & UnescapeRule::CONTROL_CHARS)))) {
// Use the unescaped version of the character.
- adjustments.push_back(i);
+ size_t length_before_append = result.length();
result.push_back(value);
i += 2;
+
+ // Adjust offset to match length change.
+ if (*offset_for_adjustment != std::string::npos) {
+ if (*offset_for_adjustment > (length_before_append + 2))
+ *offset_for_adjustment -= 2;
+ else if (*offset_for_adjustment > length_before_append)
+ *offset_for_adjustment = std::string::npos;
+ }
} else {
// Keep escaped. Append a percent and we'll get the following two
// digits on the next loops through.
@@ -167,26 +174,6 @@ STR UnescapeURLWithOffsetsImpl(const STR& escaped_text,
}
}
- // Make offset adjustment.
- if (offsets_for_adjustment && !adjustments.empty()) {
- std::for_each(offsets_for_adjustment->begin(),
- offsets_for_adjustment->end(),
- AdjustEncodingOffset(adjustments));
- }
-
- return result;
-}
-
-template<typename STR>
-STR UnescapeURLImpl(const STR& escaped_text,
- UnescapeRule::Type rules,
- size_t* offset_for_adjustment) {
- std::vector<size_t> offsets;
- if (offset_for_adjustment)
- offsets.push_back(*offset_for_adjustment);
- STR result = UnescapeURLWithOffsetsImpl(escaped_text, rules, &offsets);
- if (offset_for_adjustment)
- *offset_for_adjustment = offsets[0];
return result;
}
@@ -247,49 +234,33 @@ std::string EscapeExternalHandlerValue(const std::string& text) {
return Escape(text, kExternalHandlerCharmap, false);
}
-string16 UnescapeAndDecodeUTF8URLComponentWithOffsets(
- const std::string& text,
- UnescapeRule::Type rules,
- std::vector<size_t>* offsets_for_adjustment) {
+string16 UnescapeAndDecodeUTF8URLComponent(const std::string& text,
+ UnescapeRule::Type rules,
+ size_t* offset_for_adjustment) {
std::wstring result;
- std::vector<size_t> original_offsets;
- if (offsets_for_adjustment)
- original_offsets = *offsets_for_adjustment;
+ size_t original_offset = offset_for_adjustment ? *offset_for_adjustment : 0;
std::string unescaped_url(
- UnescapeURLWithOffsetsImpl(text, rules, offsets_for_adjustment));
- if (UTF8ToWideAndAdjustOffsets(unescaped_url.data(), unescaped_url.length(),
- &result, offsets_for_adjustment))
+ UnescapeURLImpl(text, rules, offset_for_adjustment));
+ if (UTF8ToWideAndAdjustOffset(unescaped_url.data(), unescaped_url.length(),
+ &result, offset_for_adjustment))
return WideToUTF16Hack(result); // Character set looks like it's valid.
// Not valid. Return the escaped version. Undo our changes to
// |offset_for_adjustment| since we haven't changed the string after all.
- if (offsets_for_adjustment)
- *offsets_for_adjustment = original_offsets;
- return WideToUTF16Hack(UTF8ToWideAndAdjustOffsets(
- text, offsets_for_adjustment));
-}
-
-string16 UnescapeAndDecodeUTF8URLComponent(const std::string& text,
- UnescapeRule::Type rules,
- size_t* offset_for_adjustment) {
- std::vector<size_t> offsets;
- if (offset_for_adjustment)
- offsets.push_back(*offset_for_adjustment);
- string16 result =
- UnescapeAndDecodeUTF8URLComponentWithOffsets(text, rules, &offsets);
if (offset_for_adjustment)
- *offset_for_adjustment = offsets[0];
- return result;
+ *offset_for_adjustment = original_offset;
+ return WideToUTF16Hack(UTF8ToWideAndAdjustOffset(text,
+ offset_for_adjustment));
}
std::string UnescapeURLComponent(const std::string& escaped_text,
UnescapeRule::Type rules) {
- return UnescapeURLWithOffsetsImpl<std::string>(escaped_text, rules, NULL);
+ return UnescapeURLImpl(escaped_text, rules, NULL);
}
string16 UnescapeURLComponent(const string16& escaped_text,
UnescapeRule::Type rules) {
- return UnescapeURLWithOffsetsImpl<string16>(escaped_text, rules, NULL);
+ return UnescapeURLImpl(escaped_text, rules, NULL);
}
@@ -379,27 +350,3 @@ string16 UnescapeForHTML(const string16& input) {
}
return text;
}
-
-AdjustEncodingOffset::AdjustEncodingOffset(const Adjustments& adjustments)
- : adjustments(adjustments) {}
-
-void AdjustEncodingOffset::operator()(size_t& offset) {
- // For each encoded character occurring before an offset subtract 2.
- if (offset == string16::npos)
- return;
- size_t adjusted_offset = offset;
- for (Adjustments::const_iterator i = adjustments.begin();
- i != adjustments.end(); ++i) {
- size_t location = *i;
- if (offset <= location) {
- offset = adjusted_offset;
- return;
- }
- if (offset <= (location + 2)) {
- offset = string16::npos;
- return;
- }
- adjusted_offset -= 2;
- }
- offset = adjusted_offset;
-}
diff --git a/net/base/escape.h b/net/base/escape.h
index f4c99a3..faa7bd3 100644
--- a/net/base/escape.h
+++ b/net/base/escape.h
@@ -7,7 +7,6 @@
#pragma once
#include <string>
-#include <vector>
#include "base/basictypes.h"
#include "base/string16.h"
@@ -100,20 +99,15 @@ string16 UnescapeURLComponent(const string16& escaped_text,
// Unescapes the given substring as a URL, and then tries to interpret the
// result as being encoded as UTF-8. If the result is convertable into UTF-8, it
// will be returned as converted. If it is not, the original escaped string will
-// be converted into a string16 and returned. (|offset[s]_for_adjustment|)
-// specifies one or more offsets into the source strings; each offset will be
-// adjusted to point at the same logical place in the result strings during
-// decoding. If this isn't possible because an offset points past the end of
-// the source strings or into the middle of a multibyte sequence, the offending
-// offset will be set to std::wstring::npos. |offset[s]_for_adjustment| may be
-// NULL.
+// be converted into a string16 and returned.
+//
+// |offset_for_adjustment| may be NULL; if not, it is an offset into |text| that
+// will be adjusted to point at the same logical place in the result string. If
+// this isn't possible because it points into the middle of an escape sequence
+// or past the end of the string, it will be set to string16::npos.
string16 UnescapeAndDecodeUTF8URLComponent(const std::string& text,
UnescapeRule::Type rules,
size_t* offset_for_adjustment);
-string16 UnescapeAndDecodeUTF8URLComponentWithOffsets(
- const std::string& text,
- UnescapeRule::Type rules,
- std::vector<size_t>* offsets_for_adjustment);
// Unescape the following ampersand character codes from |text|:
// &lt; &gt; &amp; &quot; &#39;
@@ -135,17 +129,4 @@ bool EscapeQueryParamValue(const string16& text, const char* codepage,
// assumes the codepage is UTF8. This is provided as a convenience.
string16 EscapeQueryParamValueUTF8(const string16& text, bool use_plus);
-// Private Functions (Exposed for Unit Testing) --------------------------------
-
-// A function called by std::for_each that will adjust any offset which occurs
-// after one or more encoded characters.
-struct AdjustEncodingOffset {
- typedef std::vector<size_t> Adjustments;
-
- explicit AdjustEncodingOffset(const Adjustments& adjustments);
- void operator()(size_t& offset);
-
- const Adjustments& adjustments;
-};
-
#endif // NET_BASE_ESCAPE_H_
diff --git a/net/base/escape_unittest.cc b/net/base/escape_unittest.cc
index 3a8d895..60d4ae3 100644
--- a/net/base/escape_unittest.cc
+++ b/net/base/escape_unittest.cc
@@ -2,7 +2,6 @@
// Use of this source code is governed by a BSD-style license that can be
// found in the LICENSE file.
-#include <algorithm>
#include <string>
#include "net/base/escape.h"
@@ -16,8 +15,6 @@
namespace {
-static const size_t kNpos = string16::npos;
-
struct EscapeCase {
const wchar_t* input;
const wchar_t* output;
@@ -399,39 +396,3 @@ TEST(EscapeTest, UnescapeForHTML) {
EXPECT_EQ(ASCIIToUTF16(tests[i].expected_output), result);
}
}
-
-TEST(EscapeTest, AdjustEncodingOffset) {
- // Imagine we have strings as shown in the following cases where the
- // %XX's represent encoded characters
-
- // 1: abc%ECdef ==> abcXdef
- std::vector<size_t> offsets;
- for (size_t t = 0; t < 9; ++t)
- offsets.push_back(t);
- AdjustEncodingOffset::Adjustments adjustments;
- adjustments.push_back(3);
- std::for_each(offsets.begin(), offsets.end(),
- AdjustEncodingOffset(adjustments));
- size_t expected_1[] = {0, 1, 2, 3, kNpos, kNpos, 4, 5, 6};
- EXPECT_EQ(offsets.size(), arraysize(expected_1));
- for (size_t i = 0; i < arraysize(expected_1); ++i)
- EXPECT_EQ(expected_1[i], offsets[i]);
-
-
- // 2: %ECabc%EC%ECdef%EC ==> XabcXXdefX
- offsets.clear();
- for (size_t t = 0; t < 18; ++t)
- offsets.push_back(t);
- adjustments.clear();
- adjustments.push_back(0);
- adjustments.push_back(6);
- adjustments.push_back(9);
- adjustments.push_back(15);
- std::for_each(offsets.begin(), offsets.end(),
- AdjustEncodingOffset(adjustments));
- size_t expected_2[] = {0, kNpos, kNpos, 1, 2, 3, 4, kNpos, kNpos, 5, kNpos,
- kNpos, 6, 7, 8, 9, kNpos, kNpos};
- EXPECT_EQ(offsets.size(), arraysize(expected_2));
- for (size_t i = 0; i < arraysize(expected_2); ++i)
- EXPECT_EQ(expected_2[i], offsets[i]);
-}
diff --git a/net/base/net_util.cc b/net/base/net_util.cc
index 378ac7b..1aaa98b 100644
--- a/net/base/net_util.cc
+++ b/net/base/net_util.cc
@@ -67,6 +67,7 @@
#endif
#include "unicode/datefmt.h"
+
using base::Time;
namespace net {
@@ -733,80 +734,6 @@ bool IDNToUnicodeOneComponent(const char16* comp,
return false;
}
-struct SubtractFromOffset {
- explicit SubtractFromOffset(size_t amount)
- : amount(amount) {}
- void operator()(size_t& offset) {
- if (offset != std::wstring::npos)
- if (offset >= amount)
- offset -= amount;
- else
- offset = std::wstring::npos;
- }
-
- size_t amount;
-};
-
-struct AddToOffset {
- explicit AddToOffset(size_t amount)
- : amount(amount) {}
- void operator()(size_t& offset) {
- if (offset != std::wstring::npos)
- offset += amount;
- }
-
- size_t amount;
-};
-
-std::vector<size_t> OffsetsIntoSection(
- std::vector<size_t>* offsets_for_adjustment,
- size_t section_begin) {
- std::vector<size_t> offsets_into_section;
- if (offsets_for_adjustment) {
- std::transform(offsets_for_adjustment->begin(),
- offsets_for_adjustment->end(),
- std::back_inserter(offsets_into_section),
- ClampComponentOffset(section_begin));
- std::for_each(offsets_into_section.begin(), offsets_into_section.end(),
- SubtractFromOffset(section_begin));
- }
- return offsets_into_section;
-}
-
-void ApplySectionAdjustments(const std::vector<size_t>& offsets_into_section,
- std::vector<size_t>* offsets_for_adjustment,
- size_t old_section_len,
- size_t new_section_len,
- size_t section_begin) {
- if (offsets_for_adjustment) {
- DCHECK_EQ(offsets_for_adjustment->size(), offsets_into_section.size());
- std::vector<size_t>::const_iterator host_offsets_iter =
- offsets_into_section.begin();
- for (std::vector<size_t>::iterator offsets_iter =
- offsets_for_adjustment->begin();
- offsets_iter != offsets_for_adjustment->end();
- ++offsets_iter, ++host_offsets_iter) {
- size_t offset = *offsets_iter;
- if (offset == std::wstring::npos || offset < section_begin) {
- // The offset is before the host section so leave it as is.
- continue;
- }
- if (offset >= section_begin + old_section_len) {
- // The offset is after the host section so adjust by host length delta.
- offset += new_section_len - old_section_len;
- } else if (*host_offsets_iter != std::wstring::npos) {
- // The offset is within the host and valid so adjust by the host
- // reformatting offsets results.
- offset = section_begin + *host_offsets_iter;
- } else {
- // The offset is invalid.
- offset = std::wstring::npos;
- }
- *offsets_iter = offset;
- }
- }
-}
-
// If |component| is valid, its begin is incremented by |delta|.
void AdjustComponent(int delta, url_parse::Component* component) {
if (!component->is_valid())
@@ -833,7 +760,7 @@ std::wstring FormatUrlInternal(const GURL& url,
UnescapeRule::Type unescape_rules,
url_parse::Parsed* new_parsed,
size_t* prefix_end,
- std::vector<size_t>* offsets_for_adjustment);
+ size_t* offset_for_adjustment);
// Helper for FormatUrl()/FormatUrlInternal().
std::wstring FormatViewSourceUrl(const GURL& url,
@@ -842,20 +769,18 @@ std::wstring FormatViewSourceUrl(const GURL& url,
UnescapeRule::Type unescape_rules,
url_parse::Parsed* new_parsed,
size_t* prefix_end,
- std::vector<size_t>* offsets_for_adjustment) {
+ size_t* offset_for_adjustment) {
DCHECK(new_parsed);
- DCHECK(offsets_for_adjustment);
const wchar_t* const kWideViewSource = L"view-source:";
const size_t kViewSourceLengthPlus1 = 12;
- std::vector<size_t> saved_offsets(*offsets_for_adjustment);
GURL real_url(url.possibly_invalid_spec().substr(kViewSourceLengthPlus1));
- // Clamp the offsets to the source area.
- std::for_each(offsets_for_adjustment->begin(),
- offsets_for_adjustment->end(),
- SubtractFromOffset(kViewSourceLengthPlus1));
+ size_t temp_offset = (*offset_for_adjustment == std::wstring::npos) ?
+ std::wstring::npos : (*offset_for_adjustment - kViewSourceLengthPlus1);
+ size_t* temp_offset_ptr = (*offset_for_adjustment < kViewSourceLengthPlus1) ?
+ NULL : &temp_offset;
std::wstring result = FormatUrlInternal(real_url, languages, format_types,
- unescape_rules, new_parsed, prefix_end, offsets_for_adjustment);
+ unescape_rules, new_parsed, prefix_end, temp_offset_ptr);
result.insert(0, kWideViewSource);
// Adjust position values.
@@ -869,61 +794,57 @@ std::wstring FormatViewSourceUrl(const GURL& url,
AdjustComponents(kViewSourceLengthPlus1, new_parsed);
if (prefix_end)
*prefix_end += kViewSourceLengthPlus1;
- std::for_each(offsets_for_adjustment->begin(),
- offsets_for_adjustment->end(),
- AddToOffset(kViewSourceLengthPlus1));
- // Restore all offsets which were not affected by FormatUrlInternal.
- DCHECK_EQ(saved_offsets.size(), offsets_for_adjustment->size());
- for (size_t i = 0; i < saved_offsets.size(); ++i) {
- if (saved_offsets[i] < kViewSourceLengthPlus1)
- (*offsets_for_adjustment)[i] = saved_offsets[i];
+ if (temp_offset_ptr) {
+ *offset_for_adjustment = (temp_offset == std::wstring::npos) ?
+ std::wstring::npos : (temp_offset + kViewSourceLengthPlus1);
}
return result;
}
// Appends the substring |in_component| inside of the URL |spec| to |output|,
// and the resulting range will be filled into |out_component|. |unescape_rules|
-// defines how to clean the URL for human readability. |offsets_for_adjustment|
-// is an array of offsets into |output| each of which will be adjusted based on
-// how it maps to the component being converted; if it is less than
-// output->length(), it will be untouched, and if it is greater than
-// output->length() + in_component.len it will be adjusted by the difference in
-// lengths between the input and output components. Otherwise it points into
-// the component being converted, and is adjusted to point to the same logical
-// place in |output|. |offsets_for_adjustment| may not be NULL.
+// defines how to clean the URL for human readability. |offset_for_adjustment|
+// is an offset into |output| which will be adjusted based on how it maps to the
+// component being converted; if it is less than output->length(), it will be
+// untouched, and if it is greater than output->length() + in_component.len it
+// will be shortened by the difference in lengths between the input and output
+// components. Otherwise it points into the component being converted, and is
+// adjusted to point to the same logical place in |output|.
+// |offset_for_adjustment| may not be NULL.
void AppendFormattedComponent(const std::string& spec,
const url_parse::Component& in_component,
UnescapeRule::Type unescape_rules,
std::wstring* output,
url_parse::Component* out_component,
- std::vector<size_t>* offsets_for_adjustment) {
+ size_t* offset_for_adjustment) {
DCHECK(output);
- DCHECK(offsets_for_adjustment);
+ DCHECK(offset_for_adjustment);
if (in_component.is_nonempty()) {
- size_t component_begin = output->length();
- out_component->begin = static_cast<int>(component_begin);
-
- // Compose a list of offsets within the component area.
- std::vector<size_t> offsets_into_component =
- OffsetsIntoSection(offsets_for_adjustment, component_begin);
-
+ out_component->begin = static_cast<int>(output->length());
+ size_t offset_past_current_output =
+ ((*offset_for_adjustment == std::wstring::npos) ||
+ (*offset_for_adjustment < output->length())) ?
+ std::wstring::npos : (*offset_for_adjustment - output->length());
+ size_t* offset_into_component =
+ (offset_past_current_output >= static_cast<size_t>(in_component.len)) ?
+ NULL : &offset_past_current_output;
if (unescape_rules == UnescapeRule::NONE) {
- output->append(UTF8ToWideAndAdjustOffsets(
+ output->append(UTF8ToWideAndAdjustOffset(
spec.substr(in_component.begin, in_component.len),
- &offsets_into_component));
+ offset_into_component));
} else {
- output->append(UTF16ToWideHack(
- UnescapeAndDecodeUTF8URLComponentWithOffsets(
- spec.substr(in_component.begin, in_component.len), unescape_rules,
- &offsets_into_component)));
+ output->append(UTF16ToWideHack(UnescapeAndDecodeUTF8URLComponent(
+ spec.substr(in_component.begin, in_component.len), unescape_rules,
+ offset_into_component)));
+ }
+ out_component->len =
+ static_cast<int>(output->length()) - out_component->begin;
+ if (offset_into_component) {
+ *offset_for_adjustment = (*offset_into_component == std::wstring::npos) ?
+ std::wstring::npos : (out_component->begin + *offset_into_component);
+ } else if (offset_past_current_output != std::wstring::npos) {
+ *offset_for_adjustment += out_component->len - in_component.len;
}
- size_t new_component_len = output->length() - component_begin;
- out_component->len = static_cast<int>(new_component_len);
-
- // Apply offset adjustments.
- size_t old_component_len = static_cast<size_t>(in_component.len);
- ApplySectionAdjustments(offsets_into_component, offsets_for_adjustment,
- old_component_len, new_component_len, component_begin);
} else {
out_component->reset();
}
@@ -937,16 +858,15 @@ std::wstring FormatUrlInternal(const GURL& url,
UnescapeRule::Type unescape_rules,
url_parse::Parsed* new_parsed,
size_t* prefix_end,
- std::vector<size_t>* offsets_for_adjustment) {
+ size_t* offset_for_adjustment) {
url_parse::Parsed parsed_temp;
if (!new_parsed)
new_parsed = &parsed_temp;
else
*new_parsed = url_parse::Parsed();
-
- std::vector<size_t> offsets_temp;
- if (!offsets_for_adjustment)
- offsets_for_adjustment = &offsets_temp;
+ size_t offset_temp = std::wstring::npos;
+ if (!offset_for_adjustment)
+ offset_for_adjustment = &offset_temp;
std::wstring url_string;
@@ -954,9 +874,7 @@ std::wstring FormatUrlInternal(const GURL& url,
if (url.is_empty()) {
if (prefix_end)
*prefix_end = 0;
- std::for_each(offsets_for_adjustment->begin(),
- offsets_for_adjustment->end(),
- LimitOffset<std::wstring>(0));
+ *offset_for_adjustment = std::wstring::npos;
return url_string;
}
@@ -968,17 +886,15 @@ std::wstring FormatUrlInternal(const GURL& url,
if (url.SchemeIs(kViewSource) &&
!StartsWithASCII(url.possibly_invalid_spec(), kViewSourceTwice, false)) {
return FormatViewSourceUrl(url, languages, format_types,
- unescape_rules, new_parsed, prefix_end, offsets_for_adjustment);
+ unescape_rules, new_parsed, prefix_end, offset_for_adjustment);
}
// We handle both valid and invalid URLs (this will give us the spec
// regardless of validity).
const std::string& spec = url.possibly_invalid_spec();
const url_parse::Parsed& parsed = url.parsed_for_possibly_invalid_spec();
- size_t spec_length = spec.length();
- std::for_each(offsets_for_adjustment->begin(),
- offsets_for_adjustment->end(),
- LimitOffset<std::wstring>(spec_length));
+ if (*offset_for_adjustment >= spec.length())
+ *offset_for_adjustment = std::wstring::npos;
// Copy everything before the username (the scheme and the separators.)
// These are ASCII.
@@ -1006,47 +922,48 @@ std::wstring FormatUrlInternal(const GURL& url,
// e.g. "http://google.com:search@evil.ru/"
new_parsed->username.reset();
new_parsed->password.reset();
- // Update the offsets based on removed username and/or password.
- if (!offsets_for_adjustment->empty() &&
+ if ((*offset_for_adjustment != std::wstring::npos) &&
(parsed.username.is_nonempty() || parsed.password.is_nonempty())) {
- AdjustOffset::Adjustments adjustments;
if (parsed.username.is_nonempty() && parsed.password.is_nonempty()) {
// The seeming off-by-one and off-by-two in these first two lines are to
// account for the ':' after the username and '@' after the password.
- adjustments.push_back(AdjustOffset::Adjustment(
- static_cast<size_t>(parsed.username.begin),
- static_cast<size_t>(parsed.username.len + parsed.password.len +
- 2), 0));
+ if (*offset_for_adjustment >
+ static_cast<size_t>(parsed.password.end())) {
+ *offset_for_adjustment -=
+ (parsed.username.len + parsed.password.len + 2);
+ } else if (*offset_for_adjustment >
+ static_cast<size_t>(parsed.username.begin)) {
+ *offset_for_adjustment = std::wstring::npos;
+ }
} else {
const url_parse::Component* nonempty_component =
parsed.username.is_nonempty() ? &parsed.username : &parsed.password;
- // The seeming off-by-one in below is to account for the '@' after the
- // username/password.
- adjustments.push_back(AdjustOffset::Adjustment(
- static_cast<size_t>(nonempty_component->begin),
- static_cast<size_t>(nonempty_component->len + 1), 0));
+ // The seeming off-by-one in these first two lines is to account for the
+ // '@' after the username/password.
+ if (*offset_for_adjustment >
+ static_cast<size_t>(nonempty_component->end())) {
+ *offset_for_adjustment -= (nonempty_component->len + 1);
+ } else if (*offset_for_adjustment >
+ static_cast<size_t>(nonempty_component->begin)) {
+ *offset_for_adjustment = std::wstring::npos;
+ }
}
-
- // Make offset adjustment.
- std::for_each(offsets_for_adjustment->begin(),
- offsets_for_adjustment->end(),
- AdjustOffset(adjustments));
}
} else {
AppendFormattedComponent(spec, parsed.username, unescape_rules, &url_string,
- &new_parsed->username, offsets_for_adjustment);
+ &new_parsed->username, offset_for_adjustment);
if (parsed.password.is_valid())
url_string.push_back(':');
AppendFormattedComponent(spec, parsed.password, unescape_rules, &url_string,
- &new_parsed->password, offsets_for_adjustment);
+ &new_parsed->password, offset_for_adjustment);
if (parsed.username.is_valid() || parsed.password.is_valid())
url_string.push_back('@');
}
if (prefix_end)
*prefix_end = static_cast<size_t>(url_string.length());
- AppendFormattedHostWithOffsets(url, languages, &url_string, new_parsed,
- offsets_for_adjustment);
+ AppendFormattedHost(url, languages, &url_string, new_parsed,
+ offset_for_adjustment);
// Port.
if (parsed.port.is_nonempty()) {
@@ -1064,35 +981,41 @@ std::wstring FormatUrlInternal(const GURL& url,
if (!(format_types & kFormatUrlOmitTrailingSlashOnBareHostname) ||
!CanStripTrailingSlash(url)) {
AppendFormattedComponent(spec, parsed.path, unescape_rules, &url_string,
- &new_parsed->path, offsets_for_adjustment);
+ &new_parsed->path, offset_for_adjustment);
}
if (parsed.query.is_valid())
url_string.push_back('?');
AppendFormattedComponent(spec, parsed.query, unescape_rules, &url_string,
- &new_parsed->query, offsets_for_adjustment);
+ &new_parsed->query, offset_for_adjustment);
// Reference is stored in valid, unescaped UTF-8, so we can just convert.
if (parsed.ref.is_valid()) {
url_string.push_back('#');
- size_t ref_begin = url_string.length();
- new_parsed->ref.begin = static_cast<int>(ref_begin);
-
- // Compose a list of offsets within the section.
- std::vector<size_t> offsets_into_ref =
- OffsetsIntoSection(offsets_for_adjustment, ref_begin);
-
+ new_parsed->ref.begin = url_string.length();
+ size_t offset_past_current_output =
+ ((*offset_for_adjustment == std::wstring::npos) ||
+ (*offset_for_adjustment < url_string.length())) ?
+ std::wstring::npos : (*offset_for_adjustment - url_string.length());
+ size_t* offset_into_ref =
+ (offset_past_current_output >= static_cast<size_t>(parsed.ref.len)) ?
+ NULL : &offset_past_current_output;
if (parsed.ref.len > 0) {
- url_string.append(UTF8ToWideAndAdjustOffsets(spec.substr(parsed.ref.begin,
- parsed.ref.len),
- &offsets_into_ref));
+ url_string.append(UTF8ToWideAndAdjustOffset(spec.substr(parsed.ref.begin,
+ parsed.ref.len),
+ offset_into_ref));
+ }
+ new_parsed->ref.len = url_string.length() - new_parsed->ref.begin;
+ if (offset_into_ref) {
+ *offset_for_adjustment = (*offset_into_ref == std::wstring::npos) ?
+ std::wstring::npos : (new_parsed->ref.begin + *offset_into_ref);
+ } else if (offset_past_current_output != std::wstring::npos) {
+ // We clamped the offset near the beginning of this function to ensure it
+ // was within the input URL. If we reach here, the input was something
+ // invalid and non-parseable such that the offset was past any component
+ // we could figure out. In this case it won't be represented in the
+ // output string, so reset it.
+ *offset_for_adjustment = std::wstring::npos;
}
- size_t old_ref_len = static_cast<size_t>(parsed.ref.len);
- size_t new_ref_len = url_string.length() - new_parsed->ref.begin;
- new_parsed->ref.len = static_cast<int>(new_ref_len);
-
- // Apply offset adjustments.
- ApplySectionAdjustments(offsets_into_ref, offsets_for_adjustment,
- old_ref_len, new_ref_len, ref_begin);
}
// If we need to strip out http do it after the fact. This way we don't need
@@ -1100,11 +1023,12 @@ std::wstring FormatUrlInternal(const GURL& url,
const size_t kHTTPSize = arraysize(kHTTP) - 1;
if (omit_http && !url_string.compare(0, kHTTPSize, kHTTP)) {
url_string = url_string.substr(kHTTPSize);
- AdjustOffset::Adjustments adjustments;
- adjustments.push_back(AdjustOffset::Adjustment(0, kHTTPSize, 0));
- std::for_each(offsets_for_adjustment->begin(),
- offsets_for_adjustment->end(),
- AdjustOffset(adjustments));
+ if (*offset_for_adjustment != std::wstring::npos) {
+ if (*offset_for_adjustment < kHTTPSize)
+ *offset_for_adjustment = std::wstring::npos;
+ else
+ *offset_for_adjustment -= kHTTPSize;
+ }
if (prefix_end)
*prefix_end -= kHTTPSize;
@@ -1262,20 +1186,21 @@ std::string GetHeaderParamValue(const std::string& field,
//
// We may want to skip this step in the case of file URLs to allow unicode
// UNC hostnames regardless of encodings.
-std::wstring IDNToUnicodeWithOffsets(
- const char* host,
- size_t host_len,
- const std::wstring& languages,
- std::vector<size_t>* offsets_for_adjustment) {
+std::wstring IDNToUnicode(const char* host,
+ size_t host_len,
+ const std::wstring& languages,
+ size_t* offset_for_adjustment) {
// Convert the ASCII input to a wide string for ICU.
string16 input16;
input16.reserve(host_len);
input16.insert(input16.end(), host, host + host_len);
+ string16 out16;
+ size_t output_offset = offset_for_adjustment ?
+ *offset_for_adjustment : std::wstring::npos;
+
// Do each component of the host separately, since we enforce script matching
// on a per-component basis.
- AdjustOffset::Adjustments adjustments;
- string16 out16;
for (size_t component_start = 0, component_end;
component_start < input16.length();
component_start = component_end + 1) {
@@ -1284,18 +1209,22 @@ std::wstring IDNToUnicodeWithOffsets(
if (component_end == string16::npos)
component_end = input16.length(); // For getting the last component.
size_t component_length = component_end - component_start;
- size_t new_component_start = out16.length();
+
+ size_t output_component_start = out16.length();
bool converted_idn = false;
if (component_end > component_start) {
// Add the substring that we just found.
converted_idn = IDNToUnicodeOneComponent(input16.data() + component_start,
component_length, languages, &out16);
}
- size_t new_component_length = out16.length() - new_component_start;
+ size_t output_component_length = out16.length() - output_component_start;
- if (converted_idn && offsets_for_adjustment) {
- adjustments.push_back(AdjustOffset::Adjustment(
- component_start, component_length, new_component_length));
+ if ((output_offset != std::wstring::npos) &&
+ (*offset_for_adjustment > component_start)) {
+ if ((*offset_for_adjustment < component_end) && converted_idn)
+ output_offset = std::wstring::npos;
+ else
+ output_offset += output_component_length - component_length;
}
// Need to add the dot we just found (if we found one).
@@ -1303,28 +1232,10 @@ std::wstring IDNToUnicodeWithOffsets(
out16.push_back('.');
}
- // Make offset adjustment.
- if (offsets_for_adjustment && !adjustments.empty()) {
- std::for_each(offsets_for_adjustment->begin(),
- offsets_for_adjustment->end(),
- AdjustOffset(adjustments));
- }
-
- return UTF16ToWideAndAdjustOffsets(out16, offsets_for_adjustment);
-}
-
-std::wstring IDNToUnicode(const char* host,
- size_t host_len,
- const std::wstring& languages,
- size_t* offset_for_adjustment) {
- std::vector<size_t> offsets;
- if (offset_for_adjustment)
- offsets.push_back(*offset_for_adjustment);
- std::wstring result =
- IDNToUnicodeWithOffsets(host, host_len, languages, &offsets);
if (offset_for_adjustment)
- *offset_for_adjustment = offsets[0];
- return result;
+ *offset_for_adjustment = output_offset;
+
+ return UTF16ToWideAndAdjustOffset(out16, offset_for_adjustment);
}
std::string CanonicalizeHost(const std::string& host,
@@ -1737,73 +1648,51 @@ std::string GetHostOrSpecFromURL(const GURL& url) {
return url.has_host() ? TrimEndingDot(url.host()) : url.spec();
}
-void AppendFormattedHostWithOffsets(
- const GURL& url,
- const std::wstring& languages,
- std::wstring* output,
- url_parse::Parsed* new_parsed,
- std::vector<size_t>* offsets_for_adjustment) {
+void AppendFormattedHost(const GURL& url,
+ const std::wstring& languages,
+ std::wstring* output,
+ url_parse::Parsed* new_parsed,
+ size_t* offset_for_adjustment) {
DCHECK(output);
const url_parse::Component& host =
url.parsed_for_possibly_invalid_spec().host;
if (host.is_nonempty()) {
// Handle possible IDN in the host name.
- size_t host_begin = output->length();
+ int new_host_begin = static_cast<int>(output->length());
if (new_parsed)
- new_parsed->host.begin = static_cast<int>(host_begin);
- size_t old_host_len = static_cast<size_t>(host.len);
-
- // Compose a list of offsets within the host area.
- std::vector<size_t> offsets_into_host =
- OffsetsIntoSection(offsets_for_adjustment, host_begin);
+ new_parsed->host.begin = new_host_begin;
+ size_t offset_past_current_output =
+ (!offset_for_adjustment ||
+ (*offset_for_adjustment == std::wstring::npos) ||
+ (*offset_for_adjustment < output->length())) ?
+ std::wstring::npos : (*offset_for_adjustment - output->length());
+ size_t* offset_into_host =
+ (offset_past_current_output >= static_cast<size_t>(host.len)) ?
+ NULL : &offset_past_current_output;
const std::string& spec = url.possibly_invalid_spec();
DCHECK(host.begin >= 0 &&
((spec.length() == 0 && host.begin == 0) ||
host.begin < static_cast<int>(spec.length())));
- output->append(IDNToUnicodeWithOffsets(&spec[host.begin], old_host_len,
- languages, &offsets_into_host));
+ output->append(IDNToUnicode(&spec[host.begin],
+ static_cast<size_t>(host.len), languages, offset_into_host));
- size_t new_host_len = output->length() - host_begin;
+ int new_host_len = static_cast<int>(output->length()) - new_host_begin;
if (new_parsed)
- new_parsed->host.len = static_cast<int>(new_host_len);
-
- // Apply offset adjustments.
- ApplySectionAdjustments(offsets_into_host, offsets_for_adjustment,
- old_host_len, new_host_len, host_begin);
+ new_parsed->host.len = new_host_len;
+ if (offset_into_host) {
+ *offset_for_adjustment = (*offset_into_host == std::wstring::npos) ?
+ std::wstring::npos : (new_host_begin + *offset_into_host);
+ } else if (offset_past_current_output != std::wstring::npos) {
+ *offset_for_adjustment += new_host_len - host.len;
+ }
} else if (new_parsed) {
new_parsed->host.reset();
}
}
-void AppendFormattedHost(const GURL& url,
- const std::wstring& languages,
- std::wstring* output,
- url_parse::Parsed* new_parsed,
- size_t* offset_for_adjustment) {
- std::vector<size_t> offsets;
- if (offset_for_adjustment)
- offsets.push_back(*offset_for_adjustment);
- AppendFormattedHostWithOffsets(url, languages, output, new_parsed, &offsets);
- if (offset_for_adjustment)
- *offset_for_adjustment = offsets[0];
-}
-
// TODO(viettrungluu): convert the wstring |FormatUrlInternal()|.
-string16 FormatUrlWithOffsets(const GURL& url,
- const std::string& languages,
- FormatUrlTypes format_types,
- UnescapeRule::Type unescape_rules,
- url_parse::Parsed* new_parsed,
- size_t* prefix_end,
- std::vector<size_t>* offsets_for_adjustment) {
- return WideToUTF16Hack(
- FormatUrlInternal(url, ASCIIToWide(languages), format_types,
- unescape_rules, new_parsed, prefix_end,
- offsets_for_adjustment));
-}
-
string16 FormatUrl(const GURL& url,
const std::string& languages,
FormatUrlTypes format_types,
@@ -1811,15 +1700,10 @@ string16 FormatUrl(const GURL& url,
url_parse::Parsed* new_parsed,
size_t* prefix_end,
size_t* offset_for_adjustment) {
- std::vector<size_t> offsets;
- if (offset_for_adjustment)
- offsets.push_back(*offset_for_adjustment);
- string16 result = WideToUTF16Hack(
+ return WideToUTF16Hack(
FormatUrlInternal(url, ASCIIToWide(languages), format_types,
- unescape_rules, new_parsed, prefix_end, &offsets));
- if (offset_for_adjustment)
- *offset_for_adjustment = offsets[0];
- return result;
+ unescape_rules, new_parsed, prefix_end,
+ offset_for_adjustment));
}
bool CanStripTrailingSlash(const GURL& url) {
@@ -2272,12 +2156,4 @@ NetworkInterface::NetworkInterface(const std::string& name,
NetworkInterface::~NetworkInterface() {
}
-ClampComponentOffset::ClampComponentOffset(size_t component_start)
- : component_start(component_start) {}
-
-size_t ClampComponentOffset::operator()(size_t offset) {
- return (offset >= component_start) ?
- offset : std::wstring::npos;
-}
-
} // namespace net
diff --git a/net/base/net_util.h b/net/base/net_util.h
index 0ff3369..bae27c3 100644
--- a/net/base/net_util.h
+++ b/net/base/net_util.h
@@ -198,21 +198,15 @@ std::string GetFileNameFromCD(const std::string& header,
// script-language pairs (currently Han, Kana and Hangul for zh,ja and ko).
// When |languages| is empty, even that mixing is not allowed.
//
-// (|offset[s]_for_adjustment|) specifies one or more offsets into the original
-// |url|'s spec(); each offset will be adjusted to point at the same logical
-// place in the result strings during decoding. If this isn't possible because
-// an offset points past the end of |host| or into the middle of a punycode
-// sequence, the offending offset will be set to std::wstring::npos.
-// |offset[s]_for_adjustment| may be NULL.
+// |offset_for_adjustment| is an offset into |host|, which will be adjusted to
+// point at the same logical place in the output string. If this isn't possible
+// because it points past the end of |host| or into the middle of a punycode
+// sequence, it will be set to std::wstring::npos. |offset_for_adjustment| may
+// be NULL.
std::wstring IDNToUnicode(const char* host,
size_t host_len,
const std::wstring& languages,
size_t* offset_for_adjustment);
-std::wstring IDNToUnicodeWithOffsets(
- const char* host,
- size_t host_len,
- const std::wstring& languages,
- std::vector<size_t>* offsets_for_adjustment);
// Canonicalizes |host| and returns it. Also fills |host_info| with
// IP address information. |host_info| must not be NULL.
@@ -298,24 +292,11 @@ int SetNonBlocking(int fd);
// the user. The given parsed structure will be updated. The host name formatter
// also takes the same accept languages component as ElideURL. |new_parsed| may
// be null.
-//
-// (|offset[s]_for_adjustment|) specifies one or more offsets into the original
-// |url|'s spec(); each offset will be adjusted to point at the same logical
-// place in the result strings after reformatting of the host. If this isn't
-// possible because an offset points past the end of the host or into the middle
-// of a multi-character sequence, the offending offset will be set to
-// std::wstring::npos. |offset[s]_for_adjustment| may be NULL.
void AppendFormattedHost(const GURL& url,
const std::wstring& languages,
std::wstring* output,
url_parse::Parsed* new_parsed,
size_t* offset_for_adjustment);
-void AppendFormattedHostWithOffsets(
- const GURL& url,
- const std::wstring& languages,
- std::wstring* output,
- url_parse::Parsed* new_parsed,
- std::vector<size_t>* offsets_for_adjustment);
// Creates a string representation of |url|. The IDN host name may be in Unicode
// if |languages| accepts the Unicode representation. |format_type| is a bitmask
@@ -328,13 +309,12 @@ void AppendFormattedHostWithOffsets(
// The last three parameters may be NULL.
// |new_parsed| will be set to the parsing parameters of the resultant URL.
// |prefix_end| will be the length before the hostname of the resultant URL.
-//
-// (|offset[s]_for_adjustment|) specifies one or more offsets into the original
-// |url|'s spec(); each offset will be modified to reflect changes this function
-// makes to the output string. For example, if |url| is "http://a:b@c.com/",
-// |omit_username_password| is true, and an offset is 12 (the offset of '.'),
-// then on return the output string will be "http://c.com/" and the offset will
-// be 8. If an offset cannot be successfully adjusted (e.g. because it points
+// |offset_for_adjustment| is an offset into the original |url|'s spec(), which
+// will be modified to reflect changes this function makes to the output string;
+// for example, if |url| is "http://a:b@c.com/", |omit_username_password| is
+// true, and |offset_for_adjustment| is 12 (the offset of '.'), then on return
+// the output string will be "http://c.com/" and |offset_for_adjustment| will be
+// 8. If the offset cannot be successfully adjusted (e.g. because it points
// into the middle of a component that was entirely removed, past the end of the
// string, or into the middle of an encoding sequence), it will be set to
// string16::npos.
@@ -345,13 +325,6 @@ string16 FormatUrl(const GURL& url,
url_parse::Parsed* new_parsed,
size_t* prefix_end,
size_t* offset_for_adjustment);
-string16 FormatUrlWithOffsets(const GURL& url,
- const std::string& languages,
- FormatUrlTypes format_types,
- UnescapeRule::Type unescape_rules,
- url_parse::Parsed* new_parsed,
- size_t* prefix_end,
- std::vector<size_t>* offsets_for_adjustment);
// This is a convenience function for FormatUrl() with
// format_types = kFormatUrlOmitAll and unescape = SPACES. This is the typical
@@ -481,16 +454,6 @@ typedef std::list<NetworkInterface> NetworkInterfaceList;
// Can be called only on a thread that allows IO.
bool GetNetworkList(NetworkInterfaceList* networks);
-// Private adjustment function called by std::transform which sets the offset
-// to npos if the offset occurs at or before |component_start|, otherwise don't
-// alter the offset. Exposed here for unit testing.
-struct ClampComponentOffset {
- explicit ClampComponentOffset(size_t component_start);
- size_t operator()(size_t offset);
-
- const size_t component_start;
-};
-
} // namespace net
#endif // NET_BASE_NET_UTIL_H_
diff --git a/net/base/net_util_unittest.cc b/net/base/net_util_unittest.cc
index 4265866..b547f83 100644
--- a/net/base/net_util_unittest.cc
+++ b/net/base/net_util_unittest.cc
@@ -4,8 +4,6 @@
#include "net/base/net_util.h"
-#include <algorithm>
-
#include "base/file_path.h"
#include "base/format_macros.h"
#include "base/string_number_conversions.h"
@@ -23,8 +21,6 @@ namespace net {
namespace {
-static const size_t kNpos = string16::npos;
-
struct FileCase {
const wchar_t* file;
const char* url;
@@ -992,20 +988,6 @@ TEST(NetUtilTest, IDNToUnicodeAdjustOffset) {
&offset);
EXPECT_EQ(adjust_cases[i].output_offset, offset);
}
-
- std::vector<size_t> offsets;
- for (size_t i = 0; i < 40; ++i)
- offsets.push_back(i);
- IDNToUnicodeWithOffsets("test.xn--cy2a840a.xn--1lq90ic7f1rc.test", 39,
- L"zh-CN", &offsets);
- size_t expected[] = {0, 1, 2, 3, 4, 5, kNpos, kNpos, kNpos, kNpos, kNpos,
- kNpos, kNpos, kNpos, kNpos, kNpos, kNpos, 7, 8, kNpos,
- kNpos, kNpos, kNpos, kNpos, kNpos, kNpos, kNpos, kNpos,
- kNpos, kNpos, kNpos, kNpos, kNpos, kNpos, 12, 13, 14, 15,
- 16, kNpos};
- ASSERT_EQ(40U, arraysize(expected));
- for (size_t i = 0; i < 40; ++i)
- EXPECT_EQ(expected[i], offsets[i]);
}
TEST(NetUtilTest, CompliantHost) {
@@ -1817,24 +1799,13 @@ TEST(NetUtilTest, FormatUrlAdjustOffset) {
EXPECT_EQ(basic_cases[i].output_offset, offset);
}
- size_t url_size = 26;
- std::vector<size_t> offsets;
- for (size_t i = 0; i < url_size + 1; ++i)
- offsets.push_back(i);
- FormatUrlWithOffsets(GURL("http://www.google.com/foo/"), "en",
- kFormatUrlOmitUsernamePassword, UnescapeRule::NORMAL,
- NULL, NULL, &offsets);
- for (size_t i = 0; i < url_size; ++i)
- EXPECT_EQ(i, offsets[i]);
- EXPECT_EQ(kNpos, offsets[url_size]);
-
const struct {
const char* input_url;
size_t input_offset;
size_t output_offset;
} omit_auth_cases[] = {
{"http://foo:bar@www.google.com/", 6, 6},
- {"http://foo:bar@www.google.com/", 7, string16::npos},
+ {"http://foo:bar@www.google.com/", 7, 7},
{"http://foo:bar@www.google.com/", 8, string16::npos},
{"http://foo:bar@www.google.com/", 10, string16::npos},
{"http://foo:bar@www.google.com/", 11, string16::npos},
@@ -1852,28 +1823,13 @@ TEST(NetUtilTest, FormatUrlAdjustOffset) {
EXPECT_EQ(omit_auth_cases[i].output_offset, offset);
}
- url_size = 30;
- offsets.clear();
- for (size_t i = 0; i < url_size; ++i)
- offsets.push_back(i);
- FormatUrlWithOffsets(GURL("http://foo:bar@www.google.com/"), "en",
- kFormatUrlOmitUsernamePassword, UnescapeRule::NORMAL,
- NULL, NULL, &offsets);
- for (size_t i = 0; i < 7; ++i)
- EXPECT_EQ(i, offsets[i]);
- for (size_t i = 7; i < 15; ++i)
- EXPECT_EQ(kNpos, offsets[i]);
- for (size_t i = 16; i < url_size; ++i)
- EXPECT_EQ(i - 8 , offsets[i]);
-
const AdjustOffsetCase view_source_cases[] = {
{0, 0},
{3, 3},
{11, 11},
{12, 12},
{13, 13},
- {18, 18},
- {19, string16::npos},
+ {19, 19},
{20, string16::npos},
{23, 19},
{26, 22},
@@ -1887,20 +1843,6 @@ TEST(NetUtilTest, FormatUrlAdjustOffset) {
EXPECT_EQ(view_source_cases[i].output_offset, offset);
}
- url_size = 38;
- offsets.clear();
- for (size_t i = 0; i < url_size; ++i)
- offsets.push_back(i);
- FormatUrlWithOffsets(GURL("view-source:http://foo@www.google.com/"), "en",
- kFormatUrlOmitUsernamePassword, UnescapeRule::NORMAL,
- NULL, NULL, &offsets);
- size_t expected[] = {0, 1, 2, 3, 4, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15, 16,
- 17, 18, kNpos, kNpos, kNpos, kNpos, 19, 20, 21, 22, 23,
- 24, 25, 26, 27, 28, 29, 30, 31, 32, 33};
- ASSERT_EQ(url_size, arraysize(expected));
- for (size_t i = 0; i < url_size; ++i)
- EXPECT_EQ(expected[i], offsets[i]);
-
const AdjustOffsetCase idn_hostname_cases[] = {
{8, string16::npos},
{16, string16::npos},
@@ -1917,21 +1859,6 @@ TEST(NetUtilTest, FormatUrlAdjustOffset) {
EXPECT_EQ(idn_hostname_cases[i].output_offset, offset);
}
- url_size = 33;
- offsets.clear();
- for (size_t i = 0; i < url_size; ++i)
- offsets.push_back(i);
- FormatUrlWithOffsets(GURL("http://xn--l8jvb1ey91xtjb.jp/foo/"), "ja",
- kFormatUrlOmitUsernamePassword, UnescapeRule::NORMAL,
- NULL, NULL, &offsets);
- size_t expected_1[] = {0, 1, 2, 3, 4, 5, 6, 7, kNpos, kNpos, kNpos, kNpos,
- kNpos, kNpos, kNpos, kNpos, kNpos, kNpos, kNpos, kNpos,
- kNpos, kNpos, kNpos, kNpos, kNpos, 12, 13, 14, 15, 16,
- 17, 18, 19};
- ASSERT_EQ(url_size, arraysize(expected_1));
- for (size_t i = 0; i < url_size; ++i)
- EXPECT_EQ(expected_1[i], offsets[i]);
-
const AdjustOffsetCase unescape_cases[] = {
{25, 25},
{26, string16::npos},
@@ -1954,31 +1881,11 @@ TEST(NetUtilTest, FormatUrlAdjustOffset) {
EXPECT_EQ(unescape_cases[i].output_offset, offset);
}
- url_size = 68;
- offsets.clear();
- for (size_t i = 0; i < url_size; ++i)
- offsets.push_back(i);
- FormatUrlWithOffsets(GURL(
- "http://www.google.com/foo%20bar/%E3%82%B0%E3%83%BC%E3%82%B0%E3%83%AB"),
- "en", kFormatUrlOmitUsernamePassword, UnescapeRule::SPACES, NULL, NULL,
- &offsets);
- size_t expected_2[] = {0, 1, 2, 3, 4, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15,
- 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, kNpos, kNpos,
- 26, 27, 28, 29, 30, kNpos, kNpos, kNpos, kNpos, kNpos,
- kNpos, kNpos, kNpos, 31, kNpos, kNpos, kNpos, kNpos,
- kNpos, kNpos, kNpos, kNpos, 32, kNpos, kNpos, kNpos,
- kNpos, kNpos, kNpos, kNpos, kNpos, 33, kNpos, kNpos,
- kNpos, kNpos, kNpos, kNpos, kNpos, kNpos};
- ASSERT_EQ(url_size, arraysize(expected_2));
- for (size_t i = 0; i < url_size; ++i)
- EXPECT_EQ(expected_2[i], offsets[i]);
-
const AdjustOffsetCase ref_cases[] = {
{30, 30},
{31, 31},
{32, string16::npos},
{34, 32},
- {35, string16::npos},
{37, 33},
{38, string16::npos},
};
@@ -1992,22 +1899,6 @@ TEST(NetUtilTest, FormatUrlAdjustOffset) {
EXPECT_EQ(ref_cases[i].output_offset, offset);
}
- url_size = 38;
- offsets.clear();
- for (size_t i = 0; i < url_size; ++i)
- offsets.push_back(i);
- // "http://www.google.com/foo.html#\x30B0\x30B0z"
- FormatUrlWithOffsets(GURL(
- "http://www.google.com/foo.html#\xE3\x82\xB0\xE3\x82\xB0z"), "en",
- kFormatUrlOmitUsernamePassword, UnescapeRule::NORMAL, NULL, NULL,
- &offsets);
- size_t expected_3[] = {0, 1, 2, 3, 4, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15,
- 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29,
- 30, 31, kNpos, kNpos, 32, kNpos, kNpos, 33};
- ASSERT_EQ(url_size, arraysize(expected_3));
- for (size_t i = 0; i < url_size; ++i)
- EXPECT_EQ(expected_3[i], offsets[i]);
-
const AdjustOffsetCase omit_http_cases[] = {
{0, string16::npos},
{3, string16::npos},
@@ -2021,18 +1912,6 @@ TEST(NetUtilTest, FormatUrlAdjustOffset) {
EXPECT_EQ(omit_http_cases[i].output_offset, offset);
}
- url_size = 23;
- offsets.clear();
- for (size_t i = 0; i < url_size; ++i)
- offsets.push_back(i);
- FormatUrlWithOffsets(GURL("http://www.google.com"), "en",
- kFormatUrlOmitHTTP, UnescapeRule::NORMAL, NULL, NULL, &offsets);
- size_t expected_4[] = {kNpos, kNpos, kNpos, kNpos, kNpos, kNpos, kNpos, 0, 1,
- 2, 3, 4, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, kNpos};
- ASSERT_EQ(url_size, arraysize(expected_4));
- for (size_t i = 0; i < url_size; ++i)
- EXPECT_EQ(expected_4[i], offsets[i]);
-
const AdjustOffsetCase omit_http_start_with_ftp[] = {
{0, 0},
{3, 3},
@@ -2045,18 +1924,6 @@ TEST(NetUtilTest, FormatUrlAdjustOffset) {
EXPECT_EQ(omit_http_start_with_ftp[i].output_offset, offset);
}
- url_size = 23;
- offsets.clear();
- for (size_t i = 0; i < url_size; ++i)
- offsets.push_back(i);
- FormatUrlWithOffsets(GURL("http://ftp.google.com"), "en",
- kFormatUrlOmitHTTP, UnescapeRule::NORMAL, NULL, NULL, &offsets);
- size_t expected_5[] = {0, 1, 2, 3, 4, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15,
- 16, 17, 18, 19, 20, 21, kNpos};
- ASSERT_EQ(url_size, arraysize(expected_5));
- for (size_t i = 0; i < url_size; ++i)
- EXPECT_EQ(expected_5[i], offsets[i]);
-
const AdjustOffsetCase omit_all_cases[] = {
{12, 0},
{13, 1},
@@ -2069,19 +1936,6 @@ TEST(NetUtilTest, FormatUrlAdjustOffset) {
UnescapeRule::NORMAL, NULL, NULL, &offset);
EXPECT_EQ(omit_all_cases[i].output_offset, offset);
}
-
- url_size = 21;
- offsets.clear();
- for (size_t i = 0; i < url_size; ++i)
- offsets.push_back(i);
- FormatUrlWithOffsets(GURL("http://user@foo.com/"), "en", kFormatUrlOmitAll,
- UnescapeRule::NORMAL, NULL, NULL, &offsets);
- size_t expected_6[] = {kNpos, kNpos, kNpos, kNpos, kNpos, kNpos, kNpos, kNpos,
- kNpos, kNpos, kNpos, kNpos, 0, 1, 2, 3, 4, 5, 6, 7,
- kNpos};
- ASSERT_EQ(url_size, arraysize(expected_6));
- for (size_t i = 0; i < url_size; ++i)
- EXPECT_EQ(expected_6[i], offsets[i]);
}
TEST(NetUtilTest, SimplifyUrlForRequest) {
@@ -2367,20 +2221,4 @@ TEST(NetUtilTest, GetNetworkList) {
}
}
-TEST(NetUtilTest, AdjustComponentOffset) {
- std::vector<size_t> old_offsets;
- for (size_t i = 0; i < 10; ++i)
- old_offsets.push_back(i);
- std::vector<size_t> new_offsets;
- std::transform(old_offsets.begin(),
- old_offsets.end(),
- std::back_inserter(new_offsets),
- ClampComponentOffset(5));
- size_t expected_1[] = {kNpos, kNpos, kNpos, kNpos, kNpos, 5, 6, 7, 8, 9};
- EXPECT_EQ(new_offsets.size(), arraysize(expected_1));
- EXPECT_EQ(new_offsets.size(), old_offsets.size());
- for (size_t i = 0; i < arraysize(expected_1); ++i)
- EXPECT_EQ(expected_1[i], new_offsets[i]);
-}
-
} // namespace net