diff options
6 files changed, 361 insertions, 1 deletions
diff --git a/url/ b/url/
index db5a6ad..2beed04 100644
--- a/url/
+++ b/url/
@@ -24,6 +24,8 @@ component("url") {
+ "",
+ "origin.h",
@@ -97,6 +99,7 @@ if (!is_android) {
sources = [
+ "",
diff --git a/url/ b/url/
new file mode 100644
index 0000000..e80eb72
--- /dev/null
+++ b/url/
@@ -0,0 +1,69 @@
+// Copyright 2015 The Chromium Authors. All rights reserved.
+// Use of this source code is governed by a BSD-style license that can be
+// found in the LICENSE file.
+#include "url/origin.h"
+#include <string.h>
+#include "base/logging.h"
+#include "base/strings/string_number_conversions.h"
+#include "url/gurl.h"
+#include "url/url_canon.h"
+#include "url/url_canon_stdstring.h"
+#include "url/url_constants.h"
+#include "url/url_util.h"
+namespace url {
+Origin::Origin() : unique_(true) {
+Origin::Origin(const GURL& url) : unique_(true) {
+ if (!url.is_valid() || (!url.IsStandard() && !url.SchemeIsBlob()))
+ return;
+ if (url.SchemeIsFileSystem()) {
+ tuple_ = SchemeHostPort(*url.inner_url());
+ } else if (url.SchemeIsBlob()) {
+ // TODO(mkwst): This relies on the fact that GURL pushes the unparseable
+ // bits and pieces of a non-standard scheme into the GURL's path. It seems
+ // fairly fragile, so it might be worth teaching GURL about blobs' data in
+ // the same way it's been taught about filesystems' inner URLs.
+ tuple_ = SchemeHostPort(GURL(url.path()));
+ } else {
+ tuple_ = SchemeHostPort(url);
+ }
+ unique_ = tuple_.IsInvalid();
+Origin::~Origin() {
+std::string Origin::Serialize() const {
+ if (unique())
+ return "null";
+ if (scheme() == kFileScheme)
+ return "file://";
+ return tuple_.Serialize();
+bool Origin::IsSameOriginWith(const Origin& other) const {
+ if (unique_ || other.unique_)
+ return false;
+ return tuple_.Equals(other.tuple_);
+bool Origin::operator<(const Origin& other) const {
+ return tuple_ < other.tuple_;
+std::ostream& operator<<(std::ostream& out, const url::Origin& origin) {
+ return out << origin.Serialize();
+} // namespace url
diff --git a/url/origin.h b/url/origin.h
new file mode 100644
index 0000000..15fe0ea
--- /dev/null
+++ b/url/origin.h
@@ -0,0 +1,125 @@
+// Copyright 2015 The Chromium Authors. All rights reserved.
+// Use of this source code is governed by a BSD-style license that can be
+// found in the LICENSE file.
+#ifndef URL_ORIGIN_H_
+#define URL_ORIGIN_H_
+#include <string>
+#include "base/strings/string16.h"
+#include "url/scheme_host_port.h"
+#include "url/third_party/mozilla/url_parse.h"
+#include "url/url_canon.h"
+#include "url/url_constants.h"
+#include "url/url_export.h"
+class GURL;
+namespace url {
+// An Origin is a tuple of (scheme, host, port), as described in RFC 6454.
+// TL;DR: If you need to make a security-relevant decision, use 'url::Origin'.
+// If you only need to extract the bits of a URL which are relevant for a
+// network connection, use 'url::SchemeHostPort'.
+// STL;SDR: If you aren't making actual network connections, use 'url::Origin'.
+// 'Origin', like 'SchemeHostPort', is composed of a tuple of (scheme, host,
+// port), but contains a number of additional concepts which make it appropriate
+// for use as a security boundary and access control mechanism between contexts.
+// This class ought to be used when code needs to determine if two resources
+// are "same-origin", and when a canonical serialization of an origin is
+// required. Note that some origins are "unique", meaning that they are not
+// same-origin with any other origin (including themselves).
+// There are a few subtleties to note:
+// * Invalid and non-standard GURLs are parsed as unique origins. This includes
+// non-hierarchical URLs like 'data:text/html,...' and 'javascript:alert(1)'.
+// * GURLs with schemes of 'filesystem' or 'blob' parse the origin out of the
+// internals of the URL. That is, 'filesystem:'
+// is parsed as ('https', '', 443).
+// * Unique origins all serialize to the string "null"; this means that the
+// serializations of two unique origins are identical to each other, though
+// the origins themselves are not "the same". This means that origins'
+// serializations must not be relied upon for security checks.
+// * GURLs with a 'file' scheme are tricky. They are parsed as ('file', '', 0),
+// but their behavior may differ from embedder to embedder.
+// * The host component of an IPv6 address includes brackets, just like the URL
+// representation.
+// Usage:
+// * Origins are generally constructed from an already-canonicalized GURL:
+// GURL url("");
+// url::Origin origin(url);
+// origin.scheme(); // "https"
+//; // ""
+// origin.port(); // 443
+// origin.IsUnique(); // false
+// * To answer the question "Are |this| and |that| "same-origin" with each
+// other?", use |Origin::IsSameOriginWith|:
+// if (this.IsSameOriginWith(that)) {
+// // Amazingness goes here.
+// }
+class URL_EXPORT Origin {
+ public:
+ // Creates a unique Origin.
+ Origin();
+ // Creates an Origin from |url|, as described at
+ //, with the following additions:
+ //
+ // 1. If |url| is invalid or non-standard, a unique Origin is constructed.
+ // 2. 'filesystem' URLs behave as 'blob' URLs (that is, the origin is parsed
+ // out of everything in the URL which follows the scheme).
+ // 3. 'file' URLs all parse as ("file", "", 0).
+ explicit Origin(const GURL& url);
+ ~Origin();
+ // For unique origins, these return ("", "", 0).
+ //
+ // TODO(mkwst): These should be 'const std::string&', along with their
+ // 'url::SchemeHostPort' analogs.
+ std::string scheme() const { return tuple_.scheme(); }
+ std::string host() const { return; }
+ uint16 port() const { return tuple_.port(); }
+ bool unique() const { return unique_; }
+ // An ASCII serialization of the Origin as per Section 6.2 of RFC 6454, with
+ // the addition that all Origins with a 'file' scheme serialize to "file://".
+ std::string Serialize() const;
+ // Two Origins are "same-origin" if their schemes, hosts, and ports are exact
+ // matches; and neither is unique.
+ bool IsSameOriginWith(const Origin& other) const;
+ // Allows SchemeHostPort to used as a key in STL (for example, a std::set or
+ // std::map).
+ bool operator<(const Origin& other) const;
+ private:
+ SchemeHostPort tuple_;
+ bool unique_;
+URL_EXPORT std::ostream& operator<<(std::ostream& out,
+ const Origin& origin);
+} // namespace url
diff --git a/url/ b/url/
new file mode 100644
index 0000000..a774c62
--- /dev/null
+++ b/url/
@@ -0,0 +1,160 @@
+// Copyright 2015 The Chromium Authors. All rights reserved.
+// Use of this source code is governed by a BSD-style license that can be
+// found in the LICENSE file.
+#include "url/origin.h"
+#include "testing/gtest/include/gtest/gtest.h"
+#include "url/gurl.h"
+namespace {
+TEST(OriginTest, UniqueOriginComparison) {
+ url::Origin unique_origin;
+ EXPECT_EQ("", unique_origin.scheme());
+ EXPECT_EQ("",;
+ EXPECT_EQ(0, unique_origin.port());
+ EXPECT_TRUE(unique_origin.unique());
+ EXPECT_FALSE(unique_origin.IsSameOriginWith(unique_origin));
+ const char* const urls[] = {"data:text/html,Hello!",
+ "javascript:alert(1)",
+ "file://",
+ "yay",
+ "http::///"};
+ for (const auto& test_url : urls) {
+ SCOPED_TRACE(test_url);
+ GURL url(test_url);
+ url::Origin origin(url);
+ EXPECT_EQ("", origin.scheme());
+ EXPECT_EQ("",;
+ EXPECT_EQ(0, origin.port());
+ EXPECT_TRUE(origin.unique());
+ EXPECT_FALSE(origin.IsSameOriginWith(origin));
+ EXPECT_FALSE(unique_origin.IsSameOriginWith(origin));
+ EXPECT_FALSE(origin.IsSameOriginWith(unique_origin));
+ }
+TEST(OriginTest, ConstructFromGURL) {
+ url::Origin different_origin(GURL("https://not-in-the-list.test/"));
+ struct TestCases {
+ const char* const url;
+ const char* const expected_scheme;
+ const char* const expected_host;
+ const uint16 expected_port;
+ } cases[] = {
+ // IP Addresses
+ {"", "http", "", 80},
+ {"http://[2001:db8::1]/", "http", "[2001:db8::1]", 80},
+ // Punycode
+ {"http://☃.net/", "http", "", 80},
+ {"blob:http://☃.net/", "http", "", 80},
+ // Generic URLs
+ {"", "http", "", 80},
+ {"", "http", "", 123},
+ {"", "https", "", 443},
+ {"", "https", "", 123},
+ {"", "http", "", 80},
+ {"", "http", "", 123},
+ {"", "https", "", 443},
+ {"", "https", "", 123},
+ // Registered URLs
+ {"", "ftp", "", 21},
+ {"gopher://", "gopher", "", 70},
+ {"ws://", "ws", "", 80},
+ {"wss://", "wss", "", 443},
+ // file: URLs
+ {"file:///etc/passwd", "file", "", 0},
+ {"file://", "file", "", 0},
+ // Filesystem:
+ {"filesystem:", "http", "", 80},
+ {"filesystem:", "http", "", 123},
+ {"filesystem:", "https", "", 443},
+ {"filesystem:", "https", "", 123},
+ // Blob:
+ {"blob:", "http", "", 80},
+ {"blob:", "http", "", 123},
+ {"blob:", "https", "", 443},
+ {"blob:", "http", "", 80},
+ };
+ for (const auto& test_case : cases) {
+ SCOPED_TRACE(test_case.url);
+ GURL url(test_case.url);
+ EXPECT_TRUE(url.is_valid());
+ url::Origin origin(url);
+ EXPECT_EQ(test_case.expected_scheme, origin.scheme());
+ EXPECT_EQ(test_case.expected_host,;
+ EXPECT_EQ(test_case.expected_port, origin.port());
+ EXPECT_FALSE(origin.unique());
+ EXPECT_TRUE(origin.IsSameOriginWith(origin));
+ EXPECT_FALSE(different_origin.IsSameOriginWith(origin));
+ EXPECT_FALSE(origin.IsSameOriginWith(different_origin));
+ }
+TEST(OriginTest, Serialization) {
+ struct TestCases {
+ const char* const url;
+ const char* const expected;
+ } cases[] = {
+ {"", ""},
+ {"http://[2001:db8::1]/", "http://[2001:db8::1]"},
+ {"http://☃.net/", ""},
+ {"", ""},
+ {"", ""},
+ {"", ""},
+ {"", ""},
+ {"file:///etc/passwd", "file://"},
+ {"file://", "file://"},
+ };
+ for (const auto& test_case : cases) {
+ SCOPED_TRACE(test_case.url);
+ GURL url(test_case.url);
+ EXPECT_TRUE(url.is_valid());
+ url::Origin origin(url);
+ EXPECT_EQ(test_case.expected, origin.Serialize());
+ // The '<<' operator should produce the same serialization as Serialize().
+ std::stringstream out;
+ out << origin;
+ EXPECT_EQ(test_case.expected, out.str());
+ }
+TEST(OriginTest, Comparison) {
+ // These URLs are arranged in increasing order:
+ const char* const urls[] = {
+ "data:uniqueness",
+ "http://a:80",
+ "http://b:80",
+ "https://a:80",
+ "https://b:80",
+ "http://a:81",
+ "http://b:81",
+ "https://a:81",
+ "https://b:81",
+ };
+ for (size_t i = 0; i < arraysize(urls); i++) {
+ GURL current_url(urls[i]);
+ url::Origin current(current_url);
+ for (size_t j = i; j < arraysize(urls); j++) {
+ GURL compare_url(urls[j]);
+ url::Origin to_compare(compare_url);
+ EXPECT_EQ(i < j, current < to_compare) << i << " < " << j;
+ EXPECT_EQ(j < i, to_compare < current) << j << " < " << i;
+ }
+ }
+} // namespace url
diff --git a/url/url.gyp b/url/url.gyp
index 198d448..b8355a8 100644
--- a/url/url.gyp
+++ b/url/url.gyp
@@ -46,8 +46,9 @@
'sources': [
- '',
+ '',
+ '',
diff --git a/url/url_srcs.gypi b/url/url_srcs.gypi
index 525598b..21d2fe1 100644
--- a/url/url_srcs.gypi
+++ b/url/url_srcs.gypi
@@ -11,6 +11,8 @@
+ '',
+ 'origin.h',