// Copyright (c) 2012 The Chromium Authors. All rights reserved. // Use of this source code is governed by a BSD-style license that can be // found in the LICENSE file. #include "chrome/common/content_settings_pattern_parser.h" #include "base/string_util.h" #include "chrome/common/url_constants.h" #include "extensions/common/constants.h" #include "googleurl/src/gurl.h" #include "googleurl/src/url_canon.h" #include "net/base/net_util.h" namespace { const char* kUrlPathSeparator = "/"; const char* kUrlPortSeparator = ":"; class Component { public: Component() : start(0), len(0) {} Component(size_t s, size_t l) : start(s), len(l) {} bool IsNonEmpty() { return len > 0; } size_t start; size_t len; }; } // namespace namespace content_settings { const char* PatternParser::kDomainWildcard = "[*.]"; const size_t PatternParser::kDomainWildcardLength = 4; const char* PatternParser::kSchemeWildcard = "*"; const char* PatternParser::kHostWildcard = "*"; const char* PatternParser::kPortWildcard = "*"; const char* PatternParser::kPathWildcard = "*"; // static void PatternParser::Parse(const std::string& pattern_spec, ContentSettingsPattern::BuilderInterface* builder) { if (pattern_spec == "*") { builder->WithSchemeWildcard(); builder->WithDomainWildcard(); builder->WithPortWildcard(); return; } // Initialize components for the individual patterns parts to empty // sub-strings. Component scheme_component; Component host_component; Component port_component; Component path_component; size_t start = 0; size_t current_pos = 0; if (pattern_spec.empty()) return; // Test if a scheme pattern is in the spec. current_pos = pattern_spec.find( std::string(content::kStandardSchemeSeparator), start); if (current_pos != std::string::npos) { scheme_component = Component(start, current_pos); start = current_pos + strlen(content::kStandardSchemeSeparator); current_pos = start; } else { current_pos = start; } if (start >= pattern_spec.size()) return; // Bad pattern spec. // Jump to the end of domain wildcards or an IPv6 addresses. IPv6 addresses // contain ':'. So first move to the end of an IPv6 address befor searching // for the ':' that separates the port form the host. if (pattern_spec[current_pos] == '[') current_pos = pattern_spec.find("]", start); if (current_pos == std::string::npos) return; // Bad pattern spec. current_pos = pattern_spec.find(std::string(kUrlPortSeparator), current_pos); if (current_pos == std::string::npos) { // No port spec found current_pos = pattern_spec.find(std::string(kUrlPathSeparator), start); if (current_pos == std::string::npos) { current_pos = pattern_spec.size(); host_component = Component(start, current_pos - start); } else { // Pattern has a path spec. host_component = Component(start, current_pos - start); } start = current_pos; } else { // Port spec found. host_component = Component(start, current_pos - start); start = current_pos + 1; if (start < pattern_spec.size()) { current_pos = pattern_spec.find(std::string(kUrlPathSeparator), start); if (current_pos == std::string::npos) { current_pos = pattern_spec.size(); } port_component = Component(start, current_pos - start); start = current_pos; } } current_pos = pattern_spec.size(); if (start < current_pos) { // Pattern has a path spec. path_component = Component(start, current_pos - start); } // Set pattern parts. std::string scheme; if (scheme_component.IsNonEmpty()) { scheme = pattern_spec.substr(scheme_component.start, scheme_component.len); if (scheme == kSchemeWildcard) { builder->WithSchemeWildcard(); } else { builder->WithScheme(scheme); } } else { builder->WithSchemeWildcard(); } if (host_component.IsNonEmpty()) { std::string host = pattern_spec.substr(host_component.start, host_component.len); if (host == kHostWildcard) { builder->WithDomainWildcard(); } else if (StartsWithASCII(host, kDomainWildcard, true)) { host = host.substr(kDomainWildcardLength); builder->WithDomainWildcard(); builder->WithHost(host); } else { // If the host contains a wildcard symbol then it is invalid. if (host.find(kHostWildcard) != std::string::npos) { builder->Invalid(); return; } builder->WithHost(host); } } if (port_component.IsNonEmpty()) { const std::string port = pattern_spec.substr(port_component.start, port_component.len); if (port == kPortWildcard) { builder->WithPortWildcard(); } else { // Check if the port string represents a valid port. for (size_t i = 0; i < port.size(); ++i) { if (!IsAsciiDigit(port[i])) { builder->Invalid(); return; } } // TODO(markusheintz): Check port range. builder->WithPort(port); } } else { if (scheme != std::string(extensions::kExtensionScheme) && scheme != std::string(chrome::kFileScheme)) builder->WithPortWildcard(); } if (path_component.IsNonEmpty()) { const std::string path = pattern_spec.substr(path_component.start, path_component.len); if (path.substr(1) == kPathWildcard) builder->WithPathWildcard(); else builder->WithPath(path); } } // static std::string PatternParser::ToString( const ContentSettingsPattern::PatternParts& parts) { // Return the most compact form to support legacy code and legacy pattern // strings. if (parts.is_scheme_wildcard && parts.has_domain_wildcard && parts.host.empty() && parts.is_port_wildcard) return "*"; std::string str; if (!parts.is_scheme_wildcard) str += parts.scheme + content::kStandardSchemeSeparator; if (parts.scheme == chrome::kFileScheme) { if (parts.is_path_wildcard) return str + kUrlPathSeparator + kPathWildcard; else return str + parts.path; } if (parts.has_domain_wildcard) { if (parts.host.empty()) str += kHostWildcard; else str += kDomainWildcard; } str += parts.host; if (parts.scheme == std::string(extensions::kExtensionScheme)) { str += parts.path.empty() ? std::string(kUrlPathSeparator) : parts.path; return str; } if (!parts.is_port_wildcard) { str += std::string(kUrlPortSeparator) + parts.port; } return str; } } // namespace content_settings