Add net to the repository.

git-svn-id: svn://svn.chromium.org/chrome/trunk/src@14 0039d316-1c4b-4281-b951-d872f2087c98
author: initial.commit <initial.commit@0039d316-1c4b-4281-b951-d872f2087c98> 2008-07-26 22:42:52 +0000
committer: initial.commit <initial.commit@0039d316-1c4b-4281-b951-d872f2087c98> 2008-07-26 22:42:52 +0000
commit: 586acc5fe142f498261f52c66862fa417c3d52d2 (patch)
tree: c98b3417a883f2477029c8cd5888f4078681e24e /net/http/http_util.cc
parent: a814a8d55429605fe6d7045045cd25b6bf624580 (diff)
download: chromium_src-586acc5fe142f498261f52c66862fa417c3d52d2.zip
chromium_src-586acc5fe142f498261f52c66862fa417c3d52d2.tar.gz
chromium_src-586acc5fe142f498261f52c66862fa417c3d52d2.tar.bz2
1 files changed, 358 insertions, 0 deletions
diff --git a/net/http/http_util.cc b/net/http/http_util.cc
new file mode 100644
index 0000000..a56a4db
--- /dev/null
+++ b/net/http/http_util.cc
@@ -0,0 +1,358 @@
+// Copyright 2008, Google Inc.
+// All rights reserved.
+//
+// Redistribution and use in source and binary forms, with or without
+// modification, are permitted provided that the following conditions are
+// met:
+//
+//    * Redistributions of source code must retain the above copyright
+// notice, this list of conditions and the following disclaimer.
+//    * Redistributions in binary form must reproduce the above
+// copyright notice, this list of conditions and the following disclaimer
+// in the documentation and/or other materials provided with the
+// distribution.
+//    * Neither the name of Google Inc. nor the names of its
+// contributors may be used to endorse or promote products derived from
+// this software without specific prior written permission.
+//
+// THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS
+// "AS IS" AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT
+// LIMITED TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR
+// A PARTICULAR PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT
+// OWNER OR CONTRIBUTORS BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL,
+// SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT
+// LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE,
+// DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY
+// THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT
+// (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE
+// OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
+
+// The rules for parsing content-types were borrowed from Firefox:
+// http://lxr.mozilla.org/mozilla/source/netwerk/base/src/nsURLHelper.cpp#834
+
+#include "net/http/http_util.h"
+
+#include <algorithm>
+
+#include "base/logging.h"
+#include "base/string_util.h"
+
+using std::string;
+
+namespace net {
+
+//-----------------------------------------------------------------------------
+
+// Return the index of the closing quote of the string, if any.
+static size_t FindStringEnd(const string& line, size_t start, char delim) {
+  DCHECK(start < line.length() && line[start] == delim &&
+         (delim == '"' || delim == '\''));
+
+  const char set[] = { delim, '\\', '\0' };
+  for (;;) {
+    // start points to either the start quote or the last
+    // escaped char (the char following a '\\')
+
+    size_t end = line.find_first_of(set, start + 1);
+    if (end == string::npos)
+      return line.length();
+
+    if (line[end] == '\\') {
+      // Hit a backslash-escaped char.  Need to skip over it.
+      start = end + 1;
+      if (start == line.length())
+        return start;
+
+      // Go back to looking for the next escape or the string end
+      continue;
+    }
+
+    return end;
+  }
+
+  NOTREACHED();
+  return line.length();
+}
+
+//-----------------------------------------------------------------------------
+
+// static
+size_t HttpUtil::FindDelimiter(const string& line, size_t search_start,
+                               char delimiter) {
+  do {
+    // search_start points to the spot from which we should start looking
+    // for the delimiter.
+    const char delim_str[] = { delimiter, '"', '\'', '\0' };
+    size_t cur_delim_pos = line.find_first_of(delim_str, search_start);
+    if (cur_delim_pos == string::npos)
+      return line.length();
+
+    char ch = line[cur_delim_pos];
+    if (ch == delimiter) {
+      // Found delimiter
+      return cur_delim_pos;
+    }
+
+    // We hit the start of a quoted string.  Look for its end.
+    search_start = FindStringEnd(line, cur_delim_pos, ch);
+    if (search_start == line.length())
+      return search_start;
+
+    ++search_start;
+
+    // search_start now points to the first char after the end of the
+    // string, so just go back to the top of the loop and look for
+    // |delimiter| again.
+  } while (true);
+
+  NOTREACHED();
+  return line.length();
+}
+
+// static
+void HttpUtil::ParseContentType(const string& content_type_str,
+                                string* mime_type, string* charset,
+                                bool *had_charset) {
+  // Trim leading and trailing whitespace from type.  We include '(' in
+  // the trailing trim set to catch media-type comments, which are not at all
+  // standard, but may occur in rare cases.
+  size_t type_val = content_type_str.find_first_not_of(HTTP_LWS);
+  type_val = std::min(type_val, content_type_str.length());
+  size_t type_end = content_type_str.find_first_of(HTTP_LWS ";(", type_val);
+  if (string::npos == type_end)
+    type_end = content_type_str.length();
+
+  size_t charset_val = 0;
+  size_t charset_end = 0;
+
+  // Iterate over parameters
+  bool type_has_charset = false;
+  size_t param_start = content_type_str.find_first_of(';', type_end);
+  if (param_start != string::npos) {
+    // We have parameters.  Iterate over them.
+    size_t cur_param_start = param_start + 1;
+    do {
+      size_t cur_param_end =
+          FindDelimiter(content_type_str, cur_param_start, ';');
+
+      size_t param_name_start = content_type_str.find_first_not_of(HTTP_LWS,
+          cur_param_start);
+      param_name_start = std::min(param_name_start, cur_param_end);
+
+      static const char charset_str[] = "charset=";
+      size_t charset_end_offset = std::min(param_name_start +
+          sizeof(charset_str) - 1, cur_param_end);
+      if (LowerCaseEqualsASCII(content_type_str.begin() + param_name_start,
+          content_type_str.begin() + charset_end_offset, charset_str)) {
+        charset_val = param_name_start + sizeof(charset_str) - 1;
+        charset_end = cur_param_end;
+        type_has_charset = true;
+      }
+
+      cur_param_start = cur_param_end + 1;
+    } while (cur_param_start < content_type_str.length());
+  }
+
+  if (type_has_charset) {
+    // Trim leading and trailing whitespace from charset_val.  We include
+    // '(' in the trailing trim set to catch media-type comments, which are
+    // not at all standard, but may occur in rare cases.
+    charset_val = content_type_str.find_first_not_of(HTTP_LWS, charset_val);
+    charset_val = std::min(charset_val, charset_end);
+    char first_char = content_type_str[charset_val];
+    if (first_char == '"' || first_char == '\'') {
+      charset_end = FindStringEnd(content_type_str, charset_val, first_char);
+      ++charset_val;
+      DCHECK(charset_end >= charset_val);
+    } else {
+      charset_end = std::min(content_type_str.find_first_of(HTTP_LWS ";(",
+                                                            charset_val),
+                             charset_end);
+    }
+  }
+
+  // if the server sent "*/*", it is meaningless, so do not store it.
+  // also, if type_val is the same as mime_type, then just update the
+  // charset.  however, if charset is empty and mime_type hasn't
+  // changed, then don't wipe-out an existing charset.  We
+  // also want to reject a mime-type if it does not include a slash.
+  // some servers give junk after the charset parameter, which may
+  // include a comma, so this check makes us a bit more tolerant.
+  if (content_type_str.length() != 0 &&
+      content_type_str != "*/*" &&
+      content_type_str.find_first_of('/') != string::npos) {
+    // Common case here is that mime_type is empty
+    bool eq = !mime_type->empty() &&
+        LowerCaseEqualsASCII(content_type_str.begin() + type_val,
+                             content_type_str.begin() + type_end,
+                             mime_type->data());
+    if (!eq) {
+      mime_type->assign(content_type_str.begin() + type_val,
+                        content_type_str.begin() + type_end);
+      StringToLowerASCII(mime_type);
+    }
+    if ((!eq && *had_charset) || type_has_charset) {
+      *had_charset = true;
+      charset->assign(content_type_str.begin() + charset_val,
+                      content_type_str.begin() + charset_end);
+      StringToLowerASCII(charset);
+    }
+  }
+}
+
+// static
+bool HttpUtil::HasHeader(const std::string& headers, const char* name) {
+  size_t name_len = strlen(name);
+  string::const_iterator it =
+      std::search(headers.begin(),
+                  headers.end(),
+                  name,
+                  name + name_len,
+                  CaseInsensitiveCompareASCII<char>());
+  if (it == headers.end())
+    return false;
+
+  // ensure match is prefixed by newline
+  if (it != headers.begin() && it[-1] != '\n')
+    return false;
+
+  // ensure match is suffixed by colon
+  if (it + name_len >= headers.end() || it[name_len] != ':')
+    return false;
+
+  return true;
+}
+
+// static
+bool HttpUtil::IsNonCoalescingHeader(string::const_iterator name_begin,
+                                     string::const_iterator name_end) {
+  // NOTE: "set-cookie2" headers do not support expires attributes, so we don't
+  // have to list them here.
+  const char* kNonCoalescingHeaders[] = {
+    "date",
+    "expires",
+    "last-modified",
+    "location",  // See bug 1050541 for details
+    "retry-after",
+    "set-cookie"
+  };
+  for (size_t i = 0; i < arraysize(kNonCoalescingHeaders); ++i) {
+    if (LowerCaseEqualsASCII(name_begin, name_end, kNonCoalescingHeaders[i]))
+      return true;
+  }
+  return false;
+}
+
+void HttpUtil::TrimLWS(string::const_iterator* begin,
+                       string::const_iterator* end) {
+  // leading whitespace
+  while (*begin < *end && strchr(HTTP_LWS, (*begin)[0]))
+    ++(*begin);
+
+  // trailing whitespace
+  while (*begin < *end && strchr(HTTP_LWS, (*end)[-1]))
+    --(*end);
+}
+
+int HttpUtil::LocateEndOfHeaders(const char* buf, int buf_len) {
+  bool was_lf = false;
+  char last_c = '\0';
+  for (int i = 0; i < buf_len; ++i) {
+    char c = buf[i];
+    if (c == '\n') {
+      if (was_lf)
+        return i + 1;
+      was_lf = true;
+    } else if (c != '\r' || last_c != '\n') {
+      was_lf = false;
+    }
+    last_c = c;
+  }
+  return -1;
+}
+
+std::string HttpUtil::AssembleRawHeaders(const char* buf, int buf_len) {
+  std::string raw_headers;
+
+  // TODO(darin):
+  //   - Handle header line continuations.
+  //   - Be careful about CRs that appear spuriously mid header line.
+
+  int line_start = 0;
+  for (int i = 0; i < buf_len; ++i) {
+    char c = buf[i];
+    if (c == '\r' || c == '\n') {
+      if (line_start != i) {
+        // (line_start,i) is a header line.
+        raw_headers.append(buf + line_start, buf + i);
+        raw_headers.push_back('\0');
+      }
+      line_start = i + 1;
+    }
+  }
+  raw_headers.push_back('\0');
+
+  return raw_headers;
+}
+
+// BNF from section 4.2 of RFC 2616:
+//
+//   message-header = field-name ":" [ field-value ]
+//   field-name     = token
+//   field-value    = *( field-content | LWS )
+//   field-content  = <the OCTETs making up the field-value
+//                     and consisting of either *TEXT or combinations
+//                     of token, separators, and quoted-string>
+//
+
+HttpUtil::HeadersIterator::HeadersIterator(string::const_iterator headers_begin,
+                                           string::const_iterator headers_end,
+                                           const std::string& line_delimiter)
+    : lines_(headers_begin, headers_end, line_delimiter) {
+}
+
+bool HttpUtil::HeadersIterator::GetNext() {
+  while (lines_.GetNext()) {
+    name_begin_ = lines_.token_begin();
+    values_end_ = lines_.token_end();
+
+    string::const_iterator colon = find(name_begin_, values_end_, ':');
+    if (colon == values_end_)
+      continue;  // skip malformed header
+
+    name_end_ = colon;
+    TrimLWS(&name_begin_, &name_end_);
+    if (name_begin_ == name_end_)
+      continue;  // skip malformed header
+
+    values_begin_ = colon + 1;
+    TrimLWS(&values_begin_, &values_end_);
+
+    // if we got a header name, then we are done.
+    return true;
+  }
+  return false;
+}
+
+HttpUtil::ValuesIterator::ValuesIterator(
+    string::const_iterator values_begin,
+    string::const_iterator values_end,
+    char delimiter)
+    : values_(values_begin, values_end, string(1, delimiter)) {
+  values_.set_quote_chars("\'\"");
+}
+
+bool HttpUtil::ValuesIterator::GetNext() {
+  while (values_.GetNext()) {
+    value_begin_ = values_.token_begin();
+    value_end_ = values_.token_end();
+    TrimLWS(&value_begin_, &value_end_);
+
+    // bypass empty values.
+    if (value_begin_ != value_end_)
+      return true;
+  }
+  return false;
+}
+
+}  // namespace net
author	initial.commit <initial.commit@0039d316-1c4b-4281-b951-d872f2087c98>	2008-07-26 22:42:52 +0000
committer	initial.commit <initial.commit@0039d316-1c4b-4281-b951-d872f2087c98>	2008-07-26 22:42:52 +0000
commit	586acc5fe142f498261f52c66862fa417c3d52d2 (patch)
tree	c98b3417a883f2477029c8cd5888f4078681e24e /net/http/http_util.cc
parent	a814a8d55429605fe6d7045045cd25b6bf624580 (diff)
download	chromium_src-586acc5fe142f498261f52c66862fa417c3d52d2.zip chromium_src-586acc5fe142f498261f52c66862fa417c3d52d2.tar.gz chromium_src-586acc5fe142f498261f52c66862fa417c3d52d2.tar.bz2