// Copyright (c) 2010 The Chromium Authors. All rights reserved. // Use of this source code is governed by a BSD-style license that can be // found in the LICENSE file. #ifndef BASE_STRING_SPLIT_H_ #define BASE_STRING_SPLIT_H_ #pragma once #include #include #include #include "base/string16.h" namespace base { // Splits |str| into a vector of strings delimited by |s|. Append the results // into |r| as they appear. If several instances of |s| are contiguous, or if // |str| begins with or ends with |s|, then an empty string is inserted. // // Every substring is trimmed of any leading or trailing white space. // Where wchar_t is char16 (i.e. Windows), |c| must be in BMP // (Basic Multilingual Plane). Elsewhere (Linux/Mac), wchar_t // should be a valid Unicode code point (32-bit). void SplitString(const std::wstring& str, wchar_t c, std::vector* r); // NOTE: |c| must be in BMP (Basic Multilingual Plane) void SplitString(const string16& str, char16 c, std::vector* r); // |str| should not be in a multi-byte encoding like Shift-JIS or GBK in which // the trailing byte of a multi-byte character can be in the ASCII range. // UTF-8, and other single/multi-byte ASCII-compatible encodings are OK. // Note: |c| must be in the ASCII range. void SplitString(const std::string& str, char c, std::vector* r); bool SplitStringIntoKeyValues( const std::string& line, char key_value_delimiter, std::string* key, std::vector* values); bool SplitStringIntoKeyValuePairs( const std::string& line, char key_value_delimiter, char key_value_pair_delimiter, std::vector >* kv_pairs); // The same as SplitString, but use a substring delimiter instead of a char. void SplitStringUsingSubstr(const string16& str, const string16& s, std::vector* r); void SplitStringUsingSubstr(const std::string& str, const std::string& s, std::vector* r); // The same as SplitString, but don't trim white space. // NOTE: |c| must be in BMP (Basic Multilingual Plane) void SplitStringDontTrim(const string16& str, char16 c, std::vector* r); // |str| should not be in a multi-byte encoding like Shift-JIS or GBK in which // the trailing byte of a multi-byte character can be in the ASCII range. // UTF-8, and other single/multi-byte ASCII-compatible encodings are OK. // Note: |c| must be in the ASCII range. void SplitStringDontTrim(const std::string& str, char c, std::vector* r); // WARNING: this uses whitespace as defined by the HTML5 spec. If you need // a function similar to this but want to trim all types of whitespace, then // factor this out into a function that takes a string containing the characters // that are treated as whitespace. // // Splits the string along whitespace (where whitespace is the five space // characters defined by HTML 5). Each contiguous block of non-whitespace // characters is added to result. void SplitStringAlongWhitespace(const std::wstring& str, std::vector* result); void SplitStringAlongWhitespace(const string16& str, std::vector* result); void SplitStringAlongWhitespace(const std::string& str, std::vector* result); } // namespace base #endif // BASE_STRING_SPLIT_H