// Copyright (c) 2012 The Chromium Authors. All rights reserved. // Use of this source code is governed by a BSD-style license that can be // found in the LICENSE file. #ifndef BASE_STRINGS_STRING_SPLIT_H_ #define BASE_STRINGS_STRING_SPLIT_H_ #include #include #include #include "base/base_export.h" #include "base/strings/string16.h" #include "base/strings/string_piece.h" namespace base { enum WhitespaceHandling { KEEP_WHITESPACE, TRIM_WHITESPACE, }; enum SplitResult { // Strictly return all results. // // If the input is ",," and the separator is ',' this will return a // vector of three empty strings. SPLIT_WANT_ALL, // Only nonempty results will be added to the results. Multiple separators // will be coalesced. Separators at the beginning and end of the input will // be ignored. With TRIM_WHITESPACE, whitespace-only results will be dropped. // // If the input is ",," and the separator is ',', this will return an empty // vector. SPLIT_WANT_NONEMPTY, }; // Split the given string on ANY of the given separators, returning copies of // the result. // // To split on either commas or semicolons, keeping all whitespace: // // std::vector tokens = base::SplitString( // input, ",;", base::KEEP_WHITESPACE, base::SPLIT_WANT_ALL); BASE_EXPORT std::vector SplitString( StringPiece input, StringPiece separators, WhitespaceHandling whitespace, SplitResult result_type); BASE_EXPORT std::vector SplitString( StringPiece16 input, StringPiece16 separators, WhitespaceHandling whitespace, SplitResult result_type); // Like SplitString above except it returns a vector of StringPieces which // reference the original buffer without copying. Although you have to be // careful to keep the original string unmodified, this provides an efficient // way to iterate through tokens in a string. // // To iterate through all whitespace-separated tokens in an input string: // // for (const auto& cur : // base::SplitStringPiece(input, base::kWhitespaceASCII, // base::KEEP_WHITESPACE, // base::SPLIT_WANT_NONEMPTY)) { // ... BASE_EXPORT std::vector SplitStringPiece( StringPiece input, StringPiece separators, WhitespaceHandling whitespace, SplitResult result_type); BASE_EXPORT std::vector SplitStringPiece( StringPiece16 input, StringPiece16 separators, WhitespaceHandling whitespace, SplitResult result_type); using StringPairs = std::vector>; // Splits |line| into key value pairs according to the given delimiters and // removes whitespace leading each key and trailing each value. Returns true // only if each pair has a non-empty key and value. |key_value_pairs| will // include ("","") pairs for entries without |key_value_delimiter|. BASE_EXPORT bool SplitStringIntoKeyValuePairs(StringPiece input, char key_value_delimiter, char key_value_pair_delimiter, StringPairs* key_value_pairs); // Similar to SplitString, but use a substring delimiter instead of a list of // characters that are all possible delimiters. // // TODO(brettw) this should probably be changed and expanded to provide a // mirror of the SplitString[Piece] API above, just with the different // delimiter handling. BASE_EXPORT void SplitStringUsingSubstr(StringPiece16 input, StringPiece16 delimiter, std::vector* result); BASE_EXPORT void SplitStringUsingSubstr(StringPiece input, StringPiece delimiter, std::vector* result); // Like SplitStringUsingSubstr above except it returns a vector of StringPieces // which reference the original buffer without copying. Although you have to be // careful to keep the original string unmodified, this provides an efficient // way to iterate through tokens in a string. // // To iterate through all newline-separated tokens in an input string: // // for (const auto& cur : // base::SplitStringUsingSubstr(input, "\r\n", // base::KEEP_WHITESPACE, // base::SPLIT_WANT_NONEMPTY)) { // ... BASE_EXPORT std::vector SplitStringPieceUsingSubstr( StringPiece16 input, StringPiece16 delimiter, WhitespaceHandling whitespace, SplitResult result_type); BASE_EXPORT std::vector SplitStringPieceUsingSubstr( StringPiece input, StringPiece delimiter, WhitespaceHandling whitespace, SplitResult result_type); } // namespace base #endif // BASE_STRINGS_STRING_SPLIT_H_