399 lines
13 KiB
C++
399 lines
13 KiB
C++
// Copyright (c) 2012 The Chromium Authors. All rights reserved.
|
|
// Use of this source code is governed by a BSD-style license that can be
|
|
// found in the LICENSE file.
|
|
|
|
#include "butil/strings/string_split.h"
|
|
|
|
#include "butil/strings/utf_string_conversions.h"
|
|
#include <gtest/gtest.h>
|
|
|
|
namespace butil {
|
|
|
|
namespace {
|
|
|
|
void AssertElements(std::vector<std::string>& result,
|
|
const char* const expected_data[],
|
|
size_t data_size) {
|
|
ASSERT_EQ(data_size, result.size());
|
|
for (size_t i = 0; i < data_size; ++i) {
|
|
ASSERT_STREQ(expected_data[i], result[i].c_str());
|
|
}
|
|
}
|
|
|
|
#if !defined(WCHAR_T_IS_UTF16)
|
|
// Overload SplitString with a wide-char version to make it easier to
|
|
// test the string16 version with wide character literals.
|
|
void SplitString(const std::wstring& str,
|
|
wchar_t c,
|
|
std::vector<std::wstring>* result) {
|
|
std::vector<string16> result16;
|
|
SplitString(WideToUTF16(str), c, &result16);
|
|
for (size_t i = 0; i < result16.size(); ++i)
|
|
result->push_back(UTF16ToWide(result16[i]));
|
|
}
|
|
#endif
|
|
|
|
} // anonymous namespace
|
|
|
|
class SplitStringIntoKeyValuePairsTest : public testing::Test {
|
|
protected:
|
|
std::vector<std::pair<std::string, std::string> > kv_pairs;
|
|
};
|
|
|
|
TEST_F(SplitStringIntoKeyValuePairsTest, EmptyString) {
|
|
EXPECT_TRUE(SplitStringIntoKeyValuePairs(std::string(),
|
|
':', // Key-value delimiter
|
|
',', // Key-value pair delimiter
|
|
&kv_pairs));
|
|
EXPECT_TRUE(kv_pairs.empty());
|
|
}
|
|
|
|
TEST_F(SplitStringIntoKeyValuePairsTest, MissingKeyValueDelimiter) {
|
|
EXPECT_FALSE(SplitStringIntoKeyValuePairs("key1,key2:value2",
|
|
':', // Key-value delimiter
|
|
',', // Key-value pair delimiter
|
|
&kv_pairs));
|
|
ASSERT_EQ(2U, kv_pairs.size());
|
|
EXPECT_TRUE(kv_pairs[0].first.empty());
|
|
EXPECT_TRUE(kv_pairs[0].second.empty());
|
|
EXPECT_EQ("key2", kv_pairs[1].first);
|
|
EXPECT_EQ("value2", kv_pairs[1].second);
|
|
}
|
|
|
|
TEST_F(SplitStringIntoKeyValuePairsTest, EmptyKeyWithKeyValueDelimiter) {
|
|
EXPECT_TRUE(SplitStringIntoKeyValuePairs(":value1,key2:value2",
|
|
':', // Key-value delimiter
|
|
',', // Key-value pair delimiter
|
|
&kv_pairs));
|
|
ASSERT_EQ(2U, kv_pairs.size());
|
|
EXPECT_TRUE(kv_pairs[0].first.empty());
|
|
EXPECT_EQ("value1", kv_pairs[0].second);
|
|
EXPECT_EQ("key2", kv_pairs[1].first);
|
|
EXPECT_EQ("value2", kv_pairs[1].second);
|
|
}
|
|
|
|
TEST_F(SplitStringIntoKeyValuePairsTest, TrailingAndLeadingPairDelimiter) {
|
|
EXPECT_TRUE(SplitStringIntoKeyValuePairs(",key1:value1,key2:value2,",
|
|
':', // Key-value delimiter
|
|
',', // Key-value pair delimiter
|
|
&kv_pairs));
|
|
ASSERT_EQ(2U, kv_pairs.size());
|
|
EXPECT_EQ("key1", kv_pairs[0].first);
|
|
EXPECT_EQ("value1", kv_pairs[0].second);
|
|
EXPECT_EQ("key2", kv_pairs[1].first);
|
|
EXPECT_EQ("value2", kv_pairs[1].second);
|
|
}
|
|
|
|
TEST_F(SplitStringIntoKeyValuePairsTest, EmptyPair) {
|
|
EXPECT_TRUE(SplitStringIntoKeyValuePairs("key1:value1,,key3:value3",
|
|
':', // Key-value delimiter
|
|
',', // Key-value pair delimiter
|
|
&kv_pairs));
|
|
ASSERT_EQ(2U, kv_pairs.size());
|
|
EXPECT_EQ("key1", kv_pairs[0].first);
|
|
EXPECT_EQ("value1", kv_pairs[0].second);
|
|
EXPECT_EQ("key3", kv_pairs[1].first);
|
|
EXPECT_EQ("value3", kv_pairs[1].second);
|
|
}
|
|
|
|
TEST_F(SplitStringIntoKeyValuePairsTest, EmptyValue) {
|
|
EXPECT_FALSE(SplitStringIntoKeyValuePairs("key1:,key2:value2",
|
|
':', // Key-value delimiter
|
|
',', // Key-value pair delimiter
|
|
&kv_pairs));
|
|
ASSERT_EQ(2U, kv_pairs.size());
|
|
EXPECT_EQ("key1", kv_pairs[0].first);
|
|
EXPECT_EQ("", kv_pairs[0].second);
|
|
EXPECT_EQ("key2", kv_pairs[1].first);
|
|
EXPECT_EQ("value2", kv_pairs[1].second);
|
|
}
|
|
|
|
TEST_F(SplitStringIntoKeyValuePairsTest, UntrimmedWhitespace) {
|
|
EXPECT_TRUE(SplitStringIntoKeyValuePairs("key1 : value1",
|
|
':', // Key-value delimiter
|
|
',', // Key-value pair delimiter
|
|
&kv_pairs));
|
|
ASSERT_EQ(1U, kv_pairs.size());
|
|
EXPECT_EQ("key1 ", kv_pairs[0].first);
|
|
EXPECT_EQ(" value1", kv_pairs[0].second);
|
|
}
|
|
|
|
TEST_F(SplitStringIntoKeyValuePairsTest, TrimmedWhitespace) {
|
|
EXPECT_TRUE(SplitStringIntoKeyValuePairs("key1:value1 , key2:value2",
|
|
':', // Key-value delimiter
|
|
',', // Key-value pair delimiter
|
|
&kv_pairs));
|
|
ASSERT_EQ(2U, kv_pairs.size());
|
|
EXPECT_EQ("key1", kv_pairs[0].first);
|
|
EXPECT_EQ("value1", kv_pairs[0].second);
|
|
EXPECT_EQ("key2", kv_pairs[1].first);
|
|
EXPECT_EQ("value2", kv_pairs[1].second);
|
|
}
|
|
|
|
TEST_F(SplitStringIntoKeyValuePairsTest, MultipleKeyValueDelimiters) {
|
|
EXPECT_TRUE(SplitStringIntoKeyValuePairs("key1:::value1,key2:value2",
|
|
':', // Key-value delimiter
|
|
',', // Key-value pair delimiter
|
|
&kv_pairs));
|
|
ASSERT_EQ(2U, kv_pairs.size());
|
|
EXPECT_EQ("key1", kv_pairs[0].first);
|
|
EXPECT_EQ("value1", kv_pairs[0].second);
|
|
EXPECT_EQ("key2", kv_pairs[1].first);
|
|
EXPECT_EQ("value2", kv_pairs[1].second);
|
|
}
|
|
|
|
TEST_F(SplitStringIntoKeyValuePairsTest, OnlySplitAtGivenSeparator) {
|
|
std::string a("a ?!@#$%^&*()_+:/{}\\\t\nb");
|
|
EXPECT_TRUE(SplitStringIntoKeyValuePairs(a + "X" + a + "Y" + a + "X" + a,
|
|
'X', // Key-value delimiter
|
|
'Y', // Key-value pair delimiter
|
|
&kv_pairs));
|
|
ASSERT_EQ(2U, kv_pairs.size());
|
|
EXPECT_EQ(a, kv_pairs[0].first);
|
|
EXPECT_EQ(a, kv_pairs[0].second);
|
|
EXPECT_EQ(a, kv_pairs[1].first);
|
|
EXPECT_EQ(a, kv_pairs[1].second);
|
|
}
|
|
|
|
|
|
TEST_F(SplitStringIntoKeyValuePairsTest, DelimiterInValue) {
|
|
EXPECT_TRUE(SplitStringIntoKeyValuePairs("key1:va:ue1,key2:value2",
|
|
':', // Key-value delimiter
|
|
',', // Key-value pair delimiter
|
|
&kv_pairs));
|
|
ASSERT_EQ(2U, kv_pairs.size());
|
|
EXPECT_EQ("key1", kv_pairs[0].first);
|
|
EXPECT_EQ("va:ue1", kv_pairs[0].second);
|
|
EXPECT_EQ("key2", kv_pairs[1].first);
|
|
EXPECT_EQ("value2", kv_pairs[1].second);
|
|
}
|
|
|
|
TEST(SplitStringUsingSubstrTest, EmptyString) {
|
|
std::vector<std::string> results;
|
|
SplitStringUsingSubstr(std::string(), "DELIMITER", &results);
|
|
const char* const expected[] = { "" };
|
|
AssertElements(results, expected, arraysize(expected));
|
|
}
|
|
|
|
TEST(StringUtilTest, SplitString) {
|
|
std::vector<std::wstring> r;
|
|
|
|
SplitString(std::wstring(), L',', &r);
|
|
EXPECT_EQ(0U, r.size());
|
|
r.clear();
|
|
|
|
SplitString(L"a,b,c", L',', &r);
|
|
ASSERT_EQ(3U, r.size());
|
|
EXPECT_EQ(r[0], L"a");
|
|
EXPECT_EQ(r[1], L"b");
|
|
EXPECT_EQ(r[2], L"c");
|
|
r.clear();
|
|
|
|
SplitString(L"a, b, c", L',', &r);
|
|
ASSERT_EQ(3U, r.size());
|
|
EXPECT_EQ(r[0], L"a");
|
|
EXPECT_EQ(r[1], L"b");
|
|
EXPECT_EQ(r[2], L"c");
|
|
r.clear();
|
|
|
|
SplitString(L"a,,c", L',', &r);
|
|
ASSERT_EQ(3U, r.size());
|
|
EXPECT_EQ(r[0], L"a");
|
|
EXPECT_EQ(r[1], L"");
|
|
EXPECT_EQ(r[2], L"c");
|
|
r.clear();
|
|
|
|
SplitString(L" ", L'*', &r);
|
|
EXPECT_EQ(0U, r.size());
|
|
r.clear();
|
|
|
|
SplitString(L"foo", L'*', &r);
|
|
ASSERT_EQ(1U, r.size());
|
|
EXPECT_EQ(r[0], L"foo");
|
|
r.clear();
|
|
|
|
SplitString(L"foo ,", L',', &r);
|
|
ASSERT_EQ(2U, r.size());
|
|
EXPECT_EQ(r[0], L"foo");
|
|
EXPECT_EQ(r[1], L"");
|
|
r.clear();
|
|
|
|
SplitString(L",", L',', &r);
|
|
ASSERT_EQ(2U, r.size());
|
|
EXPECT_EQ(r[0], L"");
|
|
EXPECT_EQ(r[1], L"");
|
|
r.clear();
|
|
|
|
SplitString(L"\t\ta\t", L'\t', &r);
|
|
ASSERT_EQ(4U, r.size());
|
|
EXPECT_EQ(r[0], L"");
|
|
EXPECT_EQ(r[1], L"");
|
|
EXPECT_EQ(r[2], L"a");
|
|
EXPECT_EQ(r[3], L"");
|
|
r.clear();
|
|
|
|
SplitString(L"\ta\t\nb\tcc", L'\n', &r);
|
|
ASSERT_EQ(2U, r.size());
|
|
EXPECT_EQ(r[0], L"a");
|
|
EXPECT_EQ(r[1], L"b\tcc");
|
|
r.clear();
|
|
}
|
|
|
|
TEST(StringUtilTest, SplitStringStringPiece) {
|
|
std::vector<butil::StringPiece> r;
|
|
|
|
SplitString(butil::StringPiece(), ',', &r);
|
|
EXPECT_EQ(0U, r.size());
|
|
r.clear();
|
|
|
|
SplitString(butil::StringPiece("a,b,c"), ',', &r);
|
|
ASSERT_EQ(3U, r.size());
|
|
EXPECT_EQ(r[0], "a");
|
|
EXPECT_EQ(r[1], "b");
|
|
EXPECT_EQ(r[2], "c");
|
|
r.clear();
|
|
|
|
SplitString(butil::StringPiece("a, b, c"), ',', &r);
|
|
ASSERT_EQ(3U, r.size());
|
|
EXPECT_EQ(r[0], "a");
|
|
EXPECT_EQ(r[1], "b");
|
|
EXPECT_EQ(r[2], "c");
|
|
r.clear();
|
|
|
|
SplitString(butil::StringPiece("a,,c"), ',', &r);
|
|
ASSERT_EQ(3U, r.size());
|
|
EXPECT_EQ(r[0], "a");
|
|
EXPECT_EQ(r[1], "");
|
|
EXPECT_EQ(r[2], "c");
|
|
r.clear();
|
|
|
|
SplitString(butil::StringPiece(" "), '*', &r);
|
|
EXPECT_EQ(0U, r.size());
|
|
r.clear();
|
|
|
|
SplitString(butil::StringPiece("foo"), '*', &r);
|
|
ASSERT_EQ(1U, r.size());
|
|
EXPECT_EQ(r[0], "foo");
|
|
r.clear();
|
|
|
|
SplitString(butil::StringPiece("foo ,"), ',', &r);
|
|
ASSERT_EQ(2U, r.size());
|
|
EXPECT_EQ(r[0], "foo");
|
|
EXPECT_EQ(r[1], "");
|
|
r.clear();
|
|
|
|
SplitString(butil::StringPiece(","), ',', &r);
|
|
ASSERT_EQ(2U, r.size());
|
|
EXPECT_EQ(r[0], "");
|
|
EXPECT_EQ(r[1], "");
|
|
r.clear();
|
|
|
|
SplitString(butil::StringPiece("\t\ta\t"), '\t', &r);
|
|
ASSERT_EQ(4U, r.size());
|
|
EXPECT_EQ(r[0], "");
|
|
EXPECT_EQ(r[1], "");
|
|
EXPECT_EQ(r[2], "a");
|
|
EXPECT_EQ(r[3], "");
|
|
r.clear();
|
|
|
|
SplitString(butil::StringPiece("\ta\t\nb\tcc"), '\n', &r);
|
|
ASSERT_EQ(2U, r.size());
|
|
EXPECT_EQ(r[0], "a");
|
|
EXPECT_EQ(r[1], "b\tcc");
|
|
r.clear();
|
|
}
|
|
|
|
TEST(SplitStringUsingSubstrTest, StringWithNoDelimiter) {
|
|
std::vector<std::string> results;
|
|
SplitStringUsingSubstr("alongwordwithnodelimiter", "DELIMITER", &results);
|
|
const char* const expected[] = { "alongwordwithnodelimiter" };
|
|
AssertElements(results, expected, arraysize(expected));
|
|
}
|
|
|
|
TEST(SplitStringUsingSubstrTest, LeadingDelimitersSkipped) {
|
|
std::vector<std::string> results;
|
|
SplitStringUsingSubstr(
|
|
"DELIMITERDELIMITERDELIMITERoneDELIMITERtwoDELIMITERthree",
|
|
"DELIMITER",
|
|
&results);
|
|
const char* const expected[] = { "", "", "", "one", "two", "three" };
|
|
AssertElements(results, expected, arraysize(expected));
|
|
}
|
|
|
|
TEST(SplitStringUsingSubstrTest, ConsecutiveDelimitersSkipped) {
|
|
std::vector<std::string> results;
|
|
SplitStringUsingSubstr(
|
|
"unoDELIMITERDELIMITERDELIMITERdosDELIMITERtresDELIMITERDELIMITERcuatro",
|
|
"DELIMITER",
|
|
&results);
|
|
const char* const expected[] = { "uno", "", "", "dos", "tres", "", "cuatro" };
|
|
AssertElements(results, expected, arraysize(expected));
|
|
|
|
}
|
|
|
|
TEST(SplitStringUsingSubstrTest, TrailingDelimitersSkipped) {
|
|
std::vector<std::string> results;
|
|
SplitStringUsingSubstr(
|
|
"unDELIMITERdeuxDELIMITERtroisDELIMITERquatreDELIMITERDELIMITERDELIMITER",
|
|
"DELIMITER",
|
|
&results);
|
|
const char* const expected[] = { "un", "deux", "trois", "quatre", "", "", "" };
|
|
AssertElements(results, expected, arraysize(expected));
|
|
}
|
|
|
|
TEST(StringSplitTest, StringSplitDontTrim) {
|
|
std::vector<std::string> r;
|
|
|
|
SplitStringDontTrim(" ", '*', &r);
|
|
ASSERT_EQ(1U, r.size());
|
|
EXPECT_EQ(r[0], " ");
|
|
|
|
SplitStringDontTrim("\t \ta\t ", '\t', &r);
|
|
ASSERT_EQ(4U, r.size());
|
|
EXPECT_EQ(r[0], "");
|
|
EXPECT_EQ(r[1], " ");
|
|
EXPECT_EQ(r[2], "a");
|
|
EXPECT_EQ(r[3], " ");
|
|
|
|
SplitStringDontTrim("\ta\t\nb\tcc", '\n', &r);
|
|
ASSERT_EQ(2U, r.size());
|
|
EXPECT_EQ(r[0], "\ta\t");
|
|
EXPECT_EQ(r[1], "b\tcc");
|
|
}
|
|
|
|
TEST(StringSplitTest, SplitStringAlongWhitespace) {
|
|
struct TestData {
|
|
const char* input;
|
|
const size_t expected_result_count;
|
|
const char* output1;
|
|
const char* output2;
|
|
} data[] = {
|
|
{ "a", 1, "a", "" },
|
|
{ " ", 0, "", "" },
|
|
{ " a", 1, "a", "" },
|
|
{ " ab ", 1, "ab", "" },
|
|
{ " ab c", 2, "ab", "c" },
|
|
{ " ab c ", 2, "ab", "c" },
|
|
{ " ab cd", 2, "ab", "cd" },
|
|
{ " ab cd ", 2, "ab", "cd" },
|
|
{ " \ta\t", 1, "a", "" },
|
|
{ " b\ta\t", 2, "b", "a" },
|
|
{ " b\tat", 2, "b", "at" },
|
|
{ "b\tat", 2, "b", "at" },
|
|
{ "b\t at", 2, "b", "at" },
|
|
};
|
|
for (size_t i = 0; i < ARRAYSIZE_UNSAFE(data); ++i) {
|
|
std::vector<std::string> results;
|
|
SplitStringAlongWhitespace(data[i].input, &results);
|
|
ASSERT_EQ(data[i].expected_result_count, results.size());
|
|
if (data[i].expected_result_count > 0) {
|
|
ASSERT_EQ(data[i].output1, results[0]);
|
|
}
|
|
if (data[i].expected_result_count > 1) {
|
|
ASSERT_EQ(data[i].output2, results[1]);
|
|
}
|
|
}
|
|
}
|
|
|
|
} // namespace butil
|