123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398 |
- // Copyright (c) 2012 The Chromium Authors. All rights reserved.
- // Use of this source code is governed by a BSD-style license that can be
- // found in the LICENSE file.
- #include "butil/strings/string_split.h"
- #include "butil/strings/utf_string_conversions.h"
- #include <gtest/gtest.h>
- namespace butil {
- namespace {
- void AssertElements(std::vector<std::string>& result,
- const char* const expected_data[],
- size_t data_size) {
- ASSERT_EQ(data_size, result.size());
- for (size_t i = 0; i < data_size; ++i) {
- ASSERT_STREQ(expected_data[i], result[i].c_str());
- }
- }
- #if !defined(WCHAR_T_IS_UTF16)
- // Overload SplitString with a wide-char version to make it easier to
- // test the string16 version with wide character literals.
- void SplitString(const std::wstring& str,
- wchar_t c,
- std::vector<std::wstring>* result) {
- std::vector<string16> result16;
- SplitString(WideToUTF16(str), c, &result16);
- for (size_t i = 0; i < result16.size(); ++i)
- result->push_back(UTF16ToWide(result16[i]));
- }
- #endif
- } // anonymous namespace
- class SplitStringIntoKeyValuePairsTest : public testing::Test {
- protected:
- std::vector<std::pair<std::string, std::string> > kv_pairs;
- };
- TEST_F(SplitStringIntoKeyValuePairsTest, EmptyString) {
- EXPECT_TRUE(SplitStringIntoKeyValuePairs(std::string(),
- ':', // Key-value delimiter
- ',', // Key-value pair delimiter
- &kv_pairs));
- EXPECT_TRUE(kv_pairs.empty());
- }
- TEST_F(SplitStringIntoKeyValuePairsTest, MissingKeyValueDelimiter) {
- EXPECT_FALSE(SplitStringIntoKeyValuePairs("key1,key2:value2",
- ':', // Key-value delimiter
- ',', // Key-value pair delimiter
- &kv_pairs));
- ASSERT_EQ(2U, kv_pairs.size());
- EXPECT_TRUE(kv_pairs[0].first.empty());
- EXPECT_TRUE(kv_pairs[0].second.empty());
- EXPECT_EQ("key2", kv_pairs[1].first);
- EXPECT_EQ("value2", kv_pairs[1].second);
- }
- TEST_F(SplitStringIntoKeyValuePairsTest, EmptyKeyWithKeyValueDelimiter) {
- EXPECT_TRUE(SplitStringIntoKeyValuePairs(":value1,key2:value2",
- ':', // Key-value delimiter
- ',', // Key-value pair delimiter
- &kv_pairs));
- ASSERT_EQ(2U, kv_pairs.size());
- EXPECT_TRUE(kv_pairs[0].first.empty());
- EXPECT_EQ("value1", kv_pairs[0].second);
- EXPECT_EQ("key2", kv_pairs[1].first);
- EXPECT_EQ("value2", kv_pairs[1].second);
- }
- TEST_F(SplitStringIntoKeyValuePairsTest, TrailingAndLeadingPairDelimiter) {
- EXPECT_TRUE(SplitStringIntoKeyValuePairs(",key1:value1,key2:value2,",
- ':', // Key-value delimiter
- ',', // Key-value pair delimiter
- &kv_pairs));
- ASSERT_EQ(2U, kv_pairs.size());
- EXPECT_EQ("key1", kv_pairs[0].first);
- EXPECT_EQ("value1", kv_pairs[0].second);
- EXPECT_EQ("key2", kv_pairs[1].first);
- EXPECT_EQ("value2", kv_pairs[1].second);
- }
- TEST_F(SplitStringIntoKeyValuePairsTest, EmptyPair) {
- EXPECT_TRUE(SplitStringIntoKeyValuePairs("key1:value1,,key3:value3",
- ':', // Key-value delimiter
- ',', // Key-value pair delimiter
- &kv_pairs));
- ASSERT_EQ(2U, kv_pairs.size());
- EXPECT_EQ("key1", kv_pairs[0].first);
- EXPECT_EQ("value1", kv_pairs[0].second);
- EXPECT_EQ("key3", kv_pairs[1].first);
- EXPECT_EQ("value3", kv_pairs[1].second);
- }
- TEST_F(SplitStringIntoKeyValuePairsTest, EmptyValue) {
- EXPECT_FALSE(SplitStringIntoKeyValuePairs("key1:,key2:value2",
- ':', // Key-value delimiter
- ',', // Key-value pair delimiter
- &kv_pairs));
- ASSERT_EQ(2U, kv_pairs.size());
- EXPECT_EQ("key1", kv_pairs[0].first);
- EXPECT_EQ("", kv_pairs[0].second);
- EXPECT_EQ("key2", kv_pairs[1].first);
- EXPECT_EQ("value2", kv_pairs[1].second);
- }
- TEST_F(SplitStringIntoKeyValuePairsTest, UntrimmedWhitespace) {
- EXPECT_TRUE(SplitStringIntoKeyValuePairs("key1 : value1",
- ':', // Key-value delimiter
- ',', // Key-value pair delimiter
- &kv_pairs));
- ASSERT_EQ(1U, kv_pairs.size());
- EXPECT_EQ("key1 ", kv_pairs[0].first);
- EXPECT_EQ(" value1", kv_pairs[0].second);
- }
- TEST_F(SplitStringIntoKeyValuePairsTest, TrimmedWhitespace) {
- EXPECT_TRUE(SplitStringIntoKeyValuePairs("key1:value1 , key2:value2",
- ':', // Key-value delimiter
- ',', // Key-value pair delimiter
- &kv_pairs));
- ASSERT_EQ(2U, kv_pairs.size());
- EXPECT_EQ("key1", kv_pairs[0].first);
- EXPECT_EQ("value1", kv_pairs[0].second);
- EXPECT_EQ("key2", kv_pairs[1].first);
- EXPECT_EQ("value2", kv_pairs[1].second);
- }
- TEST_F(SplitStringIntoKeyValuePairsTest, MultipleKeyValueDelimiters) {
- EXPECT_TRUE(SplitStringIntoKeyValuePairs("key1:::value1,key2:value2",
- ':', // Key-value delimiter
- ',', // Key-value pair delimiter
- &kv_pairs));
- ASSERT_EQ(2U, kv_pairs.size());
- EXPECT_EQ("key1", kv_pairs[0].first);
- EXPECT_EQ("value1", kv_pairs[0].second);
- EXPECT_EQ("key2", kv_pairs[1].first);
- EXPECT_EQ("value2", kv_pairs[1].second);
- }
- TEST_F(SplitStringIntoKeyValuePairsTest, OnlySplitAtGivenSeparator) {
- std::string a("a ?!@#$%^&*()_+:/{}\\\t\nb");
- EXPECT_TRUE(SplitStringIntoKeyValuePairs(a + "X" + a + "Y" + a + "X" + a,
- 'X', // Key-value delimiter
- 'Y', // Key-value pair delimiter
- &kv_pairs));
- ASSERT_EQ(2U, kv_pairs.size());
- EXPECT_EQ(a, kv_pairs[0].first);
- EXPECT_EQ(a, kv_pairs[0].second);
- EXPECT_EQ(a, kv_pairs[1].first);
- EXPECT_EQ(a, kv_pairs[1].second);
- }
- TEST_F(SplitStringIntoKeyValuePairsTest, DelimiterInValue) {
- EXPECT_TRUE(SplitStringIntoKeyValuePairs("key1:va:ue1,key2:value2",
- ':', // Key-value delimiter
- ',', // Key-value pair delimiter
- &kv_pairs));
- ASSERT_EQ(2U, kv_pairs.size());
- EXPECT_EQ("key1", kv_pairs[0].first);
- EXPECT_EQ("va:ue1", kv_pairs[0].second);
- EXPECT_EQ("key2", kv_pairs[1].first);
- EXPECT_EQ("value2", kv_pairs[1].second);
- }
- TEST(SplitStringUsingSubstrTest, EmptyString) {
- std::vector<std::string> results;
- SplitStringUsingSubstr(std::string(), "DELIMITER", &results);
- const char* const expected[] = { "" };
- AssertElements(results, expected, arraysize(expected));
- }
- TEST(StringUtilTest, SplitString) {
- std::vector<std::wstring> r;
- SplitString(std::wstring(), L',', &r);
- EXPECT_EQ(0U, r.size());
- r.clear();
- SplitString(L"a,b,c", L',', &r);
- ASSERT_EQ(3U, r.size());
- EXPECT_EQ(r[0], L"a");
- EXPECT_EQ(r[1], L"b");
- EXPECT_EQ(r[2], L"c");
- r.clear();
- SplitString(L"a, b, c", L',', &r);
- ASSERT_EQ(3U, r.size());
- EXPECT_EQ(r[0], L"a");
- EXPECT_EQ(r[1], L"b");
- EXPECT_EQ(r[2], L"c");
- r.clear();
- SplitString(L"a,,c", L',', &r);
- ASSERT_EQ(3U, r.size());
- EXPECT_EQ(r[0], L"a");
- EXPECT_EQ(r[1], L"");
- EXPECT_EQ(r[2], L"c");
- r.clear();
- SplitString(L" ", L'*', &r);
- EXPECT_EQ(0U, r.size());
- r.clear();
- SplitString(L"foo", L'*', &r);
- ASSERT_EQ(1U, r.size());
- EXPECT_EQ(r[0], L"foo");
- r.clear();
- SplitString(L"foo ,", L',', &r);
- ASSERT_EQ(2U, r.size());
- EXPECT_EQ(r[0], L"foo");
- EXPECT_EQ(r[1], L"");
- r.clear();
- SplitString(L",", L',', &r);
- ASSERT_EQ(2U, r.size());
- EXPECT_EQ(r[0], L"");
- EXPECT_EQ(r[1], L"");
- r.clear();
- SplitString(L"\t\ta\t", L'\t', &r);
- ASSERT_EQ(4U, r.size());
- EXPECT_EQ(r[0], L"");
- EXPECT_EQ(r[1], L"");
- EXPECT_EQ(r[2], L"a");
- EXPECT_EQ(r[3], L"");
- r.clear();
- SplitString(L"\ta\t\nb\tcc", L'\n', &r);
- ASSERT_EQ(2U, r.size());
- EXPECT_EQ(r[0], L"a");
- EXPECT_EQ(r[1], L"b\tcc");
- r.clear();
- }
- TEST(StringUtilTest, SplitStringStringPiece) {
- std::vector<butil::StringPiece> r;
- SplitString(butil::StringPiece(), ',', &r);
- EXPECT_EQ(0U, r.size());
- r.clear();
- SplitString(butil::StringPiece("a,b,c"), ',', &r);
- ASSERT_EQ(3U, r.size());
- EXPECT_EQ(r[0], "a");
- EXPECT_EQ(r[1], "b");
- EXPECT_EQ(r[2], "c");
- r.clear();
- SplitString(butil::StringPiece("a, b, c"), ',', &r);
- ASSERT_EQ(3U, r.size());
- EXPECT_EQ(r[0], "a");
- EXPECT_EQ(r[1], "b");
- EXPECT_EQ(r[2], "c");
- r.clear();
- SplitString(butil::StringPiece("a,,c"), ',', &r);
- ASSERT_EQ(3U, r.size());
- EXPECT_EQ(r[0], "a");
- EXPECT_EQ(r[1], "");
- EXPECT_EQ(r[2], "c");
- r.clear();
- SplitString(butil::StringPiece(" "), '*', &r);
- EXPECT_EQ(0U, r.size());
- r.clear();
- SplitString(butil::StringPiece("foo"), '*', &r);
- ASSERT_EQ(1U, r.size());
- EXPECT_EQ(r[0], "foo");
- r.clear();
- SplitString(butil::StringPiece("foo ,"), ',', &r);
- ASSERT_EQ(2U, r.size());
- EXPECT_EQ(r[0], "foo");
- EXPECT_EQ(r[1], "");
- r.clear();
- SplitString(butil::StringPiece(","), ',', &r);
- ASSERT_EQ(2U, r.size());
- EXPECT_EQ(r[0], "");
- EXPECT_EQ(r[1], "");
- r.clear();
- SplitString(butil::StringPiece("\t\ta\t"), '\t', &r);
- ASSERT_EQ(4U, r.size());
- EXPECT_EQ(r[0], "");
- EXPECT_EQ(r[1], "");
- EXPECT_EQ(r[2], "a");
- EXPECT_EQ(r[3], "");
- r.clear();
- SplitString(butil::StringPiece("\ta\t\nb\tcc"), '\n', &r);
- ASSERT_EQ(2U, r.size());
- EXPECT_EQ(r[0], "a");
- EXPECT_EQ(r[1], "b\tcc");
- r.clear();
- }
- TEST(SplitStringUsingSubstrTest, StringWithNoDelimiter) {
- std::vector<std::string> results;
- SplitStringUsingSubstr("alongwordwithnodelimiter", "DELIMITER", &results);
- const char* const expected[] = { "alongwordwithnodelimiter" };
- AssertElements(results, expected, arraysize(expected));
- }
- TEST(SplitStringUsingSubstrTest, LeadingDelimitersSkipped) {
- std::vector<std::string> results;
- SplitStringUsingSubstr(
- "DELIMITERDELIMITERDELIMITERoneDELIMITERtwoDELIMITERthree",
- "DELIMITER",
- &results);
- const char* const expected[] = { "", "", "", "one", "two", "three" };
- AssertElements(results, expected, arraysize(expected));
- }
- TEST(SplitStringUsingSubstrTest, ConsecutiveDelimitersSkipped) {
- std::vector<std::string> results;
- SplitStringUsingSubstr(
- "unoDELIMITERDELIMITERDELIMITERdosDELIMITERtresDELIMITERDELIMITERcuatro",
- "DELIMITER",
- &results);
- const char* const expected[] = { "uno", "", "", "dos", "tres", "", "cuatro" };
- AssertElements(results, expected, arraysize(expected));
- }
- TEST(SplitStringUsingSubstrTest, TrailingDelimitersSkipped) {
- std::vector<std::string> results;
- SplitStringUsingSubstr(
- "unDELIMITERdeuxDELIMITERtroisDELIMITERquatreDELIMITERDELIMITERDELIMITER",
- "DELIMITER",
- &results);
- const char* const expected[] = { "un", "deux", "trois", "quatre", "", "", "" };
- AssertElements(results, expected, arraysize(expected));
- }
- TEST(StringSplitTest, StringSplitDontTrim) {
- std::vector<std::string> r;
- SplitStringDontTrim(" ", '*', &r);
- ASSERT_EQ(1U, r.size());
- EXPECT_EQ(r[0], " ");
- SplitStringDontTrim("\t \ta\t ", '\t', &r);
- ASSERT_EQ(4U, r.size());
- EXPECT_EQ(r[0], "");
- EXPECT_EQ(r[1], " ");
- EXPECT_EQ(r[2], "a");
- EXPECT_EQ(r[3], " ");
- SplitStringDontTrim("\ta\t\nb\tcc", '\n', &r);
- ASSERT_EQ(2U, r.size());
- EXPECT_EQ(r[0], "\ta\t");
- EXPECT_EQ(r[1], "b\tcc");
- }
- TEST(StringSplitTest, SplitStringAlongWhitespace) {
- struct TestData {
- const char* input;
- const size_t expected_result_count;
- const char* output1;
- const char* output2;
- } data[] = {
- { "a", 1, "a", "" },
- { " ", 0, "", "" },
- { " a", 1, "a", "" },
- { " ab ", 1, "ab", "" },
- { " ab c", 2, "ab", "c" },
- { " ab c ", 2, "ab", "c" },
- { " ab cd", 2, "ab", "cd" },
- { " ab cd ", 2, "ab", "cd" },
- { " \ta\t", 1, "a", "" },
- { " b\ta\t", 2, "b", "a" },
- { " b\tat", 2, "b", "at" },
- { "b\tat", 2, "b", "at" },
- { "b\t at", 2, "b", "at" },
- };
- for (size_t i = 0; i < ARRAYSIZE_UNSAFE(data); ++i) {
- std::vector<std::string> results;
- SplitStringAlongWhitespace(data[i].input, &results);
- ASSERT_EQ(data[i].expected_result_count, results.size());
- if (data[i].expected_result_count > 0) {
- ASSERT_EQ(data[i].output1, results[0]);
- }
- if (data[i].expected_result_count > 1) {
- ASSERT_EQ(data[i].output2, results[1]);
- }
- }
- }
- } // namespace butil
|