1 // Copyright (c) 2012 The Chromium Authors. All rights reserved. 2 // Use of this source code is governed by a BSD-style license that can be 3 // found in the LICENSE file. 4 5 #include "base/strings/string_split.h" 6 7 #include "base/strings/utf_string_conversions.h" 8 #include "testing/gmock/include/gmock/gmock.h" 9 #include "testing/gtest/include/gtest/gtest.h" 10 11 using ::testing::ElementsAre; 12 13 namespace base { 14 15 namespace { 16 17 #if !defined(WCHAR_T_IS_UTF16) 18 // Overload SplitString with a wide-char version to make it easier to 19 // test the string16 version with wide character literals. 20 void SplitString(const std::wstring& str, 21 wchar_t c, 22 std::vector<std::wstring>* result) { 23 std::vector<string16> result16; 24 SplitString(WideToUTF16(str), c, &result16); 25 for (size_t i = 0; i < result16.size(); ++i) 26 result->push_back(UTF16ToWide(result16[i])); 27 } 28 #endif 29 30 } // anonymous namespace 31 32 class SplitStringIntoKeyValuePairsTest : public testing::Test { 33 protected: 34 std::vector<std::pair<std::string, std::string> > kv_pairs; 35 }; 36 37 TEST_F(SplitStringIntoKeyValuePairsTest, EmptyString) { 38 EXPECT_TRUE(SplitStringIntoKeyValuePairs(std::string(), 39 ':', // Key-value delimiter 40 ',', // Key-value pair delimiter 41 &kv_pairs)); 42 EXPECT_TRUE(kv_pairs.empty()); 43 } 44 45 TEST_F(SplitStringIntoKeyValuePairsTest, MissingKeyValueDelimiter) { 46 EXPECT_FALSE(SplitStringIntoKeyValuePairs("key1,key2:value2", 47 ':', // Key-value delimiter 48 ',', // Key-value pair delimiter 49 &kv_pairs)); 50 ASSERT_EQ(2U, kv_pairs.size()); 51 EXPECT_TRUE(kv_pairs[0].first.empty()); 52 EXPECT_TRUE(kv_pairs[0].second.empty()); 53 EXPECT_EQ("key2", kv_pairs[1].first); 54 EXPECT_EQ("value2", kv_pairs[1].second); 55 } 56 57 TEST_F(SplitStringIntoKeyValuePairsTest, EmptyKeyWithKeyValueDelimiter) { 58 EXPECT_TRUE(SplitStringIntoKeyValuePairs(":value1,key2:value2", 59 ':', // Key-value delimiter 60 ',', // Key-value pair delimiter 61 &kv_pairs)); 62 ASSERT_EQ(2U, kv_pairs.size()); 63 EXPECT_TRUE(kv_pairs[0].first.empty()); 64 EXPECT_EQ("value1", kv_pairs[0].second); 65 EXPECT_EQ("key2", kv_pairs[1].first); 66 EXPECT_EQ("value2", kv_pairs[1].second); 67 } 68 69 TEST_F(SplitStringIntoKeyValuePairsTest, TrailingAndLeadingPairDelimiter) { 70 EXPECT_TRUE(SplitStringIntoKeyValuePairs(",key1:value1,key2:value2,", 71 ':', // Key-value delimiter 72 ',', // Key-value pair delimiter 73 &kv_pairs)); 74 ASSERT_EQ(2U, kv_pairs.size()); 75 EXPECT_EQ("key1", kv_pairs[0].first); 76 EXPECT_EQ("value1", kv_pairs[0].second); 77 EXPECT_EQ("key2", kv_pairs[1].first); 78 EXPECT_EQ("value2", kv_pairs[1].second); 79 } 80 81 TEST_F(SplitStringIntoKeyValuePairsTest, EmptyPair) { 82 EXPECT_TRUE(SplitStringIntoKeyValuePairs("key1:value1,,key3:value3", 83 ':', // Key-value delimiter 84 ',', // Key-value pair delimiter 85 &kv_pairs)); 86 ASSERT_EQ(2U, kv_pairs.size()); 87 EXPECT_EQ("key1", kv_pairs[0].first); 88 EXPECT_EQ("value1", kv_pairs[0].second); 89 EXPECT_EQ("key3", kv_pairs[1].first); 90 EXPECT_EQ("value3", kv_pairs[1].second); 91 } 92 93 TEST_F(SplitStringIntoKeyValuePairsTest, EmptyValue) { 94 EXPECT_FALSE(SplitStringIntoKeyValuePairs("key1:,key2:value2", 95 ':', // Key-value delimiter 96 ',', // Key-value pair delimiter 97 &kv_pairs)); 98 ASSERT_EQ(2U, kv_pairs.size()); 99 EXPECT_EQ("key1", kv_pairs[0].first); 100 EXPECT_EQ("", kv_pairs[0].second); 101 EXPECT_EQ("key2", kv_pairs[1].first); 102 EXPECT_EQ("value2", kv_pairs[1].second); 103 } 104 105 TEST_F(SplitStringIntoKeyValuePairsTest, UntrimmedWhitespace) { 106 EXPECT_TRUE(SplitStringIntoKeyValuePairs("key1 : value1", 107 ':', // Key-value delimiter 108 ',', // Key-value pair delimiter 109 &kv_pairs)); 110 ASSERT_EQ(1U, kv_pairs.size()); 111 EXPECT_EQ("key1 ", kv_pairs[0].first); 112 EXPECT_EQ(" value1", kv_pairs[0].second); 113 } 114 115 TEST_F(SplitStringIntoKeyValuePairsTest, TrimmedWhitespace) { 116 EXPECT_TRUE(SplitStringIntoKeyValuePairs("key1:value1 , key2:value2", 117 ':', // Key-value delimiter 118 ',', // Key-value pair delimiter 119 &kv_pairs)); 120 ASSERT_EQ(2U, kv_pairs.size()); 121 EXPECT_EQ("key1", kv_pairs[0].first); 122 EXPECT_EQ("value1", kv_pairs[0].second); 123 EXPECT_EQ("key2", kv_pairs[1].first); 124 EXPECT_EQ("value2", kv_pairs[1].second); 125 } 126 127 TEST_F(SplitStringIntoKeyValuePairsTest, MultipleKeyValueDelimiters) { 128 EXPECT_TRUE(SplitStringIntoKeyValuePairs("key1:::value1,key2:value2", 129 ':', // Key-value delimiter 130 ',', // Key-value pair delimiter 131 &kv_pairs)); 132 ASSERT_EQ(2U, kv_pairs.size()); 133 EXPECT_EQ("key1", kv_pairs[0].first); 134 EXPECT_EQ("value1", kv_pairs[0].second); 135 EXPECT_EQ("key2", kv_pairs[1].first); 136 EXPECT_EQ("value2", kv_pairs[1].second); 137 } 138 139 TEST_F(SplitStringIntoKeyValuePairsTest, OnlySplitAtGivenSeparator) { 140 std::string a("a ?!@#$%^&*()_+:/{}\\\t\nb"); 141 EXPECT_TRUE(SplitStringIntoKeyValuePairs(a + "X" + a + "Y" + a + "X" + a, 142 'X', // Key-value delimiter 143 'Y', // Key-value pair delimiter 144 &kv_pairs)); 145 ASSERT_EQ(2U, kv_pairs.size()); 146 EXPECT_EQ(a, kv_pairs[0].first); 147 EXPECT_EQ(a, kv_pairs[0].second); 148 EXPECT_EQ(a, kv_pairs[1].first); 149 EXPECT_EQ(a, kv_pairs[1].second); 150 } 151 152 153 TEST_F(SplitStringIntoKeyValuePairsTest, DelimiterInValue) { 154 EXPECT_TRUE(SplitStringIntoKeyValuePairs("key1:va:ue1,key2:value2", 155 ':', // Key-value delimiter 156 ',', // Key-value pair delimiter 157 &kv_pairs)); 158 ASSERT_EQ(2U, kv_pairs.size()); 159 EXPECT_EQ("key1", kv_pairs[0].first); 160 EXPECT_EQ("va:ue1", kv_pairs[0].second); 161 EXPECT_EQ("key2", kv_pairs[1].first); 162 EXPECT_EQ("value2", kv_pairs[1].second); 163 } 164 165 TEST(SplitStringUsingSubstrTest, EmptyString) { 166 std::vector<std::string> results; 167 SplitStringUsingSubstr(std::string(), "DELIMITER", &results); 168 ASSERT_EQ(1u, results.size()); 169 EXPECT_THAT(results, ElementsAre("")); 170 } 171 172 TEST(StringUtilTest, SplitString) { 173 std::vector<std::wstring> r; 174 175 SplitString(std::wstring(), L',', &r); 176 EXPECT_EQ(0U, r.size()); 177 r.clear(); 178 179 SplitString(L"a,b,c", L',', &r); 180 ASSERT_EQ(3U, r.size()); 181 EXPECT_EQ(r[0], L"a"); 182 EXPECT_EQ(r[1], L"b"); 183 EXPECT_EQ(r[2], L"c"); 184 r.clear(); 185 186 SplitString(L"a, b, c", L',', &r); 187 ASSERT_EQ(3U, r.size()); 188 EXPECT_EQ(r[0], L"a"); 189 EXPECT_EQ(r[1], L"b"); 190 EXPECT_EQ(r[2], L"c"); 191 r.clear(); 192 193 SplitString(L"a,,c", L',', &r); 194 ASSERT_EQ(3U, r.size()); 195 EXPECT_EQ(r[0], L"a"); 196 EXPECT_EQ(r[1], L""); 197 EXPECT_EQ(r[2], L"c"); 198 r.clear(); 199 200 SplitString(L" ", L'*', &r); 201 EXPECT_EQ(0U, r.size()); 202 r.clear(); 203 204 SplitString(L"foo", L'*', &r); 205 ASSERT_EQ(1U, r.size()); 206 EXPECT_EQ(r[0], L"foo"); 207 r.clear(); 208 209 SplitString(L"foo ,", L',', &r); 210 ASSERT_EQ(2U, r.size()); 211 EXPECT_EQ(r[0], L"foo"); 212 EXPECT_EQ(r[1], L""); 213 r.clear(); 214 215 SplitString(L",", L',', &r); 216 ASSERT_EQ(2U, r.size()); 217 EXPECT_EQ(r[0], L""); 218 EXPECT_EQ(r[1], L""); 219 r.clear(); 220 221 SplitString(L"\t\ta\t", L'\t', &r); 222 ASSERT_EQ(4U, r.size()); 223 EXPECT_EQ(r[0], L""); 224 EXPECT_EQ(r[1], L""); 225 EXPECT_EQ(r[2], L"a"); 226 EXPECT_EQ(r[3], L""); 227 r.clear(); 228 229 SplitString(L"\ta\t\nb\tcc", L'\n', &r); 230 ASSERT_EQ(2U, r.size()); 231 EXPECT_EQ(r[0], L"a"); 232 EXPECT_EQ(r[1], L"b\tcc"); 233 r.clear(); 234 } 235 236 TEST(SplitStringUsingSubstrTest, StringWithNoDelimiter) { 237 std::vector<std::string> results; 238 SplitStringUsingSubstr("alongwordwithnodelimiter", "DELIMITER", &results); 239 ASSERT_EQ(1u, results.size()); 240 EXPECT_THAT(results, ElementsAre("alongwordwithnodelimiter")); 241 } 242 243 TEST(SplitStringUsingSubstrTest, LeadingDelimitersSkipped) { 244 std::vector<std::string> results; 245 SplitStringUsingSubstr( 246 "DELIMITERDELIMITERDELIMITERoneDELIMITERtwoDELIMITERthree", 247 "DELIMITER", 248 &results); 249 ASSERT_EQ(6u, results.size()); 250 EXPECT_THAT(results, ElementsAre("", "", "", "one", "two", "three")); 251 } 252 253 TEST(SplitStringUsingSubstrTest, ConsecutiveDelimitersSkipped) { 254 std::vector<std::string> results; 255 SplitStringUsingSubstr( 256 "unoDELIMITERDELIMITERDELIMITERdosDELIMITERtresDELIMITERDELIMITERcuatro", 257 "DELIMITER", 258 &results); 259 ASSERT_EQ(7u, results.size()); 260 EXPECT_THAT(results, ElementsAre("uno", "", "", "dos", "tres", "", "cuatro")); 261 } 262 263 TEST(SplitStringUsingSubstrTest, TrailingDelimitersSkipped) { 264 std::vector<std::string> results; 265 SplitStringUsingSubstr( 266 "unDELIMITERdeuxDELIMITERtroisDELIMITERquatreDELIMITERDELIMITERDELIMITER", 267 "DELIMITER", 268 &results); 269 ASSERT_EQ(7u, results.size()); 270 EXPECT_THAT( 271 results, ElementsAre("un", "deux", "trois", "quatre", "", "", "")); 272 } 273 274 TEST(StringSplitTest, StringSplitDontTrim) { 275 std::vector<std::string> r; 276 277 SplitStringDontTrim(" ", '*', &r); 278 ASSERT_EQ(1U, r.size()); 279 EXPECT_EQ(r[0], " "); 280 281 SplitStringDontTrim("\t \ta\t ", '\t', &r); 282 ASSERT_EQ(4U, r.size()); 283 EXPECT_EQ(r[0], ""); 284 EXPECT_EQ(r[1], " "); 285 EXPECT_EQ(r[2], "a"); 286 EXPECT_EQ(r[3], " "); 287 288 SplitStringDontTrim("\ta\t\nb\tcc", '\n', &r); 289 ASSERT_EQ(2U, r.size()); 290 EXPECT_EQ(r[0], "\ta\t"); 291 EXPECT_EQ(r[1], "b\tcc"); 292 } 293 294 TEST(StringSplitTest, SplitStringAlongWhitespace) { 295 struct TestData { 296 const char* input; 297 const size_t expected_result_count; 298 const char* output1; 299 const char* output2; 300 } data[] = { 301 { "a", 1, "a", "" }, 302 { " ", 0, "", "" }, 303 { " a", 1, "a", "" }, 304 { " ab ", 1, "ab", "" }, 305 { " ab c", 2, "ab", "c" }, 306 { " ab c ", 2, "ab", "c" }, 307 { " ab cd", 2, "ab", "cd" }, 308 { " ab cd ", 2, "ab", "cd" }, 309 { " \ta\t", 1, "a", "" }, 310 { " b\ta\t", 2, "b", "a" }, 311 { " b\tat", 2, "b", "at" }, 312 { "b\tat", 2, "b", "at" }, 313 { "b\t at", 2, "b", "at" }, 314 }; 315 for (size_t i = 0; i < ARRAYSIZE_UNSAFE(data); ++i) { 316 std::vector<std::string> results; 317 SplitStringAlongWhitespace(data[i].input, &results); 318 ASSERT_EQ(data[i].expected_result_count, results.size()); 319 if (data[i].expected_result_count > 0) 320 ASSERT_EQ(data[i].output1, results[0]); 321 if (data[i].expected_result_count > 1) 322 ASSERT_EQ(data[i].output2, results[1]); 323 } 324 } 325 326 } // namespace base 327