Primiano Tucci | 825e6de | 2018-03-13 05:43:15 +0000 | [diff] [blame] | 1 | /* |
| 2 | * Copyright (C) 2018 The Android Open Source Project |
| 3 | * |
| 4 | * Licensed under the Apache License, Version 2.0 (the "License"); |
| 5 | * you may not use this file except in compliance with the License. |
| 6 | * You may obtain a copy of the License at |
| 7 | * |
| 8 | * http://www.apache.org/licenses/LICENSE-2.0 |
| 9 | * |
| 10 | * Unless required by applicable law or agreed to in writing, software |
| 11 | * distributed under the License is distributed on an "AS IS" BASIS, |
| 12 | * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. |
| 13 | * See the License for the specific language governing permissions and |
| 14 | * limitations under the License. |
| 15 | */ |
| 16 | |
Primiano Tucci | 2c5488f | 2019-06-01 03:27:28 +0100 | [diff] [blame] | 17 | #include "perfetto/ext/base/string_splitter.h" |
Primiano Tucci | 825e6de | 2018-03-13 05:43:15 +0000 | [diff] [blame] | 18 | |
| 19 | #include <vector> |
| 20 | |
Primiano Tucci | 919ca1e | 2019-08-21 20:26:58 +0200 | [diff] [blame] | 21 | #include "test/gtest_and_gmock.h" |
Primiano Tucci | 825e6de | 2018-03-13 05:43:15 +0000 | [diff] [blame] | 22 | |
| 23 | namespace perfetto { |
| 24 | namespace base { |
| 25 | namespace { |
| 26 | |
| 27 | using testing::ElementsAreArray; |
| 28 | |
| 29 | TEST(StringSplitterTest, StdString) { |
| 30 | { |
| 31 | StringSplitter ss("", 'x'); |
| 32 | EXPECT_EQ(nullptr, ss.cur_token()); |
| 33 | EXPECT_EQ(0u, ss.cur_token_size()); |
| 34 | EXPECT_FALSE(ss.Next()); |
| 35 | EXPECT_EQ(nullptr, ss.cur_token()); |
| 36 | EXPECT_EQ(0u, ss.cur_token_size()); |
| 37 | } |
| 38 | { |
| 39 | StringSplitter ss(std::string(), 'x'); |
| 40 | EXPECT_EQ(nullptr, ss.cur_token()); |
| 41 | EXPECT_EQ(0u, ss.cur_token_size()); |
| 42 | EXPECT_FALSE(ss.Next()); |
| 43 | EXPECT_EQ(nullptr, ss.cur_token()); |
| 44 | EXPECT_EQ(0u, ss.cur_token_size()); |
| 45 | } |
| 46 | { |
| 47 | StringSplitter ss("a", 'x'); |
| 48 | EXPECT_EQ(nullptr, ss.cur_token()); |
| 49 | EXPECT_EQ(0u, ss.cur_token_size()); |
| 50 | EXPECT_TRUE(ss.Next()); |
| 51 | EXPECT_STREQ("a", ss.cur_token()); |
| 52 | EXPECT_EQ(1u, ss.cur_token_size()); |
| 53 | EXPECT_FALSE(ss.Next()); |
| 54 | EXPECT_EQ(0u, ss.cur_token_size()); |
| 55 | } |
| 56 | { |
| 57 | StringSplitter ss("abc", 'x'); |
| 58 | EXPECT_TRUE(ss.Next()); |
| 59 | EXPECT_STREQ("abc", ss.cur_token()); |
| 60 | EXPECT_EQ(3u, ss.cur_token_size()); |
| 61 | EXPECT_FALSE(ss.Next()); |
| 62 | } |
| 63 | { |
| 64 | StringSplitter ss("ab,", ','); |
| 65 | EXPECT_TRUE(ss.Next()); |
| 66 | EXPECT_STREQ("ab", ss.cur_token()); |
| 67 | EXPECT_EQ(2u, ss.cur_token_size()); |
| 68 | EXPECT_FALSE(ss.Next()); |
| 69 | } |
| 70 | { |
| 71 | StringSplitter ss(",ab,", ','); |
| 72 | EXPECT_TRUE(ss.Next()); |
| 73 | EXPECT_STREQ("ab", ss.cur_token()); |
| 74 | EXPECT_EQ(2u, ss.cur_token_size()); |
| 75 | EXPECT_FALSE(ss.Next()); |
| 76 | } |
| 77 | { |
| 78 | StringSplitter ss("a,b,c", ','); |
| 79 | EXPECT_TRUE(ss.Next()); |
| 80 | EXPECT_EQ(1u, ss.cur_token_size()); |
| 81 | EXPECT_STREQ("a", ss.cur_token()); |
| 82 | |
| 83 | EXPECT_TRUE(ss.Next()); |
| 84 | EXPECT_STREQ("b", ss.cur_token()); |
| 85 | EXPECT_EQ(1u, ss.cur_token_size()); |
| 86 | |
| 87 | EXPECT_TRUE(ss.Next()); |
| 88 | EXPECT_STREQ("c", ss.cur_token()); |
| 89 | EXPECT_EQ(1u, ss.cur_token_size()); |
| 90 | |
| 91 | EXPECT_FALSE(ss.Next()); |
| 92 | EXPECT_EQ(nullptr, ss.cur_token()); |
| 93 | EXPECT_EQ(0u, ss.cur_token_size()); |
| 94 | } |
| 95 | { |
| 96 | StringSplitter ss("a,b,c,", ','); |
| 97 | EXPECT_TRUE(ss.Next()); |
| 98 | EXPECT_STREQ("a", ss.cur_token()); |
| 99 | |
| 100 | EXPECT_TRUE(ss.Next()); |
| 101 | EXPECT_STREQ("b", ss.cur_token()); |
| 102 | |
| 103 | EXPECT_TRUE(ss.Next()); |
| 104 | EXPECT_STREQ("c", ss.cur_token()); |
| 105 | |
| 106 | EXPECT_FALSE(ss.Next()); |
| 107 | EXPECT_EQ(nullptr, ss.cur_token()); |
| 108 | } |
| 109 | { |
| 110 | StringSplitter ss(",,a,,b,,,,c,,,", ','); |
| 111 | EXPECT_TRUE(ss.Next()); |
| 112 | EXPECT_STREQ("a", ss.cur_token()); |
| 113 | EXPECT_EQ(1u, ss.cur_token_size()); |
| 114 | |
| 115 | EXPECT_TRUE(ss.Next()); |
| 116 | EXPECT_STREQ("b", ss.cur_token()); |
| 117 | EXPECT_EQ(1u, ss.cur_token_size()); |
| 118 | |
| 119 | EXPECT_TRUE(ss.Next()); |
| 120 | EXPECT_STREQ("c", ss.cur_token()); |
| 121 | EXPECT_EQ(1u, ss.cur_token_size()); |
| 122 | |
| 123 | for (int i = 0; i < 3; i++) { |
| 124 | EXPECT_FALSE(ss.Next()); |
| 125 | EXPECT_EQ(0u, ss.cur_token_size()); |
| 126 | } |
| 127 | } |
| 128 | { |
| 129 | StringSplitter ss(",,", ','); |
| 130 | for (int i = 0; i < 3; i++) { |
| 131 | EXPECT_FALSE(ss.Next()); |
| 132 | EXPECT_EQ(nullptr, ss.cur_token()); |
| 133 | EXPECT_EQ(0u, ss.cur_token_size()); |
| 134 | } |
| 135 | } |
| 136 | { |
| 137 | StringSplitter ss(",,foo", ','); |
| 138 | EXPECT_TRUE(ss.Next()); |
| 139 | EXPECT_STREQ("foo", ss.cur_token()); |
| 140 | EXPECT_EQ(3u, ss.cur_token_size()); |
| 141 | EXPECT_FALSE(ss.Next()); |
| 142 | } |
| 143 | } |
| 144 | |
| 145 | TEST(StringSplitterTest, CString) { |
| 146 | { |
| 147 | char buf[] = "\0x\0"; |
| 148 | StringSplitter ss(buf, sizeof(buf), ','); |
| 149 | EXPECT_FALSE(ss.Next()); |
| 150 | EXPECT_EQ(nullptr, ss.cur_token()); |
| 151 | } |
| 152 | { |
| 153 | char buf[] = "foo\nbar\n\nbaz\n"; |
| 154 | StringSplitter ss(buf, sizeof(buf), '\n'); |
| 155 | EXPECT_TRUE(ss.Next()); |
| 156 | EXPECT_EQ(3u, ss.cur_token_size()); |
| 157 | EXPECT_STREQ("foo", ss.cur_token()); |
| 158 | |
| 159 | EXPECT_TRUE(ss.Next()); |
| 160 | EXPECT_EQ(3u, ss.cur_token_size()); |
| 161 | EXPECT_STREQ("bar", ss.cur_token()); |
| 162 | |
| 163 | EXPECT_TRUE(ss.Next()); |
| 164 | EXPECT_EQ(3u, ss.cur_token_size()); |
| 165 | EXPECT_STREQ("baz", ss.cur_token()); |
| 166 | |
| 167 | EXPECT_FALSE(ss.Next()); |
| 168 | EXPECT_EQ(0u, ss.cur_token_size()); |
| 169 | } |
| 170 | { |
| 171 | char buf[] = ""; |
| 172 | StringSplitter ss(buf, 0, ','); |
| 173 | EXPECT_FALSE(ss.Next()); |
| 174 | EXPECT_EQ(nullptr, ss.cur_token()); |
| 175 | EXPECT_EQ(0u, ss.cur_token_size()); |
| 176 | } |
| 177 | { |
| 178 | char buf[] = "\0"; |
| 179 | StringSplitter ss(buf, 1, ','); |
| 180 | EXPECT_FALSE(ss.Next()); |
| 181 | EXPECT_EQ(nullptr, ss.cur_token()); |
| 182 | EXPECT_EQ(0u, ss.cur_token_size()); |
| 183 | } |
| 184 | { |
| 185 | char buf[] = ",,foo,bar\0,baz"; |
| 186 | StringSplitter ss(buf, sizeof(buf), ','); |
| 187 | |
| 188 | EXPECT_TRUE(ss.Next()); |
| 189 | EXPECT_STREQ("foo", ss.cur_token()); |
| 190 | EXPECT_EQ(3u, ss.cur_token_size()); |
| 191 | |
| 192 | EXPECT_TRUE(ss.Next()); |
| 193 | EXPECT_STREQ("bar", ss.cur_token()); |
| 194 | EXPECT_EQ(3u, ss.cur_token_size()); |
| 195 | |
| 196 | for (int i = 0; i < 3; i++) { |
| 197 | EXPECT_FALSE(ss.Next()); |
| 198 | EXPECT_EQ(0u, ss.cur_token_size()); |
| 199 | } |
| 200 | } |
| 201 | { |
| 202 | char buf[] = ",,a\0,b,"; |
| 203 | StringSplitter ss(buf, sizeof(buf), ','); |
| 204 | EXPECT_TRUE(ss.Next()); |
| 205 | EXPECT_STREQ("a", ss.cur_token()); |
| 206 | EXPECT_EQ(1u, ss.cur_token_size()); |
| 207 | for (int i = 0; i < 3; i++) { |
| 208 | EXPECT_FALSE(ss.Next()); |
| 209 | EXPECT_EQ(nullptr, ss.cur_token()); |
| 210 | EXPECT_EQ(0u, ss.cur_token_size()); |
| 211 | } |
| 212 | } |
| 213 | { |
| 214 | char buf[] = ",a,\0b"; |
| 215 | StringSplitter ss(buf, sizeof(buf), ','); |
| 216 | EXPECT_TRUE(ss.Next()); |
| 217 | EXPECT_STREQ("a", ss.cur_token()); |
| 218 | EXPECT_EQ(1u, ss.cur_token_size()); |
| 219 | for (int i = 0; i < 3; i++) { |
| 220 | EXPECT_FALSE(ss.Next()); |
| 221 | EXPECT_EQ(0u, ss.cur_token_size()); |
| 222 | EXPECT_EQ(nullptr, ss.cur_token()); |
| 223 | } |
| 224 | } |
| 225 | { |
| 226 | char buf[] = ",a\0\0,x\0\0b"; |
| 227 | StringSplitter ss(buf, sizeof(buf), ','); |
| 228 | EXPECT_TRUE(ss.Next()); |
| 229 | EXPECT_STREQ("a", ss.cur_token()); |
| 230 | EXPECT_EQ(1u, ss.cur_token_size()); |
| 231 | for (int i = 0; i < 3; i++) { |
| 232 | EXPECT_FALSE(ss.Next()); |
| 233 | EXPECT_EQ(0u, ss.cur_token_size()); |
| 234 | EXPECT_EQ(nullptr, ss.cur_token()); |
| 235 | } |
| 236 | } |
| 237 | } |
| 238 | |
| 239 | TEST(StringSplitterTest, SplitOnNUL) { |
| 240 | { |
| 241 | StringSplitter ss(std::string(""), '\0'); |
| 242 | EXPECT_FALSE(ss.Next()); |
| 243 | EXPECT_EQ(nullptr, ss.cur_token()); |
| 244 | } |
| 245 | { |
| 246 | std::string str; |
| 247 | str.resize(48); |
| 248 | memcpy(&str[0], "foo\0", 4); |
| 249 | memcpy(&str[4], "bar\0", 4); |
| 250 | memcpy(&str[20], "baz", 3); |
| 251 | StringSplitter ss(std::move(str), '\0'); |
| 252 | EXPECT_TRUE(ss.Next()); |
| 253 | EXPECT_STREQ("foo", ss.cur_token()); |
| 254 | EXPECT_EQ(3u, ss.cur_token_size()); |
| 255 | |
| 256 | EXPECT_TRUE(ss.Next()); |
| 257 | EXPECT_STREQ("bar", ss.cur_token()); |
| 258 | EXPECT_EQ(3u, ss.cur_token_size()); |
| 259 | |
| 260 | EXPECT_TRUE(ss.Next()); |
| 261 | EXPECT_STREQ("baz", ss.cur_token()); |
| 262 | EXPECT_EQ(3u, ss.cur_token_size()); |
| 263 | |
| 264 | for (int i = 0; i < 3; i++) { |
| 265 | EXPECT_FALSE(ss.Next()); |
| 266 | EXPECT_EQ(0u, ss.cur_token_size()); |
| 267 | EXPECT_EQ(nullptr, ss.cur_token()); |
| 268 | } |
| 269 | } |
| 270 | { |
| 271 | char buf[] = "foo\0bar\0baz\0"; |
| 272 | StringSplitter ss(buf, sizeof(buf), '\0'); |
| 273 | EXPECT_TRUE(ss.Next()); |
| 274 | EXPECT_EQ(3u, ss.cur_token_size()); |
| 275 | EXPECT_STREQ("foo", ss.cur_token()); |
| 276 | |
| 277 | EXPECT_TRUE(ss.Next()); |
| 278 | EXPECT_EQ(3u, ss.cur_token_size()); |
| 279 | EXPECT_STREQ("bar", ss.cur_token()); |
| 280 | |
| 281 | EXPECT_TRUE(ss.Next()); |
| 282 | EXPECT_EQ(3u, ss.cur_token_size()); |
| 283 | EXPECT_STREQ("baz", ss.cur_token()); |
| 284 | |
| 285 | for (int i = 0; i < 3; i++) { |
| 286 | EXPECT_FALSE(ss.Next()); |
| 287 | EXPECT_EQ(0u, ss.cur_token_size()); |
| 288 | EXPECT_EQ(nullptr, ss.cur_token()); |
| 289 | } |
| 290 | } |
| 291 | { |
| 292 | char buf[] = "\0\0foo\0\0\0\0bar\0baz\0\0"; |
| 293 | StringSplitter ss(buf, sizeof(buf), '\0'); |
| 294 | EXPECT_TRUE(ss.Next()); |
| 295 | EXPECT_EQ(3u, ss.cur_token_size()); |
| 296 | EXPECT_STREQ("foo", ss.cur_token()); |
| 297 | |
| 298 | EXPECT_TRUE(ss.Next()); |
| 299 | EXPECT_EQ(3u, ss.cur_token_size()); |
| 300 | EXPECT_STREQ("bar", ss.cur_token()); |
| 301 | |
| 302 | EXPECT_TRUE(ss.Next()); |
| 303 | EXPECT_EQ(3u, ss.cur_token_size()); |
| 304 | EXPECT_STREQ("baz", ss.cur_token()); |
| 305 | |
| 306 | for (int i = 0; i < 3; i++) { |
| 307 | EXPECT_FALSE(ss.Next()); |
| 308 | EXPECT_EQ(0u, ss.cur_token_size()); |
| 309 | EXPECT_EQ(nullptr, ss.cur_token()); |
| 310 | } |
| 311 | } |
| 312 | { |
| 313 | char buf[] = ""; |
| 314 | StringSplitter ss(buf, 0, '\0'); |
| 315 | for (int i = 0; i < 3; i++) { |
| 316 | EXPECT_FALSE(ss.Next()); |
| 317 | EXPECT_EQ(0u, ss.cur_token_size()); |
| 318 | EXPECT_EQ(nullptr, ss.cur_token()); |
| 319 | } |
| 320 | } |
| 321 | { |
| 322 | char buf[] = "\0"; |
| 323 | StringSplitter ss(buf, 1, '\0'); |
| 324 | for (int i = 0; i < 3; i++) { |
| 325 | EXPECT_FALSE(ss.Next()); |
| 326 | EXPECT_EQ(0u, ss.cur_token_size()); |
| 327 | EXPECT_EQ(nullptr, ss.cur_token()); |
| 328 | } |
| 329 | } |
| 330 | { |
| 331 | char buf[] = "\0\0"; |
| 332 | StringSplitter ss(buf, 2, '\0'); |
| 333 | for (int i = 0; i < 3; i++) { |
| 334 | EXPECT_FALSE(ss.Next()); |
| 335 | EXPECT_EQ(0u, ss.cur_token_size()); |
| 336 | EXPECT_EQ(nullptr, ss.cur_token()); |
| 337 | } |
| 338 | } |
| 339 | } |
| 340 | |
| 341 | TEST(StringSplitterTest, NestedUsage) { |
| 342 | char text[] = R"( |
| 343 | l1w1 l1w2 l1w3 |
| 344 | |
| 345 | ,l,2,w,1 l,2,,w,,2,, |
| 346 | )"; |
| 347 | std::vector<std::string> all_lines; |
| 348 | std::vector<std::string> all_words; |
| 349 | std::vector<std::string> all_tokens; |
| 350 | for (StringSplitter lines(text, sizeof(text), '\n'); lines.Next();) { |
| 351 | all_lines.push_back(lines.cur_token()); |
| 352 | for (StringSplitter words(&lines, ' '); words.Next();) { |
| 353 | all_words.push_back(words.cur_token()); |
| 354 | for (StringSplitter tokens(&words, ','); tokens.Next();) { |
| 355 | all_tokens.push_back(tokens.cur_token()); |
| 356 | } |
| 357 | } |
| 358 | } |
| 359 | EXPECT_THAT(all_lines, |
| 360 | ElementsAreArray({"l1w1 l1w2 l1w3", ",l,2,w,1 l,2,,w,,2,,"})); |
| 361 | EXPECT_THAT(all_words, ElementsAreArray({"l1w1", "l1w2", "l1w3", ",l,2,w,1", |
| 362 | "l,2,,w,,2,,"})); |
| 363 | EXPECT_THAT(all_tokens, ElementsAreArray({"l1w1", "l1w2", "l1w3", "l", "2", |
| 364 | "w", "1", "l", "2", "w", "2"})); |
| 365 | } // namespace |
| 366 | |
| 367 | } // namespace |
| 368 | } // namespace base |
| 369 | } // namespace perfetto |