2 * Copyright 2016 Facebook, Inc.
4 * Licensed under the Apache License, Version 2.0 (the "License");
5 * you may not use this file except in compliance with the License.
6 * You may obtain a copy of the License at
8 * http://www.apache.org/licenses/LICENSE-2.0
10 * Unless required by applicable law or agreed to in writing, software
11 * distributed under the License is distributed on an "AS IS" BASIS,
12 * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
13 * See the License for the specific language governing permissions and
14 * limitations under the License.
17 #include <folly/String.h>
19 #include <boost/regex.hpp>
20 #include <gtest/gtest.h>
22 #include <folly/Array.h>
24 using namespace folly;
27 TEST(StringPrintf, BasicTest) {
28 EXPECT_EQ("abc", stringPrintf("%s", "abc"));
29 EXPECT_EQ("abc", stringPrintf("%sbc", "a"));
30 EXPECT_EQ("abc", stringPrintf("a%sc", "b"));
31 EXPECT_EQ("abc", stringPrintf("ab%s", "c"));
33 EXPECT_EQ("abc", stringPrintf("abc"));
36 TEST(StringPrintf, NumericFormats) {
37 EXPECT_EQ("12", stringPrintf("%d", 12));
38 EXPECT_EQ("2000000000", stringPrintf("%ld", 2000000000UL));
39 EXPECT_EQ("2000000000", stringPrintf("%ld", 2000000000L));
40 EXPECT_EQ("-2000000000", stringPrintf("%ld", -2000000000L));
41 EXPECT_EQ("5000000000", stringPrintf("%lld", 5000000000ULL));
42 EXPECT_EQ("5000000000", stringPrintf("%lld", 5000000000LL));
43 EXPECT_EQ("-5000000000", stringPrintf("%lld", -5000000000LL));
44 EXPECT_EQ("-1", stringPrintf("%d", 0xffffffff));
45 EXPECT_EQ("-1", stringPrintf("%" PRId64, 0xffffffffffffffff));
46 EXPECT_EQ("-1", stringPrintf("%" PRId64, 0xffffffffffffffffUL));
48 EXPECT_EQ("7.7", stringPrintf("%1.1f", 7.7));
49 EXPECT_EQ("7.7", stringPrintf("%1.1lf", 7.7));
50 EXPECT_EQ("7.70000000000000018",
51 stringPrintf("%.17f", 7.7));
52 EXPECT_EQ("7.70000000000000018",
53 stringPrintf("%.17lf", 7.7));
56 TEST(StringPrintf, Appending) {
58 stringAppendf(&s, "a%s", "b");
59 stringAppendf(&s, "%c", 'c');
61 stringAppendf(&s, " %d", 123);
62 EXPECT_EQ(s, "abc 123");
65 void vprintfCheck(const char* expected, const char* fmt, ...) {
67 va_start(apOrig, fmt);
77 // Check both APIs for calling stringVPrintf()
78 EXPECT_EQ(expected, stringVPrintf(fmt, ap));
83 stringVPrintf(&out, fmt, ap);
86 EXPECT_EQ(expected, out);
88 // Check stringVAppendf() as well
89 std::string prefix = "foobar";
91 EXPECT_EQ(prefix + expected, stringVAppendf(&out, fmt, ap));
96 void vprintfError(const char* fmt, ...) {
103 // OSX's sprintf family does not return a negative number on a bad format
104 // string, but Linux does. It's unclear to me which behavior is more
106 #ifdef HAVE_VSNPRINTF_ERRORS
107 EXPECT_THROW({stringVPrintf(fmt, ap);},
112 TEST(StringPrintf, VPrintf) {
113 vprintfCheck("foo", "%s", "foo");
114 vprintfCheck("long string requiring reallocation 1 2 3 0x12345678",
115 "%s %s %d %d %d %#x",
116 "long string", "requiring reallocation", 1, 2, 3, 0x12345678);
117 vprintfError("bogus%", "foo");
120 TEST(StringPrintf, VariousSizes) {
121 // Test a wide variety of output sizes, making sure to cross the
122 // vsnprintf buffer boundary implementation detail.
123 for (int i = 0; i < 4096; ++i) {
124 string expected(i + 1, 'a');
125 expected = "X" + expected + "X";
126 string result = stringPrintf("%s", expected.c_str());
127 EXPECT_EQ(expected.size(), result.size());
128 EXPECT_EQ(expected, result);
131 EXPECT_EQ("abc12345678910111213141516171819202122232425xyz",
132 stringPrintf("abc%d%d%d%d%d%d%d%d%d%d%d%d%d%d"
133 "%d%d%d%d%d%d%d%d%d%d%dxyz",
134 1, 2, 3, 4, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15, 16,
135 17, 18, 19, 20, 21, 22, 23, 24, 25));
138 TEST(StringPrintf, oldStringPrintfTests) {
139 EXPECT_EQ(string("a/b/c/d"),
140 stringPrintf("%s/%s/%s/%s", "a", "b", "c", "d"));
142 EXPECT_EQ(string(" 5 10"),
143 stringPrintf("%5d %5d", 5, 10));
145 // check printing w/ a big buffer
146 for (int size = (1 << 8); size <= (1 << 15); size <<= 1) {
148 string b = stringPrintf("%s", a.c_str());
149 EXPECT_EQ(a.size(), b.size());
153 TEST(StringPrintf, oldStringAppendf) {
155 stringAppendf(&s, "%s/%s/%s/%s", "a", "b", "c", "d");
156 EXPECT_EQ(string("helloa/b/c/d"), s);
159 TEST(Escape, cEscape) {
160 EXPECT_EQ("hello world", cEscape<std::string>("hello world"));
161 EXPECT_EQ("hello \\\\world\\\" goodbye",
162 cEscape<std::string>("hello \\world\" goodbye"));
163 EXPECT_EQ("hello\\nworld", cEscape<std::string>("hello\nworld"));
164 EXPECT_EQ("hello\\377\\376", cEscape<std::string>("hello\xff\xfe"));
167 TEST(Escape, cUnescape) {
168 EXPECT_EQ("hello world", cUnescape<std::string>("hello world"));
169 EXPECT_EQ("hello \\world\" goodbye",
170 cUnescape<std::string>("hello \\\\world\\\" goodbye"));
171 EXPECT_EQ("hello\nworld", cUnescape<std::string>("hello\\nworld"));
172 EXPECT_EQ("hello\nworld", cUnescape<std::string>("hello\\012world"));
173 EXPECT_EQ("hello\nworld", cUnescape<std::string>("hello\\x0aworld"));
174 EXPECT_EQ("hello\xff\xfe", cUnescape<std::string>("hello\\377\\376"));
175 EXPECT_EQ("hello\xff\xfe", cUnescape<std::string>("hello\\xff\\xfe"));
177 EXPECT_THROW({cUnescape<std::string>("hello\\");},
178 std::invalid_argument);
179 EXPECT_THROW({cUnescape<std::string>("hello\\x");},
180 std::invalid_argument);
181 EXPECT_THROW({cUnescape<std::string>("hello\\q");},
182 std::invalid_argument);
185 TEST(Escape, uriEscape) {
186 EXPECT_EQ("hello%2c%20%2fworld", uriEscape<std::string>("hello, /world"));
187 EXPECT_EQ("hello%2c%20/world", uriEscape<std::string>("hello, /world",
188 UriEscapeMode::PATH));
189 EXPECT_EQ("hello%2c+%2fworld", uriEscape<std::string>("hello, /world",
190 UriEscapeMode::QUERY));
192 "0123456789abcdefghijklmnopqrstuvwxyzABCDEFGHIJKLMNOPQRSTUVWXYZ-_.~",
193 uriEscape<std::string>(
194 "0123456789abcdefghijklmnopqrstuvwxyzABCDEFGHIJKLMNOPQRSTUVWXYZ-_.~")
198 TEST(Escape, uriUnescape) {
199 EXPECT_EQ("hello, /world", uriUnescape<std::string>("hello, /world"));
200 EXPECT_EQ("hello, /world", uriUnescape<std::string>("hello%2c%20%2fworld"));
201 EXPECT_EQ("hello,+/world", uriUnescape<std::string>("hello%2c+%2fworld"));
202 EXPECT_EQ("hello, /world", uriUnescape<std::string>("hello%2c+%2fworld",
203 UriEscapeMode::QUERY));
204 EXPECT_EQ("hello/", uriUnescape<std::string>("hello%2f"));
205 EXPECT_EQ("hello/", uriUnescape<std::string>("hello%2F"));
206 EXPECT_THROW({uriUnescape<std::string>("hello%");},
207 std::invalid_argument);
208 EXPECT_THROW({uriUnescape<std::string>("hello%2");},
209 std::invalid_argument);
210 EXPECT_THROW({uriUnescape<std::string>("hello%2g");},
211 std::invalid_argument);
215 void expectPrintable(StringPiece s) {
223 TEST(Escape, uriEscapeAllCombinations) {
226 StringPiece in(c, 2);
229 for (int i = 0; i < 256; ++i) {
231 for (int j = 0; j < 256; ++j) {
236 expectPrintable(tmp);
237 uriUnescape(tmp, out);
245 return ((v >= '0' && v <= '9') ||
246 (v >= 'A' && v <= 'F') ||
247 (v >= 'a' && v <= 'f'));
251 TEST(Escape, uriUnescapePercentDecoding) {
252 char c[4] = {'%', '\0', '\0', '\0'};
253 StringPiece in(c, 3);
255 unsigned int expected = 0;
256 for (int i = 0; i < 256; ++i) {
258 for (int j = 0; j < 256; ++j) {
260 if (isHex(i) && isHex(j)) {
262 uriUnescape(in, out);
263 EXPECT_EQ(1, out.size());
264 EXPECT_EQ(1, sscanf(c + 1, "%x", &expected));
265 unsigned char v = out[0];
266 EXPECT_EQ(expected, v);
268 EXPECT_THROW({uriUnescape(in, out);}, std::invalid_argument);
276 double pow2(int exponent) {
277 return double(int64_t(1) << exponent);
281 struct PrettyTestCase{
282 std::string prettyString;
284 PrettyType prettyType;
287 PrettyTestCase prettyTestCases[] =
289 {string("8.53e+07 s "), 85.3e6, PRETTY_TIME},
290 {string("8.53e+07 s "), 85.3e6, PRETTY_TIME},
291 {string("85.3 ms"), 85.3e-3, PRETTY_TIME},
292 {string("85.3 us"), 85.3e-6, PRETTY_TIME},
293 {string("85.3 ns"), 85.3e-9, PRETTY_TIME},
294 {string("85.3 ps"), 85.3e-12, PRETTY_TIME},
295 {string("8.53e-14 s "), 85.3e-15, PRETTY_TIME},
297 {string("0 s "), 0, PRETTY_TIME},
298 {string("1 s "), 1.0, PRETTY_TIME},
299 {string("1 ms"), 1.0e-3, PRETTY_TIME},
300 {string("1 us"), 1.0e-6, PRETTY_TIME},
301 {string("1 ns"), 1.0e-9, PRETTY_TIME},
302 {string("1 ps"), 1.0e-12, PRETTY_TIME},
304 // check bytes printing
305 {string("853 B "), 853., PRETTY_BYTES},
306 {string("833 kB"), 853.e3, PRETTY_BYTES},
307 {string("813.5 MB"), 853.e6, PRETTY_BYTES},
308 {string("7.944 GB"), 8.53e9, PRETTY_BYTES},
309 {string("794.4 GB"), 853.e9, PRETTY_BYTES},
310 {string("775.8 TB"), 853.e12, PRETTY_BYTES},
312 {string("0 B "), 0, PRETTY_BYTES},
313 {string("1 B "), pow2(0), PRETTY_BYTES},
314 {string("1 kB"), pow2(10), PRETTY_BYTES},
315 {string("1 MB"), pow2(20), PRETTY_BYTES},
316 {string("1 GB"), pow2(30), PRETTY_BYTES},
317 {string("1 TB"), pow2(40), PRETTY_BYTES},
319 {string("853 B "), 853., PRETTY_BYTES_IEC},
320 {string("833 KiB"), 853.e3, PRETTY_BYTES_IEC},
321 {string("813.5 MiB"), 853.e6, PRETTY_BYTES_IEC},
322 {string("7.944 GiB"), 8.53e9, PRETTY_BYTES_IEC},
323 {string("794.4 GiB"), 853.e9, PRETTY_BYTES_IEC},
324 {string("775.8 TiB"), 853.e12, PRETTY_BYTES_IEC},
326 {string("0 B "), 0, PRETTY_BYTES_IEC},
327 {string("1 B "), pow2(0), PRETTY_BYTES_IEC},
328 {string("1 KiB"), pow2(10), PRETTY_BYTES_IEC},
329 {string("1 MiB"), pow2(20), PRETTY_BYTES_IEC},
330 {string("1 GiB"), pow2(30), PRETTY_BYTES_IEC},
331 {string("1 TiB"), pow2(40), PRETTY_BYTES_IEC},
333 // check bytes metric printing
334 {string("853 B "), 853., PRETTY_BYTES_METRIC},
335 {string("853 kB"), 853.e3, PRETTY_BYTES_METRIC},
336 {string("853 MB"), 853.e6, PRETTY_BYTES_METRIC},
337 {string("8.53 GB"), 8.53e9, PRETTY_BYTES_METRIC},
338 {string("853 GB"), 853.e9, PRETTY_BYTES_METRIC},
339 {string("853 TB"), 853.e12, PRETTY_BYTES_METRIC},
341 {string("0 B "), 0, PRETTY_BYTES_METRIC},
342 {string("1 B "), 1.0, PRETTY_BYTES_METRIC},
343 {string("1 kB"), 1.0e+3, PRETTY_BYTES_METRIC},
344 {string("1 MB"), 1.0e+6, PRETTY_BYTES_METRIC},
346 {string("1 GB"), 1.0e+9, PRETTY_BYTES_METRIC},
347 {string("1 TB"), 1.0e+12, PRETTY_BYTES_METRIC},
349 // check metric-units (powers of 1000) printing
350 {string("853 "), 853., PRETTY_UNITS_METRIC},
351 {string("853 k"), 853.e3, PRETTY_UNITS_METRIC},
352 {string("853 M"), 853.e6, PRETTY_UNITS_METRIC},
353 {string("8.53 bil"), 8.53e9, PRETTY_UNITS_METRIC},
354 {string("853 bil"), 853.e9, PRETTY_UNITS_METRIC},
355 {string("853 tril"), 853.e12, PRETTY_UNITS_METRIC},
357 // check binary-units (powers of 1024) printing
358 {string("0 "), 0, PRETTY_UNITS_BINARY},
359 {string("1 "), pow2(0), PRETTY_UNITS_BINARY},
360 {string("1 k"), pow2(10), PRETTY_UNITS_BINARY},
361 {string("1 M"), pow2(20), PRETTY_UNITS_BINARY},
362 {string("1 G"), pow2(30), PRETTY_UNITS_BINARY},
363 {string("1 T"), pow2(40), PRETTY_UNITS_BINARY},
365 {string("1023 "), pow2(10) - 1, PRETTY_UNITS_BINARY},
366 {string("1024 k"), pow2(20) - 1, PRETTY_UNITS_BINARY},
367 {string("1024 M"), pow2(30) - 1, PRETTY_UNITS_BINARY},
368 {string("1024 G"), pow2(40) - 1, PRETTY_UNITS_BINARY},
370 {string("0 "), 0, PRETTY_UNITS_BINARY_IEC},
371 {string("1 "), pow2(0), PRETTY_UNITS_BINARY_IEC},
372 {string("1 Ki"), pow2(10), PRETTY_UNITS_BINARY_IEC},
373 {string("1 Mi"), pow2(20), PRETTY_UNITS_BINARY_IEC},
374 {string("1 Gi"), pow2(30), PRETTY_UNITS_BINARY_IEC},
375 {string("1 Ti"), pow2(40), PRETTY_UNITS_BINARY_IEC},
377 {string("1023 "), pow2(10) - 1, PRETTY_UNITS_BINARY_IEC},
378 {string("1024 Ki"), pow2(20) - 1, PRETTY_UNITS_BINARY_IEC},
379 {string("1024 Mi"), pow2(30) - 1, PRETTY_UNITS_BINARY_IEC},
380 {string("1024 Gi"), pow2(40) - 1, PRETTY_UNITS_BINARY_IEC},
382 //check border SI cases
384 {string("1 Y"), 1e24, PRETTY_SI},
385 {string("10 Y"), 1e25, PRETTY_SI},
386 {string("1 y"), 1e-24, PRETTY_SI},
387 {string("10 y"), 1e-23, PRETTY_SI},
389 // check that negative values work
390 {string("-85.3 s "), -85.3, PRETTY_TIME},
391 {string("-85.3 ms"), -85.3e-3, PRETTY_TIME},
392 {string("-85.3 us"), -85.3e-6, PRETTY_TIME},
393 {string("-85.3 ns"), -85.3e-9, PRETTY_TIME},
395 {string("endoftest"), 0, PRETTY_NUM_TYPES}
398 TEST(PrettyPrint, Basic) {
399 for (int i = 0; prettyTestCases[i].prettyType != PRETTY_NUM_TYPES; ++i){
400 const PrettyTestCase& prettyTest = prettyTestCases[i];
401 EXPECT_EQ(prettyTest.prettyString,
402 prettyPrint(prettyTest.realValue, prettyTest.prettyType));
406 TEST(PrettyToDouble, Basic) {
407 // check manually created tests
408 for (int i = 0; prettyTestCases[i].prettyType != PRETTY_NUM_TYPES; ++i){
409 PrettyTestCase testCase = prettyTestCases[i];
410 PrettyType formatType = testCase.prettyType;
411 double x = testCase.realValue;
412 std::string testString = testCase.prettyString;
413 double recoveredX = 0;
415 recoveredX = prettyToDouble(testString, formatType);
416 } catch (std::range_error &ex){
419 double relativeError = fabs(x) < 1e-5 ? (x-recoveredX) :
420 (x - recoveredX) / x;
421 EXPECT_NEAR(0, relativeError, 1e-3);
424 // checks for compatibility with prettyPrint over the whole parameter space
425 for (int i = 0 ; i < PRETTY_NUM_TYPES; ++i){
426 PrettyType formatType = static_cast<PrettyType>(i);
427 for (double x = 1e-18; x < 1e40; x *= 1.9){
428 bool addSpace = static_cast<PrettyType> (i) == PRETTY_SI;
429 for (int it = 0; it < 2; ++it, addSpace = true){
430 double recoveredX = 0;
432 recoveredX = prettyToDouble(prettyPrint(x, formatType, addSpace),
434 } catch (std::range_error &ex){
437 double relativeError = (x - recoveredX) / x;
438 EXPECT_NEAR(0, relativeError, 1e-3);
443 // check for incorrect values
444 EXPECT_THROW(prettyToDouble("10Mx", PRETTY_SI), std::range_error);
445 EXPECT_THROW(prettyToDouble("10 Mx", PRETTY_SI), std::range_error);
446 EXPECT_THROW(prettyToDouble("10 M x", PRETTY_SI), std::range_error);
448 StringPiece testString = "10Mx";
449 EXPECT_DOUBLE_EQ(prettyToDouble(&testString, PRETTY_UNITS_METRIC), 10e6);
450 EXPECT_EQ(testString, "x");
453 TEST(PrettyPrint, HexDump) {
454 std::string a("abc\x00\x02\xa0", 6); // embedded NUL
456 "00000000 61 62 63 00 02 a0 "
458 hexDump(a.data(), a.size()));
460 a = "abcdefghijklmnopqrstuvwxyz";
462 "00000000 61 62 63 64 65 66 67 68 69 6a 6b 6c 6d 6e 6f 70 "
463 "|abcdefghijklmnop|\n"
464 "00000010 71 72 73 74 75 76 77 78 79 7a "
466 hexDump(a.data(), a.size()));
469 TEST(System, errnoStr) {
471 EXPECT_EQ(EACCES, errno);
472 EXPECT_EQ(EACCES, errno); // twice to make sure EXPECT_EQ doesn't change it
474 fbstring expected = strerror(ENOENT);
477 EXPECT_EQ(expected, errnoStr(ENOENT));
478 // Ensure that errno isn't changed
479 EXPECT_EQ(EACCES, errno);
481 // Per POSIX, all errno values are positive, so -1 is invalid
484 // Ensure that errno isn't changed
485 EXPECT_EQ(EACCES, errno);
490 template<template<class,class> class VectorType>
492 VectorType<string,std::allocator<string> > parts;
494 folly::split(',', "a,b,c", parts);
495 EXPECT_EQ(parts.size(), 3);
496 EXPECT_EQ(parts[0], "a");
497 EXPECT_EQ(parts[1], "b");
498 EXPECT_EQ(parts[2], "c");
501 folly::split(',', StringPiece("a,b,c"), parts);
502 EXPECT_EQ(parts.size(), 3);
503 EXPECT_EQ(parts[0], "a");
504 EXPECT_EQ(parts[1], "b");
505 EXPECT_EQ(parts[2], "c");
508 folly::split(',', string("a,b,c"), parts);
509 EXPECT_EQ(parts.size(), 3);
510 EXPECT_EQ(parts[0], "a");
511 EXPECT_EQ(parts[1], "b");
512 EXPECT_EQ(parts[2], "c");
515 folly::split(',', "a,,c", parts);
516 EXPECT_EQ(parts.size(), 3);
517 EXPECT_EQ(parts[0], "a");
518 EXPECT_EQ(parts[1], "");
519 EXPECT_EQ(parts[2], "c");
522 folly::split(',', string("a,,c"), parts);
523 EXPECT_EQ(parts.size(), 3);
524 EXPECT_EQ(parts[0], "a");
525 EXPECT_EQ(parts[1], "");
526 EXPECT_EQ(parts[2], "c");
529 folly::split(',', "a,,c", parts, true);
530 EXPECT_EQ(parts.size(), 2);
531 EXPECT_EQ(parts[0], "a");
532 EXPECT_EQ(parts[1], "c");
535 folly::split(',', string("a,,c"), parts, true);
536 EXPECT_EQ(parts.size(), 2);
537 EXPECT_EQ(parts[0], "a");
538 EXPECT_EQ(parts[1], "c");
541 folly::split(',', string(",,a,,c,,,"), parts, true);
542 EXPECT_EQ(parts.size(), 2);
543 EXPECT_EQ(parts[0], "a");
544 EXPECT_EQ(parts[1], "c");
547 // test multiple split w/o clear
548 folly::split(',', ",,a,,c,,,", parts, true);
549 EXPECT_EQ(parts.size(), 2);
550 EXPECT_EQ(parts[0], "a");
551 EXPECT_EQ(parts[1], "c");
552 folly::split(',', ",,a,,c,,,", parts, true);
553 EXPECT_EQ(parts.size(), 4);
554 EXPECT_EQ(parts[2], "a");
555 EXPECT_EQ(parts[3], "c");
558 // test splits that with multi-line delimiter
559 folly::split("ab", "dabcabkdbkab", parts, true);
560 EXPECT_EQ(parts.size(), 3);
561 EXPECT_EQ(parts[0], "d");
562 EXPECT_EQ(parts[1], "c");
563 EXPECT_EQ(parts[2], "kdbk");
566 // test last part is shorter than the delimiter
567 folly::split("bc", "abcd", parts, true);
568 EXPECT_EQ(parts.size(), 2);
569 EXPECT_EQ(parts[0], "a");
570 EXPECT_EQ(parts[1], "d");
573 string orig = "ab2342asdfv~~!";
574 folly::split("", orig, parts, true);
575 EXPECT_EQ(parts.size(), 1);
576 EXPECT_EQ(parts[0], orig);
579 folly::split("452x;o38asfsajsdlfdf.j", "asfds", parts, true);
580 EXPECT_EQ(parts.size(), 1);
581 EXPECT_EQ(parts[0], "asfds");
584 folly::split("a", "", parts, true);
585 EXPECT_EQ(parts.size(), 0);
588 folly::split("a", "", parts);
589 EXPECT_EQ(parts.size(), 1);
590 EXPECT_EQ(parts[0], "");
593 folly::split("a", StringPiece(), parts, true);
594 EXPECT_EQ(parts.size(), 0);
597 folly::split("a", StringPiece(), parts);
598 EXPECT_EQ(parts.size(), 1);
599 EXPECT_EQ(parts[0], "");
602 folly::split("a", "abcdefg", parts, true);
603 EXPECT_EQ(parts.size(), 1);
604 EXPECT_EQ(parts[0], "bcdefg");
607 orig = "All, , your base, are , , belong to us";
608 folly::split(", ", orig, parts, true);
609 EXPECT_EQ(parts.size(), 4);
610 EXPECT_EQ(parts[0], "All");
611 EXPECT_EQ(parts[1], "your base");
612 EXPECT_EQ(parts[2], "are ");
613 EXPECT_EQ(parts[3], "belong to us");
615 folly::split(", ", orig, parts);
616 EXPECT_EQ(parts.size(), 6);
617 EXPECT_EQ(parts[0], "All");
618 EXPECT_EQ(parts[1], "");
619 EXPECT_EQ(parts[2], "your base");
620 EXPECT_EQ(parts[3], "are ");
621 EXPECT_EQ(parts[4], "");
622 EXPECT_EQ(parts[5], "belong to us");
625 orig = ", Facebook, rul,es!, ";
626 folly::split(", ", orig, parts, true);
627 EXPECT_EQ(parts.size(), 2);
628 EXPECT_EQ(parts[0], "Facebook");
629 EXPECT_EQ(parts[1], "rul,es!");
631 folly::split(", ", orig, parts);
632 EXPECT_EQ(parts.size(), 4);
633 EXPECT_EQ(parts[0], "");
634 EXPECT_EQ(parts[1], "Facebook");
635 EXPECT_EQ(parts[2], "rul,es!");
636 EXPECT_EQ(parts[3], "");
639 template<template<class,class> class VectorType>
641 VectorType<StringPiece,std::allocator<StringPiece> > pieces;
642 VectorType<StringPiece,std::allocator<StringPiece> > pieces2;
644 folly::split(',', "a,b,c", pieces);
645 EXPECT_EQ(pieces.size(), 3);
646 EXPECT_EQ(pieces[0], "a");
647 EXPECT_EQ(pieces[1], "b");
648 EXPECT_EQ(pieces[2], "c");
652 folly::split(',', "a,,c", pieces);
653 EXPECT_EQ(pieces.size(), 3);
654 EXPECT_EQ(pieces[0], "a");
655 EXPECT_EQ(pieces[1], "");
656 EXPECT_EQ(pieces[2], "c");
659 folly::split(',', "a,,c", pieces, true);
660 EXPECT_EQ(pieces.size(), 2);
661 EXPECT_EQ(pieces[0], "a");
662 EXPECT_EQ(pieces[1], "c");
665 folly::split(',', ",,a,,c,,,", pieces, true);
666 EXPECT_EQ(pieces.size(), 2);
667 EXPECT_EQ(pieces[0], "a");
668 EXPECT_EQ(pieces[1], "c");
671 // test multiple split w/o clear
672 folly::split(',', ",,a,,c,,,", pieces, true);
673 EXPECT_EQ(pieces.size(), 2);
674 EXPECT_EQ(pieces[0], "a");
675 EXPECT_EQ(pieces[1], "c");
676 folly::split(',', ",,a,,c,,,", pieces, true);
677 EXPECT_EQ(pieces.size(), 4);
678 EXPECT_EQ(pieces[2], "a");
679 EXPECT_EQ(pieces[3], "c");
682 // test multiple split rounds
683 folly::split(",", "a_b,c_d", pieces);
684 EXPECT_EQ(pieces.size(), 2);
685 EXPECT_EQ(pieces[0], "a_b");
686 EXPECT_EQ(pieces[1], "c_d");
687 folly::split("_", pieces[0], pieces2);
688 EXPECT_EQ(pieces2.size(), 2);
689 EXPECT_EQ(pieces2[0], "a");
690 EXPECT_EQ(pieces2[1], "b");
692 folly::split("_", pieces[1], pieces2);
693 EXPECT_EQ(pieces2.size(), 2);
694 EXPECT_EQ(pieces2[0], "c");
695 EXPECT_EQ(pieces2[1], "d");
699 // test splits that with multi-line delimiter
700 folly::split("ab", "dabcabkdbkab", pieces, true);
701 EXPECT_EQ(pieces.size(), 3);
702 EXPECT_EQ(pieces[0], "d");
703 EXPECT_EQ(pieces[1], "c");
704 EXPECT_EQ(pieces[2], "kdbk");
707 string orig = "ab2342asdfv~~!";
708 folly::split("", orig.c_str(), pieces, true);
709 EXPECT_EQ(pieces.size(), 1);
710 EXPECT_EQ(pieces[0], orig);
713 folly::split("452x;o38asfsajsdlfdf.j", "asfds", pieces, true);
714 EXPECT_EQ(pieces.size(), 1);
715 EXPECT_EQ(pieces[0], "asfds");
718 folly::split("a", "", pieces, true);
719 EXPECT_EQ(pieces.size(), 0);
722 folly::split("a", "", pieces);
723 EXPECT_EQ(pieces.size(), 1);
724 EXPECT_EQ(pieces[0], "");
727 folly::split("a", "abcdefg", pieces, true);
728 EXPECT_EQ(pieces.size(), 1);
729 EXPECT_EQ(pieces[0], "bcdefg");
732 orig = "All, , your base, are , , belong to us";
733 folly::split(", ", orig, pieces, true);
734 EXPECT_EQ(pieces.size(), 4);
735 EXPECT_EQ(pieces[0], "All");
736 EXPECT_EQ(pieces[1], "your base");
737 EXPECT_EQ(pieces[2], "are ");
738 EXPECT_EQ(pieces[3], "belong to us");
740 folly::split(", ", orig, pieces);
741 EXPECT_EQ(pieces.size(), 6);
742 EXPECT_EQ(pieces[0], "All");
743 EXPECT_EQ(pieces[1], "");
744 EXPECT_EQ(pieces[2], "your base");
745 EXPECT_EQ(pieces[3], "are ");
746 EXPECT_EQ(pieces[4], "");
747 EXPECT_EQ(pieces[5], "belong to us");
750 orig = ", Facebook, rul,es!, ";
751 folly::split(", ", orig, pieces, true);
752 EXPECT_EQ(pieces.size(), 2);
753 EXPECT_EQ(pieces[0], "Facebook");
754 EXPECT_EQ(pieces[1], "rul,es!");
756 folly::split(", ", orig, pieces);
757 EXPECT_EQ(pieces.size(), 4);
758 EXPECT_EQ(pieces[0], "");
759 EXPECT_EQ(pieces[1], "Facebook");
760 EXPECT_EQ(pieces[2], "rul,es!");
761 EXPECT_EQ(pieces[3], "");
764 const char* str = "a,b";
765 folly::split(',', StringPiece(str), pieces);
766 EXPECT_EQ(pieces.size(), 2);
767 EXPECT_EQ(pieces[0], "a");
768 EXPECT_EQ(pieces[1], "b");
769 EXPECT_EQ(pieces[0].start(), str);
770 EXPECT_EQ(pieces[1].start(), str + 2);
772 std::set<StringPiece> unique;
773 folly::splitTo<StringPiece>(":", "asd:bsd:asd:asd:bsd:csd::asd",
774 std::inserter(unique, unique.begin()), true);
775 EXPECT_EQ(unique.size(), 3);
776 if (unique.size() == 3) {
777 EXPECT_EQ(*unique.begin(), "asd");
778 EXPECT_EQ(*--unique.end(), "csd");
781 VectorType<fbstring,std::allocator<fbstring> > blah;
782 folly::split('-', "a-b-c-d-f-e", blah);
783 EXPECT_EQ(blah.size(), 6);
788 TEST(Split, split_vector) {
789 splitTest<std::vector>();
791 TEST(Split, split_fbvector) {
792 splitTest<folly::fbvector>();
794 TEST(Split, pieces_vector) {
795 piecesTest<std::vector>();
797 TEST(Split, pieces_fbvector) {
798 piecesTest<folly::fbvector>();
802 StringPiece a, b, c, d;
804 EXPECT_TRUE(folly::split<false>('.', "a.b.c.d", a, b, c, d));
805 EXPECT_TRUE(folly::split<false>('.', "a.b.c", a, b, c));
806 EXPECT_TRUE(folly::split<false>('.', "a.b", a, b));
807 EXPECT_TRUE(folly::split<false>('.', "a", a));
809 EXPECT_TRUE(folly::split('.', "a.b.c.d", a, b, c, d));
810 EXPECT_TRUE(folly::split('.', "a.b.c", a, b, c));
811 EXPECT_TRUE(folly::split('.', "a.b", a, b));
812 EXPECT_TRUE(folly::split('.', "a", a));
814 EXPECT_TRUE(folly::split<false>('.', "a.b.c", a, b, c));
818 EXPECT_FALSE(folly::split<false>('.', "a.b", a, b, c));
819 EXPECT_TRUE(folly::split<false>('.', "a.b.c", a, b));
823 EXPECT_TRUE(folly::split('.', "a.b.c", a, b, c));
827 EXPECT_FALSE(folly::split('.', "a.b.c", a, b));
828 EXPECT_FALSE(folly::split('.', "a.b", a, b, c));
830 EXPECT_TRUE(folly::split<false>('.', "a.b", a, b));
833 EXPECT_FALSE(folly::split<false>('.', "a", a, b));
834 EXPECT_TRUE(folly::split<false>('.', "a.b", a));
837 EXPECT_TRUE(folly::split('.', "a.b", a, b));
840 EXPECT_FALSE(folly::split('.', "a", a, b));
841 EXPECT_FALSE(folly::split('.', "a.b", a));
844 TEST(Split, std_string_fixed) {
845 std::string a, b, c, d;
847 EXPECT_TRUE(folly::split<false>('.', "a.b.c.d", a, b, c, d));
848 EXPECT_TRUE(folly::split<false>('.', "a.b.c", a, b, c));
849 EXPECT_TRUE(folly::split<false>('.', "a.b", a, b));
850 EXPECT_TRUE(folly::split<false>('.', "a", a));
852 EXPECT_TRUE(folly::split('.', "a.b.c.d", a, b, c, d));
853 EXPECT_TRUE(folly::split('.', "a.b.c", a, b, c));
854 EXPECT_TRUE(folly::split('.', "a.b", a, b));
855 EXPECT_TRUE(folly::split('.', "a", a));
857 EXPECT_TRUE(folly::split<false>('.', "a.b.c", a, b, c));
861 EXPECT_FALSE(folly::split<false>('.', "a.b", a, b, c));
862 EXPECT_TRUE(folly::split<false>('.', "a.b.c", a, b));
866 EXPECT_TRUE(folly::split('.', "a.b.c", a, b, c));
870 EXPECT_FALSE(folly::split('.', "a.b.c", a, b));
871 EXPECT_FALSE(folly::split('.', "a.b", a, b, c));
873 EXPECT_TRUE(folly::split<false>('.', "a.b", a, b));
876 EXPECT_FALSE(folly::split<false>('.', "a", a, b));
877 EXPECT_TRUE(folly::split<false>('.', "a.b", a));
880 EXPECT_TRUE(folly::split('.', "a.b", a, b));
883 EXPECT_FALSE(folly::split('.', "a", a, b));
884 EXPECT_FALSE(folly::split('.', "a.b", a));
887 TEST(Split, fixed_convert) {
892 EXPECT_TRUE(folly::split(':', "a:13:14.7:b", a, b, c, d));
895 EXPECT_NEAR(14.7, c, 1e-10);
898 EXPECT_TRUE(folly::split<false>(':', "b:14:15.3:c", a, b, c, d));
901 EXPECT_NEAR(15.3, c, 1e-10);
904 EXPECT_FALSE(folly::split(':', "a:13:14.7:b", a, b, d));
906 EXPECT_TRUE(folly::split<false>(':', "a:13:14.7:b", a, b, d));
909 EXPECT_EQ("14.7:b", d);
912 // Enable verifying that a line only contains one field
913 EXPECT_TRUE(folly::split(' ', "hello", a));
914 EXPECT_FALSE(folly::split(' ', "hello world", a));
924 void parseTo(folly::StringPiece in, Color& out) {
927 } else if (in == "B") {
930 throw runtime_error("");
935 TEST(Split, fixed_convert_custom) {
938 EXPECT_TRUE(folly::split(',', "R,B", c1, c2));
939 EXPECT_EQ(c1, my::Color::Red);
940 EXPECT_EQ(c2, my::Color::Blue);
946 std::vector<int> empty = { };
947 join(":", empty, output);
948 EXPECT_TRUE(output.empty());
950 std::vector<std::string> input1 = { "1", "23", "456", "" };
951 join(':', input1, output);
952 EXPECT_EQ(output, "1:23:456:");
953 output = join(':', input1);
954 EXPECT_EQ(output, "1:23:456:");
956 auto input2 = { 1, 23, 456 };
957 join("-*-", input2, output);
958 EXPECT_EQ(output, "1-*-23-*-456");
959 output = join("-*-", input2);
960 EXPECT_EQ(output, "1-*-23-*-456");
962 auto input3 = { 'f', 'a', 'c', 'e', 'b', 'o', 'o', 'k' };
963 join("", input3, output);
964 EXPECT_EQ(output, "facebook");
966 join("_", { "", "f", "a", "c", "e", "b", "o", "o", "k", "" }, output);
967 EXPECT_EQ(output, "_f_a_c_e_b_o_o_k_");
969 output = join("", input3.begin(), input3.end());
970 EXPECT_EQ(output, "facebook");
973 TEST(String, hexlify) {
974 string input1 = "0123";
976 EXPECT_TRUE(hexlify(input1, output1));
977 EXPECT_EQ("30313233", output1);
979 fbstring input2 = "abcdefg";
984 EXPECT_TRUE(hexlify(input2, output2));
985 EXPECT_EQ("610063ff65b667", output2);
987 EXPECT_EQ("666f6f626172", hexlify("foobar"));
988 auto bytes = folly::make_array<uint8_t>(1, 2, 3, 4);
989 EXPECT_EQ("01020304", hexlify(ByteRange{bytes.data(), bytes.size()}));
992 TEST(String, unhexlify) {
993 string input1 = "30313233";
995 EXPECT_TRUE(unhexlify(input1, output1));
996 EXPECT_EQ(output1, "0123");
998 fbstring input2 = "610063ff65b667";
1000 EXPECT_TRUE(unhexlify(input2, output2));
1001 EXPECT_EQ(output2.size(), 7);
1002 EXPECT_EQ(output2[0], 'a');
1003 EXPECT_EQ(output2[1], 0);
1004 EXPECT_EQ(output2[2], 'c');
1005 EXPECT_EQ(output2[3] & 0xff, 0xff);
1006 EXPECT_EQ(output2[4], 'e');
1007 EXPECT_EQ(output2[5] & 0xff, 0xb6);
1008 EXPECT_EQ(output2[6], 'g');
1010 string input3 = "x";
1012 EXPECT_FALSE(unhexlify(input3, output3));
1014 string input4 = "xy";
1016 EXPECT_FALSE(unhexlify(input4, output4));
1018 EXPECT_EQ("foobar", unhexlify("666f6f626172"));
1019 EXPECT_EQ(StringPiece("foo\0bar", 7), unhexlify("666f6f00626172"));
1020 EXPECT_THROW(unhexlify("666f6fzz626172"), std::domain_error);
1023 TEST(String, backslashify) {
1024 EXPECT_EQ("abc", string("abc"));
1025 EXPECT_EQ("abc", backslashify(string("abc")));
1026 EXPECT_EQ("abc\\r", backslashify(string("abc\r")));
1027 EXPECT_EQ("abc\\x0d", backslashify(string("abc\r"), true));
1028 EXPECT_EQ("\\0\\0", backslashify(string(2, '\0')));
1031 TEST(String, humanify) {
1032 // Simple cases; output is obvious.
1033 EXPECT_EQ("abc", humanify(string("abc")));
1034 EXPECT_EQ("abc\\\\r", humanify(string("abc\\r")));
1035 EXPECT_EQ("0xff", humanify(string("\xff")));
1036 EXPECT_EQ("abc\\xff", humanify(string("abc\xff")));
1037 EXPECT_EQ("abc\\b", humanify(string("abc\b")));
1038 EXPECT_EQ("0x00", humanify(string(1, '\0')));
1039 EXPECT_EQ("0x0000", humanify(string(2, '\0')));
1042 // Mostly printable, so backslash! 80, 60, and 40% printable, respectively
1043 EXPECT_EQ("aaaa\\xff", humanify(string("aaaa\xff")));
1044 EXPECT_EQ("aaa\\xff\\xff", humanify(string("aaa\xff\xff")));
1045 EXPECT_EQ("aa\\xff\\xff\\xff", humanify(string("aa\xff\xff\xff")));
1047 // 20% printable, and the printable portion isn't the prefix; hexify!
1048 EXPECT_EQ("0xff61ffffff", humanify(string("\xff" "a\xff\xff\xff")));
1050 // Same as previous, except swap first two chars; prefix is
1051 // printable and within the threshold, so backslashify.
1052 EXPECT_EQ("a\\xff\\xff\\xff\\xff", humanify(string("a\xff\xff\xff\xff")));
1054 // Just too much unprintable; hex, despite prefix.
1055 EXPECT_EQ("0x61ffffffffff", humanify(string("a\xff\xff\xff\xff\xff")));
1061 * Copy bytes from src to somewhere in the buffer referenced by dst. The
1062 * actual starting position of the copy will be the first address in the
1063 * destination buffer whose address mod 8 is equal to the src address mod 8.
1064 * The caller is responsible for ensuring that the destination buffer has
1065 * enough extra space to accommodate the shifted copy.
1067 char* copyWithSameAlignment(char* dst, const char* src, size_t length) {
1068 const char* originalDst = dst;
1069 size_t dstOffset = size_t(dst) & 0x7;
1070 size_t srcOffset = size_t(src) & 0x7;
1071 while (dstOffset != srcOffset) {
1076 CHECK(dst <= originalDst + 7);
1077 CHECK((size_t(dst) & 0x7) == (size_t(src) & 0x7));
1078 memcpy(dst, src, length);
1082 void testToLowerAscii(Range<const char*> src) {
1083 // Allocate extra space so we can make copies that start at the
1084 // same alignment (byte, word, quadword, etc) as the source buffer.
1085 char controlBuf[src.size() + 7];
1086 char* control = copyWithSameAlignment(controlBuf, src.begin(), src.size());
1088 char testBuf[src.size() + 7];
1089 char* test = copyWithSameAlignment(testBuf, src.begin(), src.size());
1091 for (size_t i = 0; i < src.size(); i++) {
1092 control[i] = tolower(control[i]);
1094 toLowerAscii(test, src.size());
1095 for (size_t i = 0; i < src.size(); i++) {
1096 EXPECT_EQ(control[i], test[i]);
1102 TEST(String, toLowerAsciiAligned) {
1103 static const size_t kSize = 256;
1105 for (size_t i = 0; i < kSize; i++) {
1106 input[i] = (char)(i & 0xff);
1108 testToLowerAscii(Range<const char*>(input, kSize));
1111 TEST(String, toLowerAsciiUnaligned) {
1112 static const size_t kSize = 256;
1114 for (size_t i = 0; i < kSize; i++) {
1115 input[i] = (char)(i & 0xff);
1117 // Test input buffers of several lengths to exercise all the
1118 // cases: buffer at the start/middle/end of an aligned block, plus
1119 // buffers that span multiple aligned blocks. The longest test input
1120 // is 3 unaligned bytes + 4 32-bit aligned bytes + 8 64-bit aligned
1121 // + 4 32-bit aligned + 3 unaligned = 22 bytes.
1122 for (size_t length = 1; length < 23; length++) {
1123 for (size_t offset = 0; offset + length <= kSize; offset++) {
1124 testToLowerAscii(Range<const char*>(input + offset, length));
1129 TEST(String, whitespace) {
1131 EXPECT_EQ("kavabanga",
1132 trimWhitespace("kavabanga"));
1133 EXPECT_EQ("kavabanga",
1134 trimWhitespace("kavabanga \t \n "));
1135 EXPECT_EQ("kavabanga",
1136 trimWhitespace(" \t \r \n \n kavabanga"));
1137 EXPECT_EQ("kavabanga",
1138 trimWhitespace("\t \r \n kavabanga \t \n "));
1139 EXPECT_EQ("kavabanga",
1140 trimWhitespace(" \t \r \n \n kavabanga"));
1141 EXPECT_EQ("kavabanga",
1142 trimWhitespace("\t \r \n kavabanga \t \n "));
1144 ltrimWhitespace(rtrimWhitespace("kavabanga")),
1145 rtrimWhitespace(ltrimWhitespace("kavabanga")));
1147 ltrimWhitespace(rtrimWhitespace("kavabanga \r\t\n")),
1148 rtrimWhitespace(ltrimWhitespace("kavabanga \r\t\n")));
1149 EXPECT_EQ("", trimWhitespace("\t \r \n \t \n "));
1150 EXPECT_EQ("", trimWhitespace(""));
1151 EXPECT_EQ("", trimWhitespace("\t"));
1152 EXPECT_EQ("", trimWhitespace("\r"));
1153 EXPECT_EQ("", trimWhitespace("\n"));
1154 EXPECT_EQ("", trimWhitespace("\t "));
1155 EXPECT_EQ("", trimWhitespace("\r "));
1156 EXPECT_EQ("", trimWhitespace("\n "));
1157 EXPECT_EQ("", trimWhitespace(" \t"));
1158 EXPECT_EQ("", trimWhitespace(" \r"));
1159 EXPECT_EQ("", trimWhitespace(" \n"));
1162 EXPECT_EQ("kavabanga", ltrimWhitespace("\t kavabanga"));
1163 EXPECT_EQ("kavabanga \r\n", ltrimWhitespace("\t kavabanga \r\n"));
1164 EXPECT_EQ("", ltrimWhitespace("\r "));
1165 EXPECT_EQ("", ltrimWhitespace("\n "));
1166 EXPECT_EQ("", ltrimWhitespace("\r "));
1169 EXPECT_EQ("\t kavabanga", rtrimWhitespace("\t kavabanga"));
1170 EXPECT_EQ("\t kavabanga", rtrimWhitespace("\t kavabanga \r\n"));
1171 EXPECT_EQ("", rtrimWhitespace("\r "));
1172 EXPECT_EQ("", rtrimWhitespace("\n "));
1173 EXPECT_EQ("", rtrimWhitespace("\r "));
1176 TEST(String, stripLeftMargin_really_empty) {
1179 EXPECT_EQ(expected, stripLeftMargin(input));
1182 TEST(String, stripLeftMargin_empty) {
1183 auto input = R"TEXT(
1186 EXPECT_EQ(expected, stripLeftMargin(input));
1189 TEST(String, stripLeftMargin_only_whitespace) {
1190 // using ~ as a marker
1191 string input = R"TEXT(
1194 input = boost::regex_replace(input, boost::regex("~"), "");
1195 EXPECT_EQ("\n \n ", input);
1196 auto expected = "\n";
1197 EXPECT_EQ(expected, stripLeftMargin(input));
1200 TEST(String, stripLeftMargin_only_uneven_whitespace) {
1201 // using ~ as a marker1
1202 string input = R"TEXT(
1206 input = boost::regex_replace(input, boost::regex("~"), "");
1207 EXPECT_EQ("\n \n \n ", input);
1208 auto expected = "\n\n";
1210 EXPECT_EQ(expected, stripLeftMargin(input));
1213 TEST(String, stripLeftMargin_one_line) {
1214 auto input = R"TEXT(
1217 auto expected = "hi there bob!\n";
1218 EXPECT_EQ(expected, stripLeftMargin(input));
1221 TEST(String, stripLeftMargin_two_lines) {
1222 auto input = R"TEXT(
1226 auto expected = "hi there bob!\nnice weather today!\n";
1227 EXPECT_EQ(expected, stripLeftMargin(input));
1230 TEST(String, stripLeftMargin_three_lines_uneven) {
1231 auto input = R"TEXT(
1236 auto expected = " hi there bob!\nnice weather today!\n so long!\n";
1237 EXPECT_EQ(expected, stripLeftMargin(input));
1240 TEST(String, stripLeftMargin_preceding_blank_lines) {
1241 auto input = R"TEXT(
1246 auto expected = "\n\nhi there bob!\n";
1247 EXPECT_EQ(expected, stripLeftMargin(input));
1250 TEST(String, stripLeftMargin_succeeding_blank_lines) {
1251 auto input = R"TEXT(
1256 auto expected = "hi there bob!\n\n\n";
1257 EXPECT_EQ(expected, stripLeftMargin(input));
1260 TEST(String, stripLeftMargin_interstitial_undented_whiteline) {
1261 // using ~ as a marker
1262 string input = R"TEXT(
1267 input = boost::regex_replace(input, boost::regex(" +~"), "");
1268 EXPECT_EQ("\n hi there bob!\n\n so long!\n ", input);
1269 auto expected = "hi there bob!\n\nso long!\n";
1270 EXPECT_EQ(expected, stripLeftMargin(input));
1273 TEST(String, stripLeftMargin_interstitial_dedented_whiteline) {
1274 // using ~ as a marker
1275 string input = R"TEXT(
1280 input = boost::regex_replace(input, boost::regex("~"), "");
1281 EXPECT_EQ("\n hi there bob!\n \n so long!\n ", input);
1282 auto expected = "hi there bob!\n\nso long!\n";
1283 EXPECT_EQ(expected, stripLeftMargin(input));
1286 TEST(String, stripLeftMargin_interstitial_equidented_whiteline) {
1287 // using ~ as a marker
1288 string input = R"TEXT(
1293 input = boost::regex_replace(input, boost::regex("~"), "");
1294 EXPECT_EQ("\n hi there bob!\n \n so long!\n ", input);
1295 auto expected = "hi there bob!\n\nso long!\n";
1296 EXPECT_EQ(expected, stripLeftMargin(input));
1299 TEST(String, stripLeftMargin_interstitial_indented_whiteline) {
1300 // using ~ as a marker
1301 string input = R"TEXT(
1306 input = boost::regex_replace(input, boost::regex("~"), "");
1307 EXPECT_EQ("\n hi there bob!\n \n so long!\n ", input);
1308 auto expected = "hi there bob!\n \nso long!\n";
1309 EXPECT_EQ(expected, stripLeftMargin(input));
1312 TEST(String, stripLeftMargin_no_pre_whitespace) {
1313 // using ~ as a marker
1314 string input = R"TEXT( hi there bob!
1318 input = boost::regex_replace(input, boost::regex("~"), "");
1319 EXPECT_EQ(" hi there bob!\n \n so long!\n ", input);
1320 auto expected = "hi there bob!\n \nso long!\n";
1321 EXPECT_EQ(expected, stripLeftMargin(input));
1324 TEST(String, stripLeftMargin_no_post_whitespace) {
1325 // using ~ as a marker
1326 string input = R"TEXT(
1330 input = boost::regex_replace(input, boost::regex("~"), "");
1331 EXPECT_EQ("\n hi there bob!\n \n so long! ", input);
1332 auto expected = "hi there bob!\n \nso long! ";
1333 EXPECT_EQ(expected, stripLeftMargin(input));
1336 const folly::StringPiece kTestUTF8 = u8"This is \U0001F602 stuff!";
1338 TEST(UTF8StringPiece, valid_utf8) {
1339 folly::StringPiece sp = kTestUTF8;
1340 UTF8StringPiece utf8 = sp;
1341 // utf8.size() not available since it's not a random-access range
1342 EXPECT_EQ(16, utf8.walk_size());
1345 TEST(UTF8StringPiece, valid_suffix) {
1346 UTF8StringPiece utf8 = kTestUTF8.subpiece(8);
1347 EXPECT_EQ(8, utf8.walk_size());
1350 TEST(UTF8StringPiece, empty_mid_codepoint) {
1351 UTF8StringPiece utf8 = kTestUTF8.subpiece(9, 0); // okay since it's empty
1352 EXPECT_EQ(0, utf8.walk_size());
1355 TEST(UTF8StringPiece, invalid_mid_codepoint) {
1356 EXPECT_THROW(UTF8StringPiece(kTestUTF8.subpiece(9, 1)), std::out_of_range);
1359 TEST(UTF8StringPiece, valid_implicit_conversion) {
1360 std::string input = u8"\U0001F602\U0001F602\U0001F602";
1361 auto checkImplicitCtor = [](UTF8StringPiece implicitCtor) {
1362 return implicitCtor.walk_size();
1364 EXPECT_EQ(3, checkImplicitCtor(input));