[ADT] Add a single-character version of the small vector split routine

author Chandler Carruth <chandlerc@gmail.com>

Thu, 10 Sep 2015 06:07:03 +0000 (06:07 +0000)

committer Chandler Carruth <chandlerc@gmail.com>

Thu, 10 Sep 2015 06:07:03 +0000 (06:07 +0000)
author Chandler Carruth <chandlerc@gmail.com>
Thu, 10 Sep 2015 06:07:03 +0000 (06:07 +0000)
committer Chandler Carruth <chandlerc@gmail.com>
Thu, 10 Sep 2015 06:07:03 +0000 (06:07 +0000)
diff --git a/include/llvm/ADT/StringRef.h b/include/llvm/ADT/StringRef.h

index 95660a49f1f1b2d9fd8ea752423ff2a676710e21..414fbe4a6756b5011ce4e5df55cec1d8ea09a427 100644 (file)
--- a/include/llvm/ADT/StringRef.h
+++ b/include/llvm/ADT/StringRef.h
@@ -489,6 +489,23 @@ namespace llvm {
                 StringRef Separator, int MaxSplit = -1,
                 bool KeepEmpty = true) const;
  
+    /// Split into substrings around the occurrences of a separator character.
+    ///
+    /// Each substring is stored in \p A. If \p MaxSplit is >= 0, at most
+    /// \p MaxSplit splits are done and consequently <= \p MaxSplit
+    /// elements are added to A.
+    /// If \p KeepEmpty is false, empty strings are not added to \p A. They
+    /// still count when considering \p MaxSplit
+    /// An useful invariant is that
+    /// Separator.join(A) == *this if MaxSplit == -1 and KeepEmpty == true
+    ///
+    /// \param A - Where to put the substrings.
+    /// \param Separator - The string to split on.
+    /// \param MaxSplit - The maximum number of times the string is split.
+    /// \param KeepEmpty - True if empty substring should be added.
+    void split(SmallVectorImpl<StringRef> &A, char Separator, int MaxSplit = -1,
+               bool KeepEmpty = true) const;
+
      /// Split into two substrings around the last occurrence of a separator
      /// character.
      ///
diff --git a/lib/Support/StringRef.cpp b/lib/Support/StringRef.cpp

index ddece087a9e7114a1ab8fdaa01eadef9096ebc84..f2e587cb527759b7e8fbbc27291f7f16228a24cd 100644 (file)
--- a/lib/Support/StringRef.cpp
+++ b/lib/Support/StringRef.cpp
@@ -294,6 +294,26 @@ void StringRef::split(SmallVectorImpl<StringRef> &A,
      A.push_back(rest);
  }
  
+void StringRef::split(SmallVectorImpl<StringRef> &A, char Separator,
+                      int MaxSplit, bool KeepEmpty) const {
+  StringRef rest = *this;
+
+  // rest.data() is used to distinguish cases like "a," that splits into
+  // "a" + "" and "a" that splits into "a" + 0.
+  for (int splits = 0;
+       rest.data() != nullptr && (MaxSplit < 0 || splits < MaxSplit);
+       ++splits) {
+    std::pair<StringRef, StringRef> p = rest.split(Separator);
+
+    if (KeepEmpty || p.first.size() != 0)
+      A.push_back(p.first);
+    rest = p.second;
+  }
+  // If we have a tail left, add it.
+  if (rest.data() != nullptr && (rest.size() != 0 || KeepEmpty))
+    A.push_back(rest);
+}
+
  //===----------------------------------------------------------------------===//
  // Helpful Algorithms
  //===----------------------------------------------------------------------===//
diff --git a/lib/Support/Triple.cpp b/lib/Support/Triple.cpp

index c1e68cac2f5af3c23f8b89da77ac944ab112ad41..dfe719d1f113b100aa5959e201d8da5560a633a6 100644 (file)
--- a/lib/Support/Triple.cpp
+++ b/lib/Support/Triple.cpp
@@ -624,7 +624,7 @@ std::string Triple::normalize(StringRef Str) {
  
    // Parse into components.
    SmallVector<StringRef, 4> Components;
-  Str.split(Components, "-");
+  Str.split(Components, '-');
  
    // If the first component corresponds to a known architecture, preferentially
    // use it for the architecture.  If the second component corresponds to a
diff --git a/unittests/ADT/StringRefTest.cpp b/unittests/ADT/StringRefTest.cpp

index d80179bd78738e2b2aa869a253736f54eedf3570..8af07da24ea12d8706bb320f12063e277fa7ec07 100644 (file)
--- a/unittests/ADT/StringRefTest.cpp
+++ b/unittests/ADT/StringRefTest.cpp
@@ -225,6 +225,11 @@ TEST(StringRefTest, Split2) {
    expected.push_back("a"); expected.push_back("b"); expected.push_back("c");
    StringRef("a,,b,c").split(parts, ",", 3, false);
    EXPECT_TRUE(parts == expected);
+
+  expected.clear(); parts.clear();
+  expected.push_back("a"); expected.push_back("b"); expected.push_back("c");
+  StringRef("a,,b,c").split(parts, ',', 3, false);
+  EXPECT_TRUE(parts == expected);
  }
  
  TEST(StringRefTest, Trim) {
author	Chandler Carruth <chandlerc@gmail.com>
	Thu, 10 Sep 2015 06:07:03 +0000 (06:07 +0000)
committer	Chandler Carruth <chandlerc@gmail.com>
	Thu, 10 Sep 2015 06:07:03 +0000 (06:07 +0000)
include/llvm/ADT/StringRef.h		patch \| blob \| history
lib/Support/StringRef.cpp		patch \| blob \| history
lib/Support/Triple.cpp		patch \| blob \| history
unittests/ADT/StringRefTest.cpp		patch \| blob \| history