[llvm] [ADT] Teach StringRef to take basic features from std::string_view (NFC) (PR #113797)

Kazu Hirata via llvm-commits llvm-commits at lists.llvm.org
Sun Oct 27 08:26:08 PDT 2024


https://github.com/kazutakahirata updated https://github.com/llvm/llvm-project/pull/113797

>From 0916c4c1a995cf8d584a8c804f3bfef0031d81ac Mon Sep 17 00:00:00 2001
From: Kazu Hirata <kazu at google.com>
Date: Sat, 26 Oct 2024 20:00:30 -0700
Subject: [PATCH 1/3] [ADT] Teach StringRef to take basic features from
 std::string_view (NFC)

This patch teaches StringRef to take basic features from
std::string_view, including:

- npos
- iterator types
- empty, begin, end, rbegin, rend

I'm not replacing performance-sensitive functions like find and
operator== for now so that this patch will likely stick.
---
 llvm/include/llvm/ADT/StringRef.h | 43 ++++++++++++-------------------
 llvm/lib/Support/StringRef.cpp    |  6 ++---
 2 files changed, 19 insertions(+), 30 deletions(-)

diff --git a/llvm/include/llvm/ADT/StringRef.h b/llvm/include/llvm/ADT/StringRef.h
index f879bbf7164fd6..e59a3f10ee76df 100644
--- a/llvm/include/llvm/ADT/StringRef.h
+++ b/llvm/include/llvm/ADT/StringRef.h
@@ -50,14 +50,14 @@ namespace llvm {
   /// general safe to store a StringRef.
   class LLVM_GSL_POINTER StringRef {
   public:
-    static constexpr size_t npos = ~size_t(0);
+    static constexpr size_t npos = std::string_view::npos;
 
-    using iterator = const char *;
-    using const_iterator = const char *;
-    using size_type = size_t;
-    using value_type = char;
-    using reverse_iterator = std::reverse_iterator<iterator>;
-    using const_reverse_iterator = std::reverse_iterator<const_iterator>;
+    using iterator = std::string_view::iterator;
+    using const_iterator = std::string_view::const_iterator;
+    using size_type = std::string_view::size_type;
+    using value_type = std::string_view::value_type;
+    using reverse_iterator = std::string_view::reverse_iterator;
+    using const_reverse_iterator = std::string_view::const_reverse_iterator;
 
   private:
     std::string_view View;
@@ -106,17 +106,10 @@ namespace llvm {
     /// @name Iterators
     /// @{
 
-    iterator begin() const { return data(); }
-
-    iterator end() const { return data() + size(); }
-
-    reverse_iterator rbegin() const {
-      return std::make_reverse_iterator(end());
-    }
-
-    reverse_iterator rend() const {
-      return std::make_reverse_iterator(begin());
-    }
+    iterator begin() const { return View.begin(); }
+    iterator end() const { return View.end(); }
+    reverse_iterator rbegin() const { return View.rbegin(); }
+    reverse_iterator rend() const { return View.rend(); }
 
     const unsigned char *bytes_begin() const {
       return reinterpret_cast<const unsigned char *>(begin());
@@ -137,7 +130,7 @@ namespace llvm {
     [[nodiscard]] constexpr const char *data() const { return View.data(); }
 
     /// empty - Check if the string is empty.
-    [[nodiscard]] constexpr bool empty() const { return size() == 0; }
+    [[nodiscard]] constexpr bool empty() const { return View.empty(); }
 
     /// size - Get the string size.
     [[nodiscard]] constexpr size_t size() const { return View.size(); }
@@ -145,13 +138,13 @@ namespace llvm {
     /// front - Get the first character in the string.
     [[nodiscard]] char front() const {
       assert(!empty());
-      return data()[0];
+      return View.front();
     }
 
     /// back - Get the last character in the string.
     [[nodiscard]] char back() const {
       assert(!empty());
-      return data()[size() - 1];
+      return View.back();
     }
 
     // copy - Allocate copy in Allocator and return StringRef to it.
@@ -222,7 +215,7 @@ namespace llvm {
     [[nodiscard]] std::string str() const {
       if (!data())
         return std::string();
-      return std::string(data(), size());
+      return std::string(View);
     }
 
     /// @}
@@ -246,9 +239,7 @@ namespace llvm {
     /// @name Type Conversions
     /// @{
 
-    constexpr operator std::string_view() const {
-      return std::string_view(data(), size());
-    }
+    constexpr operator std::string_view() const { return View; }
 
     /// @}
     /// @name String Predicates
@@ -288,7 +279,7 @@ namespace llvm {
     /// \returns The index of the first occurrence of \p C, or npos if not
     /// found.
     [[nodiscard]] size_t find(char C, size_t From = 0) const {
-      return std::string_view(*this).find(C, From);
+      return View.find(C, From);
     }
 
     /// Search for the first character \p C in the string, ignoring case.
diff --git a/llvm/lib/Support/StringRef.cpp b/llvm/lib/Support/StringRef.cpp
index 4f5fcb4857e805..ba45a625c0a8db 100644
--- a/llvm/lib/Support/StringRef.cpp
+++ b/llvm/lib/Support/StringRef.cpp
@@ -216,9 +216,7 @@ size_t StringRef::rfind_insensitive(char C, size_t From) const {
 ///
 /// \return - The index of the last occurrence of \arg Str, or npos if not
 /// found.
-size_t StringRef::rfind(StringRef Str) const {
-  return std::string_view(*this).rfind(Str);
-}
+size_t StringRef::rfind(StringRef Str) const { return View.rfind(Str); }
 
 size_t StringRef::rfind_insensitive(StringRef Str) const {
   size_t N = Str.size();
@@ -251,7 +249,7 @@ StringRef::size_type StringRef::find_first_of(StringRef Chars,
 /// find_first_not_of - Find the first character in the string that is not
 /// \arg C or npos if not found.
 StringRef::size_type StringRef::find_first_not_of(char C, size_t From) const {
-  return std::string_view(*this).find_first_not_of(C, From);
+  return View.find_first_not_of(C, From);
 }
 
 /// find_first_not_of - Find the first character in the string that is not

>From d862eae402e5513a3c62745a2ae7b3d5133530bb Mon Sep 17 00:00:00 2001
From: Kazu Hirata <kazu at google.com>
Date: Sun, 27 Oct 2024 00:12:00 -0700
Subject: [PATCH 2/3] Fix errors on Windows.

---
 llvm/include/llvm/ADT/StringRef.h | 4 ++--
 1 file changed, 2 insertions(+), 2 deletions(-)

diff --git a/llvm/include/llvm/ADT/StringRef.h b/llvm/include/llvm/ADT/StringRef.h
index e59a3f10ee76df..a8b14eb99ae312 100644
--- a/llvm/include/llvm/ADT/StringRef.h
+++ b/llvm/include/llvm/ADT/StringRef.h
@@ -112,10 +112,10 @@ namespace llvm {
     reverse_iterator rend() const { return View.rend(); }
 
     const unsigned char *bytes_begin() const {
-      return reinterpret_cast<const unsigned char *>(begin());
+      return reinterpret_cast<const unsigned char *>(&*begin());
     }
     const unsigned char *bytes_end() const {
-      return reinterpret_cast<const unsigned char *>(end());
+      return reinterpret_cast<const unsigned char *>(&*end());
     }
     iterator_range<const unsigned char *> bytes() const {
       return make_range(bytes_begin(), bytes_end());

>From 599c2a3c37f65a09ab393092be6d7f0234c648ff Mon Sep 17 00:00:00 2001
From: Kazu Hirata <kazu at google.com>
Date: Sun, 27 Oct 2024 08:25:36 -0700
Subject: [PATCH 3/3] Use data() + size() instead of end().

---
 llvm/include/llvm/ADT/StringRef.h | 6 +++---
 1 file changed, 3 insertions(+), 3 deletions(-)

diff --git a/llvm/include/llvm/ADT/StringRef.h b/llvm/include/llvm/ADT/StringRef.h
index a8b14eb99ae312..f6727950b70feb 100644
--- a/llvm/include/llvm/ADT/StringRef.h
+++ b/llvm/include/llvm/ADT/StringRef.h
@@ -112,10 +112,10 @@ namespace llvm {
     reverse_iterator rend() const { return View.rend(); }
 
     const unsigned char *bytes_begin() const {
-      return reinterpret_cast<const unsigned char *>(&*begin());
+      return reinterpret_cast<const unsigned char *>(data());
     }
     const unsigned char *bytes_end() const {
-      return reinterpret_cast<const unsigned char *>(&*end());
+      return reinterpret_cast<const unsigned char *>(data() + size());
     }
     iterator_range<const unsigned char *> bytes() const {
       return make_range(bytes_begin(), bytes_end());
@@ -260,7 +260,7 @@ namespace llvm {
     /// Check if this string ends with the given \p Suffix.
     [[nodiscard]] bool ends_with(StringRef Suffix) const {
       return size() >= Suffix.size() &&
-             compareMemory(end() - Suffix.size(), Suffix.data(),
+             compareMemory(data() + size() - Suffix.size(), Suffix.data(),
                            Suffix.size()) == 0;
     }
     [[nodiscard]] bool ends_with(char Suffix) const {



More information about the llvm-commits mailing list