https://github.com/hjanuschka updated 
https://github.com/llvm/llvm-project/pull/120055

>From 8b2dc9adf4fae2065823e5beb3a1cd851686913c Mon Sep 17 00:00:00 2001
From: Helmut Januschka <hel...@januschka.com>
Date: Mon, 16 Dec 2024 08:24:14 +0100
Subject: [PATCH 1/4] [clang-tidy] Add readability-string-view-substr check

Add a new check that suggests using string_view::remove_prefix() and
remove_suffix() instead of substr() when the intent is to remove
characters from either end of a string_view.
---
 .../clang-tidy/readability/CMakeLists.txt     |   1 +
 .../readability/ReadabilityTidyModule.cpp     |   3 +
 .../readability/StringViewSubstrCheck.cpp     | 132 ++++++++++++++++++
 .../readability/StringViewSubstrCheck.h       |  39 ++++++
 clang-tools-extra/docs/ReleaseNotes.rst       |   7 +
 .../checks/readability/string-view-substr.rst |  16 +++
 .../readability/stringview_substr.cpp         |  55 ++++++++
 7 files changed, 253 insertions(+)
 create mode 100644 
clang-tools-extra/clang-tidy/readability/StringViewSubstrCheck.cpp
 create mode 100644 
clang-tools-extra/clang-tidy/readability/StringViewSubstrCheck.h
 create mode 100644 
clang-tools-extra/docs/clang-tidy/checks/readability/string-view-substr.rst
 create mode 100644 
clang-tools-extra/test/clang-tidy/checkers/readability/stringview_substr.cpp

diff --git a/clang-tools-extra/clang-tidy/readability/CMakeLists.txt 
b/clang-tools-extra/clang-tidy/readability/CMakeLists.txt
index 8f303c51e1b0da..8b44fc339441ac 100644
--- a/clang-tools-extra/clang-tidy/readability/CMakeLists.txt
+++ b/clang-tools-extra/clang-tidy/readability/CMakeLists.txt
@@ -53,6 +53,7 @@ add_clang_library(clangTidyReadabilityModule STATIC
   StaticAccessedThroughInstanceCheck.cpp
   StaticDefinitionInAnonymousNamespaceCheck.cpp
   StringCompareCheck.cpp
+  StringViewSubstrCheck.cpp
   SuspiciousCallArgumentCheck.cpp
   UniqueptrDeleteReleaseCheck.cpp
   UppercaseLiteralSuffixCheck.cpp
diff --git a/clang-tools-extra/clang-tidy/readability/ReadabilityTidyModule.cpp 
b/clang-tools-extra/clang-tidy/readability/ReadabilityTidyModule.cpp
index d61c0ba39658e5..f36ec8f95ede60 100644
--- a/clang-tools-extra/clang-tidy/readability/ReadabilityTidyModule.cpp
+++ b/clang-tools-extra/clang-tidy/readability/ReadabilityTidyModule.cpp
@@ -56,6 +56,7 @@
 #include "StaticAccessedThroughInstanceCheck.h"
 #include "StaticDefinitionInAnonymousNamespaceCheck.h"
 #include "StringCompareCheck.h"
+#include "StringViewSubstrCheck.h"
 #include "SuspiciousCallArgumentCheck.h"
 #include "UniqueptrDeleteReleaseCheck.h"
 #include "UppercaseLiteralSuffixCheck.h"
@@ -146,6 +147,8 @@ class ReadabilityModule : public ClangTidyModule {
         "readability-static-definition-in-anonymous-namespace");
     CheckFactories.registerCheck<StringCompareCheck>(
         "readability-string-compare");
+    CheckFactories.registerCheck<StringViewSubstrCheck>(
+        "readability-stringview-substr");
     CheckFactories.registerCheck<readability::NamedParameterCheck>(
         "readability-named-parameter");
     CheckFactories.registerCheck<NonConstParameterCheck>(
diff --git a/clang-tools-extra/clang-tidy/readability/StringViewSubstrCheck.cpp 
b/clang-tools-extra/clang-tidy/readability/StringViewSubstrCheck.cpp
new file mode 100644
index 00000000000000..e86a971695a835
--- /dev/null
+++ b/clang-tools-extra/clang-tidy/readability/StringViewSubstrCheck.cpp
@@ -0,0 +1,132 @@
+//===--- StringViewSubstrCheck.cpp - clang-tidy------------------*- C++ 
-*-===//
+//
+// Part of the LLVM Project, under the Apache License v2.0 with LLVM 
Exceptions.
+// See https://llvm.org/LICENSE.txt for license information.
+// SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception
+//
+//===----------------------------------------------------------------------===//
+
+#include "StringViewSubstrCheck.h"
+#include "clang/AST/ASTContext.h"
+#include "clang/ASTMatchers/ASTMatchFinder.h"
+#include "clang/Lex/Lexer.h"
+
+using namespace clang::ast_matchers;
+
+namespace clang::tidy::readability {
+
+void StringViewSubstrCheck::registerMatchers(MatchFinder *Finder) {
+  const auto HasStringViewType = 
hasType(hasUnqualifiedDesugaredType(recordType(
+      hasDeclaration(recordDecl(hasName("::std::basic_string_view"))))));
+
+  // Match assignment to string_view's substr
+  Finder->addMatcher(
+      cxxOperatorCallExpr(
+          hasOverloadedOperatorName("="),
+          hasArgument(0, expr(HasStringViewType).bind("target")),
+          hasArgument(
+              1, cxxMemberCallExpr(callee(memberExpr(hasDeclaration(
+                                       cxxMethodDecl(hasName("substr"))))),
+                                   on(expr(HasStringViewType).bind("source")))
+                     .bind("substr_call")))
+          .bind("assignment"),
+      this);
+}
+
+void StringViewSubstrCheck::check(const MatchFinder::MatchResult &Result) {
+  const auto *Assignment =
+      Result.Nodes.getNodeAs<CXXOperatorCallExpr>("assignment");
+  const auto *Target = Result.Nodes.getNodeAs<Expr>("target");
+  const auto *Source = Result.Nodes.getNodeAs<Expr>("source");
+  const auto *SubstrCall =
+      Result.Nodes.getNodeAs<CXXMemberCallExpr>("substr_call");
+
+  if (!Assignment || !Target || !Source || !SubstrCall) {
+    return;
+  }
+
+  // Get the DeclRefExpr for the target and source to compare variables
+  const auto *TargetDRE = dyn_cast<DeclRefExpr>(Target->IgnoreParenImpCasts());
+  const auto *SourceDRE = dyn_cast<DeclRefExpr>(Source->IgnoreParenImpCasts());
+
+  // Only handle self-assignment cases
+  if (!TargetDRE || !SourceDRE ||
+      TargetDRE->getDecl() != SourceDRE->getDecl()) {
+    return;
+  }
+
+  const Expr *StartArg = SubstrCall->getArg(0);
+  const Expr *LengthArg =
+      SubstrCall->getNumArgs() > 1 ? SubstrCall->getArg(1) : nullptr;
+
+  // Get source text of first argument
+  std::string StartText =
+      Lexer::getSourceText(
+          CharSourceRange::getTokenRange(StartArg->getSourceRange()),
+          *Result.SourceManager, Result.Context->getLangOpts())
+          .str();
+
+  // Case 1: Check for remove_prefix pattern - only when the second arg is
+  // missing (uses npos)
+  if (!LengthArg || isa<CXXDefaultArgExpr>(LengthArg)) {
+    std::string Replacement = TargetDRE->getNameInfo().getAsString() +
+                              ".remove_prefix(" + StartText + ")";
+    diag(Assignment->getBeginLoc(), "prefer 'remove_prefix' over 'substr' for "
+                                    "removing characters from the start")
+        << FixItHint::CreateReplacement(Assignment->getSourceRange(),
+                                        Replacement);
+    return;
+  }
+
+  // Case 2: Check for remove_suffix pattern
+  if (StartText == "0") {
+    if (const auto *BinOp = dyn_cast<BinaryOperator>(LengthArg)) {
+      if (BinOp->getOpcode() == BO_Sub) {
+        const Expr *LHS = BinOp->getLHS();
+        const Expr *RHS = BinOp->getRHS();
+
+        // Check if LHS is a length() call on the same string_view
+        if (const auto *LengthCall = dyn_cast<CXXMemberCallExpr>(LHS)) {
+          if (const auto *LengthMethod =
+                  dyn_cast<CXXMethodDecl>(LengthCall->getDirectCallee())) {
+            if (LengthMethod->getName() == "length") {
+              // Verify the length() call is on the same string_view
+              const Expr *LengthObject =
+                  LengthCall->getImplicitObjectArgument();
+              const auto *LengthDRE =
+                  dyn_cast<DeclRefExpr>(LengthObject->IgnoreParenImpCasts());
+
+              if (!LengthDRE || LengthDRE->getDecl() != TargetDRE->getDecl()) {
+                return;
+              }
+
+              // Must be a simple non-zero integer literal
+              const auto *IL =
+                  dyn_cast<IntegerLiteral>(RHS->IgnoreParenImpCasts());
+              if (!IL || IL->getValue() == 0) {
+                return;
+              }
+
+              std::string RHSText =
+                  Lexer::getSourceText(
+                      CharSourceRange::getTokenRange(RHS->getSourceRange()),
+                      *Result.SourceManager, Result.Context->getLangOpts())
+                      .str();
+
+              std::string Replacement = TargetDRE->getNameInfo().getAsString() 
+
+                                        ".remove_suffix(" + RHSText + ")";
+              diag(Assignment->getBeginLoc(),
+                   "prefer 'remove_suffix' over 'substr' for removing "
+                   "characters from the end")
+                  << FixItHint::CreateReplacement(Assignment->getSourceRange(),
+                                                  Replacement);
+              return;
+            }
+          }
+        }
+      }
+    }
+  }
+}
+
+} // namespace clang::tidy::readability
diff --git a/clang-tools-extra/clang-tidy/readability/StringViewSubstrCheck.h 
b/clang-tools-extra/clang-tidy/readability/StringViewSubstrCheck.h
new file mode 100644
index 00000000000000..1a2054da1ed9cc
--- /dev/null
+++ b/clang-tools-extra/clang-tidy/readability/StringViewSubstrCheck.h
@@ -0,0 +1,39 @@
+//===--- StringViewSubstrCheck.h - clang-tidy---------------------*- C++
+//-*-===//
+//
+// Part of the LLVM Project, under the Apache License v2.0 with LLVM 
Exceptions.
+// See https://llvm.org/LICENSE.txt for license information.
+// SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception
+//
+//===----------------------------------------------------------------------===//
+
+#ifndef LLVM_CLANG_TOOLS_EXTRA_CLANG_TIDY_READABILITY_STRINGVIEWSUBSTRCHECK_H
+#define LLVM_CLANG_TOOLS_EXTRA_CLANG_TIDY_READABILITY_STRINGVIEWSUBSTRCHECK_H
+
+#include "../ClangTidyCheck.h"
+
+namespace clang::tidy::readability {
+
+/// Finds string_view substr() calls that can be replaced with remove_prefix()
+/// or remove_suffix().
+///
+/// For the user-facing documentation see:
+/// 
https://clang.llvm.org/extra/clang-tidy/checks/readability/string-view-substr.html
+///
+/// The check matches two patterns:
+///   sv = sv.substr(N) -> sv.remove_prefix(N)
+///   sv = sv.substr(0, sv.length() - N) -> sv.remove_suffix(N)
+///
+/// These replacements make the intent clearer and are more efficient as they
+/// modify the string_view in place rather than creating a new one.
+class StringViewSubstrCheck : public ClangTidyCheck {
+public:
+  StringViewSubstrCheck(StringRef Name, ClangTidyContext *Context)
+      : ClangTidyCheck(Name, Context) {}
+  void registerMatchers(ast_matchers::MatchFinder *Finder) override;
+  void check(const ast_matchers::MatchFinder::MatchResult &Result) override;
+};
+
+} // namespace clang::tidy::readability
+
+#endif // LLVM_CLANG_TOOLS_EXTRA_CLANG_TIDY_READABILITY_STRINGVIEWSUBSTRCHECK_H
\ No newline at end of file
diff --git a/clang-tools-extra/docs/ReleaseNotes.rst 
b/clang-tools-extra/docs/ReleaseNotes.rst
index 453a91e3b504cd..4eb6c98bcf461b 100644
--- a/clang-tools-extra/docs/ReleaseNotes.rst
+++ b/clang-tools-extra/docs/ReleaseNotes.rst
@@ -136,6 +136,13 @@ New checks
   Gives warnings for tagged unions, where the number of tags is
   different from the number of data members inside the union.
 
+- New :doc:`readability-string-view-substr 
+  <clang-tidy/checks/readability/string-view-substr>` check.
+
+  Finds ``std::string_view::substr()`` calls that can be replaced with clearer 
+  alternatives using ``remove_prefix()`` or ``remove_suffix()``. This makes 
the 
+  intent clearer and is more efficient as it modifies the string_view in place.
+
 - New :doc:`portability-template-virtual-member-function
   <clang-tidy/checks/portability/template-virtual-member-function>` check.
 
diff --git 
a/clang-tools-extra/docs/clang-tidy/checks/readability/string-view-substr.rst 
b/clang-tools-extra/docs/clang-tidy/checks/readability/string-view-substr.rst
new file mode 100644
index 00000000000000..f29bcbacc0d7d1
--- /dev/null
+++ 
b/clang-tools-extra/docs/clang-tidy/checks/readability/string-view-substr.rst
@@ -0,0 +1,16 @@
+.. title:: clang-tidy - readability-string-view-substr
+
+readability-string-view-substr
+==============================
+
+Finds ``string_view substr()`` calls that can be replaced with clearer 
alternatives
+using ``remove_prefix()`` or ``remove_suffix()``.
+
+The check suggests the following transformations:
+
+===========================================  =======================
+Expression                                   Replacement
+===========================================  =======================
+``sv = sv.substr(n)``                        ``sv.remove_prefix(n)``
+``sv = sv.substr(0, sv.length()-n)``         ``sv.remove_suffix(n)``
+===========================================  =======================
diff --git 
a/clang-tools-extra/test/clang-tidy/checkers/readability/stringview_substr.cpp 
b/clang-tools-extra/test/clang-tidy/checkers/readability/stringview_substr.cpp
new file mode 100644
index 00000000000000..274c305b640803
--- /dev/null
+++ 
b/clang-tools-extra/test/clang-tidy/checkers/readability/stringview_substr.cpp
@@ -0,0 +1,55 @@
+// RUN: %check_clang_tidy %s readability-stringview-substr %t
+
+namespace std {
+template <typename T>
+class basic_string_view {
+public:
+  using size_type = unsigned long;
+  static constexpr size_type npos = -1;
+
+  basic_string_view(const char*) {}
+  basic_string_view substr(size_type pos, size_type count = npos) const { 
return *this; }
+  void remove_prefix(size_type n) {}
+  void remove_suffix(size_type n) {}
+  size_type length() const { return 0; }
+
+  // Needed for assignment operator
+  basic_string_view& operator=(const basic_string_view&) { return *this; }
+};
+
+using string_view = basic_string_view<char>;
+}
+
+void test() {
+  std::string_view sv("test");
+  std::string_view sv1("test");
+  std::string_view sv2("other");
+
+  // Should match: Removing N characters from start
+  sv = sv.substr(5);
+  // CHECK-MESSAGES: :[[@LINE-1]]:3: warning: prefer 'remove_prefix' over 
'substr' for removing characters from the start [readability-stringview-substr]
+  // CHECK-FIXES: sv.remove_prefix(5)
+
+  // Should match: Removing N characters from end
+  sv = sv.substr(0, sv.length() - 3);
+  // CHECK-MESSAGES: :[[@LINE-1]]:3: warning: prefer 'remove_suffix' over 
'substr' for removing characters from the end [readability-stringview-substr]
+  // CHECK-FIXES: sv.remove_suffix(3)
+
+  // Should not match: Basic substring operations
+  sv = sv.substr(0, 3);  // No warning - taking first N characters
+  sv = sv.substr(1, 3);  // No warning - taking N characters from position 1
+  
+  // Should not match: Operations on different string_views
+  sv = sv2.substr(0, sv2.length() - 3);  // No warning - not self-assignment
+  sv = sv.substr(0, sv2.length() - 3);   // No warning - length() from 
different string_view
+  sv1 = sv1.substr(0, sv2.length() - 3); // No warning - length() from 
different string_view
+  sv = sv1.substr(0, sv1.length() - 3);  // No warning - not self-assignment
+
+  // Should not match: Not actually removing from end
+  sv = sv.substr(0, sv.length());       // No warning - keeping entire string
+  sv = sv.substr(0, sv.length() - 0);   // No warning - subtracting zero
+  
+  // Should not match: Complex expressions
+  sv = sv.substr(0, sv.length() - (3 + 2));  // No warning - complex arithmetic
+  sv = sv.substr(1 + 2, sv.length() - 3);    // No warning - complex start 
position
+}

>From 64931c696fe64cdb8a7571029eea0cc40592a663 Mon Sep 17 00:00:00 2001
From: Helmut Januschka <hel...@januschka.com>
Date: Mon, 16 Dec 2024 11:14:12 +0100
Subject: [PATCH 2/4] up

---
 .../readability/StringViewSubstrCheck.cpp     | 19 ++++++++-
 .../readability/stringview_substr.cpp         | 41 +++++++++++++++++++
 2 files changed, 59 insertions(+), 1 deletion(-)

diff --git a/clang-tools-extra/clang-tidy/readability/StringViewSubstrCheck.cpp 
b/clang-tools-extra/clang-tidy/readability/StringViewSubstrCheck.cpp
index e86a971695a835..01c3895f61f5c4 100644
--- a/clang-tools-extra/clang-tidy/readability/StringViewSubstrCheck.cpp
+++ b/clang-tools-extra/clang-tidy/readability/StringViewSubstrCheck.cpp
@@ -79,7 +79,24 @@ void StringViewSubstrCheck::check(const 
MatchFinder::MatchResult &Result) {
   }
 
   // Case 2: Check for remove_suffix pattern
-  if (StartText == "0") {
+  const Expr *Start = StartArg->IgnoreParenImpCasts();
+  bool IsZero = false;
+
+  if (const auto *IL = dyn_cast<IntegerLiteral>(Start)) {
+    IsZero = IL->getValue() == 0;
+  } else if (const auto *DRE = dyn_cast<DeclRefExpr>(Start)) {
+    // Check constants
+    if (const auto *VD = dyn_cast<VarDecl>(DRE->getDecl())) {
+      if (VD->hasInit()) {
+        if (const auto *Init = dyn_cast<IntegerLiteral>(
+                VD->getInit()->IgnoreParenImpCasts())) {
+          IsZero = Init->getValue() == 0;
+        }
+      }
+    }
+  }
+
+  if (IsZero) {
     if (const auto *BinOp = dyn_cast<BinaryOperator>(LengthArg)) {
       if (BinOp->getOpcode() == BO_Sub) {
         const Expr *LHS = BinOp->getLHS();
diff --git 
a/clang-tools-extra/test/clang-tidy/checkers/readability/stringview_substr.cpp 
b/clang-tools-extra/test/clang-tidy/checkers/readability/stringview_substr.cpp
index 274c305b640803..2c1d9df3711b1d 100644
--- 
a/clang-tools-extra/test/clang-tidy/checkers/readability/stringview_substr.cpp
+++ 
b/clang-tools-extra/test/clang-tidy/checkers/readability/stringview_substr.cpp
@@ -53,3 +53,44 @@ void test() {
   sv = sv.substr(0, sv.length() - (3 + 2));  // No warning - complex arithmetic
   sv = sv.substr(1 + 2, sv.length() - 3);    // No warning - complex start 
position
 }
+
+void test_zeros() {
+  std::string_view sv("test");
+  const int kZero = 0;
+  constexpr std::string_view::size_type Zero = 0;  // Fixed: using 
string_view::size_type
+  #define START_POS 0
+  
+  // All of these should match remove_suffix pattern and trigger warnings
+  sv = sv.substr(0, sv.length() - 3);
+  // CHECK-MESSAGES: :[[@LINE-1]]:3: warning: prefer 'remove_suffix' over 
'substr' for removing characters from the end [readability-stringview-substr]
+  // CHECK-FIXES: sv.remove_suffix(3)
+
+  sv = sv.substr(kZero, sv.length() - 3);
+  // CHECK-MESSAGES: :[[@LINE-1]]:3: warning: prefer 'remove_suffix' over 
'substr' for removing characters from the end [readability-stringview-substr]
+  // CHECK-FIXES: sv.remove_suffix(3)
+
+  sv = sv.substr(Zero, sv.length() - 3);
+  // CHECK-MESSAGES: :[[@LINE-1]]:3: warning: prefer 'remove_suffix' over 
'substr' for removing characters from the end [readability-stringview-substr]
+  // CHECK-FIXES: sv.remove_suffix(3)
+
+  sv = sv.substr(START_POS, sv.length() - 3);
+  // CHECK-MESSAGES: :[[@LINE-1]]:3: warning: prefer 'remove_suffix' over 
'substr' for removing characters from the end [readability-stringview-substr]
+  // CHECK-FIXES: sv.remove_suffix(3)
+
+  sv = sv.substr((0), sv.length() - 3);
+  // CHECK-MESSAGES: :[[@LINE-1]]:3: warning: prefer 'remove_suffix' over 
'substr' for removing characters from the end [readability-stringview-substr]
+  // CHECK-FIXES: sv.remove_suffix(3)
+
+  sv = sv.substr(0u, sv.length() - 3);
+  // CHECK-MESSAGES: :[[@LINE-1]]:3: warning: prefer 'remove_suffix' over 
'substr' for removing characters from the end [readability-stringview-substr]
+  // CHECK-FIXES: sv.remove_suffix(3)
+
+  sv = sv.substr(0UL, sv.length() - 3);
+  // CHECK-MESSAGES: :[[@LINE-1]]:3: warning: prefer 'remove_suffix' over 
'substr' for removing characters from the end [readability-stringview-substr]
+  // CHECK-FIXES: sv.remove_suffix(3)
+
+  // These should NOT match the remove_suffix pattern
+  sv = sv.substr(1-1, sv.length() - 3);  // No warning - complex expression
+  sv = sv.substr(sv.length() - 3, sv.length() - 3);  // No warning - non-zero 
start
+}
+

>From 5b81a4d383f2e9751acedf9a895671828c2b683d Mon Sep 17 00:00:00 2001
From: Helmut Januschka <hel...@januschka.com>
Date: Mon, 16 Dec 2024 20:49:30 +0100
Subject: [PATCH 3/4] up

---
 .../readability/StringViewSubstrCheck.cpp     | 148 ++++++++++++------
 .../checks/readability/string-view-substr.rst |   2 +
 .../readability/stringview_substr.cpp         |  82 +++++-----
 3 files changed, 149 insertions(+), 83 deletions(-)

diff --git a/clang-tools-extra/clang-tidy/readability/StringViewSubstrCheck.cpp 
b/clang-tools-extra/clang-tidy/readability/StringViewSubstrCheck.cpp
index 01c3895f61f5c4..5c079e3203c989 100644
--- a/clang-tools-extra/clang-tidy/readability/StringViewSubstrCheck.cpp
+++ b/clang-tools-extra/clang-tidy/readability/StringViewSubstrCheck.cpp
@@ -45,13 +45,11 @@ void StringViewSubstrCheck::check(const 
MatchFinder::MatchResult &Result) {
     return;
   }
 
-  // Get the DeclRefExpr for the target and source to compare variables
+  // Get the DeclRefExpr for the target and source
   const auto *TargetDRE = dyn_cast<DeclRefExpr>(Target->IgnoreParenImpCasts());
   const auto *SourceDRE = dyn_cast<DeclRefExpr>(Source->IgnoreParenImpCasts());
 
-  // Only handle self-assignment cases
-  if (!TargetDRE || !SourceDRE ||
-      TargetDRE->getDecl() != SourceDRE->getDecl()) {
+  if (!TargetDRE || !SourceDRE) {
     return;
   }
 
@@ -59,89 +57,143 @@ void StringViewSubstrCheck::check(const 
MatchFinder::MatchResult &Result) {
   const Expr *LengthArg =
       SubstrCall->getNumArgs() > 1 ? SubstrCall->getArg(1) : nullptr;
 
-  // Get source text of first argument
   std::string StartText =
       Lexer::getSourceText(
           CharSourceRange::getTokenRange(StartArg->getSourceRange()),
           *Result.SourceManager, Result.Context->getLangOpts())
           .str();
 
-  // Case 1: Check for remove_prefix pattern - only when the second arg is
-  // missing (uses npos)
+  const bool IsSameVar = (TargetDRE->getDecl() == SourceDRE->getDecl());
+
+  // Case 1: Check for remove_prefix pattern
   if (!LengthArg || isa<CXXDefaultArgExpr>(LengthArg)) {
-    std::string Replacement = TargetDRE->getNameInfo().getAsString() +
-                              ".remove_prefix(" + StartText + ")";
-    diag(Assignment->getBeginLoc(), "prefer 'remove_prefix' over 'substr' for "
-                                    "removing characters from the start")
-        << FixItHint::CreateReplacement(Assignment->getSourceRange(),
-                                        Replacement);
+    if (IsSameVar) {
+      std::string Replacement = TargetDRE->getNameInfo().getAsString() +
+                                ".remove_prefix(" + StartText + ")";
+      diag(Assignment->getBeginLoc(), "prefer 'remove_prefix' over 'substr' "
+                                      "for removing characters from the start")
+          << FixItHint::CreateReplacement(Assignment->getSourceRange(),
+                                          Replacement);
+    }
     return;
   }
 
-  // Case 2: Check for remove_suffix pattern
-  const Expr *Start = StartArg->IgnoreParenImpCasts();
+  // Check if StartArg resolves to 0
   bool IsZero = false;
 
-  if (const auto *IL = dyn_cast<IntegerLiteral>(Start)) {
+  // Handle cases where StartArg is an integer literal
+  if (const auto *IL =
+          dyn_cast<IntegerLiteral>(StartArg->IgnoreParenImpCasts())) {
     IsZero = IL->getValue() == 0;
-  } else if (const auto *DRE = dyn_cast<DeclRefExpr>(Start)) {
-    // Check constants
-    if (const auto *VD = dyn_cast<VarDecl>(DRE->getDecl())) {
-      if (VD->hasInit()) {
-        if (const auto *Init = dyn_cast<IntegerLiteral>(
-                VD->getInit()->IgnoreParenImpCasts())) {
-          IsZero = Init->getValue() == 0;
-        }
-      }
-    }
   }
 
+  // Optional: Handle cases where StartArg evaluates to zero
+  if (!IsZero) {
+    // Add logic for other constant evaluation (e.g., constexpr evaluation)
+    const auto &EvalResult = StartArg->EvaluateKnownConstInt(*Result.Context);
+    IsZero = !EvalResult.isNegative() && EvalResult == 0;
+  }
+
+  // If StartArg resolves to 0, handle the case
   if (IsZero) {
+    bool isFullCopy = false;
+
+    // Check for length() or length() - expr pattern
     if (const auto *BinOp = dyn_cast<BinaryOperator>(LengthArg)) {
       if (BinOp->getOpcode() == BO_Sub) {
         const Expr *LHS = BinOp->getLHS();
         const Expr *RHS = BinOp->getRHS();
 
-        // Check if LHS is a length() call on the same string_view
+        // Check for length() call
         if (const auto *LengthCall = dyn_cast<CXXMemberCallExpr>(LHS)) {
           if (const auto *LengthMethod =
                   dyn_cast<CXXMethodDecl>(LengthCall->getDirectCallee())) {
             if (LengthMethod->getName() == "length") {
-              // Verify the length() call is on the same string_view
               const Expr *LengthObject =
                   LengthCall->getImplicitObjectArgument();
               const auto *LengthDRE =
                   dyn_cast<DeclRefExpr>(LengthObject->IgnoreParenImpCasts());
 
-              if (!LengthDRE || LengthDRE->getDecl() != TargetDRE->getDecl()) {
+              if (!LengthDRE || LengthDRE->getDecl() != SourceDRE->getDecl()) {
                 return;
               }
 
-              // Must be a simple non-zero integer literal
-              const auto *IL =
-                  dyn_cast<IntegerLiteral>(RHS->IgnoreParenImpCasts());
-              if (!IL || IL->getValue() == 0) {
-                return;
+              // Check if RHS is 0 or evaluates to 0
+              bool IsZero = false;
+              if (const auto *IL =
+                      dyn_cast<IntegerLiteral>(RHS->IgnoreParenImpCasts())) {
+                IsZero = IL->getValue() == 0;
               }
 
-              std::string RHSText =
-                  Lexer::getSourceText(
-                      CharSourceRange::getTokenRange(RHS->getSourceRange()),
-                      *Result.SourceManager, Result.Context->getLangOpts())
-                      .str();
-
-              std::string Replacement = TargetDRE->getNameInfo().getAsString() 
+
-                                        ".remove_suffix(" + RHSText + ")";
-              diag(Assignment->getBeginLoc(),
-                   "prefer 'remove_suffix' over 'substr' for removing "
-                   "characters from the end")
-                  << FixItHint::CreateReplacement(Assignment->getSourceRange(),
-                                                  Replacement);
-              return;
+              if (IsZero) {
+                isFullCopy = true;
+              } else if (IsSameVar) {
+                // remove_suffix case (only for self-assignment)
+                std::string RHSText =
+                    Lexer::getSourceText(
+                        CharSourceRange::getTokenRange(RHS->getSourceRange()),
+                        *Result.SourceManager, Result.Context->getLangOpts())
+                        .str();
+
+                std::string Replacement =
+                    TargetDRE->getNameInfo().getAsString() + ".remove_suffix(" 
+
+                    RHSText + ")";
+                diag(Assignment->getBeginLoc(),
+                     "prefer 'remove_suffix' over 'substr' for removing "
+                     "characters from the end")
+                    << FixItHint::CreateReplacement(
+                           Assignment->getSourceRange(), Replacement);
+                return;
+              }
             }
           }
         }
       }
+    } else if (const auto *LengthCall =
+                   dyn_cast<CXXMemberCallExpr>(LengthArg)) {
+      // Handle direct length() call
+      if (const auto *LengthMethod =
+              dyn_cast<CXXMethodDecl>(LengthCall->getDirectCallee())) {
+        if (LengthMethod->getName() == "length") {
+          const Expr *LengthObject = LengthCall->getImplicitObjectArgument();
+          const auto *LengthDRE =
+              dyn_cast<DeclRefExpr>(LengthObject->IgnoreParenImpCasts());
+
+          if (LengthDRE && LengthDRE->getDecl() == SourceDRE->getDecl()) {
+            isFullCopy = true;
+          }
+        }
+      }
+    }
+    if (isFullCopy) {
+      if (IsSameVar) {
+        // Remove redundant self-copy, including the semicolon
+        SourceLocation EndLoc = Assignment->getEndLoc();
+        while (EndLoc.isValid()) {
+          const char *endPtr = Result.SourceManager->getCharacterData(EndLoc);
+          if (*endPtr == ';')
+            break;
+          EndLoc = Lexer::getLocForEndOfToken(EndLoc, 0, *Result.SourceManager,
+                                              Result.Context->getLangOpts());
+        }
+        if (EndLoc.isValid()) {
+          diag(Assignment->getBeginLoc(), "redundant self-copy")
+              << FixItHint::CreateRemoval(CharSourceRange::getCharRange(
+                     Assignment->getBeginLoc(),
+                     EndLoc.getLocWithOffset(
+                         1))); // +1 to include the semicolon.
+        }
+      } else {
+        // Simplify copy between different variables
+        std::string Replacement = TargetDRE->getNameInfo().getAsString() +
+                                  " = " +
+                                  SourceDRE->getNameInfo().getAsString();
+        diag(Assignment->getBeginLoc(), "prefer direct copy over substr")
+            << FixItHint::CreateReplacement(Assignment->getSourceRange(),
+                                            Replacement);
+      }
+
+      return;
     }
   }
 }
diff --git 
a/clang-tools-extra/docs/clang-tidy/checks/readability/string-view-substr.rst 
b/clang-tools-extra/docs/clang-tidy/checks/readability/string-view-substr.rst
index f29bcbacc0d7d1..167d4f30cca8c3 100644
--- 
a/clang-tools-extra/docs/clang-tidy/checks/readability/string-view-substr.rst
+++ 
b/clang-tools-extra/docs/clang-tidy/checks/readability/string-view-substr.rst
@@ -13,4 +13,6 @@ Expression                                   Replacement
 ===========================================  =======================
 ``sv = sv.substr(n)``                        ``sv.remove_prefix(n)``
 ``sv = sv.substr(0, sv.length()-n)``         ``sv.remove_suffix(n)``
+``sv = sv.substr(0, sv.length())``           _Redundant self-copy_
+``sv1 = sv.substr(0, sv.length())``          ``sv1 = sv``
 ===========================================  =======================
diff --git 
a/clang-tools-extra/test/clang-tidy/checkers/readability/stringview_substr.cpp 
b/clang-tools-extra/test/clang-tidy/checkers/readability/stringview_substr.cpp
index 2c1d9df3711b1d..908c664e329b2f 100644
--- 
a/clang-tools-extra/test/clang-tidy/checkers/readability/stringview_substr.cpp
+++ 
b/clang-tools-extra/test/clang-tidy/checkers/readability/stringview_substr.cpp
@@ -12,59 +12,62 @@ class basic_string_view {
   void remove_prefix(size_type n) {}
   void remove_suffix(size_type n) {}
   size_type length() const { return 0; }
-
-  // Needed for assignment operator
   basic_string_view& operator=(const basic_string_view&) { return *this; }
 };
 
 using string_view = basic_string_view<char>;
-}
+} // namespace std
 
-void test() {
+void test_basic() {
   std::string_view sv("test");
   std::string_view sv1("test");
-  std::string_view sv2("other");
+  std::string_view sv2("test");
 
-  // Should match: Removing N characters from start
+  // Should match: remove_prefix
   sv = sv.substr(5);
   // CHECK-MESSAGES: :[[@LINE-1]]:3: warning: prefer 'remove_prefix' over 
'substr' for removing characters from the start [readability-stringview-substr]
   // CHECK-FIXES: sv.remove_prefix(5)
 
-  // Should match: Removing N characters from end
+  // Should match: remove_suffix
   sv = sv.substr(0, sv.length() - 3);
   // CHECK-MESSAGES: :[[@LINE-1]]:3: warning: prefer 'remove_suffix' over 
'substr' for removing characters from the end [readability-stringview-substr]
   // CHECK-FIXES: sv.remove_suffix(3)
 
-  // Should not match: Basic substring operations
-  sv = sv.substr(0, 3);  // No warning - taking first N characters
-  sv = sv.substr(1, 3);  // No warning - taking N characters from position 1
-  
-  // Should not match: Operations on different string_views
-  sv = sv2.substr(0, sv2.length() - 3);  // No warning - not self-assignment
-  sv = sv.substr(0, sv2.length() - 3);   // No warning - length() from 
different string_view
-  sv1 = sv1.substr(0, sv2.length() - 3); // No warning - length() from 
different string_view
-  sv = sv1.substr(0, sv1.length() - 3);  // No warning - not self-assignment
-
-  // Should not match: Not actually removing from end
-  sv = sv.substr(0, sv.length());       // No warning - keeping entire string
-  sv = sv.substr(0, sv.length() - 0);   // No warning - subtracting zero
-  
-  // Should not match: Complex expressions
-  sv = sv.substr(0, sv.length() - (3 + 2));  // No warning - complex arithmetic
-  sv = sv.substr(1 + 2, sv.length() - 3);    // No warning - complex start 
position
+  // Should match: remove_suffix with complex expression
+  sv = sv.substr(0, sv.length() - (3 + 2));
+  // CHECK-MESSAGES: :[[@LINE-1]]:3: warning: prefer 'remove_suffix' over 
'substr' for removing characters from the end [readability-stringview-substr]
+  // CHECK-FIXES: sv.remove_suffix((3 + 2))
+}
+
+void test_copies() {
+  std::string_view sv("test");
+  std::string_view sv1("test");
+  std::string_view sv2("test");
+
+  // Should match: remove redundant self copies
+  sv = sv.substr(0, sv.length());
+  // CHECK-MESSAGES: :[[@LINE-1]]:3: warning: redundant self-copy 
[readability-stringview-substr]
+
+  sv = sv.substr(0, sv.length() - 0);
+    // CHECK-MESSAGES: :[[@LINE-1]]:3: warning: redundant self-copy 
[readability-stringview-substr]
+
+  // Should match: simplify copies between different variables
+  sv1 = sv.substr(0, sv.length());
+  // CHECK-MESSAGES: :[[@LINE-1]]:3: warning: prefer direct copy over substr 
[readability-stringview-substr]
+  // CHECK-FIXES: sv1 = sv
+
+  sv2 = sv.substr(0, sv.length() - 0);
+  // CHECK-MESSAGES: :[[@LINE-1]]:3: warning: prefer direct copy over substr 
[readability-stringview-substr]
+  // CHECK-FIXES: sv2 = sv
 }
 
-void test_zeros() {
+void test_zero_forms() {
   std::string_view sv("test");
   const int kZero = 0;
-  constexpr std::string_view::size_type Zero = 0;  // Fixed: using 
string_view::size_type
+  constexpr std::string_view::size_type Zero = 0;
   #define START_POS 0
-  
-  // All of these should match remove_suffix pattern and trigger warnings
-  sv = sv.substr(0, sv.length() - 3);
-  // CHECK-MESSAGES: :[[@LINE-1]]:3: warning: prefer 'remove_suffix' over 
'substr' for removing characters from the end [readability-stringview-substr]
-  // CHECK-FIXES: sv.remove_suffix(3)
 
+  // Should match: various forms of zero in first argument
   sv = sv.substr(kZero, sv.length() - 3);
   // CHECK-MESSAGES: :[[@LINE-1]]:3: warning: prefer 'remove_suffix' over 
'substr' for removing characters from the end [readability-stringview-substr]
   // CHECK-FIXES: sv.remove_suffix(3)
@@ -88,9 +91,18 @@ void test_zeros() {
   sv = sv.substr(0UL, sv.length() - 3);
   // CHECK-MESSAGES: :[[@LINE-1]]:3: warning: prefer 'remove_suffix' over 
'substr' for removing characters from the end [readability-stringview-substr]
   // CHECK-FIXES: sv.remove_suffix(3)
-
-  // These should NOT match the remove_suffix pattern
-  sv = sv.substr(1-1, sv.length() - 3);  // No warning - complex expression
-  sv = sv.substr(sv.length() - 3, sv.length() - 3);  // No warning - non-zero 
start
 }
 
+void test_should_not_match() {
+  std::string_view sv("test");
+  std::string_view sv1("test");
+  std::string_view sv2("test");
+
+  // No match: substr used for prefix or mid-view
+  sv = sv.substr(1, sv.length() - 3); // No warning
+
+  // No match: Different string_views
+  sv = sv2.substr(0, sv2.length() - 3); // No warning
+
+  
+}

>From aa01bc040241a18de12d261bba60836f66b55839 Mon Sep 17 00:00:00 2001
From: Helmut Januschka <hel...@januschka.com>
Date: Mon, 16 Dec 2024 21:43:25 +0100
Subject: [PATCH 4/4] up

---
 .../docs/clang-tidy/checks/readability/string-view-substr.rst   | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git 
a/clang-tools-extra/docs/clang-tidy/checks/readability/string-view-substr.rst 
b/clang-tools-extra/docs/clang-tidy/checks/readability/string-view-substr.rst
index 167d4f30cca8c3..c4e25a1d621c8f 100644
--- 
a/clang-tools-extra/docs/clang-tidy/checks/readability/string-view-substr.rst
+++ 
b/clang-tools-extra/docs/clang-tidy/checks/readability/string-view-substr.rst
@@ -13,6 +13,6 @@ Expression                                   Replacement
 ===========================================  =======================
 ``sv = sv.substr(n)``                        ``sv.remove_prefix(n)``
 ``sv = sv.substr(0, sv.length()-n)``         ``sv.remove_suffix(n)``
-``sv = sv.substr(0, sv.length())``           _Redundant self-copy_
+``sv = sv.substr(0, sv.length())``           Redundant self-copy
 ``sv1 = sv.substr(0, sv.length())``          ``sv1 = sv``
 ===========================================  =======================

_______________________________________________
cfe-commits mailing list
cfe-commits@lists.llvm.org
https://lists.llvm.org/cgi-bin/mailman/listinfo/cfe-commits

Reply via email to