2018-08-22 21:58:25 +08:00
|
|
|
//===--- FasterStrsplitDelimiterCheck.cpp - clang-tidy---------------------===//
|
|
|
|
//
|
2019-01-19 16:50:56 +08:00
|
|
|
// Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions.
|
|
|
|
// See https://llvm.org/LICENSE.txt for license information.
|
|
|
|
// SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception
|
2018-08-22 21:58:25 +08:00
|
|
|
//
|
|
|
|
//===----------------------------------------------------------------------===//
|
|
|
|
|
|
|
|
#include "FasterStrsplitDelimiterCheck.h"
|
|
|
|
#include "clang/AST/ASTContext.h"
|
|
|
|
#include "clang/ASTMatchers/ASTMatchFinder.h"
|
2019-07-09 19:04:04 +08:00
|
|
|
#include "clang/Tooling/FixIt.h"
|
2018-08-22 21:58:25 +08:00
|
|
|
|
|
|
|
using namespace clang::ast_matchers;
|
|
|
|
|
|
|
|
namespace clang {
|
|
|
|
namespace tidy {
|
|
|
|
namespace abseil {
|
|
|
|
|
|
|
|
namespace {
|
|
|
|
|
|
|
|
AST_MATCHER(StringLiteral, lengthIsOne) { return Node.getLength() == 1; }
|
|
|
|
|
2019-07-09 19:04:04 +08:00
|
|
|
llvm::Optional<std::string> makeCharacterLiteral(const StringLiteral *Literal,
|
|
|
|
const ASTContext &Context) {
|
|
|
|
assert(Literal->getLength() == 1 &&
|
|
|
|
"Only single character string should be matched");
|
|
|
|
assert(Literal->getCharByteWidth() == 1 &&
|
|
|
|
"StrSplit doesn't support wide char");
|
|
|
|
std::string Result = clang::tooling::fixit::getText(*Literal, Context).str();
|
|
|
|
bool IsRawStringLiteral = StringRef(Result).startswith(R"(R")");
|
|
|
|
// Since raw string literal might contain unescaped non-printable characters,
|
|
|
|
// we normalize them using `StringLiteral::outputString`.
|
|
|
|
if (IsRawStringLiteral) {
|
|
|
|
Result.clear();
|
2018-08-22 21:58:25 +08:00
|
|
|
llvm::raw_string_ostream Stream(Result);
|
|
|
|
Literal->outputString(Stream);
|
|
|
|
}
|
|
|
|
// Special case: If the string contains a single quote, we just need to return
|
|
|
|
// a character of the single quote. This is a special case because we need to
|
|
|
|
// escape it in the character literal.
|
|
|
|
if (Result == R"("'")")
|
|
|
|
return std::string(R"('\'')");
|
|
|
|
|
|
|
|
// Now replace the " with '.
|
2019-07-09 19:04:04 +08:00
|
|
|
std::string::size_type Pos = Result.find_first_of('"');
|
2018-08-22 21:58:25 +08:00
|
|
|
if (Pos == Result.npos)
|
|
|
|
return llvm::None;
|
|
|
|
Result[Pos] = '\'';
|
|
|
|
Pos = Result.find_last_of('"');
|
|
|
|
if (Pos == Result.npos)
|
|
|
|
return llvm::None;
|
|
|
|
Result[Pos] = '\'';
|
|
|
|
return Result;
|
|
|
|
}
|
|
|
|
|
|
|
|
} // anonymous namespace
|
|
|
|
|
|
|
|
void FasterStrsplitDelimiterCheck::registerMatchers(MatchFinder *Finder) {
|
|
|
|
// Binds to one character string literals.
|
|
|
|
const auto SingleChar =
|
|
|
|
expr(ignoringParenCasts(stringLiteral(lengthIsOne()).bind("Literal")));
|
|
|
|
|
|
|
|
// Binds to a string_view (either absl or std) that was passed by value and
|
2020-01-04 23:28:41 +08:00
|
|
|
// constructed from string literal.
|
2019-06-13 23:16:44 +08:00
|
|
|
auto StringViewArg = ignoringElidableConstructorCall(ignoringImpCasts(
|
|
|
|
cxxConstructExpr(hasType(recordDecl(hasName("::absl::string_view"))),
|
|
|
|
hasArgument(0, ignoringParenImpCasts(SingleChar)))));
|
2018-08-22 21:58:25 +08:00
|
|
|
|
2019-06-13 23:16:44 +08:00
|
|
|
// Need to ignore the elidable constructor as otherwise there is no match for
|
|
|
|
// c++14 and earlier.
|
2018-08-22 21:58:25 +08:00
|
|
|
auto ByAnyCharArg =
|
2019-06-13 23:16:44 +08:00
|
|
|
expr(has(ignoringElidableConstructorCall(
|
|
|
|
ignoringParenCasts(cxxBindTemporaryExpr(has(cxxConstructExpr(
|
|
|
|
hasType(recordDecl(hasName("::absl::ByAnyChar"))),
|
|
|
|
hasArgument(0, StringViewArg))))))))
|
2018-08-22 21:58:25 +08:00
|
|
|
.bind("ByAnyChar");
|
|
|
|
|
|
|
|
// Find uses of absl::StrSplit(..., "x") and absl::StrSplit(...,
|
|
|
|
// absl::ByAnyChar("x")) to transform them into absl::StrSplit(..., 'x').
|
2019-11-12 23:15:56 +08:00
|
|
|
Finder->addMatcher(
|
2020-12-11 07:52:35 +08:00
|
|
|
traverse(TK_AsIs,
|
2019-11-12 23:15:56 +08:00
|
|
|
callExpr(callee(functionDecl(hasName("::absl::StrSplit"))),
|
|
|
|
hasArgument(1, anyOf(ByAnyCharArg, SingleChar)),
|
|
|
|
unless(isInTemplateInstantiation()))
|
|
|
|
.bind("StrSplit")),
|
|
|
|
this);
|
2018-08-22 21:58:25 +08:00
|
|
|
|
|
|
|
// Find uses of absl::MaxSplits("x", N) and
|
|
|
|
// absl::MaxSplits(absl::ByAnyChar("x"), N) to transform them into
|
|
|
|
// absl::MaxSplits('x', N).
|
|
|
|
Finder->addMatcher(
|
2020-12-11 07:52:35 +08:00
|
|
|
traverse(TK_AsIs,
|
2019-11-12 23:15:56 +08:00
|
|
|
callExpr(callee(functionDecl(hasName("::absl::MaxSplits"))),
|
|
|
|
hasArgument(0, anyOf(ByAnyCharArg,
|
|
|
|
ignoringParenCasts(SingleChar))),
|
|
|
|
unless(isInTemplateInstantiation()))),
|
2018-08-22 21:58:25 +08:00
|
|
|
this);
|
|
|
|
}
|
|
|
|
|
|
|
|
void FasterStrsplitDelimiterCheck::check(
|
|
|
|
const MatchFinder::MatchResult &Result) {
|
|
|
|
const auto *Literal = Result.Nodes.getNodeAs<StringLiteral>("Literal");
|
|
|
|
|
|
|
|
if (Literal->getBeginLoc().isMacroID() || Literal->getEndLoc().isMacroID())
|
|
|
|
return;
|
|
|
|
|
2019-07-09 19:04:04 +08:00
|
|
|
llvm::Optional<std::string> Replacement =
|
|
|
|
makeCharacterLiteral(Literal, *Result.Context);
|
2018-08-22 21:58:25 +08:00
|
|
|
if (!Replacement)
|
|
|
|
return;
|
|
|
|
SourceRange Range = Literal->getSourceRange();
|
|
|
|
|
|
|
|
if (const auto *ByAnyChar = Result.Nodes.getNodeAs<Expr>("ByAnyChar"))
|
|
|
|
Range = ByAnyChar->getSourceRange();
|
|
|
|
|
|
|
|
diag(
|
|
|
|
Literal->getBeginLoc(),
|
|
|
|
"%select{absl::StrSplit()|absl::MaxSplits()}0 called with a string "
|
|
|
|
"literal "
|
|
|
|
"consisting of a single character; consider using the character overload")
|
|
|
|
<< (Result.Nodes.getNodeAs<CallExpr>("StrSplit") ? 0 : 1)
|
|
|
|
<< FixItHint::CreateReplacement(CharSourceRange::getTokenRange(Range),
|
|
|
|
*Replacement);
|
|
|
|
}
|
|
|
|
|
|
|
|
} // namespace abseil
|
|
|
|
} // namespace tidy
|
|
|
|
} // namespace clang
|