2017-04-18 15:46:39 +08:00
|
|
|
//===--- InefficientVectorOperationCheck.cpp - clang-tidy------------------===//
|
|
|
|
//
|
2019-01-19 16:50:56 +08:00
|
|
|
// Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions.
|
|
|
|
// See https://llvm.org/LICENSE.txt for license information.
|
|
|
|
// SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception
|
2017-04-18 15:46:39 +08:00
|
|
|
//
|
|
|
|
//===----------------------------------------------------------------------===//
|
|
|
|
|
|
|
|
#include "InefficientVectorOperationCheck.h"
|
|
|
|
#include "clang/AST/ASTContext.h"
|
|
|
|
#include "clang/ASTMatchers/ASTMatchFinder.h"
|
|
|
|
#include "clang/Lex/Lexer.h"
|
|
|
|
#include "../utils/DeclRefExprUtils.h"
|
2017-04-27 02:13:05 +08:00
|
|
|
#include "../utils/OptionsUtils.h"
|
2017-04-18 15:46:39 +08:00
|
|
|
|
|
|
|
using namespace clang::ast_matchers;
|
|
|
|
|
|
|
|
namespace clang {
|
|
|
|
namespace tidy {
|
|
|
|
namespace performance {
|
|
|
|
|
|
|
|
namespace {
|
|
|
|
|
|
|
|
// Matcher names. Given the code:
|
|
|
|
//
|
|
|
|
// \code
|
|
|
|
// void f() {
|
|
|
|
// vector<T> v;
|
|
|
|
// for (int i = 0; i < 10 + 1; ++i) {
|
|
|
|
// v.push_back(i);
|
|
|
|
// }
|
|
|
|
// }
|
|
|
|
// \endcode
|
|
|
|
//
|
|
|
|
// The matcher names are bound to following parts of the AST:
|
2017-04-27 02:13:05 +08:00
|
|
|
// - LoopCounterName: The entire for loop (as ForStmt).
|
2017-04-18 15:46:39 +08:00
|
|
|
// - LoopParentName: The body of function f (as CompoundStmt).
|
|
|
|
// - VectorVarDeclName: 'v' in (as VarDecl).
|
|
|
|
// - VectorVarDeclStmatName: The entire 'std::vector<T> v;' statement (as
|
|
|
|
// DeclStmt).
|
2017-05-16 18:39:55 +08:00
|
|
|
// - PushBackOrEmplaceBackCallName: 'v.push_back(i)' (as cxxMemberCallExpr).
|
2017-04-18 15:46:39 +08:00
|
|
|
// - LoopInitVarName: 'i' (as VarDecl).
|
|
|
|
// - LoopEndExpr: '10+1' (as Expr).
|
|
|
|
static const char LoopCounterName[] = "for_loop_counter";
|
|
|
|
static const char LoopParentName[] = "loop_parent";
|
|
|
|
static const char VectorVarDeclName[] = "vector_var_decl";
|
|
|
|
static const char VectorVarDeclStmtName[] = "vector_var_decl_stmt";
|
2017-05-16 18:39:55 +08:00
|
|
|
static const char PushBackOrEmplaceBackCallName[] = "append_call";
|
2017-04-18 15:46:39 +08:00
|
|
|
static const char LoopInitVarName[] = "loop_init_var";
|
|
|
|
static const char LoopEndExprName[] = "loop_end_expr";
|
|
|
|
|
2017-04-27 02:13:05 +08:00
|
|
|
static const char RangeLoopName[] = "for_range_loop";
|
|
|
|
|
|
|
|
ast_matchers::internal::Matcher<Expr> supportedContainerTypesMatcher() {
|
|
|
|
return hasType(cxxRecordDecl(hasAnyName(
|
|
|
|
"::std::vector", "::std::set", "::std::unordered_set", "::std::map",
|
2017-05-16 02:18:28 +08:00
|
|
|
"::std::unordered_map", "::std::array", "::std::deque")));
|
2017-04-27 02:13:05 +08:00
|
|
|
}
|
|
|
|
|
2017-04-18 15:46:39 +08:00
|
|
|
} // namespace
|
|
|
|
|
2017-04-27 02:13:05 +08:00
|
|
|
InefficientVectorOperationCheck::InefficientVectorOperationCheck(
|
|
|
|
StringRef Name, ClangTidyContext *Context)
|
|
|
|
: ClangTidyCheck(Name, Context),
|
|
|
|
VectorLikeClasses(utils::options::parseStringList(
|
|
|
|
Options.get("VectorLikeClasses", "::std::vector"))) {}
|
|
|
|
|
|
|
|
void InefficientVectorOperationCheck::storeOptions(
|
|
|
|
ClangTidyOptions::OptionMap &Opts) {
|
|
|
|
Options.store(Opts, "VectorLikeClasses",
|
|
|
|
utils::options::serializeStringList(VectorLikeClasses));
|
|
|
|
}
|
|
|
|
|
2017-04-18 15:46:39 +08:00
|
|
|
void InefficientVectorOperationCheck::registerMatchers(MatchFinder *Finder) {
|
2017-04-27 02:13:05 +08:00
|
|
|
const auto VectorDecl = cxxRecordDecl(hasAnyName(SmallVector<StringRef, 5>(
|
|
|
|
VectorLikeClasses.begin(), VectorLikeClasses.end())));
|
2017-04-18 15:46:39 +08:00
|
|
|
const auto VectorDefaultConstructorCall = cxxConstructExpr(
|
|
|
|
hasType(VectorDecl),
|
|
|
|
hasDeclaration(cxxConstructorDecl(isDefaultConstructor())));
|
|
|
|
const auto VectorVarDecl =
|
|
|
|
varDecl(hasInitializer(VectorDefaultConstructorCall))
|
|
|
|
.bind(VectorVarDeclName);
|
2017-05-16 18:39:55 +08:00
|
|
|
const auto VectorAppendCallExpr =
|
2017-04-18 15:46:39 +08:00
|
|
|
cxxMemberCallExpr(
|
2017-05-16 18:39:55 +08:00
|
|
|
callee(cxxMethodDecl(hasAnyName("push_back", "emplace_back"))),
|
|
|
|
on(hasType(VectorDecl)),
|
2017-04-18 15:46:39 +08:00
|
|
|
onImplicitObjectArgument(declRefExpr(to(VectorVarDecl))))
|
2017-05-16 18:39:55 +08:00
|
|
|
.bind(PushBackOrEmplaceBackCallName);
|
|
|
|
const auto VectorAppendCall = expr(ignoringImplicit(VectorAppendCallExpr));
|
2017-04-18 15:46:39 +08:00
|
|
|
const auto VectorVarDefStmt =
|
|
|
|
declStmt(hasSingleDecl(equalsBoundNode(VectorVarDeclName)))
|
|
|
|
.bind(VectorVarDeclStmtName);
|
|
|
|
|
|
|
|
const auto LoopVarInit =
|
|
|
|
declStmt(hasSingleDecl(varDecl(hasInitializer(integerLiteral(equals(0))))
|
|
|
|
.bind(LoopInitVarName)));
|
|
|
|
const auto RefersToLoopVar = ignoringParenImpCasts(
|
|
|
|
declRefExpr(to(varDecl(equalsBoundNode(LoopInitVarName)))));
|
|
|
|
|
2017-05-16 18:39:55 +08:00
|
|
|
// Matchers for the loop whose body has only 1 push_back/emplace_back calling
|
|
|
|
// statement.
|
|
|
|
const auto HasInterestingLoopBody =
|
|
|
|
hasBody(anyOf(compoundStmt(statementCountIs(1), has(VectorAppendCall)),
|
|
|
|
VectorAppendCall));
|
2017-04-27 02:13:05 +08:00
|
|
|
const auto InInterestingCompoundStmt =
|
|
|
|
hasParent(compoundStmt(has(VectorVarDefStmt)).bind(LoopParentName));
|
|
|
|
|
2017-04-18 15:46:39 +08:00
|
|
|
// Match counter-based for loops:
|
|
|
|
// for (int i = 0; i < n; ++i) { v.push_back(...); }
|
|
|
|
//
|
|
|
|
// FIXME: Support more types of counter-based loops like decrement loops.
|
|
|
|
Finder->addMatcher(
|
|
|
|
forStmt(
|
|
|
|
hasLoopInit(LoopVarInit),
|
|
|
|
hasCondition(binaryOperator(
|
|
|
|
hasOperatorName("<"), hasLHS(RefersToLoopVar),
|
|
|
|
hasRHS(expr(unless(hasDescendant(expr(RefersToLoopVar))))
|
|
|
|
.bind(LoopEndExprName)))),
|
|
|
|
hasIncrement(unaryOperator(hasOperatorName("++"),
|
|
|
|
hasUnaryOperand(RefersToLoopVar))),
|
2017-04-27 02:13:05 +08:00
|
|
|
HasInterestingLoopBody, InInterestingCompoundStmt)
|
2017-04-18 15:46:39 +08:00
|
|
|
.bind(LoopCounterName),
|
|
|
|
this);
|
2017-04-27 02:13:05 +08:00
|
|
|
|
|
|
|
// Match for-range loops:
|
|
|
|
// for (const auto& E : data) { v.push_back(...); }
|
|
|
|
//
|
|
|
|
// FIXME: Support more complex range-expressions.
|
|
|
|
Finder->addMatcher(
|
|
|
|
cxxForRangeStmt(
|
|
|
|
hasRangeInit(declRefExpr(supportedContainerTypesMatcher())),
|
|
|
|
HasInterestingLoopBody, InInterestingCompoundStmt)
|
|
|
|
.bind(RangeLoopName),
|
|
|
|
this);
|
2017-04-18 15:46:39 +08:00
|
|
|
}
|
|
|
|
|
|
|
|
void InefficientVectorOperationCheck::check(
|
|
|
|
const MatchFinder::MatchResult &Result) {
|
2017-04-19 04:47:34 +08:00
|
|
|
auto* Context = Result.Context;
|
|
|
|
if (Context->getDiagnostics().hasUncompilableErrorOccurred())
|
2017-04-18 15:46:39 +08:00
|
|
|
return;
|
|
|
|
|
|
|
|
const SourceManager &SM = *Result.SourceManager;
|
2017-04-27 02:13:05 +08:00
|
|
|
const auto *VectorVarDecl =
|
|
|
|
Result.Nodes.getNodeAs<VarDecl>(VectorVarDeclName);
|
2017-04-18 15:46:39 +08:00
|
|
|
const auto *ForLoop = Result.Nodes.getNodeAs<ForStmt>(LoopCounterName);
|
2017-04-27 02:13:05 +08:00
|
|
|
const auto *RangeLoop =
|
|
|
|
Result.Nodes.getNodeAs<CXXForRangeStmt>(RangeLoopName);
|
2017-05-16 18:39:55 +08:00
|
|
|
const auto *VectorAppendCall =
|
|
|
|
Result.Nodes.getNodeAs<CXXMemberCallExpr>(PushBackOrEmplaceBackCallName);
|
2017-04-18 15:46:39 +08:00
|
|
|
const auto *LoopEndExpr = Result.Nodes.getNodeAs<Expr>(LoopEndExprName);
|
|
|
|
const auto *LoopParent = Result.Nodes.getNodeAs<CompoundStmt>(LoopParentName);
|
2017-04-27 02:13:05 +08:00
|
|
|
|
|
|
|
const Stmt *LoopStmt = ForLoop;
|
|
|
|
if (!LoopStmt)
|
|
|
|
LoopStmt = RangeLoop;
|
2017-04-18 15:46:39 +08:00
|
|
|
|
|
|
|
llvm::SmallPtrSet<const DeclRefExpr *, 16> AllVectorVarRefs =
|
|
|
|
utils::decl_ref_expr::allDeclRefExprs(*VectorVarDecl, *LoopParent,
|
2017-04-19 04:47:34 +08:00
|
|
|
*Context);
|
2017-04-18 15:46:39 +08:00
|
|
|
for (const auto *Ref : AllVectorVarRefs) {
|
|
|
|
// Skip cases where there are usages (defined as DeclRefExpr that refers to
|
|
|
|
// "v") of vector variable `v` before the for loop. We consider these usages
|
|
|
|
// are operations causing memory preallocation (e.g. "v.resize(n)",
|
|
|
|
// "v.reserve(n)").
|
|
|
|
//
|
|
|
|
// FIXME: make it more intelligent to identify the pre-allocating operations
|
|
|
|
// before the for loop.
|
|
|
|
if (SM.isBeforeInTranslationUnit(Ref->getLocation(),
|
2018-08-10 06:42:26 +08:00
|
|
|
LoopStmt->getBeginLoc())) {
|
2017-04-18 15:46:39 +08:00
|
|
|
return;
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
2017-04-19 04:47:34 +08:00
|
|
|
llvm::StringRef VectorVarName = Lexer::getSourceText(
|
2017-04-18 15:46:39 +08:00
|
|
|
CharSourceRange::getTokenRange(
|
2017-05-16 18:39:55 +08:00
|
|
|
VectorAppendCall->getImplicitObjectArgument()->getSourceRange()),
|
2017-04-19 04:47:34 +08:00
|
|
|
SM, Context->getLangOpts());
|
2017-04-18 15:46:39 +08:00
|
|
|
|
2017-04-27 02:13:05 +08:00
|
|
|
std::string ReserveStmt;
|
|
|
|
// Handle for-range loop cases.
|
|
|
|
if (RangeLoop) {
|
|
|
|
// Get the range-expression in a for-range statement represented as
|
|
|
|
// `for (range-declarator: range-expression)`.
|
|
|
|
StringRef RangeInitExpName = Lexer::getSourceText(
|
|
|
|
CharSourceRange::getTokenRange(
|
|
|
|
RangeLoop->getRangeInit()->getSourceRange()),
|
|
|
|
SM, Context->getLangOpts());
|
|
|
|
|
|
|
|
ReserveStmt =
|
|
|
|
(VectorVarName + ".reserve(" + RangeInitExpName + ".size()" + ");\n")
|
|
|
|
.str();
|
|
|
|
} else if (ForLoop) {
|
|
|
|
// Handle counter-based loop cases.
|
|
|
|
StringRef LoopEndSource = Lexer::getSourceText(
|
|
|
|
CharSourceRange::getTokenRange(LoopEndExpr->getSourceRange()), SM,
|
|
|
|
Context->getLangOpts());
|
|
|
|
ReserveStmt = (VectorVarName + ".reserve(" + LoopEndSource + ");\n").str();
|
|
|
|
}
|
|
|
|
|
2017-05-16 18:39:55 +08:00
|
|
|
auto Diag =
|
2018-08-10 06:42:26 +08:00
|
|
|
diag(VectorAppendCall->getBeginLoc(),
|
2017-05-16 18:39:55 +08:00
|
|
|
"%0 is called inside a loop; "
|
|
|
|
"consider pre-allocating the vector capacity before the loop")
|
|
|
|
<< VectorAppendCall->getMethodDecl()->getDeclName();
|
2017-04-27 02:13:05 +08:00
|
|
|
|
|
|
|
if (!ReserveStmt.empty())
|
2018-08-10 06:42:26 +08:00
|
|
|
Diag << FixItHint::CreateInsertion(LoopStmt->getBeginLoc(), ReserveStmt);
|
2017-04-18 15:46:39 +08:00
|
|
|
}
|
|
|
|
|
|
|
|
} // namespace performance
|
|
|
|
} // namespace tidy
|
|
|
|
} // namespace clang
|