2016-03-28 00:43:44 +08:00
|
|
|
//===--- RawStringLiteralCheck.cpp - clang-tidy----------------------------===//
|
|
|
|
//
|
|
|
|
// The LLVM Compiler Infrastructure
|
|
|
|
//
|
|
|
|
// This file is distributed under the University of Illinois Open Source
|
|
|
|
// License. See LICENSE.TXT for details.
|
|
|
|
//
|
|
|
|
//===----------------------------------------------------------------------===//
|
|
|
|
|
|
|
|
#include "RawStringLiteralCheck.h"
|
|
|
|
#include "clang/AST/ASTContext.h"
|
|
|
|
#include "clang/ASTMatchers/ASTMatchFinder.h"
|
|
|
|
#include "clang/Lex/Lexer.h"
|
|
|
|
|
|
|
|
using namespace clang::ast_matchers;
|
|
|
|
|
|
|
|
namespace clang {
|
|
|
|
namespace tidy {
|
|
|
|
namespace modernize {
|
|
|
|
|
|
|
|
namespace {
|
|
|
|
|
|
|
|
bool containsEscapes(StringRef HayStack, StringRef Escapes) {
|
|
|
|
size_t BackSlash = HayStack.find('\\');
|
|
|
|
if (BackSlash == StringRef::npos)
|
|
|
|
return false;
|
|
|
|
|
|
|
|
while (BackSlash != StringRef::npos) {
|
|
|
|
if (Escapes.find(HayStack[BackSlash + 1]) == StringRef::npos)
|
|
|
|
return false;
|
|
|
|
BackSlash = HayStack.find('\\', BackSlash + 2);
|
|
|
|
}
|
|
|
|
|
|
|
|
return true;
|
|
|
|
}
|
|
|
|
|
|
|
|
bool isRawStringLiteral(StringRef Text) {
|
|
|
|
// Already a raw string literal if R comes before ".
|
|
|
|
const size_t QuotePos = Text.find('"');
|
|
|
|
assert(QuotePos != StringRef::npos);
|
|
|
|
return (QuotePos > 0) && (Text[QuotePos - 1] == 'R');
|
|
|
|
}
|
|
|
|
|
|
|
|
bool containsEscapedCharacters(const MatchFinder::MatchResult &Result,
|
|
|
|
const StringLiteral *Literal) {
|
|
|
|
// FIXME: Handle L"", u8"", u"" and U"" literals.
|
|
|
|
if (!Literal->isAscii())
|
|
|
|
return false;
|
|
|
|
|
|
|
|
StringRef Bytes = Literal->getBytes();
|
|
|
|
// Non-printing characters disqualify this literal:
|
|
|
|
// \007 = \a bell
|
|
|
|
// \010 = \b backspace
|
|
|
|
// \011 = \t horizontal tab
|
|
|
|
// \012 = \n new line
|
|
|
|
// \013 = \v vertical tab
|
|
|
|
// \014 = \f form feed
|
|
|
|
// \015 = \r carriage return
|
|
|
|
// \177 = delete
|
|
|
|
if (Bytes.find_first_of(StringRef("\000\001\002\003\004\005\006\a"
|
|
|
|
"\b\t\n\v\f\r\016\017"
|
|
|
|
"\020\021\022\023\024\025\026\027"
|
|
|
|
"\030\031\032\033\034\035\036\037"
|
|
|
|
"\177",
|
|
|
|
33)) != StringRef::npos)
|
|
|
|
return false;
|
|
|
|
|
|
|
|
CharSourceRange CharRange = Lexer::makeFileCharRange(
|
|
|
|
CharSourceRange::getTokenRange(Literal->getSourceRange()),
|
|
|
|
*Result.SourceManager, Result.Context->getLangOpts());
|
|
|
|
StringRef Text = Lexer::getSourceText(CharRange, *Result.SourceManager,
|
|
|
|
Result.Context->getLangOpts());
|
|
|
|
if (isRawStringLiteral(Text))
|
|
|
|
return false;
|
|
|
|
|
|
|
|
return containsEscapes(Text, R"('\"?x01)");
|
|
|
|
}
|
|
|
|
|
|
|
|
bool containsDelimiter(StringRef Bytes, const std::string &Delimiter) {
|
|
|
|
return Bytes.find(Delimiter.empty()
|
|
|
|
? std::string(R"lit()")lit")
|
|
|
|
: (")" + Delimiter + R"(")")) != StringRef::npos;
|
|
|
|
}
|
|
|
|
|
|
|
|
std::string asRawStringLiteral(const StringLiteral *Literal,
|
|
|
|
const std::string &DelimiterStem) {
|
|
|
|
const StringRef Bytes = Literal->getBytes();
|
|
|
|
std::string Delimiter;
|
|
|
|
for (int I = 0; containsDelimiter(Bytes, Delimiter); ++I) {
|
|
|
|
Delimiter = (I == 0) ? DelimiterStem : DelimiterStem + std::to_string(I);
|
|
|
|
}
|
|
|
|
|
|
|
|
if (Delimiter.empty())
|
|
|
|
return (R"(R"()" + Bytes + R"lit()")lit").str();
|
|
|
|
|
|
|
|
return (R"(R")" + Delimiter + "(" + Bytes + ")" + Delimiter + R"(")").str();
|
|
|
|
}
|
|
|
|
|
|
|
|
} // namespace
|
|
|
|
|
|
|
|
RawStringLiteralCheck::RawStringLiteralCheck(StringRef Name,
|
|
|
|
ClangTidyContext *Context)
|
|
|
|
: ClangTidyCheck(Name, Context),
|
|
|
|
DelimiterStem(Options.get("DelimiterStem", "lit")) {}
|
|
|
|
|
|
|
|
void RawStringLiteralCheck::storeOptions(ClangTidyOptions::OptionMap &Options) {
|
|
|
|
ClangTidyCheck::storeOptions(Options);
|
|
|
|
}
|
|
|
|
|
|
|
|
void RawStringLiteralCheck::registerMatchers(MatchFinder *Finder) {
|
2016-04-21 22:39:12 +08:00
|
|
|
Finder->addMatcher(
|
|
|
|
stringLiteral(unless(hasParent(predefinedExpr()))).bind("lit"), this);
|
2016-03-28 00:43:44 +08:00
|
|
|
}
|
|
|
|
|
|
|
|
void RawStringLiteralCheck::check(const MatchFinder::MatchResult &Result) {
|
|
|
|
// Raw string literals require C++11 or later.
|
|
|
|
if (!Result.Context->getLangOpts().CPlusPlus11)
|
|
|
|
return;
|
|
|
|
|
|
|
|
const auto *Literal = Result.Nodes.getNodeAs<StringLiteral>("lit");
|
|
|
|
if (Literal->getLocStart().isMacroID())
|
|
|
|
return;
|
|
|
|
|
|
|
|
if (containsEscapedCharacters(Result, Literal))
|
|
|
|
replaceWithRawStringLiteral(Result, Literal);
|
|
|
|
}
|
|
|
|
|
|
|
|
void RawStringLiteralCheck::replaceWithRawStringLiteral(
|
|
|
|
const MatchFinder::MatchResult &Result, const StringLiteral *Literal) {
|
|
|
|
CharSourceRange CharRange = Lexer::makeFileCharRange(
|
|
|
|
CharSourceRange::getTokenRange(Literal->getSourceRange()),
|
|
|
|
*Result.SourceManager, Result.Context->getLangOpts());
|
|
|
|
diag(Literal->getLocStart(),
|
|
|
|
"escaped string literal can be written as a raw string literal")
|
|
|
|
<< FixItHint::CreateReplacement(
|
|
|
|
CharRange, asRawStringLiteral(Literal, DelimiterStem));
|
|
|
|
}
|
|
|
|
|
|
|
|
} // namespace modernize
|
|
|
|
} // namespace tidy
|
|
|
|
} // namespace clang
|