forked from OSchip/llvm-project
428 lines
16 KiB
C++
428 lines
16 KiB
C++
//===-- IncludeFixer.cpp - Include inserter based on sema callbacks -------===//
|
|
//
|
|
// The LLVM Compiler Infrastructure
|
|
//
|
|
// This file is distributed under the University of Illinois Open Source
|
|
// License. See LICENSE.TXT for details.
|
|
//
|
|
//===----------------------------------------------------------------------===//
|
|
|
|
#include "IncludeFixer.h"
|
|
#include "clang/Format/Format.h"
|
|
#include "clang/Frontend/CompilerInstance.h"
|
|
#include "clang/Lex/HeaderSearch.h"
|
|
#include "clang/Lex/Preprocessor.h"
|
|
#include "clang/Parse/ParseAST.h"
|
|
#include "clang/Sema/ExternalSemaSource.h"
|
|
#include "clang/Sema/Sema.h"
|
|
#include "llvm/Support/Debug.h"
|
|
#include "llvm/Support/raw_ostream.h"
|
|
|
|
#define DEBUG_TYPE "include-fixer"
|
|
|
|
using namespace clang;
|
|
|
|
namespace clang {
|
|
namespace include_fixer {
|
|
namespace {
|
|
|
|
class Action;
|
|
|
|
class PreprocessorHooks : public clang::PPCallbacks {
|
|
public:
|
|
explicit PreprocessorHooks(Action *EnclosingPass)
|
|
: EnclosingPass(EnclosingPass), TrackedFile(nullptr) {}
|
|
|
|
void FileChanged(clang::SourceLocation loc,
|
|
clang::PPCallbacks::FileChangeReason reason,
|
|
clang::SrcMgr::CharacteristicKind file_type,
|
|
clang::FileID prev_fid) override;
|
|
|
|
void InclusionDirective(clang::SourceLocation HashLocation,
|
|
const clang::Token &IncludeToken,
|
|
llvm::StringRef FileName, bool IsAngled,
|
|
clang::CharSourceRange FileNameRange,
|
|
const clang::FileEntry *IncludeFile,
|
|
llvm::StringRef SearchPath,
|
|
llvm::StringRef relative_path,
|
|
const clang::Module *imported) override;
|
|
|
|
private:
|
|
/// The current Action.
|
|
Action *EnclosingPass;
|
|
|
|
/// The current FileEntry.
|
|
const clang::FileEntry *TrackedFile;
|
|
};
|
|
|
|
/// Manages the parse, gathers include suggestions.
|
|
class Action : public clang::ASTFrontendAction,
|
|
public clang::ExternalSemaSource {
|
|
public:
|
|
explicit Action(SymbolIndexManager &SymbolIndexMgr, StringRef StyleName,
|
|
bool MinimizeIncludePaths)
|
|
: SymbolIndexMgr(SymbolIndexMgr), FallbackStyle(StyleName),
|
|
MinimizeIncludePaths(MinimizeIncludePaths) {}
|
|
|
|
std::unique_ptr<clang::ASTConsumer>
|
|
CreateASTConsumer(clang::CompilerInstance &Compiler,
|
|
StringRef InFile) override {
|
|
Filename = InFile;
|
|
Compiler.getPreprocessor().addPPCallbacks(
|
|
llvm::make_unique<PreprocessorHooks>(this));
|
|
return llvm::make_unique<clang::ASTConsumer>();
|
|
}
|
|
|
|
void ExecuteAction() override {
|
|
clang::CompilerInstance *Compiler = &getCompilerInstance();
|
|
assert(!Compiler->hasSema() && "CI already has Sema");
|
|
|
|
// Set up our hooks into sema and parse the AST.
|
|
if (hasCodeCompletionSupport() &&
|
|
!Compiler->getFrontendOpts().CodeCompletionAt.FileName.empty())
|
|
Compiler->createCodeCompletionConsumer();
|
|
|
|
clang::CodeCompleteConsumer *CompletionConsumer = nullptr;
|
|
if (Compiler->hasCodeCompletionConsumer())
|
|
CompletionConsumer = &Compiler->getCodeCompletionConsumer();
|
|
|
|
Compiler->createSema(getTranslationUnitKind(), CompletionConsumer);
|
|
Compiler->getSema().addExternalSource(this);
|
|
|
|
clang::ParseAST(Compiler->getSema(), Compiler->getFrontendOpts().ShowStats,
|
|
Compiler->getFrontendOpts().SkipFunctionBodies);
|
|
}
|
|
|
|
/// Callback for incomplete types. If we encounter a forward declaration we
|
|
/// have the fully qualified name ready. Just query that.
|
|
bool MaybeDiagnoseMissingCompleteType(clang::SourceLocation Loc,
|
|
clang::QualType T) override {
|
|
// Ignore spurious callbacks from SFINAE contexts.
|
|
if (getCompilerInstance().getSema().isSFINAEContext())
|
|
return false;
|
|
|
|
clang::ASTContext &context = getCompilerInstance().getASTContext();
|
|
query(T.getUnqualifiedType().getAsString(context.getPrintingPolicy()), Loc);
|
|
return false;
|
|
}
|
|
|
|
/// Callback for unknown identifiers. Try to piece together as much
|
|
/// qualification as we can get and do a query.
|
|
clang::TypoCorrection CorrectTypo(const DeclarationNameInfo &Typo,
|
|
int LookupKind, Scope *S, CXXScopeSpec *SS,
|
|
CorrectionCandidateCallback &CCC,
|
|
DeclContext *MemberContext,
|
|
bool EnteringContext,
|
|
const ObjCObjectPointerType *OPT) override {
|
|
// Ignore spurious callbacks from SFINAE contexts.
|
|
if (getCompilerInstance().getSema().isSFINAEContext())
|
|
return clang::TypoCorrection();
|
|
|
|
std::string TypoScopeString;
|
|
if (S) {
|
|
// FIXME: Currently we only use namespace contexts. Use other context
|
|
// types for query.
|
|
for (const auto *Context = S->getEntity(); Context;
|
|
Context = Context->getParent()) {
|
|
if (const auto *ND = dyn_cast<NamespaceDecl>(Context)) {
|
|
if (!ND->getName().empty())
|
|
TypoScopeString = ND->getNameAsString() + "::" + TypoScopeString;
|
|
}
|
|
}
|
|
}
|
|
|
|
auto ExtendNestedNameSpecifier = [this](CharSourceRange Range) {
|
|
StringRef Source =
|
|
Lexer::getSourceText(Range, getCompilerInstance().getSourceManager(),
|
|
getCompilerInstance().getLangOpts());
|
|
|
|
// Skip forward until we find a character that's neither identifier nor
|
|
// colon. This is a bit of a hack around the fact that we will only get a
|
|
// single callback for a long nested name if a part of the beginning is
|
|
// unknown. For example:
|
|
//
|
|
// llvm::sys::path::parent_path(...)
|
|
// ^~~~ ^~~
|
|
// known
|
|
// ^~~~
|
|
// unknown, last callback
|
|
// ^~~~~~~~~~~
|
|
// no callback
|
|
//
|
|
// With the extension we get the full nested name specifier including
|
|
// parent_path.
|
|
// FIXME: Don't rely on source text.
|
|
const char *End = Source.end();
|
|
while (isIdentifierBody(*End) || *End == ':')
|
|
++End;
|
|
|
|
return std::string(Source.begin(), End);
|
|
};
|
|
|
|
/// If we have a scope specification, use that to get more precise results.
|
|
std::string QueryString;
|
|
if (SS && SS->getRange().isValid()) {
|
|
auto Range = CharSourceRange::getTokenRange(SS->getRange().getBegin(),
|
|
Typo.getLoc());
|
|
|
|
QueryString = ExtendNestedNameSpecifier(Range);
|
|
} else if (Typo.getName().isIdentifier() && !Typo.getLoc().isMacroID()) {
|
|
auto Range =
|
|
CharSourceRange::getTokenRange(Typo.getBeginLoc(), Typo.getEndLoc());
|
|
|
|
QueryString = ExtendNestedNameSpecifier(Range);
|
|
} else {
|
|
QueryString = Typo.getAsString();
|
|
}
|
|
|
|
// Follow C++ Lookup rules. Firstly, lookup the identifier with scoped
|
|
// namespace contexts. If fails, falls back to identifier.
|
|
// For example:
|
|
//
|
|
// namespace a {
|
|
// b::foo f;
|
|
// }
|
|
//
|
|
// 1. lookup a::b::foo.
|
|
// 2. lookup b::foo.
|
|
if (!query(TypoScopeString + QueryString, Typo.getLoc()))
|
|
query(QueryString, Typo.getLoc());
|
|
|
|
// FIXME: We should just return the name we got as input here and prevent
|
|
// clang from trying to correct the typo by itself. That may change the
|
|
// identifier to something that's not wanted by the user.
|
|
return clang::TypoCorrection();
|
|
}
|
|
|
|
StringRef filename() const { return Filename; }
|
|
|
|
/// Called for each include file we discover is in the file.
|
|
/// \param SourceManager the active SourceManager
|
|
/// \param canonical_path the canonical path to the include file
|
|
/// \param uttered_path the path as it appeared in the program
|
|
/// \param IsAngled whether angle brackets were used
|
|
/// \param HashLocation the source location of the include's \#
|
|
/// \param EndLocation the source location following the include
|
|
void NextInclude(clang::SourceManager *SourceManager,
|
|
llvm::StringRef canonical_path, llvm::StringRef uttered_path,
|
|
bool IsAngled, clang::SourceLocation HashLocation,
|
|
clang::SourceLocation EndLocation) {
|
|
unsigned Offset = SourceManager->getFileOffset(HashLocation);
|
|
if (FirstIncludeOffset == -1U)
|
|
FirstIncludeOffset = Offset;
|
|
}
|
|
|
|
/// Get the minimal include for a given path.
|
|
std::string minimizeInclude(StringRef Include,
|
|
const clang::SourceManager &SourceManager,
|
|
clang::HeaderSearch &HeaderSearch) {
|
|
if (!MinimizeIncludePaths)
|
|
return Include;
|
|
|
|
// Get the FileEntry for the include.
|
|
StringRef StrippedInclude = Include.trim("\"<>");
|
|
const FileEntry *Entry =
|
|
SourceManager.getFileManager().getFile(StrippedInclude);
|
|
|
|
// If the file doesn't exist return the path from the database.
|
|
// FIXME: This should never happen.
|
|
if (!Entry)
|
|
return Include;
|
|
|
|
bool IsSystem;
|
|
std::string Suggestion =
|
|
HeaderSearch.suggestPathToFileForDiagnostics(Entry, &IsSystem);
|
|
|
|
return IsSystem ? '<' + Suggestion + '>' : '"' + Suggestion + '"';
|
|
}
|
|
|
|
/// Get the include fixer context for the queried symbol.
|
|
IncludeFixerContext
|
|
getIncludeFixerContext(const clang::SourceManager &SourceManager,
|
|
clang::HeaderSearch &HeaderSearch) {
|
|
IncludeFixerContext FixerContext;
|
|
if (SymbolQueryResults.empty())
|
|
return FixerContext;
|
|
|
|
FixerContext.SymbolIdentifer = QuerySymbol;
|
|
FixerContext.FirstIncludeOffset = FirstIncludeOffset;
|
|
for (const auto &Header : SymbolQueryResults)
|
|
FixerContext.Headers.push_back(
|
|
minimizeInclude(Header, SourceManager, HeaderSearch));
|
|
|
|
return FixerContext;
|
|
}
|
|
|
|
/// Sets the location at the very top of the file.
|
|
void setFileBegin(clang::SourceLocation Location) { FileBegin = Location; }
|
|
|
|
private:
|
|
/// Query the database for a given identifier.
|
|
bool query(StringRef Query, SourceLocation Loc) {
|
|
assert(!Query.empty() && "Empty query!");
|
|
|
|
// Skip other identifers once we have discovered an identfier successfully.
|
|
if (!SymbolQueryResults.empty())
|
|
return false;
|
|
|
|
DEBUG(llvm::dbgs() << "Looking up '" << Query << "' at ");
|
|
DEBUG(Loc.print(llvm::dbgs(), getCompilerInstance().getSourceManager()));
|
|
DEBUG(llvm::dbgs() << " ...");
|
|
|
|
QuerySymbol = Query.str();
|
|
SymbolQueryResults = SymbolIndexMgr.search(Query);
|
|
DEBUG(llvm::dbgs() << SymbolQueryResults.size() << " replies\n");
|
|
return !SymbolQueryResults.empty();
|
|
}
|
|
|
|
/// The client to use to find cross-references.
|
|
SymbolIndexManager &SymbolIndexMgr;
|
|
|
|
/// The absolute path to the file being processed.
|
|
std::string Filename;
|
|
|
|
/// The location of the beginning of the tracked file.
|
|
clang::SourceLocation FileBegin;
|
|
|
|
/// The offset of the last include in the original source file. This will
|
|
/// be used as the insertion point for new include directives.
|
|
unsigned FirstIncludeOffset = -1U;
|
|
|
|
/// The fallback format style for formatting after insertion if there is no
|
|
/// clang-format config file found.
|
|
std::string FallbackStyle;
|
|
|
|
/// The symbol being queried.
|
|
std::string QuerySymbol;
|
|
|
|
/// The query results of an identifier. We only include the first discovered
|
|
/// identifier to avoid getting caught in results from error recovery.
|
|
std::vector<std::string> SymbolQueryResults;
|
|
|
|
/// Whether we should use the smallest possible include path.
|
|
bool MinimizeIncludePaths = true;
|
|
};
|
|
|
|
void PreprocessorHooks::FileChanged(clang::SourceLocation Loc,
|
|
clang::PPCallbacks::FileChangeReason Reason,
|
|
clang::SrcMgr::CharacteristicKind FileType,
|
|
clang::FileID PrevFID) {
|
|
// Remember where the main file starts.
|
|
if (Reason == clang::PPCallbacks::EnterFile) {
|
|
clang::SourceManager *SourceManager =
|
|
&EnclosingPass->getCompilerInstance().getSourceManager();
|
|
clang::FileID loc_id = SourceManager->getFileID(Loc);
|
|
if (const clang::FileEntry *FileEntry =
|
|
SourceManager->getFileEntryForID(loc_id)) {
|
|
if (FileEntry->getName() == EnclosingPass->filename()) {
|
|
EnclosingPass->setFileBegin(Loc);
|
|
TrackedFile = FileEntry;
|
|
}
|
|
}
|
|
}
|
|
}
|
|
|
|
void PreprocessorHooks::InclusionDirective(
|
|
clang::SourceLocation HashLocation, const clang::Token &IncludeToken,
|
|
llvm::StringRef FileName, bool IsAngled,
|
|
clang::CharSourceRange FileNameRange, const clang::FileEntry *IncludeFile,
|
|
llvm::StringRef SearchPath, llvm::StringRef relative_path,
|
|
const clang::Module *imported) {
|
|
// Remember include locations so we can insert our new include at the end of
|
|
// the include block.
|
|
clang::SourceManager *SourceManager =
|
|
&EnclosingPass->getCompilerInstance().getSourceManager();
|
|
auto IDPosition = SourceManager->getDecomposedExpansionLoc(HashLocation);
|
|
const FileEntry *SourceFile =
|
|
SourceManager->getFileEntryForID(IDPosition.first);
|
|
if (!IncludeFile || TrackedFile != SourceFile)
|
|
return;
|
|
EnclosingPass->NextInclude(SourceManager, IncludeFile->getName(), FileName,
|
|
IsAngled, HashLocation, FileNameRange.getEnd());
|
|
}
|
|
|
|
} // namespace
|
|
|
|
IncludeFixerActionFactory::IncludeFixerActionFactory(
|
|
SymbolIndexManager &SymbolIndexMgr, IncludeFixerContext &Context,
|
|
StringRef StyleName, bool MinimizeIncludePaths)
|
|
: SymbolIndexMgr(SymbolIndexMgr), Context(Context),
|
|
MinimizeIncludePaths(MinimizeIncludePaths), FallbackStyle(StyleName) {}
|
|
|
|
IncludeFixerActionFactory::~IncludeFixerActionFactory() = default;
|
|
|
|
bool IncludeFixerActionFactory::runInvocation(
|
|
clang::CompilerInvocation *Invocation, clang::FileManager *Files,
|
|
std::shared_ptr<clang::PCHContainerOperations> PCHContainerOps,
|
|
clang::DiagnosticConsumer *Diagnostics) {
|
|
assert(Invocation->getFrontendOpts().Inputs.size() == 1);
|
|
|
|
// Set up Clang.
|
|
clang::CompilerInstance Compiler(PCHContainerOps);
|
|
Compiler.setInvocation(Invocation);
|
|
Compiler.setFileManager(Files);
|
|
|
|
// Create the compiler's actual diagnostics engine. We want to drop all
|
|
// diagnostics here.
|
|
Compiler.createDiagnostics(new clang::IgnoringDiagConsumer,
|
|
/*ShouldOwnClient=*/true);
|
|
Compiler.createSourceManager(*Files);
|
|
|
|
// We abort on fatal errors so don't let a large number of errors become
|
|
// fatal. A missing #include can cause thousands of errors.
|
|
Compiler.getDiagnostics().setErrorLimit(0);
|
|
|
|
// Run the parser, gather missing includes.
|
|
auto ScopedToolAction = llvm::make_unique<Action>(
|
|
SymbolIndexMgr, FallbackStyle, MinimizeIncludePaths);
|
|
Compiler.ExecuteAction(*ScopedToolAction);
|
|
|
|
Context = ScopedToolAction->getIncludeFixerContext(
|
|
Compiler.getSourceManager(),
|
|
Compiler.getPreprocessor().getHeaderSearchInfo());
|
|
|
|
// Technically this should only return true if we're sure that we have a
|
|
// parseable file. We don't know that though. Only inform users of fatal
|
|
// errors.
|
|
return !Compiler.getDiagnostics().hasFatalErrorOccurred();
|
|
}
|
|
|
|
std::vector<clang::tooling::Replacement>
|
|
createInsertHeaderReplacements(StringRef Code, StringRef FilePath,
|
|
StringRef Header, unsigned FirstIncludeOffset,
|
|
const clang::format::FormatStyle &Style) {
|
|
if (Header.empty())
|
|
return {};
|
|
// Create replacements for new headers.
|
|
clang::tooling::Replacements Insertions;
|
|
if (FirstIncludeOffset == -1U) {
|
|
// FIXME: skip header guards.
|
|
FirstIncludeOffset = 0;
|
|
// If there is no existing #include, then insert an empty line after new
|
|
// header block.
|
|
if (Code.front() != '\n')
|
|
Insertions.insert(
|
|
clang::tooling::Replacement(FilePath, FirstIncludeOffset, 0, "\n"));
|
|
}
|
|
// Keep inserting new headers before the first header.
|
|
std::string Text = "#include " + Header.str() + "\n";
|
|
Insertions.insert(
|
|
clang::tooling::Replacement(FilePath, FirstIncludeOffset, 0, Text));
|
|
DEBUG({
|
|
llvm::dbgs() << "Header insertions:\n";
|
|
for (const auto &R : Insertions)
|
|
llvm::dbgs() << R.toString() << '\n';
|
|
});
|
|
|
|
clang::tooling::Replacements Replaces =
|
|
formatReplacements(Code, Insertions, Style);
|
|
// FIXME: remove this when `clang::tooling::Replacements` is implemented as
|
|
// `std::vector<clang::tooling::Replacement>`.
|
|
std::vector<clang::tooling::Replacement> Results;
|
|
std::copy(Replaces.begin(), Replaces.end(), std::back_inserter(Results));
|
|
return Results;
|
|
}
|
|
|
|
} // namespace include_fixer
|
|
} // namespace clang
|