Split line comments

Summary:
Split line comments that exceed column limit + fixed leading whitespace
handling when splitting block comments.

Reviewers: djasper, klimek

Reviewed By: djasper

CC: cfe-commits

Differential Revision: http://llvm-reviews.chandlerc.com/D577

llvm-svn: 178133
This commit is contained in:
Alexander Kornienko 2013-03-27 11:52:18 +00:00
parent 653d8839c8
commit ffd6d04a43
2 changed files with 111 additions and 38 deletions
clang
lib/Format
unittests/Format

View File

@ -23,6 +23,7 @@
#include "clang/Format/Format.h" #include "clang/Format/Format.h"
#include "clang/Frontend/TextDiagnosticPrinter.h" #include "clang/Frontend/TextDiagnosticPrinter.h"
#include "clang/Lex/Lexer.h" #include "clang/Lex/Lexer.h"
#include "llvm/ADT/STLExtras.h"
#include "llvm/Support/Allocator.h" #include "llvm/Support/Allocator.h"
#include "llvm/Support/Debug.h" #include "llvm/Support/Debug.h"
#include <queue> #include <queue>
@ -103,6 +104,12 @@ static unsigned getLengthToMatchingParen(const AnnotatedToken &Tok) {
return End->TotalLength - Tok.TotalLength + 1; return End->TotalLength - Tok.TotalLength + 1;
} }
static size_t
calculateColumnLimit(const FormatStyle &Style, bool InPPDirective) {
// In preprocessor directives reserve two chars for trailing " \"
return Style.ColumnLimit - (InPPDirective ? 2 : 0);
}
/// \brief Manages the whitespaces around tokens and their replacements. /// \brief Manages the whitespaces around tokens and their replacements.
/// ///
/// This includes special handling for certain constructs, e.g. the alignment of /// This includes special handling for certain constructs, e.g. the alignment of
@ -120,31 +127,32 @@ public:
if (NewLines >= 2) if (NewLines >= 2)
alignComments(); alignComments();
SourceLocation TokenLoc = Tok.FormatTok.Tok.getLocation();
bool LineExceedsColumnLimit = Spaces + WhitespaceStartColumn +
Tok.FormatTok.TokenLength > Style.ColumnLimit;
// Align line comments if they are trailing or if they continue other // Align line comments if they are trailing or if they continue other
// trailing comments. // trailing comments.
if (isTrailingComment(Tok)) { if (isTrailingComment(Tok)) {
// Remove the comment's trailing whitespace. // Remove the comment's trailing whitespace.
if (Tok.FormatTok.Tok.getLength() != Tok.FormatTok.TokenLength) if (Tok.FormatTok.Tok.getLength() != Tok.FormatTok.TokenLength)
Replaces.insert(tooling::Replacement( Replaces.insert(tooling::Replacement(
SourceMgr, Tok.FormatTok.Tok.getLocation().getLocWithOffset( SourceMgr, TokenLoc.getLocWithOffset(Tok.FormatTok.TokenLength),
Tok.FormatTok.TokenLength),
Tok.FormatTok.Tok.getLength() - Tok.FormatTok.TokenLength, "")); Tok.FormatTok.Tok.getLength() - Tok.FormatTok.TokenLength, ""));
// Align comment with other comments. // Align comment with other comments.
if (Tok.Parent != NULL || !Comments.empty()) { if ((Tok.Parent != NULL || !Comments.empty()) &&
if (Style.ColumnLimit >= !LineExceedsColumnLimit) {
Spaces + WhitespaceStartColumn + Tok.FormatTok.TokenLength) { StoredComment Comment;
StoredComment Comment; Comment.Tok = Tok.FormatTok;
Comment.Tok = Tok.FormatTok; Comment.Spaces = Spaces;
Comment.Spaces = Spaces; Comment.NewLines = NewLines;
Comment.NewLines = NewLines; Comment.MinColumn =
Comment.MinColumn = NewLines > 0 ? Spaces : WhitespaceStartColumn + Spaces;
NewLines > 0 ? Spaces : WhitespaceStartColumn + Spaces; Comment.MaxColumn = Style.ColumnLimit - Tok.FormatTok.TokenLength;
Comment.MaxColumn = Style.ColumnLimit - Tok.FormatTok.TokenLength; Comment.Untouchable = false;
Comment.Untouchable = false; Comments.push_back(Comment);
Comments.push_back(Comment); return;
return;
}
} }
} }
@ -152,8 +160,19 @@ public:
if (Tok.Children.empty() && !isTrailingComment(Tok)) if (Tok.Children.empty() && !isTrailingComment(Tok))
alignComments(); alignComments();
if (Tok.Type == TT_BlockComment) if (Tok.Type == TT_BlockComment) {
indentBlockComment(Tok, Spaces, WhitespaceStartColumn, NewLines, false); indentBlockComment(Tok, Spaces, WhitespaceStartColumn, NewLines, false);
} else if (Tok.Type == TT_LineComment && LineExceedsColumnLimit) {
StringRef Line(SourceMgr.getCharacterData(TokenLoc),
Tok.FormatTok.TokenLength);
int StartColumn = Spaces + (NewLines == 0 ? WhitespaceStartColumn : 0);
StringRef Prefix = getLineCommentPrefix(Line);
std::string NewPrefix = std::string(StartColumn, ' ') + Prefix.str();
splitLineInComment(Tok.FormatTok, Line.substr(Prefix.size()),
StartColumn + Prefix.size(), NewPrefix,
/*InPPDirective=*/ false,
/*CommentHasMoreLines=*/ false);
}
storeReplacement(Tok.FormatTok, getNewLineText(NewLines, Spaces)); storeReplacement(Tok.FormatTok, getNewLineText(NewLines, Spaces));
} }
@ -209,6 +228,14 @@ public:
} }
private: private:
static StringRef getLineCommentPrefix(StringRef Comment) {
const char *KnownPrefixes[] = { "/// ", "///", "// ", "//" };
for (size_t i = 0; i < llvm::array_lengthof(KnownPrefixes); ++i)
if (Comment.startswith(KnownPrefixes[i]))
return KnownPrefixes[i];
return "";
}
/// \brief Finds a common prefix of lines of a block comment to properly /// \brief Finds a common prefix of lines of a block comment to properly
/// indent (and possibly decorate with '*'s) added lines. /// indent (and possibly decorate with '*'s) added lines.
/// ///
@ -229,13 +256,38 @@ private:
return Prefix; return Prefix;
} }
/// \brief Splits one line in a line or block comment, if it doesn't fit to
/// provided column limit. Removes trailing whitespace in each line.
///
/// \param Line points to the line contents without leading // or /*.
///
/// \param StartColumn is the column where the first character of Line will be
/// located after formatting.
///
/// \param LinePrefix is inserted after each line break.
///
/// When \param InPPDirective is true, each line break will be preceded by a
/// backslash in the last column to make line breaks inside the comment
/// visually consistent with line breaks outside the comment. This only makes
/// sense for block comments.
///
/// When \param CommentHasMoreLines is false, no line breaks/trailing
/// backslashes will be inserted after it.
void splitLineInComment(const FormatToken &Tok, StringRef Line, void splitLineInComment(const FormatToken &Tok, StringRef Line,
size_t StartColumn, StringRef LinePrefix, size_t StartColumn, StringRef LinePrefix,
bool InPPDirective, bool CommentHasMoreLines, bool InPPDirective, bool CommentHasMoreLines,
const char *WhiteSpaceChars = " ") { const char *WhiteSpaceChars = " ") {
size_t ColumnLimit = Style.ColumnLimit - (InPPDirective ? 2 : 0); size_t ColumnLimit = calculateColumnLimit(Style, InPPDirective);
const char *TokenStart = SourceMgr.getCharacterData(Tok.Tok.getLocation()); const char *TokenStart = SourceMgr.getCharacterData(Tok.Tok.getLocation());
while (Line.rtrim().size() + StartColumn > ColumnLimit) {
StringRef TrimmedLine = Line.rtrim();
int TrailingSpaceLength = Line.size() - TrimmedLine.size();
// Don't touch leading whitespace.
Line = TrimmedLine.ltrim();
StartColumn += TrimmedLine.size() - Line.size();
while (Line.size() + StartColumn > ColumnLimit) {
// Try to break at the last whitespace before the column limit. // Try to break at the last whitespace before the column limit.
size_t SpacePos = size_t SpacePos =
Line.find_last_of(WhiteSpaceChars, ColumnLimit - StartColumn + 1); Line.find_last_of(WhiteSpaceChars, ColumnLimit - StartColumn + 1);
@ -258,24 +310,25 @@ private:
size_t ReplaceChars = Line.begin() - NextCut.end(); size_t ReplaceChars = Line.begin() - NextCut.end();
breakToken(Tok, NextCut.end() - TokenStart, ReplaceChars, "", LinePrefix, breakToken(Tok, NextCut.end() - TokenStart, ReplaceChars, "", LinePrefix,
InPPDirective, 0, InPPDirective, 0, NextCut.size() + StartColumn);
NextCut.size() + StartColumn);
StartColumn = LinePrefix.size(); StartColumn = LinePrefix.size();
} }
StringRef TrimmedLine = Line.rtrim(); if (TrailingSpaceLength > 0 || (InPPDirective && CommentHasMoreLines)) {
if (TrimmedLine != Line || (InPPDirective && CommentHasMoreLines)) { // Remove trailing whitespace/insert backslash. + 1 is for \n
// Remove trailing whitespace/insert backslash. breakToken(Tok, Line.end() - TokenStart, TrailingSpaceLength + 1, "", "",
breakToken(Tok, TrimmedLine.end() - TokenStart, InPPDirective, 0, Line.size() + StartColumn);
Line.size() - TrimmedLine.size() + 1, "", "", InPPDirective, 0,
TrimmedLine.size() + StartColumn);
} }
} }
/// \brief Changes indentation of all lines in a block comment by Indent,
/// removes trailing whitespace from each line, splits lines that end up
/// exceeding the column limit.
void indentBlockComment(const AnnotatedToken &Tok, int Indent, void indentBlockComment(const AnnotatedToken &Tok, int Indent,
int WhitespaceStartColumn, int NewLines, int WhitespaceStartColumn, int NewLines,
bool InPPDirective) { bool InPPDirective) {
int StartColumn = NewLines > 0 ? Indent : WhitespaceStartColumn + Indent; assert(Tok.Type == TT_BlockComment);
int StartColumn = Indent + (NewLines == 0 ? WhitespaceStartColumn : 0);
const SourceLocation TokenLoc = Tok.FormatTok.Tok.getLocation(); const SourceLocation TokenLoc = Tok.FormatTok.Tok.getLocation();
const int CurrentIndent = SourceMgr.getSpellingColumnNumber(TokenLoc) - 1; const int CurrentIndent = SourceMgr.getSpellingColumnNumber(TokenLoc) - 1;
const int IndentDelta = Indent - CurrentIndent; const int IndentDelta = Indent - CurrentIndent;
@ -308,17 +361,17 @@ private:
} }
// Split long lines in comments. // Split long lines in comments.
size_t PrefixSize = 0; size_t OldPrefixSize = 0;
std::string NewPrefix; std::string NewPrefix;
if (Lines.size() > 1) { if (Lines.size() > 1) {
StringRef CurrentPrefix = findCommentLinesPrefix(Lines); StringRef CurrentPrefix = findCommentLinesPrefix(Lines);
PrefixSize = CurrentPrefix.size(); OldPrefixSize = CurrentPrefix.size();
NewPrefix = (IndentDelta < 0) NewPrefix = (IndentDelta < 0)
? CurrentPrefix.substr(-IndentDelta).str() ? CurrentPrefix.substr(-IndentDelta).str()
: std::string(IndentDelta, ' ') + CurrentPrefix.str(); : std::string(IndentDelta, ' ') + CurrentPrefix.str();
if (CurrentPrefix.endswith("*")) { if (CurrentPrefix.endswith("*")) {
NewPrefix += " "; NewPrefix += " ";
++PrefixSize; ++OldPrefixSize;
} }
} else if (Tok.Parent == 0) { } else if (Tok.Parent == 0) {
NewPrefix = std::string(StartColumn, ' ') + " * "; NewPrefix = std::string(StartColumn, ' ') + " * ";
@ -326,7 +379,7 @@ private:
StartColumn += 2; StartColumn += 2;
for (size_t i = 0; i < Lines.size(); ++i) { for (size_t i = 0; i < Lines.size(); ++i) {
StringRef Line = Lines[i].substr(i == 0 ? 2 : PrefixSize); StringRef Line = Lines[i].substr(i == 0 ? 2 : OldPrefixSize);
splitLineInComment(Tok.FormatTok, Line, StartColumn, NewPrefix, splitLineInComment(Tok.FormatTok, Line, StartColumn, NewPrefix,
InPPDirective, i != Lines.size() - 1); InPPDirective, i != Lines.size() - 1);
StartColumn = NewPrefix.size(); StartColumn = NewPrefix.size();
@ -974,7 +1027,7 @@ private:
} }
unsigned getColumnLimit() { unsigned getColumnLimit() {
return Style.ColumnLimit - (Line.InPPDirective ? 2 : 0); return calculateColumnLimit(Style, Line.InPPDirective);
} }
/// \brief An edge in the solution space from \c Previous->State to \c State, /// \brief An edge in the solution space from \c Previous->State to \c State,

View File

@ -681,6 +681,26 @@ TEST_F(FormatTest, AlignsMultiLineComments) {
" */")); " */"));
} }
TEST_F(FormatTest, SplitsLongCxxComments) {
EXPECT_EQ("// A comment that\n"
"// doesn't fit on\n"
"// one line",
format("// A comment that doesn't fit on one line",
getLLVMStyleWithColumns(20)));
EXPECT_EQ("if (true) // A comment that\n"
" // doesn't fit on\n"
" // one line",
format("if (true) // A comment that doesn't fit on one line ",
getLLVMStyleWithColumns(30)));
EXPECT_EQ("// Don't_touch_leading_whitespace",
format("// Don't_touch_leading_whitespace",
getLLVMStyleWithColumns(20)));
EXPECT_EQ(
"//Don't add leading\n"
"//whitespace",
format("//Don't add leading whitespace", getLLVMStyleWithColumns(20)));
}
TEST_F(FormatTest, SplitsLongLinesInComments) { TEST_F(FormatTest, SplitsLongLinesInComments) {
EXPECT_EQ("/* This is a long\n" EXPECT_EQ("/* This is a long\n"
" * comment that\n" " * comment that\n"
@ -727,10 +747,10 @@ TEST_F(FormatTest, SplitsLongLinesInComments) {
" */", " */",
getLLVMStyleWithColumns(20))); getLLVMStyleWithColumns(20)));
EXPECT_EQ("/*\n" EXPECT_EQ("/*\n"
" * This_comment_can_not_be_broken_into_lines\n" " * This_comment_can_not_be_broken_into_lines\n"
" */", " */",
format("/*\n" format("/*\n"
" * This_comment_can_not_be_broken_into_lines\n" " * This_comment_can_not_be_broken_into_lines\n"
" */", " */",
getLLVMStyleWithColumns(20))); getLLVMStyleWithColumns(20)));
EXPECT_EQ("{\n" EXPECT_EQ("{\n"
@ -1166,13 +1186,13 @@ TEST_F(FormatTest, HandlePreprocessorDirectiveContext) {
"#define A( \\\n" "#define A( \\\n"
" A, B)\n" " A, B)\n"
"#include \"b.h\"\n" "#include \"b.h\"\n"
"// some comment\n", "// somecomment\n",
format(" // some comment\n" format(" // some comment\n"
" #include \"a.h\"\n" " #include \"a.h\"\n"
"#define A(A,\\\n" "#define A(A,\\\n"
" B)\n" " B)\n"
" #include \"b.h\"\n" " #include \"b.h\"\n"
" // some comment\n", " // somecomment\n",
getLLVMStyleWithColumns(13))); getLLVMStyleWithColumns(13)));
} }
@ -2442,7 +2462,7 @@ TEST_F(FormatTest, IncorrectCodeMissingSemicolon) {
TEST_F(FormatTest, IndentationWithinColumnLimitNotPossible) { TEST_F(FormatTest, IndentationWithinColumnLimitNotPossible) {
verifyFormat("int aaaaaaaa =\n" verifyFormat("int aaaaaaaa =\n"
" // Overly long comment\n" " // Overlylongcomment\n"
" b;", " b;",
getLLVMStyleWithColumns(20)); getLLVMStyleWithColumns(20));
verifyFormat("function(\n" verifyFormat("function(\n"