llvm-docs/clang_doxygen/NamespaceEndCommentsFixer_8cpp_source.html

 //===--- NamespaceEndCommentsFixer.cpp --------------------------*- C++ -*-===//

 //

 // Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions.

 // See https://llvm.org/LICENSE.txt for license information.

 // SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception

 //

 //===----------------------------------------------------------------------===//

 ///

 /// \file

 /// This file implements NamespaceEndCommentsFixer, a TokenAnalyzer that

 /// fixes namespace end comments.

 ///

 //===----------------------------------------------------------------------===//


 #include "NamespaceEndCommentsFixer.h"

 #include "clang/Basic/TokenKinds.h"

 #include "llvm/Support/Debug.h"

 #include "llvm/Support/Regex.h"


 #define DEBUG_TYPE "namespace-end-comments-fixer"


 namespace clang {

 namespace format {


 namespace {

 // Iterates all tokens starting from StartTok to EndTok and apply Fn to all

 // tokens between them including StartTok and EndTok. Returns the token after

 // EndTok.

 const FormatToken *

 processTokens(const FormatToken *Tok, tok::TokenKind StartTok,

               tok::TokenKind EndTok,

               llvm::function_ref<void(const FormatToken *)> Fn) {

   if (!Tok || Tok->isNot(StartTok))

     return Tok;

   int NestLevel = 0;

   do {

     if (Tok->is(StartTok))

       ++NestLevel;

     else if (Tok->is(EndTok))

       --NestLevel;

     if (Fn)

       Fn(Tok);

     Tok = Tok->getNextNonComment();

   } while (Tok && NestLevel > 0);

   return Tok;

 }


 const FormatToken *skipAttribute(const FormatToken *Tok) {

   if (!Tok)

     return nullptr;

   if (Tok->isAttribute()) {

     Tok = Tok->getNextNonComment();

     Tok = processTokens(Tok, tok::l_paren, tok::r_paren, nullptr);

   } else if (Tok->is(tok::l_square)) {

     Tok = processTokens(Tok, tok::l_square, tok::r_square, nullptr);

   }

   return Tok;

 }


 // Computes the name of a namespace given the namespace token.

 // Returns "" for anonymous namespace.

 std::string computeName(const FormatToken *NamespaceTok) {

   assert(NamespaceTok &&

          NamespaceTok->isOneOf(tok::kw_namespace, TT_NamespaceMacro) &&

          "expecting a namespace token");

   std::string name;

   const FormatToken *Tok = NamespaceTok->getNextNonComment();

   if (NamespaceTok->is(TT_NamespaceMacro)) {

     // Collects all the non-comment tokens between opening parenthesis

     // and closing parenthesis or comma.

     assert(Tok && Tok->is(tok::l_paren) && "expected an opening parenthesis");

     Tok = Tok->getNextNonComment();

     while (Tok && !Tok->isOneOf(tok::r_paren, tok::comma)) {

       name += Tok->TokenText;

       Tok = Tok->getNextNonComment();

     }

     return name;

   }

   Tok = skipAttribute(Tok);


   std::string FirstNSName;

   // For `namespace [[foo]] A::B::inline C {` or

   // `namespace MACRO1 MACRO2 A::B::inline C {`, returns "A::B::inline C".

   // Peek for the first '::' (or '{' or '(')) and then return all tokens from

   // one token before that up until the '{'. A '(' might be a macro with

   // arguments.

   const FormatToken *FirstNSTok = nullptr;

   while (Tok && !Tok->isOneOf(tok::l_brace, tok::coloncolon, tok::l_paren)) {

     if (FirstNSTok)

       FirstNSName += FirstNSTok->TokenText;

     FirstNSTok = Tok;

     Tok = Tok->getNextNonComment();

   }


   if (FirstNSTok)

     Tok = FirstNSTok;

   Tok = skipAttribute(Tok);


   FirstNSTok = nullptr;

   // Add everything from '(' to ')'.

   auto AddToken = [&name](const FormatToken *Tok) { name += Tok->TokenText; };

   bool IsPrevColoncolon = false;

   bool HasColoncolon = false;

   bool IsPrevInline = false;

   bool NameFinished = false;

   // If we found '::' in name, then it's the name. Otherwise, we can't tell

   // which one is name. For example, `namespace A B {`.

   while (Tok && Tok->isNot(tok::l_brace)) {

     if (FirstNSTok) {

       if (!IsPrevInline && HasColoncolon && !IsPrevColoncolon) {

         if (FirstNSTok->is(tok::l_paren)) {

           FirstNSTok = Tok =

               processTokens(FirstNSTok, tok::l_paren, tok::r_paren, AddToken);

           continue;

         }

         if (FirstNSTok->isNot(tok::coloncolon)) {

           NameFinished = true;

           break;

         }

       }

       name += FirstNSTok->TokenText;

       IsPrevColoncolon = FirstNSTok->is(tok::coloncolon);

       HasColoncolon = HasColoncolon || IsPrevColoncolon;

       if (FirstNSTok->is(tok::kw_inline)) {

         name += " ";

         IsPrevInline = true;

       }

     }

     FirstNSTok = Tok;

     Tok = Tok->getNextNonComment();

     const FormatToken *TokAfterAttr = skipAttribute(Tok);

     if (TokAfterAttr != Tok)

       FirstNSTok = Tok = TokAfterAttr;

   }

   if (!NameFinished && FirstNSTok && FirstNSTok->isNot(tok::l_brace))

     name += FirstNSTok->TokenText;

   if (FirstNSName.empty() || HasColoncolon)

     return name;

   return name.empty() ? FirstNSName : FirstNSName + " " + name;

 }


 std::string computeEndCommentText(StringRef NamespaceName, bool AddNewline,

                                   const FormatToken *NamespaceTok,

                                   unsigned SpacesToAdd) {

   std::string text = "//";

   text.append(SpacesToAdd, ' ');

   text += NamespaceTok->TokenText;

   if (NamespaceTok->is(TT_NamespaceMacro))

     text += "(";

   else if (!NamespaceName.empty())

     text += ' ';

   text += NamespaceName;

   if (NamespaceTok->is(TT_NamespaceMacro))

     text += ")";

   if (AddNewline)

     text += '\n';

   return text;

 }


 bool hasEndComment(const FormatToken *RBraceTok) {

   return RBraceTok->Next && RBraceTok->Next->is(tok::comment);

 }


 bool validEndComment(const FormatToken *RBraceTok, StringRef NamespaceName,

                      const FormatToken *NamespaceTok) {

   assert(hasEndComment(RBraceTok));

   const FormatToken *Comment = RBraceTok->Next;


   // Matches a valid namespace end comment.

   // Valid namespace end comments don't need to be edited.

   static const llvm::Regex NamespaceCommentPattern =

       llvm::Regex("^/[/*] *(end (of )?)? *(anonymous|unnamed)? *"

                   "namespace( +([a-zA-Z0-9:_ ]+))?\\.? *(\\*/)?$",

                   llvm::Regex::IgnoreCase);

   static const llvm::Regex NamespaceMacroCommentPattern =

       llvm::Regex("^/[/*] *(end (of )?)? *(anonymous|unnamed)? *"

                   "([a-zA-Z0-9_]+)\\(([a-zA-Z0-9:_]*|\".+\")\\)\\.? *(\\*/)?$",

                   llvm::Regex::IgnoreCase);


   SmallVector<StringRef, 8> Groups;

   if (NamespaceTok->is(TT_NamespaceMacro) &&

       NamespaceMacroCommentPattern.match(Comment->TokenText, &Groups)) {

     StringRef NamespaceTokenText = Groups.size() > 4 ? Groups[4] : "";

     // The name of the macro must be used.

     if (NamespaceTokenText != NamespaceTok->TokenText)

       return false;

   } else if (NamespaceTok->isNot(tok::kw_namespace) ||

              !NamespaceCommentPattern.match(Comment->TokenText, &Groups)) {

     // Comment does not match regex.

     return false;

   }

   StringRef NamespaceNameInComment = Groups.size() > 5 ? Groups[5].rtrim() : "";

   // Anonymous namespace comments must not mention a namespace name.

   if (NamespaceName.empty() && !NamespaceNameInComment.empty())

     return false;

   StringRef AnonymousInComment = Groups.size() > 3 ? Groups[3] : "";

   // Named namespace comments must not mention anonymous namespace.

   if (!NamespaceName.empty() && !AnonymousInComment.empty())

     return false;

   if (NamespaceNameInComment == NamespaceName)

     return true;


   // Has namespace comment flowed onto the next line.

   // } // namespace

   //   // verylongnamespacenamethatdidnotfitonthepreviouscommentline

   if (!(Comment->Next && Comment->Next->is(TT_LineComment)))

     return false;


   static const llvm::Regex CommentPattern = llvm::Regex(

       "^/[/*] *( +([a-zA-Z0-9:_]+))?\\.? *(\\*/)?$", llvm::Regex::IgnoreCase);


   // Pull out just the comment text.

   if (!CommentPattern.match(Comment->Next->TokenText, &Groups))

     return false;

   NamespaceNameInComment = Groups.size() > 2 ? Groups[2] : "";


   return NamespaceNameInComment == NamespaceName;

 }


 void addEndComment(const FormatToken *RBraceTok, StringRef EndCommentText,

                    const SourceManager &SourceMgr,

                    tooling::Replacements *Fixes) {

   auto EndLoc = RBraceTok->Tok.getEndLoc();

   auto Range = CharSourceRange::getCharRange(EndLoc, EndLoc);

   auto Err = Fixes->add(tooling::Replacement(SourceMgr, Range, EndCommentText));

   if (Err) {

     llvm::errs() << "Error while adding namespace end comment: "

                  << llvm::toString(std::move(Err)) << "\n";

   }

 }


 void updateEndComment(const FormatToken *RBraceTok, StringRef EndCommentText,

                       const SourceManager &SourceMgr,

                       tooling::Replacements *Fixes) {

   assert(hasEndComment(RBraceTok));

   const FormatToken *Comment = RBraceTok->Next;

   auto Range = CharSourceRange::getCharRange(Comment->getStartOfNonWhitespace(),

                                              Comment->Tok.getEndLoc());

   auto Err = Fixes->add(tooling::Replacement(SourceMgr, Range, EndCommentText));

   if (Err) {

     llvm::errs() << "Error while updating namespace end comment: "

                  << llvm::toString(std::move(Err)) << "\n";

   }

 }

 } // namespace


 const FormatToken *

 getNamespaceToken(const AnnotatedLine *Line,

                   const SmallVectorImpl<AnnotatedLine *> &AnnotatedLines) {

   if (!Line->Affected || Line->InPPDirective || !Line->startsWith(tok::r_brace))

     return nullptr;

   size_t StartLineIndex = Line->MatchingOpeningBlockLineIndex;

   if (StartLineIndex == UnwrappedLine::kInvalidIndex)

     return nullptr;

   assert(StartLineIndex < AnnotatedLines.size());

   const FormatToken *NamespaceTok = AnnotatedLines[StartLineIndex]->First;

   if (NamespaceTok->is(tok::l_brace)) {

     // "namespace" keyword can be on the line preceding '{', e.g. in styles

     // where BraceWrapping.AfterNamespace is true.

     if (StartLineIndex > 0) {

       NamespaceTok = AnnotatedLines[StartLineIndex - 1]->First;

       if (AnnotatedLines[StartLineIndex - 1]->endsWith(tok::semi))

         return nullptr;

     }

   }


   return NamespaceTok->getNamespaceToken();

 }


 StringRef

 getNamespaceTokenText(const AnnotatedLine *Line,

                       const SmallVectorImpl<AnnotatedLine *> &AnnotatedLines) {

   const FormatToken *NamespaceTok = getNamespaceToken(Line, AnnotatedLines);

   return NamespaceTok ? NamespaceTok->TokenText : StringRef();

 }


 NamespaceEndCommentsFixer::NamespaceEndCommentsFixer(const Environment &Env,

                                                      const FormatStyle &Style)

     : TokenAnalyzer(Env, Style) {}


 std::pair<tooling::Replacements, unsigned> NamespaceEndCommentsFixer::analyze(

     TokenAnnotator &Annotator, SmallVectorImpl<AnnotatedLine *> &AnnotatedLines,

     FormatTokenLexer &Tokens) {

   const SourceManager &SourceMgr = Env.getSourceManager();

   AffectedRangeMgr.computeAffectedLines(AnnotatedLines);

   tooling::Replacements Fixes;


   // Spin through the lines and ensure we have balanced braces.

   int Braces = 0;

   for (AnnotatedLine *Line : AnnotatedLines) {

     FormatToken *Tok = Line->First;

     while (Tok) {

       Braces += Tok->is(tok::l_brace) ? 1 : Tok->is(tok::r_brace) ? -1 : 0;

       Tok = Tok->Next;

     }

   }

   // Don't attempt to comment unbalanced braces or this can

   // lead to comments being placed on the closing brace which isn't

   // the matching brace of the namespace. (occurs during incomplete editing).

   if (Braces != 0)

     return {Fixes, 0};


   std::string AllNamespaceNames;

   size_t StartLineIndex = SIZE_MAX;

   StringRef NamespaceTokenText;

   unsigned int CompactedNamespacesCount = 0;

   for (size_t I = 0, E = AnnotatedLines.size(); I != E; ++I) {

     const AnnotatedLine *EndLine = AnnotatedLines[I];

     const FormatToken *NamespaceTok =

         getNamespaceToken(EndLine, AnnotatedLines);

     if (!NamespaceTok)

       continue;

     FormatToken *RBraceTok = EndLine->First;

     if (RBraceTok->Finalized)

       continue;

     RBraceTok->Finalized = true;

     const FormatToken *EndCommentPrevTok = RBraceTok;

     // Namespaces often end with '};'. In that case, attach namespace end

     // comments to the semicolon tokens.

     if (RBraceTok->Next && RBraceTok->Next->is(tok::semi))

       EndCommentPrevTok = RBraceTok->Next;

     if (StartLineIndex == SIZE_MAX)

       StartLineIndex = EndLine->MatchingOpeningBlockLineIndex;

     std::string NamespaceName = computeName(NamespaceTok);

     if (Style.CompactNamespaces) {

       if (CompactedNamespacesCount == 0)

         NamespaceTokenText = NamespaceTok->TokenText;

       if ((I + 1 < E) &&

           NamespaceTokenText ==

               getNamespaceTokenText(AnnotatedLines[I + 1], AnnotatedLines) &&

           StartLineIndex - CompactedNamespacesCount - 1 ==

               AnnotatedLines[I + 1]->MatchingOpeningBlockLineIndex &&

           !AnnotatedLines[I + 1]->First->Finalized) {

         if (hasEndComment(EndCommentPrevTok)) {

           // remove end comment, it will be merged in next one

           updateEndComment(EndCommentPrevTok, std::string(), SourceMgr, &Fixes);

         }

         ++CompactedNamespacesCount;

         if (!NamespaceName.empty())

           AllNamespaceNames = "::" + NamespaceName + AllNamespaceNames;

         continue;

       }

       NamespaceName += AllNamespaceNames;

       CompactedNamespacesCount = 0;

       AllNamespaceNames = std::string();

     }

     // The next token in the token stream after the place where the end comment

     // token must be. This is either the next token on the current line or the

     // first token on the next line.

     const FormatToken *EndCommentNextTok = EndCommentPrevTok->Next;

     if (EndCommentNextTok && EndCommentNextTok->is(tok::comment))

       EndCommentNextTok = EndCommentNextTok->Next;

     if (!EndCommentNextTok && I + 1 < E)

       EndCommentNextTok = AnnotatedLines[I + 1]->First;

     bool AddNewline = EndCommentNextTok &&

                       EndCommentNextTok->NewlinesBefore == 0 &&

                       EndCommentNextTok->isNot(tok::eof);

     const std::string EndCommentText =

         computeEndCommentText(NamespaceName, AddNewline, NamespaceTok,

                               Style.SpacesInLineCommentPrefix.Minimum);

     if (!hasEndComment(EndCommentPrevTok)) {

       unsigned LineCount = 0;

       for (auto J = StartLineIndex + 1; J < I; ++J)

         LineCount += AnnotatedLines[J]->size();

       if (LineCount > Style.ShortNamespaceLines) {

         addEndComment(EndCommentPrevTok,

                       std::string(Style.SpacesBeforeTrailingComments, ' ') +

                           EndCommentText,

                       SourceMgr, &Fixes);

       }

     } else if (!validEndComment(EndCommentPrevTok, NamespaceName,

                                 NamespaceTok)) {

       updateEndComment(EndCommentPrevTok, EndCommentText, SourceMgr, &Fixes);

     }

     StartLineIndex = SIZE_MAX;

   }

   return {Fixes, 0};

 }


 } // namespace format

 } // namespace clang

Env
const Environment & Env
Definition: HTMLLogger.cpp:148

NamespaceEndCommentsFixer.h
This file declares NamespaceEndCommentsFixer, a TokenAnalyzer that fixes namespace end comments.

Range
SourceRange Range
Definition: SemaObjC.cpp:754

TokenKinds.h
Defines the clang::TokenKind enum and support functions.

clang::CharSourceRange::getCharRange
static CharSourceRange getCharRange(SourceRange R)
Definition: SourceLocation.h:268

clang::SourceManager
This class handles loading and caching of source files into memory.
Definition: SourceManager.h:663

clang::format::AffectedRangeManager::computeAffectedLines
bool computeAffectedLines(SmallVectorImpl< AnnotatedLine * > &Lines)
Definition: AffectedRangeManager.cpp:22

clang::format::AnnotatedLine
Definition: TokenAnnotator.h:45

clang::format::AnnotatedLine::InPPDirective
bool InPPDirective
Definition: TokenAnnotator.h:173

clang::format::AnnotatedLine::First
FormatToken * First
Definition: TokenAnnotator.h:163

clang::format::AnnotatedLine::Affected
bool Affected
True if this line should be formatted, i.e.
Definition: TokenAnnotator.h:185

clang::format::AnnotatedLine::startsWith
bool startsWith(Ts... Tokens) const
true if this line starts with the given tokens in order, ignoring comments.
Definition: TokenAnnotator.h:117

clang::format::AnnotatedLine::MatchingOpeningBlockLineIndex
size_t MatchingOpeningBlockLineIndex
Definition: TokenAnnotator.h:171

clang::format::Environment
Definition: TokenAnalyzer.h:26

clang::format::Environment::getSourceManager
SourceManager & getSourceManager() const
Definition: TokenAnalyzer.h:38

clang::format::FormatTokenLexer
Definition: FormatTokenLexer.h:35

clang::format::NamespaceEndCommentsFixer::NamespaceEndCommentsFixer
NamespaceEndCommentsFixer(const Environment &Env, const FormatStyle &Style)
Definition: NamespaceEndCommentsFixer.cpp:277

clang::format::NamespaceEndCommentsFixer::analyze
std::pair< tooling::Replacements, unsigned > analyze(TokenAnnotator &Annotator, SmallVectorImpl< AnnotatedLine * > &AnnotatedLines, FormatTokenLexer &Tokens) override
Definition: NamespaceEndCommentsFixer.cpp:281

clang::format::TokenAnalyzer
Definition: TokenAnalyzer.h:77

clang::format::TokenAnalyzer::Style
FormatStyle Style
Definition: TokenAnalyzer.h:94

clang::format::TokenAnalyzer::AffectedRangeMgr
AffectedRangeManager AffectedRangeMgr
Definition: TokenAnalyzer.h:99

clang::format::TokenAnalyzer::Env
const Environment & Env
Definition: TokenAnalyzer.h:97

clang::format::TokenAnnotator
Determines extra information about the tokens comprising an UnwrappedLine.
Definition: TokenAnnotator.h:211

clang::tooling::Replacements
Maintains a set of replacements that are conflict-free.
Definition: Replacement.h:212

llvm::SmallVectorImpl
Definition: Randstruct.h:18

clang::comments::tok::text
@ text
Definition: CommentLexer.h:35

clang::comments::tok::eof
@ eof
Definition: CommentLexer.h:33

clang::format::getNamespaceToken
const FormatToken * getNamespaceToken(const AnnotatedLine *Line, const SmallVectorImpl< AnnotatedLine * > &AnnotatedLines)
Definition: NamespaceEndCommentsFixer.cpp:248

clang::format::getNamespaceTokenText
StringRef getNamespaceTokenText(const AnnotatedLine *Line, const SmallVectorImpl< AnnotatedLine * > &AnnotatedLines)
Definition: NamespaceEndCommentsFixer.cpp:271

clang::threadSafety::sx::toString
std::string toString(const til::SExpr *E)
Definition: ThreadSafetyCommon.h:91

clang::tok::TokenKind
TokenKind
Provides a simple uniform namespace for tokens from all C languages.
Definition: TokenKinds.h:25

clang::transformer::name
RangeSelector name(std::string ID)
Given a node with a "name", (like NamedDecl, DeclRefExpr, CxxCtorInitializer, and TypeLoc) selects th...
Definition: RangeSelector.cpp:200

clang
The JSON file list parser is used to communicate input to InstallAPI.
Definition: CalledOnceCheck.h:17

clang::ComparisonCategoryType::First
@ First

clang::CXXNewInitializationStyle::Braces
@ Braces
New-expression has a C++11 list-initializer.

SIZE_MAX
#define SIZE_MAX
Definition: stdint.h:889

clang::format::FormatStyle::SpacesInLineComment::Minimum
unsigned Minimum
The minimum number of spaces at the start of the comment.
Definition: Format.h:4580

clang::format::FormatStyle
The FormatStyle is used to configure the formatting to follow specific guidelines.
Definition: Format.h:55

clang::format::FormatStyle::SpacesBeforeTrailingComments
unsigned SpacesBeforeTrailingComments
If true, spaces may be inserted into ().
Definition: Format.h:4528

clang::format::FormatStyle::CompactNamespaces
bool CompactNamespaces
If true, consecutive namespace declarations will be on the same line.
Definition: Format.h:2415

clang::format::FormatStyle::SpacesInLineCommentPrefix
SpacesInLineComment SpacesInLineCommentPrefix
How many spaces are allowed at the start of a line comment.
Definition: Format.h:4617

clang::format::FormatStyle::ShortNamespaceLines
unsigned ShortNamespaceLines
The maximal number of unwrapped lines that a short namespace spans.
Definition: Format.h:4064

clang::format::FormatToken
A wrapper around a Token storing information about the whitespace characters preceding it.
Definition: FormatToken.h:290

clang::format::FormatToken::isNot
bool isNot(T Kind) const
Definition: FormatToken.h:621

clang::format::FormatToken::TokenText
StringRef TokenText
The raw text of the token.
Definition: FormatToken.h:310

clang::format::FormatToken::getNamespaceToken
const FormatToken * getNamespaceToken() const
Return the actual namespace token, if this token starts a namespace block.
Definition: FormatToken.h:847

clang::format::FormatToken::Finalized
unsigned Finalized
If true, this token has been fully formatted (indented and potentially re-formatted inside),...
Definition: FormatToken.h:369

clang::format::FormatToken::Next
FormatToken * Next
The next token in the unwrapped line.
Definition: FormatToken.h:562

clang::format::FormatToken::NewlinesBefore
unsigned NewlinesBefore
The number of newlines immediately before the Token.
Definition: FormatToken.h:459

clang::format::FormatToken::is
bool is(tok::TokenKind Kind) const
Definition: FormatToken.h:602

clang::format::UnwrappedLine::kInvalidIndex
static const size_t kInvalidIndex
Definition: UnwrappedLineParser.h:71