proxy/index.php

//===--- DefinitionBlockSeparator.cpp ---------------------------*- C++ -*-===//

//

// Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions.

// See https://llvm.org/LICENSE.txt for license information.

// SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception

//

//===----------------------------------------------------------------------===//

///

/// \file

/// This file implements DefinitionBlockSeparator, a TokenAnalyzer that inserts

/// or removes empty lines separating definition blocks like classes, structs,

/// functions, enums, and namespaces in between.

///

//===----------------------------------------------------------------------===//


#include "DefinitionBlockSeparator.h"

#define DEBUG_TYPE "definition-block-separator"


namespace clang {

namespace format {

std::pair<tooling::Replacements, unsigned> DefinitionBlockSeparator::analyze(

    TokenAnnotator &Annotator, SmallVectorImpl<AnnotatedLine *> &AnnotatedLines,

    FormatTokenLexer &Tokens) {

  assert(Style.SeparateDefinitionBlocks != FormatStyle::SDS_Leave);

  AffectedRangeMgr.computeAffectedLines(AnnotatedLines);

  tooling::Replacements Result;

  separateBlocks(AnnotatedLines, Result, Tokens);

  return {Result, 0};

}


void DefinitionBlockSeparator::separateBlocks(

    SmallVectorImpl<AnnotatedLine *> &Lines, tooling::Replacements &Result,

    FormatTokenLexer &Tokens) {

  const bool IsNeverStyle =

      Style.SeparateDefinitionBlocks == FormatStyle::SDS_Never;

  const AdditionalKeywords &ExtraKeywords = Tokens.getKeywords();

  auto GetBracketLevelChange = [](const FormatToken *Tok) {

    if (Tok->isOneOf(tok::l_brace, tok::l_paren, tok::l_square))

      return 1;

    if (Tok->isOneOf(tok::r_brace, tok::r_paren, tok::r_square))

      return -1;

    return 0;

  };

  auto LikelyDefinition = [&](const AnnotatedLine *Line,

                              bool ExcludeEnum = false) {

    if ((Line->MightBeFunctionDecl && Line->mightBeFunctionDefinition()) ||

        Line->startsWithNamespace()) {

      return true;

    }

    int BracketLevel = 0;

    for (const FormatToken *CurrentToken = Line->First; CurrentToken;

         CurrentToken = CurrentToken->Next) {

      if (BracketLevel == 0) {

        if (CurrentToken->isOneOf(tok::kw_class, tok::kw_struct,

                                  tok::kw_union) ||

            (Style.isJavaScript() &&

             CurrentToken->is(ExtraKeywords.kw_function))) {

          return true;

        }

        if (!ExcludeEnum && CurrentToken->is(tok::kw_enum))

          return true;

      }

      BracketLevel += GetBracketLevelChange(CurrentToken);

    }

    return false;

  };

  unsigned NewlineCount =

      (Style.SeparateDefinitionBlocks == FormatStyle::SDS_Always ? 1 : 0) + 1;

  WhitespaceManager Whitespaces(

      Env.getSourceManager(), Style,

      Style.LineEnding > FormatStyle::LE_CRLF

          ? WhitespaceManager::inputUsesCRLF(

                Env.getSourceManager().getBufferData(Env.getFileID()),

                Style.LineEnding == FormatStyle::LE_DeriveCRLF)

          : Style.LineEnding == FormatStyle::LE_CRLF);

  for (unsigned I = 0; I < Lines.size(); ++I) {

    const auto &CurrentLine = Lines[I];

    if (CurrentLine->InPPDirective)

      continue;

    FormatToken *TargetToken = nullptr;

    AnnotatedLine *TargetLine;

    auto OpeningLineIndex = CurrentLine->MatchingOpeningBlockLineIndex;

    AnnotatedLine *OpeningLine = nullptr;

    const auto IsAccessSpecifierToken = [](const FormatToken *Token) {

      return Token->isAccessSpecifier() || Token->isObjCAccessSpecifier();

    };

    const auto InsertReplacement = [&](const int NewlineToInsert) {

      assert(TargetLine);

      assert(TargetToken);


      // Do not handle EOF newlines.

      if (TargetToken->is(tok::eof))

        return;

      if (IsAccessSpecifierToken(TargetToken) ||

          (OpeningLineIndex > 0 &&

           IsAccessSpecifierToken(Lines[OpeningLineIndex - 1]->First))) {

        return;

      }

      if (!TargetLine->Affected)

        return;

      Whitespaces.replaceWhitespace(*TargetToken, NewlineToInsert,

                                    TargetToken->OriginalColumn,

                                    TargetToken->OriginalColumn);

    };

    const auto IsPPConditional = [&](const size_t LineIndex) {

      const auto &Line = Lines[LineIndex];

      return Line->First->is(tok::hash) && Line->First->Next &&

             Line->First->Next->isOneOf(tok::pp_if, tok::pp_ifdef, tok::pp_else,

                                        tok::pp_ifndef, tok::pp_elifndef,

                                        tok::pp_elifdef, tok::pp_elif,

                                        tok::pp_endif);

    };

    const auto FollowingOtherOpening = [&]() {

      return OpeningLineIndex == 0 ||

             Lines[OpeningLineIndex - 1]->Last->opensScope() ||

             IsPPConditional(OpeningLineIndex - 1);

    };

    const auto HasEnumOnLine = [&]() {

      bool FoundEnumKeyword = false;

      int BracketLevel = 0;

      for (const FormatToken *CurrentToken = CurrentLine->First; CurrentToken;

           CurrentToken = CurrentToken->Next) {

        if (BracketLevel == 0) {

          if (CurrentToken->is(tok::kw_enum))

            FoundEnumKeyword = true;

          else if (FoundEnumKeyword && CurrentToken->is(tok::l_brace))

            return true;

        }

        BracketLevel += GetBracketLevelChange(CurrentToken);

      }

      return FoundEnumKeyword && I + 1 < Lines.size() &&

             Lines[I + 1]->First->is(tok::l_brace);

    };


    bool IsDefBlock = false;

    const auto MayPrecedeDefinition = [&](const int Direction = -1) {

      assert(Direction >= -1);

      assert(Direction <= 1);


      if (Lines[OpeningLineIndex]->First->is(TT_CSharpGenericTypeConstraint))

        return true;


      const size_t OperateIndex = OpeningLineIndex + Direction;

      assert(OperateIndex < Lines.size());

      const auto &OperateLine = Lines[OperateIndex];

      if (LikelyDefinition(OperateLine))

        return false;


      if (const auto *Tok = OperateLine->First;

          Tok->is(tok::comment) && !isClangFormatOn(Tok->TokenText)) {

        return true;

      }


      // A single line identifier that is not in the last line.

      if (OperateLine->First->is(tok::identifier) &&

          OperateLine->First == OperateLine->Last &&

          OperateIndex + 1 < Lines.size()) {

        // UnwrappedLineParser's recognition of free-standing macro like

        // Q_OBJECT may also recognize some uppercased type names that may be

        // used as return type as that kind of macros, which is a bit hard to

        // distinguish one from another purely from token patterns. Here, we

        // try not to add new lines below those identifiers.

        AnnotatedLine *NextLine = Lines[OperateIndex + 1];

        if (NextLine->MightBeFunctionDecl &&

            NextLine->mightBeFunctionDefinition() &&

            NextLine->First->NewlinesBefore == 1 &&

            OperateLine->First->is(TT_FunctionLikeOrFreestandingMacro)) {

          return true;

        }

      }


      if (Style.isCSharp() && OperateLine->First->is(TT_AttributeSquare))

        return true;

      return false;

    };


    if (HasEnumOnLine() &&

        !LikelyDefinition(CurrentLine, /*ExcludeEnum=*/true)) {

      // We have no scope opening/closing information for enum.

      IsDefBlock = true;

      OpeningLineIndex = I;

      while (OpeningLineIndex > 0 && MayPrecedeDefinition())

        --OpeningLineIndex;

      OpeningLine = Lines[OpeningLineIndex];

      TargetLine = OpeningLine;

      TargetToken = TargetLine->First;

      if (!FollowingOtherOpening())

        InsertReplacement(NewlineCount);

      else if (IsNeverStyle)

        InsertReplacement(OpeningLineIndex != 0);

      TargetLine = CurrentLine;

      TargetToken = TargetLine->First;

      while (TargetToken && TargetToken->isNot(tok::r_brace))

        TargetToken = TargetToken->Next;

      if (!TargetToken)

        while (I < Lines.size() && Lines[I]->First->isNot(tok::r_brace))

          ++I;

    } else if (CurrentLine->First->closesScope()) {

      if (OpeningLineIndex > Lines.size())

        continue;

      // Handling the case that opening brace has its own line, with checking

      // whether the last line already had an opening brace to guard against

      // misrecognition.

      if (OpeningLineIndex > 0 &&

          Lines[OpeningLineIndex]->First->is(tok::l_brace) &&

          Lines[OpeningLineIndex - 1]->Last->isNot(tok::l_brace)) {

        --OpeningLineIndex;

      }

      OpeningLine = Lines[OpeningLineIndex];

      // Closing a function definition.

      if (LikelyDefinition(OpeningLine)) {

        IsDefBlock = true;

        while (OpeningLineIndex > 0 && MayPrecedeDefinition())

          --OpeningLineIndex;

        OpeningLine = Lines[OpeningLineIndex];

        TargetLine = OpeningLine;

        TargetToken = TargetLine->First;

        if (!FollowingOtherOpening()) {

          // Avoid duplicated replacement.

          if (TargetToken->isNot(tok::l_brace))

            InsertReplacement(NewlineCount);

        } else if (IsNeverStyle) {

          InsertReplacement(OpeningLineIndex != 0);

        }

      }

    }


    // Not the last token.

    if (IsDefBlock && I + 1 < Lines.size()) {

      OpeningLineIndex = I + 1;

      TargetLine = Lines[OpeningLineIndex];

      TargetToken = TargetLine->First;


      // No empty line for continuously closing scopes. The token will be

      // handled in another case if the line following is opening a

      // definition.

      if (!TargetToken->closesScope() && !IsPPConditional(OpeningLineIndex)) {

        // Check whether current line may precede a definition line.

        while (OpeningLineIndex + 1 < Lines.size() &&

               MayPrecedeDefinition(/*Direction=*/0)) {

          ++OpeningLineIndex;

        }

        TargetLine = Lines[OpeningLineIndex];

        if (!LikelyDefinition(TargetLine)) {

          OpeningLineIndex = I + 1;

          TargetLine = Lines[I + 1];

          TargetToken = TargetLine->First;

          InsertReplacement(NewlineCount);

        }

      } else if (IsNeverStyle) {

        InsertReplacement(/*NewlineToInsert=*/1);

      }

    }

  }

  for (const auto &R : Whitespaces.generateReplacements()) {

    // The add method returns an Error instance which simulates program exit

    // code through overloading boolean operator, thus false here indicates

    // success.

    if (Result.add(R))

      return;

  }

}

} // namespace format

} // namespace clang

DefinitionBlockSeparator.h
This file declares DefinitionBlockSeparator, a TokenAnalyzer that inserts or removes empty lines sepa...

clang::SourceManager::getBufferData
StringRef getBufferData(FileID FID, bool *Invalid=nullptr) const
Return a StringRef to the source buffer data for the specified FileID.
Definition: SourceManager.cpp:765

clang::format::AffectedRangeManager::computeAffectedLines
bool computeAffectedLines(SmallVectorImpl< AnnotatedLine * > &Lines)
Definition: AffectedRangeManager.cpp:22

clang::format::DefinitionBlockSeparator::analyze
std::pair< tooling::Replacements, unsigned > analyze(TokenAnnotator &Annotator, SmallVectorImpl< AnnotatedLine * > &AnnotatedLines, FormatTokenLexer &Tokens) override
Definition: DefinitionBlockSeparator.cpp:21

clang::format::Environment::getFileID
FileID getFileID() const
Definition: TokenAnalyzer.h:36

clang::format::Environment::getSourceManager
SourceManager & getSourceManager() const
Definition: TokenAnalyzer.h:38

clang::format::FormatTokenLexer
Definition: FormatTokenLexer.h:35

clang::format::TokenAnalyzer::Style
FormatStyle Style
Definition: TokenAnalyzer.h:94

clang::format::TokenAnalyzer::AffectedRangeMgr
AffectedRangeManager AffectedRangeMgr
Definition: TokenAnalyzer.h:99

clang::format::TokenAnalyzer::Env
const Environment & Env
Definition: TokenAnalyzer.h:97

clang::format::TokenAnnotator
Determines extra information about the tokens comprising an UnwrappedLine.
Definition: TokenAnnotator.h:223

clang::format::WhitespaceManager::inputUsesCRLF
static bool inputUsesCRLF(StringRef Text, bool DefaultToCRLF)
Infers whether the input is using CRLF.
Definition: WhitespaceManager.cpp:82

clang::tooling::Replacements
Maintains a set of replacements that are conflict-free.
Definition: Replacement.h:212

llvm::SmallVectorImpl
Definition: Randstruct.h:18

clang::format::isClangFormatOn
bool isClangFormatOn(StringRef Comment)
Definition: Format.cpp:4432

clang::lifetimes::internal::Direction
Direction
Definition: LifetimeSafety.cpp:580

clang
The JSON file list parser is used to communicate input to InstallAPI.
Definition: CalledOnceCheck.h:17

clang::ObjCSubstitutionContext::Result
@ Result
The result type of a method or function.

clang::ComparisonCategoryType::First
@ First

clang::SourceLocIdentKind::Line
@ Line

clang::format::AdditionalKeywords
Encapsulates keywords that are context sensitive or for languages not properly supported by Clang's l...
Definition: FormatToken.h:1026

clang::format::AdditionalKeywords::kw_function
IdentifierInfo * kw_function
Definition: FormatToken.h:1389

clang::format::FormatStyle::SDS_Never
@ SDS_Never
Remove any empty line between definition blocks.
Definition: Format.h:4294

clang::format::FormatStyle::SDS_Always
@ SDS_Always
Insert an empty line between definition blocks.
Definition: Format.h:4292

clang::format::FormatStyle::SDS_Leave
@ SDS_Leave
Leave definition blocks as they are.
Definition: Format.h:4290

clang::format::FormatStyle::LE_CRLF
@ LE_CRLF
Use \r\n.
Definition: Format.h:3407

clang::format::FormatStyle::LE_DeriveCRLF
@ LE_DeriveCRLF
Use \r\n unless the input has more lines ending in \n.
Definition: Format.h:3411

clang::format::FormatStyle::isCSharp
bool isCSharp() const
Definition: Format.h:3384

clang::format::FormatStyle::isJavaScript
bool isJavaScript() const
Definition: Format.h:3387

clang::format::FormatStyle::LineEnding
LineEndingStyle LineEnding
Line ending style (\n or \r\n) to use.
Definition: Format.h:3416

clang::format::FormatStyle::SeparateDefinitionBlocks
SeparateDefinitionStyle SeparateDefinitionBlocks
Specifies the use of empty lines to separate definition blocks, including classes,...
Definition: Format.h:4343

clang::format::FormatToken
A wrapper around a Token storing information about the whitespace characters preceding it.
Definition: FormatToken.h:300