1 //===--- DefinitionBlockSeparator.cpp ---------------------------*- C++ -*-===// 2 // 3 // Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions. 4 // See https://llvm.org/LICENSE.txt for license information. 5 // SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception 6 // 7 //===----------------------------------------------------------------------===// 8 /// 9 /// \file 10 /// This file implements DefinitionBlockSeparator, a TokenAnalyzer that inserts 11 /// or removes empty lines separating definition blocks like classes, structs, 12 /// functions, enums, and namespaces in between. 13 /// 14 //===----------------------------------------------------------------------===// 15 16 #include "DefinitionBlockSeparator.h" 17 #include "llvm/Support/Debug.h" 18 #define DEBUG_TYPE "definition-block-separator" 19 20 namespace clang { 21 namespace format { 22 std::pair<tooling::Replacements, unsigned> DefinitionBlockSeparator::analyze( 23 TokenAnnotator &Annotator, SmallVectorImpl<AnnotatedLine *> &AnnotatedLines, 24 FormatTokenLexer &Tokens) { 25 assert(Style.SeparateDefinitionBlocks != FormatStyle::SDS_Leave); 26 AffectedRangeMgr.computeAffectedLines(AnnotatedLines); 27 tooling::Replacements Result; 28 separateBlocks(AnnotatedLines, Result, Tokens); 29 return {Result, 0}; 30 } 31 32 void DefinitionBlockSeparator::separateBlocks( 33 SmallVectorImpl<AnnotatedLine *> &Lines, tooling::Replacements &Result, 34 FormatTokenLexer &Tokens) { 35 const bool IsNeverStyle = 36 Style.SeparateDefinitionBlocks == FormatStyle::SDS_Never; 37 const AdditionalKeywords &ExtraKeywords = Tokens.getKeywords(); 38 auto GetBracketLevelChange = [](const FormatToken *Tok) { 39 if (Tok->isOneOf(tok::l_brace, tok::l_paren, tok::l_square)) 40 return 1; 41 if (Tok->isOneOf(tok::r_brace, tok::r_paren, tok::r_square)) 42 return -1; 43 return 0; 44 }; 45 auto LikelyDefinition = [&](const AnnotatedLine *Line, 46 bool ExcludeEnum = false) { 47 if ((Line->MightBeFunctionDecl && Line->mightBeFunctionDefinition()) || 48 Line->startsWithNamespace()) { 49 return true; 50 } 51 int BracketLevel = 0; 52 for (const FormatToken *CurrentToken = Line->First; CurrentToken; 53 CurrentToken = CurrentToken->Next) { 54 if (BracketLevel == 0) { 55 if (CurrentToken->isOneOf(tok::kw_class, tok::kw_struct, 56 tok::kw_union) || 57 (Style.isJavaScript() && 58 CurrentToken->is(ExtraKeywords.kw_function))) { 59 return true; 60 } 61 if (!ExcludeEnum && CurrentToken->is(tok::kw_enum)) 62 return true; 63 } 64 BracketLevel += GetBracketLevelChange(CurrentToken); 65 } 66 return false; 67 }; 68 unsigned NewlineCount = 69 (Style.SeparateDefinitionBlocks == FormatStyle::SDS_Always ? 1 : 0) + 1; 70 WhitespaceManager Whitespaces( 71 Env.getSourceManager(), Style, 72 Style.LineEnding > FormatStyle::LE_CRLF 73 ? WhitespaceManager::inputUsesCRLF( 74 Env.getSourceManager().getBufferData(Env.getFileID()), 75 Style.LineEnding == FormatStyle::LE_DeriveCRLF) 76 : Style.LineEnding == FormatStyle::LE_CRLF); 77 for (unsigned I = 0; I < Lines.size(); ++I) { 78 const auto &CurrentLine = Lines[I]; 79 if (CurrentLine->InPPDirective) 80 continue; 81 FormatToken *TargetToken = nullptr; 82 AnnotatedLine *TargetLine; 83 auto OpeningLineIndex = CurrentLine->MatchingOpeningBlockLineIndex; 84 AnnotatedLine *OpeningLine = nullptr; 85 const auto IsAccessSpecifierToken = [](const FormatToken *Token) { 86 return Token->isAccessSpecifier() || Token->isObjCAccessSpecifier(); 87 }; 88 const auto InsertReplacement = [&](const int NewlineToInsert) { 89 assert(TargetLine); 90 assert(TargetToken); 91 92 // Do not handle EOF newlines. 93 if (TargetToken->is(tok::eof)) 94 return; 95 if (IsAccessSpecifierToken(TargetToken) || 96 (OpeningLineIndex > 0 && 97 IsAccessSpecifierToken(Lines[OpeningLineIndex - 1]->First))) { 98 return; 99 } 100 if (!TargetLine->Affected) 101 return; 102 Whitespaces.replaceWhitespace(*TargetToken, NewlineToInsert, 103 TargetToken->OriginalColumn, 104 TargetToken->OriginalColumn); 105 }; 106 const auto IsPPConditional = [&](const size_t LineIndex) { 107 const auto &Line = Lines[LineIndex]; 108 return Line->First->is(tok::hash) && Line->First->Next && 109 Line->First->Next->isOneOf(tok::pp_if, tok::pp_ifdef, tok::pp_else, 110 tok::pp_ifndef, tok::pp_elifndef, 111 tok::pp_elifdef, tok::pp_elif, 112 tok::pp_endif); 113 }; 114 const auto FollowingOtherOpening = [&]() { 115 return OpeningLineIndex == 0 || 116 Lines[OpeningLineIndex - 1]->Last->opensScope() || 117 IsPPConditional(OpeningLineIndex - 1); 118 }; 119 const auto HasEnumOnLine = [&]() { 120 bool FoundEnumKeyword = false; 121 int BracketLevel = 0; 122 for (const FormatToken *CurrentToken = CurrentLine->First; CurrentToken; 123 CurrentToken = CurrentToken->Next) { 124 if (BracketLevel == 0) { 125 if (CurrentToken->is(tok::kw_enum)) 126 FoundEnumKeyword = true; 127 else if (FoundEnumKeyword && CurrentToken->is(tok::l_brace)) 128 return true; 129 } 130 BracketLevel += GetBracketLevelChange(CurrentToken); 131 } 132 return FoundEnumKeyword && I + 1 < Lines.size() && 133 Lines[I + 1]->First->is(tok::l_brace); 134 }; 135 136 bool IsDefBlock = false; 137 const auto MayPrecedeDefinition = [&](const int Direction = -1) { 138 assert(Direction >= -1); 139 assert(Direction <= 1); 140 const size_t OperateIndex = OpeningLineIndex + Direction; 141 assert(OperateIndex < Lines.size()); 142 const auto &OperateLine = Lines[OperateIndex]; 143 if (LikelyDefinition(OperateLine)) 144 return false; 145 146 if (OperateLine->First->is(tok::comment)) 147 return true; 148 149 // A single line identifier that is not in the last line. 150 if (OperateLine->First->is(tok::identifier) && 151 OperateLine->First == OperateLine->Last && 152 OperateIndex + 1 < Lines.size()) { 153 // UnwrappedLineParser's recognition of free-standing macro like 154 // Q_OBJECT may also recognize some uppercased type names that may be 155 // used as return type as that kind of macros, which is a bit hard to 156 // distinguish one from another purely from token patterns. Here, we 157 // try not to add new lines below those identifiers. 158 AnnotatedLine *NextLine = Lines[OperateIndex + 1]; 159 if (NextLine->MightBeFunctionDecl && 160 NextLine->mightBeFunctionDefinition() && 161 NextLine->First->NewlinesBefore == 1 && 162 OperateLine->First->is(TT_FunctionLikeOrFreestandingMacro)) { 163 return true; 164 } 165 } 166 167 if (Style.isCSharp() && OperateLine->First->is(TT_AttributeSquare)) 168 return true; 169 return false; 170 }; 171 172 if (HasEnumOnLine() && 173 !LikelyDefinition(CurrentLine, /*ExcludeEnum=*/true)) { 174 // We have no scope opening/closing information for enum. 175 IsDefBlock = true; 176 OpeningLineIndex = I; 177 while (OpeningLineIndex > 0 && MayPrecedeDefinition()) 178 --OpeningLineIndex; 179 OpeningLine = Lines[OpeningLineIndex]; 180 TargetLine = OpeningLine; 181 TargetToken = TargetLine->First; 182 if (!FollowingOtherOpening()) 183 InsertReplacement(NewlineCount); 184 else if (IsNeverStyle) 185 InsertReplacement(OpeningLineIndex != 0); 186 TargetLine = CurrentLine; 187 TargetToken = TargetLine->First; 188 while (TargetToken && !TargetToken->is(tok::r_brace)) 189 TargetToken = TargetToken->Next; 190 if (!TargetToken) 191 while (I < Lines.size() && !Lines[I]->First->is(tok::r_brace)) 192 ++I; 193 } else if (CurrentLine->First->closesScope()) { 194 if (OpeningLineIndex > Lines.size()) 195 continue; 196 // Handling the case that opening brace has its own line, with checking 197 // whether the last line already had an opening brace to guard against 198 // misrecognition. 199 if (OpeningLineIndex > 0 && 200 Lines[OpeningLineIndex]->First->is(tok::l_brace) && 201 Lines[OpeningLineIndex - 1]->Last->isNot(tok::l_brace)) { 202 --OpeningLineIndex; 203 } 204 OpeningLine = Lines[OpeningLineIndex]; 205 // Closing a function definition. 206 if (LikelyDefinition(OpeningLine)) { 207 IsDefBlock = true; 208 while (OpeningLineIndex > 0 && MayPrecedeDefinition()) 209 --OpeningLineIndex; 210 OpeningLine = Lines[OpeningLineIndex]; 211 TargetLine = OpeningLine; 212 TargetToken = TargetLine->First; 213 if (!FollowingOtherOpening()) { 214 // Avoid duplicated replacement. 215 if (TargetToken->isNot(tok::l_brace)) 216 InsertReplacement(NewlineCount); 217 } else if (IsNeverStyle) { 218 InsertReplacement(OpeningLineIndex != 0); 219 } 220 } 221 } 222 223 // Not the last token. 224 if (IsDefBlock && I + 1 < Lines.size()) { 225 OpeningLineIndex = I + 1; 226 TargetLine = Lines[OpeningLineIndex]; 227 TargetToken = TargetLine->First; 228 229 // No empty line for continuously closing scopes. The token will be 230 // handled in another case if the line following is opening a 231 // definition. 232 if (!TargetToken->closesScope() && !IsPPConditional(OpeningLineIndex)) { 233 // Check whether current line may precede a definition line. 234 while (OpeningLineIndex + 1 < Lines.size() && 235 MayPrecedeDefinition(/*Direction=*/0)) { 236 ++OpeningLineIndex; 237 } 238 TargetLine = Lines[OpeningLineIndex]; 239 if (!LikelyDefinition(TargetLine)) { 240 OpeningLineIndex = I + 1; 241 TargetLine = Lines[I + 1]; 242 TargetToken = TargetLine->First; 243 InsertReplacement(NewlineCount); 244 } 245 } else if (IsNeverStyle) { 246 InsertReplacement(/*NewlineToInsert=*/1); 247 } 248 } 249 } 250 for (const auto &R : Whitespaces.generateReplacements()) { 251 // The add method returns an Error instance which simulates program exit 252 // code through overloading boolean operator, thus false here indicates 253 // success. 254 if (Result.add(R)) 255 return; 256 } 257 } 258 } // namespace format 259 } // namespace clang 260