1 //===--- FormatToken.cpp - Format C++ code --------------------------------===// 2 // 3 // The LLVM Compiler Infrastructure 4 // 5 // This file is distributed under the University of Illinois Open Source 6 // License. See LICENSE.TXT for details. 7 // 8 //===----------------------------------------------------------------------===// 9 /// 10 /// \file 11 /// \brief This file implements specific functions of \c FormatTokens and their 12 /// roles. 13 /// 14 //===----------------------------------------------------------------------===// 15 16 #include "FormatToken.h" 17 #include "ContinuationIndenter.h" 18 #include "clang/Format/Format.h" 19 #include "llvm/ADT/SmallVector.h" 20 #include "llvm/Support/Debug.h" 21 #include <climits> 22 23 namespace clang { 24 namespace format { 25 26 // FIXME: This is copy&pasted from Sema. Put it in a common place and remove 27 // duplication. 28 bool FormatToken::isSimpleTypeSpecifier() const { 29 switch (Tok.getKind()) { 30 case tok::kw_short: 31 case tok::kw_long: 32 case tok::kw___int64: 33 case tok::kw___int128: 34 case tok::kw_signed: 35 case tok::kw_unsigned: 36 case tok::kw_void: 37 case tok::kw_char: 38 case tok::kw_int: 39 case tok::kw_half: 40 case tok::kw_float: 41 case tok::kw_double: 42 case tok::kw_wchar_t: 43 case tok::kw_bool: 44 case tok::kw___underlying_type: 45 case tok::annot_typename: 46 case tok::kw_char16_t: 47 case tok::kw_char32_t: 48 case tok::kw_typeof: 49 case tok::kw_decltype: 50 return true; 51 default: 52 return false; 53 } 54 } 55 56 TokenRole::~TokenRole() {} 57 58 void TokenRole::precomputeFormattingInfos(const FormatToken *Token) {} 59 60 unsigned CommaSeparatedList::formatAfterToken(LineState &State, 61 ContinuationIndenter *Indenter, 62 bool DryRun) { 63 if (State.NextToken == nullptr || !State.NextToken->Previous) 64 return 0; 65 66 // Ensure that we start on the opening brace. 67 const FormatToken *LBrace = 68 State.NextToken->Previous->getPreviousNonComment(); 69 if (!LBrace || LBrace->isNot(tok::l_brace) || LBrace->BlockKind == BK_Block || 70 LBrace->Type == TT_DictLiteral || 71 LBrace->Next->Type == TT_DesignatedInitializerPeriod) 72 return 0; 73 74 // Calculate the number of code points we have to format this list. As the 75 // first token is already placed, we have to subtract it. 76 unsigned RemainingCodePoints = 77 Style.ColumnLimit - State.Column + State.NextToken->Previous->ColumnWidth; 78 79 // Find the best ColumnFormat, i.e. the best number of columns to use. 80 const ColumnFormat *Format = getColumnFormat(RemainingCodePoints); 81 // If no ColumnFormat can be used, the braced list would generally be 82 // bin-packed. Add a severe penalty to this so that column layouts are 83 // preferred if possible. 84 if (!Format) 85 return 10000; 86 87 // Format the entire list. 88 unsigned Penalty = 0; 89 unsigned Column = 0; 90 unsigned Item = 0; 91 while (State.NextToken != LBrace->MatchingParen) { 92 bool NewLine = false; 93 unsigned ExtraSpaces = 0; 94 95 // If the previous token was one of our commas, we are now on the next item. 96 if (Item < Commas.size() && State.NextToken->Previous == Commas[Item]) { 97 if (!State.NextToken->isTrailingComment()) { 98 ExtraSpaces += Format->ColumnSizes[Column] - ItemLengths[Item]; 99 ++Column; 100 } 101 ++Item; 102 } 103 104 if (Column == Format->Columns || State.NextToken->MustBreakBefore) { 105 Column = 0; 106 NewLine = true; 107 } 108 109 // Place token using the continuation indenter and store the penalty. 110 Penalty += Indenter->addTokenToState(State, NewLine, DryRun, ExtraSpaces); 111 } 112 return Penalty; 113 } 114 115 unsigned CommaSeparatedList::formatFromToken(LineState &State, 116 ContinuationIndenter *Indenter, 117 bool DryRun) { 118 if (HasNestedBracedList) 119 State.Stack.back().AvoidBinPacking = true; 120 return 0; 121 } 122 123 // Returns the lengths in code points between Begin and End (both included), 124 // assuming that the entire sequence is put on a single line. 125 static unsigned CodePointsBetween(const FormatToken *Begin, 126 const FormatToken *End) { 127 assert(End->TotalLength >= Begin->TotalLength); 128 return End->TotalLength - Begin->TotalLength + Begin->ColumnWidth; 129 } 130 131 void CommaSeparatedList::precomputeFormattingInfos(const FormatToken *Token) { 132 // FIXME: At some point we might want to do this for other lists, too. 133 if (!Token->MatchingParen || Token->isNot(tok::l_brace)) 134 return; 135 136 // In C++11 braced list style, we should not format in columns unless they 137 // have many items (20 or more) or we allow bin-packing of function call 138 // arguments. 139 if (Style.Cpp11BracedListStyle && !Style.BinPackArguments && 140 Commas.size() < 19) 141 return; 142 143 // Column format doesn't really make sense if we don't align after brackets. 144 if (!Style.AlignAfterOpenBracket) 145 return; 146 147 FormatToken *ItemBegin = Token->Next; 148 while (ItemBegin->isTrailingComment()) 149 ItemBegin = ItemBegin->Next; 150 SmallVector<bool, 8> MustBreakBeforeItem; 151 152 // The lengths of an item if it is put at the end of the line. This includes 153 // trailing comments which are otherwise ignored for column alignment. 154 SmallVector<unsigned, 8> EndOfLineItemLength; 155 156 bool HasSeparatingComment = false; 157 for (unsigned i = 0, e = Commas.size() + 1; i != e; ++i) { 158 // Skip comments on their own line. 159 while (ItemBegin->HasUnescapedNewline && ItemBegin->isTrailingComment()) { 160 ItemBegin = ItemBegin->Next; 161 HasSeparatingComment = i > 0; 162 } 163 164 MustBreakBeforeItem.push_back(ItemBegin->MustBreakBefore); 165 if (ItemBegin->is(tok::l_brace)) 166 HasNestedBracedList = true; 167 const FormatToken *ItemEnd = nullptr; 168 if (i == Commas.size()) { 169 ItemEnd = Token->MatchingParen; 170 const FormatToken *NonCommentEnd = ItemEnd->getPreviousNonComment(); 171 ItemLengths.push_back(CodePointsBetween(ItemBegin, NonCommentEnd)); 172 if (Style.Cpp11BracedListStyle) { 173 // In Cpp11 braced list style, the } and possibly other subsequent 174 // tokens will need to stay on a line with the last element. 175 while (ItemEnd->Next && !ItemEnd->Next->CanBreakBefore) 176 ItemEnd = ItemEnd->Next; 177 } else { 178 // In other braced lists styles, the "}" can be wrapped to the new line. 179 ItemEnd = Token->MatchingParen->Previous; 180 } 181 } else { 182 ItemEnd = Commas[i]; 183 // The comma is counted as part of the item when calculating the length. 184 ItemLengths.push_back(CodePointsBetween(ItemBegin, ItemEnd)); 185 186 // Consume trailing comments so the are included in EndOfLineItemLength. 187 if (ItemEnd->Next && !ItemEnd->Next->HasUnescapedNewline && 188 ItemEnd->Next->isTrailingComment()) 189 ItemEnd = ItemEnd->Next; 190 } 191 EndOfLineItemLength.push_back(CodePointsBetween(ItemBegin, ItemEnd)); 192 // If there is a trailing comma in the list, the next item will start at the 193 // closing brace. Don't create an extra item for this. 194 if (ItemEnd->getNextNonComment() == Token->MatchingParen) 195 break; 196 ItemBegin = ItemEnd->Next; 197 } 198 199 // Don't use column layout for nested lists, lists with few elements and in 200 // presence of separating comments. 201 if (Token->NestingLevel != 0 || Commas.size() < 5 || HasSeparatingComment) 202 return; 203 204 // We can never place more than ColumnLimit / 3 items in a row (because of the 205 // spaces and the comma). 206 unsigned MaxItems = Style.ColumnLimit / 3; 207 std::vector<unsigned> MinSizeInColumn; 208 MinSizeInColumn.reserve(MaxItems); 209 for (unsigned Columns = 1; Columns <= MaxItems; ++Columns) { 210 ColumnFormat Format; 211 Format.Columns = Columns; 212 Format.ColumnSizes.resize(Columns); 213 MinSizeInColumn.assign(Columns, UINT_MAX); 214 Format.LineCount = 1; 215 bool HasRowWithSufficientColumns = false; 216 unsigned Column = 0; 217 for (unsigned i = 0, e = ItemLengths.size(); i != e; ++i) { 218 assert(i < MustBreakBeforeItem.size()); 219 if (MustBreakBeforeItem[i] || Column == Columns) { 220 ++Format.LineCount; 221 Column = 0; 222 } 223 if (Column == Columns - 1) 224 HasRowWithSufficientColumns = true; 225 unsigned Length = 226 (Column == Columns - 1) ? EndOfLineItemLength[i] : ItemLengths[i]; 227 Format.ColumnSizes[Column] = std::max(Format.ColumnSizes[Column], Length); 228 MinSizeInColumn[Column] = std::min(MinSizeInColumn[Column], Length); 229 ++Column; 230 } 231 // If all rows are terminated early (e.g. by trailing comments), we don't 232 // need to look further. 233 if (!HasRowWithSufficientColumns) 234 break; 235 Format.TotalWidth = Columns - 1; // Width of the N-1 spaces. 236 237 for (unsigned i = 0; i < Columns; ++i) 238 Format.TotalWidth += Format.ColumnSizes[i]; 239 240 // Don't use this Format, if the difference between the longest and shortest 241 // element in a column exceeds a threshold to avoid excessive spaces. 242 if ([&] { 243 for (unsigned i = 0; i < Columns - 1; ++i) 244 if (Format.ColumnSizes[i] - MinSizeInColumn[i] > 10) 245 return true; 246 return false; 247 }()) 248 continue; 249 250 // Ignore layouts that are bound to violate the column limit. 251 if (Format.TotalWidth > Style.ColumnLimit) 252 continue; 253 254 Formats.push_back(Format); 255 } 256 } 257 258 const CommaSeparatedList::ColumnFormat * 259 CommaSeparatedList::getColumnFormat(unsigned RemainingCharacters) const { 260 const ColumnFormat *BestFormat = nullptr; 261 for (SmallVector<ColumnFormat, 4>::const_reverse_iterator 262 I = Formats.rbegin(), 263 E = Formats.rend(); 264 I != E; ++I) { 265 if (I->TotalWidth <= RemainingCharacters) { 266 if (BestFormat && I->LineCount > BestFormat->LineCount) 267 break; 268 BestFormat = &*I; 269 } 270 } 271 return BestFormat; 272 } 273 274 } // namespace format 275 } // namespace clang 276