xref: /aosp_15_r20/external/clang/lib/Format/WhitespaceManager.cpp (revision 67e74705e28f6214e480b399dd47ea732279e315)
1*67e74705SXin Li //===--- WhitespaceManager.cpp - Format C++ code --------------------------===//
2*67e74705SXin Li //
3*67e74705SXin Li //                     The LLVM Compiler Infrastructure
4*67e74705SXin Li //
5*67e74705SXin Li // This file is distributed under the University of Illinois Open Source
6*67e74705SXin Li // License. See LICENSE.TXT for details.
7*67e74705SXin Li //
8*67e74705SXin Li //===----------------------------------------------------------------------===//
9*67e74705SXin Li ///
10*67e74705SXin Li /// \file
11*67e74705SXin Li /// \brief This file implements WhitespaceManager class.
12*67e74705SXin Li ///
13*67e74705SXin Li //===----------------------------------------------------------------------===//
14*67e74705SXin Li 
15*67e74705SXin Li #include "WhitespaceManager.h"
16*67e74705SXin Li #include "llvm/ADT/STLExtras.h"
17*67e74705SXin Li 
18*67e74705SXin Li namespace clang {
19*67e74705SXin Li namespace format {
20*67e74705SXin Li 
21*67e74705SXin Li bool WhitespaceManager::Change::IsBeforeInFile::
operator ()(const Change & C1,const Change & C2) const22*67e74705SXin Li operator()(const Change &C1, const Change &C2) const {
23*67e74705SXin Li   return SourceMgr.isBeforeInTranslationUnit(
24*67e74705SXin Li       C1.OriginalWhitespaceRange.getBegin(),
25*67e74705SXin Li       C2.OriginalWhitespaceRange.getBegin());
26*67e74705SXin Li }
27*67e74705SXin Li 
Change(bool CreateReplacement,SourceRange OriginalWhitespaceRange,unsigned IndentLevel,int Spaces,unsigned StartOfTokenColumn,unsigned NewlinesBefore,StringRef PreviousLinePostfix,StringRef CurrentLinePrefix,tok::TokenKind Kind,bool ContinuesPPDirective,bool IsStartOfDeclName,bool IsInsideToken)28*67e74705SXin Li WhitespaceManager::Change::Change(
29*67e74705SXin Li     bool CreateReplacement, SourceRange OriginalWhitespaceRange,
30*67e74705SXin Li     unsigned IndentLevel, int Spaces, unsigned StartOfTokenColumn,
31*67e74705SXin Li     unsigned NewlinesBefore, StringRef PreviousLinePostfix,
32*67e74705SXin Li     StringRef CurrentLinePrefix, tok::TokenKind Kind, bool ContinuesPPDirective,
33*67e74705SXin Li     bool IsStartOfDeclName, bool IsInsideToken)
34*67e74705SXin Li     : CreateReplacement(CreateReplacement),
35*67e74705SXin Li       OriginalWhitespaceRange(OriginalWhitespaceRange),
36*67e74705SXin Li       StartOfTokenColumn(StartOfTokenColumn), NewlinesBefore(NewlinesBefore),
37*67e74705SXin Li       PreviousLinePostfix(PreviousLinePostfix),
38*67e74705SXin Li       CurrentLinePrefix(CurrentLinePrefix), Kind(Kind),
39*67e74705SXin Li       ContinuesPPDirective(ContinuesPPDirective),
40*67e74705SXin Li       IsStartOfDeclName(IsStartOfDeclName), IndentLevel(IndentLevel),
41*67e74705SXin Li       Spaces(Spaces), IsInsideToken(IsInsideToken), IsTrailingComment(false),
42*67e74705SXin Li       TokenLength(0), PreviousEndOfTokenColumn(0), EscapedNewlineColumn(0),
43*67e74705SXin Li       StartOfBlockComment(nullptr), IndentationOffset(0) {}
44*67e74705SXin Li 
reset()45*67e74705SXin Li void WhitespaceManager::reset() {
46*67e74705SXin Li   Changes.clear();
47*67e74705SXin Li   Replaces.clear();
48*67e74705SXin Li }
49*67e74705SXin Li 
replaceWhitespace(FormatToken & Tok,unsigned Newlines,unsigned IndentLevel,unsigned Spaces,unsigned StartOfTokenColumn,bool InPPDirective)50*67e74705SXin Li void WhitespaceManager::replaceWhitespace(FormatToken &Tok, unsigned Newlines,
51*67e74705SXin Li                                           unsigned IndentLevel, unsigned Spaces,
52*67e74705SXin Li                                           unsigned StartOfTokenColumn,
53*67e74705SXin Li                                           bool InPPDirective) {
54*67e74705SXin Li   if (Tok.Finalized)
55*67e74705SXin Li     return;
56*67e74705SXin Li   Tok.Decision = (Newlines > 0) ? FD_Break : FD_Continue;
57*67e74705SXin Li   Changes.push_back(
58*67e74705SXin Li       Change(/*CreateReplacement=*/true, Tok.WhitespaceRange, IndentLevel,
59*67e74705SXin Li              Spaces, StartOfTokenColumn, Newlines, "", "", Tok.Tok.getKind(),
60*67e74705SXin Li              InPPDirective && !Tok.IsFirst,
61*67e74705SXin Li              Tok.is(TT_StartOfName) || Tok.is(TT_FunctionDeclarationName),
62*67e74705SXin Li              /*IsInsideToken=*/false));
63*67e74705SXin Li }
64*67e74705SXin Li 
addUntouchableToken(const FormatToken & Tok,bool InPPDirective)65*67e74705SXin Li void WhitespaceManager::addUntouchableToken(const FormatToken &Tok,
66*67e74705SXin Li                                             bool InPPDirective) {
67*67e74705SXin Li   if (Tok.Finalized)
68*67e74705SXin Li     return;
69*67e74705SXin Li   Changes.push_back(Change(
70*67e74705SXin Li       /*CreateReplacement=*/false, Tok.WhitespaceRange, /*IndentLevel=*/0,
71*67e74705SXin Li       /*Spaces=*/0, Tok.OriginalColumn, Tok.NewlinesBefore, "", "",
72*67e74705SXin Li       Tok.Tok.getKind(), InPPDirective && !Tok.IsFirst,
73*67e74705SXin Li       Tok.is(TT_StartOfName) || Tok.is(TT_FunctionDeclarationName),
74*67e74705SXin Li       /*IsInsideToken=*/false));
75*67e74705SXin Li }
76*67e74705SXin Li 
replaceWhitespaceInToken(const FormatToken & Tok,unsigned Offset,unsigned ReplaceChars,StringRef PreviousPostfix,StringRef CurrentPrefix,bool InPPDirective,unsigned Newlines,unsigned IndentLevel,int Spaces)77*67e74705SXin Li void WhitespaceManager::replaceWhitespaceInToken(
78*67e74705SXin Li     const FormatToken &Tok, unsigned Offset, unsigned ReplaceChars,
79*67e74705SXin Li     StringRef PreviousPostfix, StringRef CurrentPrefix, bool InPPDirective,
80*67e74705SXin Li     unsigned Newlines, unsigned IndentLevel, int Spaces) {
81*67e74705SXin Li   if (Tok.Finalized)
82*67e74705SXin Li     return;
83*67e74705SXin Li   SourceLocation Start = Tok.getStartOfNonWhitespace().getLocWithOffset(Offset);
84*67e74705SXin Li   Changes.push_back(Change(
85*67e74705SXin Li       true, SourceRange(Start, Start.getLocWithOffset(ReplaceChars)),
86*67e74705SXin Li       IndentLevel, Spaces, std::max(0, Spaces), Newlines, PreviousPostfix,
87*67e74705SXin Li       CurrentPrefix, Tok.is(TT_LineComment) ? tok::comment : tok::unknown,
88*67e74705SXin Li       InPPDirective && !Tok.IsFirst,
89*67e74705SXin Li       Tok.is(TT_StartOfName) || Tok.is(TT_FunctionDeclarationName),
90*67e74705SXin Li       /*IsInsideToken=*/Newlines == 0));
91*67e74705SXin Li }
92*67e74705SXin Li 
generateReplacements()93*67e74705SXin Li const tooling::Replacements &WhitespaceManager::generateReplacements() {
94*67e74705SXin Li   if (Changes.empty())
95*67e74705SXin Li     return Replaces;
96*67e74705SXin Li 
97*67e74705SXin Li   std::sort(Changes.begin(), Changes.end(), Change::IsBeforeInFile(SourceMgr));
98*67e74705SXin Li   calculateLineBreakInformation();
99*67e74705SXin Li   alignConsecutiveDeclarations();
100*67e74705SXin Li   alignConsecutiveAssignments();
101*67e74705SXin Li   alignTrailingComments();
102*67e74705SXin Li   alignEscapedNewlines();
103*67e74705SXin Li   generateChanges();
104*67e74705SXin Li 
105*67e74705SXin Li   return Replaces;
106*67e74705SXin Li }
107*67e74705SXin Li 
calculateLineBreakInformation()108*67e74705SXin Li void WhitespaceManager::calculateLineBreakInformation() {
109*67e74705SXin Li   Changes[0].PreviousEndOfTokenColumn = 0;
110*67e74705SXin Li   Change *LastOutsideTokenChange = &Changes[0];
111*67e74705SXin Li   for (unsigned i = 1, e = Changes.size(); i != e; ++i) {
112*67e74705SXin Li     unsigned OriginalWhitespaceStart =
113*67e74705SXin Li         SourceMgr.getFileOffset(Changes[i].OriginalWhitespaceRange.getBegin());
114*67e74705SXin Li     unsigned PreviousOriginalWhitespaceEnd = SourceMgr.getFileOffset(
115*67e74705SXin Li         Changes[i - 1].OriginalWhitespaceRange.getEnd());
116*67e74705SXin Li     Changes[i - 1].TokenLength = OriginalWhitespaceStart -
117*67e74705SXin Li                                  PreviousOriginalWhitespaceEnd +
118*67e74705SXin Li                                  Changes[i].PreviousLinePostfix.size() +
119*67e74705SXin Li                                  Changes[i - 1].CurrentLinePrefix.size();
120*67e74705SXin Li 
121*67e74705SXin Li     // If there are multiple changes in this token, sum up all the changes until
122*67e74705SXin Li     // the end of the line.
123*67e74705SXin Li     if (Changes[i - 1].IsInsideToken)
124*67e74705SXin Li       LastOutsideTokenChange->TokenLength +=
125*67e74705SXin Li           Changes[i - 1].TokenLength + Changes[i - 1].Spaces;
126*67e74705SXin Li     else
127*67e74705SXin Li       LastOutsideTokenChange = &Changes[i - 1];
128*67e74705SXin Li 
129*67e74705SXin Li     Changes[i].PreviousEndOfTokenColumn =
130*67e74705SXin Li         Changes[i - 1].StartOfTokenColumn + Changes[i - 1].TokenLength;
131*67e74705SXin Li 
132*67e74705SXin Li     Changes[i - 1].IsTrailingComment =
133*67e74705SXin Li         (Changes[i].NewlinesBefore > 0 || Changes[i].Kind == tok::eof ||
134*67e74705SXin Li          (Changes[i].IsInsideToken && Changes[i].Kind == tok::comment)) &&
135*67e74705SXin Li         Changes[i - 1].Kind == tok::comment;
136*67e74705SXin Li   }
137*67e74705SXin Li   // FIXME: The last token is currently not always an eof token; in those
138*67e74705SXin Li   // cases, setting TokenLength of the last token to 0 is wrong.
139*67e74705SXin Li   Changes.back().TokenLength = 0;
140*67e74705SXin Li   Changes.back().IsTrailingComment = Changes.back().Kind == tok::comment;
141*67e74705SXin Li 
142*67e74705SXin Li   const WhitespaceManager::Change *LastBlockComment = nullptr;
143*67e74705SXin Li   for (auto &Change : Changes) {
144*67e74705SXin Li     // Reset the IsTrailingComment flag for changes inside of trailing comments
145*67e74705SXin Li     // so they don't get realigned later.
146*67e74705SXin Li     if (Change.IsInsideToken)
147*67e74705SXin Li       Change.IsTrailingComment = false;
148*67e74705SXin Li     Change.StartOfBlockComment = nullptr;
149*67e74705SXin Li     Change.IndentationOffset = 0;
150*67e74705SXin Li     if (Change.Kind == tok::comment) {
151*67e74705SXin Li       LastBlockComment = &Change;
152*67e74705SXin Li     } else if (Change.Kind == tok::unknown) {
153*67e74705SXin Li       if ((Change.StartOfBlockComment = LastBlockComment))
154*67e74705SXin Li         Change.IndentationOffset =
155*67e74705SXin Li             Change.StartOfTokenColumn -
156*67e74705SXin Li             Change.StartOfBlockComment->StartOfTokenColumn;
157*67e74705SXin Li     } else {
158*67e74705SXin Li       LastBlockComment = nullptr;
159*67e74705SXin Li     }
160*67e74705SXin Li   }
161*67e74705SXin Li }
162*67e74705SXin Li 
163*67e74705SXin Li // Align a single sequence of tokens, see AlignTokens below.
164*67e74705SXin Li template <typename F>
165*67e74705SXin Li static void
AlignTokenSequence(unsigned Start,unsigned End,unsigned Column,F && Matches,SmallVector<WhitespaceManager::Change,16> & Changes)166*67e74705SXin Li AlignTokenSequence(unsigned Start, unsigned End, unsigned Column, F &&Matches,
167*67e74705SXin Li                    SmallVector<WhitespaceManager::Change, 16> &Changes) {
168*67e74705SXin Li   bool FoundMatchOnLine = false;
169*67e74705SXin Li   int Shift = 0;
170*67e74705SXin Li   for (unsigned i = Start; i != End; ++i) {
171*67e74705SXin Li     if (Changes[i].NewlinesBefore > 0) {
172*67e74705SXin Li       FoundMatchOnLine = false;
173*67e74705SXin Li       Shift = 0;
174*67e74705SXin Li     }
175*67e74705SXin Li 
176*67e74705SXin Li     // If this is the first matching token to be aligned, remember by how many
177*67e74705SXin Li     // spaces it has to be shifted, so the rest of the changes on the line are
178*67e74705SXin Li     // shifted by the same amount
179*67e74705SXin Li     if (!FoundMatchOnLine && Matches(Changes[i])) {
180*67e74705SXin Li       FoundMatchOnLine = true;
181*67e74705SXin Li       Shift = Column - Changes[i].StartOfTokenColumn;
182*67e74705SXin Li       Changes[i].Spaces += Shift;
183*67e74705SXin Li     }
184*67e74705SXin Li 
185*67e74705SXin Li     assert(Shift >= 0);
186*67e74705SXin Li     Changes[i].StartOfTokenColumn += Shift;
187*67e74705SXin Li     if (i + 1 != Changes.size())
188*67e74705SXin Li       Changes[i + 1].PreviousEndOfTokenColumn += Shift;
189*67e74705SXin Li   }
190*67e74705SXin Li }
191*67e74705SXin Li 
192*67e74705SXin Li // Walk through all of the changes and find sequences of matching tokens to
193*67e74705SXin Li // align. To do so, keep track of the lines and whether or not a matching token
194*67e74705SXin Li // was found on a line. If a matching token is found, extend the current
195*67e74705SXin Li // sequence. If the current line cannot be part of a sequence, e.g. because
196*67e74705SXin Li // there is an empty line before it or it contains only non-matching tokens,
197*67e74705SXin Li // finalize the previous sequence.
198*67e74705SXin Li template <typename F>
AlignTokens(const FormatStyle & Style,F && Matches,SmallVector<WhitespaceManager::Change,16> & Changes)199*67e74705SXin Li static void AlignTokens(const FormatStyle &Style, F &&Matches,
200*67e74705SXin Li                         SmallVector<WhitespaceManager::Change, 16> &Changes) {
201*67e74705SXin Li   unsigned MinColumn = 0;
202*67e74705SXin Li   unsigned MaxColumn = UINT_MAX;
203*67e74705SXin Li 
204*67e74705SXin Li   // Line number of the start and the end of the current token sequence.
205*67e74705SXin Li   unsigned StartOfSequence = 0;
206*67e74705SXin Li   unsigned EndOfSequence = 0;
207*67e74705SXin Li 
208*67e74705SXin Li   // Keep track of the nesting level of matching tokens, i.e. the number of
209*67e74705SXin Li   // surrounding (), [], or {}. We will only align a sequence of matching
210*67e74705SXin Li   // token that share the same scope depth.
211*67e74705SXin Li   //
212*67e74705SXin Li   // FIXME: This could use FormatToken::NestingLevel information, but there is
213*67e74705SXin Li   // an outstanding issue wrt the brace scopes.
214*67e74705SXin Li   unsigned NestingLevelOfLastMatch = 0;
215*67e74705SXin Li   unsigned NestingLevel = 0;
216*67e74705SXin Li 
217*67e74705SXin Li   // Keep track of the number of commas before the matching tokens, we will only
218*67e74705SXin Li   // align a sequence of matching tokens if they are preceded by the same number
219*67e74705SXin Li   // of commas.
220*67e74705SXin Li   unsigned CommasBeforeLastMatch = 0;
221*67e74705SXin Li   unsigned CommasBeforeMatch = 0;
222*67e74705SXin Li 
223*67e74705SXin Li   // Whether a matching token has been found on the current line.
224*67e74705SXin Li   bool FoundMatchOnLine = false;
225*67e74705SXin Li 
226*67e74705SXin Li   // Aligns a sequence of matching tokens, on the MinColumn column.
227*67e74705SXin Li   //
228*67e74705SXin Li   // Sequences start from the first matching token to align, and end at the
229*67e74705SXin Li   // first token of the first line that doesn't need to be aligned.
230*67e74705SXin Li   //
231*67e74705SXin Li   // We need to adjust the StartOfTokenColumn of each Change that is on a line
232*67e74705SXin Li   // containing any matching token to be aligned and located after such token.
233*67e74705SXin Li   auto AlignCurrentSequence = [&] {
234*67e74705SXin Li     if (StartOfSequence > 0 && StartOfSequence < EndOfSequence)
235*67e74705SXin Li       AlignTokenSequence(StartOfSequence, EndOfSequence, MinColumn, Matches,
236*67e74705SXin Li                          Changes);
237*67e74705SXin Li     MinColumn = 0;
238*67e74705SXin Li     MaxColumn = UINT_MAX;
239*67e74705SXin Li     StartOfSequence = 0;
240*67e74705SXin Li     EndOfSequence = 0;
241*67e74705SXin Li   };
242*67e74705SXin Li 
243*67e74705SXin Li   for (unsigned i = 0, e = Changes.size(); i != e; ++i) {
244*67e74705SXin Li     if (Changes[i].NewlinesBefore != 0) {
245*67e74705SXin Li       CommasBeforeMatch = 0;
246*67e74705SXin Li       EndOfSequence = i;
247*67e74705SXin Li       // If there is a blank line, or if the last line didn't contain any
248*67e74705SXin Li       // matching token, the sequence ends here.
249*67e74705SXin Li       if (Changes[i].NewlinesBefore > 1 || !FoundMatchOnLine)
250*67e74705SXin Li         AlignCurrentSequence();
251*67e74705SXin Li 
252*67e74705SXin Li       FoundMatchOnLine = false;
253*67e74705SXin Li     }
254*67e74705SXin Li 
255*67e74705SXin Li     if (Changes[i].Kind == tok::comma) {
256*67e74705SXin Li       ++CommasBeforeMatch;
257*67e74705SXin Li     } else if (Changes[i].Kind == tok::r_brace ||
258*67e74705SXin Li                Changes[i].Kind == tok::r_paren ||
259*67e74705SXin Li                Changes[i].Kind == tok::r_square) {
260*67e74705SXin Li       --NestingLevel;
261*67e74705SXin Li     } else if (Changes[i].Kind == tok::l_brace ||
262*67e74705SXin Li                Changes[i].Kind == tok::l_paren ||
263*67e74705SXin Li                Changes[i].Kind == tok::l_square) {
264*67e74705SXin Li       // We want sequences to skip over child scopes if possible, but not the
265*67e74705SXin Li       // other way around.
266*67e74705SXin Li       NestingLevelOfLastMatch = std::min(NestingLevelOfLastMatch, NestingLevel);
267*67e74705SXin Li       ++NestingLevel;
268*67e74705SXin Li     }
269*67e74705SXin Li 
270*67e74705SXin Li     if (!Matches(Changes[i]))
271*67e74705SXin Li       continue;
272*67e74705SXin Li 
273*67e74705SXin Li     // If there is more than one matching token per line, or if the number of
274*67e74705SXin Li     // preceding commas, or the scope depth, do not match anymore, end the
275*67e74705SXin Li     // sequence.
276*67e74705SXin Li     if (FoundMatchOnLine || CommasBeforeMatch != CommasBeforeLastMatch ||
277*67e74705SXin Li         NestingLevel != NestingLevelOfLastMatch)
278*67e74705SXin Li       AlignCurrentSequence();
279*67e74705SXin Li 
280*67e74705SXin Li     CommasBeforeLastMatch = CommasBeforeMatch;
281*67e74705SXin Li     NestingLevelOfLastMatch = NestingLevel;
282*67e74705SXin Li     FoundMatchOnLine = true;
283*67e74705SXin Li 
284*67e74705SXin Li     if (StartOfSequence == 0)
285*67e74705SXin Li       StartOfSequence = i;
286*67e74705SXin Li 
287*67e74705SXin Li     unsigned ChangeMinColumn = Changes[i].StartOfTokenColumn;
288*67e74705SXin Li     int LineLengthAfter = -Changes[i].Spaces;
289*67e74705SXin Li     for (unsigned j = i; j != e && Changes[j].NewlinesBefore == 0; ++j)
290*67e74705SXin Li       LineLengthAfter += Changes[j].Spaces + Changes[j].TokenLength;
291*67e74705SXin Li     unsigned ChangeMaxColumn = Style.ColumnLimit - LineLengthAfter;
292*67e74705SXin Li 
293*67e74705SXin Li     // If we are restricted by the maximum column width, end the sequence.
294*67e74705SXin Li     if (ChangeMinColumn > MaxColumn || ChangeMaxColumn < MinColumn ||
295*67e74705SXin Li         CommasBeforeLastMatch != CommasBeforeMatch) {
296*67e74705SXin Li       AlignCurrentSequence();
297*67e74705SXin Li       StartOfSequence = i;
298*67e74705SXin Li     }
299*67e74705SXin Li 
300*67e74705SXin Li     MinColumn = std::max(MinColumn, ChangeMinColumn);
301*67e74705SXin Li     MaxColumn = std::min(MaxColumn, ChangeMaxColumn);
302*67e74705SXin Li   }
303*67e74705SXin Li 
304*67e74705SXin Li   EndOfSequence = Changes.size();
305*67e74705SXin Li   AlignCurrentSequence();
306*67e74705SXin Li }
307*67e74705SXin Li 
alignConsecutiveAssignments()308*67e74705SXin Li void WhitespaceManager::alignConsecutiveAssignments() {
309*67e74705SXin Li   if (!Style.AlignConsecutiveAssignments)
310*67e74705SXin Li     return;
311*67e74705SXin Li 
312*67e74705SXin Li   AlignTokens(Style,
313*67e74705SXin Li               [&](const Change &C) {
314*67e74705SXin Li                 // Do not align on equal signs that are first on a line.
315*67e74705SXin Li                 if (C.NewlinesBefore > 0)
316*67e74705SXin Li                   return false;
317*67e74705SXin Li 
318*67e74705SXin Li                 // Do not align on equal signs that are last on a line.
319*67e74705SXin Li                 if (&C != &Changes.back() && (&C + 1)->NewlinesBefore > 0)
320*67e74705SXin Li                   return false;
321*67e74705SXin Li 
322*67e74705SXin Li                 return C.Kind == tok::equal;
323*67e74705SXin Li               },
324*67e74705SXin Li               Changes);
325*67e74705SXin Li }
326*67e74705SXin Li 
alignConsecutiveDeclarations()327*67e74705SXin Li void WhitespaceManager::alignConsecutiveDeclarations() {
328*67e74705SXin Li   if (!Style.AlignConsecutiveDeclarations)
329*67e74705SXin Li     return;
330*67e74705SXin Li 
331*67e74705SXin Li   // FIXME: Currently we don't handle properly the PointerAlignment: Right
332*67e74705SXin Li   // The * and & are not aligned and are left dangling. Something has to be done
333*67e74705SXin Li   // about it, but it raises the question of alignment of code like:
334*67e74705SXin Li   //   const char* const* v1;
335*67e74705SXin Li   //   float const* v2;
336*67e74705SXin Li   //   SomeVeryLongType const& v3;
337*67e74705SXin Li 
338*67e74705SXin Li   AlignTokens(Style, [](Change const &C) { return C.IsStartOfDeclName; },
339*67e74705SXin Li               Changes);
340*67e74705SXin Li }
341*67e74705SXin Li 
alignTrailingComments()342*67e74705SXin Li void WhitespaceManager::alignTrailingComments() {
343*67e74705SXin Li   unsigned MinColumn = 0;
344*67e74705SXin Li   unsigned MaxColumn = UINT_MAX;
345*67e74705SXin Li   unsigned StartOfSequence = 0;
346*67e74705SXin Li   bool BreakBeforeNext = false;
347*67e74705SXin Li   unsigned Newlines = 0;
348*67e74705SXin Li   for (unsigned i = 0, e = Changes.size(); i != e; ++i) {
349*67e74705SXin Li     if (Changes[i].StartOfBlockComment)
350*67e74705SXin Li       continue;
351*67e74705SXin Li     Newlines += Changes[i].NewlinesBefore;
352*67e74705SXin Li     if (!Changes[i].IsTrailingComment)
353*67e74705SXin Li       continue;
354*67e74705SXin Li 
355*67e74705SXin Li     unsigned ChangeMinColumn = Changes[i].StartOfTokenColumn;
356*67e74705SXin Li     unsigned ChangeMaxColumn = Style.ColumnLimit - Changes[i].TokenLength;
357*67e74705SXin Li 
358*67e74705SXin Li     // If we don't create a replacement for this change, we have to consider
359*67e74705SXin Li     // it to be immovable.
360*67e74705SXin Li     if (!Changes[i].CreateReplacement)
361*67e74705SXin Li       ChangeMaxColumn = ChangeMinColumn;
362*67e74705SXin Li 
363*67e74705SXin Li     if (i + 1 != e && Changes[i + 1].ContinuesPPDirective)
364*67e74705SXin Li       ChangeMaxColumn -= 2;
365*67e74705SXin Li     // If this comment follows an } in column 0, it probably documents the
366*67e74705SXin Li     // closing of a namespace and we don't want to align it.
367*67e74705SXin Li     bool FollowsRBraceInColumn0 = i > 0 && Changes[i].NewlinesBefore == 0 &&
368*67e74705SXin Li                                   Changes[i - 1].Kind == tok::r_brace &&
369*67e74705SXin Li                                   Changes[i - 1].StartOfTokenColumn == 0;
370*67e74705SXin Li     bool WasAlignedWithStartOfNextLine = false;
371*67e74705SXin Li     if (Changes[i].NewlinesBefore == 1) { // A comment on its own line.
372*67e74705SXin Li       unsigned CommentColumn = SourceMgr.getSpellingColumnNumber(
373*67e74705SXin Li           Changes[i].OriginalWhitespaceRange.getEnd());
374*67e74705SXin Li       for (unsigned j = i + 1; j != e; ++j) {
375*67e74705SXin Li         if (Changes[j].Kind == tok::comment ||
376*67e74705SXin Li             Changes[j].Kind == tok::unknown)
377*67e74705SXin Li           // Skip over comments and unknown tokens. "unknown tokens are used for
378*67e74705SXin Li           // the continuation of multiline comments.
379*67e74705SXin Li           continue;
380*67e74705SXin Li 
381*67e74705SXin Li         unsigned NextColumn = SourceMgr.getSpellingColumnNumber(
382*67e74705SXin Li             Changes[j].OriginalWhitespaceRange.getEnd());
383*67e74705SXin Li         // The start of the next token was previously aligned with the
384*67e74705SXin Li         // start of this comment.
385*67e74705SXin Li         WasAlignedWithStartOfNextLine =
386*67e74705SXin Li             CommentColumn == NextColumn ||
387*67e74705SXin Li             CommentColumn == NextColumn + Style.IndentWidth;
388*67e74705SXin Li         break;
389*67e74705SXin Li       }
390*67e74705SXin Li     }
391*67e74705SXin Li     if (!Style.AlignTrailingComments || FollowsRBraceInColumn0) {
392*67e74705SXin Li       alignTrailingComments(StartOfSequence, i, MinColumn);
393*67e74705SXin Li       MinColumn = ChangeMinColumn;
394*67e74705SXin Li       MaxColumn = ChangeMinColumn;
395*67e74705SXin Li       StartOfSequence = i;
396*67e74705SXin Li     } else if (BreakBeforeNext || Newlines > 1 ||
397*67e74705SXin Li                (ChangeMinColumn > MaxColumn || ChangeMaxColumn < MinColumn) ||
398*67e74705SXin Li                // Break the comment sequence if the previous line did not end
399*67e74705SXin Li                // in a trailing comment.
400*67e74705SXin Li                (Changes[i].NewlinesBefore == 1 && i > 0 &&
401*67e74705SXin Li                 !Changes[i - 1].IsTrailingComment) ||
402*67e74705SXin Li                WasAlignedWithStartOfNextLine) {
403*67e74705SXin Li       alignTrailingComments(StartOfSequence, i, MinColumn);
404*67e74705SXin Li       MinColumn = ChangeMinColumn;
405*67e74705SXin Li       MaxColumn = ChangeMaxColumn;
406*67e74705SXin Li       StartOfSequence = i;
407*67e74705SXin Li     } else {
408*67e74705SXin Li       MinColumn = std::max(MinColumn, ChangeMinColumn);
409*67e74705SXin Li       MaxColumn = std::min(MaxColumn, ChangeMaxColumn);
410*67e74705SXin Li     }
411*67e74705SXin Li     BreakBeforeNext =
412*67e74705SXin Li         (i == 0) || (Changes[i].NewlinesBefore > 1) ||
413*67e74705SXin Li         // Never start a sequence with a comment at the beginning of
414*67e74705SXin Li         // the line.
415*67e74705SXin Li         (Changes[i].NewlinesBefore == 1 && StartOfSequence == i);
416*67e74705SXin Li     Newlines = 0;
417*67e74705SXin Li   }
418*67e74705SXin Li   alignTrailingComments(StartOfSequence, Changes.size(), MinColumn);
419*67e74705SXin Li }
420*67e74705SXin Li 
alignTrailingComments(unsigned Start,unsigned End,unsigned Column)421*67e74705SXin Li void WhitespaceManager::alignTrailingComments(unsigned Start, unsigned End,
422*67e74705SXin Li                                               unsigned Column) {
423*67e74705SXin Li   for (unsigned i = Start; i != End; ++i) {
424*67e74705SXin Li     int Shift = 0;
425*67e74705SXin Li     if (Changes[i].IsTrailingComment) {
426*67e74705SXin Li       Shift = Column - Changes[i].StartOfTokenColumn;
427*67e74705SXin Li     }
428*67e74705SXin Li     if (Changes[i].StartOfBlockComment) {
429*67e74705SXin Li       Shift = Changes[i].IndentationOffset +
430*67e74705SXin Li               Changes[i].StartOfBlockComment->StartOfTokenColumn -
431*67e74705SXin Li               Changes[i].StartOfTokenColumn;
432*67e74705SXin Li     }
433*67e74705SXin Li     assert(Shift >= 0);
434*67e74705SXin Li     Changes[i].Spaces += Shift;
435*67e74705SXin Li     if (i + 1 != End)
436*67e74705SXin Li       Changes[i + 1].PreviousEndOfTokenColumn += Shift;
437*67e74705SXin Li     Changes[i].StartOfTokenColumn += Shift;
438*67e74705SXin Li   }
439*67e74705SXin Li }
440*67e74705SXin Li 
alignEscapedNewlines()441*67e74705SXin Li void WhitespaceManager::alignEscapedNewlines() {
442*67e74705SXin Li   unsigned MaxEndOfLine =
443*67e74705SXin Li       Style.AlignEscapedNewlinesLeft ? 0 : Style.ColumnLimit;
444*67e74705SXin Li   unsigned StartOfMacro = 0;
445*67e74705SXin Li   for (unsigned i = 1, e = Changes.size(); i < e; ++i) {
446*67e74705SXin Li     Change &C = Changes[i];
447*67e74705SXin Li     if (C.NewlinesBefore > 0) {
448*67e74705SXin Li       if (C.ContinuesPPDirective) {
449*67e74705SXin Li         MaxEndOfLine = std::max(C.PreviousEndOfTokenColumn + 2, MaxEndOfLine);
450*67e74705SXin Li       } else {
451*67e74705SXin Li         alignEscapedNewlines(StartOfMacro + 1, i, MaxEndOfLine);
452*67e74705SXin Li         MaxEndOfLine = Style.AlignEscapedNewlinesLeft ? 0 : Style.ColumnLimit;
453*67e74705SXin Li         StartOfMacro = i;
454*67e74705SXin Li       }
455*67e74705SXin Li     }
456*67e74705SXin Li   }
457*67e74705SXin Li   alignEscapedNewlines(StartOfMacro + 1, Changes.size(), MaxEndOfLine);
458*67e74705SXin Li }
459*67e74705SXin Li 
alignEscapedNewlines(unsigned Start,unsigned End,unsigned Column)460*67e74705SXin Li void WhitespaceManager::alignEscapedNewlines(unsigned Start, unsigned End,
461*67e74705SXin Li                                              unsigned Column) {
462*67e74705SXin Li   for (unsigned i = Start; i < End; ++i) {
463*67e74705SXin Li     Change &C = Changes[i];
464*67e74705SXin Li     if (C.NewlinesBefore > 0) {
465*67e74705SXin Li       assert(C.ContinuesPPDirective);
466*67e74705SXin Li       if (C.PreviousEndOfTokenColumn + 1 > Column)
467*67e74705SXin Li         C.EscapedNewlineColumn = 0;
468*67e74705SXin Li       else
469*67e74705SXin Li         C.EscapedNewlineColumn = Column;
470*67e74705SXin Li     }
471*67e74705SXin Li   }
472*67e74705SXin Li }
473*67e74705SXin Li 
generateChanges()474*67e74705SXin Li void WhitespaceManager::generateChanges() {
475*67e74705SXin Li   for (unsigned i = 0, e = Changes.size(); i != e; ++i) {
476*67e74705SXin Li     const Change &C = Changes[i];
477*67e74705SXin Li     if (i > 0) {
478*67e74705SXin Li       assert(Changes[i - 1].OriginalWhitespaceRange.getBegin() !=
479*67e74705SXin Li                  C.OriginalWhitespaceRange.getBegin() &&
480*67e74705SXin Li              "Generating two replacements for the same location");
481*67e74705SXin Li     }
482*67e74705SXin Li     if (C.CreateReplacement) {
483*67e74705SXin Li       std::string ReplacementText = C.PreviousLinePostfix;
484*67e74705SXin Li       if (C.ContinuesPPDirective)
485*67e74705SXin Li         appendNewlineText(ReplacementText, C.NewlinesBefore,
486*67e74705SXin Li                           C.PreviousEndOfTokenColumn, C.EscapedNewlineColumn);
487*67e74705SXin Li       else
488*67e74705SXin Li         appendNewlineText(ReplacementText, C.NewlinesBefore);
489*67e74705SXin Li       appendIndentText(ReplacementText, C.IndentLevel, std::max(0, C.Spaces),
490*67e74705SXin Li                        C.StartOfTokenColumn - std::max(0, C.Spaces));
491*67e74705SXin Li       ReplacementText.append(C.CurrentLinePrefix);
492*67e74705SXin Li       storeReplacement(C.OriginalWhitespaceRange, ReplacementText);
493*67e74705SXin Li     }
494*67e74705SXin Li   }
495*67e74705SXin Li }
496*67e74705SXin Li 
storeReplacement(SourceRange Range,StringRef Text)497*67e74705SXin Li void WhitespaceManager::storeReplacement(SourceRange Range,
498*67e74705SXin Li                                          StringRef Text) {
499*67e74705SXin Li   unsigned WhitespaceLength = SourceMgr.getFileOffset(Range.getEnd()) -
500*67e74705SXin Li                               SourceMgr.getFileOffset(Range.getBegin());
501*67e74705SXin Li   // Don't create a replacement, if it does not change anything.
502*67e74705SXin Li   if (StringRef(SourceMgr.getCharacterData(Range.getBegin()),
503*67e74705SXin Li                 WhitespaceLength) == Text)
504*67e74705SXin Li     return;
505*67e74705SXin Li   Replaces.insert(tooling::Replacement(
506*67e74705SXin Li       SourceMgr, CharSourceRange::getCharRange(Range), Text));
507*67e74705SXin Li }
508*67e74705SXin Li 
appendNewlineText(std::string & Text,unsigned Newlines)509*67e74705SXin Li void WhitespaceManager::appendNewlineText(std::string &Text,
510*67e74705SXin Li                                           unsigned Newlines) {
511*67e74705SXin Li   for (unsigned i = 0; i < Newlines; ++i)
512*67e74705SXin Li     Text.append(UseCRLF ? "\r\n" : "\n");
513*67e74705SXin Li }
514*67e74705SXin Li 
appendNewlineText(std::string & Text,unsigned Newlines,unsigned PreviousEndOfTokenColumn,unsigned EscapedNewlineColumn)515*67e74705SXin Li void WhitespaceManager::appendNewlineText(std::string &Text, unsigned Newlines,
516*67e74705SXin Li                                           unsigned PreviousEndOfTokenColumn,
517*67e74705SXin Li                                           unsigned EscapedNewlineColumn) {
518*67e74705SXin Li   if (Newlines > 0) {
519*67e74705SXin Li     unsigned Offset =
520*67e74705SXin Li         std::min<int>(EscapedNewlineColumn - 1, PreviousEndOfTokenColumn);
521*67e74705SXin Li     for (unsigned i = 0; i < Newlines; ++i) {
522*67e74705SXin Li       Text.append(EscapedNewlineColumn - Offset - 1, ' ');
523*67e74705SXin Li       Text.append(UseCRLF ? "\\\r\n" : "\\\n");
524*67e74705SXin Li       Offset = 0;
525*67e74705SXin Li     }
526*67e74705SXin Li   }
527*67e74705SXin Li }
528*67e74705SXin Li 
appendIndentText(std::string & Text,unsigned IndentLevel,unsigned Spaces,unsigned WhitespaceStartColumn)529*67e74705SXin Li void WhitespaceManager::appendIndentText(std::string &Text,
530*67e74705SXin Li                                          unsigned IndentLevel, unsigned Spaces,
531*67e74705SXin Li                                          unsigned WhitespaceStartColumn) {
532*67e74705SXin Li   switch (Style.UseTab) {
533*67e74705SXin Li   case FormatStyle::UT_Never:
534*67e74705SXin Li     Text.append(Spaces, ' ');
535*67e74705SXin Li     break;
536*67e74705SXin Li   case FormatStyle::UT_Always: {
537*67e74705SXin Li     unsigned FirstTabWidth =
538*67e74705SXin Li         Style.TabWidth - WhitespaceStartColumn % Style.TabWidth;
539*67e74705SXin Li     // Indent with tabs only when there's at least one full tab.
540*67e74705SXin Li     if (FirstTabWidth + Style.TabWidth <= Spaces) {
541*67e74705SXin Li       Spaces -= FirstTabWidth;
542*67e74705SXin Li       Text.append("\t");
543*67e74705SXin Li     }
544*67e74705SXin Li     Text.append(Spaces / Style.TabWidth, '\t');
545*67e74705SXin Li     Text.append(Spaces % Style.TabWidth, ' ');
546*67e74705SXin Li     break;
547*67e74705SXin Li   }
548*67e74705SXin Li   case FormatStyle::UT_ForIndentation:
549*67e74705SXin Li     if (WhitespaceStartColumn == 0) {
550*67e74705SXin Li       unsigned Indentation = IndentLevel * Style.IndentWidth;
551*67e74705SXin Li       // This happens, e.g. when a line in a block comment is indented less than
552*67e74705SXin Li       // the first one.
553*67e74705SXin Li       if (Indentation > Spaces)
554*67e74705SXin Li         Indentation = Spaces;
555*67e74705SXin Li       unsigned Tabs = Indentation / Style.TabWidth;
556*67e74705SXin Li       Text.append(Tabs, '\t');
557*67e74705SXin Li       Spaces -= Tabs * Style.TabWidth;
558*67e74705SXin Li     }
559*67e74705SXin Li     Text.append(Spaces, ' ');
560*67e74705SXin Li     break;
561*67e74705SXin Li   case FormatStyle::UT_ForContinuationAndIndentation:
562*67e74705SXin Li     if (WhitespaceStartColumn == 0) {
563*67e74705SXin Li       unsigned Tabs = Spaces / Style.TabWidth;
564*67e74705SXin Li       Text.append(Tabs, '\t');
565*67e74705SXin Li       Spaces -= Tabs * Style.TabWidth;
566*67e74705SXin Li     }
567*67e74705SXin Li     Text.append(Spaces, ' ');
568*67e74705SXin Li     break;
569*67e74705SXin Li   }
570*67e74705SXin Li }
571*67e74705SXin Li 
572*67e74705SXin Li } // namespace format
573*67e74705SXin Li } // namespace clang
574