WhitespaceManager.cpp 17 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404405406407408409410411412413414415416417418419420421422423424425426427428429430431432433434435436437438439440441442443444445446447448
  1. //===--- WhitespaceManager.cpp - Format C++ code --------------------------===//
  2. //
  3. // The LLVM Compiler Infrastructure
  4. //
  5. // This file is distributed under the University of Illinois Open Source
  6. // License. See LICENSE.TXT for details.
  7. //
  8. //===----------------------------------------------------------------------===//
  9. ///
  10. /// \file
  11. /// \brief This file implements WhitespaceManager class.
  12. ///
  13. //===----------------------------------------------------------------------===//
  14. #include "WhitespaceManager.h"
  15. #include "llvm/ADT/STLExtras.h"
  16. namespace clang {
  17. namespace format {
  18. bool WhitespaceManager::Change::IsBeforeInFile::
  19. operator()(const Change &C1, const Change &C2) const {
  20. return SourceMgr.isBeforeInTranslationUnit(
  21. C1.OriginalWhitespaceRange.getBegin(),
  22. C2.OriginalWhitespaceRange.getBegin());
  23. }
  24. WhitespaceManager::Change::Change(
  25. bool CreateReplacement, const SourceRange &OriginalWhitespaceRange,
  26. unsigned IndentLevel, int Spaces, unsigned StartOfTokenColumn,
  27. unsigned NewlinesBefore, StringRef PreviousLinePostfix,
  28. StringRef CurrentLinePrefix, tok::TokenKind Kind, bool ContinuesPPDirective)
  29. : CreateReplacement(CreateReplacement),
  30. OriginalWhitespaceRange(OriginalWhitespaceRange),
  31. StartOfTokenColumn(StartOfTokenColumn), NewlinesBefore(NewlinesBefore),
  32. PreviousLinePostfix(PreviousLinePostfix),
  33. CurrentLinePrefix(CurrentLinePrefix), Kind(Kind),
  34. ContinuesPPDirective(ContinuesPPDirective), IndentLevel(IndentLevel),
  35. Spaces(Spaces), IsTrailingComment(false), TokenLength(0),
  36. PreviousEndOfTokenColumn(0), EscapedNewlineColumn(0),
  37. StartOfBlockComment(nullptr), IndentationOffset(0) {}
  38. void WhitespaceManager::reset() {
  39. Changes.clear();
  40. Replaces.clear();
  41. }
  42. void WhitespaceManager::replaceWhitespace(FormatToken &Tok, unsigned Newlines,
  43. unsigned IndentLevel, unsigned Spaces,
  44. unsigned StartOfTokenColumn,
  45. bool InPPDirective) {
  46. if (Tok.Finalized)
  47. return;
  48. Tok.Decision = (Newlines > 0) ? FD_Break : FD_Continue;
  49. Changes.push_back(Change(true, Tok.WhitespaceRange, IndentLevel, Spaces,
  50. StartOfTokenColumn, Newlines, "", "",
  51. Tok.Tok.getKind(), InPPDirective && !Tok.IsFirst));
  52. }
  53. void WhitespaceManager::addUntouchableToken(const FormatToken &Tok,
  54. bool InPPDirective) {
  55. if (Tok.Finalized)
  56. return;
  57. Changes.push_back(Change(false, Tok.WhitespaceRange, /*IndentLevel=*/0,
  58. /*Spaces=*/0, Tok.OriginalColumn, Tok.NewlinesBefore,
  59. "", "", Tok.Tok.getKind(),
  60. InPPDirective && !Tok.IsFirst));
  61. }
  62. void WhitespaceManager::replaceWhitespaceInToken(
  63. const FormatToken &Tok, unsigned Offset, unsigned ReplaceChars,
  64. StringRef PreviousPostfix, StringRef CurrentPrefix, bool InPPDirective,
  65. unsigned Newlines, unsigned IndentLevel, int Spaces) {
  66. if (Tok.Finalized)
  67. return;
  68. SourceLocation Start = Tok.getStartOfNonWhitespace().getLocWithOffset(Offset);
  69. Changes.push_back(Change(
  70. true, SourceRange(Start, Start.getLocWithOffset(ReplaceChars)),
  71. IndentLevel, Spaces, std::max(0, Spaces), Newlines, PreviousPostfix,
  72. CurrentPrefix,
  73. // If we don't add a newline this change doesn't start a comment. Thus,
  74. // when we align line comments, we don't need to treat this change as one.
  75. // FIXME: We still need to take this change in account to properly
  76. // calculate the new length of the comment and to calculate the changes
  77. // for which to do the alignment when aligning comments.
  78. Tok.is(TT_LineComment) && Newlines > 0 ? tok::comment : tok::unknown,
  79. InPPDirective && !Tok.IsFirst));
  80. }
  81. const tooling::Replacements &WhitespaceManager::generateReplacements() {
  82. if (Changes.empty())
  83. return Replaces;
  84. std::sort(Changes.begin(), Changes.end(), Change::IsBeforeInFile(SourceMgr));
  85. calculateLineBreakInformation();
  86. alignConsecutiveAssignments();
  87. alignTrailingComments();
  88. alignEscapedNewlines();
  89. generateChanges();
  90. return Replaces;
  91. }
  92. void WhitespaceManager::calculateLineBreakInformation() {
  93. Changes[0].PreviousEndOfTokenColumn = 0;
  94. for (unsigned i = 1, e = Changes.size(); i != e; ++i) {
  95. unsigned OriginalWhitespaceStart =
  96. SourceMgr.getFileOffset(Changes[i].OriginalWhitespaceRange.getBegin());
  97. unsigned PreviousOriginalWhitespaceEnd = SourceMgr.getFileOffset(
  98. Changes[i - 1].OriginalWhitespaceRange.getEnd());
  99. Changes[i - 1].TokenLength = OriginalWhitespaceStart -
  100. PreviousOriginalWhitespaceEnd +
  101. Changes[i].PreviousLinePostfix.size() +
  102. Changes[i - 1].CurrentLinePrefix.size();
  103. Changes[i].PreviousEndOfTokenColumn =
  104. Changes[i - 1].StartOfTokenColumn + Changes[i - 1].TokenLength;
  105. Changes[i - 1].IsTrailingComment =
  106. (Changes[i].NewlinesBefore > 0 || Changes[i].Kind == tok::eof) &&
  107. Changes[i - 1].Kind == tok::comment;
  108. }
  109. // FIXME: The last token is currently not always an eof token; in those
  110. // cases, setting TokenLength of the last token to 0 is wrong.
  111. Changes.back().TokenLength = 0;
  112. Changes.back().IsTrailingComment = Changes.back().Kind == tok::comment;
  113. const WhitespaceManager::Change *LastBlockComment = nullptr;
  114. for (auto &Change : Changes) {
  115. Change.StartOfBlockComment = nullptr;
  116. Change.IndentationOffset = 0;
  117. if (Change.Kind == tok::comment) {
  118. LastBlockComment = &Change;
  119. } else if (Change.Kind == tok::unknown) {
  120. if ((Change.StartOfBlockComment = LastBlockComment))
  121. Change.IndentationOffset =
  122. Change.StartOfTokenColumn -
  123. Change.StartOfBlockComment->StartOfTokenColumn;
  124. } else {
  125. LastBlockComment = nullptr;
  126. }
  127. }
  128. }
  129. // Walk through all of the changes and find sequences of "=" to align. To do
  130. // so, keep track of the lines and whether or not an "=" was found on align. If
  131. // a "=" is found on a line, extend the current sequence. If the current line
  132. // cannot be part of a sequence, e.g. because there is an empty line before it
  133. // or it contains non-assignments, finalize the previous sequence.
  134. void WhitespaceManager::alignConsecutiveAssignments() {
  135. if (!Style.AlignConsecutiveAssignments)
  136. return;
  137. unsigned MinColumn = 0;
  138. unsigned StartOfSequence = 0;
  139. unsigned EndOfSequence = 0;
  140. bool FoundAssignmentOnLine = false;
  141. bool FoundLeftParenOnLine = false;
  142. unsigned CurrentLine = 0;
  143. auto AlignSequence = [&] {
  144. alignConsecutiveAssignments(StartOfSequence, EndOfSequence, MinColumn);
  145. MinColumn = 0;
  146. StartOfSequence = 0;
  147. EndOfSequence = 0;
  148. };
  149. for (unsigned i = 0, e = Changes.size(); i != e; ++i) {
  150. if (Changes[i].NewlinesBefore != 0) {
  151. CurrentLine += Changes[i].NewlinesBefore;
  152. if (StartOfSequence > 0 &&
  153. (Changes[i].NewlinesBefore > 1 || !FoundAssignmentOnLine)) {
  154. EndOfSequence = i;
  155. AlignSequence();
  156. }
  157. FoundAssignmentOnLine = false;
  158. FoundLeftParenOnLine = false;
  159. }
  160. if ((Changes[i].Kind == tok::equal &&
  161. (FoundAssignmentOnLine || ((Changes[i].NewlinesBefore > 0 ||
  162. Changes[i + 1].NewlinesBefore > 0)))) ||
  163. (!FoundLeftParenOnLine && Changes[i].Kind == tok::r_paren)) {
  164. if (StartOfSequence > 0)
  165. AlignSequence();
  166. } else if (Changes[i].Kind == tok::l_paren) {
  167. FoundLeftParenOnLine = true;
  168. if (!FoundAssignmentOnLine && StartOfSequence > 0)
  169. AlignSequence();
  170. } else if (!FoundAssignmentOnLine && !FoundLeftParenOnLine &&
  171. Changes[i].Kind == tok::equal) {
  172. FoundAssignmentOnLine = true;
  173. EndOfSequence = i;
  174. if (StartOfSequence == 0)
  175. StartOfSequence = i;
  176. unsigned ChangeMinColumn = Changes[i].StartOfTokenColumn;
  177. MinColumn = std::max(MinColumn, ChangeMinColumn);
  178. }
  179. }
  180. if (StartOfSequence > 0) {
  181. EndOfSequence = Changes.size();
  182. AlignSequence();
  183. }
  184. }
  185. void WhitespaceManager::alignConsecutiveAssignments(unsigned Start,
  186. unsigned End,
  187. unsigned Column) {
  188. bool AlignedAssignment = false;
  189. int PreviousShift = 0;
  190. for (unsigned i = Start; i != End; ++i) {
  191. int Shift = 0;
  192. if (Changes[i].NewlinesBefore > 0)
  193. AlignedAssignment = false;
  194. if (!AlignedAssignment && Changes[i].Kind == tok::equal) {
  195. Shift = Column - Changes[i].StartOfTokenColumn;
  196. AlignedAssignment = true;
  197. PreviousShift = Shift;
  198. }
  199. assert(Shift >= 0);
  200. Changes[i].Spaces += Shift;
  201. if (i + 1 != Changes.size())
  202. Changes[i + 1].PreviousEndOfTokenColumn += Shift;
  203. Changes[i].StartOfTokenColumn += Shift;
  204. if (AlignedAssignment) {
  205. Changes[i].StartOfTokenColumn += PreviousShift;
  206. if (i + 1 != Changes.size())
  207. Changes[i + 1].PreviousEndOfTokenColumn += PreviousShift;
  208. }
  209. }
  210. }
  211. void WhitespaceManager::alignTrailingComments() {
  212. unsigned MinColumn = 0;
  213. unsigned MaxColumn = UINT_MAX;
  214. unsigned StartOfSequence = 0;
  215. bool BreakBeforeNext = false;
  216. unsigned Newlines = 0;
  217. for (unsigned i = 0, e = Changes.size(); i != e; ++i) {
  218. if (Changes[i].StartOfBlockComment)
  219. continue;
  220. Newlines += Changes[i].NewlinesBefore;
  221. if (!Changes[i].IsTrailingComment)
  222. continue;
  223. unsigned ChangeMinColumn = Changes[i].StartOfTokenColumn;
  224. unsigned ChangeMaxColumn = Style.ColumnLimit - Changes[i].TokenLength;
  225. if (i + 1 != e && Changes[i + 1].ContinuesPPDirective)
  226. ChangeMaxColumn -= 2;
  227. // If this comment follows an } in column 0, it probably documents the
  228. // closing of a namespace and we don't want to align it.
  229. bool FollowsRBraceInColumn0 = i > 0 && Changes[i].NewlinesBefore == 0 &&
  230. Changes[i - 1].Kind == tok::r_brace &&
  231. Changes[i - 1].StartOfTokenColumn == 0;
  232. bool WasAlignedWithStartOfNextLine = false;
  233. if (Changes[i].NewlinesBefore == 1) { // A comment on its own line.
  234. unsigned CommentColumn = SourceMgr.getSpellingColumnNumber(
  235. Changes[i].OriginalWhitespaceRange.getEnd());
  236. for (unsigned j = i + 1; j != e; ++j) {
  237. if (Changes[j].Kind != tok::comment) { // Skip over comments.
  238. unsigned NextColumn = SourceMgr.getSpellingColumnNumber(
  239. Changes[j].OriginalWhitespaceRange.getEnd());
  240. // The start of the next token was previously aligned with the
  241. // start of this comment.
  242. WasAlignedWithStartOfNextLine =
  243. CommentColumn == NextColumn ||
  244. CommentColumn == NextColumn + Style.IndentWidth;
  245. break;
  246. }
  247. }
  248. }
  249. if (!Style.AlignTrailingComments || FollowsRBraceInColumn0) {
  250. alignTrailingComments(StartOfSequence, i, MinColumn);
  251. MinColumn = ChangeMinColumn;
  252. MaxColumn = ChangeMinColumn;
  253. StartOfSequence = i;
  254. } else if (BreakBeforeNext || Newlines > 1 ||
  255. (ChangeMinColumn > MaxColumn || ChangeMaxColumn < MinColumn) ||
  256. // Break the comment sequence if the previous line did not end
  257. // in a trailing comment.
  258. (Changes[i].NewlinesBefore == 1 && i > 0 &&
  259. !Changes[i - 1].IsTrailingComment) ||
  260. WasAlignedWithStartOfNextLine) {
  261. alignTrailingComments(StartOfSequence, i, MinColumn);
  262. MinColumn = ChangeMinColumn;
  263. MaxColumn = ChangeMaxColumn;
  264. StartOfSequence = i;
  265. } else {
  266. MinColumn = std::max(MinColumn, ChangeMinColumn);
  267. MaxColumn = std::min(MaxColumn, ChangeMaxColumn);
  268. }
  269. BreakBeforeNext =
  270. (i == 0) || (Changes[i].NewlinesBefore > 1) ||
  271. // Never start a sequence with a comment at the beginning of
  272. // the line.
  273. (Changes[i].NewlinesBefore == 1 && StartOfSequence == i);
  274. Newlines = 0;
  275. }
  276. alignTrailingComments(StartOfSequence, Changes.size(), MinColumn);
  277. }
  278. void WhitespaceManager::alignTrailingComments(unsigned Start, unsigned End,
  279. unsigned Column) {
  280. for (unsigned i = Start; i != End; ++i) {
  281. int Shift = 0;
  282. if (Changes[i].IsTrailingComment) {
  283. Shift = Column - Changes[i].StartOfTokenColumn;
  284. }
  285. if (Changes[i].StartOfBlockComment) {
  286. Shift = Changes[i].IndentationOffset +
  287. Changes[i].StartOfBlockComment->StartOfTokenColumn -
  288. Changes[i].StartOfTokenColumn;
  289. }
  290. assert(Shift >= 0);
  291. Changes[i].Spaces += Shift;
  292. if (i + 1 != End)
  293. Changes[i + 1].PreviousEndOfTokenColumn += Shift;
  294. Changes[i].StartOfTokenColumn += Shift;
  295. }
  296. }
  297. void WhitespaceManager::alignEscapedNewlines() {
  298. unsigned MaxEndOfLine =
  299. Style.AlignEscapedNewlinesLeft ? 0 : Style.ColumnLimit;
  300. unsigned StartOfMacro = 0;
  301. for (unsigned i = 1, e = Changes.size(); i < e; ++i) {
  302. Change &C = Changes[i];
  303. if (C.NewlinesBefore > 0) {
  304. if (C.ContinuesPPDirective) {
  305. MaxEndOfLine = std::max(C.PreviousEndOfTokenColumn + 2, MaxEndOfLine);
  306. } else {
  307. alignEscapedNewlines(StartOfMacro + 1, i, MaxEndOfLine);
  308. MaxEndOfLine = Style.AlignEscapedNewlinesLeft ? 0 : Style.ColumnLimit;
  309. StartOfMacro = i;
  310. }
  311. }
  312. }
  313. alignEscapedNewlines(StartOfMacro + 1, Changes.size(), MaxEndOfLine);
  314. }
  315. void WhitespaceManager::alignEscapedNewlines(unsigned Start, unsigned End,
  316. unsigned Column) {
  317. for (unsigned i = Start; i < End; ++i) {
  318. Change &C = Changes[i];
  319. if (C.NewlinesBefore > 0) {
  320. assert(C.ContinuesPPDirective);
  321. if (C.PreviousEndOfTokenColumn + 1 > Column)
  322. C.EscapedNewlineColumn = 0;
  323. else
  324. C.EscapedNewlineColumn = Column;
  325. }
  326. }
  327. }
  328. void WhitespaceManager::generateChanges() {
  329. for (unsigned i = 0, e = Changes.size(); i != e; ++i) {
  330. const Change &C = Changes[i];
  331. if (i > 0) {
  332. assert(Changes[i - 1].OriginalWhitespaceRange.getBegin() !=
  333. C.OriginalWhitespaceRange.getBegin() &&
  334. "Generating two replacements for the same location");
  335. }
  336. if (C.CreateReplacement) {
  337. std::string ReplacementText = C.PreviousLinePostfix;
  338. if (C.ContinuesPPDirective)
  339. appendNewlineText(ReplacementText, C.NewlinesBefore,
  340. C.PreviousEndOfTokenColumn, C.EscapedNewlineColumn);
  341. else
  342. appendNewlineText(ReplacementText, C.NewlinesBefore);
  343. appendIndentText(ReplacementText, C.IndentLevel, std::max(0, C.Spaces),
  344. C.StartOfTokenColumn - std::max(0, C.Spaces));
  345. ReplacementText.append(C.CurrentLinePrefix);
  346. storeReplacement(C.OriginalWhitespaceRange, ReplacementText);
  347. }
  348. }
  349. }
  350. void WhitespaceManager::storeReplacement(const SourceRange &Range,
  351. StringRef Text) {
  352. unsigned WhitespaceLength = SourceMgr.getFileOffset(Range.getEnd()) -
  353. SourceMgr.getFileOffset(Range.getBegin());
  354. // Don't create a replacement, if it does not change anything.
  355. if (StringRef(SourceMgr.getCharacterData(Range.getBegin()),
  356. WhitespaceLength) == Text)
  357. return;
  358. Replaces.insert(tooling::Replacement(
  359. SourceMgr, CharSourceRange::getCharRange(Range), Text));
  360. }
  361. void WhitespaceManager::appendNewlineText(std::string &Text,
  362. unsigned Newlines) {
  363. for (unsigned i = 0; i < Newlines; ++i)
  364. Text.append(UseCRLF ? "\r\n" : "\n");
  365. }
  366. void WhitespaceManager::appendNewlineText(std::string &Text, unsigned Newlines,
  367. unsigned PreviousEndOfTokenColumn,
  368. unsigned EscapedNewlineColumn) {
  369. if (Newlines > 0) {
  370. unsigned Offset =
  371. std::min<int>(EscapedNewlineColumn - 1, PreviousEndOfTokenColumn);
  372. for (unsigned i = 0; i < Newlines; ++i) {
  373. Text.append(EscapedNewlineColumn - Offset - 1, ' ');
  374. Text.append(UseCRLF ? "\\\r\n" : "\\\n");
  375. Offset = 0;
  376. }
  377. }
  378. }
  379. void WhitespaceManager::appendIndentText(std::string &Text,
  380. unsigned IndentLevel, unsigned Spaces,
  381. unsigned WhitespaceStartColumn) {
  382. switch (Style.UseTab) {
  383. case FormatStyle::UT_Never:
  384. Text.append(Spaces, ' ');
  385. break;
  386. case FormatStyle::UT_Always: {
  387. unsigned FirstTabWidth =
  388. Style.TabWidth - WhitespaceStartColumn % Style.TabWidth;
  389. // Indent with tabs only when there's at least one full tab.
  390. if (FirstTabWidth + Style.TabWidth <= Spaces) {
  391. Spaces -= FirstTabWidth;
  392. Text.append("\t");
  393. }
  394. Text.append(Spaces / Style.TabWidth, '\t');
  395. Text.append(Spaces % Style.TabWidth, ' ');
  396. break;
  397. }
  398. case FormatStyle::UT_ForIndentation:
  399. if (WhitespaceStartColumn == 0) {
  400. unsigned Indentation = IndentLevel * Style.IndentWidth;
  401. // This happens, e.g. when a line in a block comment is indented less than
  402. // the first one.
  403. if (Indentation > Spaces)
  404. Indentation = Spaces;
  405. unsigned Tabs = Indentation / Style.TabWidth;
  406. Text.append(Tabs, '\t');
  407. Spaces -= Tabs * Style.TabWidth;
  408. }
  409. Text.append(Spaces, ' ');
  410. break;
  411. }
  412. }
  413. } // namespace format
  414. } // namespace clang