CbC/CbC_llvm: clang/lib/Format/BreakableToken.cpp annotate

annotate clang/lib/Format/BreakableToken.cpp @ 150:1d019706d866

LLVM10

author	anatofuz
date	Thu, 13 Feb 2020 15:10:13 +0900
parents
children	0572611fdcc8

rev	line source
150 1d019706d866 LLVM10 anatofuz parents: diff changeset	1 //===--- BreakableToken.cpp - Format C++ code -----------------------------===//
1d019706d866 LLVM10 anatofuz parents: diff changeset	2 //
1d019706d866 LLVM10 anatofuz parents: diff changeset	3 // Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions.
1d019706d866 LLVM10 anatofuz parents: diff changeset	4 // See https://llvm.org/LICENSE.txt for license information.
1d019706d866 LLVM10 anatofuz parents: diff changeset	5 // SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception
1d019706d866 LLVM10 anatofuz parents: diff changeset	6 //
1d019706d866 LLVM10 anatofuz parents: diff changeset	7 //===----------------------------------------------------------------------===//
1d019706d866 LLVM10 anatofuz parents: diff changeset	8 ///
1d019706d866 LLVM10 anatofuz parents: diff changeset	9 /// \file
1d019706d866 LLVM10 anatofuz parents: diff changeset	10 /// Contains implementation of BreakableToken class and classes derived
1d019706d866 LLVM10 anatofuz parents: diff changeset	11 /// from it.
1d019706d866 LLVM10 anatofuz parents: diff changeset	12 ///
1d019706d866 LLVM10 anatofuz parents: diff changeset	13 //===----------------------------------------------------------------------===//
1d019706d866 LLVM10 anatofuz parents: diff changeset	14
1d019706d866 LLVM10 anatofuz parents: diff changeset	15 #include "BreakableToken.h"
1d019706d866 LLVM10 anatofuz parents: diff changeset	16 #include "ContinuationIndenter.h"
1d019706d866 LLVM10 anatofuz parents: diff changeset	17 #include "clang/Basic/CharInfo.h"
1d019706d866 LLVM10 anatofuz parents: diff changeset	18 #include "clang/Format/Format.h"
1d019706d866 LLVM10 anatofuz parents: diff changeset	19 #include "llvm/ADT/STLExtras.h"
1d019706d866 LLVM10 anatofuz parents: diff changeset	20 #include "llvm/Support/Debug.h"
1d019706d866 LLVM10 anatofuz parents: diff changeset	21 #include <algorithm>
1d019706d866 LLVM10 anatofuz parents: diff changeset	22
1d019706d866 LLVM10 anatofuz parents: diff changeset	23 #define DEBUG_TYPE "format-token-breaker"
1d019706d866 LLVM10 anatofuz parents: diff changeset	24
1d019706d866 LLVM10 anatofuz parents: diff changeset	25 namespace clang {
1d019706d866 LLVM10 anatofuz parents: diff changeset	26 namespace format {
1d019706d866 LLVM10 anatofuz parents: diff changeset	27
1d019706d866 LLVM10 anatofuz parents: diff changeset	28 static const char *const Blanks = " \t\v\f\r";
1d019706d866 LLVM10 anatofuz parents: diff changeset	29 static bool IsBlank(char C) {
1d019706d866 LLVM10 anatofuz parents: diff changeset	30 switch (C) {
1d019706d866 LLVM10 anatofuz parents: diff changeset	31 case ' ':
1d019706d866 LLVM10 anatofuz parents: diff changeset	32 case '\t':
1d019706d866 LLVM10 anatofuz parents: diff changeset	33 case '\v':
1d019706d866 LLVM10 anatofuz parents: diff changeset	34 case '\f':
1d019706d866 LLVM10 anatofuz parents: diff changeset	35 case '\r':
1d019706d866 LLVM10 anatofuz parents: diff changeset	36 return true;
1d019706d866 LLVM10 anatofuz parents: diff changeset	37 default:
1d019706d866 LLVM10 anatofuz parents: diff changeset	38 return false;
1d019706d866 LLVM10 anatofuz parents: diff changeset	39 }
1d019706d866 LLVM10 anatofuz parents: diff changeset	40 }
1d019706d866 LLVM10 anatofuz parents: diff changeset	41
1d019706d866 LLVM10 anatofuz parents: diff changeset	42 static StringRef getLineCommentIndentPrefix(StringRef Comment,
1d019706d866 LLVM10 anatofuz parents: diff changeset	43 const FormatStyle &Style) {
1d019706d866 LLVM10 anatofuz parents: diff changeset	44 static const char *const KnownCStylePrefixes[] = {"///<", "//!<", "///", "//",
1d019706d866 LLVM10 anatofuz parents: diff changeset	45 "//!"};
1d019706d866 LLVM10 anatofuz parents: diff changeset	46 static const char *const KnownTextProtoPrefixes[] = {"//", "#", "##", "###",
1d019706d866 LLVM10 anatofuz parents: diff changeset	47 "####"};
1d019706d866 LLVM10 anatofuz parents: diff changeset	48 ArrayRef<const char *> KnownPrefixes(KnownCStylePrefixes);
1d019706d866 LLVM10 anatofuz parents: diff changeset	49 if (Style.Language == FormatStyle::LK_TextProto)
1d019706d866 LLVM10 anatofuz parents: diff changeset	50 KnownPrefixes = KnownTextProtoPrefixes;
1d019706d866 LLVM10 anatofuz parents: diff changeset	51
1d019706d866 LLVM10 anatofuz parents: diff changeset	52 StringRef LongestPrefix;
1d019706d866 LLVM10 anatofuz parents: diff changeset	53 for (StringRef KnownPrefix : KnownPrefixes) {
1d019706d866 LLVM10 anatofuz parents: diff changeset	54 if (Comment.startswith(KnownPrefix)) {
1d019706d866 LLVM10 anatofuz parents: diff changeset	55 size_t PrefixLength = KnownPrefix.size();
1d019706d866 LLVM10 anatofuz parents: diff changeset	56 while (PrefixLength < Comment.size() && Comment[PrefixLength] == ' ')
1d019706d866 LLVM10 anatofuz parents: diff changeset	57 ++PrefixLength;
1d019706d866 LLVM10 anatofuz parents: diff changeset	58 if (PrefixLength > LongestPrefix.size())
1d019706d866 LLVM10 anatofuz parents: diff changeset	59 LongestPrefix = Comment.substr(0, PrefixLength);
1d019706d866 LLVM10 anatofuz parents: diff changeset	60 }
1d019706d866 LLVM10 anatofuz parents: diff changeset	61 }
1d019706d866 LLVM10 anatofuz parents: diff changeset	62 return LongestPrefix;
1d019706d866 LLVM10 anatofuz parents: diff changeset	63 }
1d019706d866 LLVM10 anatofuz parents: diff changeset	64
1d019706d866 LLVM10 anatofuz parents: diff changeset	65 static BreakableToken::Split
1d019706d866 LLVM10 anatofuz parents: diff changeset	66 getCommentSplit(StringRef Text, unsigned ContentStartColumn,
1d019706d866 LLVM10 anatofuz parents: diff changeset	67 unsigned ColumnLimit, unsigned TabWidth,
1d019706d866 LLVM10 anatofuz parents: diff changeset	68 encoding::Encoding Encoding, const FormatStyle &Style,
1d019706d866 LLVM10 anatofuz parents: diff changeset	69 bool DecorationEndsWithStar = false) {
1d019706d866 LLVM10 anatofuz parents: diff changeset	70 LLVM_DEBUG(llvm::dbgs() << "Comment split: \"" << Text
1d019706d866 LLVM10 anatofuz parents: diff changeset	71 << "\", Column limit: " << ColumnLimit
1d019706d866 LLVM10 anatofuz parents: diff changeset	72 << ", Content start: " << ContentStartColumn << "\n");
1d019706d866 LLVM10 anatofuz parents: diff changeset	73 if (ColumnLimit <= ContentStartColumn + 1)
1d019706d866 LLVM10 anatofuz parents: diff changeset	74 return BreakableToken::Split(StringRef::npos, 0);
1d019706d866 LLVM10 anatofuz parents: diff changeset	75
1d019706d866 LLVM10 anatofuz parents: diff changeset	76 unsigned MaxSplit = ColumnLimit - ContentStartColumn + 1;
1d019706d866 LLVM10 anatofuz parents: diff changeset	77 unsigned MaxSplitBytes = 0;
1d019706d866 LLVM10 anatofuz parents: diff changeset	78
1d019706d866 LLVM10 anatofuz parents: diff changeset	79 for (unsigned NumChars = 0;
1d019706d866 LLVM10 anatofuz parents: diff changeset	80 NumChars < MaxSplit && MaxSplitBytes < Text.size();) {
1d019706d866 LLVM10 anatofuz parents: diff changeset	81 unsigned BytesInChar =
1d019706d866 LLVM10 anatofuz parents: diff changeset	82 encoding::getCodePointNumBytes(Text[MaxSplitBytes], Encoding);
1d019706d866 LLVM10 anatofuz parents: diff changeset	83 NumChars +=
1d019706d866 LLVM10 anatofuz parents: diff changeset	84 encoding::columnWidthWithTabs(Text.substr(MaxSplitBytes, BytesInChar),
1d019706d866 LLVM10 anatofuz parents: diff changeset	85 ContentStartColumn, TabWidth, Encoding);
1d019706d866 LLVM10 anatofuz parents: diff changeset	86 MaxSplitBytes += BytesInChar;
1d019706d866 LLVM10 anatofuz parents: diff changeset	87 }
1d019706d866 LLVM10 anatofuz parents: diff changeset	88
1d019706d866 LLVM10 anatofuz parents: diff changeset	89 StringRef::size_type SpaceOffset = Text.find_last_of(Blanks, MaxSplitBytes);
1d019706d866 LLVM10 anatofuz parents: diff changeset	90
1d019706d866 LLVM10 anatofuz parents: diff changeset	91 static const auto kNumberedListRegexp = llvm::Regex("^[1-9][0-9]?\\.");
1d019706d866 LLVM10 anatofuz parents: diff changeset	92 while (SpaceOffset != StringRef::npos) {
1d019706d866 LLVM10 anatofuz parents: diff changeset	93 // Do not split before a number followed by a dot: this would be interpreted
1d019706d866 LLVM10 anatofuz parents: diff changeset	94 // as a numbered list, which would prevent re-flowing in subsequent passes.
1d019706d866 LLVM10 anatofuz parents: diff changeset	95 if (kNumberedListRegexp.match(Text.substr(SpaceOffset).ltrim(Blanks)))
1d019706d866 LLVM10 anatofuz parents: diff changeset	96 SpaceOffset = Text.find_last_of(Blanks, SpaceOffset);
1d019706d866 LLVM10 anatofuz parents: diff changeset	97 // In JavaScript, some @tags can be followed by {, and machinery that parses
1d019706d866 LLVM10 anatofuz parents: diff changeset	98 // these comments will fail to understand the comment if followed by a line
1d019706d866 LLVM10 anatofuz parents: diff changeset	99 // break. So avoid ever breaking before a {.
1d019706d866 LLVM10 anatofuz parents: diff changeset	100 else if (Style.Language == FormatStyle::LK_JavaScript &&
1d019706d866 LLVM10 anatofuz parents: diff changeset	101 SpaceOffset + 1 < Text.size() && Text[SpaceOffset + 1] == '{')
1d019706d866 LLVM10 anatofuz parents: diff changeset	102 SpaceOffset = Text.find_last_of(Blanks, SpaceOffset);
1d019706d866 LLVM10 anatofuz parents: diff changeset	103 else
1d019706d866 LLVM10 anatofuz parents: diff changeset	104 break;
1d019706d866 LLVM10 anatofuz parents: diff changeset	105 }
1d019706d866 LLVM10 anatofuz parents: diff changeset	106
1d019706d866 LLVM10 anatofuz parents: diff changeset	107 if (SpaceOffset == StringRef::npos \|\|
1d019706d866 LLVM10 anatofuz parents: diff changeset	108 // Don't break at leading whitespace.
1d019706d866 LLVM10 anatofuz parents: diff changeset	109 Text.find_last_not_of(Blanks, SpaceOffset) == StringRef::npos) {
1d019706d866 LLVM10 anatofuz parents: diff changeset	110 // Make sure that we don't break at leading whitespace that
1d019706d866 LLVM10 anatofuz parents: diff changeset	111 // reaches past MaxSplit.
1d019706d866 LLVM10 anatofuz parents: diff changeset	112 StringRef::size_type FirstNonWhitespace = Text.find_first_not_of(Blanks);
1d019706d866 LLVM10 anatofuz parents: diff changeset	113 if (FirstNonWhitespace == StringRef::npos)
1d019706d866 LLVM10 anatofuz parents: diff changeset	114 // If the comment is only whitespace, we cannot split.
1d019706d866 LLVM10 anatofuz parents: diff changeset	115 return BreakableToken::Split(StringRef::npos, 0);
1d019706d866 LLVM10 anatofuz parents: diff changeset	116 SpaceOffset = Text.find_first_of(
1d019706d866 LLVM10 anatofuz parents: diff changeset	117 Blanks, std::max<unsigned>(MaxSplitBytes, FirstNonWhitespace));
1d019706d866 LLVM10 anatofuz parents: diff changeset	118 }
1d019706d866 LLVM10 anatofuz parents: diff changeset	119 if (SpaceOffset != StringRef::npos && SpaceOffset != 0) {
1d019706d866 LLVM10 anatofuz parents: diff changeset	120 // adaptStartOfLine will break after lines starting with /** if the comment
1d019706d866 LLVM10 anatofuz parents: diff changeset	121 // is broken anywhere. Avoid emitting this break twice here.
1d019706d866 LLVM10 anatofuz parents: diff changeset	122 // Example: in /** longtextcomesherethatbreaks */ (with ColumnLimit 20) will
1d019706d866 LLVM10 anatofuz parents: diff changeset	123 // insert a break after /**, so this code must not insert the same break.
1d019706d866 LLVM10 anatofuz parents: diff changeset	124 if (SpaceOffset == 1 && Text[SpaceOffset - 1] == '*')
1d019706d866 LLVM10 anatofuz parents: diff changeset	125 return BreakableToken::Split(StringRef::npos, 0);
1d019706d866 LLVM10 anatofuz parents: diff changeset	126 StringRef BeforeCut = Text.substr(0, SpaceOffset).rtrim(Blanks);
1d019706d866 LLVM10 anatofuz parents: diff changeset	127 StringRef AfterCut = Text.substr(SpaceOffset);
1d019706d866 LLVM10 anatofuz parents: diff changeset	128 // Don't trim the leading blanks if it would create a */ after the break.
1d019706d866 LLVM10 anatofuz parents: diff changeset	129 if (!DecorationEndsWithStar \|\| AfterCut.size() <= 1 \|\| AfterCut[1] != '/')
1d019706d866 LLVM10 anatofuz parents: diff changeset	130 AfterCut = AfterCut.ltrim(Blanks);
1d019706d866 LLVM10 anatofuz parents: diff changeset	131 return BreakableToken::Split(BeforeCut.size(),
1d019706d866 LLVM10 anatofuz parents: diff changeset	132 AfterCut.begin() - BeforeCut.end());
1d019706d866 LLVM10 anatofuz parents: diff changeset	133 }
1d019706d866 LLVM10 anatofuz parents: diff changeset	134 return BreakableToken::Split(StringRef::npos, 0);
1d019706d866 LLVM10 anatofuz parents: diff changeset	135 }
1d019706d866 LLVM10 anatofuz parents: diff changeset	136
1d019706d866 LLVM10 anatofuz parents: diff changeset	137 static BreakableToken::Split
1d019706d866 LLVM10 anatofuz parents: diff changeset	138 getStringSplit(StringRef Text, unsigned UsedColumns, unsigned ColumnLimit,
1d019706d866 LLVM10 anatofuz parents: diff changeset	139 unsigned TabWidth, encoding::Encoding Encoding) {
1d019706d866 LLVM10 anatofuz parents: diff changeset	140 // FIXME: Reduce unit test case.
1d019706d866 LLVM10 anatofuz parents: diff changeset	141 if (Text.empty())
1d019706d866 LLVM10 anatofuz parents: diff changeset	142 return BreakableToken::Split(StringRef::npos, 0);
1d019706d866 LLVM10 anatofuz parents: diff changeset	143 if (ColumnLimit <= UsedColumns)
1d019706d866 LLVM10 anatofuz parents: diff changeset	144 return BreakableToken::Split(StringRef::npos, 0);
1d019706d866 LLVM10 anatofuz parents: diff changeset	145 unsigned MaxSplit = ColumnLimit - UsedColumns;
1d019706d866 LLVM10 anatofuz parents: diff changeset	146 StringRef::size_type SpaceOffset = 0;
1d019706d866 LLVM10 anatofuz parents: diff changeset	147 StringRef::size_type SlashOffset = 0;
1d019706d866 LLVM10 anatofuz parents: diff changeset	148 StringRef::size_type WordStartOffset = 0;
1d019706d866 LLVM10 anatofuz parents: diff changeset	149 StringRef::size_type SplitPoint = 0;
1d019706d866 LLVM10 anatofuz parents: diff changeset	150 for (unsigned Chars = 0;;) {
1d019706d866 LLVM10 anatofuz parents: diff changeset	151 unsigned Advance;
1d019706d866 LLVM10 anatofuz parents: diff changeset	152 if (Text[0] == '\\') {
1d019706d866 LLVM10 anatofuz parents: diff changeset	153 Advance = encoding::getEscapeSequenceLength(Text);
1d019706d866 LLVM10 anatofuz parents: diff changeset	154 Chars += Advance;
1d019706d866 LLVM10 anatofuz parents: diff changeset	155 } else {
1d019706d866 LLVM10 anatofuz parents: diff changeset	156 Advance = encoding::getCodePointNumBytes(Text[0], Encoding);
1d019706d866 LLVM10 anatofuz parents: diff changeset	157 Chars += encoding::columnWidthWithTabs(
1d019706d866 LLVM10 anatofuz parents: diff changeset	158 Text.substr(0, Advance), UsedColumns + Chars, TabWidth, Encoding);
1d019706d866 LLVM10 anatofuz parents: diff changeset	159 }
1d019706d866 LLVM10 anatofuz parents: diff changeset	160
1d019706d866 LLVM10 anatofuz parents: diff changeset	161 if (Chars > MaxSplit \|\| Text.size() <= Advance)
1d019706d866 LLVM10 anatofuz parents: diff changeset	162 break;
1d019706d866 LLVM10 anatofuz parents: diff changeset	163
1d019706d866 LLVM10 anatofuz parents: diff changeset	164 if (IsBlank(Text[0]))
1d019706d866 LLVM10 anatofuz parents: diff changeset	165 SpaceOffset = SplitPoint;
1d019706d866 LLVM10 anatofuz parents: diff changeset	166 if (Text[0] == '/')
1d019706d866 LLVM10 anatofuz parents: diff changeset	167 SlashOffset = SplitPoint;
1d019706d866 LLVM10 anatofuz parents: diff changeset	168 if (Advance == 1 && !isAlphanumeric(Text[0]))
1d019706d866 LLVM10 anatofuz parents: diff changeset	169 WordStartOffset = SplitPoint;
1d019706d866 LLVM10 anatofuz parents: diff changeset	170
1d019706d866 LLVM10 anatofuz parents: diff changeset	171 SplitPoint += Advance;
1d019706d866 LLVM10 anatofuz parents: diff changeset	172 Text = Text.substr(Advance);
1d019706d866 LLVM10 anatofuz parents: diff changeset	173 }
1d019706d866 LLVM10 anatofuz parents: diff changeset	174
1d019706d866 LLVM10 anatofuz parents: diff changeset	175 if (SpaceOffset != 0)
1d019706d866 LLVM10 anatofuz parents: diff changeset	176 return BreakableToken::Split(SpaceOffset + 1, 0);
1d019706d866 LLVM10 anatofuz parents: diff changeset	177 if (SlashOffset != 0)
1d019706d866 LLVM10 anatofuz parents: diff changeset	178 return BreakableToken::Split(SlashOffset + 1, 0);
1d019706d866 LLVM10 anatofuz parents: diff changeset	179 if (WordStartOffset != 0)
1d019706d866 LLVM10 anatofuz parents: diff changeset	180 return BreakableToken::Split(WordStartOffset + 1, 0);
1d019706d866 LLVM10 anatofuz parents: diff changeset	181 if (SplitPoint != 0)
1d019706d866 LLVM10 anatofuz parents: diff changeset	182 return BreakableToken::Split(SplitPoint, 0);
1d019706d866 LLVM10 anatofuz parents: diff changeset	183 return BreakableToken::Split(StringRef::npos, 0);
1d019706d866 LLVM10 anatofuz parents: diff changeset	184 }
1d019706d866 LLVM10 anatofuz parents: diff changeset	185
1d019706d866 LLVM10 anatofuz parents: diff changeset	186 bool switchesFormatting(const FormatToken &Token) {
1d019706d866 LLVM10 anatofuz parents: diff changeset	187 assert((Token.is(TT_BlockComment) \|\| Token.is(TT_LineComment)) &&
1d019706d866 LLVM10 anatofuz parents: diff changeset	188 "formatting regions are switched by comment tokens");
1d019706d866 LLVM10 anatofuz parents: diff changeset	189 StringRef Content = Token.TokenText.substr(2).ltrim();
1d019706d866 LLVM10 anatofuz parents: diff changeset	190 return Content.startswith("clang-format on") \|\|
1d019706d866 LLVM10 anatofuz parents: diff changeset	191 Content.startswith("clang-format off");
1d019706d866 LLVM10 anatofuz parents: diff changeset	192 }
1d019706d866 LLVM10 anatofuz parents: diff changeset	193
1d019706d866 LLVM10 anatofuz parents: diff changeset	194 unsigned
1d019706d866 LLVM10 anatofuz parents: diff changeset	195 BreakableToken::getLengthAfterCompression(unsigned RemainingTokenColumns,
1d019706d866 LLVM10 anatofuz parents: diff changeset	196 Split Split) const {
1d019706d866 LLVM10 anatofuz parents: diff changeset	197 // Example: consider the content
1d019706d866 LLVM10 anatofuz parents: diff changeset	198 // lala lala
1d019706d866 LLVM10 anatofuz parents: diff changeset	199 // - RemainingTokenColumns is the original number of columns, 10;
1d019706d866 LLVM10 anatofuz parents: diff changeset	200 // - Split is (4, 2), denoting the two spaces between the two words;
1d019706d866 LLVM10 anatofuz parents: diff changeset	201 //
1d019706d866 LLVM10 anatofuz parents: diff changeset	202 // We compute the number of columns when the split is compressed into a single
1d019706d866 LLVM10 anatofuz parents: diff changeset	203 // space, like:
1d019706d866 LLVM10 anatofuz parents: diff changeset	204 // lala lala
1d019706d866 LLVM10 anatofuz parents: diff changeset	205 //
1d019706d866 LLVM10 anatofuz parents: diff changeset	206 // FIXME: Correctly measure the length of whitespace in Split.second so it
1d019706d866 LLVM10 anatofuz parents: diff changeset	207 // works with tabs.
1d019706d866 LLVM10 anatofuz parents: diff changeset	208 return RemainingTokenColumns + 1 - Split.second;
1d019706d866 LLVM10 anatofuz parents: diff changeset	209 }
1d019706d866 LLVM10 anatofuz parents: diff changeset	210
1d019706d866 LLVM10 anatofuz parents: diff changeset	211 unsigned BreakableStringLiteral::getLineCount() const { return 1; }
1d019706d866 LLVM10 anatofuz parents: diff changeset	212
1d019706d866 LLVM10 anatofuz parents: diff changeset	213 unsigned BreakableStringLiteral::getRangeLength(unsigned LineIndex,
1d019706d866 LLVM10 anatofuz parents: diff changeset	214 unsigned Offset,
1d019706d866 LLVM10 anatofuz parents: diff changeset	215 StringRef::size_type Length,
1d019706d866 LLVM10 anatofuz parents: diff changeset	216 unsigned StartColumn) const {
1d019706d866 LLVM10 anatofuz parents: diff changeset	217 llvm_unreachable("Getting the length of a part of the string literal "
1d019706d866 LLVM10 anatofuz parents: diff changeset	218 "indicates that the code tries to reflow it.");
1d019706d866 LLVM10 anatofuz parents: diff changeset	219 }
1d019706d866 LLVM10 anatofuz parents: diff changeset	220
1d019706d866 LLVM10 anatofuz parents: diff changeset	221 unsigned
1d019706d866 LLVM10 anatofuz parents: diff changeset	222 BreakableStringLiteral::getRemainingLength(unsigned LineIndex, unsigned Offset,
1d019706d866 LLVM10 anatofuz parents: diff changeset	223 unsigned StartColumn) const {
1d019706d866 LLVM10 anatofuz parents: diff changeset	224 return UnbreakableTailLength + Postfix.size() +
1d019706d866 LLVM10 anatofuz parents: diff changeset	225 encoding::columnWidthWithTabs(Line.substr(Offset, StringRef::npos),
1d019706d866 LLVM10 anatofuz parents: diff changeset	226 StartColumn, Style.TabWidth, Encoding);
1d019706d866 LLVM10 anatofuz parents: diff changeset	227 }
1d019706d866 LLVM10 anatofuz parents: diff changeset	228
1d019706d866 LLVM10 anatofuz parents: diff changeset	229 unsigned BreakableStringLiteral::getContentStartColumn(unsigned LineIndex,
1d019706d866 LLVM10 anatofuz parents: diff changeset	230 bool Break) const {
1d019706d866 LLVM10 anatofuz parents: diff changeset	231 return StartColumn + Prefix.size();
1d019706d866 LLVM10 anatofuz parents: diff changeset	232 }
1d019706d866 LLVM10 anatofuz parents: diff changeset	233
1d019706d866 LLVM10 anatofuz parents: diff changeset	234 BreakableStringLiteral::BreakableStringLiteral(
1d019706d866 LLVM10 anatofuz parents: diff changeset	235 const FormatToken &Tok, unsigned StartColumn, StringRef Prefix,
1d019706d866 LLVM10 anatofuz parents: diff changeset	236 StringRef Postfix, unsigned UnbreakableTailLength, bool InPPDirective,
1d019706d866 LLVM10 anatofuz parents: diff changeset	237 encoding::Encoding Encoding, const FormatStyle &Style)
1d019706d866 LLVM10 anatofuz parents: diff changeset	238 : BreakableToken(Tok, InPPDirective, Encoding, Style),
1d019706d866 LLVM10 anatofuz parents: diff changeset	239 StartColumn(StartColumn), Prefix(Prefix), Postfix(Postfix),
1d019706d866 LLVM10 anatofuz parents: diff changeset	240 UnbreakableTailLength(UnbreakableTailLength) {
1d019706d866 LLVM10 anatofuz parents: diff changeset	241 assert(Tok.TokenText.startswith(Prefix) && Tok.TokenText.endswith(Postfix));
1d019706d866 LLVM10 anatofuz parents: diff changeset	242 Line = Tok.TokenText.substr(
1d019706d866 LLVM10 anatofuz parents: diff changeset	243 Prefix.size(), Tok.TokenText.size() - Prefix.size() - Postfix.size());
1d019706d866 LLVM10 anatofuz parents: diff changeset	244 }
1d019706d866 LLVM10 anatofuz parents: diff changeset	245
1d019706d866 LLVM10 anatofuz parents: diff changeset	246 BreakableToken::Split BreakableStringLiteral::getSplit(
1d019706d866 LLVM10 anatofuz parents: diff changeset	247 unsigned LineIndex, unsigned TailOffset, unsigned ColumnLimit,
1d019706d866 LLVM10 anatofuz parents: diff changeset	248 unsigned ContentStartColumn, const llvm::Regex &CommentPragmasRegex) const {
1d019706d866 LLVM10 anatofuz parents: diff changeset	249 return getStringSplit(Line.substr(TailOffset), ContentStartColumn,
1d019706d866 LLVM10 anatofuz parents: diff changeset	250 ColumnLimit - Postfix.size(), Style.TabWidth, Encoding);
1d019706d866 LLVM10 anatofuz parents: diff changeset	251 }
1d019706d866 LLVM10 anatofuz parents: diff changeset	252
1d019706d866 LLVM10 anatofuz parents: diff changeset	253 void BreakableStringLiteral::insertBreak(unsigned LineIndex,
1d019706d866 LLVM10 anatofuz parents: diff changeset	254 unsigned TailOffset, Split Split,
1d019706d866 LLVM10 anatofuz parents: diff changeset	255 unsigned ContentIndent,
1d019706d866 LLVM10 anatofuz parents: diff changeset	256 WhitespaceManager &Whitespaces) const {
1d019706d866 LLVM10 anatofuz parents: diff changeset	257 Whitespaces.replaceWhitespaceInToken(
1d019706d866 LLVM10 anatofuz parents: diff changeset	258 Tok, Prefix.size() + TailOffset + Split.first, Split.second, Postfix,
1d019706d866 LLVM10 anatofuz parents: diff changeset	259 Prefix, InPPDirective, 1, StartColumn);
1d019706d866 LLVM10 anatofuz parents: diff changeset	260 }
1d019706d866 LLVM10 anatofuz parents: diff changeset	261
1d019706d866 LLVM10 anatofuz parents: diff changeset	262 BreakableComment::BreakableComment(const FormatToken &Token,
1d019706d866 LLVM10 anatofuz parents: diff changeset	263 unsigned StartColumn, bool InPPDirective,
1d019706d866 LLVM10 anatofuz parents: diff changeset	264 encoding::Encoding Encoding,
1d019706d866 LLVM10 anatofuz parents: diff changeset	265 const FormatStyle &Style)
1d019706d866 LLVM10 anatofuz parents: diff changeset	266 : BreakableToken(Token, InPPDirective, Encoding, Style),
1d019706d866 LLVM10 anatofuz parents: diff changeset	267 StartColumn(StartColumn) {}
1d019706d866 LLVM10 anatofuz parents: diff changeset	268
1d019706d866 LLVM10 anatofuz parents: diff changeset	269 unsigned BreakableComment::getLineCount() const { return Lines.size(); }
1d019706d866 LLVM10 anatofuz parents: diff changeset	270
1d019706d866 LLVM10 anatofuz parents: diff changeset	271 BreakableToken::Split
1d019706d866 LLVM10 anatofuz parents: diff changeset	272 BreakableComment::getSplit(unsigned LineIndex, unsigned TailOffset,
1d019706d866 LLVM10 anatofuz parents: diff changeset	273 unsigned ColumnLimit, unsigned ContentStartColumn,
1d019706d866 LLVM10 anatofuz parents: diff changeset	274 const llvm::Regex &CommentPragmasRegex) const {
1d019706d866 LLVM10 anatofuz parents: diff changeset	275 // Don't break lines matching the comment pragmas regex.
1d019706d866 LLVM10 anatofuz parents: diff changeset	276 if (CommentPragmasRegex.match(Content[LineIndex]))
1d019706d866 LLVM10 anatofuz parents: diff changeset	277 return Split(StringRef::npos, 0);
1d019706d866 LLVM10 anatofuz parents: diff changeset	278 return getCommentSplit(Content[LineIndex].substr(TailOffset),
1d019706d866 LLVM10 anatofuz parents: diff changeset	279 ContentStartColumn, ColumnLimit, Style.TabWidth,
1d019706d866 LLVM10 anatofuz parents: diff changeset	280 Encoding, Style);
1d019706d866 LLVM10 anatofuz parents: diff changeset	281 }
1d019706d866 LLVM10 anatofuz parents: diff changeset	282
1d019706d866 LLVM10 anatofuz parents: diff changeset	283 void BreakableComment::compressWhitespace(
1d019706d866 LLVM10 anatofuz parents: diff changeset	284 unsigned LineIndex, unsigned TailOffset, Split Split,
1d019706d866 LLVM10 anatofuz parents: diff changeset	285 WhitespaceManager &Whitespaces) const {
1d019706d866 LLVM10 anatofuz parents: diff changeset	286 StringRef Text = Content[LineIndex].substr(TailOffset);
1d019706d866 LLVM10 anatofuz parents: diff changeset	287 // Text is relative to the content line, but Whitespaces operates relative to
1d019706d866 LLVM10 anatofuz parents: diff changeset	288 // the start of the corresponding token, so compute the start of the Split
1d019706d866 LLVM10 anatofuz parents: diff changeset	289 // that needs to be compressed into a single space relative to the start of
1d019706d866 LLVM10 anatofuz parents: diff changeset	290 // its token.
1d019706d866 LLVM10 anatofuz parents: diff changeset	291 unsigned BreakOffsetInToken =
1d019706d866 LLVM10 anatofuz parents: diff changeset	292 Text.data() - tokenAt(LineIndex).TokenText.data() + Split.first;
1d019706d866 LLVM10 anatofuz parents: diff changeset	293 unsigned CharsToRemove = Split.second;
1d019706d866 LLVM10 anatofuz parents: diff changeset	294 Whitespaces.replaceWhitespaceInToken(
1d019706d866 LLVM10 anatofuz parents: diff changeset	295 tokenAt(LineIndex), BreakOffsetInToken, CharsToRemove, "", "",
1d019706d866 LLVM10 anatofuz parents: diff changeset	296 /InPPDirective=/false, /Newlines=/0, /Spaces=/1);
1d019706d866 LLVM10 anatofuz parents: diff changeset	297 }
1d019706d866 LLVM10 anatofuz parents: diff changeset	298
1d019706d866 LLVM10 anatofuz parents: diff changeset	299 const FormatToken &BreakableComment::tokenAt(unsigned LineIndex) const {
1d019706d866 LLVM10 anatofuz parents: diff changeset	300 return Tokens[LineIndex] ? *Tokens[LineIndex] : Tok;
1d019706d866 LLVM10 anatofuz parents: diff changeset	301 }
1d019706d866 LLVM10 anatofuz parents: diff changeset	302
1d019706d866 LLVM10 anatofuz parents: diff changeset	303 static bool mayReflowContent(StringRef Content) {
1d019706d866 LLVM10 anatofuz parents: diff changeset	304 Content = Content.trim(Blanks);
1d019706d866 LLVM10 anatofuz parents: diff changeset	305 // Lines starting with '@' commonly have special meaning.
1d019706d866 LLVM10 anatofuz parents: diff changeset	306 // Lines starting with '-', '-#', '+' or '*' are bulleted/numbered lists.
1d019706d866 LLVM10 anatofuz parents: diff changeset	307 bool hasSpecialMeaningPrefix = false;
1d019706d866 LLVM10 anatofuz parents: diff changeset	308 for (StringRef Prefix :
1d019706d866 LLVM10 anatofuz parents: diff changeset	309 {"@", "TODO", "FIXME", "XXX", "-# ", "- ", "+ ", "* "}) {
1d019706d866 LLVM10 anatofuz parents: diff changeset	310 if (Content.startswith(Prefix)) {
1d019706d866 LLVM10 anatofuz parents: diff changeset	311 hasSpecialMeaningPrefix = true;
1d019706d866 LLVM10 anatofuz parents: diff changeset	312 break;
1d019706d866 LLVM10 anatofuz parents: diff changeset	313 }
1d019706d866 LLVM10 anatofuz parents: diff changeset	314 }
1d019706d866 LLVM10 anatofuz parents: diff changeset	315
1d019706d866 LLVM10 anatofuz parents: diff changeset	316 // Numbered lists may also start with a number followed by '.'
1d019706d866 LLVM10 anatofuz parents: diff changeset	317 // To avoid issues if a line starts with a number which is actually the end
1d019706d866 LLVM10 anatofuz parents: diff changeset	318 // of a previous line, we only consider numbers with up to 2 digits.
1d019706d866 LLVM10 anatofuz parents: diff changeset	319 static const auto kNumberedListRegexp = llvm::Regex("^[1-9][0-9]?\\. ");
1d019706d866 LLVM10 anatofuz parents: diff changeset	320 hasSpecialMeaningPrefix =
1d019706d866 LLVM10 anatofuz parents: diff changeset	321 hasSpecialMeaningPrefix \|\| kNumberedListRegexp.match(Content);
1d019706d866 LLVM10 anatofuz parents: diff changeset	322
1d019706d866 LLVM10 anatofuz parents: diff changeset	323 // Simple heuristic for what to reflow: content should contain at least two
1d019706d866 LLVM10 anatofuz parents: diff changeset	324 // characters and either the first or second character must be
1d019706d866 LLVM10 anatofuz parents: diff changeset	325 // non-punctuation.
1d019706d866 LLVM10 anatofuz parents: diff changeset	326 return Content.size() >= 2 && !hasSpecialMeaningPrefix &&
1d019706d866 LLVM10 anatofuz parents: diff changeset	327 !Content.endswith("\\") &&
1d019706d866 LLVM10 anatofuz parents: diff changeset	328 // Note that this is UTF-8 safe, since if isPunctuation(Content[0]) is
1d019706d866 LLVM10 anatofuz parents: diff changeset	329 // true, then the first code point must be 1 byte long.
1d019706d866 LLVM10 anatofuz parents: diff changeset	330 (!isPunctuation(Content[0]) \|\| !isPunctuation(Content[1]));
1d019706d866 LLVM10 anatofuz parents: diff changeset	331 }
1d019706d866 LLVM10 anatofuz parents: diff changeset	332
1d019706d866 LLVM10 anatofuz parents: diff changeset	333 BreakableBlockComment::BreakableBlockComment(
1d019706d866 LLVM10 anatofuz parents: diff changeset	334 const FormatToken &Token, unsigned StartColumn,
1d019706d866 LLVM10 anatofuz parents: diff changeset	335 unsigned OriginalStartColumn, bool FirstInLine, bool InPPDirective,
1d019706d866 LLVM10 anatofuz parents: diff changeset	336 encoding::Encoding Encoding, const FormatStyle &Style, bool UseCRLF)
1d019706d866 LLVM10 anatofuz parents: diff changeset	337 : BreakableComment(Token, StartColumn, InPPDirective, Encoding, Style),
1d019706d866 LLVM10 anatofuz parents: diff changeset	338 DelimitersOnNewline(false),
1d019706d866 LLVM10 anatofuz parents: diff changeset	339 UnbreakableTailLength(Token.UnbreakableTailLength) {
1d019706d866 LLVM10 anatofuz parents: diff changeset	340 assert(Tok.is(TT_BlockComment) &&
1d019706d866 LLVM10 anatofuz parents: diff changeset	341 "block comment section must start with a block comment");
1d019706d866 LLVM10 anatofuz parents: diff changeset	342
1d019706d866 LLVM10 anatofuz parents: diff changeset	343 StringRef TokenText(Tok.TokenText);
1d019706d866 LLVM10 anatofuz parents: diff changeset	344 assert(TokenText.startswith("/") && TokenText.endswith("/"));
1d019706d866 LLVM10 anatofuz parents: diff changeset	345 TokenText.substr(2, TokenText.size() - 4)
1d019706d866 LLVM10 anatofuz parents: diff changeset	346 .split(Lines, UseCRLF ? "\r\n" : "\n");
1d019706d866 LLVM10 anatofuz parents: diff changeset	347
1d019706d866 LLVM10 anatofuz parents: diff changeset	348 int IndentDelta = StartColumn - OriginalStartColumn;
1d019706d866 LLVM10 anatofuz parents: diff changeset	349 Content.resize(Lines.size());
1d019706d866 LLVM10 anatofuz parents: diff changeset	350 Content[0] = Lines[0];
1d019706d866 LLVM10 anatofuz parents: diff changeset	351 ContentColumn.resize(Lines.size());
1d019706d866 LLVM10 anatofuz parents: diff changeset	352 // Account for the initial '/*'.
1d019706d866 LLVM10 anatofuz parents: diff changeset	353 ContentColumn[0] = StartColumn + 2;
1d019706d866 LLVM10 anatofuz parents: diff changeset	354 Tokens.resize(Lines.size());
1d019706d866 LLVM10 anatofuz parents: diff changeset	355 for (size_t i = 1; i < Lines.size(); ++i)
1d019706d866 LLVM10 anatofuz parents: diff changeset	356 adjustWhitespace(i, IndentDelta);
1d019706d866 LLVM10 anatofuz parents: diff changeset	357
1d019706d866 LLVM10 anatofuz parents: diff changeset	358 // Align decorations with the column of the star on the first line,
1d019706d866 LLVM10 anatofuz parents: diff changeset	359 // that is one column after the start "/*".
1d019706d866 LLVM10 anatofuz parents: diff changeset	360 DecorationColumn = StartColumn + 1;
1d019706d866 LLVM10 anatofuz parents: diff changeset	361
1d019706d866 LLVM10 anatofuz parents: diff changeset	362 // Account for comment decoration patterns like this:
1d019706d866 LLVM10 anatofuz parents: diff changeset	363 //
1d019706d866 LLVM10 anatofuz parents: diff changeset	364 // /*
1d019706d866 LLVM10 anatofuz parents: diff changeset	365 // ** blah blah blah
1d019706d866 LLVM10 anatofuz parents: diff changeset	366 // */
1d019706d866 LLVM10 anatofuz parents: diff changeset	367 if (Lines.size() >= 2 && Content[1].startswith("**") &&
1d019706d866 LLVM10 anatofuz parents: diff changeset	368 static_cast<unsigned>(ContentColumn[1]) == StartColumn) {
1d019706d866 LLVM10 anatofuz parents: diff changeset	369 DecorationColumn = StartColumn;
1d019706d866 LLVM10 anatofuz parents: diff changeset	370 }
1d019706d866 LLVM10 anatofuz parents: diff changeset	371
1d019706d866 LLVM10 anatofuz parents: diff changeset	372 Decoration = "* ";
1d019706d866 LLVM10 anatofuz parents: diff changeset	373 if (Lines.size() == 1 && !FirstInLine) {
1d019706d866 LLVM10 anatofuz parents: diff changeset	374 // Comments for which FirstInLine is false can start on arbitrary column,
1d019706d866 LLVM10 anatofuz parents: diff changeset	375 // and available horizontal space can be too small to align consecutive
1d019706d866 LLVM10 anatofuz parents: diff changeset	376 // lines with the first one.
1d019706d866 LLVM10 anatofuz parents: diff changeset	377 // FIXME: We could, probably, align them to current indentation level, but
1d019706d866 LLVM10 anatofuz parents: diff changeset	378 // now we just wrap them without stars.
1d019706d866 LLVM10 anatofuz parents: diff changeset	379 Decoration = "";
1d019706d866 LLVM10 anatofuz parents: diff changeset	380 }
1d019706d866 LLVM10 anatofuz parents: diff changeset	381 for (size_t i = 1, e = Lines.size(); i < e && !Decoration.empty(); ++i) {
1d019706d866 LLVM10 anatofuz parents: diff changeset	382 // If the last line is empty, the closing "*/" will have a star.
1d019706d866 LLVM10 anatofuz parents: diff changeset	383 if (i + 1 == e && Content[i].empty())
1d019706d866 LLVM10 anatofuz parents: diff changeset	384 break;
1d019706d866 LLVM10 anatofuz parents: diff changeset	385 if (!Content[i].empty() && i + 1 != e && Decoration.startswith(Content[i]))
1d019706d866 LLVM10 anatofuz parents: diff changeset	386 continue;
1d019706d866 LLVM10 anatofuz parents: diff changeset	387 while (!Content[i].startswith(Decoration))
1d019706d866 LLVM10 anatofuz parents: diff changeset	388 Decoration = Decoration.substr(0, Decoration.size() - 1);
1d019706d866 LLVM10 anatofuz parents: diff changeset	389 }
1d019706d866 LLVM10 anatofuz parents: diff changeset	390
1d019706d866 LLVM10 anatofuz parents: diff changeset	391 LastLineNeedsDecoration = true;
1d019706d866 LLVM10 anatofuz parents: diff changeset	392 IndentAtLineBreak = ContentColumn[0] + 1;
1d019706d866 LLVM10 anatofuz parents: diff changeset	393 for (size_t i = 1, e = Lines.size(); i < e; ++i) {
1d019706d866 LLVM10 anatofuz parents: diff changeset	394 if (Content[i].empty()) {
1d019706d866 LLVM10 anatofuz parents: diff changeset	395 if (i + 1 == e) {
1d019706d866 LLVM10 anatofuz parents: diff changeset	396 // Empty last line means that we already have a star as a part of the
1d019706d866 LLVM10 anatofuz parents: diff changeset	397 // trailing /. We also need to preserve whitespace, so that / is
1d019706d866 LLVM10 anatofuz parents: diff changeset	398 // correctly indented.
1d019706d866 LLVM10 anatofuz parents: diff changeset	399 LastLineNeedsDecoration = false;
1d019706d866 LLVM10 anatofuz parents: diff changeset	400 // Align the star in the last '*/' with the stars on the previous lines.
1d019706d866 LLVM10 anatofuz parents: diff changeset	401 if (e >= 2 && !Decoration.empty()) {
1d019706d866 LLVM10 anatofuz parents: diff changeset	402 ContentColumn[i] = DecorationColumn;
1d019706d866 LLVM10 anatofuz parents: diff changeset	403 }
1d019706d866 LLVM10 anatofuz parents: diff changeset	404 } else if (Decoration.empty()) {
1d019706d866 LLVM10 anatofuz parents: diff changeset	405 // For all other lines, set the start column to 0 if they're empty, so
1d019706d866 LLVM10 anatofuz parents: diff changeset	406 // we do not insert trailing whitespace anywhere.
1d019706d866 LLVM10 anatofuz parents: diff changeset	407 ContentColumn[i] = 0;
1d019706d866 LLVM10 anatofuz parents: diff changeset	408 }
1d019706d866 LLVM10 anatofuz parents: diff changeset	409 continue;
1d019706d866 LLVM10 anatofuz parents: diff changeset	410 }
1d019706d866 LLVM10 anatofuz parents: diff changeset	411
1d019706d866 LLVM10 anatofuz parents: diff changeset	412 // The first line already excludes the star.
1d019706d866 LLVM10 anatofuz parents: diff changeset	413 // The last line excludes the star if LastLineNeedsDecoration is false.
1d019706d866 LLVM10 anatofuz parents: diff changeset	414 // For all other lines, adjust the line to exclude the star and
1d019706d866 LLVM10 anatofuz parents: diff changeset	415 // (optionally) the first whitespace.
1d019706d866 LLVM10 anatofuz parents: diff changeset	416 unsigned DecorationSize = Decoration.startswith(Content[i])
1d019706d866 LLVM10 anatofuz parents: diff changeset	417 ? Content[i].size()
1d019706d866 LLVM10 anatofuz parents: diff changeset	418 : Decoration.size();
1d019706d866 LLVM10 anatofuz parents: diff changeset	419 if (DecorationSize) {
1d019706d866 LLVM10 anatofuz parents: diff changeset	420 ContentColumn[i] = DecorationColumn + DecorationSize;
1d019706d866 LLVM10 anatofuz parents: diff changeset	421 }
1d019706d866 LLVM10 anatofuz parents: diff changeset	422 Content[i] = Content[i].substr(DecorationSize);
1d019706d866 LLVM10 anatofuz parents: diff changeset	423 if (!Decoration.startswith(Content[i]))
1d019706d866 LLVM10 anatofuz parents: diff changeset	424 IndentAtLineBreak =
1d019706d866 LLVM10 anatofuz parents: diff changeset	425 std::min<int>(IndentAtLineBreak, std::max(0, ContentColumn[i]));
1d019706d866 LLVM10 anatofuz parents: diff changeset	426 }
1d019706d866 LLVM10 anatofuz parents: diff changeset	427 IndentAtLineBreak = std::max<unsigned>(IndentAtLineBreak, Decoration.size());
1d019706d866 LLVM10 anatofuz parents: diff changeset	428
1d019706d866 LLVM10 anatofuz parents: diff changeset	429 // Detect a multiline jsdoc comment and set DelimitersOnNewline in that case.
1d019706d866 LLVM10 anatofuz parents: diff changeset	430 if (Style.Language == FormatStyle::LK_JavaScript \|\|
1d019706d866 LLVM10 anatofuz parents: diff changeset	431 Style.Language == FormatStyle::LK_Java) {
1d019706d866 LLVM10 anatofuz parents: diff changeset	432 if ((Lines[0] == "" \|\| Lines[0].startswith(" ")) && Lines.size() > 1) {
1d019706d866 LLVM10 anatofuz parents: diff changeset	433 // This is a multiline jsdoc comment.
1d019706d866 LLVM10 anatofuz parents: diff changeset	434 DelimitersOnNewline = true;
1d019706d866 LLVM10 anatofuz parents: diff changeset	435 } else if (Lines[0].startswith("* ") && Lines.size() == 1) {
1d019706d866 LLVM10 anatofuz parents: diff changeset	436 // Detect a long single-line comment, like:
1d019706d866 LLVM10 anatofuz parents: diff changeset	437 // /** long long long */
1d019706d866 LLVM10 anatofuz parents: diff changeset	438 // Below, '2' is the width of '*/'.
1d019706d866 LLVM10 anatofuz parents: diff changeset	439 unsigned EndColumn =
1d019706d866 LLVM10 anatofuz parents: diff changeset	440 ContentColumn[0] +
1d019706d866 LLVM10 anatofuz parents: diff changeset	441 encoding::columnWidthWithTabs(Lines[0], ContentColumn[0],
1d019706d866 LLVM10 anatofuz parents: diff changeset	442 Style.TabWidth, Encoding) +
1d019706d866 LLVM10 anatofuz parents: diff changeset	443 2;
1d019706d866 LLVM10 anatofuz parents: diff changeset	444 DelimitersOnNewline = EndColumn > Style.ColumnLimit;
1d019706d866 LLVM10 anatofuz parents: diff changeset	445 }
1d019706d866 LLVM10 anatofuz parents: diff changeset	446 }
1d019706d866 LLVM10 anatofuz parents: diff changeset	447
1d019706d866 LLVM10 anatofuz parents: diff changeset	448 LLVM_DEBUG({
1d019706d866 LLVM10 anatofuz parents: diff changeset	449 llvm::dbgs() << "IndentAtLineBreak " << IndentAtLineBreak << "\n";
1d019706d866 LLVM10 anatofuz parents: diff changeset	450 llvm::dbgs() << "DelimitersOnNewline " << DelimitersOnNewline << "\n";
1d019706d866 LLVM10 anatofuz parents: diff changeset	451 for (size_t i = 0; i < Lines.size(); ++i) {
1d019706d866 LLVM10 anatofuz parents: diff changeset	452 llvm::dbgs() << i << " \|" << Content[i] << "\| "
1d019706d866 LLVM10 anatofuz parents: diff changeset	453 << "CC=" << ContentColumn[i] << "\| "
1d019706d866 LLVM10 anatofuz parents: diff changeset	454 << "IN=" << (Content[i].data() - Lines[i].data()) << "\n";
1d019706d866 LLVM10 anatofuz parents: diff changeset	455 }
1d019706d866 LLVM10 anatofuz parents: diff changeset	456 });
1d019706d866 LLVM10 anatofuz parents: diff changeset	457 }
1d019706d866 LLVM10 anatofuz parents: diff changeset	458
1d019706d866 LLVM10 anatofuz parents: diff changeset	459 BreakableToken::Split BreakableBlockComment::getSplit(
1d019706d866 LLVM10 anatofuz parents: diff changeset	460 unsigned LineIndex, unsigned TailOffset, unsigned ColumnLimit,
1d019706d866 LLVM10 anatofuz parents: diff changeset	461 unsigned ContentStartColumn, const llvm::Regex &CommentPragmasRegex) const {
1d019706d866 LLVM10 anatofuz parents: diff changeset	462 // Don't break lines matching the comment pragmas regex.
1d019706d866 LLVM10 anatofuz parents: diff changeset	463 if (CommentPragmasRegex.match(Content[LineIndex]))
1d019706d866 LLVM10 anatofuz parents: diff changeset	464 return Split(StringRef::npos, 0);
1d019706d866 LLVM10 anatofuz parents: diff changeset	465 return getCommentSplit(Content[LineIndex].substr(TailOffset),
1d019706d866 LLVM10 anatofuz parents: diff changeset	466 ContentStartColumn, ColumnLimit, Style.TabWidth,
1d019706d866 LLVM10 anatofuz parents: diff changeset	467 Encoding, Style, Decoration.endswith("*"));
1d019706d866 LLVM10 anatofuz parents: diff changeset	468 }
1d019706d866 LLVM10 anatofuz parents: diff changeset	469
1d019706d866 LLVM10 anatofuz parents: diff changeset	470 void BreakableBlockComment::adjustWhitespace(unsigned LineIndex,
1d019706d866 LLVM10 anatofuz parents: diff changeset	471 int IndentDelta) {
1d019706d866 LLVM10 anatofuz parents: diff changeset	472 // When in a preprocessor directive, the trailing backslash in a block comment
1d019706d866 LLVM10 anatofuz parents: diff changeset	473 // is not needed, but can serve a purpose of uniformity with necessary escaped
1d019706d866 LLVM10 anatofuz parents: diff changeset	474 // newlines outside the comment. In this case we remove it here before
1d019706d866 LLVM10 anatofuz parents: diff changeset	475 // trimming the trailing whitespace. The backslash will be re-added later when
1d019706d866 LLVM10 anatofuz parents: diff changeset	476 // inserting a line break.
1d019706d866 LLVM10 anatofuz parents: diff changeset	477 size_t EndOfPreviousLine = Lines[LineIndex - 1].size();
1d019706d866 LLVM10 anatofuz parents: diff changeset	478 if (InPPDirective && Lines[LineIndex - 1].endswith("\\"))
1d019706d866 LLVM10 anatofuz parents: diff changeset	479 --EndOfPreviousLine;
1d019706d866 LLVM10 anatofuz parents: diff changeset	480
1d019706d866 LLVM10 anatofuz parents: diff changeset	481 // Calculate the end of the non-whitespace text in the previous line.
1d019706d866 LLVM10 anatofuz parents: diff changeset	482 EndOfPreviousLine =
1d019706d866 LLVM10 anatofuz parents: diff changeset	483 Lines[LineIndex - 1].find_last_not_of(Blanks, EndOfPreviousLine);
1d019706d866 LLVM10 anatofuz parents: diff changeset	484 if (EndOfPreviousLine == StringRef::npos)
1d019706d866 LLVM10 anatofuz parents: diff changeset	485 EndOfPreviousLine = 0;
1d019706d866 LLVM10 anatofuz parents: diff changeset	486 else
1d019706d866 LLVM10 anatofuz parents: diff changeset	487 ++EndOfPreviousLine;
1d019706d866 LLVM10 anatofuz parents: diff changeset	488 // Calculate the start of the non-whitespace text in the current line.
1d019706d866 LLVM10 anatofuz parents: diff changeset	489 size_t StartOfLine = Lines[LineIndex].find_first_not_of(Blanks);
1d019706d866 LLVM10 anatofuz parents: diff changeset	490 if (StartOfLine == StringRef::npos)
1d019706d866 LLVM10 anatofuz parents: diff changeset	491 StartOfLine = Lines[LineIndex].size();
1d019706d866 LLVM10 anatofuz parents: diff changeset	492
1d019706d866 LLVM10 anatofuz parents: diff changeset	493 StringRef Whitespace = Lines[LineIndex].substr(0, StartOfLine);
1d019706d866 LLVM10 anatofuz parents: diff changeset	494 // Adjust Lines to only contain relevant text.
1d019706d866 LLVM10 anatofuz parents: diff changeset	495 size_t PreviousContentOffset =
1d019706d866 LLVM10 anatofuz parents: diff changeset	496 Content[LineIndex - 1].data() - Lines[LineIndex - 1].data();
1d019706d866 LLVM10 anatofuz parents: diff changeset	497 Content[LineIndex - 1] = Lines[LineIndex - 1].substr(
1d019706d866 LLVM10 anatofuz parents: diff changeset	498 PreviousContentOffset, EndOfPreviousLine - PreviousContentOffset);
1d019706d866 LLVM10 anatofuz parents: diff changeset	499 Content[LineIndex] = Lines[LineIndex].substr(StartOfLine);
1d019706d866 LLVM10 anatofuz parents: diff changeset	500
1d019706d866 LLVM10 anatofuz parents: diff changeset	501 // Adjust the start column uniformly across all lines.
1d019706d866 LLVM10 anatofuz parents: diff changeset	502 ContentColumn[LineIndex] =
1d019706d866 LLVM10 anatofuz parents: diff changeset	503 encoding::columnWidthWithTabs(Whitespace, 0, Style.TabWidth, Encoding) +
1d019706d866 LLVM10 anatofuz parents: diff changeset	504 IndentDelta;
1d019706d866 LLVM10 anatofuz parents: diff changeset	505 }
1d019706d866 LLVM10 anatofuz parents: diff changeset	506
1d019706d866 LLVM10 anatofuz parents: diff changeset	507 unsigned BreakableBlockComment::getRangeLength(unsigned LineIndex,
1d019706d866 LLVM10 anatofuz parents: diff changeset	508 unsigned Offset,
1d019706d866 LLVM10 anatofuz parents: diff changeset	509 StringRef::size_type Length,
1d019706d866 LLVM10 anatofuz parents: diff changeset	510 unsigned StartColumn) const {
1d019706d866 LLVM10 anatofuz parents: diff changeset	511 unsigned LineLength =
1d019706d866 LLVM10 anatofuz parents: diff changeset	512 encoding::columnWidthWithTabs(Content[LineIndex].substr(Offset, Length),
1d019706d866 LLVM10 anatofuz parents: diff changeset	513 StartColumn, Style.TabWidth, Encoding);
1d019706d866 LLVM10 anatofuz parents: diff changeset	514 // FIXME: This should go into getRemainingLength instead, but we currently
1d019706d866 LLVM10 anatofuz parents: diff changeset	515 // break tests when putting it there. Investigate how to fix those tests.
1d019706d866 LLVM10 anatofuz parents: diff changeset	516 // The last line gets a "*/" postfix.
1d019706d866 LLVM10 anatofuz parents: diff changeset	517 if (LineIndex + 1 == Lines.size()) {
1d019706d866 LLVM10 anatofuz parents: diff changeset	518 LineLength += 2;
1d019706d866 LLVM10 anatofuz parents: diff changeset	519 // We never need a decoration when breaking just the trailing "*/" postfix.
1d019706d866 LLVM10 anatofuz parents: diff changeset	520 // Note that checking that Length == 0 is not enough, since Length could
1d019706d866 LLVM10 anatofuz parents: diff changeset	521 // also be StringRef::npos.
1d019706d866 LLVM10 anatofuz parents: diff changeset	522 if (Content[LineIndex].substr(Offset, StringRef::npos).empty()) {
1d019706d866 LLVM10 anatofuz parents: diff changeset	523 LineLength -= Decoration.size();
1d019706d866 LLVM10 anatofuz parents: diff changeset	524 }
1d019706d866 LLVM10 anatofuz parents: diff changeset	525 }
1d019706d866 LLVM10 anatofuz parents: diff changeset	526 return LineLength;
1d019706d866 LLVM10 anatofuz parents: diff changeset	527 }
1d019706d866 LLVM10 anatofuz parents: diff changeset	528
1d019706d866 LLVM10 anatofuz parents: diff changeset	529 unsigned BreakableBlockComment::getRemainingLength(unsigned LineIndex,
1d019706d866 LLVM10 anatofuz parents: diff changeset	530 unsigned Offset,
1d019706d866 LLVM10 anatofuz parents: diff changeset	531 unsigned StartColumn) const {
1d019706d866 LLVM10 anatofuz parents: diff changeset	532 return UnbreakableTailLength +
1d019706d866 LLVM10 anatofuz parents: diff changeset	533 getRangeLength(LineIndex, Offset, StringRef::npos, StartColumn);
1d019706d866 LLVM10 anatofuz parents: diff changeset	534 }
1d019706d866 LLVM10 anatofuz parents: diff changeset	535
1d019706d866 LLVM10 anatofuz parents: diff changeset	536 unsigned BreakableBlockComment::getContentStartColumn(unsigned LineIndex,
1d019706d866 LLVM10 anatofuz parents: diff changeset	537 bool Break) const {
1d019706d866 LLVM10 anatofuz parents: diff changeset	538 if (Break)
1d019706d866 LLVM10 anatofuz parents: diff changeset	539 return IndentAtLineBreak;
1d019706d866 LLVM10 anatofuz parents: diff changeset	540 return std::max(0, ContentColumn[LineIndex]);
1d019706d866 LLVM10 anatofuz parents: diff changeset	541 }
1d019706d866 LLVM10 anatofuz parents: diff changeset	542
1d019706d866 LLVM10 anatofuz parents: diff changeset	543 const llvm::StringSet<>
1d019706d866 LLVM10 anatofuz parents: diff changeset	544 BreakableBlockComment::ContentIndentingJavadocAnnotations = {
1d019706d866 LLVM10 anatofuz parents: diff changeset	545 "@param", "@return", "@returns", "@throws", "@type", "@template",
1d019706d866 LLVM10 anatofuz parents: diff changeset	546 "@see", "@deprecated", "@define", "@exports", "@mods", "@private",
1d019706d866 LLVM10 anatofuz parents: diff changeset	547 };
1d019706d866 LLVM10 anatofuz parents: diff changeset	548
1d019706d866 LLVM10 anatofuz parents: diff changeset	549 unsigned BreakableBlockComment::getContentIndent(unsigned LineIndex) const {
1d019706d866 LLVM10 anatofuz parents: diff changeset	550 if (Style.Language != FormatStyle::LK_Java &&
1d019706d866 LLVM10 anatofuz parents: diff changeset	551 Style.Language != FormatStyle::LK_JavaScript)
1d019706d866 LLVM10 anatofuz parents: diff changeset	552 return 0;
1d019706d866 LLVM10 anatofuz parents: diff changeset	553 // The content at LineIndex 0 of a comment like:
1d019706d866 LLVM10 anatofuz parents: diff changeset	554 // /** line 0 */
1d019706d866 LLVM10 anatofuz parents: diff changeset	555 // is "* line 0", so we need to skip over the decoration in that case.
1d019706d866 LLVM10 anatofuz parents: diff changeset	556 StringRef ContentWithNoDecoration = Content[LineIndex];
1d019706d866 LLVM10 anatofuz parents: diff changeset	557 if (LineIndex == 0 && ContentWithNoDecoration.startswith("*")) {
1d019706d866 LLVM10 anatofuz parents: diff changeset	558 ContentWithNoDecoration = ContentWithNoDecoration.substr(1).ltrim(Blanks);
1d019706d866 LLVM10 anatofuz parents: diff changeset	559 }
1d019706d866 LLVM10 anatofuz parents: diff changeset	560 StringRef FirstWord = ContentWithNoDecoration.substr(
1d019706d866 LLVM10 anatofuz parents: diff changeset	561 0, ContentWithNoDecoration.find_first_of(Blanks));
1d019706d866 LLVM10 anatofuz parents: diff changeset	562 if (ContentIndentingJavadocAnnotations.find(FirstWord) !=
1d019706d866 LLVM10 anatofuz parents: diff changeset	563 ContentIndentingJavadocAnnotations.end())
1d019706d866 LLVM10 anatofuz parents: diff changeset	564 return Style.ContinuationIndentWidth;
1d019706d866 LLVM10 anatofuz parents: diff changeset	565 return 0;
1d019706d866 LLVM10 anatofuz parents: diff changeset	566 }
1d019706d866 LLVM10 anatofuz parents: diff changeset	567
1d019706d866 LLVM10 anatofuz parents: diff changeset	568 void BreakableBlockComment::insertBreak(unsigned LineIndex, unsigned TailOffset,
1d019706d866 LLVM10 anatofuz parents: diff changeset	569 Split Split, unsigned ContentIndent,
1d019706d866 LLVM10 anatofuz parents: diff changeset	570 WhitespaceManager &Whitespaces) const {
1d019706d866 LLVM10 anatofuz parents: diff changeset	571 StringRef Text = Content[LineIndex].substr(TailOffset);
1d019706d866 LLVM10 anatofuz parents: diff changeset	572 StringRef Prefix = Decoration;
1d019706d866 LLVM10 anatofuz parents: diff changeset	573 // We need this to account for the case when we have a decoration "* " for all
1d019706d866 LLVM10 anatofuz parents: diff changeset	574 // the lines except for the last one, where the star in "*/" acts as a
1d019706d866 LLVM10 anatofuz parents: diff changeset	575 // decoration.
1d019706d866 LLVM10 anatofuz parents: diff changeset	576 unsigned LocalIndentAtLineBreak = IndentAtLineBreak;
1d019706d866 LLVM10 anatofuz parents: diff changeset	577 if (LineIndex + 1 == Lines.size() &&
1d019706d866 LLVM10 anatofuz parents: diff changeset	578 Text.size() == Split.first + Split.second) {
1d019706d866 LLVM10 anatofuz parents: diff changeset	579 // For the last line we need to break before "/", but not to add " ".
1d019706d866 LLVM10 anatofuz parents: diff changeset	580 Prefix = "";
1d019706d866 LLVM10 anatofuz parents: diff changeset	581 if (LocalIndentAtLineBreak >= 2)
1d019706d866 LLVM10 anatofuz parents: diff changeset	582 LocalIndentAtLineBreak -= 2;
1d019706d866 LLVM10 anatofuz parents: diff changeset	583 }
1d019706d866 LLVM10 anatofuz parents: diff changeset	584 // The split offset is from the beginning of the line. Convert it to an offset
1d019706d866 LLVM10 anatofuz parents: diff changeset	585 // from the beginning of the token text.
1d019706d866 LLVM10 anatofuz parents: diff changeset	586 unsigned BreakOffsetInToken =
1d019706d866 LLVM10 anatofuz parents: diff changeset	587 Text.data() - tokenAt(LineIndex).TokenText.data() + Split.first;
1d019706d866 LLVM10 anatofuz parents: diff changeset	588 unsigned CharsToRemove = Split.second;
1d019706d866 LLVM10 anatofuz parents: diff changeset	589 assert(LocalIndentAtLineBreak >= Prefix.size());
1d019706d866 LLVM10 anatofuz parents: diff changeset	590 std::string PrefixWithTrailingIndent = std::string(Prefix);
1d019706d866 LLVM10 anatofuz parents: diff changeset	591 for (unsigned I = 0; I < ContentIndent; ++I)
1d019706d866 LLVM10 anatofuz parents: diff changeset	592 PrefixWithTrailingIndent += " ";
1d019706d866 LLVM10 anatofuz parents: diff changeset	593 Whitespaces.replaceWhitespaceInToken(
1d019706d866 LLVM10 anatofuz parents: diff changeset	594 tokenAt(LineIndex), BreakOffsetInToken, CharsToRemove, "",
1d019706d866 LLVM10 anatofuz parents: diff changeset	595 PrefixWithTrailingIndent, InPPDirective, /Newlines=/1,
1d019706d866 LLVM10 anatofuz parents: diff changeset	596 /Spaces=/LocalIndentAtLineBreak + ContentIndent -
1d019706d866 LLVM10 anatofuz parents: diff changeset	597 PrefixWithTrailingIndent.size());
1d019706d866 LLVM10 anatofuz parents: diff changeset	598 }
1d019706d866 LLVM10 anatofuz parents: diff changeset	599
1d019706d866 LLVM10 anatofuz parents: diff changeset	600 BreakableToken::Split BreakableBlockComment::getReflowSplit(
1d019706d866 LLVM10 anatofuz parents: diff changeset	601 unsigned LineIndex, const llvm::Regex &CommentPragmasRegex) const {
1d019706d866 LLVM10 anatofuz parents: diff changeset	602 if (!mayReflow(LineIndex, CommentPragmasRegex))
1d019706d866 LLVM10 anatofuz parents: diff changeset	603 return Split(StringRef::npos, 0);
1d019706d866 LLVM10 anatofuz parents: diff changeset	604
1d019706d866 LLVM10 anatofuz parents: diff changeset	605 // If we're reflowing into a line with content indent, only reflow the next
1d019706d866 LLVM10 anatofuz parents: diff changeset	606 // line if its starting whitespace matches the content indent.
1d019706d866 LLVM10 anatofuz parents: diff changeset	607 size_t Trimmed = Content[LineIndex].find_first_not_of(Blanks);
1d019706d866 LLVM10 anatofuz parents: diff changeset	608 if (LineIndex) {
1d019706d866 LLVM10 anatofuz parents: diff changeset	609 unsigned PreviousContentIndent = getContentIndent(LineIndex - 1);
1d019706d866 LLVM10 anatofuz parents: diff changeset	610 if (PreviousContentIndent && Trimmed != StringRef::npos &&
1d019706d866 LLVM10 anatofuz parents: diff changeset	611 Trimmed != PreviousContentIndent)
1d019706d866 LLVM10 anatofuz parents: diff changeset	612 return Split(StringRef::npos, 0);
1d019706d866 LLVM10 anatofuz parents: diff changeset	613 }
1d019706d866 LLVM10 anatofuz parents: diff changeset	614
1d019706d866 LLVM10 anatofuz parents: diff changeset	615 return Split(0, Trimmed != StringRef::npos ? Trimmed : 0);
1d019706d866 LLVM10 anatofuz parents: diff changeset	616 }
1d019706d866 LLVM10 anatofuz parents: diff changeset	617
1d019706d866 LLVM10 anatofuz parents: diff changeset	618 bool BreakableBlockComment::introducesBreakBeforeToken() const {
1d019706d866 LLVM10 anatofuz parents: diff changeset	619 // A break is introduced when we want delimiters on newline.
1d019706d866 LLVM10 anatofuz parents: diff changeset	620 return DelimitersOnNewline &&
1d019706d866 LLVM10 anatofuz parents: diff changeset	621 Lines[0].substr(1).find_first_not_of(Blanks) != StringRef::npos;
1d019706d866 LLVM10 anatofuz parents: diff changeset	622 }
1d019706d866 LLVM10 anatofuz parents: diff changeset	623
1d019706d866 LLVM10 anatofuz parents: diff changeset	624 void BreakableBlockComment::reflow(unsigned LineIndex,
1d019706d866 LLVM10 anatofuz parents: diff changeset	625 WhitespaceManager &Whitespaces) const {
1d019706d866 LLVM10 anatofuz parents: diff changeset	626 StringRef TrimmedContent = Content[LineIndex].ltrim(Blanks);
1d019706d866 LLVM10 anatofuz parents: diff changeset	627 // Here we need to reflow.
1d019706d866 LLVM10 anatofuz parents: diff changeset	628 assert(Tokens[LineIndex - 1] == Tokens[LineIndex] &&
1d019706d866 LLVM10 anatofuz parents: diff changeset	629 "Reflowing whitespace within a token");
1d019706d866 LLVM10 anatofuz parents: diff changeset	630 // This is the offset of the end of the last line relative to the start of
1d019706d866 LLVM10 anatofuz parents: diff changeset	631 // the token text in the token.
1d019706d866 LLVM10 anatofuz parents: diff changeset	632 unsigned WhitespaceOffsetInToken = Content[LineIndex - 1].data() +
1d019706d866 LLVM10 anatofuz parents: diff changeset	633 Content[LineIndex - 1].size() -
1d019706d866 LLVM10 anatofuz parents: diff changeset	634 tokenAt(LineIndex).TokenText.data();
1d019706d866 LLVM10 anatofuz parents: diff changeset	635 unsigned WhitespaceLength = TrimmedContent.data() -
1d019706d866 LLVM10 anatofuz parents: diff changeset	636 tokenAt(LineIndex).TokenText.data() -
1d019706d866 LLVM10 anatofuz parents: diff changeset	637 WhitespaceOffsetInToken;
1d019706d866 LLVM10 anatofuz parents: diff changeset	638 Whitespaces.replaceWhitespaceInToken(
1d019706d866 LLVM10 anatofuz parents: diff changeset	639 tokenAt(LineIndex), WhitespaceOffsetInToken,
1d019706d866 LLVM10 anatofuz parents: diff changeset	640 /ReplaceChars=/WhitespaceLength, /PreviousPostfix=/"",
1d019706d866 LLVM10 anatofuz parents: diff changeset	641 /CurrentPrefix=/ReflowPrefix, InPPDirective, /Newlines=/0,
1d019706d866 LLVM10 anatofuz parents: diff changeset	642 /Spaces=/0);
1d019706d866 LLVM10 anatofuz parents: diff changeset	643 }
1d019706d866 LLVM10 anatofuz parents: diff changeset	644
1d019706d866 LLVM10 anatofuz parents: diff changeset	645 void BreakableBlockComment::adaptStartOfLine(
1d019706d866 LLVM10 anatofuz parents: diff changeset	646 unsigned LineIndex, WhitespaceManager &Whitespaces) const {
1d019706d866 LLVM10 anatofuz parents: diff changeset	647 if (LineIndex == 0) {
1d019706d866 LLVM10 anatofuz parents: diff changeset	648 if (DelimitersOnNewline) {
1d019706d866 LLVM10 anatofuz parents: diff changeset	649 // Since we're breaking at index 1 below, the break position and the
1d019706d866 LLVM10 anatofuz parents: diff changeset	650 // break length are the same.
1d019706d866 LLVM10 anatofuz parents: diff changeset	651 // Note: this works because getCommentSplit is careful never to split at
1d019706d866 LLVM10 anatofuz parents: diff changeset	652 // the beginning of a line.
1d019706d866 LLVM10 anatofuz parents: diff changeset	653 size_t BreakLength = Lines[0].substr(1).find_first_not_of(Blanks);
1d019706d866 LLVM10 anatofuz parents: diff changeset	654 if (BreakLength != StringRef::npos)
1d019706d866 LLVM10 anatofuz parents: diff changeset	655 insertBreak(LineIndex, 0, Split(1, BreakLength), /ContentIndent=/0,
1d019706d866 LLVM10 anatofuz parents: diff changeset	656 Whitespaces);
1d019706d866 LLVM10 anatofuz parents: diff changeset	657 }
1d019706d866 LLVM10 anatofuz parents: diff changeset	658 return;
1d019706d866 LLVM10 anatofuz parents: diff changeset	659 }
1d019706d866 LLVM10 anatofuz parents: diff changeset	660 // Here no reflow with the previous line will happen.
1d019706d866 LLVM10 anatofuz parents: diff changeset	661 // Fix the decoration of the line at LineIndex.
1d019706d866 LLVM10 anatofuz parents: diff changeset	662 StringRef Prefix = Decoration;
1d019706d866 LLVM10 anatofuz parents: diff changeset	663 if (Content[LineIndex].empty()) {
1d019706d866 LLVM10 anatofuz parents: diff changeset	664 if (LineIndex + 1 == Lines.size()) {
1d019706d866 LLVM10 anatofuz parents: diff changeset	665 if (!LastLineNeedsDecoration) {
1d019706d866 LLVM10 anatofuz parents: diff changeset	666 // If the last line was empty, we don't need a prefix, as the */ will
1d019706d866 LLVM10 anatofuz parents: diff changeset	667 // line up with the decoration (if it exists).
1d019706d866 LLVM10 anatofuz parents: diff changeset	668 Prefix = "";
1d019706d866 LLVM10 anatofuz parents: diff changeset	669 }
1d019706d866 LLVM10 anatofuz parents: diff changeset	670 } else if (!Decoration.empty()) {
1d019706d866 LLVM10 anatofuz parents: diff changeset	671 // For other empty lines, if we do have a decoration, adapt it to not
1d019706d866 LLVM10 anatofuz parents: diff changeset	672 // contain a trailing whitespace.
1d019706d866 LLVM10 anatofuz parents: diff changeset	673 Prefix = Prefix.substr(0, 1);
1d019706d866 LLVM10 anatofuz parents: diff changeset	674 }
1d019706d866 LLVM10 anatofuz parents: diff changeset	675 } else {
1d019706d866 LLVM10 anatofuz parents: diff changeset	676 if (ContentColumn[LineIndex] == 1) {
1d019706d866 LLVM10 anatofuz parents: diff changeset	677 // This line starts immediately after the decorating *.
1d019706d866 LLVM10 anatofuz parents: diff changeset	678 Prefix = Prefix.substr(0, 1);
1d019706d866 LLVM10 anatofuz parents: diff changeset	679 }
1d019706d866 LLVM10 anatofuz parents: diff changeset	680 }
1d019706d866 LLVM10 anatofuz parents: diff changeset	681 // This is the offset of the end of the last line relative to the start of the
1d019706d866 LLVM10 anatofuz parents: diff changeset	682 // token text in the token.
1d019706d866 LLVM10 anatofuz parents: diff changeset	683 unsigned WhitespaceOffsetInToken = Content[LineIndex - 1].data() +
1d019706d866 LLVM10 anatofuz parents: diff changeset	684 Content[LineIndex - 1].size() -
1d019706d866 LLVM10 anatofuz parents: diff changeset	685 tokenAt(LineIndex).TokenText.data();
1d019706d866 LLVM10 anatofuz parents: diff changeset	686 unsigned WhitespaceLength = Content[LineIndex].data() -
1d019706d866 LLVM10 anatofuz parents: diff changeset	687 tokenAt(LineIndex).TokenText.data() -
1d019706d866 LLVM10 anatofuz parents: diff changeset	688 WhitespaceOffsetInToken;
1d019706d866 LLVM10 anatofuz parents: diff changeset	689 Whitespaces.replaceWhitespaceInToken(
1d019706d866 LLVM10 anatofuz parents: diff changeset	690 tokenAt(LineIndex), WhitespaceOffsetInToken, WhitespaceLength, "", Prefix,
1d019706d866 LLVM10 anatofuz parents: diff changeset	691 InPPDirective, /Newlines=/1, ContentColumn[LineIndex] - Prefix.size());
1d019706d866 LLVM10 anatofuz parents: diff changeset	692 }
1d019706d866 LLVM10 anatofuz parents: diff changeset	693
1d019706d866 LLVM10 anatofuz parents: diff changeset	694 BreakableToken::Split
1d019706d866 LLVM10 anatofuz parents: diff changeset	695 BreakableBlockComment::getSplitAfterLastLine(unsigned TailOffset) const {
1d019706d866 LLVM10 anatofuz parents: diff changeset	696 if (DelimitersOnNewline) {
1d019706d866 LLVM10 anatofuz parents: diff changeset	697 // Replace the trailing whitespace of the last line with a newline.
1d019706d866 LLVM10 anatofuz parents: diff changeset	698 // In case the last line is empty, the ending '*/' is already on its own
1d019706d866 LLVM10 anatofuz parents: diff changeset	699 // line.
1d019706d866 LLVM10 anatofuz parents: diff changeset	700 StringRef Line = Content.back().substr(TailOffset);
1d019706d866 LLVM10 anatofuz parents: diff changeset	701 StringRef TrimmedLine = Line.rtrim(Blanks);
1d019706d866 LLVM10 anatofuz parents: diff changeset	702 if (!TrimmedLine.empty())
1d019706d866 LLVM10 anatofuz parents: diff changeset	703 return Split(TrimmedLine.size(), Line.size() - TrimmedLine.size());
1d019706d866 LLVM10 anatofuz parents: diff changeset	704 }
1d019706d866 LLVM10 anatofuz parents: diff changeset	705 return Split(StringRef::npos, 0);
1d019706d866 LLVM10 anatofuz parents: diff changeset	706 }
1d019706d866 LLVM10 anatofuz parents: diff changeset	707
1d019706d866 LLVM10 anatofuz parents: diff changeset	708 bool BreakableBlockComment::mayReflow(
1d019706d866 LLVM10 anatofuz parents: diff changeset	709 unsigned LineIndex, const llvm::Regex &CommentPragmasRegex) const {
1d019706d866 LLVM10 anatofuz parents: diff changeset	710 // Content[LineIndex] may exclude the indent after the '*' decoration. In that
1d019706d866 LLVM10 anatofuz parents: diff changeset	711 // case, we compute the start of the comment pragma manually.
1d019706d866 LLVM10 anatofuz parents: diff changeset	712 StringRef IndentContent = Content[LineIndex];
1d019706d866 LLVM10 anatofuz parents: diff changeset	713 if (Lines[LineIndex].ltrim(Blanks).startswith("*")) {
1d019706d866 LLVM10 anatofuz parents: diff changeset	714 IndentContent = Lines[LineIndex].ltrim(Blanks).substr(1);
1d019706d866 LLVM10 anatofuz parents: diff changeset	715 }
1d019706d866 LLVM10 anatofuz parents: diff changeset	716 return LineIndex > 0 && !CommentPragmasRegex.match(IndentContent) &&
1d019706d866 LLVM10 anatofuz parents: diff changeset	717 mayReflowContent(Content[LineIndex]) && !Tok.Finalized &&
1d019706d866 LLVM10 anatofuz parents: diff changeset	718 !switchesFormatting(tokenAt(LineIndex));
1d019706d866 LLVM10 anatofuz parents: diff changeset	719 }
1d019706d866 LLVM10 anatofuz parents: diff changeset	720
1d019706d866 LLVM10 anatofuz parents: diff changeset	721 BreakableLineCommentSection::BreakableLineCommentSection(
1d019706d866 LLVM10 anatofuz parents: diff changeset	722 const FormatToken &Token, unsigned StartColumn,
1d019706d866 LLVM10 anatofuz parents: diff changeset	723 unsigned OriginalStartColumn, bool FirstInLine, bool InPPDirective,
1d019706d866 LLVM10 anatofuz parents: diff changeset	724 encoding::Encoding Encoding, const FormatStyle &Style)
1d019706d866 LLVM10 anatofuz parents: diff changeset	725 : BreakableComment(Token, StartColumn, InPPDirective, Encoding, Style) {
1d019706d866 LLVM10 anatofuz parents: diff changeset	726 assert(Tok.is(TT_LineComment) &&
1d019706d866 LLVM10 anatofuz parents: diff changeset	727 "line comment section must start with a line comment");
1d019706d866 LLVM10 anatofuz parents: diff changeset	728 FormatToken *LineTok = nullptr;
1d019706d866 LLVM10 anatofuz parents: diff changeset	729 for (const FormatToken *CurrentTok = &Tok;
1d019706d866 LLVM10 anatofuz parents: diff changeset	730 CurrentTok && CurrentTok->is(TT_LineComment);
1d019706d866 LLVM10 anatofuz parents: diff changeset	731 CurrentTok = CurrentTok->Next) {
1d019706d866 LLVM10 anatofuz parents: diff changeset	732 LastLineTok = LineTok;
1d019706d866 LLVM10 anatofuz parents: diff changeset	733 StringRef TokenText(CurrentTok->TokenText);
1d019706d866 LLVM10 anatofuz parents: diff changeset	734 assert((TokenText.startswith("//") \|\| TokenText.startswith("#")) &&
1d019706d866 LLVM10 anatofuz parents: diff changeset	735 "unsupported line comment prefix, '//' and '#' are supported");
1d019706d866 LLVM10 anatofuz parents: diff changeset	736 size_t FirstLineIndex = Lines.size();
1d019706d866 LLVM10 anatofuz parents: diff changeset	737 TokenText.split(Lines, "\n");
1d019706d866 LLVM10 anatofuz parents: diff changeset	738 Content.resize(Lines.size());
1d019706d866 LLVM10 anatofuz parents: diff changeset	739 ContentColumn.resize(Lines.size());
1d019706d866 LLVM10 anatofuz parents: diff changeset	740 OriginalContentColumn.resize(Lines.size());
1d019706d866 LLVM10 anatofuz parents: diff changeset	741 Tokens.resize(Lines.size());
1d019706d866 LLVM10 anatofuz parents: diff changeset	742 Prefix.resize(Lines.size());
1d019706d866 LLVM10 anatofuz parents: diff changeset	743 OriginalPrefix.resize(Lines.size());
1d019706d866 LLVM10 anatofuz parents: diff changeset	744 for (size_t i = FirstLineIndex, e = Lines.size(); i < e; ++i) {
1d019706d866 LLVM10 anatofuz parents: diff changeset	745 Lines[i] = Lines[i].ltrim(Blanks);
1d019706d866 LLVM10 anatofuz parents: diff changeset	746 // We need to trim the blanks in case this is not the first line in a
1d019706d866 LLVM10 anatofuz parents: diff changeset	747 // multiline comment. Then the indent is included in Lines[i].
1d019706d866 LLVM10 anatofuz parents: diff changeset	748 StringRef IndentPrefix =
1d019706d866 LLVM10 anatofuz parents: diff changeset	749 getLineCommentIndentPrefix(Lines[i].ltrim(Blanks), Style);
1d019706d866 LLVM10 anatofuz parents: diff changeset	750 assert((TokenText.startswith("//") \|\| TokenText.startswith("#")) &&
1d019706d866 LLVM10 anatofuz parents: diff changeset	751 "unsupported line comment prefix, '//' and '#' are supported");
1d019706d866 LLVM10 anatofuz parents: diff changeset	752 OriginalPrefix[i] = Prefix[i] = IndentPrefix;
1d019706d866 LLVM10 anatofuz parents: diff changeset	753 if (Lines[i].size() > Prefix[i].size() &&
1d019706d866 LLVM10 anatofuz parents: diff changeset	754 isAlphanumeric(Lines[i][Prefix[i].size()])) {
1d019706d866 LLVM10 anatofuz parents: diff changeset	755 if (Prefix[i] == "//")
1d019706d866 LLVM10 anatofuz parents: diff changeset	756 Prefix[i] = "// ";
1d019706d866 LLVM10 anatofuz parents: diff changeset	757 else if (Prefix[i] == "///")
1d019706d866 LLVM10 anatofuz parents: diff changeset	758 Prefix[i] = "/// ";
1d019706d866 LLVM10 anatofuz parents: diff changeset	759 else if (Prefix[i] == "//!")
1d019706d866 LLVM10 anatofuz parents: diff changeset	760 Prefix[i] = "//! ";
1d019706d866 LLVM10 anatofuz parents: diff changeset	761 else if (Prefix[i] == "///<")
1d019706d866 LLVM10 anatofuz parents: diff changeset	762 Prefix[i] = "///< ";
1d019706d866 LLVM10 anatofuz parents: diff changeset	763 else if (Prefix[i] == "//!<")
1d019706d866 LLVM10 anatofuz parents: diff changeset	764 Prefix[i] = "//!< ";
1d019706d866 LLVM10 anatofuz parents: diff changeset	765 else if (Prefix[i] == "#" &&
1d019706d866 LLVM10 anatofuz parents: diff changeset	766 Style.Language == FormatStyle::LK_TextProto)
1d019706d866 LLVM10 anatofuz parents: diff changeset	767 Prefix[i] = "# ";
1d019706d866 LLVM10 anatofuz parents: diff changeset	768 }
1d019706d866 LLVM10 anatofuz parents: diff changeset	769
1d019706d866 LLVM10 anatofuz parents: diff changeset	770 Tokens[i] = LineTok;
1d019706d866 LLVM10 anatofuz parents: diff changeset	771 Content[i] = Lines[i].substr(IndentPrefix.size());
1d019706d866 LLVM10 anatofuz parents: diff changeset	772 OriginalContentColumn[i] =
1d019706d866 LLVM10 anatofuz parents: diff changeset	773 StartColumn + encoding::columnWidthWithTabs(OriginalPrefix[i],
1d019706d866 LLVM10 anatofuz parents: diff changeset	774 StartColumn,
1d019706d866 LLVM10 anatofuz parents: diff changeset	775 Style.TabWidth, Encoding);
1d019706d866 LLVM10 anatofuz parents: diff changeset	776 ContentColumn[i] =
1d019706d866 LLVM10 anatofuz parents: diff changeset	777 StartColumn + encoding::columnWidthWithTabs(Prefix[i], StartColumn,
1d019706d866 LLVM10 anatofuz parents: diff changeset	778 Style.TabWidth, Encoding);
1d019706d866 LLVM10 anatofuz parents: diff changeset	779
1d019706d866 LLVM10 anatofuz parents: diff changeset	780 // Calculate the end of the non-whitespace text in this line.
1d019706d866 LLVM10 anatofuz parents: diff changeset	781 size_t EndOfLine = Content[i].find_last_not_of(Blanks);
1d019706d866 LLVM10 anatofuz parents: diff changeset	782 if (EndOfLine == StringRef::npos)
1d019706d866 LLVM10 anatofuz parents: diff changeset	783 EndOfLine = Content[i].size();
1d019706d866 LLVM10 anatofuz parents: diff changeset	784 else
1d019706d866 LLVM10 anatofuz parents: diff changeset	785 ++EndOfLine;
1d019706d866 LLVM10 anatofuz parents: diff changeset	786 Content[i] = Content[i].substr(0, EndOfLine);
1d019706d866 LLVM10 anatofuz parents: diff changeset	787 }
1d019706d866 LLVM10 anatofuz parents: diff changeset	788 LineTok = CurrentTok->Next;
1d019706d866 LLVM10 anatofuz parents: diff changeset	789 if (CurrentTok->Next && !CurrentTok->Next->ContinuesLineCommentSection) {
1d019706d866 LLVM10 anatofuz parents: diff changeset	790 // A line comment section needs to broken by a line comment that is
1d019706d866 LLVM10 anatofuz parents: diff changeset	791 // preceded by at least two newlines. Note that we put this break here
1d019706d866 LLVM10 anatofuz parents: diff changeset	792 // instead of breaking at a previous stage during parsing, since that
1d019706d866 LLVM10 anatofuz parents: diff changeset	793 // would split the contents of the enum into two unwrapped lines in this
1d019706d866 LLVM10 anatofuz parents: diff changeset	794 // example, which is undesirable:
1d019706d866 LLVM10 anatofuz parents: diff changeset	795 // enum A {
1d019706d866 LLVM10 anatofuz parents: diff changeset	796 // a, // comment about a
1d019706d866 LLVM10 anatofuz parents: diff changeset	797 //
1d019706d866 LLVM10 anatofuz parents: diff changeset	798 // // comment about b
1d019706d866 LLVM10 anatofuz parents: diff changeset	799 // b
1d019706d866 LLVM10 anatofuz parents: diff changeset	800 // };
1d019706d866 LLVM10 anatofuz parents: diff changeset	801 //
1d019706d866 LLVM10 anatofuz parents: diff changeset	802 // FIXME: Consider putting separate line comment sections as children to
1d019706d866 LLVM10 anatofuz parents: diff changeset	803 // the unwrapped line instead.
1d019706d866 LLVM10 anatofuz parents: diff changeset	804 break;
1d019706d866 LLVM10 anatofuz parents: diff changeset	805 }
1d019706d866 LLVM10 anatofuz parents: diff changeset	806 }
1d019706d866 LLVM10 anatofuz parents: diff changeset	807 }
1d019706d866 LLVM10 anatofuz parents: diff changeset	808
1d019706d866 LLVM10 anatofuz parents: diff changeset	809 unsigned
1d019706d866 LLVM10 anatofuz parents: diff changeset	810 BreakableLineCommentSection::getRangeLength(unsigned LineIndex, unsigned Offset,
1d019706d866 LLVM10 anatofuz parents: diff changeset	811 StringRef::size_type Length,
1d019706d866 LLVM10 anatofuz parents: diff changeset	812 unsigned StartColumn) const {
1d019706d866 LLVM10 anatofuz parents: diff changeset	813 return encoding::columnWidthWithTabs(
1d019706d866 LLVM10 anatofuz parents: diff changeset	814 Content[LineIndex].substr(Offset, Length), StartColumn, Style.TabWidth,
1d019706d866 LLVM10 anatofuz parents: diff changeset	815 Encoding);
1d019706d866 LLVM10 anatofuz parents: diff changeset	816 }
1d019706d866 LLVM10 anatofuz parents: diff changeset	817
1d019706d866 LLVM10 anatofuz parents: diff changeset	818 unsigned BreakableLineCommentSection::getContentStartColumn(unsigned LineIndex,
1d019706d866 LLVM10 anatofuz parents: diff changeset	819 bool Break) const {
1d019706d866 LLVM10 anatofuz parents: diff changeset	820 if (Break)
1d019706d866 LLVM10 anatofuz parents: diff changeset	821 return OriginalContentColumn[LineIndex];
1d019706d866 LLVM10 anatofuz parents: diff changeset	822 return ContentColumn[LineIndex];
1d019706d866 LLVM10 anatofuz parents: diff changeset	823 }
1d019706d866 LLVM10 anatofuz parents: diff changeset	824
1d019706d866 LLVM10 anatofuz parents: diff changeset	825 void BreakableLineCommentSection::insertBreak(
1d019706d866 LLVM10 anatofuz parents: diff changeset	826 unsigned LineIndex, unsigned TailOffset, Split Split,
1d019706d866 LLVM10 anatofuz parents: diff changeset	827 unsigned ContentIndent, WhitespaceManager &Whitespaces) const {
1d019706d866 LLVM10 anatofuz parents: diff changeset	828 StringRef Text = Content[LineIndex].substr(TailOffset);
1d019706d866 LLVM10 anatofuz parents: diff changeset	829 // Compute the offset of the split relative to the beginning of the token
1d019706d866 LLVM10 anatofuz parents: diff changeset	830 // text.
1d019706d866 LLVM10 anatofuz parents: diff changeset	831 unsigned BreakOffsetInToken =
1d019706d866 LLVM10 anatofuz parents: diff changeset	832 Text.data() - tokenAt(LineIndex).TokenText.data() + Split.first;
1d019706d866 LLVM10 anatofuz parents: diff changeset	833 unsigned CharsToRemove = Split.second;
1d019706d866 LLVM10 anatofuz parents: diff changeset	834 // Compute the size of the new indent, including the size of the new prefix of
1d019706d866 LLVM10 anatofuz parents: diff changeset	835 // the newly broken line.
1d019706d866 LLVM10 anatofuz parents: diff changeset	836 unsigned IndentAtLineBreak = OriginalContentColumn[LineIndex] +
1d019706d866 LLVM10 anatofuz parents: diff changeset	837 Prefix[LineIndex].size() -
1d019706d866 LLVM10 anatofuz parents: diff changeset	838 OriginalPrefix[LineIndex].size();
1d019706d866 LLVM10 anatofuz parents: diff changeset	839 assert(IndentAtLineBreak >= Prefix[LineIndex].size());
1d019706d866 LLVM10 anatofuz parents: diff changeset	840 Whitespaces.replaceWhitespaceInToken(
1d019706d866 LLVM10 anatofuz parents: diff changeset	841 tokenAt(LineIndex), BreakOffsetInToken, CharsToRemove, "",
1d019706d866 LLVM10 anatofuz parents: diff changeset	842 Prefix[LineIndex], InPPDirective, /Newlines=/1,
1d019706d866 LLVM10 anatofuz parents: diff changeset	843 /Spaces=/IndentAtLineBreak - Prefix[LineIndex].size());
1d019706d866 LLVM10 anatofuz parents: diff changeset	844 }
1d019706d866 LLVM10 anatofuz parents: diff changeset	845
1d019706d866 LLVM10 anatofuz parents: diff changeset	846 BreakableComment::Split BreakableLineCommentSection::getReflowSplit(
1d019706d866 LLVM10 anatofuz parents: diff changeset	847 unsigned LineIndex, const llvm::Regex &CommentPragmasRegex) const {
1d019706d866 LLVM10 anatofuz parents: diff changeset	848 if (!mayReflow(LineIndex, CommentPragmasRegex))
1d019706d866 LLVM10 anatofuz parents: diff changeset	849 return Split(StringRef::npos, 0);
1d019706d866 LLVM10 anatofuz parents: diff changeset	850
1d019706d866 LLVM10 anatofuz parents: diff changeset	851 size_t Trimmed = Content[LineIndex].find_first_not_of(Blanks);
1d019706d866 LLVM10 anatofuz parents: diff changeset	852
1d019706d866 LLVM10 anatofuz parents: diff changeset	853 // In a line comment section each line is a separate token; thus, after a
1d019706d866 LLVM10 anatofuz parents: diff changeset	854 // split we replace all whitespace before the current line comment token
1d019706d866 LLVM10 anatofuz parents: diff changeset	855 // (which does not need to be included in the split), plus the start of the
1d019706d866 LLVM10 anatofuz parents: diff changeset	856 // line up to where the content starts.
1d019706d866 LLVM10 anatofuz parents: diff changeset	857 return Split(0, Trimmed != StringRef::npos ? Trimmed : 0);
1d019706d866 LLVM10 anatofuz parents: diff changeset	858 }
1d019706d866 LLVM10 anatofuz parents: diff changeset	859
1d019706d866 LLVM10 anatofuz parents: diff changeset	860 void BreakableLineCommentSection::reflow(unsigned LineIndex,
1d019706d866 LLVM10 anatofuz parents: diff changeset	861 WhitespaceManager &Whitespaces) const {
1d019706d866 LLVM10 anatofuz parents: diff changeset	862 if (LineIndex > 0 && Tokens[LineIndex] != Tokens[LineIndex - 1]) {
1d019706d866 LLVM10 anatofuz parents: diff changeset	863 // Reflow happens between tokens. Replace the whitespace between the
1d019706d866 LLVM10 anatofuz parents: diff changeset	864 // tokens by the empty string.
1d019706d866 LLVM10 anatofuz parents: diff changeset	865 Whitespaces.replaceWhitespace(
1d019706d866 LLVM10 anatofuz parents: diff changeset	866 Tokens[LineIndex], /Newlines=/0, /Spaces=*/0,
1d019706d866 LLVM10 anatofuz parents: diff changeset	867 /StartOfTokenColumn=/StartColumn, /InPPDirective=/false);
1d019706d866 LLVM10 anatofuz parents: diff changeset	868 } else if (LineIndex > 0) {
1d019706d866 LLVM10 anatofuz parents: diff changeset	869 // In case we're reflowing after the '\' in:
1d019706d866 LLVM10 anatofuz parents: diff changeset	870 //
1d019706d866 LLVM10 anatofuz parents: diff changeset	871 // // line comment \
1d019706d866 LLVM10 anatofuz parents: diff changeset	872 // // line 2
1d019706d866 LLVM10 anatofuz parents: diff changeset	873 //
1d019706d866 LLVM10 anatofuz parents: diff changeset	874 // the reflow happens inside the single comment token (it is a single line
1d019706d866 LLVM10 anatofuz parents: diff changeset	875 // comment with an unescaped newline).
1d019706d866 LLVM10 anatofuz parents: diff changeset	876 // Replace the whitespace between the '\' and '//' with the empty string.
1d019706d866 LLVM10 anatofuz parents: diff changeset	877 //
1d019706d866 LLVM10 anatofuz parents: diff changeset	878 // Offset points to after the '\' relative to start of the token.
1d019706d866 LLVM10 anatofuz parents: diff changeset	879 unsigned Offset = Lines[LineIndex - 1].data() +
1d019706d866 LLVM10 anatofuz parents: diff changeset	880 Lines[LineIndex - 1].size() -
1d019706d866 LLVM10 anatofuz parents: diff changeset	881 tokenAt(LineIndex - 1).TokenText.data();
1d019706d866 LLVM10 anatofuz parents: diff changeset	882 // WhitespaceLength is the number of chars between the '\' and the '//' on
1d019706d866 LLVM10 anatofuz parents: diff changeset	883 // the next line.
1d019706d866 LLVM10 anatofuz parents: diff changeset	884 unsigned WhitespaceLength =
1d019706d866 LLVM10 anatofuz parents: diff changeset	885 Lines[LineIndex].data() - tokenAt(LineIndex).TokenText.data() - Offset;
1d019706d866 LLVM10 anatofuz parents: diff changeset	886 Whitespaces.replaceWhitespaceInToken(*Tokens[LineIndex], Offset,
1d019706d866 LLVM10 anatofuz parents: diff changeset	887 /ReplaceChars=/WhitespaceLength,
1d019706d866 LLVM10 anatofuz parents: diff changeset	888 /PreviousPostfix=/"",
1d019706d866 LLVM10 anatofuz parents: diff changeset	889 /CurrentPrefix=/"",
1d019706d866 LLVM10 anatofuz parents: diff changeset	890 /InPPDirective=/false,
1d019706d866 LLVM10 anatofuz parents: diff changeset	891 /Newlines=/0,
1d019706d866 LLVM10 anatofuz parents: diff changeset	892 /Spaces=/0);
1d019706d866 LLVM10 anatofuz parents: diff changeset	893 }
1d019706d866 LLVM10 anatofuz parents: diff changeset	894 // Replace the indent and prefix of the token with the reflow prefix.
1d019706d866 LLVM10 anatofuz parents: diff changeset	895 unsigned Offset =
1d019706d866 LLVM10 anatofuz parents: diff changeset	896 Lines[LineIndex].data() - tokenAt(LineIndex).TokenText.data();
1d019706d866 LLVM10 anatofuz parents: diff changeset	897 unsigned WhitespaceLength =
1d019706d866 LLVM10 anatofuz parents: diff changeset	898 Content[LineIndex].data() - Lines[LineIndex].data();
1d019706d866 LLVM10 anatofuz parents: diff changeset	899 Whitespaces.replaceWhitespaceInToken(*Tokens[LineIndex], Offset,
1d019706d866 LLVM10 anatofuz parents: diff changeset	900 /ReplaceChars=/WhitespaceLength,
1d019706d866 LLVM10 anatofuz parents: diff changeset	901 /PreviousPostfix=/"",
1d019706d866 LLVM10 anatofuz parents: diff changeset	902 /CurrentPrefix=/ReflowPrefix,
1d019706d866 LLVM10 anatofuz parents: diff changeset	903 /InPPDirective=/false,
1d019706d866 LLVM10 anatofuz parents: diff changeset	904 /Newlines=/0,
1d019706d866 LLVM10 anatofuz parents: diff changeset	905 /Spaces=/0);
1d019706d866 LLVM10 anatofuz parents: diff changeset	906 }
1d019706d866 LLVM10 anatofuz parents: diff changeset	907
1d019706d866 LLVM10 anatofuz parents: diff changeset	908 void BreakableLineCommentSection::adaptStartOfLine(
1d019706d866 LLVM10 anatofuz parents: diff changeset	909 unsigned LineIndex, WhitespaceManager &Whitespaces) const {
1d019706d866 LLVM10 anatofuz parents: diff changeset	910 // If this is the first line of a token, we need to inform Whitespace Manager
1d019706d866 LLVM10 anatofuz parents: diff changeset	911 // about it: either adapt the whitespace range preceding it, or mark it as an
1d019706d866 LLVM10 anatofuz parents: diff changeset	912 // untouchable token.
1d019706d866 LLVM10 anatofuz parents: diff changeset	913 // This happens for instance here:
1d019706d866 LLVM10 anatofuz parents: diff changeset	914 // // line 1 \
1d019706d866 LLVM10 anatofuz parents: diff changeset	915 // // line 2
1d019706d866 LLVM10 anatofuz parents: diff changeset	916 if (LineIndex > 0 && Tokens[LineIndex] != Tokens[LineIndex - 1]) {
1d019706d866 LLVM10 anatofuz parents: diff changeset	917 // This is the first line for the current token, but no reflow with the
1d019706d866 LLVM10 anatofuz parents: diff changeset	918 // previous token is necessary. However, we still may need to adjust the
1d019706d866 LLVM10 anatofuz parents: diff changeset	919 // start column. Note that ContentColumn[LineIndex] is the expected
1d019706d866 LLVM10 anatofuz parents: diff changeset	920 // content column after a possible update to the prefix, hence the prefix
1d019706d866 LLVM10 anatofuz parents: diff changeset	921 // length change is included.
1d019706d866 LLVM10 anatofuz parents: diff changeset	922 unsigned LineColumn =
1d019706d866 LLVM10 anatofuz parents: diff changeset	923 ContentColumn[LineIndex] -
1d019706d866 LLVM10 anatofuz parents: diff changeset	924 (Content[LineIndex].data() - Lines[LineIndex].data()) +
1d019706d866 LLVM10 anatofuz parents: diff changeset	925 (OriginalPrefix[LineIndex].size() - Prefix[LineIndex].size());
1d019706d866 LLVM10 anatofuz parents: diff changeset	926
1d019706d866 LLVM10 anatofuz parents: diff changeset	927 // We always want to create a replacement instead of adding an untouchable
1d019706d866 LLVM10 anatofuz parents: diff changeset	928 // token, even if LineColumn is the same as the original column of the
1d019706d866 LLVM10 anatofuz parents: diff changeset	929 // token. This is because WhitespaceManager doesn't align trailing
1d019706d866 LLVM10 anatofuz parents: diff changeset	930 // comments if they are untouchable.
1d019706d866 LLVM10 anatofuz parents: diff changeset	931 Whitespaces.replaceWhitespace(*Tokens[LineIndex],
1d019706d866 LLVM10 anatofuz parents: diff changeset	932 /Newlines=/1,
1d019706d866 LLVM10 anatofuz parents: diff changeset	933 /Spaces=/LineColumn,
1d019706d866 LLVM10 anatofuz parents: diff changeset	934 /StartOfTokenColumn=/LineColumn,
1d019706d866 LLVM10 anatofuz parents: diff changeset	935 /InPPDirective=/false);
1d019706d866 LLVM10 anatofuz parents: diff changeset	936 }
1d019706d866 LLVM10 anatofuz parents: diff changeset	937 if (OriginalPrefix[LineIndex] != Prefix[LineIndex]) {
1d019706d866 LLVM10 anatofuz parents: diff changeset	938 // Adjust the prefix if necessary.
1d019706d866 LLVM10 anatofuz parents: diff changeset	939
1d019706d866 LLVM10 anatofuz parents: diff changeset	940 // Take care of the space possibly introduced after a decoration.
1d019706d866 LLVM10 anatofuz parents: diff changeset	941 assert(Prefix[LineIndex] == (OriginalPrefix[LineIndex] + " ").str() &&
1d019706d866 LLVM10 anatofuz parents: diff changeset	942 "Expecting a line comment prefix to differ from original by at most "
1d019706d866 LLVM10 anatofuz parents: diff changeset	943 "a space");
1d019706d866 LLVM10 anatofuz parents: diff changeset	944 Whitespaces.replaceWhitespaceInToken(
1d019706d866 LLVM10 anatofuz parents: diff changeset	945 tokenAt(LineIndex), OriginalPrefix[LineIndex].size(), 0, "", "",
1d019706d866 LLVM10 anatofuz parents: diff changeset	946 /InPPDirective=/false, /Newlines=/0, /Spaces=/1);
1d019706d866 LLVM10 anatofuz parents: diff changeset	947 }
1d019706d866 LLVM10 anatofuz parents: diff changeset	948 }
1d019706d866 LLVM10 anatofuz parents: diff changeset	949
1d019706d866 LLVM10 anatofuz parents: diff changeset	950 void BreakableLineCommentSection::updateNextToken(LineState &State) const {
1d019706d866 LLVM10 anatofuz parents: diff changeset	951 if (LastLineTok) {
1d019706d866 LLVM10 anatofuz parents: diff changeset	952 State.NextToken = LastLineTok->Next;
1d019706d866 LLVM10 anatofuz parents: diff changeset	953 }
1d019706d866 LLVM10 anatofuz parents: diff changeset	954 }
1d019706d866 LLVM10 anatofuz parents: diff changeset	955
1d019706d866 LLVM10 anatofuz parents: diff changeset	956 bool BreakableLineCommentSection::mayReflow(
1d019706d866 LLVM10 anatofuz parents: diff changeset	957 unsigned LineIndex, const llvm::Regex &CommentPragmasRegex) const {
1d019706d866 LLVM10 anatofuz parents: diff changeset	958 // Line comments have the indent as part of the prefix, so we need to
1d019706d866 LLVM10 anatofuz parents: diff changeset	959 // recompute the start of the line.
1d019706d866 LLVM10 anatofuz parents: diff changeset	960 StringRef IndentContent = Content[LineIndex];
1d019706d866 LLVM10 anatofuz parents: diff changeset	961 if (Lines[LineIndex].startswith("//")) {
1d019706d866 LLVM10 anatofuz parents: diff changeset	962 IndentContent = Lines[LineIndex].substr(2);
1d019706d866 LLVM10 anatofuz parents: diff changeset	963 }
1d019706d866 LLVM10 anatofuz parents: diff changeset	964 // FIXME: Decide whether we want to reflow non-regular indents:
1d019706d866 LLVM10 anatofuz parents: diff changeset	965 // Currently, we only reflow when the OriginalPrefix[LineIndex] matches the
1d019706d866 LLVM10 anatofuz parents: diff changeset	966 // OriginalPrefix[LineIndex-1]. That means we don't reflow
1d019706d866 LLVM10 anatofuz parents: diff changeset	967 // // text that protrudes
1d019706d866 LLVM10 anatofuz parents: diff changeset	968 // // into text with different indent
1d019706d866 LLVM10 anatofuz parents: diff changeset	969 // We do reflow in that case in block comments.
1d019706d866 LLVM10 anatofuz parents: diff changeset	970 return LineIndex > 0 && !CommentPragmasRegex.match(IndentContent) &&
1d019706d866 LLVM10 anatofuz parents: diff changeset	971 mayReflowContent(Content[LineIndex]) && !Tok.Finalized &&
1d019706d866 LLVM10 anatofuz parents: diff changeset	972 !switchesFormatting(tokenAt(LineIndex)) &&
1d019706d866 LLVM10 anatofuz parents: diff changeset	973 OriginalPrefix[LineIndex] == OriginalPrefix[LineIndex - 1];
1d019706d866 LLVM10 anatofuz parents: diff changeset	974 }
1d019706d866 LLVM10 anatofuz parents: diff changeset	975
1d019706d866 LLVM10 anatofuz parents: diff changeset	976 } // namespace format
1d019706d866 LLVM10 anatofuz parents: diff changeset	977 } // namespace clang

Mercurial > hg > CbC > CbC_llvm

annotate clang/lib/Format/BreakableToken.cpp @ 150:1d019706d866