clang-tools-extra/clangd/support/Markup.cpp - llvm-project - Git at Google

 //===--- Markup.cpp -----------------------------------------*- C++-*------===//
 //
 // Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions.
 // See https://llvm.org/LICENSE.txt for license information.
 // SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception
 //
 //===----------------------------------------------------------------------===//
 #include "support/Markup.h"
 #include "clang/Basic/CharInfo.h"
 #include "llvm/ADT/ArrayRef.h"
 #include "llvm/ADT/STLExtras.h"
 #include "llvm/ADT/SmallVector.h"
 #include "llvm/ADT/StringExtras.h"
 #include "llvm/ADT/StringRef.h"
 #include "llvm/Support/raw_ostream.h"
 #include <cstddef>
 #include <iterator>
 #include <memory>
 #include <string>
 #include <vector>

 namespace clang {
 namespace clangd {
 namespace markup {
 namespace {

 // Is <contents a plausible start to an HTML tag?
 // Contents may not be the rest of the line, but it's the rest of the plain
 // text, so we expect to see at least the tag name.
 bool looksLikeTag(llvm::StringRef Contents) {
   if (Contents.empty())
     return false;
   if (Contents.front() == '!' || Contents.front() == '?' ||
       Contents.front() == '/')
     return true;
   // Check the start of the tag name.
   if (!llvm::isAlpha(Contents.front()))
     return false;
   // Drop rest of the tag name, and following whitespace.
   Contents = Contents
                  .drop_while([](char C) {
                    return llvm::isAlnum(C) || C == '-' || C == '_' || C == ':';
                  })
                  .drop_while(llvm::isSpace);
   // The rest of the tag consists of attributes, which have restrictive names.
   // If we hit '=', all bets are off (attribute values can contain anything).
   for (; !Contents.empty(); Contents = Contents.drop_front()) {
     if (llvm::isAlnum(Contents.front()) || llvm::isSpace(Contents.front()))
       continue;
     if (Contents.front() == '>' || Contents.starts_with("/>"))
       return true; // May close the tag.
     if (Contents.front() == '=')
       return true; // Don't try to parse attribute values.
     return false;  // Random punctuation means this isn't a tag.
   }
   return true; // Potentially incomplete tag.
 }

 // Tests whether C should be backslash-escaped in markdown.
 // The string being escaped is Before + C + After. This is part of a paragraph.
 // StartsLine indicates whether `Before` is the start of the line.
 // After may not be everything until the end of the line.
 //
 // It's always safe to escape punctuation, but want minimal escaping.
 // The strategy is to escape the first character of anything that might start
 // a markdown grammar construct.
 bool needsLeadingEscapePlaintext(char C, llvm::StringRef Before,
                                  llvm::StringRef After, bool StartsLine) {
   assert(Before.take_while(llvm::isSpace).empty());
   auto RulerLength = [&]() -> /*Length*/ unsigned {
     if (!StartsLine || !Before.empty())
       return false;
     llvm::StringRef A = After.rtrim();
     return llvm::all_of(A, [C](char D) { return C == D; }) ? 1 + A.size() : 0;
   };
   auto IsBullet = [&]() {
     return StartsLine && Before.empty() &&
            (After.empty() || After.starts_with(" "));
   };
   auto SpaceSurrounds = [&]() {
     return (After.empty() || llvm::isSpace(After.front())) &&
            (Before.empty() || llvm::isSpace(Before.back()));
   };
   auto WordSurrounds = [&]() {
     return (!After.empty() && llvm::isAlnum(After.front())) &&
            (!Before.empty() && llvm::isAlnum(Before.back()));
   };

   switch (C) {
   case '\\': // Escaped character.
     return true;
   case '`': // Code block or inline code
     // Any number of backticks can delimit an inline code block that can end
     // anywhere (including on another line). We must escape them all.
     return true;
   case '~': // Code block
     return StartsLine && Before.empty() && After.starts_with("~~");
   case '#': { // ATX heading.
     if (!StartsLine || !Before.empty())
       return false;
     llvm::StringRef Rest = After.ltrim(C);
     return Rest.empty() || Rest.starts_with(" ");
   }
   case ']': // Link or link reference.
     // We escape ] rather than [ here, because it's more constrained:
     //   ](...) is an in-line link
     //   ]: is a link reference
     // The following are only links if the link reference exists:
     //   ] by itself is a shortcut link
     //   ][...] is an out-of-line link
     // Because we never emit link references, we don't need to handle these.
     return After.starts_with(":") || After.starts_with("(");
   case '=': // Setex heading.
     return RulerLength() > 0;
   case '_': // Horizontal ruler or matched delimiter.
     if (RulerLength() >= 3)
       return true;
     // Not a delimiter if surrounded by space, or inside a word.
     // (The rules at word boundaries are subtle).
     return !(SpaceSurrounds() || WordSurrounds());
   case '-': // Setex heading, horizontal ruler, or bullet.
     if (RulerLength() > 0)
       return true;
     return IsBullet();
   case '+': // Bullet list.
     return IsBullet();
   case '*': // Bullet list, horizontal ruler, or delimiter.
     return IsBullet() || RulerLength() >= 3 || !SpaceSurrounds();
   case '<': // HTML tag (or autolink, which we choose not to escape)
     return looksLikeTag(After);
   case '>': // Quote marker. Needs escaping at start of line.
     return StartsLine && Before.empty();
   case '&': { // HTML entity reference
     auto End = After.find(';');
     if (End == llvm::StringRef::npos)
       return false;
     llvm::StringRef Content = After.substr(0, End);
     if (Content.consume_front("#")) {
       if (Content.consume_front("x") || Content.consume_front("X"))
         return llvm::all_of(Content, llvm::isHexDigit);
       return llvm::all_of(Content, llvm::isDigit);
     }
     return llvm::all_of(Content, llvm::isAlpha);
   }
   case '.': // Numbered list indicator. Escape 12. -> 12\. at start of line.
   case ')':
     return StartsLine && !Before.empty() &&
            llvm::all_of(Before, llvm::isDigit) && After.starts_with(" ");
   default:
     return false;
   }
 }

 /// \brief Tests whether \p C should be backslash-escaped in markdown.
 ///
 /// The MarkupContent LSP specification defines that `markdown` content needs to
 /// follow GFM (GitHub Flavored Markdown) rules. And we can assume that markdown
 /// is rendered on the client side. This means we do not need to escape any
 /// markdown constructs.
 /// The only exception is when the client does not support HTML rendering in
 /// markdown. In that case, we need to escape HTML tags and HTML entities.
 ///
 /// **FIXME:** handle the case when the client does support HTML rendering in
 /// markdown. For this, the LSP server needs to check the
 /// [supportsHtml
 /// capability](https://github.com/microsoft/language-server-protocol/issues/1344)
 /// of the client.
 ///
 /// \param C The character to check.
 /// \param After The string that follows \p C .
 /// This is used to determine if \p C is part of a tag or an entity reference.
 ///
 /// \returns true if \p C should be escaped, false otherwise.
 bool needsLeadingEscapeMarkdown(char C, llvm::StringRef After) {
   switch (C) {
   case '<': // HTML tag (or autolink, which we choose not to escape)
     return looksLikeTag(After);
   case '&': { // HTML entity reference
     auto End = After.find(';');
     if (End == llvm::StringRef::npos)
       return false;
     llvm::StringRef Content = After.substr(0, End);
     if (Content.consume_front("#")) {
       if (Content.consume_front("x") || Content.consume_front("X"))
         return llvm::all_of(Content, llvm::isHexDigit);
       return llvm::all_of(Content, llvm::isDigit);
     }
     return llvm::all_of(Content, llvm::isAlpha);
   }
   default:
     return false;
   }
 }

 bool needsLeadingEscape(char C, llvm::StringRef Before, llvm::StringRef After,
                         bool StartsLine, bool EscapeMarkdown) {
   if (EscapeMarkdown)
     return needsLeadingEscapePlaintext(C, Before, After, StartsLine);
   return needsLeadingEscapeMarkdown(C, After);
 }

 /// Escape a markdown text block.
 /// If \p EscapeMarkdown is true it ensures the punctuation will not introduce
 /// any of the markdown constructs.
 /// Else, markdown syntax is not escaped, only HTML tags and entities.
 std::string renderText(llvm::StringRef Input, bool StartsLine,
                        bool EscapeMarkdown) {
   std::string R;
   R.reserve(Input.size());

   // split the input into lines, and escape each line separately.
   llvm::StringRef Line, Rest;

   bool IsFirstLine = true;

   for (std::tie(Line, Rest) = Input.split('\n');
        !(Line.empty() && Rest.empty());
        std::tie(Line, Rest) = Rest.split('\n')) {

     bool StartsLineIntern = IsFirstLine ? StartsLine : true;

     // Ignore leading spaces for the escape logic, but preserve them in the
     // output.
     StringRef LeadingSpaces = Line.take_while(llvm::isSpace);
     if (!LeadingSpaces.empty()) {
       R.append(LeadingSpaces);
     }

     for (unsigned I = LeadingSpaces.size(); I < Line.size(); ++I) {
       if (needsLeadingEscape(Line[I], Line.substr(LeadingSpaces.size(), I),
                              Line.substr(I + 1), StartsLineIntern,
                              EscapeMarkdown))
         R.push_back('\\');
       R.push_back(Line[I]);
     }

     IsFirstLine = false;
     if (!Rest.empty())
       R.push_back('\n');
   }

   return R;
 }

 /// Renders \p Input as an inline block of code in markdown. The returned value
 /// is surrounded by backticks and the inner contents are properly escaped.
 std::string renderInlineBlock(llvm::StringRef Input) {
   std::string R;
   R.reserve(Input.size());
   // Double all backticks to make sure we don't close the inline block early.
   for (size_t From = 0; From < Input.size();) {
     size_t Next = Input.find("`", From);
     R += Input.substr(From, Next - From);
     if (Next == llvm::StringRef::npos)
       break;
     R += "``"; // double the found backtick.

     From = Next + 1;
   }
   // If results starts with a backtick, add spaces on both sides. The spaces
   // are ignored by markdown renderers.
   if (llvm::StringRef(R).starts_with("`") || llvm::StringRef(R).ends_with("`"))
     return "` " + std::move(R) + " `";
   // Markdown render should ignore first and last space if both are there. We
   // add an extra pair of spaces in that case to make sure we render what the
   // user intended.
   if (llvm::StringRef(R).starts_with(" ") && llvm::StringRef(R).ends_with(" "))
     return "` " + std::move(R) + " `";
   return "`" + std::move(R) + "`";
 }

 /// Get marker required for \p Input to represent a markdown codeblock. It
 /// consists of at least 3 backticks(`). Although markdown also allows to use
 /// tilde(~) for code blocks, they are never used.
 std::string getMarkerForCodeBlock(llvm::StringRef Input) {
   // Count the maximum number of consecutive backticks in \p Input. We need to
   // start and end the code block with more.
   unsigned MaxBackticks = 0;
   unsigned Backticks = 0;
   for (char C : Input) {
     if (C == '`') {
       ++Backticks;
       continue;
     }
     MaxBackticks = std::max(MaxBackticks, Backticks);
     Backticks = 0;
   }
   MaxBackticks = std::max(Backticks, MaxBackticks);
   // Use the corresponding number of backticks to start and end a code block.
   return std::string(/*Repeat=*/std::max(3u, MaxBackticks + 1), '`');
 }

 // Trims the input and concatenates whitespace blocks into a single ` `.
 std::string canonicalizeSpaces(llvm::StringRef Input) {
   llvm::SmallVector<llvm::StringRef> Words;
   llvm::SplitString(Input, Words);
   return llvm::join(Words, " ");
 }

 std::string renderBlocks(llvm::ArrayRef<std::unique_ptr<Block>> Children,
                          void (Block::*RenderFunc)(llvm::raw_ostream &) const) {
   std::string R;
   llvm::raw_string_ostream OS(R);

   // Trim rulers.
   Children = Children.drop_while(
       [](const std::unique_ptr<Block> &C) { return C->isRuler(); });
   auto Last = llvm::find_if(
       llvm::reverse(Children),
       [](const std::unique_ptr<Block> &C) { return !C->isRuler(); });
   Children = Children.drop_back(Children.end() - Last.base());

   bool LastBlockWasRuler = true;
   for (const auto &C : Children) {
     if (C->isRuler() && LastBlockWasRuler)
       continue;
     LastBlockWasRuler = C->isRuler();
     ((*C).*RenderFunc)(OS);
   }

   // Get rid of redundant empty lines introduced in plaintext while imitating
   // padding in markdown.
   std::string AdjustedResult;
   llvm::StringRef TrimmedText(OS.str());
   TrimmedText = TrimmedText.trim();

   llvm::copy_if(TrimmedText, std::back_inserter(AdjustedResult),
                 [&TrimmedText](const char &C) {
                   return !llvm::StringRef(TrimmedText.data(),
                                           &C - TrimmedText.data() + 1)
                               // We allow at most two newlines.
                               .ends_with("\n\n\n");
                 });

   return AdjustedResult;
 }

 // Separates two blocks with extra spacing. Note that it might render strangely
 // in vscode if the trailing block is a codeblock, see
 // https://github.com/microsoft/vscode/issues/88416 for details.
 class Ruler : public Block {
 public:
   void renderEscapedMarkdown(llvm::raw_ostream &OS) const override {
     renderMarkdown(OS);
   }
   void renderMarkdown(llvm::raw_ostream &OS) const override {
     // Note that we need an extra new line before the ruler, otherwise we might
     // make previous block a title instead of introducing a ruler.
     OS << "\n---\n";
   }
   void renderPlainText(llvm::raw_ostream &OS) const override { OS << '\n'; }
   std::unique_ptr<Block> clone() const override {
     return std::make_unique<Ruler>(*this);
   }
   bool isRuler() const override { return true; }
 };

 class CodeBlock : public Block {
 public:
   void renderEscapedMarkdown(llvm::raw_ostream &OS) const override {
     renderMarkdown(OS);
   }
   void renderMarkdown(llvm::raw_ostream &OS) const override {
     std::string Marker = getMarkerForCodeBlock(Contents);
     // No need to pad from previous blocks, as they should end with a new line.
     OS << Marker << Language << '\n' << Contents;
     if (!Contents.empty() && Contents.back() != '\n')
       OS << '\n';
     // Always end with an empty line to separate code blocks from following
     // paragraphs.
     OS << Marker << "\n\n";
   }

   void renderPlainText(llvm::raw_ostream &OS) const override {
     // In plaintext we want one empty line before and after codeblocks.
     OS << '\n' << Contents << "\n\n";
   }

   std::unique_ptr<Block> clone() const override {
     return std::make_unique<CodeBlock>(*this);
   }

   CodeBlock(std::string Contents, std::string Language)
       : Contents(std::move(Contents)), Language(std::move(Language)) {}

 private:
   std::string Contents;
   std::string Language;
 };

 // Inserts two spaces after each `\n` to indent each line. First line is not
 // indented.
 std::string indentLines(llvm::StringRef Input) {
   assert(!Input.ends_with("\n") && "Input should've been trimmed.");
   std::string IndentedR;
   // We'll add 2 spaces after each new line which is not followed by another new
   // line.
   IndentedR.reserve(Input.size() + Input.count('\n') * 2);
   for (size_t I = 0; I < Input.size(); ++I) {
     char C = Input[I];
     IndentedR += C;
     if (C == '\n' && (((I + 1) < Input.size()) && (Input[I + 1] != '\n')))
       IndentedR.append("  ");
   }
   return IndentedR;
 }

 class Heading : public Paragraph {
 public:
   Heading(size_t Level) : Level(Level) {}

   void renderEscapedMarkdown(llvm::raw_ostream &OS) const override {
     insertHeadingMarkers(OS);
     Paragraph::renderEscapedMarkdown(OS);
   }

   void renderMarkdown(llvm::raw_ostream &OS) const override {
     insertHeadingMarkers(OS);
     Paragraph::renderMarkdown(OS);
   }

 private:
   size_t Level;

   void insertHeadingMarkers(llvm::raw_ostream &OS) const {
     OS << std::string(Level, '#') << ' ';
   }
 };

 } // namespace

 std::string Block::asEscapedMarkdown() const {
   std::string R;
   llvm::raw_string_ostream OS(R);
   renderEscapedMarkdown(OS);
   return llvm::StringRef(OS.str()).trim().str();
 }

 std::string Block::asMarkdown() const {
   std::string R;
   llvm::raw_string_ostream OS(R);
   renderMarkdown(OS);
   return llvm::StringRef(OS.str()).trim().str();
 }

 std::string Block::asPlainText() const {
   std::string R;
   llvm::raw_string_ostream OS(R);
   renderPlainText(OS);
   return llvm::StringRef(OS.str()).trim().str();
 }

 void Paragraph::renderEscapedMarkdown(llvm::raw_ostream &OS) const {
   bool NeedsSpace = false;
   bool HasChunks = false;
   for (auto &C : Chunks) {
     if (C.SpaceBefore || NeedsSpace)
       OS << " ";
     switch (C.Kind) {
     case ChunkKind::PlainText:
       OS << renderText(C.Contents, !HasChunks, /*EscapeMarkdown=*/true);
       break;
     case ChunkKind::InlineCode:
       OS << renderInlineBlock(C.Contents);
       break;
     case ChunkKind::Bold:
       OS << renderText("**" + C.Contents + "**", !HasChunks,
                        /*EscapeMarkdown=*/true);
       break;
     case ChunkKind::Emphasized:
       OS << renderText("*" + C.Contents + "*", !HasChunks,
                        /*EscapeMarkdown=*/true);
       break;
     }
     HasChunks = true;
     NeedsSpace = C.SpaceAfter;
   }
   // A paragraph in markdown is separated by a blank line.
   OS << "\n\n";
 }

 void Paragraph::renderMarkdown(llvm::raw_ostream &OS) const {
   bool NeedsSpace = false;
   bool HasChunks = false;
   for (auto &C : Chunks) {
     if (C.SpaceBefore || NeedsSpace)
       OS << " ";
     switch (C.Kind) {
     case ChunkKind::PlainText:
       OS << renderText(C.Contents, !HasChunks, /*EscapeMarkdown=*/false);
       break;
     case ChunkKind::InlineCode:
       OS << renderInlineBlock(C.Contents);
       break;
     case ChunkKind::Bold:
       OS << "**" << renderText(C.Contents, !HasChunks, /*EscapeMarkdown=*/false)
          << "**";
       break;
     case ChunkKind::Emphasized:
       OS << "*" << renderText(C.Contents, !HasChunks, /*EscapeMarkdown=*/false)
          << "*";
       break;
     }
     HasChunks = true;
     NeedsSpace = C.SpaceAfter;
   }
   // A paragraph in markdown is separated by a blank line.
   OS << "\n\n";
 }

 std::unique_ptr<Block> Paragraph::clone() const {
   return std::make_unique<Paragraph>(*this);
 }

 /// Choose a marker to delimit `Text` from a prioritized list of options.
 /// This is more readable than escaping for plain-text.
 llvm::StringRef Paragraph::chooseMarker(llvm::ArrayRef<llvm::StringRef> Options,
                                         llvm::StringRef Text) const {
   // Prefer a delimiter whose characters don't appear in the text.
   for (llvm::StringRef S : Options)
     if (Text.find_first_of(S) == llvm::StringRef::npos)
       return S;
   return Options.front();
 }

 bool Paragraph::punctuationIndicatesLineBreak(llvm::StringRef Line) const {
   constexpr llvm::StringLiteral Punctuation = R"txt(.:,;!?)txt";

   Line = Line.rtrim();
   return !Line.empty() && Punctuation.contains(Line.back());
 }

 bool Paragraph::isHardLineBreakIndicator(llvm::StringRef Rest) const {
   // '-'/'*' md list, '@'/'\' documentation command, '>' md blockquote,
   // '#' headings, '`' code blocks, two spaces (markdown force newline)
   constexpr llvm::StringLiteral LinebreakIndicators = R"txt(-*@\>#`)txt";

   Rest = Rest.ltrim(" \t");
   if (Rest.empty())
     return false;

   if (LinebreakIndicators.contains(Rest.front()))
     return true;

   if (llvm::isDigit(Rest.front())) {
     llvm::StringRef AfterDigit = Rest.drop_while(llvm::isDigit);
     if (AfterDigit.starts_with(".") || AfterDigit.starts_with(")"))
       return true;
   }
   return false;
 }

 bool Paragraph::isHardLineBreakAfter(llvm::StringRef Line,
                                      llvm::StringRef Rest) const {
   // In Markdown, 2 spaces before a line break forces a line break.
   // Add a line break for plaintext in this case too.
   // Should we also consider whether Line is short?
   return Line.ends_with("  ") || punctuationIndicatesLineBreak(Line) ||
          isHardLineBreakIndicator(Rest);
 }

 void Paragraph::renderPlainText(llvm::raw_ostream &OS) const {
   bool NeedsSpace = false;
   std::string ConcatenatedText;
   ConcatenatedText.reserve(EstimatedStringSize);

   llvm::raw_string_ostream ConcatenatedOS(ConcatenatedText);

   for (auto &C : Chunks) {

     if (C.Kind == ChunkKind::PlainText) {
       if (C.SpaceBefore || NeedsSpace)
         ConcatenatedOS << ' ';

       ConcatenatedOS << C.Contents;
       NeedsSpace = llvm::isSpace(C.Contents.back()) || C.SpaceAfter;
       continue;
     }

     if (C.SpaceBefore || NeedsSpace)
       ConcatenatedOS << ' ';
     llvm::StringRef Marker = "";
     if (C.Preserve && C.Kind == ChunkKind::InlineCode)
       Marker = chooseMarker({"`", "'", "\""}, C.Contents);
     else if (C.Kind == ChunkKind::Bold)
       Marker = "**";
     else if (C.Kind == ChunkKind::Emphasized)
       Marker = "*";
     ConcatenatedOS << Marker << C.Contents << Marker;
     NeedsSpace = C.SpaceAfter;
   }

   // We go through the contents line by line to handle the newlines
   // and required spacing correctly.
   //
   // Newlines are added if:
   // - the line ends with 2 spaces and a newline follows
   // - the line ends with punctuation that indicates a line break (.:,;!?)
   // - the next line starts with a hard line break indicator (-@>#`, or a digit
   //   followed by '.' or ')'), ignoring leading whitespace.
   //
   // Otherwise, newlines in the input are replaced with a single space.
   //
   // Multiple spaces are collapsed into a single space.
   //
   // Lines containing only whitespace are ignored.
   llvm::StringRef Line, Rest;

   for (std::tie(Line, Rest) =
            llvm::StringRef(ConcatenatedText).trim().split('\n');
        !(Line.empty() && Rest.empty());
        std::tie(Line, Rest) = Rest.split('\n')) {

     // Remove lines which only contain whitespace.
     //
     // Note: this also handles the case when there are multiple newlines
     // in a row, since all leading newlines are removed.
     //
     // The documentation parsing treats multiple newlines as paragraph
     // separators, hence it will create a new Paragraph instead of adding
     // multiple newlines to the same Paragraph.
     // Therfore multiple newlines are never added to a paragraph
     // except if the user explicitly adds them using
     // e.g. appendText("user text\n\nnext text").
     Line = Line.ltrim();
     if (Line.empty())
       continue;

     OS << canonicalizeSpaces(Line);

     if (isHardLineBreakAfter(Line, Rest))
       OS << '\n';
     else if (!Rest.empty())
       // Since we removed any trailing whitespace from the input using trim(),
       // we know that the next line contains non-whitespace characters.
       // Therefore, we can add a space without worrying about trailing spaces.
       OS << ' ';
   }

   // Paragraphs are separated by a blank line.
   OS << "\n\n";
 }

 BulletList::BulletList() = default;
 BulletList::~BulletList() = default;

 void BulletList::renderEscapedMarkdown(llvm::raw_ostream &OS) const {
   for (auto &D : Items) {
     std::string M = D.asEscapedMarkdown();
     // Instead of doing this we might prefer passing Indent to children to get
     // rid of the copies, if it turns out to be a bottleneck.
     OS << "- " << indentLines(M) << '\n';
   }
   // We add 2 newlines after list to terminate it in markdown.
   OS << "\n\n";
 }

 void BulletList::renderMarkdown(llvm::raw_ostream &OS) const {
   for (auto &D : Items) {
     std::string M = D.asMarkdown();
     // Instead of doing this we might prefer passing Indent to children to get
     // rid of the copies, if it turns out to be a bottleneck.
     OS << "- " << indentLines(M) << '\n';
   }
   // We add 2 newlines after list to terminate it in markdown.
   OS << "\n\n";
 }

 void BulletList::renderPlainText(llvm::raw_ostream &OS) const {
   for (auto &D : Items) {
     // Instead of doing this we might prefer passing Indent to children to get
     // rid of the copies, if it turns out to be a bottleneck.
     OS << "- " << indentLines(D.asPlainText()) << '\n';
   }
   OS << '\n';
 }

 Paragraph &Paragraph::appendSpace() {
   if (!Chunks.empty())
     Chunks.back().SpaceAfter = true;
   return *this;
 }

 Paragraph &Paragraph::appendChunk(llvm::StringRef Contents, ChunkKind K) {
   if (Contents.empty())
     return *this;
   Chunks.emplace_back();
   Chunk &C = Chunks.back();
   C.Contents = Contents;
   C.Kind = K;

   EstimatedStringSize += Contents.size();
   return *this;
 }

 Paragraph &Paragraph::appendText(llvm::StringRef Text) {
   if (!Chunks.empty() && Chunks.back().Kind == ChunkKind::PlainText) {
     Chunks.back().Contents += std::move(Text);
     return *this;
   }

   return appendChunk(std::move(Text), ChunkKind::PlainText);
 }

 Paragraph &Paragraph::appendEmphasizedText(llvm::StringRef Text) {
   return appendChunk(canonicalizeSpaces(std::move(Text)),
                      ChunkKind::Emphasized);
 }

 Paragraph &Paragraph::appendBoldText(llvm::StringRef Text) {
   return appendChunk(canonicalizeSpaces(std::move(Text)), ChunkKind::Bold);
 }

 Paragraph &Paragraph::appendCode(llvm::StringRef Code, bool Preserve) {
   bool AdjacentCode =
       !Chunks.empty() && Chunks.back().Kind == ChunkKind::InlineCode;
   std::string Norm = canonicalizeSpaces(std::move(Code));
   if (Norm.empty())
     return *this;
   EstimatedStringSize += Norm.size();
   Chunks.emplace_back();
   Chunk &C = Chunks.back();
   C.Contents = std::move(Norm);
   C.Kind = ChunkKind::InlineCode;
   C.Preserve = Preserve;
   // Disallow adjacent code spans without spaces, markdown can't render them.
   C.SpaceBefore = AdjacentCode;

   return *this;
 }

 std::unique_ptr<Block> BulletList::clone() const {
   return std::make_unique<BulletList>(*this);
 }

 class Document &BulletList::addItem() {
   Items.emplace_back();
   return Items.back();
 }

 Document &Document::operator=(const Document &Other) {
   Children.clear();
   for (const auto &C : Other.Children)
     Children.push_back(C->clone());
   return *this;
 }

 void Document::append(Document Other) {
   std::move(Other.Children.begin(), Other.Children.end(),
             std::back_inserter(Children));
 }

 Paragraph &Document::addParagraph() {
   Children.push_back(std::make_unique<Paragraph>());
   return *static_cast<Paragraph *>(Children.back().get());
 }

 void Document::addRuler() { Children.push_back(std::make_unique<Ruler>()); }

 void Document::addCodeBlock(std::string Code, std::string Language) {
   Children.emplace_back(
       std::make_unique<CodeBlock>(std::move(Code), std::move(Language)));
 }

 std::string Document::asEscapedMarkdown() const {
   return renderBlocks(Children, &Block::renderEscapedMarkdown);
 }

 std::string Document::asMarkdown() const {
   return renderBlocks(Children, &Block::renderMarkdown);
 }

 std::string Document::asPlainText() const {
   return renderBlocks(Children, &Block::renderPlainText);
 }

 BulletList &Document::addBulletList() {
   Children.emplace_back(std::make_unique<BulletList>());
   return *static_cast<BulletList *>(Children.back().get());
 }

 Paragraph &Document::addHeading(size_t Level) {
   assert(Level > 0);
   Children.emplace_back(std::make_unique<Heading>(Level));
   return *static_cast<Paragraph *>(Children.back().get());
 }
 } // namespace markup
 } // namespace clangd
 } // namespace clang