cppalliance
diff --git a/‎include/mrdocs/Support/String.hpp
Lines changed: 3 additions & 1 deletion b/‎include/mrdocs/Support/String.hpp
Lines changed: 3 additions & 1 deletion
diff --git a/‎src/lib/AST/ASTVisitor.cpp
Lines changed: 0 additions & 7 deletions b/‎src/lib/AST/ASTVisitor.cpp
Lines changed: 0 additions & 7 deletions
diff --git a/‎src/lib/AST/ParseJavadoc.cpp
Lines changed: 173 additions & 9 deletions b/‎src/lib/AST/ParseJavadoc.cpp
Lines changed: 173 additions & 9 deletions
diff --git a/‎src/lib/Gen/adoc/DocVisitor.cpp
Lines changed: 25 additions & 21 deletions b/‎src/lib/Gen/adoc/DocVisitor.cpp
Lines changed: 25 additions & 21 deletions
@@ -45,8 +45,10 @@ rtrim(std::string_view s) noexcept
 {
     auto it = s.end() - 1;
     while(it > s.begin() && std::isspace(*it))
+    {
         --it;
-    return s.substr(0, it - s.begin());
+    }
+    return s.substr(0, it - s.begin() + 1);
 }
 
 /** Return the substring without leading and trailing horizontal whitespace.
 
@@ -1754,13 +1754,6 @@ generateJavadoc(
     {
         return false;
     }
-    // KRYSTIAN FIXME: clang ignores documentation comments
-    // when there is a preprocessor directive between the end
-    // of the comment and the declaration location. there are two
-    // ways to fix this: either set the declaration begin location
-    // to be before and preprocessor directives, or submit a patch
-    // which disables this behavior (it's not entirely clear why
-    // this check occurs anyways, so some investigation is needed)
     parseJavadoc(javadoc, FC, D, config_, diags_);
     return true;
 }
 
@@ -16,6 +16,7 @@
 #include <mrdocs/Support/Error.hpp>
 #include <mrdocs/Support/Path.hpp>
 #include <mrdocs/Support/String.hpp>
+#include <mrdocs/Support/ScopeExit.hpp>
 #include <clang/AST/CommentCommandTraits.h>
 #include <clang/AST/ASTContext.h>
 #include <clang/AST/RawCommentList.h>
@@ -397,22 +398,183 @@ ensureUTF8(
     return s;
 }
 
+/*  Parse the inline content of a text
+
+    This function takes a string from a comment
+    and parses it into a sequence of styled text
+    nodes.
+
+    The string may contain inline commands that
+    change the style of the text:
+
+    Regular text is stored as a doc::Text.
+    Styled text is stored as a doc::Styled.
+
+    The styles can be one of: mono, bold, or italic.
+
+    The tags "`", "*", and "_" are used to indicate
+    the start and end of styled text. They can be
+    escaped by prefixing them with a backslash.
+
+ */
+doc::List<doc::Text>
+parseStyled(StringRef s)
+{
+    doc::List<doc::Text> result;
+    std::string currentText;
+    doc::Style currentStyle = doc::Style::none;
+    bool escapeNext = false;
+
+    auto isStyleMarker = [](char c) {
+        return c == '`' || c == '*' || c == '_';
+    };
+
+    auto flushCurrentText = [&]() {
+        if (!currentText.empty()) {
+            if (currentStyle == doc::Style::none) {
+                bool const lastIsSame =
+                    !result.empty() &&
+                    result.back()->kind == doc::Kind::text;
+                if (lastIsSame)
+                {
+                    auto& lastText = static_cast<doc::Text&>(*result.back());
+                    lastText.string.append(currentText);
+                }
+                else
+                {
+                    result.emplace_back(std::make_unique<doc::Text>(std::move(currentText)));
+                }
+            } else {
+                bool const lastIsSame =
+                    !result.empty() &&
+                    result.back()->kind == doc::Kind::styled &&
+                    static_cast<doc::Styled&>(*result.back()).style == currentStyle;
+                if (lastIsSame)
+                {
+                    auto& lastStyled = static_cast<doc::Styled&>(*result.back());
+                    lastStyled.string.append(currentText);
+                }
+                else
+                {
+                    result.emplace_back(std::make_unique<doc::Styled>(std::move(currentText), currentStyle));
+                }
+            }
+            currentText.clear();
+        }
+    };
+
+    auto isPunctuationOrSpace = [](char c) {
+        return std::isspace(c) || std::ispunct(c);
+    };
+
+    for (std::size_t i = 0; i < s.size(); ++i) {
+        char c = s[i];
+        if (escapeNext) {
+            currentText.push_back(c);
+            escapeNext = false;
+        } else if (c == '\\') {
+            escapeNext = true;
+        } else if (isStyleMarker(c)) {
+            bool const atWordBoundary =
+                (currentStyle == doc::Style::none && ((i == 0) || isPunctuationOrSpace(s[i - 1]))) ||
+                (currentStyle != doc::Style::none && ((i == s.size() - 1) || isPunctuationOrSpace(s[i + 1])));
+            if (atWordBoundary) {
+                flushCurrentText();
+                if (c == '`') {
+                    currentStyle = (currentStyle == doc::Style::mono) ? doc::Style::none : doc::Style::mono;
+                } else if (c == '*') {
+                    currentStyle = (currentStyle == doc::Style::bold) ? doc::Style::none : doc::Style::bold;
+                } else if (c == '_') {
+                    currentStyle = (currentStyle == doc::Style::italic) ? doc::Style::none : doc::Style::italic;
+                }
+            } else {
+                currentText.push_back(c);
+            }
+        } else {
+            currentText.push_back(c);
+        }
+    }
+
+    // Whatever style we started, we should end it because
+    // we reached the end of the string without a closing
+    // marker.
+    currentStyle = doc::Style::none;
+    flushCurrentText();
+
+    return result;
+}
+
 void
 JavadocVisitor::
 visitChildren(
     Comment const* C)
 {
-    auto const it0 = it_;
-    auto const end0 = end_;
-    it_ = C->child_begin();
-    end_ = C->child_end();
+    ScopeExitRestore s1(it_, C->child_begin());
+    ScopeExitRestore s2(end_, C->child_end());
     while(it_ != end_)
     {
         visit(*it_);
         ++it_; // must happen after
     }
-    it_ = it0;
-    end_ = end0;
+
+    if (!block_)
+    {
+        return;
+    }
+
+    bool const isVerbatim = block_->kind == doc::Kind::code;
+    if (isVerbatim)
+    {
+        return;
+    }
+
+    // Merge consecutive plain text nodes in the current block
+    auto it = block_->children.begin();
+    while(it != block_->children.end())
+    {
+        auto& child = *it;
+        if (child.get()->kind == doc::Kind::text)
+        {
+            auto* text = dynamic_cast<doc::Text*>(child.get());
+            MRDOCS_ASSERT(text);
+            auto next = std::next(it);
+            if(next != block_->children.end())
+            {
+                if(next->get()->kind == doc::Kind::text)
+                {
+                    auto* next_text = dynamic_cast<doc::Text*>(next->get());
+                    MRDOCS_ASSERT(next_text);
+                    text->string.append(next_text->string);
+                    it = block_->children.erase(next);
+                    continue;
+                }
+            }
+        }
+        ++it;
+    }
+
+    // Parse any Text nodes for styled text
+    for (auto it = block_->children.begin(); it != block_->children.end();)
+    {
+        MRDOCS_ASSERT(it->get());
+        if (it->get()->kind == doc::Kind::text)
+        {
+            auto* text = dynamic_cast<doc::Text*>(it->get());
+            auto styledText = parseStyled(text->string);
+            std::size_t const offset = std::distance(block_->children.begin(), it);
+            std::size_t const n = styledText.size();
+            block_->children.erase(it);
+            block_->children.insert(
+                block_->children.begin() + offset,
+                std::make_move_iterator(styledText.begin()),
+                std::make_move_iterator(styledText.end()));
+            it = block_->children.begin() + offset + n;
+        }
+        else
+        {
+            ++it;
+        }
+    }
 }
 
 //------------------------------------------------
@@ -462,16 +624,18 @@ visitTextComment(
     // If this is the first text comment in the
     // paragraph then remove all the leading space.
     // Otherwise, just remove the trailing space.
-    if(block_->children.empty())
+    if (block_->children.empty())
+    {
         s = s.ltrim();
-    else
-        s = s.rtrim();
+    }
 
     // Only insert non-empty text nodes
     if(! s.empty())
+    {
         emplaceText<doc::Text>(
             C->hasTrailingNewline(),
             ensureUTF8(s.str()));
+    }
 }
 
 Expected<JavadocVisitor::TagComponents>
 
@@ -18,6 +18,7 @@
 #include <llvm/Support/raw_ostream.h>
 #include <mrdocs/Support/RangeFor.hpp>
 #include <mrdocs/Support/String.hpp>
+#include <ranges>
 
 namespace clang::mrdocs::adoc {
 
@@ -65,7 +66,7 @@ operator()(
         doc::visit(*it.value,
             [&]<class T>(T const& text)
             {
-                if constexpr(std::is_same_v<T, doc::Text>)
+                if constexpr(std::derived_from<T, doc::Text>)
                 {
                     if(! text.string.empty())
                     {
@@ -89,7 +90,7 @@ DocVisitor::
 operator()(
     doc::Heading const& I) const
 {
-    fmt::format_to(ins_, "\n=== {}\n", AdocEscape(I.string));
+    fmt::format_to(ins_, "\n=== {}\n\n", AdocEscape(I.string));
 }
 
 // Also handles doc::Brief
@@ -103,15 +104,23 @@ operator()(
     {
         return;
     }
-    bool non_empty = write(*children.front(), *this);
-    for(auto const& child : children.subspan(1))
+
+    std::size_t i = 0;
+    for (auto it = children.begin(); it != children.end(); ++it)
     {
-        if (non_empty)
+        auto& child = *it;
+        if (i == 0)
         {
-            dest_.push_back('\n');
+            child->string = ltrim(child->string);
         }
-        non_empty = write(*child, *this);
+        if (i == children.size() - 1)
+        {
+            child->string = rtrim(child->string);
+        }
+        write(*child, *this);
+        i = i + 1;
     }
+
     dest_.push_back('\n');
     dest_.push_back('\n');
 }
@@ -188,37 +197,32 @@ void
 DocVisitor::
 operator()(doc::Text const& I) const
 {
-    // Asciidoc text must not have leading
-    // else they can be rendered up as code.
-    std::string_view s = trim(I.string);
-    // Render empty lines as paragraph delimiters.
-    if (s.empty())
+    if (I.string.empty())
+    {
+        dest_.append("\n\n");
+    } else
     {
-        s = "\n";
+        dest_.append(AdocEscape(I.string));
     }
-    dest_.append(AdocEscape(s));
 }
 
 void
 DocVisitor::
 operator()(doc::Styled const& I) const
 {
-    // VFALCO We need to apply Asciidoc escaping
-    // depending on the contents of the string.
-    std::string_view s = trim(I.string);
     switch(I.style)
     {
     case doc::Style::none:
-        dest_.append(s);
+        dest_.append(AdocEscape(I.string));
         break;
     case doc::Style::bold:
-        fmt::format_to(std::back_inserter(dest_), "*{}*", s);
+        fmt::format_to(std::back_inserter(dest_), "*{}*", AdocEscape(I.string));
         break;
     case doc::Style::mono:
-        fmt::format_to(std::back_inserter(dest_), "`{}`", s);
+        fmt::format_to(std::back_inserter(dest_), "`{}`", AdocEscape(I.string));
         break;
     case doc::Style::italic:
-        fmt::format_to(std::back_inserter(dest_), "_{}_", s);
+        fmt::format_to(std::back_inserter(dest_), "_{}_", AdocEscape(I.string));
         break;
     default:
         MRDOCS_UNREACHABLE();
Original file line number	Diff line number	Diff line change
`@@ -45,8 +45,10 @@ rtrim(std::string_view s) noexcept`
`45`	`45`	`{`
`46`	`46`	`auto it = s.end() - 1;`
`47`	`47`	`while(it > s.begin() && std::isspace(*it))`
	`48`	`+ {`
`48`	`49`	`--it;`
`49`		`- return s.substr(0, it - s.begin());`
	`50`	`+ }`
	`51`	`+ return s.substr(0, it - s.begin() + 1);`
`50`	`52`	`}`
`51`	`53`
`52`	`54`	`/** Return the substring without leading and trailing horizontal whitespace.`
Original file line number	Diff line number	Diff line change
`@@ -1754,13 +1754,6 @@ generateJavadoc(`
`1754`	`1754`	`{`
`1755`	`1755`	`return false;`
`1756`	`1756`	`}`
`1757`		`- // KRYSTIAN FIXME: clang ignores documentation comments`
`1758`		`- // when there is a preprocessor directive between the end`
`1759`		`- // of the comment and the declaration location. there are two`
`1760`		`- // ways to fix this: either set the declaration begin location`
`1761`		`- // to be before and preprocessor directives, or submit a patch`
`1762`		`- // which disables this behavior (it's not entirely clear why`
`1763`		`- // this check occurs anyways, so some investigation is needed)`
`1764`	`1757`	`parseJavadoc(javadoc, FC, D, config_, diags_);`
`1765`	`1758`	`return true;`
`1766`	`1759`	`}`
Original file line number	Diff line number	Diff line change
`@@ -18,6 +18,7 @@`
`18`	`18`	`#include <llvm/Support/raw_ostream.h>`
`19`	`19`	`#include <mrdocs/Support/RangeFor.hpp>`
`20`	`20`	`#include <mrdocs/Support/String.hpp>`
	`21`	`+#include <ranges>`
`21`	`22`
`22`	`23`	`namespace clang::mrdocs::adoc {`
`23`	`24`
`@@ -65,7 +66,7 @@ operator()(`
`65`	`66`	`doc::visit(*it.value,`
`66`	`67`	`[&]<class T>(T const& text)`
`67`	`68`	`{`
`68`		`- if constexpr(std::is_same_v<T, doc::Text>)`
	`69`	`+ if constexpr(std::derived_from<T, doc::Text>)`
`69`	`70`	`{`
`70`	`71`	`if(! text.string.empty())`
`71`	`72`	`{`
`@@ -89,7 +90,7 @@ DocVisitor::`
`89`	`90`	`operator()(`
`90`	`91`	`doc::Heading const& I) const`
`91`	`92`	`{`
`92`		`- fmt::format_to(ins_, "\n=== {}\n", AdocEscape(I.string));`
	`93`	`+ fmt::format_to(ins_, "\n=== {}\n\n", AdocEscape(I.string));`
`93`	`94`	`}`
`94`	`95`
`95`	`96`	`// Also handles doc::Brief`
`@@ -103,15 +104,23 @@ operator()(`
`103`	`104`	`{`
`104`	`105`	`return;`
`105`	`106`	`}`
`106`		`- bool non_empty = write(children.front(), this);`
`107`		`- for(auto const& child : children.subspan(1))`
	`107`	`+`
	`108`	`+ std::size_t i = 0;`
	`109`	`+ for (auto it = children.begin(); it != children.end(); ++it)`
`108`	`110`	`{`
`109`		`- if (non_empty)`
	`111`	`+ auto& child = *it;`
	`112`	`+ if (i == 0)`
`110`	`113`	`{`
`111`		`- dest_.push_back('\n');`
	`114`	`+ child->string = ltrim(child->string);`
`112`	`115`	`}`
`113`		`- non_empty = write(child, this);`
	`116`	`+ if (i == children.size() - 1)`
	`117`	`+ {`
	`118`	`+ child->string = rtrim(child->string);`
	`119`	`+ }`
	`120`	`+ write(child, this);`
	`121`	`+ i = i + 1;`
`114`	`122`	`}`
	`123`	`+`
`115`	`124`	`dest_.push_back('\n');`
`116`	`125`	`dest_.push_back('\n');`
`117`	`126`	`}`
`@@ -188,37 +197,32 @@ void`
`188`	`197`	`DocVisitor::`
`189`	`198`	`operator()(doc::Text const& I) const`
`190`	`199`	`{`
`191`		`- // Asciidoc text must not have leading`
`192`		`- // else they can be rendered up as code.`
`193`		`- std::string_view s = trim(I.string);`
`194`		`- // Render empty lines as paragraph delimiters.`
`195`		`- if (s.empty())`
	`200`	`+ if (I.string.empty())`
	`201`	`+ {`
	`202`	`+ dest_.append("\n\n");`
	`203`	`+ } else`
`196`	`204`	`{`
`197`		`- s = "\n";`
	`205`	`+ dest_.append(AdocEscape(I.string));`
`198`	`206`	`}`
`199`		`- dest_.append(AdocEscape(s));`
`200`	`207`	`}`
`201`	`208`
`202`	`209`	`void`
`203`	`210`	`DocVisitor::`
`204`	`211`	`operator()(doc::Styled const& I) const`
`205`	`212`	`{`
`206`		`- // VFALCO We need to apply Asciidoc escaping`
`207`		`- // depending on the contents of the string.`
`208`		`- std::string_view s = trim(I.string);`
`209`	`213`	`switch(I.style)`
`210`	`214`	`{`
`211`	`215`	`case doc::Style::none:`
`212`		`- dest_.append(s);`
	`216`	`+ dest_.append(AdocEscape(I.string));`
`213`	`217`	`break;`
`214`	`218`	`case doc::Style::bold:`
`215`		`- fmt::format_to(std::back_inserter(dest_), "{}", s);`
	`219`	`+ fmt::format_to(std::back_inserter(dest_), "{}", AdocEscape(I.string));`
`216`	`220`	`break;`
`217`	`221`	`case doc::Style::mono:`
`218`		- fmt::format_to(std::back_inserter(dest_), "`{}`", s);
	`222`	+ fmt::format_to(std::back_inserter(dest_), "`{}`", AdocEscape(I.string));
`219`	`223`	`break;`
`220`	`224`	`case doc::Style::italic:`
`221`		`- fmt::format_to(std::back_inserter(dest_), "_{}_", s);`
	`225`	`+ fmt::format_to(std::back_inserter(dest_), "_{}_", AdocEscape(I.string));`
`222`	`226`	`break;`
`223`	`227`	`default:`
`224`	`228`	`MRDOCS_UNREACHABLE();`