From 0c3a0d2f2f81aa87738c3304251eaa4a23240b36 Mon Sep 17 00:00:00 2001
From: Jeremy Daer <jeremy@37signals.com>
Date: Thu, 9 Apr 2026 13:37:51 -0700
Subject: [PATCH] Replace hand-rolled MarkdownToHTML with goldmark
MIME-Version: 1.0
Content-Type: text/plain; charset=UTF-8
Content-Transfer-Encoding: 8bit

Replace the ~350-line regex pipeline (convertInline, placeholder
extraction/restoration, line-by-line parser) with goldmark configured
for Trix editor compatibility via three custom components:

- trixTransformer: forces tight lists, converts soft breaks to hard
  inside list items and blockquotes, inserts <br> between
  blank-line-separated blocks for Trix paragraph spacing
- trixRenderer: compact blockquote output, HTML escaping for raw
  HTML blocks (vs <!-- raw HTML omitted -->), TrixBreak and
  EscapedAt node rendering
- escapedAtParser: intercepts \@ before goldmark's standard escape
  handling to preserve mention-suppression syntax

HTMLToMarkdown gains <br>-aware round-trip support: blockquote and
list handlers now normalize <br> tags before splitting, so multiline
blockquotes and list continuations survive the edit loop
(MarkdownToHTML → HTMLToMarkdown) faithfully. Also fixes multiline
blockquote/paragraph regex matching ((?i) → (?is)) and trims
trailing newlines from code fence content.

Promotes goldmark from indirect to direct dependency (v1.7.13, already
present via glamour).
---
 go.mod                             |   2 +-
 internal/richtext/richtext.go      | 962 +++++++++++++++--------------
 internal/richtext/richtext_test.go | 519 +++++++++++++++-
 3 files changed, 995 insertions(+), 488 deletions(-)
diff --git a/go.mod b/go.mod
index 97ef1cf2..957cd115 100644
--- a/go.mod
+++ b/go.mod
@@ -19,6 +19,7 @@ require (
 	github.com/spf13/cobra v1.10.2
 	github.com/spf13/pflag v1.0.10
 	github.com/stretchr/testify v1.11.1
+	github.com/yuin/goldmark v1.7.13
 	github.com/zalando/go-keyring v0.2.8
 	golang.org/x/mod v0.34.0
 	golang.org/x/sys v0.42.0
@@ -70,7 +71,6 @@ require (
 	github.com/rivo/uniseg v0.4.7 // indirect
 	github.com/rogpeppe/go-internal v1.14.1 // indirect
 	github.com/xo/terminfo v0.0.0-20220910002029-abceb7e1c41e // indirect
-	github.com/yuin/goldmark v1.7.13 // indirect
 	github.com/yuin/goldmark-emoji v1.0.6 // indirect
 	golang.org/x/net v0.38.0 // indirect
 	golang.org/x/sync v0.20.0 // indirect
diff --git a/internal/richtext/richtext.go b/internal/richtext/richtext.go
index 04f3f210..730a0b5b 100644
--- a/internal/richtext/richtext.go
+++ b/internal/richtext/richtext.go
@@ -3,6 +3,7 @@
 package richtext
 
 import (
+	"bytes"
 	"errors"
 	"fmt"
 	"html"
@@ -15,40 +16,18 @@ import (
 	"unicode/utf8"
 
 	"github.com/charmbracelet/glamour"
+	"github.com/yuin/goldmark"
+	"github.com/yuin/goldmark/ast"
+	"github.com/yuin/goldmark/extension"
+	"github.com/yuin/goldmark/parser"
+	"github.com/yuin/goldmark/renderer"
+	gmhtml "github.com/yuin/goldmark/renderer/html"
+	"github.com/yuin/goldmark/text"
+	"github.com/yuin/goldmark/util"
 )
 
-// Pre-compiled regexes for MarkdownToHTML list detection
-var (
-	ulPattern = regexp.MustCompile(`^(\s*)[-*+]\s+(.*)$`)
-	olPattern = regexp.MustCompile(`^(\s*)\d+\.\s+(.*)$`)
-)
-
-// CommonMark §2.4: any ASCII punctuation may be backslash-escaped.
-// Exact set: !"#$%&'()*+,-./:;<=>?@[\]^_`{|}~
-//
-// We intentionally omit @ from the set: in Basecamp context \@ is the
-// idiomatic way to suppress a mention ping, so it must pass through
-// literally and not be unescaped into a bare @ that ResolveMentions
-// would convert into a <bc-attachment> mention.
-const commonMarkEscapablePunctuation = "!\"#$%&'()*+,-./:;<=>?[\\]^_`{|}~"
-
-// Pre-compiled regexes for convertInline (Markdown → HTML inline elements)
-var (
-	reCodeSpan      = regexp.MustCompile("`([^`]+)`")
-	reBoldStar      = regexp.MustCompile(`\*\*([^*]+)\*\*`)
-	reBoldUnder     = regexp.MustCompile(`__([^_]+)__`)
-	reItalicStar    = regexp.MustCompile(`\*([^*]+)\*`)
-	reItalicUnder   = regexp.MustCompile(`(?:^|[^a-zA-Z0-9])_([^_]+)_(?:[^a-zA-Z0-9]|$)`)
-	reItalicInner   = regexp.MustCompile(`_([^_]+)_`)
-	reImage         = regexp.MustCompile(`!\[([^\]]*)\]\(([^)]+)\)`)
-	reLink          = regexp.MustCompile(`\[([^\]]+)\]\(([^)]+)\)`)
-	reStrikethrough = regexp.MustCompile(`~~([^~]+)~~`)
-
-	// Protect escaped backticks before code-span detection so \` does not start a code span.
-	reEscapedBacktick = regexp.MustCompile("\\\\`")
-	// Matches a backslash followed by any CommonMark-escapable ASCII punctuation character.
-	reBackslashEscape = regexp.MustCompile(`\\([` + regexp.QuoteMeta(commonMarkEscapablePunctuation) + `])`)
-)
+// Pre-compiled regexes for IsHTML detection (code span stripping)
+var reCodeSpan = regexp.MustCompile("`([^`]+)`")
 
 // Pre-compiled regexes for HTMLToMarkdown (HTML → Markdown block elements)
 var (
@@ -58,32 +37,34 @@ var (
 	reH4         = regexp.MustCompile(`(?i)<h4[^>]*>(.*?)</h4>`)
 	reH5         = regexp.MustCompile(`(?i)<h5[^>]*>(.*?)</h5>`)
 	reH6         = regexp.MustCompile(`(?i)<h6[^>]*>(.*?)</h6>`)
-	reBlockquote = regexp.MustCompile(`(?i)<blockquote[^>]*>(.*?)</blockquote>`)
+	reBlockquote = regexp.MustCompile(`(?is)<blockquote[^>]*>(.*?)</blockquote>`)
 	reCodeBlock  = regexp.MustCompile(`(?is)<pre[^>]*><code[^>]*(?:class="language-([^"]*)")?[^>]*>(.*?)</code></pre>`)
 	reCodeLang   = regexp.MustCompile(`class="language-([^"]*)"`)
+	rePreLang    = regexp.MustCompile(`(?i)<pre[^>]*\blanguage="([^"]*)"`)
 	reCodeInner  = regexp.MustCompile(`(?is)<code[^>]*>([\s\S]*?)</code>`)
-	reUL         = regexp.MustCompile(`(?is)<ul[^>]*>(.*?)</ul>`)
-	reOL         = regexp.MustCompile(`(?is)<ol[^>]*>(.*?)</ol>`)
-	reLI         = regexp.MustCompile(`(?is)<li[^>]*>(.*?)</li>`)
-	reP          = regexp.MustCompile(`(?i)<p[^>]*>(.*?)</p>`)
-	reBR         = regexp.MustCompile(`(?i)<br\s*/?\s*>`)
-	reHR         = regexp.MustCompile(`(?i)<hr\s*/?\s*>`)
+	// Tag-match patterns use (?:\s[^>]*)? to require whitespace or `>` after the
+	// tag name, preventing false matches against longer tag names with the same
+	// prefix (e.g. <p> vs <pre>, <b> vs <br>, <em> vs <embed>, <i> vs <img>,
+	// <s> vs <script>, <del> vs <details>, <a> vs <abbr>).
+	reP  = regexp.MustCompile(`(?is)<p(?:\s[^>]*)?>(.*?)</p>`)
+	reBR = regexp.MustCompile(`(?i)<br\s*/?\s*>`)
+	reHR = regexp.MustCompile(`(?i)<hr\s*/?\s*>`)
 )
 
 // Pre-compiled regexes for HTMLToMarkdown inline elements
 var (
-	reHTMLStrong        = regexp.MustCompile(`(?i)<strong[^>]*>(.*?)</strong>`)
-	reHTMLB             = regexp.MustCompile(`(?i)<b[^>]*>(.*?)</b>`)
-	reHTMLEm            = regexp.MustCompile(`(?i)<em[^>]*>(.*?)</em>`)
-	reHTMLI             = regexp.MustCompile(`(?i)<i[^>]*>(.*?)</i>`)
-	reHTMLCode          = regexp.MustCompile(`(?i)<code[^>]*>(.*?)</code>`)
-	reHTMLLink          = regexp.MustCompile(`(?i)<a[^>]*href="([^"]*)"[^>]*>(.*?)</a>`)
-	reHTMLImgSA         = regexp.MustCompile(`(?i)<img[^>]*src="([^"]*)"[^>]*alt="([^"]*)"[^>]*/?\s*>`)
-	reHTMLImgAS         = regexp.MustCompile(`(?i)<img[^>]*alt="([^"]*)"[^>]*src="([^"]*)"[^>]*/?\s*>`)
-	reHTMLImgS          = regexp.MustCompile(`(?i)<img[^>]*src="([^"]*)"[^>]*/?\s*>`)
-	reHTMLDel           = regexp.MustCompile(`(?i)<del[^>]*>(.*?)</del>`)
-	reHTMLS             = regexp.MustCompile(`(?i)<s[^>]*>(.*?)</s>`)
-	reHTMLStrike        = regexp.MustCompile(`(?i)<strike[^>]*>(.*?)</strike>`)
+	reHTMLStrong        = regexp.MustCompile(`(?i)<strong(?:\s[^>]*)?>(.*?)</strong>`)
+	reHTMLB             = regexp.MustCompile(`(?i)<b(?:\s[^>]*)?>(.*?)</b>`)
+	reHTMLEm            = regexp.MustCompile(`(?i)<em(?:\s[^>]*)?>(.*?)</em>`)
+	reHTMLI             = regexp.MustCompile(`(?i)<i(?:\s[^>]*)?>(.*?)</i>`)
+	reHTMLCode          = regexp.MustCompile(`(?i)<code(?:\s[^>]*)?>(.*?)</code>`)
+	reHTMLLink          = regexp.MustCompile(`(?i)<a\s[^>]*href="([^"]*)"[^>]*>(.*?)</a>`)
+	reHTMLImgSA         = regexp.MustCompile(`(?i)<img\s[^>]*src="([^"]*)"[^>]*alt="([^"]*)"[^>]*/?\s*>`)
+	reHTMLImgAS         = regexp.MustCompile(`(?i)<img\s[^>]*alt="([^"]*)"[^>]*src="([^"]*)"[^>]*/?\s*>`)
+	reHTMLImgS          = regexp.MustCompile(`(?i)<img\s[^>]*src="([^"]*)"[^>]*/?\s*>`)
+	reHTMLDel           = regexp.MustCompile(`(?i)<del(?:\s[^>]*)?>(.*?)</del>`)
+	reHTMLS             = regexp.MustCompile(`(?i)<s(?:\s[^>]*)?>(.*?)</s>`)
+	reHTMLStrike        = regexp.MustCompile(`(?i)<strike(?:\s[^>]*)?>(.*?)</strike>`)
 	reMentionAttachment = regexp.MustCompile(`(?is)<bc-attachment[^>]*content-type="application/vnd\.basecamp\.mention"[^>]*>(.*?)</bc-attachment>`)
 	reMentionFigcaption = regexp.MustCompile(`(?is)<figcaption[^>]*>(.*?)</figcaption>`)
 	reMentionImgAlt     = regexp.MustCompile(`(?is)<img[^>]*alt="([^"]+)"[^>]*>`)
@@ -131,355 +112,257 @@ var reMarkdownPatterns = []*regexp.Regexp{
 	regexp.MustCompile(`^>\s`),
 }
 
-// MarkdownToHTML converts Markdown text to HTML suitable for Basecamp's rich text fields.
-// It handles common Markdown syntax: headings, bold, italic, links, lists, code blocks, and blockquotes.
-// If the input already appears to be HTML, it is returned unchanged to preserve existing formatting.
-func MarkdownToHTML(md string) string {
-	if md == "" {
-		return ""
-	}
+// mdConverter is the goldmark Markdown-to-HTML converter configured for Trix compatibility.
+var mdConverter = goldmark.New(
+	goldmark.WithExtensions(extension.Strikethrough),
+	goldmark.WithRendererOptions(gmhtml.WithUnsafe()),
+	goldmark.WithParserOptions(
+		parser.WithInlineParsers(
+			util.Prioritized(&escapedAtParser{}, 900),
+		),
+		parser.WithASTTransformers(
+			util.Prioritized(&trixTransformer{}, 100),
+		),
+	),
+	goldmark.WithRendererOptions(
+		renderer.WithNodeRenderers(
+			util.Prioritized(&trixRenderer{}, 500),
+		),
+	),
+)
 
-	// If input is already HTML, return unchanged to preserve existing content
-	if IsHTML(md) {
-		return md
-	}
+// TrixBreak is a custom block node that renders as <br>\n for Trix paragraph spacing.
+type TrixBreak struct{ ast.BaseBlock }
 
-	// Normalize line endings
-	md = strings.ReplaceAll(md, "\r\n", "\n")
-	md = strings.ReplaceAll(md, "\r", "\n")
+// KindTrixBreak is the node kind for TrixBreak.
+var KindTrixBreak = ast.NewNodeKind("TrixBreak")
 
-	var result strings.Builder
-	lines := strings.Split(md, "\n")
-
-	var inCodeBlock bool
-	var codeBlockLang string
-	var codeLines []string
-	var inList bool
-	var listItems []string
-	var listType string // "ul" or "ol"
-	var pendingBreak bool
-	var paraLines []string
-
-	flushPendingBreak := func() {
-		if pendingBreak {
-			result.WriteString("<br>\n")
-			pendingBreak = false
-		}
-	}
+func (n *TrixBreak) Kind() ast.NodeKind            { return KindTrixBreak }
+func (n *TrixBreak) Dump(source []byte, level int) { ast.DumpHelper(n, source, level, nil, nil) }
 
-	flushParagraph := func() {
-		if len(paraLines) > 0 {
-			flushPendingBreak()
-			text := strings.Join(paraLines, " ")
-			result.WriteString("<p>" + convertInline(text) + "</p>\n")
-			paraLines = nil
-		}
-	}
+// EscapedAt is a custom inline node that renders as literal \@.
+type EscapedAt struct{ ast.BaseInline }
 
-	flushList := func() {
-		if len(listItems) > 0 {
-			result.WriteString("<" + listType + ">\n")
-			for _, item := range listItems {
-				result.WriteString("<li>" + item + "</li>\n")
-			}
-			result.WriteString("</" + listType + ">\n")
-			listItems = nil
-			inList = false
-		}
-	}
+// KindEscapedAt is the node kind for EscapedAt.
+var KindEscapedAt = ast.NewNodeKind("EscapedAt")
 
-	for i := range lines {
-		line := lines[i]
+func (n *EscapedAt) Kind() ast.NodeKind            { return KindEscapedAt }
+func (n *EscapedAt) Dump(source []byte, level int) { ast.DumpHelper(n, source, level, nil, nil) }
 
-		// Handle code blocks
-		if after, ok := strings.CutPrefix(line, "```"); ok {
-			if inCodeBlock {
-				// End code block
-				code := strings.Join(codeLines, "\n")
-				code = escapeHTML(code)
-				if codeBlockLang != "" {
-					// Sanitize language to prevent attribute injection
-					safeLang := sanitizeLanguage(codeBlockLang)
-					result.WriteString("<pre><code class=\"language-" + safeLang + "\">" + code + "</code></pre>\n")
-				} else {
-					result.WriteString("<pre><code>" + code + "</code></pre>\n")
-				}
-				inCodeBlock = false
-				codeLines = nil
-				codeBlockLang = ""
-			} else {
-				// Start code block
-				flushParagraph()
-				flushList()
-				flushPendingBreak()
-				inCodeBlock = true
-				codeBlockLang = after
-			}
-			continue
-		}
+// escapedAtParser intercepts \@ before goldmark's standard backslash escape handling.
+type escapedAtParser struct{}
 
-		if inCodeBlock {
-			codeLines = append(codeLines, line)
-			continue
-		}
+func (p *escapedAtParser) Trigger() []byte { return []byte{'\\'} }
 
-		// Check for list items (using precompiled regexes)
-		ulMatch := ulPattern.FindStringSubmatch(line)
-		olMatch := olPattern.FindStringSubmatch(line)
-
-		if ulMatch != nil {
-			flushParagraph()
-			if !inList || listType != "ul" {
-				flushList()
-				flushPendingBreak()
-				inList = true
-				listType = "ul"
-			}
-			pendingBreak = false // blank was between items, not after the list
-			listItems = append(listItems, convertInline(ulMatch[2]))
-			continue
-		}
+func (p *escapedAtParser) Parse(_ ast.Node, block text.Reader, _ parser.Context) ast.Node {
+	line, _ := block.PeekLine()
+	if len(line) < 2 || line[0] != '\\' || line[1] != '@' {
+		return nil
+	}
+	block.Advance(2)
+	return &EscapedAt{}
+}
 
-		if olMatch != nil {
-			flushParagraph()
-			if !inList || listType != "ol" {
-				flushList()
-				flushPendingBreak()
-				inList = true
-				listType = "ol"
-			}
-			pendingBreak = false // blank was between items, not after the list
-			listItems = append(listItems, convertInline(olMatch[2]))
-			continue
-		}
+// trixTransformer modifies the AST for Trix-compatible HTML output.
+type trixTransformer struct{}
 
-		// Empty line - handle differently based on context
-		if strings.TrimSpace(line) == "" {
-			if inList {
-				// In a list: empty lines between items create spacing but don't break the list.
-				// Record pending break so content after the list gets proper separation.
-				pendingBreak = true
-				continue
-			}
-			// Not in a list: flush paragraph and record break
-			flushParagraph()
-			if result.Len() > 0 {
-				pendingBreak = true
-			}
-			continue
+func (t *trixTransformer) Transform(node *ast.Document, reader text.Reader, pc parser.Context) {
+	// Phase 1: Force tight lists, convert soft breaks to hard in list items,
+	// and unwrap blockquote paragraphs
+	_ = ast.Walk(node, func(n ast.Node, entering bool) (ast.WalkStatus, error) {
+		if !entering {
+			return ast.WalkContinue, nil
 		}
-
-		// Check for list continuation lines (indented text that continues previous list item)
-		if inList && len(listItems) > 0 {
-			// Check if line is indented (starts with spaces or tabs)
-			if strings.HasPrefix(line, " ") || strings.HasPrefix(line, "\t") {
-				// This is a continuation of the last list item
-				trimmedLine := strings.TrimSpace(line)
-				// Append to last list item with <br> separator
-				lastItemIndex := len(listItems) - 1
-				listItems[lastItemIndex] = listItems[lastItemIndex] + "<br>\n" + convertInline(trimmedLine)
-				pendingBreak = false // blank was before continuation, not after the list
-				continue
+		switch v := n.(type) {
+		case *ast.List:
+			v.IsTight = true
+			for li := v.FirstChild(); li != nil; li = li.NextSibling() {
+				replaceParagraphsWithTextBlocks(li)
+				convertSoftBreaksToHard(li)
 			}
+		case *ast.Blockquote:
+			replaceParagraphsWithTextBlocks(v)
+			convertSoftBreaksToHard(v)
+			insertBreaksBetweenTextBlocks(v)
 		}
+		return ast.WalkContinue, nil
+	})
 
-		// Not a list item or continuation, flush any pending list
-		flushList()
-
-		// Headings
-		if strings.HasPrefix(line, "#") {
-			flushParagraph()
-			flushPendingBreak()
-		}
-		if after, ok := strings.CutPrefix(line, "######"); ok {
-			result.WriteString("<h6>" + convertInline(strings.TrimSpace(after)) + "</h6>\n")
-			continue
-		}
-		if after, ok := strings.CutPrefix(line, "#####"); ok {
-			result.WriteString("<h5>" + convertInline(strings.TrimSpace(after)) + "</h5>\n")
-			continue
-		}
-		if after, ok := strings.CutPrefix(line, "####"); ok {
-			result.WriteString("<h4>" + convertInline(strings.TrimSpace(after)) + "</h4>\n")
-			continue
+	// Phase 2: Insert TrixBreak nodes before blank-line-separated top-level blocks
+	for child := node.FirstChild(); child != nil; child = child.NextSibling() {
+		if child.HasBlankPreviousLines() && child.PreviousSibling() != nil {
+			br := &TrixBreak{}
+			node.InsertBefore(node, child, br)
 		}
-		if after, ok := strings.CutPrefix(line, "###"); ok {
-			result.WriteString("<h3>" + convertInline(strings.TrimSpace(after)) + "</h3>\n")
-			continue
-		}
-		if after, ok := strings.CutPrefix(line, "##"); ok {
-			result.WriteString("<h2>" + convertInline(strings.TrimSpace(after)) + "</h2>\n")
-			continue
-		}
-		if after, ok := strings.CutPrefix(line, "#"); ok {
-			result.WriteString("<h1>" + convertInline(strings.TrimSpace(after)) + "</h1>\n")
-			continue
+	}
+}
+
+func replaceParagraphsWithTextBlocks(parent ast.Node) {
+	for child := parent.FirstChild(); child != nil; {
+		next := child.NextSibling()
+		if p, ok := child.(*ast.Paragraph); ok {
+			tb := ast.NewTextBlock()
+			for gc := p.FirstChild(); gc != nil; {
+				gnext := gc.NextSibling()
+				tb.AppendChild(tb, gc)
+				gc = gnext
+			}
+			tb.SetLines(p.Lines())
+			parent.ReplaceChild(parent, p, tb)
 		}
+		child = next
+	}
+}
 
-		// Blockquote
-		if strings.HasPrefix(line, ">") {
-			flushParagraph()
-			flushPendingBreak()
+func convertSoftBreaksToHard(parent ast.Node) {
+	_ = ast.Walk(parent, func(n ast.Node, entering bool) (ast.WalkStatus, error) {
+		if !entering {
+			return ast.WalkContinue, nil
 		}
-		if after, ok := strings.CutPrefix(line, ">"); ok {
-			quote := strings.TrimSpace(after)
-			result.WriteString("<blockquote>" + convertInline(quote) + "</blockquote>\n")
-			continue
+		if t, ok := n.(*ast.Text); ok && t.SoftLineBreak() {
+			t.SetSoftLineBreak(false)
+			t.SetHardLineBreak(true)
 		}
+		return ast.WalkContinue, nil
+	})
+}
 
-		// Horizontal rule
-		trimmed := strings.TrimSpace(line)
-		if len(trimmed) >= 3 && (allChars(trimmed, '-') || allChars(trimmed, '*') || allChars(trimmed, '_')) {
-			flushParagraph()
-			flushPendingBreak()
-			result.WriteString("<hr>\n")
-			continue
+func insertBreaksBetweenTextBlocks(parent ast.Node) {
+	for child := parent.FirstChild(); child != nil; child = child.NextSibling() {
+		if _, ok := child.(*ast.TextBlock); ok {
+			if next := child.NextSibling(); next != nil {
+				if _, ok := next.(*ast.TextBlock); ok {
+					br := &TrixBreak{}
+					parent.InsertAfter(parent, child, br)
+				}
+			}
 		}
-
-		// Accumulate paragraph lines
-		paraLines = append(paraLines, line)
-	}
-
-	// Flush any remaining paragraph or list
-	flushParagraph()
-	flushList()
-
-	// Handle unclosed code block
-	if inCodeBlock && len(codeLines) > 0 {
-		code := strings.Join(codeLines, "\n")
-		code = escapeHTML(code)
-		result.WriteString("<pre><code>" + code + "</code></pre>\n")
 	}
-
-	return strings.TrimSpace(result.String())
 }
 
-// convertInline converts inline Markdown elements (bold, italic, links, code) to HTML.
-// Code spans and backslash escapes are protected from further processing to preserve
-// their literal content.
-func convertInline(text string) string {
-	// Protect escaped backticks before code-span detection so \` remains literal
-	// and cannot be interpreted as a code-span delimiter.
-	var escapedBackticks []string
-	text = reEscapedBacktick.ReplaceAllStringFunc(text, func(_ string) string {
-		idx := len(escapedBackticks)
-		escapedBackticks = append(escapedBackticks, "`")
-		return "\x00ESCBT" + strconv.Itoa(idx) + "\x00"
-	})
+// trixRenderer provides custom rendering for Trix-compatible HTML output.
+type trixRenderer struct{}
 
-	// Extract code spans — their content must be completely literal.
-	var codeSpans []string
-	text = reCodeSpan.ReplaceAllStringFunc(text, func(match string) string {
-		inner := reCodeSpan.FindStringSubmatch(match)
-		if len(inner) >= 2 {
-			idx := len(codeSpans)
-			codeSpans = append(codeSpans, inner[1])
-			return "\x00CODE" + strconv.Itoa(idx) + "\x00"
-		}
-		return match
-	})
-
-	// Process backslash escapes (CommonMark §2.4): a backslash before an ASCII
-	// punctuation character produces the literal character. We extract these into
-	// placeholders so they are not treated as Markdown delimiters and restore
-	// them afterward. We use attribute-safe escaping on restore because escaped
-	// punctuation can be captured inside href/src values before link/image HTML is built.
-	var escaped []string
-	text = reBackslashEscape.ReplaceAllStringFunc(text, func(match string) string {
-		idx := len(escaped)
-		escaped = append(escaped, match[1:]) // the punctuation character after the backslash
-		return "\x00ESC" + strconv.Itoa(idx) + "\x00"
-	})
+func (r *trixRenderer) RegisterFuncs(reg renderer.NodeRendererFuncRegisterer) {
+	reg.Register(ast.KindRawHTML, r.renderRawHTML)
+	reg.Register(ast.KindHTMLBlock, r.renderHTMLBlock)
+	reg.Register(ast.KindBlockquote, r.renderBlockquote)
+	reg.Register(ast.KindFencedCodeBlock, r.renderFencedCodeBlock)
+	reg.Register(KindTrixBreak, r.renderTrixBreak)
+	reg.Register(KindEscapedAt, r.renderEscapedAt)
+}
 
-	// Escape HTML entities
-	text = escapeHTML(text)
+func (r *trixRenderer) renderBlockquote(w util.BufWriter, _ []byte, _ ast.Node, entering bool) (ast.WalkStatus, error) {
+	if entering {
+		_, _ = w.WriteString("<blockquote>")
+	} else {
+		_, _ = w.WriteString("</blockquote>\n")
+	}
+	return ast.WalkContinue, nil
+}
 
-	// Bold with ** or __
-	text = reBoldStar.ReplaceAllString(text, "<strong>$1</strong>")
-	text = reBoldUnder.ReplaceAllString(text, "<strong>$1</strong>")
+func (r *trixRenderer) renderRawHTML(w util.BufWriter, source []byte, node ast.Node, entering bool) (ast.WalkStatus, error) {
+	if !entering {
+		return ast.WalkContinue, nil
+	}
+	n, ok := node.(*ast.RawHTML)
+	if !ok {
+		return ast.WalkContinue, nil
+	}
+	for i := 0; i < n.Segments.Len(); i++ {
+		seg := n.Segments.At(i)
+		_, _ = w.Write(util.EscapeHTML(seg.Value(source)))
+	}
+	return ast.WalkContinue, nil
+}
 
-	// Italic with * or _ (but not inside words for _)
-	text = reItalicStar.ReplaceAllString(text, "<em>$1</em>")
-	text = reItalicUnder.ReplaceAllStringFunc(text, func(s string) string {
-		inner := reItalicInner.FindStringSubmatch(s)
-		if len(inner) >= 2 {
-			prefix := ""
-			suffix := ""
-			if len(s) > 0 && s[0] != '_' {
-				prefix = string(s[0])
-			}
-			if len(s) > 0 && s[len(s)-1] != '_' {
-				suffix = string(s[len(s)-1])
-			}
-			return prefix + "<em>" + inner[1] + "</em>" + suffix
-		}
-		return s
-	})
+func (r *trixRenderer) renderHTMLBlock(w util.BufWriter, source []byte, node ast.Node, entering bool) (ast.WalkStatus, error) {
+	if !entering {
+		return ast.WalkContinue, nil
+	}
+	n, ok := node.(*ast.HTMLBlock)
+	if !ok {
+		return ast.WalkContinue, nil
+	}
+	lines := n.Lines()
+	parts := make([]string, 0, lines.Len()+1)
+	for i := 0; i < lines.Len(); i++ {
+		seg := lines.At(i)
+		escaped := strings.TrimRight(string(util.EscapeHTML(seg.Value(source))), "\n")
+		parts = append(parts, escaped)
+	}
+	if n.HasClosure() {
+		escaped := strings.TrimRight(string(util.EscapeHTML(n.ClosureLine.Value(source))), "\n")
+		parts = append(parts, escaped)
+	}
+	_, _ = w.WriteString("<p>" + strings.Join(parts, " ") + "</p>\n")
+	return ast.WalkContinue, nil
+}
 
-	// Images ![alt](url) - MUST come before links since image syntax contains link syntax
-	text = reImage.ReplaceAllStringFunc(text, func(match string) string {
-		parts := reImage.FindStringSubmatch(match)
-		if len(parts) >= 3 {
-			alt := escapeAttr(parts[1])
-			src := resolveDestinationEscapes(parts[2], escaped, escapedBackticks)
-			src = escapeAttr(src)
-			return `<img src="` + src + `" alt="` + alt + `">`
+// renderFencedCodeBlock emits <pre language="X"><code>...</code></pre> for syntax
+// highlighting in BC5. The SyntaxHighlightFilter looks for the language attribute
+// on <pre>, not class="language-X" on <code> (the CommonMark default).
+func (r *trixRenderer) renderFencedCodeBlock(w util.BufWriter, source []byte, node ast.Node, entering bool) (ast.WalkStatus, error) {
+	n, ok := node.(*ast.FencedCodeBlock)
+	if !ok {
+		return ast.WalkContinue, nil
+	}
+	if entering {
+		if language := n.Language(source); language != nil {
+			_, _ = w.WriteString(`<pre language="`)
+			_, _ = w.Write(util.EscapeHTML(language))
+			_, _ = w.WriteString(`"><code>`)
+		} else {
+			_, _ = w.WriteString("<pre><code>")
 		}
-		return match
-	})
-
-	// Links [text](url)
-	text = reLink.ReplaceAllStringFunc(text, func(match string) string {
-		parts := reLink.FindStringSubmatch(match)
-		if len(parts) >= 3 {
-			linkText := parts[1]
-			href := resolveDestinationEscapes(parts[2], escaped, escapedBackticks)
-			href = escapeAttr(href)
-			return `<a href="` + href + `">` + linkText + `</a>`
+		lines := n.Lines()
+		for i := 0; i < lines.Len(); i++ {
+			line := lines.At(i)
+			_, _ = w.Write(util.EscapeHTML(line.Value(source)))
 		}
-		return match
-	})
-
-	// Strikethrough ~~text~~
-	text = reStrikethrough.ReplaceAllString(text, "<del>$1</del>")
-
-	// Restore backslash-escaped characters in body text. Placeholders inside
-	// link/image destinations were already resolved with percent-encoding above.
-	escapedRendered := make([]string, len(escaped))
-	for i, ch := range escaped {
-		escapedRendered[i] = escapeAttr(ch)
+	} else {
+		_, _ = w.WriteString("</code></pre>\n")
 	}
-	text = restorePlaceholders(text, "ESC", escapedRendered)
-	text = restorePlaceholders(text, "ESCBT", escapedRenderedBackticks(escapedBackticks))
+	return ast.WalkContinue, nil
+}
 
-	// Restore code spans (HTML-escape their content since extraction now
-	// happens before escapeHTML to allow backslash-escape processing).
-	codeRendered := make([]string, len(codeSpans))
-	for i, code := range codeSpans {
-		codeRendered[i] = "<code>" + escapeHTML(code) + "</code>"
+func (r *trixRenderer) renderTrixBreak(w util.BufWriter, _ []byte, _ ast.Node, entering bool) (ast.WalkStatus, error) {
+	if !entering {
+		return ast.WalkContinue, nil
 	}
-	text = restorePlaceholders(text, "CODE", codeRendered)
-
-	return text
+	_, _ = w.WriteString("<br>\n")
+	return ast.WalkContinue, nil
 }
 
-func escapedRenderedBackticks(backticks []string) []string {
-	rendered := make([]string, len(backticks))
-	for i, bt := range backticks {
-		rendered[i] = escapeAttr(bt)
+func (r *trixRenderer) renderEscapedAt(w util.BufWriter, _ []byte, _ ast.Node, entering bool) (ast.WalkStatus, error) {
+	if !entering {
+		return ast.WalkContinue, nil
 	}
-	return rendered
+	_, _ = w.WriteString(`\@`)
+	return ast.WalkContinue, nil
 }
 
-func restorePlaceholders(text, prefix string, replacements []string) string {
-	if len(replacements) == 0 {
-		return text
+// MarkdownToHTML converts Markdown text to HTML suitable for Basecamp's rich text fields.
+// It uses goldmark with custom AST transformations for Trix editor compatibility.
+// If the input already appears to be HTML, it is returned unchanged to preserve existing formatting.
+func MarkdownToHTML(md string) string {
+	if md == "" {
+		return ""
+	}
+
+	if IsHTML(md) {
+		return md
 	}
-	pairs := make([]string, 0, len(replacements)*2)
-	for i, repl := range replacements {
-		pairs = append(pairs, "\x00"+prefix+strconv.Itoa(i)+"\x00", repl)
+
+	md = strings.ReplaceAll(md, "\r\n", "\n")
+	md = strings.ReplaceAll(md, "\r", "\n")
+
+	var buf bytes.Buffer
+	if err := mdConverter.Convert([]byte(md), &buf); err != nil {
+		return "<p>" + html.EscapeString(md) + "</p>"
 	}
-	return strings.NewReplacer(pairs...).Replace(text)
+
+	return strings.TrimSpace(buf.String())
 }
 
 // escapeHTML escapes special HTML characters.
@@ -498,73 +381,6 @@ func escapeAttr(s string) string {
 	return s
 }
 
-// percentEncodeChar percent-encodes a single byte for use in URL destinations.
-// Characters left literal match the destination-safe set derived from markdown-it:
-// !$&'()*+,-./:;=?@_~#
-// Everything else gets %XX hex encoding.
-func percentEncodeChar(ch byte) string {
-	switch {
-	case ch >= 'A' && ch <= 'Z', ch >= 'a' && ch <= 'z', ch >= '0' && ch <= '9':
-		return string(ch)
-	case ch == '!' || ch == '$' || ch == '&' || ch == '\'' ||
-		ch == '(' || ch == ')' || ch == '*' || ch == '+' ||
-		ch == ',' || ch == '-' || ch == '.' || ch == '/' ||
-		ch == ':' || ch == ';' || ch == '=' || ch == '?' ||
-		ch == '@' || ch == '_' || ch == '~' || ch == '#':
-		return string(ch)
-	default:
-		return fmt.Sprintf("%%%02X", ch)
-	}
-}
-
-// resolveDestinationEscapes restores ESC and ESCBT placeholders within a link/image
-// destination using percent-encoding instead of HTML entity escaping.
-func resolveDestinationEscapes(dest string, escaped []string, escapedBackticks []string) string {
-	for i, ch := range escaped {
-		placeholder := "\x00ESC" + strconv.Itoa(i) + "\x00"
-		if strings.Contains(dest, placeholder) {
-			var encoded strings.Builder
-			for j := range len(ch) {
-				encoded.WriteString(percentEncodeChar(ch[j]))
-			}
-			dest = strings.ReplaceAll(dest, placeholder, encoded.String())
-		}
-	}
-	for i, bt := range escapedBackticks {
-		placeholder := "\x00ESCBT" + strconv.Itoa(i) + "\x00"
-		if strings.Contains(dest, placeholder) {
-			var encoded strings.Builder
-			for j := range len(bt) {
-				encoded.WriteString(percentEncodeChar(bt[j]))
-			}
-			dest = strings.ReplaceAll(dest, placeholder, encoded.String())
-		}
-	}
-	return dest
-}
-
-// sanitizeLanguage sanitizes a code block language identifier to prevent attribute injection.
-// Only allows alphanumeric characters, hyphens, and underscores.
-func sanitizeLanguage(lang string) string {
-	var result strings.Builder
-	for _, r := range lang {
-		if unicode.IsLetter(r) || unicode.IsDigit(r) || r == '-' || r == '_' {
-			result.WriteRune(r)
-		}
-	}
-	return result.String()
-}
-
-// allChars returns true if the string consists entirely of the given character.
-func allChars(s string, c byte) bool {
-	for i := range len(s) {
-		if s[i] != c && s[i] != ' ' {
-			return false
-		}
-	}
-	return true
-}
-
 // glamourCache caches glamour renderers by width to avoid repeated construction.
 var (
 	glamourMu    sync.Mutex
@@ -647,66 +463,38 @@ func HTMLToMarkdown(html string) string {
 	html = reH5.ReplaceAllString(html, "##### $1\n\n")
 	html = reH6.ReplaceAllString(html, "###### $1\n\n")
 
-	// Blockquotes
-	html = reBlockquote.ReplaceAllStringFunc(html, func(s string) string {
+	// Blockquotes — convert inner block elements (lists, code, paragraphs) to
+	// Markdown first, then prefix each line with >. Loop handles nesting:
+	// the lazy regex matches outermost open → innermost close, so each pass
+	// converts one level and the next pass handles the enclosing level.
+	convertBlockquote := func(s string) string {
 		inner := reBlockquote.FindStringSubmatch(s)
 		if len(inner) >= 2 {
-			lines := strings.Split(strings.TrimSpace(inner[1]), "\n")
+			content := blockquoteInnerToMarkdown(inner[1])
+			lines := strings.Split(content, "\n")
 			result := make([]string, 0, len(lines))
 			for _, line := range lines {
-				result = append(result, "> "+strings.TrimSpace(line))
+				if line == "" {
+					result = append(result, ">")
+				} else {
+					result = append(result, "> "+line)
+				}
 			}
 			return strings.Join(result, "\n") + "\n\n"
 		}
 		return s
-	})
+	}
+	for reBlockquote.MatchString(html) {
+		html = reBlockquote.ReplaceAllStringFunc(html, convertBlockquote)
+	}
 
-	// Code blocks (use (?is) for case-insensitive and dotall mode to match multi-line content)
+	// Code blocks
 	html = reCodeBlock.ReplaceAllStringFunc(html, func(s string) string {
-		langMatch := reCodeLang.FindStringSubmatch(s)
-		lang := ""
-		if len(langMatch) >= 2 {
-			lang = langMatch[1]
-		}
-		codeMatch := reCodeInner.FindStringSubmatch(s)
-		if len(codeMatch) >= 2 {
-			code := unescapeHTML(codeMatch[1])
-			return "```" + lang + "\n" + code + "\n```\n\n"
-		}
-		return s
+		return convertCodeBlockHTML(s) + "\n\n"
 	})
 
-	// Unordered lists
-	html = reUL.ReplaceAllStringFunc(html, func(s string) string {
-		inner := reUL.FindStringSubmatch(s)
-		if len(inner) >= 2 {
-			items := reLI.FindAllStringSubmatch(inner[1], -1)
-			var result []string
-			for _, item := range items {
-				if len(item) >= 2 {
-					result = append(result, "- "+strings.TrimSpace(item[1]))
-				}
-			}
-			return strings.Join(result, "\n") + "\n\n"
-		}
-		return s
-	})
-
-	// Ordered lists
-	html = reOL.ReplaceAllStringFunc(html, func(s string) string {
-		inner := reOL.FindStringSubmatch(s)
-		if len(inner) >= 2 {
-			items := reLI.FindAllStringSubmatch(inner[1], -1)
-			var result []string
-			for i, item := range items {
-				if len(item) >= 2 {
-					result = append(result, strconv.Itoa(i+1)+". "+strings.TrimSpace(item[1]))
-				}
-			}
-			return strings.Join(result, "\n") + "\n\n"
-		}
-		return s
-	})
+	// Lists — use balanced-tag replacement to handle nesting correctly.
+	html = replaceBalancedListBlocks(html)
 
 	// Paragraphs
 	html = reP.ReplaceAllString(html, "$1\n\n")
@@ -789,6 +577,232 @@ func HTMLToMarkdown(html string) string {
 	return strings.TrimSpace(html)
 }
 
+// reBRLine matches a <br> tag followed by an optional newline, collapsing
+// the pair to a single \n. goldmark's hard-break output is <br>\n; Trix API
+// content may have standalone <br>.
+var reBRLine = regexp.MustCompile(`(?i)<br\s*/?\s*>\n?`)
+
+// formatListItem converts a list item's HTML content to Markdown, handling
+// <br> tags as indented continuation lines.
+func formatListItem(prefix, indent, content string) string {
+	content = strings.TrimSpace(content)
+	content = reBRLine.ReplaceAllString(content, "\n")
+	lines := strings.Split(content, "\n")
+	var parts []string
+	for i, line := range lines {
+		if i == 0 {
+			parts = append(parts, prefix+strings.TrimSpace(line))
+		} else {
+			// Preserve existing indentation from nested list conversion
+			parts = append(parts, indent+line)
+		}
+	}
+	return strings.Join(parts, "\n")
+}
+
+// convertCodeBlockHTML converts a <pre><code>...</code></pre> match to Markdown.
+// Entities are left escaped so that later regex passes (reP, reStripTags) don't
+// corrupt code content like &lt;p&gt;. The global unescapeHTML at the end of
+// HTMLToMarkdown converts them.
+func convertCodeBlockHTML(s string) string {
+	lang := ""
+	// Prefer <pre language="X"> (Trix/BC5 format). Fall back to
+	// <code class="language-X"> for CommonMark-formatted content (e.g. legacy
+	// stored HTML or output from other markdown renderers).
+	if match := rePreLang.FindStringSubmatch(s); len(match) >= 2 {
+		lang = match[1]
+	} else if match := reCodeLang.FindStringSubmatch(s); len(match) >= 2 {
+		lang = match[1]
+	}
+	codeMatch := reCodeInner.FindStringSubmatch(s)
+	if len(codeMatch) >= 2 {
+		code := strings.TrimSuffix(codeMatch[1], "\n")
+		return "```" + lang + "\n" + code + "\n```"
+	}
+	return s
+}
+
+// reLIOpen matches an opening <li> tag (with optional attributes).
+var reLIOpen = regexp.MustCompile(`(?i)<li[^>]*>`)
+
+// hasPrefixFold checks if s starts with prefix using ASCII case-insensitive
+// comparison. Safe for HTML tag matching without ToLower index desync.
+func hasPrefixFold(s, prefix string) bool {
+	return len(s) >= len(prefix) && strings.EqualFold(s[:len(prefix)], prefix)
+}
+
+// extractListItems extracts top-level <li> content by tracking nesting depth,
+// correctly handling nested <li> tags that trip up regex-based extraction.
+// Nested <ul>/<ol> inside items are recursively converted to Markdown.
+func extractListItems(html string) []string {
+	var items []string
+	i := 0
+	for {
+		// Find next top-level <li> opening tag (regex is case-insensitive)
+		loc := reLIOpen.FindStringIndex(html[i:])
+		if loc == nil {
+			break
+		}
+		contentStart := i + loc[1]
+
+		// Walk forward tracking <li> depth to find the matching </li>.
+		// Jump to next '<' to avoid quadratic byte-by-byte scanning.
+		depth := 1
+		j := contentStart
+		for j < len(html) && depth > 0 {
+			idx := strings.IndexByte(html[j:], '<')
+			if idx == -1 {
+				j = len(html)
+				break
+			}
+			j += idx
+			if hasPrefixFold(html[j:], "</li>") {
+				depth--
+				if depth == 0 {
+					content := html[contentStart:j]
+					content = replaceBalancedListBlocks(content)
+					items = append(items, content)
+					j += 5
+					break
+				}
+				j += 5
+			} else if loc := reLIOpen.FindStringIndex(html[j:]); loc != nil && loc[0] == 0 {
+				depth++
+				j += loc[1]
+			} else {
+				j++
+			}
+		}
+		i = j
+	}
+	return items
+}
+
+var reListOpen = regexp.MustCompile(`(?i)<(ul|ol)[^>]*>`)
+
+// replaceBalancedListBlocks finds top-level <ul>/<ol> blocks by tracking tag
+// depth and converts each to Markdown. Handles nesting correctly where regex
+// lazy/greedy matching cannot.
+func replaceBalancedListBlocks(html string) string {
+	var result strings.Builder
+	// Track last written byte to avoid materializing result.String() in the loop.
+	var lastByte byte
+	writeString := func(s string) {
+		if len(s) > 0 {
+			lastByte = s[len(s)-1]
+			result.WriteString(s)
+		}
+	}
+	writeByte := func(b byte) {
+		lastByte = b
+		result.WriteByte(b)
+	}
+
+	i := 0
+	for {
+		loc := reListOpen.FindStringSubmatchIndex(html[i:])
+		if loc == nil {
+			writeString(html[i:])
+			break
+		}
+		matchStart := i + loc[0]
+		tag := strings.ToLower(html[i+loc[2] : i+loc[3]]) // "ul" or "ol"
+		contentStart := i + loc[1]
+
+		writeString(html[i:matchStart])
+
+		depth := 1
+		j := contentStart
+		for j < len(html) && depth > 0 {
+			// Jump to next '<' to avoid quadratic byte-by-byte scanning
+			idx := strings.IndexByte(html[j:], '<')
+			if idx == -1 {
+				j = len(html)
+				break
+			}
+			j += idx
+			// Decrement for any list close tag (handles mixed <ul>/<ol> nesting)
+			if hasPrefixFold(html[j:], "</ul>") || hasPrefixFold(html[j:], "</ol>") {
+				closeLen := 5 // len("</ul>") == len("</ol>")
+				depth--
+				if depth == 0 {
+					inner := html[contentStart:j]
+					var md string
+					if tag == "ul" {
+						md = convertULInner(inner)
+					} else {
+						md = convertOLInner(inner)
+					}
+					if lastByte != 0 && lastByte != '\n' {
+						writeByte('\n')
+					}
+					writeString(md + "\n\n")
+					j += closeLen
+					break
+				}
+				j += closeLen
+			} else if loc := reListOpen.FindStringSubmatchIndex(html[j:]); loc != nil && loc[0] == 0 {
+				depth++
+				j += loc[1]
+			} else {
+				j++
+			}
+		}
+		if depth > 0 {
+			// Unclosed tag — write original text
+			writeString(html[matchStart:])
+			break
+		}
+		i = j
+	}
+	return result.String()
+}
+
+// convertULInner converts inner <ul> content (between <ul> and </ul>) to Markdown.
+func convertULInner(inner string) string {
+	items := extractListItems(inner)
+	result := make([]string, 0, len(items))
+	for _, content := range items {
+		result = append(result, formatListItem("- ", "  ", content))
+	}
+	return strings.Join(result, "\n")
+}
+
+// convertOLInner converts inner <ol> content (between <ol> and </ol>) to Markdown.
+func convertOLInner(inner string) string {
+	items := extractListItems(inner)
+	result := make([]string, 0, len(items))
+	for i, content := range items {
+		prefix := strconv.Itoa(i+1) + ". "
+		indent := strings.Repeat(" ", len(prefix))
+		result = append(result, formatListItem(prefix, indent, content))
+	}
+	return strings.Join(result, "\n")
+}
+
+// blockquoteInnerToMarkdown converts the inner HTML of a blockquote to Markdown,
+// handling nested block elements (lists, code blocks) before line-level operations.
+func blockquoteInnerToMarkdown(inner string) string {
+	content := strings.TrimSpace(inner)
+	content = reCodeBlock.ReplaceAllStringFunc(content, func(s string) string {
+		return convertCodeBlockHTML(s) + "\n\n"
+	})
+	content = replaceBalancedListBlocks(content)
+	// Replace </p> with double newline (paragraph break) to separate adjacent blocks,
+	// then strip <p> openers. Two passes so <p>para1</p><p>para2</p> produces
+	// "para1\n\npara2" (blank line = > separator) rather than "para1para2".
+	content = reClosingP.ReplaceAllString(content, "\n\n")
+	content = reOpeningP.ReplaceAllString(content, "")
+	content = reBRLine.ReplaceAllString(content, "\n")
+	content = reMultiNewline.ReplaceAllString(content, "\n\n")
+	return strings.TrimSpace(content)
+}
+
+var (
+	reOpeningP = regexp.MustCompile(`(?i)<p(?:\s[^>]*)?>`)
+	reClosingP = regexp.MustCompile(`(?i)</p>`)
+)
+
 // unescapeHTML converts HTML entities back to their characters.
 func unescapeHTML(s string) string {
 	s = strings.ReplaceAll(s, "&amp;", "&")
@@ -934,7 +948,7 @@ func resolveMentionAnchors(html string, lookupByID PersonByIDFunc) (string, erro
 		switch scheme {
 		case "mention":
 			// Zero API calls — use value as SGID, link text as display name (caller-trusted).
-			// Unescape HTML because convertInline already escaped the link text (e.g. & → &amp;)
+			// Unescape HTML because goldmark already escaped the link text (e.g. & → &amp;)
 			// and MentionToHTML will re-escape — without this we'd double-encode.
 			name := unescapeHTML(strings.TrimPrefix(displayText, "@"))
 			tag = MentionToHTML(value, name)
diff --git a/internal/richtext/richtext_test.go b/internal/richtext/richtext_test.go
index 42796be7..46726ca4 100644
--- a/internal/richtext/richtext_test.go
+++ b/internal/richtext/richtext_test.go
@@ -80,7 +80,7 @@ func TestMarkdownToHTML(t *testing.T) {
 		{
 			name:     "ordered list with trailing spaces and descriptions",
 			input:    "1. **Item** - [Link](url) (time)  \n   Description here\n\n2. **Next** - [Link](url)",
-			expected: "<ol>\n<li><strong>Item</strong> - <a href=\"url\">Link</a> (time)  <br>\nDescription here</li>\n<li><strong>Next</strong> - <a href=\"url\">Link</a></li>\n</ol>",
+			expected: "<ol>\n<li><strong>Item</strong> - <a href=\"url\">Link</a> (time)<br>\nDescription here</li>\n<li><strong>Next</strong> - <a href=\"url\">Link</a></li>\n</ol>",
 		},
 		{
 			name:     "list followed by blank line then paragraph",
@@ -88,9 +88,12 @@ func TestMarkdownToHTML(t *testing.T) {
 			expected: "<ul>\n<li>Item 1</li>\n<li>Item 2</li>\n</ul>\n<br>\n<p>Following paragraph.</p>",
 		},
 		{
-			name:     "blank between list items does not leak break after list",
+			// CommonMark §5.4: "After" is a lazy continuation of the second list item.
+			// goldmark treats non-indented continuation lines as part of the list item,
+			// unlike our previous hand-rolled parser which ended the list.
+			name:     "lazy continuation stays in list item",
 			input:    "- One\n\n- Two\nAfter",
-			expected: "<ul>\n<li>One</li>\n<li>Two</li>\n</ul>\n<p>After</p>",
+			expected: "<ul>\n<li>One</li>\n<li>Two<br>\nAfter</li>\n</ul>",
 		},
 		{
 			name:     "blockquote",
@@ -100,12 +103,12 @@ func TestMarkdownToHTML(t *testing.T) {
 		{
 			name:     "code block",
 			input:    "```go\nfunc main() {}\n```",
-			expected: `<pre><code class="language-go">func main() {}</code></pre>`,
+			expected: "<pre language=\"go\"><code>func main() {}\n</code></pre>",
 		},
 		{
 			name:     "code block without language",
 			input:    "```\nsome code\n```",
-			expected: "<pre><code>some code</code></pre>",
+			expected: "<pre><code>some code\n</code></pre>",
 		},
 		{
 			name:     "horizontal rule with dashes",
@@ -150,7 +153,7 @@ func TestMarkdownToHTML(t *testing.T) {
 		{
 			name:     "consecutive lines join into one paragraph",
 			input:    "Line one\nLine two",
-			expected: "<p>Line one Line two</p>",
+			expected: "<p>Line one\nLine two</p>",
 		},
 		{
 			name:     "blank line before list",
@@ -160,7 +163,7 @@ func TestMarkdownToHTML(t *testing.T) {
 		{
 			name:     "blank line before code block",
 			input:    "Intro\n\n```\ncode\n```",
-			expected: "<p>Intro</p>\n<br>\n<pre><code>code</code></pre>",
+			expected: "<p>Intro</p>\n<br>\n<pre><code>code\n</code></pre>",
 		},
 		{
 			name:     "leading blank lines ignored",
@@ -195,12 +198,13 @@ func TestMarkdownToHTML(t *testing.T) {
 		{
 			name:     "code fence flushes accumulated paragraph",
 			input:    "Text\n```go\nx\n```",
-			expected: "<p>Text</p>\n<pre><code class=\"language-go\">x</code></pre>",
+			expected: "<p>Text</p>\n<pre language=\"go\"><code>x\n</code></pre>",
 		},
 		{
-			name:     "horizontal rule flushes accumulated paragraph",
+			// CommonMark: "Text\n---" is a setext heading (h2), not paragraph + hr
+			name:     "setext heading level 2",
 			input:    "Text\n---",
-			expected: "<p>Text</p>\n<hr>",
+			expected: "<h2>Text</h2>",
 		},
 		{
 			name:     "code span containing HTML tag is converted not passthrough",
@@ -210,7 +214,7 @@ func TestMarkdownToHTML(t *testing.T) {
 		{
 			name:     "fenced code block containing HTML tags is converted",
 			input:    "intro\n\n```\n<div>hello</div>\n```",
-			expected: "<p>intro</p>\n<br>\n<pre><code>&lt;div&gt;hello&lt;/div&gt;</code></pre>",
+			expected: "<p>intro</p>\n<br>\n<pre><code>&lt;div&gt;hello&lt;/div&gt;\n</code></pre>",
 		},
 	}
 
@@ -301,9 +305,10 @@ func TestMarkdownToHTMLBackslashEscapes(t *testing.T) {
 			expected: `<p><a href="https://example.com/?q=%22hi%22">x</a></p>`,
 		},
 		{
+			// goldmark treats \% as literal % in URLs (CommonMark spec)
 			name:     "escaped percent in link destination",
 			input:    `[x](https://example.com/\%20)`,
-			expected: `<p><a href="https://example.com/%2520">x</a></p>`,
+			expected: `<p><a href="https://example.com/%20">x</a></p>`,
 		},
 		{
 			name:     "escaped backslash in link destination",
@@ -323,7 +328,7 @@ func TestMarkdownToHTMLBackslashEscapes(t *testing.T) {
 		{
 			name:     "escaped percent in image src",
 			input:    `![alt](https://example.com/\%20.png)`,
-			expected: `<p><img src="https://example.com/%2520.png" alt="alt"></p>`,
+			expected: `<p><img src="https://example.com/%20.png" alt="alt"></p>`,
 		},
 		{
 			name:     "literal-safe chars stay literal in link destination",
@@ -393,6 +398,494 @@ func TestMarkdownToHTMLBackslashEscapes(t *testing.T) {
 	}
 }
 
+func TestMarkdownToHTMLBackslashAtCounts(t *testing.T) {
+	tests := []struct {
+		name     string
+		input    string
+		expected string
+	}{
+		{
+			name:     "single backslash at",
+			input:    `\@John`,
+			expected: `<p>\@John</p>`,
+		},
+		{
+			name:     "double backslash at",
+			input:    `\\@John`,
+			expected: `<p>\@John</p>`,
+		},
+		{
+			name:     "triple backslash at",
+			input:    `\\\@John`,
+			expected: `<p>\\@John</p>`,
+		},
+		{
+			name:     "quadruple backslash at",
+			input:    `\\\\@John`,
+			expected: `<p>\\@John</p>`,
+		},
+	}
+
+	for _, tt := range tests {
+		t.Run(tt.name, func(t *testing.T) {
+			result := MarkdownToHTML(tt.input)
+			if result != tt.expected {
+				t.Errorf("MarkdownToHTML(%q)\ngot:  %q\nwant: %q", tt.input, result, tt.expected)
+			}
+		})
+	}
+}
+
+func TestMarkdownToHTMLMultiParagraphBlockquote(t *testing.T) {
+	tests := []struct {
+		name     string
+		input    string
+		expected string
+	}{
+		{
+			name:     "single line",
+			input:    "> text",
+			expected: "<blockquote>text</blockquote>",
+		},
+		{
+			name:     "multiline",
+			input:    "> line1\n> line2",
+			expected: "<blockquote>line1<br>\nline2</blockquote>",
+		},
+		{
+			name:     "multi-paragraph",
+			input:    "> para1\n>\n> para2",
+			expected: "<blockquote>para1\n<br>\npara2</blockquote>",
+		},
+	}
+
+	for _, tt := range tests {
+		t.Run(tt.name, func(t *testing.T) {
+			result := MarkdownToHTML(tt.input)
+			if result != tt.expected {
+				t.Errorf("MarkdownToHTML(%q)\ngot:  %q\nwant: %q", tt.input, result, tt.expected)
+			}
+		})
+	}
+}
+
+func TestMarkdownToHTMLRawHTMLBlock(t *testing.T) {
+	tests := []struct {
+		name     string
+		input    string
+		expected string
+	}{
+		{
+			name:     "single-line script tag",
+			input:    "<script>alert(1)</script>",
+			expected: "<p>&lt;script&gt;alert(1)&lt;/script&gt;</p>",
+		},
+		{
+			name:     "multiline script tag",
+			input:    "<script>\nalert(1)\n</script>",
+			expected: "<p>&lt;script&gt; alert(1) &lt;/script&gt;</p>",
+		},
+	}
+
+	for _, tt := range tests {
+		t.Run(tt.name, func(t *testing.T) {
+			result := MarkdownToHTML(tt.input)
+			if result != tt.expected {
+				t.Errorf("MarkdownToHTML(%q)\ngot:  %q\nwant: %q", tt.input, result, tt.expected)
+			}
+		})
+	}
+}
+
+// Tag-match regexes use (?:\s[^>]*)? to require whitespace or `>` after the
+// tag name. Without that, `<p[^>]*>` false-matches `<pre>`, `<b[^>]*>` matches
+// `<br>`, `<em[^>]*>` matches `<embed>`, etc. — leading to garbled output when
+// such tag prefixes coexist with their matching close tags elsewhere.
+func TestHTMLToMarkdownTagBoundaries(t *testing.T) {
+	tests := []struct {
+		name     string
+		input    string
+		expected string
+	}{
+		{
+			// Without the boundary, <p[^>]*>.*?</p> would match
+			// "<pre>" ... "</p>" across the pre block.
+			name:     "p does not match pre",
+			input:    "<pre><code>keep</code></pre><p>tail</p>",
+			expected: "```\nkeep\n```\n\ntail",
+		},
+		{
+			// Without the boundary, <b[^>]*>.*?</b> would match
+			// "<br>" ... "</b>" eating the line break.
+			name:     "b does not match br",
+			input:    "text<br>and <b>bold</b>",
+			expected: "text\nand **bold**",
+		},
+		{
+			// Without the boundary, <em[^>]*>.*?</em> would match
+			// "<embed" ... "</em>".
+			name:     "em does not match embed",
+			input:    "<embed src=\"x\"><em>real</em>",
+			expected: "*real*",
+		},
+		{
+			// Without the boundary, <i[^>]*>.*?</i> would match
+			// "<img" ... "</i>".
+			name:     "i does not match img",
+			input:    "<img src=\"x.png\" alt=\"a\"> then <i>italic</i>",
+			expected: "![a](x.png) then *italic*",
+		},
+	}
+
+	for _, tt := range tests {
+		t.Run(tt.name, func(t *testing.T) {
+			result := HTMLToMarkdown(tt.input)
+			if result != tt.expected {
+				t.Errorf("HTMLToMarkdown(%q)\ngot:  %q\nwant: %q", tt.input, result, tt.expected)
+			}
+		})
+	}
+}
+
+// BC5's SyntaxHighlightFilter converts <pre language="X"> into a Stimulus
+// controller that triggers Prism.js. The CommonMark convention
+// (<code class="language-X">) does not trigger highlighting.
+func TestMarkdownToHTMLCodeBlockSyntaxHighlight(t *testing.T) {
+	tests := []struct {
+		name     string
+		input    string
+		expected string
+	}{
+		{
+			name:     "language emits pre[language] not code[class]",
+			input:    "```ruby\ndef hello; end\n```",
+			expected: "<pre language=\"ruby\"><code>def hello; end\n</code></pre>",
+		},
+		{
+			name:     "language with hyphen",
+			input:    "```objective-c\nreturn nil;\n```",
+			expected: "<pre language=\"objective-c\"><code>return nil;\n</code></pre>",
+		},
+		{
+			name:     "no language omits attribute",
+			input:    "```\nplain\n```",
+			expected: "<pre><code>plain\n</code></pre>",
+		},
+		{
+			name:     "html content escaped",
+			input:    "```html\n<div>hi</div>\n```",
+			expected: "<pre language=\"html\"><code>&lt;div&gt;hi&lt;/div&gt;\n</code></pre>",
+		},
+	}
+
+	for _, tt := range tests {
+		t.Run(tt.name, func(t *testing.T) {
+			result := MarkdownToHTML(tt.input)
+			if result != tt.expected {
+				t.Errorf("MarkdownToHTML(%q)\ngot:  %q\nwant: %q", tt.input, result, tt.expected)
+			}
+		})
+	}
+}
+
+// HTMLToMarkdown must recognize both the Trix/BC5 format (<pre language="X">)
+// and the legacy CommonMark format (<code class="language-X">) so round-trips
+// work for content stored in either form.
+func TestHTMLToMarkdownCodeBlockLanguageFormats(t *testing.T) {
+	tests := []struct {
+		name     string
+		input    string
+		expected string
+	}{
+		{
+			name:     "pre language attribute",
+			input:    `<pre language="go"><code>func main() {}</code></pre>`,
+			expected: "```go\nfunc main() {}\n```",
+		},
+		{
+			name:     "code class attribute (legacy)",
+			input:    `<pre><code class="language-go">func main() {}</code></pre>`,
+			expected: "```go\nfunc main() {}\n```",
+		},
+		{
+			name:     "pre language preferred over code class",
+			input:    `<pre language="ruby"><code class="language-go">x</code></pre>`,
+			expected: "```ruby\nx\n```",
+		},
+		{
+			name:     "no language",
+			input:    `<pre><code>plain</code></pre>`,
+			expected: "```\nplain\n```",
+		},
+	}
+
+	for _, tt := range tests {
+		t.Run(tt.name, func(t *testing.T) {
+			result := HTMLToMarkdown(tt.input)
+			if result != tt.expected {
+				t.Errorf("HTMLToMarkdown(%q)\ngot:  %q\nwant: %q", tt.input, result, tt.expected)
+			}
+		})
+	}
+}
+
+func TestHTMLToMarkdownMultilineBlockquote(t *testing.T) {
+	tests := []struct {
+		name     string
+		input    string
+		expected string
+	}{
+		{
+			name:     "single paragraph",
+			input:    "<blockquote>\n<p>text</p>\n</blockquote>",
+			expected: "> text",
+		},
+		{
+			name:     "adjacent paragraphs",
+			input:    "<blockquote><p>para1</p><p>para2</p></blockquote>",
+			expected: "> para1\n>\n> para2",
+		},
+		{
+			name:     "paragraph then list",
+			input:    "<blockquote><p>intro</p><ul><li>one</li><li>two</li></ul></blockquote>",
+			expected: "> intro\n>\n> - one\n> - two",
+		},
+		{
+			name:     "paragraph then code block",
+			input:    "<blockquote><p>intro</p><pre><code>code</code></pre></blockquote>",
+			expected: "> intro\n>\n> ```\n> code\n> ```",
+		},
+		{
+			name:     "code block then paragraph",
+			input:    "<blockquote><pre><code>code</code></pre><p>tail</p></blockquote>",
+			expected: "> ```\n> code\n> ```\n>\n> tail",
+		},
+		{
+			name:     "code block then nested blockquote",
+			input:    "<blockquote><pre><code>code</code></pre><blockquote>nested</blockquote></blockquote>",
+			expected: "> ```\n> code\n> ```\n>\n> > nested",
+		},
+		{
+			name:     "whitespace-separated paragraphs",
+			input:    "<blockquote>\n<p>para1</p>\n<p>para2</p>\n</blockquote>",
+			expected: "> para1\n>\n> para2",
+		},
+	}
+
+	for _, tt := range tests {
+		t.Run(tt.name, func(t *testing.T) {
+			result := HTMLToMarkdown(tt.input)
+			if result != tt.expected {
+				t.Errorf("HTMLToMarkdown(%q)\ngot:  %q\nwant: %q", tt.input, result, tt.expected)
+			}
+		})
+	}
+}
+
+func TestHTMLToMarkdownMultilineParagraph(t *testing.T) {
+	input := "<p>line1\nline2</p>"
+	result := HTMLToMarkdown(input)
+	if !strings.Contains(result, "line1") || !strings.Contains(result, "line2") {
+		t.Errorf("HTMLToMarkdown(%q)\ngot:  %q\nmissing content", input, result)
+	}
+}
+
+func TestHTMLToMarkdownCodeFenceNewline(t *testing.T) {
+	input := "<pre><code>func main() {}\n</code></pre>"
+	result := HTMLToMarkdown(input)
+	if strings.Contains(result, "\n\n```") {
+		t.Errorf("HTMLToMarkdown(%q) has extra blank line before closing fence\ngot: %q", input, result)
+	}
+	if !strings.Contains(result, "func main() {}") {
+		t.Errorf("HTMLToMarkdown(%q) missing code content\ngot: %q", input, result)
+	}
+}
+
+func TestHTMLToMarkdownCodePreservesHTMLEntities(t *testing.T) {
+	tests := []struct {
+		name     string
+		input    string
+		contains string
+	}{
+		{
+			name:     "p tags in code block survive reP and reStripTags",
+			input:    "<pre><code>&lt;p&gt;\nhi\n&lt;/p&gt;\n</code></pre>",
+			contains: "<p>\nhi\n</p>",
+		},
+		{
+			name:     "div tags in code block survive reStripTags",
+			input:    "<pre><code>&lt;div&gt;hello&lt;/div&gt;</code></pre>",
+			contains: "<div>hello</div>",
+		},
+		{
+			name:     "p tags in blockquoted code block",
+			input:    "<blockquote><pre><code>&lt;p&gt;\nhi\n&lt;/p&gt;\n</code></pre></blockquote>",
+			contains: "<p>\n> hi\n> </p>",
+		},
+	}
+
+	for _, tt := range tests {
+		t.Run(tt.name, func(t *testing.T) {
+			result := HTMLToMarkdown(tt.input)
+			if !strings.Contains(result, tt.contains) {
+				t.Errorf("HTMLToMarkdown(%q)\ngot:     %q\nmissing: %q", tt.input, result, tt.contains)
+			}
+		})
+	}
+}
+
+func TestHTMLToMarkdownNestedLists(t *testing.T) {
+	tests := []struct {
+		name     string
+		input    string
+		expected string
+	}{
+		{
+			name:     "nested ul compact",
+			input:    "<ul><li>parent<ul><li>child</li></ul></li></ul>",
+			expected: "- parent\n  - child",
+		},
+		{
+			name:     "nested ul with whitespace",
+			input:    "<ul>\n<li>parent\n<ul>\n<li>child</li>\n</ul>\n</li>\n</ul>",
+			expected: "- parent\n  - child",
+		},
+		{
+			name:     "nested ol",
+			input:    "<ol><li>parent<ol><li>child</li></ol></li></ol>",
+			expected: "1. parent\n   1. child",
+		},
+		{
+			name:     "mixed nesting ul then ol",
+			input:    "<ul><li>parent<ol><li>child</li></ol></li></ul>",
+			expected: "- parent\n  1. child",
+		},
+		{
+			name:     "mixed nesting ol then ul",
+			input:    "<ol><li>parent<ul><li>child</li></ul></li></ol>",
+			expected: "1. parent\n   - child",
+		},
+		{
+			name:     "3-level nesting",
+			input:    "<ul><li>a<ul><li>b<ul><li>c</li></ul></li></ul></li></ul>",
+			expected: "- a\n  - b\n    - c",
+		},
+		{
+			name:     "uppercase tags",
+			input:    "<UL><LI>one</LI><LI>two</LI></UL>",
+			expected: "- one\n- two",
+		},
+		{
+			name:     "nested blockquote",
+			input:    "<blockquote><blockquote>nested</blockquote></blockquote>",
+			expected: "> > nested",
+		},
+		{
+			name:     "sibling lists preserved",
+			input:    "<ul><li>a</li></ul><p>text</p><ul><li>b</li></ul>",
+			expected: "- a\n\ntext\n\n- b",
+		},
+	}
+
+	for _, tt := range tests {
+		t.Run(tt.name, func(t *testing.T) {
+			result := HTMLToMarkdown(tt.input)
+			if result != tt.expected {
+				t.Errorf("HTMLToMarkdown(%q)\ngot:  %q\nwant: %q", tt.input, result, tt.expected)
+			}
+		})
+	}
+}
+
+func TestEditLoopRoundTrip(t *testing.T) {
+	tests := []struct {
+		name     string
+		markdown string
+		expected string // exact expected round-trip output
+	}{
+		{
+			name:     "blockquote",
+			markdown: "> A quote",
+			expected: "> A quote",
+		},
+		{
+			name:     "multiline blockquote",
+			markdown: "> line1\n> line2",
+			expected: "> line1\n> line2",
+		},
+		{
+			name:     "multi-paragraph blockquote",
+			markdown: "> para1\n>\n> para2",
+			expected: "> para1\n>\n> para2",
+		},
+		{
+			name:     "unordered list",
+			markdown: "- One\n- Two\n- Three",
+			expected: "- One\n- Two\n- Three",
+		},
+		{
+			name:     "list with continuation",
+			markdown: "1. First\n   Desc\n\n2. Second\n   More",
+			expected: "1. First\n   Desc\n2. Second\n   More",
+		},
+		{
+			name:     "code fence",
+			markdown: "```go\nfunc main() {}\n```",
+			expected: "```go\nfunc main() {}\n```",
+		},
+		{
+			name:     "heading",
+			markdown: "# Title",
+			expected: "# Title",
+		},
+		{
+			name:     "quoted list",
+			markdown: "> - One\n>   Two",
+			expected: "> - One\n>   Two",
+		},
+		{
+			name:     "quoted code fence",
+			markdown: "> ```\n> code\n> ```",
+			expected: "> ```\n> code\n> ```",
+		},
+		{
+			name:     "quoted ordered list",
+			markdown: "> 1. First\n> 2. Second",
+			expected: "> 1. First\n> 2. Second",
+		},
+		{
+			name:     "nested unordered list",
+			markdown: "- parent\n  - child",
+			expected: "- parent\n  - child",
+		},
+		{
+			name:     "nested ordered list",
+			markdown: "1. parent\n   1. child",
+			expected: "1. parent\n   1. child",
+		},
+		{
+			name:     "nested blockquote",
+			markdown: "> > nested",
+			expected: "> > nested",
+		},
+		{
+			name:     "mixed content",
+			markdown: "# Title\n\nSome **bold** text.\n\n- Item 1\n- Item 2\n\n> A quote\n\n```\ncode\n```",
+			expected: "# Title\n\nSome **bold** text.\n\n- Item 1\n- Item 2\n\n> A quote\n\n```\ncode\n```",
+		},
+	}
+
+	for _, tt := range tests {
+		t.Run(tt.name, func(t *testing.T) {
+			html := MarkdownToHTML(tt.markdown)
+			back := HTMLToMarkdown(html)
+			if back != tt.expected {
+				t.Errorf("round-trip mismatch\nmarkdown: %q\nhtml:     %q\ngot:      %q\nwant:     %q", tt.markdown, html, back, tt.expected)
+			}
+		})
+	}
+}
+
 func TestHTMLToMarkdown(t *testing.T) {
 	tests := []struct {
 		name     string