fix(ui): allow XML tag for markdown rich input (#6095)

jocelynlin-wd · web-flow · commit 7df6e95c40fa · 2026-04-02T09:02:07.000-07:00
* fix(ui): allow XML tag for rich input

- Introduced utilities for escaping and unescaping non-standard XML/HTML tags to preserve them during markdown processing.
- Updated RichInput and ExpandRichInputDialog components to utilize the new XML tag utilities for handling custom tags.
- Added Jest configuration for the UI package and created tests for the XML tag utilities to ensure functionality.
- Updated package.json to include Jest as a dependency and added a test script.

* address code review comments from Gemini

* allow html tag in markdown editor

* add test case for markdown format

* update dependency in ui
diff --git a/packages/server/src/utils/buildAgentflow.ts b/packages/server/src/utils/buildAgentflow.ts
@@ -247,8 +247,11 @@ export const resolveVariables = async (
         // If value is not a string, return as is
         if (typeof value !== 'string') return value
 
-        // Convert legacy HTML content to markdown, preserving any markdown syntax within
-        if (/<[a-z][a-z0-9]*[^>]*>/i.test(value)) {
+        // Convert legacy HTML content to markdown, preserving any markdown syntax within.
+        // Legacy content from old getHTML() starts with a TipTap block tag (e.g. <p>text</p>).
+        // Anchor with ^ to avoid matching intentional HTML/XML tags in user prompts
+        // (e.g. <instruction><div>...</div></instruction>).
+        if (/^\s*<(?:p|div|h[1-6]|ul|ol|blockquote|pre|table)\b/i.test(value)) {
             const turndownService = new TurndownService()
             // Disable escaping so markdown characters (e.g. ###, -, *) inside HTML are preserved as-is
             turndownService.escape = (str: string) => str
diff --git a/packages/ui/jest.config.js b/packages/ui/jest.config.js
@@ -0,0 +1,14 @@
+module.exports = {
+    roots: ['<rootDir>/src'],
+    testEnvironment: 'node',
+    testMatch: ['<rootDir>/src/**/*.test.js'],
+    testPathIgnorePatterns: ['/node_modules/', '/build/'],
+    moduleNameMapper: {
+        '\\.(css|less|scss|sass|svg|png|jpg|jpeg|gif|webp)$': '<rootDir>/src/__mocks__/styleMock.js',
+        '^@/(.*)$': '<rootDir>/src/$1'
+    },
+    transform: {
+        '^.+\\.jsx?$': 'babel-jest'
+    },
+    transformIgnorePatterns: ['/node_modules/']
+}
diff --git a/packages/ui/package.json b/packages/ui/package.json
@@ -26,6 +26,7 @@
         "@mui/x-tree-view": "^7.25.0",
         "@reduxjs/toolkit": "^2.2.7",
         "@tabler/icons-react": "^3.30.0",
+        "@tiptap/core": "^3.20.4",
         "@tiptap/extension-code-block-lowlight": "^3.20.4",
         "@tiptap/extension-mention": "^3.20.4",
         "@tiptap/extension-placeholder": "^3.20.4",
@@ -81,11 +82,20 @@
         "dev": "vite",
         "start": "vite",
         "build": "vite build",
+        "test": "jest",
         "clean": "rimraf build",
         "nuke": "rimraf build node_modules .turbo"
     },
     "babel": {
         "presets": [
+            [
+                "@babel/preset-env",
+                {
+                    "targets": {
+                        "node": "current"
+                    }
+                }
+            ],
             "@babel/preset-react"
         ]
     },
@@ -108,6 +118,7 @@
         "@testing-library/react": "^14.0.0",
         "@testing-library/user-event": "^12.8.3",
         "@vitejs/plugin-react": "^4.2.0",
+        "jest": "^29.7.0",
         "pretty-quick": "^3.1.3",
         "react-scripts": "^5.0.1",
         "rimraf": "^5.0.5",
diff --git a/packages/ui/src/__mocks__/styleMock.js b/packages/ui/src/__mocks__/styleMock.js
@@ -0,0 +1 @@
+module.exports = {}
diff --git a/packages/ui/src/ui-component/dialog/ExpandRichInputDialog.jsx b/packages/ui/src/ui-component/dialog/ExpandRichInputDialog.jsx
@@ -23,15 +23,10 @@ import { common, createLowlight } from 'lowlight'
 import { suggestionOptions } from '@/ui-component/input/suggestionOption'
 import { getAvailableNodesForVariable } from '@/utils/genericHelper'
 import { CustomMention } from '@/utils/customMention'
+import { isHtmlContent, escapeXmlTags, unescapeXmlEntities, unescapeXmlTags } from '@/utils/xmlTagUtils'
 
 const lowlight = createLowlight(common)
 
-// Detect if content is legacy HTML (from old getHTML() storage) vs markdown
-const isHtmlContent = (content) => {
-    if (!content || typeof content !== 'string') return false
-    return /<(?:p|div|span|h[1-6]|ul|ol|li|br|code|pre|blockquote|table|strong|em)\b/i.test(content)
-}
-
 // Store
 import { HIDE_CANVAS_DIALOG, SHOW_CANVAS_DIALOG } from '@/store/actions'
 
@@ -221,7 +216,7 @@ const ExpandRichInputDialog = ({ show, dialogProps, onCancel, onInputHintDialogC
             onUpdate: ({ editor }) => {
                 if (!isSwitchingRef.current) {
                     try {
-                        setInputValue(editor.getMarkdown())
+                        setInputValue(unescapeXmlTags(editor.getMarkdown()))
                     } catch {
                         setInputValue(editor.getHTML())
                     }
@@ -239,12 +234,13 @@ const ExpandRichInputDialog = ({ show, dialogProps, onCancel, onInputHintDialogC
             if (isHtmlContent(inputValue)) {
                 editor.commands.setContent(inputValue)
                 try {
-                    setInputValue(editor.getMarkdown())
+                    setInputValue(unescapeXmlTags(editor.getMarkdown()))
                 } catch {
                     // keep original value if conversion fails
                 }
             } else {
-                editor.commands.setContent(inputValue, { contentType: 'markdown' })
+                editor.commands.setContent(escapeXmlTags(inputValue), { contentType: 'markdown' })
+                editor.commands.setContent(unescapeXmlEntities(editor.getJSON()))
             }
             isSwitchingRef.current = false
         }
@@ -265,13 +261,17 @@ const ExpandRichInputDialog = ({ show, dialogProps, onCancel, onInputHintDialogC
 
             if (newMode === 'preview' && editor) {
                 isSwitchingRef.current = true
-                const contentType = isHtmlContent(inputValue) ? 'html' : 'markdown'
-                editor.commands.setContent(inputValue, { contentType })
+                if (isHtmlContent(inputValue)) {
+                    editor.commands.setContent(inputValue, { contentType: 'html' })
+                } else {
+                    editor.commands.setContent(escapeXmlTags(inputValue), { contentType: 'markdown' })
+                    editor.commands.setContent(unescapeXmlEntities(editor.getJSON()))
+                }
                 isSwitchingRef.current = false
                 setTimeout(() => editor.commands.focus(), 50)
             } else if (newMode === 'raw' && editor) {
                 try {
-                    setInputValue(editor.getMarkdown())
+                    setInputValue(unescapeXmlTags(editor.getMarkdown()))
                 } catch {
                     setInputValue(editor.getHTML())
                 }
diff --git a/packages/ui/src/ui-component/input/RichInput.jsx b/packages/ui/src/ui-component/input/RichInput.jsx
@@ -13,15 +13,10 @@ import { common, createLowlight } from 'lowlight'
 import { suggestionOptions } from './suggestionOption'
 import { getAvailableNodesForVariable } from '@/utils/genericHelper'
 import { CustomMention } from '@/utils/customMention'
+import { isHtmlContent, escapeXmlTags, unescapeXmlEntities, unescapeXmlTags } from '@/utils/xmlTagUtils'
 
 const lowlight = createLowlight(common)
 
-// Detect if content is legacy HTML (from old getHTML() storage) vs markdown
-const isHtmlContent = (content) => {
-    if (!content || typeof content !== 'string') return false
-    return /<(?:p|div|span|h[1-6]|ul|ol|li|br|code|pre|blockquote|table|strong|em)\b/i.test(content)
-}
-
 // define your extension array
 const extensions = (
     availableNodesForVariable,
@@ -154,7 +149,7 @@ export const RichInput = ({ inputParam, value, nodes, edges, nodeId, onChange, d
             onUpdate: ({ editor }) => {
                 if (useMarkdown) {
                     try {
-                        onChange(editor.getMarkdown())
+                        onChange(unescapeXmlTags(editor.getMarkdown()))
                     } catch {
                         onChange(editor.getHTML())
                     }
@@ -173,7 +168,10 @@ export const RichInput = ({ inputParam, value, nodes, edges, nodeId, onChange, d
             if (!useMarkdown || isHtmlContent(value)) {
                 editor.commands.setContent(value)
             } else {
-                editor.commands.setContent(value, { contentType: 'markdown' })
+                // Step 1: Escape XML tags to entities so marked treats them as text
+                editor.commands.setContent(escapeXmlTags(value), { contentType: 'markdown' })
+                // Step 2: Decode entities in the ProseMirror doc for proper display
+                editor.commands.setContent(unescapeXmlEntities(editor.getJSON()))
             }
         }
     }, [editor]) // eslint-disable-line react-hooks/exhaustive-deps
diff --git a/packages/ui/src/utils/xmlTagUtils.js b/packages/ui/src/utils/xmlTagUtils.js
@@ -0,0 +1,107 @@
+/**
+ * Utilities for preserving XML/HTML tags in prompt text through TipTap's markdown roundtrip.
+ *
+ * Problem: When content like `<question>text</question>` is parsed by marked (via @tiptap/markdown),
+ * the lexer tokenizes tags as HTML tokens. TipTap's parseHTMLToken then calls generateJSON which
+ * creates DOM elements — unrecognized tags are stripped and only inner text survives.
+ *
+ * Solution: Three-step process:
+ *   1. escapeXmlTags: Convert all tags to HTML entities before markdown parsing
+ *      so marked treats them as text, not HTML tokens.
+ *   2. unescapeXmlEntities: After TipTap builds the ProseMirror document, walk the JSON tree
+ *      and decode &lt;/&gt; back to </>  in text nodes for proper visual display.
+ *   3. unescapeXmlTags: After getMarkdown(), reverse any remaining entity-escaped tags
+ *      in the serialized output (safety net — typically a no-op).
+ */
+
+/**
+ * Detect if content is legacy HTML from old getHTML() storage vs markdown.
+ * Legacy content always starts with a block-level tag like <p>.
+ * Anchored with ^ to avoid matching intentional HTML tags inside user prompts.
+ *
+ * @example
+ * isHtmlContent('<p>some text</p>')       // → true  (legacy getHTML output)
+ * isHtmlContent('<instruction>text</instruction>') // → false (user prompt)
+ *
+ * @param {string} content - Content to check
+ * @returns {boolean} True if content looks like legacy HTML
+ */
+export const isHtmlContent = (content) => {
+    if (!content || typeof content !== 'string') return false
+    return /^\s*<(?:p|div|h[1-6]|ul|ol|blockquote|pre|table)\b/i.test(content)
+}
+
+/**
+ * Regex matching opening, closing, and self-closing XML/HTML tags.
+ * Captures: (1) optional slash, (2) tag name, (3) optional attributes, (4) optional self-close slash
+ */
+const XML_TAG_REGEX = /<(\/?)([a-zA-Z][a-zA-Z0-9_.-]*)(\s[^>]*)?(\/?)>/g
+
+/**
+ * Escape all XML/HTML tags to HTML entities so marked doesn't parse them as HTML.
+ * In prompt editing context, users want tags preserved literally, not rendered.
+ *
+ * @example
+ * escapeXmlTags('<instructions>Be helpful</instructions>')
+ * // → '&lt;instructions&gt;Be helpful&lt;/instructions&gt;'
+ *
+ * escapeXmlTags('<div><question>text</question></div>')
+ * // → '&lt;div&gt;&lt;question&gt;text&lt;/question&gt;&lt;/div&gt;'
+ *
+ * @param {string} text - Raw markdown/text content
+ * @returns {string} Content with tags escaped to HTML entities
+ */
+export function escapeXmlTags(text) {
+    if (!text || typeof text !== 'string') return text
+    return text.replace(XML_TAG_REGEX, (match, slash, tagName, attrs, selfClose) => {
+        return `&lt;${slash}${tagName}${attrs || ''}${selfClose}&gt;`
+    })
+}
+
+/**
+ * Unescape XML tag entities in ProseMirror JSON text nodes.
+ * Call this after setContent() to fix the visual display in the editor.
+ * Mutates the JSON in-place and returns it.
+ *
+ * @example
+ * const json = { type: 'doc', content: [
+ *   { type: 'paragraph', content: [{ type: 'text', text: '&lt;question&gt;What?&lt;/question&gt;' }] }
+ * ]}
+ * unescapeXmlEntities(json)
+ * // json.content[0].content[0].text → '<question>What?</question>'
+ *
+ * @param {object} json - ProseMirror document JSON from editor.getJSON()
+ * @returns {object} The same JSON with decoded entities in text nodes
+ */
+export function unescapeXmlEntities(json) {
+    if (json.text) {
+        json.text = unescapeXmlTags(json.text)
+    }
+    if (json.content) {
+        json.content.forEach(unescapeXmlEntities)
+    }
+    return json
+}
+
+/**
+ * Unescape all entity-escaped XML/HTML tags after markdown serialization.
+ *
+ * @example
+ * unescapeXmlTags('&lt;question&gt;text&lt;/question&gt;')
+ * // → '<question>text</question>'
+ *
+ * unescapeXmlTags('&lt;div&gt;text&lt;/div&gt;')
+ * // → '<div>text</div>'
+ *
+ * unescapeXmlTags('<question>text</question>')
+ * // → '<question>text</question>'  (raw tags pass through unchanged)
+ *
+ * @param {string} text - Markdown output from TipTap
+ * @returns {string} Content with tags restored to angle brackets
+ */
+export function unescapeXmlTags(text) {
+    if (!text || typeof text !== 'string') return text
+    return text.replace(/&lt;(\/?)([a-zA-Z][a-zA-Z0-9_.-]*)(\s.*?)?(\/?)&gt;/g, (match, slash, tagName, attrs, selfClose) => {
+        return `<${slash}${tagName}${attrs || ''}${selfClose}>`
+    })
+}
diff --git a/packages/ui/src/utils/xmlTagUtils.test.js b/packages/ui/src/utils/xmlTagUtils.test.js
diff --git a/pnpm-lock.yaml b/pnpm-lock.yaml