test(x-markdown): add test cases to justify protecting all newlines in custom tags

yanghuanrong · yanghuanrong · commit b0231dd8595d · 2026-01-28T17:14:50.000+08:00
- Add test case to verify single \n alone does not cause block separation per CommonMark spec
- Add test cases to explain why protect all \n (using /\n/g) instead of just \n\n:
  - \n followed by list marker (-) causes block change
  - \n followed by ordered list marker (1.) causes block change
  - \n followed by heading marker (#) causes block change
  - \n followed by code fence (```) causes block change
- Add test case for blockquote marker (&gt;) being escaped by marked
diff --git a/packages/x-markdown/src/XMarkdown/__tests__/Parser.test.ts b/packages/x-markdown/src/XMarkdown/__tests__/Parser.test.ts
@@ -56,18 +56,134 @@ describe('Parser', () => {
   });
 
   describe('protectCustomTagNewlines', () => {
-    it('should protect newlines inside custom tags (both single and double)', () => {
+    it('should protect double newlines inside custom tags (block separation)', () => {
       const parser = new Parser({
         protectCustomTagNewlines: true,
         components: { CustomComponent: 'div' },
       });
-      const result1 = parser.parse('<CustomComponent>First line\n\nSecond line</CustomComponent>');
-      expect(result1).toContain('<CustomComponent>First line\n\nSecond line</CustomComponent>');
-      expect(result1).not.toMatch(/<CustomComponent>First line<\/p>\s*<p>Second line/);
+      // 双换行符在 CommonMark 中会导致段落分块，需要保护
+      const result = parser.parse('<CustomComponent>First line\n\nSecond line</CustomComponent>');
+      expect(result).toContain('<CustomComponent>First line\n\nSecond line</CustomComponent>');
+      expect(result).not.toMatch(/<CustomComponent>First line<\/p>\s*<p>Second line/);
+    });
+
+    it('single newline alone does not cause block separation per CommonMark spec', () => {
+      // 根据 CommonMark 规范，单独的 \n 不会导致段落分块
+      // 所以对于纯粹的 \n，开启与否 protectCustomTagNewlines 结果相同
+      const parserWithProtect = new Parser({
+        protectCustomTagNewlines: true,
+        components: { CustomComponent: 'div' },
+      });
+      const parserWithoutProtect = new Parser({
+        protectCustomTagNewlines: false,
+        components: { CustomComponent: 'div' },
+      });
+      const content = '<CustomComponent>Line1\nLine2</CustomComponent>';
 
-      const result2 = parser.parse('<CustomComponent>Line1\nLine2</CustomComponent>');
-      expect(result2).toContain('<CustomComponent>Line1\nLine2</CustomComponent>');
-      expect(result2).not.toMatch(/<CustomComponent>Line1<\/p>\s*<p>Line2/);
+      // 两种情况下单独的 \n 都不会导致分块
+      const resultWith = parserWithProtect.parse(content);
+      const resultWithout = parserWithoutProtect.parse(content);
+
+      expect(resultWith).toContain('<CustomComponent>Line1\nLine2</CustomComponent>');
+      expect(resultWithout).toContain('<CustomComponent>Line1\nLine2</CustomComponent>');
+    });
+
+    // =======================================================================
+    // 以下测试用例说明为什么需要保护所有 \n（使用 /\n/g）而不仅仅是 \n\n
+    // 虽然单独的 \n 不会导致分块，但 \n 后跟特定 Markdown 语法标记会导致块结构变化
+    // 保护所有 \n 是一种保守但安全的策略，可以覆盖所有可能的 Markdown 块级语法
+    // =======================================================================
+
+    it('why protect all newlines: \\n followed by list marker causes block change', () => {
+      // \n- 会被 Markdown 解析为无序列表，需要保护
+      const parserWithProtect = new Parser({
+        protectCustomTagNewlines: true,
+        components: { CustomComponent: 'div' },
+      });
+      const parserWithoutProtect = new Parser({
+        protectCustomTagNewlines: false,
+        components: { CustomComponent: 'div' },
+      });
+      const content = '<CustomComponent>Text\n- item1</CustomComponent>';
+
+      // 不开启保护时，\n- 会被解析为列表，破坏自定义标签结构
+      const resultWithout = parserWithoutProtect.parse(content);
+      expect(resultWithout).toContain('<ul>');
+      expect(resultWithout).toContain('<li>');
+
+      // 开启保护时，内容保持完整
+      const resultWith = parserWithProtect.parse(content);
+      expect(resultWith).toContain('<CustomComponent>Text\n- item1</CustomComponent>');
+      expect(resultWith).not.toContain('<ul>');
+    });
+
+    it('why protect all newlines: \\n followed by ordered list marker causes block change', () => {
+      // \n1. 会被 Markdown 解析为有序列表，需要保护
+      const parserWithProtect = new Parser({
+        protectCustomTagNewlines: true,
+        components: { CustomComponent: 'div' },
+      });
+      const parserWithoutProtect = new Parser({
+        protectCustomTagNewlines: false,
+        components: { CustomComponent: 'div' },
+      });
+      const content = '<CustomComponent>Text\n1. first</CustomComponent>';
+
+      // 不开启保护时，\n1. 会被解析为有序列表
+      const resultWithout = parserWithoutProtect.parse(content);
+      expect(resultWithout).toContain('<ol>');
+      expect(resultWithout).toContain('<li>');
+
+      // 开启保护时，内容保持完整
+      const resultWith = parserWithProtect.parse(content);
+      expect(resultWith).toContain('<CustomComponent>Text\n1. first</CustomComponent>');
+      expect(resultWith).not.toContain('<ol>');
+    });
+
+    it('why protect all newlines: \\n followed by heading marker causes block change', () => {
+      // \n# 会被 Markdown 解析为标题，需要保护
+      const parserWithProtect = new Parser({
+        protectCustomTagNewlines: true,
+        components: { CustomComponent: 'div' },
+      });
+      const parserWithoutProtect = new Parser({
+        protectCustomTagNewlines: false,
+        components: { CustomComponent: 'div' },
+      });
+      const content = '<CustomComponent>Text\n# heading</CustomComponent>';
+
+      // 不开启保护时，\n# 会被解析为标题
+      const resultWithout = parserWithoutProtect.parse(content);
+      expect(resultWithout).toContain('<h1>');
+
+      // 开启保护时，内容保持完整
+      const resultWith = parserWithProtect.parse(content);
+      expect(resultWith).toContain('<CustomComponent>Text\n# heading</CustomComponent>');
+      expect(resultWith).not.toContain('<h1>');
+    });
+
+    it('why protect all newlines: \\n followed by code fence causes block change', () => {
+      // \n``` 会被 Markdown 解析为代码块，需要保护
+      const parserWithProtect = new Parser({
+        protectCustomTagNewlines: true,
+        components: { CustomComponent: 'div' },
+      });
+      const parserWithoutProtect = new Parser({
+        protectCustomTagNewlines: false,
+        components: { CustomComponent: 'div' },
+      });
+      const content = '<CustomComponent>Text\n```\ncode\n```</CustomComponent>';
+
+      // 不开启保护时，\n``` 会被解析为代码块，破坏自定义标签结构
+      const resultWithout = parserWithoutProtect.parse(content);
+      expect(resultWithout).toMatch(/<pre>|<code>/);
+
+      // 开启保护时，内容保持完整（注：``` 在 HTML 内会被 marked 处理为 <code>）
+      const resultWith = parserWithProtect.parse(content);
+      expect(resultWith).toContain('<CustomComponent>');
+      expect(resultWith).toContain('code');
+      // 关键验证：不会生成 <pre> 代码块结构
+      expect(resultWith).not.toContain('<pre>');
     });
 
     it('should not protect newlines when protectCustomTagNewlines is false', () => {
@@ -80,6 +196,19 @@ describe('Parser', () => {
       expect(result).toContain('<p>');
     });
 
+    it('blockquote marker (>) inside custom tags is escaped by marked', () => {
+      // 在 HTML 标签内的 > 字符会被 marked 转义为 &gt;，不会被解析为引用块
+      // 这是 marked 库的默认行为，不需要特殊保护
+      const parser = new Parser({
+        protectCustomTagNewlines: true,
+        components: { CustomComponent: 'div' },
+      });
+      const content = '<CustomComponent>Text\n> quote here</CustomComponent>';
+      const result = parser.parse(content);
+      expect(result).toContain('&gt;');
+      expect(result).not.toContain('<blockquote>');
+    });
+
     it('should work normally when protectCustomTagNewlines is true but no custom components', () => {
       const parser = new Parser({
         protectCustomTagNewlines: true,