From d2c1137a4cacea0f997b053b1c795b8dcf8780b5 Mon Sep 17 00:00:00 2001
From: Ricardo Amaral <ricardo@doist.com>
Date: Thu, 5 Jan 2023 11:16:42 +0000
Subject: [PATCH] fix: Disables more tokenizers if marks/nodes are not found in
 the editor schema

---
 src/helpers/serializer.test.ts              |  21 +-
 src/helpers/serializer.ts                   |  29 +-
 src/serializers/html/extensions/disabled.ts | 160 +++++++++++
 src/serializers/html/extensions/link.ts     |  16 +-
 src/serializers/html/html.test.ts           | 304 +++++++++++++++-----
 src/serializers/html/html.ts                |  54 +---
 src/serializers/markdown/markdown.ts        |   4 +
 7 files changed, 456 insertions(+), 132 deletions(-)
 create mode 100644 src/serializers/html/extensions/disabled.ts

diff --git a/src/helpers/serializer.test.ts b/src/helpers/serializer.test.ts
index 94f38f38..847f90e5 100644
--- a/src/helpers/serializer.test.ts
+++ b/src/helpers/serializer.test.ts
@@ -1,10 +1,29 @@
 import { getSchema } from '@tiptap/core'
 
 import { RichTextKit } from '../extensions/rich-text/rich-text-kit'
+import { createSuggestionExtension } from '../factories/create-suggestion-extension'
 
-import { extractTagsFromParseRules } from './serializer'
+import { buildSuggestionSchemaPartialRegex, extractTagsFromParseRules } from './serializer'
 
 describe('Helper: Serializer', () => {
+    describe('#buildSuggestionSchemaPartialRegex', () => {
+        test('returns `null` when there are no suggestion nodes in the schema', () => {
+            expect(buildSuggestionSchemaPartialRegex(getSchema([RichTextKit]))).toBeNull()
+        })
+
+        test('returns a partial regular expression including valid URL schemas', () => {
+            expect(
+                buildSuggestionSchemaPartialRegex(
+                    getSchema([
+                        RichTextKit,
+                        createSuggestionExtension('mention'),
+                        createSuggestionExtension('channel'),
+                    ]),
+                ),
+            ).toBe('(?:mention|channel)://')
+        })
+    })
+
     describe('#extractTagsFromParseRules', () => {
         test('returns an array of all tags from the given parse rules', () => {
             expect(
diff --git a/src/helpers/serializer.ts b/src/helpers/serializer.ts
index 42eb085c..dad66eb2 100644
--- a/src/helpers/serializer.ts
+++ b/src/helpers/serializer.ts
@@ -1,4 +1,29 @@
-import type { ParseRule } from 'prosemirror-model'
+import { kebabCase } from 'lodash-es'
+
+import type { ParseRule, Schema } from 'prosemirror-model'
+
+/**
+ * Builds a partial regular expression that includes valid URL schemas used by all the available
+ * suggestion nodes from the given editor schema.
+ *
+ * @param schema The editor schema to be used for suggestion nodes detection.
+ *
+ * @returns A partial regular expression with valid URL schemas for the available suggestion nodes,
+ * `null` if there are no suggestion nodes in the editor schema.
+ */
+function buildSuggestionSchemaPartialRegex(schema: Schema) {
+    const suggestionNodes = Object.values(schema.nodes).filter((node) =>
+        node.name.endsWith('Suggestion'),
+    )
+
+    if (suggestionNodes.length === 0) {
+        return null
+    }
+
+    return `(?:${suggestionNodes
+        .map((suggestionNode) => kebabCase(suggestionNode.name.replace(/Suggestion$/, '')))
+        .join('|')})://`
+}
 
 /**
  * Extract all tags from the given parse rules argument, and returns an array of said tags.
@@ -19,4 +44,4 @@ function extractTagsFromParseRules(
         .map((rule) => rule.tag as keyof HTMLElementTagNameMap)
 }
 
-export { extractTagsFromParseRules }
+export { buildSuggestionSchemaPartialRegex, extractTagsFromParseRules }
diff --git a/src/serializers/html/extensions/disabled.ts b/src/serializers/html/extensions/disabled.ts
new file mode 100644
index 00000000..1f93aded
--- /dev/null
+++ b/src/serializers/html/extensions/disabled.ts
@@ -0,0 +1,160 @@
+import { marked } from 'marked'
+
+import { buildSuggestionSchemaPartialRegex } from '../../../helpers/serializer'
+import { INITIAL_MARKED_OPTIONS } from '../html'
+
+import type { Schema } from 'prosemirror-model'
+
+/**
+ * A version of `marked.TokenizerObject` that allows to return an `undefined` tokenizer.
+ */
+type MarkedTokenizerObjectAsUndefined = Partial<
+    Omit<marked.Tokenizer<undefined>, 'constructor' | 'options'>
+>
+
+/**
+ * A Marked extension which disables multiple parsing rules by disabling the rules respective
+ * tokenizers based on the availability of marks and/or nodes in the editor schema.
+ *
+ * @param schema The editor schema to be used for nodes and marks detection.
+ */
+function disabled(schema: Schema) {
+    const markedTokenizer = new marked.Tokenizer(INITIAL_MARKED_OPTIONS)
+
+    const tokenizer: marked.TokenizerObject = {}
+
+    if (!schema.nodes.blockquote) {
+        Object.assign(tokenizer, {
+            blockquote() {
+                return undefined
+            },
+        })
+    }
+
+    if (!schema.marks.bold || !schema.marks.italic) {
+        Object.assign(tokenizer, {
+            emStrong() {
+                return undefined
+            },
+        })
+    }
+
+    // Given that there isn't a one to one mapping between the bullet/ordered list nodes and Marked
+    // tokenizers, we need to conditionally disable the `list` tokenizer based on the input
+    if (!schema.nodes.bulletList || !schema.nodes.orderedList) {
+        Object.assign<marked.TokenizerObject, MarkedTokenizerObjectAsUndefined>(tokenizer, {
+            list(src) {
+                const isOrdered = /^\d+/.test(src)
+
+                if (
+                    (isOrdered && schema.nodes.orderedList) ||
+                    (!isOrdered && schema.nodes.bulletList)
+                ) {
+                    return markedTokenizer.list.apply(this, [src])
+                }
+
+                return undefined
+            },
+        })
+    }
+
+    if (!schema.marks.code) {
+        Object.assign(tokenizer, {
+            codespan() {
+                return undefined
+            },
+        })
+    }
+
+    if (!schema.nodes.codeBlock) {
+        Object.assign(tokenizer, {
+            code() {
+                return undefined
+            },
+            fences() {
+                return undefined
+            },
+        })
+    }
+
+    if (!schema.nodes.hardBreak) {
+        Object.assign(tokenizer, {
+            br() {
+                return undefined
+            },
+        })
+    }
+
+    if (!schema.nodes.heading) {
+        Object.assign(tokenizer, {
+            heading() {
+                return undefined
+            },
+        })
+    }
+
+    if (!schema.nodes.horizontalRule) {
+        Object.assign(tokenizer, {
+            hr() {
+                return undefined
+            },
+        })
+    }
+
+    if (!schema.marks.link) {
+        Object.assign(tokenizer, {
+            url() {
+                return undefined
+            },
+        })
+    }
+
+    // Given that there isn't a one to one mapping between the link/image mark/node and Marked
+    // tokenizers, nor Marked supports our custom Markdown syntax for suggestions, we need to
+    // conditionally disable the `link` tokenizer based on the input
+    if (!schema.marks.link || !schema.nodes.image) {
+        const suggestionSchemaPartialRegex = buildSuggestionSchemaPartialRegex(schema)
+        const suggestionSchemaRegex = suggestionSchemaPartialRegex
+            ? new RegExp(`^\\[[^\\]]*\\]\\(${suggestionSchemaPartialRegex}`)
+            : null
+
+        Object.assign<marked.TokenizerObject, MarkedTokenizerObjectAsUndefined>(tokenizer, {
+            link(src) {
+                const isImage = /^!\[[^\]]*\]\([^)]+\)/.test(src)
+                const isSuggestion = suggestionSchemaRegex?.test(src)
+
+                if (
+                    (isImage && schema.nodes.image) ||
+                    (!isImage && schema.marks.link) ||
+                    isSuggestion
+                ) {
+                    return markedTokenizer.link.apply(this, [src])
+                }
+
+                return undefined
+            },
+        })
+    }
+
+    if (!schema.marks.strike) {
+        Object.assign(tokenizer, {
+            del() {
+                return undefined
+            },
+        })
+    }
+
+    if (!schema.nodes.table) {
+        Object.assign(tokenizer, {
+            table() {
+                return undefined
+            },
+        })
+    }
+
+    return {
+        tokenizer,
+    }
+}
+
+export { disabled }
diff --git a/src/serializers/html/extensions/link.ts b/src/serializers/html/extensions/link.ts
index 9aa15007..44e54d00 100644
--- a/src/serializers/html/extensions/link.ts
+++ b/src/serializers/html/extensions/link.ts
@@ -1,27 +1,19 @@
-import { kebabCase } from 'lodash-es'
 import { marked } from 'marked'
 
-import type { NodeType } from 'prosemirror-model'
-
 const markedRenderer = new marked.Renderer()
 
 /**
  * A Marked extension which tweaks the `link` renderer to add support for suggestion nodes, while
  * preserving the original renderer for standard links.
  *
- * @param suggestionNodes An array of the suggestion nodes to serialize.
+ * @param suggestionSchemaRegex A regular expression with valid URL schemas for the available
+ * suggestion nodes.
  */
-function link(suggestionNodes: NodeType[]): marked.MarkedExtension {
-    const linkSchemaRegex = new RegExp(
-        `^(?:${suggestionNodes
-            .map((suggestionNode) => kebabCase(suggestionNode.name.replace(/Suggestion$/, '')))
-            .join('|')})://`,
-    )
-
+function link(suggestionSchemaRegex: RegExp): marked.MarkedExtension {
     return {
         renderer: {
             link(href, title, text) {
-                if (href && linkSchemaRegex.test(href)) {
+                if (href && suggestionSchemaRegex?.test(href)) {
                     const [, schema, id] = /^([a-z-]+):\/\/(\S+)$/i.exec(href) || []
 
                     if (schema && id && text) {
diff --git a/src/serializers/html/html.test.ts b/src/serializers/html/html.test.ts
index 0238a92d..49f76cbe 100644
--- a/src/serializers/html/html.test.ts
+++ b/src/serializers/html/html.test.ts
@@ -60,7 +60,7 @@ const MARKDOWN_INPUT_BLOCKQUOTES = `> Dorothy followed her through many of the b
 > - Revenue was off the chart.
 > - Profits were higher than ever.
 >
-> *Everything* is going according to **plan**.`
+> _Everything_ is going according to **plan**.`
 
 const MARKDOWN_INPUT_ORDERED_LISTS = `1. First item
 2. Second item
@@ -222,6 +222,25 @@ const MARKDOWN_INPUT_STYLED_LINKS = `I love supporting the **[EFF](https://eff.o
 This is the *[Markdown Guide](https://www.markdownguide.org)*.
 See the section on [\`code\`](#code).`
 
+const MARKDOWN_INPUT_TABLES = `| Syntax      | Description |
+| ----------- | ----------- |
+| Header      | Title       |
+| Paragraph   | Text        |
+
+---
+
+| Syntax | Description |
+| --- | ----------- |
+| Header | Title |
+| Paragraph | Text |
+
+---
+
+| Syntax      | Description | Test Text     |
+| :---        |    :----:   |          ---: |
+| Header      | Title       | Here's this   |
+| Paragraph   | Text        | And more      |`
+
 describe('HTML Serializer', () => {
     describe('Plain-text Document', () => {
         describe('with default extensions', () => {
@@ -263,7 +282,7 @@ describe('HTML Serializer', () => {
 
             test('blockquotes syntax is preserved', () => {
                 expect(htmlSerializer.serialize(MARKDOWN_INPUT_BLOCKQUOTES)).toBe(
-                    '<p>&gt; Dorothy followed her through many of the beautiful rooms in her castle.</p><p></p><p>&gt; Dorothy followed her through many of the beautiful rooms in her castle.</p><p>&gt;</p><p>&gt; The Witch bade her clean the pots and kettles and sweep the floor and keep the fire fed with wood.</p><p></p><p>&gt; Dorothy followed her through many of the beautiful rooms in her castle.</p><p>&gt;</p><p>&gt; &gt; The Witch bade her clean the pots and kettles and sweep the floor and keep the fire fed with wood.</p><p></p><p>&gt; #### The quarterly results look great!</p><p>&gt;</p><p>&gt; - Revenue was off the chart.</p><p>&gt; - Profits were higher than ever.</p><p>&gt;</p><p>&gt; *Everything* is going according to **plan**.</p>',
+                    '<p>&gt; Dorothy followed her through many of the beautiful rooms in her castle.</p><p></p><p>&gt; Dorothy followed her through many of the beautiful rooms in her castle.</p><p>&gt;</p><p>&gt; The Witch bade her clean the pots and kettles and sweep the floor and keep the fire fed with wood.</p><p></p><p>&gt; Dorothy followed her through many of the beautiful rooms in her castle.</p><p>&gt;</p><p>&gt; &gt; The Witch bade her clean the pots and kettles and sweep the floor and keep the fire fed with wood.</p><p></p><p>&gt; #### The quarterly results look great!</p><p>&gt;</p><p>&gt; - Revenue was off the chart.</p><p>&gt; - Profits were higher than ever.</p><p>&gt;</p><p>&gt; _Everything_ is going according to **plan**.</p>',
                 )
             })
 
@@ -309,7 +328,7 @@ describe('HTML Serializer', () => {
                 )
             })
 
-            test('line rules syntax is preserved', () => {
+            test('horizontal rules syntax is preserved', () => {
                 expect(htmlSerializer.serialize(MARKDOWN_INPUT_LINE_RULES)).toBe(
                     '<p>***</p><p></p><p>_________________</p><p></p><p>---</p>',
                 )
@@ -413,12 +432,6 @@ Answer: [Doist Frontend](channel://190200)`),
                 )
             })
 
-            test('task lists syntax is preserved (unsupported by default)', () => {
-                expect(htmlSerializer.serialize(MARKDOWN_INPUT_TASK_LISTS)).toBe(
-                    '<ul><li>[ ] First item</li><li>[x] Second item</li><li>[x] Third item</li><li>[ ] Fourth item</li></ul><hr><ul><li>[x] First item</li><li>[ ] Second item</li><li>[ ] Third item</li><li>[x] Fourth item</li></ul><hr><ul><li>[x] First item</li><li>[ ] Second item</li><li>[x] Third item</li><li>[ ] Fourth item</li></ul><hr><ul><li>First item</li><li>Second item</li><li>Third item<ul><li>[ ] Indented item</li><li>[ ] Indented item</li></ul></li><li>Fourth item</li></ul><hr><ul><li>[ ] 1968. A great year!</li><li>[x] I think 1969 was second best.</li></ul><hr><ul><li>[ ] This is the first list item.</li><li>[ ] Here&#39;s the second list item.<br>  I need to add another paragraph below the second list item.</li><li>[ ] And here&#39;s the third list item.</li></ul>',
-                )
-            })
-
             test('images HTML output is correct', () => {
                 expect(htmlSerializer.serialize(MARKDOWN_INPUT_IMAGES)).toBe(
                     '<img src="https://octodex.github.com/images/octobiwan.jpg" alt="Octobi Wan Catnobi"><img src="https://octodex.github.com/images/octobiwan.jpg" alt=""><img src="https://octodex.github.com/images/octobiwan.jpg" alt=""><img src="https://octodex.github.com/images/octobiwan.jpg" alt="Octobi Wan Catnobi" title="Octobi Wan Catnobi"><p><a href="https://octodex.github.com/octobiwan/"><img src="https://octodex.github.com/images/octobiwan.jpg" alt="Octobi Wan Catnobi" title="Octobi Wan Catnobi"></a></p><p>Octobi Wan Catnobi: </p><p>Octobi Wan Catnobi:  - These are not the droids you\'re looking for!</p><p> - These are not the droids you\'re looking for!</p>',
@@ -449,7 +462,7 @@ Answer: [Doist Frontend](channel://190200)`),
 &lt;/html&gt;</code></pre></li></ol>`)
             })
 
-            test('line rules HTML output is correct', () => {
+            test('horizontal rules HTML output is correct', () => {
                 expect(htmlSerializer.serialize(MARKDOWN_INPUT_LINE_RULES)).toBe('<hr><hr><hr>')
             })
 
@@ -466,77 +479,176 @@ Answer: [Doist Frontend](channel://190200)`),
             })
         })
 
-        describe('without `heading` extension', () => {
-            test("HTML output doesn't have heading elements", () => {
-                const customSerializer = createHTMLSerializer(
+        describe('without non-essential extensions', () => {
+            let htmlSerializer: HTMLSerializerReturnType
+
+            beforeEach(() => {
+                htmlSerializer = createHTMLSerializer(
                     getSchema([
+                        // Although we can disable pretty much any extension in the `RichTextKit`,
+                        // only non-essential nodes/marks extensions are disabled (these are the
+                        // only ones that have an effect on the serializer output)
                         RichTextKit.configure({
+                            blockquote: false,
+                            bold: false,
+                            bulletList: false,
+                            code: false,
+                            codeBlock: false,
+                            hardBreak: false,
                             heading: false,
+                            horizontalRule: false,
+                            image: false,
+                            italic: false,
+                            link: false,
+                            orderedList: false,
+                            strike: false,
                         }),
                     ]),
                 )
+            })
 
-                expect(customSerializer.serialize(MARKDOWN_INPUT_HEADINGS)).toBe(
+            test('headings HTML output is preserved', () => {
+                expect(htmlSerializer.serialize(MARKDOWN_INPUT_HEADINGS)).toBe(
                     '<p># Heading level 1</p><p>## Heading level 2</p><p>### Heading level 3</p><p>#### Heading level 4</p><p>##### Heading level 5</p><p>###### Heading level 6</p>',
                 )
             })
-        })
 
-        describe('without `strike` extension', () => {
-            test("HTML output doesn't have `del` elements", () => {
-                const customSerializer = createHTMLSerializer(
-                    getSchema([
-                        RichTextKit.configure({
-                            strike: false,
-                        }),
-                    ]),
+            test('paragraphs HTML output is preserved', () => {
+                expect(htmlSerializer.serialize(MARKDOWN_INPUT_PARAGRAPHS)).toBe(
+                    "<p>I really like using Markdown.</p><p>I think I'll use it to format all of my documents from now on.</p>",
                 )
+            })
 
-                expect(customSerializer.serialize(MARKDOWN_INPUT_STYLED_TEXT)).toBe(
-                    "<p>I just love <strong>bold text</strong>.<br>I just love <strong>bold text</strong>.</p><p>Italicized text is the <em>cat's meow</em>.<br>Italicized text is the <em>cat's meow</em>.</p><p>This text is <em><strong>really important</strong></em>.<br>This text is <em><strong>really important</strong></em>.<br>This text is <strong><em>really important</em></strong>.<br>This text is <strong><em>really important</em></strong>.<br>This is really <em><strong>very</strong></em> important text.</p><p>Strikethrough uses two tildes: ~~scratch this~~</p>",
+            test('line breaks HTML output is preserved', () => {
+                expect(htmlSerializer.serialize(MARKDOWN_INPUT_LINE_BREAKS)).toBe(
+                    `<p>This is the first line.
+And this is the second line.</p>`,
                 )
             })
-        })
 
-        describe('without `codeblock` extension', () => {
-            test('code block HTML output is correct', () => {
-                const customSerializer = createHTMLSerializer(
-                    getSchema([
-                        RichTextKit.configure({
-                            codeBlock: false,
-                        }),
-                    ]),
+            test('styled text HTML output is preserved', () => {
+                expect(htmlSerializer.serialize(MARKDOWN_INPUT_STYLED_TEXT))
+                    .toBe(`<p>I just love **bold text**.
+I just love __bold text__.</p><p>Italicized text is the *cat's meow*.
+Italicized text is the _cat's meow_.</p><p>This text is ***really important***.
+This text is ___really important___.
+This text is __*really important*__.
+This text is **_really important_**.
+This is really ***very*** important text.</p><p>Strikethrough uses two tildes: ~~scratch this~~</p>`)
+            })
+
+            test('blockquotes HTML output is preserved', () => {
+                expect(htmlSerializer.serialize(MARKDOWN_INPUT_BLOCKQUOTES)).toBe(
+                    '<p>&gt; Dorothy followed her through many of the beautiful rooms in her castle.</p><p>&gt; Dorothy followed her through many of the beautiful rooms in her castle.</p><p>&gt;</p><p>&gt; The Witch bade her clean the pots and kettles and sweep the floor and keep the fire fed with wood.</p><p>&gt; Dorothy followed her through many of the beautiful rooms in her castle.</p><p>&gt;</p><p>&gt; &gt; The Witch bade her clean the pots and kettles and sweep the floor and keep the fire fed with wood.</p><p>&gt; #### The quarterly results look great!</p><p>&gt;</p><p>&gt; - Revenue was off the chart.</p><p>&gt; - Profits were higher than ever.</p><p>&gt;</p><p>&gt; _Everything_ is going according to **plan**.</p>',
                 )
+            })
 
-                expect(customSerializer.serialize(MARKDOWN_INPUT_CODE_BLOCK))
-                    .toBe(`<pre><code>&lt;html&gt;
+            test('ordered lists HTML output is preserved', () => {
+                expect(htmlSerializer.serialize(MARKDOWN_INPUT_ORDERED_LISTS))
+                    .toBe(`<p>1. First item
+2. Second item
+3. Third item
+4. Fourth item</p><p>---</p><p>1. First item</p><p>1. Second item</p><p>1. Third item</p><p>1. Fourth item</p><p>---</p><p>1. First item
+8. Second item
+3. Third item
+5. Fourth item</p><p>---</p><p>1. First item
+2. Second item
+3. Third item
+    1. Indented item
+    2. Indented item
+4. Fourth item</p>`)
+            })
+
+            test('unordered lists HTML output is preserved', () => {
+                expect(htmlSerializer.serialize(MARKDOWN_INPUT_UNORDERED_LISTS))
+                    .toBe(`<p>- First item</p><p>- Second item</p><p>- Third item</p><p>- Fourth item</p><p>---</p><p>* First item</p><p>* Second item</p><p>* Third item</p><p>* Fourth item</p><p>---</p><p>+ First item</p><p>+ Second item</p><p>+ Third item</p><p>+ Fourth item</p><p>---</p><p>- First item</p><p>- Second item</p><p>- Third item
+    - Indented item
+    - Indented item</p><p>- Fourth item</p><p>---</p><p>- 1968. A great year!</p><p>- I think 1969 was second best.</p><p>---</p><p>* This is the first list item.</p><p>* Here's the second list item.
+    I need to add another paragraph below the second list item.</p><p>* And here's the third list item.</p>`)
+            })
+
+            test('images HTML output is preserved', () => {
+                expect(htmlSerializer.serialize(MARKDOWN_INPUT_IMAGES)).toBe(
+                    '<p>![Octobi Wan Catnobi](https://octodex.github.com/images/octobiwan.jpg)</p><p>![](https://octodex.github.com/images/octobiwan.jpg)![](https://octodex.github.com/images/octobiwan.jpg)</p><p>![Octobi Wan Catnobi](https://octodex.github.com/images/octobiwan.jpg "Octobi Wan Catnobi")</p><p>[![Octobi Wan Catnobi](https://octodex.github.com/images/octobiwan.jpg "Octobi Wan Catnobi")](https://octodex.github.com/octobiwan/)</p><p>Octobi Wan Catnobi: ![](https://octodex.github.com/images/octobiwan.jpg)</p><p>Octobi Wan Catnobi: ![](https://octodex.github.com/images/octobiwan.jpg) - These are not the droids you\'re looking for!</p><p>![](https://octodex.github.com/images/octobiwan.jpg) - These are not the droids you\'re looking for!</p>',
+                )
+            })
+
+            test('code HTML output is preserved', () => {
+                expect(htmlSerializer.serialize(MARKDOWN_INPUT_CODE)).toBe(
+                    '<p>At the command prompt, type `nano`.</p><p>``Use `code` in your Markdown file.``</p>',
+                )
+            })
+
+            test('code block HTML output is preserved', () => {
+                expect(htmlSerializer.serialize(MARKDOWN_INPUT_CODE_BLOCK)).toBe(
+                    `<p>\`\`\`</p>&lt;html&gt;
   &lt;head&gt;
     &lt;title&gt;Test&lt;/title&gt;
   &lt;/head&gt;
 &lt;/html&gt;
-</code></pre>`)
+\`\`\``,
+                )
+            })
+
+            test('block elements HTML output is preserved', () => {
+                expect(htmlSerializer.serialize(MARKDOWN_INPUT_INDENTED_BLOCK_ELEMENTS))
+                    .toBe(`<p>1. Blockquote:
+    &gt; Dorothy followed her through many of the beautiful rooms in her castle.
+2. Image:
+    ![Octobi Wan Catnobi](https://octodex.github.com/images/octobiwan.jpg)
+3. Codeblock:
+    \`\`\`
+    &lt;html&gt;
+      &lt;head&gt;
+        &lt;title&gt;Test&lt;/title&gt;
+      &lt;/head&gt;
+    &lt;/html&gt;
+    \`\`\`</p>`)
+            })
+
+            test('horizontal rules HTML output is preserved', () => {
+                expect(htmlSerializer.serialize(MARKDOWN_INPUT_LINE_RULES)).toBe(
+                    '<p>***</p><p>_________________</p><p>---</p>',
+                )
+            })
+
+            test('links HTML output is preserved', () => {
+                expect(htmlSerializer.serialize(MARKDOWN_INPUT_LINKS))
+                    .toBe(`<p>My favorite search engine is [Duck Duck Go](https://duckduckgo.com).
+My favorite search engine is [Duck Duck Go](https://duckduckgo.com "The best search engine for privacy").</p>`)
+            })
+
+            test('styled links HTML output is preserved', () => {
+                expect(htmlSerializer.serialize(MARKDOWN_INPUT_STYLED_LINKS))
+                    .toBe(`<p>I love supporting the **[EFF](https://eff.org)**.
+This is the *[Markdown Guide](https://www.markdownguide.org)*.
+See the section on [\`code\`](#code).</p>`)
             })
         })
 
-        describe('without `image` extension', () => {
-            test('images HTML output is correct', () => {
-                const customSerializer = createHTMLSerializer(
-                    getSchema([
-                        RichTextKit.configure({
-                            image: false,
-                        }),
-                    ]),
+        describe('without support for certain extensions', () => {
+            let htmlSerializer: HTMLSerializerReturnType
+
+            beforeEach(() => {
+                htmlSerializer = createHTMLSerializer(getSchema([RichTextKit]))
+            })
+
+            test('task lists syntax is preserved', () => {
+                expect(htmlSerializer.serialize(MARKDOWN_INPUT_TASK_LISTS)).toBe(
+                    '<ul><li>[ ] First item</li><li>[x] Second item</li><li>[x] Third item</li><li>[ ] Fourth item</li></ul><hr><ul><li>[x] First item</li><li>[ ] Second item</li><li>[ ] Third item</li><li>[x] Fourth item</li></ul><hr><ul><li>[x] First item</li><li>[ ] Second item</li><li>[x] Third item</li><li>[ ] Fourth item</li></ul><hr><ul><li>First item</li><li>Second item</li><li>Third item<ul><li>[ ] Indented item</li><li>[ ] Indented item</li></ul></li><li>Fourth item</li></ul><hr><ul><li>[ ] 1968. A great year!</li><li>[x] I think 1969 was second best.</li></ul><hr><ul><li>[ ] This is the first list item.</li><li>[ ] Here&#39;s the second list item.<br>  I need to add another paragraph below the second list item.</li><li>[ ] And here&#39;s the third list item.</li></ul>',
                 )
+            })
 
-                expect(customSerializer.serialize(MARKDOWN_INPUT_IMAGES)).toBe(
-                    '<img src="https://octodex.github.com/images/octobiwan.jpg" alt="Octobi Wan Catnobi"><img src="https://octodex.github.com/images/octobiwan.jpg" alt=""><img src="https://octodex.github.com/images/octobiwan.jpg" alt=""><img src="https://octodex.github.com/images/octobiwan.jpg" alt="Octobi Wan Catnobi" title="Octobi Wan Catnobi"><p><a href="https://octodex.github.com/octobiwan/"><img src="https://octodex.github.com/images/octobiwan.jpg" alt="Octobi Wan Catnobi" title="Octobi Wan Catnobi"></a></p><p>Octobi Wan Catnobi: </p><p>Octobi Wan Catnobi:  - These are not the droids you\'re looking for!</p><p> - These are not the droids you\'re looking for!</p>',
+            test('tables syntax is preserved', () => {
+                expect(htmlSerializer.serialize(MARKDOWN_INPUT_TABLES)).toBe(
+                    "<p>| Syntax      | Description |<br>| ----------- | ----------- |<br>| Header      | Title       |<br>| Paragraph   | Text        |</p><hr><p>| Syntax | Description |<br>| --- | ----------- |<br>| Header | Title |<br>| Paragraph | Text |</p><hr><p>| Syntax      | Description | Test Text     |<br>| :---        |    :----:   |          ---: |<br>| Header      | Title       | Here's this   |<br>| Paragraph   | Text        | And more      |</p>",
                 )
             })
         })
 
-        describe('with `image` extension (inline)', () => {
+        describe('with `image` extension (inline node rendering)', () => {
             test('images HTML output is correct', () => {
-                const customSerializer = createHTMLSerializer(
+                const htmlSerializer = createHTMLSerializer(
                     getSchema([
                         RichTextKit.configure({
                             image: {
@@ -546,19 +658,19 @@ Answer: [Doist Frontend](channel://190200)`),
                     ]),
                 )
 
-                expect(customSerializer.serialize(MARKDOWN_INPUT_IMAGES)).toBe(
+                expect(htmlSerializer.serialize(MARKDOWN_INPUT_IMAGES)).toBe(
                     '<p><img src="https://octodex.github.com/images/octobiwan.jpg" alt="Octobi Wan Catnobi"></p><p><img src="https://octodex.github.com/images/octobiwan.jpg" alt=""><img src="https://octodex.github.com/images/octobiwan.jpg" alt=""></p><p><img src="https://octodex.github.com/images/octobiwan.jpg" alt="Octobi Wan Catnobi" title="Octobi Wan Catnobi"></p><p><a href="https://octodex.github.com/octobiwan/"><img src="https://octodex.github.com/images/octobiwan.jpg" alt="Octobi Wan Catnobi" title="Octobi Wan Catnobi"></a></p><p>Octobi Wan Catnobi: <img src="https://octodex.github.com/images/octobiwan.jpg" alt=""></p><p>Octobi Wan Catnobi: <img src="https://octodex.github.com/images/octobiwan.jpg" alt=""> - These are not the droids you\'re looking for!</p><p><img src="https://octodex.github.com/images/octobiwan.jpg" alt=""> - These are not the droids you\'re looking for!</p>',
                 )
             })
         })
 
-        describe('with custom `taskList` extension', () => {
+        describe('with official `taskList`/`taskItem` extensions', () => {
             test('task lists HTML output is correct', () => {
-                const customSerializer = createHTMLSerializer(
+                const htmlSerializer = createHTMLSerializer(
                     getSchema([RichTextKit, TaskList, TaskItem]),
                 )
 
-                expect(customSerializer.serialize(MARKDOWN_INPUT_TASK_LISTS)).toBe(
+                expect(htmlSerializer.serialize(MARKDOWN_INPUT_TASK_LISTS)).toBe(
                     '<ul data-type="taskList"><li data-type="taskItem" data-checked="false">First item</li><li data-type="taskItem" data-checked="true">Second item</li><li data-type="taskItem" data-checked="true">Third item</li><li data-type="taskItem" data-checked="false">Fourth item</li></ul><hr><ul data-type="taskList"><li data-type="taskItem" data-checked="true">First item</li><li data-type="taskItem" data-checked="false">Second item</li><li data-type="taskItem" data-checked="false">Third item</li><li data-type="taskItem" data-checked="true">Fourth item</li></ul><hr><ul data-type="taskList"><li data-type="taskItem" data-checked="true">First item</li><li data-type="taskItem" data-checked="false">Second item</li><li data-type="taskItem" data-checked="true">Third item</li><li data-type="taskItem" data-checked="false">Fourth item</li></ul><hr><ul data-type="taskList"><li>First item</li><li>Second item</li><li>Third item<ul data-type="taskList"><li data-type="taskItem" data-checked="false">Indented item</li><li data-type="taskItem" data-checked="false">Indented item</li></ul></li><li>Fourth item</li></ul><hr><ul data-type="taskList"><li data-type="taskItem" data-checked="false">1968. A great year!</li><li data-type="taskItem" data-checked="true">I think 1969 was second best.</li></ul><hr><ul data-type="taskList"><li data-type="taskItem" data-checked="false">This is the first list item.</li><li data-type="taskItem" data-checked="false">Here&#39;s the second list item.<br>  I need to add another paragraph below the second list item.</li><li data-type="taskItem" data-checked="false">And here&#39;s the third list item.</li></ul>',
                 )
             })
@@ -566,42 +678,82 @@ Answer: [Doist Frontend](channel://190200)`),
 
         describe('with custom `*Suggestion` extensions', () => {
             test('suggestion extensions support alphanumeric IDs', () => {
-                const customSerializer = createHTMLSerializer(
+                const htmlSerializer = createHTMLSerializer(
                     getSchema([RichTextKit, createSuggestionExtension('mention')]),
                 )
 
                 expect(
-                    customSerializer.serialize(`Question: Who's the head of the Frontend team?
+                    htmlSerializer.serialize(`Question: Who's the head of the Frontend team?
 Answer: [Henning M](mention://user:190200@doist.dev)`),
                 ).toBe(
                     '<p>Question: Who\'s the head of the Frontend team?<br>Answer: <span data-mention="" data-id="user:190200@doist.dev" data-label="Henning M"></span></p>',
                 )
             })
 
-            test('mention suggestions HTML output is correct', () => {
-                const customSerializer = createHTMLSerializer(
-                    getSchema([RichTextKit, createSuggestionExtension('mention')]),
-                )
+            describe('with the `Link` extension enabled', () => {
+                let htmlSerializer: HTMLSerializerReturnType
 
-                expect(
-                    customSerializer.serialize(`Question: Who's the head of the Frontend team?
-Answer: [Henning M](mention://963827)`),
-                ).toBe(
-                    '<p>Question: Who\'s the head of the Frontend team?<br>Answer: <span data-mention="" data-id="963827" data-label="Henning M"></span></p>',
-                )
-            })
+                beforeEach(() => {
+                    htmlSerializer = createHTMLSerializer(
+                        getSchema([
+                            RichTextKit,
+                            createSuggestionExtension('mention'),
+                            createSuggestionExtension('channel'),
+                        ]),
+                    )
+                })
 
-            test('channel suggestions HTML output is correct', () => {
-                const customSerializer = createHTMLSerializer(
-                    getSchema([RichTextKit, createSuggestionExtension('channel')]),
-                )
-
-                expect(
-                    customSerializer.serialize(`Question: What's the best channel on Twist?
+                test('mention suggestions HTML output is correct', () => {
+                    expect(
+                        htmlSerializer.serialize(`Question: Who's the head of the Frontend team?
+Answer: [Henning M](mention://963827)`),
+                    ).toBe(
+                        '<p>Question: Who\'s the head of the Frontend team?<br>Answer: <span data-mention="" data-id="963827" data-label="Henning M"></span></p>',
+                    )
+                })
+
+                test('channel suggestions HTML output is correct', () => {
+                    expect(
+                        htmlSerializer.serialize(`Question: What's the best channel on Twist?
 Answer: [Doist Frontend](channel://190200)`),
-                ).toBe(
-                    '<p>Question: What\'s the best channel on Twist?<br>Answer: <span data-channel="" data-id="190200" data-label="Doist Frontend"></span></p>',
-                )
+                    ).toBe(
+                        '<p>Question: What\'s the best channel on Twist?<br>Answer: <span data-channel="" data-id="190200" data-label="Doist Frontend"></span></p>',
+                    )
+                })
+            })
+
+            describe('with the `Link` extension disabled', () => {
+                let htmlSerializer: HTMLSerializerReturnType
+
+                beforeEach(() => {
+                    htmlSerializer = createHTMLSerializer(
+                        getSchema([
+                            RichTextKit.configure({
+                                link: false,
+                            }),
+                            createSuggestionExtension('mention'),
+                            createSuggestionExtension('channel'),
+                        ]),
+                    )
+                })
+
+                test('mention suggestions HTML output is correct', () => {
+                    expect(
+                        htmlSerializer.serialize(`Question: Who's the head of the Frontend team?
+Answer: [Henning M](mention://963827)`),
+                    ).toBe(
+                        '<p>Question: Who\'s the head of the Frontend team?<br>Answer: <span data-mention="" data-id="963827" data-label="Henning M"></span></p>',
+                    )
+                })
+
+                test('channel suggestions HTML output is correct', () => {
+                    expect(
+                        htmlSerializer.serialize(`Question: What's the best channel on Twist?
+Answer: [Doist Frontend](channel://190200)`),
+                    ).toBe(
+                        '<p>Question: What\'s the best channel on Twist?<br>Answer: <span data-channel="" data-id="190200" data-label="Doist Frontend"></span></p>',
+                    )
+                })
             })
         })
     })
diff --git a/src/serializers/html/html.ts b/src/serializers/html/html.ts
index cf90531e..17f48c32 100644
--- a/src/serializers/html/html.ts
+++ b/src/serializers/html/html.ts
@@ -3,9 +3,11 @@ import { marked } from 'marked'
 
 import { REGEX_LINE_BREAKS } from '../../constants/regular-expressions'
 import { isPlainTextDocument } from '../../helpers/schema'
+import { buildSuggestionSchemaPartialRegex } from '../../helpers/serializer'
 
 import { checkbox } from './extensions/checkbox'
 import { code } from './extensions/code'
+import { disabled } from './extensions/disabled'
 import { html } from './extensions/html'
 import { link } from './extensions/link'
 import { paragraph } from './extensions/paragraph'
@@ -33,6 +35,7 @@ type HTMLSerializerReturnType = {
  * @see https://marked.js.org/using_advanced#options
  */
 const INITIAL_MARKED_OPTIONS: marked.MarkedOptions = {
+    ...marked.getDefaults(),
     breaks: true,
     gfm: true,
     headerIds: false,
@@ -87,40 +90,11 @@ function createHTMLSerializer(schema: Schema): HTMLSerializerReturnType {
         return createHTMLSerializerForPlainTextEditor(schema)
     }
 
-    // Reset Marked to the defaults and set custom options
-    marked.setOptions({
-        ...marked.getDefaults(),
-        ...INITIAL_MARKED_OPTIONS,
-    })
-
-    // Disable built-in rules that the editor does not yet support
-    marked.use({
-        // eslint-disable-next-line @typescript-eslint/ban-ts-comment
-        // @ts-ignore: Returning `undefined` is acceptable to disable tokens
-        tokenizer: {
-            ...(!schema.marks.strike
-                ? {
-                      del() {
-                          /* noop: disables tokenizer */
-                      },
-                  }
-                : {}),
-            ...(!schema.nodes.heading
-                ? {
-                      heading() {
-                          /* noop: disables tokenizer */
-                      },
-                  }
-                : {}),
-            ...(!schema.nodes.table
-                ? {
-                      table() {
-                          /* noop: disables tokenizer */
-                      },
-                  }
-                : {}),
-        },
-    })
+    // Reset Marked instance to the initial options
+    marked.setOptions(INITIAL_MARKED_OPTIONS)
+
+    // Disable built-in rules that are not supported by the schema
+    marked.use(disabled(schema))
 
     // Overwrite some built-in rules for handling of special behaviours
     // (see documentation for each extension for more details)
@@ -136,14 +110,12 @@ function createHTMLSerializer(schema: Schema): HTMLSerializerReturnType {
         marked.use(taskList)
     }
 
-    // Get all the available suggestion nodes from the schema
-    const suggestionNodes = Object.values(schema.nodes).filter((node) =>
-        node.name.endsWith('Suggestion'),
-    )
+    // Build a regular expression with all the available suggestion nodes from the schema
+    const suggestionSchemaPartialRegex = buildSuggestionSchemaPartialRegex(schema)
 
     // Overwrite the built-in link rule if any suggestion node exists in the schema
-    if (suggestionNodes.length > 0) {
-        marked.use(link(suggestionNodes))
+    if (suggestionSchemaPartialRegex) {
+        marked.use(link(new RegExp(`^${suggestionSchemaPartialRegex}`)))
     }
 
     return {
@@ -163,6 +135,6 @@ function createHTMLSerializer(schema: Schema): HTMLSerializerReturnType {
     }
 }
 
-export { createHTMLSerializer }
+export { createHTMLSerializer, INITIAL_MARKED_OPTIONS }
 
 export type { HTMLSerializerReturnType }
diff --git a/src/serializers/markdown/markdown.ts b/src/serializers/markdown/markdown.ts
index 7119599b..8f7c5261 100644
--- a/src/serializers/markdown/markdown.ts
+++ b/src/serializers/markdown/markdown.ts
@@ -89,6 +89,10 @@ const INITIAL_TURNDOWN_OPTIONS: Turndown.Options = {
  * a plain-text editor. The editor schema is used to detect which nodes and marks are available in
  * the editor, and only parses the input with the minimal required rules.
  *
+ * **Note:** Unlike the HTML serializer, built-in rules that are not supported by the schema are not
+ * disabled because if the schema does not support certain nodes/marks, the parsing rules don't have
+ * valid HTML elements to match in the editor HTML output.
+ *
  * @param schema The editor schema to be used for nodes and marks detection.
  *
  * @returns A normalized object for the Markdown serializer.