From 49bd13d2595aecfa25b1bb9f10c05bf89af483db Mon Sep 17 00:00:00 2001 From: =?UTF-8?q?Jind=C5=99ich=20B=C3=A4r?= Date: Thu, 12 Dec 2024 13:51:26 +0100 Subject: [PATCH] fix: parse project changelogs with `remark` (#1342) This PR adds actual parsing of the Markdown content instead of using RegExp-based transformations. This mitigates the problems with mismatched token delimiters (nested Markdown links etc.). Fixes the documentation build in https://github.com/apify/apify-client-js (which in turn unblocks the releases there). related to https://github.com/facebook/docusaurus/issues/10739 --- apify-docs-theme/package.json | 6 +- apify-docs-theme/src/markdown.js | 137 ++++++++++++++++++++++++++----- package-lock.json | 64 ++++++++++++++- 3 files changed, 186 insertions(+), 21 deletions(-) diff --git a/apify-docs-theme/package.json b/apify-docs-theme/package.json index 1e60c7b6c..bdf396e35 100644 --- a/apify-docs-theme/package.json +++ b/apify-docs-theme/package.json @@ -26,7 +26,11 @@ "babel-loader": "^9.1.3", "docusaurus-gtm-plugin": "^0.0.2", "postcss-preset-env": "^9.3.0", - "prism-react-renderer": "^2.0.6" + "prism-react-renderer": "^2.0.6", + "remark-parse": "^11.0.0", + "remark-stringify": "^11.0.0", + "unified": "^11.0.5", + "unist-util-visit-parents": "^3.1.1" }, "peerDependencies": { "clsx": "*", diff --git a/apify-docs-theme/src/markdown.js b/apify-docs-theme/src/markdown.js index de9504d73..d1d5b295b 100644 --- a/apify-docs-theme/src/markdown.js +++ b/apify-docs-theme/src/markdown.js @@ -1,33 +1,132 @@ +const remarkParse = require('remark-parse'); +const remarkStringify = require('remark-stringify'); +const { unified } = require('unified'); +const visitParents = require('unist-util-visit-parents'); + +/** + * Updates the markdown content for better UX and compatibility with Docusaurus v3. + * @param {string} changelog The markdown content. + * @returns {string} The updated markdown content. + */ function updateChangelog(changelog) { + const pipeline = unified() + .use(remarkParse) + .use(incrementHeadingLevels) + .use(prettifyPRLinks) + .use(linkifyUserTags) + .use(remarkStringify); + + changelog = pipeline.processSync(changelog).toString(); changelog = addFrontmatter(changelog); - changelog = pushHeadings(changelog); - changelog = fixUserLinks(changelog); - changelog = fixPRLinks(changelog); changelog = escapeMDXCharacters(changelog); return changelog; } -function addFrontmatter(changelog, header = 'Changelog') { - return `--- -title: ${header} -sidebar_label: ${header} -toc_max_heading_level: 2 ---- -${changelog}`; -} +/** + * Bumps the headings levels in the markdown content. This function increases the depth + * of all headings in the content by 1. This is useful when the content is included in + * another markdown file with a higher-level heading. + * @param {*} tree Remark AST tree. + * @returns {void} Nothing. This function modifies the tree in place. + */ +const incrementHeadingLevels = () => (tree) => { + visitParents(tree, 'heading', (node) => { + node.depth += 1; + }); +}; -function pushHeadings(changelog) { - return changelog.replaceAll(/\n#[^#]/g, '\n## '); -} +/** + * Links user tags in the markdown content. This function replaces the user tags + * (e.g. `@username`) with a link to the user's GitHub profile (just like GitHub's UI). + * @param {*} tree Remark AST tree. + * @returns {void} Nothing. This function modifies the tree in place. + */ +const linkifyUserTags = () => (tree) => { + visitParents(tree, 'text', (node, parents) => { + const userTagRegex = /@([a-zA-Z0-9-]+)(\s|$)/g; + const match = userTagRegex.exec(node.value); -function fixUserLinks(changelog) { - return changelog.replaceAll(/by @([a-zA-Z0-9-]+)/g, 'by [@$1](https://github.com/$1)'); -} + if (!match) return; + + const directParent = parents[parents.length - 1]; + const nodeIndexInParent = directParent.children.findIndex((x) => x === node); + + const username = match[1]; + const ending = match[2] === ' ' ? ' ' : ''; + const before = node.value.slice(0, match.index); + const after = node.value.slice(userTagRegex.lastIndex); -function fixPRLinks(changelog) { - return changelog.replaceAll(/(((https?:\/\/)?(www.)?)?github.com\/[^\s]*?\/pull\/([0-9]+))/g, '[#$5]($1)'); + const link = { + type: 'link', + url: `https://github.com/${username}`, + children: [{ type: 'text', value: `@${username}` }], + }; + node.value = before; + directParent.children.splice(nodeIndexInParent + 1, 0, link); + + if (!after) return nodeIndexInParent + 2; + + directParent.children.splice(nodeIndexInParent + 2, 0, { type: 'text', value: `${ending}${after}` }); + return nodeIndexInParent + 3; + }); +}; + +/** + * Prettifies PR links in the markdown content. Just like GitHub's UI, this function + * replaces the full PR URL with a link represented by the PR number (prefixed by a hashtag). + * @param {*} tree Remark AST tree. + * @returns {void} Nothing. This function modifies the tree in place. + */ +const prettifyPRLinks = () => (tree) => { + visitParents(tree, 'text', (node, parents) => { + const prLinkRegex = /https:\/\/github.com\/[^\s]+\/pull\/(\d+)/g; + const match = prLinkRegex.exec(node.value); + + if (!match) return; + + const directParent = parents[parents.length - 1]; + const nodeIndexInParent = directParent.children.findIndex((x) => x === node); + + const prNumber = match[1]; + const before = node.value.slice(0, match.index); + const after = node.value.slice(prLinkRegex.lastIndex); + + const link = { + type: 'link', + url: match[0], + children: [{ type: 'text', value: `#${prNumber}` }], + }; + node.value = before; + + directParent.children.splice(nodeIndexInParent + 1, 0, link); + if (!after) return nodeIndexInParent + 1; + + directParent.children.splice(nodeIndexInParent + 2, 0, { type: 'text', value: after }); + return nodeIndexInParent + 2; + }); +}; + +/** + * Adds frontmatter to the markdown content. + * @param {string} changelog The markdown content. + * @param {string} title The frontmatter title. + * @returns {string} The markdown content with frontmatter. + */ +function addFrontmatter(changelog, title = 'Changelog') { + return `--- +title: ${title} +sidebar_label: ${title} +toc_max_heading_level: 3 +--- +${changelog}`; } +/** + * Escapes the MDX-related characters in the markdown content. + * This is required by Docusaurus v3 and its dependencies (see the v3 [migration guide](https://docusaurus.io/docs/migration/v3#common-mdx-problems)). + * @param {string} changelog The markdown content. + * @returns {string} The markdown content with escaped MDX characters. + */ function escapeMDXCharacters(changelog) { return changelog.replaceAll(/<|>/g, (match) => { return match === '<' ? '<' : '>'; diff --git a/package-lock.json b/package-lock.json index be60408ad..d1864da3c 100644 --- a/package-lock.json +++ b/package-lock.json @@ -84,7 +84,11 @@ "babel-loader": "^9.1.3", "docusaurus-gtm-plugin": "^0.0.2", "postcss-preset-env": "^9.3.0", - "prism-react-renderer": "^2.0.6" + "prism-react-renderer": "^2.0.6", + "remark-parse": "^11.0.0", + "remark-stringify": "^11.0.0", + "unified": "^11.0.5", + "unist-util-visit-parents": "^3.1.1" }, "peerDependencies": { "clsx": "*", @@ -20007,6 +20011,20 @@ "integrity": "sha512-CmBKiL6NNo/OqgmMn95Fk9Whlp2mtvIv+KNpQKN2F4SjvrEesubTRWGYSg+BnWZOnlCaSTU1sMpsBOzgbYhnsA==", "license": "MIT" }, + "node_modules/mdast-util-directive/node_modules/unist-util-visit-parents": { + "version": "6.0.1", + "resolved": "https://registry.npmjs.org/unist-util-visit-parents/-/unist-util-visit-parents-6.0.1.tgz", + "integrity": "sha512-L/PqWzfTP9lzzEa6CKs0k2nARxTdZduw3zyh8d2NVBnsyvHjSX4TWse388YrrQKbvI8w20fGjGlhgT96WwKykw==", + "license": "MIT", + "dependencies": { + "@types/unist": "^3.0.0", + "unist-util-is": "^6.0.0" + }, + "funding": { + "type": "opencollective", + "url": "https://opencollective.com/unified" + } + }, "node_modules/mdast-util-find-and-replace": { "version": "3.0.1", "resolved": "https://registry.npmjs.org/mdast-util-find-and-replace/-/mdast-util-find-and-replace-3.0.1.tgz", @@ -20044,6 +20062,20 @@ "url": "https://github.com/sponsors/sindresorhus" } }, + "node_modules/mdast-util-find-and-replace/node_modules/unist-util-visit-parents": { + "version": "6.0.1", + "resolved": "https://registry.npmjs.org/unist-util-visit-parents/-/unist-util-visit-parents-6.0.1.tgz", + "integrity": "sha512-L/PqWzfTP9lzzEa6CKs0k2nARxTdZduw3zyh8d2NVBnsyvHjSX4TWse388YrrQKbvI8w20fGjGlhgT96WwKykw==", + "license": "MIT", + "dependencies": { + "@types/unist": "^3.0.0", + "unist-util-is": "^6.0.0" + }, + "funding": { + "type": "opencollective", + "url": "https://opencollective.com/unified" + } + }, "node_modules/mdast-util-from-markdown": { "version": "0.8.5", "resolved": "https://registry.npmjs.org/mdast-util-from-markdown/-/mdast-util-from-markdown-0.8.5.tgz", @@ -33213,6 +33245,36 @@ } }, "node_modules/unist-util-visit-parents": { + "version": "3.1.1", + "resolved": "https://registry.npmjs.org/unist-util-visit-parents/-/unist-util-visit-parents-3.1.1.tgz", + "integrity": "sha512-1KROIZWo6bcMrZEwiH2UrXDyalAa0uqzWCxCJj6lPOvTve2WkfgCytoDTPaMnodXh1WrXOq0haVYHj99ynJlsg==", + "license": "MIT", + "dependencies": { + "@types/unist": "^2.0.0", + "unist-util-is": "^4.0.0" + }, + "funding": { + "type": "opencollective", + "url": "https://opencollective.com/unified" + } + }, + "node_modules/unist-util-visit-parents/node_modules/@types/unist": { + "version": "2.0.11", + "resolved": "https://registry.npmjs.org/@types/unist/-/unist-2.0.11.tgz", + "integrity": "sha512-CmBKiL6NNo/OqgmMn95Fk9Whlp2mtvIv+KNpQKN2F4SjvrEesubTRWGYSg+BnWZOnlCaSTU1sMpsBOzgbYhnsA==", + "license": "MIT" + }, + "node_modules/unist-util-visit-parents/node_modules/unist-util-is": { + "version": "4.1.0", + "resolved": "https://registry.npmjs.org/unist-util-is/-/unist-util-is-4.1.0.tgz", + "integrity": "sha512-ZOQSsnce92GrxSqlnEEseX0gi7GH9zTJZ0p9dtu87WRb/37mMPO2Ilx1s/t9vBHrFhbgweUwb+t7cIn5dxPhZg==", + "license": "MIT", + "funding": { + "type": "opencollective", + "url": "https://opencollective.com/unified" + } + }, + "node_modules/unist-util-visit/node_modules/unist-util-visit-parents": { "version": "6.0.1", "resolved": "https://registry.npmjs.org/unist-util-visit-parents/-/unist-util-visit-parents-6.0.1.tgz", "integrity": "sha512-L/PqWzfTP9lzzEa6CKs0k2nARxTdZduw3zyh8d2NVBnsyvHjSX4TWse388YrrQKbvI8w20fGjGlhgT96WwKykw==",