1
0
mirror of synced 2025-12-19 18:10:59 -05:00
Files
docs/src/automated-pipelines/lib/update-markdown.ts
2025-07-09 18:12:39 +00:00

547 lines
19 KiB
TypeScript

import walk from 'walk-sync'
import { existsSync, lstatSync, unlinkSync } from 'fs'
import path from 'path'
import { readFile, writeFile, readdir } from 'fs/promises'
import matter from 'gray-matter'
import { rimraf } from 'rimraf'
import { mkdirp } from 'mkdirp'
import { difference, isEqual } from 'lodash-es'
import { allVersions } from '@/versions/lib/all-versions'
import getApplicableVersions from '@/versions/lib/get-applicable-versions.js'
import type { MarkdownFrontmatter } from '@/types'
// Type definitions - extending existing type to add missing fields and make most fields optional
type FrontmatterData = Partial<MarkdownFrontmatter> & {
autogenerated?: string
[key: string]: any
}
type SourceContentItem = {
data: FrontmatterData
content: string
}
type SourceContent = {
[key: string]: SourceContentItem
}
type IndexOrder = {
[key: string]: {
startsWith?: string[]
}
}
type UpdateContentDirectoryOptions = {
targetDirectory: string
sourceContent: SourceContent
frontmatter: FrontmatterData
indexOrder?: IndexOrder
}
type UpdateDirectoryOptions = {
rootDirectoryOnly?: boolean
shortTitle?: boolean
indexOrder?: IndexOrder
}
type ChildUpdates = {
itemsToAdd: string[]
itemsToRemove: string[]
}
type DirectoryInfo = {
directoryContents: string[]
directoryFiles: string[]
childDirectories: string[]
}
type ChildrenComparison = {
childrenOnDisk: string[]
indexChildren: string[]
}
const ROOT_INDEX_FILE = 'content/index.md'
export const MARKDOWN_COMMENT = '\n<!-- Content after this section is automatically generated -->\n'
// Main entrypoint into this module. This function adds, removes, and updates
// versions frontmatter in all directories under the targetDirectory.
export async function updateContentDirectory({
targetDirectory,
sourceContent,
frontmatter,
indexOrder,
}: UpdateContentDirectoryOptions): Promise<void> {
const sourceFiles = Object.keys(sourceContent)
await createDirectory(targetDirectory)
await removeMarkdownFiles(targetDirectory, sourceFiles, frontmatter.autogenerated)
await updateMarkdownFiles(targetDirectory, sourceContent, frontmatter, indexOrder)
}
// Remove markdown files that are no longer in the source data
async function removeMarkdownFiles(
targetDirectory: string,
sourceFiles: string[],
autogeneratedType: string | undefined,
): Promise<void> {
// Copy the autogenerated Markdown files to the target directory
const autogeneratedFiles = await getAutogeneratedFiles(targetDirectory, autogeneratedType)
// If the first array contains items that the second array does not,
// it means that a Markdown page was deleted from the OpenAPI schema
const filesToRemove = difference(autogeneratedFiles, sourceFiles)
// Markdown files that need to be deleted
for (const file of filesToRemove) {
unlinkSync(file)
}
}
// Gets a list of all files under targetDirectory that have the
// `autogenerated` frontmatter set to `autogeneratedType`.
async function getAutogeneratedFiles(
targetDirectory: string,
autogeneratedType: string | undefined,
): Promise<string[]> {
const files = walk(targetDirectory, {
includeBasePath: true,
directories: false,
globs: ['**/*.md'],
ignore: ['**/README.md', '**/index.md'],
})
return (
await Promise.all(
files.map(async (file: string) => {
const { data } = matter(await readFile(file, 'utf-8'))
if (data.autogenerated === autogeneratedType) {
return file
}
}),
)
).filter(Boolean) as string[]
}
// The `sourceContent` object contains the new content and target file
// path for the Markdown files. Ex:
// { <targetFile>: { data: <frontmatter>, content: <markdownContent> } }
async function updateMarkdownFiles(
targetDirectory: string,
sourceContent: SourceContent,
frontmatter: FrontmatterData,
indexOrder: IndexOrder = {},
): Promise<void> {
for (const [file, newContent] of Object.entries(sourceContent)) {
await updateMarkdownFile(file, newContent.data, newContent.content)
}
// This function recursively updates the index.md files in each
// of the directories under targetDirectory
await updateDirectory(targetDirectory, frontmatter, { indexOrder })
// We don't want to update directories that the pipelines don't affect
// so we make one call to update only the root index.md file
// in targetDirectory to prevent any unintended changes
await updateDirectory(path.dirname(targetDirectory), frontmatter, { rootDirectoryOnly: true })
}
// If the Markdown file already exists on disk, we only update the
// content and version frontmatter to allow writers to manually
// edit the modifiable content of the file. If the Markdown file doesn't
// exists, we create a new Markdown file.
async function updateMarkdownFile(
file: string,
sourceData: FrontmatterData,
sourceContent: string,
commentDelimiter: string = MARKDOWN_COMMENT,
): Promise<void> {
if (existsSync(file)) {
// update only the versions property of the file, assuming
// the other properties have already been added and edited
const { data, content } = matter(await readFile(file, 'utf-8'))
// Double check that the comment delimiter is only used once
const matcher = new RegExp(commentDelimiter, 'g')
const matches = content.match(matcher)
if (matches && matches.length > 1) {
throw new Error(`Error: ${file} has multiple comment delimiters`)
}
const [manuallyCreatedContent, automatedContent] = matches
? content.split(commentDelimiter)
: [content, '']
const isDelimiterMissing = !matches
const isContentSame = automatedContent === sourceContent
const isVersionsSame = isEqual(sourceData.versions, data.versions)
// Only proceed if the content or versions have changed
if (isContentSame && isVersionsSame && !isDelimiterMissing) {
return
}
// Create a new object so that we don't mutate the original data
const newData = { ...data }
// Only modify the versions property when a file already exists
newData.versions = sourceData.versions
const targetContent = manuallyCreatedContent + commentDelimiter + sourceContent
const newFileContent = appendVersionComment(matter.stringify(targetContent, newData))
await writeFile(file, newFileContent)
} else {
await createDirectory(path.dirname(file))
const newFileContent = appendVersionComment(
matter.stringify(commentDelimiter + sourceContent, sourceData),
)
await writeFile(file, newFileContent)
}
}
// Recursively walks through the directory structure and updates the
// index.md files to match the disk. Before calling this function
// ensure that the Markdown files have been updated and any files
// that need to be deleted have been removed.
async function updateDirectory(
directory: string,
frontmatter: FrontmatterData,
{ rootDirectoryOnly = false, shortTitle = false, indexOrder = {} }: UpdateDirectoryOptions = {},
): Promise<void> {
const initialDirectoryListing = await getDirectoryInfo(directory)
// If there are no children on disk, remove the directory
if (initialDirectoryListing.directoryContents.length === 0 && !rootDirectoryOnly) {
await rimraf(directory)
return
}
// Recursively update child directories
if (!rootDirectoryOnly) {
await Promise.all(
initialDirectoryListing.childDirectories.map(async (subDirectory) => {
await updateDirectory(`${directory}/${subDirectory}`, frontmatter, { indexOrder })
}),
)
}
const indexFile = `${directory}/index.md`
const { data, content } = await getIndexFileContents(indexFile, frontmatter, shortTitle)
// We need to re-get the directory contents because a recursive call
// may have removed a directory since the initial directory read.
const { directoryContents, childDirectories, directoryFiles } = await getDirectoryInfo(directory)
const { childrenOnDisk, indexChildren } = getChildrenToCompare(
indexFile,
directoryContents,
data.children || [],
)
const itemsToAdd = difference(childrenOnDisk, indexChildren)
const itemsToRemove = difference(indexChildren, childrenOnDisk)
if (itemsToRemove.length === 0 && itemsToAdd.length === 0) {
return
}
if (!rootDirectoryOnly) {
// Update the versions in the index.md file to match the directory contents
directoryFiles.push(...childDirectories.map((dir) => path.join(dir, 'index.md')))
const newVersions = await getIndexFileVersions(directory, directoryFiles)
const isVersionEqual = isEqual(newVersions, data.versions)
if (!isVersionEqual) {
data.versions = newVersions
}
}
// Update the index.md file contents and write the file to disk
const dataUpdatedChildren = updateIndexChildren(
data,
{ itemsToAdd, itemsToRemove },
indexFile,
indexOrder,
isRootIndexFile(indexFile),
)
await writeFile(indexFile, matter.stringify(content, dataUpdatedChildren))
}
// Takes the children properties from the index.md file and the
// files/directories on disk and normalizes them to be comparable
// against each other.
// Children properties include a leading slash except when the
// index.md file is the root index.md file. We also want to
// remove the file extension from the files on disk.
function getChildrenToCompare(
indexFile: string,
directoryContents: string[],
fmChildren: string[] | undefined,
): ChildrenComparison {
if (!fmChildren) {
throw new Error(`No children property found in ${indexFile}`)
}
const isEarlyAccess = (item: string) => isRootIndexFile(indexFile) && item === 'early-access'
// Get the list of children from the directory contents
const childrenOnDisk = directoryContents
.map((file) => `${path.basename(file, '.md')}`)
.filter((item) => !isEarlyAccess(item))
const indexChildren = fmChildren
.map((child) => child.replace('/', ''))
.filter((item) => !isEarlyAccess(item))
return { childrenOnDisk, indexChildren }
}
// Adds and removes children properties to the index.md file.
// There are three possible scenarios that we want to handle:
//
// 1. If the lib/config.json file for the pipeline defines a sort
// order for the index file we're currently processing, then
// we want to use that sort order. Currently, the config files
// only defined a startsWith parameter. This property defines
// the order of the first items in the index files children
// property. All other items are sorted and appended to list.
//
// 2. If not config is defined and the index file is an
// autogenerated file, we sort all the children alphabetically.
//
// 3. If the index file is not autogenerated, we leave the ordering
// as is and append new children to the end.
function updateIndexChildren(
data: FrontmatterData,
childUpdates: ChildUpdates,
indexFile: string,
indexOrder: IndexOrder,
rootIndex: boolean = false,
): FrontmatterData {
const { itemsToAdd, itemsToRemove } = childUpdates
const childPrefix = rootIndex ? '' : '/'
// Get a new list of children with added and removed items
const children = [...(data.children || [])]
// remove the '/' prefix used in index.md children
.map((item) => item.replace(childPrefix, ''))
.filter((item) => !itemsToRemove.includes(item))
children.push(...itemsToAdd)
const orderedIndexChildren: string[] = []
// Only used for tests. During testing, the content directory is
// in a temp directory so the paths are not relative to
// the current working directory. This gets the relative path
// from the full path to the index file.
const indexRelativePath = process.env.TEST_OS_ROOT_DIR
? indexFile.replace(`${process.env.TEST_OS_ROOT_DIR}/`, '')
: indexFile
const indexOrderConfig = indexOrder[indexRelativePath]
const isAutogenerated = data.autogenerated
if (indexOrderConfig && isAutogenerated) {
if (indexOrderConfig.startsWith) {
const sortableChildren = difference(children, indexOrderConfig.startsWith).sort()
orderedIndexChildren.push(...indexOrderConfig.startsWith, ...sortableChildren)
}
} else if (isAutogenerated) {
// always sort autogenerated index files that have no override config
orderedIndexChildren.push(...children)
orderedIndexChildren.sort()
} else {
// just leave the children in the order they are in the index file
// so they can be manually sorted
orderedIndexChildren.push(...children)
}
const updatedData = { ...data }
// add the '/' prefix back to the children
updatedData.children = orderedIndexChildren.map((item) => `${childPrefix}${item}`)
return updatedData
}
// Gets the contents of the index.md file from disk if it exits or
// creates a new index.md file with the default frontmatter.
async function getIndexFileContents(
indexFile: string,
frontmatter: FrontmatterData,
shortTitle: boolean = false,
): Promise<{ data: FrontmatterData; content: string }> {
const directory = path.dirname(indexFile)
const indexFileContent = {
data: {
title: path.basename(directory),
...frontmatter,
children: [],
},
content: '',
}
if (shortTitle) {
indexFileContent.data.shortTitle = path.basename(directory)
}
return existsSync(indexFile) ? matter(await readFile(indexFile, 'utf-8')) : indexFileContent
}
// Builds the index.md versions frontmatter by consolidating
// the versions from each Markdown file in the directory + the
// index.md files in any subdirectories of directory.
async function getIndexFileVersions(
directory: string,
files: string[],
): Promise<{ [key: string]: string }> {
const versions = new Set<string>()
await Promise.all(
files.map(async (file) => {
const filepath = path.join(directory, file)
if (!existsSync(filepath)) {
throw new Error(
`File ${filepath} does not exist while assembling directory index.md files to create parent version.`,
)
}
// If not a markdown(x) file, skip it
if (!file.endsWith('.md') && !file.endsWith('.mdx')) {
return
}
const { data } = matter(await readFile(filepath, 'utf-8'))
if (!data || !data.versions) {
throw new Error(`Frontmatter in ${filepath} does not contain versions.`)
}
const fmVersions = getApplicableVersions(data.versions)
fmVersions.forEach((version: string) => versions.add(version))
}),
)
const versionArray = [...versions]
return await convertVersionsToFrontmatter(versionArray)
}
/* Takes a list of versions in the format:
[
'free-pro-team@latest',
'enterprise-cloud@latest',
'enterprise-server@3.3',
'enterprise-server@3.4',
'enterprise-server@3.5',
'enterprise-server@3.6',
'enterprise-server@3.7'
]
and returns the frontmatter equivalent JSON:
{
fpt: '*',
ghec: '*',
ghes: '*'
}
*/
export async function convertVersionsToFrontmatter(
versions: string[],
): Promise<{ [key: string]: string }> {
const frontmatterVersions: { [key: string]: string } = {}
const numberedReleases: { [key: string]: { availableReleases: (string | undefined)[] } } = {}
// Currently, only GHES is numbered. Number releases have to be
// handled differently because they use semantic versioning.
versions.forEach((version) => {
const docsVersion = allVersions[version]
if (!docsVersion.hasNumberedReleases) {
frontmatterVersions[docsVersion.shortName] = '*'
} else {
// Each version that has numbered releases in allVersions
// has a string for the number (currentRelease) and an array
// of all of the available releases (e.g. ['3.3', '3.4', '3.5'])
// This creates an array of the applicable releases in the same
// order as the available releases array. This is used to track when
// a release is no longer supported.
const i = docsVersion.releases.indexOf(docsVersion.currentRelease)
if (!numberedReleases[docsVersion.shortName]) {
const availableReleases: (string | undefined)[] = Array(docsVersion.releases.length).fill(
undefined,
)
availableReleases[i] = docsVersion.currentRelease
numberedReleases[docsVersion.shortName] = {
availableReleases,
}
} else {
numberedReleases[docsVersion.shortName].availableReleases[i] = docsVersion.currentRelease
}
}
})
// Create semantic versions for numbered releases
Object.keys(numberedReleases).forEach((key) => {
const availableReleases = numberedReleases[key].availableReleases
const versionContinuity = checkVersionContinuity(availableReleases)
if (availableReleases.every(Boolean)) {
frontmatterVersions[key] = '*'
} else if (!versionContinuity) {
// If there happens to be version gaps, just enumerate each version
// using syntax like =3.x || =3.x
const semVer = availableReleases
.filter(Boolean)
.map((release) => `=${release}`)
.join(' || ')
frontmatterVersions[key] = semVer
} else {
const semVer: string[] = []
if (!availableReleases[availableReleases.length - 1]) {
const startVersion = availableReleases.filter(Boolean).pop()
semVer.push(`>=${startVersion}`)
}
if (!availableReleases[0]) {
const endVersion = availableReleases.filter(Boolean).shift()
semVer.push(`<=${endVersion}`)
}
frontmatterVersions[key] = semVer.join(' ')
}
})
const sortedFrontmatterVersions = Object.keys(frontmatterVersions)
.sort()
.reduce((acc: { [key: string]: string }, key) => {
acc[key] = frontmatterVersions[key]
return acc
}, {})
return sortedFrontmatterVersions
}
// This is uncommon, but we potentially could have the case where an
// article was versioned for say 3.2, not for 3.3, and then again
// versioned for 3.4. This will result in a custom semantic version range
function checkVersionContinuity(versions: (string | undefined)[]): boolean {
const availableVersions = [...versions]
// values at the beginning or end of the array are not gaps but normal
// starts and ends of version ranges
while (!availableVersions[0]) {
availableVersions.shift()
}
while (!availableVersions[availableVersions.length - 1]) {
availableVersions.pop()
}
return availableVersions.every(Boolean)
}
// Returns true if the indexFile is the root index.md file
function isRootIndexFile(indexFile: string): boolean {
return indexFile === ROOT_INDEX_FILE
}
// Creates a new directory if it doesn't exist
async function createDirectory(targetDirectory: string): Promise<void> {
if (!existsSync(targetDirectory)) {
await mkdirp(targetDirectory)
}
}
async function getDirectoryInfo(directory: string): Promise<DirectoryInfo> {
if (!existsSync(directory)) {
throw new Error(`Directory ${directory} did not exist when attempting to get directory info.`)
}
const directoryContents = (await readdir(directory)).filter(
(file) => file !== 'README.md' && file !== 'index.md',
)
const childDirectories = directoryContents.filter((item) =>
lstatSync(`${directory}/${item}`).isDirectory(),
)
const directoryFiles = difference(directoryContents, childDirectories)
return { directoryContents, directoryFiles, childDirectories }
}
function appendVersionComment(stringifiedContent: string): string {
return stringifiedContent.replace(
'\nversions:\n',
`\nversions: # DO NOT MANUALLY EDIT. CHANGES WILL BE OVERWRITTEN BY A 🤖\n`,
)
}