1
0
mirror of synced 2025-12-19 18:10:59 -05:00
Files
docs/src/automated-pipelines/lib/update-markdown.js
dependabot[bot] 50dcd77129 Bump rimraf from 4.1.2 to 5.0.0 (#36328)
Signed-off-by: dependabot[bot] <support@github.com>
Co-authored-by: dependabot[bot] <49699333+dependabot[bot]@users.noreply.github.com>
Co-authored-by: Grace Park <gracepark@github.com>
2023-04-12 20:19:14 +00:00

450 lines
17 KiB
JavaScript

import walk from 'walk-sync'
import { existsSync, lstatSync, unlinkSync } from 'fs'
import path from 'path'
import { readFile, writeFile, readdir } from 'fs/promises'
import matter from 'gray-matter'
import { rimraf } from 'rimraf'
import { mkdirp } from 'mkdirp'
import { difference, isEqual } from 'lodash-es'
import { allVersions } from '../../../lib/all-versions.js'
import getApplicableVersions from '../../../lib/get-applicable-versions.js'
const ROOT_INDEX_FILE = 'content/index.md'
export const MARKDOWN_COMMENT = '\n<!-- Content after this section is automatically generated -->\n'
// Main entrypoint into this module. This function adds, removes, and updates
// versions frontmatter in all directories under the targetDirectory.
export async function updateContentDirectory({
targetDirectory,
sourceContent,
frontmatter,
indexOrder,
}) {
const sourceFiles = Object.keys(sourceContent)
await createDirectory(targetDirectory)
await removeMarkdownFiles(targetDirectory, sourceFiles, frontmatter.autogenerated)
await updateMarkdownFiles(targetDirectory, sourceContent, frontmatter, indexOrder)
}
// Remove markdown files that are no longer in the source data
async function removeMarkdownFiles(targetDirectory, sourceFiles, autogeneratedType) {
// Copy the autogenerated Markdown files to the target directory
const autogeneratedFiles = await getAutogeneratedFiles(targetDirectory, autogeneratedType)
// If the first array contains items that the second array does not,
// it means that a Markdown page was deleted from the OpenAPI schema
const filesToRemove = difference(autogeneratedFiles, sourceFiles)
// Markdown files that need to be deleted
for (const file of filesToRemove) {
unlinkSync(file)
}
}
// Gets a list of all files under targetDirectory that have the
// `autogenerated` frontmatter set to `autogeneratedType`.
async function getAutogeneratedFiles(targetDirectory, autogeneratedType) {
const files = walk(targetDirectory, {
includeBasePath: true,
childDirectories: false,
globs: ['**/*.md'],
ignore: ['**/README.md', '**/index.md'],
})
return (
await Promise.all(
files.map(async (file) => {
const { data } = matter(await readFile(file, 'utf-8'))
if (data.autogenerated === autogeneratedType) {
return file
}
})
)
).filter(Boolean)
}
// The `sourceContent` object contains the new content and target file
// path for the Markdown files. Ex:
// { <targetFile>: { data: <frontmatter>, content: <markdownContent> } }
async function updateMarkdownFiles(targetDirectory, sourceContent, frontmatter, indexOrder = {}) {
for (const [file, newContent] of Object.entries(sourceContent)) {
await updateMarkdownFile(file, newContent.data, newContent.content)
}
// This function recursively updates the index.md files in each
// of the directories under targetDirectory
await updateDirectory(targetDirectory, frontmatter, { indexOrder })
// We don't want to update directories that the pipelines don't affect
// so we make one call to update only only the root index.md file
// in targetDirectory to prevent any unintended changes
await updateDirectory(path.dirname(targetDirectory), frontmatter, { rootDirectoryOnly: true })
}
// If the Markdown file already exists on disk, we only update the
// content and version frontmatter to allow writers to manually
// edit the modifiable content of the file. If the Markdown file doesn't
// exists, we create a new Markdown file.
async function updateMarkdownFile(
file,
sourceData,
sourceContent,
commentDelimiter = MARKDOWN_COMMENT
) {
if (existsSync(file)) {
// update only the versions property of the file, assuming
// the other properties have already been added and edited
const { data, content } = matter(await readFile(file, 'utf-8'))
// Double check that the comment delimiter is only used once
const matcher = new RegExp(commentDelimiter, 'g')
const matches = content.match(matcher)
if (matches && matches.length > 1) {
throw new Error(`Error: ${file} has multiple comment delimiters`)
}
const [manuallyCreatedContent, automatedContent] = matches
? content.split(commentDelimiter)
: [content, '']
const isDelimiterMissing = !matches
const isContentSame = automatedContent === sourceContent
const isVersionsSame = isEqual(sourceData.versions, data.versions)
// Only proceed if the content or versions have changed
if (isContentSame && isVersionsSame && !isDelimiterMissing) {
return
}
// Create a new object so that we don't mutate the original data
const newData = { ...data }
// Only modify the versions property when a file already existss
newData.versions = sourceData.versions
const targetContent = manuallyCreatedContent + commentDelimiter + sourceContent
await writeFile(file, matter.stringify(targetContent, newData))
} else {
await createDirectory(path.dirname(file))
await writeFile(file, matter.stringify(commentDelimiter + sourceContent, sourceData))
}
}
// Recursively walks through the directory structure and updates the
// index.md files to match the disk. Before calling this function
// ensure that the Markdown files have been updated and any files
// that need to be deleted have been removed.
async function updateDirectory(
directory,
frontmatter,
{ rootDirectoryOnly = false, shortTitle = false, indexOrder = {} } = {}
) {
const initialDirectoryListing = await getDirectoryInfo(directory)
// If there are no children on disk, remove the directory
if (initialDirectoryListing.directoryContents.length === 0 && !rootDirectoryOnly) {
rimraf(directory)
return
}
// Recursively update child directories
if (!rootDirectoryOnly) {
await Promise.all(
initialDirectoryListing.childDirectories.map(async (subDirectory) => {
await updateDirectory(`${directory}/${subDirectory}`, frontmatter, { indexOrder })
})
)
}
const indexFile = `${directory}/index.md`
const { data, content } = await getIndexFileContents(indexFile, frontmatter, shortTitle)
// We need to re-get the directory contents because a recursive call
// may have removed a directory since the initial directory read.
const { directoryContents, childDirectories, directoryFiles } = await getDirectoryInfo(directory)
const { childrenOnDisk, indexChildren } = getChildrenToCompare(
indexFile,
directoryContents,
data.children
)
const itemsToAdd = difference(childrenOnDisk, indexChildren)
const itemsToRemove = difference(indexChildren, childrenOnDisk)
if (itemsToRemove.length === 0 && itemsToAdd.length === 0) {
return
}
if (!rootDirectoryOnly) {
// Update the versions in the index.md file to match the directory contents
directoryFiles.push(...childDirectories.map((dir) => path.join(dir, 'index.md')))
const newVersions = await getIndexFileVersions(directory, directoryFiles)
const isVersionEqual = isEqual(newVersions, data.versions)
if (!isVersionEqual) {
data.versions = newVersions
}
}
// Update the index.md file contents and write the file to disk
const dataUpdatedChildren = updateIndexChildren(
data,
{ itemsToAdd, itemsToRemove },
indexFile,
indexOrder,
isRootIndexFile(indexFile)
)
await writeFile(indexFile, matter.stringify(content, dataUpdatedChildren))
}
// Takes the children properties from the index.md file and the
// files/directories on disk and normalizes them to be comparable
// against each other.
// Children properties include a leading slash except when the
// index.md file is the root index.md file. We also want to
// remove the file extension from the files on disk.
function getChildrenToCompare(indexFile, directoryContents, fmChildren) {
if (!fmChildren) {
throw new Error(`No children property found in ${indexFile}`)
}
const isEarlyAccess = (item) => isRootIndexFile(indexFile) && item === 'early-access'
// Get the list of children from the directory contents
const childrenOnDisk = directoryContents
.map((file) => `${path.basename(file, '.md')}`)
.filter((item) => !isEarlyAccess(item))
const indexChildren = fmChildren
.map((child) => child.replace('/', ''))
.filter((item) => !isEarlyAccess(item))
return { childrenOnDisk, indexChildren }
}
// Adds and removes children properties to the index.md file.
// There are three possible scenarios that we want to handle:
//
// 1. If the lib/config.json file for the pipeline defines a sort
// order for the index file we're currently processing, then
// we want to use that sort order. Currently, the config files
// only defined a startsWith parameter. This property defines
// the order of the first items in the index files children
// property. All other items are sorted and appended to list.
//
// 2. If not config is defined and the index file is an
// autogenerated file, we sort all the children alphabetically.
//
// 3. If the index file is not autogenerated, we leave the ordering
// as is and append new children to the end.
function updateIndexChildren(data, childUpdates, indexFile, indexOrder, rootIndex = false) {
const { itemsToAdd, itemsToRemove } = childUpdates
const childPrefix = rootIndex ? '' : '/'
// Get a new list of children with added and removed items
const children = [...data.children]
// remove the '/' prefix used in index.md children
.map((item) => item.replace(childPrefix, ''))
.filter((item) => !itemsToRemove.includes(item))
children.push(...itemsToAdd)
const orderedIndexChildren = []
// Only used for tests. During testing, the content directory is
// in a temp directory so the paths are not relative to
// the current working directory. This gets the relative path
// from the full path to the index file.
const indexRelativePath = process.env.TEST_OS_ROOT_DIR
? indexFile.replace(`${process.env.TEST_OS_ROOT_DIR}/`, '')
: indexFile
const indexOrderConfig = indexOrder[indexRelativePath]
const isAutogenerated = data.autogenerated
if (indexOrderConfig && isAutogenerated) {
if (indexOrderConfig.startsWith) {
const sortableChildren = difference(children, indexOrderConfig.startsWith).sort()
orderedIndexChildren.push(...indexOrderConfig.startsWith, ...sortableChildren)
}
} else if (isAutogenerated) {
// always sort autogenerated index files that have no override config
orderedIndexChildren.push(...children)
orderedIndexChildren.sort()
} else {
// just leave the children in the order they are in the index file
// so they can be manually sorted
orderedIndexChildren.push(...children)
}
const updatedData = { ...data }
// add the '/' prefix back to the children
updatedData.children = orderedIndexChildren.map((item) => `${childPrefix}${item}`)
return updatedData
}
// Gets the contents of the index.md file from disk if it exits or
// creates a new index.md file with the default frontmatter.
async function getIndexFileContents(indexFile, frontmatter, shortTitle = false) {
const directory = path.dirname(indexFile)
const indexFileContent = {
data: {
title: path.basename(directory),
...frontmatter,
children: [],
},
content: '',
}
if (shortTitle) {
indexFileContent.data.shortTitle = path.basename(directory)
}
return existsSync(indexFile) ? matter(await readFile(indexFile, 'utf-8')) : indexFileContent
}
// Builds the index.md versions frontmatter by consolidating
// the versions from each Markdown file in the directory + the
// index.md files in any subdirectories of directory.
async function getIndexFileVersions(directory, files) {
const versions = new Set()
await Promise.all(
files.map(async (file) => {
const filepath = path.join(directory, file)
if (!existsSync(filepath)) {
throw new Error(
`File ${filepath} does not exist while assembling directory index.md files to create parent version.`
)
}
const { data } = matter(await readFile(filepath, 'utf-8'))
if (!data || !data.versions) {
throw new Error(`Frontmatter in ${filepath} does not contain versions.`)
}
const fmVersions = getApplicableVersions(data.versions)
fmVersions.forEach((version) => versions.add(version))
})
)
const versionArray = [...versions]
return await convertVersionsToFrontmatter(versionArray)
}
/* Takes a list of versions in the format:
[
'free-pro-team@latest',
'enterprise-cloud@latest',
'enterprise-server@3.3',
'enterprise-server@3.4',
'enterprise-server@3.5',
'enterprise-server@3.6',
'enterprise-server@3.7',
'github-ae@latest'
]
and returns the frontmatter equivalent JSON:
{
fpt: '*',
ghae: '*',
ghec: '*',
ghes: '*'
}
*/
export async function convertVersionsToFrontmatter(versions) {
const frontmatterVersions = {}
const numberedReleases = {}
// Currently, only GHES is numbered. Number releases have to be
// handled differently because they use semantic versioning.
versions.forEach((version) => {
const docsVersion = allVersions[version]
if (!docsVersion.hasNumberedReleases) {
frontmatterVersions[docsVersion.shortName] = '*'
} else {
// Each version that has numbered releases in allVersions
// has a string for the number (currentRelease) and an array
// of all of the available releases (e.g. ['3.3', '3.4', '3.5'])
// This creates an array of the applicable releases in the same
// order as the available releases array. This is used to track when
// a release is no longer supported.
const i = docsVersion.releases.sort().indexOf(docsVersion.currentRelease)
if (!numberedReleases[docsVersion.shortName]) {
const availableReleases = Array(docsVersion.releases.length).fill(undefined)
availableReleases[i] = docsVersion.currentRelease
numberedReleases[docsVersion.shortName] = {
availableReleases,
}
} else {
numberedReleases[docsVersion.shortName].availableReleases[i] = docsVersion.currentRelease
}
}
})
// Create semantic versions for numbered releases
Object.keys(numberedReleases).forEach((key) => {
const availableReleases = numberedReleases[key].availableReleases
const versionContinuity = checkVersionContinuity(availableReleases)
if (availableReleases.every(Boolean)) {
frontmatterVersions[key] = '*'
} else if (!versionContinuity) {
// If there happens to be version gaps, just enumerate each version
// using syntax like =3.x || =3.x
const semVer = availableReleases
.filter(Boolean)
.map((release) => `=${release}`)
.join(' || ')
frontmatterVersions[key] = semVer
} else {
const semVer = []
if (!availableReleases[availableReleases.length - 1]) {
const endVersion = availableReleases.filter(Boolean).pop()
semVer.push(`<=${endVersion}`)
}
if (!availableReleases[0]) {
const startVersion = availableReleases.filter(Boolean).shift()
semVer.push(`>=${startVersion}`)
}
frontmatterVersions[key] = semVer.join(' ')
}
})
const sortedFrontmatterVersions = Object.keys(frontmatterVersions)
.sort()
.reduce((acc, key) => {
acc[key] = frontmatterVersions[key]
return acc
}, {})
return sortedFrontmatterVersions
}
// This is uncommon, but we potentially could have the case where an
// article was versioned for say 3.2, not for 3.3, and then again
// versioned for 3.4. This will result in a custom semantic version range
function checkVersionContinuity(versions) {
const availableVersions = [...versions]
// values at the beginning or end of the array are not gaps but normal
// starts and ends of version ranges
while (!availableVersions[0]) {
availableVersions.shift()
}
while (!availableVersions[availableVersions.length - 1]) {
availableVersions.pop()
}
return availableVersions.every(Boolean)
}
// Returns true if the indexFile is the root index.md file
function isRootIndexFile(indexFile) {
return indexFile === ROOT_INDEX_FILE
}
// Creates a new directory if it doesn't exist
async function createDirectory(targetDirectory) {
if (!existsSync(targetDirectory)) {
await mkdirp(targetDirectory)
}
}
async function getDirectoryInfo(directory) {
if (!existsSync(directory)) {
throw new Error(`Directory ${directory} did not exist when attempting to get directory info.`)
}
const directoryContents = (await readdir(directory)).filter(
(file) => file !== 'README.md' && file !== 'index.md'
)
const childDirectories = directoryContents.filter((item) =>
lstatSync(`${directory}/${item}`).isDirectory()
)
const directoryFiles = difference(directoryContents, childDirectories)
return { directoryContents, directoryFiles, childDirectories }
}