overleaf/services/web/scripts/learn/checkSanitize/index.mjs

import checkSanitizeOptions from './checkSanitizeOptions.mjs'
import Scrape from './scrape.mjs'
import { fileURLToPath } from 'node:url'

const { getAllPagesAndCache, scrapeAndCachePage } = Scrape

async function main() {
  const BASE_URL = process.argv.pop()
  if (!BASE_URL.startsWith('http')) {
    throw new Error(
      'Usage: node scripts/learn/checkSanitize/index.mjs https://LEARN_WIKI'
    )
  }

  const pages = await getAllPagesAndCache(BASE_URL)

  for (const page of pages) {
    try {
      const parsed = await scrapeAndCachePage(BASE_URL, page)

      const title = parsed.title
      const text = parsed.text ? parsed.text['*'] : ''

      checkSanitizeOptions(page, title, text)
    } catch (e) {
      console.error('---')
      console.error(page, e)
      throw e
    }
  }
}

if (fileURLToPath(import.meta.url) === process.argv[1]) {
  try {
    await main()
    process.exit(0)
  } catch (error) {
    console.error(error)
    process.exit(1)
  }
}
Merge pull request #21282 from overleaf/ls-scripts-to-esm-5 Migrate rest of the scripts to esm GitOrigin-RevId: 421f3ccd15342d34113be8d22e343d08533177ea 2024-10-24 07:14:00 -04:00			`import checkSanitizeOptions from './checkSanitizeOptions.mjs'`
			`import Scrape from './scrape.mjs'`
[web] Add `prefer-node-protocol` ESLint rule (#21523) * Add `unicorn/prefer-node-protocol` * Revert non-web changes * Run `npm run lint:fix` (prefer-node-protocol) GitOrigin-RevId: c3cdd88ff9e6b3de6a4397d45935c4d026c1c1ed 2024-11-04 04:09:11 -05:00			`import { fileURLToPath } from 'node:url'`
Merge pull request #21282 from overleaf/ls-scripts-to-esm-5 Migrate rest of the scripts to esm GitOrigin-RevId: 421f3ccd15342d34113be8d22e343d08533177ea 2024-10-24 07:14:00 -04:00
			`const { getAllPagesAndCache, scrapeAndCachePage } = Scrape`
Merge pull request #3998 from overleaf/jpa-learn-sanitize [learn] sanitize the wiki content GitOrigin-RevId: c114bbd94479e926c0621953fe9c03f6d380a19d 2021-05-07 09:16:12 -04:00
			`async function main() {`
			`const BASE_URL = process.argv.pop()`
			`if (!BASE_URL.startsWith('http')) {`
			`throw new Error(`
Merge pull request #21282 from overleaf/ls-scripts-to-esm-5 Migrate rest of the scripts to esm GitOrigin-RevId: 421f3ccd15342d34113be8d22e343d08533177ea 2024-10-24 07:14:00 -04:00			`'Usage: node scripts/learn/checkSanitize/index.mjs https://LEARN_WIKI'`
Merge pull request #3998 from overleaf/jpa-learn-sanitize [learn] sanitize the wiki content GitOrigin-RevId: c114bbd94479e926c0621953fe9c03f6d380a19d 2021-05-07 09:16:12 -04:00			`)`
			`}`

			`const pages = await getAllPagesAndCache(BASE_URL)`

			`for (const page of pages) {`
			`try {`
			`const parsed = await scrapeAndCachePage(BASE_URL, page)`

			`const title = parsed.title`
			`const text = parsed.text ? parsed.text['*'] : ''`

			`checkSanitizeOptions(page, title, text)`
			`} catch (e) {`
			`console.error('---')`
			`console.error(page, e)`
			`throw e`
			`}`
			`}`
			`}`

Merge pull request #21282 from overleaf/ls-scripts-to-esm-5 Migrate rest of the scripts to esm GitOrigin-RevId: 421f3ccd15342d34113be8d22e343d08533177ea 2024-10-24 07:14:00 -04:00			`if (fileURLToPath(import.meta.url) === process.argv[1]) {`
			`try {`
			`await main()`
			`process.exit(0)`
			`} catch (error) {`
			`console.error(error)`
Merge pull request #3998 from overleaf/jpa-learn-sanitize [learn] sanitize the wiki content GitOrigin-RevId: c114bbd94479e926c0621953fe9c03f6d380a19d 2021-05-07 09:16:12 -04:00			`process.exit(1)`
Merge pull request #21282 from overleaf/ls-scripts-to-esm-5 Migrate rest of the scripts to esm GitOrigin-RevId: 421f3ccd15342d34113be8d22e343d08533177ea 2024-10-24 07:14:00 -04:00			`}`
Merge pull request #3998 from overleaf/jpa-learn-sanitize [learn] sanitize the wiki content GitOrigin-RevId: c114bbd94479e926c0621953fe9c03f6d380a19d 2021-05-07 09:16:12 -04:00			`}`