overleaf/services/web/scripts/delete-orphaned-docs/delete-orphaned-docs.js
Timothée Alby 6734d9e107 Merge pull request #2641 from overleaf/ew-delete-orphaned-docs
Process and Script to Delete Orphaned Docs

GitOrigin-RevId: 0c428e36973a9131e3d379fdf4657e802576b23d
2020-03-10 04:14:46 +00:00

139 lines
3.2 KiB
JavaScript

'use strict'
const fs = require('fs')
const minimist = require('minimist')
const readline = require('readline')
const { db, ObjectId } = require('../../app/src/infrastructure/mongojs')
const DocstoreManager = require('../../app/src/Features/Docstore/DocstoreManager')
.promises
const argv = minimist(process.argv.slice(2))
const commit = argv.commit !== undefined
const offset = parseInt(argv.offset) || 0
const limit = parseInt(argv.limit) || 0
if (!commit) {
console.log('DOING DRY RUN. TO SAVE CHANGES PASS --commit')
}
const input = fs.createReadStream(argv._[0])
const rl = readline.createInterface({
crlfDelay: Infinity,
input
})
const orphanedDocs = {}
console.log('Loading Data')
let idx = 0
let processed = 0
rl.on('line', async line => {
if (offset && idx++ < offset) {
return
}
if (limit && processed++ >= limit) {
return
}
let [docId, projectId] = line.split(',')
docId = docId.replace(/^ObjectId\(/, '').replace(/\)$/, '')
projectId = projectId.replace(/^ObjectId\(/, '').replace(/\)$/, '')
try {
docId = ObjectId(docId).toString()
projectId = ObjectId(projectId).toString()
} catch (err) {
console.error(`Invalid id: ${docId}, ${projectId}`)
return
}
if (!orphanedDocs[projectId]) {
orphanedDocs[projectId] = []
}
orphanedDocs[projectId].push(docId)
})
rl.on('close', async () => {
const docCount = Object.values(orphanedDocs).reduce((i, v) => i + v.length, 0)
const projectCount = Object.keys(orphanedDocs).length
console.log(`Loaded Data for ${docCount} docs in ${projectCount} Projects`)
for (const projectId of Object.keys(orphanedDocs)) {
await deleteOrphanedDocs(projectId, orphanedDocs[projectId])
}
console.log('DONE')
process.exit()
})
async function deleteOrphanedDocs(projectId, docIds) {
try {
if (await projectIdExists(projectId)) {
console.error(`Project id exists: ${projectId}`)
return
}
} catch (err) {
console.error(`Error checking if project exists: ${projectId}`, err.stack)
return
}
console.log(`Delete docs ${docIds.join(', ')} for project ${projectId}`)
if (!commit) {
return
}
try {
await DocstoreManager.destroyProject(projectId)
} catch (err) {
console.error(`Error deleting project ${projectId}`, err)
}
}
async function projectIdExists(projectId) {
// check both projects and deletedProjects to see if project id exists
const [project, deletedProject] = await Promise.all([
findProject(projectId),
findDeletedProject(projectId)
])
return project !== null || deletedProject !== null
}
async function findProject(projectId) {
return new Promise((resolve, reject) => {
db.projects.findOne(
{ _id: ObjectId(projectId) },
{ _id: 1 },
(err, project) => {
if (err) {
reject(err)
} else {
resolve(project)
}
}
)
})
}
async function findDeletedProject(projectId) {
return new Promise((resolve, reject) => {
db.deletedProjects.findOne(
{ 'project._id': ObjectId(projectId) },
{ _id: 1 },
(err, project) => {
if (err) {
reject(err)
} else {
resolve(project)
}
}
)
})
}