mirror of
https://github.com/overleaf/overleaf.git
synced 2025-01-09 22:43:12 +00:00
6c9d4fb522
Fix translation of tracked deletes GitOrigin-RevId: 4124db6953cbed46eea61f62118fc8e1ddfff4a0
374 lines
12 KiB
JavaScript
374 lines
12 KiB
JavaScript
// @ts-check
|
||
|
||
const { callbackifyAll } = require('@overleaf/promise-utils')
|
||
const LockManager = require('./LockManager')
|
||
const RedisManager = require('./RedisManager')
|
||
const ProjectHistoryRedisManager = require('./ProjectHistoryRedisManager')
|
||
const RealTimeRedisManager = require('./RealTimeRedisManager')
|
||
const ShareJsUpdateManager = require('./ShareJsUpdateManager')
|
||
const HistoryManager = require('./HistoryManager')
|
||
const logger = require('@overleaf/logger')
|
||
const Metrics = require('./Metrics')
|
||
const Errors = require('./Errors')
|
||
const DocumentManager = require('./DocumentManager')
|
||
const RangesManager = require('./RangesManager')
|
||
const SnapshotManager = require('./SnapshotManager')
|
||
const Profiler = require('./Profiler')
|
||
const { isInsert, isDelete, getDocLength } = require('./Utils')
|
||
|
||
/**
|
||
* @typedef {import("./types").DeleteOp} DeleteOp
|
||
* @typedef {import("./types").HistoryUpdate } HistoryUpdate
|
||
* @typedef {import("./types").InsertOp} InsertOp
|
||
* @typedef {import("./types").Op} Op
|
||
* @typedef {import("./types").Ranges} Ranges
|
||
* @typedef {import("./types").Update} Update
|
||
*/
|
||
|
||
const UpdateManager = {
|
||
async processOutstandingUpdates(projectId, docId) {
|
||
const timer = new Metrics.Timer('updateManager.processOutstandingUpdates')
|
||
try {
|
||
await UpdateManager.fetchAndApplyUpdates(projectId, docId)
|
||
timer.done({ status: 'success' })
|
||
} catch (err) {
|
||
timer.done({ status: 'error' })
|
||
throw err
|
||
}
|
||
},
|
||
|
||
async processOutstandingUpdatesWithLock(projectId, docId) {
|
||
const profile = new Profiler('processOutstandingUpdatesWithLock', {
|
||
project_id: projectId,
|
||
doc_id: docId,
|
||
})
|
||
|
||
const lockValue = await LockManager.promises.tryLock(docId)
|
||
if (lockValue == null) {
|
||
return
|
||
}
|
||
profile.log('tryLock')
|
||
|
||
try {
|
||
await UpdateManager.processOutstandingUpdates(projectId, docId)
|
||
profile.log('processOutstandingUpdates')
|
||
} finally {
|
||
await LockManager.promises.releaseLock(docId, lockValue)
|
||
profile.log('releaseLock').end()
|
||
}
|
||
|
||
await UpdateManager.continueProcessingUpdatesWithLock(projectId, docId)
|
||
},
|
||
|
||
async continueProcessingUpdatesWithLock(projectId, docId) {
|
||
const length = await RealTimeRedisManager.promises.getUpdatesLength(docId)
|
||
if (length > 0) {
|
||
await UpdateManager.processOutstandingUpdatesWithLock(projectId, docId)
|
||
}
|
||
},
|
||
|
||
async fetchAndApplyUpdates(projectId, docId) {
|
||
const profile = new Profiler('fetchAndApplyUpdates', {
|
||
project_id: projectId,
|
||
doc_id: docId,
|
||
})
|
||
|
||
const updates =
|
||
await RealTimeRedisManager.promises.getPendingUpdatesForDoc(docId)
|
||
logger.debug(
|
||
{ projectId, docId, count: updates.length },
|
||
'processing updates'
|
||
)
|
||
if (updates.length === 0) {
|
||
return
|
||
}
|
||
profile.log('getPendingUpdatesForDoc')
|
||
|
||
for (const update of updates) {
|
||
await UpdateManager.applyUpdate(projectId, docId, update)
|
||
profile.log('applyUpdate')
|
||
}
|
||
profile.log('async done').end()
|
||
},
|
||
|
||
/**
|
||
* Apply an update to the given document
|
||
*
|
||
* @param {string} projectId
|
||
* @param {string} docId
|
||
* @param {Update} update
|
||
*/
|
||
async applyUpdate(projectId, docId, update) {
|
||
const profile = new Profiler('applyUpdate', {
|
||
project_id: projectId,
|
||
doc_id: docId,
|
||
})
|
||
|
||
UpdateManager._sanitizeUpdate(update)
|
||
profile.log('sanitizeUpdate', { sync: true })
|
||
|
||
try {
|
||
let {
|
||
lines,
|
||
version,
|
||
ranges,
|
||
pathname,
|
||
projectHistoryId,
|
||
historyRangesSupport,
|
||
} = await DocumentManager.promises.getDoc(projectId, docId)
|
||
profile.log('getDoc')
|
||
|
||
if (lines == null || version == null) {
|
||
throw new Errors.NotFoundError(`document not found: ${docId}`)
|
||
}
|
||
|
||
const previousVersion = version
|
||
const incomingUpdateVersion = update.v
|
||
let updatedDocLines, appliedOps
|
||
;({ updatedDocLines, version, appliedOps } =
|
||
await ShareJsUpdateManager.promises.applyUpdate(
|
||
projectId,
|
||
docId,
|
||
update,
|
||
lines,
|
||
version
|
||
))
|
||
profile.log('sharejs.applyUpdate', {
|
||
// only synchronous when the update applies directly to the
|
||
// doc version, otherwise getPreviousDocOps is called.
|
||
sync: incomingUpdateVersion === previousVersion,
|
||
})
|
||
|
||
const { newRanges, rangesWereCollapsed, historyUpdates } =
|
||
RangesManager.applyUpdate(
|
||
projectId,
|
||
docId,
|
||
ranges,
|
||
appliedOps,
|
||
updatedDocLines,
|
||
{ historyRangesSupport }
|
||
)
|
||
profile.log('RangesManager.applyUpdate', { sync: true })
|
||
|
||
await RedisManager.promises.updateDocument(
|
||
projectId,
|
||
docId,
|
||
updatedDocLines,
|
||
version,
|
||
appliedOps,
|
||
newRanges,
|
||
update.meta
|
||
)
|
||
profile.log('RedisManager.updateDocument')
|
||
|
||
UpdateManager._adjustHistoryUpdatesMetadata(
|
||
historyUpdates,
|
||
pathname,
|
||
projectHistoryId,
|
||
lines,
|
||
ranges,
|
||
historyRangesSupport
|
||
)
|
||
|
||
if (historyUpdates.length > 0) {
|
||
Metrics.inc('history-queue', 1, { status: 'project-history' })
|
||
try {
|
||
const projectOpsLength =
|
||
await ProjectHistoryRedisManager.promises.queueOps(
|
||
projectId,
|
||
...historyUpdates.map(op => JSON.stringify(op))
|
||
)
|
||
HistoryManager.recordAndFlushHistoryOps(
|
||
projectId,
|
||
historyUpdates,
|
||
projectOpsLength
|
||
)
|
||
profile.log('recordAndFlushHistoryOps')
|
||
} catch (err) {
|
||
// The full project history can re-sync a project in case
|
||
// updates went missing.
|
||
// Just record the error here and acknowledge the write-op.
|
||
Metrics.inc('history-queue-error')
|
||
}
|
||
}
|
||
|
||
if (rangesWereCollapsed) {
|
||
Metrics.inc('doc-snapshot')
|
||
logger.debug(
|
||
{
|
||
projectId,
|
||
docId,
|
||
previousVersion,
|
||
lines,
|
||
ranges,
|
||
update,
|
||
},
|
||
'update collapsed some ranges, snapshotting previous content'
|
||
)
|
||
|
||
// Do this last, since it's a mongo call, and so potentially longest running
|
||
// If it overruns the lock, it's ok, since all of our redis work is done
|
||
await SnapshotManager.promises.recordSnapshot(
|
||
projectId,
|
||
docId,
|
||
previousVersion,
|
||
pathname,
|
||
lines,
|
||
ranges
|
||
)
|
||
}
|
||
} catch (error) {
|
||
RealTimeRedisManager.sendData({
|
||
project_id: projectId,
|
||
doc_id: docId,
|
||
error: error instanceof Error ? error.message : error,
|
||
})
|
||
profile.log('sendData')
|
||
throw error
|
||
} finally {
|
||
profile.end()
|
||
}
|
||
},
|
||
|
||
async lockUpdatesAndDo(method, projectId, docId, ...args) {
|
||
const profile = new Profiler('lockUpdatesAndDo', {
|
||
project_id: projectId,
|
||
doc_id: docId,
|
||
})
|
||
|
||
const lockValue = await LockManager.promises.getLock(docId)
|
||
profile.log('getLock')
|
||
|
||
let result
|
||
try {
|
||
await UpdateManager.processOutstandingUpdates(projectId, docId)
|
||
profile.log('processOutstandingUpdates')
|
||
|
||
result = await method(projectId, docId, ...args)
|
||
profile.log('method')
|
||
} finally {
|
||
await LockManager.promises.releaseLock(docId, lockValue)
|
||
profile.log('releaseLock').end()
|
||
}
|
||
|
||
// We held the lock for a while so updates might have queued up
|
||
UpdateManager.continueProcessingUpdatesWithLock(projectId, docId).catch(
|
||
err => {
|
||
// The processing may fail for invalid user updates.
|
||
// This can be very noisy, put them on level DEBUG
|
||
// and record a metric.
|
||
Metrics.inc('background-processing-updates-error')
|
||
logger.debug(
|
||
{ err, projectId, docId },
|
||
'error processing updates in background'
|
||
)
|
||
}
|
||
)
|
||
|
||
return result
|
||
},
|
||
|
||
_sanitizeUpdate(update) {
|
||
// In Javascript, characters are 16-bits wide. It does not understand surrogates as characters.
|
||
//
|
||
// From Wikipedia (http://en.wikipedia.org/wiki/Plane_(Unicode)#Basic_Multilingual_Plane):
|
||
// "The High Surrogates (U+D800–U+DBFF) and Low Surrogate (U+DC00–U+DFFF) codes are reserved
|
||
// for encoding non-BMP characters in UTF-16 by using a pair of 16-bit codes: one High Surrogate
|
||
// and one Low Surrogate. A single surrogate code point will never be assigned a character.""
|
||
//
|
||
// The main offender seems to be \uD835 as a stand alone character, which would be the first
|
||
// 16-bit character of a blackboard bold character (http://www.fileformat.info/info/unicode/char/1d400/index.htm).
|
||
// Something must be going on client side that is screwing up the encoding and splitting the
|
||
// two 16-bit characters so that \uD835 is standalone.
|
||
for (const op of update.op || []) {
|
||
if (op.i != null) {
|
||
// Replace high and low surrogate characters with 'replacement character' (\uFFFD)
|
||
op.i = op.i.replace(/[\uD800-\uDFFF]/g, '\uFFFD')
|
||
}
|
||
}
|
||
return update
|
||
},
|
||
|
||
/**
|
||
* Add metadata that will be useful to project history
|
||
*
|
||
* @param {HistoryUpdate[]} updates
|
||
* @param {string} pathname
|
||
* @param {string} projectHistoryId
|
||
* @param {string[]} lines
|
||
* @param {Ranges} ranges
|
||
* @param {boolean} historyRangesSupport
|
||
*/
|
||
_adjustHistoryUpdatesMetadata(
|
||
updates,
|
||
pathname,
|
||
projectHistoryId,
|
||
lines,
|
||
ranges,
|
||
historyRangesSupport
|
||
) {
|
||
let docLength = getDocLength(lines)
|
||
let historyDocLength = docLength
|
||
for (const change of ranges.changes ?? []) {
|
||
if ('d' in change.op) {
|
||
historyDocLength += change.op.d.length
|
||
}
|
||
}
|
||
|
||
for (const update of updates) {
|
||
update.projectHistoryId = projectHistoryId
|
||
if (!update.meta) {
|
||
update.meta = {}
|
||
}
|
||
update.meta.pathname = pathname
|
||
update.meta.doc_length = docLength
|
||
if (historyRangesSupport && historyDocLength !== docLength) {
|
||
update.meta.history_doc_length = historyDocLength
|
||
}
|
||
|
||
// Each update may contain multiple ops, i.e.
|
||
// [{
|
||
// ops: [{i: "foo", p: 4}, {d: "bar", p:8}]
|
||
// }, {
|
||
// ops: [{d: "baz", p: 40}, {i: "qux", p:8}]
|
||
// }]
|
||
// We want to include the doc_length at the start of each update,
|
||
// before it's ops are applied. However, we need to track any
|
||
// changes to it for the next update.
|
||
for (const op of update.op) {
|
||
if (isInsert(op)) {
|
||
docLength += op.i.length
|
||
if (!op.trackedDeleteRejection) {
|
||
// Tracked delete rejections end up retaining characters rather
|
||
// than inserting
|
||
historyDocLength += op.i.length
|
||
}
|
||
}
|
||
if (isDelete(op)) {
|
||
docLength -= op.d.length
|
||
if (update.meta.tc) {
|
||
// This is a tracked delete. It will be translated into a retain in
|
||
// history, except any enclosed tracked inserts, which will be
|
||
// translated into regular deletes.
|
||
for (const change of op.trackedChanges ?? []) {
|
||
if (change.type === 'insert') {
|
||
historyDocLength -= change.length
|
||
}
|
||
}
|
||
} else {
|
||
// This is a regular delete. It will be translated to a delete in
|
||
// history.
|
||
historyDocLength -= op.d.length
|
||
}
|
||
}
|
||
}
|
||
|
||
if (!historyRangesSupport) {
|
||
// Prevent project-history from processing tracked changes
|
||
delete update.meta.tc
|
||
}
|
||
}
|
||
},
|
||
}
|
||
|
||
module.exports = { ...callbackifyAll(UpdateManager), promises: UpdateManager }
|