mirror of
https://github.com/yu-i-i/overleaf-cep.git
synced 2026-05-24 01:29:35 +02:00
* fix: correct typedef for Document in helpers.mjs * add move-migrations codemod * update migration paths to use shared migrations directory * move migrations to shared location * fix: update Dockerfile and docker-compose.ci.yml to include migrations directory * feat: add migrations tool to workspaces in package.json * [monorepo] Fix order of docker ignore rules * [web] remove unused docker ignore file * [monorepo] replace old references to migrations folder * [server-ce] copy migrations from new place * [migrations] Inline web scripts Co-authored-by: Brian Gough <brian.gough@overleaf.com> * [migrations] move three web scripts over Co-authored-by: Brian Gough <brian.gough@overleaf.com> * [migrations] add missing collection Co-authored-by: Brian Gough <brian.gough@overleaf.com> * [migrations] remove lodash dependency Co-authored-by: Brian Gough <brian.gough@overleaf.com> * [migrations] avoid mongodb-legacy dependency Co-authored-by: Brian Gough <brian.gough@overleaf.com> * [monorepo] run migrations from tools/migrations Co-authored-by: Brian Gough <brian.gough@overleaf.com> * [migrations] simplify migration for adding gitBridge feature to users * [monorepo] run migrations from tests in all the services * [migrations] add Jenkins pipeline for linting/formatting * [monorepo] fixup running web migrations everywhere * [monorepo] trigger Jenkins builds on changes to mongo migrations * [migrations] add Jenkins pipeline for linting/formatting * [monorepo] build scripts: update devDependencies before deps scanning * [monorepo] build scripts: formerly depend on tools/migrations * [monorepo] run eslint on .mjs files * [migrations] enable more eslint rules and fix all the errors * [rake] fix migrations:list task --------- Co-authored-by: Jakob Ackermann <jakob.ackermann@overleaf.com> GitOrigin-RevId: 14cf69cc1b9405bbc75adbb9a000e555500e0614
116 lines
3.2 KiB
JavaScript
116 lines
3.2 KiB
JavaScript
import mongodb from 'mongodb'
|
|
import { db, READ_PREFERENCE_SECONDARY } from '../lib/mongodb.mjs'
|
|
|
|
const { ObjectId } = mongodb
|
|
|
|
const NOW_IN_S = Date.now() / 1000
|
|
const ONE_WEEK_IN_S = 60 * 60 * 24 * 7
|
|
|
|
const DUMMY_NAME = 'unknown.tex'
|
|
const DUMMY_TIME = new Date('2021-04-12T00:00:00.000Z')
|
|
|
|
let deletedProjectsCache = null
|
|
|
|
function getSecondsFromObjectId(id) {
|
|
return id.getTimestamp().getTime() / 1000
|
|
}
|
|
|
|
async function main(firstProjectId) {
|
|
const options = {
|
|
firstProjectId,
|
|
incrementByS: parseInt(process.env.INCREMENT_BY_S, 10) || ONE_WEEK_IN_S,
|
|
batchSize: parseInt(process.env.BATCH_SIZE, 10) || 1000,
|
|
stopAtS: parseInt(process.env.STOP_AT_S, 10) || NOW_IN_S,
|
|
}
|
|
|
|
deletedProjectsCache = new Map()
|
|
|
|
let startId = options.firstProjectId
|
|
|
|
let nProcessed = 0
|
|
while (getSecondsFromObjectId(startId) <= options.stopAtS) {
|
|
const end = getSecondsFromObjectId(startId) + options.incrementByS
|
|
let endId = ObjectId.createFromTime(end)
|
|
const query = {
|
|
project_id: {
|
|
// include edge
|
|
$gte: startId,
|
|
// exclude edge
|
|
$lt: endId,
|
|
},
|
|
deleted: true,
|
|
name: {
|
|
$exists: false,
|
|
},
|
|
}
|
|
const docs = await db.docs
|
|
.find(query, { readPreference: READ_PREFERENCE_SECONDARY })
|
|
.project({ _id: 1, project_id: 1 })
|
|
.limit(options.batchSize)
|
|
.toArray()
|
|
|
|
if (docs.length) {
|
|
const docIds = docs.map(doc => doc._id)
|
|
console.log('Back filling dummy meta data for', JSON.stringify(docIds))
|
|
await processBatch(docs, options)
|
|
nProcessed += docIds.length
|
|
|
|
if (docs.length === options.batchSize) {
|
|
endId = docs[docs.length - 1].project_id
|
|
}
|
|
}
|
|
console.error('Processed %d until %s', nProcessed, endId)
|
|
|
|
startId = endId
|
|
}
|
|
}
|
|
|
|
async function getDeletedProject(projectId) {
|
|
const cacheKey = projectId.toString()
|
|
if (deletedProjectsCache.has(cacheKey)) {
|
|
return deletedProjectsCache.get(cacheKey)
|
|
}
|
|
const deletedProject = await db.deletedProjects.findOne(
|
|
{ 'deleterData.deletedProjectId': projectId },
|
|
{
|
|
projection: {
|
|
_id: 1,
|
|
'project.deletedDocs': 1,
|
|
},
|
|
}
|
|
)
|
|
deletedProjectsCache.set(cacheKey, deletedProject)
|
|
return deletedProject
|
|
}
|
|
|
|
async function processBatch(docs, options) {
|
|
for (const doc of docs) {
|
|
const { _id: docId, project_id: projectId } = doc
|
|
const deletedProject = await getDeletedProject(projectId)
|
|
let name = DUMMY_NAME
|
|
let deletedAt = DUMMY_TIME
|
|
if (deletedProject) {
|
|
const project = deletedProject.project
|
|
if (project) {
|
|
const deletedDoc =
|
|
project.deletedDocs &&
|
|
project.deletedDocs.find(deletedDoc => docId.equals(deletedDoc._id))
|
|
if (deletedDoc) {
|
|
console.log('Found deletedDoc for %s', docId)
|
|
name = deletedDoc.name
|
|
deletedAt = deletedDoc.deletedAt
|
|
} else {
|
|
console.log('Missing deletedDoc for %s', docId)
|
|
}
|
|
} else {
|
|
console.log('Orphaned deleted doc %s (failed hard deletion)', docId)
|
|
}
|
|
} else {
|
|
console.log('Orphaned deleted doc %s (no deletedProjects entry)', docId)
|
|
}
|
|
await db.docs.updateOne({ _id: docId }, { $set: { name, deletedAt } })
|
|
}
|
|
}
|
|
|
|
export default main
|