Files
overleaf-cep/services/web/app/src/Features/Uploads/ArchiveManager.js
Eric Mc Sween 5fc6d7dcb3 Merge pull request #5740 from overleaf/em-gcp-logging-web
Improve GCP logging for web

GitOrigin-RevId: b304c87a3fe46c29189f665eb3daf22c23d6eb8f
2021-11-11 09:03:09 +00:00

272 lines
7.8 KiB
JavaScript

/* eslint-disable
node/handle-callback-err,
max-len,
no-return-assign,
*/
// TODO: This file was created by bulk-decaffeinate.
// Fix any style issues and re-enable lint.
/*
* decaffeinate suggestions:
* DS101: Remove unnecessary use of Array.from
* DS102: Remove unnecessary code created because of implicit returns
* DS207: Consider shorter variations of null checks
* Full docs: https://github.com/decaffeinate/decaffeinate/blob/master/docs/suggestions.md
*/
const logger = require('@overleaf/logger')
const OError = require('@overleaf/o-error')
const metrics = require('@overleaf/metrics')
const fs = require('fs')
const Path = require('path')
const fse = require('fs-extra')
const yauzl = require('yauzl')
const Settings = require('@overleaf/settings')
const {
InvalidZipFileError,
EmptyZipFileError,
ZipContentsTooLargeError,
} = require('./ArchiveErrors')
const _ = require('underscore')
const { promisifyAll } = require('../../util/promises')
const ONE_MEG = 1024 * 1024
const ArchiveManager = {
_isZipTooLarge(source, callback) {
if (callback == null) {
callback = function () {}
}
callback = _.once(callback)
let totalSizeInBytes = null
return yauzl.open(source, { lazyEntries: true }, function (err, zipfile) {
if (err != null) {
return callback(new InvalidZipFileError().withCause(err))
}
if (
Settings.maxEntitiesPerProject != null &&
zipfile.entryCount > Settings.maxEntitiesPerProject
) {
return callback(null, true) // too many files in zip file
}
zipfile.on('error', callback)
// read all the entries
zipfile.readEntry()
zipfile.on('entry', function (entry) {
totalSizeInBytes += entry.uncompressedSize
return zipfile.readEntry()
}) // get the next entry
// no more entries to read
return zipfile.on('end', function () {
if (totalSizeInBytes == null || isNaN(totalSizeInBytes)) {
logger.warn(
{ source, totalSizeInBytes },
'error getting bytes of zip'
)
return callback(
new InvalidZipFileError({ info: { totalSizeInBytes } })
)
}
const isTooLarge = totalSizeInBytes > ONE_MEG * 300
return callback(null, isTooLarge)
})
})
},
_checkFilePath(entry, destination, callback) {
// transform backslashes to forwardslashes to accommodate badly-behaved zip archives
if (callback == null) {
callback = function () {}
}
const transformedFilename = entry.fileName.replace(/\\/g, '/')
// check if the entry is a directory
const endsWithSlash = /\/$/
if (endsWithSlash.test(transformedFilename)) {
return callback() // don't give a destfile for directory
}
// check that the file does not use a relative path
for (const dir of Array.from(transformedFilename.split('/'))) {
if (dir === '..') {
return callback(new Error('relative path'))
}
}
// check that the destination file path is normalized
const dest = `${destination}/${transformedFilename}`
if (dest !== Path.normalize(dest)) {
return callback(new Error('unnormalized path'))
} else {
return callback(null, dest)
}
},
_writeFileEntry(zipfile, entry, destFile, callback) {
if (callback == null) {
callback = function () {}
}
callback = _.once(callback)
return zipfile.openReadStream(entry, function (err, readStream) {
if (err != null) {
return callback(err)
}
readStream.on('error', callback)
readStream.on('end', callback)
const errorHandler = function (err) {
// clean up before calling callback
readStream.unpipe()
readStream.destroy()
return callback(err)
}
return fse.ensureDir(Path.dirname(destFile), function (err) {
if (err != null) {
return errorHandler(err)
}
const writeStream = fs.createWriteStream(destFile)
writeStream.on('error', errorHandler)
return readStream.pipe(writeStream)
})
})
},
_extractZipFiles(source, destination, callback) {
if (callback == null) {
callback = function () {}
}
callback = _.once(callback)
return yauzl.open(source, { lazyEntries: true }, function (err, zipfile) {
if (err != null) {
return callback(err)
}
zipfile.on('error', callback)
// read all the entries
zipfile.readEntry()
let entryFileCount = 0
zipfile.on('entry', function (entry) {
return ArchiveManager._checkFilePath(
entry,
destination,
function (err, destFile) {
if (err != null) {
logger.warn(
{ err, source, destination },
'skipping bad file path'
)
zipfile.readEntry() // bad path, just skip to the next file
return
}
if (destFile != null) {
// only write files
return ArchiveManager._writeFileEntry(
zipfile,
entry,
destFile,
function (err) {
if (err != null) {
OError.tag(err, 'error unzipping file entry', {
source,
destFile,
})
zipfile.close() // bail out, stop reading file entries
return callback(err)
} else {
entryFileCount++
return zipfile.readEntry()
}
}
) // continue to the next file
} else {
// if it's a directory, continue
return zipfile.readEntry()
}
}
)
})
// no more entries to read
return zipfile.on('end', () => {
if (entryFileCount > 0) {
callback()
} else {
callback(new EmptyZipFileError())
}
})
})
},
extractZipArchive(source, destination, _callback) {
if (_callback == null) {
_callback = function () {}
}
const callback = function (...args) {
_callback(...Array.from(args || []))
return (_callback = function () {})
}
return ArchiveManager._isZipTooLarge(source, function (err, isTooLarge) {
if (err != null) {
OError.tag(err, 'error checking size of zip file')
return callback(err)
}
if (isTooLarge) {
return callback(new ZipContentsTooLargeError())
}
const timer = new metrics.Timer('unzipDirectory')
logger.log({ source, destination }, 'unzipping file')
return ArchiveManager._extractZipFiles(
source,
destination,
function (err) {
timer.done()
if (err != null) {
OError.tag(err, 'unzip failed', {
source,
destination,
})
return callback(err)
} else {
return callback()
}
}
)
})
},
findTopLevelDirectory(directory, callback) {
if (callback == null) {
callback = function () {}
}
return fs.readdir(directory, function (error, files) {
if (error != null) {
return callback(error)
}
if (files.length === 1) {
const childPath = Path.join(directory, files[0])
return fs.stat(childPath, function (error, stat) {
if (error != null) {
return callback(error)
}
if (stat.isDirectory()) {
return callback(null, childPath)
} else {
return callback(null, directory)
}
})
} else {
return callback(null, directory)
}
})
},
}
ArchiveManager.promises = promisifyAll(ArchiveManager)
module.exports = ArchiveManager