overleaf/services/clsi/app/js/UrlFetcher.js

/* eslint-disable
    no-return-assign,
    no-unused-vars,
    n/no-deprecated-api,
*/
// TODO: This file was created by bulk-decaffeinate.
// Fix any style issues and re-enable lint.
/*
 * decaffeinate suggestions:
 * DS102: Remove unnecessary code created because of implicit returns
 * DS207: Consider shorter variations of null checks
 * Full docs: https://github.com/decaffeinate/decaffeinate/blob/master/docs/suggestions.md
 */
let UrlFetcher
const request = require('request').defaults({ jar: false })
const fs = require('fs')
const logger = require('@overleaf/logger')
const settings = require('@overleaf/settings')
const async = require('async')
const { URL } = require('url')
const { promisify } = require('util')

const oneMinute = 60 * 1000

module.exports = UrlFetcher = {
  pipeUrlToFileWithRetry(url, filePath, callback) {
    const doDownload = function (cb) {
      UrlFetcher.pipeUrlToFile(url, filePath, cb)
    }
    async.retry(3, doDownload, callback)
  },

  pipeUrlToFile(url, filePath, _callback) {
    if (_callback == null) {
      _callback = function () {}
    }
    const callbackOnce = function (error) {
      if (timeoutHandler != null) {
        clearTimeout(timeoutHandler)
      }
      _callback(error)
      return (_callback = function () {})
    }

    const u = new URL(url)
    if (
      settings.filestoreDomainOveride &&
      u.host !== settings.apis.clsiPerf.host
    ) {
      url = `${settings.filestoreDomainOveride}${u.pathname}${u.search}`
    }
    let timeoutHandler = setTimeout(
      function () {
        timeoutHandler = null
        logger.error({ url, filePath }, 'Timed out downloading file to cache')
        return callbackOnce(
          new Error(`Timed out downloading file to cache ${url}`)
        )
      },
      // FIXME: maybe need to close fileStream here
      3 * oneMinute
    )

    logger.debug({ url, filePath }, 'started downloading url to cache')
    const urlStream = request.get({ url, timeout: oneMinute })
    urlStream.pause() // stop data flowing until we are ready

    // attach handlers before setting up pipes
    urlStream.on('error', function (error) {
      logger.error({ err: error, url, filePath }, 'error downloading url')
      return callbackOnce(
        error || new Error(`Something went wrong downloading the URL ${url}`)
      )
    })

    urlStream.on('end', () =>
      logger.debug({ url, filePath }, 'finished downloading file into cache')
    )

    return urlStream.on('response', function (res) {
      if (res.statusCode >= 200 && res.statusCode < 300) {
        const atomicWrite = filePath + '~'
        const fileStream = fs.createWriteStream(atomicWrite)

        // attach handlers before setting up pipes
        fileStream.on('error', function (error) {
          logger.error(
            { err: error, url, filePath },
            'error writing file into cache'
          )
          return fs.unlink(atomicWrite, function (err) {
            if (err != null) {
              logger.err({ err, filePath }, 'error deleting file from cache')
            }
            return callbackOnce(error)
          })
        })

        fileStream.on('finish', function () {
          logger.debug({ url, filePath }, 'finished writing file into cache')
          fs.rename(atomicWrite, filePath, error => {
            if (error) {
              fs.unlink(atomicWrite, () => callbackOnce(error))
            } else {
              callbackOnce()
            }
          })
        })

        fileStream.on('pipe', () =>
          logger.debug({ url, filePath }, 'piping into filestream')
        )

        urlStream.pipe(fileStream)
        return urlStream.resume() // now we are ready to handle the data
      } else {
        logger.error(
          { statusCode: res.statusCode, url, filePath },
          'unexpected status code downloading url to cache'
        )
        // https://nodejs.org/api/http.html#http_class_http_clientrequest
        // If you add a 'response' event handler, then you must consume
        // the data from the response object, either by calling
        // response.read() whenever there is a 'readable' event, or by
        // adding a 'data' handler, or by calling the .resume()
        // method. Until the data is consumed, the 'end' event will not
        // fire. Also, until the data is read it will consume memory
        // that can eventually lead to a 'process out of memory' error.
        urlStream.resume() // discard the data
        return callbackOnce(
          new Error(
            `URL returned non-success status code: ${res.statusCode} ${url}`
          )
        )
      }
    })
  },
}

module.exports.promises = {
  pipeUrlToFileWithRetry: promisify(UrlFetcher.pipeUrlToFileWithRetry),
}
decaffeinate: Run post-processing cleanups on CommandRunner.coffee and 25 other files 2020-02-19 11:14:28 +00:00			`/* eslint-disable`
			`no-return-assign,`
			`no-unused-vars,`
Merge pull request #7986 from overleaf/jpa-eslint-8 [misc] upgrade eslint packages to the latest version everywhere GitOrigin-RevId: f1480d4a171acef82fb26c4aa54be3a6088b0ab3 2022-05-16 14:25:49 +00:00			`n/no-deprecated-api,`
decaffeinate: Run post-processing cleanups on CommandRunner.coffee and 25 other files 2020-02-19 11:14:28 +00:00			`*/`
			`// TODO: This file was created by bulk-decaffeinate.`
			`// Fix any style issues and re-enable lint.`
decaffeinate: Convert CommandRunner.coffee and 25 other files to JS 2020-02-19 11:14:14 +00:00			`/*`
			`* decaffeinate suggestions:`
			`* DS102: Remove unnecessary code created because of implicit returns`
			`* DS207: Consider shorter variations of null checks`
			`* Full docs: https://github.com/decaffeinate/decaffeinate/blob/master/docs/suggestions.md`
			`*/`
fix eslint errors 2020-06-02 08:51:34 +00:00			`let UrlFetcher`
prettier: convert app/js decaffeinated files to Prettier format 2020-02-19 11:14:37 +00:00			`const request = require('request').defaults({ jar: false })`
			`const fs = require('fs')`
Merge pull request #6926 from overleaf/jpa-clsi-bump-logger-metrics [clsi] upgrade logger and metrics module GitOrigin-RevId: 85c346b5eed683672a77d86d6a434dc313b7824b 2022-03-01 15:09:36 +00:00			`const logger = require('@overleaf/logger')`
[misc] switch from settings-sharelatex to @overleaf/settings 2021-07-12 16:47:21 +00:00			`const settings = require('@overleaf/settings')`
add pipeUrlToFileWithRetry function to retry file downloads 3 times 2020-05-14 12:09:57 +00:00			`const async = require('async')`
Merge pull request #5349 from overleaf/jpa-no-depreacted-api [misc] fix eslint violations for node/no-depreacted-api GitOrigin-RevId: 0f7d64984da9e789c4ab95381db34afb89fa1a94 2021-10-20 10:17:59 +00:00			`const { URL } = require('url')`
Merge pull request #4649 from overleaf/jpa-fs-based-caching [perf] UrlCache: pure fs based cache state for downloads GitOrigin-RevId: d19afc396324d4c3318b31620c8ad0c04e0544ce 2021-10-06 08:11:59 +00:00			`const { promisify } = require('util')`
Initial open source commit 2014-02-12 17:27:43 +00:00
prettier: convert app/js decaffeinated files to Prettier format 2020-02-19 11:14:37 +00:00			`const oneMinute = 60 * 1000`
clean up error handling in UrlFetcher 2015-05-15 13:07:15 +00:00
prettier: convert app/js decaffeinated files to Prettier format 2020-02-19 11:14:37 +00:00			`module.exports = UrlFetcher = {`
add pipeUrlToFileWithRetry function to retry file downloads 3 times 2020-05-14 12:09:57 +00:00			`pipeUrlToFileWithRetry(url, filePath, callback) {`
[misc] bump the dev-env to 3.3.2 2020-08-10 16:01:11 +00:00			`const doDownload = function (cb) {`
add pipeUrlToFileWithRetry function to retry file downloads 3 times 2020-05-14 12:09:57 +00:00			`UrlFetcher.pipeUrlToFile(url, filePath, cb)`
			`}`
			`async.retry(3, doDownload, callback)`
			`},`

prettier: convert app/js decaffeinated files to Prettier format 2020-02-19 11:14:37 +00:00			`pipeUrlToFile(url, filePath, _callback) {`
			`if (_callback == null) {`
Merge pull request #5367 from overleaf/jpa-node-handle-callback-err [misc] fix eslint violations for node/handle-callback-err GitOrigin-RevId: 83a4900e8861010df1917bff49382bd9c93375bd 2021-10-27 09:49:18 +00:00			`_callback = function () {}`
prettier: convert app/js decaffeinated files to Prettier format 2020-02-19 11:14:37 +00:00			`}`
[misc] bump the dev-env to 3.3.2 2020-08-10 16:01:11 +00:00			`const callbackOnce = function (error) {`
prettier: convert app/js decaffeinated files to Prettier format 2020-02-19 11:14:37 +00:00			`if (timeoutHandler != null) {`
			`clearTimeout(timeoutHandler)`
			`}`
			`_callback(error)`
[misc] bump the dev-env to 3.3.2 2020-08-10 16:01:11 +00:00			`return (_callback = function () {})`
prettier: convert app/js decaffeinated files to Prettier format 2020-02-19 11:14:37 +00:00			`}`
clean up error handling in UrlFetcher 2015-05-15 13:07:15 +00:00
Merge pull request #5349 from overleaf/jpa-no-depreacted-api [misc] fix eslint violations for node/no-depreacted-api GitOrigin-RevId: 0f7d64984da9e789c4ab95381db34afb89fa1a94 2021-10-20 10:17:59 +00:00			`const u = new URL(url)`
[UrlFetcher] do not override domain for clsi-perf requests 2021-07-02 08:17:29 +00:00			`if (`
			`settings.filestoreDomainOveride &&`
			`u.host !== settings.apis.clsiPerf.host`
			`) {`
Merge pull request #5349 from overleaf/jpa-no-depreacted-api [misc] fix eslint violations for node/no-depreacted-api GitOrigin-RevId: 0f7d64984da9e789c4ab95381db34afb89fa1a94 2021-10-20 10:17:59 +00:00			url = `${settings.filestoreDomainOveride}${u.pathname}${u.search}`
prettier: convert app/js decaffeinated files to Prettier format 2020-02-19 11:14:37 +00:00			`}`
Merge pull request #5352 from overleaf/jpa-no-var [misc] fix eslint violations for `no-var` GitOrigin-RevId: c52e82f3a8a993b8662cc5aa56e7b95ca3c55832 2021-10-26 08:08:56 +00:00			`let timeoutHandler = setTimeout(`
[misc] bump the dev-env to 3.3.2 2020-08-10 16:01:11 +00:00			`function () {`
prettier: convert app/js decaffeinated files to Prettier format 2020-02-19 11:14:37 +00:00			`timeoutHandler = null`
			`logger.error({ url, filePath }, 'Timed out downloading file to cache')`
			`return callbackOnce(`
			new Error(`Timed out downloading file to cache ${url}`)
			`)`
			`},`
			`// FIXME: maybe need to close fileStream here`
			`3 * oneMinute`
			`)`
clean up error handling in UrlFetcher 2015-05-15 13:07:15 +00:00
Merge pull request #7906 from overleaf/em-downgrade-logs Downgrade all INFO logs to DEBUG GitOrigin-RevId: 05ed582ef0721fcada059f0ad158565f50feca27 2022-05-16 12:38:18 +00:00			`logger.debug({ url, filePath }, 'started downloading url to cache')`
prettier: convert app/js decaffeinated files to Prettier format 2020-02-19 11:14:37 +00:00			`const urlStream = request.get({ url, timeout: oneMinute })`
			`urlStream.pause() // stop data flowing until we are ready`
clean up error handling in UrlFetcher 2015-05-15 13:07:15 +00:00
prettier: convert app/js decaffeinated files to Prettier format 2020-02-19 11:14:37 +00:00			`// attach handlers before setting up pipes`
[misc] bump the dev-env to 3.3.2 2020-08-10 16:01:11 +00:00			`urlStream.on('error', function (error) {`
prettier: convert app/js decaffeinated files to Prettier format 2020-02-19 11:14:37 +00:00			`logger.error({ err: error, url, filePath }, 'error downloading url')`
			`return callbackOnce(`
			error \|\| new Error(`Something went wrong downloading the URL ${url}`)
			`)`
			`})`
Initial open source commit 2014-02-12 17:27:43 +00:00
prettier: convert app/js decaffeinated files to Prettier format 2020-02-19 11:14:37 +00:00			`urlStream.on('end', () =>`
Merge pull request #7906 from overleaf/em-downgrade-logs Downgrade all INFO logs to DEBUG GitOrigin-RevId: 05ed582ef0721fcada059f0ad158565f50feca27 2022-05-16 12:38:18 +00:00			`logger.debug({ url, filePath }, 'finished downloading file into cache')`
prettier: convert app/js decaffeinated files to Prettier format 2020-02-19 11:14:37 +00:00			`)`
Initial open source commit 2014-02-12 17:27:43 +00:00
[misc] bump the dev-env to 3.3.2 2020-08-10 16:01:11 +00:00			`return urlStream.on('response', function (res) {`
prettier: convert app/js decaffeinated files to Prettier format 2020-02-19 11:14:37 +00:00			`if (res.statusCode >= 200 && res.statusCode < 300) {`
Merge pull request #4649 from overleaf/jpa-fs-based-caching [perf] UrlCache: pure fs based cache state for downloads GitOrigin-RevId: d19afc396324d4c3318b31620c8ad0c04e0544ce 2021-10-06 08:11:59 +00:00			`const atomicWrite = filePath + '~'`
			`const fileStream = fs.createWriteStream(atomicWrite)`
clean up error handling in UrlFetcher 2015-05-15 13:07:15 +00:00
prettier: convert app/js decaffeinated files to Prettier format 2020-02-19 11:14:37 +00:00			`// attach handlers before setting up pipes`
[misc] bump the dev-env to 3.3.2 2020-08-10 16:01:11 +00:00			`fileStream.on('error', function (error) {`
prettier: convert app/js decaffeinated files to Prettier format 2020-02-19 11:14:37 +00:00			`logger.error(`
			`{ err: error, url, filePath },`
			`'error writing file into cache'`
			`)`
Merge pull request #4649 from overleaf/jpa-fs-based-caching [perf] UrlCache: pure fs based cache state for downloads GitOrigin-RevId: d19afc396324d4c3318b31620c8ad0c04e0544ce 2021-10-06 08:11:59 +00:00			`return fs.unlink(atomicWrite, function (err) {`
prettier: convert app/js decaffeinated files to Prettier format 2020-02-19 11:14:37 +00:00			`if (err != null) {`
			`logger.err({ err, filePath }, 'error deleting file from cache')`
			`}`
			`return callbackOnce(error)`
			`})`
			`})`
clean up error handling in UrlFetcher 2015-05-15 13:07:15 +00:00
[misc] bump the dev-env to 3.3.2 2020-08-10 16:01:11 +00:00			`fileStream.on('finish', function () {`
Merge pull request #7906 from overleaf/em-downgrade-logs Downgrade all INFO logs to DEBUG GitOrigin-RevId: 05ed582ef0721fcada059f0ad158565f50feca27 2022-05-16 12:38:18 +00:00			`logger.debug({ url, filePath }, 'finished writing file into cache')`
Merge pull request #4649 from overleaf/jpa-fs-based-caching [perf] UrlCache: pure fs based cache state for downloads GitOrigin-RevId: d19afc396324d4c3318b31620c8ad0c04e0544ce 2021-10-06 08:11:59 +00:00			`fs.rename(atomicWrite, filePath, error => {`
			`if (error) {`
			`fs.unlink(atomicWrite, () => callbackOnce(error))`
			`} else {`
			`callbackOnce()`
			`}`
			`})`
prettier: convert app/js decaffeinated files to Prettier format 2020-02-19 11:14:37 +00:00			`})`
clean up error handling in UrlFetcher 2015-05-15 13:07:15 +00:00
prettier: convert app/js decaffeinated files to Prettier format 2020-02-19 11:14:37 +00:00			`fileStream.on('pipe', () =>`
Merge pull request #7906 from overleaf/em-downgrade-logs Downgrade all INFO logs to DEBUG GitOrigin-RevId: 05ed582ef0721fcada059f0ad158565f50feca27 2022-05-16 12:38:18 +00:00			`logger.debug({ url, filePath }, 'piping into filestream')`
prettier: convert app/js decaffeinated files to Prettier format 2020-02-19 11:14:37 +00:00			`)`
clean up error handling in UrlFetcher 2015-05-15 13:07:15 +00:00
prettier: convert app/js decaffeinated files to Prettier format 2020-02-19 11:14:37 +00:00			`urlStream.pipe(fileStream)`
			`return urlStream.resume() // now we are ready to handle the data`
			`} else {`
			`logger.error(`
			`{ statusCode: res.statusCode, url, filePath },`
			`'unexpected status code downloading url to cache'`
			`)`
			`// https://nodejs.org/api/http.html#http_class_http_clientrequest`
			`// If you add a 'response' event handler, then you must consume`
			`// the data from the response object, either by calling`
			`// response.read() whenever there is a 'readable' event, or by`
			`// adding a 'data' handler, or by calling the .resume()`
			`// method. Until the data is consumed, the 'end' event will not`
			`// fire. Also, until the data is read it will consume memory`
			`// that can eventually lead to a 'process out of memory' error.`
			`urlStream.resume() // discard the data`
			`return callbackOnce(`
			`new Error(`
			`URL returned non-success status code: ${res.statusCode} ${url}`
			`)`
			`)`
			`}`
			`})`
[misc] run format_fix and lint:fix 2021-07-13 11:04:48 +00:00			`},`
prettier: convert app/js decaffeinated files to Prettier format 2020-02-19 11:14:37 +00:00			`}`
Merge pull request #4649 from overleaf/jpa-fs-based-caching [perf] UrlCache: pure fs based cache state for downloads GitOrigin-RevId: d19afc396324d4c3318b31620c8ad0c04e0544ce 2021-10-06 08:11:59 +00:00
			`module.exports.promises = {`
			`pipeUrlToFileWithRetry: promisify(UrlFetcher.pipeUrlToFileWithRetry),`
			`}`