etherpad-lite/src/node/utils/Minify.js

342 lines
12 KiB
JavaScript
Raw Normal View History

'use strict';
/**
* This Module manages all /minified/* requests. It controls the
* minification && compression of Javascript and CSS.
*/
2011-05-30 15:53:11 +01:00
/*
* 2011 Peter 'Pita' Martischka (Primary Technology Ltd)
*
* Licensed under the Apache License, Version 2.0 (the "License");
* you may not use this file except in compliance with the License.
* You may obtain a copy of the License at
*
* http://www.apache.org/licenses/LICENSE-2.0
*
* Unless required by applicable law or agreed to in writing, software
* distributed under the License is distributed on an "AS-IS" BASIS,
* WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
* See the License for the specific language governing permissions and
* limitations under the License.
*/
const assert = require('assert').strict;
2020-11-23 13:24:19 -05:00
const settings = require('./Settings');
2021-02-11 18:19:31 -05:00
const fs = require('fs').promises;
2020-11-23 13:24:19 -05:00
const path = require('path');
const plugins = require('../../static/js/pluginfw/plugin_defs');
2020-11-23 13:24:19 -05:00
const RequireKernel = require('etherpad-require-kernel');
const mime = require('mime-types');
const Threads = require('threads');
const log4js = require('log4js');
const logger = log4js.getLogger('Minify');
const ROOT_DIR = path.join(settings.root, 'src/static/');
2020-11-23 13:24:19 -05:00
const threadsPool = new Threads.Pool(() => Threads.spawn(new Threads.Worker('./MinifyWorker')), 2);
2020-11-23 13:24:19 -05:00
const LIBRARY_WHITELIST = [
'async',
'js-cookie',
'security',
'tinycon',
'underscore',
'unorm',
];
2012-05-11 18:01:10 -07:00
// What follows is a terrible hack to avoid loop-back within the server.
// TODO: Serve files from another service, or directly from the file system.
const requestURI = async (url, method, headers) => await new Promise((resolve, reject) => {
const parsedUrl = new URL(url);
let status = 500;
const content = [];
const mockRequest = {
url,
method,
params: {filename: (parsedUrl.pathname + parsedUrl.search).replace(/^\/static\//, '')},
headers,
};
const mockResponse = {
writeHead: (_status, _headers) => {
status = _status;
for (const header in _headers) {
if (Object.prototype.hasOwnProperty.call(_headers, header)) {
headers[header] = _headers[header];
}
}
},
setHeader: (header, value) => {
headers[header.toLowerCase()] = value.toString();
},
header: (header, value) => {
headers[header.toLowerCase()] = value.toString();
},
write: (_content) => {
_content && content.push(_content);
},
end: (_content) => {
_content && content.push(_content);
resolve([status, headers, content.join('')]);
},
};
minify(mockRequest, mockResponse).catch(reject);
});
const requestURIs = (locations, method, headers, callback) => {
Promise.all(locations.map((loc) => requestURI(loc, method, headers))).then((responses) => {
2020-11-23 13:24:19 -05:00
const statuss = responses.map((x) => x[0]);
const headerss = responses.map((x) => x[1]);
const contentss = responses.map((x) => x[2]);
callback(statuss, headerss, contentss);
});
};
const sanitizePathname = (p) => {
// Replace all backslashes with forward slashes to support Windows. This MUST be done BEFORE path
// normalization, otherwise an attacker will be able to read arbitrary files anywhere on the
// filesystem. See https://nvd.nist.gov/vuln/detail/CVE-2015-3297. Node.js treats both the
// backlash and the forward slash characters as pathname component separators on Windows so this
// does not change the meaning of the pathname.
p = p.replace(/\\/g, '/');
// The Node.js documentation says that path.join() normalizes, and the documentation for
// path.normalize() says that it resolves '..' and '.' components. The word "resolve" implies that
// it examines the filesystem to resolve symbolic links, so 'a/../b' might not be the same thing
// as 'b'. Most path normalization functions from other libraries (e.g. Python's
// os.path.normpath()) clearly state that they do not examine the filesystem -- they are simple
// string manipulations. Node.js's path.normalize() probably also does a simple string
// manipulation, but if not it must be given a real pathname. Join with ROOT_DIR here just in
// case. ROOT_DIR will be removed later.
p = path.join(ROOT_DIR, p);
// Prevent attempts to read outside of ROOT_DIR via extra '..' components. ROOT_DIR is assumed to
// be normalized.
assert(ROOT_DIR.endsWith(path.sep));
if (!p.startsWith(ROOT_DIR)) throw new Error(`attempt to read outside ROOT_DIR (${ROOT_DIR})`);
// Convert back to a relative pathname.
p = p.slice(ROOT_DIR.length);
// On Windows, path.normalize replaces forward slashes with backslashes. Convert back to forward
// slashes. THIS IS DANGEROUS UNLESS BACKSLASHES ARE REPLACED WITH FORWARD SLASHES BEFORE PATH
// NORMALIZATION, otherwise on POSIXish systems '..\\' in the input pathname would not be
// normalized away before being converted to '../'.
p = p.replace(/\\/g, '/');
return p;
};
const compatPaths = {
'js/browser.js': 'js/vendors/browser.js',
'js/farbtastic.js': 'js/vendors/farbtastic.js',
'js/gritter.js': 'js/vendors/gritter.js',
'js/html10n.js': 'js/vendors/html10n.js',
'js/jquery.js': 'js/vendors/jquery.js',
'js/nice-select.js': 'js/vendors/nice-select.js',
};
/**
* creates the minifed javascript for the given minified name
2011-05-30 15:53:11 +01:00
* @param req the Express request
* @param res the Express response
*/
2021-02-11 17:15:31 -05:00
const minify = async (req, res) => {
2020-11-23 13:24:19 -05:00
let filename = req.params.filename;
try {
filename = sanitizePathname(filename);
} catch (err) {
logger.error(`sanitization of pathname "${filename}" failed: ${err.stack || err}`);
res.writeHead(404, {});
res.end();
return;
}
2012-01-05 11:31:39 +01:00
// Backward compatibility for plugins that require() files from old paths.
const newLocation = compatPaths[filename.replace(/^plugins\/ep_etherpad-lite\/static\//, '')];
if (newLocation != null) {
logger.warn(`request for deprecated path "${filename}", replacing with "${newLocation}"`);
filename = newLocation;
}
2012-05-11 18:01:10 -07:00
/* Handle static files for plugins/libraries:
paths like "plugins/ep_myplugin/static/js/test.js"
are rewritten into ROOT_PATH_OF_MYPLUGIN/static/js/test.js,
commonly ETHERPAD_ROOT/node_modules/ep_myplugin/static/js/test.js
*/
const match = filename.match(/^plugins\/([^/]+)(\/(?:(static\/.*)|.*))?$/);
if (match) {
2020-11-23 13:24:19 -05:00
const library = match[1];
const libraryPath = match[2] || '';
2012-05-11 18:01:10 -07:00
if (plugins.plugins[library] && match[3]) {
2020-11-23 13:24:19 -05:00
const plugin = plugins.plugins[library];
const pluginPath = plugin.package.realPath;
filename = path.relative(ROOT_DIR, path.join(pluginPath, libraryPath));
// On Windows, path.relative converts forward slashes to backslashes. Convert them back
// because some of the code below assumes forward slashes. Node.js treats both the backlash
// and the forward slash characters as pathname component separators on Windows so this does
// not change the meaning of the pathname. This conversion does not introduce a directory
// traversal vulnerability because all '..\\' substrings have already been removed by
// sanitizePathname.
filename = filename.replace(/\\/g, '/');
} else if (LIBRARY_WHITELIST.indexOf(library) !== -1) {
2012-05-11 18:01:10 -07:00
// Go straight into node_modules
// Avoid `require.resolve()`, since 'mustache' and 'mustache/index.js'
// would end up resolving to logically distinct resources.
filename = path.join('../node_modules/', library, libraryPath);
}
}
2020-11-23 13:24:19 -05:00
const contentType = mime.lookup(filename);
2012-02-26 22:01:52 +01:00
const [date, exists] = await statFile(filename, 3);
2021-02-11 17:15:31 -05:00
if (date) {
date.setMilliseconds(0);
res.setHeader('last-modified', date.toUTCString());
res.setHeader('date', (new Date()).toUTCString());
if (settings.maxAge !== undefined) {
const expiresDate = new Date(Date.now() + settings.maxAge * 1000);
res.setHeader('expires', expiresDate.toUTCString());
res.setHeader('cache-control', `max-age=${settings.maxAge}`);
}
2021-02-11 17:15:31 -05:00
}
2021-02-11 17:15:31 -05:00
if (!exists) {
res.writeHead(404, {});
res.end();
} else if (new Date(req.headers['if-modified-since']) >= date) {
res.writeHead(304, {});
res.end();
} else if (req.method === 'HEAD') {
res.header('Content-Type', contentType);
res.writeHead(200, {});
res.end();
} else if (req.method === 'GET') {
const content = await getFileCompressed(filename, contentType);
2021-02-11 17:15:31 -05:00
res.header('Content-Type', contentType);
res.writeHead(200, {});
res.write(content);
res.end();
} else {
res.writeHead(405, {allow: 'HEAD, GET'});
res.end();
}
};
// Check for the existance of the file and get the last modification date.
2021-02-11 16:54:25 -05:00
const statFile = async (filename, dirStatLimit) => {
/*
* The only external call to this function provides an explicit value for
* dirStatLimit: this check could be removed.
*/
2012-09-11 22:25:44 -07:00
if (typeof dirStatLimit === 'undefined') {
dirStatLimit = 3;
}
if (dirStatLimit < 1 || filename === '' || filename === '/') {
2021-02-11 16:54:25 -05:00
return [null, false];
} else if (filename === 'js/ace.js') {
// Sometimes static assets are inlined into this file, so we have to stat
// everything.
2021-02-11 16:54:25 -05:00
return [await lastModifiedDateOfEverything(), true];
} else if (filename === 'js/require-kernel.js') {
return [_requireLastModified, true];
} else {
2021-02-11 16:54:25 -05:00
let stats;
try {
stats = await fs.stat(path.join(ROOT_DIR, filename));
2021-02-11 16:54:25 -05:00
} catch (err) {
if (err.code === 'ENOENT') {
// Stat the directory instead.
const [date] = await statFile(path.dirname(filename), dirStatLimit - 1);
return [date, false];
2012-01-22 18:29:00 -08:00
}
2021-02-11 16:54:25 -05:00
throw err;
}
return [stats.mtime, stats.isFile()];
}
};
const lastModifiedDateOfEverything = async () => {
const folders2check = [path.join(ROOT_DIR, 'js/'), path.join(ROOT_DIR, 'css/')];
let latestModification = null;
2021-02-03 00:30:07 +01:00
// go through this two folders
await Promise.all(folders2check.map(async (dir) => {
2020-11-23 13:24:19 -05:00
// read the files in the folder
const files = await fs.readdir(dir);
2020-11-23 13:24:19 -05:00
// we wanna check the directory itself for changes too
files.push('.');
2020-11-23 13:24:19 -05:00
// go through all files in this folder
await Promise.all(files.map(async (filename) => {
// get the stat data of this file
const stats = await fs.stat(path.join(dir, filename));
2020-11-23 13:24:19 -05:00
// compare the modification time to the highest found
if (latestModification == null || stats.mtime > latestModification) {
latestModification = stats.mtime;
}
}));
}));
return latestModification;
};
2012-01-22 18:29:00 -08:00
// This should be provided by the module, but until then, just use startup
// time.
2020-11-23 13:24:19 -05:00
const _requireLastModified = new Date();
const requireDefinition = () => `var require = ${RequireKernel.kernelSource};\n`;
2021-02-11 17:10:13 -05:00
const getFileCompressed = async (filename, contentType) => {
let content = await getFile(filename);
if (!content || !settings.minify) {
return content;
} else if (contentType === 'application/javascript') {
return await new Promise((resolve) => {
2020-11-23 13:24:19 -05:00
threadsPool.queue(async ({compressJS}) => {
try {
2020-11-23 13:24:19 -05:00
logger.info('Compress JS file %s.', filename);
content = content.toString();
const compressResult = await compressJS(content);
if (compressResult.error) {
console.error(`Error compressing JS (${filename}) using terser`, compressResult.error);
} else {
content = compressResult.code.toString(); // Convert content obj code to string
}
} catch (error) {
console.error('getFile() returned an error in ' +
`getFileCompressed(${filename}, ${contentType}): ${error}`);
}
2021-02-11 17:10:13 -05:00
resolve(content);
2020-11-23 13:24:19 -05:00
});
2021-02-11 17:10:13 -05:00
});
} else if (contentType === 'text/css') {
return await new Promise((resolve) => {
2020-11-23 13:24:19 -05:00
threadsPool.queue(async ({compressCSS}) => {
try {
2020-11-23 13:24:19 -05:00
logger.info('Compress CSS file %s.', filename);
content = await compressCSS(filename, ROOT_DIR);
} catch (error) {
console.error(`CleanCSS.minify() returned an error on ${filename}: ${error}`);
}
2021-02-11 17:10:13 -05:00
resolve(content);
2020-11-23 13:24:19 -05:00
});
2021-02-11 17:10:13 -05:00
});
} else {
return content;
}
};
2012-01-15 17:23:48 -08:00
2021-02-11 16:32:29 -05:00
const getFile = async (filename) => {
if (filename === 'js/require-kernel.js') return requireDefinition();
return await fs.readFile(path.join(ROOT_DIR, filename));
};
2021-02-11 17:15:31 -05:00
exports.minify = (req, res, next) => minify(req, res).catch((err) => next(err || new Error(err)));
exports.requestURIs = requestURIs;
exports.shutdown = async (hookName, context) => {
await threadsPool.terminate();
};