mirror of
https://github.com/ether/etherpad-lite.git
synced 2025-04-23 08:56:17 -04:00
Tidy HTML before trying to convert it with abiword
This commit is contained in:
parent
9e9207d8b6
commit
786b43efc8
4 changed files with 87 additions and 35 deletions
|
@ -28,6 +28,7 @@ var fs = require("fs");
|
|||
var settings = require('../utils/Settings');
|
||||
var os = require('os');
|
||||
var hooks = require("ep_etherpad-lite/static/js/pluginfw/hooks");
|
||||
var TidyHtml = require('../utils/TidyHtml');
|
||||
|
||||
//load abiword only if its enabled
|
||||
if(settings.abiword != null)
|
||||
|
@ -35,28 +36,28 @@ if(settings.abiword != null)
|
|||
|
||||
var tempDirectory = "/tmp";
|
||||
|
||||
//tempDirectory changes if the operating system is windows
|
||||
//tempDirectory changes if the operating system is windows
|
||||
if(os.type().indexOf("Windows") > -1)
|
||||
{
|
||||
tempDirectory = process.env.TEMP;
|
||||
}
|
||||
|
||||
|
||||
/**
|
||||
* do a requested export
|
||||
*/
|
||||
*/
|
||||
exports.doExport = function(req, res, padId, type)
|
||||
{
|
||||
var fileName = padId;
|
||||
|
||||
// allow fileName to be overwritten by a hook, the type type is kept static for security reasons
|
||||
hooks.aCallFirst("exportFileName", padId,
|
||||
hooks.aCallFirst("exportFileName", padId,
|
||||
function(err, hookFileName){
|
||||
// if fileName is set then set it to the padId, note that fileName is returned as an array.
|
||||
if(hookFileName.length) fileName = hookFileName;
|
||||
|
||||
//tell the browser that this is a downloadable file
|
||||
res.attachment(fileName + "." + type);
|
||||
|
||||
|
||||
//if this is a plain text export, we can do this directly
|
||||
// We have to over engineer this because tabs are stored as attributes and not plain text
|
||||
if(type == "etherpad"){
|
||||
|
@ -72,7 +73,7 @@ exports.doExport = function(req, res, padId, type)
|
|||
var txt;
|
||||
var randNum;
|
||||
var srcFile, destFile;
|
||||
|
||||
|
||||
async.series([
|
||||
//render the txt document
|
||||
function(callback)
|
||||
|
@ -96,7 +97,7 @@ exports.doExport = function(req, res, padId, type)
|
|||
{
|
||||
//ensure html can be collected by the garbage collector
|
||||
txt = null;
|
||||
|
||||
|
||||
destFile = tempDirectory + "/etherpad_export_" + randNum + "." + type;
|
||||
abiword.convertFile(srcFile, destFile, type, callback);
|
||||
},
|
||||
|
@ -140,7 +141,7 @@ exports.doExport = function(req, res, padId, type)
|
|||
var html;
|
||||
var randNum;
|
||||
var srcFile, destFile;
|
||||
|
||||
|
||||
async.series([
|
||||
//render the html document
|
||||
function(callback)
|
||||
|
@ -150,7 +151,7 @@ exports.doExport = function(req, res, padId, type)
|
|||
if(ERR(err, callback)) return;
|
||||
html = _html;
|
||||
callback();
|
||||
});
|
||||
});
|
||||
},
|
||||
//decide what to do with the html export
|
||||
function(callback)
|
||||
|
@ -162,22 +163,29 @@ exports.doExport = function(req, res, padId, type)
|
|||
hooks.aCallFirst("exportHTMLSend", html, function(err, newHTML){
|
||||
if(newHTML.length) html = newHTML;
|
||||
res.send(html);
|
||||
callback("stop");
|
||||
callback("stop");
|
||||
});
|
||||
}
|
||||
else //write the html export to a file
|
||||
{
|
||||
randNum = Math.floor(Math.random()*0xFFFFFFFF);
|
||||
srcFile = tempDirectory + "/etherpad_export_" + randNum + ".html";
|
||||
fs.writeFile(srcFile, html, callback);
|
||||
fs.writeFile(srcFile, html, callback);
|
||||
}
|
||||
},
|
||||
//send the convert job to abiword
|
||||
|
||||
// Tidy up the exported HTML
|
||||
function(callback)
|
||||
{
|
||||
//ensure html can be collected by the garbage collector
|
||||
html = null;
|
||||
|
||||
|
||||
TidyHtml.tidy(srcFile, callback);
|
||||
},
|
||||
|
||||
//send the convert job to abiword
|
||||
function(callback)
|
||||
{
|
||||
destFile = tempDirectory + "/etherpad_export_" + randNum + "." + type;
|
||||
abiword.convertFile(srcFile, destFile, type, callback);
|
||||
},
|
||||
|
@ -199,7 +207,7 @@ exports.doExport = function(req, res, padId, type)
|
|||
//100ms delay to accomidate for slow windows fs
|
||||
if(os.type().indexOf("Windows") > -1)
|
||||
{
|
||||
setTimeout(function()
|
||||
setTimeout(function()
|
||||
{
|
||||
fs.unlink(destFile, callback);
|
||||
}, 100);
|
||||
|
|
|
@ -152,6 +152,11 @@ exports.minify = true;
|
|||
*/
|
||||
exports.abiword = null;
|
||||
|
||||
/**
|
||||
* The path of the tidy executable
|
||||
*/
|
||||
exports.tidyHtml = null;
|
||||
|
||||
/**
|
||||
* Should we support none natively supported file types on import?
|
||||
*/
|
||||
|
@ -167,7 +172,7 @@ exports.loglevel = "INFO";
|
|||
*/
|
||||
exports.disableIPlogging = false;
|
||||
|
||||
/**
|
||||
/**
|
||||
* Disable Load Testing
|
||||
*/
|
||||
exports.loadTest = false;
|
||||
|
@ -239,7 +244,7 @@ exports.reloadSettings = function reloadSettings() {
|
|||
} else {
|
||||
settingsFilename = path.resolve(path.join(exports.root, settingsFilename));
|
||||
}
|
||||
|
||||
|
||||
var settingsStr;
|
||||
try{
|
||||
//read the settings sync
|
||||
|
|
35
src/node/utils/TidyHtml.js
Normal file
35
src/node/utils/TidyHtml.js
Normal file
|
@ -0,0 +1,35 @@
|
|||
/**
|
||||
* Tidy up the HTML in a given file
|
||||
*/
|
||||
|
||||
var settings = require("./Settings");
|
||||
var spawn = require('child_process').spawn;
|
||||
|
||||
exports.tidy = function(srcFile, callback) {
|
||||
// Don't do anything if Tidy hasn't been enabled
|
||||
if (!settings.tidyHtml) {
|
||||
return callback(null);
|
||||
}
|
||||
|
||||
var errMessage = '';
|
||||
|
||||
// Spawn a new tidy instance that cleans up the file inline
|
||||
var tidy = spawn(settings.tidyHtml, ['-modify', srcFile]);
|
||||
|
||||
// Keep track of any error messages
|
||||
tidy.stderr.on('data', function (data) {
|
||||
errMessage += data.toString();
|
||||
});
|
||||
|
||||
// Wait until Tidy is done
|
||||
tidy.on('close', function(code) {
|
||||
// Tidy returns a 0 when no errors occur and a 1 exit code when
|
||||
// the file could be tidied but a few warnings were generated
|
||||
if (code === 0 || code === 1) {
|
||||
return callback(null);
|
||||
} else {
|
||||
console.error(errMessage);
|
||||
return callback('Tidy died with exit code ' + code);
|
||||
}
|
||||
});
|
||||
};
|
Loading…
Add table
Add a link
Reference in a new issue