pad.libre-service.eu-etherpad/src/node/handler/ImportHandler.js

320 lines
9.8 KiB
JavaScript
Raw Normal View History

2011-07-21 21:13:58 +02:00
/**
* Handles the import requests
*/
/*
* 2011 Peter 'Pita' Martischka (Primary Technology Ltd)
2012-11-27 00:11:45 +01:00
* 2012 Iván Eixarch
2014-12-30 00:12:26 +01:00
* 2014 John McLear (Etherpad Foundation / McLear Ltd)
2011-07-21 21:13:58 +02:00
*
* Licensed under the Apache License, Version 2.0 (the "License");
* you may not use this file except in compliance with the License.
* You may obtain a copy of the License at
*
* http://www.apache.org/licenses/LICENSE-2.0
*
* Unless required by applicable law or agreed to in writing, software
* distributed under the License is distributed on an "AS-IS" BASIS,
* WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
* See the License for the specific language governing permissions and
* limitations under the License.
*/
2012-11-23 19:06:18 +01:00
var ERR = require("async-stacktrace")
, padManager = require("../db/PadManager")
, padMessageHandler = require("./PadMessageHandler")
, async = require("async")
, fs = require("fs")
, path = require("path")
2012-11-23 19:06:18 +01:00
, settings = require('../utils/Settings')
, formidable = require('formidable')
, os = require("os")
2013-09-27 15:47:34 +02:00
, importHtml = require("../utils/ImportHtml")
2014-12-29 20:57:58 +01:00
, importEtherpad = require("../utils/ImportEtherpad")
2013-11-27 01:23:11 +01:00
, log4js = require("log4js")
, hooks = require("ep_etherpad-lite/static/js/pluginfw/hooks.js");
var convertor = null;
var exportExtension = "htm";
//load abiword only if its enabled and if soffice is disabled
if(settings.abiword != null && settings.soffice === null)
convertor = require("../utils/Abiword");
//load soffice only if its enabled
if(settings.soffice != null) {
convertor = require("../utils/LibreOffice");
exportExtension = "html";
}
//for node 0.6 compatibily, os.tmpDir() only works from 0.8
var tmpDirectory = process.env.TEMP || process.env.TMPDIR || process.env.TMP || '/tmp';
2011-07-21 21:13:58 +02:00
/**
* do a requested import
*/
exports.doImport = function(req, res, padId)
{
2013-09-27 15:47:34 +02:00
var apiLogger = log4js.getLogger("ImportHandler");
2011-07-21 21:13:58 +02:00
//pipe to a file
//convert file to html via abiword or soffice
2012-11-23 19:06:18 +01:00
//set html in the pad
2011-07-21 21:13:58 +02:00
2012-11-23 19:06:18 +01:00
var srcFile, destFile
, pad
2013-11-27 01:23:11 +01:00
, text
2014-12-29 20:57:58 +01:00
, importHandledByPlugin
, directDatabaseAccess
, useConvertor;
2013-11-27 01:23:11 +01:00
var randNum = Math.floor(Math.random()*0xFFFFFFFF);
2011-07-21 21:13:58 +02:00
// setting flag for whether to use convertor or not
useConvertor = (convertor != null);
2011-07-21 21:13:58 +02:00
async.series([
//save the uploaded file to /tmp
2012-11-23 19:06:18 +01:00
function(callback) {
2011-07-21 21:13:58 +02:00
var form = new formidable.IncomingForm();
form.keepExtensions = true;
form.uploadDir = tmpDirectory;
2011-07-21 21:13:58 +02:00
2012-11-23 19:06:18 +01:00
form.parse(req, function(err, fields, files) {
//the upload failed, stop at this point
2012-11-23 19:06:18 +01:00
if(err || files.file === undefined) {
if(err) console.warn("Uploading Error: " + err.stack);
callback("uploadFailed");
}
//everything ok, continue
2012-11-23 19:06:18 +01:00
else {
//save the path of the uploaded file
srcFile = files.file.path;
callback();
}
2011-07-21 21:13:58 +02:00
});
},
2011-07-24 22:07:42 +02:00
//ensure this is a file ending we know, else we change the file ending to .txt
//this allows us to accept source code files like .c or .java
2012-11-23 19:06:18 +01:00
function(callback) {
var fileEnding = path.extname(srcFile).toLowerCase()
2017-08-03 23:53:12 +02:00
, knownFileEndings = [".txt", ".doc", ".docx", ".pdf", ".odt", ".html", ".htm", ".etherpad", ".rtf"]
, fileEndingKnown = (knownFileEndings.indexOf(fileEnding) > -1);
2011-07-24 22:07:42 +02:00
//if the file ending is known, continue as normal
2012-11-23 19:06:18 +01:00
if(fileEndingKnown) {
2011-07-24 22:07:42 +02:00
callback();
}
//we need to rename this file with a .txt ending
2012-11-23 19:06:18 +01:00
else {
if(settings.allowUnknownFileEnds === true){
var oldSrcFile = srcFile;
srcFile = path.join(path.dirname(srcFile),path.basename(srcFile, fileEnding)+".txt");
fs.rename(oldSrcFile, srcFile, callback);
}else{
console.warn("Not allowing unknown file type to be imported", fileEnding);
callback("uploadFailed");
}
2011-07-24 22:07:42 +02:00
}
},
2013-11-27 01:23:11 +01:00
function(callback){
destFile = path.join(tmpDirectory, "etherpad_import_" + randNum + "." + exportExtension);
2013-11-27 01:23:11 +01:00
// Logic for allowing external Import Plugins
hooks.aCallAll("import", {srcFile: srcFile, destFile: destFile}, function(err, result){
if(ERR(err, callback)) return callback();
if(result.length > 0){ // This feels hacky and wrong..
importHandledByPlugin = true;
}
callback();
2013-11-27 01:23:11 +01:00
});
},
2014-12-29 20:57:58 +01:00
function(callback) {
var fileEnding = path.extname(srcFile).toLowerCase()
var fileIsNotEtherpad = (fileEnding !== ".etherpad");
if (fileIsNotEtherpad) {
callback();
return;
}
// we do this here so we can see if the pad has quit ea few edits
padManager.getPad(padId, function(err, _pad){
var headCount = _pad.head;
if(headCount >= 10){
apiLogger.warn("Direct database Import attempt of a pad that already has content, we wont be doing this")
return callback("padHasData");
}
fs.readFile(srcFile, "utf8", function(err, _text){
directDatabaseAccess = true;
importEtherpad.setPadRaw(padId, _text, function(err){
callback();
});
2014-12-29 20:57:58 +01:00
});
});
2014-12-29 20:57:58 +01:00
},
2013-11-27 01:23:11 +01:00
//convert file to html
function(callback) {
if (importHandledByPlugin || directDatabaseAccess) {
2013-11-27 01:23:11 +01:00
callback();
return;
}
var fileEnding = path.extname(srcFile).toLowerCase();
var fileIsHTML = (fileEnding === ".html" || fileEnding === ".htm");
var fileIsTXT = (fileEnding === ".txt");
if (fileIsTXT) useConvertor = false; // Don't use convertor for text files
// See https://github.com/ether/etherpad-lite/issues/2572
if (fileIsHTML || (useConvertor === false)) {
// if no convertor only rename
fs.rename(srcFile, destFile, callback);
return;
}
convertor.convertFile(srcFile, destFile, exportExtension, function(err) {
//catch convert errors
if(err) {
console.warn("Converting Error:", err);
return callback("convertFailed");
} else {
callback();
}
});
2011-07-21 21:13:58 +02:00
},
function(callback) {
if (!useConvertor && !directDatabaseAccess){
// Read the file with no encoding for raw buffer access.
fs.readFile(destFile, function(err, buf) {
if (err) throw err;
var isAscii = true;
// Check if there are only ascii chars in the uploaded file
for (var i=0, len=buf.length; i<len; i++) {
if (buf[i] > 240) {
isAscii=false;
break;
2014-12-29 21:35:10 +01:00
}
}
if (isAscii) {
callback();
} else {
callback("uploadFailed");
}
});
} else {
callback();
}
},
2011-07-21 21:13:58 +02:00
//get the pad object
2012-11-23 19:06:18 +01:00
function(callback) {
padManager.getPad(padId, function(err, _pad){
if(ERR(err, callback)) return;
2011-07-21 21:13:58 +02:00
pad = _pad;
callback();
2011-07-21 21:13:58 +02:00
});
},
//read the text
2012-11-23 19:06:18 +01:00
function(callback) {
2014-12-29 20:57:58 +01:00
if(!directDatabaseAccess){
fs.readFile(destFile, "utf8", function(err, _text){
if(ERR(err, callback)) return;
text = _text;
// Title needs to be stripped out else it appends it to the pad..
text = text.replace("<title>", "<!-- <title>");
text = text.replace("</title>","</title>-->");
2014-12-29 20:57:58 +01:00
//node on windows has a delay on releasing of the file lock.
//We add a 100ms delay to work around this
if(os.type().indexOf("Windows") > -1){
setTimeout(function() {callback();}, 100);
} else {
callback();
}
});
}else{
callback();
}
2011-07-21 21:13:58 +02:00
},
//change text of the pad and broadcast the changeset
2012-11-23 19:06:18 +01:00
function(callback) {
2014-12-29 20:57:58 +01:00
if(!directDatabaseAccess){
var fileEnding = path.extname(srcFile).toLowerCase();
if (importHandledByPlugin || useConvertor || fileEnding == ".htm" || fileEnding == ".html") {
2015-01-19 03:51:32 +01:00
importHtml.setPadHTML(pad, text, function(e){
if(e) apiLogger.warn("Error importing, possibly caused by malformed HTML");
});
2014-12-29 20:57:58 +01:00
} else {
pad.setText(text);
2013-09-27 15:47:34 +02:00
}
}
2014-12-29 20:57:58 +01:00
// Load the Pad into memory then brodcast updates to all clients
padManager.unloadPad(padId);
padManager.getPad(padId, function(err, _pad){
var pad = _pad;
padManager.unloadPad(padId);
2014-12-30 12:12:24 +01:00
// direct Database Access means a pad user should perform a switchToPad
// and not attempt to recieve updated pad data..
if(!directDatabaseAccess){
padMessageHandler.updatePadClients(pad, function(){
callback();
});
}else{
2014-12-29 20:57:58 +01:00
callback();
2014-12-30 12:12:24 +01:00
}
2014-12-29 20:57:58 +01:00
});
2011-07-21 21:13:58 +02:00
},
//clean up temporary files
2012-11-23 19:06:18 +01:00
function(callback) {
2014-12-29 20:57:58 +01:00
if(!directDatabaseAccess){
//for node < 0.7 compatible
var fileExists = fs.exists || path.exists;
async.parallel([
function(callback){
fileExists (srcFile, function(exist) { (exist)? fs.unlink(srcFile, callback): callback(); });
},
function(callback){
fileExists (destFile, function(exist) { (exist)? fs.unlink(destFile, callback): callback(); });
}
], callback);
}else{
callback();
}
2011-07-21 21:13:58 +02:00
}
2012-11-23 19:06:18 +01:00
], function(err) {
var status = "ok";
//check for known errors and replace the status
if(err == "uploadFailed" || err == "convertFailed" || err == "padHasData")
{
status = err;
err = null;
}
ERR(err);
2014-12-30 12:12:24 +01:00
2011-07-21 21:13:58 +02:00
//close the connection
2014-11-25 23:14:48 +01:00
res.send(
"<head> \
<script type='text/javascript' src='../../static/js/jquery.js'></script> \
</head> \
<script> \
$(window).load(function(){ \
2014-12-30 12:12:24 +01:00
var impexp = window.parent.padimpexp.handleFrameCall('" + directDatabaseAccess +"', '" + status + "'); \
2014-11-25 23:14:48 +01:00
}) \
</script>"
);
2011-07-21 21:13:58 +02:00
});
}