Merge branch 'develop' of github.com:ether/etherpad-lite into mochawesome

This commit is contained in:
John McLear 2021-01-27 20:11:53 +00:00
commit 7696ec0a02
7 changed files with 333 additions and 356 deletions

View file

@ -421,7 +421,20 @@ Things in context:
4. text - the text for that line 4. text - the text for that line
This hook allows you to validate/manipulate the text before it's sent to the This hook allows you to validate/manipulate the text before it's sent to the
server side. The return value should be the validated/manipulated text. server side. To change the text, either:
* Set the `text` context property to the desired value and return `undefined`.
* (Deprecated) Return a string. If a hook function changes the `text` context
property, the return value is ignored. If no hook function changes `text` but
multiple hook functions return a string, the first one wins.
Example:
```
exports.collectContentLineText = (hookName, context) => {
context.text = tweakText(context.text);
};
```
## collectContentLineBreak ## collectContentLineBreak

View file

@ -391,9 +391,9 @@ const defaultResponseRefs = {
// convert to a dictionary of operation objects // convert to a dictionary of operation objects
const operations = {}; const operations = {};
for (const resource in resources) { for (const [resource, actions] of Object.entries(resources)) {
for (const action in resources[resource]) { for (const [action, spec] of Object.entries(actions)) {
const {operationId, responseSchema, ...operation} = resources[resource][action]; const {operationId, responseSchema, ...operation} = spec;
// add response objects // add response objects
const responses = {...defaultResponseRefs}; const responses = {...defaultResponseRefs};
@ -623,7 +623,7 @@ exports.expressCreateServer = (hookName, args, cb) => {
} else { } else {
// an unknown error happened // an unknown error happened
// log it and throw internal error // log it and throw internal error
apiLogger.error(err); apiLogger.error(err.stack || err.toString());
throw new createHTTPError.InternalError('internal error'); throw new createHTTPError.InternalError('internal error');
} }
}); });

View file

@ -1139,7 +1139,7 @@ function Ace2Inner() {
lastDirtyNode = (lastDirtyNode && isNodeDirty(lastDirtyNode) && lastDirtyNode); lastDirtyNode = (lastDirtyNode && isNodeDirty(lastDirtyNode) && lastDirtyNode);
if (firstDirtyNode && lastDirtyNode) { if (firstDirtyNode && lastDirtyNode) {
const cc = makeContentCollector(isStyled, browser, rep.apool, null, className2Author); const cc = makeContentCollector(isStyled, browser, rep.apool, className2Author);
cc.notifySelection(selection); cc.notifySelection(selection);
const dirtyNodes = []; const dirtyNodes = [];
for (let n = firstDirtyNode; n && for (let n = firstDirtyNode; n &&

View file

@ -32,30 +32,31 @@ const hooks = require('./pluginfw/hooks');
const sanitizeUnicode = (s) => UNorm.nfc(s); const sanitizeUnicode = (s) => UNorm.nfc(s);
const makeContentCollector = (collectStyles, abrowser, apool, domInterface, className2Author) => { // This file is used both in browsers and with cheerio in Node.js (for importing HTML). Cheerio's
const dom = domInterface || { // Node-like objects are not 100% API compatible with the DOM specification; the following functions
isNodeText: (n) => n.nodeType === 3, // abstract away the differences.
nodeTagName: (n) => n.tagName,
nodeValue: (n) => n.nodeValue,
nodeNumChildren: (n) => {
if (n.childNodes == null) return 0;
return n.childNodes.length;
},
nodeChild: (n, i) => {
if (n.childNodes.item == null) {
return n.childNodes[i];
}
return n.childNodes.item(i);
},
nodeProp: (n, p) => n[p],
nodeAttr: (n, a) => {
if (n.getAttribute != null) return n.getAttribute(a);
if (n.attribs != null) return n.attribs[a];
return null;
},
optNodeInnerHTML: (n) => n.innerHTML,
};
// .nodeType works with DOM and cheerio 0.22.0, but cheerio 0.22.0 does not provide the Node.*_NODE
// constants so they cannot be used here.
const isElementNode = (n) => n.nodeType === 1; // Node.ELEMENT_NODE
const isTextNode = (n) => n.nodeType === 3; // Node.TEXT_NODE
// .tagName works with DOM and cheerio 0.22.0, but:
// * With DOM, .tagName is an uppercase string.
// * With cheerio 0.22.0, .tagName is a lowercase string.
// For consistency, this function always returns a lowercase string.
const tagName = (n) => n.tagName && n.tagName.toLowerCase();
// .childNodes works with DOM and cheerio 0.22.0, except in cheerio the .childNodes property does
// not exist on text nodes (and maybe other non-element nodes).
const childNodes = (n) => n.childNodes || [];
const getAttribute = (n, a) => {
// .getAttribute() works with DOM but not with cheerio 0.22.0.
if (n.getAttribute != null) return n.getAttribute(a);
// .attribs[] works with cheerio 0.22.0 but not with DOM.
if (n.attribs != null) return n.attribs[a];
return null;
};
const makeContentCollector = (collectStyles, abrowser, apool, className2Author) => {
const _blockElems = { const _blockElems = {
div: 1, div: 1,
p: 1, p: 1,
@ -67,7 +68,7 @@ const makeContentCollector = (collectStyles, abrowser, apool, domInterface, clas
_blockElems[element] = 1; _blockElems[element] = 1;
}); });
const isBlockElement = (n) => !!_blockElems[(dom.nodeTagName(n) || '').toLowerCase()]; const isBlockElement = (n) => !!_blockElems[tagName(n) || ''];
const textify = (str) => sanitizeUnicode( const textify = (str) => sanitizeUnicode(
str.replace(/(\n | \n)/g, ' ') str.replace(/(\n | \n)/g, ' ')
@ -75,7 +76,7 @@ const makeContentCollector = (collectStyles, abrowser, apool, domInterface, clas
.replace(/\xa0/g, ' ') .replace(/\xa0/g, ' ')
.replace(/\t/g, ' ')); .replace(/\t/g, ' '));
const getAssoc = (node, name) => dom.nodeProp(node, `_magicdom_${name}`); const getAssoc = (node, name) => node[`_magicdom_${name}`];
const lines = (() => { const lines = (() => {
const textArray = []; const textArray = [];
@ -123,13 +124,17 @@ const makeContentCollector = (collectStyles, abrowser, apool, domInterface, clas
let selEnd = [-1, -1]; let selEnd = [-1, -1];
const _isEmpty = (node, state) => { const _isEmpty = (node, state) => {
// consider clean blank lines pasted in IE to be empty // consider clean blank lines pasted in IE to be empty
if (dom.nodeNumChildren(node) === 0) return true; if (childNodes(node).length === 0) return true;
if (dom.nodeNumChildren(node) === 1 && if (childNodes(node).length === 1 &&
getAssoc(node, 'shouldBeEmpty') && getAssoc(node, 'shouldBeEmpty') &&
dom.optNodeInnerHTML(node) === ' ' && // Note: The .innerHTML property exists on DOM Element objects but not on cheerio's
// Element-like objects (cheerio v0.22.0) so this equality check will always be false.
// Cheerio's Element-like objects have no equivalent to .innerHTML. (Cheerio objects have an
// .html() method, but that isn't accessible here.)
node.innerHTML === ' ' &&
!getAssoc(node, 'unpasted')) { !getAssoc(node, 'unpasted')) {
if (state) { if (state) {
const child = dom.nodeChild(node, 0); const child = childNodes(node)[0];
_reachPoint(child, 0, state); _reachPoint(child, 0, state);
_reachPoint(child, 1, state); _reachPoint(child, 1, state);
} }
@ -149,7 +154,7 @@ const makeContentCollector = (collectStyles, abrowser, apool, domInterface, clas
}; };
const _reachBlockPoint = (nd, idx, state) => { const _reachBlockPoint = (nd, idx, state) => {
if (!dom.isNodeText(nd)) _reachPoint(nd, idx, state); if (!isTextNode(nd)) _reachPoint(nd, idx, state);
}; };
const _reachPoint = (nd, idx, state) => { const _reachPoint = (nd, idx, state) => {
@ -228,25 +233,24 @@ const makeContentCollector = (collectStyles, abrowser, apool, domInterface, clas
const _recalcAttribString = (state) => { const _recalcAttribString = (state) => {
const lst = []; const lst = [];
for (const a in state.attribs) { for (const [a, count] of Object.entries(state.attribs)) {
if (state.attribs[a]) { if (!count) continue;
// The following splitting of the attribute name is a workaround // The following splitting of the attribute name is a workaround
// to enable the content collector to store key-value attributes // to enable the content collector to store key-value attributes
// see https://github.com/ether/etherpad-lite/issues/2567 for more information // see https://github.com/ether/etherpad-lite/issues/2567 for more information
// in long term the contentcollector should be refactored to get rid of this workaround // in long term the contentcollector should be refactored to get rid of this workaround
const ATTRIBUTE_SPLIT_STRING = '::'; const ATTRIBUTE_SPLIT_STRING = '::';
// see if attributeString is splittable // see if attributeString is splittable
const attributeSplits = a.split(ATTRIBUTE_SPLIT_STRING); const attributeSplits = a.split(ATTRIBUTE_SPLIT_STRING);
if (attributeSplits.length > 1) { if (attributeSplits.length > 1) {
// the attribute name follows the convention key::value // the attribute name follows the convention key::value
// so save it as a key value attribute // so save it as a key value attribute
lst.push([attributeSplits[0], attributeSplits[1]]); lst.push([attributeSplits[0], attributeSplits[1]]);
} else { } else {
// the "normal" case, the attribute is just a switch // the "normal" case, the attribute is just a switch
// so set it true // so set it true
lst.push([a, 'true']); lst.push([a, 'true']);
}
} }
} }
if (state.authorLevel > 0) { if (state.authorLevel > 0) {
@ -316,25 +320,15 @@ const makeContentCollector = (collectStyles, abrowser, apool, domInterface, clas
const startLine = lines.length() - 1; const startLine = lines.length() - 1;
_reachBlockPoint(node, 0, state); _reachBlockPoint(node, 0, state);
if (dom.isNodeText(node)) { if (isTextNode(node)) {
let txt = dom.nodeValue(node); const tname = getAttribute(node.parentNode, 'name');
const tname = dom.nodeAttr(node.parentNode, 'name'); const context = {cc: this, state, tname, node, text: node.nodeValue};
// Hook functions may either return a string (deprecated) or modify context.text. If any hook
const txtFromHook = hooks.callAll('collectContentLineText', { // function modifies context.text then all returned strings are ignored. If no hook functions
cc: this, // modify context.text, the first hook function to return a string wins.
state, const [hookTxt] =
tname, hooks.callAll('collectContentLineText', context).filter((s) => typeof s === 'string');
node, let txt = context.text === node.nodeValue && hookTxt != null ? hookTxt : context.text;
text: txt,
styl: null,
cls: null,
});
if (typeof (txtFromHook) === 'object') {
txt = dom.nodeValue(node);
} else if (txtFromHook) {
txt = txtFromHook;
}
let rest = ''; let rest = '';
let x = 0; // offset into original text let x = 0; // offset into original text
@ -384,8 +378,8 @@ const makeContentCollector = (collectStyles, abrowser, apool, domInterface, clas
cc.startNewLine(state); cc.startNewLine(state);
} }
} }
} else { } else if (isElementNode(node)) {
const tname = (dom.nodeTagName(node) || '').toLowerCase(); const tname = tagName(node) || '';
if (tname === 'img') { if (tname === 'img') {
hooks.callAll('collectContentImage', { hooks.callAll('collectContentImage', {
@ -403,8 +397,8 @@ const makeContentCollector = (collectStyles, abrowser, apool, domInterface, clas
if (tname === 'br') { if (tname === 'br') {
this.breakLine = true; this.breakLine = true;
const tvalue = dom.nodeAttr(node, 'value'); const tvalue = getAttribute(node, 'value');
const induceLineBreak = hooks.callAll('collectContentLineBreak', { const [startNewLine = true] = hooks.callAll('collectContentLineBreak', {
cc: this, cc: this,
state, state,
tname, tname,
@ -412,17 +406,14 @@ const makeContentCollector = (collectStyles, abrowser, apool, domInterface, clas
styl: null, styl: null,
cls: null, cls: null,
}); });
const startNewLine = (
typeof (induceLineBreak) === 'object' &&
induceLineBreak.length === 0) ? true : induceLineBreak[0];
if (startNewLine) { if (startNewLine) {
cc.startNewLine(state); cc.startNewLine(state);
} }
} else if (tname === 'script' || tname === 'style') { } else if (tname === 'script' || tname === 'style') {
// ignore // ignore
} else if (!isEmpty) { } else if (!isEmpty) {
let styl = dom.nodeAttr(node, 'style'); let styl = getAttribute(node, 'style');
let cls = dom.nodeAttr(node, 'class'); let cls = getAttribute(node, 'class');
let isPre = (tname === 'pre'); let isPre = (tname === 'pre');
if ((!isPre) && abrowser && abrowser.safari) { if ((!isPre) && abrowser && abrowser.safari) {
isPre = (styl && /\bwhite-space:\s*pre\b/i.exec(styl)); isPre = (styl && /\bwhite-space:\s*pre\b/i.exec(styl));
@ -469,26 +460,23 @@ const makeContentCollector = (collectStyles, abrowser, apool, domInterface, clas
cc.doAttrib(state, 'strikethrough'); cc.doAttrib(state, 'strikethrough');
} }
if (tname === 'ul' || tname === 'ol') { if (tname === 'ul' || tname === 'ol') {
let type = node.attribs ? node.attribs.class : null; let type = getAttribute(node, 'class');
const rr = cls && /(?:^| )list-([a-z]+[0-9]+)\b/.exec(cls); const rr = cls && /(?:^| )list-([a-z]+[0-9]+)\b/.exec(cls);
// lists do not need to have a type, so before we make a wrong guess // lists do not need to have a type, so before we make a wrong guess
// check if we find a better hint within the node's children // check if we find a better hint within the node's children
if (!rr && !type) { if (!rr && !type) {
for (const i in node.children) { for (const child of childNodes(node)) {
if (node.children[i] && node.children[i].name === 'ul') { if (tagName(child) !== 'ul') continue;
type = node.children[i].attribs.class; type = getAttribute(child, 'class');
if (type) { if (type) break;
break;
}
}
} }
} }
if (rr && rr[1]) { if (rr && rr[1]) {
type = rr[1]; type = rr[1];
} else { } else {
if (tname === 'ul') { if (tname === 'ul') {
if ((type && type.match('indent')) || const cls = getAttribute(node, 'class');
(node.attribs && node.attribs.class && node.attribs.class.match('indent'))) { if ((type && type.match('indent')) || (cls && cls.match('indent'))) {
type = 'indent'; type = 'indent';
} else { } else {
type = 'bullet'; type = 'bullet';
@ -503,7 +491,7 @@ const makeContentCollector = (collectStyles, abrowser, apool, domInterface, clas
// This has undesirable behavior in Chrome but is right in other browsers. // This has undesirable behavior in Chrome but is right in other browsers.
// See https://github.com/ether/etherpad-lite/issues/2412 for reasoning // See https://github.com/ether/etherpad-lite/issues/2412 for reasoning
if (!abrowser.chrome) oldListTypeOrNull = (_enterList(state, undefined) || 'none'); if (!abrowser.chrome) oldListTypeOrNull = (_enterList(state, undefined) || 'none');
} else if ((tname === 'li')) { } else if (tname === 'li') {
state.lineAttributes.start = state.start || 0; state.lineAttributes.start = state.start || 0;
_recalcAttribString(state); _recalcAttribString(state);
if (state.lineAttributes.list.indexOf('number') !== -1) { if (state.lineAttributes.list.indexOf('number') !== -1) {
@ -513,7 +501,7 @@ const makeContentCollector = (collectStyles, abrowser, apool, domInterface, clas
Note how the <ol> item has to be inside a <li> Note how the <ol> item has to be inside a <li>
Because of this we don't increment the start number Because of this we don't increment the start number
*/ */
if (node.parent && node.parent.name !== 'ol') { if (node.parentNode && tagName(node.parentNode) !== 'ol') {
/* /*
TODO: start number has to increment based on indentLevel(numberX) TODO: start number has to increment based on indentLevel(numberX)
This means we have to build an object IE This means we have to build an object IE
@ -530,7 +518,7 @@ const makeContentCollector = (collectStyles, abrowser, apool, domInterface, clas
} }
} }
// UL list items never modify the start value. // UL list items never modify the start value.
if (node.parent && node.parent.name === 'ul') { if (node.parentNode && tagName(node.parentNode) === 'ul') {
state.start++; state.start++;
// TODO, this is hacky. // TODO, this is hacky.
// Because if the first item is an UL it will increment a list no? // Because if the first item is an UL it will increment a list no?
@ -559,9 +547,7 @@ const makeContentCollector = (collectStyles, abrowser, apool, domInterface, clas
} }
} }
const nc = dom.nodeNumChildren(node); for (const c of childNodes(node)) {
for (let i = 0; i < nc; i++) {
const c = dom.nodeChild(node, i);
cc.collectContent(c, state); cc.collectContent(c, state);
} }

View file

@ -1,3 +1,5 @@
'use strict';
/* /*
* This file is copied & modified from <basedir>/tests/backend/specs/api/pad.js * This file is copied & modified from <basedir>/tests/backend/specs/api/pad.js
* *

View file

@ -6,151 +6,148 @@
* TODO: unify those two files, and merge in a single one. * TODO: unify those two files, and merge in a single one.
*/ */
/* eslint-disable max-len */
const common = require('../../common'); const common = require('../../common');
const supertest = require(`${__dirname}/../../../../src/node_modules/supertest`); const settings = require('../../../container/loadSettings.js').loadSettings();
const settings = require(`${__dirname}/../../../../tests/container/loadSettings.js`).loadSettings(); const supertest = require('ep_etherpad-lite/node_modules/supertest');
const api = supertest(`http://${settings.ip}:${settings.port}`);
const api = supertest(`http://${settings.ip}:${settings.port}`);
const apiKey = common.apiKey; const apiKey = common.apiKey;
const apiVersion = 1; const apiVersion = 1;
const testImports = { const testImports = {
'malformed': { 'malformed': {
input: '<html><body><li>wtf</ul></body></html>', input: '<html><body><li>wtf</ul></body></html>',
expectedHTML: '<!DOCTYPE HTML><html><body>wtf<br><br></body></html>', wantHTML: '<!DOCTYPE HTML><html><body>wtf<br><br></body></html>',
expectedText: 'wtf\n\n', wantText: 'wtf\n\n',
disabled: true, disabled: true,
}, },
'nonelistiteminlist #3620': { 'nonelistiteminlist #3620': {
input: '<html><body><ul>test<li>FOO</li></ul></body></html>', input: '<html><body><ul>test<li>FOO</li></ul></body></html>',
expectedHTML: '<!DOCTYPE HTML><html><body><ul class="bullet">test<li>FOO</ul><br></body></html>', wantHTML: '<!DOCTYPE HTML><html><body><ul class="bullet">test<li>FOO</ul><br></body></html>',
expectedText: '\ttest\n\t* FOO\n\n', wantText: '\ttest\n\t* FOO\n\n',
disabled: true, disabled: true,
}, },
'whitespaceinlist #3620': { 'whitespaceinlist #3620': {
input: '<html><body><ul> <li>FOO</li></ul></body></html>', input: '<html><body><ul> <li>FOO</li></ul></body></html>',
expectedHTML: '<!DOCTYPE HTML><html><body><ul class="bullet"><li>FOO</ul><br></body></html>', wantHTML: '<!DOCTYPE HTML><html><body><ul class="bullet"><li>FOO</ul><br></body></html>',
expectedText: '\t* FOO\n\n', wantText: '\t* FOO\n\n',
disabled: true,
}, },
'prefixcorrectlinenumber': { 'prefixcorrectlinenumber': {
input: '<html><body><ol><li>should be 1</li><li>should be 2</li></ol></body></html>', input: '<html><body><ol><li>should be 1</li><li>should be 2</li></ol></body></html>',
expectedHTML: '<!DOCTYPE HTML><html><body><ol start="1" class="number"><li>should be 1</li><li>should be 2</ol><br></body></html>', wantHTML: '<!DOCTYPE HTML><html><body><ol start="1" class="number"><li>should be 1</li><li>should be 2</ol><br></body></html>',
expectedText: '\t1. should be 1\n\t2. should be 2\n\n', wantText: '\t1. should be 1\n\t2. should be 2\n\n',
}, },
'prefixcorrectlinenumbernested': { 'prefixcorrectlinenumbernested': {
input: '<html><body><ol><li>should be 1</li><ol><li>foo</li></ol><li>should be 2</li></ol></body></html>', input: '<html><body><ol><li>should be 1</li><ol><li>foo</li></ol><li>should be 2</li></ol></body></html>',
expectedHTML: '<!DOCTYPE HTML><html><body><ol start="1" class="number"><li>should be 1<ol start="2" class="number"><li>foo</ol><li>should be 2</ol><br></body></html>', wantHTML: '<!DOCTYPE HTML><html><body><ol start="1" class="number"><li>should be 1<ol start="2" class="number"><li>foo</ol><li>should be 2</ol><br></body></html>',
expectedText: '\t1. should be 1\n\t\t1.1. foo\n\t2. should be 2\n\n', wantText: '\t1. should be 1\n\t\t1.1. foo\n\t2. should be 2\n\n',
}, },
/* /*
"prefixcorrectlinenumber when introduced none list item - currently not supported see #3450":{ "prefixcorrectlinenumber when introduced none list item - currently not supported see #3450": {
input: '<html><body><ol><li>should be 1</li>test<li>should be 2</li></ol></body></html>', input: '<html><body><ol><li>should be 1</li>test<li>should be 2</li></ol></body></html>',
expectedHTML: '<!DOCTYPE HTML><html><body><ol start="1" class="number"><li>should be 1</li>test<li>should be 2</li></ol><br></body></html>', wantHTML: '<!DOCTYPE HTML><html><body><ol start="1" class="number"><li>should be 1</li>test<li>should be 2</li></ol><br></body></html>',
expectedText: '\t1. should be 1\n\ttest\n\t2. should be 2\n\n' wantText: '\t1. should be 1\n\ttest\n\t2. should be 2\n\n',
} }
, ,
"newlinesshouldntresetlinenumber #2194":{ "newlinesshouldntresetlinenumber #2194": {
input: '<html><body><ol><li>should be 1</li>test<li>should be 2</li></ol></body></html>', input: '<html><body><ol><li>should be 1</li>test<li>should be 2</li></ol></body></html>',
expectedHTML: '<!DOCTYPE HTML><html><body><ol class="number"><li>should be 1</li>test<li>should be 2</li></ol><br></body></html>', wantHTML: '<!DOCTYPE HTML><html><body><ol class="number"><li>should be 1</li>test<li>should be 2</li></ol><br></body></html>',
expectedText: '\t1. should be 1\n\ttest\n\t2. should be 2\n\n' wantText: '\t1. should be 1\n\ttest\n\t2. should be 2\n\n',
} }
*/ */
'ignoreAnyTagsOutsideBody': { 'ignoreAnyTagsOutsideBody': {
description: 'Content outside body should be ignored', description: 'Content outside body should be ignored',
input: '<html><head><title>title</title><style></style></head><body>empty<br></body></html>', input: '<html><head><title>title</title><style></style></head><body>empty<br></body></html>',
expectedHTML: '<!DOCTYPE HTML><html><body>empty<br><br></body></html>', wantHTML: '<!DOCTYPE HTML><html><body>empty<br><br></body></html>',
expectedText: 'empty\n\n', wantText: 'empty\n\n',
}, },
'indentedListsAreNotBullets': { 'indentedListsAreNotBullets': {
description: 'Indented lists are represented with tabs and without bullets', description: 'Indented lists are represented with tabs and without bullets',
input: '<html><body><ul class="indent"><li>indent</li><li>indent</ul></body></html>', input: '<html><body><ul class="indent"><li>indent</li><li>indent</ul></body></html>',
expectedHTML: '<!DOCTYPE HTML><html><body><ul class="indent"><li>indent</li><li>indent</ul><br></body></html>', wantHTML: '<!DOCTYPE HTML><html><body><ul class="indent"><li>indent</li><li>indent</ul><br></body></html>',
expectedText: '\tindent\n\tindent\n\n' wantText: '\tindent\n\tindent\n\n',
}, },
lineWithMultipleSpaces: { 'lineWithMultipleSpaces': {
description: 'Multiple spaces should be collapsed', description: 'Multiple spaces should be collapsed',
input: '<html><body>Text with more than one space.<br></body></html>', input: '<html><body>Text with more than one space.<br></body></html>',
expectedHTML: '<!DOCTYPE HTML><html><body>Text with more than one space.<br><br></body></html>', wantHTML: '<!DOCTYPE HTML><html><body>Text with more than one space.<br><br></body></html>',
expectedText: 'Text with more than one space.\n\n' wantText: 'Text with more than one space.\n\n',
}, },
lineWithMultipleNonBreakingAndNormalSpaces: { 'lineWithMultipleNonBreakingAndNormalSpaces': {
// XXX the HTML between "than" and "one" looks strange // XXX the HTML between "than" and "one" looks strange
description: 'non-breaking space should be preserved, but can be replaced when it', description: 'non-breaking space should be preserved, but can be replaced when it',
input: '<html><body>Text&nbsp;with&nbsp; more&nbsp;&nbsp;&nbsp;than &nbsp;one space.<br></body></html>', input: '<html><body>Text&nbsp;with&nbsp; more&nbsp;&nbsp;&nbsp;than &nbsp;one space.<br></body></html>',
expectedHTML: '<!DOCTYPE HTML><html><body>Text with&nbsp; more&nbsp;&nbsp; than&nbsp; one space.<br><br></body></html>', wantHTML: '<!DOCTYPE HTML><html><body>Text with&nbsp; more&nbsp;&nbsp; than&nbsp; one space.<br><br></body></html>',
expectedText: 'Text with more than one space.\n\n' wantText: 'Text with more than one space.\n\n',
}, },
multiplenbsp: { 'multiplenbsp': {
description: 'Multiple non-breaking space should be preserved', description: 'Multiple non-breaking space should be preserved',
input: '<html><body>&nbsp;&nbsp;<br></body></html>', input: '<html><body>&nbsp;&nbsp;<br></body></html>',
expectedHTML: '<!DOCTYPE HTML><html><body>&nbsp;&nbsp;<br><br></body></html>', wantHTML: '<!DOCTYPE HTML><html><body>&nbsp;&nbsp;<br><br></body></html>',
expectedText: ' \n\n' wantText: ' \n\n',
}, },
multipleNonBreakingSpaceBetweenWords: { 'multipleNonBreakingSpaceBetweenWords': {
description: 'A normal space is always inserted before a word', description: 'A normal space is always inserted before a word',
input: '<html><body>&nbsp;&nbsp;word1&nbsp;&nbsp;word2&nbsp;&nbsp;&nbsp;word3<br></body></html>', input: '<html><body>&nbsp;&nbsp;word1&nbsp;&nbsp;word2&nbsp;&nbsp;&nbsp;word3<br></body></html>',
expectedHTML: '<!DOCTYPE HTML><html><body>&nbsp; word1&nbsp; word2&nbsp;&nbsp; word3<br><br></body></html>', wantHTML: '<!DOCTYPE HTML><html><body>&nbsp; word1&nbsp; word2&nbsp;&nbsp; word3<br><br></body></html>',
expectedText: ' word1 word2 word3\n\n' wantText: ' word1 word2 word3\n\n',
}, },
nonBreakingSpacePreceededBySpaceBetweenWords: { 'nonBreakingSpacePreceededBySpaceBetweenWords': {
description: 'A non-breaking space preceeded by a normal space', description: 'A non-breaking space preceeded by a normal space',
input: '<html><body> &nbsp;word1 &nbsp;word2 &nbsp;word3<br></body></html>', input: '<html><body> &nbsp;word1 &nbsp;word2 &nbsp;word3<br></body></html>',
expectedHTML: '<!DOCTYPE HTML><html><body>&nbsp;word1&nbsp; word2&nbsp; word3<br><br></body></html>', wantHTML: '<!DOCTYPE HTML><html><body>&nbsp;word1&nbsp; word2&nbsp; word3<br><br></body></html>',
expectedText: ' word1 word2 word3\n\n' wantText: ' word1 word2 word3\n\n',
}, },
nonBreakingSpaceFollowededBySpaceBetweenWords: { 'nonBreakingSpaceFollowededBySpaceBetweenWords': {
description: 'A non-breaking space followed by a normal space', description: 'A non-breaking space followed by a normal space',
input: '<html><body>&nbsp; word1&nbsp; word2&nbsp; word3<br></body></html>', input: '<html><body>&nbsp; word1&nbsp; word2&nbsp; word3<br></body></html>',
expectedHTML: '<!DOCTYPE HTML><html><body>&nbsp; word1&nbsp; word2&nbsp; word3<br><br></body></html>', wantHTML: '<!DOCTYPE HTML><html><body>&nbsp; word1&nbsp; word2&nbsp; word3<br><br></body></html>',
expectedText: ' word1 word2 word3\n\n' wantText: ' word1 word2 word3\n\n',
}, },
spacesAfterNewline: { 'spacesAfterNewline': {
description: 'Collapse spaces that follow a newline', description: 'Collapse spaces that follow a newline',
input:'<!doctype html><html><body>something<br> something<br></body></html>', input: '<!doctype html><html><body>something<br> something<br></body></html>',
expectedHTML: '<!DOCTYPE HTML><html><body>something<br>something<br><br></body></html>', wantHTML: '<!DOCTYPE HTML><html><body>something<br>something<br><br></body></html>',
expectedText: 'something\nsomething\n\n' wantText: 'something\nsomething\n\n',
}, },
spacesAfterNewlineP: { 'spacesAfterNewlineP': {
description: 'Collapse spaces that follow a paragraph', description: 'Collapse spaces that follow a paragraph',
input:'<!doctype html><html><body>something<p></p> something<br></body></html>', input: '<!doctype html><html><body>something<p></p> something<br></body></html>',
expectedHTML: '<!DOCTYPE HTML><html><body>something<br><br>something<br><br></body></html>', wantHTML: '<!DOCTYPE HTML><html><body>something<br><br>something<br><br></body></html>',
expectedText: 'something\n\nsomething\n\n' wantText: 'something\n\nsomething\n\n',
}, },
spacesAtEndOfLine: { 'spacesAtEndOfLine': {
description: 'Collapse spaces that preceed/follow a newline', description: 'Collapse spaces that preceed/follow a newline',
input:'<html><body>something <br> something<br></body></html>', input: '<html><body>something <br> something<br></body></html>',
expectedHTML: '<!DOCTYPE HTML><html><body>something<br>something<br><br></body></html>', wantHTML: '<!DOCTYPE HTML><html><body>something<br>something<br><br></body></html>',
expectedText: 'something\nsomething\n\n' wantText: 'something\nsomething\n\n',
}, },
spacesAtEndOfLineP: { 'spacesAtEndOfLineP': {
description: 'Collapse spaces that preceed/follow a paragraph', description: 'Collapse spaces that preceed/follow a paragraph',
input:'<html><body>something <p></p> something<br></body></html>', input: '<html><body>something <p></p> something<br></body></html>',
expectedHTML: '<!DOCTYPE HTML><html><body>something<br><br>something<br><br></body></html>', wantHTML: '<!DOCTYPE HTML><html><body>something<br><br>something<br><br></body></html>',
expectedText: 'something\n\nsomething\n\n' wantText: 'something\n\nsomething\n\n',
}, },
nonBreakingSpacesAfterNewlines: { 'nonBreakingSpacesAfterNewlines': {
description: 'Don\'t collapse non-breaking spaces that follow a newline', description: 'Don\'t collapse non-breaking spaces that follow a newline',
input:'<html><body>something<br>&nbsp;&nbsp;&nbsp;something<br></body></html>', input: '<html><body>something<br>&nbsp;&nbsp;&nbsp;something<br></body></html>',
expectedHTML: '<!DOCTYPE HTML><html><body>something<br>&nbsp;&nbsp; something<br><br></body></html>', wantHTML: '<!DOCTYPE HTML><html><body>something<br>&nbsp;&nbsp; something<br><br></body></html>',
expectedText: 'something\n something\n\n' wantText: 'something\n something\n\n',
}, },
nonBreakingSpacesAfterNewlinesP: { 'nonBreakingSpacesAfterNewlinesP': {
description: 'Don\'t collapse non-breaking spaces that follow a paragraph', description: 'Don\'t collapse non-breaking spaces that follow a paragraph',
input:'<html><body>something<p></p>&nbsp;&nbsp;&nbsp;something<br></body></html>', input: '<html><body>something<p></p>&nbsp;&nbsp;&nbsp;something<br></body></html>',
expectedHTML: '<!DOCTYPE HTML><html><body>something<br><br>&nbsp;&nbsp; something<br><br></body></html>', wantHTML: '<!DOCTYPE HTML><html><body>something<br><br>&nbsp;&nbsp; something<br><br></body></html>',
expectedText: 'something\n\n something\n\n' wantText: 'something\n\n something\n\n',
}, },
collapseSpacesInsideElements: { 'collapseSpacesInsideElements': {
description: 'Preserve only one space when multiple are present', description: 'Preserve only one space when multiple are present',
input: '<html><body>Need <span> more </span> space<i> s </i> !<br></body></html>', input: '<html><body>Need <span> more </span> space<i> s </i> !<br></body></html>',
expectedHTML: '<!DOCTYPE HTML><html><body>Need more space<em> s </em>!<br><br></body></html>', wantHTML: '<!DOCTYPE HTML><html><body>Need more space<em> s </em>!<br><br></body></html>',
expectedText: 'Need more space s !\n\n' wantText: 'Need more space s !\n\n',
}, },
collapseSpacesAcrossNewlines: { 'collapseSpacesAcrossNewlines': {
description: 'Newlines and multiple spaces across newlines should be collapsed', description: 'Newlines and multiple spaces across newlines should be collapsed',
input: ` input: `
<html><body>Need <html><body>Need
@ -158,30 +155,30 @@ const testImports = {
space space
<i> s </i> <i> s </i>
!<br></body></html>`, !<br></body></html>`,
expectedHTML: '<!DOCTYPE HTML><html><body>Need more space <em>s </em>!<br><br></body></html>', wantHTML: '<!DOCTYPE HTML><html><body>Need more space <em>s </em>!<br><br></body></html>',
expectedText: 'Need more space s !\n\n' wantText: 'Need more space s !\n\n',
}, },
multipleNewLinesAtBeginning: { 'multipleNewLinesAtBeginning': {
description: 'Multiple new lines and paragraphs at the beginning should be preserved', description: 'Multiple new lines and paragraphs at the beginning should be preserved',
input: '<html><body><br><br><p></p><p></p>first line<br><br>second line<br></body></html>', input: '<html><body><br><br><p></p><p></p>first line<br><br>second line<br></body></html>',
expectedHTML: '<!DOCTYPE HTML><html><body><br><br><br><br>first line<br><br>second line<br><br></body></html>', wantHTML: '<!DOCTYPE HTML><html><body><br><br><br><br>first line<br><br>second line<br><br></body></html>',
expectedText: '\n\n\n\nfirst line\n\nsecond line\n\n' wantText: '\n\n\n\nfirst line\n\nsecond line\n\n',
}, },
multiLineParagraph:{ 'multiLineParagraph': {
description: "A paragraph with multiple lines should not loose spaces when lines are combined", description: 'A paragraph with multiple lines should not loose spaces when lines are combined',
input:`<html><body> input: `<html><body>
<p> <p>
а б в г ґ д е є ж з и і ї й к л м н о а б в г ґ д е є ж з и і ї й к л м н о
п р с т у ф х ц ч ш щ ю я ь п р с т у ф х ц ч ш щ ю я ь
</p> </p>
</body></html>`, </body></html>`,
expectedHTML: '<!DOCTYPE HTML><html><body>&#1072; &#1073; &#1074; &#1075; &#1169; &#1076; &#1077; &#1108; &#1078; &#1079; &#1080; &#1110; &#1111; &#1081; &#1082; &#1083; &#1084; &#1085; &#1086; &#1087; &#1088; &#1089; &#1090; &#1091; &#1092; &#1093; &#1094; &#1095; &#1096; &#1097; &#1102; &#1103; &#1100;<br><br></body></html>', wantHTML: '<!DOCTYPE HTML><html><body>&#1072; &#1073; &#1074; &#1075; &#1169; &#1076; &#1077; &#1108; &#1078; &#1079; &#1080; &#1110; &#1111; &#1081; &#1082; &#1083; &#1084; &#1085; &#1086; &#1087; &#1088; &#1089; &#1090; &#1091; &#1092; &#1093; &#1094; &#1095; &#1096; &#1097; &#1102; &#1103; &#1100;<br><br></body></html>',
expectedText: 'а б в г ґ д е є ж з и і ї й к л м н о п р с т у ф х ц ч ш щ ю я ь\n\n' wantText: 'а б в г ґ д е є ж з и і ї й к л м н о п р с т у ф х ц ч ш щ ю я ь\n\n',
}, },
multiLineParagraphWithPre:{ 'multiLineParagraphWithPre': {
//XXX why is there &nbsp; before "in"? // XXX why is there &nbsp; before "in"?
description: "lines in preformatted text should be kept intact", description: 'lines in preformatted text should be kept intact',
input:`<html><body> input: `<html><body>
<p> <p>
а б в г ґ д е є ж з и і ї й к л м н о<pre>multiple а б в г ґ д е є ж з и і ї й к л м н о<pre>multiple
lines lines
@ -190,55 +187,55 @@ const testImports = {
</pre></p><p>п р с т у ф х ц ч ш щ ю я </pre></p><p>п р с т у ф х ц ч ш щ ю я
ь</p> ь</p>
</body></html>`, </body></html>`,
expectedHTML: '<!DOCTYPE HTML><html><body>&#1072; &#1073; &#1074; &#1075; &#1169; &#1076; &#1077; &#1108; &#1078; &#1079; &#1080; &#1110; &#1111; &#1081; &#1082; &#1083; &#1084; &#1085; &#1086;<br>multiple<br>&nbsp;&nbsp; lines<br>&nbsp;in<br>&nbsp;&nbsp;&nbsp;&nbsp;&nbsp; pre<br><br>&#1087; &#1088; &#1089; &#1090; &#1091; &#1092; &#1093; &#1094; &#1095; &#1096; &#1097; &#1102; &#1103; &#1100;<br><br></body></html>', wantHTML: '<!DOCTYPE HTML><html><body>&#1072; &#1073; &#1074; &#1075; &#1169; &#1076; &#1077; &#1108; &#1078; &#1079; &#1080; &#1110; &#1111; &#1081; &#1082; &#1083; &#1084; &#1085; &#1086;<br>multiple<br>&nbsp;&nbsp; lines<br>&nbsp;in<br>&nbsp;&nbsp;&nbsp;&nbsp;&nbsp; pre<br><br>&#1087; &#1088; &#1089; &#1090; &#1091; &#1092; &#1093; &#1094; &#1095; &#1096; &#1097; &#1102; &#1103; &#1100;<br><br></body></html>',
expectedText: 'а б в г ґ д е є ж з и і ї й к л м н о\nmultiple\n lines\n in\n pre\n\nп р с т у ф х ц ч ш щ ю я ь\n\n' wantText: 'а б в г ґ д е є ж з и і ї й к л м н о\nmultiple\n lines\n in\n pre\n\nп р с т у ф х ц ч ш щ ю я ь\n\n',
}, },
preIntroducesASpace: { 'preIntroducesASpace': {
description: "pre should be on a new line not preceeded by a space", description: 'pre should be on a new line not preceeded by a space',
input:`<html><body><p> input: `<html><body><p>
1 1
<pre>preline <pre>preline
</pre></p></body></html>`, </pre></p></body></html>`,
expectedHTML: '<!DOCTYPE HTML><html><body>1<br>preline<br><br><br></body></html>', wantHTML: '<!DOCTYPE HTML><html><body>1<br>preline<br><br><br></body></html>',
expectedText: '1\npreline\n\n\n' wantText: '1\npreline\n\n\n',
}, },
dontDeleteSpaceInsideElements: { 'dontDeleteSpaceInsideElements': {
description: 'Preserve spaces inside elements', description: 'Preserve spaces inside elements',
input: '<html><body>Need<span> more </span>space<i> s </i>!<br></body></html>', input: '<html><body>Need<span> more </span>space<i> s </i>!<br></body></html>',
expectedHTML: '<!DOCTYPE HTML><html><body>Need more space<em> s </em>!<br><br></body></html>', wantHTML: '<!DOCTYPE HTML><html><body>Need more space<em> s </em>!<br><br></body></html>',
expectedText: 'Need more space s !\n\n' wantText: 'Need more space s !\n\n',
}, },
dontDeleteSpaceOutsideElements: { 'dontDeleteSpaceOutsideElements': {
description: 'Preserve spaces outside elements', description: 'Preserve spaces outside elements',
input: '<html><body>Need <span>more</span> space <i>s</i> !<br></body></html>', input: '<html><body>Need <span>more</span> space <i>s</i> !<br></body></html>',
expectedHTML: '<!DOCTYPE HTML><html><body>Need more space <em>s</em> !<br><br></body></html>', wantHTML: '<!DOCTYPE HTML><html><body>Need more space <em>s</em> !<br><br></body></html>',
expectedText: 'Need more space s !\n\n' wantText: 'Need more space s !\n\n',
}, },
dontDeleteSpaceAtEndOfElement: { 'dontDeleteSpaceAtEndOfElement': {
description: 'Preserve spaces at the end of an element', description: 'Preserve spaces at the end of an element',
input: '<html><body>Need <span>more </span>space <i>s </i>!<br></body></html>', input: '<html><body>Need <span>more </span>space <i>s </i>!<br></body></html>',
expectedHTML: '<!DOCTYPE HTML><html><body>Need more space <em>s </em>!<br><br></body></html>', wantHTML: '<!DOCTYPE HTML><html><body>Need more space <em>s </em>!<br><br></body></html>',
expectedText: 'Need more space s !\n\n' wantText: 'Need more space s !\n\n',
}, },
dontDeleteSpaceAtBeginOfElements: { 'dontDeleteSpaceAtBeginOfElements': {
description: 'Preserve spaces at the start of an element', description: 'Preserve spaces at the start of an element',
input: '<html><body>Need<span> more</span> space<i> s</i> !<br></body></html>', input: '<html><body>Need<span> more</span> space<i> s</i> !<br></body></html>',
expectedHTML: '<!DOCTYPE HTML><html><body>Need more space<em> s</em> !<br><br></body></html>', wantHTML: '<!DOCTYPE HTML><html><body>Need more space<em> s</em> !<br><br></body></html>',
expectedText: 'Need more space s !\n\n' wantText: 'Need more space s !\n\n',
}, },
}; };
describe(__filename, function () { describe(__filename, function () {
Object.keys(testImports).forEach((testName) => { Object.keys(testImports).forEach((testName) => {
const testPadId = makeid(); describe(testName, function () {
const test = testImports[testName]; const testPadId = makeid();
if (test.disabled) { const test = testImports[testName];
return xit(`DISABLED: ${testName}`, function (done) { if (test.disabled) {
done(); return xit(`DISABLED: ${testName}`, function (done) {
}); done();
} });
describe(`createPad ${testName}`, function () { }
it('creates a new Pad', function (done) { it('createPad', function (done) {
api.get(`${endPoint('createPad')}&padID=${testPadId}`) api.get(`${endPoint('createPad')}&padID=${testPadId}`)
.expect((res) => { .expect((res) => {
if (res.body.code !== 0) throw new Error('Unable to create new Pad'); if (res.body.code !== 0) throw new Error('Unable to create new Pad');
@ -246,10 +243,8 @@ describe(__filename, function () {
.expect('Content-Type', /json/) .expect('Content-Type', /json/)
.expect(200, done); .expect(200, done);
}); });
});
describe(`setHTML ${testName}`, function () { it('setHTML', function (done) {
it('Sets the HTML', function (done) {
api.get(`${endPoint('setHTML')}&padID=${testPadId}&html=${encodeURIComponent(test.input)}`) api.get(`${endPoint('setHTML')}&padID=${testPadId}&html=${encodeURIComponent(test.input)}`)
.expect((res) => { .expect((res) => {
if (res.body.code !== 0) throw new Error(`Error:${testName}`); if (res.body.code !== 0) throw new Error(`Error:${testName}`);
@ -257,23 +252,21 @@ describe(__filename, function () {
.expect('Content-Type', /json/) .expect('Content-Type', /json/)
.expect(200, done); .expect(200, done);
}); });
});
describe(`getHTML ${testName}`, function () { it('getHTML', function (done) {
it('Gets back the HTML of a Pad', function (done) {
api.get(`${endPoint('getHTML')}&padID=${testPadId}`) api.get(`${endPoint('getHTML')}&padID=${testPadId}`)
.expect((res) => { .expect((res) => {
const receivedHtml = res.body.data.html; const gotHtml = res.body.data.html;
if (receivedHtml !== test.expectedHTML) { if (gotHtml !== test.wantHTML) {
throw new Error(`HTML received from export is not the one we were expecting. throw new Error(`HTML received from export is not the one we were expecting.
Test Name: Test Name:
${testName} ${testName}
Received: Got:
${JSON.stringify(receivedHtml)} ${JSON.stringify(gotHtml)}
Expected: Want:
${JSON.stringify(test.expectedHTML)} ${JSON.stringify(test.wantHTML)}
Which is a different version of the originally imported one: Which is a different version of the originally imported one:
${test.input}`); ${test.input}`);
@ -282,23 +275,21 @@ describe(__filename, function () {
.expect('Content-Type', /json/) .expect('Content-Type', /json/)
.expect(200, done); .expect(200, done);
}); });
});
describe(`getText ${testName}`, function () { it('getText', function (done) {
it('Gets back the Text of a Pad', function (done) {
api.get(`${endPoint('getText')}&padID=${testPadId}`) api.get(`${endPoint('getText')}&padID=${testPadId}`)
.expect((res) => { .expect((res) => {
const receivedText = res.body.data.text; const gotText = res.body.data.text;
if (receivedText !== test.expectedText) { if (gotText !== test.wantText) {
throw new Error(`Text received from export is not the one we were expecting. throw new Error(`Text received from export is not the one we were expecting.
Test Name: Test Name:
${testName} ${testName}
Received: Got:
${JSON.stringify(receivedText)} ${JSON.stringify(gotText)}
Expected: Want:
${JSON.stringify(test.expectedText)} ${JSON.stringify(test.wantText)}
Which is a different version of the originally imported one: Which is a different version of the originally imported one:
${test.input}`); ${test.input}`);
@ -315,7 +306,7 @@ describe(__filename, function () {
function endPoint(point, version) { function endPoint(point, version) {
version = version || apiVersion; version = version || apiVersion;
return `/api/${version}/${point}?apikey=${apiKey}`; return `/api/${version}/${point}?apikey=${apiKey}`;
}; }
function makeid() { function makeid() {
let text = ''; let text = '';

View file

@ -1,34 +1,34 @@
'use strict'; 'use strict';
/* eslint-disable max-len */
/* /*
* While importexport tests target the `setHTML` API endpoint, which is nearly identical to what happens * While importexport tests target the `setHTML` API endpoint, which is nearly identical to what
* when a user manually imports a document via the UI, the contentcollector tests here don't use rehype to process * happens when a user manually imports a document via the UI, the contentcollector tests here don't
* the document. Rehype removes spaces and newĺines were applicable, so the expected results here can * use rehype to process the document. Rehype removes spaces and newĺines were applicable, so the
* differ from importexport.js. * expected results here can differ from importexport.js.
* *
* If you add tests here, please also add them to importexport.js * If you add tests here, please also add them to importexport.js
*/ */
const contentcollector = require('../../../src/static/js/contentcollector'); const AttributePool = require('ep_etherpad-lite/static/js/AttributePool');
const AttributePool = require('../../../src/static/js/AttributePool'); const assert = require('assert').strict;
const cheerio = require('../../../src/node_modules/cheerio'); const cheerio = require('ep_etherpad-lite/node_modules/cheerio');
const contentcollector = require('ep_etherpad-lite/static/js/contentcollector');
const tests = { const tests = {
nestedLi: { nestedLi: {
description: 'Complex nested Li', description: 'Complex nested Li',
html: '<!doctype html><html><body><ol><li>one</li><li><ol><li>1.1</li></ol></li><li>two</li></ol></body></html>', html: '<!doctype html><html><body><ol><li>one</li><li><ol><li>1.1</li></ol></li><li>two</li></ol></body></html>',
expectedLineAttribs: [ wantLineAttribs: [
'*0*1*2*3+1+3', '*0*4*2*5+1+3', '*0*1*2*5+1+3', '*0*1*2*3+1+3', '*0*4*2*5+1+3', '*0*1*2*5+1+3',
], ],
expectedText: [ wantText: [
'*one', '*1.1', '*two', '*one', '*1.1', '*two',
], ],
}, },
complexNest: { complexNest: {
description: 'Complex list of different types', description: 'Complex list of different types',
html: '<!doctype html><html><body><ul class="bullet"><li>one</li><li>two</li><li>0</li><li>1</li><li>2<ul class="bullet"><li>3</li><li>4</li></ul></li></ul><ol class="number"><li>item<ol class="number"><li>item1</li><li>item2</li></ol></li></ol></body></html>', html: '<!doctype html><html><body><ul class="bullet"><li>one</li><li>two</li><li>0</li><li>1</li><li>2<ul class="bullet"><li>3</li><li>4</li></ul></li></ul><ol class="number"><li>item<ol class="number"><li>item1</li><li>item2</li></ol></li></ol></body></html>',
expectedLineAttribs: [ wantLineAttribs: [
'*0*1*2+1+3', '*0*1*2+1+3',
'*0*1*2+1+3', '*0*1*2+1+3',
'*0*1*2+1+1', '*0*1*2+1+1',
@ -40,7 +40,7 @@ const tests = {
'*0*6*2*7+1+5', '*0*6*2*7+1+5',
'*0*6*2*7+1+5', '*0*6*2*7+1+5',
], ],
expectedText: [ wantText: [
'*one', '*one',
'*two', '*two',
'*0', '*0',
@ -56,148 +56,142 @@ const tests = {
ul: { ul: {
description: 'Tests if uls properly get attributes', description: 'Tests if uls properly get attributes',
html: '<html><body><ul><li>a</li><li>b</li></ul><div>div</div><p>foo</p></body></html>', html: '<html><body><ul><li>a</li><li>b</li></ul><div>div</div><p>foo</p></body></html>',
expectedLineAttribs: ['*0*1*2+1+1', '*0*1*2+1+1', '+3', '+3'], wantLineAttribs: ['*0*1*2+1+1', '*0*1*2+1+1', '+3', '+3'],
expectedText: ['*a', '*b', 'div', 'foo'], wantText: ['*a', '*b', 'div', 'foo'],
}, },
ulIndented: { ulIndented: {
description: 'Tests if indented uls properly get attributes', description: 'Tests if indented uls properly get attributes',
html: '<html><body><ul><li>a</li><ul><li>b</li></ul><li>a</li></ul><p>foo</p></body></html>', html: '<html><body><ul><li>a</li><ul><li>b</li></ul><li>a</li></ul><p>foo</p></body></html>',
expectedLineAttribs: ['*0*1*2+1+1', '*0*3*2+1+1', '*0*1*2+1+1', '+3'], wantLineAttribs: ['*0*1*2+1+1', '*0*3*2+1+1', '*0*1*2+1+1', '+3'],
expectedText: ['*a', '*b', '*a', 'foo'], wantText: ['*a', '*b', '*a', 'foo'],
}, },
ol: { ol: {
description: 'Tests if ols properly get line numbers when in a normal OL', description: 'Tests if ols properly get line numbers when in a normal OL',
html: '<html><body><ol><li>a</li><li>b</li><li>c</li></ol><p>test</p></body></html>', html: '<html><body><ol><li>a</li><li>b</li><li>c</li></ol><p>test</p></body></html>',
expectedLineAttribs: ['*0*1*2*3+1+1', '*0*1*2*3+1+1', '*0*1*2*3+1+1', '+4'], wantLineAttribs: ['*0*1*2*3+1+1', '*0*1*2*3+1+1', '*0*1*2*3+1+1', '+4'],
expectedText: ['*a', '*b', '*c', 'test'], wantText: ['*a', '*b', '*c', 'test'],
noteToSelf: 'Ensure empty P does not induce line attribute marker, wont this break the editor?', noteToSelf: 'Ensure empty P does not induce line attribute marker, wont this break the editor?',
}, },
lineDoBreakInOl: { lineDoBreakInOl: {
description: 'A single completely empty line break within an ol should reset count if OL is closed off..', description: 'A single completely empty line break within an ol should reset count if OL is closed off..',
html: '<html><body><ol><li>should be 1</li></ol><p>hello</p><ol><li>should be 1</li><li>should be 2</li></ol><p></p></body></html>', html: '<html><body><ol><li>should be 1</li></ol><p>hello</p><ol><li>should be 1</li><li>should be 2</li></ol><p></p></body></html>',
expectedLineAttribs: ['*0*1*2*3+1+b', '+5', '*0*1*2*4+1+b', '*0*1*2*4+1+b', ''], wantLineAttribs: ['*0*1*2*3+1+b', '+5', '*0*1*2*4+1+b', '*0*1*2*4+1+b', ''],
expectedText: ['*should be 1', 'hello', '*should be 1', '*should be 2', ''], wantText: ['*should be 1', 'hello', '*should be 1', '*should be 2', ''],
noteToSelf: "Shouldn't include attribute marker in the <p> line", noteToSelf: "Shouldn't include attribute marker in the <p> line",
}, },
bulletListInOL: {
description: 'A bullet within an OL should not change numbering..',
html: '<html><body><ol><li>should be 1</li><ul><li>should be a bullet</li></ul><li>should be 2</li></ol><p></p></body></html>',
expectedLineAttribs: ['*0*1*2*3+1+b', '*0*4*2*3+1+i', '*0*1*2*5+1+b', ''],
expectedText: ['*should be 1', '*should be a bullet', '*should be 2', ''],
},
testP: { testP: {
description: 'A single <p></p> should create a new line', description: 'A single <p></p> should create a new line',
html: '<html><body><p></p><p></p></body></html>', html: '<html><body><p></p><p></p></body></html>',
expectedLineAttribs: ['', ''], wantLineAttribs: ['', ''],
expectedText: ['', ''], wantText: ['', ''],
noteToSelf: '<p></p>should create a line break but not break numbering', noteToSelf: '<p></p>should create a line break but not break numbering',
}, },
nestedOl: { nestedOl: {
description: 'Tests if ols properly get line numbers when in a normal OL', description: 'Tests if ols properly get line numbers when in a normal OL',
html: '<html><body>a<ol><li>b<ol><li>c</li></ol></ol>notlist<p>foo</p></body></html>', html: '<html><body>a<ol><li>b<ol><li>c</li></ol></ol>notlist<p>foo</p></body></html>',
expectedLineAttribs: ['+1', '*0*1*2*3+1+1', '*0*4*2*5+1+1', '+7', '+3'], wantLineAttribs: ['+1', '*0*1*2*3+1+1', '*0*4*2*5+1+1', '+7', '+3'],
expectedText: ['a', '*b', '*c', 'notlist', 'foo'], wantText: ['a', '*b', '*c', 'notlist', 'foo'],
noteToSelf: 'Ensure empty P does not induce line attribute marker, wont this break the editor?', noteToSelf: 'Ensure empty P does not induce line attribute marker, wont this break the editor?',
}, },
nestedOl2: { nestedOl2: {
description: 'First item being an UL then subsequent being OL will fail', description: 'First item being an UL then subsequent being OL will fail',
html: '<html><body><ul><li>a<ol><li>b</li><li>c</li></ol></li></ul></body></html>', html: '<html><body><ul><li>a<ol><li>b</li><li>c</li></ol></li></ul></body></html>',
expectedLineAttribs: ['+1', '*0*1*2*3+1+1', '*0*4*2*5+1+1'], wantLineAttribs: ['+1', '*0*1*2*3+1+1', '*0*4*2*5+1+1'],
expectedText: ['a', '*b', '*c'], wantText: ['a', '*b', '*c'],
noteToSelf: 'Ensure empty P does not induce line attribute marker, wont this break the editor?', noteToSelf: 'Ensure empty P does not induce line attribute marker, wont this break the editor?',
disabled: true, disabled: true,
}, },
lineDontBreakOL: { lineDontBreakOL: {
description: 'A single completely empty line break within an ol should NOT reset count', description: 'A single completely empty line break within an ol should NOT reset count',
html: '<html><body><ol><li>should be 1</li><p></p><li>should be 2</li><li>should be 3</li></ol><p></p></body></html>', html: '<html><body><ol><li>should be 1</li><p></p><li>should be 2</li><li>should be 3</li></ol><p></p></body></html>',
expectedLineAttribs: [], wantLineAttribs: [],
expectedText: ['*should be 1', '*should be 2', '*should be 3'], wantText: ['*should be 1', '*should be 2', '*should be 3'],
noteToSelf: "<p></p>should create a line break but not break numbering -- This is what I can't get working!", noteToSelf: "<p></p>should create a line break but not break numbering -- This is what I can't get working!",
disabled: true, disabled: true,
}, },
ignoreAnyTagsOutsideBody: { ignoreAnyTagsOutsideBody: {
description: 'Content outside body should be ignored', description: 'Content outside body should be ignored',
html: '<html><head><title>title</title><style></style></head><body>empty<br></body></html>', html: '<html><head><title>title</title><style></style></head><body>empty<br></body></html>',
expectedLineAttribs: ['+5'], wantLineAttribs: ['+5'],
expectedText: ['empty'], wantText: ['empty'],
}, },
lineWithMultipleSpaces: { lineWithMultipleSpaces: {
description: 'Multiple spaces should be preserved', description: 'Multiple spaces should be preserved',
html: '<html><body>Text with more than one space.<br></body></html>', html: '<html><body>Text with more than one space.<br></body></html>',
expectedLineAttribs: [ '+10' ], wantLineAttribs: ['+10'],
expectedText: ['Text with more than one space.'] wantText: ['Text with more than one space.'],
}, },
lineWithMultipleNonBreakingAndNormalSpaces: { lineWithMultipleNonBreakingAndNormalSpaces: {
description: 'non-breaking and normal space should be preserved', description: 'non-breaking and normal space should be preserved',
html: '<html><body>Text&nbsp;with&nbsp; more&nbsp;&nbsp;&nbsp;than &nbsp;one space.<br></body></html>', html: '<html><body>Text&nbsp;with&nbsp; more&nbsp;&nbsp;&nbsp;than &nbsp;one space.<br></body></html>',
expectedLineAttribs: [ '+10' ], wantLineAttribs: ['+10'],
expectedText: ['Text with more than one space.'] wantText: ['Text with more than one space.'],
}, },
multiplenbsp: { multiplenbsp: {
description: 'Multiple nbsp should be preserved', description: 'Multiple nbsp should be preserved',
html: '<html><body>&nbsp;&nbsp;<br></body></html>', html: '<html><body>&nbsp;&nbsp;<br></body></html>',
expectedLineAttribs: [ '+2' ], wantLineAttribs: ['+2'],
expectedText: [' '] wantText: [' '],
}, },
multipleNonBreakingSpaceBetweenWords: { multipleNonBreakingSpaceBetweenWords: {
description: 'Multiple nbsp between words ', description: 'Multiple nbsp between words ',
html: '<html><body>&nbsp;&nbsp;word1&nbsp;&nbsp;word2&nbsp;&nbsp;&nbsp;word3<br></body></html>', html: '<html><body>&nbsp;&nbsp;word1&nbsp;&nbsp;word2&nbsp;&nbsp;&nbsp;word3<br></body></html>',
expectedLineAttribs: [ '+m' ], wantLineAttribs: ['+m'],
expectedText: [' word1 word2 word3'] wantText: [' word1 word2 word3'],
}, },
nonBreakingSpacePreceededBySpaceBetweenWords: { nonBreakingSpacePreceededBySpaceBetweenWords: {
description: 'A non-breaking space preceeded by a normal space', description: 'A non-breaking space preceeded by a normal space',
html: '<html><body> &nbsp;word1 &nbsp;word2 &nbsp;word3<br></body></html>', html: '<html><body> &nbsp;word1 &nbsp;word2 &nbsp;word3<br></body></html>',
expectedLineAttribs: [ '+l' ], wantLineAttribs: ['+l'],
expectedText: [' word1 word2 word3'] wantText: [' word1 word2 word3'],
}, },
nonBreakingSpaceFollowededBySpaceBetweenWords: { nonBreakingSpaceFollowededBySpaceBetweenWords: {
description: 'A non-breaking space followed by a normal space', description: 'A non-breaking space followed by a normal space',
html: '<html><body>&nbsp; word1&nbsp; word2&nbsp; word3<br></body></html>', html: '<html><body>&nbsp; word1&nbsp; word2&nbsp; word3<br></body></html>',
expectedLineAttribs: [ '+l' ], wantLineAttribs: ['+l'],
expectedText: [' word1 word2 word3'] wantText: [' word1 word2 word3'],
}, },
spacesAfterNewline: { spacesAfterNewline: {
description: 'Don\'t collapse spaces that follow a newline', description: 'Don\'t collapse spaces that follow a newline',
html:'<!doctype html><html><body>something<br> something<br></body></html>', html: '<!doctype html><html><body>something<br> something<br></body></html>',
expectedLineAttribs: ['+9', '+m'], wantLineAttribs: ['+9', '+m'],
expectedText: ['something', ' something'] wantText: ['something', ' something'],
}, },
spacesAfterNewlineP: { spacesAfterNewlineP: {
description: 'Don\'t collapse spaces that follow a empty paragraph', description: 'Don\'t collapse spaces that follow a empty paragraph',
html:'<!doctype html><html><body>something<p></p> something<br></body></html>', html: '<!doctype html><html><body>something<p></p> something<br></body></html>',
expectedLineAttribs: ['+9', '', '+m'], wantLineAttribs: ['+9', '', '+m'],
expectedText: ['something', '', ' something'] wantText: ['something', '', ' something'],
}, },
spacesAtEndOfLine: { spacesAtEndOfLine: {
description: 'Don\'t collapse spaces that preceed/follow a newline', description: 'Don\'t collapse spaces that preceed/follow a newline',
html:'<html><body>something <br> something<br></body></html>', html: '<html><body>something <br> something<br></body></html>',
expectedLineAttribs: ['+l', '+m'], wantLineAttribs: ['+l', '+m'],
expectedText: ['something ', ' something'] wantText: ['something ', ' something'],
}, },
spacesAtEndOfLineP: { spacesAtEndOfLineP: {
description: 'Don\'t collapse spaces that preceed/follow a empty paragraph', description: 'Don\'t collapse spaces that preceed/follow a empty paragraph',
html:'<html><body>something <p></p> something<br></body></html>', html: '<html><body>something <p></p> something<br></body></html>',
expectedLineAttribs: ['+l', '', '+m'], wantLineAttribs: ['+l', '', '+m'],
expectedText: ['something ', '', ' something'] wantText: ['something ', '', ' something'],
}, },
nonBreakingSpacesAfterNewlines: { nonBreakingSpacesAfterNewlines: {
description: 'Don\'t collapse non-breaking spaces that follow a newline', description: 'Don\'t collapse non-breaking spaces that follow a newline',
html:'<html><body>something<br>&nbsp;&nbsp;&nbsp;something<br></body></html>', html: '<html><body>something<br>&nbsp;&nbsp;&nbsp;something<br></body></html>',
expectedLineAttribs: ['+9', '+c'], wantLineAttribs: ['+9', '+c'],
expectedText: ['something', ' something'] wantText: ['something', ' something'],
}, },
nonBreakingSpacesAfterNewlinesP: { nonBreakingSpacesAfterNewlinesP: {
description: 'Don\'t collapse non-breaking spaces that follow a paragraph', description: 'Don\'t collapse non-breaking spaces that follow a paragraph',
html:'<html><body>something<p></p>&nbsp;&nbsp;&nbsp;something<br></body></html>', html: '<html><body>something<p></p>&nbsp;&nbsp;&nbsp;something<br></body></html>',
expectedLineAttribs: ['+9', '', '+c'], wantLineAttribs: ['+9', '', '+c'],
expectedText: ['something', '', ' something'] wantText: ['something', '', ' something'],
}, },
preserveSpacesInsideElements: { preserveSpacesInsideElements: {
description: 'Preserve all spaces when multiple are present', description: 'Preserve all spaces when multiple are present',
html: '<html><body>Need <span> more </span> space<i> s </i> !<br></body></html>', html: '<html><body>Need <span> more </span> space<i> s </i> !<br></body></html>',
expectedLineAttribs: ['+h*0+4+2'], wantLineAttribs: ['+h*0+4+2'],
expectedText: ['Need more space s !'], wantText: ['Need more space s !'],
}, },
preserveSpacesAcrossNewlines: { preserveSpacesAcrossNewlines: {
description: 'Newlines and multiple spaces across newlines should be preserved', description: 'Newlines and multiple spaces across newlines should be preserved',
@ -207,69 +201,76 @@ const tests = {
space space
<i> s </i> <i> s </i>
!<br></body></html>`, !<br></body></html>`,
expectedLineAttribs: [ '+19*0+4+b' ], wantLineAttribs: ['+19*0+4+b'],
expectedText: [ 'Need more space s !' ] wantText: ['Need more space s !'],
}, },
multipleNewLinesAtBeginning: { multipleNewLinesAtBeginning: {
description: 'Multiple new lines at the beginning should be preserved', description: 'Multiple new lines at the beginning should be preserved',
html: '<html><body><br><br><p></p><p></p>first line<br><br>second line<br></body></html>', html: '<html><body><br><br><p></p><p></p>first line<br><br>second line<br></body></html>',
expectedLineAttribs: ['', '', '', '', '+a', '', '+b'], wantLineAttribs: ['', '', '', '', '+a', '', '+b'],
expectedText: [ '', '', '', '', 'first line', '', 'second line'] wantText: ['', '', '', '', 'first line', '', 'second line'],
}, },
multiLineParagraph:{ multiLineParagraph: {
description: "A paragraph with multiple lines should not loose spaces when lines are combined", description: 'A paragraph with multiple lines should not loose spaces when lines are combined',
html:`<html><body><p> html: `<html><body><p>
а б в г ґ д е є ж з и і ї й к л м н о а б в г ґ д е є ж з и і ї й к л м н о
п р с т у ф х ц ч ш щ ю я ь</p> п р с т у ф х ц ч ш щ ю я ь</p>
</body></html>`, </body></html>`,
expectedLineAttribs: [ '+1t' ], wantLineAttribs: ['+1t'],
expectedText: ["а б в г ґ д е є ж з и і ї й к л м н о п р с т у ф х ц ч ш щ ю я ь"] wantText: ['а б в г ґ д е є ж з и і ї й к л м н о п р с т у ф х ц ч ш щ ю я ь'],
}, },
multiLineParagraphWithPre:{ multiLineParagraphWithPre: {
description: "lines in preformatted text should be kept intact", description: 'lines in preformatted text should be kept intact',
html:`<html><body><p> html: `<html><body><p>
а б в г ґ д е є ж з и і ї й к л м н о<pre>multiple а б в г ґ д е є ж з и і ї й к л м н о</p><pre>multiple
lines lines
in in
pre pre
</pre></p><p>п р с т у ф х ц ч ш щ ю я </pre><p>п р с т у ф х ц ч ш щ ю я
ь</p> ь</p>
</body></html>`, </body></html>`,
expectedLineAttribs: [ '+11', '+8', '+5', '+2', '+3', '+r' ], wantLineAttribs: ['+11', '+8', '+5', '+2', '+3', '+r'],
expectedText: ['а б в г ґ д е є ж з и і ї й к л м н о', 'multiple', 'lines', 'in', 'pre', 'п р с т у ф х ц ч ш щ ю я ь'] wantText: [
'а б в г ґ д е є ж з и і ї й к л м н о',
'multiple',
'lines',
'in',
'pre',
'п р с т у ф х ц ч ш щ ю я ь',
],
}, },
preIntroducesASpace: { preIntroducesASpace: {
description: "pre should be on a new line not preceeded by a space", description: 'pre should be on a new line not preceeded by a space',
html:`<html><body><p> html: `<html><body><p>
1 1
<pre>preline </p><pre>preline
</pre></p></body></html>`, </pre></body></html>`,
expectedLineAttribs: [ '+6', '+7' ], wantLineAttribs: ['+6', '+7'],
expectedText: [' 1 ', 'preline'] wantText: [' 1 ', 'preline'],
}, },
dontDeleteSpaceInsideElements: { dontDeleteSpaceInsideElements: {
description: 'Preserve spaces on the beginning and end of a element', description: 'Preserve spaces on the beginning and end of a element',
html: '<html><body>Need<span> more </span>space<i> s </i>!<br></body></html>', html: '<html><body>Need<span> more </span>space<i> s </i>!<br></body></html>',
expectedLineAttribs: ['+f*0+3+1'], wantLineAttribs: ['+f*0+3+1'],
expectedText: ['Need more space s !'] wantText: ['Need more space s !'],
}, },
dontDeleteSpaceOutsideElements: { dontDeleteSpaceOutsideElements: {
description: 'Preserve spaces outside elements', description: 'Preserve spaces outside elements',
html: '<html><body>Need <span>more</span> space <i>s</i> !<br></body></html>', html: '<html><body>Need <span>more</span> space <i>s</i> !<br></body></html>',
expectedLineAttribs: ['+g*0+1+2'], wantLineAttribs: ['+g*0+1+2'],
expectedText: ['Need more space s !'] wantText: ['Need more space s !'],
}, },
dontDeleteSpaceAtEndOfElement: { dontDeleteSpaceAtEndOfElement: {
description: 'Preserve spaces at the end of an element', description: 'Preserve spaces at the end of an element',
html: '<html><body>Need <span>more </span>space <i>s </i>!<br></body></html>', html: '<html><body>Need <span>more </span>space <i>s </i>!<br></body></html>',
expectedLineAttribs: ['+g*0+2+1'], wantLineAttribs: ['+g*0+2+1'],
expectedText: ['Need more space s !'] wantText: ['Need more space s !'],
}, },
dontDeleteSpaceAtBeginOfElements: { dontDeleteSpaceAtBeginOfElements: {
description: 'Preserve spaces at the start of an element', description: 'Preserve spaces at the start of an element',
html: '<html><body>Need<span> more</span> space<i> s</i> !<br></body></html>', html: '<html><body>Need<span> more</span> space<i> s</i> !<br></body></html>',
expectedLineAttribs: ['+f*0+2+2'], wantLineAttribs: ['+f*0+2+2'],
expectedText: ['Need more space s !'] wantText: ['Need more space s !'],
}, },
}; };
@ -283,7 +284,7 @@ describe(__filename, function () {
}); });
} }
it(testObj.description, function (done) { it(testObj.description, async function () {
const $ = cheerio.load(testObj.html); // Load HTML into Cheerio const $ = cheerio.load(testObj.html); // Load HTML into Cheerio
const doc = $('body')[0]; // Creates a dom-like representation of HTML const doc = $('body')[0]; // Creates a dom-like representation of HTML
// Create an empty attribute pool // Create an empty attribute pool
@ -293,29 +294,13 @@ describe(__filename, function () {
const cc = contentcollector.makeContentCollector(true, null, apool); const cc = contentcollector.makeContentCollector(true, null, apool);
cc.collectContent(doc); cc.collectContent(doc);
const result = cc.finish(); const result = cc.finish();
const recievedAttributes = result.lineAttribs; const gotAttributes = result.lineAttribs;
const expectedAttributes = testObj.expectedLineAttribs; const wantAttributes = testObj.wantLineAttribs;
const recievedText = new Array(result.lines); const gotText = new Array(result.lines);
const expectedText = testObj.expectedText; const wantText = testObj.wantText;
// Check recieved text matches the expected text assert.deepEqual(gotText[0], wantText);
if (arraysEqual(recievedText[0], expectedText)) { assert.deepEqual(gotAttributes, wantAttributes);
// console.log("PASS: Recieved Text did match Expected Text\nRecieved:", recievedText[0], "\nExpected:", testObj.expectedText)
} else {
console.error('FAIL: Recieved Text did not match Expected Text\nRecieved:', recievedText[0], '\nExpected:', testObj.expectedText);
throw new Error();
}
// Check recieved attributes matches the expected attributes
if (arraysEqual(recievedAttributes, expectedAttributes)) {
// console.log("PASS: Recieved Attributes matched Expected Attributes");
done();
} else {
console.error('FAIL', test, testObj.description);
console.error('FAIL: Recieved Attributes did not match Expected Attributes\nRecieved: ', recievedAttributes, '\nExpected: ', expectedAttributes);
console.error('FAILING HTML', testObj.html);
throw new Error();
}
}); });
}); });
} }
@ -325,7 +310,7 @@ describe(__filename, function () {
function arraysEqual(a, b) { function arraysEqual(a, b) {
if (a === b) return true; if (a === b) return true;
if (a == null || b == null) return false; if (a == null || b == null) return false;
if (a.length != b.length) return false; if (a.length !== b.length) return false;
// If you don't care about the order of the elements inside // If you don't care about the order of the elements inside
// the array, you should sort both arrays here. // the array, you should sort both arrays here.