mirror of
https://github.com/ether/etherpad-lite.git
synced 2025-04-25 18:06:15 -04:00
Merge branch 'develop' of github.com:ether/etherpad-lite into mochawesome
This commit is contained in:
commit
7696ec0a02
7 changed files with 333 additions and 356 deletions
|
@ -421,7 +421,20 @@ Things in context:
|
||||||
4. text - the text for that line
|
4. text - the text for that line
|
||||||
|
|
||||||
This hook allows you to validate/manipulate the text before it's sent to the
|
This hook allows you to validate/manipulate the text before it's sent to the
|
||||||
server side. The return value should be the validated/manipulated text.
|
server side. To change the text, either:
|
||||||
|
|
||||||
|
* Set the `text` context property to the desired value and return `undefined`.
|
||||||
|
* (Deprecated) Return a string. If a hook function changes the `text` context
|
||||||
|
property, the return value is ignored. If no hook function changes `text` but
|
||||||
|
multiple hook functions return a string, the first one wins.
|
||||||
|
|
||||||
|
Example:
|
||||||
|
|
||||||
|
```
|
||||||
|
exports.collectContentLineText = (hookName, context) => {
|
||||||
|
context.text = tweakText(context.text);
|
||||||
|
};
|
||||||
|
```
|
||||||
|
|
||||||
## collectContentLineBreak
|
## collectContentLineBreak
|
||||||
|
|
||||||
|
|
|
@ -391,9 +391,9 @@ const defaultResponseRefs = {
|
||||||
|
|
||||||
// convert to a dictionary of operation objects
|
// convert to a dictionary of operation objects
|
||||||
const operations = {};
|
const operations = {};
|
||||||
for (const resource in resources) {
|
for (const [resource, actions] of Object.entries(resources)) {
|
||||||
for (const action in resources[resource]) {
|
for (const [action, spec] of Object.entries(actions)) {
|
||||||
const {operationId, responseSchema, ...operation} = resources[resource][action];
|
const {operationId, responseSchema, ...operation} = spec;
|
||||||
|
|
||||||
// add response objects
|
// add response objects
|
||||||
const responses = {...defaultResponseRefs};
|
const responses = {...defaultResponseRefs};
|
||||||
|
@ -623,7 +623,7 @@ exports.expressCreateServer = (hookName, args, cb) => {
|
||||||
} else {
|
} else {
|
||||||
// an unknown error happened
|
// an unknown error happened
|
||||||
// log it and throw internal error
|
// log it and throw internal error
|
||||||
apiLogger.error(err);
|
apiLogger.error(err.stack || err.toString());
|
||||||
throw new createHTTPError.InternalError('internal error');
|
throw new createHTTPError.InternalError('internal error');
|
||||||
}
|
}
|
||||||
});
|
});
|
||||||
|
|
|
@ -1139,7 +1139,7 @@ function Ace2Inner() {
|
||||||
|
|
||||||
lastDirtyNode = (lastDirtyNode && isNodeDirty(lastDirtyNode) && lastDirtyNode);
|
lastDirtyNode = (lastDirtyNode && isNodeDirty(lastDirtyNode) && lastDirtyNode);
|
||||||
if (firstDirtyNode && lastDirtyNode) {
|
if (firstDirtyNode && lastDirtyNode) {
|
||||||
const cc = makeContentCollector(isStyled, browser, rep.apool, null, className2Author);
|
const cc = makeContentCollector(isStyled, browser, rep.apool, className2Author);
|
||||||
cc.notifySelection(selection);
|
cc.notifySelection(selection);
|
||||||
const dirtyNodes = [];
|
const dirtyNodes = [];
|
||||||
for (let n = firstDirtyNode; n &&
|
for (let n = firstDirtyNode; n &&
|
||||||
|
|
|
@ -32,30 +32,31 @@ const hooks = require('./pluginfw/hooks');
|
||||||
|
|
||||||
const sanitizeUnicode = (s) => UNorm.nfc(s);
|
const sanitizeUnicode = (s) => UNorm.nfc(s);
|
||||||
|
|
||||||
const makeContentCollector = (collectStyles, abrowser, apool, domInterface, className2Author) => {
|
// This file is used both in browsers and with cheerio in Node.js (for importing HTML). Cheerio's
|
||||||
const dom = domInterface || {
|
// Node-like objects are not 100% API compatible with the DOM specification; the following functions
|
||||||
isNodeText: (n) => n.nodeType === 3,
|
// abstract away the differences.
|
||||||
nodeTagName: (n) => n.tagName,
|
|
||||||
nodeValue: (n) => n.nodeValue,
|
|
||||||
nodeNumChildren: (n) => {
|
|
||||||
if (n.childNodes == null) return 0;
|
|
||||||
return n.childNodes.length;
|
|
||||||
},
|
|
||||||
nodeChild: (n, i) => {
|
|
||||||
if (n.childNodes.item == null) {
|
|
||||||
return n.childNodes[i];
|
|
||||||
}
|
|
||||||
return n.childNodes.item(i);
|
|
||||||
},
|
|
||||||
nodeProp: (n, p) => n[p],
|
|
||||||
nodeAttr: (n, a) => {
|
|
||||||
if (n.getAttribute != null) return n.getAttribute(a);
|
|
||||||
if (n.attribs != null) return n.attribs[a];
|
|
||||||
return null;
|
|
||||||
},
|
|
||||||
optNodeInnerHTML: (n) => n.innerHTML,
|
|
||||||
};
|
|
||||||
|
|
||||||
|
// .nodeType works with DOM and cheerio 0.22.0, but cheerio 0.22.0 does not provide the Node.*_NODE
|
||||||
|
// constants so they cannot be used here.
|
||||||
|
const isElementNode = (n) => n.nodeType === 1; // Node.ELEMENT_NODE
|
||||||
|
const isTextNode = (n) => n.nodeType === 3; // Node.TEXT_NODE
|
||||||
|
// .tagName works with DOM and cheerio 0.22.0, but:
|
||||||
|
// * With DOM, .tagName is an uppercase string.
|
||||||
|
// * With cheerio 0.22.0, .tagName is a lowercase string.
|
||||||
|
// For consistency, this function always returns a lowercase string.
|
||||||
|
const tagName = (n) => n.tagName && n.tagName.toLowerCase();
|
||||||
|
// .childNodes works with DOM and cheerio 0.22.0, except in cheerio the .childNodes property does
|
||||||
|
// not exist on text nodes (and maybe other non-element nodes).
|
||||||
|
const childNodes = (n) => n.childNodes || [];
|
||||||
|
const getAttribute = (n, a) => {
|
||||||
|
// .getAttribute() works with DOM but not with cheerio 0.22.0.
|
||||||
|
if (n.getAttribute != null) return n.getAttribute(a);
|
||||||
|
// .attribs[] works with cheerio 0.22.0 but not with DOM.
|
||||||
|
if (n.attribs != null) return n.attribs[a];
|
||||||
|
return null;
|
||||||
|
};
|
||||||
|
|
||||||
|
const makeContentCollector = (collectStyles, abrowser, apool, className2Author) => {
|
||||||
const _blockElems = {
|
const _blockElems = {
|
||||||
div: 1,
|
div: 1,
|
||||||
p: 1,
|
p: 1,
|
||||||
|
@ -67,7 +68,7 @@ const makeContentCollector = (collectStyles, abrowser, apool, domInterface, clas
|
||||||
_blockElems[element] = 1;
|
_blockElems[element] = 1;
|
||||||
});
|
});
|
||||||
|
|
||||||
const isBlockElement = (n) => !!_blockElems[(dom.nodeTagName(n) || '').toLowerCase()];
|
const isBlockElement = (n) => !!_blockElems[tagName(n) || ''];
|
||||||
|
|
||||||
const textify = (str) => sanitizeUnicode(
|
const textify = (str) => sanitizeUnicode(
|
||||||
str.replace(/(\n | \n)/g, ' ')
|
str.replace(/(\n | \n)/g, ' ')
|
||||||
|
@ -75,7 +76,7 @@ const makeContentCollector = (collectStyles, abrowser, apool, domInterface, clas
|
||||||
.replace(/\xa0/g, ' ')
|
.replace(/\xa0/g, ' ')
|
||||||
.replace(/\t/g, ' '));
|
.replace(/\t/g, ' '));
|
||||||
|
|
||||||
const getAssoc = (node, name) => dom.nodeProp(node, `_magicdom_${name}`);
|
const getAssoc = (node, name) => node[`_magicdom_${name}`];
|
||||||
|
|
||||||
const lines = (() => {
|
const lines = (() => {
|
||||||
const textArray = [];
|
const textArray = [];
|
||||||
|
@ -123,13 +124,17 @@ const makeContentCollector = (collectStyles, abrowser, apool, domInterface, clas
|
||||||
let selEnd = [-1, -1];
|
let selEnd = [-1, -1];
|
||||||
const _isEmpty = (node, state) => {
|
const _isEmpty = (node, state) => {
|
||||||
// consider clean blank lines pasted in IE to be empty
|
// consider clean blank lines pasted in IE to be empty
|
||||||
if (dom.nodeNumChildren(node) === 0) return true;
|
if (childNodes(node).length === 0) return true;
|
||||||
if (dom.nodeNumChildren(node) === 1 &&
|
if (childNodes(node).length === 1 &&
|
||||||
getAssoc(node, 'shouldBeEmpty') &&
|
getAssoc(node, 'shouldBeEmpty') &&
|
||||||
dom.optNodeInnerHTML(node) === ' ' &&
|
// Note: The .innerHTML property exists on DOM Element objects but not on cheerio's
|
||||||
|
// Element-like objects (cheerio v0.22.0) so this equality check will always be false.
|
||||||
|
// Cheerio's Element-like objects have no equivalent to .innerHTML. (Cheerio objects have an
|
||||||
|
// .html() method, but that isn't accessible here.)
|
||||||
|
node.innerHTML === ' ' &&
|
||||||
!getAssoc(node, 'unpasted')) {
|
!getAssoc(node, 'unpasted')) {
|
||||||
if (state) {
|
if (state) {
|
||||||
const child = dom.nodeChild(node, 0);
|
const child = childNodes(node)[0];
|
||||||
_reachPoint(child, 0, state);
|
_reachPoint(child, 0, state);
|
||||||
_reachPoint(child, 1, state);
|
_reachPoint(child, 1, state);
|
||||||
}
|
}
|
||||||
|
@ -149,7 +154,7 @@ const makeContentCollector = (collectStyles, abrowser, apool, domInterface, clas
|
||||||
};
|
};
|
||||||
|
|
||||||
const _reachBlockPoint = (nd, idx, state) => {
|
const _reachBlockPoint = (nd, idx, state) => {
|
||||||
if (!dom.isNodeText(nd)) _reachPoint(nd, idx, state);
|
if (!isTextNode(nd)) _reachPoint(nd, idx, state);
|
||||||
};
|
};
|
||||||
|
|
||||||
const _reachPoint = (nd, idx, state) => {
|
const _reachPoint = (nd, idx, state) => {
|
||||||
|
@ -228,25 +233,24 @@ const makeContentCollector = (collectStyles, abrowser, apool, domInterface, clas
|
||||||
|
|
||||||
const _recalcAttribString = (state) => {
|
const _recalcAttribString = (state) => {
|
||||||
const lst = [];
|
const lst = [];
|
||||||
for (const a in state.attribs) {
|
for (const [a, count] of Object.entries(state.attribs)) {
|
||||||
if (state.attribs[a]) {
|
if (!count) continue;
|
||||||
// The following splitting of the attribute name is a workaround
|
// The following splitting of the attribute name is a workaround
|
||||||
// to enable the content collector to store key-value attributes
|
// to enable the content collector to store key-value attributes
|
||||||
// see https://github.com/ether/etherpad-lite/issues/2567 for more information
|
// see https://github.com/ether/etherpad-lite/issues/2567 for more information
|
||||||
// in long term the contentcollector should be refactored to get rid of this workaround
|
// in long term the contentcollector should be refactored to get rid of this workaround
|
||||||
const ATTRIBUTE_SPLIT_STRING = '::';
|
const ATTRIBUTE_SPLIT_STRING = '::';
|
||||||
|
|
||||||
// see if attributeString is splittable
|
// see if attributeString is splittable
|
||||||
const attributeSplits = a.split(ATTRIBUTE_SPLIT_STRING);
|
const attributeSplits = a.split(ATTRIBUTE_SPLIT_STRING);
|
||||||
if (attributeSplits.length > 1) {
|
if (attributeSplits.length > 1) {
|
||||||
// the attribute name follows the convention key::value
|
// the attribute name follows the convention key::value
|
||||||
// so save it as a key value attribute
|
// so save it as a key value attribute
|
||||||
lst.push([attributeSplits[0], attributeSplits[1]]);
|
lst.push([attributeSplits[0], attributeSplits[1]]);
|
||||||
} else {
|
} else {
|
||||||
// the "normal" case, the attribute is just a switch
|
// the "normal" case, the attribute is just a switch
|
||||||
// so set it true
|
// so set it true
|
||||||
lst.push([a, 'true']);
|
lst.push([a, 'true']);
|
||||||
}
|
|
||||||
}
|
}
|
||||||
}
|
}
|
||||||
if (state.authorLevel > 0) {
|
if (state.authorLevel > 0) {
|
||||||
|
@ -316,25 +320,15 @@ const makeContentCollector = (collectStyles, abrowser, apool, domInterface, clas
|
||||||
const startLine = lines.length() - 1;
|
const startLine = lines.length() - 1;
|
||||||
_reachBlockPoint(node, 0, state);
|
_reachBlockPoint(node, 0, state);
|
||||||
|
|
||||||
if (dom.isNodeText(node)) {
|
if (isTextNode(node)) {
|
||||||
let txt = dom.nodeValue(node);
|
const tname = getAttribute(node.parentNode, 'name');
|
||||||
const tname = dom.nodeAttr(node.parentNode, 'name');
|
const context = {cc: this, state, tname, node, text: node.nodeValue};
|
||||||
|
// Hook functions may either return a string (deprecated) or modify context.text. If any hook
|
||||||
const txtFromHook = hooks.callAll('collectContentLineText', {
|
// function modifies context.text then all returned strings are ignored. If no hook functions
|
||||||
cc: this,
|
// modify context.text, the first hook function to return a string wins.
|
||||||
state,
|
const [hookTxt] =
|
||||||
tname,
|
hooks.callAll('collectContentLineText', context).filter((s) => typeof s === 'string');
|
||||||
node,
|
let txt = context.text === node.nodeValue && hookTxt != null ? hookTxt : context.text;
|
||||||
text: txt,
|
|
||||||
styl: null,
|
|
||||||
cls: null,
|
|
||||||
});
|
|
||||||
|
|
||||||
if (typeof (txtFromHook) === 'object') {
|
|
||||||
txt = dom.nodeValue(node);
|
|
||||||
} else if (txtFromHook) {
|
|
||||||
txt = txtFromHook;
|
|
||||||
}
|
|
||||||
|
|
||||||
let rest = '';
|
let rest = '';
|
||||||
let x = 0; // offset into original text
|
let x = 0; // offset into original text
|
||||||
|
@ -384,8 +378,8 @@ const makeContentCollector = (collectStyles, abrowser, apool, domInterface, clas
|
||||||
cc.startNewLine(state);
|
cc.startNewLine(state);
|
||||||
}
|
}
|
||||||
}
|
}
|
||||||
} else {
|
} else if (isElementNode(node)) {
|
||||||
const tname = (dom.nodeTagName(node) || '').toLowerCase();
|
const tname = tagName(node) || '';
|
||||||
|
|
||||||
if (tname === 'img') {
|
if (tname === 'img') {
|
||||||
hooks.callAll('collectContentImage', {
|
hooks.callAll('collectContentImage', {
|
||||||
|
@ -403,8 +397,8 @@ const makeContentCollector = (collectStyles, abrowser, apool, domInterface, clas
|
||||||
|
|
||||||
if (tname === 'br') {
|
if (tname === 'br') {
|
||||||
this.breakLine = true;
|
this.breakLine = true;
|
||||||
const tvalue = dom.nodeAttr(node, 'value');
|
const tvalue = getAttribute(node, 'value');
|
||||||
const induceLineBreak = hooks.callAll('collectContentLineBreak', {
|
const [startNewLine = true] = hooks.callAll('collectContentLineBreak', {
|
||||||
cc: this,
|
cc: this,
|
||||||
state,
|
state,
|
||||||
tname,
|
tname,
|
||||||
|
@ -412,17 +406,14 @@ const makeContentCollector = (collectStyles, abrowser, apool, domInterface, clas
|
||||||
styl: null,
|
styl: null,
|
||||||
cls: null,
|
cls: null,
|
||||||
});
|
});
|
||||||
const startNewLine = (
|
|
||||||
typeof (induceLineBreak) === 'object' &&
|
|
||||||
induceLineBreak.length === 0) ? true : induceLineBreak[0];
|
|
||||||
if (startNewLine) {
|
if (startNewLine) {
|
||||||
cc.startNewLine(state);
|
cc.startNewLine(state);
|
||||||
}
|
}
|
||||||
} else if (tname === 'script' || tname === 'style') {
|
} else if (tname === 'script' || tname === 'style') {
|
||||||
// ignore
|
// ignore
|
||||||
} else if (!isEmpty) {
|
} else if (!isEmpty) {
|
||||||
let styl = dom.nodeAttr(node, 'style');
|
let styl = getAttribute(node, 'style');
|
||||||
let cls = dom.nodeAttr(node, 'class');
|
let cls = getAttribute(node, 'class');
|
||||||
let isPre = (tname === 'pre');
|
let isPre = (tname === 'pre');
|
||||||
if ((!isPre) && abrowser && abrowser.safari) {
|
if ((!isPre) && abrowser && abrowser.safari) {
|
||||||
isPre = (styl && /\bwhite-space:\s*pre\b/i.exec(styl));
|
isPre = (styl && /\bwhite-space:\s*pre\b/i.exec(styl));
|
||||||
|
@ -469,26 +460,23 @@ const makeContentCollector = (collectStyles, abrowser, apool, domInterface, clas
|
||||||
cc.doAttrib(state, 'strikethrough');
|
cc.doAttrib(state, 'strikethrough');
|
||||||
}
|
}
|
||||||
if (tname === 'ul' || tname === 'ol') {
|
if (tname === 'ul' || tname === 'ol') {
|
||||||
let type = node.attribs ? node.attribs.class : null;
|
let type = getAttribute(node, 'class');
|
||||||
const rr = cls && /(?:^| )list-([a-z]+[0-9]+)\b/.exec(cls);
|
const rr = cls && /(?:^| )list-([a-z]+[0-9]+)\b/.exec(cls);
|
||||||
// lists do not need to have a type, so before we make a wrong guess
|
// lists do not need to have a type, so before we make a wrong guess
|
||||||
// check if we find a better hint within the node's children
|
// check if we find a better hint within the node's children
|
||||||
if (!rr && !type) {
|
if (!rr && !type) {
|
||||||
for (const i in node.children) {
|
for (const child of childNodes(node)) {
|
||||||
if (node.children[i] && node.children[i].name === 'ul') {
|
if (tagName(child) !== 'ul') continue;
|
||||||
type = node.children[i].attribs.class;
|
type = getAttribute(child, 'class');
|
||||||
if (type) {
|
if (type) break;
|
||||||
break;
|
|
||||||
}
|
|
||||||
}
|
|
||||||
}
|
}
|
||||||
}
|
}
|
||||||
if (rr && rr[1]) {
|
if (rr && rr[1]) {
|
||||||
type = rr[1];
|
type = rr[1];
|
||||||
} else {
|
} else {
|
||||||
if (tname === 'ul') {
|
if (tname === 'ul') {
|
||||||
if ((type && type.match('indent')) ||
|
const cls = getAttribute(node, 'class');
|
||||||
(node.attribs && node.attribs.class && node.attribs.class.match('indent'))) {
|
if ((type && type.match('indent')) || (cls && cls.match('indent'))) {
|
||||||
type = 'indent';
|
type = 'indent';
|
||||||
} else {
|
} else {
|
||||||
type = 'bullet';
|
type = 'bullet';
|
||||||
|
@ -503,7 +491,7 @@ const makeContentCollector = (collectStyles, abrowser, apool, domInterface, clas
|
||||||
// This has undesirable behavior in Chrome but is right in other browsers.
|
// This has undesirable behavior in Chrome but is right in other browsers.
|
||||||
// See https://github.com/ether/etherpad-lite/issues/2412 for reasoning
|
// See https://github.com/ether/etherpad-lite/issues/2412 for reasoning
|
||||||
if (!abrowser.chrome) oldListTypeOrNull = (_enterList(state, undefined) || 'none');
|
if (!abrowser.chrome) oldListTypeOrNull = (_enterList(state, undefined) || 'none');
|
||||||
} else if ((tname === 'li')) {
|
} else if (tname === 'li') {
|
||||||
state.lineAttributes.start = state.start || 0;
|
state.lineAttributes.start = state.start || 0;
|
||||||
_recalcAttribString(state);
|
_recalcAttribString(state);
|
||||||
if (state.lineAttributes.list.indexOf('number') !== -1) {
|
if (state.lineAttributes.list.indexOf('number') !== -1) {
|
||||||
|
@ -513,7 +501,7 @@ const makeContentCollector = (collectStyles, abrowser, apool, domInterface, clas
|
||||||
Note how the <ol> item has to be inside a <li>
|
Note how the <ol> item has to be inside a <li>
|
||||||
Because of this we don't increment the start number
|
Because of this we don't increment the start number
|
||||||
*/
|
*/
|
||||||
if (node.parent && node.parent.name !== 'ol') {
|
if (node.parentNode && tagName(node.parentNode) !== 'ol') {
|
||||||
/*
|
/*
|
||||||
TODO: start number has to increment based on indentLevel(numberX)
|
TODO: start number has to increment based on indentLevel(numberX)
|
||||||
This means we have to build an object IE
|
This means we have to build an object IE
|
||||||
|
@ -530,7 +518,7 @@ const makeContentCollector = (collectStyles, abrowser, apool, domInterface, clas
|
||||||
}
|
}
|
||||||
}
|
}
|
||||||
// UL list items never modify the start value.
|
// UL list items never modify the start value.
|
||||||
if (node.parent && node.parent.name === 'ul') {
|
if (node.parentNode && tagName(node.parentNode) === 'ul') {
|
||||||
state.start++;
|
state.start++;
|
||||||
// TODO, this is hacky.
|
// TODO, this is hacky.
|
||||||
// Because if the first item is an UL it will increment a list no?
|
// Because if the first item is an UL it will increment a list no?
|
||||||
|
@ -559,9 +547,7 @@ const makeContentCollector = (collectStyles, abrowser, apool, domInterface, clas
|
||||||
}
|
}
|
||||||
}
|
}
|
||||||
|
|
||||||
const nc = dom.nodeNumChildren(node);
|
for (const c of childNodes(node)) {
|
||||||
for (let i = 0; i < nc; i++) {
|
|
||||||
const c = dom.nodeChild(node, i);
|
|
||||||
cc.collectContent(c, state);
|
cc.collectContent(c, state);
|
||||||
}
|
}
|
||||||
|
|
||||||
|
|
|
@ -1,3 +1,5 @@
|
||||||
|
'use strict';
|
||||||
|
|
||||||
/*
|
/*
|
||||||
* This file is copied & modified from <basedir>/tests/backend/specs/api/pad.js
|
* This file is copied & modified from <basedir>/tests/backend/specs/api/pad.js
|
||||||
*
|
*
|
||||||
|
|
|
@ -6,151 +6,148 @@
|
||||||
* TODO: unify those two files, and merge in a single one.
|
* TODO: unify those two files, and merge in a single one.
|
||||||
*/
|
*/
|
||||||
|
|
||||||
/* eslint-disable max-len */
|
|
||||||
|
|
||||||
const common = require('../../common');
|
const common = require('../../common');
|
||||||
const supertest = require(`${__dirname}/../../../../src/node_modules/supertest`);
|
const settings = require('../../../container/loadSettings.js').loadSettings();
|
||||||
const settings = require(`${__dirname}/../../../../tests/container/loadSettings.js`).loadSettings();
|
const supertest = require('ep_etherpad-lite/node_modules/supertest');
|
||||||
const api = supertest(`http://${settings.ip}:${settings.port}`);
|
|
||||||
|
|
||||||
|
const api = supertest(`http://${settings.ip}:${settings.port}`);
|
||||||
const apiKey = common.apiKey;
|
const apiKey = common.apiKey;
|
||||||
const apiVersion = 1;
|
const apiVersion = 1;
|
||||||
|
|
||||||
const testImports = {
|
const testImports = {
|
||||||
'malformed': {
|
'malformed': {
|
||||||
input: '<html><body><li>wtf</ul></body></html>',
|
input: '<html><body><li>wtf</ul></body></html>',
|
||||||
expectedHTML: '<!DOCTYPE HTML><html><body>wtf<br><br></body></html>',
|
wantHTML: '<!DOCTYPE HTML><html><body>wtf<br><br></body></html>',
|
||||||
expectedText: 'wtf\n\n',
|
wantText: 'wtf\n\n',
|
||||||
disabled: true,
|
disabled: true,
|
||||||
},
|
},
|
||||||
'nonelistiteminlist #3620': {
|
'nonelistiteminlist #3620': {
|
||||||
input: '<html><body><ul>test<li>FOO</li></ul></body></html>',
|
input: '<html><body><ul>test<li>FOO</li></ul></body></html>',
|
||||||
expectedHTML: '<!DOCTYPE HTML><html><body><ul class="bullet">test<li>FOO</ul><br></body></html>',
|
wantHTML: '<!DOCTYPE HTML><html><body><ul class="bullet">test<li>FOO</ul><br></body></html>',
|
||||||
expectedText: '\ttest\n\t* FOO\n\n',
|
wantText: '\ttest\n\t* FOO\n\n',
|
||||||
disabled: true,
|
disabled: true,
|
||||||
},
|
},
|
||||||
'whitespaceinlist #3620': {
|
'whitespaceinlist #3620': {
|
||||||
input: '<html><body><ul> <li>FOO</li></ul></body></html>',
|
input: '<html><body><ul> <li>FOO</li></ul></body></html>',
|
||||||
expectedHTML: '<!DOCTYPE HTML><html><body><ul class="bullet"><li>FOO</ul><br></body></html>',
|
wantHTML: '<!DOCTYPE HTML><html><body><ul class="bullet"><li>FOO</ul><br></body></html>',
|
||||||
expectedText: '\t* FOO\n\n',
|
wantText: '\t* FOO\n\n',
|
||||||
disabled: true,
|
|
||||||
},
|
},
|
||||||
'prefixcorrectlinenumber': {
|
'prefixcorrectlinenumber': {
|
||||||
input: '<html><body><ol><li>should be 1</li><li>should be 2</li></ol></body></html>',
|
input: '<html><body><ol><li>should be 1</li><li>should be 2</li></ol></body></html>',
|
||||||
expectedHTML: '<!DOCTYPE HTML><html><body><ol start="1" class="number"><li>should be 1</li><li>should be 2</ol><br></body></html>',
|
wantHTML: '<!DOCTYPE HTML><html><body><ol start="1" class="number"><li>should be 1</li><li>should be 2</ol><br></body></html>',
|
||||||
expectedText: '\t1. should be 1\n\t2. should be 2\n\n',
|
wantText: '\t1. should be 1\n\t2. should be 2\n\n',
|
||||||
},
|
},
|
||||||
'prefixcorrectlinenumbernested': {
|
'prefixcorrectlinenumbernested': {
|
||||||
input: '<html><body><ol><li>should be 1</li><ol><li>foo</li></ol><li>should be 2</li></ol></body></html>',
|
input: '<html><body><ol><li>should be 1</li><ol><li>foo</li></ol><li>should be 2</li></ol></body></html>',
|
||||||
expectedHTML: '<!DOCTYPE HTML><html><body><ol start="1" class="number"><li>should be 1<ol start="2" class="number"><li>foo</ol><li>should be 2</ol><br></body></html>',
|
wantHTML: '<!DOCTYPE HTML><html><body><ol start="1" class="number"><li>should be 1<ol start="2" class="number"><li>foo</ol><li>should be 2</ol><br></body></html>',
|
||||||
expectedText: '\t1. should be 1\n\t\t1.1. foo\n\t2. should be 2\n\n',
|
wantText: '\t1. should be 1\n\t\t1.1. foo\n\t2. should be 2\n\n',
|
||||||
},
|
},
|
||||||
|
|
||||||
/*
|
/*
|
||||||
"prefixcorrectlinenumber when introduced none list item - currently not supported see #3450":{
|
"prefixcorrectlinenumber when introduced none list item - currently not supported see #3450": {
|
||||||
input: '<html><body><ol><li>should be 1</li>test<li>should be 2</li></ol></body></html>',
|
input: '<html><body><ol><li>should be 1</li>test<li>should be 2</li></ol></body></html>',
|
||||||
expectedHTML: '<!DOCTYPE HTML><html><body><ol start="1" class="number"><li>should be 1</li>test<li>should be 2</li></ol><br></body></html>',
|
wantHTML: '<!DOCTYPE HTML><html><body><ol start="1" class="number"><li>should be 1</li>test<li>should be 2</li></ol><br></body></html>',
|
||||||
expectedText: '\t1. should be 1\n\ttest\n\t2. should be 2\n\n'
|
wantText: '\t1. should be 1\n\ttest\n\t2. should be 2\n\n',
|
||||||
}
|
}
|
||||||
,
|
,
|
||||||
"newlinesshouldntresetlinenumber #2194":{
|
"newlinesshouldntresetlinenumber #2194": {
|
||||||
input: '<html><body><ol><li>should be 1</li>test<li>should be 2</li></ol></body></html>',
|
input: '<html><body><ol><li>should be 1</li>test<li>should be 2</li></ol></body></html>',
|
||||||
expectedHTML: '<!DOCTYPE HTML><html><body><ol class="number"><li>should be 1</li>test<li>should be 2</li></ol><br></body></html>',
|
wantHTML: '<!DOCTYPE HTML><html><body><ol class="number"><li>should be 1</li>test<li>should be 2</li></ol><br></body></html>',
|
||||||
expectedText: '\t1. should be 1\n\ttest\n\t2. should be 2\n\n'
|
wantText: '\t1. should be 1\n\ttest\n\t2. should be 2\n\n',
|
||||||
}
|
}
|
||||||
*/
|
*/
|
||||||
'ignoreAnyTagsOutsideBody': {
|
'ignoreAnyTagsOutsideBody': {
|
||||||
description: 'Content outside body should be ignored',
|
description: 'Content outside body should be ignored',
|
||||||
input: '<html><head><title>title</title><style></style></head><body>empty<br></body></html>',
|
input: '<html><head><title>title</title><style></style></head><body>empty<br></body></html>',
|
||||||
expectedHTML: '<!DOCTYPE HTML><html><body>empty<br><br></body></html>',
|
wantHTML: '<!DOCTYPE HTML><html><body>empty<br><br></body></html>',
|
||||||
expectedText: 'empty\n\n',
|
wantText: 'empty\n\n',
|
||||||
},
|
},
|
||||||
'indentedListsAreNotBullets': {
|
'indentedListsAreNotBullets': {
|
||||||
description: 'Indented lists are represented with tabs and without bullets',
|
description: 'Indented lists are represented with tabs and without bullets',
|
||||||
input: '<html><body><ul class="indent"><li>indent</li><li>indent</ul></body></html>',
|
input: '<html><body><ul class="indent"><li>indent</li><li>indent</ul></body></html>',
|
||||||
expectedHTML: '<!DOCTYPE HTML><html><body><ul class="indent"><li>indent</li><li>indent</ul><br></body></html>',
|
wantHTML: '<!DOCTYPE HTML><html><body><ul class="indent"><li>indent</li><li>indent</ul><br></body></html>',
|
||||||
expectedText: '\tindent\n\tindent\n\n'
|
wantText: '\tindent\n\tindent\n\n',
|
||||||
},
|
},
|
||||||
lineWithMultipleSpaces: {
|
'lineWithMultipleSpaces': {
|
||||||
description: 'Multiple spaces should be collapsed',
|
description: 'Multiple spaces should be collapsed',
|
||||||
input: '<html><body>Text with more than one space.<br></body></html>',
|
input: '<html><body>Text with more than one space.<br></body></html>',
|
||||||
expectedHTML: '<!DOCTYPE HTML><html><body>Text with more than one space.<br><br></body></html>',
|
wantHTML: '<!DOCTYPE HTML><html><body>Text with more than one space.<br><br></body></html>',
|
||||||
expectedText: 'Text with more than one space.\n\n'
|
wantText: 'Text with more than one space.\n\n',
|
||||||
},
|
},
|
||||||
lineWithMultipleNonBreakingAndNormalSpaces: {
|
'lineWithMultipleNonBreakingAndNormalSpaces': {
|
||||||
// XXX the HTML between "than" and "one" looks strange
|
// XXX the HTML between "than" and "one" looks strange
|
||||||
description: 'non-breaking space should be preserved, but can be replaced when it',
|
description: 'non-breaking space should be preserved, but can be replaced when it',
|
||||||
input: '<html><body>Text with more than one space.<br></body></html>',
|
input: '<html><body>Text with more than one space.<br></body></html>',
|
||||||
expectedHTML: '<!DOCTYPE HTML><html><body>Text with more than one space.<br><br></body></html>',
|
wantHTML: '<!DOCTYPE HTML><html><body>Text with more than one space.<br><br></body></html>',
|
||||||
expectedText: 'Text with more than one space.\n\n'
|
wantText: 'Text with more than one space.\n\n',
|
||||||
},
|
},
|
||||||
multiplenbsp: {
|
'multiplenbsp': {
|
||||||
description: 'Multiple non-breaking space should be preserved',
|
description: 'Multiple non-breaking space should be preserved',
|
||||||
input: '<html><body> <br></body></html>',
|
input: '<html><body> <br></body></html>',
|
||||||
expectedHTML: '<!DOCTYPE HTML><html><body> <br><br></body></html>',
|
wantHTML: '<!DOCTYPE HTML><html><body> <br><br></body></html>',
|
||||||
expectedText: ' \n\n'
|
wantText: ' \n\n',
|
||||||
},
|
},
|
||||||
multipleNonBreakingSpaceBetweenWords: {
|
'multipleNonBreakingSpaceBetweenWords': {
|
||||||
description: 'A normal space is always inserted before a word',
|
description: 'A normal space is always inserted before a word',
|
||||||
input: '<html><body> word1 word2 word3<br></body></html>',
|
input: '<html><body> word1 word2 word3<br></body></html>',
|
||||||
expectedHTML: '<!DOCTYPE HTML><html><body> word1 word2 word3<br><br></body></html>',
|
wantHTML: '<!DOCTYPE HTML><html><body> word1 word2 word3<br><br></body></html>',
|
||||||
expectedText: ' word1 word2 word3\n\n'
|
wantText: ' word1 word2 word3\n\n',
|
||||||
},
|
},
|
||||||
nonBreakingSpacePreceededBySpaceBetweenWords: {
|
'nonBreakingSpacePreceededBySpaceBetweenWords': {
|
||||||
description: 'A non-breaking space preceeded by a normal space',
|
description: 'A non-breaking space preceeded by a normal space',
|
||||||
input: '<html><body> word1 word2 word3<br></body></html>',
|
input: '<html><body> word1 word2 word3<br></body></html>',
|
||||||
expectedHTML: '<!DOCTYPE HTML><html><body> word1 word2 word3<br><br></body></html>',
|
wantHTML: '<!DOCTYPE HTML><html><body> word1 word2 word3<br><br></body></html>',
|
||||||
expectedText: ' word1 word2 word3\n\n'
|
wantText: ' word1 word2 word3\n\n',
|
||||||
},
|
},
|
||||||
nonBreakingSpaceFollowededBySpaceBetweenWords: {
|
'nonBreakingSpaceFollowededBySpaceBetweenWords': {
|
||||||
description: 'A non-breaking space followed by a normal space',
|
description: 'A non-breaking space followed by a normal space',
|
||||||
input: '<html><body> word1 word2 word3<br></body></html>',
|
input: '<html><body> word1 word2 word3<br></body></html>',
|
||||||
expectedHTML: '<!DOCTYPE HTML><html><body> word1 word2 word3<br><br></body></html>',
|
wantHTML: '<!DOCTYPE HTML><html><body> word1 word2 word3<br><br></body></html>',
|
||||||
expectedText: ' word1 word2 word3\n\n'
|
wantText: ' word1 word2 word3\n\n',
|
||||||
},
|
},
|
||||||
spacesAfterNewline: {
|
'spacesAfterNewline': {
|
||||||
description: 'Collapse spaces that follow a newline',
|
description: 'Collapse spaces that follow a newline',
|
||||||
input:'<!doctype html><html><body>something<br> something<br></body></html>',
|
input: '<!doctype html><html><body>something<br> something<br></body></html>',
|
||||||
expectedHTML: '<!DOCTYPE HTML><html><body>something<br>something<br><br></body></html>',
|
wantHTML: '<!DOCTYPE HTML><html><body>something<br>something<br><br></body></html>',
|
||||||
expectedText: 'something\nsomething\n\n'
|
wantText: 'something\nsomething\n\n',
|
||||||
},
|
},
|
||||||
spacesAfterNewlineP: {
|
'spacesAfterNewlineP': {
|
||||||
description: 'Collapse spaces that follow a paragraph',
|
description: 'Collapse spaces that follow a paragraph',
|
||||||
input:'<!doctype html><html><body>something<p></p> something<br></body></html>',
|
input: '<!doctype html><html><body>something<p></p> something<br></body></html>',
|
||||||
expectedHTML: '<!DOCTYPE HTML><html><body>something<br><br>something<br><br></body></html>',
|
wantHTML: '<!DOCTYPE HTML><html><body>something<br><br>something<br><br></body></html>',
|
||||||
expectedText: 'something\n\nsomething\n\n'
|
wantText: 'something\n\nsomething\n\n',
|
||||||
},
|
},
|
||||||
spacesAtEndOfLine: {
|
'spacesAtEndOfLine': {
|
||||||
description: 'Collapse spaces that preceed/follow a newline',
|
description: 'Collapse spaces that preceed/follow a newline',
|
||||||
input:'<html><body>something <br> something<br></body></html>',
|
input: '<html><body>something <br> something<br></body></html>',
|
||||||
expectedHTML: '<!DOCTYPE HTML><html><body>something<br>something<br><br></body></html>',
|
wantHTML: '<!DOCTYPE HTML><html><body>something<br>something<br><br></body></html>',
|
||||||
expectedText: 'something\nsomething\n\n'
|
wantText: 'something\nsomething\n\n',
|
||||||
},
|
},
|
||||||
spacesAtEndOfLineP: {
|
'spacesAtEndOfLineP': {
|
||||||
description: 'Collapse spaces that preceed/follow a paragraph',
|
description: 'Collapse spaces that preceed/follow a paragraph',
|
||||||
input:'<html><body>something <p></p> something<br></body></html>',
|
input: '<html><body>something <p></p> something<br></body></html>',
|
||||||
expectedHTML: '<!DOCTYPE HTML><html><body>something<br><br>something<br><br></body></html>',
|
wantHTML: '<!DOCTYPE HTML><html><body>something<br><br>something<br><br></body></html>',
|
||||||
expectedText: 'something\n\nsomething\n\n'
|
wantText: 'something\n\nsomething\n\n',
|
||||||
},
|
},
|
||||||
nonBreakingSpacesAfterNewlines: {
|
'nonBreakingSpacesAfterNewlines': {
|
||||||
description: 'Don\'t collapse non-breaking spaces that follow a newline',
|
description: 'Don\'t collapse non-breaking spaces that follow a newline',
|
||||||
input:'<html><body>something<br> something<br></body></html>',
|
input: '<html><body>something<br> something<br></body></html>',
|
||||||
expectedHTML: '<!DOCTYPE HTML><html><body>something<br> something<br><br></body></html>',
|
wantHTML: '<!DOCTYPE HTML><html><body>something<br> something<br><br></body></html>',
|
||||||
expectedText: 'something\n something\n\n'
|
wantText: 'something\n something\n\n',
|
||||||
},
|
},
|
||||||
nonBreakingSpacesAfterNewlinesP: {
|
'nonBreakingSpacesAfterNewlinesP': {
|
||||||
description: 'Don\'t collapse non-breaking spaces that follow a paragraph',
|
description: 'Don\'t collapse non-breaking spaces that follow a paragraph',
|
||||||
input:'<html><body>something<p></p> something<br></body></html>',
|
input: '<html><body>something<p></p> something<br></body></html>',
|
||||||
expectedHTML: '<!DOCTYPE HTML><html><body>something<br><br> something<br><br></body></html>',
|
wantHTML: '<!DOCTYPE HTML><html><body>something<br><br> something<br><br></body></html>',
|
||||||
expectedText: 'something\n\n something\n\n'
|
wantText: 'something\n\n something\n\n',
|
||||||
},
|
},
|
||||||
collapseSpacesInsideElements: {
|
'collapseSpacesInsideElements': {
|
||||||
description: 'Preserve only one space when multiple are present',
|
description: 'Preserve only one space when multiple are present',
|
||||||
input: '<html><body>Need <span> more </span> space<i> s </i> !<br></body></html>',
|
input: '<html><body>Need <span> more </span> space<i> s </i> !<br></body></html>',
|
||||||
expectedHTML: '<!DOCTYPE HTML><html><body>Need more space<em> s </em>!<br><br></body></html>',
|
wantHTML: '<!DOCTYPE HTML><html><body>Need more space<em> s </em>!<br><br></body></html>',
|
||||||
expectedText: 'Need more space s !\n\n'
|
wantText: 'Need more space s !\n\n',
|
||||||
},
|
},
|
||||||
collapseSpacesAcrossNewlines: {
|
'collapseSpacesAcrossNewlines': {
|
||||||
description: 'Newlines and multiple spaces across newlines should be collapsed',
|
description: 'Newlines and multiple spaces across newlines should be collapsed',
|
||||||
input: `
|
input: `
|
||||||
<html><body>Need
|
<html><body>Need
|
||||||
|
@ -158,30 +155,30 @@ const testImports = {
|
||||||
space
|
space
|
||||||
<i> s </i>
|
<i> s </i>
|
||||||
!<br></body></html>`,
|
!<br></body></html>`,
|
||||||
expectedHTML: '<!DOCTYPE HTML><html><body>Need more space <em>s </em>!<br><br></body></html>',
|
wantHTML: '<!DOCTYPE HTML><html><body>Need more space <em>s </em>!<br><br></body></html>',
|
||||||
expectedText: 'Need more space s !\n\n'
|
wantText: 'Need more space s !\n\n',
|
||||||
},
|
},
|
||||||
multipleNewLinesAtBeginning: {
|
'multipleNewLinesAtBeginning': {
|
||||||
description: 'Multiple new lines and paragraphs at the beginning should be preserved',
|
description: 'Multiple new lines and paragraphs at the beginning should be preserved',
|
||||||
input: '<html><body><br><br><p></p><p></p>first line<br><br>second line<br></body></html>',
|
input: '<html><body><br><br><p></p><p></p>first line<br><br>second line<br></body></html>',
|
||||||
expectedHTML: '<!DOCTYPE HTML><html><body><br><br><br><br>first line<br><br>second line<br><br></body></html>',
|
wantHTML: '<!DOCTYPE HTML><html><body><br><br><br><br>first line<br><br>second line<br><br></body></html>',
|
||||||
expectedText: '\n\n\n\nfirst line\n\nsecond line\n\n'
|
wantText: '\n\n\n\nfirst line\n\nsecond line\n\n',
|
||||||
},
|
},
|
||||||
multiLineParagraph:{
|
'multiLineParagraph': {
|
||||||
description: "A paragraph with multiple lines should not loose spaces when lines are combined",
|
description: 'A paragraph with multiple lines should not loose spaces when lines are combined',
|
||||||
input:`<html><body>
|
input: `<html><body>
|
||||||
<p>
|
<p>
|
||||||
а б в г ґ д е є ж з и і ї й к л м н о
|
а б в г ґ д е є ж з и і ї й к л м н о
|
||||||
п р с т у ф х ц ч ш щ ю я ь
|
п р с т у ф х ц ч ш щ ю я ь
|
||||||
</p>
|
</p>
|
||||||
</body></html>`,
|
</body></html>`,
|
||||||
expectedHTML: '<!DOCTYPE HTML><html><body>а б в г ґ д е є ж з и і ї й к л м н о п р с т у ф х ц ч ш щ ю я ь<br><br></body></html>',
|
wantHTML: '<!DOCTYPE HTML><html><body>а б в г ґ д е є ж з и і ї й к л м н о п р с т у ф х ц ч ш щ ю я ь<br><br></body></html>',
|
||||||
expectedText: 'а б в г ґ д е є ж з и і ї й к л м н о п р с т у ф х ц ч ш щ ю я ь\n\n'
|
wantText: 'а б в г ґ д е є ж з и і ї й к л м н о п р с т у ф х ц ч ш щ ю я ь\n\n',
|
||||||
},
|
},
|
||||||
multiLineParagraphWithPre:{
|
'multiLineParagraphWithPre': {
|
||||||
//XXX why is there before "in"?
|
// XXX why is there before "in"?
|
||||||
description: "lines in preformatted text should be kept intact",
|
description: 'lines in preformatted text should be kept intact',
|
||||||
input:`<html><body>
|
input: `<html><body>
|
||||||
<p>
|
<p>
|
||||||
а б в г ґ д е є ж з и і ї й к л м н о<pre>multiple
|
а б в г ґ д е є ж з и і ї й к л м н о<pre>multiple
|
||||||
lines
|
lines
|
||||||
|
@ -190,55 +187,55 @@ const testImports = {
|
||||||
</pre></p><p>п р с т у ф х ц ч ш щ ю я
|
</pre></p><p>п р с т у ф х ц ч ш щ ю я
|
||||||
ь</p>
|
ь</p>
|
||||||
</body></html>`,
|
</body></html>`,
|
||||||
expectedHTML: '<!DOCTYPE HTML><html><body>а б в г ґ д е є ж з и і ї й к л м н о<br>multiple<br> lines<br> in<br> pre<br><br>п р с т у ф х ц ч ш щ ю я ь<br><br></body></html>',
|
wantHTML: '<!DOCTYPE HTML><html><body>а б в г ґ д е є ж з и і ї й к л м н о<br>multiple<br> lines<br> in<br> pre<br><br>п р с т у ф х ц ч ш щ ю я ь<br><br></body></html>',
|
||||||
expectedText: 'а б в г ґ д е є ж з и і ї й к л м н о\nmultiple\n lines\n in\n pre\n\nп р с т у ф х ц ч ш щ ю я ь\n\n'
|
wantText: 'а б в г ґ д е є ж з и і ї й к л м н о\nmultiple\n lines\n in\n pre\n\nп р с т у ф х ц ч ш щ ю я ь\n\n',
|
||||||
},
|
},
|
||||||
preIntroducesASpace: {
|
'preIntroducesASpace': {
|
||||||
description: "pre should be on a new line not preceeded by a space",
|
description: 'pre should be on a new line not preceeded by a space',
|
||||||
input:`<html><body><p>
|
input: `<html><body><p>
|
||||||
1
|
1
|
||||||
<pre>preline
|
<pre>preline
|
||||||
</pre></p></body></html>`,
|
</pre></p></body></html>`,
|
||||||
expectedHTML: '<!DOCTYPE HTML><html><body>1<br>preline<br><br><br></body></html>',
|
wantHTML: '<!DOCTYPE HTML><html><body>1<br>preline<br><br><br></body></html>',
|
||||||
expectedText: '1\npreline\n\n\n'
|
wantText: '1\npreline\n\n\n',
|
||||||
},
|
},
|
||||||
dontDeleteSpaceInsideElements: {
|
'dontDeleteSpaceInsideElements': {
|
||||||
description: 'Preserve spaces inside elements',
|
description: 'Preserve spaces inside elements',
|
||||||
input: '<html><body>Need<span> more </span>space<i> s </i>!<br></body></html>',
|
input: '<html><body>Need<span> more </span>space<i> s </i>!<br></body></html>',
|
||||||
expectedHTML: '<!DOCTYPE HTML><html><body>Need more space<em> s </em>!<br><br></body></html>',
|
wantHTML: '<!DOCTYPE HTML><html><body>Need more space<em> s </em>!<br><br></body></html>',
|
||||||
expectedText: 'Need more space s !\n\n'
|
wantText: 'Need more space s !\n\n',
|
||||||
},
|
},
|
||||||
dontDeleteSpaceOutsideElements: {
|
'dontDeleteSpaceOutsideElements': {
|
||||||
description: 'Preserve spaces outside elements',
|
description: 'Preserve spaces outside elements',
|
||||||
input: '<html><body>Need <span>more</span> space <i>s</i> !<br></body></html>',
|
input: '<html><body>Need <span>more</span> space <i>s</i> !<br></body></html>',
|
||||||
expectedHTML: '<!DOCTYPE HTML><html><body>Need more space <em>s</em> !<br><br></body></html>',
|
wantHTML: '<!DOCTYPE HTML><html><body>Need more space <em>s</em> !<br><br></body></html>',
|
||||||
expectedText: 'Need more space s !\n\n'
|
wantText: 'Need more space s !\n\n',
|
||||||
},
|
},
|
||||||
dontDeleteSpaceAtEndOfElement: {
|
'dontDeleteSpaceAtEndOfElement': {
|
||||||
description: 'Preserve spaces at the end of an element',
|
description: 'Preserve spaces at the end of an element',
|
||||||
input: '<html><body>Need <span>more </span>space <i>s </i>!<br></body></html>',
|
input: '<html><body>Need <span>more </span>space <i>s </i>!<br></body></html>',
|
||||||
expectedHTML: '<!DOCTYPE HTML><html><body>Need more space <em>s </em>!<br><br></body></html>',
|
wantHTML: '<!DOCTYPE HTML><html><body>Need more space <em>s </em>!<br><br></body></html>',
|
||||||
expectedText: 'Need more space s !\n\n'
|
wantText: 'Need more space s !\n\n',
|
||||||
},
|
},
|
||||||
dontDeleteSpaceAtBeginOfElements: {
|
'dontDeleteSpaceAtBeginOfElements': {
|
||||||
description: 'Preserve spaces at the start of an element',
|
description: 'Preserve spaces at the start of an element',
|
||||||
input: '<html><body>Need<span> more</span> space<i> s</i> !<br></body></html>',
|
input: '<html><body>Need<span> more</span> space<i> s</i> !<br></body></html>',
|
||||||
expectedHTML: '<!DOCTYPE HTML><html><body>Need more space<em> s</em> !<br><br></body></html>',
|
wantHTML: '<!DOCTYPE HTML><html><body>Need more space<em> s</em> !<br><br></body></html>',
|
||||||
expectedText: 'Need more space s !\n\n'
|
wantText: 'Need more space s !\n\n',
|
||||||
},
|
},
|
||||||
};
|
};
|
||||||
|
|
||||||
describe(__filename, function () {
|
describe(__filename, function () {
|
||||||
Object.keys(testImports).forEach((testName) => {
|
Object.keys(testImports).forEach((testName) => {
|
||||||
const testPadId = makeid();
|
describe(testName, function () {
|
||||||
const test = testImports[testName];
|
const testPadId = makeid();
|
||||||
if (test.disabled) {
|
const test = testImports[testName];
|
||||||
return xit(`DISABLED: ${testName}`, function (done) {
|
if (test.disabled) {
|
||||||
done();
|
return xit(`DISABLED: ${testName}`, function (done) {
|
||||||
});
|
done();
|
||||||
}
|
});
|
||||||
describe(`createPad ${testName}`, function () {
|
}
|
||||||
it('creates a new Pad', function (done) {
|
it('createPad', function (done) {
|
||||||
api.get(`${endPoint('createPad')}&padID=${testPadId}`)
|
api.get(`${endPoint('createPad')}&padID=${testPadId}`)
|
||||||
.expect((res) => {
|
.expect((res) => {
|
||||||
if (res.body.code !== 0) throw new Error('Unable to create new Pad');
|
if (res.body.code !== 0) throw new Error('Unable to create new Pad');
|
||||||
|
@ -246,10 +243,8 @@ describe(__filename, function () {
|
||||||
.expect('Content-Type', /json/)
|
.expect('Content-Type', /json/)
|
||||||
.expect(200, done);
|
.expect(200, done);
|
||||||
});
|
});
|
||||||
});
|
|
||||||
|
|
||||||
describe(`setHTML ${testName}`, function () {
|
it('setHTML', function (done) {
|
||||||
it('Sets the HTML', function (done) {
|
|
||||||
api.get(`${endPoint('setHTML')}&padID=${testPadId}&html=${encodeURIComponent(test.input)}`)
|
api.get(`${endPoint('setHTML')}&padID=${testPadId}&html=${encodeURIComponent(test.input)}`)
|
||||||
.expect((res) => {
|
.expect((res) => {
|
||||||
if (res.body.code !== 0) throw new Error(`Error:${testName}`);
|
if (res.body.code !== 0) throw new Error(`Error:${testName}`);
|
||||||
|
@ -257,23 +252,21 @@ describe(__filename, function () {
|
||||||
.expect('Content-Type', /json/)
|
.expect('Content-Type', /json/)
|
||||||
.expect(200, done);
|
.expect(200, done);
|
||||||
});
|
});
|
||||||
});
|
|
||||||
|
|
||||||
describe(`getHTML ${testName}`, function () {
|
it('getHTML', function (done) {
|
||||||
it('Gets back the HTML of a Pad', function (done) {
|
|
||||||
api.get(`${endPoint('getHTML')}&padID=${testPadId}`)
|
api.get(`${endPoint('getHTML')}&padID=${testPadId}`)
|
||||||
.expect((res) => {
|
.expect((res) => {
|
||||||
const receivedHtml = res.body.data.html;
|
const gotHtml = res.body.data.html;
|
||||||
if (receivedHtml !== test.expectedHTML) {
|
if (gotHtml !== test.wantHTML) {
|
||||||
throw new Error(`HTML received from export is not the one we were expecting.
|
throw new Error(`HTML received from export is not the one we were expecting.
|
||||||
Test Name:
|
Test Name:
|
||||||
${testName}
|
${testName}
|
||||||
|
|
||||||
Received:
|
Got:
|
||||||
${JSON.stringify(receivedHtml)}
|
${JSON.stringify(gotHtml)}
|
||||||
|
|
||||||
Expected:
|
Want:
|
||||||
${JSON.stringify(test.expectedHTML)}
|
${JSON.stringify(test.wantHTML)}
|
||||||
|
|
||||||
Which is a different version of the originally imported one:
|
Which is a different version of the originally imported one:
|
||||||
${test.input}`);
|
${test.input}`);
|
||||||
|
@ -282,23 +275,21 @@ describe(__filename, function () {
|
||||||
.expect('Content-Type', /json/)
|
.expect('Content-Type', /json/)
|
||||||
.expect(200, done);
|
.expect(200, done);
|
||||||
});
|
});
|
||||||
});
|
|
||||||
|
|
||||||
describe(`getText ${testName}`, function () {
|
it('getText', function (done) {
|
||||||
it('Gets back the Text of a Pad', function (done) {
|
|
||||||
api.get(`${endPoint('getText')}&padID=${testPadId}`)
|
api.get(`${endPoint('getText')}&padID=${testPadId}`)
|
||||||
.expect((res) => {
|
.expect((res) => {
|
||||||
const receivedText = res.body.data.text;
|
const gotText = res.body.data.text;
|
||||||
if (receivedText !== test.expectedText) {
|
if (gotText !== test.wantText) {
|
||||||
throw new Error(`Text received from export is not the one we were expecting.
|
throw new Error(`Text received from export is not the one we were expecting.
|
||||||
Test Name:
|
Test Name:
|
||||||
${testName}
|
${testName}
|
||||||
|
|
||||||
Received:
|
Got:
|
||||||
${JSON.stringify(receivedText)}
|
${JSON.stringify(gotText)}
|
||||||
|
|
||||||
Expected:
|
Want:
|
||||||
${JSON.stringify(test.expectedText)}
|
${JSON.stringify(test.wantText)}
|
||||||
|
|
||||||
Which is a different version of the originally imported one:
|
Which is a different version of the originally imported one:
|
||||||
${test.input}`);
|
${test.input}`);
|
||||||
|
@ -315,7 +306,7 @@ describe(__filename, function () {
|
||||||
function endPoint(point, version) {
|
function endPoint(point, version) {
|
||||||
version = version || apiVersion;
|
version = version || apiVersion;
|
||||||
return `/api/${version}/${point}?apikey=${apiKey}`;
|
return `/api/${version}/${point}?apikey=${apiKey}`;
|
||||||
};
|
}
|
||||||
|
|
||||||
function makeid() {
|
function makeid() {
|
||||||
let text = '';
|
let text = '';
|
||||||
|
|
|
@ -1,34 +1,34 @@
|
||||||
'use strict';
|
'use strict';
|
||||||
|
|
||||||
/* eslint-disable max-len */
|
|
||||||
/*
|
/*
|
||||||
* While importexport tests target the `setHTML` API endpoint, which is nearly identical to what happens
|
* While importexport tests target the `setHTML` API endpoint, which is nearly identical to what
|
||||||
* when a user manually imports a document via the UI, the contentcollector tests here don't use rehype to process
|
* happens when a user manually imports a document via the UI, the contentcollector tests here don't
|
||||||
* the document. Rehype removes spaces and newĺines were applicable, so the expected results here can
|
* use rehype to process the document. Rehype removes spaces and newĺines were applicable, so the
|
||||||
* differ from importexport.js.
|
* expected results here can differ from importexport.js.
|
||||||
*
|
*
|
||||||
* If you add tests here, please also add them to importexport.js
|
* If you add tests here, please also add them to importexport.js
|
||||||
*/
|
*/
|
||||||
|
|
||||||
const contentcollector = require('../../../src/static/js/contentcollector');
|
const AttributePool = require('ep_etherpad-lite/static/js/AttributePool');
|
||||||
const AttributePool = require('../../../src/static/js/AttributePool');
|
const assert = require('assert').strict;
|
||||||
const cheerio = require('../../../src/node_modules/cheerio');
|
const cheerio = require('ep_etherpad-lite/node_modules/cheerio');
|
||||||
|
const contentcollector = require('ep_etherpad-lite/static/js/contentcollector');
|
||||||
|
|
||||||
const tests = {
|
const tests = {
|
||||||
nestedLi: {
|
nestedLi: {
|
||||||
description: 'Complex nested Li',
|
description: 'Complex nested Li',
|
||||||
html: '<!doctype html><html><body><ol><li>one</li><li><ol><li>1.1</li></ol></li><li>two</li></ol></body></html>',
|
html: '<!doctype html><html><body><ol><li>one</li><li><ol><li>1.1</li></ol></li><li>two</li></ol></body></html>',
|
||||||
expectedLineAttribs: [
|
wantLineAttribs: [
|
||||||
'*0*1*2*3+1+3', '*0*4*2*5+1+3', '*0*1*2*5+1+3',
|
'*0*1*2*3+1+3', '*0*4*2*5+1+3', '*0*1*2*5+1+3',
|
||||||
],
|
],
|
||||||
expectedText: [
|
wantText: [
|
||||||
'*one', '*1.1', '*two',
|
'*one', '*1.1', '*two',
|
||||||
],
|
],
|
||||||
},
|
},
|
||||||
complexNest: {
|
complexNest: {
|
||||||
description: 'Complex list of different types',
|
description: 'Complex list of different types',
|
||||||
html: '<!doctype html><html><body><ul class="bullet"><li>one</li><li>two</li><li>0</li><li>1</li><li>2<ul class="bullet"><li>3</li><li>4</li></ul></li></ul><ol class="number"><li>item<ol class="number"><li>item1</li><li>item2</li></ol></li></ol></body></html>',
|
html: '<!doctype html><html><body><ul class="bullet"><li>one</li><li>two</li><li>0</li><li>1</li><li>2<ul class="bullet"><li>3</li><li>4</li></ul></li></ul><ol class="number"><li>item<ol class="number"><li>item1</li><li>item2</li></ol></li></ol></body></html>',
|
||||||
expectedLineAttribs: [
|
wantLineAttribs: [
|
||||||
'*0*1*2+1+3',
|
'*0*1*2+1+3',
|
||||||
'*0*1*2+1+3',
|
'*0*1*2+1+3',
|
||||||
'*0*1*2+1+1',
|
'*0*1*2+1+1',
|
||||||
|
@ -40,7 +40,7 @@ const tests = {
|
||||||
'*0*6*2*7+1+5',
|
'*0*6*2*7+1+5',
|
||||||
'*0*6*2*7+1+5',
|
'*0*6*2*7+1+5',
|
||||||
],
|
],
|
||||||
expectedText: [
|
wantText: [
|
||||||
'*one',
|
'*one',
|
||||||
'*two',
|
'*two',
|
||||||
'*0',
|
'*0',
|
||||||
|
@ -56,148 +56,142 @@ const tests = {
|
||||||
ul: {
|
ul: {
|
||||||
description: 'Tests if uls properly get attributes',
|
description: 'Tests if uls properly get attributes',
|
||||||
html: '<html><body><ul><li>a</li><li>b</li></ul><div>div</div><p>foo</p></body></html>',
|
html: '<html><body><ul><li>a</li><li>b</li></ul><div>div</div><p>foo</p></body></html>',
|
||||||
expectedLineAttribs: ['*0*1*2+1+1', '*0*1*2+1+1', '+3', '+3'],
|
wantLineAttribs: ['*0*1*2+1+1', '*0*1*2+1+1', '+3', '+3'],
|
||||||
expectedText: ['*a', '*b', 'div', 'foo'],
|
wantText: ['*a', '*b', 'div', 'foo'],
|
||||||
},
|
},
|
||||||
ulIndented: {
|
ulIndented: {
|
||||||
description: 'Tests if indented uls properly get attributes',
|
description: 'Tests if indented uls properly get attributes',
|
||||||
html: '<html><body><ul><li>a</li><ul><li>b</li></ul><li>a</li></ul><p>foo</p></body></html>',
|
html: '<html><body><ul><li>a</li><ul><li>b</li></ul><li>a</li></ul><p>foo</p></body></html>',
|
||||||
expectedLineAttribs: ['*0*1*2+1+1', '*0*3*2+1+1', '*0*1*2+1+1', '+3'],
|
wantLineAttribs: ['*0*1*2+1+1', '*0*3*2+1+1', '*0*1*2+1+1', '+3'],
|
||||||
expectedText: ['*a', '*b', '*a', 'foo'],
|
wantText: ['*a', '*b', '*a', 'foo'],
|
||||||
},
|
},
|
||||||
ol: {
|
ol: {
|
||||||
description: 'Tests if ols properly get line numbers when in a normal OL',
|
description: 'Tests if ols properly get line numbers when in a normal OL',
|
||||||
html: '<html><body><ol><li>a</li><li>b</li><li>c</li></ol><p>test</p></body></html>',
|
html: '<html><body><ol><li>a</li><li>b</li><li>c</li></ol><p>test</p></body></html>',
|
||||||
expectedLineAttribs: ['*0*1*2*3+1+1', '*0*1*2*3+1+1', '*0*1*2*3+1+1', '+4'],
|
wantLineAttribs: ['*0*1*2*3+1+1', '*0*1*2*3+1+1', '*0*1*2*3+1+1', '+4'],
|
||||||
expectedText: ['*a', '*b', '*c', 'test'],
|
wantText: ['*a', '*b', '*c', 'test'],
|
||||||
noteToSelf: 'Ensure empty P does not induce line attribute marker, wont this break the editor?',
|
noteToSelf: 'Ensure empty P does not induce line attribute marker, wont this break the editor?',
|
||||||
},
|
},
|
||||||
lineDoBreakInOl: {
|
lineDoBreakInOl: {
|
||||||
description: 'A single completely empty line break within an ol should reset count if OL is closed off..',
|
description: 'A single completely empty line break within an ol should reset count if OL is closed off..',
|
||||||
html: '<html><body><ol><li>should be 1</li></ol><p>hello</p><ol><li>should be 1</li><li>should be 2</li></ol><p></p></body></html>',
|
html: '<html><body><ol><li>should be 1</li></ol><p>hello</p><ol><li>should be 1</li><li>should be 2</li></ol><p></p></body></html>',
|
||||||
expectedLineAttribs: ['*0*1*2*3+1+b', '+5', '*0*1*2*4+1+b', '*0*1*2*4+1+b', ''],
|
wantLineAttribs: ['*0*1*2*3+1+b', '+5', '*0*1*2*4+1+b', '*0*1*2*4+1+b', ''],
|
||||||
expectedText: ['*should be 1', 'hello', '*should be 1', '*should be 2', ''],
|
wantText: ['*should be 1', 'hello', '*should be 1', '*should be 2', ''],
|
||||||
noteToSelf: "Shouldn't include attribute marker in the <p> line",
|
noteToSelf: "Shouldn't include attribute marker in the <p> line",
|
||||||
},
|
},
|
||||||
bulletListInOL: {
|
|
||||||
description: 'A bullet within an OL should not change numbering..',
|
|
||||||
html: '<html><body><ol><li>should be 1</li><ul><li>should be a bullet</li></ul><li>should be 2</li></ol><p></p></body></html>',
|
|
||||||
expectedLineAttribs: ['*0*1*2*3+1+b', '*0*4*2*3+1+i', '*0*1*2*5+1+b', ''],
|
|
||||||
expectedText: ['*should be 1', '*should be a bullet', '*should be 2', ''],
|
|
||||||
},
|
|
||||||
testP: {
|
testP: {
|
||||||
description: 'A single <p></p> should create a new line',
|
description: 'A single <p></p> should create a new line',
|
||||||
html: '<html><body><p></p><p></p></body></html>',
|
html: '<html><body><p></p><p></p></body></html>',
|
||||||
expectedLineAttribs: ['', ''],
|
wantLineAttribs: ['', ''],
|
||||||
expectedText: ['', ''],
|
wantText: ['', ''],
|
||||||
noteToSelf: '<p></p>should create a line break but not break numbering',
|
noteToSelf: '<p></p>should create a line break but not break numbering',
|
||||||
},
|
},
|
||||||
nestedOl: {
|
nestedOl: {
|
||||||
description: 'Tests if ols properly get line numbers when in a normal OL',
|
description: 'Tests if ols properly get line numbers when in a normal OL',
|
||||||
html: '<html><body>a<ol><li>b<ol><li>c</li></ol></ol>notlist<p>foo</p></body></html>',
|
html: '<html><body>a<ol><li>b<ol><li>c</li></ol></ol>notlist<p>foo</p></body></html>',
|
||||||
expectedLineAttribs: ['+1', '*0*1*2*3+1+1', '*0*4*2*5+1+1', '+7', '+3'],
|
wantLineAttribs: ['+1', '*0*1*2*3+1+1', '*0*4*2*5+1+1', '+7', '+3'],
|
||||||
expectedText: ['a', '*b', '*c', 'notlist', 'foo'],
|
wantText: ['a', '*b', '*c', 'notlist', 'foo'],
|
||||||
noteToSelf: 'Ensure empty P does not induce line attribute marker, wont this break the editor?',
|
noteToSelf: 'Ensure empty P does not induce line attribute marker, wont this break the editor?',
|
||||||
},
|
},
|
||||||
nestedOl2: {
|
nestedOl2: {
|
||||||
description: 'First item being an UL then subsequent being OL will fail',
|
description: 'First item being an UL then subsequent being OL will fail',
|
||||||
html: '<html><body><ul><li>a<ol><li>b</li><li>c</li></ol></li></ul></body></html>',
|
html: '<html><body><ul><li>a<ol><li>b</li><li>c</li></ol></li></ul></body></html>',
|
||||||
expectedLineAttribs: ['+1', '*0*1*2*3+1+1', '*0*4*2*5+1+1'],
|
wantLineAttribs: ['+1', '*0*1*2*3+1+1', '*0*4*2*5+1+1'],
|
||||||
expectedText: ['a', '*b', '*c'],
|
wantText: ['a', '*b', '*c'],
|
||||||
noteToSelf: 'Ensure empty P does not induce line attribute marker, wont this break the editor?',
|
noteToSelf: 'Ensure empty P does not induce line attribute marker, wont this break the editor?',
|
||||||
disabled: true,
|
disabled: true,
|
||||||
},
|
},
|
||||||
lineDontBreakOL: {
|
lineDontBreakOL: {
|
||||||
description: 'A single completely empty line break within an ol should NOT reset count',
|
description: 'A single completely empty line break within an ol should NOT reset count',
|
||||||
html: '<html><body><ol><li>should be 1</li><p></p><li>should be 2</li><li>should be 3</li></ol><p></p></body></html>',
|
html: '<html><body><ol><li>should be 1</li><p></p><li>should be 2</li><li>should be 3</li></ol><p></p></body></html>',
|
||||||
expectedLineAttribs: [],
|
wantLineAttribs: [],
|
||||||
expectedText: ['*should be 1', '*should be 2', '*should be 3'],
|
wantText: ['*should be 1', '*should be 2', '*should be 3'],
|
||||||
noteToSelf: "<p></p>should create a line break but not break numbering -- This is what I can't get working!",
|
noteToSelf: "<p></p>should create a line break but not break numbering -- This is what I can't get working!",
|
||||||
disabled: true,
|
disabled: true,
|
||||||
},
|
},
|
||||||
ignoreAnyTagsOutsideBody: {
|
ignoreAnyTagsOutsideBody: {
|
||||||
description: 'Content outside body should be ignored',
|
description: 'Content outside body should be ignored',
|
||||||
html: '<html><head><title>title</title><style></style></head><body>empty<br></body></html>',
|
html: '<html><head><title>title</title><style></style></head><body>empty<br></body></html>',
|
||||||
expectedLineAttribs: ['+5'],
|
wantLineAttribs: ['+5'],
|
||||||
expectedText: ['empty'],
|
wantText: ['empty'],
|
||||||
},
|
},
|
||||||
lineWithMultipleSpaces: {
|
lineWithMultipleSpaces: {
|
||||||
description: 'Multiple spaces should be preserved',
|
description: 'Multiple spaces should be preserved',
|
||||||
html: '<html><body>Text with more than one space.<br></body></html>',
|
html: '<html><body>Text with more than one space.<br></body></html>',
|
||||||
expectedLineAttribs: [ '+10' ],
|
wantLineAttribs: ['+10'],
|
||||||
expectedText: ['Text with more than one space.']
|
wantText: ['Text with more than one space.'],
|
||||||
},
|
},
|
||||||
lineWithMultipleNonBreakingAndNormalSpaces: {
|
lineWithMultipleNonBreakingAndNormalSpaces: {
|
||||||
description: 'non-breaking and normal space should be preserved',
|
description: 'non-breaking and normal space should be preserved',
|
||||||
html: '<html><body>Text with more than one space.<br></body></html>',
|
html: '<html><body>Text with more than one space.<br></body></html>',
|
||||||
expectedLineAttribs: [ '+10' ],
|
wantLineAttribs: ['+10'],
|
||||||
expectedText: ['Text with more than one space.']
|
wantText: ['Text with more than one space.'],
|
||||||
},
|
},
|
||||||
multiplenbsp: {
|
multiplenbsp: {
|
||||||
description: 'Multiple nbsp should be preserved',
|
description: 'Multiple nbsp should be preserved',
|
||||||
html: '<html><body> <br></body></html>',
|
html: '<html><body> <br></body></html>',
|
||||||
expectedLineAttribs: [ '+2' ],
|
wantLineAttribs: ['+2'],
|
||||||
expectedText: [' ']
|
wantText: [' '],
|
||||||
},
|
},
|
||||||
multipleNonBreakingSpaceBetweenWords: {
|
multipleNonBreakingSpaceBetweenWords: {
|
||||||
description: 'Multiple nbsp between words ',
|
description: 'Multiple nbsp between words ',
|
||||||
html: '<html><body> word1 word2 word3<br></body></html>',
|
html: '<html><body> word1 word2 word3<br></body></html>',
|
||||||
expectedLineAttribs: [ '+m' ],
|
wantLineAttribs: ['+m'],
|
||||||
expectedText: [' word1 word2 word3']
|
wantText: [' word1 word2 word3'],
|
||||||
},
|
},
|
||||||
nonBreakingSpacePreceededBySpaceBetweenWords: {
|
nonBreakingSpacePreceededBySpaceBetweenWords: {
|
||||||
description: 'A non-breaking space preceeded by a normal space',
|
description: 'A non-breaking space preceeded by a normal space',
|
||||||
html: '<html><body> word1 word2 word3<br></body></html>',
|
html: '<html><body> word1 word2 word3<br></body></html>',
|
||||||
expectedLineAttribs: [ '+l' ],
|
wantLineAttribs: ['+l'],
|
||||||
expectedText: [' word1 word2 word3']
|
wantText: [' word1 word2 word3'],
|
||||||
},
|
},
|
||||||
nonBreakingSpaceFollowededBySpaceBetweenWords: {
|
nonBreakingSpaceFollowededBySpaceBetweenWords: {
|
||||||
description: 'A non-breaking space followed by a normal space',
|
description: 'A non-breaking space followed by a normal space',
|
||||||
html: '<html><body> word1 word2 word3<br></body></html>',
|
html: '<html><body> word1 word2 word3<br></body></html>',
|
||||||
expectedLineAttribs: [ '+l' ],
|
wantLineAttribs: ['+l'],
|
||||||
expectedText: [' word1 word2 word3']
|
wantText: [' word1 word2 word3'],
|
||||||
},
|
},
|
||||||
spacesAfterNewline: {
|
spacesAfterNewline: {
|
||||||
description: 'Don\'t collapse spaces that follow a newline',
|
description: 'Don\'t collapse spaces that follow a newline',
|
||||||
html:'<!doctype html><html><body>something<br> something<br></body></html>',
|
html: '<!doctype html><html><body>something<br> something<br></body></html>',
|
||||||
expectedLineAttribs: ['+9', '+m'],
|
wantLineAttribs: ['+9', '+m'],
|
||||||
expectedText: ['something', ' something']
|
wantText: ['something', ' something'],
|
||||||
},
|
},
|
||||||
spacesAfterNewlineP: {
|
spacesAfterNewlineP: {
|
||||||
description: 'Don\'t collapse spaces that follow a empty paragraph',
|
description: 'Don\'t collapse spaces that follow a empty paragraph',
|
||||||
html:'<!doctype html><html><body>something<p></p> something<br></body></html>',
|
html: '<!doctype html><html><body>something<p></p> something<br></body></html>',
|
||||||
expectedLineAttribs: ['+9', '', '+m'],
|
wantLineAttribs: ['+9', '', '+m'],
|
||||||
expectedText: ['something', '', ' something']
|
wantText: ['something', '', ' something'],
|
||||||
},
|
},
|
||||||
spacesAtEndOfLine: {
|
spacesAtEndOfLine: {
|
||||||
description: 'Don\'t collapse spaces that preceed/follow a newline',
|
description: 'Don\'t collapse spaces that preceed/follow a newline',
|
||||||
html:'<html><body>something <br> something<br></body></html>',
|
html: '<html><body>something <br> something<br></body></html>',
|
||||||
expectedLineAttribs: ['+l', '+m'],
|
wantLineAttribs: ['+l', '+m'],
|
||||||
expectedText: ['something ', ' something']
|
wantText: ['something ', ' something'],
|
||||||
},
|
},
|
||||||
spacesAtEndOfLineP: {
|
spacesAtEndOfLineP: {
|
||||||
description: 'Don\'t collapse spaces that preceed/follow a empty paragraph',
|
description: 'Don\'t collapse spaces that preceed/follow a empty paragraph',
|
||||||
html:'<html><body>something <p></p> something<br></body></html>',
|
html: '<html><body>something <p></p> something<br></body></html>',
|
||||||
expectedLineAttribs: ['+l', '', '+m'],
|
wantLineAttribs: ['+l', '', '+m'],
|
||||||
expectedText: ['something ', '', ' something']
|
wantText: ['something ', '', ' something'],
|
||||||
},
|
},
|
||||||
nonBreakingSpacesAfterNewlines: {
|
nonBreakingSpacesAfterNewlines: {
|
||||||
description: 'Don\'t collapse non-breaking spaces that follow a newline',
|
description: 'Don\'t collapse non-breaking spaces that follow a newline',
|
||||||
html:'<html><body>something<br> something<br></body></html>',
|
html: '<html><body>something<br> something<br></body></html>',
|
||||||
expectedLineAttribs: ['+9', '+c'],
|
wantLineAttribs: ['+9', '+c'],
|
||||||
expectedText: ['something', ' something']
|
wantText: ['something', ' something'],
|
||||||
},
|
},
|
||||||
nonBreakingSpacesAfterNewlinesP: {
|
nonBreakingSpacesAfterNewlinesP: {
|
||||||
description: 'Don\'t collapse non-breaking spaces that follow a paragraph',
|
description: 'Don\'t collapse non-breaking spaces that follow a paragraph',
|
||||||
html:'<html><body>something<p></p> something<br></body></html>',
|
html: '<html><body>something<p></p> something<br></body></html>',
|
||||||
expectedLineAttribs: ['+9', '', '+c'],
|
wantLineAttribs: ['+9', '', '+c'],
|
||||||
expectedText: ['something', '', ' something']
|
wantText: ['something', '', ' something'],
|
||||||
},
|
},
|
||||||
preserveSpacesInsideElements: {
|
preserveSpacesInsideElements: {
|
||||||
description: 'Preserve all spaces when multiple are present',
|
description: 'Preserve all spaces when multiple are present',
|
||||||
html: '<html><body>Need <span> more </span> space<i> s </i> !<br></body></html>',
|
html: '<html><body>Need <span> more </span> space<i> s </i> !<br></body></html>',
|
||||||
expectedLineAttribs: ['+h*0+4+2'],
|
wantLineAttribs: ['+h*0+4+2'],
|
||||||
expectedText: ['Need more space s !'],
|
wantText: ['Need more space s !'],
|
||||||
},
|
},
|
||||||
preserveSpacesAcrossNewlines: {
|
preserveSpacesAcrossNewlines: {
|
||||||
description: 'Newlines and multiple spaces across newlines should be preserved',
|
description: 'Newlines and multiple spaces across newlines should be preserved',
|
||||||
|
@ -207,69 +201,76 @@ const tests = {
|
||||||
space
|
space
|
||||||
<i> s </i>
|
<i> s </i>
|
||||||
!<br></body></html>`,
|
!<br></body></html>`,
|
||||||
expectedLineAttribs: [ '+19*0+4+b' ],
|
wantLineAttribs: ['+19*0+4+b'],
|
||||||
expectedText: [ 'Need more space s !' ]
|
wantText: ['Need more space s !'],
|
||||||
},
|
},
|
||||||
multipleNewLinesAtBeginning: {
|
multipleNewLinesAtBeginning: {
|
||||||
description: 'Multiple new lines at the beginning should be preserved',
|
description: 'Multiple new lines at the beginning should be preserved',
|
||||||
html: '<html><body><br><br><p></p><p></p>first line<br><br>second line<br></body></html>',
|
html: '<html><body><br><br><p></p><p></p>first line<br><br>second line<br></body></html>',
|
||||||
expectedLineAttribs: ['', '', '', '', '+a', '', '+b'],
|
wantLineAttribs: ['', '', '', '', '+a', '', '+b'],
|
||||||
expectedText: [ '', '', '', '', 'first line', '', 'second line']
|
wantText: ['', '', '', '', 'first line', '', 'second line'],
|
||||||
},
|
},
|
||||||
multiLineParagraph:{
|
multiLineParagraph: {
|
||||||
description: "A paragraph with multiple lines should not loose spaces when lines are combined",
|
description: 'A paragraph with multiple lines should not loose spaces when lines are combined',
|
||||||
html:`<html><body><p>
|
html: `<html><body><p>
|
||||||
а б в г ґ д е є ж з и і ї й к л м н о
|
а б в г ґ д е є ж з и і ї й к л м н о
|
||||||
п р с т у ф х ц ч ш щ ю я ь</p>
|
п р с т у ф х ц ч ш щ ю я ь</p>
|
||||||
</body></html>`,
|
</body></html>`,
|
||||||
expectedLineAttribs: [ '+1t' ],
|
wantLineAttribs: ['+1t'],
|
||||||
expectedText: ["а б в г ґ д е є ж з и і ї й к л м н о п р с т у ф х ц ч ш щ ю я ь"]
|
wantText: ['а б в г ґ д е є ж з и і ї й к л м н о п р с т у ф х ц ч ш щ ю я ь'],
|
||||||
},
|
},
|
||||||
multiLineParagraphWithPre:{
|
multiLineParagraphWithPre: {
|
||||||
description: "lines in preformatted text should be kept intact",
|
description: 'lines in preformatted text should be kept intact',
|
||||||
html:`<html><body><p>
|
html: `<html><body><p>
|
||||||
а б в г ґ д е є ж з и і ї й к л м н о<pre>multiple
|
а б в г ґ д е є ж з и і ї й к л м н о</p><pre>multiple
|
||||||
lines
|
lines
|
||||||
in
|
in
|
||||||
pre
|
pre
|
||||||
</pre></p><p>п р с т у ф х ц ч ш щ ю я
|
</pre><p>п р с т у ф х ц ч ш щ ю я
|
||||||
ь</p>
|
ь</p>
|
||||||
</body></html>`,
|
</body></html>`,
|
||||||
expectedLineAttribs: [ '+11', '+8', '+5', '+2', '+3', '+r' ],
|
wantLineAttribs: ['+11', '+8', '+5', '+2', '+3', '+r'],
|
||||||
expectedText: ['а б в г ґ д е є ж з и і ї й к л м н о', 'multiple', 'lines', 'in', 'pre', 'п р с т у ф х ц ч ш щ ю я ь']
|
wantText: [
|
||||||
|
'а б в г ґ д е є ж з и і ї й к л м н о',
|
||||||
|
'multiple',
|
||||||
|
'lines',
|
||||||
|
'in',
|
||||||
|
'pre',
|
||||||
|
'п р с т у ф х ц ч ш щ ю я ь',
|
||||||
|
],
|
||||||
},
|
},
|
||||||
preIntroducesASpace: {
|
preIntroducesASpace: {
|
||||||
description: "pre should be on a new line not preceeded by a space",
|
description: 'pre should be on a new line not preceeded by a space',
|
||||||
html:`<html><body><p>
|
html: `<html><body><p>
|
||||||
1
|
1
|
||||||
<pre>preline
|
</p><pre>preline
|
||||||
</pre></p></body></html>`,
|
</pre></body></html>`,
|
||||||
expectedLineAttribs: [ '+6', '+7' ],
|
wantLineAttribs: ['+6', '+7'],
|
||||||
expectedText: [' 1 ', 'preline']
|
wantText: [' 1 ', 'preline'],
|
||||||
},
|
},
|
||||||
dontDeleteSpaceInsideElements: {
|
dontDeleteSpaceInsideElements: {
|
||||||
description: 'Preserve spaces on the beginning and end of a element',
|
description: 'Preserve spaces on the beginning and end of a element',
|
||||||
html: '<html><body>Need<span> more </span>space<i> s </i>!<br></body></html>',
|
html: '<html><body>Need<span> more </span>space<i> s </i>!<br></body></html>',
|
||||||
expectedLineAttribs: ['+f*0+3+1'],
|
wantLineAttribs: ['+f*0+3+1'],
|
||||||
expectedText: ['Need more space s !']
|
wantText: ['Need more space s !'],
|
||||||
},
|
},
|
||||||
dontDeleteSpaceOutsideElements: {
|
dontDeleteSpaceOutsideElements: {
|
||||||
description: 'Preserve spaces outside elements',
|
description: 'Preserve spaces outside elements',
|
||||||
html: '<html><body>Need <span>more</span> space <i>s</i> !<br></body></html>',
|
html: '<html><body>Need <span>more</span> space <i>s</i> !<br></body></html>',
|
||||||
expectedLineAttribs: ['+g*0+1+2'],
|
wantLineAttribs: ['+g*0+1+2'],
|
||||||
expectedText: ['Need more space s !']
|
wantText: ['Need more space s !'],
|
||||||
},
|
},
|
||||||
dontDeleteSpaceAtEndOfElement: {
|
dontDeleteSpaceAtEndOfElement: {
|
||||||
description: 'Preserve spaces at the end of an element',
|
description: 'Preserve spaces at the end of an element',
|
||||||
html: '<html><body>Need <span>more </span>space <i>s </i>!<br></body></html>',
|
html: '<html><body>Need <span>more </span>space <i>s </i>!<br></body></html>',
|
||||||
expectedLineAttribs: ['+g*0+2+1'],
|
wantLineAttribs: ['+g*0+2+1'],
|
||||||
expectedText: ['Need more space s !']
|
wantText: ['Need more space s !'],
|
||||||
},
|
},
|
||||||
dontDeleteSpaceAtBeginOfElements: {
|
dontDeleteSpaceAtBeginOfElements: {
|
||||||
description: 'Preserve spaces at the start of an element',
|
description: 'Preserve spaces at the start of an element',
|
||||||
html: '<html><body>Need<span> more</span> space<i> s</i> !<br></body></html>',
|
html: '<html><body>Need<span> more</span> space<i> s</i> !<br></body></html>',
|
||||||
expectedLineAttribs: ['+f*0+2+2'],
|
wantLineAttribs: ['+f*0+2+2'],
|
||||||
expectedText: ['Need more space s !']
|
wantText: ['Need more space s !'],
|
||||||
},
|
},
|
||||||
};
|
};
|
||||||
|
|
||||||
|
@ -283,7 +284,7 @@ describe(__filename, function () {
|
||||||
});
|
});
|
||||||
}
|
}
|
||||||
|
|
||||||
it(testObj.description, function (done) {
|
it(testObj.description, async function () {
|
||||||
const $ = cheerio.load(testObj.html); // Load HTML into Cheerio
|
const $ = cheerio.load(testObj.html); // Load HTML into Cheerio
|
||||||
const doc = $('body')[0]; // Creates a dom-like representation of HTML
|
const doc = $('body')[0]; // Creates a dom-like representation of HTML
|
||||||
// Create an empty attribute pool
|
// Create an empty attribute pool
|
||||||
|
@ -293,29 +294,13 @@ describe(__filename, function () {
|
||||||
const cc = contentcollector.makeContentCollector(true, null, apool);
|
const cc = contentcollector.makeContentCollector(true, null, apool);
|
||||||
cc.collectContent(doc);
|
cc.collectContent(doc);
|
||||||
const result = cc.finish();
|
const result = cc.finish();
|
||||||
const recievedAttributes = result.lineAttribs;
|
const gotAttributes = result.lineAttribs;
|
||||||
const expectedAttributes = testObj.expectedLineAttribs;
|
const wantAttributes = testObj.wantLineAttribs;
|
||||||
const recievedText = new Array(result.lines);
|
const gotText = new Array(result.lines);
|
||||||
const expectedText = testObj.expectedText;
|
const wantText = testObj.wantText;
|
||||||
|
|
||||||
// Check recieved text matches the expected text
|
assert.deepEqual(gotText[0], wantText);
|
||||||
if (arraysEqual(recievedText[0], expectedText)) {
|
assert.deepEqual(gotAttributes, wantAttributes);
|
||||||
// console.log("PASS: Recieved Text did match Expected Text\nRecieved:", recievedText[0], "\nExpected:", testObj.expectedText)
|
|
||||||
} else {
|
|
||||||
console.error('FAIL: Recieved Text did not match Expected Text\nRecieved:', recievedText[0], '\nExpected:', testObj.expectedText);
|
|
||||||
throw new Error();
|
|
||||||
}
|
|
||||||
|
|
||||||
// Check recieved attributes matches the expected attributes
|
|
||||||
if (arraysEqual(recievedAttributes, expectedAttributes)) {
|
|
||||||
// console.log("PASS: Recieved Attributes matched Expected Attributes");
|
|
||||||
done();
|
|
||||||
} else {
|
|
||||||
console.error('FAIL', test, testObj.description);
|
|
||||||
console.error('FAIL: Recieved Attributes did not match Expected Attributes\nRecieved: ', recievedAttributes, '\nExpected: ', expectedAttributes);
|
|
||||||
console.error('FAILING HTML', testObj.html);
|
|
||||||
throw new Error();
|
|
||||||
}
|
|
||||||
});
|
});
|
||||||
});
|
});
|
||||||
}
|
}
|
||||||
|
@ -325,7 +310,7 @@ describe(__filename, function () {
|
||||||
function arraysEqual(a, b) {
|
function arraysEqual(a, b) {
|
||||||
if (a === b) return true;
|
if (a === b) return true;
|
||||||
if (a == null || b == null) return false;
|
if (a == null || b == null) return false;
|
||||||
if (a.length != b.length) return false;
|
if (a.length !== b.length) return false;
|
||||||
|
|
||||||
// If you don't care about the order of the elements inside
|
// If you don't care about the order of the elements inside
|
||||||
// the array, you should sort both arrays here.
|
// the array, you should sort both arrays here.
|
||||||
|
|
Loading…
Add table
Add a link
Reference in a new issue