2020-12-18 06:40:33 +01:00
|
|
|
|
'use strict';
|
|
|
|
|
|
2020-12-20 07:18:19 +01:00
|
|
|
|
/*
|
2021-01-24 06:56:11 +01:00
|
|
|
|
* While importexport tests target the `setHTML` API endpoint, which is nearly identical to what
|
|
|
|
|
* happens when a user manually imports a document via the UI, the contentcollector tests here don't
|
|
|
|
|
* use rehype to process the document. Rehype removes spaces and newĺines were applicable, so the
|
|
|
|
|
* expected results here can differ from importexport.js.
|
2020-12-20 07:18:19 +01:00
|
|
|
|
*
|
|
|
|
|
* If you add tests here, please also add them to importexport.js
|
|
|
|
|
*/
|
2020-12-18 06:40:33 +01:00
|
|
|
|
|
2021-01-24 06:56:11 +01:00
|
|
|
|
const AttributePool = require('ep_etherpad-lite/static/js/AttributePool');
|
2021-01-24 07:34:28 +01:00
|
|
|
|
const assert = require('assert').strict;
|
2021-01-24 06:56:11 +01:00
|
|
|
|
const cheerio = require('ep_etherpad-lite/node_modules/cheerio');
|
|
|
|
|
const contentcollector = require('ep_etherpad-lite/static/js/contentcollector');
|
2020-06-05 21:54:16 +02:00
|
|
|
|
|
|
|
|
|
const tests = {
|
2020-11-23 19:21:51 +01:00
|
|
|
|
nestedLi: {
|
|
|
|
|
description: 'Complex nested Li',
|
2020-06-05 21:54:16 +02:00
|
|
|
|
html: '<!doctype html><html><body><ol><li>one</li><li><ol><li>1.1</li></ol></li><li>two</li></ol></body></html>',
|
2021-01-24 07:54:14 +01:00
|
|
|
|
wantLineAttribs: [
|
2020-11-23 19:21:51 +01:00
|
|
|
|
'*0*1*2*3+1+3', '*0*4*2*5+1+3', '*0*1*2*5+1+3',
|
2020-06-05 21:54:16 +02:00
|
|
|
|
],
|
2021-01-24 07:54:14 +01:00
|
|
|
|
wantText: [
|
2020-11-23 19:21:51 +01:00
|
|
|
|
'*one', '*1.1', '*two',
|
|
|
|
|
],
|
2020-06-05 21:54:16 +02:00
|
|
|
|
},
|
2020-11-23 19:21:51 +01:00
|
|
|
|
complexNest: {
|
|
|
|
|
description: 'Complex list of different types',
|
2020-06-05 21:54:16 +02:00
|
|
|
|
html: '<!doctype html><html><body><ul class="bullet"><li>one</li><li>two</li><li>0</li><li>1</li><li>2<ul class="bullet"><li>3</li><li>4</li></ul></li></ul><ol class="number"><li>item<ol class="number"><li>item1</li><li>item2</li></ol></li></ol></body></html>',
|
2021-01-24 07:54:14 +01:00
|
|
|
|
wantLineAttribs: [
|
2020-06-05 21:54:16 +02:00
|
|
|
|
'*0*1*2+1+3',
|
|
|
|
|
'*0*1*2+1+3',
|
|
|
|
|
'*0*1*2+1+1',
|
|
|
|
|
'*0*1*2+1+1',
|
|
|
|
|
'*0*1*2+1+1',
|
|
|
|
|
'*0*3*2+1+1',
|
|
|
|
|
'*0*3*2+1+1',
|
|
|
|
|
'*0*4*2*5+1+4',
|
|
|
|
|
'*0*6*2*7+1+5',
|
2020-11-23 19:21:51 +01:00
|
|
|
|
'*0*6*2*7+1+5',
|
2020-06-05 21:54:16 +02:00
|
|
|
|
],
|
2021-01-24 07:54:14 +01:00
|
|
|
|
wantText: [
|
2020-11-23 19:21:51 +01:00
|
|
|
|
'*one',
|
|
|
|
|
'*two',
|
|
|
|
|
'*0',
|
|
|
|
|
'*1',
|
|
|
|
|
'*2',
|
|
|
|
|
'*3',
|
|
|
|
|
'*4',
|
|
|
|
|
'*item',
|
|
|
|
|
'*item1',
|
|
|
|
|
'*item2',
|
|
|
|
|
],
|
2020-06-05 21:54:16 +02:00
|
|
|
|
},
|
|
|
|
|
ul: {
|
2020-11-23 19:21:51 +01:00
|
|
|
|
description: 'Tests if uls properly get attributes',
|
|
|
|
|
html: '<html><body><ul><li>a</li><li>b</li></ul><div>div</div><p>foo</p></body></html>',
|
2021-01-24 07:54:14 +01:00
|
|
|
|
wantLineAttribs: ['*0*1*2+1+1', '*0*1*2+1+1', '+3', '+3'],
|
|
|
|
|
wantText: ['*a', '*b', 'div', 'foo'],
|
2020-11-23 19:21:51 +01:00
|
|
|
|
},
|
2020-06-05 21:54:16 +02:00
|
|
|
|
ulIndented: {
|
2020-11-23 19:21:51 +01:00
|
|
|
|
description: 'Tests if indented uls properly get attributes',
|
|
|
|
|
html: '<html><body><ul><li>a</li><ul><li>b</li></ul><li>a</li></ul><p>foo</p></body></html>',
|
2021-01-24 07:54:14 +01:00
|
|
|
|
wantLineAttribs: ['*0*1*2+1+1', '*0*3*2+1+1', '*0*1*2+1+1', '+3'],
|
|
|
|
|
wantText: ['*a', '*b', '*a', 'foo'],
|
2020-06-05 21:54:16 +02:00
|
|
|
|
},
|
|
|
|
|
ol: {
|
2020-11-23 19:21:51 +01:00
|
|
|
|
description: 'Tests if ols properly get line numbers when in a normal OL',
|
|
|
|
|
html: '<html><body><ol><li>a</li><li>b</li><li>c</li></ol><p>test</p></body></html>',
|
2021-01-24 07:54:14 +01:00
|
|
|
|
wantLineAttribs: ['*0*1*2*3+1+1', '*0*1*2*3+1+1', '*0*1*2*3+1+1', '+4'],
|
|
|
|
|
wantText: ['*a', '*b', '*c', 'test'],
|
2020-11-23 19:21:51 +01:00
|
|
|
|
noteToSelf: 'Ensure empty P does not induce line attribute marker, wont this break the editor?',
|
2020-06-05 21:54:16 +02:00
|
|
|
|
},
|
2020-11-23 19:21:51 +01:00
|
|
|
|
lineDoBreakInOl: {
|
|
|
|
|
description: 'A single completely empty line break within an ol should reset count if OL is closed off..',
|
|
|
|
|
html: '<html><body><ol><li>should be 1</li></ol><p>hello</p><ol><li>should be 1</li><li>should be 2</li></ol><p></p></body></html>',
|
2021-01-24 07:54:14 +01:00
|
|
|
|
wantLineAttribs: ['*0*1*2*3+1+b', '+5', '*0*1*2*4+1+b', '*0*1*2*4+1+b', ''],
|
|
|
|
|
wantText: ['*should be 1', 'hello', '*should be 1', '*should be 2', ''],
|
2020-11-23 19:21:51 +01:00
|
|
|
|
noteToSelf: "Shouldn't include attribute marker in the <p> line",
|
2020-06-05 21:54:16 +02:00
|
|
|
|
},
|
2020-11-23 19:21:51 +01:00
|
|
|
|
testP: {
|
|
|
|
|
description: 'A single <p></p> should create a new line',
|
|
|
|
|
html: '<html><body><p></p><p></p></body></html>',
|
2021-01-24 07:54:14 +01:00
|
|
|
|
wantLineAttribs: ['', ''],
|
|
|
|
|
wantText: ['', ''],
|
2020-11-23 19:21:51 +01:00
|
|
|
|
noteToSelf: '<p></p>should create a line break but not break numbering',
|
2020-06-05 21:54:16 +02:00
|
|
|
|
},
|
|
|
|
|
nestedOl: {
|
2020-11-23 19:21:51 +01:00
|
|
|
|
description: 'Tests if ols properly get line numbers when in a normal OL',
|
|
|
|
|
html: '<html><body>a<ol><li>b<ol><li>c</li></ol></ol>notlist<p>foo</p></body></html>',
|
2021-01-24 07:54:14 +01:00
|
|
|
|
wantLineAttribs: ['+1', '*0*1*2*3+1+1', '*0*4*2*5+1+1', '+7', '+3'],
|
|
|
|
|
wantText: ['a', '*b', '*c', 'notlist', 'foo'],
|
2020-11-23 19:21:51 +01:00
|
|
|
|
noteToSelf: 'Ensure empty P does not induce line attribute marker, wont this break the editor?',
|
2020-06-05 21:54:16 +02:00
|
|
|
|
},
|
2020-12-18 06:40:33 +01:00
|
|
|
|
nestedOl2: {
|
2020-11-23 19:21:51 +01:00
|
|
|
|
description: 'First item being an UL then subsequent being OL will fail',
|
|
|
|
|
html: '<html><body><ul><li>a<ol><li>b</li><li>c</li></ol></li></ul></body></html>',
|
2021-01-24 07:54:14 +01:00
|
|
|
|
wantLineAttribs: ['+1', '*0*1*2*3+1+1', '*0*4*2*5+1+1'],
|
|
|
|
|
wantText: ['a', '*b', '*c'],
|
2020-11-23 19:21:51 +01:00
|
|
|
|
noteToSelf: 'Ensure empty P does not induce line attribute marker, wont this break the editor?',
|
|
|
|
|
disabled: true,
|
2020-06-05 21:54:16 +02:00
|
|
|
|
},
|
2020-11-23 19:21:51 +01:00
|
|
|
|
lineDontBreakOL: {
|
|
|
|
|
description: 'A single completely empty line break within an ol should NOT reset count',
|
|
|
|
|
html: '<html><body><ol><li>should be 1</li><p></p><li>should be 2</li><li>should be 3</li></ol><p></p></body></html>',
|
2021-01-24 07:54:14 +01:00
|
|
|
|
wantLineAttribs: [],
|
|
|
|
|
wantText: ['*should be 1', '*should be 2', '*should be 3'],
|
2020-06-05 21:54:16 +02:00
|
|
|
|
noteToSelf: "<p></p>should create a line break but not break numbering -- This is what I can't get working!",
|
2020-11-23 19:21:51 +01:00
|
|
|
|
disabled: true,
|
|
|
|
|
},
|
2020-12-18 10:37:37 +01:00
|
|
|
|
ignoreAnyTagsOutsideBody: {
|
|
|
|
|
description: 'Content outside body should be ignored',
|
|
|
|
|
html: '<html><head><title>title</title><style></style></head><body>empty<br></body></html>',
|
2021-01-24 07:54:14 +01:00
|
|
|
|
wantLineAttribs: ['+5'],
|
|
|
|
|
wantText: ['empty'],
|
2020-12-18 10:37:37 +01:00
|
|
|
|
},
|
2020-12-20 07:18:19 +01:00
|
|
|
|
lineWithMultipleSpaces: {
|
|
|
|
|
description: 'Multiple spaces should be preserved',
|
|
|
|
|
html: '<html><body>Text with more than one space.<br></body></html>',
|
2021-01-24 07:54:14 +01:00
|
|
|
|
wantLineAttribs: ['+10'],
|
|
|
|
|
wantText: ['Text with more than one space.'],
|
2020-12-20 07:18:19 +01:00
|
|
|
|
},
|
|
|
|
|
lineWithMultipleNonBreakingAndNormalSpaces: {
|
|
|
|
|
description: 'non-breaking and normal space should be preserved',
|
|
|
|
|
html: '<html><body>Text with more than one space.<br></body></html>',
|
2021-01-24 07:54:14 +01:00
|
|
|
|
wantLineAttribs: ['+10'],
|
|
|
|
|
wantText: ['Text with more than one space.'],
|
2020-12-20 07:18:19 +01:00
|
|
|
|
},
|
|
|
|
|
multiplenbsp: {
|
|
|
|
|
description: 'Multiple nbsp should be preserved',
|
|
|
|
|
html: '<html><body> <br></body></html>',
|
2021-01-24 07:54:14 +01:00
|
|
|
|
wantLineAttribs: ['+2'],
|
|
|
|
|
wantText: [' '],
|
2020-12-20 07:18:19 +01:00
|
|
|
|
},
|
|
|
|
|
multipleNonBreakingSpaceBetweenWords: {
|
|
|
|
|
description: 'Multiple nbsp between words ',
|
|
|
|
|
html: '<html><body> word1 word2 word3<br></body></html>',
|
2021-01-24 07:54:14 +01:00
|
|
|
|
wantLineAttribs: ['+m'],
|
|
|
|
|
wantText: [' word1 word2 word3'],
|
2020-12-20 07:18:19 +01:00
|
|
|
|
},
|
|
|
|
|
nonBreakingSpacePreceededBySpaceBetweenWords: {
|
|
|
|
|
description: 'A non-breaking space preceeded by a normal space',
|
|
|
|
|
html: '<html><body> word1 word2 word3<br></body></html>',
|
2021-01-24 07:54:14 +01:00
|
|
|
|
wantLineAttribs: ['+l'],
|
|
|
|
|
wantText: [' word1 word2 word3'],
|
2020-12-20 07:18:19 +01:00
|
|
|
|
},
|
|
|
|
|
nonBreakingSpaceFollowededBySpaceBetweenWords: {
|
|
|
|
|
description: 'A non-breaking space followed by a normal space',
|
|
|
|
|
html: '<html><body> word1 word2 word3<br></body></html>',
|
2021-01-24 07:54:14 +01:00
|
|
|
|
wantLineAttribs: ['+l'],
|
|
|
|
|
wantText: [' word1 word2 word3'],
|
2020-12-20 07:18:19 +01:00
|
|
|
|
},
|
|
|
|
|
spacesAfterNewline: {
|
|
|
|
|
description: 'Don\'t collapse spaces that follow a newline',
|
2021-01-24 06:56:11 +01:00
|
|
|
|
html: '<!doctype html><html><body>something<br> something<br></body></html>',
|
2021-01-24 07:54:14 +01:00
|
|
|
|
wantLineAttribs: ['+9', '+m'],
|
|
|
|
|
wantText: ['something', ' something'],
|
2020-12-20 07:18:19 +01:00
|
|
|
|
},
|
|
|
|
|
spacesAfterNewlineP: {
|
|
|
|
|
description: 'Don\'t collapse spaces that follow a empty paragraph',
|
2021-01-24 06:56:11 +01:00
|
|
|
|
html: '<!doctype html><html><body>something<p></p> something<br></body></html>',
|
2021-01-24 07:54:14 +01:00
|
|
|
|
wantLineAttribs: ['+9', '', '+m'],
|
|
|
|
|
wantText: ['something', '', ' something'],
|
2020-12-20 07:18:19 +01:00
|
|
|
|
},
|
|
|
|
|
spacesAtEndOfLine: {
|
|
|
|
|
description: 'Don\'t collapse spaces that preceed/follow a newline',
|
2021-01-24 06:56:11 +01:00
|
|
|
|
html: '<html><body>something <br> something<br></body></html>',
|
2021-01-24 07:54:14 +01:00
|
|
|
|
wantLineAttribs: ['+l', '+m'],
|
|
|
|
|
wantText: ['something ', ' something'],
|
2020-12-20 07:18:19 +01:00
|
|
|
|
},
|
|
|
|
|
spacesAtEndOfLineP: {
|
|
|
|
|
description: 'Don\'t collapse spaces that preceed/follow a empty paragraph',
|
2021-01-24 06:56:11 +01:00
|
|
|
|
html: '<html><body>something <p></p> something<br></body></html>',
|
2021-01-24 07:54:14 +01:00
|
|
|
|
wantLineAttribs: ['+l', '', '+m'],
|
|
|
|
|
wantText: ['something ', '', ' something'],
|
2020-12-20 07:18:19 +01:00
|
|
|
|
},
|
|
|
|
|
nonBreakingSpacesAfterNewlines: {
|
|
|
|
|
description: 'Don\'t collapse non-breaking spaces that follow a newline',
|
2021-01-24 06:56:11 +01:00
|
|
|
|
html: '<html><body>something<br> something<br></body></html>',
|
2021-01-24 07:54:14 +01:00
|
|
|
|
wantLineAttribs: ['+9', '+c'],
|
|
|
|
|
wantText: ['something', ' something'],
|
2020-12-20 07:18:19 +01:00
|
|
|
|
},
|
|
|
|
|
nonBreakingSpacesAfterNewlinesP: {
|
|
|
|
|
description: 'Don\'t collapse non-breaking spaces that follow a paragraph',
|
2021-01-24 06:56:11 +01:00
|
|
|
|
html: '<html><body>something<p></p> something<br></body></html>',
|
2021-01-24 07:54:14 +01:00
|
|
|
|
wantLineAttribs: ['+9', '', '+c'],
|
|
|
|
|
wantText: ['something', '', ' something'],
|
2020-12-20 07:18:19 +01:00
|
|
|
|
},
|
|
|
|
|
preserveSpacesInsideElements: {
|
|
|
|
|
description: 'Preserve all spaces when multiple are present',
|
|
|
|
|
html: '<html><body>Need <span> more </span> space<i> s </i> !<br></body></html>',
|
2021-01-24 07:54:14 +01:00
|
|
|
|
wantLineAttribs: ['+h*0+4+2'],
|
|
|
|
|
wantText: ['Need more space s !'],
|
2020-12-20 07:18:19 +01:00
|
|
|
|
},
|
|
|
|
|
preserveSpacesAcrossNewlines: {
|
|
|
|
|
description: 'Newlines and multiple spaces across newlines should be preserved',
|
|
|
|
|
html: `
|
|
|
|
|
<html><body>Need
|
|
|
|
|
<span> more </span>
|
|
|
|
|
space
|
|
|
|
|
<i> s </i>
|
|
|
|
|
!<br></body></html>`,
|
2021-01-24 07:54:14 +01:00
|
|
|
|
wantLineAttribs: ['+19*0+4+b'],
|
|
|
|
|
wantText: ['Need more space s !'],
|
2020-12-20 07:18:19 +01:00
|
|
|
|
},
|
|
|
|
|
multipleNewLinesAtBeginning: {
|
|
|
|
|
description: 'Multiple new lines at the beginning should be preserved',
|
|
|
|
|
html: '<html><body><br><br><p></p><p></p>first line<br><br>second line<br></body></html>',
|
2021-01-24 07:54:14 +01:00
|
|
|
|
wantLineAttribs: ['', '', '', '', '+a', '', '+b'],
|
|
|
|
|
wantText: ['', '', '', '', 'first line', '', 'second line'],
|
2020-12-20 07:18:19 +01:00
|
|
|
|
},
|
2021-01-24 06:56:11 +01:00
|
|
|
|
multiLineParagraph: {
|
|
|
|
|
description: 'A paragraph with multiple lines should not loose spaces when lines are combined',
|
|
|
|
|
html: `<html><body><p>
|
2020-12-20 07:18:19 +01:00
|
|
|
|
а б в г ґ д е є ж з и і ї й к л м н о
|
|
|
|
|
п р с т у ф х ц ч ш щ ю я ь</p>
|
|
|
|
|
</body></html>`,
|
2021-01-24 07:54:14 +01:00
|
|
|
|
wantLineAttribs: ['+1t'],
|
|
|
|
|
wantText: ['а б в г ґ д е є ж з и і ї й к л м н о п р с т у ф х ц ч ш щ ю я ь'],
|
2020-12-20 07:18:19 +01:00
|
|
|
|
},
|
2021-01-24 06:56:11 +01:00
|
|
|
|
multiLineParagraphWithPre: {
|
|
|
|
|
description: 'lines in preformatted text should be kept intact',
|
|
|
|
|
html: `<html><body><p>
|
2021-01-24 09:31:45 +01:00
|
|
|
|
а б в г ґ д е є ж з и і ї й к л м н о</p><pre>multiple
|
2020-12-20 07:18:19 +01:00
|
|
|
|
lines
|
|
|
|
|
in
|
|
|
|
|
pre
|
2021-01-24 09:31:45 +01:00
|
|
|
|
</pre><p>п р с т у ф х ц ч ш щ ю я
|
2020-12-20 07:18:19 +01:00
|
|
|
|
ь</p>
|
|
|
|
|
</body></html>`,
|
2021-01-24 07:54:14 +01:00
|
|
|
|
wantLineAttribs: ['+11', '+8', '+5', '+2', '+3', '+r'],
|
|
|
|
|
wantText: [
|
2021-01-24 06:56:11 +01:00
|
|
|
|
'а б в г ґ д е є ж з и і ї й к л м н о',
|
|
|
|
|
'multiple',
|
|
|
|
|
'lines',
|
|
|
|
|
'in',
|
|
|
|
|
'pre',
|
|
|
|
|
'п р с т у ф х ц ч ш щ ю я ь',
|
|
|
|
|
],
|
2020-12-20 07:18:19 +01:00
|
|
|
|
},
|
|
|
|
|
preIntroducesASpace: {
|
2021-01-24 06:56:11 +01:00
|
|
|
|
description: 'pre should be on a new line not preceeded by a space',
|
|
|
|
|
html: `<html><body><p>
|
2020-12-20 07:18:19 +01:00
|
|
|
|
1
|
2021-01-24 09:31:45 +01:00
|
|
|
|
</p><pre>preline
|
|
|
|
|
</pre></body></html>`,
|
2021-01-24 07:54:14 +01:00
|
|
|
|
wantLineAttribs: ['+6', '+7'],
|
|
|
|
|
wantText: [' 1 ', 'preline'],
|
2020-12-20 07:18:19 +01:00
|
|
|
|
},
|
|
|
|
|
dontDeleteSpaceInsideElements: {
|
|
|
|
|
description: 'Preserve spaces on the beginning and end of a element',
|
|
|
|
|
html: '<html><body>Need<span> more </span>space<i> s </i>!<br></body></html>',
|
2021-01-24 07:54:14 +01:00
|
|
|
|
wantLineAttribs: ['+f*0+3+1'],
|
|
|
|
|
wantText: ['Need more space s !'],
|
2020-12-20 07:18:19 +01:00
|
|
|
|
},
|
|
|
|
|
dontDeleteSpaceOutsideElements: {
|
|
|
|
|
description: 'Preserve spaces outside elements',
|
|
|
|
|
html: '<html><body>Need <span>more</span> space <i>s</i> !<br></body></html>',
|
2021-01-24 07:54:14 +01:00
|
|
|
|
wantLineAttribs: ['+g*0+1+2'],
|
|
|
|
|
wantText: ['Need more space s !'],
|
2020-12-20 07:18:19 +01:00
|
|
|
|
},
|
|
|
|
|
dontDeleteSpaceAtEndOfElement: {
|
|
|
|
|
description: 'Preserve spaces at the end of an element',
|
|
|
|
|
html: '<html><body>Need <span>more </span>space <i>s </i>!<br></body></html>',
|
2021-01-24 07:54:14 +01:00
|
|
|
|
wantLineAttribs: ['+g*0+2+1'],
|
|
|
|
|
wantText: ['Need more space s !'],
|
2020-12-20 07:18:19 +01:00
|
|
|
|
},
|
|
|
|
|
dontDeleteSpaceAtBeginOfElements: {
|
|
|
|
|
description: 'Preserve spaces at the start of an element',
|
|
|
|
|
html: '<html><body>Need<span> more</span> space<i> s</i> !<br></body></html>',
|
2021-01-24 07:54:14 +01:00
|
|
|
|
wantLineAttribs: ['+f*0+2+2'],
|
|
|
|
|
wantText: ['Need more space s !'],
|
2020-12-20 07:18:19 +01:00
|
|
|
|
},
|
2020-11-23 19:21:51 +01:00
|
|
|
|
};
|
2020-06-05 21:54:16 +02:00
|
|
|
|
|
2020-11-23 19:21:51 +01:00
|
|
|
|
describe(__filename, function () {
|
2020-12-18 06:40:33 +01:00
|
|
|
|
for (const test of Object.keys(tests)) {
|
2020-11-23 19:21:51 +01:00
|
|
|
|
const testObj = tests[test];
|
|
|
|
|
describe(test, function () {
|
2020-10-10 00:19:46 +02:00
|
|
|
|
if (testObj.disabled) {
|
2020-11-23 19:21:51 +01:00
|
|
|
|
return xit('DISABLED:', test, function (done) {
|
2020-10-10 00:19:46 +02:00
|
|
|
|
done();
|
2020-11-23 19:21:51 +01:00
|
|
|
|
});
|
2020-06-05 21:54:16 +02:00
|
|
|
|
}
|
|
|
|
|
|
2021-01-24 07:57:11 +01:00
|
|
|
|
it(testObj.description, async function () {
|
2020-11-23 19:21:51 +01:00
|
|
|
|
const $ = cheerio.load(testObj.html); // Load HTML into Cheerio
|
2020-12-18 10:37:37 +01:00
|
|
|
|
const doc = $('body')[0]; // Creates a dom-like representation of HTML
|
2020-10-10 00:19:46 +02:00
|
|
|
|
// Create an empty attribute pool
|
2020-11-23 19:21:51 +01:00
|
|
|
|
const apool = new AttributePool();
|
2020-10-10 00:19:46 +02:00
|
|
|
|
// Convert a dom tree into a list of lines and attribute liens
|
|
|
|
|
// using the content collector object
|
2020-11-23 19:21:51 +01:00
|
|
|
|
const cc = contentcollector.makeContentCollector(true, null, apool);
|
2020-10-10 00:19:46 +02:00
|
|
|
|
cc.collectContent(doc);
|
2020-11-23 19:21:51 +01:00
|
|
|
|
const result = cc.finish();
|
2021-01-24 07:54:14 +01:00
|
|
|
|
const gotAttributes = result.lineAttribs;
|
|
|
|
|
const wantAttributes = testObj.wantLineAttribs;
|
|
|
|
|
const gotText = new Array(result.lines);
|
|
|
|
|
const wantText = testObj.wantText;
|
2020-06-05 21:54:16 +02:00
|
|
|
|
|
2021-01-24 07:54:14 +01:00
|
|
|
|
assert.deepEqual(gotText[0], wantText);
|
|
|
|
|
assert.deepEqual(gotAttributes, wantAttributes);
|
2020-10-10 00:19:46 +02:00
|
|
|
|
});
|
|
|
|
|
});
|
|
|
|
|
}
|
|
|
|
|
});
|
2020-06-05 21:54:16 +02:00
|
|
|
|
|
|
|
|
|
|
|
|
|
|
function arraysEqual(a, b) {
|
|
|
|
|
if (a === b) return true;
|
|
|
|
|
if (a == null || b == null) return false;
|
2021-01-24 06:56:11 +01:00
|
|
|
|
if (a.length !== b.length) return false;
|
2020-06-05 21:54:16 +02:00
|
|
|
|
|
|
|
|
|
// If you don't care about the order of the elements inside
|
|
|
|
|
// the array, you should sort both arrays here.
|
|
|
|
|
// Please note that calling sort on an array will modify that array.
|
|
|
|
|
// you might want to clone your array first.
|
|
|
|
|
|
2020-11-23 19:21:51 +01:00
|
|
|
|
for (let i = 0; i < a.length; ++i) {
|
2020-06-05 21:54:16 +02:00
|
|
|
|
if (a[i] !== b[i]) return false;
|
|
|
|
|
}
|
|
|
|
|
return true;
|
|
|
|
|
}
|