" and return root element', function () {
const root = parseHTML('
');
const div = new HTMLElement('div', {}, '');
const a = div.appendChild(new HTMLElement('a', {}, ''));
const img = a.appendChild(new HTMLElement('img', {}, ''));
const p = div.appendChild(new HTMLElement('p', {}, ''));
root.firstChild.should.eql(div);
});
it('should parse "
" and return root element without comments', function () {
const root = parseHTML('
');
const div = new HTMLElement('div', {}, '');
const a = div.appendChild(new HTMLElement('a', {}, ''));
root.firstChild.should.eql(div);
});
it('should parse "
" and return root element with comments', function () {
const root = parseHTML('
', { comment: true });
const div = new HTMLElement('div', {}, '');
const a = div.appendChild(new HTMLElement('a', {}, ''));
const comment = a.appendChild(new CommentNode(' my comment '));
root.firstChild.should.eql(div);
});
it('should not parse HTML inside comments', function () {
const root = parseHTML('', { comment: true });
const div = new HTMLElement('div', {}, '');
const comment = div.appendChild(new CommentNode(''));
root.firstChild.should.eql(div);
});
it('should parse picture element', function () {
const root = parseHTML('');
const picture = new HTMLElement('picture', {}, '');
const source = picture.appendChild(new HTMLElement('source', {}, 'srcset="/images/example-1.jpg 1200w, /images/example-2.jpg 1600w" sizes="100vw"'));
const img = picture.appendChild(new HTMLElement('img', {}, 'src="/images/example.jpg" alt="Example"'));
root.firstChild.should.eql(picture);
});
it('should not extract text in script and style by default', function () {
const root = parseHTML('');
root.firstChild.childNodes.should.be.empty;
root.lastChild.childNodes.should.be.empty;
});
it('should extract text in script and style when ask so', function () {
const root = parseHTML('', {
script: true,
style: true
});
root.firstChild.childNodes.should.not.be.empty;
root.firstChild.childNodes.should.eql([new TextNode('1')]);
root.firstChild.text.should.eql('1');
root.lastChild.childNodes.should.not.be.empty;
root.lastChild.childNodes.should.eql([new TextNode('2&')]);
root.lastChild.text.should.eql('2&');
root.lastChild.rawText.should.eql('2&');
});
it('should be able to parse "html/incomplete-script" file', function () {
const root = parseHTML(fs.readFileSync(__dirname + '/html/incomplete-script').toString(), {
script: true
});
});
it('should be able to parse namespaces', function () {
const namespacedXML = 'content';
parseHTML(namespacedXML).toString().should.eql(namespacedXML);
});
it('should parse "
.." very fast', function () {
for (let i = 0; i < 100; i++)
parseHTML('
');
});
it('should parse "
.." fast', function () {
for (let i = 0; i < 100; i++)
parseHTML('
', {
lowerCaseTagName: true
});
});
// Test for broken tags.
something
it('should parse "
content
other
" (fix h3, span closing tag) very fast', function () {
const root = parseHTML(fs.readFileSync(__dirname + '/html/incomplete-script').toString());
});
});
describe('parseWithValidation', function () {
// parse with validation tests
it('should return Object with valid: true. does not count
as error. instead fixes it to ', function () {
const result = parseHTML('');
result.valid.should.eql(true);
})
it('should return Object with valid: true. does not count as error. instead fixes it to ', function () {
const result = parseHTML('');
result.valid.should.eql(true);
})
it('should return Object with valid: false. does not count
as error', function () {
const result = parseHTML('
');
result.valid.should.eql(false);
})
it('hillcrestpartyrentals.html should return Object with valid: false. not closing
tag on line 476', function () {
const result = parseHTML(fs.readFileSync(__dirname + '/html/hillcrestpartyrentals.html').toString(), {
noFix: true
});
result.valid.should.eql(false);
})
it('google.html should return Object with valid: true', function () {
const result = parseHTML(fs.readFileSync(__dirname + '/html/google.html').toString(), {
noFix: true
});
result.valid.should.eql(true);
})
it('gmail.html should return Object with valid: true', function () {
const result = parseHTML(fs.readFileSync(__dirname + '/html/gmail.html').toString(), {
noFix: true
});
result.valid.should.eql(true);
})
it('ffmpeg.html should return Object with valid: false (extra opening
', function () {
const result = parseHTML(fs.readFileSync(__dirname + '/html/ffmpeg.html').toString(), {
noFix: true
});
result.valid.should.eql(false);
})
// fix issue speed test
it('should fix "
');
})
it('gmail.html should return Object with valid: true', function () {
const result = parseHTML(fs.readFileSync(__dirname + '/html/gmail.html').toString().replace(/<\//gi, '<'));
result.valid.should.eql(false);
})
it('gmail.html should return Object with valid: true', function () {
const result = parseHTML(fs.readFileSync(__dirname + '/html/nice.html').toString().replace(/<\//gi, '<'));
result.valid.should.eql(false);
})
});
describe('TextNode', function () {
describe('#isWhitespace', function () {
let node = new TextNode('');
node.isWhitespace.should.be.ok;
node = new TextNode(' \t');
node.isWhitespace.should.be.ok;
node = new TextNode(' \t \t');
node.isWhitespace.should.be.ok;
});
});
describe('HTMLElement', function () {
describe('#removeWhitespace()', function () {
it('should remove whitespaces while preserving nodes with content', function () {
const root = parseHTML('
\r \n \t
123
');
const p = new HTMLElement('p', {}, '');
p.appendChild(new HTMLElement('h5', {}, ''))
.appendChild(new TextNode('123'));
root.firstChild.removeWhitespace().should.eql(p);
});
});
describe('#rawAttributes', function () {
it('should return escaped attributes of the element', function () {
const root = parseHTML('');
root.firstChild.rawAttributes.should.eql({
'a': '12',
'data-id': '!$$&',
'yAz': '1'
});
});
});
describe('#attributes', function () {
it('should return attributes of the element', function () {
const root = parseHTML('');
root.firstChild.attributes.should.eql({
'a': '12',
'data-id': '!$$&',
'yAz': '1',
'disabled': '',
'class': ''
});
});
});
describe('#getAttribute', function () {
it('should return value of the attribute', function () {
const root = parseHTML('');
root.firstChild.getAttribute('a').should.eql('a1b');
});
it('should return null when there is no such attribute', function () {
const root = parseHTML('');
should.equal(root.firstChild.getAttribute('b'), null);
});
it('should return empty string as broser behavior', function () {
const root = parseHTML('');
const input = root.firstChild;
input.getAttribute('required').should.eql('');
});
it('should return null as broser behavior', function () {
const root = parseHTML('');
const input = root.firstChild;
input.setAttribute('readonly', null);
input.getAttribute('readonly').should.eql('null');
});
});
describe('#setAttribute', function () {
it('should edit the attributes of the element', function () {
const root = parseHTML('');
const attr = root.firstChild.attributes;
root.firstChild.setAttribute('a', 13);
attr.should.eql({
'a': '13',
});
root.firstChild.getAttribute('a').should.eql('13');
root.firstChild.toString().should.eql('');
});
it('should add an attribute to the element', function () {
const root = parseHTML('');
root.firstChild.setAttribute('b', 13);
root.firstChild.attributes.should.eql({
'a': '12',
'b': '13',
});
root.firstChild.toString().should.eql('');
root.firstChild.setAttribute('required', '');
root.firstChild.toString().should.eql('');
});
it('should convert value to string', function () {
const root = parseHTML('');
const p = root.firstChild;
p.setAttribute('b', null);
p.setAttribute('c', undefined);
p.getAttribute('b').should.eql('null');
p.getAttribute('c').should.eql('undefined');
p.toString().should.eql('');
});
it('should throw type Error', function () {
const root = parseHTML('');
const p = root.firstChild;
should.throws(function () { p.setAttribute('b') });
should.throws(function () { p.setAttribute() });
});
it('should keep quotes arount value', function () {
const root = parseHTML('');
root.firstChild.setAttribute('b', 13);
root.firstChild.setAttribute('c', '2');
root.firstChild.attributes.should.eql({
'a': '12',
'b': '13',
'c': '2'
});
root.firstChild.toString().should.eql('');
});
});
describe('#setAttributes', function () {
it('should return attributes of the element', function () {
const root = parseHTML('');
root.firstChild.setAttributes({
c: 12,
d: '&&<>foo'
});
root.firstChild.attributes.should.eql({
'c': '12',
d: '&&<>foo'
});
root.firstChild.toString().should.eql('');
// root.firstChild.toString().should.eql('');
});
});
describe('#removeAttribute', function () {
const root = parseHTML('');
const input = root.firstChild;
input.removeAttribute('required');
input.toString().should.eql('');
});
describe('#hasAttribute', function () {
it('should return true or false when has or has not some attribute', function () {
const root = parseHTML('');
const input = root.firstChild;
input.hasAttribute('required').should.eql(true);
input.removeAttribute('required');
input.hasAttribute('required').should.eql(false);
});
});
describe('#querySelector()', function () {
it('should return correct elements in DOM tree', function () {
const root = parseHTML('
');
root.querySelector('#id').should.eql(root.firstChild);
root.querySelector('span.a').should.eql(root.firstChild.firstChild.firstChild);
root.querySelector('span.b').should.eql(root.firstChild.firstChild.firstChild);
root.querySelector('span.a.b').should.eql(root.firstChild.firstChild.firstChild);
root.querySelector('#id .b').should.eql(root.firstChild.firstChild.firstChild);
root.querySelector('#id span').should.eql(root.firstChild.firstChild.firstChild);
root.querySelector('[data-id=myid]').should.eql(root.firstChild);
root.querySelector('[data-id="myid"]').should.eql(root.firstChild);
});
});
describe('#querySelectorAll()', function () {
it('should return correct elements in DOM tree', function () {
const root = parseHTML('
');
root.querySelectorAll('#id').should.eql([root.firstChild]);
root.querySelectorAll('span.a').should.eql([root.firstChild.firstChild.firstChild]);
root.querySelectorAll('span.b').should.eql([root.firstChild.firstChild.firstChild]);
root.querySelectorAll('span.a.b').should.eql([root.firstChild.firstChild.firstChild]);
root.querySelectorAll('#id .b').should.eql([root.firstChild.firstChild.firstChild]);
root.querySelectorAll('#id span').should.eql(root.firstChild.firstChild.childNodes);
root.querySelectorAll('#id, #id .b').should.eql([root.firstChild, root.firstChild.firstChild.firstChild]);
});
it('should return just one element', function () {
const root = parseHTML('