asynctest(
'browser.tinymce.core.html.SaxParserTest',
[
'ephox.mcagar.api.LegacyUnit',
'ephox.agar.api.Pipeline',
'tinymce.core.html.SaxParser',
'tinymce.core.html.Writer',
'tinymce.core.html.Schema',
'tinymce.core.util.Tools'
],
function (LegacyUnit, Pipeline, SaxParser, Writer, Schema, Tools) {
var success = arguments[arguments.length - 2];
var failure = arguments[arguments.length - 1];
var suite = LegacyUnit.createSuite();
var writer = new Writer(), schema = new Schema();
var createCounter = function (writer) {
var counts = {};
return {
counts: counts,
comment: function (text) {
if ("comment" in counts) {
counts.comment++;
} else {
counts.comment = 1;
}
writer.comment(text);
},
cdata: function (text) {
if ("cdata" in counts) {
counts.cdata++;
} else {
counts.cdata = 1;
}
writer.cdata(text);
},
text: function (text, raw) {
if ("text" in counts) {
counts.text++;
} else {
counts.text = 1;
}
writer.text(text, raw);
},
start: function (name, attrs, empty) {
if ("start" in counts) {
counts.start++;
} else {
counts.start = 1;
}
writer.start(name, attrs, empty);
},
end: function (name) {
if ("end" in counts) {
counts.end++;
} else {
counts.end = 1;
}
writer.end(name);
},
pi: function (name, text) {
if ("pi" in counts) {
counts.pi++;
} else {
counts.pi = 1;
}
writer.pi(name, text);
},
doctype: function (text) {
if ("doctype:" in counts) {
counts.doctype++;
} else {
counts.doctype = 1;
}
writer.doctype(text);
}
};
};
suite.test('Parse elements', function () {
var counter, parser;
counter = createCounter(writer);
parser = new SaxParser(counter, schema);
writer.reset();
parser.parse(
'<span id=id1 title="title value" class=\'class1 class2\' data-value="value1" ' +
'MYATTR="val1" myns:myattr="val2" disabled empty=""></span>'
);
LegacyUnit.equal(
writer.getContent(),
'<span id="id1" title="title value" class="class1 class2" data-value="value1" myattr="val1" ' +
'myns:myattr="val2" disabled="disabled" empty=""></span>',
'Parse attribute formats.'
);
LegacyUnit.deepEqual(counter.counts, { start: 1, end: 1 }, 'Parse attribute formats counts.');
counter = createCounter(writer);
parser = new SaxParser(counter, schema);
writer.reset();
parser.parse('<b href=\'"&<>\'></b>');
LegacyUnit.equal(writer.getContent(), '<b href=""&<>"></b>', 'Parse attributes with <> in them.');
LegacyUnit.deepEqual(counter.counts, { start: 1, end: 1 }, 'Parse attributes with <> in them (count).');
counter = createCounter(writer);
parser = new SaxParser(counter, schema);
writer.reset();
parser.parse('<span title=" "class=" "></span>');
LegacyUnit.equal(writer.getContent(), '<span title=" " class=" "></span>', 'Parse compressed attributes.');
LegacyUnit.deepEqual(counter.counts, { start: 1, end: 1 }, 'Parse compressed attributes (count).');
counter = createCounter(writer);
parser = new SaxParser(counter, schema);
writer.reset();
parser.parse('<span title></span>');
LegacyUnit.equal(writer.getContent(), '<span title=""></span>', 'Single empty attribute.');
LegacyUnit.deepEqual(counter.counts, { start: 1, end: 1 }, 'Single empty attributes (count).');
counter = createCounter(writer);
parser = new SaxParser(counter, schema);
writer.reset();
parser.parse('<span class="class" title></span>');
LegacyUnit.equal(writer.getContent(), '<span class="class" title=""></span>', 'Empty attribute at end.');
LegacyUnit.deepEqual(counter.counts, { start: 1, end: 1 }, 'Empty attribute at end (count).');
counter = createCounter(writer);
parser = new SaxParser(counter, schema);
writer.reset();
parser.parse('<span title class="class"></span>');
LegacyUnit.equal(writer.getContent(), '<span title="" class="class"></span>', 'Empty attribute at start.');
LegacyUnit.deepEqual(counter.counts, { start: 1, end: 1 }, 'Empty attribute at start (count).');
counter = createCounter(writer);
parser = new SaxParser(counter, schema);
writer.reset();
parser.parse('<img src="test">');
LegacyUnit.equal(writer.getContent(), '<img src="test" />', 'Parse empty element.');
LegacyUnit.deepEqual(counter.counts, { start: 1 }, 'Parse empty element counts.');
counter = createCounter(writer);
parser = new SaxParser(counter, schema);
writer.reset();
parser.parse('<img\nsrc="test"\ntitle="row1\nrow2">');
LegacyUnit.equal(writer.getContent(), '<img src="test" title="row1\nrow2" />', 'Parse attributes with linebreak.');
LegacyUnit.deepEqual(counter.counts, { start: 1 }, 'Parse attributes with linebreak counts.');
counter = createCounter(writer);
parser = new SaxParser(counter, schema);
writer.reset();
parser.parse('<img \t \t src="test" \t \t title="\t row1\t row2">');
LegacyUnit.equal(writer.getContent(), '<img src="test" title="\t row1\t row2" />', 'Parse attributes with whitespace.');
LegacyUnit.deepEqual(counter.counts, { start: 1 }, 'Parse attributes with whitespace counts.');
counter = createCounter(writer);
parser = new SaxParser(counter, schema);
writer.reset();
parser.parse('<myns:mytag>text</myns:mytag>');
LegacyUnit.equal(writer.getContent(), '<myns:mytag>text</myns:mytag>', 'Parse element with namespace.');
LegacyUnit.deepEqual(counter.counts, { start: 1, text: 1, end: 1 }, 'Parse element with namespace counts.');
counter = createCounter(writer);
parser = new SaxParser(counter, schema);
writer.reset();
parser.parse('<myns-mytag>text</myns-mytag>');
LegacyUnit.equal(writer.getContent(), '<myns-mytag>text</myns-mytag>', 'Parse element with dash name.');
LegacyUnit.deepEqual(counter.counts, { start: 1, text: 1, end: 1 }, 'Parse element with dash name counts.');
counter = createCounter(writer);
parser = new SaxParser(counter, schema);
writer.reset();
parser.parse('<myns_mytag>text</myns_mytag>');
LegacyUnit.equal(writer.getContent(), '<myns_mytag>text</myns_mytag>', 'Parse element with underscore name.');
LegacyUnit.deepEqual(counter.counts, { start: 1, text: 1, end: 1 }, 'Parse element with underscore name counts.');
counter = createCounter(writer);
parser = new SaxParser(counter, schema);
writer.reset();
parser.parse('text1<p>text2<b>text3</p>text4</b>text5');
LegacyUnit.equal(writer.getContent(), 'text1<p>text2<b>text3</b></p>text4text5', 'Parse tag soup 1.');
LegacyUnit.deepEqual(counter.counts, { text: 5, start: 2, end: 2 }, 'Parse tag soup 1 counts.');
counter = createCounter(writer);
parser = new SaxParser(counter, schema);
writer.reset();
parser.parse('text1<P>text2<B>text3</p>text4</b>text5');
LegacyUnit.equal(writer.getContent(), 'text1<p>text2<b>text3</b></p>text4text5', 'Parse tag soup 2.');
LegacyUnit.deepEqual(counter.counts, { text: 5, start: 2, end: 2 }, 'Parse tag soup 2 counts.');
counter = createCounter(writer);
parser = new SaxParser(counter, schema);
writer.reset();
parser.parse('text1<P>text2<B>tex<t3</p>te>xt4</b>text5');
LegacyUnit.equal(writer.getContent(), 'text1<p>text2<b>tex<t3</b></p>te>xt4text5', 'Parse tag soup 3.');
LegacyUnit.deepEqual(counter.counts, { text: 5, start: 2, end: 2 }, 'Parse tag soup 3 counts.');
counter = createCounter(writer);
parser = new SaxParser(counter, schema);
writer.reset();
parser.parse('text1<p>text2<b>text3');
LegacyUnit.equal(writer.getContent(), 'text1<p>text2<b>text3</b></p>', 'Parse tag soup 4.');
LegacyUnit.deepEqual(counter.counts, { text: 3, start: 2, end: 2 }, 'Parse tag soup 4 counts.');
counter = createCounter(writer);
parser = new SaxParser(counter, schema);
writer.reset();
parser.parse('text1<script>text2');
LegacyUnit.equal(writer.getContent(), 'text1<script>text2</s' + 'cript>', 'Parse tag soup 5.');
LegacyUnit.deepEqual(counter.counts, { text: 2, start: 1, end: 1 }, 'Parse tag soup 5 counts.');
counter = createCounter(writer);
parser = new SaxParser(counter, schema);
writer.reset();
parser.parse('text1<style>text2');
LegacyUnit.equal(writer.getContent(), 'text1<style>text2</st' + 'yle>', 'Parse tag soup 6.');
LegacyUnit.deepEqual(counter.counts, { text: 2, start: 1, end: 1 }, 'Parse tag soup 6 counts.');
counter = createCounter(writer);
parser = new SaxParser(counter, schema);
writer.reset();
parser.parse('text1<span title="<test" data-test="test>"></span>');
LegacyUnit.equal(
writer.getContent(),
'text1<span title="<test" data-test="test>"></span>',
'Parse element with </> in attributes.'
);
LegacyUnit.deepEqual(counter.counts, { text: 1, start: 1, end: 1 }, 'Parse element with </> in attributes counts.');
counter = createCounter(writer);
parser = new SaxParser(counter, schema);
writer.reset();
parser.parse("text\n<SC" + "RIPT type=mce-text/javascript>// <![CDATA[\nalert('HELLO WORLD!');\n// ]]></SC" + "RIPT>");
LegacyUnit.equal(
writer.getContent(),
"text\n<sc" + "ript type=\"mce-text/javascript\">// <![CDATA[\nalert('HELLO WORLD!');\n// ]]></sc" + "ript>",
'Parse cdata script.'
);
LegacyUnit.deepEqual(counter.counts, { text: 2, start: 1, end: 1 }, 'Parse cdata script counts.');
counter = createCounter(writer);
parser = new SaxParser(counter, schema);
writer.reset();
parser.parse('text1<noscript>te<br>xt2</noscript>text3');
LegacyUnit.equal(writer.getContent(), 'text1<noscript>te<br>xt2</noscript>text3', 'Parse noscript elements.');
LegacyUnit.deepEqual(counter.counts, { text: 3, start: 1, end: 1 }, 'Parse noscript elements counts.');
counter = createCounter(writer);
parser = new SaxParser(counter, schema);
writer.reset();
parser.parse('<p>a</p><p /><p>b</p>');
LegacyUnit.equal(writer.getContent(), '<p>a</p><p></p><p>b</p>', 'Parse invalid closed element.');
LegacyUnit.deepEqual(counter.counts, { text: 2, start: 3, end: 3 }, 'Parse invalid closed element counts.');
counter = createCounter(writer);
parser = new SaxParser(counter, schema);
writer.reset();
parser.parse('<br><br /><br/>');
LegacyUnit.equal(writer.getContent(), '<br /><br /><br />', 'Parse short ended elements.');
LegacyUnit.deepEqual(counter.counts, { start: 3 }, 'Parse short ended elements counts.');
counter = createCounter(writer);
parser = new SaxParser(counter, schema);
writer.reset();
parser.parse('<p ></p>');
LegacyUnit.equal(writer.getContent(), '<p></p>', 'Parse start elements with whitespace only attribs part.');
LegacyUnit.deepEqual(counter.counts, { start: 1, end: 1 }, 'Parse start elements with whitespace only attribs part (counts).');
});
suite.test('Parse style elements', function () {
var counter, parser;
counter = createCounter(writer);
parser = new SaxParser(counter, schema);
writer.reset();
parser.parse('text1<em><style>// <b>tag</b></st' + 'yle>text2</em>');
LegacyUnit.equal(writer.getContent(), 'text1<em><style>// <b>tag</b></st' + 'yle>text2</em>', 'Parse style element.');
LegacyUnit.deepEqual(counter.counts, { start: 2, end: 2, text: 3 }, 'Parse style element counts.');
counter = createCounter(writer);
parser = new SaxParser(counter, schema);
writer.reset();
parser.parse('text1<em><style id="id">// <b>tag</b></st' + 'yle>text2</em>');
LegacyUnit.equal(
writer.getContent(),
'text1<em><style id="id">// <b>tag</b></st' + 'yle>text2</em>',
'Parse style element with attributes.'
);
LegacyUnit.deepEqual(counter.counts, { text: 3, start: 2, end: 2 }, 'Parse style element with attributes counts.');
counter = createCounter(writer);
parser = new SaxParser(counter, schema);
writer.reset();
parser.parse('text1<em><style></st' + 'yle>text2</span>');
LegacyUnit.equal(writer.getContent(), 'text1<em><style></st' + 'yle>text2</em>', 'Parse empty style element.');
LegacyUnit.deepEqual(counter.counts, { text: 2, start: 2, end: 2 }, 'Parse empty style element counts.');
counter = createCounter(writer);
parser = new SaxParser(Tools.extend({ validate: true }, counter), new Schema({ invalid_elements: 'style' }));
writer.reset();
parser.parse('text1<em><style>text2</st' + 'yle>text3</em>');
LegacyUnit.equal(writer.getContent(), 'text1<em>text3</em>', 'Parse invalid style element.');
LegacyUnit.deepEqual(counter.counts, { text: 2, start: 1, end: 1 }, 'Parse invalid style element (count).');
});
suite.test('Parse script elements', function () {
var counter, parser;
counter = createCounter(writer);
parser = new SaxParser(counter, schema);
writer.reset();
parser.parse('text1<em><script>// <b>tag</b></s' + 'cript>text2</em>');
LegacyUnit.equal(writer.getContent(), 'text1<em><script>// <b>tag</b></s' + 'cript>text2</em>', 'Parse script element.');
LegacyUnit.deepEqual(counter.counts, { start: 2, end: 2, text: 3 }, 'Parse script element counts.');
counter = createCounter(writer);
parser = new SaxParser(counter, schema);
writer.reset();
parser.parse('text1<em><script id="id">// <b>tag</b></s' + 'cript>text2</em>');
LegacyUnit.equal(
writer.getContent(),
'text1<em><script id="id">// <b>tag</b></s' + 'cript>text2</em>',
'Parse script element with attributes.'
);
LegacyUnit.deepEqual(counter.counts, { start: 2, end: 2, text: 3 }, 'Parse script element with attributes counts.');
counter = createCounter(writer);
parser = new SaxParser(counter, schema);
writer.reset();
parser.parse('text1<em><script></s' + 'cript>text2</em>');
LegacyUnit.equal(writer.getContent(), 'text1<em><script></s' + 'cript>text2</em>', 'Parse empty script element.');
LegacyUnit.deepEqual(counter.counts, { text: 2, start: 2, end: 2 }, 'Parse empty script element counts.');
counter = createCounter(writer);
parser = new SaxParser(Tools.extend({ validate: true }, counter), new Schema({ invalid_elements: 'script' }));
writer.reset();
parser.parse('text1<em><s' + 'cript>text2</s' + 'cript>text3</em>');
LegacyUnit.equal(writer.getContent(), 'text1<em>text3</em>', 'Parse invalid script element.');
LegacyUnit.deepEqual(counter.counts, { text: 2, start: 1, end: 1 }, 'Parse invalid script element (count).');
});
suite.test('Parse text', function () {
var counter, parser;
counter = createCounter(writer);
parser = new SaxParser(counter, schema);
writer.reset();
parser.parse('');
LegacyUnit.equal(writer.getContent(), '', 'Parse empty.');
LegacyUnit.deepEqual(counter.counts, {}, 'Parse empty counts.');
counter = createCounter(writer);
parser = new SaxParser(counter, schema);
writer.reset();
parser.parse('text');
LegacyUnit.equal(writer.getContent(), 'text', 'Parse single text node.');
LegacyUnit.deepEqual(counter.counts, { text: 1 }, 'Parse single text node counts.');
counter = createCounter(writer);
parser = new SaxParser(counter, schema);
writer.reset();
parser.parse('<b>text</b>');
LegacyUnit.equal(writer.getContent(), '<b>text</b>', 'Parse wrapped text.');
LegacyUnit.deepEqual(counter.counts, { start: 1, text: 1, end: 1 }, 'Parse wrapped text counts');
counter = createCounter(writer);
parser = new SaxParser(counter, schema);
writer.reset();
parser.parse('text1<b>text2</b>');
LegacyUnit.equal(writer.getContent(), 'text1<b>text2</b>', 'Parse text at start.');
LegacyUnit.deepEqual(counter.counts, { start: 1, text: 2, end: 1 }, 'Parse text at start counts.');
counter = createCounter(writer);
parser = new SaxParser(counter, schema);
writer.reset();
parser.parse('<b>text1</b>text2');
LegacyUnit.equal(writer.getContent(), '<b>text1</b>text2', 'Parse text at end.');
LegacyUnit.deepEqual(counter.counts, { start: 1, end: 1, text: 2 }, 'Parse text at end counts.');
});
suite.test('Parsing comments', function () {
var counter, parser;
counter = createCounter(writer);
parser = new SaxParser(counter, schema);
writer.reset();
parser.parse('<!-- comment value -->');
LegacyUnit.equal(writer.getContent(), '<!-- comment value -->', 'Parse comment with value.');
LegacyUnit.deepEqual(counter.counts, { comment: 1 }, 'Parse comment with value count.');
counter = createCounter(writer);
parser = new SaxParser(counter, schema);
writer.reset();
parser.parse('<!---->');
LegacyUnit.equal(writer.getContent(), '', 'Parse comment without value.');
LegacyUnit.deepEqual(counter.counts, {}, 'Parse comment without value count.');
counter = createCounter(writer);
parser = new SaxParser(counter, schema);
writer.reset();
parser.parse('<!--<b></b>-->');
LegacyUnit.equal(writer.getContent(), '<!--<b></b>-->', 'Parse comment with tag inside.');
LegacyUnit.deepEqual(counter.counts, { comment: 1 }, 'Parse comment with tag inside counts.');
counter = createCounter(writer);
parser = new SaxParser(counter, schema);
writer.reset();
parser.parse('<b>a<!-- value -->b</b>');
LegacyUnit.equal(writer.getContent(), '<b>a<!-- value -->b</b>', 'Parse comment with tags around it.');
LegacyUnit.deepEqual(counter.counts, { comment: 1, text: 2, start: 1, end: 1 }, 'Parse comment with tags around it counts.');
});
suite.test('Parsing cdata', function () {
var counter, parser;
counter = createCounter(writer);
parser = new SaxParser(counter, schema);
writer.reset();
parser.parse('<![CDATA[test text]]>');
LegacyUnit.equal(writer.getContent(), '<![CDATA[test text]]>', 'Parse cdata with value.');
LegacyUnit.deepEqual(counter.counts, { cdata: 1 }, 'Parse cdata with value counts.');
counter = createCounter(writer);
parser = new SaxParser(counter, schema);
writer.reset();
parser.parse('<![CDATA[]]>');
LegacyUnit.equal(writer.getContent(), '', 'Parse cdata without value.');
LegacyUnit.deepEqual(counter.counts, {}, 'Parse cdata without value counts.');
counter = createCounter(writer);
parser = new SaxParser(counter, schema);
writer.reset();
parser.parse('<![CDATA[<b>a</b>]]>');
LegacyUnit.equal(writer.getContent(), '<![CDATA[<b>a</b>]]>', 'Parse cdata with tag inside.');
LegacyUnit.deepEqual(counter.counts, { cdata: 1 }, 'Parse cdata with tag inside counts.');
counter = createCounter(writer);
parser = new SaxParser(counter, schema);
writer.reset();
parser.parse('<b>a<![CDATA[value]]>b</b>');
LegacyUnit.equal(writer.getContent(), '<b>a<![CDATA[value]]>b</b>', 'Parse cdata with tags around it.');
LegacyUnit.deepEqual(counter.counts, { cdata: 1, start: 1, end: 1, text: 2 }, 'Parse cdata with tags around it counts.');
});
suite.test('Parse PI', function () {
var counter, parser;
counter = createCounter(writer);
parser = new SaxParser(counter, schema);
writer.reset();
parser.parse('<?xml version="1.0" encoding="UTF-8" ?>text1');
LegacyUnit.equal(writer.getContent(), '<?xml version="1.0" encoding="UTF-8" ?>text1', 'Parse PI with attributes.');
LegacyUnit.deepEqual(counter.counts, { pi: 1, text: 1 }, 'Parse PI with attributes counts.');
counter = createCounter(writer);
parser = new SaxParser(counter, schema);
writer.reset();
parser.parse('<?xml?>text1');
LegacyUnit.equal(writer.getContent(), '<?xml?>text1', 'Parse PI with no data.');
LegacyUnit.deepEqual(counter.counts, { pi: 1, text: 1 }, 'Parse PI with data counts.');
counter = createCounter(writer);
parser = new SaxParser(counter, schema);
writer.reset();
parser.parse('<?xml somevalue/>text1');
LegacyUnit.equal(writer.getContent(), '<?xml somevalue?>text1', 'Parse PI with IE style ending.');
LegacyUnit.deepEqual(counter.counts, { pi: 1, text: 1 }, 'Parse PI with IE style ending counts.');
});
suite.test('Parse doctype', function () {
var counter, parser;
counter = createCounter(writer);
parser = new SaxParser(counter, schema);
writer.reset();
parser.parse(
'<!DOCTYPE html PUBLIC "-//W3C//DTD XHTML 1.0 Transitional//EN" "http://www.w3.org/TR/xhtml1/DTD/xhtml1-transitional.dtd">text1'
);
LegacyUnit.equal(
writer.getContent(),
'<!DOCTYPE html PUBLIC "-//W3C//DTD XHTML 1.0 Transitional//EN" "http://www.w3.org/TR/xhtml1/DTD/xhtml1-transitional.dtd">text1',
'Parse DOCTYPE.'
);
LegacyUnit.deepEqual(counter.counts, { doctype: 1, text: 1 }, 'Parse HTML5 DOCTYPE counts.');
counter = createCounter(writer);
parser = new SaxParser(counter, schema);
writer.reset();
parser.parse('<!DOCTYPE html>text1');
LegacyUnit.equal(writer.getContent(), '<!DOCTYPE html>text1', 'Parse HTML5 DOCTYPE.');
LegacyUnit.deepEqual(counter.counts, { doctype: 1, text: 1 }, 'Parse HTML5 DOCTYPE counts.');
});
suite.test('Parse (validate)', function () {
var counter, parser;
counter = createCounter(writer);
counter.validate = true;
parser = new SaxParser(counter, schema);
writer.reset();
parser.parse('<invalid1>123<invalid2 />456<span title="title" invalid3="value">789</span>012</invalid1>');
LegacyUnit.equal(writer.getContent(), '123456<span title="title">789</span>012', 'Parse invalid elements and attributes.');
LegacyUnit.deepEqual(counter.counts, { start: 1, end: 1, text: 4 }, 'Parse invalid elements and attributes counts.');
});
suite.test('Self closing', function () {
var counter, parser;
counter = createCounter(writer);
counter.validate = true;
parser = new SaxParser(counter, schema);
writer.reset();
parser.parse('<ul><li>1<li><b>2</b><li><em><b>3</b></em></ul>');
LegacyUnit.equal(
writer.getContent(),
'<ul><li>1</li><li><b>2</b></li><li><em><b>3</b></em></li></ul>',
'Parse list with self closing items.'
);
});
suite.test('Preserve internal elements', function () {
var counter, parser, schema;
schema = new Schema({ valid_elements: 'b' });
counter = createCounter(writer);
counter.validate = true;
parser = new SaxParser(counter, schema);
writer.reset();
parser.parse('<span id="id"><b>text</b></span><span id="id" data-mce-type="something"></span>');
LegacyUnit.equal(
writer.getContent(),
'<b>text</b><span id="id" data-mce-type="something"></span>',
'Preserve internal span element without any span schema rule.'
);
schema = new Schema({ valid_elements: 'b,span[class]' });
counter = createCounter(writer);
counter.validate = true;
parser = new SaxParser(counter, schema);
writer.reset();
parser.parse('<span id="id" class="class"><b>text</b></span><span id="id" data-mce-type="something"></span>');
LegacyUnit.equal(
writer.getContent(),
'<span class="class"><b>text</b></span><span id="id" data-mce-type="something"></span>',
'Preserve internal span element with a span schema rule.'
);
});
suite.test('Remove internal elements', function () {
var counter, parser, schema;
schema = new Schema({ valid_elements: 'b' });
counter = createCounter(writer);
counter.validate = true;
counter.remove_internals = true;
parser = new SaxParser(counter, schema);
writer.reset();
parser.parse('<span id="id"><b>text</b></span><span id="id" data-mce-type="something"></span>');
LegacyUnit.equal(writer.getContent(), '<b>text</b>', 'Remove internal span element without any span schema rule.');
schema = new Schema({ valid_elements: 'b,span[class]' });
counter = createCounter(writer);
counter.validate = true;
counter.remove_internals = true;
parser = new SaxParser(counter, schema);
writer.reset();
parser.parse('<span id="id" class="class"><b>text</b></span><span id="id" data-mce-type="something"></span>');
LegacyUnit.equal(
writer.getContent(),
'<span class="class"><b>text</b></span>',
'Remove internal span element with a span schema rule.'
);
// Reset
counter.remove_internals = false;
});
suite.test('Parse attr with backslash #5436', function () {
var counter, parser;
counter = createCounter(writer);
parser = new SaxParser(counter, schema);
writer.reset();
parser.parse('<a title="\\" href="h">x</a>');
LegacyUnit.equal(writer.getContent(), '<a title="\\" href="h">x</a>');
});
suite.test('Parse no attributes span before strong', function () {
var counter, parser;
counter = createCounter(writer);
counter.validate = true;
parser = new SaxParser(counter, schema);
writer.reset();
parser.parse('<p><span>A</span> <strong>B</strong></p>');
LegacyUnit.equal(writer.getContent(), '<p>A <strong>B</strong></p>');
});
suite.test('Conditional comments (allowed)', function () {
var counter, parser;
counter = createCounter(writer);
counter.validate = false;
counter.allow_conditional_comments = true;
parser = new SaxParser(counter, schema);
writer.reset();
parser.parse('<!--[if gte IE 4]>alert(1)<![endif]-->');
LegacyUnit.equal(writer.getContent(), '<!--[if gte IE 4]>alert(1)<![endif]-->');
});
suite.test('Conditional comments (denied)', function () {
var counter, parser;
counter = createCounter(writer);
counter.validate = false;
counter.allow_conditional_comments = false;
parser = new SaxParser(counter, schema);
writer.reset();
parser.parse('<!--[if gte IE 4]>alert(1)<![endif]-->');
LegacyUnit.equal(writer.getContent(), '<!-- [if gte IE 4]>alert(1)<![endif]-->');
writer.reset();
parser.parse('<!--[if !IE]>alert(1)<![endif]-->');
LegacyUnit.equal(writer.getContent(), '<!-- [if !IE]>alert(1)<![endif]-->');
writer.reset();
parser.parse('<!--[iF !IE]>alert(1)<![endif]-->');
LegacyUnit.equal(writer.getContent(), '<!-- [iF !IE]>alert(1)<![endif]-->');
});
suite.test('Parse script urls (allowed)', function () {
var counter, parser;
counter = createCounter(writer);
counter.validate = false;
counter.allow_script_urls = true;
parser = new SaxParser(counter, schema);
writer.reset();
parser.parse(
'<a href="javascript:alert(1)">1</a>' +
'<a href=" 2 ">2</a>' +
'<a href="data:text/html;base64,PHN2Zy9vbmxvYWQ9YWxlcnQoMik+">3</a>'
);
LegacyUnit.equal(
writer.getContent(),
'<a href="javascript:alert(1)">1</a><a href=" 2 ">2</a>' +
'<a href="data:text/html;base64,PHN2Zy9vbmxvYWQ9YWxlcnQoMik+">3</a>'
);
});
suite.test('Parse script urls (allowed html data uris)', function () {
var counter, parser;
counter = createCounter(writer);
counter.validate = false;
counter.allow_html_data_urls = true;
parser = new SaxParser(counter, schema);
writer.reset();
parser.parse(
'<a href="javascript:alert(1)">1</a>' +
'<a href="data:text/html;base64,PHN2Zy9vbmxvYWQ9YWxlcnQoMik+">2</a>'
);
LegacyUnit.equal(
writer.getContent(),
'<a>1</a>' +
'<a href="data:text/html;base64,PHN2Zy9vbmxvYWQ9YWxlcnQoMik+">2</a>'
);
});
suite.test('Parse script urls (denied)', function () {
var counter, parser;
counter = createCounter(writer);
counter.validate = false;
parser = new SaxParser(counter, schema);
writer.reset();
parser.parse(
'<a href="jAvaScript:alert(1)">1</a>' +
'<a href="vbscript:alert(2)">2</a>' +
'<a href="java\u0000script:alert(3)">3</a>' +
'<a href="\njavascript:alert(4)">4</a>' +
'<a href="java\nscript:alert(5)">5</a>' +
'<a href="java\tscript:alert(6)">6</a>' +
'<a href="%6aavascript:alert(7)">7</a>' +
'<a href="data:text/html;base64,PHN2Zy9vbmxvYWQ9YWxlcnQoMik+">8</a>' +
'<a href=" dAt%61: tExt/html ; bAse64 , PHN2Zy9vbmxvYWQ9YWxlcnQoMik+">9</a>' +
'<object data="data:text/html;base64,PHN2Zy9vbmxvYWQ9YWxlcnQoMik+">10</object>' +
'<button formaction="javascript:alert(11)">11</button>' +
'<table background="javascript:alert(12)"><tr><tr>12</tr></tr></table>' +
'<a href="mhtml:13">13</a>' +
'<img src="">' +
'<a href="%E3%82%AA%E3%83%BC%E3%83">Invalid url</a>'
);
LegacyUnit.equal(
writer.getContent(),
'<a>1</a><a>2</a><a>3</a><a>4</a><a>5</a><a>6</a><a>7</a><a>8</a><a>9</a>' +
'<object>10</object><button>11</button><table><tr></tr><tr>12</tr></table><a>13</a>' +
'<img src="" />' +
'<a href="%E3%82%AA%E3%83%BC%E3%83">Invalid url</a>'
);
});
suite.test('Parse away bogus elements', function () {
var testBogusSaxParse = function (inputHtml, outputHtml, counters) {
var counter, parser;
counter = createCounter(writer);
counter.validate = true;
parser = new SaxParser(counter, schema);
writer.reset();
parser.parse(inputHtml);
LegacyUnit.equal(writer.getContent(), outputHtml);
LegacyUnit.deepEqual(counter.counts, counters);
};
testBogusSaxParse('a<b data-mce-bogus="1">b</b>c', 'abc', { text: 3 });
testBogusSaxParse('a<b data-mce-bogus="true">b</b>c', 'abc', { text: 3 });
testBogusSaxParse('a<b data-mce-bogus="1"></b>c', 'ac', { text: 2 });
testBogusSaxParse('a<b data-mce-bogus="all">b</b>c', 'ac', { text: 2 });
testBogusSaxParse('a<b data-mce-bogus="all"><!-- x --><?xml?></b>c', 'ac', { text: 2 });
testBogusSaxParse('a<b data-mce-bogus="all"><b>b</b></b>c', 'ac', { text: 2 });
testBogusSaxParse('a<b data-mce-bogus="all"><br>b</b><b>c</b>', 'a<b>c</b>', { start: 1, end: 1, text: 2 });
testBogusSaxParse('a<b data-mce-bogus="all"><img>b</b><b>c</b>', 'a<b>c</b>', { start: 1, end: 1, text: 2 });
testBogusSaxParse('a<b data-mce-bogus="all"><b attr="x">b</b></b>c', 'ac', { text: 2 });
testBogusSaxParse('a<b data-mce-bogus="all"></b>c', 'ac', { text: 2 });
testBogusSaxParse('a<b data-mce-bogus="all"></b><b>c</b>', 'a<b>c</b>', { start: 1, end: 1, text: 2 });
});
suite.test('findEndTag', function () {
var testFindEndTag = function (html, startIndex, expectedIndex) {
LegacyUnit.equal(SaxParser.findEndTag(schema, html, startIndex), expectedIndex);
};
testFindEndTag('<b>', 3, 3);
testFindEndTag('<img>', 3, 3);
testFindEndTag('<b></b>', 3, 7);
testFindEndTag('<b><img></b>', 3, 12);
testFindEndTag('<b><!-- </b> --></b>', 3, 20);
testFindEndTag('<span><b><i>a<img>b</i><b>c</b></b></span>', 9, 35);
});
suite.test('parse XSS PI', function () {
var counter, parser;
counter = createCounter(writer);
counter.validate = false;
parser = new SaxParser(counter, schema);
writer.reset();
parser.parse(
'<?xml><iframe SRC=javascript:alert('XSS')>?>'
);
LegacyUnit.equal(
writer.getContent(),
'<?xml ><iframe SRC=&#106&#97&#118&#97&#115&#99&#114&#105&#112&' +
'#116&#58&#97&#108&#101&#114&#116&#40&#39&#88&#83&#83&#39&#41>?>'
);
});
suite.test('aria attributes', function () {
var counter, parser;
counter = createCounter(writer);
parser = new SaxParser(Tools.extend({ validate: true }, counter), schema);
writer.reset();
parser.parse('<span aria-label="test" role="myrole" unsupportedattr="2">a</span>');
LegacyUnit.equal(
writer.getContent(),
'<span aria-label="test" role="myrole">a</span>'
);
});
suite.test('Parse elements with numbers', function () {
var counter, parser;
counter = createCounter(writer);
parser = new SaxParser(counter, schema);
writer.reset();
parser.parse('<a5>text</a5>');
LegacyUnit.equal(writer.getContent(), '<a5>text</a5>', 'Parse element with numbers.');
LegacyUnit.deepEqual(counter.counts, { start: 1, text: 1, end: 1 }, 'Parse element with numbers counts.');
});
suite.test('Parse internal elements with disallowed attributes', function () {
var counter, parser;
counter = createCounter(writer);
parser = new SaxParser(counter, schema);
writer.reset();
parser.parse('<b data-mce-type="test" id="x" style="color: red" src="1" data="2" onclick="3"></b>');
LegacyUnit.equal(writer.getContent(), '<b data-mce-type="test" id="x" style="color: red"></b>');
LegacyUnit.deepEqual(counter.counts, { start: 1, end: 1 });
});
suite.test('Parse cdata with comments and trim those comments away', function () {
var counter, parser;
counter = createCounter(writer);
parser = new SaxParser(counter, schema);
writer.reset();
parser.parse('<![CDATA[<!--x--><!--y-->--><!--]]>');
LegacyUnit.equal(writer.getContent(), '<![CDATA[xy]]>');
LegacyUnit.deepEqual(counter.counts, { cdata: 1 });
});
suite.test('Parse special elements', function () {
var counter, parser;
var specialHtml = (
'<b>' +
'<textarea></b></textarea><title></b></title><script></b></script>' +
'<noframes></b></noframes><noscript></b></noscript><style></b></style>' +
'<xmp></b></xmp>' +
'<noembed></b></noembed>' +
'</b>'
);
counter = createCounter(writer);
parser = new SaxParser(counter, schema);
writer.reset();
parser.parse(specialHtml);
LegacyUnit.equal(writer.getContent(), specialHtml);
LegacyUnit.deepEqual(counter.counts, { start: 9, text: 8, end: 9 });
});
suite.test('Parse malformed elements that start with numbers', function () {
var counter, parser;
counter = createCounter(writer);
parser = new SaxParser(counter, schema);
writer.reset();
parser.parse('a <2 b b b b b b b b b b b b b b b b b b b b b b');
LegacyUnit.equal(writer.getContent(), 'a <2 b b b b b b b b b b b b b b b b b b b b b b');
counter = createCounter(writer);
parser = new SaxParser(counter, schema);
writer.reset();
parser.parse('a <2b>a</2b> b');
LegacyUnit.equal(writer.getContent(), 'a <2b>a</2b> b');
});
suite.test('Parse malformed elements without an end', function () {
var counter, parser;
counter = createCounter(writer);
parser = new SaxParser(counter, schema);
writer.reset();
parser.parse('<b b b b b b b b b b b b b b b b b b b b b b b');
LegacyUnit.equal(
writer.getContent(),
'<b b b b b b b b b b b b b b b b b b b b b b b'
);
counter = createCounter(writer);
parser = new SaxParser(counter, schema);
writer.reset();
parser.parse('a a<b c');
LegacyUnit.equal(
writer.getContent(),
'a a<b c'
);
});
Pipeline.async({}, suite.toSteps({}), function () {
success();
}, failure);
}
);
|