| {"tests": [ |
| |
| {"description":"DOCTYPE without name", |
| "input":"<!DOCTYPE>", |
| "output":["ParseError", "ParseError", ["DOCTYPE", null, null, null, false]]}, |
| |
| {"description":"DOCTYPE without space before name", |
| "input":"<!DOCTYPEhtml>", |
| "output":["ParseError", ["DOCTYPE", "html", null, null, true]]}, |
| |
| {"description":"Incorrect DOCTYPE without a space before name", |
| "input":"<!DOCTYPEfoo>", |
| "output":["ParseError", ["DOCTYPE", "foo", null, null, true]]}, |
| |
| {"description":"DOCTYPE with publicId", |
| "input":"<!DOCTYPE html PUBLIC \"-//W3C//DTD HTML Transitional 4.01//EN\">", |
| "output":[["DOCTYPE", "html", "-//W3C//DTD HTML Transitional 4.01//EN", null, true]]}, |
| |
| {"description":"DOCTYPE with EOF after PUBLIC", |
| "input":"<!DOCTYPE html PUBLIC", |
| "output":["ParseError", ["DOCTYPE", "html", null, null, false]]}, |
| |
| {"description":"DOCTYPE with EOF after PUBLIC '", |
| "input":"<!DOCTYPE html PUBLIC '", |
| "output":["ParseError", ["DOCTYPE", "html", "", null, false]]}, |
| |
| {"description":"DOCTYPE with EOF after PUBLIC 'x", |
| "input":"<!DOCTYPE html PUBLIC 'x", |
| "output":["ParseError", ["DOCTYPE", "html", "x", null, false]]}, |
| |
| {"description":"DOCTYPE with systemId", |
| "input":"<!DOCTYPE html SYSTEM \"-//W3C//DTD HTML Transitional 4.01//EN\">", |
| "output":[["DOCTYPE", "html", null, "-//W3C//DTD HTML Transitional 4.01//EN", true]]}, |
| |
| {"description":"DOCTYPE with publicId and systemId", |
| "input":"<!DOCTYPE html PUBLIC \"-//W3C//DTD HTML Transitional 4.01//EN\" \"-//W3C//DTD HTML Transitional 4.01//EN\">", |
| "output":[["DOCTYPE", "html", "-//W3C//DTD HTML Transitional 4.01//EN", "-//W3C//DTD HTML Transitional 4.01//EN", true]]}, |
| |
| {"description":"DOCTYPE with > in double-quoted publicId", |
| "input":"<!DOCTYPE html PUBLIC \">x", |
| "output":["ParseError", ["DOCTYPE", "html", "", null, false], ["Character", "x"]]}, |
| |
| {"description":"DOCTYPE with > in single-quoted publicId", |
| "input":"<!DOCTYPE html PUBLIC '>x", |
| "output":["ParseError", ["DOCTYPE", "html", "", null, false], ["Character", "x"]]}, |
| |
| {"description":"DOCTYPE with > in double-quoted systemId", |
| "input":"<!DOCTYPE html PUBLIC \"foo\" \">x", |
| "output":["ParseError", ["DOCTYPE", "html", "foo", "", false], ["Character", "x"]]}, |
| |
| {"description":"DOCTYPE with > in single-quoted systemId", |
| "input":"<!DOCTYPE html PUBLIC 'foo' '>x", |
| "output":["ParseError", ["DOCTYPE", "html", "foo", "", false], ["Character", "x"]]}, |
| |
| {"description":"Incomplete doctype", |
| "input":"<!DOCTYPE html ", |
| "output":["ParseError", ["DOCTYPE", "html", null, null, false]]}, |
| |
| {"description":"Numeric entity representing the NUL character", |
| "input":"�", |
| "output":["ParseError", ["Character", "\uFFFD"]]}, |
| |
| {"description":"Hexadecimal entity representing the NUL character", |
| "input":"�", |
| "output":["ParseError", ["Character", "\uFFFD"]]}, |
| |
| {"description":"Numeric entity representing a codepoint after 1114111 (U+10FFFF)", |
| "input":"�", |
| "output":["ParseError", ["Character", "\uFFFD"]]}, |
| |
| {"description":"Hexadecimal entity representing a codepoint after 1114111 (U+10FFFF)", |
| "input":"�", |
| "output":["ParseError", ["Character", "\uFFFD"]]}, |
| |
| {"description":"Hexadecimal entity pair representing a surrogate pair", |
| "input":"��", |
| "output":["ParseError", ["Character", "\uFFFD"], "ParseError", ["Character", "\uFFFD"]]}, |
| |
| {"description":"Hexadecimal entity with mixed uppercase and lowercase", |
| "input":"ꯍ", |
| "output":[["Character", "\uABCD"]]}, |
| |
| {"description":"Entity without a name", |
| "input":"&;", |
| "output":[["Character", "&;"]]}, |
| |
| {"description":"Unescaped ampersand in attribute value", |
| "input":"<h a='&'>", |
| "output":[["StartTag", "h", { "a":"&" }]]}, |
| |
| {"description":"StartTag containing <", |
| "input":"<a<b>", |
| "output":[["StartTag", "a<b", { }]]}, |
| |
| {"description":"Non-void element containing trailing /", |
| "input":"<h/>", |
| "output":[["StartTag","h",{},true]]}, |
| |
| {"description":"Void element with permitted slash", |
| "input":"<br/>", |
| "output":[["StartTag","br",{},true]]}, |
| |
| {"description":"Void element with permitted slash (with attribute)", |
| "input":"<br foo='bar'/>", |
| "output":[["StartTag","br",{"foo":"bar"},true]]}, |
| |
| {"description":"StartTag containing /", |
| "input":"<h/a='b'>", |
| "output":["ParseError", ["StartTag", "h", { "a":"b" }]]}, |
| |
| {"description":"Double-quoted attribute value", |
| "input":"<h a=\"b\">", |
| "output":[["StartTag", "h", { "a":"b" }]]}, |
| |
| {"description":"Unescaped </", |
| "input":"</", |
| "output":["ParseError", ["Character", "</"]]}, |
| |
| {"description":"Illegal end tag name", |
| "input":"</1>", |
| "output":["ParseError", ["Comment", "1"]]}, |
| |
| {"description":"Simili processing instruction", |
| "input":"<?namespace>", |
| "output":["ParseError", ["Comment", "?namespace"]]}, |
| |
| {"description":"A bogus comment stops at >, even if preceeded by two dashes", |
| "input":"<?foo-->", |
| "output":["ParseError", ["Comment", "?foo--"]]}, |
| |
| {"description":"Unescaped <", |
| "input":"foo < bar", |
| "output":[["Character", "foo "], "ParseError", ["Character", "< bar"]]}, |
| |
| {"description":"Null Byte Replacement", |
| "input":"\u0000", |
| "output":["ParseError", ["Character", "\u0000"]]}, |
| |
| {"description":"Comment with dash", |
| "input":"<!---x", |
| "output":["ParseError", ["Comment", "-x"]]}, |
| |
| {"description":"Entity + newline", |
| "input":"\nx\n>\n", |
| "output":[["Character","\nx\n>\n"]]}, |
| |
| {"description":"Start tag with no attributes but space before the greater-than sign", |
| "input":"<h >", |
| "output":[["StartTag", "h", {}]]}, |
| |
| {"description":"Empty attribute followed by uppercase attribute", |
| "input":"<h a B=''>", |
| "output":[["StartTag", "h", {"a":"", "b":""}]]}, |
| |
| {"description":"Double-quote after attribute name", |
| "input":"<h a \">", |
| "output":["ParseError", ["StartTag", "h", {"a":"", "\"":""}]]}, |
| |
| {"description":"Single-quote after attribute name", |
| "input":"<h a '>", |
| "output":["ParseError", ["StartTag", "h", {"a":"", "'":""}]]}, |
| |
| {"description":"Empty end tag with following characters", |
| "input":"a</>bc", |
| "output":[["Character", "a"], "ParseError", ["Character", "bc"]]}, |
| |
| {"description":"Empty end tag with following tag", |
| "input":"a</><b>c", |
| "output":[["Character", "a"], "ParseError", ["StartTag", "b", {}], ["Character", "c"]]}, |
| |
| {"description":"Empty end tag with following comment", |
| "input":"a</><!--b-->c", |
| "output":[["Character", "a"], "ParseError", ["Comment", "b"], ["Character", "c"]]}, |
| |
| {"description":"Empty end tag with following end tag", |
| "input":"a</></b>c", |
| "output":[["Character", "a"], "ParseError", ["EndTag", "b"], ["Character", "c"]]} |
| |
| ]} |