Source code

Revision control

Copy as Markdown

Other Tools

Test Info:

<!doctype html>
<html>
<head>
<meta charset="utf-8">
<title>Test for CSS parser diagnostics escaping unprintable
characters correctly</title>
<script src="/tests/SimpleTest/SimpleTest.js"></script>
<link rel="stylesheet" href="/tests/SimpleTest/test.css">
</head>
<body>
<a target="_blank"
>Mozilla Bug 229827</a>
<style id="testbench"></style>
<script type="application/javascript">
// This test has intimate knowledge of how to get the CSS parser to
// emit diagnostics that contain text under control of the user.
// That's not the point of the test, though; the point is only that
// *that text* is properly escaped.
SpecialPowers.wrap(window).docShell.cssErrorReportingEnabled = true;
// There is one "pattern" for each code path through the error reporter
// that might need to escape some kind of user-supplied text.
// Each "pattern" is tested once with each of the "substitution"s below:
// <t>, <i>, and <s> are replaced by the t:, i:, and s: fields of
// each substitution object in turn.
let patterns = [
// REPORT_UNEXPECTED_P (only ever used in contexts where identifier-like
// escaping is appropriate)
{ i: "<t>|x{}", o: "prefix \u2018<i>\u2019" },
// REPORT_UNEXPECTED_TOKEN with:
// _Ident
{ i: "@namespace fnord <t>;", o: "within @namespace: \u2018<i>\u2019" },
// _Ref
{ i: "@namespace fnord #<t>;", o: "within @namespace: \u2018#<i>\u2019" },
// _Function
{ i: "@namespace fnord <t>();", o: "within @namespace: \u2018<i>(\u2019" },
// _Dimension
{ i: "@namespace fnord 14<t>;", o: "within @namespace: \u201814<i>\u2019" },
// _AtKeyword
{ i: "x{@<t>: }", o: "declaration but found \u2018@<i>\u2019." },
// _String
{ i: "x{ color: '<t>'}" , o: 'color but found \u2018"<s>"\u2019.' },
// _Bad_String
{ i: "x{ color: '<t>\n}", o: 'color but found \u2018"<s>\u2019.' },
];
// Blocks of characters to test, and how they should be escaped when
// they appear in identifiers and string constants.
const substitutions = [
// ASCII printables that _can_ normally appear in identifiers,
// so should of course _not_ be escaped.
{ t: "-_0123456789", i: "-_0123456789",
s: "-_0123456789" },
{ t: "abcdefghijklmnopqrstuvwxyz", i: "abcdefghijklmnopqrstuvwxyz",
s: "abcdefghijklmnopqrstuvwxyz" },
{ t: "ABCDEFGHIJKLMNOPQRSTUVWXYZ", i: "ABCDEFGHIJKLMNOPQRSTUVWXYZ",
s: "ABCDEFGHIJKLMNOPQRSTUVWXYZ" },
// ASCII printables that are not normally valid as the first character
// of an identifier, or the character immediately after a leading dash,
// but can be forced into that position with escapes.
{ t: "\\-", i: "\\-", s: "-" },
{ t: "\\30 ", i: "\\30 ", s: "0" },
{ t: "\\31 ", i: "\\31 ", s: "1" },
{ t: "\\32 ", i: "\\32 ", s: "2" },
{ t: "\\33 ", i: "\\33 ", s: "3" },
{ t: "\\34 ", i: "\\34 ", s: "4" },
{ t: "\\35 ", i: "\\35 ", s: "5" },
{ t: "\\36 ", i: "\\36 ", s: "6" },
{ t: "\\37 ", i: "\\37 ", s: "7" },
{ t: "\\38 ", i: "\\38 ", s: "8" },
{ t: "\\39 ", i: "\\39 ", s: "9" },
{ t: "-\\-", i: "--", s: "--" },
{ t: "-\\30 ", i: "-\\30 ", s: "-0" },
{ t: "-\\31 ", i: "-\\31 ", s: "-1" },
{ t: "-\\32 ", i: "-\\32 ", s: "-2" },
{ t: "-\\33 ", i: "-\\33 ", s: "-3" },
{ t: "-\\34 ", i: "-\\34 ", s: "-4" },
{ t: "-\\35 ", i: "-\\35 ", s: "-5" },
{ t: "-\\36 ", i: "-\\36 ", s: "-6" },
{ t: "-\\37 ", i: "-\\37 ", s: "-7" },
{ t: "-\\38 ", i: "-\\38 ", s: "-8" },
{ t: "-\\39 ", i: "-\\39 ", s: "-9" },
// ASCII printables that must be escaped in identifiers.
// Most of these should not be escaped in strings.
{ t: "\\!\\\"\\#\\$", i: "\\!\\\"\\#\\$", s: "!\\\"#$" },
{ t: "\\%\\&\\'\\(", i: "\\%\\&\\'\\(", s: "%&'(" },
{ t: "\\)\\*\\+\\,", i: "\\)\\*\\+\\,", s: ")*+," },
{ t: "\\.\\/\\:\\;", i: "\\.\\/\\:\\;", s: "./:;" },
{ t: "\\<\\=\\>\\?", i: "\\<\\=\\>\\?", s: "<=>?", },
{ t: "\\@\\[\\\\\\]", i: "\\@\\[\\\\\\]", s: "@[\\\\]" },
{ t: "\\^\\`\\{\\}\\~", i: "\\^\\`\\{\\}\\~", s: "^`{}~" },
// U+0000 - U+0020 (C0 controls, space)
// U+000A LINE FEED, U+000C FORM FEED, and U+000D CARRIAGE RETURN
// cannot be put into a CSS token as escaped literal characters, so
// we do them with hex escapes instead.
// The parser replaces U+0000 with U+FFFD.
{ t: "\\\x00\\\x01\\\x02\\\x03", i: "�\\1 \\2 \\3 ",
s: "�\\1 \\2 \\3 " },
{ t: "\\\x04\\\x05\\\x06\\\x07", i: "\\4 \\5 \\6 \\7 ",
s: "\\4 \\5 \\6 \\7 " },
{ t: "\\\x08\\\x09\\000A\\\x0B", i: "\\8 \\9 \\a \\b ",
s: "\\8 \\9 \\a \\b " },
{ t: "\\000C\\000D\\\x0E\\\x0F", i: "\\c \\d \\e \\f ",
s: "\\c \\d \\e \\f " },
{ t: "\\\x10\\\x11\\\x12\\\x13", i: "\\10 \\11 \\12 \\13 ",
s: "\\10 \\11 \\12 \\13 " },
{ t: "\\\x14\\\x15\\\x16\\\x17", i: "\\14 \\15 \\16 \\17 ",
s: "\\14 \\15 \\16 \\17 " },
{ t: "\\\x18\\\x19\\\x1A\\\x1B", i: "\\18 \\19 \\1a \\1b ",
s: "\\18 \\19 \\1a \\1b " },
{ t: "\\\x1C\\\x1D\\\x1E\\\x1F\\ ", i: "\\1c \\1d \\1e \\1f \\ ",
s: "\\1c \\1d \\1e \\1f " },
// U+007F (DELETE) and U+0080 - U+009F (C1 controls)
{ t: "\\\x7f\\\x80\\\x81\\\x82", i: "\\7f \x80\x81\x82",
s: "\\7f \x80\x81\x82" },
{ t: "\\\x83\\\x84\\\x85\\\x86", i: "\x83\x84\x85\x86",
s: "\x83\x84\x85\x86" },
{ t: "\\\x87\\\x88\\\x89\\\x8A", i: "\x87\x88\x89\x8A",
s: "\x87\x88\x89\x8A" },
{ t: "\\\x8B\\\x8C\\\x8D\\\x8E", i: "\x8B\x8C\x8D\x8E",
s: "\x8B\x8C\x8D\x8E" },
{ t: "\\\x8F\\\x90\\\x91\\\x92", i: "\x8F\x90\x91\x92",
s: "\x8F\x90\x91\x92" },
{ t: "\\\x93\\\x94\\\x95\\\x96", i: "\x93\x94\x95\x96",
s: "\x93\x94\x95\x96" },
{ t: "\\\x97\\\x98\\\x99\\\x9A", i: "\x97\x98\x99\x9A",
s: "\x97\x98\x99\x9A" },
{ t: "\\\x9B\\\x9C\\\x9D\\\x9E\\\x9F", i: "\x9B\x9C\x9D\x9E\x9F",
s: "\x9B\x9C\x9D\x9E\x9F" },
// CSS doesn't bother with the full Unicode rules for identifiers,
// instead declaring that any code point greater than or equal to
// U+0080 is a valid identifier character. Test a small handful
// of both basic and astral plane characters.
// Arabic (caution to editors: there is a possibly-invisible U+200E
// LEFT-TO-RIGHT MARK in each string, just before the close quote)
{ t: "أبجدهوزحطيكلمنسعفصقرشتثخذضظغ‎",
i: "أبجدهوزحطيكلمنسعفصقرشتثخذضظغ‎",
s: "أبجدهوزحطيكلمنسعفصقرشتثخذضظغ‎" },
// Box drawing
{ t: "─│┌┐└┘├┤┬┴┼╭╮╯╰╴╵╶╷",
i: "─│┌┐└┘├┤┬┴┼╭╮╯╰╴╵╶╷",
s: "─│┌┐└┘├┤┬┴┼╭╮╯╰╴╵╶╷" },
// CJK Unified Ideographs
{ t: "一丁丂七丄丅丆万丈三上下丌不与丏",
i: "一丁丂七丄丅丆万丈三上下丌不与丏",
s: "一丁丂七丄丅丆万丈三上下丌不与丏" },
// CJK Unified Ideographs Extension B (astral)
{ t: "𠀀𠀁𠀂𠀃𠀄𠀅𠀆𠀇𠀈𠀉𠀊𠀋𠀌𠀍𠀎𠀏",
i: "𠀀𠀁𠀂𠀃𠀄𠀅𠀆𠀇𠀈𠀉𠀊𠀋𠀌𠀍𠀎𠀏",
s: "𠀀𠀁𠀂𠀃𠀄𠀅𠀆𠀇𠀈𠀉𠀊𠀋𠀌𠀍𠀎𠀏" },
// Devanagari
{ t: "कखगघङचछजझञटठडढणतथदधनपफबभमयरलळवशषसह",
i: "कखगघङचछजझञटठडढणतथदधनपफबभमयरलळवशषसह",
s: "कखगघङचछजझञटठडढणतथदधनपफबभमयरलळवशषसह" },
// Emoticons (astral)
{ t: "😁😂😃😄😅😆😇😈😉😊😋😌😍😎😏😐",
i: "😁😂😃😄😅😆😇😈😉😊😋😌😍😎😏😐",
s: "😁😂😃😄😅😆😇😈😉😊😋😌😍😎😏😐" },
// Greek
{ t: "αβγδεζηθικλμνξοπρςστυφχψω",
i: "αβγδεζηθικλμνξοπρςστυφχψω",
s: "αβγδεζηθικλμνξοπρςστυφχψω" }
];
const npatterns = patterns.length;
const nsubstitutions = substitutions.length;
function quotemeta(str) {
return str.replace(/[-[\]{}()*+?.,\\^$|#\s]/g, "\\$&");
}
function subst(str, sub) {
return str.replace("<t>", sub.t)
.replace("<i>", sub.i)
.replace("<s>", sub.s);
}
var curpat = 0;
var cursubst = -1;
var testbench = document.getElementById("testbench");
function nextTest() {
cursubst++;
if (cursubst == nsubstitutions) {
curpat++;
cursubst = 0;
}
if (curpat == npatterns) {
SimpleTest.finish();
return;
}
let css = subst(patterns[curpat].i, substitutions[cursubst]);
let msg = quotemeta(subst(patterns[curpat].o, substitutions[cursubst]));
info(css);
info(msg);
SimpleTest.expectConsoleMessages(function () { testbench.innerHTML = css },
[{ errorMessage: new RegExp(msg) }],
nextTest);
}
SimpleTest.waitForExplicitFinish();
nextTest();
</script>
</body>
</html>