You cannot select more than 25 topics
Topics must start with a letter or number, can include dashes ('-') and can be up to 35 characters long.
400 lines
15 KiB
JavaScript
400 lines
15 KiB
JavaScript
describe("PEG.js grammar parser", function() {
|
|
var trivialGrammar;
|
|
|
|
function oneRuleGrammar(displayName, expression) {
|
|
return {
|
|
type: "grammar",
|
|
initializer: null,
|
|
rules: [
|
|
{
|
|
type: "rule",
|
|
name: "start",
|
|
displayName: displayName,
|
|
expression: expression
|
|
}
|
|
],
|
|
startRule: "start"
|
|
};
|
|
}
|
|
|
|
function ruleRefGrammar(name) {
|
|
return oneRuleGrammar(null, { type: "rule_ref", name: name });
|
|
}
|
|
|
|
function literalGrammar(value) {
|
|
var ignoreCase = arguments.length > 1 ? arguments[1] : false;
|
|
|
|
return oneRuleGrammar(null, {
|
|
type: "literal",
|
|
value: value,
|
|
ignoreCase: ignoreCase
|
|
});
|
|
}
|
|
|
|
function classGrammar(parts, rawText) {
|
|
var inverted = arguments.length > 2 ? arguments[2] : false,
|
|
ignoreCase = arguments.length > 3 ? arguments[3] : false;
|
|
|
|
return oneRuleGrammar(null, {
|
|
type: "class",
|
|
inverted: inverted,
|
|
ignoreCase: ignoreCase,
|
|
parts: parts,
|
|
rawText: rawText
|
|
});
|
|
}
|
|
|
|
beforeEach(function() {
|
|
trivialGrammar = literalGrammar("abcd");
|
|
|
|
this.addMatchers({
|
|
toParseAs: function(expected) {
|
|
var result;
|
|
|
|
try {
|
|
result = PEG.parser.parse(this.actual);
|
|
|
|
this.message = function() {
|
|
return "Expected " + jasmine.pp(this.actual) + " "
|
|
+ (this.isNot ? "not " : "")
|
|
+ "to parse as " + jasmine.pp(expected) + ", "
|
|
+ "but it parsed as " + jasmine.pp(result) + ".";
|
|
};
|
|
|
|
return this.env.equals_(result, expected);
|
|
} catch (e) {
|
|
this.message = function() {
|
|
return "Expected " + jasmine.pp(this.actual) + " "
|
|
+ "to parse as " + jasmine.pp(expected) + ", "
|
|
+ "but it failed to parse with message "
|
|
+ jasmine.pp(e.message) + ".";
|
|
};
|
|
|
|
return false;
|
|
}
|
|
},
|
|
|
|
toFailToParse: function(details) {
|
|
/*
|
|
* Extracted into a function just to silence JSHint complaining about
|
|
* creating functions in a loop.
|
|
*/
|
|
function buildKeyMessage(key, value) {
|
|
return function() {
|
|
return "Expected " + jasmine.pp(this.actual) + " to fail to parse"
|
|
+ (details ? " with details " + jasmine.pp(details) : "") + ", "
|
|
+ "but " + jasmine.pp(key) + " "
|
|
+ "is " + jasmine.pp(value) + ".";
|
|
};
|
|
}
|
|
|
|
var result, key;
|
|
|
|
try {
|
|
result = PEG.parser.parse(this.actual);
|
|
|
|
this.message = function() {
|
|
return "Expected " + jasmine.pp(this.actual) + " to fail to parse"
|
|
+ (details ? " with details " + jasmine.pp(details) : "") + ", "
|
|
+ "but it parsed as " + jasmine.pp(result) + ".";
|
|
};
|
|
|
|
return false;
|
|
} catch (e) {
|
|
if (this.isNot) {
|
|
this.message = function() {
|
|
return "Expected " + jasmine.pp(this.actual) + " to parse, "
|
|
+ "but it failed with message "
|
|
+ jasmine.pp(e.message) + ".";
|
|
};
|
|
} else {
|
|
if (details) {
|
|
for (key in details) {
|
|
if (!this.env.equals_(e[key], details[key])) {
|
|
this.message = buildKeyMessage(key, e[key]);
|
|
|
|
return false;
|
|
}
|
|
}
|
|
}
|
|
}
|
|
|
|
return true;
|
|
}
|
|
}
|
|
});
|
|
});
|
|
|
|
/* Canonical identifier is "a". */
|
|
it("parses identifier", function() {
|
|
expect('start = a' ).toParseAs(ruleRefGrammar("a"));
|
|
expect('start = _' ).toParseAs(ruleRefGrammar("_"));
|
|
expect('start = $' ).toParseAs(ruleRefGrammar("$"));
|
|
expect('start = aa' ).toParseAs(ruleRefGrammar("aa"));
|
|
expect('start = a0' ).toParseAs(ruleRefGrammar("a0"));
|
|
expect('start = a_' ).toParseAs(ruleRefGrammar("a_"));
|
|
expect('start = a$' ).toParseAs(ruleRefGrammar("a$"));
|
|
expect('start = abcd').toParseAs(ruleRefGrammar("abcd"));
|
|
|
|
expect('start = a\n').toParseAs(ruleRefGrammar("a"));
|
|
});
|
|
|
|
/* Canonical literal is "\"abcd\"". */
|
|
it("parses literal", function() {
|
|
expect('start = "abcd"' ).toParseAs(literalGrammar("abcd"));
|
|
expect("start = 'abcd'" ).toParseAs(literalGrammar("abcd"));
|
|
|
|
expect('start = "abcd"i').toParseAs(literalGrammar("abcd", true));
|
|
|
|
expect('start = "abcd"\n').toParseAs(literalGrammar("abcd"));
|
|
});
|
|
|
|
/* Canonical string is "\"abcd\"". */
|
|
it("parses string", function() {
|
|
var grammar = oneRuleGrammar("abcd", {
|
|
type: "literal",
|
|
value: "abcd",
|
|
ignoreCase: false
|
|
});
|
|
|
|
expect('start "abcd" = "abcd"' ).toParseAs(grammar);
|
|
expect('start \'abcd\' = "abcd"').toParseAs(grammar);
|
|
|
|
expect('start "abcd"\n= "abcd"').toParseAs(grammar);
|
|
});
|
|
|
|
/* Canonical doubleQuotedString is "\"abcd\"". */
|
|
it("parses doubleQuotedString", function() {
|
|
expect('start = ""' ).toParseAs(literalGrammar(""));
|
|
expect('start = "a"' ).toParseAs(literalGrammar("a"));
|
|
expect('start = "abc"').toParseAs(literalGrammar("abc"));
|
|
});
|
|
|
|
/* Canonical doubleQuotedCharacter is "a". */
|
|
it("parses doubleQuotedCharacter", function() {
|
|
expect('start = "a"' ).toParseAs(literalGrammar("a"));
|
|
expect('start = "\\n"' ).toParseAs(literalGrammar("\n"));
|
|
expect('start = "\\0"' ).toParseAs(literalGrammar("\x00"));
|
|
expect('start = "\\xFF"' ).toParseAs(literalGrammar("\xFF"));
|
|
expect('start = "\\uFFFF"').toParseAs(literalGrammar("\uFFFF"));
|
|
expect('start = "\\\n"' ).toParseAs(literalGrammar("\n"));
|
|
});
|
|
|
|
/* Canonical simpleDoubleQuotedCharacter is "a". */
|
|
it("parses simpleDoubleQuotedCharacter", function() {
|
|
expect('start = "a"').toParseAs(literalGrammar("a"));
|
|
|
|
expect('start = """' ).toFailToParse();
|
|
expect('start = "\\"').toFailToParse();
|
|
expect('start = "\n"').toFailToParse();
|
|
});
|
|
|
|
/* Canonical singleQuotedString is "'abcd'". */
|
|
it("parses singleQuotedString", function() {
|
|
expect("start = ''" ).toParseAs(literalGrammar(""));
|
|
expect("start = 'a'" ).toParseAs(literalGrammar("a"));
|
|
expect("start = 'abc'").toParseAs(literalGrammar("abc"));
|
|
});
|
|
|
|
/* Canonical singleQuotedCharacter is "a". */
|
|
it("parses singleQuotedCharacter", function() {
|
|
expect("start = 'a'" ).toParseAs(literalGrammar("a"));
|
|
expect("start = '\\n'" ).toParseAs(literalGrammar("\n"));
|
|
expect("start = '\\0'" ).toParseAs(literalGrammar("\x00"));
|
|
expect("start = '\\xFF'" ).toParseAs(literalGrammar("\xFF"));
|
|
expect("start = '\\uFFFF'").toParseAs(literalGrammar("\uFFFF"));
|
|
expect("start = '\\\n'" ).toParseAs(literalGrammar("\n"));
|
|
});
|
|
|
|
/* Canonical simpleSingleQuotedCharacter is "a". */
|
|
it("parses simpleSingleQuotedCharacter", function() {
|
|
expect("start = 'a'").toParseAs(literalGrammar("a"));
|
|
|
|
expect("start = '''" ).toFailToParse();
|
|
expect("start = '\\'").toFailToParse();
|
|
expect("start = '\n'").toFailToParse();
|
|
});
|
|
|
|
/* Canonical class is "[a-d]". */
|
|
it("parses class", function() {
|
|
expect('start = []' ).toParseAs(classGrammar([], "[]"));
|
|
expect('start = [a-d]' ).toParseAs(classGrammar([["a", "d"]], "[a-d]"));
|
|
expect('start = [a]' ).toParseAs(classGrammar(["a"], "[a]"));
|
|
expect('start = [a-de-hi-l]').toParseAs(
|
|
classGrammar([["a", "d"], ["e", "h"], ["i", "l"]], "[a-de-hi-l]")
|
|
);
|
|
|
|
expect('start = [^a-d]').toParseAs(
|
|
classGrammar([["a", "d"]], "[^a-d]", true, false)
|
|
);
|
|
expect('start = [a-d]i').toParseAs(
|
|
classGrammar([["a", "d"]], "[a-d]i", false, true)
|
|
);
|
|
|
|
expect('start = [\u0080\u0081\u0082]').toParseAs(
|
|
classGrammar(["\u0080", "\u0081", "\u0082"], "[\\x80\\x81\\x82]")
|
|
);
|
|
|
|
expect('start = [a-d]\n').toParseAs(classGrammar([["a", "d"]], "[a-d]"));
|
|
});
|
|
|
|
/* Canonical classCharacterRange is "a-d". */
|
|
it("parses classCharacterRange", function() {
|
|
expect('start = [a-d]').toParseAs(classGrammar([["a", "d"]], "[a-d]"));
|
|
expect('start = [a-a]').toParseAs(classGrammar([["a", "a"]], "[a-a]"));
|
|
|
|
expect('start = [b-a]').toFailToParse({
|
|
message: "Invalid character range: b-a."
|
|
});
|
|
expect('start = [\u0081-\u0080]').toFailToParse({
|
|
message: "Invalid character range: \\x81-\\x80."
|
|
});
|
|
});
|
|
|
|
/* Canonical classCharacter is "a". */
|
|
it("parses classCharacter", function() {
|
|
expect('start = [a]').toParseAs(classGrammar(["a"], "[a]"));
|
|
|
|
/* This test demonstrates that |rawText| is not really "raw". */
|
|
expect('start = [\u0080]').toParseAs(classGrammar(["\x80"], "[\\x80]"));
|
|
});
|
|
|
|
/* Canonical bracketDelimitedCharacter is "a". */
|
|
it("parses bracketDelimitedCharacter", function() {
|
|
expect('start = [a]' ).toParseAs(classGrammar(["a"], "[a]"));
|
|
expect('start = [\\n]' ).toParseAs(classGrammar(["\n"], "[\\n]"));
|
|
expect('start = [\\0]' ).toParseAs(classGrammar(["\x00"], "[\\0]"));
|
|
expect('start = [\\xFF]' ).toParseAs(classGrammar(["\xFF"], "[\\xFF]"));
|
|
expect('start = [\\uFFFF]').toParseAs(classGrammar(["\uFFFF"], "[\\uFFFF]"));
|
|
expect('start = [\\\n]' ).toParseAs(classGrammar(["\n"], "[\\n]"));
|
|
});
|
|
|
|
/* Canonical simpleBracketDelimiedCharacter is "a". */
|
|
it("parses simpleBracketDelimitedCharacter", function() {
|
|
expect('start = [a]').toParseAs(classGrammar(["a"], "[a]"));
|
|
|
|
expect('start = []]' ).toFailToParse();
|
|
expect('start = [\\]').toFailToParse();
|
|
expect('start = [\n]').toFailToParse();
|
|
});
|
|
|
|
/* Canonical simpleEscapeSequence is "\\n". */
|
|
it("parses simpleEscapeSequence", function() {
|
|
expect('start = "\\b"').toParseAs(literalGrammar("\b"));
|
|
expect('start = "\\f"').toParseAs(literalGrammar("\f"));
|
|
expect('start = "\\n"').toParseAs(literalGrammar("\n"));
|
|
expect('start = "\\r"').toParseAs(literalGrammar("\r"));
|
|
expect('start = "\\t"').toParseAs(literalGrammar("\t"));
|
|
expect('start = "\\v"').toParseAs(literalGrammar("\x0B")); // no "\v" in IE
|
|
expect('start = "\\a"').toParseAs(literalGrammar("a"));
|
|
|
|
expect('start = "\\1"').toFailToParse();
|
|
expect('start = "\\x"').toFailToParse();
|
|
expect('start = "\\u"').toFailToParse();
|
|
});
|
|
|
|
/* Canonical zeroEscapeSequence is "\\0". */
|
|
it("parses zeroEscapeSequence", function() {
|
|
expect('start = "\\0"').toParseAs(literalGrammar("\x00"));
|
|
|
|
expect('start = "\\00"').toFailToParse();
|
|
expect('start = "\\09"').toFailToParse();
|
|
});
|
|
|
|
/* Canonical hexEscapeSequence is "\\xFF". */
|
|
it("parses hexEscapeSequence", function() {
|
|
expect('start = "\\xFF"').toParseAs(literalGrammar("\xFF"));
|
|
});
|
|
|
|
/* Canonical unicodeEscapeSequence is "\\uFFFF". */
|
|
it("parses unicodeEscapeSequence", function() {
|
|
expect('start = "\\uFFFF"').toParseAs(literalGrammar("\uFFFF"));
|
|
});
|
|
|
|
/* Canonical eolEscapeSequence is "\\\n". */
|
|
it("parses eolEscapeSequence", function() {
|
|
expect('start = "\\\n"' ).toParseAs(literalGrammar("\n"));
|
|
expect('start = "\\\r\n"' ).toParseAs(literalGrammar("\r\n"));
|
|
expect('start = "\\\r"' ).toParseAs(literalGrammar("\r"));
|
|
expect('start = "\\\u2028"').toParseAs(literalGrammar("\u2028"));
|
|
expect('start = "\\\u2029"').toParseAs(literalGrammar("\u2029"));
|
|
});
|
|
|
|
/* Trivial character class rules are not tested. */
|
|
|
|
/* Canonical __ is "\n". */
|
|
it("parses __", function() {
|
|
expect('start ="abcd"' ).toParseAs(trivialGrammar);
|
|
expect('start = "abcd"' ).toParseAs(trivialGrammar);
|
|
expect('start =\n"abcd"' ).toParseAs(trivialGrammar);
|
|
expect('start =/* comment */"abcd"').toParseAs(trivialGrammar);
|
|
expect('start = "abcd"' ).toParseAs(trivialGrammar);
|
|
});
|
|
|
|
// Canonical comment is "/* comment */".
|
|
it("parses comment", function() {
|
|
expect('start =// comment\n"abcd"' ).toParseAs(trivialGrammar);
|
|
expect('start =/* comment */"abcd"').toParseAs(trivialGrammar);
|
|
});
|
|
|
|
/* Canonical singleLineComment is "// comment". */
|
|
it("parses singleLineComment", function() {
|
|
expect('start =//\n"abcd"' ).toParseAs(trivialGrammar);
|
|
expect('start =//a\n"abcd"' ).toParseAs(trivialGrammar);
|
|
expect('start =//aaa\n"abcd"').toParseAs(trivialGrammar);
|
|
});
|
|
|
|
// Canonical multiLineComment is "/* comment */".
|
|
it("parses multiLineComment", function() {
|
|
expect('start =/**/"abcd"' ).toParseAs(trivialGrammar);
|
|
expect('start =/*a*/"abcd"' ).toParseAs(trivialGrammar);
|
|
expect('start =/*aaa*/"abcd"').toParseAs(trivialGrammar);
|
|
expect('start =/***/"abcd"' ).toParseAs(trivialGrammar);
|
|
|
|
expect('start =/**/*/"abcd"').toFailToParse();
|
|
});
|
|
|
|
/* Canonical eol is "\n". */
|
|
it("parses eol", function() {
|
|
expect('start =\n"abcd"' ).toParseAs(trivialGrammar);
|
|
expect('start =\r\n"abcd"' ).toParseAs(trivialGrammar);
|
|
expect('start =\r"abcd"' ).toParseAs(trivialGrammar);
|
|
expect('start =\u2028"abcd"').toParseAs(trivialGrammar);
|
|
expect('start =\u2029"abcd"').toParseAs(trivialGrammar);
|
|
});
|
|
|
|
/* Canonical eolChar is "\n". */
|
|
it("parses eolChar", function() {
|
|
expect('start =\n"abcd"' ).toParseAs(trivialGrammar);
|
|
expect('start =\r"abcd"' ).toParseAs(trivialGrammar);
|
|
expect('start =\u2028"abcd"').toParseAs(trivialGrammar);
|
|
expect('start =\u2029"abcd"').toParseAs(trivialGrammar);
|
|
});
|
|
|
|
/* Canonical whitespace is " ". */
|
|
it("parses whitespace", function() {
|
|
expect('start =\t"abcd"' ).toParseAs(trivialGrammar);
|
|
expect('start =\x0B"abcd"' ).toParseAs(trivialGrammar); // no "\v" in IE
|
|
expect('start =\f"abcd"' ).toParseAs(trivialGrammar);
|
|
expect('start = "abcd"' ).toParseAs(trivialGrammar);
|
|
expect('start =\u00A0"abcd"').toParseAs(trivialGrammar);
|
|
expect('start =\uFEFF"abcd"').toParseAs(trivialGrammar);
|
|
expect('start =\u1680"abcd"').toParseAs(trivialGrammar);
|
|
expect('start =\u180E"abcd"').toParseAs(trivialGrammar);
|
|
expect('start =\u2000"abcd"').toParseAs(trivialGrammar);
|
|
expect('start =\u2001"abcd"').toParseAs(trivialGrammar);
|
|
expect('start =\u2002"abcd"').toParseAs(trivialGrammar);
|
|
expect('start =\u2003"abcd"').toParseAs(trivialGrammar);
|
|
expect('start =\u2004"abcd"').toParseAs(trivialGrammar);
|
|
expect('start =\u2005"abcd"').toParseAs(trivialGrammar);
|
|
expect('start =\u2006"abcd"').toParseAs(trivialGrammar);
|
|
expect('start =\u2007"abcd"').toParseAs(trivialGrammar);
|
|
expect('start =\u2008"abcd"').toParseAs(trivialGrammar);
|
|
expect('start =\u2009"abcd"').toParseAs(trivialGrammar);
|
|
expect('start =\u200A"abcd"').toParseAs(trivialGrammar);
|
|
expect('start =\u202F"abcd"').toParseAs(trivialGrammar);
|
|
expect('start =\u205F"abcd"').toParseAs(trivialGrammar);
|
|
expect('start =\u3000"abcd"').toParseAs(trivialGrammar);
|
|
});
|
|
});
|