(function() { var global = this; /* ===== Helpers ===== */ global.throws = function(block, exceptionType) { var exception = null; try { block(); } catch (e) { exception = e; } ok( exception !== null, exception !== null ? "okay: thrown something" : "failed, nothing thrown" ); if (exception !== null) { ok( exception instanceof exceptionType, exception instanceof exceptionType ? "okay: thrown " + exceptionType.name : "failed, thrown " + exception.name + " instead of " + exceptionType.name ); } return exception; }; global.parses = function(parser, input, expected) { deepEqual(parser.parse(input), expected); }; global.doesNotParse = function(parser, input) { throws(function() { parser.parse(input); }, PEG.Parser.SyntaxError); }; global.doesNotParseWithMessage = function(parser, input, message) { var exception = throws( function() { parser.parse(input); }, PEG.Parser.SyntaxError ); if (exception) { strictEqual(exception.message, message); } }; global.doesNotParseWithPos = function(parser, input, line, column) { var exception = throws( function() { parser.parse(input); }, PEG.Parser.SyntaxError ); if (exception) { strictEqual(exception.line, line); strictEqual(exception.column, column); } }; /* ===== PEG.Compiler ===== */ module("PEG.Compiler"); test("formatCode joins parts", function() { strictEqual(PEG.Compiler.formatCode("foo", "bar"), "foo\nbar"); }); test("formatCode interpolates variables", function() { strictEqual( PEG.Compiler.formatCode("foo", "${bar}", { bar: "baz" }), "foo\nbaz" ); throws(function() { PEG.Compiler.formatCode("foo", "${bar}"); }, Error); }); test("formatCode filters variables", function() { strictEqual( PEG.Compiler.formatCode("foo", "${bar|string}", { bar: "baz" }), "foo\n\"baz\"" ); throws(function() { PEG.Compiler.formatCode("foo", "${bar|eeek}", { bar: "baz" }); }, Error); }); test("formatCode indents multiline parts", function() { strictEqual( PEG.Compiler.formatCode("foo", "${bar}", { bar: " baz\nqux" }), "foo\n baz\n qux" ); }); test("generateUniqueIdentifier", function() { notStrictEqual( PEG.Compiler.generateUniqueIdentifier("prefix"), PEG.Compiler.generateUniqueIdentifier("prefix") ); }); /* ===== PEG ===== */ module("PEG"); test("buildParser reports invalid grammar object", function() { throws(function() { PEG.buildParser(42); }, PEG.Grammar.GrammarError); }); test("buildParser reports missing start rule", function() { throws(function() { PEG.buildParser({}); }, PEG.Grammar.GrammarError); }); test("buildParser allows custom start rule", function() { var parser = PEG.buildParser('s: "abcd"', "s"); parses(parser, "abcd", "abcd"); }); /* ===== Generated Parser ===== */ module("Generated Parser"); test("literals", function() { var parser = PEG.buildParser('start: "abcd"'); parses(parser, "abcd", "abcd"); doesNotParse(parser, ""); doesNotParse(parser, "abc"); doesNotParse(parser, "abcde"); doesNotParse(parser, "efgh"); /* * Test that the parsing position moves forward after successful parsing of * a literal. */ var posTestParser = PEG.buildParser('start: "a" "b"'); parses(posTestParser, "ab", ["a", "b"]); }); test("anys", function() { var parser = PEG.buildParser('start: .'); parses(parser, "a", "a"); doesNotParse(parser, ""); doesNotParse(parser, "ab"); /* * Test that the parsing position moves forward after successful parsing of * an any. */ var posTestParser = PEG.buildParser('start: . .'); parses(posTestParser, "ab", ["a", "b"]); }); test("classes", function() { var emptyClassParser = PEG.buildParser('start: []'); doesNotParse(emptyClassParser, ""); doesNotParse(emptyClassParser, "a"); doesNotParse(emptyClassParser, "ab"); var nonEmptyClassParser = PEG.buildParser('start: [ab-d]'); parses(nonEmptyClassParser, "a", "a"); parses(nonEmptyClassParser, "b", "b"); parses(nonEmptyClassParser, "c", "c"); parses(nonEmptyClassParser, "d", "d"); doesNotParse(nonEmptyClassParser, ""); doesNotParse(nonEmptyClassParser, "ab"); /* * Test that the parsing position moves forward after successful parsing of * a class. */ var posTestParser = PEG.buildParser('start: [ab-d] [ab-d]'); parses(posTestParser, "ab", ["a", "b"]); }); test("sequences", function() { var emptySequenceParser = PEG.buildParser('start: '); parses(emptySequenceParser, "", []); doesNotParse(emptySequenceParser, "abc"); var nonEmptySequenceParser = PEG.buildParser('start: "a" "b" "c"'); parses(nonEmptySequenceParser, "abc", ["a", "b", "c"]); doesNotParse(nonEmptySequenceParser, ""); doesNotParse(nonEmptySequenceParser, "ab"); doesNotParse(nonEmptySequenceParser, "abcd"); doesNotParse(nonEmptySequenceParser, "efg"); /* * Test that the parsing position returns after unsuccessful parsing of a * sequence. */ var posTestParser = PEG.buildParser('start: ("a" "b") / "a"'); parses(posTestParser, "a", "a"); }); test("choices", function() { var parser = PEG.buildParser('start: "a" / "b" / "c"'); parses(parser, "a", "a"); parses(parser, "b", "b"); parses(parser, "c", "c"); doesNotParse(parser, ""); doesNotParse(parser, "ab"); doesNotParse(parser, "d"); }); test("optional expressions", function() { var parser = PEG.buildParser('start: "a"?'); parses(parser, "", ""); parses(parser, "a", "a"); }); test("zero or more expressions", function() { var parser = PEG.buildParser('start: "a"*'); parses(parser, "", []); parses(parser, "a", ["a"]); parses(parser, "aaa", ["a", "a", "a"]); }); test("one or more expressions", function() { var parser = PEG.buildParser('start: "a"+'); doesNotParse(parser, ""); parses(parser, "a", ["a"]); parses(parser, "aaa", ["a", "a", "a"]); }); test("and predicate", function() { var parser = PEG.buildParser('start: "a" &"b" "b"'); parses(parser, "ab", ["a", "", "b"]); doesNotParse(parser, "ac"); /* * Test that the parsing position returns after successful parsing of a * predicate is not needed, it is implicit in the tests above. */ }); test("not predicate", function() { var parser = PEG.buildParser('start: "a" !"b"'); parses(parser, "a", ["a", ""]); doesNotParse(parser, "ab"); /* * Test that the parsing position returns after successful parsing of a * predicate. */ var posTestParser = PEG.buildParser('start: "a" !"b" "c"'); parses(posTestParser, "ac", ["a", "", "c"]); }); test("rule references", function() { var parser = PEG.buildParser([ 'start: static / dynamic', 'static: "C" / "C++" / "Java" / "C#"', 'dynamic: "Ruby" / "Python" / "JavaScript"' ].join("\n")); parses(parser, "Java", "Java"); parses(parser, "Python", "Python"); }); test("actions", function() { var singleMatchParser = PEG.buildParser( 'start: "a" { return Array.prototype.slice.call(arguments).join("").toUpperCase(); }' ); parses(singleMatchParser, "a", "A"); var multiMatchParser = PEG.buildParser( 'start: "a" "b" "c" { return Array.prototype.slice.call(arguments).join("").toUpperCase(); }' ); parses(multiMatchParser, "abc", "ABC"); var innerMatchParser = PEG.buildParser( 'start: "a" ("b" "c" "d" { return Array.prototype.slice.call(arguments).join("").toUpperCase(); }) "e"' ); parses(innerMatchParser, "abcde", ["a", "BCD", "e"]); /* Test that the action is not called when its expression does not match. */ var notAMatchParser = PEG.buildParser( 'start: "a" { ok(false, "action got called when it should not be"); }' ); doesNotParse(notAMatchParser, "b"); var variablesParser = PEG.buildParser([ 'start: "a" "b" "c" "d" "e" "f" "g" "h" "i" "j" {', ' return [$1, $2, $3, $4, $5, $6, $7, $8, $9, $10].join("").toUpperCase();', ' }' ].join("\n")); parses(variablesParser, "abcdefghij", "ABCDEFGHIJ"); }); test("cache", function() { /* * Should trigger a codepath where the cache is used (for the "a" rule). */ var parser = PEG.buildParser([ 'start: (a b) / (a c)', 'a: "a"', 'b: "b"', 'c: "c"' ].join("\n")); parses(parser, "ac", ["a", "c"]); }); test("indempotence", function() { var parser1 = PEG.buildParser('start: "abcd"'); var parser2 = PEG.buildParser('start: "abcd"'); strictEqual(parser1.toSource(), parser2.toSource()); }); test("error messages", function() { var literalParser = PEG.buildParser('start: "abcd"'); doesNotParseWithMessage( literalParser, "", 'Expected "abcd" but end of input found.' ); doesNotParseWithMessage( literalParser, "efgh", 'Expected "abcd" but "e" found.' ); doesNotParseWithMessage( literalParser, "abcde", 'Expected end of input but "e" found.' ); var anyParser = PEG.buildParser('start: .'); doesNotParseWithMessage( anyParser, "", 'Expected any character but end of input found.' ); var namedRuleWithLiteralParser = PEG.buildParser('start "digit": [0-9]'); doesNotParseWithMessage( namedRuleWithLiteralParser, "a", 'Expected digit but "a" found.' ); var namedRuleWithAnyParser = PEG.buildParser('start "whatever": .'); doesNotParseWithMessage( namedRuleWithAnyParser, "", 'Expected whatever but end of input found.' ); var namedRuleWithNamedRuleParser = PEG.buildParser([ 'start "digits": digit+', 'digit "digit": [0-9]' ].join("\n")); doesNotParseWithMessage( namedRuleWithNamedRuleParser, "", 'Expected digits but end of input found.' ); var choiceParser1 = PEG.buildParser('start: "a" / "b" / "c"'); doesNotParseWithMessage( choiceParser1, "def", 'Expected "a", "b" or "c" but "d" found.' ); var choiceParser2 = PEG.buildParser('start: "a" "b" "c" / "a"'); doesNotParseWithMessage( choiceParser2, "abd", 'Expected "c" but "d" found.' ); var notPredicateParser = PEG.buildParser('start: !"a" "b"'); doesNotParseWithMessage( notPredicateParser, "c", 'Expected "b" but "c" found.' ); var andPredicateParser = PEG.buildParser('start: &"a" [a-b]'); doesNotParseWithMessage( andPredicateParser, "c", 'Expected end of input but "c" found.' ); var emptyParser = PEG.buildParser('start: '); doesNotParseWithMessage( emptyParser, "something", 'Expected end of input but "s" found.' ); }); test("error positions", function() { var parser = PEG.buildParser([ 'start: line (("\\r" / "\\n" / "\\u2028" / "\\u2029")+ line)*', 'line: digit (" "+ digit)*', 'digit: [0-9]+ { return $1.join(""); }' ].join("\n")); doesNotParseWithPos(parser, "a", 1, 1); doesNotParseWithPos(parser, "1\n2\n\n3\n\n\n4 5 x", 7, 5); /* Non-Unix newlines */ doesNotParseWithPos(parser, "1\rx", 2, 1); // Old Mac doesNotParseWithPos(parser, "1\r\nx", 2, 1); // Windows doesNotParseWithPos(parser, "1\n\rx", 3, 1); // mismatched /* Strange newlines */ doesNotParseWithPos(parser, "1\u2028x", 2, 1); // line separator doesNotParseWithPos(parser, "1\u2029x", 2, 1); // paragraph separator }); /* * Following examples are from Wikipedia, see * http://en.wikipedia.org/w/index.php?title=Parsing_expression_grammar&oldid=335106938. */ test("arithmetics", function() { /* * Value ← [0-9]+ / '(' Expr ')' * Product ← Value (('*' / '/') Value)* * Sum ← Product (('+' / '-') Product)* * Expr ← Sum */ var parser = PEG.buildParser([ 'Value : [0-9]+ { return parseInt($1.join("")); }', ' / "(" Expr ")" { return $2; }', 'Product : Value (("*" / "/") Value)* {', ' var result = $1;', ' for (var i = 0; i < $2.length; i++) {', ' if ($2[i][0] == "*") { result *= $2[i][1]; }', ' if ($2[i][0] == "/") { result /= $2[i][1]; }', ' }', ' return result;', ' }', 'Sum : Product (("+" / "-") Product)* {', ' var result = $1;', ' for (var i = 0; i < $2.length; i++) {', ' if ($2[i][0] == "+") { result += $2[i][1]; }', ' if ($2[i][0] == "-") { result -= $2[i][1]; }', ' }', ' return result;', ' }', 'Expr : Sum' ].join("\n"), "Expr"); /* Test "value" rule. */ parses(parser, "0", 0); parses(parser, "123", 123); parses(parser, "(42+43)", 42+43); /* Test "product" rule. */ parses(parser, "42", 42); parses(parser, "42*43", 42*43); parses(parser, "42*43*44*45", 42*43*44*45); parses(parser, "42/43", 42/43); parses(parser, "42/43/44/45", 42/43/44/45); /* Test "sum" rule. */ parses(parser, "42*43", 42*43); parses(parser, "42*43+44*45", 42*43+44*45); parses(parser, "42*43+44*45+46*47+48*49", 42*43+44*45+46*47+48*49); parses(parser, "42*43-44*45", 42*43-44*45); parses(parser, "42*43-44*45-46*47-48*49", 42*43-44*45-46*47-48*49); /* Test "expr" rule. */ parses(parser, "42+43", 42+43); /* Complex test */ parses(parser, "(1+2)*(3+4)",(1+2)*(3+4)); }); test("non-context-free language", function() { /* The following parsing expression grammar describes the classic * non-context-free language { a^n b^n c^n : n >= 1 }: * * S ← &(A c) a+ B !(a/b/c) * A ← a A? b * B ← b B? c */ var parser = PEG.buildParser([ 'S: &(A "c") "a"+ B !("a" / "b" / "c") { return $2.join("") + $3; }', 'A: "a" A? "b" { return $1 + $2 + $3; }', 'B: "b" B? "c" { return $1 + $2 + $3; }', ].join("\n"), "S"); parses(parser, "abc", "abc"); parses(parser, "aaabbbccc", "aaabbbccc"); doesNotParse(parser, "aabbbccc"); doesNotParse(parser, "aaaabbbccc"); doesNotParse(parser, "aaabbccc"); doesNotParse(parser, "aaabbbbccc"); doesNotParse(parser, "aaabbbcc"); doesNotParse(parser, "aaabbbcccc"); }); test("nested comments", function() { /* * Begin ← "(*" * End ← "*)" * C ← Begin N* End * N ← C / (!Begin !End Z) * Z ← any single character */ var parser = PEG.buildParser([ 'Begin : "(*"', 'End : "*)"', 'C : Begin N* End { return $1 + $2.join("") + $3; }', 'N : C', ' / (!Begin !End Z) { return $3; }', 'Z : .' ].join("\n"), "C"); parses(parser, "(**)", "(**)"); parses(parser, "(*abc*)", "(*abc*)"); parses(parser, "(*(**)*)", "(*(**)*)"); parses( parser, "(*abc(*def*)ghi(*(*(*jkl*)*)*)mno*)", "(*abc(*def*)ghi(*(*(*jkl*)*)*)mno*)" ); }); })();