#define CATCH_CONFIG_MAIN #include "catch.hpp" #include #include TEST_CASE("Simple syntax test", "[general]") { peglib::peg parser( " ROOT <- _ " " _ <- ' ' " ); bool ret = parser; REQUIRE(ret == true); } TEST_CASE("Empty syntax test", "[general]") { peglib::peg parser(""); bool ret = parser; REQUIRE(ret == false); } TEST_CASE("String capture test", "[general]") { peglib::peg parser( " ROOT <- _ ('[' TAG_NAME ']' _)* " " TAG_NAME <- (!']' .)+ " " _ <- [ \t]* " ); std::vector tags; parser["TAG_NAME"] = [&](const char* s, size_t l) { tags.push_back(std::string(s, l)); }; auto ret = parser.parse(" [tag1] [tag:2] [tag-3] "); REQUIRE(ret == true); REQUIRE(tags.size() == 3); REQUIRE(tags[0] == "tag1"); REQUIRE(tags[1] == "tag:2"); REQUIRE(tags[2] == "tag-3"); } TEST_CASE("String capture test with match", "[general]") { peglib::match m; auto ret = peglib::peg_match( " ROOT <- _ ('[' $< TAG_NAME > ']' _)* " " TAG_NAME <- (!']' .)+ " " _ <- [ \t]* ", " [tag1] [tag:2] [tag-3] ", m); REQUIRE(ret == true); REQUIRE(m.size() == 4); REQUIRE(m.str(1) == "tag1"); REQUIRE(m.str(2) == "tag:2"); REQUIRE(m.str(3) == "tag-3"); } using namespace peglib; using namespace std; TEST_CASE("String capture test2", "[general]") { vector tags; rule ROOT, TAG, TAG_NAME, WS; ROOT <= seq(WS, zom(TAG)); TAG <= seq(chr('['), TAG_NAME, chr(']'), WS); TAG_NAME <= oom(seq(npd(chr(']')), dot())), [&](const char* s, size_t l) { tags.push_back(string(s, l)); }; WS <= zom(cls(" \t")); auto m = ROOT.parse(" [tag1] [tag:2] [tag-3] "); REQUIRE(m.ret == true); REQUIRE(tags.size() == 3); REQUIRE(tags[0] == "tag1"); REQUIRE(tags[1] == "tag:2"); REQUIRE(tags[2] == "tag-3"); } TEST_CASE("String capture test3", "[general]") { auto syntax = " ROOT <- _ TOKEN* " " TOKEN <- '[' < (!']' .)+ > ']' _ " " _ <- [ \t\r\n]* " ; peg pg(syntax); std::vector tags; pg["TOKEN"] = [&](const char* s, size_t l) { tags.push_back(std::string(s, l)); }; auto ret = pg.parse(" [tag1] [tag:2] [tag-3] "); REQUIRE(ret == true); REQUIRE(tags.size() == 3); REQUIRE(tags[0] == "tag1"); REQUIRE(tags[1] == "tag:2"); REQUIRE(tags[2] == "tag-3"); } TEST_CASE("String capture test with embedded match action", "[general]") { rule ROOT, TAG, TAG_NAME, WS; vector tags; ROOT <= seq(WS, zom(TAG)); TAG <= seq(chr('['), cap(TAG_NAME, [&](const char* s, size_t l, size_t id) { tags.push_back(string(s, l)); }), chr(']'), WS); TAG_NAME <= oom(seq(npd(chr(']')), dot())); WS <= zom(cls(" \t")); auto m = ROOT.parse(" [tag1] [tag:2] [tag-3] "); REQUIRE(m.ret == true); REQUIRE(tags.size() == 3); REQUIRE(tags[0] == "tag1"); REQUIRE(tags[1] == "tag:2"); REQUIRE(tags[2] == "tag-3"); } TEST_CASE("Cyclic grammer test", "[general]") { rule PARENT; rule CHILD; PARENT <= seq(CHILD); CHILD <= seq(PARENT); } TEST_CASE("Visit test", "[general]") { rule ROOT, TAG, TAG_NAME, WS; ROOT <= seq(WS, zom(TAG)); TAG <= seq(chr('['), TAG_NAME, chr(']'), WS); TAG_NAME <= oom(seq(npd(chr(']')), dot())); WS <= zom(cls(" \t")); DefinitionIDs defIds; ROOT.accept(defIds); REQUIRE(defIds.ids.size() == 4); } TEST_CASE("Lambda action test", "[general]") { peg parser( " START <- (CHAR)* " " CHAR <- . "); string ss; parser["CHAR"] = [&](const char* s, size_t l) { ss += *s; }; bool ret = parser.parse("hello"); REQUIRE(ret == true); REQUIRE(ss == "hello"); } TEST_CASE("Skip token test", "[general]") { peglib::peg parser( " ROOT <- _ ITEM (',' _ ITEM _)* " " ITEM <- ([a-z0-9])+ " " ~_ <- [ \t]* " ); parser["ROOT"] = [&](const SemanticValues& sv) { REQUIRE(sv.size() == 2); }; auto ret = parser.parse(" item1, item2 "); REQUIRE(ret == true); } TEST_CASE("Backtracking test", "[general]") { peg parser( " START <- PAT1 / PAT2 " " PAT1 <- HELLO ' One' " " PAT2 <- HELLO ' Two' " " HELLO <- 'Hello' " ); size_t count = 0; parser["HELLO"] = [&](const char* s, size_t l) { count++; }; bool ret = parser.parse("Hello Two", true, true); REQUIRE(ret == true); REQUIRE(count == 1); // Skip second time } TEST_CASE("Octal/Hex value test", "[general]") { peglib::peg parser( " ROOT <- '\132\x7a' " ); auto ret = parser.parse("Zz"); REQUIRE(ret == true); } TEST_CASE("mutable lambda test", "[general]") { vector vec; peg pg("ROOT <- 'mutable lambda test'"); // This test makes sure if the following code can be compiled. pg["TOKEN"] = [=](const char* s, size_t l) mutable { vec.push_back(string(s, l)); }; } TEST_CASE("Simple calculator test", "[general]") { auto syntax = " Additive <- Multitive '+' Additive / Multitive " " Multitive <- Primary '*' Multitive / Primary " " Primary <- '(' Additive ')' / Number " " Number <- [0-9]+ "; peg parser(syntax); parser["Additive"] = { // Default action nullptr, // Action for the first choice [](const SemanticValues& sv) { return sv[0].val.get() + sv[1].val.get(); }, // Action for the second choice [](const SemanticValues& sv) { return sv[0]; } }; parser["Multitive"] = [](const SemanticValues& sv) { switch (sv.choice) { case 0: // Action for the first choice return sv[0].val.get() * sv[1].val.get(); default: // Action for the second choice return sv[0].val.get(); } }; parser["Number"] = [](const char* s, size_t l) { return atoi(s); }; int val; parser.parse("(1+2)*3", val); REQUIRE(val == 9); } TEST_CASE("Calculator test", "[general]") { // Construct grammer rule EXPRESSION, TERM, FACTOR, TERM_OPERATOR, FACTOR_OPERATOR, NUMBER; EXPRESSION <= seq(TERM, zom(seq(TERM_OPERATOR, TERM))); TERM <= seq(FACTOR, zom(seq(FACTOR_OPERATOR, FACTOR))); FACTOR <= cho(NUMBER, seq(chr('('), EXPRESSION, chr(')'))); TERM_OPERATOR <= cls("+-"); FACTOR_OPERATOR <= cls("*/"); NUMBER <= oom(cls("0-9")); // Setup actions auto reduce = [](const SemanticValues& sv) -> long { long ret = sv[0].val.get(); for (auto i = 1u; i < sv.size(); i += 2) { auto num = sv[i + 1].val.get(); switch (sv[i].val.get()) { case '+': ret += num; break; case '-': ret -= num; break; case '*': ret *= num; break; case '/': ret /= num; break; } } return ret; }; EXPRESSION = reduce; TERM = reduce; TERM_OPERATOR = [](const char* s, size_t l) { return *s; }; FACTOR_OPERATOR = [](const char* s, size_t l) { return *s; }; NUMBER = [&](const char* s, size_t l) { return stol(string(s, l), nullptr, 10); }; // Parse long val; auto m = EXPRESSION.parse_with_value("1+2*3*(4-5+6)/7-8", val); REQUIRE(m.ret == true); REQUIRE(val == -3); } TEST_CASE("Calculator test2", "[general]") { // Parse syntax auto syntax = " # Grammar for Calculator...\n " " EXPRESSION <- TERM (TERM_OPERATOR TERM)* " " TERM <- FACTOR (FACTOR_OPERATOR FACTOR)* " " FACTOR <- NUMBER / '(' EXPRESSION ')' " " TERM_OPERATOR <- [-+] " " FACTOR_OPERATOR <- [/*] " " NUMBER <- [0-9]+ " ; string start; auto grammar = PEGParser::parse(syntax, strlen(syntax), start, nullptr, nullptr); auto& g = *grammar; // Setup actions auto reduce = [](const SemanticValues& sv) -> long { long ret = sv[0].val.get(); for (auto i = 1u; i < sv.size(); i += 2) { auto num = sv[i + 1].val.get(); switch (sv[i].val.get()) { case '+': ret += num; break; case '-': ret -= num; break; case '*': ret *= num; break; case '/': ret /= num; break; } } return ret; }; g["EXPRESSION"] = reduce; g["TERM"] = reduce; g["TERM_OPERATOR"] = [](const char* s, size_t l) { return *s; }; g["FACTOR_OPERATOR"] = [](const char* s, size_t l) { return *s; }; g["NUMBER"] = [](const char* s, size_t l) { return stol(string(s, l), nullptr, 10); }; // Parse long val; auto m = g[start].parse_with_value("1+2*3*(4-5+6)/7-8", val); REQUIRE(m.ret == true); REQUIRE(val == -3); } TEST_CASE("Calculator test3", "[general]") { // Parse syntax peg parser( " # Grammar for Calculator...\n " " EXPRESSION <- TERM (TERM_OPERATOR TERM)* " " TERM <- FACTOR (FACTOR_OPERATOR FACTOR)* " " FACTOR <- NUMBER / '(' EXPRESSION ')' " " TERM_OPERATOR <- [-+] " " FACTOR_OPERATOR <- [/*] " " NUMBER <- [0-9]+ " ); auto reduce = [](const SemanticValues& sv) -> long { long ret = sv[0].val.get(); for (auto i = 1u; i < sv.size(); i += 2) { auto num = sv[i + 1].val.get(); switch (sv[i].val.get()) { case '+': ret += num; break; case '-': ret -= num; break; case '*': ret *= num; break; case '/': ret /= num; break; } } return ret; }; // Setup actions parser["EXPRESSION"] = reduce; parser["TERM"] = reduce; parser["TERM_OPERATOR"] = [](const char* s, size_t l) { return (char)*s; }; parser["FACTOR_OPERATOR"] = [](const char* s, size_t l) { return (char)*s; }; parser["NUMBER"] = [](const char* s, size_t l) { return stol(string(s, l), nullptr, 10); }; // Parse long val; auto ret = parser.parse("1+2*3*(4-5+6)/7-8", val); REQUIRE(ret == true); REQUIRE(val == -3); } bool exact(Grammar& g, const char* d, const char* s) { auto l = strlen(s); auto r = g[d].parse(s, l); return r.ret && r.len == l; } Grammar& make_peg_grammar() { return PEGParser::grammar(); } TEST_CASE("PEG Grammar", "[peg]") { auto g = PEGParser::grammar(); REQUIRE(exact(g, "Grammar", " Definition <- a / ( b c ) / d \n rule2 <- [a-zA-Z][a-z0-9-]+ ") == true); } TEST_CASE("PEG Definition", "[peg]") { auto g = PEGParser::grammar(); REQUIRE(exact(g, "Definition", "Definition <- a / (b c) / d ") == true); REQUIRE(exact(g, "Definition", "Definition <- a / b c / d ") == true); REQUIRE(exact(g, "Definition", "Definition ") == false); REQUIRE(exact(g, "Definition", " ") == false); REQUIRE(exact(g, "Definition", "") == false); REQUIRE(exact(g, "Definition", "Definition = a / (b c) / d ") == false); } TEST_CASE("PEG Expression", "[peg]") { auto g = PEGParser::grammar(); REQUIRE(exact(g, "Expression", "a / (b c) / d ") == true); REQUIRE(exact(g, "Expression", "a / b c / d ") == true); REQUIRE(exact(g, "Expression", "a b ") == true); REQUIRE(exact(g, "Expression", "") == true); REQUIRE(exact(g, "Expression", " ") == false); REQUIRE(exact(g, "Expression", " a b ") == false); } TEST_CASE("PEG Sequence", "[peg]") { auto g = PEGParser::grammar(); REQUIRE(exact(g, "Sequence", "a b c d ") == true); REQUIRE(exact(g, "Sequence", "") == true); REQUIRE(exact(g, "Sequence", "!") == false); REQUIRE(exact(g, "Sequence", "<-") == false); REQUIRE(exact(g, "Sequence", " a") == false); } TEST_CASE("PEG Prefix", "[peg]") { auto g = PEGParser::grammar(); REQUIRE(exact(g, "Prefix", "&[a]") == true); REQUIRE(exact(g, "Prefix", "![']") == true); REQUIRE(exact(g, "Prefix", "-[']") == false); REQUIRE(exact(g, "Prefix", "") == false); REQUIRE(exact(g, "Sequence", " a") == false); } TEST_CASE("PEG Suffix", "[peg]") { auto g = PEGParser::grammar(); REQUIRE(exact(g, "Suffix", "aaa ") == true); REQUIRE(exact(g, "Suffix", "aaa? ") == true); REQUIRE(exact(g, "Suffix", "aaa* ") == true); REQUIRE(exact(g, "Suffix", "aaa+ ") == true); REQUIRE(exact(g, "Suffix", ". + ") == true); REQUIRE(exact(g, "Suffix", "?") == false); REQUIRE(exact(g, "Suffix", "") == false); REQUIRE(exact(g, "Sequence", " a") == false); } TEST_CASE("PEG Primary", "[peg]") { auto g = PEGParser::grammar(); REQUIRE(exact(g, "Primary", "_Identifier0_ ") == true); REQUIRE(exact(g, "Primary", "_Identifier0_<-") == false); REQUIRE(exact(g, "Primary", "( _Identifier0_ _Identifier1_ )") == true); REQUIRE(exact(g, "Primary", "'Literal String'") == true); REQUIRE(exact(g, "Primary", "\"Literal String\"") == true); REQUIRE(exact(g, "Primary", "[a-zA-Z]") == true); REQUIRE(exact(g, "Primary", ".") == true); REQUIRE(exact(g, "Primary", "") == false); REQUIRE(exact(g, "Primary", " ") == false); REQUIRE(exact(g, "Primary", " a") == false); REQUIRE(exact(g, "Primary", "") == false); } TEST_CASE("PEG Identifier", "[peg]") { auto g = PEGParser::grammar(); REQUIRE(exact(g, "Identifier", "_Identifier0_ ") == true); REQUIRE(exact(g, "Identifier", "0Identifier_ ") == false); REQUIRE(exact(g, "Identifier", "Iden|t ") == false); REQUIRE(exact(g, "Identifier", " ") == false); REQUIRE(exact(g, "Identifier", " a") == false); REQUIRE(exact(g, "Identifier", "") == false); } TEST_CASE("PEG IdentStart", "[peg]") { auto g = PEGParser::grammar(); REQUIRE(exact(g, "IdentStart", "_") == true); REQUIRE(exact(g, "IdentStart", "a") == true); REQUIRE(exact(g, "IdentStart", "Z") == true); REQUIRE(exact(g, "IdentStart", "") == false); REQUIRE(exact(g, "IdentStart", " ") == false); REQUIRE(exact(g, "IdentStart", "0") == false); } TEST_CASE("PEG IdentRest", "[peg]") { auto g = PEGParser::grammar(); REQUIRE(exact(g, "IdentRest", "_") == true); REQUIRE(exact(g, "IdentRest", "a") == true); REQUIRE(exact(g, "IdentRest", "Z") == true); REQUIRE(exact(g, "IdentRest", "") == false); REQUIRE(exact(g, "IdentRest", " ") == false); REQUIRE(exact(g, "IdentRest", "0") == true); } TEST_CASE("PEG Literal", "[peg]") { auto g = PEGParser::grammar(); REQUIRE(exact(g, "Literal", "'abc' ") == true); REQUIRE(exact(g, "Literal", "'a\\nb\\tc' ") == true); REQUIRE(exact(g, "Literal", "'a\\277\tc' ") == true); REQUIRE(exact(g, "Literal", "'a\\77\tc' ") == true); REQUIRE(exact(g, "Literal", "'a\\80\tc' ") == false); REQUIRE(exact(g, "Literal", "'\n' ") == true); REQUIRE(exact(g, "Literal", "'a\\'b' ") == true); REQUIRE(exact(g, "Literal", "'a'b' ") == false); REQUIRE(exact(g, "Literal", "'a\"'b' ") == false); REQUIRE(exact(g, "Literal", "\"'\\\"abc\\\"'\" ") == true); REQUIRE(exact(g, "Literal", "\"'\"abc\"'\" ") == false); REQUIRE(exact(g, "Literal", "abc") == false); REQUIRE(exact(g, "Literal", "") == false); REQUIRE(exact(g, "Literal", "日本語") == false); } TEST_CASE("PEG Class", "[peg]") { auto g = PEGParser::grammar(); REQUIRE(exact(g, "Class", "[]") == true); REQUIRE(exact(g, "Class", "[a]") == true); REQUIRE(exact(g, "Class", "[a-z]") == true); REQUIRE(exact(g, "Class", "[az]") == true); REQUIRE(exact(g, "Class", "[a-zA-Z-]") == true); REQUIRE(exact(g, "Class", "[a-zA-Z-0-9]") == true); REQUIRE(exact(g, "Class", "[a-]") == false); REQUIRE(exact(g, "Class", "[-a]") == true); REQUIRE(exact(g, "Class", "[") == false); REQUIRE(exact(g, "Class", "[a") == false); REQUIRE(exact(g, "Class", "]") == false); REQUIRE(exact(g, "Class", "a]") == false); REQUIRE(exact(g, "Class", "あ-ん") == false); REQUIRE(exact(g, "Class", "[-+]") == true); REQUIRE(exact(g, "Class", "[+-]") == false); } TEST_CASE("PEG Range", "[peg]") { auto g = PEGParser::grammar(); REQUIRE(exact(g, "Range", "a") == true); REQUIRE(exact(g, "Range", "a-z") == true); REQUIRE(exact(g, "Range", "az") == false); REQUIRE(exact(g, "Range", "") == false); REQUIRE(exact(g, "Range", "a-") == false); REQUIRE(exact(g, "Range", "-a") == false); } TEST_CASE("PEG Char", "[peg]") { auto g = PEGParser::grammar(); REQUIRE(exact(g, "Char", "\\n") == true); REQUIRE(exact(g, "Char", "\\r") == true); REQUIRE(exact(g, "Char", "\\t") == true); REQUIRE(exact(g, "Char", "\\'") == true); REQUIRE(exact(g, "Char", "\\\"") == true); REQUIRE(exact(g, "Char", "\\[") == true); REQUIRE(exact(g, "Char", "\\]") == true); REQUIRE(exact(g, "Char", "\\\\") == true); REQUIRE(exact(g, "Char", "\\000") == true); REQUIRE(exact(g, "Char", "\\377") == true); REQUIRE(exact(g, "Char", "\\477") == false); REQUIRE(exact(g, "Char", "\\087") == false); REQUIRE(exact(g, "Char", "\\079") == false); REQUIRE(exact(g, "Char", "\\00") == true); REQUIRE(exact(g, "Char", "\\77") == true); REQUIRE(exact(g, "Char", "\\80") == false); REQUIRE(exact(g, "Char", "\\08") == false); REQUIRE(exact(g, "Char", "\\0") == true); REQUIRE(exact(g, "Char", "\\7") == true); REQUIRE(exact(g, "Char", "\\8") == false); REQUIRE(exact(g, "Char", "a") == true); REQUIRE(exact(g, "Char", ".") == true); REQUIRE(exact(g, "Char", "0") == true); REQUIRE(exact(g, "Char", "\\") == false); REQUIRE(exact(g, "Char", " ") == true); REQUIRE(exact(g, "Char", " ") == false); REQUIRE(exact(g, "Char", "") == false); REQUIRE(exact(g, "Char", "あ") == false); } TEST_CASE("PEG Operators", "[peg]") { auto g = PEGParser::grammar(); REQUIRE(exact(g, "LEFTARROW", "<-") == true); REQUIRE(exact(g, "SLASH", "/ ") == true); REQUIRE(exact(g, "AND", "& ") == true); REQUIRE(exact(g, "NOT", "! ") == true); REQUIRE(exact(g, "QUESTION", "? ") == true); REQUIRE(exact(g, "STAR", "* ") == true); REQUIRE(exact(g, "PLUS", "+ ") == true); REQUIRE(exact(g, "OPEN", "( ") == true); REQUIRE(exact(g, "CLOSE", ") ") == true); REQUIRE(exact(g, "DOT", ". ") == true); } TEST_CASE("PEG Comment", "[peg]") { auto g = PEGParser::grammar(); REQUIRE(exact(g, "Comment", "# Comment.\n") == true); REQUIRE(exact(g, "Comment", "# Comment.") == false); REQUIRE(exact(g, "Comment", " ") == false); REQUIRE(exact(g, "Comment", "a") == false); } TEST_CASE("PEG Space", "[peg]") { auto g = PEGParser::grammar(); REQUIRE(exact(g, "Space", " ") == true); REQUIRE(exact(g, "Space", "\t") == true); REQUIRE(exact(g, "Space", "\n") == true); REQUIRE(exact(g, "Space", "") == false); REQUIRE(exact(g, "Space", "a") == false); } TEST_CASE("PEG EndOfLine", "[peg]") { auto g = PEGParser::grammar(); REQUIRE(exact(g, "EndOfLine", "\r\n") == true); REQUIRE(exact(g, "EndOfLine", "\n") == true); REQUIRE(exact(g, "EndOfLine", "\r") == true); REQUIRE(exact(g, "EndOfLine", " ") == false); REQUIRE(exact(g, "EndOfLine", "") == false); REQUIRE(exact(g, "EndOfLine", "a") == false); } TEST_CASE("PEG EndOfFile", "[peg]") { Grammar g = make_peg_grammar(); REQUIRE(exact(g, "EndOfFile", "") == true); REQUIRE(exact(g, "EndOfFile", " ") == false); } // vim: et ts=4 sw=4 cin cino={1s ff=unix