#include #include #include //////////////////////////////////////////////////////////////////////////////////////////////////// TEST_CASE("[tokenizer] Simple strings are tokenized correctly", "[tokenizer]") { std::stringstream s(" identifier 5 \n-51\t 0 1 100 200 -300 -400"); tokenize::Tokenizer<> p("input", s); REQUIRE(p.get() == "identifier"); REQUIRE(p.get() == 5u); REQUIRE(p.get() == -51); REQUIRE(p.get() == false); REQUIRE(p.get() == true); REQUIRE(p.get() == 100); REQUIRE(p.get() == 200u); REQUIRE(p.get() == -300); REQUIRE_THROWS_AS(p.get(), tokenize::TokenizerException); } //////////////////////////////////////////////////////////////////////////////////////////////////// TEST_CASE("[tokenizer] Tokenizing exceptions are correctly reported", "[tokenizer]") { std::stringstream s(" identifier 5 \n-51\t 0 1 100 200 -300 -400"); tokenize::Tokenizer<> p("input", s); REQUIRE_NOTHROW(p.expect("identifier")); REQUIRE_NOTHROW(p.expect(5u)); REQUIRE_NOTHROW(p.expect(-51)); REQUIRE_NOTHROW(p.expect(false)); REQUIRE_NOTHROW(p.expect(true)); REQUIRE_NOTHROW(p.expect(100)); REQUIRE_NOTHROW(p.expect(200u)); REQUIRE_NOTHROW(p.expect(-300)); REQUIRE_THROWS_AS(p.expect(-400), tokenize::TokenizerException); p.seek(0); REQUIRE_THROWS_AS(p.expect("error"), tokenize::TokenizerException); p.seek(14); REQUIRE_THROWS_AS(p.expect(6u), tokenize::TokenizerException); p.seek(17); REQUIRE_THROWS_AS(p.expect(-50), tokenize::TokenizerException); p.seek(24); REQUIRE_THROWS_AS(p.expect(true), tokenize::TokenizerException); p.seek(26); REQUIRE_THROWS_AS(p.expect(false), tokenize::TokenizerException); p.seek(28); REQUIRE_THROWS_AS(p.expect(101), tokenize::TokenizerException); p.seek(31); REQUIRE_THROWS_AS(p.expect(201), tokenize::TokenizerException); p.seek(34); REQUIRE_THROWS_AS(p.expect(-299), tokenize::TokenizerException); } //////////////////////////////////////////////////////////////////////////////////////////////////// TEST_CASE("[tokenizer] While tokenizing, the cursor position is as expected", "[tokenizer]") { std::stringstream s(" identifier 5 \n-51\t 0 1"); tokenize::Tokenizer<> p("input", s); tokenize::StreamPosition pos; pos = p.position(); REQUIRE(p.testAndReturn("error") == false); REQUIRE(p.position() == pos); REQUIRE(p.testAndReturn("identifier") == true); REQUIRE(p.position() == pos); REQUIRE(p.testAndSkip("error") == false); REQUIRE(p.position() == pos); REQUIRE(p.testAndSkip("identifier") == true); REQUIRE(p.position() == 12); pos = p.position(); REQUIRE(p.testAndReturn(6u) == false); REQUIRE(p.position() == pos); REQUIRE(p.testAndReturn(5u) == true); REQUIRE(p.position() == pos); REQUIRE(p.testAndSkip(6u) == false); REQUIRE(p.position() == pos); REQUIRE(p.testAndSkip(5u) == true); REQUIRE(p.position() == 15); pos = p.position(); REQUIRE(p.testAndReturn(-50) == false); REQUIRE(p.position() == pos); REQUIRE(p.testAndReturn(-51) == true); REQUIRE(p.position() == pos); REQUIRE(p.testAndSkip(-50) == false); REQUIRE(p.position() == pos); REQUIRE(p.testAndSkip(-51) == true); REQUIRE(p.position() == 22); pos = p.position(); REQUIRE(p.testAndReturn(true) == false); REQUIRE(p.position() == pos); REQUIRE(p.testAndReturn(false) == true); REQUIRE(p.position() == pos); REQUIRE(p.testAndSkip(true) == false); REQUIRE(p.position() == pos); REQUIRE(p.testAndSkip(false) == true); REQUIRE(p.position() == 25); pos = p.position(); REQUIRE(p.testAndReturn(false) == false); REQUIRE(p.position() == pos); REQUIRE(p.testAndReturn(true) == true); REQUIRE(p.position() == pos); REQUIRE(p.testAndSkip(false) == false); REQUIRE(p.position() == pos); REQUIRE(p.testAndSkip(true) == true); REQUIRE(p.position() == 27); } //////////////////////////////////////////////////////////////////////////////////////////////////// TEST_CASE("[tokenizer] The end of the input stream is correctly handled", "[tokenizer]") { std::stringstream s1("test"); tokenize::Tokenizer<> p1("input", s1); REQUIRE_NOTHROW(p1.expect("test")); REQUIRE_THROWS_AS(p1.get(), tokenize::TokenizerException); std::stringstream s2("test1 test2 test3"); tokenize::Tokenizer<> p2("input", s2); REQUIRE_NOTHROW(p2.expect("test1")); REQUIRE_NOTHROW(p2.expect("test2")); REQUIRE_NOTHROW(p2.expect("test3")); REQUIRE_THROWS_AS(p2.get(), tokenize::TokenizerException); std::stringstream s3("-127"); tokenize::Tokenizer<> p3("input", s3); p3.expect(-127); REQUIRE_THROWS_AS(p3.get(), tokenize::TokenizerException); std::stringstream s4("128 -1023 -4095"); tokenize::Tokenizer<> p4("input", s4); REQUIRE_NOTHROW(p4.expect(128)); REQUIRE_NOTHROW(p4.expect(-1023)); REQUIRE_NOTHROW(p4.expect(-4095)); REQUIRE_THROWS_AS(p4.get(), tokenize::TokenizerException); std::stringstream s5("0"); tokenize::Tokenizer<> p5("input", s5); p5.expect(false); REQUIRE_THROWS_AS(p5.get(), tokenize::TokenizerException); std::stringstream s6("0 1 0"); tokenize::Tokenizer<> p6("input", s6); REQUIRE_NOTHROW(p6.expect(false)); REQUIRE_NOTHROW(p6.expect(true)); REQUIRE_NOTHROW(p6.expect(false)); REQUIRE_THROWS_AS(p6.get(), tokenize::TokenizerException); } //////////////////////////////////////////////////////////////////////////////////////////////////// TEST_CASE("[tokenizer] While tokenizing, the cursor location is as expcected", "[tokenizer]") { std::stringstream s("123 \n4\ntest1\n test2\ntest3 \ntest4\n\n\n\n"); tokenize::Tokenizer<> p("input", s); const auto startPosition = p.position(); { auto l = tokenize::Location(p); REQUIRE(l.rowStart() == 1u); REQUIRE(l.columnStart() == 1u); REQUIRE(p.currentCharacter() == '1'); } REQUIRE_NOTHROW(p.advance()); { auto l = tokenize::Location(p); REQUIRE(l.rowStart() == 1u); REQUIRE(l.columnStart() == 2u); REQUIRE(p.currentCharacter() == '2'); } REQUIRE_NOTHROW(p.advance()); { auto l = tokenize::Location(p); REQUIRE(l.rowStart() == 1u); REQUIRE(l.columnStart() == 3u); REQUIRE(p.currentCharacter() == '3'); } REQUIRE_NOTHROW(p.advance()); { auto l = tokenize::Location(p); REQUIRE(l.rowStart() == 1u); REQUIRE(l.columnStart() == 4u); REQUIRE(p.currentCharacter() == ' '); } REQUIRE_NOTHROW(p.advance()); { auto l = tokenize::Location(p); REQUIRE(l.rowStart() == 1u); REQUIRE(l.columnStart() == 5u); REQUIRE(p.currentCharacter() == '\n'); } REQUIRE_NOTHROW(p.advance()); { auto l = tokenize::Location(p); REQUIRE(l.rowStart() == 2u); REQUIRE(l.columnStart() == 1u); REQUIRE(p.currentCharacter() == '4'); } REQUIRE_NOTHROW(p.advance()); REQUIRE_NOTHROW(p.expect("test1")); { auto l = tokenize::Location(p); REQUIRE(l.rowStart() == 3u); REQUIRE(l.columnStart() == 6u); } REQUIRE_NOTHROW(p.expect("test2")); { auto l = tokenize::Location(p); REQUIRE(l.rowStart() == 4u); REQUIRE(l.columnStart() == 7u); } REQUIRE_NOTHROW(p.expect("test3")); { auto l = tokenize::Location(p); REQUIRE(l.rowStart() == 5u); REQUIRE(l.columnStart() == 6u); } REQUIRE_NOTHROW(p.skipLine()); { auto l = tokenize::Location(p); REQUIRE(l.rowStart() == 6u); REQUIRE(l.columnStart() == 1u); } REQUIRE_NOTHROW(p.skipLine()); { auto l = tokenize::Location(p); REQUIRE(l.rowStart() == 7u); REQUIRE(l.columnStart() == 1u); } REQUIRE_NOTHROW(p.skipWhiteSpace()); { auto l = tokenize::Location(p); REQUIRE(l.rowStart() == 10u); REQUIRE(l.columnStart() == 1u); REQUIRE(p.atEnd()); } p.reset(); REQUIRE(p.position() == startPosition); REQUIRE_FALSE(p.atEnd()); for (size_t i = 0; i < 5; i++) p.advance(); REQUIRE(p.position() == static_cast(5)); p.seek(static_cast(7)); REQUIRE(p.position() == static_cast(7)); REQUIRE_NOTHROW(p.expect("test1")); // TODO: test tokenizer with multiple sections } //////////////////////////////////////////////////////////////////////////////////////////////////// TEST_CASE("[tokenizer] Comments are correctly removed", "[tokenizer]") { std::stringstream s1("; comment at beginning\ntest1; comment in between\ntest2; comment at end"); tokenize::Tokenizer<> p1("input", s1); p1.removeComments(";", "\n", false); REQUIRE_NOTHROW(p1.expect("test1")); { auto l = tokenize::Location(p1); REQUIRE(l.rowStart() == 2u); REQUIRE(l.columnStart() == 6u); } REQUIRE_NOTHROW(p1.expect("test2")); { auto l = tokenize::Location(p1); REQUIRE(l.rowStart() == 3u); REQUIRE(l.columnStart() == 6u); } p1.skipWhiteSpace(); REQUIRE(p1.atEnd()); std::stringstream s2("test;"); tokenize::Tokenizer<> p2("input", s2); p2.removeComments(";", "\n", false); REQUIRE_NOTHROW(p2.expect("test")); p2.skipWhiteSpace(); REQUIRE(p2.atEnd()); std::stringstream s3("/* comment at start */ test1 /* comment in between */ test2 /*"); tokenize::Tokenizer<> p3("input", s3); p3.removeComments("/*", "*/", true); REQUIRE_NOTHROW(p3.expect("test1")); REQUIRE_NOTHROW(p3.expect("test2")); p3.skipWhiteSpace(); REQUIRE(p3.atEnd()); // Check that if there are no comments, the end is not accidentally truncated std::stringstream s4("test foo bar"); tokenize::Tokenizer<> p4("input", s4); p4.removeComments(";", "\n", false); REQUIRE_NOTHROW(p4.expect("test")); REQUIRE_NOTHROW(p4.expect("foo")); REQUIRE_NOTHROW(p4.expect("bar")); REQUIRE(p4.atEnd()); }