|
@@ -30,8 +30,7 @@ class MasterLexerStateTest : public ::testing::Test {
|
|
|
protected:
|
|
|
MasterLexerStateTest() : common_options(MasterLexer::INITIAL_WS),
|
|
|
s_null(NULL),
|
|
|
- s_start(*State::getStartInstance(
|
|
|
- lexer, common_options)),
|
|
|
+ s_start(State::getInstance(State::Start)),
|
|
|
s_crlf(State::getInstance(State::CRLF)),
|
|
|
s_string(State::getInstance(State::String)),
|
|
|
options(MasterLexer::NONE),
|
|
@@ -65,18 +64,18 @@ eofCheck(const State& state, MasterLexer& lexer) {
|
|
|
TEST_F(MasterLexerStateTest, startAndEnd) {
|
|
|
// A simple case: the input is empty, so we begin with start and
|
|
|
// are immediately done.
|
|
|
- EXPECT_EQ(s_null, s_start.handle(lexer));
|
|
|
+ EXPECT_EQ(s_null, s_start.handle(lexer, common_options));
|
|
|
eofCheck(s_start, lexer);
|
|
|
}
|
|
|
|
|
|
TEST_F(MasterLexerStateTest, startToEOL) {
|
|
|
ss << "\n";
|
|
|
- EXPECT_EQ(s_null, s_start.handle(lexer));
|
|
|
+ EXPECT_EQ(s_null, s_start.handle(lexer, common_options));
|
|
|
EXPECT_TRUE(s_start.wasLastEOL(lexer));
|
|
|
EXPECT_EQ(Token::END_OF_LINE, s_start.getToken(lexer).getType());
|
|
|
|
|
|
// The next lexer session will reach EOF. Same eof check should pass.
|
|
|
- EXPECT_EQ(s_null, s_start.handle(lexer));
|
|
|
+ EXPECT_EQ(s_null, s_start.handle(lexer, common_options));
|
|
|
eofCheck(s_start, lexer);
|
|
|
}
|
|
|
|
|
@@ -85,20 +84,17 @@ TEST_F(MasterLexerStateTest, space) {
|
|
|
// twice; at the second iteration, it's a white space at the beginning
|
|
|
// of line, but since we don't specify INITIAL_WS option, it's treated as
|
|
|
// normal space and ignored.
|
|
|
- State::getStartInstance(lexer, MasterLexer::NONE);
|
|
|
for (size_t i = 0; i < 2; ++i) {
|
|
|
ss << " \t\n";
|
|
|
- EXPECT_EQ(s_null, s_start.handle(lexer));
|
|
|
+ EXPECT_EQ(s_null, s_start.handle(lexer, MasterLexer::NONE));
|
|
|
EXPECT_TRUE(s_start.wasLastEOL(lexer));
|
|
|
EXPECT_EQ(Token::END_OF_LINE, s_start.getToken(lexer).getType());
|
|
|
}
|
|
|
|
|
|
// Now we specify the INITIAL_WS option. It will be recognized and the
|
|
|
// corresponding token will be returned.
|
|
|
- State::getStartInstance(lexer, common_options);
|
|
|
ss << " ";
|
|
|
- options = MasterLexer::INITIAL_WS;
|
|
|
- EXPECT_EQ(s_null, s_start.handle(lexer));
|
|
|
+ EXPECT_EQ(s_null, s_start.handle(lexer, MasterLexer::INITIAL_WS));
|
|
|
EXPECT_FALSE(s_start.wasLastEOL(lexer));
|
|
|
EXPECT_EQ(Token::INITIAL_WS, s_start.getToken(lexer).getType());
|
|
|
}
|
|
@@ -106,55 +102,55 @@ TEST_F(MasterLexerStateTest, space) {
|
|
|
TEST_F(MasterLexerStateTest, parentheses) {
|
|
|
ss << "\n(\na\n )\n "; // 1st \n is to check if 'was EOL' is set to false
|
|
|
|
|
|
- EXPECT_EQ(s_null, s_start.handle(lexer)); // handle \n
|
|
|
+ EXPECT_EQ(s_null, s_start.handle(lexer, common_options)); // handle \n
|
|
|
|
|
|
// Now handle '('. It skips \n and recognize 'a' as string
|
|
|
EXPECT_EQ(0, s_start.getParenCount(lexer)); // check pre condition
|
|
|
- EXPECT_EQ(&s_string, s_start.handle(lexer));
|
|
|
+ EXPECT_EQ(&s_string, s_start.handle(lexer, common_options));
|
|
|
EXPECT_EQ(1, s_start.getParenCount(lexer)); // check post condition
|
|
|
EXPECT_FALSE(s_start.wasLastEOL(lexer));
|
|
|
|
|
|
// skip 'a' (note: until #2373 it's actually skipped as part of the '('
|
|
|
// handling)
|
|
|
- s_string.handle(lexer);
|
|
|
+ s_string.handle(lexer, common_options);
|
|
|
|
|
|
// Then handle ')'. '\n' before ')' isn't recognized because
|
|
|
// it's canceled due to the '('. Likewise, the space after the '\n'
|
|
|
// shouldn't be recognized but should be just ignored.
|
|
|
- EXPECT_EQ(s_null, s_start.handle(lexer));
|
|
|
+ EXPECT_EQ(s_null, s_start.handle(lexer, common_options));
|
|
|
EXPECT_EQ(0, s_start.getParenCount(lexer));
|
|
|
|
|
|
// Now, temporarily disabled options are restored: Both EOL and the
|
|
|
// initial WS are recognized
|
|
|
EXPECT_EQ(Token::END_OF_LINE, s_start.getToken(lexer).getType());
|
|
|
- EXPECT_EQ(s_null, s_start.handle(lexer));
|
|
|
+ EXPECT_EQ(s_null, s_start.handle(lexer, common_options));
|
|
|
EXPECT_EQ(Token::INITIAL_WS, s_start.getToken(lexer).getType());
|
|
|
}
|
|
|
|
|
|
TEST_F(MasterLexerStateTest, nestedParentheses) {
|
|
|
// This is an unusual, but allowed (in this implementation) case.
|
|
|
ss << "(a(b)\n c)\n ";
|
|
|
- EXPECT_EQ(&s_string, s_start.handle(lexer)); // consume '('
|
|
|
- s_string.handle(lexer); // consume 'a'
|
|
|
- EXPECT_EQ(&s_string, s_start.handle(lexer)); // consume '('
|
|
|
- s_string.handle(lexer); // consume 'b'
|
|
|
+ EXPECT_EQ(&s_string, s_start.handle(lexer, common_options)); // consume '('
|
|
|
+ s_string.handle(lexer, common_options); // consume 'a'
|
|
|
+ EXPECT_EQ(&s_string, s_start.handle(lexer, common_options)); // consume '('
|
|
|
+ s_string.handle(lexer, common_options); // consume 'b'
|
|
|
EXPECT_EQ(2, s_start.getParenCount(lexer)); // now the count is 2
|
|
|
|
|
|
// Close the inner most parentheses. count will be decreased, but option
|
|
|
// shouldn't be restored yet, so the intermediate EOL or initial WS won't
|
|
|
// be recognized.
|
|
|
- EXPECT_EQ(&s_string, s_start.handle(lexer)); // consume ')'
|
|
|
- s_string.handle(lexer); // consume 'c'
|
|
|
+ EXPECT_EQ(&s_string, s_start.handle(lexer, common_options)); // consume ')'
|
|
|
+ s_string.handle(lexer, common_options); // consume 'c'
|
|
|
EXPECT_EQ(1, s_start.getParenCount(lexer));
|
|
|
|
|
|
// Close the outermost parentheses. count will be reset to 0, and original
|
|
|
// options are restored.
|
|
|
- EXPECT_EQ(s_null, s_start.handle(lexer));
|
|
|
+ EXPECT_EQ(s_null, s_start.handle(lexer, common_options));
|
|
|
|
|
|
// Now, temporarily disabled options are restored: Both EOL and the
|
|
|
// initial WS are recognized
|
|
|
EXPECT_EQ(Token::END_OF_LINE, s_start.getToken(lexer).getType());
|
|
|
- EXPECT_EQ(s_null, s_start.handle(lexer));
|
|
|
+ EXPECT_EQ(s_null, s_start.handle(lexer, common_options));
|
|
|
EXPECT_EQ(Token::INITIAL_WS, s_start.getToken(lexer).getType());
|
|
|
}
|
|
|
|
|
@@ -163,13 +159,13 @@ TEST_F(MasterLexerStateTest, unbalancedParentheses) {
|
|
|
// correctly canceled after detecting the error.
|
|
|
ss << "\n)";
|
|
|
|
|
|
- EXPECT_EQ(s_null, s_start.handle(lexer)); // consume '\n'
|
|
|
+ EXPECT_EQ(s_null, s_start.handle(lexer, common_options)); // consume '\n'
|
|
|
EXPECT_TRUE(s_start.wasLastEOL(lexer)); // this \n was remembered
|
|
|
|
|
|
// Now checking ')'. The result should be error, count shouldn't be
|
|
|
// changed. "last EOL" should be canceled.
|
|
|
EXPECT_EQ(0, s_start.getParenCount(lexer));
|
|
|
- EXPECT_EQ(s_null, s_start.handle(lexer));
|
|
|
+ EXPECT_EQ(s_null, s_start.handle(lexer, common_options));
|
|
|
EXPECT_EQ(0, s_start.getParenCount(lexer));
|
|
|
ASSERT_EQ(Token::ERROR, s_start.getToken(lexer).getType());
|
|
|
EXPECT_EQ(Token::UNBALANCED_PAREN, s_start.getToken(lexer).getErrorCode());
|
|
@@ -177,10 +173,10 @@ TEST_F(MasterLexerStateTest, unbalancedParentheses) {
|
|
|
|
|
|
// Reach EOF with a dangling open parenthesis.
|
|
|
ss << "(a";
|
|
|
- EXPECT_EQ(&s_string, s_start.handle(lexer)); // consume '('
|
|
|
- s_string.handle(lexer); // consume 'a'
|
|
|
+ EXPECT_EQ(&s_string, s_start.handle(lexer, common_options)); // consume '('
|
|
|
+ s_string.handle(lexer, common_options); // consume 'a'
|
|
|
EXPECT_EQ(1, s_start.getParenCount(lexer));
|
|
|
- EXPECT_EQ(s_null, s_start.handle(lexer)); // reach EOF
|
|
|
+ EXPECT_EQ(s_null, s_start.handle(lexer, common_options)); // reach EOF
|
|
|
ASSERT_EQ(Token::ERROR, s_start.getToken(lexer).getType());
|
|
|
EXPECT_EQ(Token::UNBALANCED_PAREN, s_start.getToken(lexer).getErrorCode());
|
|
|
EXPECT_EQ(0, s_start.getParenCount(lexer)); // should be reset to 0
|
|
@@ -191,12 +187,12 @@ TEST_F(MasterLexerStateTest, startToComment) {
|
|
|
// the rest of the line, and recognize the new line. Note that the
|
|
|
// second ';' is simply ignored.
|
|
|
ss << " ;a;\n";
|
|
|
- EXPECT_EQ(s_null, s_start.handle(lexer));
|
|
|
+ EXPECT_EQ(s_null, s_start.handle(lexer, common_options));
|
|
|
EXPECT_EQ(Token::END_OF_LINE, s_start.getToken(lexer).getType());
|
|
|
|
|
|
// Likewise, but the comment ends with EOF.
|
|
|
ss << ";a;";
|
|
|
- EXPECT_EQ(s_null, s_start.handle(lexer));
|
|
|
+ EXPECT_EQ(s_null, s_start.handle(lexer, common_options));
|
|
|
EXPECT_EQ(Token::END_OF_FILE, s_start.getToken(lexer).getType());
|
|
|
}
|
|
|
|
|
@@ -205,39 +201,42 @@ TEST_F(MasterLexerStateTest, commentAfterParen) {
|
|
|
// other tests should also ensure that it works correctly, but we
|
|
|
// check it explicitly.
|
|
|
ss << "( ;this is a comment\na)\n";
|
|
|
- EXPECT_EQ(&s_string, s_start.handle(lexer)); // consume '(', skip comments
|
|
|
- s_string.handle(lexer); // consume 'a'
|
|
|
- EXPECT_EQ(s_null, s_start.handle(lexer)); // consume ')', see '\n'
|
|
|
+ // consume '(', skip comments, consume 'a', then consume ')'
|
|
|
+ EXPECT_EQ(&s_string, s_start.handle(lexer, common_options));
|
|
|
+ s_string.handle(lexer, common_options);
|
|
|
+ EXPECT_EQ(s_null, s_start.handle(lexer, common_options));
|
|
|
EXPECT_EQ(Token::END_OF_LINE, s_start.getToken(lexer).getType());
|
|
|
}
|
|
|
|
|
|
TEST_F(MasterLexerStateTest, crlf) {
|
|
|
// A sequence of \r, \n is recognized as a single 'end-of-line'
|
|
|
ss << "\r\n";
|
|
|
- EXPECT_EQ(&s_crlf, s_start.handle(lexer)); // recognize '\r'
|
|
|
- EXPECT_EQ(s_null, s_crlf.handle(lexer)); // recognize '\n'
|
|
|
+ EXPECT_EQ(&s_crlf, s_start.handle(lexer, common_options)); // recognize '\r'
|
|
|
+ EXPECT_EQ(s_null, s_crlf.handle(lexer, common_options)); // recognize '\n'
|
|
|
EXPECT_EQ(Token::END_OF_LINE, s_start.getToken(lexer).getType());
|
|
|
EXPECT_TRUE(s_start.wasLastEOL(lexer));
|
|
|
|
|
|
// Single '\r' (not followed by \n) is recognized as a single 'end-of-line'
|
|
|
ss << "\r "; // then there will be "initial WS"
|
|
|
- State::getStartInstance(lexer, common_options); // specify usual options
|
|
|
- EXPECT_EQ(&s_crlf, s_start.handle(lexer)); // recognize '\r'
|
|
|
- EXPECT_EQ(s_null, s_crlf.handle(lexer)); // recognize ' ', "unget" it
|
|
|
- EXPECT_EQ(s_null, s_start.handle(lexer)); // re-recognize ' '
|
|
|
+ EXPECT_EQ(&s_crlf, s_start.handle(lexer, common_options)); // recognize '\r'
|
|
|
+ // see ' ', "unget" it
|
|
|
+ EXPECT_EQ(s_null, s_crlf.handle(lexer, common_options));
|
|
|
+ EXPECT_EQ(s_null, s_start.handle(lexer, common_options)); // recognize ' '
|
|
|
EXPECT_EQ(Token::INITIAL_WS, s_start.getToken(lexer).getType());
|
|
|
|
|
|
ss << "\r;comment\na";
|
|
|
- EXPECT_EQ(&s_crlf, s_start.handle(lexer)); // recognize '\r'
|
|
|
- EXPECT_EQ(s_null, s_crlf.handle(lexer)); // skip comments, recognize '\n'
|
|
|
+ EXPECT_EQ(&s_crlf, s_start.handle(lexer, common_options)); // recognize '\r'
|
|
|
+ // skip comments, recognize '\n'
|
|
|
+ EXPECT_EQ(s_null, s_crlf.handle(lexer, common_options));
|
|
|
EXPECT_EQ(Token::END_OF_LINE, s_start.getToken(lexer).getType());
|
|
|
- EXPECT_EQ(&s_string, s_start.handle(lexer));
|
|
|
+ EXPECT_EQ(&s_string, s_start.handle(lexer, common_options));
|
|
|
|
|
|
// \r then EOF
|
|
|
ss << "\r";
|
|
|
- EXPECT_EQ(&s_crlf, s_start.handle(lexer)); // recognize '\r'
|
|
|
- EXPECT_EQ(s_null, s_crlf.handle(lexer)); // see EOF, then "unget" it
|
|
|
- EXPECT_EQ(s_null, s_start.handle(lexer)); // re-recognize EOF
|
|
|
+ EXPECT_EQ(&s_crlf, s_start.handle(lexer, common_options)); // recognize '\r'
|
|
|
+ // see EOF, then "unget" it
|
|
|
+ EXPECT_EQ(s_null, s_crlf.handle(lexer, common_options));
|
|
|
+ EXPECT_EQ(s_null, s_start.handle(lexer, common_options)); // recognize EOF
|
|
|
EXPECT_EQ(Token::END_OF_FILE, s_start.getToken(lexer).getType());
|
|
|
}
|
|
|
|