mirror of
				https://github.com/ethereum/solidity
				synced 2023-10-03 13:03:40 +00:00 
			
		
		
		
	
		
			
				
	
	
		
			996 lines
		
	
	
		
			39 KiB
		
	
	
	
		
			C++
		
	
	
	
	
	
			
		
		
	
	
			996 lines
		
	
	
		
			39 KiB
		
	
	
	
		
			C++
		
	
	
	
	
	
| /*
 | |
|     This file is part of solidity.
 | |
| 
 | |
|     solidity is free software: you can redistribute it and/or modify
 | |
|     it under the terms of the GNU General Public License as published by
 | |
|     the Free Software Foundation, either version 3 of the License, or
 | |
|     (at your option) any later version.
 | |
| 
 | |
|     solidity is distributed in the hope that it will be useful,
 | |
|     but WITHOUT ANY WARRANTY; without even the implied warranty of
 | |
|     MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
 | |
|     GNU General Public License for more details.
 | |
| 
 | |
|     You should have received a copy of the GNU General Public License
 | |
|     along with solidity.  If not, see <http://www.gnu.org/licenses/>.
 | |
| */
 | |
| /**
 | |
|  * @author Christian <c@ethdev.com>
 | |
|  * @date 2014
 | |
|  * Unit tests for the solidity scanner.
 | |
|  */
 | |
| 
 | |
| #include <liblangutil/Scanner.h>
 | |
| 
 | |
| #include <boost/test/unit_test.hpp>
 | |
| 
 | |
| using namespace std;
 | |
| using namespace solidity::langutil;
 | |
| 
 | |
| namespace solidity::langutil::test
 | |
| {
 | |
| 
 | |
| BOOST_AUTO_TEST_SUITE(ScannerTest)
 | |
| 
 | |
| BOOST_AUTO_TEST_CASE(test_empty)
 | |
| {
 | |
| 	Scanner scanner(CharStream{});
 | |
| 	BOOST_CHECK_EQUAL(scanner.currentToken(), Token::EOS);
 | |
| }
 | |
| 
 | |
| BOOST_AUTO_TEST_CASE(smoke_test)
 | |
| {
 | |
| 	Scanner scanner(CharStream("function break;765  \t  \"string1\",'string2'\nidentifier1", ""));
 | |
| 	BOOST_CHECK_EQUAL(scanner.currentToken(), Token::Function);
 | |
| 	BOOST_CHECK_EQUAL(scanner.next(), Token::Break);
 | |
| 	BOOST_CHECK_EQUAL(scanner.next(), Token::Semicolon);
 | |
| 	BOOST_CHECK_EQUAL(scanner.next(), Token::Number);
 | |
| 	BOOST_CHECK_EQUAL(scanner.currentLiteral(), "765");
 | |
| 	BOOST_CHECK_EQUAL(scanner.next(), Token::StringLiteral);
 | |
| 	BOOST_CHECK_EQUAL(scanner.currentLiteral(), "string1");
 | |
| 	BOOST_CHECK_EQUAL(scanner.next(), Token::Comma);
 | |
| 	BOOST_CHECK_EQUAL(scanner.next(), Token::StringLiteral);
 | |
| 	BOOST_CHECK_EQUAL(scanner.currentLiteral(), "string2");
 | |
| 	BOOST_CHECK_EQUAL(scanner.next(), Token::Identifier);
 | |
| 	BOOST_CHECK_EQUAL(scanner.currentLiteral(), "identifier1");
 | |
| 	BOOST_CHECK_EQUAL(scanner.next(), Token::EOS);
 | |
| }
 | |
| 
 | |
| BOOST_AUTO_TEST_CASE(assembly_assign)
 | |
| {
 | |
| 	Scanner scanner(CharStream("let a := 1", ""));
 | |
| 	BOOST_CHECK_EQUAL(scanner.currentToken(), Token::Let);
 | |
| 	BOOST_CHECK_EQUAL(scanner.next(), Token::Identifier);
 | |
| 	BOOST_CHECK_EQUAL(scanner.next(), Token::AssemblyAssign);
 | |
| 	BOOST_CHECK_EQUAL(scanner.next(), Token::Number);
 | |
| 	BOOST_CHECK_EQUAL(scanner.currentLiteral(), "1");
 | |
| 	BOOST_CHECK_EQUAL(scanner.next(), Token::EOS);
 | |
| }
 | |
| 
 | |
| BOOST_AUTO_TEST_CASE(assembly_multiple_assign)
 | |
| {
 | |
| 	Scanner scanner(CharStream("let a, b, c := 1", ""));
 | |
| 	BOOST_CHECK_EQUAL(scanner.currentToken(), Token::Let);
 | |
| 	BOOST_CHECK_EQUAL(scanner.next(), Token::Identifier);
 | |
| 	BOOST_CHECK_EQUAL(scanner.next(), Token::Comma);
 | |
| 	BOOST_CHECK_EQUAL(scanner.next(), Token::Identifier);
 | |
| 	BOOST_CHECK_EQUAL(scanner.next(), Token::Comma);
 | |
| 	BOOST_CHECK_EQUAL(scanner.next(), Token::Identifier);
 | |
| 	BOOST_CHECK_EQUAL(scanner.next(), Token::AssemblyAssign);
 | |
| 	BOOST_CHECK_EQUAL(scanner.next(), Token::Number);
 | |
| 	BOOST_CHECK_EQUAL(scanner.currentLiteral(), "1");
 | |
| 	BOOST_CHECK_EQUAL(scanner.next(), Token::EOS);
 | |
| }
 | |
| 
 | |
| BOOST_AUTO_TEST_CASE(string_printable)
 | |
| {
 | |
| 	for (unsigned v = 0x20; v < 0x7e; v++) {
 | |
| 		string lit{static_cast<char>(v)};
 | |
| 		// Escape \ and " (since we are quoting with ")
 | |
| 		if (v == '\\' || v == '"')
 | |
| 			lit = string{'\\'} + lit;
 | |
| 		Scanner scanner(CharStream("  { \"" + lit + "\"", ""));
 | |
| 		BOOST_CHECK_EQUAL(scanner.currentToken(), Token::LBrace);
 | |
| 		BOOST_CHECK_EQUAL(scanner.next(), Token::StringLiteral);
 | |
| 		BOOST_CHECK_EQUAL(scanner.currentLiteral(), string{static_cast<char>(v)});
 | |
| 		BOOST_CHECK_EQUAL(scanner.next(), Token::EOS);
 | |
| 	}
 | |
| 	// Special case of unescaped " for strings quoted with '
 | |
| 	Scanner scanner(CharStream("  { '\"'", ""));
 | |
| 	BOOST_CHECK_EQUAL(scanner.currentToken(), Token::LBrace);
 | |
| 	BOOST_CHECK_EQUAL(scanner.next(), Token::StringLiteral);
 | |
| 	BOOST_CHECK_EQUAL(scanner.currentLiteral(), "\"");
 | |
| 	BOOST_CHECK_EQUAL(scanner.next(), Token::EOS);
 | |
| }
 | |
| 
 | |
| BOOST_AUTO_TEST_CASE(string_nonprintable)
 | |
| {
 | |
| 	for (unsigned v = 0; v < 0xff; v++) {
 | |
| 		// Skip the valid ones
 | |
| 		if (v >= 0x20 && v <= 0x7e)
 | |
| 			continue;
 | |
| 		string lit{static_cast<char>(v)};
 | |
| 		Scanner scanner(CharStream("  { \"" + lit + "\"", ""));
 | |
| 		BOOST_CHECK_EQUAL(scanner.currentToken(), Token::LBrace);
 | |
| 		BOOST_CHECK_EQUAL(scanner.next(), Token::Illegal);
 | |
| 		if (v == '\n' || v == '\v' || v == '\f' || v == '\r')
 | |
| 			BOOST_CHECK_EQUAL(scanner.currentError(), ScannerError::IllegalStringEndQuote);
 | |
| 		else
 | |
| 			BOOST_CHECK_EQUAL(scanner.currentError(), ScannerError::IllegalCharacterInString);
 | |
| 		BOOST_CHECK_EQUAL(scanner.currentLiteral(), "");
 | |
| 	}
 | |
| }
 | |
| 
 | |
| BOOST_AUTO_TEST_CASE(string_escapes)
 | |
| {
 | |
| 	Scanner scanner(CharStream("  { \"a\\x61\"", ""));
 | |
| 	BOOST_CHECK_EQUAL(scanner.currentToken(), Token::LBrace);
 | |
| 	BOOST_CHECK_EQUAL(scanner.next(), Token::StringLiteral);
 | |
| 	BOOST_CHECK_EQUAL(scanner.currentLiteral(), "aa");
 | |
| }
 | |
| 
 | |
| BOOST_AUTO_TEST_CASE(string_escapes_all)
 | |
| {
 | |
| 	Scanner scanner(CharStream("  { \"a\\x61\\n\\r\\t\"", ""));
 | |
| 	BOOST_CHECK_EQUAL(scanner.currentToken(), Token::LBrace);
 | |
| 	BOOST_CHECK_EQUAL(scanner.next(), Token::StringLiteral);
 | |
| 	BOOST_CHECK_EQUAL(scanner.currentLiteral(), "aa\n\r\t");
 | |
| }
 | |
| 
 | |
| BOOST_AUTO_TEST_CASE(string_escapes_legal_before_080)
 | |
| {
 | |
| 	Scanner scanner(CharStream("  { \"a\\b", ""));
 | |
| 	BOOST_CHECK_EQUAL(scanner.currentToken(), Token::LBrace);
 | |
| 	BOOST_CHECK_EQUAL(scanner.next(), Token::Illegal);
 | |
| 	BOOST_CHECK_EQUAL(scanner.currentError(), ScannerError::IllegalEscapeSequence);
 | |
| 	BOOST_CHECK_EQUAL(scanner.currentLiteral(), "");
 | |
| 	scanner.reset(CharStream("  { \"a\\f", ""));
 | |
| 	BOOST_CHECK_EQUAL(scanner.currentToken(), Token::LBrace);
 | |
| 	BOOST_CHECK_EQUAL(scanner.next(), Token::Illegal);
 | |
| 	BOOST_CHECK_EQUAL(scanner.currentError(), ScannerError::IllegalEscapeSequence);
 | |
| 	BOOST_CHECK_EQUAL(scanner.currentLiteral(), "");
 | |
| 	scanner.reset(CharStream("  { \"a\\v", ""));
 | |
| 	BOOST_CHECK_EQUAL(scanner.currentToken(), Token::LBrace);
 | |
| 	BOOST_CHECK_EQUAL(scanner.next(), Token::Illegal);
 | |
| 	BOOST_CHECK_EQUAL(scanner.currentError(), ScannerError::IllegalEscapeSequence);
 | |
| 	BOOST_CHECK_EQUAL(scanner.currentLiteral(), "");
 | |
| }
 | |
| 
 | |
| BOOST_AUTO_TEST_CASE(string_escapes_with_zero)
 | |
| {
 | |
| 	Scanner scanner(CharStream("  { \"a\\x61\\x00abc\"", ""));
 | |
| 	BOOST_CHECK_EQUAL(scanner.currentToken(), Token::LBrace);
 | |
| 	BOOST_CHECK_EQUAL(scanner.next(), Token::StringLiteral);
 | |
| 	BOOST_CHECK_EQUAL(scanner.currentLiteral(), std::string("aa\0abc", 6));
 | |
| }
 | |
| 
 | |
| BOOST_AUTO_TEST_CASE(string_escape_illegal)
 | |
| {
 | |
| 	Scanner scanner(CharStream(" bla \"\\x6rf\" (illegalescape)", ""));
 | |
| 	BOOST_CHECK_EQUAL(scanner.currentToken(), Token::Identifier);
 | |
| 	BOOST_CHECK_EQUAL(scanner.next(), Token::Illegal);
 | |
| 	BOOST_CHECK_EQUAL(scanner.currentError(), ScannerError::IllegalEscapeSequence);
 | |
| 	BOOST_CHECK_EQUAL(scanner.currentLiteral(), "");
 | |
| 	// TODO recovery from illegal tokens should be improved
 | |
| 	BOOST_CHECK_EQUAL(scanner.next(), Token::Illegal);
 | |
| 	BOOST_CHECK_EQUAL(scanner.next(), Token::Identifier);
 | |
| 	BOOST_CHECK_EQUAL(scanner.next(), Token::Illegal);
 | |
| 	BOOST_CHECK_EQUAL(scanner.next(), Token::EOS);
 | |
| }
 | |
| 
 | |
| BOOST_AUTO_TEST_CASE(hex_numbers)
 | |
| {
 | |
| 	Scanner scanner(CharStream("var x = 0x765432536763762734623472346;", ""));
 | |
| 	BOOST_CHECK_EQUAL(scanner.currentToken(), Token::Var);
 | |
| 	BOOST_CHECK_EQUAL(scanner.next(), Token::Identifier);
 | |
| 	BOOST_CHECK_EQUAL(scanner.next(), Token::Assign);
 | |
| 	BOOST_CHECK_EQUAL(scanner.next(), Token::Number);
 | |
| 	BOOST_CHECK_EQUAL(scanner.currentLiteral(), "0x765432536763762734623472346");
 | |
| 	BOOST_CHECK_EQUAL(scanner.next(), Token::Semicolon);
 | |
| 	BOOST_CHECK_EQUAL(scanner.next(), Token::EOS);
 | |
| 	scanner.reset(CharStream("0x1234", ""));
 | |
| 	BOOST_CHECK_EQUAL(scanner.currentToken(), Token::Number);
 | |
| 	BOOST_CHECK_EQUAL(scanner.currentLiteral(), "0x1234");
 | |
| 	scanner.reset(CharStream("0X1234", ""));
 | |
| 	BOOST_CHECK_EQUAL(scanner.currentToken(), Token::Illegal);
 | |
| }
 | |
| 
 | |
| BOOST_AUTO_TEST_CASE(octal_numbers)
 | |
| {
 | |
| 	Scanner scanner(CharStream("07", ""));
 | |
| 	BOOST_CHECK_EQUAL(scanner.currentToken(), Token::Illegal);
 | |
| 	scanner.reset(CharStream("007", ""));
 | |
| 	BOOST_CHECK_EQUAL(scanner.currentToken(), Token::Illegal);
 | |
| 	scanner.reset(CharStream("-07", ""));
 | |
| 	BOOST_CHECK_EQUAL(scanner.currentToken(), Token::Sub);
 | |
| 	BOOST_CHECK_EQUAL(scanner.next(), Token::Illegal);
 | |
| 	scanner.reset(CharStream("-.07", ""));
 | |
| 	BOOST_CHECK_EQUAL(scanner.currentToken(), Token::Sub);
 | |
| 	BOOST_CHECK_EQUAL(scanner.next(), Token::Number);
 | |
| 	scanner.reset(CharStream("0", ""));
 | |
| 	BOOST_CHECK_EQUAL(scanner.currentToken(), Token::Number);
 | |
| 	scanner.reset(CharStream("0.1", ""));
 | |
| 	BOOST_CHECK_EQUAL(scanner.currentToken(), Token::Number);
 | |
| }
 | |
| 
 | |
| BOOST_AUTO_TEST_CASE(scientific_notation)
 | |
| {
 | |
| 	Scanner scanner(CharStream("var x = 2e10;", ""));
 | |
| 	BOOST_CHECK_EQUAL(scanner.currentToken(), Token::Var);
 | |
| 	BOOST_CHECK_EQUAL(scanner.next(), Token::Identifier);
 | |
| 	BOOST_CHECK_EQUAL(scanner.next(), Token::Assign);
 | |
| 	BOOST_CHECK_EQUAL(scanner.next(), Token::Number);
 | |
| 	BOOST_CHECK_EQUAL(scanner.currentLiteral(), "2e10");
 | |
| 	BOOST_CHECK_EQUAL(scanner.next(), Token::Semicolon);
 | |
| 	BOOST_CHECK_EQUAL(scanner.next(), Token::EOS);
 | |
| }
 | |
| 
 | |
| BOOST_AUTO_TEST_CASE(leading_dot_in_identifier)
 | |
| {
 | |
| 	Scanner scanner(CharStream("function .a(", ""));
 | |
| 	BOOST_CHECK_EQUAL(scanner.currentToken(), Token::Function);
 | |
| 	BOOST_CHECK_EQUAL(scanner.next(), Token::Period);
 | |
| 	BOOST_CHECK_EQUAL(scanner.next(), Token::Identifier);
 | |
| 	BOOST_CHECK_EQUAL(scanner.next(), Token::LParen);
 | |
| 	BOOST_CHECK_EQUAL(scanner.next(), Token::EOS);
 | |
| 	scanner.reset(CharStream("function .a(", ""));
 | |
| 	scanner.setScannerMode(ScannerKind::Yul);
 | |
| 	BOOST_CHECK_EQUAL(scanner.currentToken(), Token::Function);
 | |
| 	BOOST_CHECK_EQUAL(scanner.next(), Token::Period);
 | |
| 	BOOST_CHECK_EQUAL(scanner.next(), Token::Identifier);
 | |
| 	BOOST_CHECK_EQUAL(scanner.next(), Token::LParen);
 | |
| 	BOOST_CHECK_EQUAL(scanner.next(), Token::EOS);
 | |
| }
 | |
| 
 | |
| BOOST_AUTO_TEST_CASE(middle_dot_in_identifier)
 | |
| {
 | |
| 	Scanner scanner(CharStream("function a..a(", ""));
 | |
| 	BOOST_CHECK_EQUAL(scanner.currentToken(), Token::Function);
 | |
| 	BOOST_CHECK_EQUAL(scanner.next(), Token::Identifier);
 | |
| 	BOOST_CHECK_EQUAL(scanner.next(), Token::Period);
 | |
| 	BOOST_CHECK_EQUAL(scanner.next(), Token::Period);
 | |
| 	BOOST_CHECK_EQUAL(scanner.next(), Token::Identifier);
 | |
| 	BOOST_CHECK_EQUAL(scanner.next(), Token::LParen);
 | |
| 	BOOST_CHECK_EQUAL(scanner.next(), Token::EOS);
 | |
| 	scanner.reset(CharStream("function a...a(", ""));
 | |
| 	scanner.setScannerMode(ScannerKind::Yul);
 | |
| 	BOOST_CHECK_EQUAL(scanner.currentToken(), Token::Function);
 | |
| 	BOOST_CHECK_EQUAL(scanner.next(), Token::Identifier);
 | |
| 	BOOST_CHECK_EQUAL(scanner.next(), Token::LParen);
 | |
| 	BOOST_CHECK_EQUAL(scanner.next(), Token::EOS);
 | |
| }
 | |
| 
 | |
| BOOST_AUTO_TEST_CASE(trailing_dot_in_identifier)
 | |
| {
 | |
| 	Scanner scanner(CharStream("function a.(", ""));
 | |
| 	BOOST_CHECK_EQUAL(scanner.currentToken(), Token::Function);
 | |
| 	BOOST_CHECK_EQUAL(scanner.next(), Token::Identifier);
 | |
| 	BOOST_CHECK_EQUAL(scanner.next(), Token::Period);
 | |
| 	BOOST_CHECK_EQUAL(scanner.next(), Token::LParen);
 | |
| 	BOOST_CHECK_EQUAL(scanner.next(), Token::EOS);
 | |
| 	scanner.reset(CharStream("function a.(", ""));
 | |
| 	scanner.setScannerMode(ScannerKind::Yul);
 | |
| 	BOOST_CHECK_EQUAL(scanner.currentToken(), Token::Function);
 | |
| 	BOOST_CHECK_EQUAL(scanner.next(), Token::Identifier);
 | |
| 	BOOST_CHECK_EQUAL(scanner.next(), Token::LParen);
 | |
| 	BOOST_CHECK_EQUAL(scanner.next(), Token::EOS);
 | |
| }
 | |
| 
 | |
| BOOST_AUTO_TEST_CASE(trailing_dot_in_numbers)
 | |
| {
 | |
| 	Scanner scanner(CharStream("2.5", ""));
 | |
| 	BOOST_CHECK_EQUAL(scanner.currentToken(), Token::Number);
 | |
| 	BOOST_CHECK_EQUAL(scanner.next(), Token::EOS);
 | |
| 	scanner.reset(CharStream("2.5e10", ""));
 | |
| 	BOOST_CHECK_EQUAL(scanner.currentToken(), Token::Number);
 | |
| 	BOOST_CHECK_EQUAL(scanner.next(), Token::EOS);
 | |
| 	scanner.reset(CharStream(".5", ""));
 | |
| 	BOOST_CHECK_EQUAL(scanner.currentToken(), Token::Number);
 | |
| 	BOOST_CHECK_EQUAL(scanner.next(), Token::EOS);
 | |
| 	scanner.reset(CharStream(".5e10", ""));
 | |
| 	BOOST_CHECK_EQUAL(scanner.currentToken(), Token::Number);
 | |
| 	BOOST_CHECK_EQUAL(scanner.next(), Token::EOS);
 | |
| 	scanner.reset(CharStream("2.", ""));
 | |
| 	BOOST_CHECK_EQUAL(scanner.currentToken(), Token::Number);
 | |
| 	BOOST_CHECK_EQUAL(scanner.next(), Token::Period);
 | |
| 	BOOST_CHECK_EQUAL(scanner.next(), Token::EOS);
 | |
| }
 | |
| 
 | |
| BOOST_AUTO_TEST_CASE(leading_underscore_decimal_is_identifier)
 | |
| {
 | |
| 	// Actual error is cought by SyntaxChecker.
 | |
| 	Scanner scanner(CharStream("_1.2", ""));
 | |
| 	BOOST_CHECK_EQUAL(scanner.currentToken(), Token::Identifier);
 | |
| 	BOOST_CHECK_EQUAL(scanner.next(), Token::Number);
 | |
| 	BOOST_CHECK_EQUAL(scanner.next(), Token::EOS);
 | |
| }
 | |
| 
 | |
| BOOST_AUTO_TEST_CASE(leading_underscore_decimal_after_dot_illegal)
 | |
| {
 | |
| 	// Actual error is cought by SyntaxChecker.
 | |
| 	Scanner scanner(CharStream("1._2", ""));
 | |
| 	BOOST_CHECK_EQUAL(scanner.currentToken(), Token::Number);
 | |
| 	BOOST_CHECK_EQUAL(scanner.next(), Token::EOS);
 | |
| 
 | |
| 	scanner.reset(CharStream("1._", ""));
 | |
| 	BOOST_CHECK_EQUAL(scanner.currentToken(), Token::Number);
 | |
| 	BOOST_CHECK_EQUAL(scanner.next(), Token::EOS);
 | |
| }
 | |
| 
 | |
| BOOST_AUTO_TEST_CASE(leading_underscore_exp_are_identifier)
 | |
| {
 | |
| 	// Actual error is cought by SyntaxChecker.
 | |
| 	Scanner scanner(CharStream("_1e2", ""));
 | |
| 	BOOST_CHECK_EQUAL(scanner.currentToken(), Token::Identifier);
 | |
| 	BOOST_CHECK_EQUAL(scanner.next(), Token::EOS);
 | |
| }
 | |
| 
 | |
| BOOST_AUTO_TEST_CASE(leading_underscore_exp_after_e_illegal)
 | |
| {
 | |
| 	// Actual error is cought by SyntaxChecker.
 | |
| 	Scanner scanner(CharStream("1e_2", ""));
 | |
| 	BOOST_CHECK_EQUAL(scanner.currentToken(), Token::Number);
 | |
| 	BOOST_CHECK_EQUAL(scanner.currentLiteral(), "1e_2");
 | |
| 	BOOST_CHECK_EQUAL(scanner.next(), Token::EOS);
 | |
| }
 | |
| 
 | |
| BOOST_AUTO_TEST_CASE(leading_underscore_hex_illegal)
 | |
| {
 | |
| 	Scanner scanner(CharStream("0x_abc", ""));
 | |
| 	BOOST_CHECK_EQUAL(scanner.currentToken(), Token::Illegal);
 | |
| 	BOOST_CHECK_EQUAL(scanner.next(), Token::Identifier);
 | |
| 	BOOST_CHECK_EQUAL(scanner.next(), Token::EOS);
 | |
| }
 | |
| 
 | |
| BOOST_AUTO_TEST_CASE(fixed_number_invalid_underscore_front)
 | |
| {
 | |
| 	// Actual error is cought by SyntaxChecker.
 | |
| 	Scanner scanner(CharStream("12._1234_1234", ""));
 | |
| 	BOOST_CHECK_EQUAL(scanner.currentToken(), Token::Number);
 | |
| 	BOOST_CHECK_EQUAL(scanner.next(), Token::EOS);
 | |
| }
 | |
| 
 | |
| BOOST_AUTO_TEST_CASE(number_literals_with_trailing_underscore_at_eos)
 | |
| {
 | |
| 	// Actual error is cought by SyntaxChecker.
 | |
| 	Scanner scanner(CharStream("0x123_", ""));
 | |
| 	BOOST_CHECK_EQUAL(scanner.currentToken(), Token::Number);
 | |
| 	BOOST_CHECK_EQUAL(scanner.next(), Token::EOS);
 | |
| 
 | |
| 	scanner.reset(CharStream("123_", ""));
 | |
| 	BOOST_CHECK_EQUAL(scanner.currentToken(), Token::Number);
 | |
| 	BOOST_CHECK_EQUAL(scanner.next(), Token::EOS);
 | |
| 
 | |
| 	scanner.reset(CharStream("12.34_", ""));
 | |
| 	BOOST_CHECK_EQUAL(scanner.currentToken(), Token::Number);
 | |
| 	BOOST_CHECK_EQUAL(scanner.next(), Token::EOS);
 | |
| }
 | |
| 
 | |
| BOOST_AUTO_TEST_CASE(negative_numbers)
 | |
| {
 | |
| 	Scanner scanner(CharStream("var x = -.2 + -0x78 + -7.3 + 8.9 + 2e-2;", ""));
 | |
| 	BOOST_CHECK_EQUAL(scanner.currentToken(), Token::Var);
 | |
| 	BOOST_CHECK_EQUAL(scanner.next(), Token::Identifier);
 | |
| 	BOOST_CHECK_EQUAL(scanner.next(), Token::Assign);
 | |
| 	BOOST_CHECK_EQUAL(scanner.next(), Token::Sub);
 | |
| 	BOOST_CHECK_EQUAL(scanner.next(), Token::Number);
 | |
| 	BOOST_CHECK_EQUAL(scanner.currentLiteral(), ".2");
 | |
| 	BOOST_CHECK_EQUAL(scanner.next(), Token::Add);
 | |
| 	BOOST_CHECK_EQUAL(scanner.next(), Token::Sub);
 | |
| 	BOOST_CHECK_EQUAL(scanner.next(), Token::Number);
 | |
| 	BOOST_CHECK_EQUAL(scanner.currentLiteral(), "0x78");
 | |
| 	BOOST_CHECK_EQUAL(scanner.next(), Token::Add);
 | |
| 	BOOST_CHECK_EQUAL(scanner.next(), Token::Sub);
 | |
| 	BOOST_CHECK_EQUAL(scanner.next(), Token::Number);
 | |
| 	BOOST_CHECK_EQUAL(scanner.currentLiteral(), "7.3");
 | |
| 	BOOST_CHECK_EQUAL(scanner.next(), Token::Add);
 | |
| 	BOOST_CHECK_EQUAL(scanner.next(), Token::Number);
 | |
| 	BOOST_CHECK_EQUAL(scanner.currentLiteral(), "8.9");
 | |
| 	BOOST_CHECK_EQUAL(scanner.next(), Token::Add);
 | |
| 	BOOST_CHECK_EQUAL(scanner.next(), Token::Number);
 | |
| 	BOOST_CHECK_EQUAL(scanner.currentLiteral(), "2e-2");
 | |
| 	BOOST_CHECK_EQUAL(scanner.next(), Token::Semicolon);
 | |
| 	BOOST_CHECK_EQUAL(scanner.next(), Token::EOS);
 | |
| }
 | |
| 
 | |
| BOOST_AUTO_TEST_CASE(locations)
 | |
| {
 | |
| 	Scanner scanner(CharStream("function_identifier has ; -0x743/*comment*/\n ident //comment", ""));
 | |
| 	BOOST_CHECK_EQUAL(scanner.currentToken(), Token::Identifier);
 | |
| 	BOOST_CHECK_EQUAL(scanner.currentLocation().start, 0);
 | |
| 	BOOST_CHECK_EQUAL(scanner.currentLocation().end, 19);
 | |
| 	BOOST_CHECK_EQUAL(scanner.next(), Token::Identifier);
 | |
| 	BOOST_CHECK_EQUAL(scanner.currentLocation().start, 20);
 | |
| 	BOOST_CHECK_EQUAL(scanner.currentLocation().end, 23);
 | |
| 	BOOST_CHECK_EQUAL(scanner.next(), Token::Semicolon);
 | |
| 	BOOST_CHECK_EQUAL(scanner.currentLocation().start, 24);
 | |
| 	BOOST_CHECK_EQUAL(scanner.currentLocation().end, 25);
 | |
| 	BOOST_CHECK_EQUAL(scanner.next(), Token::Sub);
 | |
| 	BOOST_CHECK_EQUAL(scanner.next(), Token::Number);
 | |
| 	BOOST_CHECK_EQUAL(scanner.currentLocation().start, 27);
 | |
| 	BOOST_CHECK_EQUAL(scanner.currentLocation().end, 32);
 | |
| 	BOOST_CHECK_EQUAL(scanner.next(), Token::Identifier);
 | |
| 	BOOST_CHECK_EQUAL(scanner.currentLocation().start, 45);
 | |
| 	BOOST_CHECK_EQUAL(scanner.currentLocation().end, 50);
 | |
| 	BOOST_CHECK_EQUAL(scanner.next(), Token::EOS);
 | |
| }
 | |
| 
 | |
| BOOST_AUTO_TEST_CASE(ambiguities)
 | |
| {
 | |
| 	// test scanning of some operators which need look-ahead
 | |
| 	Scanner scanner(CharStream("<=" "<" "+ +=a++ =>" "<<" ">>" " >>=" ">>>" ">>>=" " >>>>>=><<=", ""));
 | |
| 	BOOST_CHECK_EQUAL(scanner.currentToken(), Token::LessThanOrEqual);
 | |
| 	BOOST_CHECK_EQUAL(scanner.next(), Token::LessThan);
 | |
| 	BOOST_CHECK_EQUAL(scanner.next(), Token::Add);
 | |
| 	BOOST_CHECK_EQUAL(scanner.next(), Token::AssignAdd);
 | |
| 	BOOST_CHECK_EQUAL(scanner.next(), Token::Identifier);
 | |
| 	BOOST_CHECK_EQUAL(scanner.next(), Token::Inc);
 | |
| 	BOOST_CHECK_EQUAL(scanner.next(), Token::DoubleArrow);
 | |
| 	BOOST_CHECK_EQUAL(scanner.next(), Token::SHL);
 | |
| 	BOOST_CHECK_EQUAL(scanner.next(), Token::SAR);
 | |
| 	BOOST_CHECK_EQUAL(scanner.next(), Token::AssignSar);
 | |
| 	BOOST_CHECK_EQUAL(scanner.next(), Token::SHR);
 | |
| 	BOOST_CHECK_EQUAL(scanner.next(), Token::AssignShr);
 | |
| 	// the last "monster" token combination
 | |
| 	BOOST_CHECK_EQUAL(scanner.next(), Token::SHR);
 | |
| 	BOOST_CHECK_EQUAL(scanner.next(), Token::AssignSar);
 | |
| 	BOOST_CHECK_EQUAL(scanner.next(), Token::GreaterThan);
 | |
| 	BOOST_CHECK_EQUAL(scanner.next(), Token::AssignShl);
 | |
| }
 | |
| 
 | |
| BOOST_AUTO_TEST_CASE(documentation_comments_parsed_begin)
 | |
| {
 | |
| 	Scanner scanner(CharStream("/// Send $(value / 1000) chocolates to the user", ""));
 | |
| 	BOOST_CHECK_EQUAL(scanner.currentToken(), Token::EOS);
 | |
| 	BOOST_CHECK_EQUAL(scanner.currentCommentLiteral(), "Send $(value / 1000) chocolates to the user");
 | |
| }
 | |
| 
 | |
| BOOST_AUTO_TEST_CASE(multiline_documentation_comments_parsed_begin)
 | |
| {
 | |
| 	Scanner scanner(CharStream("/** Send $(value / 1000) chocolates to the user*/", ""));
 | |
| 	BOOST_CHECK_EQUAL(scanner.currentToken(), Token::EOS);
 | |
| 	BOOST_CHECK_EQUAL(scanner.currentCommentLiteral(), "Send $(value / 1000) chocolates to the user");
 | |
| }
 | |
| 
 | |
| BOOST_AUTO_TEST_CASE(documentation_comments_parsed)
 | |
| {
 | |
| 	Scanner scanner(CharStream("some other tokens /// Send $(value / 1000) chocolates to the user", ""));
 | |
| 	BOOST_CHECK_EQUAL(scanner.currentToken(), Token::Identifier);
 | |
| 	BOOST_CHECK_EQUAL(scanner.next(), Token::Identifier);
 | |
| 	BOOST_CHECK_EQUAL(scanner.next(), Token::Identifier);
 | |
| 	BOOST_CHECK_EQUAL(scanner.next(), Token::EOS);
 | |
| 	BOOST_CHECK_EQUAL(scanner.currentCommentLiteral(), "Send $(value / 1000) chocolates to the user");
 | |
| }
 | |
| 
 | |
| BOOST_AUTO_TEST_CASE(multiline_documentation_comments_parsed)
 | |
| {
 | |
| 	Scanner scanner(CharStream("some other tokens /**\n"
 | |
| 							   "* Send $(value / 1000) chocolates to the user\n"
 | |
| 							   "*/", ""));
 | |
| 	BOOST_CHECK_EQUAL(scanner.currentToken(), Token::Identifier);
 | |
| 	BOOST_CHECK_EQUAL(scanner.next(), Token::Identifier);
 | |
| 	BOOST_CHECK_EQUAL(scanner.next(), Token::Identifier);
 | |
| 	BOOST_CHECK_EQUAL(scanner.next(), Token::EOS);
 | |
| 	BOOST_CHECK_EQUAL(scanner.currentCommentLiteral(), " Send $(value / 1000) chocolates to the user");
 | |
| }
 | |
| 
 | |
| BOOST_AUTO_TEST_CASE(multiline_documentation_no_stars)
 | |
| {
 | |
| 	Scanner scanner(CharStream("some other tokens /**\n"
 | |
| 							   " Send $(value / 1000) chocolates to the user\n"
 | |
| 							   "*/", ""));
 | |
| 	BOOST_CHECK_EQUAL(scanner.currentToken(), Token::Identifier);
 | |
| 	BOOST_CHECK_EQUAL(scanner.next(), Token::Identifier);
 | |
| 	BOOST_CHECK_EQUAL(scanner.next(), Token::Identifier);
 | |
| 	BOOST_CHECK_EQUAL(scanner.next(), Token::EOS);
 | |
| 	BOOST_CHECK_EQUAL(scanner.currentCommentLiteral(), "Send $(value / 1000) chocolates to the user");
 | |
| }
 | |
| 
 | |
| BOOST_AUTO_TEST_CASE(multiline_documentation_whitespace_hell)
 | |
| {
 | |
| 	Scanner scanner(CharStream("some other tokens /** \t \r \n"
 | |
| 							   "\t \r  * Send $(value / 1000) chocolates to the user\n"
 | |
| 							   "*/", ""));
 | |
| 	BOOST_CHECK_EQUAL(scanner.currentToken(), Token::Identifier);
 | |
| 	BOOST_CHECK_EQUAL(scanner.next(), Token::Identifier);
 | |
| 	BOOST_CHECK_EQUAL(scanner.next(), Token::Identifier);
 | |
| 	BOOST_CHECK_EQUAL(scanner.next(), Token::EOS);
 | |
| 	BOOST_CHECK_EQUAL(scanner.currentCommentLiteral(), " Send $(value / 1000) chocolates to the user");
 | |
| }
 | |
| 
 | |
| BOOST_AUTO_TEST_CASE(comment_before_eos)
 | |
| {
 | |
| 	Scanner scanner(CharStream("//", ""));
 | |
| 	BOOST_CHECK_EQUAL(scanner.currentToken(), Token::EOS);
 | |
| 	BOOST_CHECK_EQUAL(scanner.currentCommentLiteral(), "");
 | |
| }
 | |
| 
 | |
| BOOST_AUTO_TEST_CASE(documentation_comment_before_eos)
 | |
| {
 | |
| 	Scanner scanner(CharStream("///", ""));
 | |
| 	BOOST_CHECK_EQUAL(scanner.currentToken(), Token::EOS);
 | |
| 	BOOST_CHECK_EQUAL(scanner.currentCommentLiteral(), "");
 | |
| }
 | |
| 
 | |
| BOOST_AUTO_TEST_CASE(empty_multiline_comment)
 | |
| {
 | |
| 	Scanner scanner(CharStream("/**/", ""));
 | |
| 	BOOST_CHECK_EQUAL(scanner.currentToken(), Token::EOS);
 | |
| 	BOOST_CHECK_EQUAL(scanner.currentCommentLiteral(), "");
 | |
| }
 | |
| 
 | |
| BOOST_AUTO_TEST_CASE(empty_multiline_documentation_comment_before_eos)
 | |
| {
 | |
| 	Scanner scanner(CharStream("/***/", ""));
 | |
| 	BOOST_CHECK_EQUAL(scanner.currentToken(), Token::EOS);
 | |
| 	BOOST_CHECK_EQUAL(scanner.currentCommentLiteral(), "");
 | |
| }
 | |
| 
 | |
| BOOST_AUTO_TEST_CASE(comments_mixed_in_sequence)
 | |
| {
 | |
| 	Scanner scanner(CharStream("hello_world ///documentation comment \n"
 | |
| 							   "//simple comment \n"
 | |
| 							   "<<", ""));
 | |
| 	BOOST_CHECK_EQUAL(scanner.currentToken(), Token::Identifier);
 | |
| 	BOOST_CHECK_EQUAL(scanner.next(), Token::SHL);
 | |
| 	BOOST_CHECK_EQUAL(scanner.currentCommentLiteral(), "documentation comment ");
 | |
| }
 | |
| 
 | |
| BOOST_AUTO_TEST_CASE(ether_subdenominations)
 | |
| {
 | |
| 	Scanner scanner(CharStream("wei gwei ether", ""));
 | |
| 	BOOST_CHECK_EQUAL(scanner.currentToken(), Token::SubWei);
 | |
| 	BOOST_CHECK_EQUAL(scanner.next(), Token::SubGwei);
 | |
| 	BOOST_CHECK_EQUAL(scanner.next(), Token::SubEther);
 | |
| }
 | |
| 
 | |
| BOOST_AUTO_TEST_CASE(time_subdenominations)
 | |
| {
 | |
| 	Scanner scanner(CharStream("seconds minutes hours days weeks years", ""));
 | |
| 	BOOST_CHECK_EQUAL(scanner.currentToken(), Token::SubSecond);
 | |
| 	BOOST_CHECK_EQUAL(scanner.next(), Token::SubMinute);
 | |
| 	BOOST_CHECK_EQUAL(scanner.next(), Token::SubHour);
 | |
| 	BOOST_CHECK_EQUAL(scanner.next(), Token::SubDay);
 | |
| 	BOOST_CHECK_EQUAL(scanner.next(), Token::SubWeek);
 | |
| 	BOOST_CHECK_EQUAL(scanner.next(), Token::SubYear);
 | |
| }
 | |
| 
 | |
| BOOST_AUTO_TEST_CASE(empty_comment)
 | |
| {
 | |
| 	Scanner scanner(CharStream("//\ncontract{}", ""));
 | |
| 	BOOST_CHECK_EQUAL(scanner.currentCommentLiteral(), "");
 | |
| 	BOOST_CHECK_EQUAL(scanner.currentToken(), Token::Contract);
 | |
| 	BOOST_CHECK_EQUAL(scanner.next(), Token::LBrace);
 | |
| 	BOOST_CHECK_EQUAL(scanner.next(), Token::RBrace);
 | |
| 
 | |
| }
 | |
| 
 | |
| // Unicode string escapes
 | |
| 
 | |
| BOOST_AUTO_TEST_CASE(valid_unicode_string_escape)
 | |
| {
 | |
| 	Scanner scanner(CharStream("{ \"\\u00DAnicode\"", ""));
 | |
| 	BOOST_CHECK_EQUAL(scanner.currentToken(), Token::LBrace);
 | |
| 	BOOST_CHECK_EQUAL(scanner.next(), Token::StringLiteral);
 | |
| 	BOOST_CHECK_EQUAL(scanner.currentLiteral(), std::string("\xC3\x9Anicode", 8));
 | |
| }
 | |
| 
 | |
| BOOST_AUTO_TEST_CASE(valid_unicode_string_escape_7f)
 | |
| {
 | |
| 	Scanner scanner(CharStream("{ \"\\u007Fnicode\"", ""));
 | |
| 	BOOST_CHECK_EQUAL(scanner.currentToken(), Token::LBrace);
 | |
| 	BOOST_CHECK_EQUAL(scanner.next(), Token::StringLiteral);
 | |
| 	BOOST_CHECK_EQUAL(scanner.currentLiteral(), std::string("\x7Fnicode", 7));
 | |
| }
 | |
| 
 | |
| BOOST_AUTO_TEST_CASE(valid_unicode_string_escape_7ff)
 | |
| {
 | |
| 	Scanner scanner(CharStream("{ \"\\u07FFnicode\"", ""));
 | |
| 	BOOST_CHECK_EQUAL(scanner.currentToken(), Token::LBrace);
 | |
| 	BOOST_CHECK_EQUAL(scanner.next(), Token::StringLiteral);
 | |
| 	BOOST_CHECK_EQUAL(scanner.currentLiteral(), std::string("\xDF\xBFnicode", 8));
 | |
| }
 | |
| 
 | |
| BOOST_AUTO_TEST_CASE(valid_unicode_string_escape_ffff)
 | |
| {
 | |
| 	Scanner scanner(CharStream("{ \"\\uFFFFnicode\"", ""));
 | |
| 	BOOST_CHECK_EQUAL(scanner.currentToken(), Token::LBrace);
 | |
| 	BOOST_CHECK_EQUAL(scanner.next(), Token::StringLiteral);
 | |
| 	BOOST_CHECK_EQUAL(scanner.currentLiteral(), std::string("\xEF\xBF\xBFnicode", 9));
 | |
| }
 | |
| 
 | |
| BOOST_AUTO_TEST_CASE(invalid_short_unicode_string_escape)
 | |
| {
 | |
| 	Scanner scanner(CharStream("{ \"\\uFFnicode\"", ""));
 | |
| 	BOOST_CHECK_EQUAL(scanner.currentToken(), Token::LBrace);
 | |
| 	BOOST_CHECK_EQUAL(scanner.next(), Token::Illegal);
 | |
| }
 | |
| 
 | |
| // Unicode string literal
 | |
| 
 | |
| BOOST_AUTO_TEST_CASE(unicode_prefix_only)
 | |
| {
 | |
| 	Scanner scanner(CharStream("{ unicode", ""));
 | |
| 	BOOST_CHECK_EQUAL(scanner.currentToken(), Token::LBrace);
 | |
| 	BOOST_CHECK_EQUAL(scanner.next(), Token::Illegal);
 | |
| 	BOOST_CHECK_EQUAL(scanner.currentError(), ScannerError::IllegalToken);
 | |
| 	scanner.reset(CharStream("{ unicode", ""));
 | |
| 	scanner.setScannerMode(ScannerKind::Yul);
 | |
| 	BOOST_CHECK_EQUAL(scanner.currentToken(), Token::LBrace);
 | |
| 	BOOST_CHECK_EQUAL(scanner.next(), Token::Identifier);
 | |
| 	BOOST_CHECK_EQUAL(scanner.currentLiteral(), "unicode");
 | |
| }
 | |
| 
 | |
| BOOST_AUTO_TEST_CASE(unicode_invalid_space)
 | |
| {
 | |
| 	Scanner scanner(CharStream("{ unicode ", ""));
 | |
| 	BOOST_CHECK_EQUAL(scanner.currentToken(), Token::LBrace);
 | |
| 	BOOST_CHECK_EQUAL(scanner.next(), Token::Illegal);
 | |
| 	BOOST_CHECK_EQUAL(scanner.currentError(), ScannerError::IllegalToken);
 | |
| }
 | |
| 
 | |
| BOOST_AUTO_TEST_CASE(unicode_invalid_token)
 | |
| {
 | |
| 	Scanner scanner(CharStream("{ unicode test", ""));
 | |
| 	BOOST_CHECK_EQUAL(scanner.currentToken(), Token::LBrace);
 | |
| 	BOOST_CHECK_EQUAL(scanner.next(), Token::Illegal);
 | |
| 	BOOST_CHECK_EQUAL(scanner.currentError(), ScannerError::IllegalToken);
 | |
| 	scanner.reset(CharStream("{ unicode test", ""));
 | |
| 	scanner.setScannerMode(ScannerKind::Yul);
 | |
| 	BOOST_CHECK_EQUAL(scanner.currentToken(), Token::LBrace);
 | |
| 	BOOST_CHECK_EQUAL(scanner.next(), Token::Identifier);
 | |
| 	BOOST_CHECK_EQUAL(scanner.currentLiteral(), "unicode");
 | |
| 	BOOST_CHECK_EQUAL(scanner.next(), Token::Identifier);
 | |
| 	BOOST_CHECK_EQUAL(scanner.currentLiteral(), "test");
 | |
| }
 | |
| 
 | |
| BOOST_AUTO_TEST_CASE(valid_unicode_literal)
 | |
| {
 | |
| 	Scanner scanner(CharStream("{ unicode\"Hello 😃\"", ""));
 | |
| 	BOOST_CHECK_EQUAL(scanner.currentToken(), Token::LBrace);
 | |
| 	BOOST_CHECK_EQUAL(scanner.next(), Token::UnicodeStringLiteral);
 | |
| 	BOOST_CHECK_EQUAL(scanner.currentLiteral(), std::string("Hello \xf0\x9f\x98\x83", 10));
 | |
| }
 | |
| 
 | |
| BOOST_AUTO_TEST_CASE(valid_nonprintable_in_unicode_literal)
 | |
| {
 | |
| 	// Non-printable characters are allowed in unicode strings...
 | |
| 	Scanner scanner(CharStream("{ unicode\"Hello \007😃\"", ""));
 | |
| 	BOOST_CHECK_EQUAL(scanner.currentToken(), Token::LBrace);
 | |
| 	BOOST_CHECK_EQUAL(scanner.next(), Token::UnicodeStringLiteral);
 | |
| 	BOOST_CHECK_EQUAL(scanner.currentLiteral(), std::string("Hello \x07\xf0\x9f\x98\x83", 11));
 | |
| }
 | |
| 
 | |
| // Hex string literal
 | |
| 
 | |
| BOOST_AUTO_TEST_CASE(hex_prefix_only)
 | |
| {
 | |
| 	Scanner scanner(CharStream("{ hex", ""));
 | |
| 	BOOST_CHECK_EQUAL(scanner.currentToken(), Token::LBrace);
 | |
| 	BOOST_CHECK_EQUAL(scanner.next(), Token::Illegal);
 | |
| 	BOOST_CHECK_EQUAL(scanner.currentError(), ScannerError::IllegalToken);
 | |
| 	scanner.reset(CharStream("{ hex", ""));
 | |
| 	scanner.setScannerMode(ScannerKind::Yul);
 | |
| 	BOOST_CHECK_EQUAL(scanner.next(), Token::Illegal);
 | |
| 	BOOST_CHECK_EQUAL(scanner.currentError(), ScannerError::IllegalToken);
 | |
| }
 | |
| 
 | |
| BOOST_AUTO_TEST_CASE(hex_invalid_space)
 | |
| {
 | |
| 	Scanner scanner(CharStream("{ hex ", ""));
 | |
| 	BOOST_CHECK_EQUAL(scanner.currentToken(), Token::LBrace);
 | |
| 	BOOST_CHECK_EQUAL(scanner.next(), Token::Illegal);
 | |
| 	BOOST_CHECK_EQUAL(scanner.currentError(), ScannerError::IllegalToken);
 | |
| }
 | |
| 
 | |
| BOOST_AUTO_TEST_CASE(hex_invalid_token)
 | |
| {
 | |
| 	Scanner scanner(CharStream("{ hex test", ""));
 | |
| 	BOOST_CHECK_EQUAL(scanner.currentToken(), Token::LBrace);
 | |
| 	BOOST_CHECK_EQUAL(scanner.next(), Token::Illegal);
 | |
| 	BOOST_CHECK_EQUAL(scanner.currentError(), ScannerError::IllegalToken);
 | |
| 	scanner.reset(CharStream("{ hex test", ""));
 | |
| 	scanner.setScannerMode(ScannerKind::Yul);
 | |
| 	BOOST_CHECK_EQUAL(scanner.currentToken(), Token::LBrace);
 | |
| 	BOOST_CHECK_EQUAL(scanner.next(), Token::Illegal);
 | |
| 	BOOST_CHECK_EQUAL(scanner.currentError(), ScannerError::IllegalToken);
 | |
| }
 | |
| 
 | |
| BOOST_AUTO_TEST_CASE(valid_hex_literal)
 | |
| {
 | |
| 	Scanner scanner(CharStream("{ hex\"00112233FF\"", ""));
 | |
| 	BOOST_CHECK_EQUAL(scanner.currentToken(), Token::LBrace);
 | |
| 	BOOST_CHECK_EQUAL(scanner.next(), Token::HexStringLiteral);
 | |
| 	BOOST_CHECK_EQUAL(scanner.currentLiteral(), std::string("\x00\x11\x22\x33\xFF", 5));
 | |
| }
 | |
| 
 | |
| BOOST_AUTO_TEST_CASE(invalid_short_hex_literal)
 | |
| {
 | |
| 	Scanner scanner(CharStream("{ hex\"00112233F\"", ""));
 | |
| 	BOOST_CHECK_EQUAL(scanner.currentToken(), Token::LBrace);
 | |
| 	BOOST_CHECK_EQUAL(scanner.next(), Token::Illegal);
 | |
| 	BOOST_CHECK_EQUAL(scanner.currentError(), ScannerError::IllegalHexString);
 | |
| }
 | |
| 
 | |
| BOOST_AUTO_TEST_CASE(invalid_hex_literal_with_space)
 | |
| {
 | |
| 	Scanner scanner(CharStream("{ hex\"00112233FF \"", ""));
 | |
| 	BOOST_CHECK_EQUAL(scanner.currentToken(), Token::LBrace);
 | |
| 	BOOST_CHECK_EQUAL(scanner.next(), Token::Illegal);
 | |
| 	BOOST_CHECK_EQUAL(scanner.currentError(), ScannerError::IllegalHexString);
 | |
| }
 | |
| 
 | |
| BOOST_AUTO_TEST_CASE(invalid_hex_literal_with_wrong_quotes)
 | |
| {
 | |
| 	Scanner scanner(CharStream("{ hex\"00112233FF'", ""));
 | |
| 	BOOST_CHECK_EQUAL(scanner.currentToken(), Token::LBrace);
 | |
| 	BOOST_CHECK_EQUAL(scanner.next(), Token::Illegal);
 | |
| 	BOOST_CHECK_EQUAL(scanner.currentError(), ScannerError::IllegalHexString);
 | |
| }
 | |
| 
 | |
| BOOST_AUTO_TEST_CASE(invalid_hex_literal_nonhex_string)
 | |
| {
 | |
| 	Scanner scanner(CharStream("{ hex\"hello\"", ""));
 | |
| 	BOOST_CHECK_EQUAL(scanner.currentToken(), Token::LBrace);
 | |
| 	BOOST_CHECK_EQUAL(scanner.next(), Token::Illegal);
 | |
| 	BOOST_CHECK_EQUAL(scanner.currentError(), ScannerError::IllegalHexString);
 | |
| }
 | |
| 
 | |
| // Comments
 | |
| 
 | |
| BOOST_AUTO_TEST_CASE(invalid_multiline_comment_close)
 | |
| {
 | |
| 	// This used to parse as "comment", "identifier"
 | |
| 	Scanner scanner(CharStream("/** / x", ""));
 | |
| 	BOOST_CHECK_EQUAL(scanner.currentToken(), Token::Illegal);
 | |
| 	BOOST_CHECK_EQUAL(scanner.next(), Token::EOS);
 | |
| }
 | |
| 
 | |
| BOOST_AUTO_TEST_CASE(multiline_doc_comment_at_eos)
 | |
| {
 | |
| 	// This used to parse as "whitespace"
 | |
| 	Scanner scanner(CharStream("/**", ""));
 | |
| 	BOOST_CHECK_EQUAL(scanner.currentToken(), Token::Illegal);
 | |
| 	BOOST_CHECK_EQUAL(scanner.next(), Token::EOS);
 | |
| }
 | |
| 
 | |
| BOOST_AUTO_TEST_CASE(multiline_comment_at_eos)
 | |
| {
 | |
| 	Scanner scanner(CharStream("/*", ""));
 | |
| 	BOOST_CHECK_EQUAL(scanner.currentToken(), Token::Illegal);
 | |
| 	BOOST_CHECK_EQUAL(scanner.next(), Token::EOS);
 | |
| }
 | |
| 
 | |
| BOOST_AUTO_TEST_CASE(regular_line_break_in_single_line_comment)
 | |
| {
 | |
| 	for (auto const& nl: {"\r", "\n", "\r\n"})
 | |
| 	{
 | |
| 		Scanner scanner(CharStream("// abc " + string(nl) + " def ", ""));
 | |
| 		BOOST_CHECK_EQUAL(scanner.currentCommentLiteral(), "");
 | |
| 		BOOST_CHECK_EQUAL(scanner.currentToken(), Token::Identifier);
 | |
| 		BOOST_CHECK_EQUAL(scanner.currentLiteral(), "def");
 | |
| 		BOOST_CHECK_EQUAL(scanner.next(), Token::EOS);
 | |
| 	}
 | |
| }
 | |
| 
 | |
| BOOST_AUTO_TEST_CASE(irregular_line_breaks_in_single_line_comment)
 | |
| {
 | |
| 	for (auto const& nl: {"\v", "\f", "\xE2\x80\xA8", "\xE2\x80\xA9"})
 | |
| 	{
 | |
| 		Scanner scanner(CharStream("// abc " + string(nl) + " def ", ""));
 | |
| 		BOOST_CHECK_EQUAL(scanner.currentCommentLiteral(), "");
 | |
| 		BOOST_CHECK_EQUAL(scanner.currentToken(), Token::Illegal);
 | |
| 		for (size_t i = 0; i < string(nl).size() - 1; i++)
 | |
| 			BOOST_CHECK_EQUAL(scanner.next(), Token::Illegal);
 | |
| 		BOOST_CHECK_EQUAL(scanner.next(), Token::Identifier);
 | |
| 		BOOST_CHECK_EQUAL(scanner.currentLiteral(), "def");
 | |
| 		BOOST_CHECK_EQUAL(scanner.next(), Token::EOS);
 | |
| 	}
 | |
| }
 | |
| 
 | |
| BOOST_AUTO_TEST_CASE(regular_line_breaks_in_single_line_doc_comment)
 | |
| {
 | |
| 	for (auto const& nl: {"\r", "\n", "\r\n"})
 | |
| 	{
 | |
| 		Scanner scanner(CharStream("/// abc " + string(nl) + " def ", ""));
 | |
| 		BOOST_CHECK_EQUAL(scanner.currentCommentLiteral(), "abc ");
 | |
| 		BOOST_CHECK_EQUAL(scanner.currentToken(), Token::Identifier);
 | |
| 		BOOST_CHECK_EQUAL(scanner.currentLiteral(), "def");
 | |
| 		BOOST_CHECK_EQUAL(scanner.next(), Token::EOS);
 | |
| 	}
 | |
| }
 | |
| 
 | |
| BOOST_AUTO_TEST_CASE(regular_line_breaks_in_multiline_doc_comment)
 | |
| {
 | |
| 	// Test CR, LF, CRLF as line valid terminators for code comments.
 | |
| 	// Any accepted non-LF is being canonicalized to LF.
 | |
| 	for (auto const& nl : {"\r"s, "\n"s, "\r\n"s})
 | |
| 	{
 | |
| 		Scanner scanner{CharStream{"/// Hello" + nl + "/// World" + nl + "ident", ""}};
 | |
| 		auto const& lit = scanner.currentCommentLiteral();
 | |
| 		BOOST_CHECK_EQUAL(lit, "Hello\n World");
 | |
| 		BOOST_CHECK_EQUAL(scanner.currentCommentLiteral(), "Hello\n World");
 | |
| 		BOOST_CHECK_EQUAL(scanner.currentToken(), Token::Identifier);
 | |
| 		BOOST_CHECK_EQUAL(scanner.currentLiteral(), "ident");
 | |
| 		BOOST_CHECK_EQUAL(scanner.next(), Token::EOS);
 | |
| 	}
 | |
| }
 | |
| 
 | |
| BOOST_AUTO_TEST_CASE(irregular_line_breaks_in_single_line_doc_comment)
 | |
| {
 | |
| 	for (auto const& nl: {"\v", "\f", "\xE2\x80\xA8", "\xE2\x80\xA9"})
 | |
| 	{
 | |
| 		Scanner scanner(CharStream("/// abc " + string(nl) + " def ", ""));
 | |
| 		BOOST_CHECK_EQUAL(scanner.currentCommentLiteral(), "abc ");
 | |
| 		BOOST_CHECK_EQUAL(scanner.currentToken(), Token::Illegal);
 | |
| 		for (size_t i = 0; i < string(nl).size() - 1; i++)
 | |
| 			BOOST_CHECK_EQUAL(scanner.next(), Token::Illegal);
 | |
| 		BOOST_CHECK_EQUAL(scanner.next(), Token::Identifier);
 | |
| 		BOOST_CHECK_EQUAL(scanner.currentLiteral(), "def");
 | |
| 		BOOST_CHECK_EQUAL(scanner.next(), Token::EOS);
 | |
| 	}
 | |
| }
 | |
| 
 | |
| BOOST_AUTO_TEST_CASE(regular_line_breaks_in_strings)
 | |
| {
 | |
| 	for (auto const& nl: {"\r"s, "\n"s, "\r\n"s})
 | |
| 	{
 | |
| 		Scanner scanner(CharStream("\"abc " + nl + " def\"", ""));
 | |
| 		BOOST_CHECK_EQUAL(scanner.currentToken(), Token::Illegal);
 | |
| 		BOOST_CHECK_EQUAL(scanner.next(), Token::Identifier);
 | |
| 		BOOST_CHECK_EQUAL(scanner.currentLiteral(), "def");
 | |
| 		BOOST_CHECK_EQUAL(scanner.next(), Token::Illegal);
 | |
| 		BOOST_CHECK_EQUAL(scanner.next(), Token::EOS);
 | |
| 	}
 | |
| }
 | |
| 
 | |
| BOOST_AUTO_TEST_CASE(irregular_line_breaks_in_strings)
 | |
| {
 | |
| 	for (auto const& nl: {"\v", "\f", "\xE2\x80\xA8", "\xE2\x80\xA9"})
 | |
| 	{
 | |
| 		Scanner scanner(CharStream("\"abc " + string(nl) + " def\"", ""));
 | |
| 		BOOST_CHECK_EQUAL(scanner.currentToken(), Token::Illegal);
 | |
| 		for (size_t i = 0; i < string(nl).size(); i++)
 | |
| 			BOOST_CHECK_EQUAL(scanner.next(), Token::Illegal);
 | |
| 		BOOST_CHECK_EQUAL(scanner.next(), Token::Identifier);
 | |
| 		BOOST_CHECK_EQUAL(scanner.currentLiteral(), "def");
 | |
| 		BOOST_CHECK_EQUAL(scanner.next(), Token::Illegal);
 | |
| 		BOOST_CHECK_EQUAL(scanner.next(), Token::EOS);
 | |
| 	}
 | |
| }
 | |
| 
 | |
| BOOST_AUTO_TEST_CASE(solidity_keywords)
 | |
| {
 | |
| 	// These are tokens which have a different meaning in Yul.
 | |
| 	string keywords = "return byte bool address var in true false leave switch case default";
 | |
| 	Scanner scanner(CharStream(keywords, ""));
 | |
| 	BOOST_CHECK_EQUAL(scanner.currentToken(), Token::Return);
 | |
| 	BOOST_CHECK_EQUAL(scanner.next(), Token::Byte);
 | |
| 	BOOST_CHECK_EQUAL(scanner.next(), Token::Bool);
 | |
| 	BOOST_CHECK_EQUAL(scanner.next(), Token::Address);
 | |
| 	BOOST_CHECK_EQUAL(scanner.next(), Token::Var);
 | |
| 	BOOST_CHECK_EQUAL(scanner.next(), Token::In);
 | |
| 	BOOST_CHECK_EQUAL(scanner.next(), Token::TrueLiteral);
 | |
| 	BOOST_CHECK_EQUAL(scanner.next(), Token::FalseLiteral);
 | |
| 	BOOST_CHECK_EQUAL(scanner.next(), Token::Identifier);
 | |
| 	BOOST_CHECK_EQUAL(scanner.next(), Token::Switch);
 | |
| 	BOOST_CHECK_EQUAL(scanner.next(), Token::Case);
 | |
| 	BOOST_CHECK_EQUAL(scanner.next(), Token::Default);
 | |
| 	BOOST_CHECK_EQUAL(scanner.next(), Token::EOS);
 | |
| 	scanner.reset(CharStream(keywords, ""));
 | |
| 	scanner.setScannerMode(ScannerKind::Yul);
 | |
| 	BOOST_CHECK_EQUAL(scanner.currentToken(), Token::Identifier);
 | |
| 	BOOST_CHECK_EQUAL(scanner.next(), Token::Identifier);
 | |
| 	BOOST_CHECK_EQUAL(scanner.next(), Token::Identifier);
 | |
| 	BOOST_CHECK_EQUAL(scanner.next(), Token::Identifier);
 | |
| 	BOOST_CHECK_EQUAL(scanner.next(), Token::Identifier);
 | |
| 	BOOST_CHECK_EQUAL(scanner.next(), Token::Identifier);
 | |
| 	BOOST_CHECK_EQUAL(scanner.next(), Token::TrueLiteral);
 | |
| 	BOOST_CHECK_EQUAL(scanner.next(), Token::FalseLiteral);
 | |
| 	BOOST_CHECK_EQUAL(scanner.next(), Token::Leave);
 | |
| 	BOOST_CHECK_EQUAL(scanner.next(), Token::Switch);
 | |
| 	BOOST_CHECK_EQUAL(scanner.next(), Token::Case);
 | |
| 	BOOST_CHECK_EQUAL(scanner.next(), Token::Default);
 | |
| 	BOOST_CHECK_EQUAL(scanner.next(), Token::EOS);
 | |
| }
 | |
| 
 | |
| BOOST_AUTO_TEST_CASE(yul_keyword_like)
 | |
| {
 | |
| 	Scanner scanner(CharStream("leave.function", ""));
 | |
| 	BOOST_CHECK_EQUAL(scanner.currentToken(), Token::Identifier);
 | |
| 	BOOST_CHECK_EQUAL(scanner.next(), Token::Period);
 | |
| 	BOOST_CHECK_EQUAL(scanner.next(), Token::Function);
 | |
| 	BOOST_CHECK_EQUAL(scanner.next(), Token::EOS);
 | |
| 	scanner.reset(CharStream("leave.function", ""));
 | |
| 	scanner.setScannerMode(ScannerKind::Yul);
 | |
| 	BOOST_CHECK_EQUAL(scanner.currentToken(), Token::Identifier);
 | |
| 	BOOST_CHECK_EQUAL(scanner.next(), Token::EOS);
 | |
| }
 | |
| 
 | |
| BOOST_AUTO_TEST_CASE(yul_identifier_with_dots)
 | |
| {
 | |
| 	Scanner scanner(CharStream("mystorage.slot := 1", ""));
 | |
| 	BOOST_CHECK_EQUAL(scanner.currentToken(), Token::Identifier);
 | |
| 	BOOST_CHECK_EQUAL(scanner.next(), Token::Period);
 | |
| 	BOOST_CHECK_EQUAL(scanner.next(), Token::Identifier);
 | |
| 	BOOST_CHECK_EQUAL(scanner.next(), Token::AssemblyAssign);
 | |
| 	BOOST_CHECK_EQUAL(scanner.next(), Token::Number);
 | |
| 	BOOST_CHECK_EQUAL(scanner.next(), Token::EOS);
 | |
| 	scanner.reset(CharStream("mystorage.slot := 1", ""));
 | |
| 	scanner.setScannerMode(ScannerKind::Yul);
 | |
| 	BOOST_CHECK_EQUAL(scanner.currentToken(), Token::Identifier);
 | |
| 	BOOST_CHECK_EQUAL(scanner.next(), Token::AssemblyAssign);
 | |
| 	BOOST_CHECK_EQUAL(scanner.next(), Token::Number);
 | |
| 	BOOST_CHECK_EQUAL(scanner.next(), Token::EOS);
 | |
| }
 | |
| 
 | |
| BOOST_AUTO_TEST_CASE(yul_function)
 | |
| {
 | |
| 	string sig = "function f(a, b) -> x, y";
 | |
| 	Scanner scanner(CharStream(sig, ""));
 | |
| 	BOOST_CHECK_EQUAL(scanner.currentToken(), Token::Function);
 | |
| 	BOOST_CHECK_EQUAL(scanner.next(), Token::Identifier);
 | |
| 	BOOST_CHECK_EQUAL(scanner.next(), Token::LParen);
 | |
| 	BOOST_CHECK_EQUAL(scanner.next(), Token::Identifier);
 | |
| 	BOOST_CHECK_EQUAL(scanner.next(), Token::Comma);
 | |
| 	BOOST_CHECK_EQUAL(scanner.next(), Token::Identifier);
 | |
| 	BOOST_CHECK_EQUAL(scanner.next(), Token::RParen);
 | |
| 	BOOST_CHECK_EQUAL(scanner.next(), Token::RightArrow);
 | |
| 	BOOST_CHECK_EQUAL(scanner.next(), Token::Identifier);
 | |
| 	BOOST_CHECK_EQUAL(scanner.next(), Token::Comma);
 | |
| 	BOOST_CHECK_EQUAL(scanner.next(), Token::Identifier);
 | |
| 	BOOST_CHECK_EQUAL(scanner.next(), Token::EOS);
 | |
| 	scanner.reset(CharStream(sig, ""));
 | |
| 	scanner.setScannerMode(ScannerKind::Yul);
 | |
| 	BOOST_CHECK_EQUAL(scanner.currentToken(), Token::Function);
 | |
| 	BOOST_CHECK_EQUAL(scanner.next(), Token::Identifier);
 | |
| 	BOOST_CHECK_EQUAL(scanner.next(), Token::LParen);
 | |
| 	BOOST_CHECK_EQUAL(scanner.next(), Token::Identifier);
 | |
| 	BOOST_CHECK_EQUAL(scanner.next(), Token::Comma);
 | |
| 	BOOST_CHECK_EQUAL(scanner.next(), Token::Identifier);
 | |
| 	BOOST_CHECK_EQUAL(scanner.next(), Token::RParen);
 | |
| 	BOOST_CHECK_EQUAL(scanner.next(), Token::RightArrow);
 | |
| 	BOOST_CHECK_EQUAL(scanner.next(), Token::Identifier);
 | |
| 	BOOST_CHECK_EQUAL(scanner.next(), Token::Comma);
 | |
| 	BOOST_CHECK_EQUAL(scanner.next(), Token::Identifier);
 | |
| 	BOOST_CHECK_EQUAL(scanner.next(), Token::EOS);
 | |
| }
 | |
| 
 | |
| BOOST_AUTO_TEST_CASE(yul_function_with_whitespace)
 | |
| {
 | |
| 	string sig = "function f (a, b) - > x, y";
 | |
| 	Scanner scanner(CharStream(sig, ""));
 | |
| 	BOOST_CHECK_EQUAL(scanner.currentToken(), Token::Function);
 | |
| 	BOOST_CHECK_EQUAL(scanner.next(), Token::Identifier);
 | |
| 	BOOST_CHECK_EQUAL(scanner.next(), Token::LParen);
 | |
| 	BOOST_CHECK_EQUAL(scanner.next(), Token::Identifier);
 | |
| 	BOOST_CHECK_EQUAL(scanner.next(), Token::Comma);
 | |
| 	BOOST_CHECK_EQUAL(scanner.next(), Token::Identifier);
 | |
| 	BOOST_CHECK_EQUAL(scanner.next(), Token::RParen);
 | |
| 	BOOST_CHECK_EQUAL(scanner.next(), Token::Sub);
 | |
| 	BOOST_CHECK_EQUAL(scanner.next(), Token::GreaterThan);
 | |
| 	BOOST_CHECK_EQUAL(scanner.next(), Token::Identifier);
 | |
| 	BOOST_CHECK_EQUAL(scanner.next(), Token::Comma);
 | |
| 	BOOST_CHECK_EQUAL(scanner.next(), Token::Identifier);
 | |
| 	BOOST_CHECK_EQUAL(scanner.next(), Token::EOS);
 | |
| 	scanner.reset(CharStream(sig, ""));
 | |
| 	scanner.setScannerMode(ScannerKind::Yul);
 | |
| 	BOOST_CHECK_EQUAL(scanner.currentToken(), Token::Function);
 | |
| 	BOOST_CHECK_EQUAL(scanner.next(), Token::Identifier);
 | |
| 	BOOST_CHECK_EQUAL(scanner.next(), Token::LParen);
 | |
| 	BOOST_CHECK_EQUAL(scanner.next(), Token::Identifier);
 | |
| 	BOOST_CHECK_EQUAL(scanner.next(), Token::Comma);
 | |
| 	BOOST_CHECK_EQUAL(scanner.next(), Token::Identifier);
 | |
| 	BOOST_CHECK_EQUAL(scanner.next(), Token::RParen);
 | |
| 	BOOST_CHECK_EQUAL(scanner.next(), Token::Sub);
 | |
| 	BOOST_CHECK_EQUAL(scanner.next(), Token::GreaterThan);
 | |
| 	BOOST_CHECK_EQUAL(scanner.next(), Token::Identifier);
 | |
| 	BOOST_CHECK_EQUAL(scanner.next(), Token::Comma);
 | |
| 	BOOST_CHECK_EQUAL(scanner.next(), Token::Identifier);
 | |
| 	BOOST_CHECK_EQUAL(scanner.next(), Token::EOS);
 | |
| }
 | |
| 
 | |
| BOOST_AUTO_TEST_SUITE_END()
 | |
| 
 | |
| } // end namespaces
 |