mirror of
https://github.com/ethereum/solidity
synced 2023-10-03 13:03:40 +00:00
c21265f9f8
Co-authored-by: Kamil Śliwak <cameel2@gmail.com>
1032 lines
39 KiB
C++
1032 lines
39 KiB
C++
/*
|
|
This file is part of solidity.
|
|
|
|
solidity is free software: you can redistribute it and/or modify
|
|
it under the terms of the GNU General Public License as published by
|
|
the Free Software Foundation, either version 3 of the License, or
|
|
(at your option) any later version.
|
|
|
|
solidity is distributed in the hope that it will be useful,
|
|
but WITHOUT ANY WARRANTY; without even the implied warranty of
|
|
MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
|
|
GNU General Public License for more details.
|
|
|
|
You should have received a copy of the GNU General Public License
|
|
along with solidity. If not, see <http://www.gnu.org/licenses/>.
|
|
*/
|
|
/**
|
|
* @author Christian <c@ethdev.com>
|
|
* @date 2014
|
|
* Unit tests for the solidity scanner.
|
|
*/
|
|
|
|
#include <liblangutil/Scanner.h>
|
|
|
|
#include <boost/test/unit_test.hpp>
|
|
|
|
using namespace std;
|
|
using namespace solidity::langutil;
|
|
|
|
namespace solidity::langutil::test
|
|
{
|
|
|
|
BOOST_AUTO_TEST_SUITE(ScannerTest)
|
|
|
|
BOOST_AUTO_TEST_CASE(test_empty)
|
|
{
|
|
CharStream stream{};
|
|
Scanner scanner(stream);
|
|
BOOST_CHECK_EQUAL(scanner.currentToken(), Token::EOS);
|
|
}
|
|
|
|
BOOST_AUTO_TEST_CASE(smoke_test)
|
|
{
|
|
CharStream stream("function break;765 \t \"string1\",'string2'\nidentifier1", "");
|
|
Scanner scanner(stream);
|
|
BOOST_CHECK_EQUAL(scanner.currentToken(), Token::Function);
|
|
BOOST_CHECK_EQUAL(scanner.next(), Token::Break);
|
|
BOOST_CHECK_EQUAL(scanner.next(), Token::Semicolon);
|
|
BOOST_CHECK_EQUAL(scanner.next(), Token::Number);
|
|
BOOST_CHECK_EQUAL(scanner.currentLiteral(), "765");
|
|
BOOST_CHECK_EQUAL(scanner.next(), Token::StringLiteral);
|
|
BOOST_CHECK_EQUAL(scanner.currentLiteral(), "string1");
|
|
BOOST_CHECK_EQUAL(scanner.next(), Token::Comma);
|
|
BOOST_CHECK_EQUAL(scanner.next(), Token::StringLiteral);
|
|
BOOST_CHECK_EQUAL(scanner.currentLiteral(), "string2");
|
|
BOOST_CHECK_EQUAL(scanner.next(), Token::Identifier);
|
|
BOOST_CHECK_EQUAL(scanner.currentLiteral(), "identifier1");
|
|
BOOST_CHECK_EQUAL(scanner.next(), Token::EOS);
|
|
}
|
|
|
|
BOOST_AUTO_TEST_CASE(assembly_assign)
|
|
{
|
|
CharStream stream("let a := 1", "");
|
|
Scanner scanner(stream);
|
|
BOOST_CHECK_EQUAL(scanner.currentToken(), Token::Let);
|
|
BOOST_CHECK_EQUAL(scanner.next(), Token::Identifier);
|
|
BOOST_CHECK_EQUAL(scanner.next(), Token::AssemblyAssign);
|
|
BOOST_CHECK_EQUAL(scanner.next(), Token::Number);
|
|
BOOST_CHECK_EQUAL(scanner.currentLiteral(), "1");
|
|
BOOST_CHECK_EQUAL(scanner.next(), Token::EOS);
|
|
}
|
|
|
|
BOOST_AUTO_TEST_CASE(assembly_multiple_assign)
|
|
{
|
|
CharStream stream("let a, b, c := 1", "");
|
|
Scanner scanner(stream);
|
|
BOOST_CHECK_EQUAL(scanner.currentToken(), Token::Let);
|
|
BOOST_CHECK_EQUAL(scanner.next(), Token::Identifier);
|
|
BOOST_CHECK_EQUAL(scanner.next(), Token::Comma);
|
|
BOOST_CHECK_EQUAL(scanner.next(), Token::Identifier);
|
|
BOOST_CHECK_EQUAL(scanner.next(), Token::Comma);
|
|
BOOST_CHECK_EQUAL(scanner.next(), Token::Identifier);
|
|
BOOST_CHECK_EQUAL(scanner.next(), Token::AssemblyAssign);
|
|
BOOST_CHECK_EQUAL(scanner.next(), Token::Number);
|
|
BOOST_CHECK_EQUAL(scanner.currentLiteral(), "1");
|
|
BOOST_CHECK_EQUAL(scanner.next(), Token::EOS);
|
|
}
|
|
|
|
BOOST_AUTO_TEST_CASE(string_printable)
|
|
{
|
|
for (unsigned v = 0x20; v < 0x7e; v++) {
|
|
string lit{static_cast<char>(v)};
|
|
// Escape \ and " (since we are quoting with ")
|
|
if (v == '\\' || v == '"')
|
|
lit = string{'\\'} + lit;
|
|
CharStream stream(" { \"" + lit + "\"", "");
|
|
Scanner scanner(stream);
|
|
BOOST_CHECK_EQUAL(scanner.currentToken(), Token::LBrace);
|
|
BOOST_CHECK_EQUAL(scanner.next(), Token::StringLiteral);
|
|
BOOST_CHECK_EQUAL(scanner.currentLiteral(), string{static_cast<char>(v)});
|
|
BOOST_CHECK_EQUAL(scanner.next(), Token::EOS);
|
|
}
|
|
// Special case of unescaped " for strings quoted with '
|
|
CharStream stream(" { '\"'", "");
|
|
Scanner scanner(stream);
|
|
BOOST_CHECK_EQUAL(scanner.currentToken(), Token::LBrace);
|
|
BOOST_CHECK_EQUAL(scanner.next(), Token::StringLiteral);
|
|
BOOST_CHECK_EQUAL(scanner.currentLiteral(), "\"");
|
|
BOOST_CHECK_EQUAL(scanner.next(), Token::EOS);
|
|
}
|
|
|
|
BOOST_AUTO_TEST_CASE(string_nonprintable)
|
|
{
|
|
for (unsigned v = 0; v < 0xff; v++) {
|
|
// Skip the valid ones
|
|
if (v >= 0x20 && v <= 0x7e)
|
|
continue;
|
|
string lit{static_cast<char>(v)};
|
|
CharStream stream(" { \"" + lit + "\"", "");
|
|
Scanner scanner(stream);
|
|
BOOST_CHECK_EQUAL(scanner.currentToken(), Token::LBrace);
|
|
BOOST_CHECK_EQUAL(scanner.next(), Token::Illegal);
|
|
if (v == '\n' || v == '\v' || v == '\f' || v == '\r')
|
|
BOOST_CHECK_EQUAL(scanner.currentError(), ScannerError::IllegalStringEndQuote);
|
|
else
|
|
BOOST_CHECK_EQUAL(scanner.currentError(),ScannerError::UnicodeCharacterInNonUnicodeString);
|
|
BOOST_CHECK_EQUAL(scanner.currentLiteral(), "");
|
|
}
|
|
}
|
|
|
|
BOOST_AUTO_TEST_CASE(string_escapes)
|
|
{
|
|
CharStream stream(" { \"a\\x61\"", "");
|
|
Scanner scanner(stream);
|
|
BOOST_CHECK_EQUAL(scanner.currentToken(), Token::LBrace);
|
|
BOOST_CHECK_EQUAL(scanner.next(), Token::StringLiteral);
|
|
BOOST_CHECK_EQUAL(scanner.currentLiteral(), "aa");
|
|
}
|
|
|
|
BOOST_AUTO_TEST_CASE(string_escapes_all)
|
|
{
|
|
CharStream stream(" { \"a\\x61\\n\\r\\t\"", "");
|
|
Scanner scanner(stream);
|
|
BOOST_CHECK_EQUAL(scanner.currentToken(), Token::LBrace);
|
|
BOOST_CHECK_EQUAL(scanner.next(), Token::StringLiteral);
|
|
BOOST_CHECK_EQUAL(scanner.currentLiteral(), "aa\n\r\t");
|
|
}
|
|
|
|
struct TestScanner
|
|
{
|
|
unique_ptr<CharStream> stream;
|
|
unique_ptr<Scanner> scanner;
|
|
explicit TestScanner(string _text) { reset(move(_text)); }
|
|
|
|
void reset(std::string _text)
|
|
{
|
|
stream = make_unique<CharStream>(move(_text), "");
|
|
scanner = make_unique<Scanner>(*stream);
|
|
}
|
|
|
|
decltype(auto) currentToken() { return scanner->currentToken(); }
|
|
decltype(auto) next() { return scanner->next(); }
|
|
decltype(auto) currentError() { return scanner->currentError(); }
|
|
decltype(auto) currentLiteral() { return scanner->currentLiteral(); }
|
|
decltype(auto) currentCommentLiteral() { return scanner->currentCommentLiteral(); }
|
|
decltype(auto) currentLocation() { return scanner->currentLocation(); }
|
|
};
|
|
|
|
BOOST_AUTO_TEST_CASE(string_escapes_legal_before_080)
|
|
{
|
|
TestScanner scanner(" { \"a\\b");
|
|
BOOST_CHECK_EQUAL(scanner.currentToken(), Token::LBrace);
|
|
BOOST_CHECK_EQUAL(scanner.next(), Token::Illegal);
|
|
BOOST_CHECK_EQUAL(scanner.currentError(), ScannerError::IllegalEscapeSequence);
|
|
BOOST_CHECK_EQUAL(scanner.currentLiteral(), "");
|
|
scanner.reset(" { \"a\\f");
|
|
BOOST_CHECK_EQUAL(scanner.currentToken(), Token::LBrace);
|
|
BOOST_CHECK_EQUAL(scanner.next(), Token::Illegal);
|
|
BOOST_CHECK_EQUAL(scanner.currentError(), ScannerError::IllegalEscapeSequence);
|
|
BOOST_CHECK_EQUAL(scanner.currentLiteral(), "");
|
|
scanner.reset(" { \"a\\v");
|
|
BOOST_CHECK_EQUAL(scanner.currentToken(), Token::LBrace);
|
|
BOOST_CHECK_EQUAL(scanner.next(), Token::Illegal);
|
|
BOOST_CHECK_EQUAL(scanner.currentError(), ScannerError::IllegalEscapeSequence);
|
|
BOOST_CHECK_EQUAL(scanner.currentLiteral(), "");
|
|
}
|
|
|
|
BOOST_AUTO_TEST_CASE(string_escapes_with_zero)
|
|
{
|
|
TestScanner scanner(" { \"a\\x61\\x00abc\"");
|
|
BOOST_CHECK_EQUAL(scanner.currentToken(), Token::LBrace);
|
|
BOOST_CHECK_EQUAL(scanner.next(), Token::StringLiteral);
|
|
BOOST_CHECK_EQUAL(scanner.currentLiteral(), std::string("aa\0abc", 6));
|
|
}
|
|
|
|
BOOST_AUTO_TEST_CASE(string_escape_illegal)
|
|
{
|
|
CharStream stream(" bla \"\\x6rf\" (illegalescape)", "");
|
|
Scanner scanner(stream);
|
|
BOOST_CHECK_EQUAL(scanner.currentToken(), Token::Identifier);
|
|
BOOST_CHECK_EQUAL(scanner.next(), Token::Illegal);
|
|
BOOST_CHECK_EQUAL(scanner.currentError(), ScannerError::IllegalEscapeSequence);
|
|
BOOST_CHECK_EQUAL(scanner.currentLiteral(), "");
|
|
// TODO recovery from illegal tokens should be improved
|
|
BOOST_CHECK_EQUAL(scanner.next(), Token::Illegal);
|
|
BOOST_CHECK_EQUAL(scanner.next(), Token::Identifier);
|
|
BOOST_CHECK_EQUAL(scanner.next(), Token::Illegal);
|
|
BOOST_CHECK_EQUAL(scanner.next(), Token::EOS);
|
|
}
|
|
|
|
BOOST_AUTO_TEST_CASE(hex_numbers)
|
|
{
|
|
TestScanner scanner("var x = 0x765432536763762734623472346;");
|
|
BOOST_CHECK_EQUAL(scanner.currentToken(), Token::Var);
|
|
BOOST_CHECK_EQUAL(scanner.next(), Token::Identifier);
|
|
BOOST_CHECK_EQUAL(scanner.next(), Token::Assign);
|
|
BOOST_CHECK_EQUAL(scanner.next(), Token::Number);
|
|
BOOST_CHECK_EQUAL(scanner.currentLiteral(), "0x765432536763762734623472346");
|
|
BOOST_CHECK_EQUAL(scanner.next(), Token::Semicolon);
|
|
BOOST_CHECK_EQUAL(scanner.next(), Token::EOS);
|
|
scanner.reset("0x1234");
|
|
BOOST_CHECK_EQUAL(scanner.currentToken(), Token::Number);
|
|
BOOST_CHECK_EQUAL(scanner.currentLiteral(), "0x1234");
|
|
scanner.reset("0X1234");
|
|
BOOST_CHECK_EQUAL(scanner.currentToken(), Token::Illegal);
|
|
}
|
|
|
|
BOOST_AUTO_TEST_CASE(octal_numbers)
|
|
{
|
|
TestScanner scanner("07");
|
|
BOOST_CHECK_EQUAL(scanner.currentToken(), Token::Illegal);
|
|
scanner.reset("007");
|
|
BOOST_CHECK_EQUAL(scanner.currentToken(), Token::Illegal);
|
|
scanner.reset("-07");
|
|
BOOST_CHECK_EQUAL(scanner.currentToken(), Token::Sub);
|
|
BOOST_CHECK_EQUAL(scanner.next(), Token::Illegal);
|
|
scanner.reset("-.07");
|
|
BOOST_CHECK_EQUAL(scanner.currentToken(), Token::Sub);
|
|
BOOST_CHECK_EQUAL(scanner.next(), Token::Number);
|
|
scanner.reset("0");
|
|
BOOST_CHECK_EQUAL(scanner.currentToken(), Token::Number);
|
|
scanner.reset("0.1");
|
|
BOOST_CHECK_EQUAL(scanner.currentToken(), Token::Number);
|
|
}
|
|
|
|
BOOST_AUTO_TEST_CASE(scientific_notation)
|
|
{
|
|
CharStream stream("var x = 2e10;", "");
|
|
Scanner scanner(stream);
|
|
BOOST_CHECK_EQUAL(scanner.currentToken(), Token::Var);
|
|
BOOST_CHECK_EQUAL(scanner.next(), Token::Identifier);
|
|
BOOST_CHECK_EQUAL(scanner.next(), Token::Assign);
|
|
BOOST_CHECK_EQUAL(scanner.next(), Token::Number);
|
|
BOOST_CHECK_EQUAL(scanner.currentLiteral(), "2e10");
|
|
BOOST_CHECK_EQUAL(scanner.next(), Token::Semicolon);
|
|
BOOST_CHECK_EQUAL(scanner.next(), Token::EOS);
|
|
}
|
|
|
|
BOOST_AUTO_TEST_CASE(leading_dot_in_identifier)
|
|
{
|
|
TestScanner scanner("function .a(");
|
|
BOOST_CHECK_EQUAL(scanner.currentToken(), Token::Function);
|
|
BOOST_CHECK_EQUAL(scanner.next(), Token::Period);
|
|
BOOST_CHECK_EQUAL(scanner.next(), Token::Identifier);
|
|
BOOST_CHECK_EQUAL(scanner.next(), Token::LParen);
|
|
BOOST_CHECK_EQUAL(scanner.next(), Token::EOS);
|
|
scanner.reset("function .a(");
|
|
scanner.scanner->setScannerMode(ScannerKind::Yul);
|
|
BOOST_CHECK_EQUAL(scanner.currentToken(), Token::Function);
|
|
BOOST_CHECK_EQUAL(scanner.next(), Token::Period);
|
|
BOOST_CHECK_EQUAL(scanner.next(), Token::Identifier);
|
|
BOOST_CHECK_EQUAL(scanner.next(), Token::LParen);
|
|
BOOST_CHECK_EQUAL(scanner.next(), Token::EOS);
|
|
}
|
|
|
|
BOOST_AUTO_TEST_CASE(middle_dot_in_identifier)
|
|
{
|
|
TestScanner scanner("function a..a(");
|
|
BOOST_CHECK_EQUAL(scanner.currentToken(), Token::Function);
|
|
BOOST_CHECK_EQUAL(scanner.next(), Token::Identifier);
|
|
BOOST_CHECK_EQUAL(scanner.next(), Token::Period);
|
|
BOOST_CHECK_EQUAL(scanner.next(), Token::Period);
|
|
BOOST_CHECK_EQUAL(scanner.next(), Token::Identifier);
|
|
BOOST_CHECK_EQUAL(scanner.next(), Token::LParen);
|
|
BOOST_CHECK_EQUAL(scanner.next(), Token::EOS);
|
|
scanner.reset("function a...a(");
|
|
scanner.scanner->setScannerMode(ScannerKind::Yul);
|
|
BOOST_CHECK_EQUAL(scanner.currentToken(), Token::Function);
|
|
BOOST_CHECK_EQUAL(scanner.next(), Token::Identifier);
|
|
BOOST_CHECK_EQUAL(scanner.next(), Token::LParen);
|
|
BOOST_CHECK_EQUAL(scanner.next(), Token::EOS);
|
|
}
|
|
|
|
BOOST_AUTO_TEST_CASE(trailing_dot_in_identifier)
|
|
{
|
|
TestScanner scanner("function a.(");
|
|
BOOST_CHECK_EQUAL(scanner.currentToken(), Token::Function);
|
|
BOOST_CHECK_EQUAL(scanner.next(), Token::Identifier);
|
|
BOOST_CHECK_EQUAL(scanner.next(), Token::Period);
|
|
BOOST_CHECK_EQUAL(scanner.next(), Token::LParen);
|
|
BOOST_CHECK_EQUAL(scanner.next(), Token::EOS);
|
|
scanner.reset("function a.(");
|
|
scanner.scanner->setScannerMode(ScannerKind::Yul);
|
|
BOOST_CHECK_EQUAL(scanner.currentToken(), Token::Function);
|
|
BOOST_CHECK_EQUAL(scanner.next(), Token::Identifier);
|
|
BOOST_CHECK_EQUAL(scanner.next(), Token::LParen);
|
|
BOOST_CHECK_EQUAL(scanner.next(), Token::EOS);
|
|
}
|
|
|
|
BOOST_AUTO_TEST_CASE(trailing_dot_in_numbers)
|
|
{
|
|
TestScanner scanner("2.5");
|
|
BOOST_CHECK_EQUAL(scanner.currentToken(), Token::Number);
|
|
BOOST_CHECK_EQUAL(scanner.next(), Token::EOS);
|
|
scanner.reset("2.5e10");
|
|
BOOST_CHECK_EQUAL(scanner.currentToken(), Token::Number);
|
|
BOOST_CHECK_EQUAL(scanner.next(), Token::EOS);
|
|
scanner.reset(".5");
|
|
BOOST_CHECK_EQUAL(scanner.currentToken(), Token::Number);
|
|
BOOST_CHECK_EQUAL(scanner.next(), Token::EOS);
|
|
scanner.reset(".5e10");
|
|
BOOST_CHECK_EQUAL(scanner.currentToken(), Token::Number);
|
|
BOOST_CHECK_EQUAL(scanner.next(), Token::EOS);
|
|
scanner.reset("2.");
|
|
BOOST_CHECK_EQUAL(scanner.currentToken(), Token::Number);
|
|
BOOST_CHECK_EQUAL(scanner.next(), Token::Period);
|
|
BOOST_CHECK_EQUAL(scanner.next(), Token::EOS);
|
|
}
|
|
|
|
BOOST_AUTO_TEST_CASE(leading_underscore_decimal_is_identifier)
|
|
{
|
|
// Actual error is cought by SyntaxChecker.
|
|
CharStream stream("_1.2", "");
|
|
Scanner scanner(stream);
|
|
BOOST_CHECK_EQUAL(scanner.currentToken(), Token::Identifier);
|
|
BOOST_CHECK_EQUAL(scanner.next(), Token::Number);
|
|
BOOST_CHECK_EQUAL(scanner.next(), Token::EOS);
|
|
}
|
|
|
|
BOOST_AUTO_TEST_CASE(leading_underscore_decimal_after_dot_illegal)
|
|
{
|
|
// Actual error is cought by SyntaxChecker.
|
|
TestScanner scanner("1._2");
|
|
BOOST_CHECK_EQUAL(scanner.currentToken(), Token::Number);
|
|
BOOST_CHECK_EQUAL(scanner.next(), Token::EOS);
|
|
|
|
scanner.reset("1._");
|
|
BOOST_CHECK_EQUAL(scanner.currentToken(), Token::Number);
|
|
BOOST_CHECK_EQUAL(scanner.next(), Token::EOS);
|
|
}
|
|
|
|
BOOST_AUTO_TEST_CASE(leading_underscore_exp_are_identifier)
|
|
{
|
|
// Actual error is cought by SyntaxChecker.
|
|
CharStream stream("_1e2", "");
|
|
Scanner scanner(stream);
|
|
BOOST_CHECK_EQUAL(scanner.currentToken(), Token::Identifier);
|
|
BOOST_CHECK_EQUAL(scanner.next(), Token::EOS);
|
|
}
|
|
|
|
BOOST_AUTO_TEST_CASE(leading_underscore_exp_after_e_illegal)
|
|
{
|
|
// Actual error is cought by SyntaxChecker.
|
|
CharStream stream("1e_2", "");
|
|
Scanner scanner(stream);
|
|
BOOST_CHECK_EQUAL(scanner.currentToken(), Token::Number);
|
|
BOOST_CHECK_EQUAL(scanner.currentLiteral(), "1e_2");
|
|
BOOST_CHECK_EQUAL(scanner.next(), Token::EOS);
|
|
}
|
|
|
|
BOOST_AUTO_TEST_CASE(leading_underscore_hex_illegal)
|
|
{
|
|
CharStream stream("0x_abc", "");
|
|
Scanner scanner(stream);
|
|
BOOST_CHECK_EQUAL(scanner.currentToken(), Token::Illegal);
|
|
BOOST_CHECK_EQUAL(scanner.next(), Token::Identifier);
|
|
BOOST_CHECK_EQUAL(scanner.next(), Token::EOS);
|
|
}
|
|
|
|
BOOST_AUTO_TEST_CASE(fixed_number_invalid_underscore_front)
|
|
{
|
|
// Actual error is cought by SyntaxChecker.
|
|
CharStream stream("12._1234_1234", "");
|
|
Scanner scanner(stream);
|
|
BOOST_CHECK_EQUAL(scanner.currentToken(), Token::Number);
|
|
BOOST_CHECK_EQUAL(scanner.next(), Token::EOS);
|
|
}
|
|
|
|
BOOST_AUTO_TEST_CASE(number_literals_with_trailing_underscore_at_eos)
|
|
{
|
|
// Actual error is cought by SyntaxChecker.
|
|
TestScanner scanner("0x123_");
|
|
BOOST_CHECK_EQUAL(scanner.currentToken(), Token::Number);
|
|
BOOST_CHECK_EQUAL(scanner.next(), Token::EOS);
|
|
|
|
scanner.reset("123_");
|
|
BOOST_CHECK_EQUAL(scanner.currentToken(), Token::Number);
|
|
BOOST_CHECK_EQUAL(scanner.next(), Token::EOS);
|
|
|
|
scanner.reset("12.34_");
|
|
BOOST_CHECK_EQUAL(scanner.currentToken(), Token::Number);
|
|
BOOST_CHECK_EQUAL(scanner.next(), Token::EOS);
|
|
}
|
|
|
|
BOOST_AUTO_TEST_CASE(negative_numbers)
|
|
{
|
|
TestScanner scanner("var x = -.2 + -0x78 + -7.3 + 8.9 + 2e-2;");
|
|
BOOST_CHECK_EQUAL(scanner.currentToken(), Token::Var);
|
|
BOOST_CHECK_EQUAL(scanner.next(), Token::Identifier);
|
|
BOOST_CHECK_EQUAL(scanner.next(), Token::Assign);
|
|
BOOST_CHECK_EQUAL(scanner.next(), Token::Sub);
|
|
BOOST_CHECK_EQUAL(scanner.next(), Token::Number);
|
|
BOOST_CHECK_EQUAL(scanner.currentLiteral(), ".2");
|
|
BOOST_CHECK_EQUAL(scanner.next(), Token::Add);
|
|
BOOST_CHECK_EQUAL(scanner.next(), Token::Sub);
|
|
BOOST_CHECK_EQUAL(scanner.next(), Token::Number);
|
|
BOOST_CHECK_EQUAL(scanner.currentLiteral(), "0x78");
|
|
BOOST_CHECK_EQUAL(scanner.next(), Token::Add);
|
|
BOOST_CHECK_EQUAL(scanner.next(), Token::Sub);
|
|
BOOST_CHECK_EQUAL(scanner.next(), Token::Number);
|
|
BOOST_CHECK_EQUAL(scanner.currentLiteral(), "7.3");
|
|
BOOST_CHECK_EQUAL(scanner.next(), Token::Add);
|
|
BOOST_CHECK_EQUAL(scanner.next(), Token::Number);
|
|
BOOST_CHECK_EQUAL(scanner.currentLiteral(), "8.9");
|
|
BOOST_CHECK_EQUAL(scanner.next(), Token::Add);
|
|
BOOST_CHECK_EQUAL(scanner.next(), Token::Number);
|
|
BOOST_CHECK_EQUAL(scanner.currentLiteral(), "2e-2");
|
|
BOOST_CHECK_EQUAL(scanner.next(), Token::Semicolon);
|
|
BOOST_CHECK_EQUAL(scanner.next(), Token::EOS);
|
|
}
|
|
|
|
BOOST_AUTO_TEST_CASE(locations)
|
|
{
|
|
TestScanner scanner("function_identifier has ; -0x743/*comment*/\n ident //comment");
|
|
BOOST_CHECK_EQUAL(scanner.currentToken(), Token::Identifier);
|
|
BOOST_CHECK_EQUAL(scanner.currentLocation().start, 0);
|
|
BOOST_CHECK_EQUAL(scanner.currentLocation().end, 19);
|
|
BOOST_CHECK_EQUAL(scanner.next(), Token::Identifier);
|
|
BOOST_CHECK_EQUAL(scanner.currentLocation().start, 20);
|
|
BOOST_CHECK_EQUAL(scanner.currentLocation().end, 23);
|
|
BOOST_CHECK_EQUAL(scanner.next(), Token::Semicolon);
|
|
BOOST_CHECK_EQUAL(scanner.currentLocation().start, 24);
|
|
BOOST_CHECK_EQUAL(scanner.currentLocation().end, 25);
|
|
BOOST_CHECK_EQUAL(scanner.next(), Token::Sub);
|
|
BOOST_CHECK_EQUAL(scanner.next(), Token::Number);
|
|
BOOST_CHECK_EQUAL(scanner.currentLocation().start, 27);
|
|
BOOST_CHECK_EQUAL(scanner.currentLocation().end, 32);
|
|
BOOST_CHECK_EQUAL(scanner.next(), Token::Identifier);
|
|
BOOST_CHECK_EQUAL(scanner.currentLocation().start, 45);
|
|
BOOST_CHECK_EQUAL(scanner.currentLocation().end, 50);
|
|
BOOST_CHECK_EQUAL(scanner.next(), Token::EOS);
|
|
}
|
|
|
|
BOOST_AUTO_TEST_CASE(ambiguities)
|
|
{
|
|
// test scanning of some operators which need look-ahead
|
|
TestScanner scanner("<=" "<" "+ +=a++ =>" "<<" ">>" " >>=" ">>>" ">>>=" " >>>>>=><<=");
|
|
BOOST_CHECK_EQUAL(scanner.currentToken(), Token::LessThanOrEqual);
|
|
BOOST_CHECK_EQUAL(scanner.next(), Token::LessThan);
|
|
BOOST_CHECK_EQUAL(scanner.next(), Token::Add);
|
|
BOOST_CHECK_EQUAL(scanner.next(), Token::AssignAdd);
|
|
BOOST_CHECK_EQUAL(scanner.next(), Token::Identifier);
|
|
BOOST_CHECK_EQUAL(scanner.next(), Token::Inc);
|
|
BOOST_CHECK_EQUAL(scanner.next(), Token::DoubleArrow);
|
|
BOOST_CHECK_EQUAL(scanner.next(), Token::SHL);
|
|
BOOST_CHECK_EQUAL(scanner.next(), Token::SAR);
|
|
BOOST_CHECK_EQUAL(scanner.next(), Token::AssignSar);
|
|
BOOST_CHECK_EQUAL(scanner.next(), Token::SHR);
|
|
BOOST_CHECK_EQUAL(scanner.next(), Token::AssignShr);
|
|
// the last "monster" token combination
|
|
BOOST_CHECK_EQUAL(scanner.next(), Token::SHR);
|
|
BOOST_CHECK_EQUAL(scanner.next(), Token::AssignSar);
|
|
BOOST_CHECK_EQUAL(scanner.next(), Token::GreaterThan);
|
|
BOOST_CHECK_EQUAL(scanner.next(), Token::AssignShl);
|
|
}
|
|
|
|
BOOST_AUTO_TEST_CASE(documentation_comments_parsed_begin)
|
|
{
|
|
TestScanner scanner("/// Send $(value / 1000) chocolates to the user");
|
|
BOOST_CHECK_EQUAL(scanner.currentToken(), Token::EOS);
|
|
BOOST_CHECK_EQUAL(scanner.currentCommentLiteral(), "Send $(value / 1000) chocolates to the user");
|
|
}
|
|
|
|
BOOST_AUTO_TEST_CASE(multiline_documentation_comments_parsed_begin)
|
|
{
|
|
TestScanner scanner("/** Send $(value / 1000) chocolates to the user*/");
|
|
BOOST_CHECK_EQUAL(scanner.currentToken(), Token::EOS);
|
|
BOOST_CHECK_EQUAL(scanner.currentCommentLiteral(), "Send $(value / 1000) chocolates to the user");
|
|
}
|
|
|
|
BOOST_AUTO_TEST_CASE(documentation_comments_parsed)
|
|
{
|
|
TestScanner scanner("some other tokens /// Send $(value / 1000) chocolates to the user");
|
|
BOOST_CHECK_EQUAL(scanner.currentToken(), Token::Identifier);
|
|
BOOST_CHECK_EQUAL(scanner.next(), Token::Identifier);
|
|
BOOST_CHECK_EQUAL(scanner.next(), Token::Identifier);
|
|
BOOST_CHECK_EQUAL(scanner.next(), Token::EOS);
|
|
BOOST_CHECK_EQUAL(scanner.currentCommentLiteral(), "Send $(value / 1000) chocolates to the user");
|
|
}
|
|
|
|
BOOST_AUTO_TEST_CASE(multiline_documentation_comments_parsed)
|
|
{
|
|
TestScanner scanner("some other tokens /**\n"
|
|
"* Send $(value / 1000) chocolates to the user\n"
|
|
"*/");
|
|
BOOST_CHECK_EQUAL(scanner.currentToken(), Token::Identifier);
|
|
BOOST_CHECK_EQUAL(scanner.next(), Token::Identifier);
|
|
BOOST_CHECK_EQUAL(scanner.next(), Token::Identifier);
|
|
BOOST_CHECK_EQUAL(scanner.next(), Token::EOS);
|
|
BOOST_CHECK_EQUAL(scanner.currentCommentLiteral(), " Send $(value / 1000) chocolates to the user");
|
|
}
|
|
|
|
BOOST_AUTO_TEST_CASE(multiline_documentation_no_stars)
|
|
{
|
|
TestScanner scanner("some other tokens /**\n"
|
|
" Send $(value / 1000) chocolates to the user\n"
|
|
"*/");
|
|
BOOST_CHECK_EQUAL(scanner.currentToken(), Token::Identifier);
|
|
BOOST_CHECK_EQUAL(scanner.next(), Token::Identifier);
|
|
BOOST_CHECK_EQUAL(scanner.next(), Token::Identifier);
|
|
BOOST_CHECK_EQUAL(scanner.next(), Token::EOS);
|
|
BOOST_CHECK_EQUAL(scanner.currentCommentLiteral(), "Send $(value / 1000) chocolates to the user");
|
|
}
|
|
|
|
BOOST_AUTO_TEST_CASE(multiline_documentation_whitespace_hell)
|
|
{
|
|
TestScanner scanner("some other tokens /** \t \r \n"
|
|
"\t \r * Send $(value / 1000) chocolates to the user\n"
|
|
"*/");
|
|
BOOST_CHECK_EQUAL(scanner.currentToken(), Token::Identifier);
|
|
BOOST_CHECK_EQUAL(scanner.next(), Token::Identifier);
|
|
BOOST_CHECK_EQUAL(scanner.next(), Token::Identifier);
|
|
BOOST_CHECK_EQUAL(scanner.next(), Token::EOS);
|
|
BOOST_CHECK_EQUAL(scanner.currentCommentLiteral(), " Send $(value / 1000) chocolates to the user");
|
|
}
|
|
|
|
BOOST_AUTO_TEST_CASE(comment_before_eos)
|
|
{
|
|
TestScanner scanner("//");
|
|
BOOST_CHECK_EQUAL(scanner.currentToken(), Token::EOS);
|
|
BOOST_CHECK_EQUAL(scanner.currentCommentLiteral(), "");
|
|
}
|
|
|
|
BOOST_AUTO_TEST_CASE(documentation_comment_before_eos)
|
|
{
|
|
TestScanner scanner("///");
|
|
BOOST_CHECK_EQUAL(scanner.currentToken(), Token::EOS);
|
|
BOOST_CHECK_EQUAL(scanner.currentCommentLiteral(), "");
|
|
}
|
|
|
|
BOOST_AUTO_TEST_CASE(empty_multiline_comment)
|
|
{
|
|
TestScanner scanner("/**/");
|
|
BOOST_CHECK_EQUAL(scanner.currentToken(), Token::EOS);
|
|
BOOST_CHECK_EQUAL(scanner.currentCommentLiteral(), "");
|
|
}
|
|
|
|
BOOST_AUTO_TEST_CASE(empty_multiline_documentation_comment_before_eos)
|
|
{
|
|
TestScanner scanner("/***/");
|
|
BOOST_CHECK_EQUAL(scanner.currentToken(), Token::EOS);
|
|
BOOST_CHECK_EQUAL(scanner.currentCommentLiteral(), "");
|
|
}
|
|
|
|
BOOST_AUTO_TEST_CASE(comments_mixed_in_sequence)
|
|
{
|
|
TestScanner scanner("hello_world ///documentation comment \n"
|
|
"//simple comment \n"
|
|
"<<");
|
|
BOOST_CHECK_EQUAL(scanner.currentToken(), Token::Identifier);
|
|
BOOST_CHECK_EQUAL(scanner.next(), Token::SHL);
|
|
BOOST_CHECK_EQUAL(scanner.currentCommentLiteral(), "documentation comment ");
|
|
}
|
|
|
|
BOOST_AUTO_TEST_CASE(ether_subdenominations)
|
|
{
|
|
TestScanner scanner("wei gwei ether");
|
|
BOOST_CHECK_EQUAL(scanner.currentToken(), Token::SubWei);
|
|
BOOST_CHECK_EQUAL(scanner.next(), Token::SubGwei);
|
|
BOOST_CHECK_EQUAL(scanner.next(), Token::SubEther);
|
|
}
|
|
|
|
BOOST_AUTO_TEST_CASE(time_subdenominations)
|
|
{
|
|
TestScanner scanner("seconds minutes hours days weeks years");
|
|
BOOST_CHECK_EQUAL(scanner.currentToken(), Token::SubSecond);
|
|
BOOST_CHECK_EQUAL(scanner.next(), Token::SubMinute);
|
|
BOOST_CHECK_EQUAL(scanner.next(), Token::SubHour);
|
|
BOOST_CHECK_EQUAL(scanner.next(), Token::SubDay);
|
|
BOOST_CHECK_EQUAL(scanner.next(), Token::SubWeek);
|
|
BOOST_CHECK_EQUAL(scanner.next(), Token::SubYear);
|
|
}
|
|
|
|
BOOST_AUTO_TEST_CASE(empty_comment)
|
|
{
|
|
TestScanner scanner("//\ncontract{}");
|
|
BOOST_CHECK_EQUAL(scanner.currentCommentLiteral(), "");
|
|
BOOST_CHECK_EQUAL(scanner.currentToken(), Token::Contract);
|
|
BOOST_CHECK_EQUAL(scanner.next(), Token::LBrace);
|
|
BOOST_CHECK_EQUAL(scanner.next(), Token::RBrace);
|
|
|
|
}
|
|
|
|
// Unicode string escapes
|
|
|
|
BOOST_AUTO_TEST_CASE(valid_unicode_string_escape)
|
|
{
|
|
TestScanner scanner("{ \"\\u00DAnicode\"");
|
|
BOOST_CHECK_EQUAL(scanner.currentToken(), Token::LBrace);
|
|
BOOST_CHECK_EQUAL(scanner.next(), Token::StringLiteral);
|
|
BOOST_CHECK_EQUAL(scanner.currentLiteral(), std::string("\xC3\x9Anicode", 8));
|
|
}
|
|
|
|
BOOST_AUTO_TEST_CASE(valid_unicode_string_escape_7f)
|
|
{
|
|
TestScanner scanner("{ \"\\u007Fnicode\"");
|
|
BOOST_CHECK_EQUAL(scanner.currentToken(), Token::LBrace);
|
|
BOOST_CHECK_EQUAL(scanner.next(), Token::StringLiteral);
|
|
BOOST_CHECK_EQUAL(scanner.currentLiteral(), std::string("\x7Fnicode", 7));
|
|
}
|
|
|
|
BOOST_AUTO_TEST_CASE(valid_unicode_string_escape_7ff)
|
|
{
|
|
TestScanner scanner("{ \"\\u07FFnicode\"");
|
|
BOOST_CHECK_EQUAL(scanner.currentToken(), Token::LBrace);
|
|
BOOST_CHECK_EQUAL(scanner.next(), Token::StringLiteral);
|
|
BOOST_CHECK_EQUAL(scanner.currentLiteral(), std::string("\xDF\xBFnicode", 8));
|
|
}
|
|
|
|
BOOST_AUTO_TEST_CASE(valid_unicode_string_escape_ffff)
|
|
{
|
|
TestScanner scanner("{ \"\\uFFFFnicode\"");
|
|
BOOST_CHECK_EQUAL(scanner.currentToken(), Token::LBrace);
|
|
BOOST_CHECK_EQUAL(scanner.next(), Token::StringLiteral);
|
|
BOOST_CHECK_EQUAL(scanner.currentLiteral(), std::string("\xEF\xBF\xBFnicode", 9));
|
|
}
|
|
|
|
BOOST_AUTO_TEST_CASE(invalid_short_unicode_string_escape)
|
|
{
|
|
TestScanner scanner("{ \"\\uFFnicode\"");
|
|
BOOST_CHECK_EQUAL(scanner.currentToken(), Token::LBrace);
|
|
BOOST_CHECK_EQUAL(scanner.next(), Token::Illegal);
|
|
}
|
|
|
|
// Unicode string literal
|
|
|
|
BOOST_AUTO_TEST_CASE(unicode_prefix_only)
|
|
{
|
|
TestScanner scanner("{ unicode");
|
|
BOOST_CHECK_EQUAL(scanner.currentToken(), Token::LBrace);
|
|
BOOST_CHECK_EQUAL(scanner.next(), Token::Illegal);
|
|
BOOST_CHECK_EQUAL(scanner.currentError(), ScannerError::IllegalToken);
|
|
scanner.reset("{ unicode");
|
|
scanner.scanner->setScannerMode(ScannerKind::Yul);
|
|
BOOST_CHECK_EQUAL(scanner.currentToken(), Token::LBrace);
|
|
BOOST_CHECK_EQUAL(scanner.next(), Token::Identifier);
|
|
BOOST_CHECK_EQUAL(scanner.currentLiteral(), "unicode");
|
|
}
|
|
|
|
BOOST_AUTO_TEST_CASE(unicode_invalid_space)
|
|
{
|
|
TestScanner scanner("{ unicode ");
|
|
BOOST_CHECK_EQUAL(scanner.currentToken(), Token::LBrace);
|
|
BOOST_CHECK_EQUAL(scanner.next(), Token::Illegal);
|
|
BOOST_CHECK_EQUAL(scanner.currentError(), ScannerError::IllegalToken);
|
|
}
|
|
|
|
BOOST_AUTO_TEST_CASE(unicode_invalid_token)
|
|
{
|
|
TestScanner scanner("{ unicode test");
|
|
BOOST_CHECK_EQUAL(scanner.currentToken(), Token::LBrace);
|
|
BOOST_CHECK_EQUAL(scanner.next(), Token::Illegal);
|
|
BOOST_CHECK_EQUAL(scanner.currentError(), ScannerError::IllegalToken);
|
|
scanner.reset("{ unicode test");
|
|
scanner.scanner->setScannerMode(ScannerKind::Yul);
|
|
BOOST_CHECK_EQUAL(scanner.currentToken(), Token::LBrace);
|
|
BOOST_CHECK_EQUAL(scanner.next(), Token::Identifier);
|
|
BOOST_CHECK_EQUAL(scanner.currentLiteral(), "unicode");
|
|
BOOST_CHECK_EQUAL(scanner.next(), Token::Identifier);
|
|
BOOST_CHECK_EQUAL(scanner.currentLiteral(), "test");
|
|
}
|
|
|
|
BOOST_AUTO_TEST_CASE(valid_unicode_literal)
|
|
{
|
|
TestScanner scanner("{ unicode\"Hello 😃\"");
|
|
BOOST_CHECK_EQUAL(scanner.currentToken(), Token::LBrace);
|
|
BOOST_CHECK_EQUAL(scanner.next(), Token::UnicodeStringLiteral);
|
|
BOOST_CHECK_EQUAL(scanner.currentLiteral(), std::string("Hello \xf0\x9f\x98\x83", 10));
|
|
}
|
|
|
|
BOOST_AUTO_TEST_CASE(valid_nonprintable_in_unicode_literal)
|
|
{
|
|
// Non-printable characters are allowed in unicode strings...
|
|
TestScanner scanner("{ unicode\"Hello \007😃\"");
|
|
BOOST_CHECK_EQUAL(scanner.currentToken(), Token::LBrace);
|
|
BOOST_CHECK_EQUAL(scanner.next(), Token::UnicodeStringLiteral);
|
|
BOOST_CHECK_EQUAL(scanner.currentLiteral(), std::string("Hello \x07\xf0\x9f\x98\x83", 11));
|
|
}
|
|
|
|
// Hex string literal
|
|
|
|
BOOST_AUTO_TEST_CASE(hex_prefix_only)
|
|
{
|
|
TestScanner scanner("{ hex");
|
|
BOOST_CHECK_EQUAL(scanner.currentToken(), Token::LBrace);
|
|
BOOST_CHECK_EQUAL(scanner.next(), Token::Illegal);
|
|
BOOST_CHECK_EQUAL(scanner.currentError(), ScannerError::IllegalToken);
|
|
scanner.reset("{ hex");
|
|
scanner.scanner->setScannerMode(ScannerKind::Yul);
|
|
BOOST_CHECK_EQUAL(scanner.next(), Token::Illegal);
|
|
BOOST_CHECK_EQUAL(scanner.currentError(), ScannerError::IllegalToken);
|
|
}
|
|
|
|
BOOST_AUTO_TEST_CASE(hex_invalid_space)
|
|
{
|
|
TestScanner scanner("{ hex ");
|
|
BOOST_CHECK_EQUAL(scanner.currentToken(), Token::LBrace);
|
|
BOOST_CHECK_EQUAL(scanner.next(), Token::Illegal);
|
|
BOOST_CHECK_EQUAL(scanner.currentError(), ScannerError::IllegalToken);
|
|
}
|
|
|
|
BOOST_AUTO_TEST_CASE(hex_invalid_token)
|
|
{
|
|
TestScanner scanner("{ hex test");
|
|
BOOST_CHECK_EQUAL(scanner.currentToken(), Token::LBrace);
|
|
BOOST_CHECK_EQUAL(scanner.next(), Token::Illegal);
|
|
BOOST_CHECK_EQUAL(scanner.currentError(), ScannerError::IllegalToken);
|
|
scanner.reset("{ hex test");
|
|
scanner.scanner->setScannerMode(ScannerKind::Yul);
|
|
BOOST_CHECK_EQUAL(scanner.currentToken(), Token::LBrace);
|
|
BOOST_CHECK_EQUAL(scanner.next(), Token::Illegal);
|
|
BOOST_CHECK_EQUAL(scanner.currentError(), ScannerError::IllegalToken);
|
|
}
|
|
|
|
BOOST_AUTO_TEST_CASE(valid_hex_literal)
|
|
{
|
|
TestScanner scanner("{ hex\"00112233FF\"");
|
|
BOOST_CHECK_EQUAL(scanner.currentToken(), Token::LBrace);
|
|
BOOST_CHECK_EQUAL(scanner.next(), Token::HexStringLiteral);
|
|
BOOST_CHECK_EQUAL(scanner.currentLiteral(), std::string("\x00\x11\x22\x33\xFF", 5));
|
|
}
|
|
|
|
BOOST_AUTO_TEST_CASE(invalid_short_hex_literal)
|
|
{
|
|
TestScanner scanner("{ hex\"00112233F\"");
|
|
BOOST_CHECK_EQUAL(scanner.currentToken(), Token::LBrace);
|
|
BOOST_CHECK_EQUAL(scanner.next(), Token::Illegal);
|
|
BOOST_CHECK_EQUAL(scanner.currentError(), ScannerError::IllegalHexString);
|
|
}
|
|
|
|
BOOST_AUTO_TEST_CASE(invalid_hex_literal_with_space)
|
|
{
|
|
TestScanner scanner("{ hex\"00112233FF \"");
|
|
BOOST_CHECK_EQUAL(scanner.currentToken(), Token::LBrace);
|
|
BOOST_CHECK_EQUAL(scanner.next(), Token::Illegal);
|
|
BOOST_CHECK_EQUAL(scanner.currentError(), ScannerError::IllegalHexString);
|
|
}
|
|
|
|
BOOST_AUTO_TEST_CASE(invalid_hex_literal_with_wrong_quotes)
|
|
{
|
|
TestScanner scanner("{ hex\"00112233FF'");
|
|
BOOST_CHECK_EQUAL(scanner.currentToken(), Token::LBrace);
|
|
BOOST_CHECK_EQUAL(scanner.next(), Token::Illegal);
|
|
BOOST_CHECK_EQUAL(scanner.currentError(), ScannerError::IllegalHexString);
|
|
}
|
|
|
|
BOOST_AUTO_TEST_CASE(invalid_hex_literal_nonhex_string)
|
|
{
|
|
TestScanner scanner("{ hex\"hello\"");
|
|
BOOST_CHECK_EQUAL(scanner.currentToken(), Token::LBrace);
|
|
BOOST_CHECK_EQUAL(scanner.next(), Token::Illegal);
|
|
BOOST_CHECK_EQUAL(scanner.currentError(), ScannerError::IllegalHexString);
|
|
}
|
|
|
|
// Comments
|
|
|
|
BOOST_AUTO_TEST_CASE(invalid_multiline_comment_close)
|
|
{
|
|
// This used to parse as "comment", "identifier"
|
|
TestScanner scanner("/** / x");
|
|
BOOST_CHECK_EQUAL(scanner.currentToken(), Token::Illegal);
|
|
BOOST_CHECK_EQUAL(scanner.next(), Token::EOS);
|
|
}
|
|
|
|
BOOST_AUTO_TEST_CASE(multiline_doc_comment_at_eos)
|
|
{
|
|
// This used to parse as "whitespace"
|
|
TestScanner scanner("/**");
|
|
BOOST_CHECK_EQUAL(scanner.currentToken(), Token::Illegal);
|
|
BOOST_CHECK_EQUAL(scanner.next(), Token::EOS);
|
|
}
|
|
|
|
BOOST_AUTO_TEST_CASE(multiline_comment_at_eos)
|
|
{
|
|
TestScanner scanner("/*");
|
|
BOOST_CHECK_EQUAL(scanner.currentToken(), Token::Illegal);
|
|
BOOST_CHECK_EQUAL(scanner.next(), Token::EOS);
|
|
}
|
|
|
|
BOOST_AUTO_TEST_CASE(regular_line_break_in_single_line_comment)
|
|
{
|
|
for (auto const& nl: {"\r", "\n", "\r\n"})
|
|
{
|
|
TestScanner scanner("// abc " + string(nl) + " def ");
|
|
BOOST_CHECK_EQUAL(scanner.currentCommentLiteral(), "");
|
|
BOOST_CHECK_EQUAL(scanner.currentToken(), Token::Identifier);
|
|
BOOST_CHECK_EQUAL(scanner.currentLiteral(), "def");
|
|
BOOST_CHECK_EQUAL(scanner.next(), Token::EOS);
|
|
}
|
|
}
|
|
|
|
BOOST_AUTO_TEST_CASE(irregular_line_breaks_in_single_line_comment)
|
|
{
|
|
for (auto const& nl: {"\v", "\f", "\xE2\x80\xA8", "\xE2\x80\xA9"})
|
|
{
|
|
TestScanner scanner("// abc " + string(nl) + " def ");
|
|
BOOST_CHECK_EQUAL(scanner.currentCommentLiteral(), "");
|
|
BOOST_CHECK_EQUAL(scanner.currentToken(), Token::Illegal);
|
|
for (size_t i = 0; i < string(nl).size() - 1; i++)
|
|
BOOST_CHECK_EQUAL(scanner.next(), Token::Illegal);
|
|
BOOST_CHECK_EQUAL(scanner.next(), Token::Identifier);
|
|
BOOST_CHECK_EQUAL(scanner.currentLiteral(), "def");
|
|
BOOST_CHECK_EQUAL(scanner.next(), Token::EOS);
|
|
}
|
|
}
|
|
|
|
BOOST_AUTO_TEST_CASE(regular_line_breaks_in_single_line_doc_comment)
|
|
{
|
|
for (auto const& nl: {"\r", "\n", "\r\n"})
|
|
{
|
|
TestScanner scanner("/// abc " + string(nl) + " def ");
|
|
BOOST_CHECK_EQUAL(scanner.currentCommentLiteral(), "abc ");
|
|
BOOST_CHECK_EQUAL(scanner.currentToken(), Token::Identifier);
|
|
BOOST_CHECK_EQUAL(scanner.currentLiteral(), "def");
|
|
BOOST_CHECK_EQUAL(scanner.next(), Token::EOS);
|
|
}
|
|
}
|
|
|
|
BOOST_AUTO_TEST_CASE(regular_line_breaks_in_multiline_doc_comment)
|
|
{
|
|
// Test CR, LF, CRLF as line valid terminators for code comments.
|
|
// Any accepted non-LF is being canonicalized to LF.
|
|
for (auto const& nl : {"\r"s, "\n"s, "\r\n"s})
|
|
{
|
|
TestScanner scanner{"/// Hello" + nl + "/// World" + nl + "ident"};
|
|
auto const& lit = scanner.currentCommentLiteral();
|
|
BOOST_CHECK_EQUAL(lit, "Hello\n World");
|
|
BOOST_CHECK_EQUAL(scanner.currentCommentLiteral(), "Hello\n World");
|
|
BOOST_CHECK_EQUAL(scanner.currentToken(), Token::Identifier);
|
|
BOOST_CHECK_EQUAL(scanner.currentLiteral(), "ident");
|
|
BOOST_CHECK_EQUAL(scanner.next(), Token::EOS);
|
|
}
|
|
}
|
|
|
|
BOOST_AUTO_TEST_CASE(irregular_line_breaks_in_single_line_doc_comment)
|
|
{
|
|
for (auto const& nl: {"\v", "\f", "\xE2\x80\xA8", "\xE2\x80\xA9"})
|
|
{
|
|
TestScanner scanner("/// abc " + string(nl) + " def ");
|
|
BOOST_CHECK_EQUAL(scanner.currentCommentLiteral(), "abc ");
|
|
BOOST_CHECK_EQUAL(scanner.currentToken(), Token::Illegal);
|
|
for (size_t i = 0; i < string(nl).size() - 1; i++)
|
|
BOOST_CHECK_EQUAL(scanner.next(), Token::Illegal);
|
|
BOOST_CHECK_EQUAL(scanner.next(), Token::Identifier);
|
|
BOOST_CHECK_EQUAL(scanner.currentLiteral(), "def");
|
|
BOOST_CHECK_EQUAL(scanner.next(), Token::EOS);
|
|
}
|
|
}
|
|
|
|
BOOST_AUTO_TEST_CASE(regular_line_breaks_in_strings)
|
|
{
|
|
for (auto const& nl: {"\r"s, "\n"s, "\r\n"s})
|
|
{
|
|
TestScanner scanner("\"abc " + nl + " def\"");
|
|
BOOST_CHECK_EQUAL(scanner.currentToken(), Token::Illegal);
|
|
BOOST_CHECK_EQUAL(scanner.next(), Token::Identifier);
|
|
BOOST_CHECK_EQUAL(scanner.currentLiteral(), "def");
|
|
BOOST_CHECK_EQUAL(scanner.next(), Token::Illegal);
|
|
BOOST_CHECK_EQUAL(scanner.next(), Token::EOS);
|
|
}
|
|
}
|
|
|
|
BOOST_AUTO_TEST_CASE(irregular_line_breaks_in_strings)
|
|
{
|
|
for (auto const& nl: {"\v", "\f", "\xE2\x80\xA8", "\xE2\x80\xA9"})
|
|
{
|
|
TestScanner scanner("\"abc " + string(nl) + " def\"");
|
|
BOOST_CHECK_EQUAL(scanner.currentToken(), Token::Illegal);
|
|
for (size_t i = 0; i < string(nl).size(); i++)
|
|
BOOST_CHECK_EQUAL(scanner.next(), Token::Illegal);
|
|
BOOST_CHECK_EQUAL(scanner.next(), Token::Identifier);
|
|
BOOST_CHECK_EQUAL(scanner.currentLiteral(), "def");
|
|
BOOST_CHECK_EQUAL(scanner.next(), Token::Illegal);
|
|
BOOST_CHECK_EQUAL(scanner.next(), Token::EOS);
|
|
}
|
|
}
|
|
|
|
BOOST_AUTO_TEST_CASE(solidity_keywords)
|
|
{
|
|
// These are tokens which have a different meaning in Yul.
|
|
string keywords = "return byte bool address var in true false leave switch case default";
|
|
TestScanner scanner(keywords);
|
|
BOOST_CHECK_EQUAL(scanner.currentToken(), Token::Return);
|
|
BOOST_CHECK_EQUAL(scanner.next(), Token::Byte);
|
|
BOOST_CHECK_EQUAL(scanner.next(), Token::Bool);
|
|
BOOST_CHECK_EQUAL(scanner.next(), Token::Address);
|
|
BOOST_CHECK_EQUAL(scanner.next(), Token::Var);
|
|
BOOST_CHECK_EQUAL(scanner.next(), Token::In);
|
|
BOOST_CHECK_EQUAL(scanner.next(), Token::TrueLiteral);
|
|
BOOST_CHECK_EQUAL(scanner.next(), Token::FalseLiteral);
|
|
BOOST_CHECK_EQUAL(scanner.next(), Token::Identifier);
|
|
BOOST_CHECK_EQUAL(scanner.next(), Token::Switch);
|
|
BOOST_CHECK_EQUAL(scanner.next(), Token::Case);
|
|
BOOST_CHECK_EQUAL(scanner.next(), Token::Default);
|
|
BOOST_CHECK_EQUAL(scanner.next(), Token::EOS);
|
|
scanner.reset(keywords);
|
|
scanner.scanner->setScannerMode(ScannerKind::Yul);
|
|
BOOST_CHECK_EQUAL(scanner.currentToken(), Token::Identifier);
|
|
BOOST_CHECK_EQUAL(scanner.next(), Token::Identifier);
|
|
BOOST_CHECK_EQUAL(scanner.next(), Token::Identifier);
|
|
BOOST_CHECK_EQUAL(scanner.next(), Token::Identifier);
|
|
BOOST_CHECK_EQUAL(scanner.next(), Token::Identifier);
|
|
BOOST_CHECK_EQUAL(scanner.next(), Token::Identifier);
|
|
BOOST_CHECK_EQUAL(scanner.next(), Token::TrueLiteral);
|
|
BOOST_CHECK_EQUAL(scanner.next(), Token::FalseLiteral);
|
|
BOOST_CHECK_EQUAL(scanner.next(), Token::Leave);
|
|
BOOST_CHECK_EQUAL(scanner.next(), Token::Switch);
|
|
BOOST_CHECK_EQUAL(scanner.next(), Token::Case);
|
|
BOOST_CHECK_EQUAL(scanner.next(), Token::Default);
|
|
BOOST_CHECK_EQUAL(scanner.next(), Token::EOS);
|
|
}
|
|
|
|
BOOST_AUTO_TEST_CASE(yul_keyword_like)
|
|
{
|
|
TestScanner scanner("leave.function");
|
|
BOOST_CHECK_EQUAL(scanner.currentToken(), Token::Identifier);
|
|
BOOST_CHECK_EQUAL(scanner.next(), Token::Period);
|
|
BOOST_CHECK_EQUAL(scanner.next(), Token::Function);
|
|
BOOST_CHECK_EQUAL(scanner.next(), Token::EOS);
|
|
scanner.reset("leave.function");
|
|
scanner.scanner->setScannerMode(ScannerKind::Yul);
|
|
BOOST_CHECK_EQUAL(scanner.currentToken(), Token::Identifier);
|
|
BOOST_CHECK_EQUAL(scanner.next(), Token::EOS);
|
|
}
|
|
|
|
BOOST_AUTO_TEST_CASE(yul_identifier_with_dots)
|
|
{
|
|
TestScanner scanner("mystorage.slot := 1");
|
|
BOOST_CHECK_EQUAL(scanner.currentToken(), Token::Identifier);
|
|
BOOST_CHECK_EQUAL(scanner.next(), Token::Period);
|
|
BOOST_CHECK_EQUAL(scanner.next(), Token::Identifier);
|
|
BOOST_CHECK_EQUAL(scanner.next(), Token::AssemblyAssign);
|
|
BOOST_CHECK_EQUAL(scanner.next(), Token::Number);
|
|
BOOST_CHECK_EQUAL(scanner.next(), Token::EOS);
|
|
scanner.reset("mystorage.slot := 1");
|
|
scanner.scanner->setScannerMode(ScannerKind::Yul);
|
|
BOOST_CHECK_EQUAL(scanner.currentToken(), Token::Identifier);
|
|
BOOST_CHECK_EQUAL(scanner.next(), Token::AssemblyAssign);
|
|
BOOST_CHECK_EQUAL(scanner.next(), Token::Number);
|
|
BOOST_CHECK_EQUAL(scanner.next(), Token::EOS);
|
|
}
|
|
|
|
BOOST_AUTO_TEST_CASE(yul_function)
|
|
{
|
|
string sig = "function f(a, b) -> x, y";
|
|
TestScanner scanner(sig);
|
|
BOOST_CHECK_EQUAL(scanner.currentToken(), Token::Function);
|
|
BOOST_CHECK_EQUAL(scanner.next(), Token::Identifier);
|
|
BOOST_CHECK_EQUAL(scanner.next(), Token::LParen);
|
|
BOOST_CHECK_EQUAL(scanner.next(), Token::Identifier);
|
|
BOOST_CHECK_EQUAL(scanner.next(), Token::Comma);
|
|
BOOST_CHECK_EQUAL(scanner.next(), Token::Identifier);
|
|
BOOST_CHECK_EQUAL(scanner.next(), Token::RParen);
|
|
BOOST_CHECK_EQUAL(scanner.next(), Token::RightArrow);
|
|
BOOST_CHECK_EQUAL(scanner.next(), Token::Identifier);
|
|
BOOST_CHECK_EQUAL(scanner.next(), Token::Comma);
|
|
BOOST_CHECK_EQUAL(scanner.next(), Token::Identifier);
|
|
BOOST_CHECK_EQUAL(scanner.next(), Token::EOS);
|
|
scanner.reset(sig);
|
|
scanner.scanner->setScannerMode(ScannerKind::Yul);
|
|
BOOST_CHECK_EQUAL(scanner.currentToken(), Token::Function);
|
|
BOOST_CHECK_EQUAL(scanner.next(), Token::Identifier);
|
|
BOOST_CHECK_EQUAL(scanner.next(), Token::LParen);
|
|
BOOST_CHECK_EQUAL(scanner.next(), Token::Identifier);
|
|
BOOST_CHECK_EQUAL(scanner.next(), Token::Comma);
|
|
BOOST_CHECK_EQUAL(scanner.next(), Token::Identifier);
|
|
BOOST_CHECK_EQUAL(scanner.next(), Token::RParen);
|
|
BOOST_CHECK_EQUAL(scanner.next(), Token::RightArrow);
|
|
BOOST_CHECK_EQUAL(scanner.next(), Token::Identifier);
|
|
BOOST_CHECK_EQUAL(scanner.next(), Token::Comma);
|
|
BOOST_CHECK_EQUAL(scanner.next(), Token::Identifier);
|
|
BOOST_CHECK_EQUAL(scanner.next(), Token::EOS);
|
|
}
|
|
|
|
BOOST_AUTO_TEST_CASE(yul_function_with_whitespace)
|
|
{
|
|
string sig = "function f (a, b) - > x, y";
|
|
TestScanner scanner(sig);
|
|
BOOST_CHECK_EQUAL(scanner.currentToken(), Token::Function);
|
|
BOOST_CHECK_EQUAL(scanner.next(), Token::Identifier);
|
|
BOOST_CHECK_EQUAL(scanner.next(), Token::LParen);
|
|
BOOST_CHECK_EQUAL(scanner.next(), Token::Identifier);
|
|
BOOST_CHECK_EQUAL(scanner.next(), Token::Comma);
|
|
BOOST_CHECK_EQUAL(scanner.next(), Token::Identifier);
|
|
BOOST_CHECK_EQUAL(scanner.next(), Token::RParen);
|
|
BOOST_CHECK_EQUAL(scanner.next(), Token::Sub);
|
|
BOOST_CHECK_EQUAL(scanner.next(), Token::GreaterThan);
|
|
BOOST_CHECK_EQUAL(scanner.next(), Token::Identifier);
|
|
BOOST_CHECK_EQUAL(scanner.next(), Token::Comma);
|
|
BOOST_CHECK_EQUAL(scanner.next(), Token::Identifier);
|
|
BOOST_CHECK_EQUAL(scanner.next(), Token::EOS);
|
|
scanner.reset(sig);
|
|
scanner.scanner->setScannerMode(ScannerKind::Yul);
|
|
BOOST_CHECK_EQUAL(scanner.currentToken(), Token::Function);
|
|
BOOST_CHECK_EQUAL(scanner.next(), Token::Identifier);
|
|
BOOST_CHECK_EQUAL(scanner.next(), Token::LParen);
|
|
BOOST_CHECK_EQUAL(scanner.next(), Token::Identifier);
|
|
BOOST_CHECK_EQUAL(scanner.next(), Token::Comma);
|
|
BOOST_CHECK_EQUAL(scanner.next(), Token::Identifier);
|
|
BOOST_CHECK_EQUAL(scanner.next(), Token::RParen);
|
|
BOOST_CHECK_EQUAL(scanner.next(), Token::Sub);
|
|
BOOST_CHECK_EQUAL(scanner.next(), Token::GreaterThan);
|
|
BOOST_CHECK_EQUAL(scanner.next(), Token::Identifier);
|
|
BOOST_CHECK_EQUAL(scanner.next(), Token::Comma);
|
|
BOOST_CHECK_EQUAL(scanner.next(), Token::Identifier);
|
|
BOOST_CHECK_EQUAL(scanner.next(), Token::EOS);
|
|
}
|
|
|
|
BOOST_AUTO_TEST_SUITE_END()
|
|
|
|
} // end namespaces
|