2014-10-20 14:37:04 +00:00
|
|
|
/*
|
|
|
|
This file is part of cpp-ethereum.
|
|
|
|
|
|
|
|
cpp-ethereum is free software: you can redistribute it and/or modify
|
|
|
|
it under the terms of the GNU General Public License as published by
|
|
|
|
the Free Software Foundation, either version 3 of the License, or
|
|
|
|
(at your option) any later version.
|
|
|
|
|
|
|
|
cpp-ethereum is distributed in the hope that it will be useful,
|
|
|
|
but WITHOUT ANY WARRANTY; without even the implied warranty of
|
|
|
|
MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
|
|
|
|
GNU General Public License for more details.
|
|
|
|
|
|
|
|
You should have received a copy of the GNU General Public License
|
|
|
|
along with cpp-ethereum. If not, see <http://www.gnu.org/licenses/>.
|
|
|
|
|
|
|
|
This file is derived from the file "scanner.h", which was part of the
|
|
|
|
V8 project. The original copyright header follows:
|
|
|
|
|
|
|
|
Copyright 2006-2012, the V8 project authors. All rights reserved.
|
|
|
|
Redistribution and use in source and binary forms, with or without
|
|
|
|
modification, are permitted provided that the following conditions are
|
|
|
|
met:
|
|
|
|
|
|
|
|
* Redistributions of source code must retain the above copyright
|
|
|
|
notice, this list of conditions and the following disclaimer.
|
|
|
|
* Redistributions in binary form must reproduce the above
|
|
|
|
copyright notice, this list of conditions and the following
|
|
|
|
disclaimer in the documentation and/or other materials provided
|
|
|
|
with the distribution.
|
|
|
|
* Neither the name of Google Inc. nor the names of its
|
|
|
|
contributors may be used to endorse or promote products derived
|
|
|
|
from this software without specific prior written permission.
|
|
|
|
|
|
|
|
THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS
|
|
|
|
"AS IS" AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT
|
|
|
|
LIMITED TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR
|
|
|
|
A PARTICULAR PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT
|
|
|
|
OWNER OR CONTRIBUTORS BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL,
|
|
|
|
SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT
|
|
|
|
LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE,
|
|
|
|
DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY
|
|
|
|
THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT
|
|
|
|
(INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE
|
|
|
|
OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
|
|
|
|
*/
|
|
|
|
/**
|
|
|
|
* @author Christian <c@ethdev.com>
|
|
|
|
* @date 2014
|
|
|
|
* Solidity scanner.
|
|
|
|
*/
|
2014-10-06 15:13:52 +00:00
|
|
|
|
|
|
|
#pragma once
|
|
|
|
|
|
|
|
#include <libdevcore/Common.h>
|
|
|
|
#include <libdevcore/Log.h>
|
|
|
|
#include <libdevcore/CommonData.h>
|
2014-10-07 16:25:04 +00:00
|
|
|
#include <libsolidity/BaseTypes.h>
|
2014-10-06 15:13:52 +00:00
|
|
|
#include <libsolidity/Token.h>
|
|
|
|
|
2014-10-16 12:08:54 +00:00
|
|
|
namespace dev
|
|
|
|
{
|
|
|
|
namespace solidity
|
|
|
|
{
|
2014-10-06 15:13:52 +00:00
|
|
|
|
|
|
|
|
|
|
|
class AstRawString;
|
|
|
|
class AstValueFactory;
|
|
|
|
class ParserRecorder;
|
|
|
|
|
2014-10-16 12:08:54 +00:00
|
|
|
class CharStream
|
|
|
|
{
|
2014-10-06 15:13:52 +00:00
|
|
|
public:
|
2014-10-22 22:24:07 +00:00
|
|
|
CharStream(): m_pos(0) {}
|
2014-10-20 11:02:06 +00:00
|
|
|
explicit CharStream(std::string const& _source): m_source(_source), m_pos(0) {}
|
2014-10-09 10:28:37 +00:00
|
|
|
int getPos() const { return m_pos; }
|
2014-11-27 17:57:50 +00:00
|
|
|
bool isPastEndOfInput(size_t _charsForward = 0) const { return (m_pos + _charsForward) >= m_source.size(); }
|
|
|
|
char get(size_t _charsForward = 0) const { return m_source[m_pos + _charsForward]; }
|
2014-11-30 21:43:40 +00:00
|
|
|
char advanceAndGet(size_t _chars=1);
|
2014-10-16 21:49:45 +00:00
|
|
|
char rollback(size_t _amount);
|
2014-10-09 10:28:37 +00:00
|
|
|
|
2014-12-03 16:45:12 +00:00
|
|
|
void reset() { m_pos = 0; }
|
|
|
|
|
2014-10-22 18:35:35 +00:00
|
|
|
///@{
|
|
|
|
///@name Error printing helper functions
|
2014-10-09 10:28:37 +00:00
|
|
|
/// Functions that help pretty-printing parse errors
|
|
|
|
/// Do only use in error cases, they are quite expensive.
|
|
|
|
std::string getLineAtPosition(int _position) const;
|
|
|
|
std::tuple<int, int> translatePositionToLineColumn(int _position) const;
|
2014-10-22 18:35:35 +00:00
|
|
|
///@}
|
2014-10-20 14:28:24 +00:00
|
|
|
|
2014-10-06 15:13:52 +00:00
|
|
|
private:
|
2014-10-09 10:28:37 +00:00
|
|
|
std::string m_source;
|
|
|
|
size_t m_pos;
|
2014-10-06 15:13:52 +00:00
|
|
|
};
|
|
|
|
|
|
|
|
|
2014-11-27 17:57:50 +00:00
|
|
|
|
2014-10-16 12:08:54 +00:00
|
|
|
class Scanner
|
|
|
|
{
|
2014-11-30 22:25:42 +00:00
|
|
|
friend class LiteralScope;
|
2014-10-06 15:13:52 +00:00
|
|
|
public:
|
2014-11-27 17:57:50 +00:00
|
|
|
|
2014-12-03 16:45:12 +00:00
|
|
|
explicit Scanner(CharStream const& _source = CharStream(), std::string const& _sourceName = "") { reset(_source, _sourceName); }
|
2014-10-09 10:28:37 +00:00
|
|
|
|
2014-12-03 16:45:12 +00:00
|
|
|
/// Resets the scanner as if newly constructed with _source and _sourceName as input.
|
|
|
|
void reset(CharStream const& _source, std::string const& _sourceName);
|
|
|
|
/// Resets scanner to the start of input.
|
|
|
|
void reset();
|
2014-10-09 10:28:37 +00:00
|
|
|
|
2014-11-20 22:56:24 +00:00
|
|
|
/// Returns the next token and advances input
|
|
|
|
Token::Value next();
|
2014-10-16 21:49:45 +00:00
|
|
|
|
2014-10-22 18:35:35 +00:00
|
|
|
///@{
|
|
|
|
///@name Information about the current token
|
2014-10-16 21:49:45 +00:00
|
|
|
|
|
|
|
/// Returns the current token
|
2014-11-19 15:21:42 +00:00
|
|
|
Token::Value getCurrentToken()
|
2014-11-18 17:50:40 +00:00
|
|
|
{
|
2014-11-21 16:08:35 +00:00
|
|
|
return m_currentToken.token;
|
2014-11-18 17:50:40 +00:00
|
|
|
}
|
2015-01-05 15:37:43 +00:00
|
|
|
|
2014-11-21 16:08:35 +00:00
|
|
|
Location getCurrentLocation() const { return m_currentToken.location; }
|
|
|
|
std::string const& getCurrentLiteral() const { return m_currentToken.literal; }
|
2014-10-22 18:35:35 +00:00
|
|
|
///@}
|
|
|
|
|
2014-11-19 15:21:42 +00:00
|
|
|
///@{
|
|
|
|
///@name Information about the current comment token
|
2014-11-27 17:57:50 +00:00
|
|
|
|
2014-11-21 16:08:35 +00:00
|
|
|
Location getCurrentCommentLocation() const { return m_skippedComment.location; }
|
|
|
|
std::string const& getCurrentCommentLiteral() const { return m_skippedComment.literal; }
|
2014-11-27 17:57:50 +00:00
|
|
|
/// Called by the parser during FunctionDefinition parsing to clear the current comment
|
|
|
|
void clearCurrentCommentLiteral() { m_skippedComment.literal.clear(); }
|
|
|
|
|
2014-11-19 15:21:42 +00:00
|
|
|
///@}
|
|
|
|
|
2014-10-22 18:35:35 +00:00
|
|
|
///@{
|
|
|
|
///@name Information about the next token
|
2014-10-09 10:28:37 +00:00
|
|
|
|
2014-10-16 21:49:45 +00:00
|
|
|
/// Returns the next token without advancing input.
|
2014-11-21 16:08:35 +00:00
|
|
|
Token::Value peekNextToken() const { return m_nextToken.token; }
|
|
|
|
Location peekLocation() const { return m_nextToken.location; }
|
|
|
|
std::string const& peekLiteral() const { return m_nextToken.literal; }
|
2014-10-22 18:35:35 +00:00
|
|
|
///@}
|
2014-10-09 10:28:37 +00:00
|
|
|
|
2014-12-03 17:52:28 +00:00
|
|
|
std::shared_ptr<std::string const> const& getSourceName() const { return m_sourceName; }
|
|
|
|
|
2014-10-22 18:35:35 +00:00
|
|
|
///@{
|
|
|
|
///@name Error printing helper functions
|
|
|
|
/// Functions that help pretty-printing parse errors
|
2014-10-09 10:28:37 +00:00
|
|
|
/// Do only use in error cases, they are quite expensive.
|
2014-10-16 21:49:45 +00:00
|
|
|
std::string getLineAtPosition(int _position) const { return m_source.getLineAtPosition(_position); }
|
|
|
|
std::tuple<int, int> translatePositionToLineColumn(int _position) const { return m_source.translatePositionToLineColumn(_position); }
|
2014-10-22 18:35:35 +00:00
|
|
|
///@}
|
2014-10-09 10:28:37 +00:00
|
|
|
|
2014-10-06 15:13:52 +00:00
|
|
|
private:
|
2014-11-20 21:08:16 +00:00
|
|
|
/// Used for the current and look-ahead token and comments
|
2014-10-16 12:08:54 +00:00
|
|
|
struct TokenDesc
|
|
|
|
{
|
2014-10-09 10:28:37 +00:00
|
|
|
Token::Value token;
|
|
|
|
Location location;
|
|
|
|
std::string literal;
|
|
|
|
};
|
|
|
|
|
2014-10-22 18:35:35 +00:00
|
|
|
///@{
|
|
|
|
///@name Literal buffer support
|
2014-11-21 16:08:35 +00:00
|
|
|
inline void addLiteralChar(char c) { m_nextToken.literal.push_back(c); }
|
|
|
|
inline void addCommentLiteralChar(char c) { m_nextSkippedComment.literal.push_back(c); }
|
2014-10-16 12:08:54 +00:00
|
|
|
inline void addLiteralCharAndAdvance() { addLiteralChar(m_char); advance(); }
|
2014-10-22 18:35:35 +00:00
|
|
|
///@}
|
2014-10-09 10:28:37 +00:00
|
|
|
|
|
|
|
bool advance() { m_char = m_source.advanceAndGet(); return !m_source.isPastEndOfInput(); }
|
2014-10-16 21:49:45 +00:00
|
|
|
void rollback(int _amount) { m_char = m_source.rollback(_amount); }
|
2014-10-09 10:28:37 +00:00
|
|
|
|
2014-10-16 21:49:45 +00:00
|
|
|
inline Token::Value selectToken(Token::Value _tok) { advance(); return _tok; }
|
|
|
|
/// If the next character is _next, advance and return _then, otherwise return _else.
|
|
|
|
inline Token::Value selectToken(char _next, Token::Value _then, Token::Value _else);
|
2014-10-09 10:28:37 +00:00
|
|
|
|
2014-11-05 13:20:56 +00:00
|
|
|
bool scanHexByte(char& o_scannedByte);
|
2014-10-09 10:28:37 +00:00
|
|
|
|
2014-11-30 21:43:40 +00:00
|
|
|
/// Scans a single Solidity token.
|
|
|
|
void scanToken();
|
2014-10-09 10:28:37 +00:00
|
|
|
|
2014-10-22 18:35:35 +00:00
|
|
|
/// Skips all whitespace and @returns true if something was skipped.
|
2014-10-09 10:28:37 +00:00
|
|
|
bool skipWhitespace();
|
2014-12-18 12:27:25 +00:00
|
|
|
/// Skips all whitespace except Line feeds and returns true if something was skipped
|
|
|
|
bool skipWhitespaceExceptLF();
|
2014-10-09 10:28:37 +00:00
|
|
|
Token::Value skipSingleLineComment();
|
|
|
|
Token::Value skipMultiLineComment();
|
|
|
|
|
|
|
|
void scanDecimalDigits();
|
2014-11-05 07:40:21 +00:00
|
|
|
Token::Value scanNumber(char _charSeen = 0);
|
2014-10-09 10:28:37 +00:00
|
|
|
Token::Value scanIdentifierOrKeyword();
|
|
|
|
|
|
|
|
Token::Value scanString();
|
2014-12-17 17:53:18 +00:00
|
|
|
Token::Value scanSingleLineDocComment();
|
|
|
|
Token::Value scanMultiLineDocComment();
|
2014-12-18 16:30:10 +00:00
|
|
|
/// Scans a slash '/' and depending on the characters returns the appropriate token
|
|
|
|
Token::Value scanSlash();
|
2014-10-09 10:28:37 +00:00
|
|
|
|
2014-10-16 21:49:45 +00:00
|
|
|
/// Scans an escape-sequence which is part of a string and adds the
|
|
|
|
/// decoded character to the current literal. Returns true if a pattern
|
|
|
|
/// is scanned.
|
2014-10-09 10:28:37 +00:00
|
|
|
bool scanEscape();
|
|
|
|
|
2014-10-16 21:49:45 +00:00
|
|
|
/// Return the current source position.
|
2014-10-16 12:08:54 +00:00
|
|
|
int getSourcePos() { return m_source.getPos(); }
|
|
|
|
bool isSourcePastEndOfInput() { return m_source.isPastEndOfInput(); }
|
2014-10-09 10:28:37 +00:00
|
|
|
|
2014-11-21 16:08:35 +00:00
|
|
|
TokenDesc m_skippedComment; // desc for current skipped comment
|
|
|
|
TokenDesc m_nextSkippedComment; // desc for next skiped comment
|
2014-11-19 15:21:42 +00:00
|
|
|
|
2014-11-21 16:08:35 +00:00
|
|
|
TokenDesc m_currentToken; // desc for current token (as returned by Next())
|
|
|
|
TokenDesc m_nextToken; // desc for next token (one token look-ahead)
|
2014-10-09 10:28:37 +00:00
|
|
|
|
|
|
|
CharStream m_source;
|
2014-12-03 17:52:28 +00:00
|
|
|
std::shared_ptr<std::string const> m_sourceName;
|
2014-10-09 10:28:37 +00:00
|
|
|
|
2014-10-16 21:49:45 +00:00
|
|
|
/// one character look-ahead, equals 0 at end of input
|
2014-10-09 10:28:37 +00:00
|
|
|
char m_char;
|
2014-10-06 15:13:52 +00:00
|
|
|
};
|
|
|
|
|
2014-10-16 12:08:54 +00:00
|
|
|
}
|
|
|
|
}
|