/* This file is part of solidity. solidity is free software: you can redistribute it and/or modify it under the terms of the GNU General Public License as published by the Free Software Foundation, either version 3 of the License, or (at your option) any later version. solidity is distributed in the hope that it will be useful, but WITHOUT ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU General Public License for more details. You should have received a copy of the GNU General Public License along with solidity. If not, see . */ /** * Yul interpreter module that evaluates EVM instructions. */ #include #include #include #include #include using namespace std; using namespace dev; using namespace yul; using namespace yul::test; namespace { u256 exp256(u256 _base, u256 _exponent) { using boost::multiprecision::limb_type; u256 result = 1; while (_exponent) { if (boost::multiprecision::bit_test(_exponent, 0)) result *= _base; _base *= _base; _exponent >>= 1; } return result; } /// Reads 32 bytes from @a _data at position @a _offset bytes while /// interpreting @a _data to be padded with an infinite number of zero /// bytes beyond its end. u256 readZeroExtended(bytes const& _data, u256 const& _offset) { if (_offset >= _data.size()) return 0; else if (_offset + 32 <= _data.size()) return *reinterpret_cast(_data.data() + size_t(_offset)); else { size_t off = size_t(_offset); u256 val; for (size_t i = 0; i < 32; ++i) { val <<= 8; if (off + i < _data.size()) val += _data[off + i]; } return val; } } /// Copy @a _size bytes of @a _source at offset @a _sourceOffset to /// @a _target at offset @a _targetOffset. Behaves as if @a _source would /// continue with an infinite sequence of zero bytes beyond its end. /// Asserts the target is large enough to hold the copied segment. void copyZeroExtended( bytes& _target, bytes const& _source, size_t _targetOffset, size_t _sourceOffset, size_t _size ) { yulAssert(_targetOffset + _size <= _target.size(), ""); for (size_t i = 0; i < _size; ++i) _target[_targetOffset + i] = _sourceOffset + i < _source.size() ? _source[_sourceOffset + i] : 0; } } using u512 = boost::multiprecision::number>; u256 EVMInstructionInterpreter::eval( dev::eth::Instruction _instruction, vector const& _arguments ) { using namespace dev::eth; using dev::eth::Instruction; auto info = instructionInfo(_instruction); yulAssert(size_t(info.args) == _arguments.size(), ""); auto const& arg = _arguments; switch (_instruction) { case Instruction::STOP: throw ExplicitlyTerminated(); // --------------- arithmetic --------------- case Instruction::ADD: return arg[0] + arg[1]; case Instruction::MUL: return arg[0] * arg[1]; case Instruction::SUB: return arg[0] - arg[1]; case Instruction::DIV: return arg[1] == 0 ? 0 : arg[0] / arg[1]; case Instruction::SDIV: return arg[1] == 0 ? 0 : s2u(u2s(arg[0]) / u2s(arg[1])); case Instruction::MOD: return arg[1] == 0 ? 0 : arg[0] % arg[1]; case Instruction::SMOD: return arg[1] == 0 ? 0 : s2u(u2s(arg[0]) % u2s(arg[1])); case Instruction::EXP: return exp256(arg[0], arg[1]); case Instruction::NOT: return ~arg[0]; case Instruction::LT: return arg[0] < arg[1] ? 1 : 0; case Instruction::GT: return arg[0] > arg[1] ? 1 : 0; case Instruction::SLT: return u2s(arg[0]) < u2s(arg[1]) ? 1 : 0; case Instruction::SGT: return u2s(arg[0]) > u2s(arg[1]) ? 1 : 0; case Instruction::EQ: return arg[0] == arg[1] ? 1 : 0; case Instruction::ISZERO: return arg[0] == 0 ? 1 : 0; case Instruction::AND: return arg[0] & arg[1]; case Instruction::OR: return arg[0] | arg[1]; case Instruction::XOR: return arg[0] ^ arg[1]; case Instruction::BYTE: return arg[0] >= 32 ? 0 : (arg[1] >> unsigned(8 * (31 - arg[0]))) & 0xff; case Instruction::SHL: return arg[0] > 255 ? 0 : (arg[1] << unsigned(arg[0])); case Instruction::SHR: return arg[0] > 255 ? 0 : (arg[1] >> unsigned(arg[0])); case Instruction::SAR: { static u256 const hibit = u256(1) << 255; if (arg[0] >= 256) return arg[1] & hibit ? u256(-1) : 0; else { unsigned amount = unsigned(arg[0]); u256 v = arg[1] >> amount; if (arg[1] & hibit) v |= u256(-1) << (256 - amount); return v; } } case Instruction::ADDMOD: return arg[2] == 0 ? 0 : u256((u512(arg[0]) + u512(arg[1])) % arg[2]); case Instruction::MULMOD: return arg[2] == 0 ? 0 : u256((u512(arg[0]) * u512(arg[1])) % arg[2]); case Instruction::SIGNEXTEND: if (arg[0] >= 31) return arg[1]; else { unsigned testBit = unsigned(arg[0]) * 8 + 7; u256 ret = arg[1]; u256 mask = ((u256(1) << testBit) - 1); if (boost::multiprecision::bit_test(ret, testBit)) ret |= ~mask; else ret &= mask; return ret; } // --------------- blockchain stuff --------------- case Instruction::KECCAK256: { if (!logMemoryRead(arg[0], arg[1])) return u256("0x1234cafe1234cafe1234cafe") + arg[0]; uint64_t offset = uint64_t(arg[0] & uint64_t(-1)); uint64_t size = uint64_t(arg[1] & uint64_t(-1)); return u256(keccak256(bytesConstRef(m_state.memory.data() + offset, size))); } case Instruction::ADDRESS: return m_state.address; case Instruction::BALANCE: return m_state.balance; case Instruction::ORIGIN: return m_state.origin; case Instruction::CALLER: return m_state.caller; case Instruction::CALLVALUE: return m_state.callvalue; case Instruction::CALLDATALOAD: return readZeroExtended(m_state.calldata, arg[0]); case Instruction::CALLDATASIZE: return m_state.calldata.size(); case Instruction::CALLDATACOPY: if (logMemoryWrite(arg[0], arg[2])) copyZeroExtended( m_state.memory, m_state.calldata, size_t(arg[0]), size_t(arg[1]), size_t(arg[2]) ); return 0; case Instruction::CODESIZE: return m_state.code.size(); case Instruction::CODECOPY: if (logMemoryWrite(arg[0], arg[2])) copyZeroExtended( m_state.memory, m_state.code, size_t(arg[0]), size_t(arg[1]), size_t(arg[2]) ); return 0; case Instruction::GASPRICE: return m_state.gasprice; case Instruction::EXTCODESIZE: logTrace(_instruction, arg); return u256(keccak256(h256(arg[0]))) & 0xffffff; case Instruction::EXTCODEHASH: logTrace(_instruction, arg); return u256(keccak256(h256(arg[0] + 1))); case Instruction::EXTCODECOPY: logTrace(_instruction, arg); if (logMemoryWrite(arg[1], arg[3])) // TODO this way extcodecopy and codecopy do the same thing. copyZeroExtended( m_state.memory, m_state.code, size_t(arg[1]), size_t(arg[2]), size_t(arg[3]) ); return 0; case Instruction::RETURNDATASIZE: logTrace(_instruction, arg); return m_state.returndata.size(); case Instruction::RETURNDATACOPY: logTrace(_instruction, arg); if (logMemoryWrite(arg[0], arg[2])) copyZeroExtended( m_state.memory, m_state.returndata, size_t(arg[0]), size_t(arg[1]), size_t(arg[2]) ); return 0; case Instruction::BLOCKHASH: if (arg[0] >= m_state.blockNumber || arg[0] + 256 < m_state.blockNumber) return 0; else return 0xaaaaaaaa + (arg[0] - m_state.blockNumber - 256); case Instruction::COINBASE: return m_state.coinbase; case Instruction::TIMESTAMP: return m_state.timestamp; case Instruction::NUMBER: return m_state.blockNumber; case Instruction::DIFFICULTY: return m_state.difficulty; case Instruction::GASLIMIT: return m_state.gaslimit; // --------------- memory / storage / logs --------------- case Instruction::MLOAD: if (logMemoryRead(arg[0], 0x20)) return u256(*reinterpret_cast(m_state.memory.data() + size_t(arg[0]))); else return 0x1234 + arg[0]; case Instruction::MSTORE: if (logMemoryWrite(arg[0], 0x20, h256(arg[1]).asBytes())) *reinterpret_cast(m_state.memory.data() + size_t(arg[0])) = h256(arg[1]); return 0; case Instruction::MSTORE8: if (logMemoryWrite(arg[0], 1, bytes{1, uint8_t(arg[1] & 0xff)})) m_state.memory[size_t(arg[0])] = uint8_t(arg[1] & 0xff); return 0; case Instruction::SLOAD: logTrace(_instruction, arg); return m_state.storage[h256(arg[0])]; case Instruction::SSTORE: logTrace(Instruction::SSTORE, arg); m_state.storage[h256(arg[0])] = h256(arg[1]); return 0; case Instruction::PC: logTrace(_instruction); return 0x77; case Instruction::MSIZE: logTrace(_instruction); return m_state.msize; case Instruction::GAS: logTrace(_instruction); return 0x99; case Instruction::LOG0: logMemoryRead(arg[0], arg[1]); logTrace(_instruction, arg); return 0; case Instruction::LOG1: logMemoryRead(arg[0], arg[1]); logTrace(_instruction, arg); return 0; case Instruction::LOG2: logMemoryRead(arg[0], arg[1]); logTrace(_instruction, arg); return 0; case Instruction::LOG3: logMemoryRead(arg[0], arg[1]); logTrace(_instruction, arg); return 0; case Instruction::LOG4: logMemoryRead(arg[0], arg[1]); logTrace(_instruction, arg); return 0; // --------------- calls --------------- case Instruction::CREATE: logMemoryRead(arg[1], arg[2]); logTrace(_instruction, arg); return 0xcccccc + arg[1]; case Instruction::CREATE2: logMemoryRead(arg[2], arg[3]); logTrace(_instruction, arg); return 0xdddddd + arg[1]; case Instruction::CALL: case Instruction::CALLCODE: // TODO assign returndata logMemoryRead(arg[3], arg[4]); logMemoryWrite(arg[5], arg[6]); logTrace(_instruction, arg); return arg[0] & 1; case Instruction::DELEGATECALL: case Instruction::STATICCALL: logMemoryRead(arg[2], arg[3]); logMemoryWrite(arg[4], arg[5]); logTrace(_instruction, arg); return 0; case Instruction::RETURN: { bytes data; if (logMemoryRead(arg[0], arg[1])) data = bytesConstRef(m_state.memory.data() + size_t(arg[0]), size_t(arg[1])).toBytes(); logTrace(_instruction, arg, data); throw ExplicitlyTerminated(); } case Instruction::REVERT: logMemoryRead(arg[0], arg[1]); logTrace(_instruction, arg); throw ExplicitlyTerminated(); case Instruction::INVALID: logTrace(_instruction); throw ExplicitlyTerminated(); case Instruction::SELFDESTRUCT: logTrace(_instruction, arg); throw ExplicitlyTerminated(); case Instruction::POP: break; // --------------- invalid in strict assembly --------------- case Instruction::JUMP: case Instruction::JUMPI: case Instruction::JUMPDEST: case Instruction::PUSH1: case Instruction::PUSH2: case Instruction::PUSH3: case Instruction::PUSH4: case Instruction::PUSH5: case Instruction::PUSH6: case Instruction::PUSH7: case Instruction::PUSH8: case Instruction::PUSH9: case Instruction::PUSH10: case Instruction::PUSH11: case Instruction::PUSH12: case Instruction::PUSH13: case Instruction::PUSH14: case Instruction::PUSH15: case Instruction::PUSH16: case Instruction::PUSH17: case Instruction::PUSH18: case Instruction::PUSH19: case Instruction::PUSH20: case Instruction::PUSH21: case Instruction::PUSH22: case Instruction::PUSH23: case Instruction::PUSH24: case Instruction::PUSH25: case Instruction::PUSH26: case Instruction::PUSH27: case Instruction::PUSH28: case Instruction::PUSH29: case Instruction::PUSH30: case Instruction::PUSH31: case Instruction::PUSH32: case Instruction::DUP1: case Instruction::DUP2: case Instruction::DUP3: case Instruction::DUP4: case Instruction::DUP5: case Instruction::DUP6: case Instruction::DUP7: case Instruction::DUP8: case Instruction::DUP9: case Instruction::DUP10: case Instruction::DUP11: case Instruction::DUP12: case Instruction::DUP13: case Instruction::DUP14: case Instruction::DUP15: case Instruction::DUP16: case Instruction::SWAP1: case Instruction::SWAP2: case Instruction::SWAP3: case Instruction::SWAP4: case Instruction::SWAP5: case Instruction::SWAP6: case Instruction::SWAP7: case Instruction::SWAP8: case Instruction::SWAP9: case Instruction::SWAP10: case Instruction::SWAP11: case Instruction::SWAP12: case Instruction::SWAP13: case Instruction::SWAP14: case Instruction::SWAP15: case Instruction::SWAP16: // --------------- EVM 2.0 --------------- case Instruction::JUMPTO: case Instruction::JUMPIF: case Instruction::JUMPV: case Instruction::JUMPSUB: case Instruction::JUMPSUBV: case Instruction::BEGINSUB: case Instruction::BEGINDATA: case Instruction::RETURNSUB: case Instruction::PUTLOCAL: case Instruction::GETLOCAL: { yulAssert(false, ""); return 0; } } return 0; } u256 EVMInstructionInterpreter::evalBuiltin(YulString _name, const std::vector& _arguments) { if (_name == "datasize"_yulstring) return u256(keccak256(h256(_arguments.at(0)))) & 0xfff; else if (_name == "dataoffset"_yulstring) return u256(keccak256(h256(_arguments.at(0) + 2))) & 0xfff; else if (_name == "datacopy"_yulstring) { // This is identical to codecopy. if (logMemoryWrite(_arguments.at(0), _arguments.at(2))) copyZeroExtended( m_state.memory, m_state.code, size_t(_arguments.at(0)), size_t(_arguments.at(1) & size_t(-1)), size_t(_arguments.at(2)) ); } else yulAssert(false, "Unknown builtin: " + _name.str()); return 0; } bool EVMInstructionInterpreter::logMemoryRead(u256 const& _offset, u256 const& _size) { return logMemory(false, _offset, _size); } bool EVMInstructionInterpreter::logMemoryWrite(u256 const& _offset, u256 const& _size, bytes const& _data) { return logMemory(true, _offset, _size, _data); } bool EVMInstructionInterpreter::logMemory(bool _write, u256 const& _offset, u256 const& _size, bytes const& _data) { logTrace(_write ? "MSTORE_AT_SIZE" : "MLOAD_FROM_SIZE", {_offset, _size}, _data); if (((_offset + _size) >= _offset) && ((_offset + _size + 0x1f) >= (_offset + _size))) { u256 newSize = (_offset + _size + 0x1f) & ~u256(0x1f); m_state.msize = max(m_state.msize, newSize); if (newSize < m_state.maxMemSize) { if (m_state.memory.size() < newSize) m_state.memory.resize(size_t(newSize)); return true; } } else m_state.msize = u256(-1); return false; } void EVMInstructionInterpreter::logTrace(dev::eth::Instruction _instruction, std::vector const& _arguments, bytes const& _data) { logTrace(dev::eth::instructionInfo(_instruction).name, _arguments, _data); } void EVMInstructionInterpreter::logTrace(std::string const& _pseudoInstruction, std::vector const& _arguments, bytes const& _data) { string message = _pseudoInstruction + "("; for (size_t i = 0; i < _arguments.size(); ++i) message += (i > 0 ? ", " : "") + formatNumber(_arguments[i]); message += ")"; if (!_data.empty()) message += " [" + toHex(_data) + "]"; m_state.trace.emplace_back(std::move(message)); if (m_state.maxTraceSize > 0 && m_state.trace.size() >= m_state.maxTraceSize) { m_state.trace.emplace_back("Trace size limit reached."); throw TraceLimitReached(); } }