solidity/libyul/optimiser/DataFlowAnalyzer.cpp

444 lines
13 KiB
C++
Raw Normal View History

/*(
This file is part of solidity.
solidity is free software: you can redistribute it and/or modify
it under the terms of the GNU General Public License as published by
the Free Software Foundation, either version 3 of the License, or
(at your option) any later version.
solidity is distributed in the hope that it will be useful,
but WITHOUT ANY WARRANTY; without even the implied warranty of
MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
GNU General Public License for more details.
You should have received a copy of the GNU General Public License
along with solidity. If not, see <http://www.gnu.org/licenses/>.
*/
/**
2018-06-06 04:43:58 +00:00
* Base class to perform data flow analysis during AST walks.
* Tracks assignments and is used as base class for both Rematerialiser and
* Common Subexpression Eliminator.
*/
2018-10-15 09:52:35 +00:00
#include <libyul/optimiser/DataFlowAnalyzer.h>
2018-10-15 09:52:35 +00:00
#include <libyul/optimiser/NameCollector.h>
#include <libyul/optimiser/Semantics.h>
#include <libyul/AST.h>
2018-10-15 09:52:35 +00:00
#include <libyul/Exceptions.h>
2019-05-21 13:52:15 +00:00
#include <libyul/backends/evm/EVMDialect.h>
#include <libsolutil/CommonData.h>
#include <boost/range/adaptor/reversed.hpp>
2019-05-21 13:52:15 +00:00
#include <boost/range/algorithm_ext/erase.hpp>
#include <variant>
using namespace std;
2019-12-11 16:31:36 +00:00
using namespace solidity;
using namespace solidity::util;
using namespace solidity::yul;
2019-05-21 13:52:15 +00:00
void DataFlowAnalyzer::operator()(ExpressionStatement& _statement)
{
2019-12-11 16:31:36 +00:00
if (auto vars = isSimpleStore(evmasm::Instruction::SSTORE, _statement))
2019-05-21 13:52:15 +00:00
{
ASTModifier::operator()(_statement);
set<YulString> keysToErase;
for (auto const& item: m_storage.values)
if (!(
m_knowledgeBase.knownToBeDifferent(vars->first, item.first) ||
m_knowledgeBase.knownToBeEqual(vars->second, item.second)
))
keysToErase.insert(item.first);
for (YulString const& key: keysToErase)
m_storage.eraseKey(key);
m_storage.set(vars->first, vars->second);
2019-05-21 13:52:15 +00:00
}
2019-12-11 16:31:36 +00:00
else if (auto vars = isSimpleStore(evmasm::Instruction::MSTORE, _statement))
2019-05-27 22:14:01 +00:00
{
ASTModifier::operator()(_statement);
set<YulString> keysToErase;
for (auto const& item: m_memory.values)
if (!m_knowledgeBase.knownToBeDifferentByAtLeast32(vars->first, item.first))
keysToErase.insert(item.first);
for (YulString const& key: keysToErase)
m_memory.eraseKey(key);
m_memory.set(vars->first, vars->second);
2019-05-27 22:14:01 +00:00
}
2019-05-21 13:52:15 +00:00
else
{
2019-05-27 22:14:01 +00:00
clearKnowledgeIfInvalidated(_statement.expression);
2019-05-21 13:52:15 +00:00
ASTModifier::operator()(_statement);
}
}
void DataFlowAnalyzer::operator()(Assignment& _assignment)
{
set<YulString> names;
for (auto const& var: _assignment.variableNames)
names.emplace(var.name);
2018-05-09 09:43:14 +00:00
assertThrow(_assignment.value, OptimizerException, "");
2019-05-27 22:14:01 +00:00
clearKnowledgeIfInvalidated(*_assignment.value);
visit(*_assignment.value);
2020-11-26 17:07:12 +00:00
handleAssignment(names, _assignment.value.get(), false);
}
void DataFlowAnalyzer::operator()(VariableDeclaration& _varDecl)
{
set<YulString> names;
for (auto const& var: _varDecl.variables)
names.emplace(var.name);
2018-02-05 17:02:32 +00:00
m_variableScopes.back().variables += names;
if (_varDecl.value)
2019-05-21 13:52:15 +00:00
{
2019-05-27 22:14:01 +00:00
clearKnowledgeIfInvalidated(*_varDecl.value);
visit(*_varDecl.value);
2019-05-21 13:52:15 +00:00
}
2020-11-26 17:07:12 +00:00
handleAssignment(names, _varDecl.value.get(), true);
}
void DataFlowAnalyzer::operator()(If& _if)
{
2019-05-27 22:14:01 +00:00
clearKnowledgeIfInvalidated(*_if.condition);
2019-05-21 13:52:15 +00:00
InvertibleMap<YulString, YulString> storage = m_storage;
2019-05-27 22:14:01 +00:00
InvertibleMap<YulString, YulString> memory = m_memory;
2019-05-21 13:52:15 +00:00
ASTModifier::operator()(_if);
2019-05-27 22:14:01 +00:00
joinKnowledge(storage, memory);
2019-05-21 13:52:15 +00:00
Assignments assignments;
assignments(_if.body);
clearValues(assignments.names());
}
void DataFlowAnalyzer::operator()(Switch& _switch)
{
2019-05-27 22:14:01 +00:00
clearKnowledgeIfInvalidated(*_switch.expression);
visit(*_switch.expression);
set<YulString> assignedVariables;
for (auto& _case: _switch.cases)
{
2019-05-21 13:52:15 +00:00
InvertibleMap<YulString, YulString> storage = m_storage;
2019-05-27 22:14:01 +00:00
InvertibleMap<YulString, YulString> memory = m_memory;
(*this)(_case.body);
2019-05-27 22:14:01 +00:00
joinKnowledge(storage, memory);
2019-05-21 13:52:15 +00:00
Assignments assignments;
assignments(_case.body);
assignedVariables += assignments.names();
// This is a little too destructive, we could retain the old values.
clearValues(assignments.names());
2019-05-27 22:14:01 +00:00
clearKnowledgeIfInvalidated(_case.body);
}
2019-05-21 13:52:15 +00:00
for (auto& _case: _switch.cases)
2019-05-27 22:14:01 +00:00
clearKnowledgeIfInvalidated(_case.body);
clearValues(assignedVariables);
}
void DataFlowAnalyzer::operator()(FunctionDefinition& _fun)
{
// Save all information. We might rather reinstantiate this class,
// but this could be difficult if it is subclassed.
2019-11-28 13:22:17 +00:00
map<YulString, AssignedValue> value;
2019-11-27 09:44:40 +00:00
size_t loopDepth{0};
InvertibleRelation<YulString> references;
2019-05-21 13:52:15 +00:00
InvertibleMap<YulString, YulString> storage;
2019-05-27 22:14:01 +00:00
InvertibleMap<YulString, YulString> memory;
2019-11-27 09:44:40 +00:00
swap(m_value, value);
swap(m_loopDepth, loopDepth);
swap(m_references, references);
2019-05-21 13:52:15 +00:00
swap(m_storage, storage);
2019-05-27 22:14:01 +00:00
swap(m_memory, memory);
pushScope(true);
for (auto const& parameter: _fun.parameters)
m_variableScopes.back().variables.emplace(parameter.name);
for (auto const& var: _fun.returnVariables)
{
m_variableScopes.back().variables.emplace(var.name);
2020-11-26 17:07:12 +00:00
handleAssignment({var.name}, nullptr, true);
}
ASTModifier::operator()(_fun);
2019-10-28 14:25:02 +00:00
// Note that the contents of return variables, storage and memory at this point
// might be incorrect due to the fact that the DataFlowAnalyzer ignores the ``leave``
// statement.
popScope();
2019-11-27 09:44:40 +00:00
swap(m_value, value);
swap(m_loopDepth, loopDepth);
swap(m_references, references);
2019-05-21 13:52:15 +00:00
swap(m_storage, storage);
2019-05-27 22:14:01 +00:00
swap(m_memory, memory);
}
void DataFlowAnalyzer::operator()(ForLoop& _for)
{
// If the pre block was not empty,
// we would have to deal with more complicated scoping rules.
assertThrow(_for.pre.statements.empty(), OptimizerException, "");
2019-11-27 09:44:40 +00:00
++m_loopDepth;
AssignmentsSinceContinue assignmentsSinceCont;
assignmentsSinceCont(_for.body);
Assignments assignments;
assignments(_for.body);
assignments(_for.post);
clearValues(assignments.names());
2019-05-21 13:52:15 +00:00
// break/continue are tricky for storage and thus we almost always clear here.
2019-05-27 22:14:01 +00:00
clearKnowledgeIfInvalidated(*_for.condition);
clearKnowledgeIfInvalidated(_for.post);
clearKnowledgeIfInvalidated(_for.body);
2019-05-21 13:52:15 +00:00
visit(*_for.condition);
(*this)(_for.body);
clearValues(assignmentsSinceCont.names());
2019-05-27 22:14:01 +00:00
clearKnowledgeIfInvalidated(_for.body);
(*this)(_for.post);
clearValues(assignments.names());
2019-05-27 22:14:01 +00:00
clearKnowledgeIfInvalidated(*_for.condition);
clearKnowledgeIfInvalidated(_for.post);
clearKnowledgeIfInvalidated(_for.body);
2019-11-27 09:44:40 +00:00
--m_loopDepth;
}
void DataFlowAnalyzer::operator()(Block& _block)
{
size_t numScopes = m_variableScopes.size();
pushScope(false);
ASTModifier::operator()(_block);
popScope();
2018-05-09 09:43:14 +00:00
assertThrow(numScopes == m_variableScopes.size(), OptimizerException, "");
}
2020-11-26 17:07:12 +00:00
void DataFlowAnalyzer::handleAssignment(set<YulString> const& _variables, Expression* _value, bool _isDeclaration)
{
2020-11-26 17:07:12 +00:00
if (!_isDeclaration)
clearValues(_variables);
MovableChecker movableChecker{m_dialect, &m_functionSideEffects};
if (_value)
movableChecker.visit(*_value);
else
for (auto const& var: _variables)
2019-11-27 09:44:40 +00:00
assignValue(var, &m_zero);
if (_value && _variables.size() == 1)
{
YulString name = *_variables.begin();
// Expression has to be movable and cannot contain a reference
// to the variable that will be assigned to.
if (movableChecker.movable() && !movableChecker.referencedVariables().count(name))
2019-11-27 09:44:40 +00:00
assignValue(name, _value);
}
auto const& referencedVariables = movableChecker.referencedVariables();
for (auto const& name: _variables)
2019-05-21 13:52:15 +00:00
{
m_references.set(name, referencedVariables);
2020-11-26 17:07:12 +00:00
if (!_isDeclaration)
{
// assignment to slot denoted by "name"
m_storage.eraseKey(name);
// assignment to slot contents denoted by "name"
m_storage.eraseValue(name);
// assignment to slot denoted by "name"
m_memory.eraseKey(name);
// assignment to slot contents denoted by "name"
m_memory.eraseValue(name);
}
2019-05-21 13:52:15 +00:00
}
if (_value && _variables.size() == 1)
{
YulString variable = *_variables.begin();
if (!movableChecker.referencedVariables().count(variable))
{
// This might erase additional knowledge about the slot.
// On the other hand, if we knew the value in the slot
// already, then the sload() / mload() would have been replaced by a variable anyway.
if (auto key = isSimpleLoad(evmasm::Instruction::MLOAD, *_value))
m_memory.set(*key, variable);
else if (auto key = isSimpleLoad(evmasm::Instruction::SLOAD, *_value))
m_storage.set(*key, variable);
}
}
}
void DataFlowAnalyzer::pushScope(bool _functionScope)
{
m_variableScopes.emplace_back(_functionScope);
}
void DataFlowAnalyzer::popScope()
{
clearValues(std::move(m_variableScopes.back().variables));
m_variableScopes.pop_back();
}
void DataFlowAnalyzer::clearValues(set<YulString> _variables)
{
// All variables that reference variables to be cleared also have to be
// cleared, but not recursively, since only the value of the original
// variables changes. Example:
// let a := 1
// let b := a
// let c := b
// let a := 2
// add(b, c)
// In the last line, we can replace c by b, but not b by a.
//
// This cannot be easily tested since the substitutions will be done
// one by one on the fly, and the last line will just be add(1, 1)
2019-05-21 13:52:15 +00:00
// First clear storage knowledge, because we do not have to clear
// storage knowledge of variables whose expression has changed,
// since the value is still unchanged.
for (auto const& name: _variables)
{
// clear slot denoted by "name"
m_storage.eraseKey(name);
// clear slot contents denoted by "name"
m_storage.eraseValue(name);
2019-05-27 22:14:01 +00:00
// assignment to slot denoted by "name"
m_memory.eraseKey(name);
// assignment to slot contents denoted by "name"
m_memory.eraseValue(name);
2019-05-21 13:52:15 +00:00
}
// Also clear variables that reference variables to be cleared.
for (auto const& name: _variables)
for (auto const& ref: m_references.backward[name])
_variables.emplace(ref);
// Clear the value and update the reference relation.
for (auto const& name: _variables)
m_value.erase(name);
for (auto const& name: _variables)
m_references.eraseKey(name);
}
2019-11-27 09:44:40 +00:00
void DataFlowAnalyzer::assignValue(YulString _variable, Expression const* _value)
{
2019-11-28 13:22:17 +00:00
m_value[_variable] = {_value, m_loopDepth};
2019-11-27 09:44:40 +00:00
}
2019-05-27 22:14:01 +00:00
void DataFlowAnalyzer::clearKnowledgeIfInvalidated(Block const& _block)
2019-05-21 13:52:15 +00:00
{
SideEffectsCollector sideEffects(m_dialect, _block, &m_functionSideEffects);
2019-05-27 22:14:01 +00:00
if (sideEffects.invalidatesStorage())
2019-05-21 13:52:15 +00:00
m_storage.clear();
2019-05-27 22:14:01 +00:00
if (sideEffects.invalidatesMemory())
m_memory.clear();
2019-05-21 13:52:15 +00:00
}
2019-05-27 22:14:01 +00:00
void DataFlowAnalyzer::clearKnowledgeIfInvalidated(Expression const& _expr)
2019-05-21 13:52:15 +00:00
{
SideEffectsCollector sideEffects(m_dialect, _expr, &m_functionSideEffects);
2019-05-27 22:14:01 +00:00
if (sideEffects.invalidatesStorage())
2019-05-21 13:52:15 +00:00
m_storage.clear();
2019-05-27 22:14:01 +00:00
if (sideEffects.invalidatesMemory())
m_memory.clear();
}
void DataFlowAnalyzer::joinKnowledge(
InvertibleMap<YulString, YulString> const& _olderStorage,
InvertibleMap<YulString, YulString> const& _olderMemory
)
{
joinKnowledgeHelper(m_storage, _olderStorage);
joinKnowledgeHelper(m_memory, _olderMemory);
2019-05-21 13:52:15 +00:00
}
2019-05-27 22:14:01 +00:00
void DataFlowAnalyzer::joinKnowledgeHelper(
InvertibleMap<YulString, YulString>& _this,
InvertibleMap<YulString, YulString> const& _older
)
2019-05-21 13:52:15 +00:00
{
2019-05-27 22:14:01 +00:00
// We clear if the key does not exist in the older map or if the value is different.
// This also works for memory because _older is an "older version"
// of m_memory and thus any overlapping write would have cleared the keys
// that are not known to be different inside m_memory already.
2019-05-21 13:52:15 +00:00
set<YulString> keysToErase;
2019-05-27 22:14:01 +00:00
for (auto const& item: _this.values)
2019-05-21 13:52:15 +00:00
{
2019-05-27 22:14:01 +00:00
auto it = _older.values.find(item.first);
if (it == _older.values.end() || it->second != item.second)
2019-05-21 13:52:15 +00:00
keysToErase.insert(item.first);
}
for (auto const& key: keysToErase)
2019-05-27 22:14:01 +00:00
_this.eraseKey(key);
2019-05-21 13:52:15 +00:00
}
bool DataFlowAnalyzer::inScope(YulString _variableName) const
{
for (auto const& scope: m_variableScopes | boost::adaptors::reversed)
{
2018-02-05 17:02:32 +00:00
if (scope.variables.count(_variableName))
return true;
2018-02-05 17:02:32 +00:00
if (scope.isFunction)
return false;
}
return false;
}
2019-05-21 13:52:15 +00:00
std::optional<pair<YulString, YulString>> DataFlowAnalyzer::isSimpleStore(
2019-12-11 16:31:36 +00:00
evmasm::Instruction _store,
2019-05-21 13:52:15 +00:00
ExpressionStatement const& _statement
) const
{
2019-05-27 22:14:01 +00:00
yulAssert(
2019-12-11 16:31:36 +00:00
_store == evmasm::Instruction::MSTORE ||
_store == evmasm::Instruction::SSTORE,
2019-05-27 22:14:01 +00:00
""
);
if (holds_alternative<FunctionCall>(_statement.expression))
2019-05-21 13:52:15 +00:00
{
FunctionCall const& funCall = std::get<FunctionCall>(_statement.expression);
2019-05-21 13:52:15 +00:00
if (EVMDialect const* dialect = dynamic_cast<EVMDialect const*>(&m_dialect))
if (auto const* builtin = dialect->builtin(funCall.functionName.name))
2019-05-27 22:14:01 +00:00
if (builtin->instruction == _store)
2019-05-21 13:52:15 +00:00
if (
holds_alternative<Identifier>(funCall.arguments.at(0)) &&
holds_alternative<Identifier>(funCall.arguments.at(1))
2019-05-21 13:52:15 +00:00
)
{
YulString key = std::get<Identifier>(funCall.arguments.at(0)).name;
YulString value = std::get<Identifier>(funCall.arguments.at(1)).name;
2019-05-21 13:52:15 +00:00
return make_pair(key, value);
}
}
return {};
}
std::optional<YulString> DataFlowAnalyzer::isSimpleLoad(
evmasm::Instruction _load,
Expression const& _expression
) const
{
yulAssert(
_load == evmasm::Instruction::MLOAD ||
_load == evmasm::Instruction::SLOAD,
""
);
if (holds_alternative<FunctionCall>(_expression))
{
FunctionCall const& funCall = std::get<FunctionCall>(_expression);
if (EVMDialect const* dialect = dynamic_cast<EVMDialect const*>(&m_dialect))
if (auto const* builtin = dialect->builtin(funCall.functionName.name))
if (builtin->instruction == _load)
if (holds_alternative<Identifier>(funCall.arguments.at(0)))
return std::get<Identifier>(funCall.arguments.at(0)).name;
}
return {};
}