New full inliner.

This commit is contained in:
chriseth 2018-10-02 10:46:59 +02:00
parent 72b1bb00bd
commit e2e4a9fe81
12 changed files with 227 additions and 254 deletions

View File

@ -23,12 +23,13 @@
#include <libyul/optimiser/ASTCopier.h> #include <libyul/optimiser/ASTCopier.h>
#include <libyul/optimiser/ASTWalker.h> #include <libyul/optimiser/ASTWalker.h>
#include <libyul/optimiser/NameCollector.h> #include <libyul/optimiser/NameCollector.h>
#include <libyul/optimiser/Semantics.h> #include <libyul/optimiser/Utilities.h>
#include <libyul/Exceptions.h> #include <libyul/Exceptions.h>
#include <libsolidity/inlineasm/AsmData.h> #include <libsolidity/inlineasm/AsmData.h>
#include <libdevcore/CommonData.h> #include <libdevcore/CommonData.h>
#include <libdevcore/Visitor.h>
#include <boost/range/adaptor/reversed.hpp> #include <boost/range/adaptor/reversed.hpp>
@ -56,7 +57,8 @@ FullInliner::FullInliner(Block& _ast):
void FullInliner::run() void FullInliner::run()
{ {
assertThrow(m_ast.statements[0].type() == typeid(Block), OptimizerException, ""); assertThrow(m_ast.statements[0].type() == typeid(Block), OptimizerException, "");
InlineModifier(*this, m_nameDispenser, "").visit(m_ast.statements[0]);
handleBlock("", boost::get<Block>(m_ast.statements[0]));
while (!m_functionsToVisit.empty()) while (!m_functionsToVisit.empty())
handleFunction(**m_functionsToVisit.begin()); handleFunction(**m_functionsToVisit.begin());
} }
@ -66,168 +68,105 @@ void FullInliner::handleFunction(FunctionDefinition& _fun)
if (!m_functionsToVisit.count(&_fun)) if (!m_functionsToVisit.count(&_fun))
return; return;
m_functionsToVisit.erase(&_fun); m_functionsToVisit.erase(&_fun);
(InlineModifier(*this, m_nameDispenser, _fun.name))(_fun.body);
handleBlock(_fun.name, _fun.body);
} }
void InlineModifier::operator()(FunctionalInstruction& _instruction) void FullInliner::handleBlock(string const& _currentFunctionName, Block& _block)
{ {
visitArguments(_instruction.arguments); InlineModifier{*this, m_nameDispenser, _currentFunctionName}(_block);
}
void InlineModifier::operator()(FunctionCall&)
{
assertThrow(false, OptimizerException, "Should be handled in visit() instead.");
}
void InlineModifier::operator()(ForLoop& _loop)
{
(*this)(_loop.pre);
// Do not visit the condition because we cannot inline there.
(*this)(_loop.post);
(*this)(_loop.body);
} }
void InlineModifier::operator()(Block& _block) void InlineModifier::operator()(Block& _block)
{ {
vector<Statement> saved; function<boost::optional<vector<Statement>>(Statement&)> f = [&](Statement& _statement) -> boost::optional<vector<Statement>> {
saved.swap(m_statementsToPrefix); visit(_statement);
return tryInlineStatement(_statement);
// This is only used if needed to minimize the number of move operations. };
vector<Statement> modifiedStatements; iterateReplacing(_block.statements, f);
for (size_t i = 0; i < _block.statements.size(); ++i)
{
visit(_block.statements.at(i));
if (!m_statementsToPrefix.empty())
{
if (modifiedStatements.empty())
std::move(
_block.statements.begin(),
_block.statements.begin() + i,
back_inserter(modifiedStatements)
);
modifiedStatements += std::move(m_statementsToPrefix);
m_statementsToPrefix.clear();
}
if (!modifiedStatements.empty())
modifiedStatements.emplace_back(std::move(_block.statements[i]));
}
if (!modifiedStatements.empty())
_block.statements = std::move(modifiedStatements);
saved.swap(m_statementsToPrefix);
} }
void InlineModifier::visit(Expression& _expression) boost::optional<vector<Statement>> InlineModifier::tryInlineStatement(Statement& _statement)
{ {
if (_expression.type() != typeid(FunctionCall)) // Only inline for expression statements, assignments and variable declarations.
return ASTModifier::visit(_expression); Expression* e = boost::apply_visitor(GenericFallbackReturnsVisitor<Expression*, ExpressionStatement, Assignment, VariableDeclaration>(
[](ExpressionStatement& _s) { return &_s.expression; },
FunctionCall& funCall = boost::get<FunctionCall>(_expression); [](Assignment& _s) { return _s.value.get(); },
FunctionDefinition& fun = m_driver.function(funCall.functionName.name); [](VariableDeclaration& _s) { return _s.value.get(); }
), _statement);
m_driver.handleFunction(fun); if (e)
// TODO: Insert good heuristic here. Perhaps implement that inside the driver.
bool doInline = funCall.functionName.name != m_currentFunction;
if (fun.returnVariables.size() > 1)
doInline = false;
{ {
vector<string> argNames; // Only inline direct function calls.
vector<string> argTypes; FunctionCall* funCall = boost::apply_visitor(GenericFallbackReturnsVisitor<FunctionCall*, FunctionCall&>(
for (auto const& arg: fun.parameters) [](FunctionCall& _e) { return &_e; }
), *e);
if (funCall)
{ {
argNames.push_back(fun.name + "_" + arg.name); FunctionDefinition& fun = m_driver.function(funCall->functionName.name);
argTypes.push_back(arg.type); m_driver.handleFunction(fun);
// TODO: Insert good heuristic here. Perhaps implement that inside the driver.
bool doInline = funCall->functionName.name != m_currentFunction;
if (doInline)
return performInline(_statement, *funCall, fun);
} }
visitArguments(funCall.arguments, argNames, argTypes, doInline);
} }
return {};
}
if (!doInline) vector<Statement> InlineModifier::performInline(Statement& _statement, FunctionCall& _funCall, FunctionDefinition& _function)
return; {
vector<Statement> newStatements;
map<string, string> variableReplacements; map<string, string> variableReplacements;
for (size_t i = 0; i < funCall.arguments.size(); ++i)
variableReplacements[fun.parameters[i].name] = boost::get<Identifier>(funCall.arguments[i]).name;
if (fun.returnVariables.empty())
_expression = noop(funCall.location);
else
{
string returnVariable = fun.returnVariables[0].name;
variableReplacements[returnVariable] = newName(fun.name + "_" + returnVariable);
m_statementsToPrefix.emplace_back(VariableDeclaration{ // helper function to create a new variable that is supposed to model
funCall.location, // an existing variable.
{{funCall.location, variableReplacements[returnVariable], fun.returnVariables[0].type}}, auto newVariable = [&](TypedName const& _existingVariable, Expression* _value) {
{} string newName = m_nameDispenser.newName(_function.name + "_" + _existingVariable.name);
}); variableReplacements[_existingVariable.name] = newName;
_expression = Identifier{funCall.location, variableReplacements[returnVariable]}; VariableDeclaration varDecl{_funCall.location, {{_funCall.location, newName, _existingVariable.type}}, {}};
} if (_value)
m_statementsToPrefix.emplace_back(BodyCopier(m_nameDispenser, fun.name + "_", variableReplacements)(fun.body)); varDecl.value = make_shared<Expression>(std::move(*_value));
} newStatements.emplace_back(std::move(varDecl));
};
void InlineModifier::visit(Statement& _statement) for (size_t i = 0; i < _funCall.arguments.size(); ++i)
{ newVariable(_function.parameters[i], &_funCall.arguments[i]);
ASTModifier::visit(_statement); for (auto const& var: _function.returnVariables)
// Replace pop(0) expression statemets (and others) by empty blocks. newVariable(var, nullptr);
if (_statement.type() == typeid(ExpressionStatement))
{ Statement newBody = BodyCopier(m_nameDispenser, _function.name + "_", variableReplacements)(_function.body);
ExpressionStatement& expSt = boost::get<ExpressionStatement>(_statement); newStatements += std::move(boost::get<Block>(newBody).statements);
if (expSt.expression.type() == typeid(FunctionalInstruction))
boost::apply_visitor(GenericFallbackVisitor<Assignment, VariableDeclaration>{
[&](Assignment& _assignment)
{ {
FunctionalInstruction& funInstr = boost::get<FunctionalInstruction>(expSt.expression); for (size_t i = 0; i < _assignment.variableNames.size(); ++i)
if (funInstr.instruction == solidity::Instruction::POP) newStatements.emplace_back(Assignment{
if (MovableChecker(funInstr.arguments.at(0)).movable()) _assignment.location,
_statement = Block{expSt.location, {}}; {_assignment.variableNames[i]},
} make_shared<Expression>(Identifier{
} _assignment.location,
} variableReplacements.at(_function.returnVariables[i].name)
})
void InlineModifier::visitArguments( });
vector<Expression>& _arguments, },
vector<string> const& _nameHints, [&](VariableDeclaration& _varDecl)
vector<string> const& _types,
bool _moveToFront
)
{
// If one of the elements moves parts to the front, all other elements right of it
// also have to be moved to the front to keep the order of evaluation.
vector<Statement> prefix;
for (size_t i = 0; i < _arguments.size(); ++i)
{
auto& arg = _arguments[i];
// TODO optimize vector operations, check that it actually moves
auto internalPrefix = visitRecursively(arg);
if (!internalPrefix.empty())
{ {
_moveToFront = true; for (size_t i = 0; i < _varDecl.variables.size(); ++i)
// We go through the arguments left to right, so we have to invert newStatements.emplace_back(VariableDeclaration{
// the prefixes. _varDecl.location,
prefix = std::move(internalPrefix) + std::move(prefix); {std::move(_varDecl.variables[i])},
make_shared<Expression>(Identifier{
_varDecl.location,
variableReplacements.at(_function.returnVariables[i].name)
})
});
} }
else if (_moveToFront) // nothing to be done for expression statement
{ }, _statement);
auto location = locationOf(arg); return newStatements;
string var = newName(i < _nameHints.size() ? _nameHints[i] : "");
prefix.emplace(prefix.begin(), VariableDeclaration{
location,
{{TypedName{location, var, i < _types.size() ? _types[i] : ""}}},
make_shared<Expression>(std::move(arg))
});
arg = Identifier{location, var};
}
}
m_statementsToPrefix += std::move(prefix);
}
vector<Statement> InlineModifier::visitRecursively(Expression& _expression)
{
vector<Statement> saved;
saved.swap(m_statementsToPrefix);
visit(_expression);
saved.swap(m_statementsToPrefix);
return saved;
} }
string InlineModifier::newName(string const& _prefix) string InlineModifier::newName(string const& _prefix)
@ -235,13 +174,6 @@ string InlineModifier::newName(string const& _prefix)
return m_nameDispenser.newName(_prefix); return m_nameDispenser.newName(_prefix);
} }
Expression InlineModifier::noop(SourceLocation const& _location)
{
return FunctionalInstruction{_location, solidity::Instruction::POP, {
Literal{_location, assembly::LiteralKind::Number, "0", ""}
}};
}
Statement BodyCopier::operator()(VariableDeclaration const& _varDecl) Statement BodyCopier::operator()(VariableDeclaration const& _varDecl)
{ {
for (auto const& var: _varDecl.variables) for (auto const& var: _varDecl.variables)

View File

@ -42,29 +42,31 @@ class NameCollector;
/** /**
* Optimiser component that modifies an AST in place, inlining arbitrary functions. * Optimiser component that modifies an AST in place, inlining functions.
* Expressions are expected to be split, i.e. the component will only inline
* function calls that are at the root of the expression and that only contains
* variables as arguments. More specifically, it will inline
* - let x1, ..., xn := f(a1, ..., am)
* - x1, ..., xn := f(a1, ..., am)
* f(a1, ..., am)
* *
* Code of the form * The transform changes code of the form
* *
* function f(a, b) -> c { ... } * function f(a, b) -> c { ... }
* h(g(x(...), f(arg1(...), arg2(...)), y(...)), z(...)) * let z := f(x, y)
* *
* is transformed into * into
* *
* function f(a, b) -> c { ... } * function f(a, b) -> c { ... }
* *
* let z1 := z(...) let y1 := y(...) let a2 := arg2(...) let a1 := arg1(...) * let f_a := x
* let c1 := 0 * let f_b := y
* { code of f, with replacements: a -> a1, b -> a2, c -> c1, d -> d1 } * let f_c
* h(g(x(...), c1, y1), z1) * code of f, with replacements: a -> f_a, b -> f_b, c -> f_c
* let z := f_c
* *
* No temporary variable is created for expressions that are "movable" * Prerequisites: Disambiguator, Function Hoister
* (i.e. they are "pure", have no side-effects and also do not depend on other code * More efficient if run after: Expression Splitter
* that might have side-effects).
*
* This component can only be used on sources with unique names and with hoisted functions,
* i.e. the root node has to be a block that itself contains a single block followed by all
* function definitions.
*/ */
class FullInliner: public ASTModifier class FullInliner: public ASTModifier
{ {
@ -79,6 +81,8 @@ public:
FunctionDefinition& function(std::string _name) { return *m_functions.at(_name); } FunctionDefinition& function(std::string _name) { return *m_functions.at(_name); }
private: private:
void handleBlock(std::string const& _currentFunctionName, Block& _block);
/// The AST to be modified. The root block itself will not be modified, because /// The AST to be modified. The root block itself will not be modified, because
/// we store pointers to functions. /// we store pointers to functions.
Block& m_ast; Block& m_ast;
@ -99,46 +103,15 @@ public:
m_driver(_driver), m_driver(_driver),
m_nameDispenser(_nameDispenser) m_nameDispenser(_nameDispenser)
{ } { }
~InlineModifier()
{
assertThrow(m_statementsToPrefix.empty(), OptimizerException, "");
}
virtual void operator()(FunctionalInstruction&) override;
virtual void operator()(FunctionCall&) override;
virtual void operator()(ForLoop&) override;
virtual void operator()(Block& _block) override; virtual void operator()(Block& _block) override;
using ASTModifier::visit;
virtual void visit(Expression& _expression) override;
virtual void visit(Statement& _st) override;
private: private:
boost::optional<std::vector<Statement>> tryInlineStatement(Statement& _statement);
/// Visits a list of expressions (usually an argument list to a function call) and tries std::vector<Statement> performInline(Statement& _statement, FunctionCall& _funCall, FunctionDefinition& _function);
/// to inline them. If one of them is inlined, all right of it have to be moved to the front
/// (to keep the order of evaluation). If @a _moveToFront is true, all elements are moved
/// to the front. @a _nameHints and @_types are used for the newly created variables, but
/// both can be empty.
void visitArguments(
std::vector<Expression>& _arguments,
std::vector<std::string> const& _nameHints = {},
std::vector<std::string> const& _types = {},
bool _moveToFront = false
);
/// Visits an expression, but saves and restores the current statements to prefix and returns
/// the statements that should be prefixed for @a _expression.
std::vector<Statement> visitRecursively(Expression& _expression);
std::string newName(std::string const& _prefix); std::string newName(std::string const& _prefix);
/// @returns an expression returning nothing.
Expression noop(SourceLocation const& _location);
/// List of statements that should go in front of the currently visited AST element,
/// at the statement level.
std::vector<Statement> m_statementsToPrefix;
std::string m_currentFunction; std::string m_currentFunction;
FullInliner& m_driver; FullInliner& m_driver;
NameDispenser& m_nameDispenser; NameDispenser& m_nameDispenser;

View File

@ -130,7 +130,11 @@ bool YulOptimizerTest::run(ostream& _stream, string const& _linePrefix, bool con
disambiguate(); disambiguate();
(FunctionHoister{})(*m_ast); (FunctionHoister{})(*m_ast);
(FunctionGrouper{})(*m_ast); (FunctionGrouper{})(*m_ast);
NameDispenser nameDispenser;
nameDispenser.m_usedNames = NameCollector(*m_ast).names();
ExpressionSplitter{nameDispenser}(*m_ast);
FullInliner(*m_ast).run(); FullInliner(*m_ast).run();
ExpressionJoiner::run(*m_ast);
} }
else if (m_optimizerStep == "mainFunction") else if (m_optimizerStep == "mainFunction")
{ {

View File

@ -0,0 +1,30 @@
{
function f(a) -> b, c { let x := mload(a) b := sload(x) c := 3 }
let a1 := calldataload(0)
let b3, c3 := f(a1)
let b4, c4 := f(c3)
}
// ----
// fullInliner
// {
// {
// let f_a := calldataload(0)
// let f_b
// let f_c
// f_b := sload(mload(f_a))
// f_c := 3
// let b3 := f_b
// let f_a_1 := f_c
// let f_b_1
// let f_c_1
// f_b_1 := sload(mload(f_a_1))
// f_c_1 := 3
// let b4 := f_b_1
// let c4 := f_c_1
// }
// function f(a) -> b, c
// {
// b := sload(mload(a))
// c := 3
// }
// }

View File

@ -12,14 +12,12 @@
// fullInliner // fullInliner
// { // {
// { // {
// let _1 := mload(0) // let _2 := mload(0)
// let f_a := mload(1) // let f_a := mload(1)
// let f_r // let f_r
// { // f_a := mload(f_a)
// f_a := mload(f_a) // f_r := add(f_a, calldatasize())
// f_r := add(f_a, calldatasize()) // if gt(f_r, _2)
// }
// if gt(f_r, _1)
// { // {
// sstore(0, 2) // sstore(0, 2)
// } // }

View File

@ -9,16 +9,17 @@
// fullInliner // fullInliner
// { // {
// { // {
// let _1 := mload(5) // let _2 := mload(5)
// let f_c := mload(4) // let _4 := mload(4)
// let f_b := mload(3) // let _6 := mload(3)
// let f_a := mload(2) // let f_a := mload(2)
// let f_b := _6
// let f_c := _4
// let f_x // let f_x
// { // f_x := add(f_a, f_b)
// f_x := add(f_a, f_b) // f_x := mul(f_x, f_c)
// f_x := mul(f_x, f_c) // let _10 := add(f_x, _2)
// } // let y := add(mload(1), _10)
// let y := add(mload(1), add(f_x, _1))
// } // }
// function f(a, b, c) -> x // function f(a, b, c) -> x
// { // {

View File

@ -7,21 +7,17 @@
// fullInliner // fullInliner
// { // {
// { // {
// let g_c := 7 // let _1 := 7
// let f_a_1 := 3 // let f_a := 3
// let f_x_1 // let f_x
// { // f_x := add(f_a, f_a)
// f_x_1 := add(f_a_1, f_a_1) // let g_b := f_x
// } // let g_c := _1
// let g_y // let g_y
// { // let g_f_a_1 := g_b
// let g_f_a := f_x_1 // let g_f_x_1
// let g_f_x // g_f_x_1 := add(g_f_a_1, g_f_a_1)
// { // g_y := mul(mload(g_c), g_f_x_1)
// g_f_x := add(g_f_a, g_f_a)
// }
// g_y := mul(mload(g_c), g_f_x)
// }
// let y_1 := g_y // let y_1 := g_y
// } // }
// function f(a) -> x // function f(a) -> x
@ -30,11 +26,9 @@
// } // }
// function g(b, c) -> y // function g(b, c) -> y
// { // {
// let f_a := b // let f_a_1 := b
// let f_x // let f_x_1
// { // f_x_1 := add(f_a_1, f_a_1)
// f_x := add(f_a, f_a) // y := mul(mload(c), f_x_1)
// }
// y := mul(mload(c), f_x)
// } // }
// } // }

View File

@ -1,17 +1,22 @@
// The full inliner currently does not work with
// functions returning multiple values.
{ {
function f(a) -> x, y { function f(a) -> x, y {
x := mul(a, a) x := mul(a, a)
y := add(a, x) y := add(a, x)
} }
let a, b := f(mload(0)) let r, s := f(mload(0))
mstore(r, s)
} }
// ---- // ----
// fullInliner // fullInliner
// { // {
// { // {
// let a_1, b := f(mload(0)) // let f_a := mload(0)
// let f_x
// let f_y
// f_x := mul(f_a, f_a)
// f_y := add(f_a, f_x)
// let r := f_x
// mstore(r, f_y)
// } // }
// function f(a) -> x, y // function f(a) -> x, y
// { // {

View File

@ -9,11 +9,7 @@
// { // {
// { // {
// let f_a := mload(0) // let f_a := mload(0)
// { // sstore(f_a, f_a)
// sstore(f_a, f_a)
// }
// {
// }
// } // }
// function f(a) // function f(a)
// { // {

View File

@ -0,0 +1,43 @@
{
for { let x := f(0) } f(x) { x := f(x) }
{
let t := f(x)
}
function f(a) -> r {
sstore(a, 0)
r := a
}
}
// ----
// fullInliner
// {
// {
// for {
// let f_a := 0
// let f_r
// sstore(f_a, 0)
// f_r := f_a
// let x := f_r
// }
// f(x)
// {
// let f_a_1 := x
// let f_r_1
// sstore(f_a_1, 0)
// f_r_1 := f_a_1
// x := f_r_1
// }
// {
// let f_a_2 := x
// let f_r_2
// sstore(f_a_2, 0)
// f_r_2 := f_a_2
// let t := f_r_2
// }
// }
// function f(a) -> r
// {
// sstore(a, 0)
// r := a
// }
// }

View File

@ -1,4 +1,6 @@
// This tests that `pop(r)` is removed. // An earlier version of the inliner produced
// pop(...) statements and explicitly removed them.
// This used to test that they are removed.
{ {
function f(a) -> x { function f(a) -> x {
let r := mul(a, a) let r := mul(a, a)
@ -13,12 +15,9 @@
// let _1 := 2 // let _1 := 2
// let f_a := 7 // let f_a := 7
// let f_x // let f_x
// { // let f_r := mul(f_a, f_a)
// let f_r := mul(f_a, f_a) // f_x := add(f_r, f_r)
// f_x := add(f_r, f_r) // pop(add(f_x, _1))
// }
// {
// }
// } // }
// function f(a) -> x // function f(a) -> x
// { // {

View File

@ -9,14 +9,12 @@
// fullInliner // fullInliner
// { // {
// { // {
// let _1 := mload(7) // let _2 := mload(7)
// let f_a := sload(mload(2)) // let f_a := sload(mload(2))
// let f_x // let f_x
// { // let f_r := mul(f_a, f_a)
// let f_r := mul(f_a, f_a) // f_x := add(f_r, f_r)
// f_x := add(f_r, f_r) // let y := add(f_x, _2)
// }
// let y := add(f_x, _1)
// } // }
// function f(a) -> x // function f(a) -> x
// { // {