solidity/libyul/optimiser/DataFlowAnalyzer.h

226 lines
8.5 KiB
C
Raw Permalink Normal View History

/*
This file is part of solidity.
solidity is free software: you can redistribute it and/or modify
it under the terms of the GNU General Public License as published by
the Free Software Foundation, either version 3 of the License, or
(at your option) any later version.
solidity is distributed in the hope that it will be useful,
but WITHOUT ANY WARRANTY; without even the implied warranty of
MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
GNU General Public License for more details.
You should have received a copy of the GNU General Public License
along with solidity. If not, see <http://www.gnu.org/licenses/>.
*/
// SPDX-License-Identifier: GPL-3.0
/**
* Base class to perform data flow analysis during AST walks.
* Tracks assignments and is used as base class for both Rematerialiser and
* Common Subexpression Eliminator.
*/
#pragma once
2018-10-15 09:52:35 +00:00
#include <libyul/optimiser/ASTWalker.h>
2019-05-21 13:52:15 +00:00
#include <libyul/optimiser/KnowledgeBase.h>
#include <libyul/YulString.h>
#include <libyul/AST.h> // Needed for m_zero below.
#include <libyul/SideEffects.h>
#include <libsolutil/Numeric.h>
#include <libsolutil/Common.h>
#include <map>
#include <set>
2019-12-11 16:31:36 +00:00
namespace solidity::yul
{
2018-12-20 17:55:32 +00:00
struct Dialect;
struct SideEffects;
class KnowledgeBase;
2019-11-28 13:22:17 +00:00
/// Value assigned to a variable.
struct AssignedValue
{
Expression const* value{nullptr};
/// Loop nesting depth of the definition of the variable.
size_t loopDepth{0};
};
/**
* Base class to perform data flow analysis during AST walks.
* Tracks assignments and is used as base class for both Rematerialiser and
* Common Subexpression Eliminator.
*
* A special zero constant expression is used for the default value of variables.
*
2019-05-21 13:52:15 +00:00
* The class also tracks contents in storage and memory. Both keys and values
* are names of variables. Whenever such a variable is re-assigned, the knowledge
* is cleared.
*
* For elementary statements, we check if it is an SSTORE(x, y) / MSTORE(x, y)
* If yes, visit the statement. Then record that fact and clear all storage slots t
* where we cannot prove x != t or y == m_storage[t] using the current values of the variables x and t.
* Otherwise, determine if the statement invalidates storage/memory. If yes, clear all knowledge
* about storage/memory before visiting the statement. Then visit the statement.
*
* For forward-joining control flow, storage/memory information from the branches is combined.
* If the keys or values are different or non-existent in one branch, the key is deleted.
* This works also for memory (where addresses overlap) because one branch is always an
* older version of the other and thus overlapping contents would have been deleted already
* at the point of assignment.
*
2019-10-28 14:25:02 +00:00
* The DataFlowAnalyzer currently does not deal with the ``leave`` statement. This is because
* it only matters at the end of a function body, which is a point in the code a derived class
* can not easily deal with.
*
* Prerequisite: Disambiguator, ForLoopInitRewriter.
*/
class DataFlowAnalyzer: public ASTModifier
{
public:
enum class MemoryAndStorage { Analyze, Ignore };
/// @param _functionSideEffects
/// Side-effects of user-defined functions. Worst-case side-effects are assumed
/// if this is not provided or the function is not found.
/// The parameter is mostly used to determine movability of expressions.
explicit DataFlowAnalyzer(
Dialect const& _dialect,
MemoryAndStorage _analyzeStores,
std::map<YulString, SideEffects> _functionSideEffects = {}
);
2018-12-20 17:55:32 +00:00
using ASTModifier::operator();
2019-05-21 13:52:15 +00:00
void operator()(ExpressionStatement& _statement) override;
void operator()(Assignment& _assignment) override;
void operator()(VariableDeclaration& _varDecl) override;
void operator()(If& _if) override;
void operator()(Switch& _switch) override;
void operator()(FunctionDefinition&) override;
void operator()(ForLoop&) override;
void operator()(Block& _block) override;
/// @returns the current value of the given variable, if known - always movable.
2022-03-10 18:35:58 +00:00
AssignedValue const* variableValue(YulString _variable) const { return util::valueOrNullptr(m_state.value, _variable); }
std::set<YulString> const* references(YulString _variable) const { return util::valueOrNullptr(m_state.references, _variable); }
std::map<YulString, AssignedValue> const& allValues() const { return m_state.value; }
std::optional<YulString> storageValue(YulString _key) const;
std::optional<YulString> memoryValue(YulString _key) const;
std::optional<YulString> keccakValue(YulString _start, YulString _length) const;
protected:
/// Registers the assignment.
2020-11-26 17:07:12 +00:00
void handleAssignment(std::set<YulString> const& _names, Expression* _value, bool _isDeclaration);
/// Creates a new inner scope.
void pushScope(bool _functionScope);
/// Removes the innermost scope and clears all variables in it.
void popScope();
/// Clears information about the values assigned to the given variables,
/// for example at points where control flow is merged.
void clearValues(std::set<YulString> _names);
2022-11-07 15:13:05 +00:00
virtual void assignValue(YulString _variable, Expression const* _value);
2019-11-27 09:44:40 +00:00
2019-05-27 22:14:01 +00:00
/// Clears knowledge about storage or memory if they may be modified inside the block.
void clearKnowledgeIfInvalidated(Block const& _block);
/// Clears knowledge about storage or memory if they may be modified inside the expression.
void clearKnowledgeIfInvalidated(Expression const& _expression);
2019-05-21 13:52:15 +00:00
/// Returns true iff the variable is in scope.
bool inScope(YulString _variableName) const;
/// Returns the literal value of the identifier, if it exists.
std::optional<u256> valueOfIdentifier(YulString const& _name) const;
enum class StoreLoadLocation {
Memory = 0,
Storage = 1,
Last = Storage
};
/// Checks if the statement is sstore(a, b) / mstore(a, b)
/// where a and b are variables and returns these variables in that case.
std::optional<std::pair<YulString, YulString>> isSimpleStore(
StoreLoadLocation _location,
2019-05-27 22:14:01 +00:00
ExpressionStatement const& _statement
) const;
2019-05-21 13:52:15 +00:00
/// Checks if the expression is sload(a) / mload(a)
/// where a is a variable and returns the variable in that case.
std::optional<YulString> isSimpleLoad(
StoreLoadLocation _location,
Expression const& _expression
) const;
/// Checks if the expression is keccak256(s, l)
/// where s and l are variables and returns these variables in that case.
std::optional<std::pair<YulString, YulString>> isKeccak(Expression const& _expression) const;
2019-05-21 13:52:15 +00:00
Dialect const& m_dialect;
/// Side-effects of user-defined functions. Worst-case side-effects are assumed
/// if this is not provided or the function is not found.
std::map<YulString, SideEffects> m_functionSideEffects;
2019-05-21 13:52:15 +00:00
2022-03-10 18:35:58 +00:00
private:
2022-03-17 18:04:00 +00:00
struct Environment
{
std::unordered_map<YulString, YulString> storage;
std::unordered_map<YulString, YulString> memory;
/// If keccak[s, l] = y then y := keccak256(s, l) occurs in the code.
std::map<std::pair<YulString, YulString>, YulString> keccak;
2022-03-17 18:04:00 +00:00
};
2022-03-10 18:35:58 +00:00
struct State
{
/// Current values of variables, always movable.
std::map<YulString, AssignedValue> value;
/// m_references[a].contains(b) <=> the current expression assigned to a references b
std::unordered_map<YulString, std::set<YulString>> references;
2018-02-05 17:02:32 +00:00
2022-03-17 18:04:00 +00:00
Environment environment;
2022-03-10 18:35:58 +00:00
};
2022-03-17 18:04:00 +00:00
/// Joins knowledge about storage and memory with an older point in the control-flow.
/// This only works if the current state is a direct successor of the older point,
/// i.e. `_olderState.storage` and `_olderState.memory` cannot have additional changes.
/// Does nothing if memory and storage analysis is disabled / ignored.
void joinKnowledge(Environment const& _olderEnvironment);
static void joinKnowledgeHelper(
std::unordered_map<YulString, YulString>& _thisData,
std::unordered_map<YulString, YulString> const& _olderData
);
2022-03-10 18:35:58 +00:00
State m_state;
2019-05-21 13:52:15 +00:00
2022-03-10 18:35:58 +00:00
protected:
2019-05-21 13:52:15 +00:00
KnowledgeBase m_knowledgeBase;
/// If true, analyzes memory and storage content via mload/mstore and sload/sstore.
bool m_analyzeStores = true;
YulString m_storeFunctionName[static_cast<unsigned>(StoreLoadLocation::Last) + 1];
YulString m_loadFunctionName[static_cast<unsigned>(StoreLoadLocation::Last) + 1];
2019-11-27 09:44:40 +00:00
/// Current nesting depth of loops.
size_t m_loopDepth{0};
2018-02-05 17:02:32 +00:00
struct Scope
{
explicit Scope(bool _isFunction): isFunction(_isFunction) {}
std::set<YulString> variables;
2018-02-05 17:02:32 +00:00
bool isFunction;
};
/// Special expression whose address will be used in m_value.
/// YulString does not need to be reset because DataFlowAnalyzer is short-lived.
Expression const m_zero{Literal{{}, LiteralKind::Number, YulString{"0"}, {}}};
2018-02-05 17:02:32 +00:00
/// List of scopes.
std::vector<Scope> m_variableScopes;
};
}