/* This file is part of solidity. solidity is free software: you can redistribute it and/or modify it under the terms of the GNU General Public License as published by the Free Software Foundation, either version 3 of the License, or (at your option) any later version. solidity is distributed in the hope that it will be useful, but WITHOUT ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU General Public License for more details. You should have received a copy of the GNU General Public License along with solidity. If not, see . */ /** * Base class to perform data flow analysis during AST walks. * Tracks assignments and is used as base class for both Rematerialiser and * Common Subexpression Eliminator. */ #pragma once #include #include #include #include #include // TODO avoid #include #include #include #include namespace solidity::yul { struct Dialect; struct SideEffects; /** * Base class to perform data flow analysis during AST walks. * Tracks assignments and is used as base class for both Rematerialiser and * Common Subexpression Eliminator. * * A special zero constant expression is used for the default value of variables. * * The class also tracks contents in storage and memory. Both keys and values * are names of variables. Whenever such a variable is re-assigned, the knowledge * is cleared. * * For elementary statements, we check if it is an SSTORE(x, y) / MSTORE(x, y) * If yes, visit the statement. Then record that fact and clear all storage slots t * where we cannot prove x != t or y == m_storage[t] using the current values of the variables x and t. * Otherwise, determine if the statement invalidates storage/memory. If yes, clear all knowledge * about storage/memory before visiting the statement. Then visit the statement. * * For forward-joining control flow, storage/memory information from the branches is combined. * If the keys or values are different or non-existent in one branch, the key is deleted. * This works also for memory (where addresses overlap) because one branch is always an * older version of the other and thus overlapping contents would have been deleted already * at the point of assignment. * * The DataFlowAnalyzer currently does not deal with the ``leave`` statement. This is because * it only matters at the end of a function body, which is a point in the code a derived class * can not easily deal with. * * Prerequisite: Disambiguator, ForLoopInitRewriter. */ class DataFlowAnalyzer: public ASTModifier { public: /// @param _functionSideEffects /// Side-effects of user-defined functions. Worst-case side-effects are assumed /// if this is not provided or the function is not found. /// The parameter is mostly used to determine movability of expressions. explicit DataFlowAnalyzer( Dialect const& _dialect, std::map _functionSideEffects = {} ): m_dialect(_dialect), m_functionSideEffects(std::move(_functionSideEffects)), m_knowledgeBase(_dialect, m_value) {} using ASTModifier::operator(); void operator()(ExpressionStatement& _statement) override; void operator()(Assignment& _assignment) override; void operator()(VariableDeclaration& _varDecl) override; void operator()(If& _if) override; void operator()(Switch& _switch) override; void operator()(FunctionDefinition&) override; void operator()(ForLoop&) override; void operator()(Block& _block) override; protected: /// Registers the assignment. void handleAssignment(std::set const& _names, Expression* _value); /// Creates a new inner scope. void pushScope(bool _functionScope); /// Removes the innermost scope and clears all variables in it. void popScope(); /// Clears information about the values assigned to the given variables, /// for example at points where control flow is merged. void clearValues(std::set _names); void assignValue(YulString _variable, Expression const* _value); /// Clears knowledge about storage or memory if they may be modified inside the block. void clearKnowledgeIfInvalidated(Block const& _block); /// Clears knowledge about storage or memory if they may be modified inside the expression. void clearKnowledgeIfInvalidated(Expression const& _expression); /// Joins knowledge about storage and memory with an older point in the control-flow. /// This only works if the current state is a direct successor of the older point, /// i.e. `_otherStorage` and `_otherMemory` cannot have additional changes. void joinKnowledge( InvertibleMap const& _olderStorage, InvertibleMap const& _olderMemory ); static void joinKnowledgeHelper( InvertibleMap& _thisData, InvertibleMap const& _olderData ); /// Returns true iff the variable is in scope. bool inScope(YulString _variableName) const; std::optional> isSimpleStore( evmasm::Instruction _store, ExpressionStatement const& _statement ) const; Dialect const& m_dialect; /// Side-effects of user-defined functions. Worst-case side-effects are assumed /// if this is not provided or the function is not found. std::map m_functionSideEffects; /// Current values of variables, always movable. std::map m_value; /// The loop nesting depth of the definition of variables (those used in m_value). std::map m_variableLoopDepth; /// m_references.forward[a].contains(b) <=> the current expression assigned to a references b /// m_references.backward[b].contains(a) <=> the current expression assigned to a references b InvertibleRelation m_references; InvertibleMap m_storage; InvertibleMap m_memory; KnowledgeBase m_knowledgeBase; /// Current nesting depth of loops. size_t m_loopDepth{0}; struct Scope { explicit Scope(bool _isFunction): isFunction(_isFunction) {} std::set variables; bool isFunction; }; /// Special expression whose address will be used in m_value. /// YulString does not need to be reset because DataFlowAnalyzer is short-lived. Expression const m_zero{Literal{{}, LiteralKind::Number, YulString{"0"}, {}}}; /// List of scopes. std::vector m_variableScopes; }; }