mirror of
				https://github.com/ethereum/solidity
				synced 2023-10-03 13:03:40 +00:00 
			
		
		
		
	
		
			
				
	
	
		
			183 lines
		
	
	
		
			6.6 KiB
		
	
	
	
		
			C++
		
	
	
	
	
	
			
		
		
	
	
			183 lines
		
	
	
		
			6.6 KiB
		
	
	
	
		
			C++
		
	
	
	
	
	
| /*
 | |
| 	This file is part of solidity.
 | |
| 
 | |
| 	solidity is free software: you can redistribute it and/or modify
 | |
| 	it under the terms of the GNU General Public License as published by
 | |
| 	the Free Software Foundation, either version 3 of the License, or
 | |
| 	(at your option) any later version.
 | |
| 
 | |
| 	solidity is distributed in the hope that it will be useful,
 | |
| 	but WITHOUT ANY WARRANTY; without even the implied warranty of
 | |
| 	MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
 | |
| 	GNU General Public License for more details.
 | |
| 
 | |
| 	You should have received a copy of the GNU General Public License
 | |
| 	along with solidity.  If not, see <http://www.gnu.org/licenses/>.
 | |
| */
 | |
| /**
 | |
|  * Base class to perform data flow analysis during AST walks.
 | |
|  * Tracks assignments and is used as base class for both Rematerialiser and
 | |
|  * Common Subexpression Eliminator.
 | |
|  */
 | |
| 
 | |
| #pragma once
 | |
| 
 | |
| #include <libyul/optimiser/ASTWalker.h>
 | |
| #include <libyul/optimiser/KnowledgeBase.h>
 | |
| #include <libyul/YulString.h>
 | |
| #include <libyul/AsmData.h>
 | |
| #include <libyul/SideEffects.h>
 | |
| 
 | |
| // TODO avoid
 | |
| #include <libevmasm/Instruction.h>
 | |
| 
 | |
| #include <libsolutil/InvertibleMap.h>
 | |
| 
 | |
| #include <map>
 | |
| #include <set>
 | |
| 
 | |
| namespace solidity::yul
 | |
| {
 | |
| struct Dialect;
 | |
| struct SideEffects;
 | |
| 
 | |
| /// Value assigned to a variable.
 | |
| struct AssignedValue
 | |
| {
 | |
| 	Expression const* value{nullptr};
 | |
| 	/// Loop nesting depth of the definition of the variable.
 | |
| 	size_t loopDepth{0};
 | |
| };
 | |
| 
 | |
| /**
 | |
|  * Base class to perform data flow analysis during AST walks.
 | |
|  * Tracks assignments and is used as base class for both Rematerialiser and
 | |
|  * Common Subexpression Eliminator.
 | |
|  *
 | |
|  * A special zero constant expression is used for the default value of variables.
 | |
|  *
 | |
|  * The class also tracks contents in storage and memory. Both keys and values
 | |
|  * are names of variables. Whenever such a variable is re-assigned, the knowledge
 | |
|  * is cleared.
 | |
|  *
 | |
|  * For elementary statements, we check if it is an SSTORE(x, y) / MSTORE(x, y)
 | |
|  * If yes, visit the statement. Then record that fact and clear all storage slots t
 | |
|  *   where we cannot prove x != t or y == m_storage[t] using the current values of the variables x and t.
 | |
|  * Otherwise, determine if the statement invalidates storage/memory. If yes, clear all knowledge
 | |
|  * about storage/memory before visiting the statement. Then visit the statement.
 | |
|  *
 | |
|  * For forward-joining control flow, storage/memory information from the branches is combined.
 | |
|  * If the keys or values are different or non-existent in one branch, the key is deleted.
 | |
|  * This works also for memory (where addresses overlap) because one branch is always an
 | |
|  * older version of the other and thus overlapping contents would have been deleted already
 | |
|  * at the point of assignment.
 | |
|  *
 | |
|  * The DataFlowAnalyzer currently does not deal with the ``leave`` statement. This is because
 | |
|  * it only matters at the end of a function body, which is a point in the code a derived class
 | |
|  * can not easily deal with.
 | |
|  *
 | |
|  * Prerequisite: Disambiguator, ForLoopInitRewriter.
 | |
|  */
 | |
| class DataFlowAnalyzer: public ASTModifier
 | |
| {
 | |
| public:
 | |
| 	/// @param _functionSideEffects
 | |
| 	///            Side-effects of user-defined functions. Worst-case side-effects are assumed
 | |
| 	///            if this is not provided or the function is not found.
 | |
| 	///            The parameter is mostly used to determine movability of expressions.
 | |
| 	explicit DataFlowAnalyzer(
 | |
| 		Dialect const& _dialect,
 | |
| 		std::map<YulString, SideEffects> _functionSideEffects = {}
 | |
| 	):
 | |
| 		m_dialect(_dialect),
 | |
| 		m_functionSideEffects(std::move(_functionSideEffects)),
 | |
| 		m_knowledgeBase(_dialect, m_value)
 | |
| 	{}
 | |
| 
 | |
| 	using ASTModifier::operator();
 | |
| 	void operator()(ExpressionStatement& _statement) override;
 | |
| 	void operator()(Assignment& _assignment) override;
 | |
| 	void operator()(VariableDeclaration& _varDecl) override;
 | |
| 	void operator()(If& _if) override;
 | |
| 	void operator()(Switch& _switch) override;
 | |
| 	void operator()(FunctionDefinition&) override;
 | |
| 	void operator()(ForLoop&) override;
 | |
| 	void operator()(Block& _block) override;
 | |
| 
 | |
| protected:
 | |
| 	/// Registers the assignment.
 | |
| 	void handleAssignment(std::set<YulString> const& _names, Expression* _value);
 | |
| 
 | |
| 	/// Creates a new inner scope.
 | |
| 	void pushScope(bool _functionScope);
 | |
| 
 | |
| 	/// Removes the innermost scope and clears all variables in it.
 | |
| 	void popScope();
 | |
| 
 | |
| 	/// Clears information about the values assigned to the given variables,
 | |
| 	/// for example at points where control flow is merged.
 | |
| 	void clearValues(std::set<YulString> _names);
 | |
| 
 | |
| 	void assignValue(YulString _variable, Expression const* _value);
 | |
| 
 | |
| 	/// Clears knowledge about storage or memory if they may be modified inside the block.
 | |
| 	void clearKnowledgeIfInvalidated(Block const& _block);
 | |
| 
 | |
| 	/// Clears knowledge about storage or memory if they may be modified inside the expression.
 | |
| 	void clearKnowledgeIfInvalidated(Expression const& _expression);
 | |
| 
 | |
| 	/// Joins knowledge about storage and memory with an older point in the control-flow.
 | |
| 	/// This only works if the current state is a direct successor of the older point,
 | |
| 	/// i.e. `_otherStorage` and `_otherMemory` cannot have additional changes.
 | |
| 	void joinKnowledge(
 | |
| 		InvertibleMap<YulString, YulString> const& _olderStorage,
 | |
| 		InvertibleMap<YulString, YulString> const& _olderMemory
 | |
| 	);
 | |
| 
 | |
| 	static void joinKnowledgeHelper(
 | |
| 		InvertibleMap<YulString, YulString>& _thisData,
 | |
| 		InvertibleMap<YulString, YulString> const& _olderData
 | |
| 	);
 | |
| 
 | |
| 	/// Returns true iff the variable is in scope.
 | |
| 	bool inScope(YulString _variableName) const;
 | |
| 
 | |
| 	std::optional<std::pair<YulString, YulString>> isSimpleStore(
 | |
| 		evmasm::Instruction _store,
 | |
| 		ExpressionStatement const& _statement
 | |
| 	) const;
 | |
| 
 | |
| 	Dialect const& m_dialect;
 | |
| 	/// Side-effects of user-defined functions. Worst-case side-effects are assumed
 | |
| 	/// if this is not provided or the function is not found.
 | |
| 	std::map<YulString, SideEffects> m_functionSideEffects;
 | |
| 
 | |
| 	/// Current values of variables, always movable.
 | |
| 	std::map<YulString, AssignedValue> m_value;
 | |
| 	/// m_references.forward[a].contains(b) <=> the current expression assigned to a references b
 | |
| 	/// m_references.backward[b].contains(a) <=> the current expression assigned to a references b
 | |
| 	InvertibleRelation<YulString> m_references;
 | |
| 
 | |
| 	InvertibleMap<YulString, YulString> m_storage;
 | |
| 	InvertibleMap<YulString, YulString> m_memory;
 | |
| 
 | |
| 	KnowledgeBase m_knowledgeBase;
 | |
| 
 | |
| 	/// Current nesting depth of loops.
 | |
| 	size_t m_loopDepth{0};
 | |
| 
 | |
| 	struct Scope
 | |
| 	{
 | |
| 		explicit Scope(bool _isFunction): isFunction(_isFunction) {}
 | |
| 		std::set<YulString> variables;
 | |
| 		bool isFunction;
 | |
| 	};
 | |
| 	/// Special expression whose address will be used in m_value.
 | |
| 	/// YulString does not need to be reset because DataFlowAnalyzer is short-lived.
 | |
| 	Expression const m_zero{Literal{{}, LiteralKind::Number, YulString{"0"}, {}}};
 | |
| 	/// List of scopes.
 | |
| 	std::vector<Scope> m_variableScopes;
 | |
| };
 | |
| 
 | |
| }
 |