mirror of
				https://github.com/ethereum/solidity
				synced 2023-10-03 13:03:40 +00:00 
			
		
		
		
	
		
			
				
	
	
		
			393 lines
		
	
	
		
			15 KiB
		
	
	
	
		
			C++
		
	
	
	
	
	
			
		
		
	
	
			393 lines
		
	
	
		
			15 KiB
		
	
	
	
		
			C++
		
	
	
	
	
	
| /*
 | |
| 	This file is part of solidity.
 | |
| 
 | |
| 	solidity is free software: you can redistribute it and/or modify
 | |
| 	it under the terms of the GNU General Public License as published by
 | |
| 	the Free Software Foundation, either version 3 of the License, or
 | |
| 	(at your option) any later version.
 | |
| 
 | |
| 	solidity is distributed in the hope that it will be useful,
 | |
| 	but WITHOUT ANY WARRANTY; without even the implied warranty of
 | |
| 	MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
 | |
| 	GNU General Public License for more details.
 | |
| 
 | |
| 	You should have received a copy of the GNU General Public License
 | |
| 	along with solidity.  If not, see <http://www.gnu.org/licenses/>.
 | |
| */
 | |
| // SPDX-License-Identifier: GPL-3.0
 | |
| #include <libsolidity/interface/FileReader.h>
 | |
| 
 | |
| #include <liblangutil/Exceptions.h>
 | |
| 
 | |
| #include <libsolutil/CommonIO.h>
 | |
| #include <libsolutil/Exceptions.h>
 | |
| #include <libsolutil/StringUtils.h>
 | |
| 
 | |
| #include <boost/algorithm/string/predicate.hpp>
 | |
| #include <range/v3/view/transform.hpp>
 | |
| 
 | |
| #include <range/v3/range/conversion.hpp>
 | |
| 
 | |
| #include <functional>
 | |
| 
 | |
| using solidity::frontend::ReadCallback;
 | |
| using solidity::langutil::InternalCompilerError;
 | |
| using solidity::util::errinfo_comment;
 | |
| using solidity::util::readFileAsString;
 | |
| using solidity::util::joinHumanReadable;
 | |
| 
 | |
| namespace solidity::frontend
 | |
| {
 | |
| 
 | |
| FileReader::FileReader(
 | |
| 	boost::filesystem::path _basePath,
 | |
| 	std::vector<boost::filesystem::path> const& _includePaths,
 | |
| 	FileSystemPathSet _allowedDirectories
 | |
| ):
 | |
| 	m_allowedDirectories(std::move(_allowedDirectories)),
 | |
| 	m_sourceCodes()
 | |
| {
 | |
| 	setBasePath(_basePath);
 | |
| 	for (boost::filesystem::path const& includePath: _includePaths)
 | |
| 		addIncludePath(includePath);
 | |
| 
 | |
| 	for (boost::filesystem::path const& allowedDir: m_allowedDirectories)
 | |
| 		solAssert(!allowedDir.empty(), "");
 | |
| }
 | |
| 
 | |
| void FileReader::setBasePath(boost::filesystem::path const& _path)
 | |
| {
 | |
| 	if (_path.empty())
 | |
| 	{
 | |
| 		// Empty base path is a special case that does not make sense when include paths are used.
 | |
| 		solAssert(m_includePaths.empty(), "");
 | |
| 		m_basePath = "";
 | |
| 	}
 | |
| 	else
 | |
| 		m_basePath = normalizeCLIPathForVFS(_path);
 | |
| }
 | |
| 
 | |
| void FileReader::addIncludePath(boost::filesystem::path const& _path)
 | |
| {
 | |
| 	solAssert(!m_basePath.empty(), "");
 | |
| 	solAssert(!_path.empty(), "");
 | |
| 	m_includePaths.push_back(normalizeCLIPathForVFS(_path));
 | |
| }
 | |
| 
 | |
| void FileReader::allowDirectory(boost::filesystem::path _path)
 | |
| {
 | |
| 	solAssert(!_path.empty(), "");
 | |
| 	m_allowedDirectories.insert(std::move(_path));
 | |
| }
 | |
| 
 | |
| void FileReader::addOrUpdateFile(boost::filesystem::path const& _path, SourceCode _source)
 | |
| {
 | |
| 	m_sourceCodes[cliPathToSourceUnitName(_path)] = std::move(_source);
 | |
| }
 | |
| 
 | |
| void FileReader::setStdin(SourceCode _source)
 | |
| {
 | |
| 	m_sourceCodes["<stdin>"] = std::move(_source);
 | |
| }
 | |
| 
 | |
| void FileReader::setSourceUnits(StringMap _sources)
 | |
| {
 | |
| 	m_sourceCodes = std::move(_sources);
 | |
| }
 | |
| 
 | |
| ReadCallback::Result FileReader::readFile(std::string const& _kind, std::string const& _sourceUnitName)
 | |
| {
 | |
| 	try
 | |
| 	{
 | |
| 		if (_kind != ReadCallback::kindString(ReadCallback::Kind::ReadFile))
 | |
| 			solAssert(false, "ReadFile callback used as callback kind " + _kind);
 | |
| 		std::string strippedSourceUnitName = _sourceUnitName;
 | |
| 		if (strippedSourceUnitName.find("file://") == 0)
 | |
| 			strippedSourceUnitName.erase(0, 7);
 | |
| 
 | |
| 		std::vector<boost::filesystem::path> candidates;
 | |
| 		std::vector<std::reference_wrapper<boost::filesystem::path>> prefixes = {m_basePath};
 | |
| 		prefixes += (m_includePaths | ranges::to<std::vector<std::reference_wrapper<boost::filesystem::path>>>);
 | |
| 
 | |
| 		for (auto const& prefix: prefixes)
 | |
| 		{
 | |
| 			boost::filesystem::path canonicalPath = normalizeCLIPathForVFS(prefix / strippedSourceUnitName, SymlinkResolution::Enabled);
 | |
| 			if (boost::filesystem::exists(canonicalPath))
 | |
| 				candidates.push_back(std::move(canonicalPath));
 | |
| 		}
 | |
| 
 | |
| 		auto pathToQuotedString = [](boost::filesystem::path const& _path){ return "\"" + _path.string() + "\""; };
 | |
| 
 | |
| 		if (candidates.empty())
 | |
| 			return ReadCallback::Result{
 | |
| 				false,
 | |
| 				"File not found. Searched the following locations: " +
 | |
| 				joinHumanReadable(prefixes | ranges::views::transform(pathToQuotedString), ", ") +
 | |
| 				"."
 | |
| 			};
 | |
| 
 | |
| 		if (candidates.size() >= 2)
 | |
| 			return ReadCallback::Result{
 | |
| 				false,
 | |
| 				"Ambiguous import. "
 | |
| 				"Multiple matching files found inside base path and/or include paths: " +
 | |
| 				joinHumanReadable(candidates | ranges::views::transform(pathToQuotedString), ", ") +
 | |
| 				"."
 | |
| 			};
 | |
| 
 | |
| 		FileSystemPathSet allowedPaths =
 | |
| 			m_allowedDirectories +
 | |
| 			decltype(allowedPaths){m_basePath.empty() ? "." : m_basePath} +
 | |
| 			m_includePaths;
 | |
| 
 | |
| 		bool isAllowed = false;
 | |
| 		for (boost::filesystem::path const& allowedDir: allowedPaths)
 | |
| 			if (isPathPrefix(normalizeCLIPathForVFS(allowedDir, SymlinkResolution::Enabled), candidates[0]))
 | |
| 			{
 | |
| 				isAllowed = true;
 | |
| 				break;
 | |
| 			}
 | |
| 
 | |
| 		if (!isAllowed)
 | |
| 			return ReadCallback::Result{
 | |
| 				false,
 | |
| 				"File outside of allowed directories. The following are allowed: " +
 | |
| 				joinHumanReadable(allowedPaths | ranges::views::transform(pathToQuotedString), ", ") +
 | |
| 				"."
 | |
| 			};
 | |
| 
 | |
| 		if (!boost::filesystem::is_regular_file(candidates[0]))
 | |
| 			return ReadCallback::Result{false, "Not a valid file."};
 | |
| 
 | |
| 		// NOTE: we ignore the FileNotFound exception as we manually check above
 | |
| 		auto contents = readFileAsString(candidates[0]);
 | |
| 		solAssert(m_sourceCodes.count(_sourceUnitName) == 0, "");
 | |
| 		m_sourceCodes[_sourceUnitName] = contents;
 | |
| 		return ReadCallback::Result{true, contents};
 | |
| 	}
 | |
| 	catch (util::Exception const& _exception)
 | |
| 	{
 | |
| 		return ReadCallback::Result{false, "Exception in read callback: " + boost::diagnostic_information(_exception)};
 | |
| 	}
 | |
| 	catch (std::exception const& _exception)
 | |
| 	{
 | |
| 		return ReadCallback::Result{false, "Exception in read callback: " + boost::diagnostic_information(_exception)};
 | |
| 	}
 | |
| 	catch (...)
 | |
| 	{
 | |
| 		return ReadCallback::Result{false, "Unknown exception in read callback: " + boost::current_exception_diagnostic_information()};
 | |
| 	}
 | |
| }
 | |
| 
 | |
| std::string FileReader::cliPathToSourceUnitName(boost::filesystem::path const& _cliPath) const
 | |
| {
 | |
| 	std::vector<boost::filesystem::path> prefixes = {m_basePath.empty() ? normalizeCLIPathForVFS(".") : m_basePath};
 | |
| 	prefixes += m_includePaths;
 | |
| 
 | |
| 	boost::filesystem::path normalizedPath = normalizeCLIPathForVFS(_cliPath);
 | |
| 	for (boost::filesystem::path const& prefix: prefixes)
 | |
| 		if (isPathPrefix(prefix, normalizedPath))
 | |
| 		{
 | |
| 			// Multiple prefixes can potentially match the path. We take the first one.
 | |
| 			normalizedPath = stripPrefixIfPresent(prefix, normalizedPath);
 | |
| 			break;
 | |
| 		}
 | |
| 
 | |
| 	return normalizedPath.generic_string();
 | |
| }
 | |
| 
 | |
| std::map<std::string, FileReader::FileSystemPathSet> FileReader::detectSourceUnitNameCollisions(FileSystemPathSet const& _cliPaths) const
 | |
| {
 | |
| 	std::map<std::string, FileReader::FileSystemPathSet> nameToPaths;
 | |
| 	for (boost::filesystem::path const& cliPath: _cliPaths)
 | |
| 	{
 | |
| 		std::string sourceUnitName = cliPathToSourceUnitName(cliPath);
 | |
| 		boost::filesystem::path normalizedPath = normalizeCLIPathForVFS(cliPath);
 | |
| 		nameToPaths[sourceUnitName].insert(normalizedPath);
 | |
| 	}
 | |
| 
 | |
| 	std::map<std::string, FileReader::FileSystemPathSet> collisions;
 | |
| 	for (auto&& [sourceUnitName, cliPaths]: nameToPaths)
 | |
| 		if (cliPaths.size() >= 2)
 | |
| 			collisions[sourceUnitName] = std::move(cliPaths);
 | |
| 
 | |
| 	return collisions;
 | |
| }
 | |
| 
 | |
| boost::filesystem::path FileReader::normalizeCLIPathForVFS(
 | |
| 	boost::filesystem::path const& _path,
 | |
| 	SymlinkResolution _symlinkResolution
 | |
| )
 | |
| {
 | |
| 	// Detailed normalization rules:
 | |
| 	// - Makes the path either be absolute or have slash as root (note that on Windows paths with
 | |
| 	//   slash as root are not considered absolute by Boost). If it is empty, it becomes
 | |
| 	//   the current working directory.
 | |
| 	// - Collapses redundant . and .. segments.
 | |
| 	// - Removes leading .. segments from an absolute path (i.e. /../../ becomes just /).
 | |
| 	// - Squashes sequences of multiple path separators into one.
 | |
| 	// - Ensures that forward slashes are used as path separators on all platforms.
 | |
| 	// - Removes the root name (e.g. drive letter on Windows) when it matches the root name in the
 | |
| 	//   path to the current working directory.
 | |
| 	//
 | |
| 	// Also note that this function:
 | |
| 	// - Does NOT resolve symlinks (except for symlinks in the path to the current working directory)
 | |
| 	//   unless explicitly requested.
 | |
| 	// - Does NOT check if the path refers to a file or a directory. If the path ends with a slash,
 | |
| 	//   the slash is preserved even if it's a file.
 | |
| 	//   - The only exception are paths where the file name is a dot (e.g. '.' or 'a/b/.'). These
 | |
| 	//     always have a trailing slash after normalization.
 | |
| 	// - Preserves case. Even if the filesystem is case-insensitive but case-preserving and the
 | |
| 	//   case differs, the actual case from disk is NOT detected.
 | |
| 
 | |
| 	boost::filesystem::path canonicalWorkDir = boost::filesystem::weakly_canonical(boost::filesystem::current_path());
 | |
| 
 | |
| 	// NOTE: On UNIX systems the path returned from current_path() has symlinks resolved while on
 | |
| 	// Windows it does not. To get consistent results we resolve them on all platforms.
 | |
| 	boost::filesystem::path absolutePath = boost::filesystem::absolute(_path, canonicalWorkDir);
 | |
| 
 | |
| 	boost::filesystem::path normalizedPath;
 | |
| 	if (_symlinkResolution == SymlinkResolution::Enabled)
 | |
| 	{
 | |
| 		// NOTE: weakly_canonical() will not convert a relative path into an absolute one if no
 | |
| 		// directory included in the path actually exists.
 | |
| 		normalizedPath = boost::filesystem::weakly_canonical(absolutePath);
 | |
| 
 | |
| 		// The three corner cases in which lexically_normal() includes a trailing slash in the
 | |
| 		// normalized path but weakly_canonical() does not. Note that the trailing slash is not
 | |
| 		// ignored when comparing paths with ==.
 | |
| 		if ((_path == "." || _path == "./" || _path == "../") && !boost::ends_with(normalizedPath.generic_string(), "/"))
 | |
| 			normalizedPath = normalizedPath.parent_path() / (normalizedPath.filename().string() + "/");
 | |
| 	}
 | |
| 	else
 | |
| 	{
 | |
| 		solAssert(_symlinkResolution == SymlinkResolution::Disabled, "");
 | |
| 
 | |
| 		// NOTE: boost path preserves certain differences that are ignored by its operator ==.
 | |
| 		// E.g. "a//b" vs "a/b" or "a/b/" vs "a/b/.". lexically_normal() does remove these differences.
 | |
| 		normalizedPath = absolutePath.lexically_normal();
 | |
| 	}
 | |
| 	solAssert(normalizedPath.is_absolute() || normalizedPath.root_path() == "/", "");
 | |
| 
 | |
| 	// If the path is on the same drive as the working dir, for portability we prefer not to
 | |
| 	// include the root name. Do this only for non-UNC paths - my experiments show that on Windows
 | |
| 	// when the working dir is an UNC path, / does not not actually refer to the root of the UNC path.
 | |
| 
 | |
| 	boost::filesystem::path normalizedRootPath = normalizeCLIRootPathForVFS(normalizedPath, canonicalWorkDir);
 | |
| 
 | |
| 	// lexically_normal() will not squash paths like "/../../" into "/". We have to do it manually.
 | |
| 	boost::filesystem::path dotDotPrefix = absoluteDotDotPrefix(normalizedPath);
 | |
| 
 | |
| 	boost::filesystem::path normalizedPathNoDotDot = normalizedPath;
 | |
| 	if (dotDotPrefix.empty())
 | |
| 		normalizedPathNoDotDot = normalizedRootPath / normalizedPath.relative_path();
 | |
| 	else
 | |
| 		normalizedPathNoDotDot = normalizedRootPath / normalizedPath.lexically_relative(normalizedPath.root_path() / dotDotPrefix);
 | |
| 	solAssert(!hasDotDotSegments(normalizedPathNoDotDot), "");
 | |
| 
 | |
| 	// NOTE: On Windows lexically_normal() converts all separators to forward slashes. Convert them back.
 | |
| 	// Separators do not affect path comparison but remain in internal representation returned by native().
 | |
| 	// This will also normalize the root name to start with // in UNC paths.
 | |
| 	normalizedPathNoDotDot = normalizedPathNoDotDot.generic_string();
 | |
| 
 | |
| 	// For some reason boost considers "/." different than "/" even though for other directories
 | |
| 	// the trailing dot is ignored.
 | |
| 	if (normalizedPathNoDotDot == "/.")
 | |
| 		return "/";
 | |
| 
 | |
| 	return normalizedPathNoDotDot;
 | |
| }
 | |
| 
 | |
| boost::filesystem::path FileReader::normalizeCLIRootPathForVFS(
 | |
| 	boost::filesystem::path const& _path,
 | |
| 	boost::filesystem::path const& _workDir
 | |
| )
 | |
| {
 | |
| 	solAssert(_workDir.is_absolute(), "");
 | |
| 
 | |
| 	boost::filesystem::path absolutePath = boost::filesystem::absolute(_path, _workDir);
 | |
| 	boost::filesystem::path rootPath = absolutePath.root_path();
 | |
| 	boost::filesystem::path baseRootPath = _workDir.root_path();
 | |
| 
 | |
| 	if (isUNCPath(absolutePath))
 | |
| 		return rootPath;
 | |
| 
 | |
| 	// Ignore drive letter case on Windows (C:\ <=> c:\).
 | |
| 	if (boost::filesystem::equivalent(rootPath, baseRootPath))
 | |
| 		return "/";
 | |
| 
 | |
| 	return rootPath;
 | |
| }
 | |
| 
 | |
| bool FileReader::isPathPrefix(boost::filesystem::path const& _prefix, boost::filesystem::path const& _path)
 | |
| {
 | |
| 	solAssert(!_prefix.empty() && !_path.empty(), "");
 | |
| 	// NOTE: On Windows paths starting with a slash (rather than a drive letter) are considered relative by boost.
 | |
| 	solAssert(_prefix.is_absolute() || isUNCPath(_prefix) || _prefix.root_path() == "/", "");
 | |
| 	solAssert(_path.is_absolute() || isUNCPath(_path) || _path.root_path() == "/", "");
 | |
| 	// NOTE: On Windows before Boost 1.78 lexically_normal() would not replace the `//` UNC prefix with `\\\\`.
 | |
| 	// Later versions do. Use generic_path() to normalize all slashes to `/` and ignore that difference.
 | |
| 	// This does not make the assert weaker because == ignores slash type anyway.
 | |
| 	solAssert(_prefix == _prefix.lexically_normal().generic_string() && _path == _path.lexically_normal().generic_string(), "");
 | |
| 	solAssert(!hasDotDotSegments(_prefix) && !hasDotDotSegments(_path), "");
 | |
| 
 | |
| 	boost::filesystem::path strippedPath = _path.lexically_relative(
 | |
| 		// Before 1.72.0 lexically_relative() was not handling paths with empty, dot and dot dot segments
 | |
| 		// correctly (see https://github.com/boostorg/filesystem/issues/76). The only case where this
 | |
| 		// is possible after our normalization is a directory name ending in a slash (filename is a dot).
 | |
| 		_prefix.filename_is_dot() ? _prefix.parent_path() : _prefix
 | |
| 	);
 | |
| 	return !strippedPath.empty() && *strippedPath.begin() != "..";
 | |
| }
 | |
| 
 | |
| boost::filesystem::path FileReader::stripPrefixIfPresent(boost::filesystem::path const& _prefix, boost::filesystem::path const& _path)
 | |
| {
 | |
| 	if (!isPathPrefix(_prefix, _path))
 | |
| 		return _path;
 | |
| 
 | |
| 	boost::filesystem::path strippedPath = _path.lexically_relative(
 | |
| 		_prefix.filename_is_dot() ? _prefix.parent_path() : _prefix
 | |
| 	);
 | |
| 	solAssert(strippedPath.empty() || *strippedPath.begin() != "..", "");
 | |
| 	return strippedPath;
 | |
| }
 | |
| 
 | |
| boost::filesystem::path FileReader::absoluteDotDotPrefix(boost::filesystem::path const& _path)
 | |
| {
 | |
| 	solAssert(_path.is_absolute() || _path.root_path() == "/", "");
 | |
| 
 | |
| 	boost::filesystem::path _pathWithoutRoot = _path.relative_path();
 | |
| 	boost::filesystem::path prefix;
 | |
| 	for (boost::filesystem::path const& segment: _pathWithoutRoot)
 | |
| 		if (segment.filename_is_dot_dot())
 | |
| 			prefix /= segment;
 | |
| 
 | |
| 	return prefix;
 | |
| }
 | |
| 
 | |
| bool FileReader::hasDotDotSegments(boost::filesystem::path const& _path)
 | |
| {
 | |
| 	for (boost::filesystem::path const& segment: _path)
 | |
| 		if (segment.filename_is_dot_dot())
 | |
| 			return true;
 | |
| 
 | |
| 	return false;
 | |
| }
 | |
| 
 | |
| bool FileReader::isUNCPath(boost::filesystem::path const& _path)
 | |
| {
 | |
| 	std::string rootName = _path.root_name().string();
 | |
| 
 | |
| 	return (
 | |
| 		rootName.size() == 2 ||
 | |
| 		(rootName.size() > 2 && rootName[2] != rootName[1])
 | |
| 	) && (
 | |
| 		(rootName[0] == '/' && rootName[1] == '/')
 | |
| #if defined(_WIN32)
 | |
| 		|| (rootName[0] == '\\' && rootName[1] == '\\')
 | |
| #endif
 | |
| 	);
 | |
| }
 | |
| 
 | |
| }
 |