2020-06-25 20:11:50 +00:00
|
|
|
// VulcanizeDB
|
|
|
|
// Copyright © 2020 Vulcanize
|
|
|
|
|
|
|
|
// This program is free software: you can redistribute it and/or modify
|
|
|
|
// it under the terms of the GNU Affero General Public License as published by
|
|
|
|
// the Free Software Foundation, either version 3 of the License, or
|
|
|
|
// (at your option) any later version.
|
|
|
|
|
|
|
|
// This program is distributed in the hope that it will be useful,
|
|
|
|
// but WITHOUT ANY WARRANTY; without even the implied warranty of
|
|
|
|
// MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
|
|
|
|
// GNU Affero General Public License for more details.
|
|
|
|
|
|
|
|
// You should have received a copy of the GNU Affero General Public License
|
|
|
|
// along with this program. If not, see <http://www.gnu.org/licenses/>.
|
|
|
|
|
|
|
|
package validator
|
|
|
|
|
|
|
|
import (
|
2022-08-08 23:28:13 +00:00
|
|
|
"bytes"
|
2022-08-24 19:09:46 +00:00
|
|
|
"context"
|
2022-08-08 23:28:13 +00:00
|
|
|
"fmt"
|
2021-08-25 08:20:31 +00:00
|
|
|
"time"
|
|
|
|
|
2020-06-25 20:11:50 +00:00
|
|
|
"github.com/ethereum/go-ethereum/common"
|
|
|
|
"github.com/ethereum/go-ethereum/core/state"
|
2022-08-08 23:28:13 +00:00
|
|
|
"github.com/ethereum/go-ethereum/core/types"
|
2020-06-26 18:11:30 +00:00
|
|
|
"github.com/ethereum/go-ethereum/crypto"
|
2020-06-25 20:11:50 +00:00
|
|
|
"github.com/ethereum/go-ethereum/ethdb"
|
2022-08-08 23:28:13 +00:00
|
|
|
"github.com/ethereum/go-ethereum/rlp"
|
2020-06-25 20:11:50 +00:00
|
|
|
"github.com/ethereum/go-ethereum/trie"
|
2020-07-13 00:57:47 +00:00
|
|
|
"github.com/ipfs/go-blockservice"
|
2020-06-25 20:11:50 +00:00
|
|
|
"github.com/jmoiron/sqlx"
|
2021-08-25 08:20:31 +00:00
|
|
|
"github.com/mailgun/groupcache/v2"
|
2022-08-24 19:09:46 +00:00
|
|
|
log "github.com/sirupsen/logrus"
|
|
|
|
"golang.org/x/sync/errgroup"
|
2020-06-25 20:11:50 +00:00
|
|
|
|
2022-09-14 19:01:21 +00:00
|
|
|
nodeiter "github.com/cerc-io/go-eth-state-node-iterator"
|
|
|
|
"github.com/cerc-io/go-eth-state-node-iterator/tracker"
|
|
|
|
ipfsethdb "github.com/cerc-io/ipfs-ethdb/v4"
|
|
|
|
pgipfsethdb "github.com/cerc-io/ipfs-ethdb/v4/postgres"
|
2020-06-25 20:11:50 +00:00
|
|
|
)
|
|
|
|
|
|
|
|
// Validator is used for validating Ethereum state and storage tries on PG-IPFS
|
|
|
|
type Validator struct {
|
|
|
|
kvs ethdb.KeyValueStore
|
|
|
|
trieDB *trie.Database
|
|
|
|
stateDatabase state.Database
|
2021-08-25 08:20:31 +00:00
|
|
|
db *pgipfsethdb.Database
|
2022-08-08 23:28:13 +00:00
|
|
|
|
2022-08-24 19:09:46 +00:00
|
|
|
params Params
|
2020-06-25 20:11:50 +00:00
|
|
|
}
|
|
|
|
|
2022-08-24 19:09:46 +00:00
|
|
|
type Params struct {
|
|
|
|
Workers uint
|
|
|
|
RecoveryFormat string // %s substituted with traversal type
|
|
|
|
}
|
|
|
|
|
|
|
|
var (
|
|
|
|
DefaultRecoveryFormat = "./recover_validate_%s"
|
|
|
|
emptyCodeHash = crypto.Keccak256(nil)
|
|
|
|
)
|
2022-08-08 23:28:13 +00:00
|
|
|
|
2020-07-13 00:57:47 +00:00
|
|
|
// NewPGIPFSValidator returns a new trie validator ontop of a connection pool for an IPFS backing Postgres database
|
2022-08-24 19:09:46 +00:00
|
|
|
func NewPGIPFSValidator(db *sqlx.DB, par Params) *Validator {
|
2021-08-25 08:20:31 +00:00
|
|
|
kvs := pgipfsethdb.NewKeyValueStore(db, pgipfsethdb.CacheConfig{
|
|
|
|
Name: "kv",
|
|
|
|
Size: 16 * 1000 * 1000, // 16MB
|
|
|
|
ExpiryDuration: time.Hour * 8, // 8 hours
|
|
|
|
})
|
|
|
|
|
|
|
|
database := pgipfsethdb.NewDatabase(db, pgipfsethdb.CacheConfig{
|
|
|
|
Name: "db",
|
|
|
|
Size: 16 * 1000 * 1000, // 16MB
|
|
|
|
ExpiryDuration: time.Hour * 8, // 8 hours
|
|
|
|
})
|
|
|
|
|
2022-08-24 19:09:46 +00:00
|
|
|
normalizeParams(&par)
|
2020-07-13 00:57:47 +00:00
|
|
|
return &Validator{
|
|
|
|
kvs: kvs,
|
|
|
|
trieDB: trie.NewDatabase(kvs),
|
|
|
|
stateDatabase: state.NewDatabase(database),
|
2021-12-29 19:44:32 +00:00
|
|
|
db: database.(*pgipfsethdb.Database),
|
2022-08-24 19:09:46 +00:00
|
|
|
params: par,
|
2020-07-13 00:57:47 +00:00
|
|
|
}
|
|
|
|
}
|
|
|
|
|
2021-08-25 08:20:31 +00:00
|
|
|
func (v *Validator) GetCacheStats() groupcache.Stats {
|
|
|
|
return v.db.GetCacheStats()
|
|
|
|
}
|
|
|
|
|
2020-07-13 00:57:47 +00:00
|
|
|
// NewIPFSValidator returns a new trie validator ontop of an IPFS blockservice
|
2022-08-24 19:09:46 +00:00
|
|
|
func NewIPFSValidator(bs blockservice.BlockService, par Params) *Validator {
|
2020-07-13 00:57:47 +00:00
|
|
|
kvs := ipfsethdb.NewKeyValueStore(bs)
|
|
|
|
database := ipfsethdb.NewDatabase(bs)
|
2022-08-24 19:09:46 +00:00
|
|
|
normalizeParams(&par)
|
2020-07-13 00:57:47 +00:00
|
|
|
return &Validator{
|
|
|
|
kvs: kvs,
|
|
|
|
trieDB: trie.NewDatabase(kvs),
|
|
|
|
stateDatabase: state.NewDatabase(database),
|
2022-08-24 19:09:46 +00:00
|
|
|
params: par,
|
2020-07-13 00:57:47 +00:00
|
|
|
}
|
|
|
|
}
|
|
|
|
|
2020-06-25 20:11:50 +00:00
|
|
|
// NewValidator returns a new trie validator
|
2020-06-26 18:11:30 +00:00
|
|
|
// Validating the completeness of a modified merkle patricia tries requires traversing the entire trie and verifying that
|
|
|
|
// every node is present, this is an expensive operation
|
2020-07-13 00:57:47 +00:00
|
|
|
func NewValidator(kvs ethdb.KeyValueStore, database ethdb.Database) *Validator {
|
2020-06-25 20:11:50 +00:00
|
|
|
return &Validator{
|
|
|
|
kvs: kvs,
|
|
|
|
trieDB: trie.NewDatabase(kvs),
|
|
|
|
stateDatabase: state.NewDatabase(database),
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
2022-08-24 19:09:46 +00:00
|
|
|
// Ensure params are valid
|
|
|
|
func normalizeParams(p *Params) {
|
|
|
|
if p.Workers == 0 {
|
|
|
|
p.Workers = 1
|
2022-08-08 23:28:13 +00:00
|
|
|
}
|
2022-08-24 19:09:46 +00:00
|
|
|
if len(p.RecoveryFormat) == 0 {
|
|
|
|
p.RecoveryFormat = DefaultRecoveryFormat
|
2022-08-08 23:28:13 +00:00
|
|
|
}
|
|
|
|
}
|
|
|
|
|
2020-06-26 18:11:30 +00:00
|
|
|
// ValidateTrie returns an error if the state and storage tries for the provided state root cannot be confirmed as complete
|
|
|
|
// This does consider child storage tries
|
|
|
|
func (v *Validator) ValidateTrie(stateRoot common.Hash) error {
|
2022-08-08 23:28:13 +00:00
|
|
|
t, err := v.stateDatabase.OpenTrie(stateRoot)
|
2020-06-25 20:11:50 +00:00
|
|
|
if err != nil {
|
2020-06-26 18:11:30 +00:00
|
|
|
return err
|
2020-06-25 20:11:50 +00:00
|
|
|
}
|
2022-08-24 19:09:46 +00:00
|
|
|
iterate := func(it trie.NodeIterator) error { return v.iterate(it, true) }
|
|
|
|
return iterateTracked(t, fmt.Sprintf(v.params.RecoveryFormat, fullTraversal), v.params.Workers, iterate)
|
2020-06-26 18:11:30 +00:00
|
|
|
}
|
|
|
|
|
|
|
|
// ValidateStateTrie returns an error if the state trie for the provided state root cannot be confirmed as complete
|
|
|
|
// This does not consider child storage tries
|
|
|
|
func (v *Validator) ValidateStateTrie(stateRoot common.Hash) error {
|
|
|
|
// Generate the trie.NodeIterator for this root
|
|
|
|
t, err := v.stateDatabase.OpenTrie(stateRoot)
|
|
|
|
if err != nil {
|
|
|
|
return err
|
|
|
|
}
|
2022-08-24 19:09:46 +00:00
|
|
|
iterate := func(it trie.NodeIterator) error { return v.iterate(it, false) }
|
|
|
|
return iterateTracked(t, fmt.Sprintf(v.params.RecoveryFormat, stateTraversal), v.params.Workers, iterate)
|
2020-06-26 18:11:30 +00:00
|
|
|
}
|
|
|
|
|
|
|
|
// ValidateStorageTrie returns an error if the storage trie for the provided storage root and contract address cannot be confirmed as complete
|
|
|
|
func (v *Validator) ValidateStorageTrie(address common.Address, storageRoot common.Hash) error {
|
|
|
|
// Generate the state.NodeIterator for this root
|
|
|
|
addrHash := crypto.Keccak256Hash(address.Bytes())
|
|
|
|
t, err := v.stateDatabase.OpenStorageTrie(addrHash, storageRoot)
|
|
|
|
if err != nil {
|
|
|
|
return err
|
|
|
|
}
|
2022-08-24 19:09:46 +00:00
|
|
|
iterate := func(it trie.NodeIterator) error { return v.iterate(it, false) }
|
|
|
|
return iterateTracked(t, fmt.Sprintf(v.params.RecoveryFormat, storageTraversal), v.params.Workers, iterate)
|
2020-06-25 20:11:50 +00:00
|
|
|
}
|
2021-10-11 15:18:45 +00:00
|
|
|
|
|
|
|
// Close implements io.Closer
|
|
|
|
// it deregisters the groupcache name
|
|
|
|
func (v *Validator) Close() error {
|
|
|
|
groupcache.DeregisterGroup("kv")
|
|
|
|
groupcache.DeregisterGroup("db")
|
|
|
|
return nil
|
|
|
|
}
|
2022-08-24 19:09:46 +00:00
|
|
|
|
2022-08-30 14:48:12 +00:00
|
|
|
// Traverses one iterator fully
|
2022-08-24 19:09:46 +00:00
|
|
|
// If storage = true, also traverse storage tries for each leaf.
|
|
|
|
func (v *Validator) iterate(it trie.NodeIterator, storage bool) error {
|
|
|
|
// Iterate through entire state trie. it.Next() will return false when we have
|
|
|
|
// either completed iteration of the entire trie or run into an error (e.g. a
|
|
|
|
// missing node). If we are able to iterate through the entire trie without error
|
|
|
|
// then the trie is complete.
|
|
|
|
for it.Next(true) {
|
|
|
|
// This block adapted from geth - core/state/iterator.go
|
|
|
|
// If storage is not requested, or the state trie node is an internal entry, skip
|
|
|
|
if !storage || !it.Leaf() {
|
|
|
|
continue
|
|
|
|
}
|
|
|
|
// Otherwise we've reached an account node, initiate data iteration
|
|
|
|
var account types.StateAccount
|
|
|
|
if err := rlp.Decode(bytes.NewReader(it.LeafBlob()), &account); err != nil {
|
|
|
|
return err
|
|
|
|
}
|
|
|
|
dataTrie, err := v.stateDatabase.OpenStorageTrie(common.BytesToHash(it.LeafKey()), account.Root)
|
|
|
|
if err != nil {
|
|
|
|
return err
|
|
|
|
}
|
|
|
|
dataIt := dataTrie.NodeIterator(nil)
|
|
|
|
if !bytes.Equal(account.CodeHash, emptyCodeHash) {
|
|
|
|
addrHash := common.BytesToHash(it.LeafKey())
|
|
|
|
_, err := v.stateDatabase.ContractCode(addrHash, common.BytesToHash(account.CodeHash))
|
|
|
|
if err != nil {
|
2022-08-30 14:48:12 +00:00
|
|
|
return fmt.Errorf("code %x: %w (path %x)", account.CodeHash, err, nodeiter.HexToKeyBytes(it.Path()))
|
2022-08-24 19:09:46 +00:00
|
|
|
}
|
|
|
|
}
|
|
|
|
for dataIt.Next(true) {
|
|
|
|
}
|
|
|
|
if dataIt.Error() != nil {
|
2022-08-30 14:48:12 +00:00
|
|
|
return fmt.Errorf("data iterator error (path %x): %w", nodeiter.HexToKeyBytes(dataIt.Path()), dataIt.Error())
|
2022-08-24 19:09:46 +00:00
|
|
|
}
|
|
|
|
}
|
|
|
|
return it.Error()
|
|
|
|
}
|
|
|
|
|
2022-08-30 14:48:12 +00:00
|
|
|
// Traverses each iterator in a separate goroutine, dumping to a recovery file on failure. Handles signals
|
2022-08-24 19:09:46 +00:00
|
|
|
func iterateTracked(tree state.Trie, recoveryFile string, iterCount uint, fn func(trie.NodeIterator) error) error {
|
|
|
|
ctx, cancelCtx := context.WithCancel(context.Background())
|
|
|
|
tracker := tracker.New(recoveryFile, iterCount)
|
|
|
|
tracker.CaptureSignal(cancelCtx)
|
|
|
|
halt := func() {
|
|
|
|
if err := tracker.HaltAndDump(); err != nil {
|
|
|
|
log.Errorf("failed to write recovery file: %v", err)
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
// attempt to restore from recovery file if it exists
|
|
|
|
iters, err := tracker.Restore(tree)
|
|
|
|
if err != nil {
|
|
|
|
return err
|
|
|
|
}
|
|
|
|
if iterCount < uint(len(iters)) {
|
|
|
|
return fmt.Errorf("recovered too many iterators: got %d, expected %d", len(iters), iterCount)
|
|
|
|
}
|
|
|
|
|
|
|
|
if iters == nil { // nothing restored
|
|
|
|
iters = nodeiter.SubtrieIterators(tree, iterCount)
|
|
|
|
for i, it := range iters {
|
|
|
|
iters[i] = tracker.Tracked(it, nil)
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
g, ctx := errgroup.WithContext(ctx)
|
|
|
|
defer halt()
|
|
|
|
|
|
|
|
for _, it := range iters {
|
|
|
|
func(it trie.NodeIterator) {
|
|
|
|
g.Go(func() error { return fn(it) })
|
|
|
|
}(it)
|
|
|
|
}
|
|
|
|
return g.Wait()
|
|
|
|
}
|