bc1ec69008
In this pull request, the state iterator is implemented. It's mostly a copy-paste from the original state snapshot package, but still has some important changes to highlight here: (a) The iterator for the disk layer consists of a diff iterator and a disk iterator. Originally, the disk layer in the state snapshot was a wrapper around the disk, and its corresponding iterator was also a wrapper around the disk iterator. However, due to structural differences, the disk layer iterator is divided into two parts: - The disk iterator, which traverses the content stored on disk. - The diff iterator, which traverses the aggregated state buffer. Checkout `BinaryIterator` and `FastIterator` for more details. (b) The staleness management is improved in the diffAccountIterator and diffStorageIterator Originally, in the `diffAccountIterator`, the layer’s staleness had to be checked within the Next function to ensure the iterator remained usable. Additionally, a read lock on the associated diff layer was required to first retrieve the account blob. This read lock protection is essential to prevent concurrent map read/write. Afterward, a staleness check was performed to ensure the retrieved data was not outdated. The entire logic can be simplified as follows: a loadAccount callback is provided to retrieve account data. If the corresponding state is immutable (e.g., diff layers in the path database), the staleness check can be skipped, and a single account data retrieval is sufficient. However, if the corresponding state is mutable (e.g., the disk layer in the path database), the callback can operate as follows: ```go func(hash common.Hash) ([]byte, error) { dl.lock.RLock() defer dl.lock.RUnlock() if dl.stale { return nil, errSnapshotStale } return dl.buffer.states.mustAccount(hash) } ``` The callback solution can eliminate the complexity for managing concurrency with the read lock for atomic operation.
151 lines
5.2 KiB
Go
151 lines
5.2 KiB
Go
// Copyright 2024 The go-ethereum Authors
|
|
// This file is part of the go-ethereum library.
|
|
//
|
|
// The go-ethereum library is free software: you can redistribute it and/or modify
|
|
// it under the terms of the GNU Lesser General Public License as published by
|
|
// the Free Software Foundation, either version 3 of the License, or
|
|
// (at your option) any later version.
|
|
//
|
|
// The go-ethereum library is distributed in the hope that it will be useful,
|
|
// but WITHOUT ANY WARRANTY; without even the implied warranty of
|
|
// MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
|
|
// GNU Lesser General Public License for more details.
|
|
//
|
|
// You should have received a copy of the GNU Lesser General Public License
|
|
// along with the go-ethereum library. If not, see <http://www.gnu.org/licenses/>
|
|
|
|
package pathdb
|
|
|
|
import (
|
|
"fmt"
|
|
|
|
"github.com/ethereum/go-ethereum/common"
|
|
"github.com/ethereum/go-ethereum/common/hexutil"
|
|
"github.com/ethereum/go-ethereum/core/types"
|
|
"github.com/ethereum/go-ethereum/log"
|
|
"github.com/ethereum/go-ethereum/rlp"
|
|
"github.com/ethereum/go-ethereum/triedb/database"
|
|
)
|
|
|
|
// The types of locations where the node is found.
|
|
const (
|
|
locDirtyCache = "dirty" // dirty cache
|
|
locCleanCache = "clean" // clean cache
|
|
locDiskLayer = "disk" // persistent state
|
|
locDiffLayer = "diff" // diff layers
|
|
)
|
|
|
|
// nodeLoc is a helpful structure that contains the location where the node
|
|
// is found, as it's useful for debugging purposes.
|
|
type nodeLoc struct {
|
|
loc string
|
|
depth int
|
|
}
|
|
|
|
// string returns the string representation of node location.
|
|
func (loc *nodeLoc) string() string {
|
|
return fmt.Sprintf("loc: %s, depth: %d", loc.loc, loc.depth)
|
|
}
|
|
|
|
// reader implements the database.NodeReader interface, providing the functionalities to
|
|
// retrieve trie nodes by wrapping the internal state layer.
|
|
type reader struct {
|
|
layer layer
|
|
noHashCheck bool
|
|
}
|
|
|
|
// Node implements database.NodeReader interface, retrieving the node with specified
|
|
// node info. Don't modify the returned byte slice since it's not deep-copied
|
|
// and still be referenced by database.
|
|
func (r *reader) Node(owner common.Hash, path []byte, hash common.Hash) ([]byte, error) {
|
|
blob, got, loc, err := r.layer.node(owner, path, 0)
|
|
if err != nil {
|
|
return nil, err
|
|
}
|
|
// Error out if the local one is inconsistent with the target.
|
|
if !r.noHashCheck && got != hash {
|
|
// Location is always available even if the node
|
|
// is not found.
|
|
switch loc.loc {
|
|
case locCleanCache:
|
|
nodeCleanFalseMeter.Mark(1)
|
|
case locDirtyCache:
|
|
nodeDirtyFalseMeter.Mark(1)
|
|
case locDiffLayer:
|
|
nodeDiffFalseMeter.Mark(1)
|
|
case locDiskLayer:
|
|
nodeDiskFalseMeter.Mark(1)
|
|
}
|
|
blobHex := "nil"
|
|
if len(blob) > 0 {
|
|
blobHex = hexutil.Encode(blob)
|
|
}
|
|
log.Error("Unexpected trie node", "location", loc.loc, "owner", owner.Hex(), "path", path, "expect", hash.Hex(), "got", got.Hex(), "blob", blobHex)
|
|
return nil, fmt.Errorf("unexpected node: (%x %v), %x!=%x, %s, blob: %s", owner, path, hash, got, loc.string(), blobHex)
|
|
}
|
|
return blob, nil
|
|
}
|
|
|
|
// AccountRLP directly retrieves the account associated with a particular hash.
|
|
// An error will be returned if the read operation exits abnormally. Specifically,
|
|
// if the layer is already stale.
|
|
//
|
|
// Note:
|
|
// - the returned account data is not a copy, please don't modify it
|
|
// - no error will be returned if the requested account is not found in database
|
|
func (r *reader) AccountRLP(hash common.Hash) ([]byte, error) {
|
|
return r.layer.account(hash, 0)
|
|
}
|
|
|
|
// Account directly retrieves the account associated with a particular hash in
|
|
// the slim data format. An error will be returned if the read operation exits
|
|
// abnormally. Specifically, if the layer is already stale.
|
|
//
|
|
// Note:
|
|
// - the returned account object is safe to modify
|
|
// - no error will be returned if the requested account is not found in database
|
|
func (r *reader) Account(hash common.Hash) (*types.SlimAccount, error) {
|
|
blob, err := r.layer.account(hash, 0)
|
|
if err != nil {
|
|
return nil, err
|
|
}
|
|
if len(blob) == 0 {
|
|
return nil, nil
|
|
}
|
|
account := new(types.SlimAccount)
|
|
if err := rlp.DecodeBytes(blob, account); err != nil {
|
|
panic(err)
|
|
}
|
|
return account, nil
|
|
}
|
|
|
|
// Storage directly retrieves the storage data associated with a particular hash,
|
|
// within a particular account. An error will be returned if the read operation
|
|
// exits abnormally. Specifically, if the layer is already stale.
|
|
//
|
|
// Note:
|
|
// - the returned storage data is not a copy, please don't modify it
|
|
// - no error will be returned if the requested slot is not found in database
|
|
func (r *reader) Storage(accountHash, storageHash common.Hash) ([]byte, error) {
|
|
return r.layer.storage(accountHash, storageHash, 0)
|
|
}
|
|
|
|
// NodeReader retrieves a layer belonging to the given state root.
|
|
func (db *Database) NodeReader(root common.Hash) (database.NodeReader, error) {
|
|
layer := db.tree.get(root)
|
|
if layer == nil {
|
|
return nil, fmt.Errorf("state %#x is not available", root)
|
|
}
|
|
return &reader{layer: layer, noHashCheck: db.isVerkle}, nil
|
|
}
|
|
|
|
// StateReader returns a reader that allows access to the state data associated
|
|
// with the specified state.
|
|
func (db *Database) StateReader(root common.Hash) (database.StateReader, error) {
|
|
layer := db.tree.get(root)
|
|
if layer == nil {
|
|
return nil, fmt.Errorf("state %#x is not available", root)
|
|
}
|
|
return &reader{layer: layer}, nil
|
|
}
|