go-ethereum/core/state/partial/state.go
CPerezz fc2d55dd58
core/state/partial: only write modified accounts to trie
Match upstream BALStateTransition behavior: only call UpdateAccount for
accounts that were actually modified (balance, nonce, code, or storage
changes). Previously, all accounts in the BAL (including read-only ones)
were written back to the trie, which could cause root mismatches if the
re-encoded RLP differed from the original encoding.

Co-Authored-By: Claude Opus 4.6 <noreply@anthropic.com>
2026-04-17 12:13:05 +02:00

465 lines
16 KiB
Go

// Copyright 2025 The go-ethereum Authors
// This file is part of the go-ethereum library.
//
// The go-ethereum library is free software: you can redistribute it and/or modify
// it under the terms of the GNU Lesser General Public License as published by
// the Free Software Foundation, either version 3 of the License, or
// (at your option) any later version.
//
// The go-ethereum library is distributed in the hope that it will be useful,
// but WITHOUT ANY WARRANTY; without even the implied warranty of
// MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
// GNU Lesser General Public License for more details.
//
// You should have received a copy of the GNU Lesser General Public License
// along with the go-ethereum library. If not, see <http://www.gnu.org/licenses/>.
package partial
import (
"bytes"
"fmt"
"sync/atomic"
"github.com/ethereum/go-ethereum/common"
"github.com/ethereum/go-ethereum/core/rawdb"
"github.com/ethereum/go-ethereum/core/types"
"github.com/ethereum/go-ethereum/core/types/bal"
"github.com/ethereum/go-ethereum/crypto"
"github.com/ethereum/go-ethereum/ethdb"
"github.com/ethereum/go-ethereum/log"
"github.com/ethereum/go-ethereum/rlp"
"github.com/ethereum/go-ethereum/trie"
"github.com/ethereum/go-ethereum/trie/trienode"
"github.com/ethereum/go-ethereum/triedb"
"github.com/holiman/uint256"
)
// StorageRootResolver fetches new storage roots for untracked accounts from peers.
// Parameters: stateRoot (block's expected root), addrs (untracked addresses with
// storage changes), oldRoots (their current storage roots — used to detect stale
// peer responses). Returns: map of address → new storage root for resolved addresses.
type StorageRootResolver func(stateRoot common.Hash, addrs []common.Address, oldRoots map[common.Address]common.Hash) (map[common.Address]common.Hash, error)
// PartialState manages state for partial stateful nodes.
// It applies BAL diffs to update state without re-executing transactions.
type PartialState struct {
db ethdb.Database
trieDB *triedb.Database
filter ContractFilter
history *BALHistory
resolver StorageRootResolver // optional, for resolving untracked storage roots
stateRoot atomic.Pointer[common.Hash] // computed root (may differ from header root)
lastProcessedNum uint64 // last block successfully processed via BAL
}
// SetResolver sets the storage root resolver used to fetch updated storage roots
// for untracked contracts from snap-capable peers.
func (s *PartialState) SetResolver(r StorageRootResolver) {
s.resolver = r
}
// NewPartialState creates a new partial state manager.
func NewPartialState(db ethdb.Database, trieDB *triedb.Database, filter ContractFilter, balRetention uint64) *PartialState {
return &PartialState{
db: db,
trieDB: trieDB,
filter: filter,
history: NewBALHistory(db, balRetention),
}
}
// Filter returns the contract filter used by this partial state.
func (s *PartialState) Filter() ContractFilter {
return s.filter
}
// SetRoot atomically sets the current computed state root.
func (s *PartialState) SetRoot(root common.Hash) {
s.stateRoot.Store(&root)
}
// Root atomically returns the current computed state root.
func (s *PartialState) Root() common.Hash {
if p := s.stateRoot.Load(); p != nil {
return *p
}
return common.Hash{}
}
// History returns the BAL history manager.
func (s *PartialState) History() *BALHistory {
return s.history
}
// LastProcessedBlock returns the number of the last block processed via BAL.
func (s *PartialState) LastProcessedBlock() uint64 {
return s.lastProcessedNum
}
// SetLastProcessedBlock records the last block successfully processed via BAL.
func (s *PartialState) SetLastProcessedBlock(num uint64) {
s.lastProcessedNum = num
}
// accountState tracks an account being processed with origin info for PathDB StateSet.
type accountState struct {
account *types.StateAccount
origin *types.StateAccount // Original state (for PathDB StateSet)
addr common.Address
existed bool // true if account existed before this block
modified bool // true if any field was changed
storageRoot common.Hash // updated after storage trie commit
}
// ApplyBALAndComputeRoot applies BAL diffs and returns the new state root.
// This is the core method for partial state block processing.
//
// The expectedRoot parameter is the block header's declared state root. It is used
// in two ways: (1) to query peers for untracked contracts' storage roots, and
// (2) as a fallback PathDB layer label if peer resolution fails. Pass common.Hash{}
// to skip resolution and fallback (used in tests).
//
// Commit ordering (critical for correct state root):
// Phase 1: For each account, apply storage changes and commit storage trie
// Phase 1.5: Resolve storage roots for untracked contracts with storage changes
// Phase 2: Update account Root fields with committed storage roots
// Phase 3: Commit account trie to get final state root
func (s *PartialState) ApplyBALAndComputeRoot(parentRoot common.Hash, expectedRoot common.Hash, accessList *bal.BlockAccessList) (common.Hash, int, error) {
// Open state trie at parent root
tr, err := trie.NewStateTrie(trie.StateTrieID(parentRoot), s.trieDB)
if err != nil {
return common.Hash{}, 0, fmt.Errorf("failed to open state trie: %w", err)
}
// Collect all account states with origin tracking
accounts := make([]*accountState, 0, len(*accessList))
// Collect all trie nodes for batched update
allNodes := trienode.NewMergedNodeSet()
// Phase 1: Process each account's changes from BAL
for _, access := range *accessList {
addr := common.BytesToAddress(access.Address[:])
// Get current account state with origin tracking
data, err := tr.GetAccount(addr)
if err != nil {
return common.Hash{}, 0, fmt.Errorf("failed to get account %s: %w", addr.Hex(), err)
}
existed := data != nil
var account *types.StateAccount
if existed {
account = data
} else {
// New account - create with defaults
account = &types.StateAccount{
Balance: new(uint256.Int),
Root: types.EmptyRootHash,
CodeHash: types.EmptyCodeHash.Bytes(),
}
}
// Copy original state for PathDB StateSet
var origin *types.StateAccount
if existed {
origin = &types.StateAccount{
Nonce: account.Nonce,
Balance: new(uint256.Int).Set(account.Balance),
Root: account.Root,
CodeHash: common.CopyBytes(account.CodeHash),
}
}
state := &accountState{
account: account,
origin: origin,
addr: addr,
existed: existed,
modified: false,
storageRoot: account.Root,
}
// Apply balance changes (use final value from last tx)
if len(access.BalanceChanges) > 0 {
lastChange := access.BalanceChanges[len(access.BalanceChanges)-1]
account.Balance = new(uint256.Int).Set(lastChange.Balance)
state.modified = true
}
// Apply nonce changes
if len(access.NonceChanges) > 0 {
lastNonce := access.NonceChanges[len(access.NonceChanges)-1]
account.Nonce = lastNonce.Nonce
state.modified = true
}
// Apply code changes
if len(access.CodeChanges) > 0 {
lastCode := access.CodeChanges[len(access.CodeChanges)-1]
codeHash := crypto.Keccak256Hash(lastCode.Code)
account.CodeHash = codeHash.Bytes()
state.modified = true
// Only store code bytes for tracked contracts
if s.filter.IsTracked(addr) {
rawdb.WriteCode(s.db, codeHash, lastCode.Code)
}
}
// Apply storage changes (only for tracked contracts)
// CRITICAL: Commit storage trie HERE, before account trie
if len(access.StorageChanges) > 0 && s.filter.IsTracked(addr) {
newStorageRoot, storageNodes, err := s.applyStorageChanges(
addr, parentRoot, account.Root, &access)
if err != nil {
return common.Hash{}, 0, fmt.Errorf("failed to apply storage for %s: %w",
addr.Hex(), err)
}
state.storageRoot = newStorageRoot
state.modified = true
// Merge storage nodes
if storageNodes != nil {
if err := allNodes.Merge(storageNodes); err != nil {
return common.Hash{}, 0, err
}
}
}
accounts = append(accounts, state)
}
// Phase 1.5: Resolve storage roots for untracked contracts with storage changes.
// These contracts had storage modifications in the BAL but we skipped applying them
// (no local storage trie). We need their new storage roots to compute the correct
// state root. Query snap peers, or fall back to using expectedRoot as the layer label.
var untrackedAddrs []common.Address
oldRoots := make(map[common.Address]common.Hash)
for _, access := range *accessList {
addr := common.BytesToAddress(access.Address[:])
if !s.filter.IsTracked(addr) && len(access.StorageChanges) > 0 {
untrackedAddrs = append(untrackedAddrs, addr)
// Look up the current storage root from the account we already loaded
for _, state := range accounts {
if state.addr == addr {
oldRoots[addr] = state.storageRoot
break
}
}
}
}
var resolved map[common.Address]common.Hash
if len(untrackedAddrs) > 0 && s.resolver != nil {
var err error
resolved, err = s.resolver(expectedRoot, untrackedAddrs, oldRoots)
if err != nil {
log.Warn("Storage root resolution failed", "unresolved", len(untrackedAddrs), "err", err)
} else {
// Apply resolved storage roots
for _, state := range accounts {
if newRoot, ok := resolved[state.addr]; ok {
state.storageRoot = newRoot
state.modified = true
}
}
}
}
// Phase 2: Update account Root fields and write to account trie
for _, state := range accounts {
// Update storage root (may have changed in Phase 1)
state.account.Root = state.storageRoot
// Only consider deletion if modified AND now empty (EIP-161)
if state.modified && s.isEmptyAccount(state.account) {
// Only delete if it existed before (don't delete never-existed accounts)
if state.existed {
if err := tr.DeleteAccount(state.addr); err != nil {
return common.Hash{}, 0, fmt.Errorf("failed to delete account %s: %w",
state.addr.Hex(), err)
}
}
// Skip update for accounts that didn't exist and are still empty
continue
}
// Only write accounts that were actually modified to the trie.
// Upstream BALStateTransition only processes ModifiedAccounts().
if !state.modified {
continue
}
if err := tr.UpdateAccount(state.addr, state.account, 0); err != nil {
return common.Hash{}, 0, fmt.Errorf("failed to update account %s: %w",
state.addr.Hex(), err)
}
}
// Phase 3: Commit account trie
root, accountNodes := tr.Commit(false)
// Merge account nodes
if accountNodes != nil {
if err := allNodes.Merge(accountNodes); err != nil {
return common.Hash{}, 0, err
}
}
// Build StateSet for PathDB compatibility
stateSet := s.buildStateSet(accounts, accessList)
// Compute unresolved count for caller to decide root mismatch severity.
// The computed root may differ from the header root when untracked contracts
// have unresolved storage roots. Subsequent blocks must chain off the
// computed root (via partialState.Root()), not the header root.
unresolvedCount := 0
if len(untrackedAddrs) > 0 {
unresolvedCount = len(untrackedAddrs)
if resolved != nil {
for _, addr := range untrackedAddrs {
if _, ok := resolved[addr]; ok {
unresolvedCount--
}
}
}
if unresolvedCount > 0 {
log.Debug("Unresolved untracked storage roots",
"unresolved", unresolvedCount, "total", len(untrackedAddrs),
"expectedRoot", expectedRoot, "computedRoot", root)
}
}
// Write all trie nodes and state to database
if err := s.trieDB.Update(root, parentRoot, 0, allNodes, stateSet); err != nil {
return common.Hash{}, 0, fmt.Errorf("failed to update trie db: %w", err)
}
s.stateRoot.Store(&root)
return root, unresolvedCount, nil
}
// buildStateSet constructs StateSet for trieDB.Update() (required for PathDB).
// The StateSet tracks account and storage changes along with their original values,
// which PathDB uses for efficient state diff tracking.
func (s *PartialState) buildStateSet(accounts []*accountState, accessList *bal.BlockAccessList) *triedb.StateSet {
stateSet := triedb.NewStateSet()
for _, state := range accounts {
addrHash := crypto.Keccak256Hash(state.addr.Bytes())
// Add account data (slim RLP encoding)
if s.isEmptyAccount(state.account) && state.existed {
stateSet.Accounts[addrHash] = nil // nil = deletion
} else if state.modified {
stateSet.Accounts[addrHash] = types.SlimAccountRLP(*state.account)
}
// Add account origin (original state before this block)
if state.origin != nil {
stateSet.AccountsOrigin[state.addr] = types.SlimAccountRLP(*state.origin)
}
// Add storage changes for tracked contracts
if s.filter.IsTracked(state.addr) {
s.addStorageToStateSet(stateSet, state.addr, addrHash, accessList)
}
}
return stateSet
}
// addStorageToStateSet finds storage writes for the given address and adds them to the StateSet.
func (s *PartialState) addStorageToStateSet(stateSet *triedb.StateSet, addr common.Address, addrHash common.Hash, accessList *bal.BlockAccessList) {
// Find this account's storage writes in BAL
for _, access := range *accessList {
accessAddr := access.Address
if accessAddr != addr {
continue
}
if len(access.StorageChanges) == 0 {
break
}
storageMap := make(map[common.Hash][]byte)
for _, slotWrite := range access.StorageChanges {
slotKey := slotWrite.Slot.ToHash()
slotHash := crypto.Keccak256Hash(slotKey[:])
if len(slotWrite.Accesses) > 0 {
lastWrite := slotWrite.Accesses[len(slotWrite.Accesses)-1]
value := lastWrite.ValueAfter.ToHash()
if value == (common.Hash{}) {
storageMap[slotHash] = nil // nil = deletion
} else {
// Prefix-zero-trimmed RLP encoding
blob, err := rlp.EncodeToBytes(common.TrimLeftZeroes(value[:]))
if err != nil {
panic(fmt.Sprintf("failed to RLP-encode storage value: %v", err))
}
storageMap[slotHash] = blob
}
}
}
stateSet.Storages[addrHash] = storageMap
break
}
}
// isEmptyAccount checks if account is empty per EIP-161.
// An account is empty if it has zero nonce, zero balance, empty storage root,
// and empty code hash.
func (s *PartialState) isEmptyAccount(account *types.StateAccount) bool {
return account.Balance.IsZero() &&
account.Nonce == 0 &&
account.Root == types.EmptyRootHash &&
bytes.Equal(account.CodeHash, types.EmptyCodeHash.Bytes())
}
// applyStorageChanges applies storage writes and returns new root + nodes.
// Note: Does NOT write to trieDB - caller batches all writes.
func (s *PartialState) applyStorageChanges(
addr common.Address,
stateRoot common.Hash,
currentStorageRoot common.Hash,
access *bal.AccountAccess,
) (common.Hash, *trienode.NodeSet, error) {
// Open storage trie (use parent state root for ID, not current)
addrHash := crypto.Keccak256Hash(addr.Bytes())
storageID := trie.StorageTrieID(stateRoot, addrHash, currentStorageRoot)
storageTrie, err := trie.NewStateTrie(storageID, s.trieDB)
if err != nil {
return common.Hash{}, nil, err
}
// Apply each storage write (use final value)
for _, slotWrite := range access.StorageChanges {
slot := slotWrite.Slot.ToHash()
// Get final value (last write wins)
if len(slotWrite.Accesses) == 0 {
continue
}
lastWrite := slotWrite.Accesses[len(slotWrite.Accesses)-1]
value := lastWrite.ValueAfter.ToHash()
if value == (common.Hash{}) {
// Delete slot
if err := storageTrie.DeleteStorage(addr, slot.Bytes()); err != nil {
return common.Hash{}, nil, err
}
} else {
// Update slot — trim leading zeros to match how the EVM stores
// values (as big integers). UpdateStorage RLP-encodes the value,
// so [0,0,...,5] vs [5] produce different trie nodes.
if err := storageTrie.UpdateStorage(addr, slot.Bytes(), common.TrimLeftZeroes(value.Bytes())); err != nil {
return common.Hash{}, nil, err
}
}
}
// Commit storage trie (collect nodes, don't write to DB yet)
storageRoot, nodes := storageTrie.Commit(false)
return storageRoot, nodes, nil
}