-
Notifications
You must be signed in to change notification settings - Fork 13
New issue
Have a question about this project? Sign up for a free GitHub account to open an issue and contact its maintainers and the community.
By clicking “Sign up for GitHub”, you agree to our terms of service and privacy statement. We’ll occasionally send you account related emails.
Already on GitHub? Sign in to your account
Include base -> overlay key-values migration logic #199
Changes from 4 commits
5aea81b
4896b69
db97f14
c9a85f6
b505401
55ca4c3
File filter
Filter by extension
Conversations
Jump to
Diff view
Diff view
There are no files selected for viewing
Original file line number | Diff line number | Diff line change |
---|---|---|
|
@@ -18,8 +18,10 @@ package core | |
|
||
import ( | ||
"bytes" | ||
"encoding/binary" | ||
"fmt" | ||
"math/big" | ||
"time" | ||
|
||
"github.com/ethereum/go-ethereum/common" | ||
"github.com/ethereum/go-ethereum/consensus" | ||
|
@@ -33,6 +35,9 @@ import ( | |
"github.com/ethereum/go-ethereum/log" | ||
"github.com/ethereum/go-ethereum/params" | ||
"github.com/ethereum/go-ethereum/trie" | ||
tutils "github.com/ethereum/go-ethereum/trie/utils" | ||
"github.com/gballet/go-verkle" | ||
"github.com/holiman/uint256" | ||
) | ||
|
||
// StateProcessor is a basic Processor, which takes care of transitioning | ||
|
@@ -96,6 +101,7 @@ func (p *StateProcessor) Process(block *types.Block, statedb *state.StateDB, cfg | |
// N values from the MPT into the verkle tree. | ||
if fdb, ok := statedb.Database().(*state.ForkingDB); ok { | ||
if fdb.InTransition() { | ||
now := time.Now() | ||
// XXX overkill, just save the parent root in the forking db | ||
tt := statedb.GetTrie().(*trie.TransitionTrie) | ||
mpt := tt.Base() | ||
|
@@ -109,17 +115,22 @@ func (p *StateProcessor) Process(block *types.Block, statedb *state.StateDB, cfg | |
return nil, nil, 0, err | ||
} | ||
|
||
// move N=500 accounts into the verkle tree, starting with the | ||
const maxMovedCount = 500 | ||
// mkv will be assiting in the collection of up to maxMovedCount key values to be migrated to the VKT. | ||
// It has internal caches to do efficient MPT->VKT key calculations, which will be discarded after | ||
// this function. | ||
mkv := &keyValueMigrator{} | ||
Comment on lines
+119
to
+122
There was a problem hiding this comment. Choose a reason for hiding this commentThe reason will be displayed to describe this comment to others. Learn more. This |
||
// move maxCount accounts into the verkle tree, starting with the | ||
// slots from the previous account. | ||
count := 0 | ||
for ; stIt.Next() && count < 500; count++ { | ||
addr := rawdb.ReadPreimage(statedb.Database().DiskDB(), accIt.Hash()) | ||
for ; stIt.Next() && count < maxMovedCount; count++ { | ||
slotnr := rawdb.ReadPreimage(statedb.Database().DiskDB(), stIt.Hash()) | ||
|
||
// @jsign: do your magic here adding the slot `slotnr` | ||
mkv.addStorageSlot(addr, slotnr, stIt.Slot()) | ||
} | ||
|
||
// if less than 500 slots were moved, move to the next account | ||
for count < 500 { | ||
// if less than maxCount slots were moved, move to the next account | ||
for count < maxMovedCount { | ||
if accIt.Next() { | ||
acc, err := snapshot.FullAccount(accIt.Account()) | ||
if err != nil { | ||
|
@@ -128,21 +139,21 @@ func (p *StateProcessor) Process(block *types.Block, statedb *state.StateDB, cfg | |
} | ||
addr := rawdb.ReadPreimage(statedb.Database().DiskDB(), accIt.Hash()) | ||
|
||
// @jsign: do your magic here adding the account at `addr | ||
mkv.addAccount(addr, acc) | ||
|
||
// Store the account code if present | ||
if !bytes.Equal(acc.CodeHash, emptyCode) { | ||
code := rawdb.ReadCode(statedb.Database().DiskDB(), common.BytesToHash(acc.CodeHash)) | ||
chunks := trie.ChunkifyCode(code) | ||
|
||
// @jsign: do your magic here with the code chunks | ||
mkv.addAccountCode(addr, uint64(len(code)), chunks) | ||
} | ||
|
||
if !bytes.Equal(acc.Root, emptyRoot[:]) { | ||
for ; stIt.Next() && count < 500; count++ { | ||
for ; stIt.Next() && count < maxMovedCount; count++ { | ||
slotnr := rawdb.ReadPreimage(statedb.Database().DiskDB(), stIt.Hash()) | ||
|
||
// @jsign do your magic here with extra slots | ||
mkv.addStorageSlot(addr, slotnr, stIt.Slot()) | ||
} | ||
Comment on lines
-131
to
157
There was a problem hiding this comment. Choose a reason for hiding this commentThe reason will be displayed to describe this comment to others. Learn more. TL;DR: we simply "collect" the key values and let mkv capture them. |
||
} | ||
} | ||
|
@@ -157,6 +168,13 @@ func (p *StateProcessor) Process(block *types.Block, statedb *state.StateDB, cfg | |
fdb.LastAccHash = accIt.Hash() | ||
fdb.LastSlotHash = stIt.Hash() | ||
} | ||
log.Info("Collected and prepared key values from base tree", "count", count, "duration", time.Since(now)) | ||
|
||
now = time.Now() | ||
if err := mkv.migrateCollectedKeyValues(tt.Overlay()); err != nil { | ||
return nil, nil, 0, fmt.Errorf("could not migrate key values: %w", err) | ||
} | ||
Comment on lines
+174
to
+176
There was a problem hiding this comment. Choose a reason for hiding this commentThe reason will be displayed to describe this comment to others. Learn more. After we finish collecting them, we let the component do the go-verkle use of new APIS: batch create leaf nodes, and insert into the tree. More about this below. |
||
log.Info("Inserted key values in overlay tree", "count", count, "duration", time.Since(now)) | ||
} | ||
} | ||
|
||
|
@@ -232,3 +250,114 @@ func ApplyTransaction(config *params.ChainConfig, bc ChainContext, author *commo | |
vmenv := vm.NewEVM(blockContext, vm.TxContext{}, statedb, config, cfg) | ||
return applyTransaction(msg, config, author, gp, statedb, header.Number, header.Hash(), tx, usedGas, vmenv) | ||
} | ||
|
||
// keyValueMigrator is a helper struct that collects key-values from the base tree. | ||
// The walk is done in account order, so **we assume** the APIs hold this invariant. This is | ||
// useful to be smart about caching banderwagon.Points to make VKT key calculations faster. | ||
type keyValueMigrator struct { | ||
currAddr []byte | ||
currAddrPoint *verkle.Point | ||
|
||
vktLeafData map[string]*verkle.BatchNewLeafNodeData | ||
} | ||
Comment on lines
+254
to
+262
There was a problem hiding this comment. Choose a reason for hiding this commentThe reason will be displayed to describe this comment to others. Learn more. There shouldn't be much surprises here. We keep collecting stuff in the vktLeafData which we use at the end to batch create leaf nodes and insert into the tree. The method implementations shouldn't be surprising. They're doing something similar to what we did in the full tree conversion. Note that I'm sharing as soon as I finished writing the code, so might be something missing, so please double check. I tried to use as many defined constants as possible to avoid magic indexes or sizes, etc. (As mentioned in the PR description, there're some potential changes to make this faster. But I think this is reasonable and quite clear/clean to have a decent starting point; we can see later if we need to push limits a bit more that can justify a more complex version). |
||
|
||
func (kvm *keyValueMigrator) addStorageSlot(addr []byte, slotNumber []byte, slotValue []byte) { | ||
addrPoint := kvm.getAddrPoint(addr) | ||
|
||
vktKey := tutils.GetTreeKeyStorageSlotWithEvaluatedAddress(addrPoint, slotNumber) | ||
leafNodeData := kvm.getOrInitLeafNodeData(vktKey) | ||
|
||
leafNodeData.Values[vktKey[verkle.StemSize]] = slotValue | ||
} | ||
|
||
func (kvm *keyValueMigrator) addAccount(addr []byte, acc snapshot.Account) { | ||
addrPoint := kvm.getAddrPoint(addr) | ||
|
||
vktKey := tutils.GetTreeKeyVersionWithEvaluatedAddress(addrPoint) | ||
leafNodeData := kvm.getOrInitLeafNodeData(vktKey) | ||
|
||
var version [verkle.LeafValueSize]byte | ||
leafNodeData.Values[tutils.VersionLeafKey] = version[:] | ||
|
||
var balance [verkle.LeafValueSize]byte | ||
for i, b := range acc.Balance.Bytes() { | ||
balance[len(acc.Balance.Bytes())-1-i] = b | ||
} | ||
leafNodeData.Values[tutils.BalanceLeafKey] = balance[:] | ||
|
||
var nonce [verkle.LeafValueSize]byte | ||
binary.LittleEndian.PutUint64(nonce[:8], acc.Nonce) | ||
leafNodeData.Values[tutils.NonceLeafKey] = balance[:] | ||
|
||
leafNodeData.Values[tutils.CodeKeccakLeafKey] = acc.CodeHash[:] | ||
|
||
// Code size is ignored here. If this isn't an EOA, the tree-walk will call | ||
// addAccountCode with this information. | ||
} | ||
|
||
func (kvm *keyValueMigrator) addAccountCode(addr []byte, codeSize uint64, chunks []byte) { | ||
addrPoint := kvm.getAddrPoint(addr) | ||
|
||
vktKey := tutils.GetTreeKeyVersionWithEvaluatedAddress(addrPoint) | ||
leafNodeData := kvm.getOrInitLeafNodeData(vktKey) | ||
|
||
// Save the code size. | ||
var codeSizeBytes [verkle.LeafValueSize]byte | ||
binary.LittleEndian.PutUint64(codeSizeBytes[:8], codeSize) | ||
leafNodeData.Values[tutils.CodeSizeLeafKey] = codeSizeBytes[:] | ||
|
||
// The first 128 chunks are stored in the account header leaf. | ||
for i := 0; i < 128 && i < len(chunks)/32; i++ { | ||
leafNodeData.Values[byte(128+i)] = chunks[32*i : 32*(i+1)] | ||
} | ||
|
||
// Potential further chunks, have their own leaf nodes. | ||
for i := 128; i < len(chunks)/32; { | ||
vktKey := tutils.GetTreeKeyCodeChunkWithEvaluatedAddress(addrPoint, uint256.NewInt(uint64(i))) | ||
leafNodeData := kvm.getOrInitLeafNodeData(vktKey) | ||
|
||
j := i | ||
for ; (j-i) < 256 && j < len(chunks)/32; j++ { | ||
leafNodeData.Values[byte((j-128)%256)] = chunks[32*j : 32*(j+1)] | ||
} | ||
i = j | ||
} | ||
} | ||
|
||
func (kvm *keyValueMigrator) getAddrPoint(addr []byte) *verkle.Point { | ||
if bytes.Equal(addr, kvm.currAddr) { | ||
return kvm.currAddrPoint | ||
} | ||
kvm.currAddr = addr | ||
kvm.currAddrPoint = tutils.EvaluateAddressPoint(addr) | ||
return kvm.currAddrPoint | ||
} | ||
|
||
func (kvm *keyValueMigrator) getOrInitLeafNodeData(stem []byte) *verkle.BatchNewLeafNodeData { | ||
stemStr := string(stem) | ||
if _, ok := kvm.vktLeafData[stemStr]; !ok { | ||
kvm.vktLeafData[stemStr] = &verkle.BatchNewLeafNodeData{ | ||
Stem: stem, | ||
Values: make(map[byte][]byte), | ||
} | ||
} | ||
return kvm.vktLeafData[stemStr] | ||
} | ||
|
||
func (kvm *keyValueMigrator) migrateCollectedKeyValues(tree *trie.VerkleTrie) error { | ||
// Transform the map into a slice. | ||
nodeValues := make([]verkle.BatchNewLeafNodeData, 0, len(kvm.vktLeafData)) | ||
for _, vld := range kvm.vktLeafData { | ||
nodeValues = append(nodeValues, *vld) | ||
} | ||
|
||
// Create all leaves in batch mode so we can optimize cryptography operations. | ||
newLeaves := verkle.BatchNewLeafNode(nodeValues) | ||
|
||
// Insert into the tree. | ||
if err := tree.InsertMigratedLeaves(newLeaves); err != nil { | ||
return fmt.Errorf("failed to insert migrated leaves: %w", err) | ||
} | ||
|
||
return nil | ||
} | ||
Comment on lines
+347
to
+363
There was a problem hiding this comment. Choose a reason for hiding this commentThe reason will be displayed to describe this comment to others. Learn more. This is what we called in L173. Basically, we use the new APIs to efficiently create leaves and insert into the tree. |
Original file line number | Diff line number | Diff line change |
---|---|---|
|
@@ -23,7 +23,7 @@ require ( | |
github.com/fjl/gencodec v0.0.0-20220412091415-8bb9e558978c | ||
github.com/fjl/memsize v0.0.0-20190710130421-bcb5799ab5e5 | ||
github.com/gballet/go-libpcsclite v0.0.0-20190607065134-2772fd86a8ff | ||
github.com/gballet/go-verkle v0.0.0-20230414192453-2838510d5ee0 | ||
github.com/gballet/go-verkle v0.0.0-20230420192103-fe912821ad59 | ||
There was a problem hiding this comment. Choose a reason for hiding this commentThe reason will be displayed to describe this comment to others. Learn more. Pointing to last commit of ethereum/go-verkle#343 There was a problem hiding this comment. Choose a reason for hiding this commentThe reason will be displayed to describe this comment to others. Learn more. is there any reason that PR is still in draft, btw? There was a problem hiding this comment. Choose a reason for hiding this commentThe reason will be displayed to describe this comment to others. Learn more. Mostly to have some extra information after seeing how would fit "this side" of the story. After that, I can update |
||
github.com/go-stack/stack v1.8.0 | ||
github.com/golang-jwt/jwt/v4 v4.3.0 | ||
github.com/golang/protobuf v1.5.2 | ||
|
Original file line number | Diff line number | Diff line change |
---|---|---|
|
@@ -38,6 +38,10 @@ func (t *TransitionTrie) Base() *SecureTrie { | |
return t.base | ||
} | ||
|
||
func (t *TransitionTrie) Overlay() *VerkleTrie { | ||
return t.overlay | ||
} | ||
Comment on lines
+42
to
+44
There was a problem hiding this comment. Choose a reason for hiding this commentThe reason will be displayed to describe this comment to others. Learn more. Needed for There was a problem hiding this comment. Choose a reason for hiding this commentThe reason will be displayed to describe this comment to others. Learn more. is it needed? We could also just implement all the required functions on top of There was a problem hiding this comment. Choose a reason for hiding this commentThe reason will be displayed to describe this comment to others. Learn more. I guess it's simpler to do for now, could you just please add a TODO in a comment so that we remember to check that when we merge the final PR ? There was a problem hiding this comment. Choose a reason for hiding this commentThe reason will be displayed to describe this comment to others. Learn more. The "problem" with making it an API in I'll add the TODO to remember about this, yes. There was a problem hiding this comment. Choose a reason for hiding this commentThe reason will be displayed to describe this comment to others. Learn more. Done. |
||
|
||
// GetKey returns the sha3 preimage of a hashed key that was previously used | ||
// to store a value. | ||
// | ||
|
Original file line number | Diff line number | Diff line change |
---|---|---|
|
@@ -50,6 +50,12 @@ func NewVerkleTrie(root verkle.VerkleNode, db *Database, pointCache *utils.Point | |
} | ||
} | ||
|
||
func (trie *VerkleTrie) InsertMigratedLeaves(leaves []verkle.LeafNode) error { | ||
return trie.root.(*verkle.InternalNode).InsertMigratedLeaves(leaves, func(hash []byte) ([]byte, error) { | ||
return trie.db.diskdb.Get(hash) | ||
}) | ||
} | ||
Comment on lines
+53
to
+57
There was a problem hiding this comment. Choose a reason for hiding this commentThe reason will be displayed to describe this comment to others. Learn more. Just a trampoline to use the new API to avoid magic castings and skipping layers. For now should be fine... whenever we reconsider ethereum/go-verkle#314 maybe this method will go away if it can be as fast as the new API. |
||
|
||
var errInvalidProof = errors.New("invalid proof") | ||
|
||
// GetKey returns the sha3 preimage of a hashed key that was previously used | ||
|
There was a problem hiding this comment.
Choose a reason for hiding this comment
The reason will be displayed to describe this comment to others. Learn more.
Only this offtopic nit.