From 5444cd1ef57e68088853f47d2b2f0f3ab3ca2ed4 Mon Sep 17 00:00:00 2001 From: Guillaume Ballet <3272758+gballet@users.noreply.github.com> Date: Wed, 11 Sep 2024 12:51:34 +0200 Subject: [PATCH 1/8] use skiplists to compress leave storage --- encoding.go | 55 +++++++++++++++++++----- encoding_test.go | 109 ++++++++++++++++++++++++++++++++++++++--------- tree.go | 54 +++++++++++++++++------ 3 files changed, 173 insertions(+), 45 deletions(-) diff --git a/encoding.go b/encoding.go index d5e27d17..0f64e682 100644 --- a/encoding.go +++ b/encoding.go @@ -56,12 +56,11 @@ const ( leafC1CommitmentOffset = leafCommitmentOffset + banderwagon.UncompressedSize leafC2CommitmentOffset = leafC1CommitmentOffset + banderwagon.UncompressedSize leafChildrenOffset = leafC2CommitmentOffset + banderwagon.UncompressedSize - leafBalanceSize = 32 - leafNonceSize = 8 + leafBasicDataSize = 32 leafSlotSize = 32 leafValueIndexSize = 1 singleSlotLeafSize = nodeTypeSize + StemSize + 2*banderwagon.UncompressedSize + leafValueIndexSize + leafSlotSize - eoaLeafSize = nodeTypeSize + StemSize + 2*banderwagon.UncompressedSize + leafBalanceSize + leafNonceSize + eoaLeafSize = nodeTypeSize + StemSize + 2*banderwagon.UncompressedSize + leafBasicDataSize ) func bit(bitlist []byte, nr int) bool { @@ -94,6 +93,8 @@ func ParseNode(serializedNode []byte, depth byte) (VerkleNode, error) { return parseEoAccountNode(serializedNode, depth) case singleSlotType: return parseSingleSlotNode(serializedNode, depth) + case skipListType: + return parseSkipList(serializedNode, depth) default: return nil, ErrInvalidNodeEncoding } @@ -135,17 +136,49 @@ func parseLeafNode(serialized []byte, depth byte) (VerkleNode, error) { return ln, nil } +func parseSkipList(serialized []byte, depth byte) (VerkleNode, error) { + var values [NodeWidth][]byte + offset := leafStemOffset + StemSize + 3*banderwagon.UncompressedSize // offset in the serialized payload + valueIdx := 0 // Index of the value being deserialized + for valueIdx < NodeWidth { + rangecount := serialized[offset+1] + gapsize := serialized[offset] + valueIdx += int(gapsize) + offset += 2 + for i := 0; i < int(rangecount); i++ { + values[valueIdx] = serialized[offset : offset+leafSlotSize] + offset += leafSlotSize + valueIdx++ + } + } + ln := NewLeafNodeWithNoComms(serialized[leafStemOffset:leafStemOffset+StemSize], values[:]) + ln.setDepth(depth) + ln.c1 = new(Point) + + // Sanity check that we have at least 3*banderwagon.UncompressedSize bytes left in the serialized payload. + if len(serialized[leafCommitmentOffset:]) < 3*banderwagon.UncompressedSize { + return nil, fmt.Errorf("leaf node commitments are not the correct size, expected at least %d, got %d", 3*banderwagon.UncompressedSize, len(serialized[leafC1CommitmentOffset:])) + } + + if err := ln.c1.SetBytesUncompressed(serialized[leafC1CommitmentOffset:leafC1CommitmentOffset+banderwagon.UncompressedSize], true); err != nil { + return nil, fmt.Errorf("setting c1 commitment: %w", err) + } + ln.c2 = new(Point) + if err := ln.c2.SetBytesUncompressed(serialized[leafC2CommitmentOffset:leafC2CommitmentOffset+banderwagon.UncompressedSize], true); err != nil { + return nil, fmt.Errorf("setting c2 commitment: %w", err) + } + ln.commitment = new(Point) + if err := ln.commitment.SetBytesUncompressed(serialized[leafCommitmentOffset:leafC1CommitmentOffset], true); err != nil { + return nil, fmt.Errorf("setting commitment: %w", err) + } + return ln, nil +} + func parseEoAccountNode(serialized []byte, depth byte) (VerkleNode, error) { var values [NodeWidth][]byte offset := leafStemOffset + StemSize + 2*banderwagon.UncompressedSize - values[0] = zero32[:] // 0 version - values[1] = serialized[offset : offset+leafBalanceSize] // balance - var nonce [32]byte - offset += leafBalanceSize - copy(nonce[:leafNonceSize], serialized[offset:offset+leafNonceSize]) - values[2] = nonce[:] // nonce - values[3] = EmptyCodeHash[:] - values[4] = zero32[:] // 0 code size + values[0] = serialized[offset : offset+leafBasicDataSize] // basic data + values[1] = EmptyCodeHash[:] ln := NewLeafNodeWithNoComms(serialized[leafStemOffset:leafStemOffset+StemSize], values[:]) ln.setDepth(depth) ln.c1 = new(Point) diff --git a/encoding_test.go b/encoding_test.go index c7eb53d6..3f6ed4bd 100644 --- a/encoding_test.go +++ b/encoding_test.go @@ -2,6 +2,7 @@ package verkle import ( "bytes" + "encoding/binary" "testing" "github.com/crate-crypto/go-ipa/banderwagon" @@ -22,7 +23,9 @@ func TestLeafStemLength(t *testing.T) { // Serialize a leaf with no values, but whose stem is 32 bytes. The // serialization should trim the extra byte. toolong := make([]byte, 32) - leaf, err := NewLeafNode(toolong, make([][]byte, NodeWidth)) + values := make([][]byte, NodeWidth) + values[42] = zero32[:] + leaf, err := NewLeafNode(toolong, values) if err != nil { t.Fatal(err) } @@ -30,8 +33,8 @@ func TestLeafStemLength(t *testing.T) { if err != nil { t.Fatal(err) } - if len(ser) != nodeTypeSize+StemSize+bitlistSize+3*banderwagon.UncompressedSize { - t.Fatalf("invalid serialization when the stem is longer than 31 bytes: %x (%d bytes != %d)", ser, len(ser), nodeTypeSize+StemSize+bitlistSize+2*banderwagon.UncompressedSize) + if len(ser) != singleSlotLeafSize { + t.Fatalf("invalid serialization when the stem is longer than 31 bytes: %x (%d bytes != %d)", ser, len(ser), singleSlotLeafSize) } } @@ -61,12 +64,11 @@ func TestInvalidNodeEncoding(t *testing.T) { } func TestParseNodeEoA(t *testing.T) { + var basicdata [32]byte values := make([][]byte, 256) - values[0] = zero32[:] + values[0] = basicdata[:] + binary.BigEndian.PutUint64(values[0][8:], 0xde) values[1] = EmptyCodeHash[:] // set empty code hash as balance, because why not - values[2] = fourtyKeyTest[:] // set nonce to 64 - values[3] = EmptyCodeHash[:] // set empty code hash - values[4] = zero32[:] // zero-size ln, err := NewLeafNode(ffx32KeyTest[:31], values) if err != nil { t.Fatalf("error creating leaf node: %v", err) @@ -99,26 +101,15 @@ func TestParseNodeEoA(t *testing.T) { t.Fatalf("invalid stem, got %x, expected %x", lnd.stem, ffx32KeyTest[:31]) } - if !bytes.Equal(lnd.values[0], zero32[:]) { - t.Fatalf("invalid version, got %x, expected %x", lnd.values[0], zero32[:]) + nonce := binary.BigEndian.Uint64(lnd.values[0][8:]) + if nonce != 0xde { + t.Fatalf("invalid version, got %x, expected %x", nonce, 0xde) } if !bytes.Equal(lnd.values[1], EmptyCodeHash[:]) { t.Fatalf("invalid balance, got %x, expected %x", lnd.values[1], EmptyCodeHash[:]) } - if !bytes.Equal(lnd.values[2], fourtyKeyTest[:]) { - t.Fatalf("invalid nonce, got %x, expected %x", lnd.values[2], fourtyKeyTest[:]) - } - - if !bytes.Equal(lnd.values[3], EmptyCodeHash[:]) { - t.Fatalf("invalid code hash, got %x, expected %x", lnd.values[3], EmptyCodeHash[:]) - } - - if !bytes.Equal(lnd.values[4], zero32[:]) { - t.Fatalf("invalid code size, got %x, expected %x", lnd.values[4], zero32[:]) - } - if !lnd.c2.Equal(&banderwagon.Identity) { t.Fatalf("invalid c2, got %x, expected %x", lnd.c2, banderwagon.Identity) } @@ -190,3 +181,79 @@ func TestParseNodeSingleSlot(t *testing.T) { t.Fatalf("invalid commitment, got %x, expected %x", lnd.commitment, ln.commitment) } } + +func TestSerializeWithSkipLists(t *testing.T) { + t.Parallel() + + values := make([][]byte, NodeWidth) + values[42] = zero32[:] + values[57] = fourtyKeyTest[:] + leaf, err := NewLeafNode(ffx32KeyTest, values) + if err != nil { + t.Fatal(err) + } + ser, err := leaf.Serialize() + if err != nil { + t.Fatal(err) + } + if len(ser) == 0 { + t.Fatal("empty serialization buffer") + } + if ser[0] != skipListType { + t.Fatalf("invalid serialization type, got %d, expected %d", ser[0], skipListType) + } + if !bytes.Equal(ser[1:32], ffx32KeyTest[:31]) { + t.Fatalf("stem didn't serialize properly, got %x, want %x", ser[1:32], ffx32KeyTest[:31]) + } + expectedSize := nodeTypeSize + StemSize + 3*banderwagon.UncompressedSize + 4 + 2*leafSlotSize + if len(ser) != expectedSize { + t.Fatalf("invalid skiplist serialization: %x (%d bytes != %d)", ser, len(ser), expectedSize) + } + if ser[nodeTypeSize+StemSize+3*banderwagon.UncompressedSize] != 42 { + t.Fatalf("invalid amount of leaves skipped, got %d, want %d", ser[nodeTypeSize+StemSize+3*banderwagon.UncompressedSize], 42) + } + if ser[nodeTypeSize+StemSize+3*banderwagon.UncompressedSize+1] != 1 { + t.Fatalf("invalid amount of leaves skipped, got %d, want %d", ser[nodeTypeSize+StemSize+3*banderwagon.UncompressedSize+1], 42) + } + if ser[nodeTypeSize+StemSize+3*banderwagon.UncompressedSize+2+leafSlotSize] != 14 { + t.Fatalf("invalid amount of leaves skipped, got %d, want %d", ser[nodeTypeSize+StemSize+3*banderwagon.UncompressedSize+2+leafSlotSize], 14) + } + + // add a last value to check that the final gap is properly handled + values[255] = ffx32KeyTest + ser, err = leaf.Serialize() + if err != nil { + t.Fatal(err) + } + expectedSize = nodeTypeSize + StemSize + 3*banderwagon.UncompressedSize + 6 + 3*leafSlotSize + if len(ser) != expectedSize { + t.Fatalf("invalid skiplist serialization: %x (%d bytes != %d)", ser, len(ser), expectedSize) + } + + deser, err := ParseNode(ser, 5) + if err != nil { + t.Fatal(err) + } + vals := deser.(*LeafNode).values + for i, val := range vals { + + switch i { + case 42: + if !bytes.Equal(val, zero32[:]) { + t.Fatalf("invalid deserialized skiplist value at %d: got %x, want %x", i, val, zero32) + } + case 57: + if !bytes.Equal(val, fourtyKeyTest[:]) { + t.Fatalf("invalid deserialized skiplist value at %d: got %x, want %x", i, val, fourtyKeyTest) + } + case 255: + if !bytes.Equal(val, ffx32KeyTest[:]) { + t.Fatalf("invalid deserialized skiplist value at %d: got %x, want %x", i, val, ffx32KeyTest) + } + default: + if val != nil { + t.Fatalf("invalid deserialized skiplist value at %d: got %x, want nil", i, val) + } + } + } +} diff --git a/tree.go b/tree.go index f0788164..b35305ec 100644 --- a/tree.go +++ b/tree.go @@ -170,6 +170,7 @@ const ( leafType byte = 2 eoAccountType byte = 3 singleSlotType byte = 4 + skipListType byte = 8 ) type ( @@ -1775,35 +1776,42 @@ func (n *LeafNode) serializeLeafWithUncompressedCommitments(cBytes, c1Bytes, c2B bitlist [bitlistSize]byte isEoA = true count, lastIdx int + gapcount int + gaps [32]struct { + Skip byte // How many slots to skip before the next range + Count byte // Size of the next range + } ) for i, v := range n.values { if v != nil { count++ lastIdx = i + gaps[gapcount].Count++ + setBit(bitlist[:], i) children = append(children, v...) if padding := emptyValue[:LeafValueSize-len(v)]; len(padding) != 0 { children = append(children, padding...) } + } else { + if gaps[gapcount].Skip == 255 { + panic("empty leaf node") + } + if i > 0 && n.values[i-1] != nil { + gapcount++ + } + gaps[gapcount].Skip++ } + // Check for an EOA if isEoA { switch i { case 0: - // Version should be 0 - isEoA = v != nil && bytes.Equal(v, zero32[:]) - case 1: - // Balance should not be nil + // Basic data should not be nil isEoA = v != nil - case 2: - // Nonce should have its last 24 bytes set to 0 - isEoA = v != nil && bytes.Equal(v[leafNonceSize:], zero24[:]) - case 3: + case 1: // Code hash should be the empty code hash isEoA = v != nil && bytes.Equal(v, EmptyCodeHash[:]) - case 4: - // Code size must be 0 - isEoA = v != nil && bytes.Equal(v, zero32[:]) default: // All other values must be nil isEoA = v == nil @@ -1830,8 +1838,28 @@ func (n *LeafNode) serializeLeafWithUncompressedCommitments(cBytes, c1Bytes, c2B copy(result[leafStemOffset:], n.stem[:StemSize]) copy(result[leafStemOffset+StemSize:], c1Bytes[:]) copy(result[leafStemOffset+StemSize+banderwagon.UncompressedSize:], cBytes[:]) - copy(result[leafStemOffset+StemSize+2*banderwagon.UncompressedSize:], n.values[1]) // copy balance - copy(result[leafStemOffset+StemSize+2*banderwagon.UncompressedSize+leafBalanceSize:], n.values[2][:leafNonceSize]) // copy nonce + copy(result[leafStemOffset+StemSize+2*banderwagon.UncompressedSize:], n.values[0]) // copy basic data + case gapcount < 16: + // If there are less than 16 gaps, it's worth using skiplists + result = make([]byte, 1, nodeTypeSize+StemSize+bitlistSize+3*banderwagon.UncompressedSize+len(children)) + result[0] = skipListType + result = append(result, n.stem[:StemSize]...) + result = append(result, cBytes[:]...) + result = append(result, c1Bytes[:]...) + result = append(result, c2Bytes[:]...) + var leafIdx int + for _, gap := range gaps { + if gap.Count == 0 { + break // skip the last gap as nothing follows + } + result = append(result, gap.Skip) + leafIdx += int(gap.Skip) + result = append(result, gap.Count) + for i := 0; i < int(gap.Count); i++ { + result = append(result, n.values[leafIdx]...) + leafIdx++ + } + } default: result = make([]byte, nodeTypeSize+StemSize+bitlistSize+3*banderwagon.UncompressedSize+len(children)) result[0] = leafType From f40bb5a3da4da431927f46c168fd56d6c9032b32 Mon Sep 17 00:00:00 2001 From: Guillaume Ballet <3272758+gballet@users.noreply.github.com> Date: Wed, 11 Sep 2024 18:08:50 +0200 Subject: [PATCH 2/8] fix: copy slice instead of reusing buffer --- go.mod | 2 +- proof_ipa.go | 5 +++-- 2 files changed, 4 insertions(+), 3 deletions(-) diff --git a/go.mod b/go.mod index 088ca77e..426a329a 100644 --- a/go.mod +++ b/go.mod @@ -1,6 +1,6 @@ module github.com/ethereum/go-verkle -go 1.19 +go 1.21 require ( github.com/crate-crypto/go-ipa v0.0.0-20240223125850-b1e8a79f509c diff --git a/proof_ipa.go b/proof_ipa.go index 2afcfbda..3aef2c82 100644 --- a/proof_ipa.go +++ b/proof_ipa.go @@ -29,6 +29,7 @@ import ( "bytes" "errors" "fmt" + "slices" "sort" ipa "github.com/crate-crypto/go-ipa" @@ -399,14 +400,14 @@ func DeserializeProof(vp *VerkleProof, statediff StateDiff) (*Proof, error) { k[StemSize] = ins.Suffix keys = append(keys, k[:]) prevalues = append(prevalues, nil) - postvalues = append(postvalues, ins.New[:]) + postvalues = append(postvalues, slices.Clone(ins.New[:])) } for _, rd := range stemdiff.Reads { var k [32]byte copy(k[:StemSize], stemdiff.Stem[:]) k[StemSize] = rd.Suffix keys = append(keys, k[:]) - prevalues = append(prevalues, rd.Current[:]) + prevalues = append(prevalues, slices.Clone(rd.Current[:])) postvalues = append(postvalues, nil) } for _, mi := range stemdiff.Missing { From 3b15f7845f5b3d184027e0779ffe7ed8959d6351 Mon Sep 17 00:00:00 2001 From: Guillaume Ballet <3272758+gballet@users.noreply.github.com> Date: Thu, 12 Sep 2024 11:47:27 +0200 Subject: [PATCH 3/8] some fixes found while replaying --- encoding.go | 2 +- encoding_test.go | 13 +++++++++++++ tree.go | 3 +++ 3 files changed, 17 insertions(+), 1 deletion(-) diff --git a/encoding.go b/encoding.go index 0f64e682..d5b28dcb 100644 --- a/encoding.go +++ b/encoding.go @@ -140,7 +140,7 @@ func parseSkipList(serialized []byte, depth byte) (VerkleNode, error) { var values [NodeWidth][]byte offset := leafStemOffset + StemSize + 3*banderwagon.UncompressedSize // offset in the serialized payload valueIdx := 0 // Index of the value being deserialized - for valueIdx < NodeWidth { + for valueIdx < NodeWidth && offset < len(serialized) { rangecount := serialized[offset+1] gapsize := serialized[offset] valueIdx += int(gapsize) diff --git a/encoding_test.go b/encoding_test.go index 3f6ed4bd..1b773aad 100644 --- a/encoding_test.go +++ b/encoding_test.go @@ -3,6 +3,7 @@ package verkle import ( "bytes" "encoding/binary" + "encoding/hex" "testing" "github.com/crate-crypto/go-ipa/banderwagon" @@ -257,3 +258,15 @@ func TestSerializeWithSkipLists(t *testing.T) { } } } + +// TestParseSkipList covers all issues found while replaying the chain +func TestParseSkipList(t *testing.T) { + serialized, err := hex.DecodeString("085b5fdfedd6a0e932da408ac7d772a36513d1eee9b9926e52620c43a433aad7647a5ec9f2a10159bb602a63e71b35640124f533abd866cfad4c9cd2675acf34201f98dae9b3f4e3b3f3813f9a954e4195d93a50ff52c0aa30b2ef0b07c9cc035d6c07a8ec8b3cd63a5c7b8d698c02717fd12d8fc0bf6fc5d19d050dadaf739d191941c23a791e54873be2c1f3762fda13decd4758917a7bd4e813eba8e28d760000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000100020000000000000000000000000000000000000000000000000000000000000000c5d2460186f7233c927e7db2dcc703c0e500b653ca82273b7bfad8045d85a4703e40406ffec31e8a0a13180b8ef3e6a64eabc5c7dc117821a64faa8a9b2060e89eb6e3a8e684ceba600c8594165403eb24a0749ea7e54d4152ed6902006ebdc03f1d9330bba1a48ea6212977b09864ee55be4b8a75a9ee5f55952eea95fd7bc7ab5eb18b8a87cf4320d6c8c463ce03a9c7743ad677e98cc5f56f531d57e6cd0e53ef950c3958a9a97ad744fb7c2e98bfa415f0b7054fd7d226fcbbe49cb0c12d42be4c07dcaf41f3d6f06c46aead9e3ec8829dee4630bed78fd9b6c274e61829a2de4bf7fb1761f92a729ddcdd1d27b2c97e2e1b914e5906a00adeac9c3b6b8bf17f98fe45640ce21ff0e4a3c53296f85c6269644451bfdf67a52c9e312d7ba49dd04f43e893705e9b90455bf98891ae1bff460d9fc1f53134d41c6344cad10dd383fe54f3e74e31e8f1d859ab53de3f736a47d352a7f28b234433a301f0bf05fec728928d85e79ee9e660cb7fe6b303640ffd22d45933f1f81780fbb18e8828e0231bd5908d303339aea3661482c5345f90ad4a113532adac36f2a645be770f9e20f266a9e76bb01913565f91838d02d5b337529ead171976c78b6403b9b55f9bd181fc82186665f5756d3b9e101b4ea9e4c08ce4ff79d69ec2c849bfd0a42d03fc223f33fc43fa0db89c404f60b9b6316b61ac57807d2cb773b7ade5e8789a7797c8636a27195e4a838b482094cac9ee0a52a1a18a883072ee0f92de08e7581095840c35509a33ae2e847fed729974533dd1d22a929e180ebef69d598421368572936811b8cc0828b3fbcef40e7b99720526823a297b22b0c25c038237e0bd5f54668677e6ad909f562373e3a269c926718f4b9b5f8de9266420f7f3ca0bb51925c09fb01574cc7f032f12528ee6a9ee0325d72d08aa6240d289bcfa100f3bf79a5edeaa6fb5ac6ded0f3b3f86ccde4c297309e029c54372a74424539b907173692e1bdfca37a90cf1a1d2f96e2a6d3edbfd978520d29284e5130e4dddb4146907167fabd1bfe00622ac2c0698b990c184a402b30c7ab85e3ba8b284dfb9314b6cda37808f000dcfcce110d6bb28cf7672894ef5775d9c5a5cd7f4d1403b74481c5a4c4fe573d5eac0d12ec953b4706a77791d55d0dea3f642f3d3ad36adb0bda2714d9e3f993a61f75e8cea53f589ed349175097dabca20e944944dae7869d592b6b787b05bd46a3891a6129f8e70bfc7ac5757fe5833e2619e829f3ece2cc1057faa2daee516878adc9a46f7ce81d66d22e427a984480f63fe3ca6898a9a075de8ba39dd63aa8cba28cf47dbc27787d07c541eb2fb681fb500b01ccd5dd7a20ff2a629c9ceba5fdb23b1df64ef5b7133367d66dd01d868d500e38fbe56c2831cb36e70fbcad3f304a2fa563f4aaa7e302dc6a074ad3c6fd6d32308ed5a4b3fab189e26fca6bb169f690e2ab217f74a994b53fee24a6fd58eb040a9b11f1abcba3dd1d7f2c41f17dcf38ee033a3e157dbd3028c4fed9d26764eebaca90475c6c58d0ada387e1f8cdf25bccb770d50df3648245460117db188a40886d19df697e257cf708219dd1d3c39a696d01df594102f3cf4920d8af965f3f0f63d73b5e447f94fec97f1d8ca3c06e5084b61c67fe2a47cc9a632615a4d4701e26cab319a8a1cf559e57f250d0c2aecf85bd14827e9ef205fe3b02b55cce3ec02f7154411e475c7a6d9c5ec01553e4c4521b1f047b900a20780c85a237bd78dafe02b173af8c9f381add39abc410d0ab37bf9f5d0bd2e8eaf4d9ee7473a7479ea0d3220974257e731ac12604f7baf868d6b53596567d2b1be635bf877a5002abeea50cf85de8c3ab6a23d052c8f31dbb033d4e1ef34a11f8ca432b116e6c80e91000269522b93a24625c2af00b6cf0456063195c0e3c0f315cd2a1270d5fc64c0216344f365c6a683949716c68222ba838875a5416d6ff16ade3b7ea89fe52f8e3a4151be03a79f8afa08df75f17461854826d47f44bd96729dabf64a801abd0436fd138305dc5567c2faa8310aa92532bf41d415cb36a0c1853ff3b6d6375f3ad8133b016d4ac298b99716a10beeba0fa89af5ffbcb6e10a52d4f10af81f21ae0b7de926d6aa2d1a1810aff426bd912d2084864f71dbc859d670d02eb235905f0551988a22d851268b391bb4e7f57a655fde10238135fae197ff7a65152931fbd73a6163e4f8ae7732cd777484a8eb5fa2b580f9683c4f4563ef0719ebb4fb53b5a9bf3112d35a5877f6bcd6eac543686d606b5431eeb413c9f8a01fb5b7f3a9eac53f1233c2f1b1536486c450c14ac97bc08ce190fcc84538ed51647b1e6700809ed2a31cfe7f6507417b42d1187f073050a771683144331da40bdd5dc1d5c7739a3d5476d4e2d766a7a93bdc1155bfcbe794d0c6fa7bf77993cf8eb82a7efbde68a09d8ffa8813e5f2142bd62b70d8f4e9ac3a69b7cd02a8bad4331bbc9c98177e49b198293bba6ce1477a3b2482a537f94196f4b9cbb038dca5b33192ecdeea3c3885548b3ea4fc8329b4f49b47d55cc70090e34038ba69e8ce9e3bfee4e5719f3b15f2ca26b668c5403e9d6341158227545986f7dacabadcf16b5dbcad6ee862054bdf3d404ef9538541c94849fd959ead548be2b805038e0bc43fdb33942e5bff590140e91a19ee1601f4e4464f71726ecf98167fdda3b61a1e233f2afdec63b3ddb97e7966c34305bb99e21dbdbd0c16a026a4d55611afa59d3cba784aa480e1a028797dd655924e9545978c00272fa81a9b86d5241146beafc6bd40eac2661abb99b0265046bfbe909fd961da57f9bd8e88814482d5a6095ce9a01cb085e24b504d3a9706667e20acd37225178a348d53f1736636363448d4e9d685e11d650499c368f821c3ce0ea2d0621918301f9d40afd44fba31bac401a89462fc889c6b5b34") + if err != nil { + panic(err) + } + if len(serialized) != 2340 { + t.Fatalf("invalid range %d", len(serialized)) + } + parseSkipList(serialized, 5) +} diff --git a/tree.go b/tree.go index b35305ec..89f613d0 100644 --- a/tree.go +++ b/tree.go @@ -1856,6 +1856,9 @@ func (n *LeafNode) serializeLeafWithUncompressedCommitments(cBytes, c1Bytes, c2B leafIdx += int(gap.Skip) result = append(result, gap.Count) for i := 0; i < int(gap.Count); i++ { + if len(n.values[leafIdx]) != 32 { + panic(fmt.Sprintf("%x", n.values[leafIdx])) + } result = append(result, n.values[leafIdx]...) leafIdx++ } From fe8246c9adb042aa6633dc77ce582954fb5e6ff3 Mon Sep 17 00:00:00 2001 From: Guillaume Ballet <3272758+gballet@users.noreply.github.com> Date: Thu, 12 Sep 2024 19:23:48 +0200 Subject: [PATCH 4/8] fix: support full leaves --- encoding.go | 38 +++++++++++++++++++++++++------------- tree.go | 6 +++--- 2 files changed, 28 insertions(+), 16 deletions(-) diff --git a/encoding.go b/encoding.go index d5b28dcb..6d83d0cc 100644 --- a/encoding.go +++ b/encoding.go @@ -56,6 +56,9 @@ const ( leafC1CommitmentOffset = leafCommitmentOffset + banderwagon.UncompressedSize leafC2CommitmentOffset = leafC1CommitmentOffset + banderwagon.UncompressedSize leafChildrenOffset = leafC2CommitmentOffset + banderwagon.UncompressedSize + leafSkipListCOffset = nodeTypeSize + StemSize + leafSkipListC1Offset = leafSkipListCOffset + banderwagon.UncompressedSize + leafSkipListC2Offset = leafSkipListC1Offset + banderwagon.UncompressedSize leafBasicDataSize = 32 leafSlotSize = 32 leafValueIndexSize = 1 @@ -140,15 +143,24 @@ func parseSkipList(serialized []byte, depth byte) (VerkleNode, error) { var values [NodeWidth][]byte offset := leafStemOffset + StemSize + 3*banderwagon.UncompressedSize // offset in the serialized payload valueIdx := 0 // Index of the value being deserialized - for valueIdx < NodeWidth && offset < len(serialized) { - rangecount := serialized[offset+1] - gapsize := serialized[offset] - valueIdx += int(gapsize) - offset += 2 - for i := 0; i < int(rangecount); i++ { - values[valueIdx] = serialized[offset : offset+leafSlotSize] + + // shortcut: the leaf is full and so both values are 0. + if serialized[offset] == 0 && serialized[offset+1] == 0 { + for i := 0; i < 256; i++ { + values[i] = serialized[offset : offset+leafSlotSize] offset += leafSlotSize - valueIdx++ + } + } else { + for valueIdx < NodeWidth && offset < len(serialized) { + rangecount := serialized[offset+1] + gapsize := serialized[offset] + valueIdx += int(gapsize) + offset += 2 + for i := 0; i < int(rangecount); i++ { + values[valueIdx] = serialized[offset : offset+leafSlotSize] + offset += leafSlotSize + valueIdx++ + } } } ln := NewLeafNodeWithNoComms(serialized[leafStemOffset:leafStemOffset+StemSize], values[:]) @@ -156,19 +168,19 @@ func parseSkipList(serialized []byte, depth byte) (VerkleNode, error) { ln.c1 = new(Point) // Sanity check that we have at least 3*banderwagon.UncompressedSize bytes left in the serialized payload. - if len(serialized[leafCommitmentOffset:]) < 3*banderwagon.UncompressedSize { - return nil, fmt.Errorf("leaf node commitments are not the correct size, expected at least %d, got %d", 3*banderwagon.UncompressedSize, len(serialized[leafC1CommitmentOffset:])) + if len(serialized[leafSkipListCOffset:]) < 3*banderwagon.UncompressedSize { + return nil, fmt.Errorf("leaf node commitments are not the correct size, expected at least %d, got %d", 3*banderwagon.UncompressedSize, len(serialized[leafSkipListCOffset:])) } - if err := ln.c1.SetBytesUncompressed(serialized[leafC1CommitmentOffset:leafC1CommitmentOffset+banderwagon.UncompressedSize], true); err != nil { + if err := ln.c1.SetBytesUncompressed(serialized[leafC1CommitmentOffset:leafSkipListC2Offset], true); err != nil { return nil, fmt.Errorf("setting c1 commitment: %w", err) } ln.c2 = new(Point) - if err := ln.c2.SetBytesUncompressed(serialized[leafC2CommitmentOffset:leafC2CommitmentOffset+banderwagon.UncompressedSize], true); err != nil { + if err := ln.c2.SetBytesUncompressed(serialized[leafSkipListC2Offset:leafSkipListC2Offset+banderwagon.UncompressedSize], true); err != nil { return nil, fmt.Errorf("setting c2 commitment: %w", err) } ln.commitment = new(Point) - if err := ln.commitment.SetBytesUncompressed(serialized[leafCommitmentOffset:leafC1CommitmentOffset], true); err != nil { + if err := ln.commitment.SetBytesUncompressed(serialized[leafSkipListCOffset:leafSkipListC1Offset], true); err != nil { return nil, fmt.Errorf("setting commitment: %w", err) } return ln, nil diff --git a/tree.go b/tree.go index 89f613d0..af160a4c 100644 --- a/tree.go +++ b/tree.go @@ -1779,7 +1779,7 @@ func (n *LeafNode) serializeLeafWithUncompressedCommitments(cBytes, c1Bytes, c2B gapcount int gaps [32]struct { Skip byte // How many slots to skip before the next range - Count byte // Size of the next range + Count int // Size of the next range } ) for i, v := range n.values { @@ -1854,8 +1854,8 @@ func (n *LeafNode) serializeLeafWithUncompressedCommitments(cBytes, c1Bytes, c2B } result = append(result, gap.Skip) leafIdx += int(gap.Skip) - result = append(result, gap.Count) - for i := 0; i < int(gap.Count); i++ { + result = append(result, byte(gap.Count)) + for i := 0; i < gap.Count; i++ { if len(n.values[leafIdx]) != 32 { panic(fmt.Sprintf("%x", n.values[leafIdx])) } From ee9413f5dce6a3148e24062ef1ca44c7d1bc13a9 Mon Sep 17 00:00:00 2001 From: Guillaume Ballet <3272758+gballet@users.noreply.github.com> Date: Thu, 12 Sep 2024 20:45:52 +0200 Subject: [PATCH 5/8] improve Count comment --- tree.go | 2 +- 1 file changed, 1 insertion(+), 1 deletion(-) diff --git a/tree.go b/tree.go index af160a4c..a25b0f01 100644 --- a/tree.go +++ b/tree.go @@ -1779,7 +1779,7 @@ func (n *LeafNode) serializeLeafWithUncompressedCommitments(cBytes, c1Bytes, c2B gapcount int gaps [32]struct { Skip byte // How many slots to skip before the next range - Count int // Size of the next range + Count int // Size of the next range. `int` because a full leaf has 256 entries } ) for i, v := range n.values { From 4deabaa892f8ae660d10e047ef37265117c2a396 Mon Sep 17 00:00:00 2001 From: Guillaume Ballet <3272758+gballet@users.noreply.github.com> Date: Fri, 13 Sep 2024 13:51:11 +0200 Subject: [PATCH 6/8] replay fixes Signed-off-by: Guillaume Ballet <3272758+gballet@users.noreply.github.com> --- encoding.go | 2 +- tree.go | 16 ++++++++++++---- 2 files changed, 13 insertions(+), 5 deletions(-) diff --git a/encoding.go b/encoding.go index 6d83d0cc..13dc864f 100644 --- a/encoding.go +++ b/encoding.go @@ -172,7 +172,7 @@ func parseSkipList(serialized []byte, depth byte) (VerkleNode, error) { return nil, fmt.Errorf("leaf node commitments are not the correct size, expected at least %d, got %d", 3*banderwagon.UncompressedSize, len(serialized[leafSkipListCOffset:])) } - if err := ln.c1.SetBytesUncompressed(serialized[leafC1CommitmentOffset:leafSkipListC2Offset], true); err != nil { + if err := ln.c1.SetBytesUncompressed(serialized[leafSkipListC1Offset:leafSkipListC2Offset], true); err != nil { return nil, fmt.Errorf("setting c1 commitment: %w", err) } ln.c2 = new(Point) diff --git a/tree.go b/tree.go index a25b0f01..cb1295c2 100644 --- a/tree.go +++ b/tree.go @@ -1766,6 +1766,10 @@ var ( EmptyCodeHash, _ = hex.DecodeString("c5d2460186f7233c927e7db2dcc703c0e500b653ca82273b7bfad8045d85a470") ) +// skipListMaxGapCount is the maximum allowed number of +// gaps before one has to fall back to the bitmap. +const skipListMaxGapCount = 16 + func (n *LeafNode) serializeLeafWithUncompressedCommitments(cBytes, c1Bytes, c2Bytes [banderwagon.UncompressedSize]byte) []byte { // Empty value in LeafNode used for padding. var emptyValue [LeafValueSize]byte @@ -1777,7 +1781,7 @@ func (n *LeafNode) serializeLeafWithUncompressedCommitments(cBytes, c1Bytes, c2B isEoA = true count, lastIdx int gapcount int - gaps [32]struct { + gaps [skipListMaxGapCount]struct { Skip byte // How many slots to skip before the next range Count int // Size of the next range. `int` because a full leaf has 256 entries } @@ -1786,14 +1790,18 @@ func (n *LeafNode) serializeLeafWithUncompressedCommitments(cBytes, c1Bytes, c2B if v != nil { count++ lastIdx = i - gaps[gapcount].Count++ + if gapcount < skipListMaxGapCount { + gaps[gapcount].Count++ + } setBit(bitlist[:], i) children = append(children, v...) if padding := emptyValue[:LeafValueSize-len(v)]; len(padding) != 0 { children = append(children, padding...) } - } else { + } else if gapcount < skipListMaxGapCount { + // If we reach the 256th empty leaf in the node, this means + // that the whole node is empty, which should not happen. if gaps[gapcount].Skip == 255 { panic("empty leaf node") } @@ -1839,7 +1847,7 @@ func (n *LeafNode) serializeLeafWithUncompressedCommitments(cBytes, c1Bytes, c2B copy(result[leafStemOffset+StemSize:], c1Bytes[:]) copy(result[leafStemOffset+StemSize+banderwagon.UncompressedSize:], cBytes[:]) copy(result[leafStemOffset+StemSize+2*banderwagon.UncompressedSize:], n.values[0]) // copy basic data - case gapcount < 16: + case gapcount < skipListMaxGapCount: // If there are less than 16 gaps, it's worth using skiplists result = make([]byte, 1, nodeTypeSize+StemSize+bitlistSize+3*banderwagon.UncompressedSize+len(children)) result[0] = skipListType From a41ce0842c997ac3796efdc0fc392b2cc6ed5cf9 Mon Sep 17 00:00:00 2001 From: Guillaume Ballet <3272758+gballet@users.noreply.github.com> Date: Fri, 13 Sep 2024 14:26:42 +0200 Subject: [PATCH 7/8] more replay fixes Signed-off-by: Guillaume Ballet <3272758+gballet@users.noreply.github.com> --- tree.go | 6 +++++- 1 file changed, 5 insertions(+), 1 deletion(-) diff --git a/tree.go b/tree.go index cb1295c2..921508cf 100644 --- a/tree.go +++ b/tree.go @@ -1805,10 +1805,14 @@ func (n *LeafNode) serializeLeafWithUncompressedCommitments(cBytes, c1Bytes, c2B if gaps[gapcount].Skip == 255 { panic("empty leaf node") } + // If the previous value wasn't nil, a new + // gap is starting. if i > 0 && n.values[i-1] != nil { gapcount++ } - gaps[gapcount].Skip++ + if gapcount < skipListMaxGapCount { + gaps[gapcount].Skip++ + } } // Check for an EOA From 12343ee9aba2166f43472b678ce0494d8db552e8 Mon Sep 17 00:00:00 2001 From: Guillaume Ballet <3272758+gballet@users.noreply.github.com> Date: Mon, 16 Sep 2024 22:47:44 +0200 Subject: [PATCH 8/8] fix: +2 offset in no-gap encoding Signed-off-by: Guillaume Ballet <3272758+gballet@users.noreply.github.com> --- encoding.go | 1 + 1 file changed, 1 insertion(+) diff --git a/encoding.go b/encoding.go index 13dc864f..25f7151d 100644 --- a/encoding.go +++ b/encoding.go @@ -146,6 +146,7 @@ func parseSkipList(serialized []byte, depth byte) (VerkleNode, error) { // shortcut: the leaf is full and so both values are 0. if serialized[offset] == 0 && serialized[offset+1] == 0 { + offset += 2 // skip single header for i := 0; i < 256; i++ { values[i] = serialized[offset : offset+leafSlotSize] offset += leafSlotSize