Skip to content

Commit 4dfec7e

Browse files
authored
trie: optimize memory allocation (#30932)
This pull request removes the node copy operation to reduce memory allocation. Key Changes as below: **(a) Use `decodeNodeUnsafe` for decoding nodes retrieved from the trie node reader** In the current implementation of the MPT, once a trie node blob is retrieved, it is passed to `decodeNode` for decoding. However, `decodeNode` assumes the supplied byte slice might be mutated later, so it performs a deep copy internally before parsing the node. Given that the node reader is implemented by the path database and the hash database, both of which guarantee the immutability of the returned byte slice. By restricting the node reader interface to explicitly guarantee that the returned byte slice will not be modified, we can safely replace `decodeNode` with `decodeNodeUnsafe`. This eliminates the need for a redundant byte copy during each node resolution. **(b) Modify the trie in place** In the current implementation of the MPT, a copy of a trie node is created before any modifications are made. These modifications include: - Node resolution: Converting the value from a hash to the actual node. - Node hashing: Tagging the hash into its cache. - Node commit: Replacing the children with its hash. - Structural changes: For example, adding a new child to a fullNode or replacing a child of a shortNode. This mechanism ensures that modifications only affect the live tree, leaving all previously created copies unaffected. Unfortunately, this property leads to a huge memory allocation requirement. For example, if we want to modify the fullNode for n times, the node will be copied for n times. In this pull request, all the trie modifications are made in place. In order to make sure all previously created copies are unaffected, the `Copy` function now will deep-copy all the live nodes rather than the root node itself. With this change, while the `Copy` function becomes more expensive, it's totally acceptable as it's not a frequently used one. For the normal trie operations (Get, GetNode, Hash, Commit, Insert, Delete), the node copy is not required anymore.
1 parent 4ff5093 commit 4dfec7e

File tree

6 files changed

+279
-96
lines changed

6 files changed

+279
-96
lines changed

trie/committer.go

+13-26
Original file line numberDiff line numberDiff line change
@@ -57,32 +57,26 @@ func (c *committer) commit(path []byte, n node, parallel bool) node {
5757
// Commit children, then parent, and remove the dirty flag.
5858
switch cn := n.(type) {
5959
case *shortNode:
60-
// Commit child
61-
collapsed := cn.copy()
62-
6360
// If the child is fullNode, recursively commit,
6461
// otherwise it can only be hashNode or valueNode.
6562
if _, ok := cn.Val.(*fullNode); ok {
66-
collapsed.Val = c.commit(append(path, cn.Key...), cn.Val, false)
63+
cn.Val = c.commit(append(path, cn.Key...), cn.Val, false)
6764
}
6865
// The key needs to be copied, since we're adding it to the
6966
// modified nodeset.
70-
collapsed.Key = hexToCompact(cn.Key)
71-
hashedNode := c.store(path, collapsed)
67+
cn.Key = hexToCompact(cn.Key)
68+
hashedNode := c.store(path, cn)
7269
if hn, ok := hashedNode.(hashNode); ok {
7370
return hn
7471
}
75-
return collapsed
72+
return cn
7673
case *fullNode:
77-
hashedKids := c.commitChildren(path, cn, parallel)
78-
collapsed := cn.copy()
79-
collapsed.Children = hashedKids
80-
81-
hashedNode := c.store(path, collapsed)
74+
c.commitChildren(path, cn, parallel)
75+
hashedNode := c.store(path, cn)
8276
if hn, ok := hashedNode.(hashNode); ok {
8377
return hn
8478
}
85-
return collapsed
79+
return cn
8680
case hashNode:
8781
return cn
8882
default:
@@ -92,11 +86,10 @@ func (c *committer) commit(path []byte, n node, parallel bool) node {
9286
}
9387

9488
// commitChildren commits the children of the given fullnode
95-
func (c *committer) commitChildren(path []byte, n *fullNode, parallel bool) [17]node {
89+
func (c *committer) commitChildren(path []byte, n *fullNode, parallel bool) {
9690
var (
97-
wg sync.WaitGroup
98-
nodesMu sync.Mutex
99-
children [17]node
91+
wg sync.WaitGroup
92+
nodesMu sync.Mutex
10093
)
10194
for i := 0; i < 16; i++ {
10295
child := n.Children[i]
@@ -106,22 +99,21 @@ func (c *committer) commitChildren(path []byte, n *fullNode, parallel bool) [17]
10699
// If it's the hashed child, save the hash value directly.
107100
// Note: it's impossible that the child in range [0, 15]
108101
// is a valueNode.
109-
if hn, ok := child.(hashNode); ok {
110-
children[i] = hn
102+
if _, ok := child.(hashNode); ok {
111103
continue
112104
}
113105
// Commit the child recursively and store the "hashed" value.
114106
// Note the returned node can be some embedded nodes, so it's
115107
// possible the type is not hashNode.
116108
if !parallel {
117-
children[i] = c.commit(append(path, byte(i)), child, false)
109+
n.Children[i] = c.commit(append(path, byte(i)), child, false)
118110
} else {
119111
wg.Add(1)
120112
go func(index int) {
121113
p := append(path, byte(index))
122114
childSet := trienode.NewNodeSet(c.nodes.Owner)
123115
childCommitter := newCommitter(childSet, c.tracer, c.collectLeaf)
124-
children[index] = childCommitter.commit(p, child, false)
116+
n.Children[index] = childCommitter.commit(p, child, false)
125117
nodesMu.Lock()
126118
c.nodes.MergeSet(childSet)
127119
nodesMu.Unlock()
@@ -132,11 +124,6 @@ func (c *committer) commitChildren(path []byte, n *fullNode, parallel bool) [17]
132124
if parallel {
133125
wg.Wait()
134126
}
135-
// For the 17th child, it's possible the type is valuenode.
136-
if n.Children[16] != nil {
137-
children[16] = n.Children[16]
138-
}
139-
return children
140127
}
141128

142129
// store hashes the node n and adds it to the modified nodeset. If leaf collection

trie/hasher.go

+40-44
Original file line numberDiff line numberDiff line change
@@ -53,72 +53,66 @@ func returnHasherToPool(h *hasher) {
5353
hasherPool.Put(h)
5454
}
5555

56-
// hash collapses a node down into a hash node, also returning a copy of the
57-
// original node initialized with the computed hash to replace the original one.
58-
func (h *hasher) hash(n node, force bool) (hashed node, cached node) {
56+
// hash collapses a node down into a hash node.
57+
func (h *hasher) hash(n node, force bool) node {
5958
// Return the cached hash if it's available
6059
if hash, _ := n.cache(); hash != nil {
61-
return hash, n
60+
return hash
6261
}
6362
// Trie not processed yet, walk the children
6463
switch n := n.(type) {
6564
case *shortNode:
66-
collapsed, cached := h.hashShortNodeChildren(n)
65+
collapsed := h.hashShortNodeChildren(n)
6766
hashed := h.shortnodeToHash(collapsed, force)
68-
// We need to retain the possibly _not_ hashed node, in case it was too
69-
// small to be hashed
7067
if hn, ok := hashed.(hashNode); ok {
71-
cached.flags.hash = hn
68+
n.flags.hash = hn
7269
} else {
73-
cached.flags.hash = nil
70+
n.flags.hash = nil
7471
}
75-
return hashed, cached
72+
return hashed
7673
case *fullNode:
77-
collapsed, cached := h.hashFullNodeChildren(n)
78-
hashed = h.fullnodeToHash(collapsed, force)
74+
collapsed := h.hashFullNodeChildren(n)
75+
hashed := h.fullnodeToHash(collapsed, force)
7976
if hn, ok := hashed.(hashNode); ok {
80-
cached.flags.hash = hn
77+
n.flags.hash = hn
8178
} else {
82-
cached.flags.hash = nil
79+
n.flags.hash = nil
8380
}
84-
return hashed, cached
81+
return hashed
8582
default:
8683
// Value and hash nodes don't have children, so they're left as were
87-
return n, n
84+
return n
8885
}
8986
}
9087

91-
// hashShortNodeChildren collapses the short node. The returned collapsed node
92-
// holds a live reference to the Key, and must not be modified.
93-
func (h *hasher) hashShortNodeChildren(n *shortNode) (collapsed, cached *shortNode) {
94-
// Hash the short node's child, caching the newly hashed subtree
95-
collapsed, cached = n.copy(), n.copy()
96-
// Previously, we did copy this one. We don't seem to need to actually
97-
// do that, since we don't overwrite/reuse keys
98-
// cached.Key = common.CopyBytes(n.Key)
88+
// hashShortNodeChildren returns a copy of the supplied shortNode, with its child
89+
// being replaced by either the hash or an embedded node if the child is small.
90+
func (h *hasher) hashShortNodeChildren(n *shortNode) *shortNode {
91+
var collapsed shortNode
9992
collapsed.Key = hexToCompact(n.Key)
100-
// Unless the child is a valuenode or hashnode, hash it
10193
switch n.Val.(type) {
10294
case *fullNode, *shortNode:
103-
collapsed.Val, cached.Val = h.hash(n.Val, false)
95+
collapsed.Val = h.hash(n.Val, false)
96+
default:
97+
collapsed.Val = n.Val
10498
}
105-
return collapsed, cached
99+
return &collapsed
106100
}
107101

108-
func (h *hasher) hashFullNodeChildren(n *fullNode) (collapsed *fullNode, cached *fullNode) {
109-
// Hash the full node's children, caching the newly hashed subtrees
110-
cached = n.copy()
111-
collapsed = n.copy()
102+
// hashFullNodeChildren returns a copy of the supplied fullNode, with its child
103+
// being replaced by either the hash or an embedded node if the child is small.
104+
func (h *hasher) hashFullNodeChildren(n *fullNode) *fullNode {
105+
var children [17]node
112106
if h.parallel {
113107
var wg sync.WaitGroup
114108
wg.Add(16)
115109
for i := 0; i < 16; i++ {
116110
go func(i int) {
117111
hasher := newHasher(false)
118112
if child := n.Children[i]; child != nil {
119-
collapsed.Children[i], cached.Children[i] = hasher.hash(child, false)
113+
children[i] = hasher.hash(child, false)
120114
} else {
121-
collapsed.Children[i] = nilValueNode
115+
children[i] = nilValueNode
122116
}
123117
returnHasherToPool(hasher)
124118
wg.Done()
@@ -128,19 +122,21 @@ func (h *hasher) hashFullNodeChildren(n *fullNode) (collapsed *fullNode, cached
128122
} else {
129123
for i := 0; i < 16; i++ {
130124
if child := n.Children[i]; child != nil {
131-
collapsed.Children[i], cached.Children[i] = h.hash(child, false)
125+
children[i] = h.hash(child, false)
132126
} else {
133-
collapsed.Children[i] = nilValueNode
127+
children[i] = nilValueNode
134128
}
135129
}
136130
}
137-
return collapsed, cached
131+
if n.Children[16] != nil {
132+
children[16] = n.Children[16]
133+
}
134+
return &fullNode{flags: nodeFlag{}, Children: children}
138135
}
139136

140-
// shortnodeToHash creates a hashNode from a shortNode. The supplied shortnode
141-
// should have hex-type Key, which will be converted (without modification)
142-
// into compact form for RLP encoding.
143-
// If the rlp data is smaller than 32 bytes, `nil` is returned.
137+
// shortNodeToHash computes the hash of the given shortNode. The shortNode must
138+
// first be collapsed, with its key converted to compact form. If the RLP-encoded
139+
// node data is smaller than 32 bytes, the node itself is returned.
144140
func (h *hasher) shortnodeToHash(n *shortNode, force bool) node {
145141
n.encode(h.encbuf)
146142
enc := h.encodedBytes()
@@ -151,8 +147,8 @@ func (h *hasher) shortnodeToHash(n *shortNode, force bool) node {
151147
return h.hashData(enc)
152148
}
153149

154-
// fullnodeToHash is used to create a hashNode from a fullNode, (which
155-
// may contain nil values)
150+
// fullnodeToHash computes the hash of the given fullNode. If the RLP-encoded
151+
// node data is smaller than 32 bytes, the node itself is returned.
156152
func (h *hasher) fullnodeToHash(n *fullNode, force bool) node {
157153
n.encode(h.encbuf)
158154
enc := h.encodedBytes()
@@ -203,10 +199,10 @@ func (h *hasher) hashDataTo(dst, data []byte) {
203199
func (h *hasher) proofHash(original node) (collapsed, hashed node) {
204200
switch n := original.(type) {
205201
case *shortNode:
206-
sn, _ := h.hashShortNodeChildren(n)
202+
sn := h.hashShortNodeChildren(n)
207203
return sn, h.shortnodeToHash(sn, false)
208204
case *fullNode:
209-
fn, _ := h.hashFullNodeChildren(n)
205+
fn := h.hashFullNodeChildren(n)
210206
return fn, h.fullnodeToHash(fn, false)
211207
default:
212208
// Value and hash nodes don't have children, so they're left as were

trie/node.go

+10-4
Original file line numberDiff line numberDiff line change
@@ -79,15 +79,19 @@ func (n *fullNode) EncodeRLP(w io.Writer) error {
7979
return eb.Flush()
8080
}
8181

82-
func (n *fullNode) copy() *fullNode { copy := *n; return &copy }
83-
func (n *shortNode) copy() *shortNode { copy := *n; return &copy }
84-
8582
// nodeFlag contains caching-related metadata about a node.
8683
type nodeFlag struct {
8784
hash hashNode // cached hash of the node (may be nil)
8885
dirty bool // whether the node has changes that must be written to the database
8986
}
9087

88+
func (n nodeFlag) copy() nodeFlag {
89+
return nodeFlag{
90+
hash: common.CopyBytes(n.hash),
91+
dirty: n.dirty,
92+
}
93+
}
94+
9195
func (n *fullNode) cache() (hashNode, bool) { return n.flags.hash, n.flags.dirty }
9296
func (n *shortNode) cache() (hashNode, bool) { return n.flags.hash, n.flags.dirty }
9397
func (n hashNode) cache() (hashNode, bool) { return nil, true }
@@ -228,7 +232,9 @@ func decodeRef(buf []byte) (node, []byte, error) {
228232
err := fmt.Errorf("oversized embedded node (size is %d bytes, want size < %d)", size, hashLen)
229233
return nil, buf, err
230234
}
231-
n, err := decodeNode(nil, buf)
235+
// The buffer content has already been copied or is safe to use;
236+
// no additional copy is required.
237+
n, err := decodeNodeUnsafe(nil, buf)
232238
return n, rest, err
233239
case kind == rlp.String && len(val) == 0:
234240
// empty node

0 commit comments

Comments
 (0)