From ef1bab0802d764b87f7b7dd51b0d34c1721c0905 Mon Sep 17 00:00:00 2001
From: Jacek Sieka <jacek@status.im>
Date: Mon, 2 Sep 2024 16:03:10 +0200
Subject: [PATCH] avoid some trivial memory allocations (#2587)

* pre-allocate `blobify` data and remove redundant error handling
(cannot fail on correct data)
* use threadvar for temporary storage when decoding rdb, avoiding
closure env
* speed up database walkers by avoiding many temporaries

~5% perf improvement on block import, 100x on database iteration (useful
for building analysis tooling)
---
 nimbus/db/aristo/aristo_blobify.nim           | 50 ++++++++++---------
 nimbus/db/aristo/aristo_compute.nim           |  4 +-
 nimbus/db/aristo/aristo_desc/desc_nibbles.nim | 31 +++++++-----
 nimbus/db/aristo/aristo_init/memory_db.nim    |  9 +---
 nimbus/db/aristo/aristo_init/rocks_db.nim     |  6 +--
 .../aristo/aristo_init/rocks_db/rdb_get.nim   | 20 ++++----
 .../aristo/aristo_init/rocks_db/rdb_put.nim   |  7 +--
 .../aristo/aristo_init/rocks_db/rdb_walk.nim  | 36 ++++++++++---
 nimbus/db/aristo/aristo_serialise.nim         |  8 +--
 tests/test_aristo/test_blobify.nim            | 10 ++--
 tests/test_aristo/test_portal_proof.nim       |  2 +-
 vendor/nim-stew                               |  2 +-
 12 files changed, 100 insertions(+), 85 deletions(-)

diff --git a/nimbus/db/aristo/aristo_blobify.nim b/nimbus/db/aristo/aristo_blobify.nim
index 493a11497..7245a6ceb 100644
--- a/nimbus/db/aristo/aristo_blobify.nim
+++ b/nimbus/db/aristo/aristo_blobify.nim
@@ -203,12 +203,12 @@ proc blobifyTo*(vtx: VertexRef; data: var Blob): Result[void,AristoError] =
         if vtx.ePfx.len > 0:
           vtx.ePfx.toHexPrefix(isleaf = false)
         else:
-          @[]
+          default(HexPrefixBuf)
       psLen = pSegm.len.byte
     if 33 < psLen:
       return err(BlobifyExtPathOverflow)
 
-    data &= pSegm
+    data &= pSegm.data()
     data &= lens.toBytesBE
     data &= [0x80u8 or psLen]
 
@@ -219,16 +219,16 @@ proc blobifyTo*(vtx: VertexRef; data: var Blob): Result[void,AristoError] =
     if psLen == 0 or 33 < psLen:
       return err(BlobifyLeafPathOverflow)
     vtx.lData.blobifyTo(data)
-    data &= pSegm
+    data &= pSegm.data()
     data &= [0xC0u8 or psLen]
 
   ok()
 
-proc blobify*(vtx: VertexRef): Result[Blob, AristoError] =
+proc blobify*(vtx: VertexRef): Blob =
   ## Variant of `blobify()`
-  var data: Blob
-  ? vtx.blobifyTo data
-  ok(move(data))
+  result = newSeqOfCap[byte](128)
+  if vtx.blobifyTo(result).isErr:
+    result.setLen(0) # blobify only fails on invalid verticies
 
 proc blobifyTo*(lSst: SavedState; data: var Blob): Result[void,AristoError] =
   ## Serialise a last saved state record
@@ -246,45 +246,48 @@ proc blobify*(lSst: SavedState): Result[Blob,AristoError] =
 # -------------
 proc deblobify(
     data: openArray[byte];
-    T: type LeafPayload;
-      ): Result[LeafPayload,AristoError] =
+    pyl: var LeafPayload;
+      ): Result[void,AristoError] =
   if data.len == 0:
-    return ok LeafPayload(pType: RawData)
+    pyl = LeafPayload(pType: RawData)
+    return ok()
 
   let mask = data[^1]
   if (mask and 0x10) > 0: # unstructured payload
-    return ok LeafPayload(pType: RawData, rawBlob: data[0 .. ^2])
+    pyl = LeafPayload(pType: RawData, rawBlob: data[0 .. ^2])
+    return ok()
 
   if (mask and 0x20) > 0: # Slot storage data
-    return ok LeafPayload(
+    pyl = LeafPayload(
       pType: StoData,
       stoData: ?deblobify(data.toOpenArray(0, data.len - 2), UInt256))
+    return ok()
 
+  pyl = LeafPayload(pType: AccountData)
   var
-    pAcc = LeafPayload(pType: AccountData)
     start = 0
     lens = uint16.fromBytesBE(data.toOpenArray(data.len - 3, data.len - 2))
 
   if (mask and 0x01) > 0:
     let len = lens and 0b111
-    pAcc.account.nonce = ? load64(data, start, int(len + 1))
+    pyl.account.nonce = ? load64(data, start, int(len + 1))
 
   if (mask and 0x02) > 0:
     let len = (lens shr 3) and 0b11111
-    pAcc.account.balance = ? load256(data, start, int(len + 1))
+    pyl.account.balance = ? load256(data, start, int(len + 1))
 
   if (mask and 0x04) > 0:
     let len = (lens shr 8) and 0b111
-    pAcc.stoID = (true, VertexID(? load64(data, start, int(len + 1))))
+    pyl.stoID = (true, VertexID(? load64(data, start, int(len + 1))))
 
   if (mask and 0x08) > 0:
     if data.len() < start + 32:
       return err(DeblobCodeLenUnsupported)
-    discard pAcc.account.codeHash.data.copyFrom(data.toOpenArray(start, start + 31))
+    discard pyl.account.codeHash.data.copyFrom(data.toOpenArray(start, start + 31))
   else:
-    pAcc.account.codeHash = EMPTY_CODE_HASH
+    pyl.account.codeHash = EMPTY_CODE_HASH
 
-  ok(pAcc)
+  ok()
 
 proc deblobify*(
     record: openArray[byte];
@@ -336,11 +339,12 @@ proc deblobify*(
       NibblesBuf.fromHexPrefix record.toOpenArray(pLen, rLen-1)
     if not isLeaf:
       return err(DeblobLeafGotExtPrefix)
-    let pyl = ? record.toOpenArray(0, pLen - 1).deblobify(LeafPayload)
-    VertexRef(
+    let vtx = VertexRef(
       vType: Leaf,
-      lPfx:  pathSegment,
-      lData: pyl)
+      lPfx:  pathSegment)
+
+    ? record.toOpenArray(0, pLen - 1).deblobify(vtx.lData)
+    vtx
 
   else:
     return err(DeblobUnknown)
diff --git a/nimbus/db/aristo/aristo_compute.nim b/nimbus/db/aristo/aristo_compute.nim
index e3c26d3f6..46a02f1c9 100644
--- a/nimbus/db/aristo/aristo_compute.nim
+++ b/nimbus/db/aristo/aristo_compute.nim
@@ -68,7 +68,7 @@ proc computeKeyImpl(
   case vtx.vType:
   of Leaf:
     writer.startList(2)
-    writer.append(vtx.lPfx.toHexPrefix(isLeaf = true))
+    writer.append(vtx.lPfx.toHexPrefix(isLeaf = true).data())
 
     case vtx.lData.pType
     of AccountData:
@@ -111,7 +111,7 @@ proc computeKeyImpl(
       writeBranch(bwriter)
 
       writer.startList(2)
-      writer.append(vtx.ePfx.toHexPrefix(isleaf = false))
+      writer.append(vtx.ePfx.toHexPrefix(isleaf = false).data())
       writer.append(bwriter.finish().digestTo(HashKey))
     else:
       writeBranch(writer)
diff --git a/nimbus/db/aristo/aristo_desc/desc_nibbles.nim b/nimbus/db/aristo/aristo_desc/desc_nibbles.nim
index 58ecc9708..48f67633d 100644
--- a/nimbus/db/aristo/aristo_desc/desc_nibbles.nim
+++ b/nimbus/db/aristo/aristo_desc/desc_nibbles.nim
@@ -8,15 +8,20 @@
 # at your option. This file may not be copied, modified, or distributed
 # except according to those terms.
 
-import stew/arrayops
+import stew/[arraybuf, arrayops]
 
-type NibblesBuf* = object
-  ## Allocation-free type for storing up to 64 4-bit nibbles, as seen in the
-  ## Ethereum MPT
-  bytes: array[32, byte]
-  ibegin, iend: int8
-    # Where valid nibbles can be found - we use indices here to avoid copies
-    # wen slicing - iend not inclusive
+export arraybuf
+
+type
+  NibblesBuf* = object
+    ## Allocation-free type for storing up to 64 4-bit nibbles, as seen in the
+    ## Ethereum MPT
+    bytes: array[32, byte]
+    ibegin, iend: int8
+      # Where valid nibbles can be found - we use indices here to avoid copies
+      # wen slicing - iend not inclusive
+
+  HexPrefixBuf* = ArrayBuf[33, byte]
 
 func high*(T: type NibblesBuf): int =
   63
@@ -61,7 +66,7 @@ func `$`*(r: NibblesBuf): string =
     const chars = "0123456789abcdef"
     result.add chars[r[i]]
 
-func slice*(r: NibblesBuf, ibegin: int, iend = -1): NibblesBuf =
+func slice*(r: NibblesBuf, ibegin: int, iend = -1): NibblesBuf {.noinit.} =
   result.bytes = r.bytes
   result.ibegin = r.ibegin + ibegin.int8
   let e =
@@ -75,7 +80,7 @@ func slice*(r: NibblesBuf, ibegin: int, iend = -1): NibblesBuf =
 template writeFirstByte(nibbleCountExpr) {.dirty.} =
   let nibbleCount = nibbleCountExpr
   var oddnessFlag = (nibbleCount and 1) != 0
-  newSeq(result, (nibbleCount div 2) + 1)
+  result.setLen((nibbleCount div 2) + 1)
   result[0] = byte((int(isLeaf) * 2 + int(oddnessFlag)) shl 4)
   var writeHead = 0
 
@@ -89,11 +94,11 @@ template writeNibbles(r) {.dirty.} =
       result[writeHead] = nextNibble shl 4
     oddnessFlag = not oddnessFlag
 
-func toHexPrefix*(r: NibblesBuf, isLeaf = false): seq[byte] =
+func toHexPrefix*(r: NibblesBuf, isLeaf = false): HexPrefixBuf =
   writeFirstByte(r.len)
   writeNibbles(r)
 
-func toHexPrefix*(r1, r2: NibblesBuf, isLeaf = false): seq[byte] =
+func toHexPrefix*(r1, r2: NibblesBuf, isLeaf = false): HexPrefixBuf =
   writeFirstByte(r1.len + r2.len)
   writeNibbles(r1)
   writeNibbles(r2)
@@ -131,7 +136,7 @@ func fromHexPrefix*(
   else:
     result.isLeaf = false
 
-func `&`*(a, b: NibblesBuf): NibblesBuf =
+func `&`*(a, b: NibblesBuf): NibblesBuf {.noinit.} =
   for i in 0 ..< a.len:
     result[i] = a[i]
 
diff --git a/nimbus/db/aristo/aristo_init/memory_db.nim b/nimbus/db/aristo/aristo_init/memory_db.nim
index a90773ceb..2e7c95a7a 100644
--- a/nimbus/db/aristo/aristo_init/memory_db.nim
+++ b/nimbus/db/aristo/aristo_init/memory_db.nim
@@ -133,14 +133,7 @@ proc putVtxFn(db: MemBackendRef): PutVtxFn =
       let hdl = hdl.getSession db
       if hdl.error.isNil:
         if vtx.isValid:
-          let rc = vtx.blobify()
-          if rc.isErr:
-            hdl.error = TypedPutHdlErrRef(
-              pfx:  VtxPfx,
-              vid:  rvid.vid,
-              code: rc.error)
-            return
-          hdl.sTab[rvid] = rc.value
+          hdl.sTab[rvid] = vtx.blobify()
         else:
           hdl.sTab[rvid] = EmptyBlob
 
diff --git a/nimbus/db/aristo/aristo_init/rocks_db.nim b/nimbus/db/aristo/aristo_init/rocks_db.nim
index 702d359f1..15c51c054 100644
--- a/nimbus/db/aristo/aristo_init/rocks_db.nim
+++ b/nimbus/db/aristo/aristo_init/rocks_db.nim
@@ -312,10 +312,8 @@ iterator walkVtx*(
     be: RdbBackendRef;
       ): tuple[evid: RootedVertexID, vtx: VertexRef] =
   ## Variant of `walk()` iteration over the vertex sub-table.
-  for (rvid, data) in be.rdb.walkVtx:
-    let rc = data.deblobify VertexRef
-    if rc.isOk:
-      yield (rvid, rc.value)
+  for (rvid, vtx) in be.rdb.walkVtx:
+    yield (rvid, vtx)
 
 iterator walkKey*(
     be: RdbBackendRef;
diff --git a/nimbus/db/aristo/aristo_init/rocks_db/rdb_get.nim b/nimbus/db/aristo/aristo_init/rocks_db/rdb_get.nim
index b36a279e2..f3fad1f54 100644
--- a/nimbus/db/aristo/aristo_init/rocks_db/rdb_get.nim
+++ b/nimbus/db/aristo/aristo_init/rocks_db/rdb_get.nim
@@ -63,10 +63,10 @@ proc getKey*(
     return ok(move(rc.value))
 
   # Otherwise fetch from backend database
-  var res: Result[HashKey,(AristoError,string)]
+  # A threadvar is used to avoid allocating an environment for onData
+  var res{.threadvar.}: Opt[HashKey]
   let onData = proc(data: openArray[byte]) =
-    res = HashKey.fromBytes(data).mapErr(proc(): auto =
-      (RdbHashKeyExpected,""))
+    res = HashKey.fromBytes(data)
 
   let gotData = rdb.keyCol.get(rvid.blobify().data(), onData).valueOr:
      const errSym = RdbBeDriverGetKeyError
@@ -76,9 +76,9 @@ proc getKey*(
 
   # Correct result if needed
   if not gotData:
-    res = ok(VOID_HASH_KEY)
+    res.ok(VOID_HASH_KEY)
   elif res.isErr():
-    return res # Parsing failed
+    return err((RdbHashKeyExpected,"")) # Parsing failed
 
   # Update cache and return
   ok rdb.rdKeyLru.lruAppend(rvid.vid, res.value(), RdKeyLruMaxSize)
@@ -93,10 +93,10 @@ proc getVtx*(
     return ok(move(rc.value))
 
   # Otherwise fetch from backend database
-  var res: Result[VertexRef,(AristoError,string)]
+  # A threadvar is used to avoid allocating an environment for onData
+  var res {.threadvar.}: Result[VertexRef,AristoError]
   let onData = proc(data: openArray[byte]) =
-    res = data.deblobify(VertexRef).mapErr(proc(error: AristoError): auto =
-      (error,""))
+    res = data.deblobify(VertexRef)
 
   let gotData = rdb.vtxCol.get(rvid.blobify().data(), onData).valueOr:
     const errSym = RdbBeDriverGetVtxError
@@ -105,9 +105,9 @@ proc getVtx*(
     return err((errSym,error))
 
   if not gotData:
-    res = ok(VertexRef(nil))
+    res.ok(VertexRef(nil))
   elif res.isErr():
-    return res # Parsing failed
+    return err((res.error(), "Parsing failed")) # Parsing failed
 
   # Update cache and return
   ok rdb.rdVtxLru.lruAppend(rvid.vid, res.value(), RdVtxLruMaxSize)
diff --git a/nimbus/db/aristo/aristo_init/rocks_db/rdb_put.nim b/nimbus/db/aristo/aristo_init/rocks_db/rdb_put.nim
index 640097b9e..f30319164 100644
--- a/nimbus/db/aristo/aristo_init/rocks_db/rdb_put.nim
+++ b/nimbus/db/aristo/aristo_init/rocks_db/rdb_put.nim
@@ -122,12 +122,7 @@ proc putVtx*(
       ): Result[void,(VertexID,AristoError,string)] =
   let dsc = rdb.session
   if vtx.isValid:
-    let rc = vtx.blobify()
-    if rc.isErr:
-      # Caller must `rollback()` which will flush the `rdVtxLru` cache
-      return err((rvid.vid,rc.error,""))
-
-    dsc.put(rvid.blobify().data(), rc.value, rdb.vtxCol.handle()).isOkOr:
+    dsc.put(rvid.blobify().data(), vtx.blobify(), rdb.vtxCol.handle()).isOkOr:
       # Caller must `rollback()` which will flush the `rdVtxLru` cache
       const errSym = RdbBeDriverPutVtxError
       when extraTraceMessages:
diff --git a/nimbus/db/aristo/aristo_init/rocks_db/rdb_walk.nim b/nimbus/db/aristo/aristo_init/rocks_db/rdb_walk.nim
index 637c6272d..ab57dd9a2 100644
--- a/nimbus/db/aristo/aristo_init/rocks_db/rdb_walk.nim
+++ b/nimbus/db/aristo/aristo_init/rocks_db/rdb_walk.nim
@@ -72,8 +72,8 @@ iterator walkKey*(rdb: RdbInst): tuple[rvid: RootedVertexID, data: Blob] =
         yield (rvid, val)
 
 
-iterator walkVtx*(rdb: RdbInst): tuple[rvid: RootedVertexID, data: Blob] =
-  ## Walk over key-value pairs of the hash key column of the database.
+iterator walkVtx*(rdb: RdbInst): tuple[rvid: RootedVertexID, data: VertexRef] =
+  ## Walk over key-value pairs of the vertex column of the database.
   ##
   ## Non-decodable entries are are ignored.
   ##
@@ -84,12 +84,32 @@ iterator walkVtx*(rdb: RdbInst): tuple[rvid: RootedVertexID, data: Blob] =
       break walkBody
     defer: rit.close()
 
-    for (key,val) in rit.pairs:
-      if val.len != 0:
-        let rvid = key.deblobify(RootedVertexID).valueOr:
-          continue
-
-        yield (rvid, val)
+    rit.seekToFirst()
+    var key: RootedVertexID
+    var value: VertexRef
+    while rit.isValid():
+      var valid = true
+      rit.key(
+        proc(data: openArray[byte]) =
+          key = deblobify(data, RootedVertexID).valueOr:
+            valid = false
+            default(RootedVertexID)
+      )
+      if not valid:
+        continue
+
+      rit.value(
+        proc(data: openArray[byte]) =
+          value = deblobify(data, VertexRef).valueOr:
+            valid = false
+            default(VertexRef)
+      )
+      if not valid:
+        continue
+
+      rit.next()
+      yield (key, value)
+    rit.close()
 
 # ------------------------------------------------------------------------------
 # End
diff --git a/nimbus/db/aristo/aristo_serialise.nim b/nimbus/db/aristo/aristo_serialise.nim
index 77b1b9a9c..13f2810f1 100644
--- a/nimbus/db/aristo/aristo_serialise.nim
+++ b/nimbus/db/aristo/aristo_serialise.nim
@@ -86,7 +86,7 @@ proc to*(node: NodeRef; T: type seq[Blob]): T =
 
       var wrx = initRlpWriter()
       wrx.startList(2)
-      wrx.append node.ePfx.toHexPrefix(isleaf = false)
+      wrx.append node.ePfx.toHexPrefix(isleaf = false).data()
       wrx.append brHash
 
       result.add wrx.finish()
@@ -104,7 +104,7 @@ proc to*(node: NodeRef; T: type seq[Blob]): T =
 
     var wr = initRlpWriter()
     wr.startList(2)
-    wr.append node.lPfx.toHexPrefix(isleaf = true)
+    wr.append node.lPfx.toHexPrefix(isleaf = true).data()
     wr.append node.lData.serialise(getKey0).value
 
     result.add (wr.finish())
@@ -127,7 +127,7 @@ proc digestTo*(node: NodeRef; T: type HashKey): T =
       let brHash = wr.finish().digestTo(HashKey)
       wr = initRlpWriter()
       wr.startList(2)
-      wr.append node.ePfx.toHexPrefix(isleaf = false)
+      wr.append node.ePfx.toHexPrefix(isleaf = false).data()
       wr.append brHash
 
   of Leaf:
@@ -138,7 +138,7 @@ proc digestTo*(node: NodeRef; T: type HashKey): T =
       ok(node.key[0]) # always succeeds
 
     wr.startList(2)
-    wr.append node.lPfx.toHexPrefix(isleaf = true)
+    wr.append node.lPfx.toHexPrefix(isleaf = true).data()
     wr.append node.lData.serialise(getKey0).value
 
   wr.finish().digestTo(HashKey)
diff --git a/tests/test_aristo/test_blobify.nim b/tests/test_aristo/test_blobify.nim
index b94ee8dfa..03d39b1c9 100644
--- a/tests/test_aristo/test_blobify.nim
+++ b/tests/test_aristo/test_blobify.nim
@@ -65,8 +65,8 @@ suite "Aristo blobify":
       )
 
     check:
-      deblobify(blobify(leafRawData)[], VertexRef)[] == leafRawData
-      deblobify(blobify(leafAccount)[], VertexRef)[] == leafAccount
-      deblobify(blobify(leafStoData)[], VertexRef)[] == leafStoData
-      deblobify(blobify(branch)[], VertexRef)[] == branch
-      deblobify(blobify(extension)[], VertexRef)[] == extension
+      deblobify(blobify(leafRawData), VertexRef)[] == leafRawData
+      deblobify(blobify(leafAccount), VertexRef)[] == leafAccount
+      deblobify(blobify(leafStoData), VertexRef)[] == leafStoData
+      deblobify(blobify(branch), VertexRef)[] == branch
+      deblobify(blobify(extension), VertexRef)[] == extension
diff --git a/tests/test_aristo/test_portal_proof.nim b/tests/test_aristo/test_portal_proof.nim
index 4d6b5db70..8af4e39b0 100644
--- a/tests/test_aristo/test_portal_proof.nim
+++ b/tests/test_aristo/test_portal_proof.nim
@@ -115,7 +115,7 @@ func asExtension(b: Blob; path: Hash256): Blob =
     var wr = initRlpWriter()
 
     wr.startList(2)
-    wr.append NibblesBuf.fromBytes(@[nibble]).slice(1).toHexPrefix(isleaf=false)
+    wr.append NibblesBuf.fromBytes(@[nibble]).slice(1).toHexPrefix(isleaf=false).data()
     wr.append node.listElem(nibble.int).toBytes
     wr.finish()
 
diff --git a/vendor/nim-stew b/vendor/nim-stew
index 54cc67cbb..fc09b2e02 160000
--- a/vendor/nim-stew
+++ b/vendor/nim-stew
@@ -1 +1 @@
-Subproject commit 54cc67cbb83f61b6e3168b09701758c5b805120a
+Subproject commit fc09b2e023ab2d73e425f7d15cf94871c7867868