cleanup manifest (#44)

* cleanup manifest

* Attach decode to `Manifest`

* move manifest container to it's own file

* rebase main

* update header license year
This commit is contained in:
Dmitriy Ryajov 2022-01-12 19:55:51 -06:00 committed by GitHub
parent 68a45d8f57
commit 5f48de6a44
No known key found for this signature in database
GPG Key ID: 4AEE18F83AFDEB23
5 changed files with 196 additions and 167 deletions

158
dagger/blocksmanifest.nim Normal file
View File

@ -0,0 +1,158 @@
## Nim-Dagger
## Copyright (c) 2022 Status Research & Development GmbH
## Licensed under either of
## * Apache License, version 2.0, ([LICENSE-APACHE](LICENSE-APACHE))
## * MIT license ([LICENSE-MIT](LICENSE-MIT))
## at your option.
## This file may not be copied, modified, or distributed except according to
## those terms.
{.push raises: [Defect].}
import std/tables
import pkg/libp2p
import pkg/questionable
import pkg/questionable/results
import pkg/chronicles
import pkg/chronos
import ./manifest
import ./errors
export manifest
const
ManifestCodec* = multiCodec("dag-pb")
var
emptyDigests {.threadvar.}: array[CIDv0..CIDv1, Table[MultiCodec, MultiHash]]
once {.threadvar.}: bool
template EmptyDigests: untyped =
if not once:
emptyDigests = [
CIDv0: {
multiCodec("sha2-256"): Cid
.init("bafybeihdwdcefgh4dqkjv67uzcmw7ojee6xedzdetojuzjevtenxquvyku")
.get()
.mhash
.get()
}.toTable,
CIDv1: {
multiCodec("sha2-256"): Cid.init("QmdfTbBqBPQ7VNxZEYEj14VmRuZBkqFbiwReogJgS1zR1n")
.get()
.mhash
.get()
}.toTable,
]
once = true
emptyDigests
type
BlocksManifest* = object
manifest: Manifest
version*: CidVersion
hcodec*: MultiCodec
codec*: MultiCodec
proc len*(b: BlocksManifest): int = b.manifest.blocks.len
iterator items*(b: BlocksManifest): Cid =
for b in b.manifest.blocks:
yield b
template hashBytes(mh: MultiHash): seq[byte] =
## get the hash bytes of a multihash object
##
mh.data.buffer[mh.dpos..(mh.dpos + mh.size - 1)]
proc cid*(b: var BlocksManifest): ?!Cid =
## Generate a root hash using the treehash algorithm
##
if htree =? b.manifest.cid:
return htree.success
var
stack: seq[MultiHash]
for cid in b.manifest.blocks:
stack.add(? cid.mhash.mapFailure)
while stack.len > 1:
let
(b1, b2) = (stack.pop(), stack.pop())
mh = ? MultiHash.digest(
$b.hcodec,
(b1.hashBytes() & b2.hashBytes()))
.mapFailure
stack.add(mh)
if stack.len == 1:
let cid = ? Cid.init(
b.version,
b.codec,
(? EmptyDigests[b.version][b.hcodec].catch))
.mapFailure
b.manifest.cid = cid.some
return cid.success
proc put*(b: var BlocksManifest, cid: Cid) =
b.manifest.cid = Cid.none
trace "Adding cid to manifest", cid
b.manifest.blocks.add(cid)
proc contains*(b: BlocksManifest, cid: Cid): bool =
cid in b.manifest.blocks
proc encode*(b: var BlocksManifest): ?!seq[byte] =
if b.manifest.cid.isNone:
b.manifest.cid = (? b.cid).some
b.manifest.encode()
proc init*(
T: type BlocksManifest,
blocks: openArray[Cid] = [],
version = CIDv1,
hcodec = multiCodec("sha2-256"),
codec = multiCodec("raw")): ?!T =
## Create a manifest using array of `Cid`s
##
if hcodec notin EmptyDigests[version]:
return failure("Unsupported manifest hash codec!")
T(
manifest: Manifest(blocks: @blocks),
version: version,
codec: codec,
hcodec: hcodec,
).success
proc init*(
T: type BlocksManifest,
data: openArray[byte]): ?!T =
## Create manifest from a raw data blob
## (in dag-pb for for now)
##
let
manifest = ? Manifest.decode(data)
cid = !manifest.cid
mhash = ? cid.mhash.mapFailure
var blockManifest = ? BlocksManifest.init(
manifest.blocks,
cid.version,
mhash.mcodec,
cid.mcodec)
if cid != ? blockManifest.cid:
return failure("Decoded content hash doesn't match!")
blockManifest.success

View File

@ -1,5 +1,5 @@
## Nim-Dagger ## Nim-Dagger
## Copyright (c) 2021 Status Research & Development GmbH ## Copyright (c) 2022 Status Research & Development GmbH
## Licensed under either of ## Licensed under either of
## * Apache License, version 2.0, ([LICENSE-APACHE](LICENSE-APACHE)) ## * Apache License, version 2.0, ([LICENSE-APACHE](LICENSE-APACHE))
## * MIT license ([LICENSE-MIT](LICENSE-MIT)) ## * MIT license ([LICENSE-MIT](LICENSE-MIT))
@ -7,110 +7,23 @@
## This file may not be copied, modified, or distributed except according to ## This file may not be copied, modified, or distributed except according to
## those terms. ## those terms.
{.push raises: [Defect].}
import std/tables
import pkg/libp2p
import pkg/libp2p/protobuf/minprotobuf import pkg/libp2p/protobuf/minprotobuf
import pkg/libp2p
import pkg/questionable import pkg/questionable
import pkg/questionable/results import pkg/questionable/results
import pkg/chronicles
import pkg/chronos
import ./blocktype
import ./errors import ./errors
const
ManifestCodec* = multiCodec("dag-pb")
var
emptyDigests {.threadvar.}: array[CIDv0..CIDv1, Table[MultiCodec, MultiHash]]
once {.threadvar.}: bool
template EmptyDigests: untyped =
if not once:
emptyDigests = [
CIDv0: {
multiCodec("sha2-256"): Cid
.init("bafybeihdwdcefgh4dqkjv67uzcmw7ojee6xedzdetojuzjevtenxquvyku")
.get()
.mhash
.get()
}.toTable,
CIDv1: {
multiCodec("sha2-256"): Cid.init("QmdfTbBqBPQ7VNxZEYEj14VmRuZBkqFbiwReogJgS1zR1n")
.get()
.mhash
.get()
}.toTable,
]
once = true
emptyDigests
type type
BlocksManifest* = object Manifest* = object
blocks: seq[Cid] cid*: ?Cid
htree: ?Cid blocks*: seq[Cid]
version*: CidVersion
hcodec*: MultiCodec
codec*: MultiCodec
proc len*(b: BlocksManifest): int = b.blocks.len proc encode*(b: var Manifest): ?!seq[byte] =
iterator items*(b: BlocksManifest): Cid =
for b in b.blocks:
yield b
proc hashBytes(mh: MultiHash): seq[byte] =
## get the hash bytes of a multihash object
##
mh.data.buffer[mh.dpos..(mh.dpos + mh.size - 1)]
proc cid*(b: var BlocksManifest): ?!Cid =
## Generate a root hash using the treehash algorithm
##
if htree =? b.htree:
return htree.success
var
stack: seq[MultiHash]
for cid in b.blocks:
stack.add(? cid.mhash.mapFailure)
while stack.len > 1:
let
(b1, b2) = (stack.pop(), stack.pop())
mh = ? MultiHash.digest(
$b.hcodec,
(b1.hashBytes() & b2.hashBytes()))
.mapFailure
stack.add(mh)
if stack.len == 1:
let cid = ? Cid.init(
b.version,
b.codec,
(? EmptyDigests[b.version][b.hcodec].catch))
.mapFailure
b.htree = cid.some
return cid.success
proc put*(b: var BlocksManifest, cid: Cid) =
b.htree = Cid.none
trace "Adding cid to manifest", cid
b.blocks.add(cid)
proc contains*(b: BlocksManifest, cid: Cid): bool =
cid in b.blocks
proc encode*(b: var BlocksManifest): ?!seq[byte] =
## Encode the manifest into a ``ManifestCodec`` ## Encode the manifest into a ``ManifestCodec``
## multicodec container (Dag-pb) for now ## multicodec container (Dag-pb) for now
##
var pbNode = initProtoBuffer() var pbNode = initProtoBuffer()
for c in b.blocks: for c in b.blocks:
@ -119,75 +32,34 @@ proc encode*(b: var BlocksManifest): ?!seq[byte] =
pbLink.finish() pbLink.finish()
pbNode.write(2, pbLink) pbNode.write(2, pbLink)
let cid = ? b.cid let cid = !b.cid
pbNode.write(1, cid.data.buffer) # set the treeHash Cid as the data field pbNode.write(1, cid.data.buffer) # set the treeHash Cid as the data field
pbNode.finish() pbNode.finish()
return pbNode.buffer.success return pbNode.buffer.success
proc decode*(_: type BlocksManifest, data: seq[byte]): ?!(Cid, seq[Cid]) = proc decode*(_: type Manifest, data: openArray[byte]): ?!Manifest =
## Decode a manifest from a byte seq ## Decode a manifest from a data blob
## ##
var var
pbNode = initProtoBuffer(data) pbNode = initProtoBuffer(data)
cidBuf: seq[byte] cidBuf: seq[byte]
blocks: seq[Cid] blocks: seq[Cid]
if pbNode.getField(1, cidBuf).isOk: if pbNode.getField(1, cidBuf).isErr:
let cid = ? Cid.init(cidBuf).mapFailure return failure("Unable to decode Cid from manifest!")
var linksBuf: seq[seq[byte]]
if pbNode.getRepeatedField(2, linksBuf).isOk:
for pbLinkBuf in linksBuf:
var
blocksBuf: seq[seq[byte]]
blockBuf: seq[byte]
pbLink = initProtoBuffer(pbLinkBuf)
if pbLink.getField(1, blockBuf).isOk: let cid = ? Cid.init(cidBuf).mapFailure
let cidRes = Cid.init(blockBuf) var linksBuf: seq[seq[byte]]
if cidRes.isOk: if pbNode.getRepeatedField(2, linksBuf).isOk:
blocks.add(cidRes.get()) for pbLinkBuf in linksBuf:
var
blocksBuf: seq[seq[byte]]
blockBuf: seq[byte]
pbLink = initProtoBuffer(pbLinkBuf)
return (cid, blocks).success if pbLink.getField(1, blockBuf).isOk:
blocks.add(? Cid.init(blockBuf).mapFailure)
proc init*( Manifest(cid: cid.some, blocks: blocks).success
T: type BlocksManifest,
blocks: openArray[Cid] = [],
version = CIDv1,
hcodec = multiCodec("sha2-256"),
codec = multiCodec("raw")): ?!T =
## Create a manifest using array of `Cid`s
##
if hcodec notin EmptyDigests[version]:
return failure("Unsuported manifest hash codec!")
T(
blocks: @blocks,
version: version,
codec: codec,
hcodec: hcodec,
).success
proc init*(
T: type BlocksManifest,
blk: Block): ?!T =
## Create manifest from a raw manifest block
## (in dag-pb for for now)
##
let
(cid, blocks) = ? BlocksManifest.decode(blk.data)
mhash = ? cid.mhash.mapFailure
var
manifest = ? BlocksManifest.init(
blocks,
cid.version,
mhash.mcodec,
cid.mcodec)
if cid != (? manifest.cid):
return failure("Content hashes don't match!")
return manifest.success

View File

@ -21,7 +21,7 @@ import pkg/libp2p/signed_envelope
import ./chunker import ./chunker
import ./blocktype as bt import ./blocktype as bt
import ./manifest import ./blocksmanifest
import ./stores/blockstore import ./stores/blockstore
import ./blockexchange import ./blockexchange
@ -99,11 +99,10 @@ proc retrieve*(
if mc == ManifestCodec: if mc == ManifestCodec:
trace "Retrieving data set", cid, mc trace "Retrieving data set", cid, mc
let res = BlocksManifest.init(blk) without blockManifest =? BlocksManifest.init(blk.data):
if (res.isErr): return failure("Unable to construct manifest!")
return failure(res.error.msg)
asyncSpawn node.streamBlocks(stream, res.get()) asyncSpawn node.streamBlocks(stream, blockManifest)
else: else:
asyncSpawn (proc(): Future[void] {.async.} = asyncSpawn (proc(): Future[void] {.async.} =
try: try:
@ -168,8 +167,8 @@ proc store*(
return failure(cid.error.msg) return failure(cid.error.msg)
trace "Stored data", manifestCid = manifest.cid, trace "Stored data", manifestCid = manifest.cid,
contentCid = !cid, contentCid = !cid,
blocks = blockManifest.len blocks = blockManifest.len
return manifest.cid.success return manifest.cid.success

View File

@ -9,7 +9,7 @@ import pkg/stew/byteutils
import pkg/dagger/chunker import pkg/dagger/chunker
import pkg/dagger/blocktype as bt import pkg/dagger/blocktype as bt
import pkg/dagger/manifest import pkg/dagger/blocksmanifest
import ./helpers import ./helpers
@ -47,10 +47,10 @@ suite "Manifest":
) )
var var
manifest = BlocksManifest.init(blocks).tryGet() blocksManifest = BlocksManifest.init(blocks).tryGet()
let let
e = manifest.encode().tryGet() e = blocksManifest.encode().tryGet()
(cid, decoded) = BlocksManifest.decode(e).tryGet() manifest = Manifest.decode(e).tryGet()
check decoded == blocks check manifest.blocks == blocks

View File

@ -12,7 +12,7 @@ import pkg/dagger/stores
import pkg/dagger/blockexchange import pkg/dagger/blockexchange
import pkg/dagger/chunker import pkg/dagger/chunker
import pkg/dagger/node import pkg/dagger/node
import pkg/dagger/manifest import pkg/dagger/blocksmanifest
import pkg/dagger/blocktype as bt import pkg/dagger/blocktype as bt
import ./helpers import ./helpers
@ -75,7 +75,7 @@ suite "Test Node":
var var
manifestBlock = (await localStore.getBlock(manifestCid)).tryGet() manifestBlock = (await localStore.getBlock(manifestCid)).tryGet()
localManifest = BlocksManifest.init(manifestBlock).tryGet() localManifest = BlocksManifest.init(manifestBlock.data).tryGet()
check: check:
manifest.len == localManifest.len manifest.len == localManifest.len