mirror of
https://github.com/logos-storage/constantine.git
synced 2026-01-02 13:13:07 +00:00
* unoptimized msm * MSM: reorder loops * add a signed windowed recoding technique * improve wNAF table access * use batchAffine * revamp EC tests * MSM signed digit support * refactor MSM: recode signed ahead of time * missing test vector * refactor allocs and Alloca sideeffect * add an endomorphism threshold * Add Jacobian extended coordinates * refactor recodings, prepare for parallelizable on-the-fly signed recoding * recoding changes, introduce proper NAF for pairings * more pairings refactoring, introduce miller accumulator for EVM * some optim to the addchain miller loop * start optimizing multi-pairing * finish multi-miller loop refactoring * minor tuning * MSM: signed encoding suitable for parallelism (no precompute) * cleanup signed window encoding * add prefetching * add metering * properly init result to infinity * comment on prefetching * introduce vartime inversion for batch additions * fix JacExt infinity conversion * add batchAffine for MSM, though slower than JacExtended at the moment * add a batch affine scheduler for MSM * Add Multi-Scalar-Multiplication endomorphism acceleration * some tuning * signed integer fixes + 32-bit + tuning * Some more tuning * common msm bench + don't use affine for c < 9 * nit
114 lines
4.2 KiB
Nim
114 lines
4.2 KiB
Nim
# Constantine
|
|
# Copyright (c) 2018-2019 Status Research & Development GmbH
|
|
# Copyright (c) 2020-Present Mamy André-Ratsimbazafy
|
|
# Licensed and distributed under either of
|
|
# * MIT license (license terms in the root directory or at http://opensource.org/licenses/MIT).
|
|
# * Apache v2 license (license terms in the root directory or at http://www.apache.org/licenses/LICENSE-2.0).
|
|
# at your option. This file may not be copied, modified, or distributed except according to those terms.
|
|
|
|
import
|
|
# Internals
|
|
../constantine/math/config/curves,
|
|
../constantine/math/arithmetic,
|
|
../constantine/math/elliptic/[
|
|
ec_shortweierstrass_affine,
|
|
ec_shortweierstrass_projective,
|
|
ec_shortweierstrass_jacobian,
|
|
ec_shortweierstrass_jacobian_extended,
|
|
ec_shortweierstrass_batch_ops_parallel],
|
|
../constantine/platforms/threadpool/threadpool,
|
|
# Helpers
|
|
../helpers/prng_unsafe,
|
|
./bench_elliptic_template,
|
|
./bench_blueprint
|
|
|
|
# ############################################################
|
|
#
|
|
# Parallel Benchmark definitions
|
|
#
|
|
# ############################################################
|
|
|
|
proc multiAddParallelBench*(EC: typedesc, numPoints: int, iters: int) =
|
|
var points = newSeq[ECP_ShortW_Aff[EC.F, EC.G]](numPoints)
|
|
|
|
for i in 0 ..< numPoints:
|
|
points[i] = rng.random_unsafe(ECP_ShortW_Aff[EC.F, EC.G])
|
|
|
|
var r{.noInit.}: EC
|
|
|
|
var tp = Threadpool.new()
|
|
|
|
bench("EC parallel batch add (" & align($tp.numThreads, 2) & " threads) " & $EC.G & " (" & $numPoints & " points)", EC, iters):
|
|
tp.sum_reduce_vartime_parallel(r, points)
|
|
|
|
tp.shutdown()
|
|
|
|
# ############################################################
|
|
#
|
|
# Benchmark of the G1 group of
|
|
# Short Weierstrass elliptic curves
|
|
# in (homogeneous) projective coordinates
|
|
#
|
|
# ############################################################
|
|
|
|
|
|
const Iters = 10_000
|
|
const AvailableCurves = [
|
|
# BN254_Snarks,
|
|
BLS12_381,
|
|
]
|
|
|
|
# const testNumPoints = [10, 100, 1000, 10000, 100000]
|
|
const testNumPoints = [4, 8, 16, 32, 64, 128, 256, 512, 1024, 2048, 4096, 8192, 65536, 131072]
|
|
|
|
proc main() =
|
|
separator()
|
|
staticFor i, 0, AvailableCurves.len:
|
|
const curve = AvailableCurves[i]
|
|
addBench(ECP_ShortW_Prj[Fp[curve], G1], Iters)
|
|
doublingBench(ECP_ShortW_Prj[Fp[curve], G1], Iters)
|
|
mixedAddBench(ECP_ShortW_Prj[Fp[curve], G1], Iters)
|
|
addBench(ECP_ShortW_Jac[Fp[curve], G1], Iters)
|
|
doublingBench(ECP_ShortW_Jac[Fp[curve], G1], Iters)
|
|
mixedAddBench(ECP_ShortW_Jac[Fp[curve], G1], Iters)
|
|
addBench(ECP_ShortW_JacExt[Fp[curve], G1], Iters)
|
|
doublingBench(ECP_ShortW_JacExt[Fp[curve], G1], Iters)
|
|
mixedAddBench(ECP_ShortW_JacExt[Fp[curve], G1], Iters)
|
|
separator()
|
|
for numPoints in testNumPoints:
|
|
let batchIters = max(1, Iters div numPoints)
|
|
multiAddBench(ECP_ShortW_Prj[Fp[curve], G1], numPoints, useBatching = false, batchIters)
|
|
separator()
|
|
for numPoints in testNumPoints:
|
|
let batchIters = max(1, Iters div numPoints)
|
|
multiAddBench(ECP_ShortW_Prj[Fp[curve], G1], numPoints, useBatching = true, batchIters)
|
|
separator()
|
|
for numPoints in testNumPoints:
|
|
let batchIters = max(1, Iters div numPoints)
|
|
multiAddParallelBench(ECP_ShortW_Prj[Fp[curve], G1], numPoints, batchIters)
|
|
separator()
|
|
for numPoints in testNumPoints:
|
|
let batchIters = max(1, Iters div numPoints)
|
|
multiAddBench(ECP_ShortW_Jac[Fp[curve], G1], numPoints, useBatching = false, batchIters)
|
|
separator()
|
|
for numPoints in testNumPoints:
|
|
let batchIters = max(1, Iters div numPoints)
|
|
multiAddBench(ECP_ShortW_Jac[Fp[curve], G1], numPoints, useBatching = true, batchIters)
|
|
separator()
|
|
for numPoints in testNumPoints:
|
|
let batchIters = max(1, Iters div numPoints)
|
|
multiAddParallelBench(ECP_ShortW_Jac[Fp[curve], G1], numPoints, batchIters)
|
|
separator()
|
|
for numPoints in testNumPoints:
|
|
let batchIters = max(1, Iters div numPoints)
|
|
multiAddBench(ECP_ShortW_JacExt[Fp[curve], G1], numPoints, useBatching = false, batchIters)
|
|
separator()
|
|
for numPoints in testNumPoints:
|
|
let batchIters = max(1, Iters div numPoints)
|
|
multiAddBench(ECP_ShortW_JacExt[Fp[curve], G1], numPoints, useBatching = true, batchIters)
|
|
separator()
|
|
separator()
|
|
|
|
main()
|
|
notes()
|