From cc52064cde33dfa157697d94cce421379eb9d074 Mon Sep 17 00:00:00 2001
From: mratsim <mamy.ratsimbazafy_dev@gadz.org>
Date: Sun, 25 Feb 2018 15:55:42 +0100
Subject: [PATCH] Add BigEndian + Refactoring: remove U512, mapArray, modular
 arithmetics

---
 src/ethash.nim             | 66 +++++++++++++++-----------------------
 src/private/casting.nim    | 34 ++------------------
 src/private/functional.nim | 19 -----------
 src/private/intmath.nim    | 50 ++---------------------------
 tests/all_tests.nim        |  2 +-
 5 files changed, 32 insertions(+), 139 deletions(-)

diff --git a/src/ethash.nim b/src/ethash.nim
index da9c0a1..dc5453b 100644
--- a/src/ethash.nim
+++ b/src/ethash.nim
@@ -1,17 +1,13 @@
 # Copyright (c) 2018 Status Research & Development GmbH
 # Distributed under the Apache v2 License (license terms are at http://www.apache.org/licenses/LICENSE-2.0).
 
-import  math, sequtils, algorithm,
+import  math, endians,
         keccak_tiny
 
 import  ./private/[primes, casting, functional, intmath]
-export toHex, hexToByteArrayBE, hexToSeqBytesBE, toByteArrayBE
+export toHex, hexToByteArrayBE, hexToSeqBytesBE, toByteArrayBE # debug functions
 export keccak_tiny
 
-# TODO: Switching from default int to uint64
-# Note: array/seq indexing requires an Ordinal, uint64 are not.
-# So to index arrays/seq we would need to cast uint64 to int anyway ...
-
 # ###############################################################################
 # Definitions
 
@@ -22,7 +18,7 @@ const
   DATASET_BYTES_GROWTH* = 2'u^23     # dataset growth per epoch
   CACHE_BYTES_INIT* = 2'u^24         # bytes in cache at genesis
   CACHE_BYTES_GROWTH* = 2'u^17       # cache growth per epoch
-  CACHE_MULTIPLIER=1024              # Size of the DAG relative to the cache
+  CACHE_MULTIPLIER = 1024            # Size of the DAG relative to the cache
   EPOCH_LENGTH* = 30000              # blocks per epoch
   MIX_BYTES* = 128                   # width of mix
   HASH_BYTES* = 64                   # hash length in bytes
@@ -30,9 +26,6 @@ const
   CACHE_ROUNDS* = 3                  # number of rounds in cache production
   ACCESSES* = 64                     # number of accesses in hashimoto loop
 
-  # MAGIC_NUM ?
-  # MAGIC_NUM_SIZE ?
-
 # ###############################################################################
 # Parameters
 
@@ -67,24 +60,23 @@ proc get_cachesize_lut*(block_number: Natural): uint64 {.noSideEffect, inline.}
 
 proc mkcache*(cache_size: uint64, seed: Hash[256]): seq[Hash[512]] {.noSideEffect.}=
 
-  # The starting cache size is a set of 524288 64-byte values
-
+  # Cache size
   let n = int(cache_size div HASH_BYTES)
 
   # Sequentially produce the initial dataset
   result = newSeq[Hash[512]](n)
-  result[0] = keccak512 seed.toByteArrayBE
+  result[0] = keccak512 seed.data
 
   for i in 1 ..< n:
-    result[i] = keccak512 result[i-1].toU512
+    result[i] = keccak512 result[i-1].data
 
   # Use a low-round version of randmemohash
   for _ in 0 ..< CACHE_ROUNDS:
     for i in 0 ..< n:
       let
-        v = result[i].toU512[0] mod n.uint32
-        a = result[(i-1+n) mod n].toU512
-        b = result[v.int].toU512
+        v = result[i].as_u32_words[0] mod n.uint32
+        a = result[(i-1+n) mod n].data
+        b = result[v.int].data
       result[i] = keccak512 zipMap(a, b, x xor y)
 
 # ###############################################################################
@@ -106,9 +98,7 @@ proc fnv*[T: SomeUnsignedInt or Natural](v1, v2: T): uint32 {.inline, noSideEffe
   #   - for powers of 2: a mod 2^p == a and (2^p - 1)
   #   - 2^32 - 1 == high(uint32)
 
-
-  # # mulmod(v1 and mask, FNV_PRIME.T, (2^32).T) xor (v2 and mask)
-  # Casting to uint32 should do the modulo and masking just fine
+  # So casting to uint32 should do the modulo and masking just fine
 
   (v1.uint32 * FNV_PRIME) xor v2.uint32
 
@@ -116,26 +106,25 @@ proc fnv*[T: SomeUnsignedInt or Natural](v1, v2: T): uint32 {.inline, noSideEffe
 # Full dataset calculation
 
 proc calc_dataset_item*(cache: seq[Hash[512]], i: Natural): Hash[512] {.noSideEffect, noInit.} =
-  # TODO review WORD_BYTES
-  # TODO use uint32 instead of uint64
-  # and mix[0] should be uint32
-
   let n = cache.len
   const r: uint32 = HASH_BYTES div WORD_BYTES
 
-  var mix = cast[U512](cache[i mod n])
+  # Alias for the result value. Interpreted as an array of uint32 words
+  var mix = cast[ptr array[16, uint32]](addr result)
+
+  mix[] = cache[i mod n].as_u32_words
   when system.cpuEndian == littleEndian:
     mix[0] = mix[0] xor i.uint32
   else:
-    mix[high(mix)] = mix[high(0)] xor i.uint32
-  mix = toU512 keccak512 mix
+    mix[high(mix)] = mix[high(mix)] xor i.uint32
+  result = keccak512 mix[]
 
   # FNV with a lots of random cache nodes based on i
   for j in 0'u32 ..< DATASET_PARENTS:
     let cache_index = fnv(i.uint32 xor j, mix[j mod r])
-    mix = zipMap(mix, cache[cache_index.int mod n].toU512, fnv(x, y))
+    mix[] = zipMap(mix[], cache[cache_index.int mod n].as_u32_words, fnv(x, y))
 
-  result = keccak512 mix
+  result = keccak512 mix[]
 
 proc calc_dataset*(full_size: Natural, cache: seq[Hash[512]]): seq[Hash[512]] {.noSideEffect.} =
 
@@ -148,7 +137,6 @@ proc calc_dataset*(full_size: Natural, cache: seq[Hash[512]]): seq[Hash[512]] {.
 # Main loop
 
 type HashimotoHash = tuple[mix_digest: Hash[256], value: Hash[256]]
-  # TODO use Hash as a result type
 type DatasetLookup = proc(i: Natural): Hash[512] {.noSideEffect.}
 
 proc hashimoto(header: Hash[256],
@@ -169,12 +157,11 @@ proc hashimoto(header: Hash[256],
   let s_bytes = cast[ptr array[64, byte]](addr s)   # Alias for to interpret s as a byte array
   let s_words = cast[ptr array[16, uint32]](addr s) # Alias for to interpret s as an uint32 array
 
-  s_bytes[0..<32] = header.toByteArrayBE            # We first populate the first 40 bytes of s with the concatenation
+  s_bytes[0..<32] = header.data                     # We first populate the first 40 bytes of s with the concatenation
 
-  when system.cpuEndian == littleEndian:            # ⚠⚠ Warning ⚠⚠, the spec is WRONG compared to tests here
-    s_bytes[32..<40] = cast[array[8,byte]](nonce)   # the nonce should be concatenated with its LITTLE ENDIAN representation
-  else:
-    raise newException(ValueError, "Big endian system not supported yet")
+  var nonceLE{.noInit.}: array[8, byte]             # the nonce should be concatenated with its LITTLE ENDIAN representation
+  littleEndian64(addr nonceLE, unsafeAddr nonce)
+  s_bytes[32..<40] = cast[array[8,byte]](nonceLE)
 
   s = keccak_512 s_bytes[0..<40]                    # TODO: Does this allocate a seq?
 
@@ -200,10 +187,8 @@ proc hashimoto(header: Hash[256],
   for i in countup(0, mix.len - 1, 4):
     cmix[i div 4] = mix[i].fnv(mix[i+1]).fnv(mix[i+2]).fnv(mix[i+3])
 
-  # ⚠⚠ Warning ⚠⚠: Another big endian little endian issue?
-  # result.mix_digest = cast[Hash[256]](
-  #   mapArray(cmix, x.toByteArrayBE) # Each uint32 must be changed to Big endian
-  #   )
+  # ⚠⚠ Warning ⚠⚠: Another bigEndian littleEndian issue?
+  # It doesn't seem like the uint32 in cmix need to be changed to big endian
   result.mix_digest = cast[Hash[256]](cmix)
 
   var concat{.noInit.}: array[64 + 32, byte]
@@ -233,6 +218,5 @@ proc hashimoto_full*(full_size:Natural, dataset: seq[Hash[512]],
 # Defining the seed hash
 
 proc get_seedhash*(block_number: uint64): Hash[256] {.noSideEffect.} =
-  # uint64 are not Ordinal :/
   for i in 0 ..< int(block_number div EPOCH_LENGTH):
-    result = keccak256 result.toByteArrayBE
\ No newline at end of file
+    result = keccak256 result.data
\ No newline at end of file
diff --git a/src/private/casting.nim b/src/private/casting.nim
index 320eafc..3f46f49 100644
--- a/src/private/casting.nim
+++ b/src/private/casting.nim
@@ -3,33 +3,10 @@
 
 import keccak_tiny
 
-type U512* = array[16, uint32]
-  ## A very simple type alias to `xor` Hash[512] with normal integers
-  ## and be able to do sha3_512 which only accepts arrays
-
-  # TODO delete this
-
-proc toU512*(x: Natural): U512 {.inline, noSideEffect.}=
-  when system.cpuEndian == littleEndian:
-    result[0] = x.uint32
-  else:
-    result[result.high] = x.uint32
-
-proc toU512*(x: Hash[512]): U512 {.inline, noSideEffect, noInit.}=
+proc as_u32_words*[N: static[int]](x: Hash[N]): array[N div 32, uint32] {.inline, noSideEffect, noInit.}=
+  # Convert an hash to its uint32 representation
   cast[type result](x)
 
-proc `xor`*(x, y: U512): U512 {.inline, noSideEffect, noInit.}=
-  for i in 0 ..< result.len:
-    {.unroll: 4.}
-    result[i] = x[i] xor y[i]
-
-proc toHash512*(x: U512): Hash[512] {.inline, noSideEffect, noInit.}=
-  cast[type result](x)
-
-
-# ### Hex conversion
-
-
 type ByteArrayBE*[N: static[int]] = array[N, byte]
   ## A byte array that stores bytes in big-endian order
 
@@ -70,7 +47,6 @@ proc hexToSeqBytesBE*(hexStr: string): seq[byte] {.noSideEffect.}=
 proc toHex*[N: static[int]](ba: ByteArrayBE[N]): string {.noSideEffect.}=
   ## Convert a big-endian byte array to its hex representation
   ## Output is in lowercase
-  ##
 
   const hexChars = "0123456789abcdef"
 
@@ -82,7 +58,6 @@ proc toHex*[N: static[int]](ba: ByteArrayBE[N]): string {.noSideEffect.}=
 proc toHex*(ba: seq[byte]): string {.noSideEffect, noInit.}=
   ## Convert a big-endian byte sequence to its hex representation
   ## Output is in lowercase
-  ##
 
   let N = ba.len
   const hexChars = "0123456789abcdef"
@@ -106,8 +81,5 @@ proc toByteArrayBE*[T: SomeInteger](num: T): ByteArrayBE[T.sizeof] {.noSideEffec
     for i in 0 ..< N:
       result[i] = byte(num shr T((N-1-i) * 8))
 
-proc toByteArrayBE*(x: U512): ByteArrayBE[64] {.inline, noSideEffect, noInit.}=
-  cast[type result](x)
-
 proc toByteArrayBE*[N: static[int]](x: Hash[N]): ByteArrayBE[N div 8] {.inline, noSideEffect, noInit.}=
-  cast[type result](x)
\ No newline at end of file
+  cast[type result](x.data)
\ No newline at end of file
diff --git a/src/private/functional.nim b/src/private/functional.nim
index e99ca10..31dbb48 100644
--- a/src/private/functional.nim
+++ b/src/private/functional.nim
@@ -35,22 +35,3 @@ template zipMap*[N: static[int], T, U](
     result[i] = op
 
   result
-
-
-template mapArray*[N: static[int], T](
-  a: array[N, T],
-  op: untyped): untyped =
-  ## inline map operation
-
-  type outType = type((
-    block:
-      var x{.inject.}: T;
-      op
-  ))
-
-  var result: array[N, outType]
-
-  for i, x {.inject.} in a:
-    {.unroll: 4.}
-    result[i] = op
-  result
\ No newline at end of file
diff --git a/src/private/intmath.nim b/src/private/intmath.nim
index 5cbc0f8..043c3c0 100644
--- a/src/private/intmath.nim
+++ b/src/private/intmath.nim
@@ -28,12 +28,8 @@ proc bit_length*[T: SomeInteger](n: T): T =
       x = x shr 1
       inc(result)
 
-
 # ########### Integer math
 
-proc isOdd*[T: SomeInteger](i: T): bool {.inline, noSideEffect.} =
-  (i and 1.T) != 0
-
 proc isqrt*[T: SomeInteger](n: T):  T =
   ## Integer square root, return the biggest squarable number under n
   ## Computation via Newton method
@@ -58,56 +54,16 @@ type
 proc ldiv(a, b: clong): ldiv_t {.importc: "ldiv", header: "<stdlib.h>".}
 proc lldiv(a, b: clonglong): lldiv_t {.importc: "lldiv", header: "<stdlib.h>".}
 
-proc divmod*(a, b: int32): tuple[quot, rem: clong] {.inline.}=
+proc divmod*(a, b: int32): tuple[quot, rem: clong] {.inline, noSideEffect, noInit.}=
   ## Compute quotient and reminder of integer division in a single intrinsics operation
   # TODO: changing clong to int32 poses an issue for some reason
   cast[type result](ldiv(a,b))
 
-proc divmod*(a, b: int64): tuple[quot, rem: int64] {.inline.}=
+proc divmod*(a, b: int64): tuple[quot, rem: int64] {.inline, noSideEffect, noInit.}=
   ## Compute quotient and reminder of integer division in a single intrinsicsoperation
   cast[type result](lldiv(a,b))
 
-proc divmod*[T: SomeUnsignedInt](a, b: T): tuple[quot, rem: T] {.inline.}=
+proc divmod*[T: SomeUnsignedInt](a, b: T): tuple[quot, rem: T] {.inline, noSideEffect, noInit.}=
   # There is no single instruction for unsigned ints
   # Hopefully the compiler does its work properly
   (a div b, a mod b)
-
-# ############ Modular arithmetics
-
-proc addmod*[T: SomeInteger](a, b, m: T): T =
-  ## Modular addition
-
-  let a_m = if a < m: a
-            else: a mod m
-  if b == 0.T:
-    return a_m
-  let b_m = if b < m: b
-            else: b mod m
-
-  # We don't do a + b to avoid overflows
-  # But we know that m at least is inferior to biggest T
-
-  let b_from_m = m - b_m
-  if a_m >= b_from_m:
-    return a_m - b_from_m
-  return m - b_from_m + a_m
-
-proc doublemod[T: SomeInteger](a, m: T): T {.inline.}=
-  ## double a modulo m. assume a < m
-  result = a
-  if a >= m - a:
-    result -= m
-  result += a
-
-proc mulmod*[T: SomeInteger](a, b, m: T): T =
-  ## Modular multiplication
-
-  var a_m = a mod m
-  var b_m = b mod m
-  if b_m > a_m:
-    swap(a_m, b_m)
-  while b_m > 0.T:
-    if b_m.isOdd:
-      result = addmod(result, a_m, m)
-    a_m = doublemod(a_m, m)
-    b_m = b_m shr 1
\ No newline at end of file
diff --git a/tests/all_tests.nim b/tests/all_tests.nim
index 3602f31..b3c63b7 100644
--- a/tests/all_tests.nim
+++ b/tests/all_tests.nim
@@ -139,7 +139,7 @@ suite "Seed hash":
     var expected: Hash[256]
     for i in countup(0'u32, 30000 * 2048, 30000):
       check: get_seedhash(i) == expected
-      expected = keccak_256(expected.toByteArrayBE)
+      expected = keccak_256(expected.data)
 
 suite "Dagger hashimoto computation":
     # We can't replicate Python's dynamic typing here