mirror of
https://github.com/codex-storage/nim-leopard.git
synced 2025-01-18 07:01:13 +00:00
41cd86df5b
* initial implementation and tests * [wip] refactor checking of RS code validity * [wip] point GHA badge link to main branch instead of initial_impl * [wip] delete leftover echo at bottom of test_leopard.nim * [wip] add basic usage info to README * [wip] more basic info added to README re: requirements, installation, usage * [wip] add config.nims with --tlsEmulation:off to check if it helps with perf on Windows * [wip] use `object` instead of `object of CatchableError` for LeopardError workaround for edge case encountered in context of nimbus-build-system project * [wip] clarify wording in README re: stability * [wip] can use `object of CatchableError` for LeopardError with workaround * Initial implementation * make Leo a case object * initial test * cleanup * remove echo * use `func` where possible * comments, misc * make construction more convenient * add more tests * more tests * unused warnings * remove sideeffects pragma * fix importc pragma on unix * fix windows build * fix ci * better warning * adding more comprehensive tests * moar tests * add TODO for usage * Update leopard/leopard.nim Co-authored-by: Michael Bradley <michaelsbradleyjr@gmail.com> * Update leopard/wrapper.nim Co-authored-by: Michael Bradley <michaelsbradleyjr@gmail.com> * add tests to reuse same encoder/decoder * check that parity and data buffers are < 65536 * test that data+parity isn't > 65536 Co-authored-by: Michael Bradley, Jr <michaelsbradleyjr@gmail.com>
290 lines
11 KiB
Nim
290 lines
11 KiB
Nim
## Copyright (c) 2017 Christopher A. Taylor. All rights reserved.
|
|
##
|
|
## Redistribution and use in source and binary forms, with or without
|
|
## modification, are permitted provided that the following conditions are met:
|
|
##
|
|
## * Redistributions of source code must retain the above copyright notice,
|
|
## this list of conditions and the following disclaimer.
|
|
## * Redistributions in binary form must reproduce the above copyright notice,
|
|
## this list of conditions and the following disclaimer in the documentation
|
|
## and/or other materials provided with the distribution.
|
|
## * Neither the name of Leopard-RS nor the names of its contributors may be
|
|
## used to endorse or promote products derived from this software without
|
|
## specific prior written permission.
|
|
##
|
|
## THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS "AS IS"
|
|
## AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
|
|
## IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
|
|
## ARE DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT HOLDER OR CONTRIBUTORS BE
|
|
## LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR
|
|
## CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF
|
|
## SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS
|
|
## INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN
|
|
## CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE)
|
|
## ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE
|
|
## POSSIBILITY OF SUCH DAMAGE.
|
|
|
|
|
|
## Leopard-RS
|
|
## MDS Reed-Solomon Erasure Correction Codes for Large Data in C
|
|
##
|
|
## Algorithms are described in LeopardCommon.h
|
|
##
|
|
##
|
|
## Inspired by discussion with:
|
|
##
|
|
## Sian-Jhen Lin <sjhenglin@gmail.com> : Author of {1} {3}, basis for Leopard
|
|
## Bulat Ziganshin <bulat.ziganshin@gmail.com> : Author of FastECC
|
|
## Yutaka Sawada <tenfon@outlook.jp> : Author of MultiPar
|
|
##
|
|
##
|
|
## References:
|
|
##
|
|
## {1} S.-J. Lin, T. Y. Al-Naffouri, Y. S. Han, and W.-H. Chung,
|
|
## "Novel Polynomial Basis with Fast Fourier Transform
|
|
## and Its Application to Reed-Solomon Erasure Codes"
|
|
## IEEE Trans. on Information Theory, pp. 6284-6299, November, 2016.
|
|
##
|
|
## {2} D. G. Cantor, "On arithmetical algorithms over finite fields",
|
|
## Journal of Combinatorial Theory, Series A, vol. 50, no. 2, pp. 285-300, 1989.
|
|
##
|
|
## {3} Sian-Jheng Lin, Wei-Ho Chung, "An Efficient (n, k) Information
|
|
## Dispersal Algorithm for High Code Rate System over Fermat Fields,"
|
|
## IEEE Commun. Lett., vol.16, no.12, pp. 2036-2039, Dec. 2012.
|
|
##
|
|
## {4} Plank, J. S., Greenan, K. M., Miller, E. L., "Screaming fast Galois Field
|
|
## arithmetic using Intel SIMD instructions." In: FAST-2013: 11th Usenix
|
|
## Conference on File and Storage Technologies, San Jose, 2013
|
|
|
|
|
|
import pkg/upraises
|
|
push: {.upraises: [].}
|
|
|
|
## -----------------------------------------------------------------------------
|
|
## Build configuration
|
|
|
|
import std/compilesettings
|
|
import std/os
|
|
import std/strutils
|
|
|
|
const
|
|
LeopardCmakeFlags {.strdefine.} =
|
|
when defined(macosx):
|
|
"-DCMAKE_BUILD_TYPE=Release -DENABLE_OPENMP=off"
|
|
elif defined(windows):
|
|
"-G\"MSYS Makefiles\" -DCMAKE_BUILD_TYPE=Release"
|
|
else:
|
|
"-DCMAKE_BUILD_TYPE=Release"
|
|
|
|
LeopardDir {.strdefine.} =
|
|
joinPath(currentSourcePath.parentDir.parentDir, "vendor", "leopard")
|
|
|
|
buildDir = joinPath(querySetting(nimcacheDir), "vendor_leopard")
|
|
|
|
LeopardHeader {.strdefine.} = "leopard.h"
|
|
|
|
LeopardLib {.strdefine.} = joinPath(buildDir, "liblibleopard.a")
|
|
|
|
LeopardCompilerFlags {.strdefine.} =
|
|
when defined(macosx):
|
|
"-I" & LeopardDir
|
|
else:
|
|
"-I" & LeopardDir & " -fopenmp"
|
|
|
|
LeopardLinkerFlags {.strdefine.} =
|
|
when defined(macosx):
|
|
LeopardLib
|
|
else:
|
|
LeopardLib & " -fopenmp"
|
|
|
|
LeopardExtraCompilerFlags {.strdefine.} = ""
|
|
|
|
LeopardExtraLinkerFlags {.strdefine.} = ""
|
|
|
|
static:
|
|
if defined(windows):
|
|
func pathUnix2Win(path: string): string =
|
|
gorge("cygpath -w " & path.strip).strip
|
|
|
|
func pathWin2Unix(path: string): string =
|
|
gorge("cygpath " & path.strip).strip
|
|
|
|
proc bash(cmd: varargs[string]): string =
|
|
gorge(gorge("which bash").pathUnix2Win & " -c '" & cmd.join(" ") & "'")
|
|
|
|
proc bashEx(cmd: varargs[string]): tuple[output: string, exitCode: int] =
|
|
gorgeEx(gorge("which bash").pathUnix2Win & " -c '" & cmd.join(" ") & "'")
|
|
|
|
let
|
|
buildDirUnix = buildDir.pathWin2Unix
|
|
leopardDirUnix = LeopardDir.pathWin2Unix
|
|
if defined(LeopardRebuild): discard bash("rm -rf", buildDirUnix)
|
|
if (bashEx("ls", LeopardLib.pathWin2Unix)).exitCode != 0:
|
|
discard bash("mkdir -p", buildDirUnix)
|
|
let cmd =
|
|
@["cd", buildDirUnix, "&& cmake", leopardDirUnix, LeopardCmakeFlags,
|
|
"&& make"]
|
|
echo "\nBuilding Leopard-RS: " & cmd.join(" ")
|
|
let (output, exitCode) = bashEx cmd
|
|
echo output
|
|
if exitCode != 0:
|
|
discard bash("rm -rf", buildDirUnix)
|
|
raise (ref Defect)(msg: "Failed to build Leopard-RS")
|
|
else:
|
|
if defined(LeopardRebuild): discard gorge "rm -rf " & buildDir
|
|
if gorgeEx("ls " & LeopardLib).exitCode != 0:
|
|
discard gorge "mkdir -p " & buildDir
|
|
let cmd =
|
|
"cd " & buildDir & " && cmake " & LeopardDir & " " & LeopardCmakeFlags &
|
|
" && make"
|
|
echo "\nBuilding Leopard-RS: " & cmd
|
|
let (output, exitCode) = gorgeEx cmd
|
|
echo output
|
|
if exitCode != 0:
|
|
discard gorge "rm -rf " & buildDir
|
|
raise (ref Defect)(msg: "Failed to build Leopard-RS")
|
|
|
|
{.passC: LeopardCompilerFlags & " " & LeopardExtraCompilerFlags.}
|
|
{.passL: LeopardLinkerFlags & " " & LeopardExtraLinkerFlags.}
|
|
|
|
{.pragma: leo, cdecl, header: LeopardHeader.}
|
|
|
|
proc leoInit*(): cint {.leo, importcpp: "leo_init".}
|
|
|
|
## ------------------------------------------------------------------------------
|
|
## Shared Constants / Datatypes
|
|
## Results
|
|
|
|
# TODO: For some reason it's only possibly to use the enum with `ord`
|
|
type
|
|
LeopardResult* = enum
|
|
LeopardCallInitialize = -7, ## Call leo_init() first
|
|
LeopardPlatform = -6, ## Platform is unsupported
|
|
LeopardInvalidInput = -5, ## A function parameter was invalid
|
|
LeopardInvalidCounts = -4, ## Invalid counts provided
|
|
LeopardInvalidSize = -3, ## Buffer size must be a multiple of 64 bytes
|
|
LeopardTooMuchData = -2, ## Buffer counts are too high
|
|
LeopardNeedMoreData = -1, ## Not enough recovery data received
|
|
LeopardSuccess = 0 ## Operation succeeded
|
|
|
|
|
|
## Convert Leopard result to string
|
|
|
|
proc leoResultString*(result: LeopardResult): cstring {.leo, importc: "leo_result_string".}
|
|
## ------------------------------------------------------------------------------
|
|
## Encoder API
|
|
##
|
|
## leo_encode_work_count()
|
|
##
|
|
## Calculate the number of work_data buffers to provide to leo_encode().
|
|
##
|
|
## The sum of original_count + recovery_count must not exceed 65536.
|
|
##
|
|
## Returns the work_count value to pass into leo_encode().
|
|
## Returns 0 on invalid input.
|
|
##
|
|
|
|
proc leoEncodeWorkCount*(originalCount: cuint; recoveryCount: cuint): cuint
|
|
{.leo, importc: "leo_encode_work_count".}
|
|
##
|
|
## leo_encode()
|
|
##
|
|
## Generate recovery data.
|
|
##
|
|
## original_count: Number of original_data[] buffers provided.
|
|
## recovery_count: Number of desired recovery data buffers.
|
|
## buffer_bytes: Number of bytes in each data buffer.
|
|
## original_data: Array of pointers to original data buffers.
|
|
## work_count: Number of work_data[] buffers, from leo_encode_work_count().
|
|
## work_data: Array of pointers to work data buffers.
|
|
##
|
|
## The sum of original_count + recovery_count must not exceed 65536.
|
|
## The recovery_count <= original_count.
|
|
##
|
|
## The buffer_bytes must be a multiple of 64.
|
|
## Each buffer should have the same number of bytes.
|
|
## Even the last piece must be rounded up to the block size.
|
|
##
|
|
## Let buffer_bytes = The number of bytes in each buffer:
|
|
##
|
|
## original_count = static_cast<unsigned>(
|
|
## ((uint64_t)total_bytes + buffer_bytes - 1) / buffer_bytes);
|
|
##
|
|
## Or if the number of pieces is known:
|
|
##
|
|
## buffer_bytes = static_cast<unsigned>(
|
|
## ((uint64_t)total_bytes + original_count - 1) / original_count);
|
|
##
|
|
## Returns Leopard_Success on success.
|
|
## The first set of recovery_count buffers in work_data will be the result.
|
|
## Returns other values on errors.
|
|
##
|
|
|
|
proc leoEncode*(
|
|
bufferBytes: uint64;
|
|
originalCount: cuint;
|
|
recoveryCount: cuint;
|
|
workCount: cuint;
|
|
originalData: ptr pointer;
|
|
workData: ptr pointer): LeopardResult {.leo, importc: "leo_encode".}
|
|
## Number of bytes in each data buffer
|
|
## Number of original_data[] buffer pointers
|
|
## Number of recovery_data[] buffer pointers
|
|
## Number of work_data[] buffer pointers, from leo_encode_work_count()
|
|
## Array of pointers to original data buffers
|
|
##
|
|
|
|
## Array of work buffers
|
|
## ------------------------------------------------------------------------------
|
|
## Decoder API
|
|
##
|
|
## leo_decode_work_count()
|
|
##
|
|
## Calculate the number of work_data buffers to provide to leo_decode().
|
|
##
|
|
## The sum of original_count + recovery_count must not exceed 65536.
|
|
##
|
|
## Returns the work_count value to pass into leo_encode().
|
|
## Returns 0 on invalid input.
|
|
##
|
|
|
|
proc leoDecodeWorkCount*(originalCount: cuint; recoveryCount: cuint): cuint
|
|
{.leo, importc: "leo_decode_work_count".}
|
|
##
|
|
## leo_decode()
|
|
##
|
|
## Decode original data from recovery data.
|
|
##
|
|
## buffer_bytes: Number of bytes in each data buffer.
|
|
## original_count: Number of original_data[] buffers provided.
|
|
## original_data: Array of pointers to original data buffers.
|
|
## recovery_count: Number of recovery_data[] buffers provided.
|
|
## recovery_data: Array of pointers to recovery data buffers.
|
|
## work_count: Number of work_data[] buffers, from leo_decode_work_count().
|
|
## work_data: Array of pointers to recovery data buffers.
|
|
##
|
|
## Lost original/recovery data should be set to NULL.
|
|
##
|
|
## The sum of recovery_count + the number of non-NULL original data must be at
|
|
## least original_count in order to perform recovery.
|
|
##
|
|
## Returns Leopard_Success on success.
|
|
## Returns other values on errors.
|
|
##
|
|
|
|
proc leoDecode*(
|
|
bufferBytes: uint64;
|
|
originalCount: cuint;
|
|
recoveryCount: cuint;
|
|
workCount: cuint;
|
|
originalData: ptr pointer;
|
|
recoveryData: ptr pointer;
|
|
workData: ptr pointer): LeopardResult {.leo, importc: "leo_decode".}
|
|
## Number of bytes in each data buffer
|
|
## Number of original_data[] buffer pointers
|
|
## Number of recovery_data[] buffer pointers
|
|
## Number of buffer pointers in work_data[]
|
|
## Array of original data buffers
|
|
## Array of recovery data buffers
|
|
## Array of work data buffers
|