leopard/LeopardFF8.h

201 lines
5.7 KiB
C
Raw Normal View History

2017-05-25 09:24:15 +00:00
/*
Copyright (c) 2017 Christopher A. Taylor. All rights reserved.
Redistribution and use in source and binary forms, with or without
modification, are permitted provided that the following conditions are met:
* Redistributions of source code must retain the above copyright notice,
this list of conditions and the following disclaimer.
* Redistributions in binary form must reproduce the above copyright notice,
this list of conditions and the following disclaimer in the documentation
and/or other materials provided with the distribution.
* Neither the name of Leopard-RS nor the names of its contributors may be
used to endorse or promote products derived from this software without
specific prior written permission.
THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS "AS IS"
AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
ARE DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT HOLDER OR CONTRIBUTORS BE
LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR
CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF
SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS
INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN
CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE)
ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE
POSSIBILITY OF SUCH DAMAGE.
*/
#pragma once
#include "LeopardCommon.h"
2017-05-27 03:10:53 +00:00
#ifdef LEO_HAS_FF8
2017-05-25 09:24:15 +00:00
/*
8-bit Finite Field Math
This finite field contains 256 elements and so each element is one byte.
This library is designed for data that is a multiple of 64 bytes in size.
2017-05-28 22:15:39 +00:00
Algorithms are described in LeopardCommon.h
2017-05-25 09:24:15 +00:00
*/
namespace leopard { namespace ff8 {
//------------------------------------------------------------------------------
// Datatypes and Constants
// Finite field element type
typedef uint8_t ffe_t;
// Number of bits per element
static const unsigned kBits = 8;
// Finite field order: Number of elements in the field
static const unsigned kOrder = 256;
2017-05-28 20:50:32 +00:00
// Modulus for field operations
static const ffe_t kModulus = 255;
// LFSR Polynomial that generates the field elements
static const unsigned kPolynomial = 0x11D;
2017-05-25 09:24:15 +00:00
//------------------------------------------------------------------------------
// Fast Walsh-Hadamard Transform (FWHT) (mod kModulus)
// Transform for a variable number of bits (up to kOrder)
void FWHT(ffe_t* data, const unsigned bits);
// Transform specialized for the finite field order
void FWHT(ffe_t data[kOrder]);
//------------------------------------------------------------------------------
// Multiplies
2017-05-28 01:44:06 +00:00
// x[] = exp(log(y[]) + log_m)
void mul_mem(
2017-05-25 09:24:15 +00:00
void * LEO_RESTRICT x, const void * LEO_RESTRICT y,
2017-05-28 01:44:06 +00:00
ffe_t log_m, uint64_t bytes);
2017-05-25 09:24:15 +00:00
//------------------------------------------------------------------------------
// FFT Operations
2017-05-28 01:44:06 +00:00
/*
2017-05-28 20:50:32 +00:00
Precondition: log_m != kModulus
x[] ^= exp(log(y[]) + log_m)
2017-05-28 01:44:06 +00:00
y[] ^= x[]
*/
2017-05-27 02:51:30 +00:00
void fft_butterfly(
2017-05-25 09:24:15 +00:00
void * LEO_RESTRICT x, void * LEO_RESTRICT y,
2017-05-28 01:44:06 +00:00
ffe_t log_m, uint64_t bytes);
2017-05-25 09:24:15 +00:00
2017-05-28 08:23:03 +00:00
#ifdef LEO_USE_VECTOR4_OPT
2017-05-28 01:44:06 +00:00
// Unroll 4 rows at a time
2017-05-27 03:30:48 +00:00
void fft_butterfly4(
2017-05-25 09:24:15 +00:00
void * LEO_RESTRICT x_0, void * LEO_RESTRICT y_0,
void * LEO_RESTRICT x_1, void * LEO_RESTRICT y_1,
void * LEO_RESTRICT x_2, void * LEO_RESTRICT y_2,
2017-05-27 03:30:48 +00:00
void * LEO_RESTRICT x_3, void * LEO_RESTRICT y_3,
2017-05-28 01:44:06 +00:00
ffe_t log_m, uint64_t bytes);
2017-05-25 09:24:15 +00:00
2017-05-28 08:23:03 +00:00
#endif // LEO_USE_VECTOR4_OPT
2017-05-25 09:24:15 +00:00
//------------------------------------------------------------------------------
// IFFT Operations
2017-05-28 01:44:06 +00:00
/*
2017-05-28 20:50:32 +00:00
Precondition: log_m != kModulus
2017-05-28 01:44:06 +00:00
y[] ^= x[]
2017-05-28 20:50:32 +00:00
x[] ^= exp(log(y[]) + log_m)
2017-05-28 01:44:06 +00:00
*/
2017-05-27 02:51:30 +00:00
void ifft_butterfly(
2017-05-25 09:24:15 +00:00
void * LEO_RESTRICT x, void * LEO_RESTRICT y,
2017-05-28 01:44:06 +00:00
ffe_t log_m, uint64_t bytes);
2017-05-25 09:24:15 +00:00
2017-05-28 08:23:03 +00:00
#ifdef LEO_USE_VECTOR4_OPT
2017-05-28 01:44:06 +00:00
// Unroll 4 rows at a time
2017-05-27 03:30:48 +00:00
void ifft_butterfly4(
2017-05-25 09:24:15 +00:00
void * LEO_RESTRICT x_0, void * LEO_RESTRICT y_0,
void * LEO_RESTRICT x_1, void * LEO_RESTRICT y_1,
void * LEO_RESTRICT x_2, void * LEO_RESTRICT y_2,
2017-05-27 03:30:48 +00:00
void * LEO_RESTRICT x_3, void * LEO_RESTRICT y_3,
2017-05-28 01:44:06 +00:00
ffe_t log_m, uint64_t bytes);
2017-05-27 02:51:30 +00:00
2017-05-28 08:23:03 +00:00
#endif // LEO_USE_VECTOR4_OPT
//------------------------------------------------------------------------------
// FFT
2017-05-28 20:50:32 +00:00
/*
if (log_m != kModulus)
x[] ^= exp(log(y[]) + log_m)
y[] ^= x[]
*/
2017-05-28 02:39:38 +00:00
void VectorFFTButterfly(
const uint64_t bytes,
unsigned count,
void** x,
void** y,
2017-05-28 20:50:32 +00:00
const ffe_t log_m);
2017-05-28 02:39:38 +00:00
2017-05-28 20:50:32 +00:00
/*
y[] ^= x[]
if (log_m != kModulus)
x[] ^= exp(log(y[]) + log_m)
*/
2017-05-28 02:39:38 +00:00
void VectorIFFTButterfly(
const uint64_t bytes,
unsigned count,
void** x,
void** y,
2017-05-28 20:50:32 +00:00
const ffe_t log_m);
2017-05-28 02:39:38 +00:00
2017-05-27 02:51:30 +00:00
//------------------------------------------------------------------------------
2017-05-28 22:15:39 +00:00
// Reed-Solomon Encode
2017-05-27 02:51:30 +00:00
2017-05-28 22:15:39 +00:00
void ReedSolomonEncode(
2017-05-27 02:51:30 +00:00
uint64_t buffer_bytes,
unsigned original_count,
unsigned recovery_count,
unsigned m, // = NextPow2(recovery_count) * 2 = work_count
void* const * const data,
void** work); // Size of GetEncodeWorkCount()
//------------------------------------------------------------------------------
2017-05-28 22:15:39 +00:00
// Reed-Solomon Decode
2017-05-27 02:51:30 +00:00
2017-05-28 22:15:39 +00:00
void ReedSolomonDecode(
2017-05-27 02:51:30 +00:00
uint64_t buffer_bytes,
unsigned original_count,
unsigned recovery_count,
unsigned m, // = NextPow2(recovery_count)
unsigned n, // = NextPow2(m + original_count) = work_count
void* const * const original, // original_count entries
void* const * const recovery, // recovery_count entries
void** work); // n entries
2017-05-25 09:24:15 +00:00
//------------------------------------------------------------------------------
// API
// Returns false if the self-test fails
bool Initialize();
}} // namespace leopard::ff8
2017-05-27 03:10:53 +00:00
#endif // LEO_HAS_FF8