1
1
mirror of https://github.com/henrydcase/pqc.git synced 2024-11-24 00:11:27 +00:00
pqcrypto/crypto_kem/hqc-rmrs-128/avx2/reed_solomon.c

352 lines
12 KiB
C
Raw Normal View History

2020-09-07 19:23:34 +01:00
#include "fft.h"
#include "gf.h"
#include "parameters.h"
#include "parsing.h"
2020-09-07 19:23:34 +01:00
#include "reed_solomon.h"
#include <stdint.h>
#include <stdio.h>
#include <string.h>
/**
* @file reed_solomon.c
* Constant time implementation of Reed-Solomon codes
*/
static void compute_syndromes(uint16_t *syndromes, uint8_t *cdw);
2020-09-11 23:19:10 +01:00
static uint16_t compute_elp(uint16_t *sigma, const uint16_t *syndromes);
2020-09-07 19:23:34 +01:00
static void compute_roots(uint8_t *error, uint16_t *sigma);
2020-09-11 23:19:10 +01:00
static void compute_z_poly(uint16_t *z, const uint16_t *sigma, uint16_t degree, const uint16_t *syndromes);
2020-09-07 19:23:34 +01:00
static void compute_error_values(uint16_t *error_values, const uint16_t *z, const uint8_t *error);
static void correct_errors(uint8_t *cdw, const uint16_t *error_values);
/**
* @brief Encodes a message message of PARAM_K bits to a Reed-Solomon codeword codeword of PARAM_N1 bytes
*
* Following @cite lin1983error (Chapter 4 - Cyclic Codes),
* We perform a systematic encoding using a linear (PARAM_N1 - PARAM_K)-stage shift register
* with feedback connections based on the generator polynomial PARAM_RS_POLY of the Reed-Solomon code.
*
* @param[out] cdw Array of size VEC_N1_SIZE_64 receiving the encoded message
* @param[in] msg Array of size VEC_K_SIZE_64 storing the message
*/
void PQCLEAN_HQCRMRS128_AVX2_reed_solomon_encode(uint8_t *cdw, const uint8_t *msg) {
2020-09-14 20:45:24 +01:00
size_t i, j, k;
2020-09-07 19:23:34 +01:00
uint8_t gate_value = 0;
uint16_t tmp[PARAM_G] = {0};
uint16_t PARAM_RS_POLY [] = {RS_POLY_COEFS};
2020-09-14 20:45:24 +01:00
uint8_t prev, x;
2020-09-07 19:23:34 +01:00
2020-09-14 20:45:24 +01:00
for (i = 0; i < PARAM_N1; ++i) {
cdw[i] = 0;
2020-09-07 19:23:34 +01:00
}
2020-09-14 20:45:24 +01:00
for (i = 0; i < PARAM_K; ++i) {
2020-09-14 21:45:04 +01:00
gate_value = (uint8_t) (msg[PARAM_K - 1 - i] ^ cdw[PARAM_N1 - PARAM_K - 1]);
2020-09-07 19:23:34 +01:00
2020-09-14 20:45:24 +01:00
for (j = 0; j < PARAM_G; ++j) {
2020-09-07 19:23:34 +01:00
tmp[j] = PQCLEAN_HQCRMRS128_AVX2_gf_mul(gate_value, PARAM_RS_POLY[j]);
}
2020-09-14 20:45:24 +01:00
prev = 0;
for (k = 0; k < PARAM_N1 - PARAM_K; k++) {
x = cdw[k];
2020-09-14 22:11:08 +01:00
cdw[k] = (uint8_t) (prev ^ tmp[k]);
2020-09-14 20:45:24 +01:00
prev = x;
2020-09-07 19:23:34 +01:00
}
}
memcpy(cdw + PARAM_N1 - PARAM_K, msg, PARAM_K);
2020-09-07 19:23:34 +01:00
}
/**
* @brief Computes 2 * PARAM_DELTA syndromes
*
* @param[out] syndromes Array of size 2 * PARAM_DELTA receiving the computed syndromes
* @param[in] cdw Array of size PARAM_N1 storing the received vector
*/
void compute_syndromes(uint16_t *syndromes, uint8_t *cdw) {
2020-09-10 21:36:42 +01:00
for (size_t i = 0; i < 2 * PARAM_DELTA; ++i) {
for (size_t j = 1; j < PARAM_N1; ++j) {
2020-09-07 19:23:34 +01:00
syndromes[i] ^= PQCLEAN_HQCRMRS128_AVX2_gf_mul(cdw[j], alpha_ij_pow[i][j - 1]);
}
syndromes[i] ^= cdw[0];
}
}
/**
* @brief Computes the error locator polynomial (ELP) sigma
*
* This is a constant time implementation of Berlekamp's simplified algorithm (see @cite lin1983error (Chapter 6 - BCH Codes). <br>
* We use the letter p for rho which is initialized at -1. <br>
* The array X_sigma_p represents the polynomial X^(mu-rho)*sigma_p(X). <br>
* Instead of maintaining a list of sigmas, we update in place both sigma and X_sigma_p. <br>
* sigma_copy serves as a temporary save of sigma in case X_sigma_p needs to be updated. <br>
* We can properly correct only if the degree of sigma does not exceed PARAM_DELTA.
* This means only the first PARAM_DELTA + 1 coefficients of sigma are of value
* and we only need to save its first PARAM_DELTA - 1 coefficients.
*
* @returns the degree of the ELP sigma
* @param[out] sigma Array of size (at least) PARAM_DELTA receiving the ELP
* @param[in] syndromes Array of size (at least) 2*PARAM_DELTA storing the syndromes
*/
2020-09-11 23:19:10 +01:00
static uint16_t compute_elp(uint16_t *sigma, const uint16_t *syndromes) {
uint16_t deg_sigma = 0;
uint16_t deg_sigma_p = 0;
uint16_t deg_sigma_copy = 0;
2020-09-07 19:23:34 +01:00
uint16_t sigma_copy[PARAM_DELTA + 1] = {0};
uint16_t X_sigma_p[PARAM_DELTA + 1] = {0, 1};
2020-09-14 20:45:24 +01:00
uint16_t pp = (uint16_t) -1; // 2*rho
2020-09-07 19:23:34 +01:00
uint16_t d_p = 1;
uint16_t d = syndromes[0];
2020-09-11 23:19:10 +01:00
uint16_t mask1, mask2, mask12;
uint16_t deg_X, deg_X_sigma_p;
uint16_t dd;
uint16_t mu;
uint16_t i;
sigma[0] = 1;
for (mu = 0; (mu < (2 * PARAM_DELTA)); ++mu) {
2020-09-07 19:23:34 +01:00
// Save sigma in case we need it to update X_sigma_p
memcpy(sigma_copy, sigma, 2 * (PARAM_DELTA));
deg_sigma_copy = deg_sigma;
2020-09-11 23:19:10 +01:00
dd = PQCLEAN_HQCRMRS128_AVX2_gf_mul(d, PQCLEAN_HQCRMRS128_AVX2_gf_inverse(d_p));
2020-09-07 19:23:34 +01:00
2020-09-11 23:19:10 +01:00
for (i = 1; (i <= mu + 1) && (i <= PARAM_DELTA); ++i) {
2020-09-07 19:23:34 +01:00
sigma[i] ^= PQCLEAN_HQCRMRS128_AVX2_gf_mul(dd, X_sigma_p[i]);
}
2020-09-11 23:19:10 +01:00
deg_X = mu - pp;
deg_X_sigma_p = deg_X + deg_sigma_p;
2020-09-07 19:23:34 +01:00
// mask1 = 0xffff if(d != 0) and 0 otherwise
2020-09-11 23:19:10 +01:00
mask1 = -((uint16_t) - d >> 15);
2020-09-07 19:23:34 +01:00
// mask2 = 0xffff if(deg_X_sigma_p > deg_sigma) and 0 otherwise
2020-09-11 23:19:10 +01:00
mask2 = -((uint16_t) (deg_sigma - deg_X_sigma_p) >> 15);
2020-09-07 19:23:34 +01:00
// mask12 = 0xffff if the deg_sigma increased and 0 otherwise
2020-09-11 23:19:10 +01:00
mask12 = mask1 & mask2;
deg_sigma ^= mask12 & (deg_X_sigma_p ^ deg_sigma);
2020-09-07 19:23:34 +01:00
if (mu == (2 * PARAM_DELTA - 1)) {
break;
}
2020-09-11 23:19:10 +01:00
pp ^= mask12 & (mu ^ pp);
d_p ^= mask12 & (d ^ d_p);
for (i = PARAM_DELTA; i; --i) {
2020-09-07 19:23:34 +01:00
X_sigma_p[i] = (mask12 & sigma_copy[i - 1]) ^ (~mask12 & X_sigma_p[i - 1]);
}
2020-09-11 23:19:10 +01:00
deg_sigma_p ^= mask12 & (deg_sigma_copy ^ deg_sigma_p);
2020-09-07 19:23:34 +01:00
d = syndromes[mu + 1];
2020-09-11 23:19:10 +01:00
for (i = 1; (i <= mu + 1) && (i <= PARAM_DELTA); ++i) {
2020-09-07 19:23:34 +01:00
d ^= PQCLEAN_HQCRMRS128_AVX2_gf_mul(sigma[i], syndromes[mu + 1 - i]);
}
}
return deg_sigma;
}
/**
* @brief Computes the error polynomial error from the error locator polynomial sigma
*
* See function PQCLEAN_HQCRMRS128_AVX2_fft for more details.
*
* @param[out] error Array of 2^PARAM_M elements receiving the error polynomial
* @param[out] error_compact Array of PARAM_DELTA + PARAM_N1 elements receiving a compact representation of the vector error
* @param[in] sigma Array of 2^PARAM_FFT elements storing the error locator polynomial
*/
static void compute_roots(uint8_t *error, uint16_t *sigma) {
uint16_t w[1 << PARAM_M] = {0};
PQCLEAN_HQCRMRS128_AVX2_fft(w, sigma, PARAM_DELTA + 1);
PQCLEAN_HQCRMRS128_AVX2_fft_retrieve_error_poly(error, w);
}
/**
* @brief Computes the polynomial z(x)
*
* See @cite lin1983error (Chapter 6 - BCH Codes) for more details.
*
* @param[out] z Array of PARAM_DELTA + 1 elements receiving the polynomial z(x)
* @param[in] sigma Array of 2^PARAM_FFT elements storing the error locator polynomial
* @param[in] degree Integer that is the degree of polynomial sigma
* @param[in] syndromes Array of 2 * PARAM_DELTA storing the syndromes
*/
2020-09-11 23:19:10 +01:00
static void compute_z_poly(uint16_t *z, const uint16_t *sigma, uint16_t degree, const uint16_t *syndromes) {
size_t i, j;
uint16_t mask;
2020-09-07 19:23:34 +01:00
z[0] = 1;
2020-09-11 23:19:10 +01:00
for (i = 1; i < PARAM_DELTA + 1; ++i) {
mask = -((uint16_t) (i - degree - 1) >> 15);
z[i] = mask & sigma[i];
2020-09-07 19:23:34 +01:00
}
z[1] ^= syndromes[0];
2020-09-11 23:19:10 +01:00
for (i = 2; i <= PARAM_DELTA; ++i) {
mask = -((uint16_t) (i - degree - 1) >> 15);
z[i] ^= mask & syndromes[i - 1];
2020-09-07 19:23:34 +01:00
2020-09-11 23:19:10 +01:00
for (j = 1; j < i; ++j) {
z[i] ^= mask & PQCLEAN_HQCRMRS128_AVX2_gf_mul(sigma[j], syndromes[i - j - 1]);
2020-09-07 19:23:34 +01:00
}
}
}
/**
* @brief Computes the error values
*
* See @cite lin1983error (Chapter 6 - BCH Codes) for more details.
*
* @param[out] error_values Array of PARAM_DELTA elements receiving the error values
* @param[in] z Array of PARAM_DELTA + 1 elements storing the polynomial z(x)
* @param[in] z_degree Integer that is the degree of polynomial z(x)
* @param[in] error_compact Array of PARAM_DELTA + PARAM_N1 storing compact representation of the error
*/
static void compute_error_values(uint16_t *error_values, const uint16_t *z, const uint8_t *error) {
uint16_t beta_j[PARAM_DELTA] = {0};
uint16_t e_j[PARAM_DELTA] = {0};
2020-09-15 15:33:06 +01:00
uint16_t delta_counter;
2020-09-07 19:23:34 +01:00
uint16_t delta_real_value;
2020-09-15 15:33:06 +01:00
uint16_t found;
uint16_t mask1;
uint16_t mask2;
uint16_t tmp1;
uint16_t tmp2;
uint16_t inverse;
uint16_t inverse_power_j;
2020-09-07 19:23:34 +01:00
// Compute the beta_{j_i} page 31 of the documentation
2020-09-15 15:33:06 +01:00
delta_counter = 0;
2020-09-10 21:36:42 +01:00
for (size_t i = 0; i < PARAM_N1; i++) {
2020-09-15 15:33:06 +01:00
found = 0;
mask1 = (uint16_t) (-((int32_t)error[i]) >> 31); // error[i] != 0
for (size_t j = 0; j < PARAM_DELTA; j++) {
mask2 = ~((uint16_t) (-((int32_t) j ^ delta_counter) >> 31)); // j == delta_counter
beta_j[j] += mask1 & mask2 & gf_exp[i];
found += mask1 & mask2 & 1;
2020-09-07 19:23:34 +01:00
}
delta_counter += found;
}
delta_real_value = delta_counter;
// Compute the e_{j_i} page 31 of the documentation
2020-09-10 21:36:42 +01:00
for (size_t i = 0; i < PARAM_DELTA; ++i) {
2020-09-15 15:33:06 +01:00
tmp1 = 1;
tmp2 = 1;
inverse = PQCLEAN_HQCRMRS128_AVX2_gf_inverse(beta_j[i]);
inverse_power_j = 1;
2020-09-07 19:23:34 +01:00
2020-09-10 21:36:42 +01:00
for (size_t j = 1; j <= PARAM_DELTA; ++j) {
2020-09-07 19:23:34 +01:00
inverse_power_j = PQCLEAN_HQCRMRS128_AVX2_gf_mul(inverse_power_j, inverse);
tmp1 ^= PQCLEAN_HQCRMRS128_AVX2_gf_mul(inverse_power_j, z[j]);
}
2020-09-10 21:36:42 +01:00
for (size_t k = 1; k < PARAM_DELTA; ++k) {
2020-09-07 19:23:34 +01:00
tmp2 = PQCLEAN_HQCRMRS128_AVX2_gf_mul(tmp2, (1 ^ PQCLEAN_HQCRMRS128_AVX2_gf_mul(inverse, beta_j[(i + k) % PARAM_DELTA])));
}
2020-09-15 15:33:06 +01:00
mask1 = (uint16_t) (((int16_t) i - delta_real_value) >> 15); // i < delta_real_value
e_j[i] = mask1 & PQCLEAN_HQCRMRS128_AVX2_gf_mul(tmp1, PQCLEAN_HQCRMRS128_AVX2_gf_inverse(tmp2));
2020-09-07 19:23:34 +01:00
}
// Place the delta e_{j_i} values at the right coordinates of the output vector
delta_counter = 0;
2020-09-10 21:36:42 +01:00
for (size_t i = 0; i < PARAM_N1; ++i) {
2020-09-15 15:33:06 +01:00
found = 0;
mask1 = (uint16_t) (-((int32_t)error[i]) >> 31); // error[i] != 0
2020-09-10 21:36:42 +01:00
for (size_t j = 0; j < PARAM_DELTA; j++) {
2020-09-15 15:33:06 +01:00
mask2 = ~((uint16_t) (-((int32_t) j ^ delta_counter) >> 31)); // j == delta_counter
error_values[i] += mask1 & mask2 & e_j[j];
found += mask1 & mask2 & 1;
2020-09-07 19:23:34 +01:00
}
delta_counter += found;
}
}
/**
* @brief Correct the errors
*
* @param[out] cdw Array of PARAM_N1 elements receiving the corrected vector
* @param[in] error Array of the error vector
* @param[in] error_values Array of PARAM_DELTA elements storing the error values
*/
static void correct_errors(uint8_t *cdw, const uint16_t *error_values) {
2020-09-10 21:36:42 +01:00
for (size_t i = 0; i < PARAM_N1; ++i) {
2020-09-07 19:23:34 +01:00
cdw[i] ^= error_values[i];
}
}
/**
* @brief Decodes the received word
*
* This function relies on six steps:
* <ol>
* <li> The first step, is the computation of the 2*PARAM_DELTA syndromes.
* <li> The second step is the computation of the error-locator polynomial sigma.
* <li> The third step, done by additive FFT, is finding the error-locator numbers by calculating the roots of the polynomial sigma and takings their inverses.
* <li> The fourth step, is the polynomial z(x).
* <li> The fifth step, is the computation of the error values.
* <li> The sixth step is the correction of the errors in the received polynomial.
* </ol>
* For a more complete picture on Reed-Solomon decoding, see Shu. Lin and Daniel J. Costello in Error Control Coding: Fundamentals and Applications @cite lin1983error
*
* @param[out] msg Array of size VEC_K_SIZE_64 receiving the decoded message
* @param[in] cdw Array of size VEC_N1_SIZE_64 storing the received word
*/
void PQCLEAN_HQCRMRS128_AVX2_reed_solomon_decode(uint8_t *msg, uint8_t *cdw) {
2020-09-07 19:23:34 +01:00
uint16_t syndromes[2 * PARAM_DELTA] = {0};
uint16_t sigma[1 << PARAM_FFT] = {0};
uint8_t error[1 << PARAM_M] = {0};
uint16_t z[PARAM_N1] = {0};
uint16_t error_values[PARAM_N1] = {0};
2020-09-11 23:19:10 +01:00
uint16_t deg;
2020-09-07 19:23:34 +01:00
// Calculate the 2*PARAM_DELTA syndromes
compute_syndromes(syndromes, cdw);
2020-09-07 19:23:34 +01:00
// Compute the error locator polynomial sigma
// Sigma's degree is at most PARAM_DELTA but the FFT requires the extra room
2020-09-11 23:19:10 +01:00
deg = compute_elp(sigma, syndromes);
2020-09-07 19:23:34 +01:00
// Compute the error polynomial error
compute_roots(error, sigma);
// Compute the polynomial z(x)
compute_z_poly(z, sigma, deg, syndromes);
// Compute the error values
compute_error_values(error_values, z, error);
// Correct the errors
correct_errors(cdw, error_values);
2020-09-07 19:23:34 +01:00
// Retrieve the message from the decoded codeword
memcpy(msg, cdw + (PARAM_G - 1), PARAM_K);
2020-09-07 19:23:34 +01:00
}