@@ -1,3 +1,8 @@ | |||
from collections import namedtuple | |||
comb_config = namedtuple("comb_config",["n","t","s"]) | |||
wnaf_config = namedtuple("wnaf_config",["fixed","var"]) | |||
field_data = { | |||
"p25519" : { | |||
"gf_desc" : "2^255 - 19", | |||
@@ -22,7 +27,11 @@ curve_data = { | |||
"scalar_bits" : 253, | |||
"d": -121665, | |||
"trace": -0xa6f7cef517bce6b2c09318d2e7ae9f7a, | |||
"mont_base": 9 | |||
"mont_base": 9, | |||
"combs":comb_config(3,5,17), | |||
"wnaf":wnaf_config(5,3), | |||
"window_bits":4 | |||
}, | |||
"ed448goldilocks" : { | |||
"name" : "Ed448-Goldilocks", | |||
@@ -31,7 +40,11 @@ curve_data = { | |||
"scalar_bits" : 446, | |||
"d": -39081, | |||
"trace": 0x10cd77058eec492d944a725bf7a4cf635c8e9c2ab721cf5b5529eec34, | |||
"mont_base": 5 | |||
"mont_base": 5, | |||
"combs":comb_config(5,5,18), | |||
"wnaf":wnaf_config(5,3), | |||
"window_bits":5 | |||
} | |||
} | |||
@@ -1,50 +0,0 @@ | |||
/** | |||
* @file decaf_config.h | |||
* @author Mike Hamburg | |||
* | |||
* @copyright | |||
* Copyright (c) 2015 Cryptography Research, Inc. \n | |||
* Released under the MIT License. See LICENSE.txt for license information. | |||
* | |||
* @brief Configuration for decaf_fast.c | |||
*/ | |||
#ifndef __DECAF_CONFIG_H__ | |||
#define __DECAF_CONFIG_H__ 1 | |||
/** | |||
* Use the Montgomery ladder for direct scalarmul. | |||
* | |||
* The Montgomery ladder is faster than Edwards scalarmul, but providing | |||
* the features Decaf supports (cofactor elimination, twist rejection) | |||
* makes it complicated and adds code. Removing the ladder saves a few | |||
* kilobytes at the cost of perhaps 5-10% overhead in direct scalarmul | |||
* time. | |||
*/ | |||
#define DECAF_USE_MONTGOMERY_LADDER 0 /* FUTURE */ | |||
/** The number of comb tables for fixed base scalarmul. */ | |||
#define DECAF_COMBS_N 3 | |||
/** The number of teeth per comb for fixed base scalarmul. */ | |||
#define DECAF_COMBS_T 5 | |||
/** The comb spacing fixed base scalarmul. */ | |||
#define DECAF_COMBS_S 17 | |||
/** Performance tuning: the width of the fixed window for scalar mul. */ | |||
#define DECAF_WINDOW_BITS 4 | |||
/** | |||
* The number of bits used for the precomputed table in variable-time | |||
* double scalarmul. | |||
*/ | |||
#define DECAF_WNAF_FIXED_TABLE_BITS 5 | |||
/** | |||
* Performance tuning: bits used for the variable table in variable-time | |||
* double scalarmul. | |||
*/ | |||
#define DECAF_WNAF_VAR_TABLE_BITS 3 | |||
#endif /* __DECAF_CONFIG_H__ */ |
@@ -1,50 +0,0 @@ | |||
/** | |||
* @file decaf_config.h | |||
* @author Mike Hamburg | |||
* | |||
* @copyright | |||
* Copyright (c) 2015 Cryptography Research, Inc. \n | |||
* Released under the MIT License. See LICENSE.txt for license information. | |||
* | |||
* @brief Configuration for decaf_fast.c | |||
*/ | |||
#ifndef __DECAF_CONFIG_H__ | |||
#define __DECAF_CONFIG_H__ 1 | |||
/** | |||
* Use the Montgomery ladder for direct scalarmul. | |||
* | |||
* The Montgomery ladder is faster than Edwards scalarmul, but providing | |||
* the features Decaf supports (cofactor elimination, twist rejection) | |||
* makes it complicated and adds code. Removing the ladder saves a few | |||
* kilobytes at the cost of perhaps 5-10% overhead in direct scalarmul | |||
* time. | |||
*/ | |||
#define DECAF_USE_MONTGOMERY_LADDER 1 | |||
/** The number of comb tables for fixed base scalarmul. */ | |||
#define DECAF_COMBS_N 5 | |||
/** The number of teeth per comb for fixed base scalarmul. */ | |||
#define DECAF_COMBS_T 5 | |||
/** The comb spacing fixed base scalarmul. */ | |||
#define DECAF_COMBS_S 18 | |||
/** Performance tuning: the width of the fixed window for scalar mul. */ | |||
#define DECAF_WINDOW_BITS 5 | |||
/** | |||
* The number of bits used for the precomputed table in variable-time | |||
* double scalarmul. | |||
*/ | |||
#define DECAF_WNAF_FIXED_TABLE_BITS 5 | |||
/** | |||
* Performance tuning: bits used for the variable table in variable-time | |||
* double scalarmul. | |||
*/ | |||
#define DECAF_WNAF_VAR_TABLE_BITS 3 | |||
#endif /* __DECAF_CONFIG_H__ */ |
@@ -6,7 +6,6 @@ | |||
#include "word.h" | |||
#include "field.h" | |||
#include "decaf_config.h" | |||
#include <decaf.h> | |||
@@ -20,19 +19,38 @@ | |||
#define IMAGINE_TWIST $(imagine_twist) | |||
#define COFACTOR $(cofactor) | |||
/** Comb config: number of combs, n, t, s. */ | |||
#define COMBS_N $(combs.n) | |||
#define COMBS_T $(combs.t) | |||
#define COMBS_S $(combs.s) | |||
#define DECAF_WINDOW_BITS $(window_bits) | |||
#define DECAF_WNAF_FIXED_TABLE_BITS $(wnaf.fixed) | |||
#define DECAF_WNAF_VAR_TABLE_BITS $(wnaf.var) | |||
static const int EDWARDS_D = $(d); | |||
static const scalar_t sc_p = {{{ $(ser(q,64,"SC_LIMB")) }}}; | |||
static const scalar_t sc_r2 = {{{ $(ser(((2**128)**((scalar_bits+63)/64))%q,64,"SC_LIMB")) }}}; | |||
extern const scalar_t API_NS(point_scalarmul_adjustment); /* TODO: auto template these too. */ | |||
extern const scalar_t API_NS(precomputed_scalarmul_adjustment); | |||
static const scalar_t sc_p = {{{ | |||
$(ser(q,64,"SC_LIMB")) | |||
}}}, sc_r2 = {{{ | |||
$(ser(((2**128)**((scalar_bits+63)/64))%q,64,"SC_LIMB")) | |||
}}}, point_scalarmul_adjustment = {{{ | |||
$(ser((2**(scalar_bits-1+window_bits - ((scalar_bits-1)%window_bits)) - 1) % q,64,"SC_LIMB")) | |||
}}}, precomputed_scalarmul_adjustment = {{{ | |||
$(ser((2**(combs.n*combs.t*combs.s) - 1) % q,64,"SC_LIMB")) | |||
}}}; | |||
static const decaf_word_t MONTGOMERY_FACTOR = (decaf_word_t)0x$("%x" % pow(-q,2**64-1,2**64))ull; | |||
const uint8_t API_NS(x_base_point)[SER_BYTES] /* TODO */ = { | |||
$(ser(mont_base,8)) | |||
}; | |||
#if COFACTOR==8 | |||
static const gf SQRT_ONE_MINUS_D = {FIELD_LITERAL( | |||
$(sqrt_one_minus_d) | |||
)}; | |||
#endif | |||
/* End of template stuff */ | |||
#if (COFACTOR == 8) && !IMAGINE_TWIST | |||
/* FUTURE: Curve41417 doesn't have these properties. */ | |||
@@ -62,7 +80,7 @@ typedef struct { niels_t n; gf z; } __attribute__((aligned(sizeof(big_register_t | |||
pniels_s, pniels_t[1]; | |||
/* Precomputed base */ | |||
struct precomputed_s { niels_t table [DECAF_COMBS_N<<(DECAF_COMBS_T-1)]; }; | |||
struct precomputed_s { niels_t table [COMBS_N<<(COMBS_T-1)]; }; | |||
extern const gf API_NS(precomputed_base_as_fe)[]; | |||
const precomputed_s *API_NS(precomputed_base) = | |||
@@ -916,7 +934,7 @@ void API_NS(point_scalarmul) ( | |||
NTABLE = 1<<(WINDOW-1); | |||
scalar_t scalar1x; | |||
API_NS(scalar_add)(scalar1x, scalar, API_NS(point_scalarmul_adjustment)); | |||
API_NS(scalar_add)(scalar1x, scalar, point_scalarmul_adjustment); | |||
sc_halve(scalar1x,scalar1x,sc_p); | |||
/* Set up a precomputed table with odd multiples of b. */ | |||
@@ -978,9 +996,9 @@ void API_NS(point_double_scalarmul) ( | |||
NTABLE = 1<<(WINDOW-1); | |||
scalar_t scalar1x, scalar2x; | |||
API_NS(scalar_add)(scalar1x, scalarb, API_NS(point_scalarmul_adjustment)); | |||
API_NS(scalar_add)(scalar1x, scalarb, point_scalarmul_adjustment); | |||
sc_halve(scalar1x,scalar1x,sc_p); | |||
API_NS(scalar_add)(scalar2x, scalarc, API_NS(point_scalarmul_adjustment)); | |||
API_NS(scalar_add)(scalar2x, scalarc, point_scalarmul_adjustment); | |||
sc_halve(scalar2x,scalar2x,sc_p); | |||
/* Set up a precomputed table with odd multiples of b. */ | |||
@@ -1054,9 +1072,9 @@ void API_NS(point_dual_scalarmul) ( | |||
NTABLE = 1<<(WINDOW-1); | |||
scalar_t scalar1x, scalar2x; | |||
API_NS(scalar_add)(scalar1x, scalar1, API_NS(point_scalarmul_adjustment)); | |||
API_NS(scalar_add)(scalar1x, scalar1, point_scalarmul_adjustment); | |||
sc_halve(scalar1x,scalar1x,sc_p); | |||
API_NS(scalar_add)(scalar2x, scalar2, API_NS(point_scalarmul_adjustment)); | |||
API_NS(scalar_add)(scalar2x, scalar2, point_scalarmul_adjustment); | |||
sc_halve(scalar2x,scalar2x,sc_p); | |||
/* Set up a precomputed table with odd multiples of b. */ | |||
@@ -1417,7 +1435,7 @@ void API_NS(precompute) ( | |||
precomputed_s *table, | |||
const point_t base | |||
) { | |||
const unsigned int n = DECAF_COMBS_N, t = DECAF_COMBS_T, s = DECAF_COMBS_S; | |||
const unsigned int n = COMBS_N, t = COMBS_T, s = COMBS_S; | |||
assert(n*t*s >= SCALAR_BITS); | |||
point_t working, start, doubles[t-1]; | |||
@@ -1495,10 +1513,10 @@ void API_NS(precomputed_scalarmul) ( | |||
) { | |||
int i; | |||
unsigned j,k; | |||
const unsigned int n = DECAF_COMBS_N, t = DECAF_COMBS_T, s = DECAF_COMBS_S; | |||
const unsigned int n = COMBS_N, t = COMBS_T, s = COMBS_S; | |||
scalar_t scalar1x; | |||
API_NS(scalar_add)(scalar1x, scalar, API_NS(precomputed_scalarmul_adjustment)); | |||
API_NS(scalar_add)(scalar1x, scalar, precomputed_scalarmul_adjustment); | |||
sc_halve(scalar1x,scalar1x,sc_p); | |||
niels_t ni; | |||
@@ -7,21 +7,15 @@ | |||
#include "field.h" | |||
#include "f_field.h" | |||
#include "decaf.h" | |||
#include "decaf_config.h" | |||
#define API_NS(_id) $(c_ns)_##_id | |||
#define SCALAR_BITS $(C_NS)_SCALAR_BITS | |||
static const unsigned char base_point_ser_for_pregen[SER_BYTES] = { | |||
$(decaf_base) | |||
}; | |||
/* To satisfy linker. */ | |||
const gf API_NS(precomputed_base_as_fe)[1]; | |||
const API_NS(scalar_t) API_NS(precomputed_scalarmul_adjustment); | |||
const API_NS(scalar_t) API_NS(point_scalarmul_adjustment); | |||
const API_NS(point_t) API_NS(point_base); | |||
const uint8_t API_NS(x_base_point)[X_PUBLIC_BYTES] = {0}; | |||
struct niels_s; | |||
const gf_s *API_NS(precomputed_wnaf_as_fe); | |||
@@ -31,28 +25,6 @@ void API_NS(precompute_wnafs) ( | |||
struct niels_s *out, | |||
const API_NS(point_t) base | |||
); | |||
static void scalar_print(const char *name, const API_NS(scalar_t) sc) { /* UNIFY */ | |||
printf("const API_NS(scalar_t) %s = {{{\n", name); | |||
const int SCALAR_BYTES = (SCALAR_BITS + 7) / 8; | |||
unsigned char ser[SCALAR_BYTES]; | |||
API_NS(scalar_encode)(ser,sc); | |||
int b=0, i, comma=0; | |||
unsigned long long limb = 0; | |||
for (i=0; i<SCALAR_BYTES; i++) { | |||
limb |= ((uint64_t)ser[i])<<b; | |||
b += 8; | |||
if (b == 64 || i==SCALAR_BYTES-1) { | |||
b = 0; | |||
if (comma) printf(","); | |||
comma = 1; | |||
printf("SC_LIMB(0x%016llx)", limb); | |||
limb = ((uint64_t)ser[i])>>(8-b); | |||
} | |||
} | |||
printf("}}};\n\n"); | |||
} | |||
static void field_print(const gf f) { /* UNIFY */ | |||
unsigned char ser[SER_BYTES]; | |||
gf_serialize(ser,f); | |||
@@ -129,38 +101,5 @@ int main(int argc, char **argv) { | |||
} | |||
printf("\n};\n"); | |||
API_NS(scalar_t) smadj; | |||
API_NS(scalar_copy)(smadj,API_NS(scalar_one)); | |||
for (i=0; i<DECAF_COMBS_N*DECAF_COMBS_T*DECAF_COMBS_S; i++) { | |||
API_NS(scalar_add)(smadj,smadj,smadj); | |||
} | |||
API_NS(scalar_sub)(smadj, smadj, API_NS(scalar_one)); | |||
scalar_print("API_NS(precomputed_scalarmul_adjustment)", smadj); | |||
API_NS(scalar_copy)(smadj,API_NS(scalar_one)); | |||
for (i=0; i<SCALAR_BITS-1 + DECAF_WINDOW_BITS | |||
- ((SCALAR_BITS-1) % DECAF_WINDOW_BITS); i++) { | |||
API_NS(scalar_add)(smadj,smadj,smadj); | |||
} | |||
API_NS(scalar_sub)(smadj, smadj, API_NS(scalar_one)); | |||
scalar_print("API_NS(point_scalarmul_adjustment)", smadj); | |||
API_NS(scalar_sub)(smadj,API_NS(scalar_zero),API_NS(scalar_one)); /* get p-1 */ | |||
/* Generate the Montgomery ladder version of the base point */ | |||
gf base1,base2; | |||
ret = gf_deserialize(base1,base_point_ser_for_pregen); | |||
if (ret != DECAF_SUCCESS) return 1; | |||
gf_sqr(base2,base1); | |||
uint8_t x_ser[X_PUBLIC_BYTES] = {0}; | |||
gf_serialize(x_ser, base2); | |||
printf("const uint8_t API_NS(x_base_point)[%d] = {", X_PUBLIC_BYTES); | |||
for (i=0; i<X_PUBLIC_BYTES; i++) { | |||
printf("%s%s%d",i?",":"",(i%32==0)?"\n ":"",x_ser[i]); | |||
} | |||
printf("\n};\n"); | |||
return 0; | |||
} |