13status_t hardened_memcpy(uint32_t *restrict dest,
const uint32_t *restrict src,
16 random_order_init(&order, word_len);
23 uintptr_t src_addr = (uintptr_t)src;
24 uintptr_t dest_addr = (uintptr_t)dest;
28 for (; launderw(count) < word_len; count = launderw(count) + 1) {
34 size_t byte_idx = launderw(random_order_advance(&order)) *
sizeof(uint32_t);
41 void *src = (
void *)launderw(src_addr + byte_idx);
42 void *dest = (
void *)launderw(dest_addr + byte_idx);
45 write_32(read_32(src), dest);
50 return (status_t){.value = (int32_t)launder32((uint32_t)OTCRYPTO_OK.value)};
53status_t hardened_memshred(uint32_t *dest,
size_t word_len) {
55 random_order_init(&order, word_len);
59 uintptr_t data_addr = (uintptr_t)dest;
61 for (; count < word_len; count = launderw(count) + 1) {
62 size_t byte_idx = launderw(random_order_advance(&order)) *
sizeof(uint32_t);
66 void *data = (
void *)launderw(data_addr + byte_idx);
75 return (status_t){.value = (int32_t)launder32((uint32_t)OTCRYPTO_OK.value)};
81 random_order_init(&order, word_len);
85 uintptr_t lhs_addr = (uintptr_t)lhs;
86 uintptr_t rhs_addr = (uintptr_t)rhs;
89 uint32_t ones = UINT32_MAX;
93 for (; count < word_len; count = launderw(count) + 1) {
94 size_t byte_idx = launderw(random_order_advance(&order)) *
sizeof(uint32_t);
98 void *av = (
void *)launderw(lhs_addr + byte_idx);
99 void *bv = (
void *)launderw(rhs_addr + byte_idx);
101 uint32_t a = read_32(av);
102 uint32_t b = read_32(bv);
109 zeros = launder32(zeros) | (launder32(a) ^ b);
113 ones = launder32(ones) & (launder32(a) ^ ~b);
118 if (launder32(zeros) == 0) {
123 HARDENED_CHECK_NE(ones, UINT32_MAX);
130 uint32_t ones = UINT32_MAX;
133 random_order_init(&order, len);
137 uintptr_t lhs_addr = (uintptr_t)lhs;
138 uintptr_t rhs_addr = (uintptr_t)rhs;
140 for (; launderw(count) < len; count = launderw(count) + 1) {
141 size_t byte_idx = launderw(random_order_advance(&order));
144 uint8_t *a = (uint8_t *)launderw(lhs_addr + byte_idx);
145 uint8_t *b = (uint8_t *)launderw(rhs_addr + byte_idx);
152 zeros = launder32(zeros) | (launder32((uint32_t)*a) ^ *b);
156 ones = launder32(ones) & (launder32((uint32_t)*a) ^ ~(uint32_t)*b);
161 if (launder32(zeros) == 0) {
166 HARDENED_CHECK_NE(ones, UINT32_MAX);
170status_t hardened_xor(
const uint32_t *restrict x,
const uint32_t *restrict y,
171 size_t word_len, uint32_t *restrict dest) {
173 hardened_memshred(dest, word_len);
176 uint32_t rand[word_len];
177 hardened_memshred(rand, word_len);
180 uintptr_t x_addr = (uintptr_t)x;
181 uintptr_t y_addr = (uintptr_t)y;
182 uintptr_t dest_addr = (uintptr_t)dest;
183 uintptr_t rand_addr = (uintptr_t)&rand;
187 random_order_init(&order, word_len);
192 for (; launderw(count) < word_len; count = launderw(count) + 1) {
193 size_t byte_idx = launderw(random_order_advance(&order)) *
sizeof(uint32_t);
199 uintptr_t xp = x_addr + byte_idx;
200 uintptr_t yp = y_addr + byte_idx;
201 uintptr_t destp = dest_addr + byte_idx;
202 uintptr_t randp = rand_addr + byte_idx;
205 void *xv = (
void *)launderw(xp);
206 void *yv = (
void *)launderw(yp);
207 void *destv = (
void *)launderw(destp);
208 void *randv = (
void *)launderw(randp);
211 write_32(read_32(xv) ^ read_32(randv), destv);
212 write_32(read_32(destv) ^ read_32(yv), destv);
213 write_32(read_32(destv) ^ read_32(randv), destv);
218 return (status_t){.value = (int32_t)launder32((uint32_t)OTCRYPTO_OK.value)};
221status_t hardened_xor_in_place(uint32_t *restrict x,
const uint32_t *restrict y,
225 random_order_init(&order, word_len);
229 uintptr_t x_addr = (uintptr_t)x;
230 uintptr_t y_addr = (uintptr_t)y;
234 for (; launderw(count) < word_len; count = launderw(count) + 1) {
235 size_t byte_idx = launderw(random_order_advance(&order)) *
sizeof(uint32_t);
241 void *xv = (
void *)launderw(x_addr + byte_idx);
242 void *yv = (
void *)launderw(y_addr + byte_idx);
245 write_32(read_32(xv) ^ read_32(yv), xv);
250 return (status_t){.value = (int32_t)launder32((uint32_t)OTCRYPTO_OK.value)};
253status_t randomized_bytecopy(
void *restrict dest,
const void *restrict src,
256 random_order_init(&order, byte_len);
260 uintptr_t src_addr = (uintptr_t)src;
261 uintptr_t dest_addr = (uintptr_t)dest;
263 for (; launderw(count) < byte_len; count = launderw(count) + 1) {
264 size_t byte_idx = launderw(random_order_advance(&order));
267 uint8_t *src_byte_idx = (uint8_t *)launderw(src_addr + byte_idx);
268 uint8_t *dest_byte_idx = (uint8_t *)launderw(dest_addr + byte_idx);
270 *(dest_byte_idx) = *(src_byte_idx);
275 return (status_t){.value = (int32_t)launder32((uint32_t)OTCRYPTO_OK.value)};
278status_t randomized_bytexor_in_place(
void *restrict x,
const void *restrict y,
281 random_order_init(&order, byte_len);
285 uintptr_t x_addr = (uintptr_t)x;
286 uintptr_t y_addr = (uintptr_t)y;
288 for (; launderw(count) < byte_len; count = launderw(count) + 1) {
289 size_t byte_idx = launderw(random_order_advance(&order));
293 uint8_t *x_byte_idx = (uint8_t *)launderw(x_addr + byte_idx);
294 uint8_t *y_byte_idx = (uint8_t *)launderw(y_addr + byte_idx);
296 *(x_byte_idx) = *(x_byte_idx) ^ *(y_byte_idx);
301 return (status_t){.value = (int32_t)launder32((uint32_t)OTCRYPTO_OK.value)};
304#ifdef OT_PLATFORM_RV32
313static inline uint32_t rv32_addc(uint32_t x, uint32_t y, uint32_t *carry) {
314 uint32_t res, next_carry, c1, c2;
315 __asm__ __volatile__(
316 "add %[res], %[x], %[c_in]\n\t"
317 "sltu %[c1], %[res], %[c_in]\n\t"
318 "add %[res], %[res], %[y]\n\t"
319 "sltu %[c2], %[res], %[y]\n\t"
320 "or %[next_c], %[c1], %[c2]"
321 : [res]
"=&r"(res), [next_c]
"=&r"(next_carry), [c1]
"=&r"(c1),
323 : [x]
"r"(x), [y]
"r"(y), [c_in]
"r"(*carry));
336static inline uint32_t rv32_subc(uint32_t x, uint32_t y, uint32_t *borrow) {
337 uint32_t res, next_borrow, b1, b2;
338 __asm__ __volatile__(
339 "sltu %[b1], %[x], %[b_in]\n\t"
340 "sub %[res], %[x], %[b_in]\n\t"
341 "sltu %[b2], %[res], %[y]\n\t"
342 "sub %[res], %[res], %[y]\n\t"
343 "or %[next_b], %[b1], %[b2]"
344 : [res]
"=&r"(res), [next_b]
"=&r"(next_borrow), [b1]
"=&r"(b1),
346 : [x]
"r"(x), [y]
"r"(y), [b_in]
"r"(*borrow));
347 *borrow = next_borrow;
360static inline uint32_t rv32_sel(uint32_t cond, uint32_t a, uint32_t b) {
361 uint32_t res, mask, tmp;
362 __asm__ __volatile__(
363 "neg %[mask], %[cond]\n\t"
365 "xor %[tmp], %[a], %[b]\n\t"
366 "and %[tmp], %[tmp], %[mask]\n\t"
367 "xor %[res], %[b], %[tmp]"
368 : [res]
"=r"(res), [mask]
"=&r"(mask), [tmp]
"=&r"(tmp)
369 : [cond]
"r"(cond), [a]
"r"(a), [b]
"r"(b));
374status_t hardened_add(
const uint32_t *restrict x,
const uint32_t *restrict y,
375 size_t word_len, uint32_t *restrict dest) {
377 hardened_memshred(dest, word_len);
382 for (; launderw(count) < word_len; count = launderw(count) + 1) {
383#ifdef OT_PLATFORM_RV32
384 dest[count] = rv32_addc(x[count], y[count], &carry);
386 uint32_t x_val = x[count];
387 uint32_t y_val = y[count];
389 uint32_t res = x_val + carry;
390 uint32_t next_carry = (res < carry);
393 next_carry += (res < y_val);
401 return (status_t){.value = (int32_t)launder32((uint32_t)OTCRYPTO_OK.value)};
404status_t hardened_sub(
const uint32_t *restrict x,
const uint32_t *restrict y,
405 size_t word_len, uint32_t *restrict dest) {
407 hardened_memshred(dest, word_len);
412 for (; launderw(count) < word_len; count = launderw(count) + 1) {
413#ifdef OT_PLATFORM_RV32
414 dest[count] = rv32_subc(x[count], y[count], &borrow);
416 uint32_t x_val = x[count];
417 uint32_t y_val = y[count];
419 uint32_t res = x_val - borrow;
421 uint32_t next_borrow = (x_val < borrow);
423 next_borrow += (res < y_val);
427 borrow = next_borrow;
432 return (status_t){.value = (int32_t)launder32((uint32_t)OTCRYPTO_OK.value)};
435status_t hardened_sub_mod(
const uint32_t *restrict x,
436 const uint32_t *restrict y,
437 const uint32_t *restrict n,
size_t word_len,
438 uint32_t *restrict dest) {
440 hardened_memshred(dest, word_len);
443 uint32_t temp_sub[word_len];
446 for (; launderw(count) < word_len; count = launderw(count) + 1) {
447#ifdef OT_PLATFORM_RV32
448 temp_sub[count] = rv32_subc(x[count], y[count], &borrow);
450 uint32_t x_val = x[count];
451 uint32_t y_val = y[count];
452 uint32_t res = x_val - borrow;
453 uint32_t next_borrow = (x_val < borrow);
454 next_borrow += (res < y_val);
456 temp_sub[count] = res;
457 borrow = next_borrow;
463 uint32_t temp_add[word_len];
466 for (; launderw(count) < word_len; count = launderw(count) + 1) {
467#ifdef OT_PLATFORM_RV32
468 temp_add[count] = rv32_addc(temp_sub[count], n[count], &carry);
470 uint32_t x_val = temp_sub[count];
471 uint32_t y_val = n[count];
472 uint32_t res = x_val + carry;
473 uint32_t next_carry = (res < carry);
475 next_carry += (res < y_val);
476 temp_add[count] = res;
483 uint32_t is_borrow = launder32(borrow);
486 for (; launderw(count) < word_len; count = launderw(count) + 1) {
487#ifdef OT_PLATFORM_RV32
488 dest[count] = rv32_sel(is_borrow, temp_add[count], temp_sub[count]);
491 uint32_t mask = ~(is_borrow - 1);
493 mask = launder32(mask);
494 dest[count] = (temp_add[count] & launder32(mask)) |
495 (temp_sub[count] & launder32(~mask));
500 return (status_t){.value = (int32_t)launder32((uint32_t)OTCRYPTO_OK.value)};
503status_t hardened_add_mod(
const uint32_t *restrict x,
504 const uint32_t *restrict y,
505 const uint32_t *restrict n,
size_t word_len,
506 uint32_t *restrict dest) {
508 hardened_memshred(dest, word_len);
511 uint32_t temp_add[word_len];
514 for (; launderw(count) < word_len; count = launderw(count) + 1) {
515#ifdef OT_PLATFORM_RV32
516 temp_add[count] = rv32_addc(x[count], y[count], &carry);
518 uint32_t x_val = x[count];
519 uint32_t y_val = y[count];
520 uint32_t res = x_val + carry;
521 uint32_t next_carry = (res < carry);
523 next_carry += (res < y_val);
524 temp_add[count] = res;
531 uint32_t temp_sub[word_len];
534 for (; launderw(count) < word_len; count = launderw(count) + 1) {
535#ifdef OT_PLATFORM_RV32
536 temp_sub[count] = rv32_subc(temp_add[count], n[count], &borrow);
538 uint32_t x_val = temp_add[count];
539 uint32_t y_val = n[count];
540 uint32_t res = x_val - borrow;
541 uint32_t next_borrow = (x_val < borrow);
542 next_borrow += (res < y_val);
544 temp_sub[count] = res;
545 borrow = next_borrow;
550 uint32_t is_ge = launder32(carry) | (1 - launder32(borrow));
553 for (; launderw(count) < word_len; count = launderw(count) + 1) {
554#ifdef OT_PLATFORM_RV32
555 dest[count] = rv32_sel(is_ge, temp_sub[count], temp_add[count]);
557 uint32_t mask = ~(is_ge - 1);
559 mask = launder32(mask);
560 dest[count] = (temp_sub[count] & launder32(mask)) |
561 (temp_add[count] & launder32(~mask));
566 return (status_t){.value = (int32_t)launder32((uint32_t)OTCRYPTO_OK.value)};
569status_t hardened_range_check(
const uint32_t *value,
const uint32_t *N,
572 uint32_t is_zero_acc = 0;
575 for (; launderw(count) < word_len; count = launderw(count) + 1) {
576 uint32_t val_word = value[count];
577 uint32_t n_word = N[count];
580 is_zero_acc = launder32(is_zero_acc) | launder32(val_word);
582#ifdef OT_PLATFORM_RV32
583 (void)rv32_subc(val_word, n_word, &borrow);
586 uint32_t res = val_word - borrow;
587 uint32_t next_borrow = (val_word < borrow);
588 next_borrow += (res < n_word);
590 borrow = next_borrow;
595 uint32_t is_zero = (launder32(is_zero_acc) == 0);
596 uint32_t is_greater_or_eq = (launder32(borrow) == 0);
597 uint32_t is_bad = launder32(is_zero) | launder32(is_greater_or_eq);
599 if (launder32(is_bad) != 0) {
601 .value = (int32_t)launder32((uint32_t)OTCRYPTO_BAD_ARGS.value)};
605 return (status_t){.value = (int32_t)launder32((uint32_t)OTCRYPTO_OK.value)};
608status_t hardened_mod_reduce(
const uint32_t *value,
const uint32_t *n,
609 size_t word_len, uint32_t *result) {
616 uint32_t r[2 * word_len];
618 uint32_t r_sub[2 * word_len];
623 for (; launderw(i) < 2 * word_len; i = launderw(i) + 1) {
631 for (; launderw(i) > 0; i = launderw(i) - 1) {
632 size_t bit_idx = i - 1;
633 size_t word_idx = bit_idx >> 5;
634 size_t bit_in_word = bit_idx % 32;
639 for (; launderw(j) < 2 * word_len; j = launderw(j) + 1) {
640 uint32_t next_carry = (r[j] >> 31);
641 r[j] = (r[j] << 1) | carry;
647 uint32_t bit = (value[word_idx] >> bit_in_word) & 1;
648 r[0] = r[0] ^ ((r[0] ^ bit) & 1);
653 for (; launderw(j) < word_len; j = launderw(j) + 1) {
654#ifdef OT_PLATFORM_RV32
655 r_sub[j] = rv32_subc(r[j], n[j], &borrow);
657 uint32_t r_word = r[j];
658 uint32_t n_word = n[j];
659 uint32_t res = r_word - borrow;
660 uint32_t next_borrow = (r_word < borrow);
661 next_borrow |= (res < n_word);
664 borrow = next_borrow;
671 for (; launderw(j) < 2 * word_len; j = launderw(j) + 1) {
672#ifdef OT_PLATFORM_RV32
673 r_sub[j] = rv32_subc(r[j], 0, &borrow);
675 uint32_t res = r[j] - borrow;
676 borrow = (r[j] < borrow);
684#ifdef OT_PLATFORM_RV32
685 uint32_t cond = launder32(1 - launder32(borrow));
687 uint32_t mask = borrow - 1;
689 mask = launder32(mask);
693 for (; launderw(j) < 2 * word_len; j = launderw(j) + 1) {
694#ifdef OT_PLATFORM_RV32
695 r[j] = rv32_sel(cond, r_sub[j], r[j]);
697 r[j] = (r_sub[j] & launder32(mask)) | (r[j] & launder32(~mask));
706 TRY(hardened_memcpy(result, r, word_len));
708 return (status_t){.value = (int32_t)launder32((uint32_t)OTCRYPTO_OK.value)};