| // Copyright 2016 Google Inc. |
| // |
| // Licensed under the Apache License, Version 2.0 (the "License"); |
| // you may not use this file except in compliance with the License. |
| // You may obtain a copy of the License at |
| // |
| // http://www.apache.org/licenses/LICENSE-2.0 |
| // |
| // Unless required by applicable law or agreed to in writing, software |
| // distributed under the License is distributed on an "AS IS" BASIS, |
| // WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. |
| // See the License for the specific language governing permissions and |
| // limitations under the License. |
| #include <assert.h> |
| #include <stdint.h> |
| #include <string.h> |
| |
| #include "cryptoc/p256.h" |
| |
| const p256_int SECP256r1_n = // curve order |
| {{0xfc632551, 0xf3b9cac2, 0xa7179e84, 0xbce6faad, -1, -1, 0, -1}}; |
| |
| const p256_int SECP256r1_nMin2 = // curve order - 2 |
| {{0xfc632551 - 2, 0xf3b9cac2, 0xa7179e84, 0xbce6faad, -1, -1, 0, -1}}; |
| |
| const p256_int SECP256r1_p = // curve field size |
| {{-1, -1, -1, 0, 0, 0, 1, -1 }}; |
| |
| const p256_int SECP256r1_b = // curve b |
| {{0x27d2604b, 0x3bce3c3e, 0xcc53b0f6, 0x651d06b0, |
| 0x769886bc, 0xb3ebbd55, 0xaa3a93e7, 0x5ac635d8}}; |
| |
| static const p256_int p256_one = P256_ONE; |
| |
| |
| void p256_init(p256_int* a) { |
| memset(a, 0, sizeof(*a)); |
| } |
| |
| void p256_clear(p256_int* a) { p256_init(a); } |
| |
| int p256_get_bit(const p256_int* scalar, int bit) { |
| return (P256_DIGIT(scalar, bit / P256_BITSPERDIGIT) |
| >> (bit & (P256_BITSPERDIGIT - 1))) & 1; |
| } |
| |
| int p256_is_zero(const p256_int* a) { |
| int i, result = 0; |
| for (i = 0; i < P256_NDIGITS; ++i) result |= P256_DIGIT(a, i); |
| return !result; |
| } |
| |
| // top, c[] += a[] * b |
| // Returns new top |
| static p256_digit mulAdd(const p256_int* a, |
| p256_digit b, |
| p256_digit top, |
| p256_digit* c) { |
| int i; |
| p256_ddigit carry = 0; |
| |
| for (i = 0; i < P256_NDIGITS; ++i) { |
| carry += *c; |
| carry += (p256_ddigit)P256_DIGIT(a, i) * b; |
| *c++ = (p256_digit)carry; |
| carry >>= P256_BITSPERDIGIT; |
| } |
| return top + (p256_digit)carry; |
| } |
| |
| // top, c[] -= top_a, a[] |
| static p256_digit subTop(p256_digit top_a, |
| const p256_digit* a, |
| p256_digit top_c, |
| p256_digit* c) { |
| int i; |
| p256_sddigit borrow = 0; |
| |
| for (i = 0; i < P256_NDIGITS; ++i) { |
| borrow += *c; |
| borrow -= *a++; |
| *c++ = (p256_digit)borrow; |
| borrow >>= P256_BITSPERDIGIT; |
| } |
| borrow += top_c; |
| borrow -= top_a; |
| top_c = (p256_digit)borrow; |
| assert((borrow >> P256_BITSPERDIGIT) == 0); |
| return top_c; |
| } |
| |
| // top, c[] -= MOD[] & mask (0 or -1) |
| // returns new top. |
| static p256_digit subM(const p256_int* MOD, |
| p256_digit top, |
| p256_digit* c, |
| p256_digit mask) { |
| int i; |
| p256_sddigit borrow = 0; |
| for (i = 0; i < P256_NDIGITS; ++i) { |
| borrow += *c; |
| borrow -= P256_DIGIT(MOD, i) & mask; |
| *c++ = (p256_digit)borrow; |
| borrow >>= P256_BITSPERDIGIT; |
| } |
| return top + (p256_digit)borrow; |
| } |
| |
| // top, c[] += MOD[] & mask (0 or -1) |
| // returns new top. |
| static p256_digit addM(const p256_int* MOD, |
| p256_digit top, |
| p256_digit* c, |
| p256_digit mask) { |
| int i; |
| p256_ddigit carry = 0; |
| for (i = 0; i < P256_NDIGITS; ++i) { |
| carry += *c; |
| carry += P256_DIGIT(MOD, i) & mask; |
| *c++ = (p256_digit)carry; |
| carry >>= P256_BITSPERDIGIT; |
| } |
| return top + (p256_digit)carry; |
| } |
| |
| // c = a * b mod MOD. c can be a and/or b. |
| void p256_modmul(const p256_int* MOD, |
| const p256_int* a, |
| const p256_digit top_b, |
| const p256_int* b, |
| p256_int* c) { |
| p256_digit tmp[P256_NDIGITS * 2 + 1] = { 0 }; |
| p256_digit top = 0; |
| int i; |
| |
| // Multiply/add into tmp. |
| for (i = 0; i < P256_NDIGITS; ++i) { |
| if (i) tmp[i + P256_NDIGITS - 1] = top; |
| top = mulAdd(a, P256_DIGIT(b, i), 0, tmp + i); |
| } |
| |
| // Multiply/add top digit |
| tmp[i + P256_NDIGITS - 1] = top; |
| top = mulAdd(a, top_b, 0, tmp + i); |
| |
| // Reduce tmp, digit by digit. |
| for (; i >= 0; --i) { |
| p256_digit reducer[P256_NDIGITS] = { 0 }; |
| p256_digit top_reducer; |
| |
| // top can be any value at this point. |
| // Guestimate reducer as top * MOD, since msw of MOD is -1. |
| top_reducer = mulAdd(MOD, top, 0, reducer); |
| |
| // Subtract reducer from top | tmp. |
| top = subTop(top_reducer, reducer, top, tmp + i); |
| |
| // top is now either 0 or 1. Make it 0, fixed-timing. |
| assert(top <= 1); |
| |
| top = subM(MOD, top, tmp + i, ~(top - 1)); |
| |
| assert(top == 0); |
| |
| // We have now reduced the top digit off tmp. Fetch new top digit. |
| top = tmp[i + P256_NDIGITS - 1]; |
| } |
| |
| // tmp might still be larger than MOD, yet same bit length. |
| // Make sure it is less, fixed-timing. |
| addM(MOD, 0, tmp, subM(MOD, 0, tmp, -1)); |
| |
| memcpy(c, tmp, P256_NBYTES); |
| } |
| |
| int p256_is_odd(const p256_int* a) { return P256_DIGIT(a, 0) & 1; } |
| int p256_is_even(const p256_int* a) { return !(P256_DIGIT(a, 0) & 1); } |
| |
| p256_digit p256_shl(const p256_int* a, int n, p256_int* b) { |
| int i; |
| p256_digit top = P256_DIGIT(a, P256_NDIGITS - 1); |
| |
| n %= P256_BITSPERDIGIT; |
| for (i = P256_NDIGITS - 1; i > 0; --i) { |
| p256_digit accu = (P256_DIGIT(a, i) << n); |
| accu |= (P256_DIGIT(a, i - 1) >> (P256_BITSPERDIGIT - n)); |
| P256_DIGIT(b, i) = accu; |
| } |
| P256_DIGIT(b, i) = (P256_DIGIT(a, i) << n); |
| |
| top >>= (P256_BITSPERDIGIT - n); |
| |
| return top; |
| } |
| |
| void p256_shr(const p256_int* a, int n, p256_int* b) { |
| int i; |
| |
| n %= P256_BITSPERDIGIT; |
| for (i = 0; i < P256_NDIGITS - 1; ++i) { |
| p256_digit accu = (P256_DIGIT(a, i) >> n); |
| accu |= (P256_DIGIT(a, i + 1) << (P256_BITSPERDIGIT - n)); |
| P256_DIGIT(b, i) = accu; |
| } |
| P256_DIGIT(b, i) = (P256_DIGIT(a, i) >> n); |
| } |
| |
| static void p256_shr1(const p256_int* a, int highbit, p256_int* b) { |
| int i; |
| |
| for (i = 0; i < P256_NDIGITS - 1; ++i) { |
| p256_digit accu = (P256_DIGIT(a, i) >> 1); |
| accu |= (P256_DIGIT(a, i + 1) << (P256_BITSPERDIGIT - 1)); |
| P256_DIGIT(b, i) = accu; |
| } |
| P256_DIGIT(b, i) = (P256_DIGIT(a, i) >> 1) | |
| (highbit << (P256_BITSPERDIGIT - 1)); |
| } |
| |
| // Return -1, 0, 1 for a < b, a == b or a > b respectively. |
| int p256_cmp(const p256_int* a, const p256_int* b) { |
| int i; |
| p256_sddigit borrow = 0; |
| p256_digit notzero = 0; |
| |
| for (i = 0; i < P256_NDIGITS; ++i) { |
| borrow += (p256_sddigit)P256_DIGIT(a, i) - P256_DIGIT(b, i); |
| // Track whether any result digit is ever not zero. |
| // Relies on !!(non-zero) evaluating to 1, e.g., !!(-1) evaluating to 1. |
| notzero |= !!((p256_digit)borrow); |
| borrow >>= P256_BITSPERDIGIT; |
| } |
| return (int)borrow | notzero; |
| } |
| |
| // c = a - b. Returns borrow: 0 or -1. |
| int p256_sub(const p256_int* a, const p256_int* b, p256_int* c) { |
| int i; |
| p256_sddigit borrow = 0; |
| |
| for (i = 0; i < P256_NDIGITS; ++i) { |
| borrow += (p256_sddigit)P256_DIGIT(a, i) - P256_DIGIT(b, i); |
| if (c) P256_DIGIT(c, i) = (p256_digit)borrow; |
| borrow >>= P256_BITSPERDIGIT; |
| } |
| return (int)borrow; |
| } |
| |
| // c = a + b. Returns carry: 0 or 1. |
| int p256_add(const p256_int* a, const p256_int* b, p256_int* c) { |
| int i; |
| p256_ddigit carry = 0; |
| |
| for (i = 0; i < P256_NDIGITS; ++i) { |
| carry += (p256_ddigit)P256_DIGIT(a, i) + P256_DIGIT(b, i); |
| if (c) P256_DIGIT(c, i) = (p256_digit)carry; |
| carry >>= P256_BITSPERDIGIT; |
| } |
| return (int)carry; |
| } |
| |
| // b = a + d. Returns carry, 0 or 1. |
| int p256_add_d(const p256_int* a, p256_digit d, p256_int* b) { |
| int i; |
| p256_ddigit carry = d; |
| |
| for (i = 0; i < P256_NDIGITS; ++i) { |
| carry += (p256_ddigit)P256_DIGIT(a, i); |
| if (b) P256_DIGIT(b, i) = (p256_digit)carry; |
| carry >>= P256_BITSPERDIGIT; |
| } |
| return (int)carry; |
| } |
| |
| // if (mask) dst = src, fixed-timing style. |
| static void copyConditional(const p256_int* src, |
| p256_int* dst, |
| int mask) { |
| int i; |
| for (i = 0; i < P256_NDIGITS; ++i) { |
| p256_digit b = P256_DIGIT(src, i) & mask; // 0 or src[i] |
| b |= P256_DIGIT(dst, i) & ~mask; // dst[i] or 0 |
| P256_DIGIT(dst, i) = b; |
| } |
| } |
| |
| // -1 iff (x&15) == 0, 0 otherwise. |
| // Relies on arithmetic shift right behavior. |
| #define ZEROtoONES(x) (((int32_t)(((x)&15)-1))>>31) |
| |
| // tbl[0] = tbl[idx], fixed-timing style. |
| static void set0ToIdx(p256_int tbl[16], int idx) { |
| int32_t i; |
| tbl[0] = p256_one; |
| for (i = 1; i < 16; ++i) { |
| copyConditional(&tbl[i], &tbl[0], ZEROtoONES(i-idx)); |
| } |
| } |
| |
| // b = 1/a mod MOD, fixed timing, Fermat's little theorem. |
| void p256_modinv(const p256_int* MOD, |
| const p256_int* a, |
| p256_int* b) { |
| p256_int tbl[16]; |
| int i; |
| |
| // tbl[i] = a**i, tbl[0] unused. |
| tbl[1] = *a; |
| for (i = 2; i < 16; ++i) { |
| p256_modmul(MOD, &tbl[i-1], 0, a, &tbl[i]); |
| } |
| |
| *b = p256_one; |
| for (i = 256; i > 0; i -= 4) { |
| int32_t idx = 0; |
| p256_modmul(MOD, b, 0, b, b); |
| p256_modmul(MOD, b, 0, b, b); |
| p256_modmul(MOD, b, 0, b, b); |
| p256_modmul(MOD, b, 0, b, b); |
| idx |= p256_get_bit(&SECP256r1_nMin2, i - 1) << 3; |
| idx |= p256_get_bit(&SECP256r1_nMin2, i - 2) << 2; |
| idx |= p256_get_bit(&SECP256r1_nMin2, i - 3) << 1; |
| idx |= p256_get_bit(&SECP256r1_nMin2, i - 4) << 0; |
| set0ToIdx(tbl, idx); // tbl[0] = tbl[idx] |
| p256_modmul(MOD, b, 0, &tbl[0], &tbl[0]); |
| copyConditional(&tbl[0], b, ~ZEROtoONES(idx)); |
| } |
| } |
| |
| // b = 1/a mod MOD, binary euclid. |
| void p256_modinv_vartime(const p256_int* MOD, |
| const p256_int* a, |
| p256_int* b) { |
| p256_int R = P256_ZERO; |
| p256_int S = P256_ONE; |
| p256_int U = *MOD; |
| p256_int V = *a; |
| |
| for (;;) { |
| if (p256_is_even(&U)) { |
| p256_shr1(&U, 0, &U); |
| if (p256_is_even(&R)) { |
| p256_shr1(&R, 0, &R); |
| } else { |
| // R = (R+MOD)/2 |
| p256_shr1(&R, p256_add(&R, MOD, &R), &R); |
| } |
| } else if (p256_is_even(&V)) { |
| p256_shr1(&V, 0, &V); |
| if (p256_is_even(&S)) { |
| p256_shr1(&S, 0, &S); |
| } else { |
| // S = (S+MOD)/2 |
| p256_shr1(&S, p256_add(&S, MOD, &S) , &S); |
| } |
| } else { // U,V both odd. |
| if (!p256_sub(&V, &U, NULL)) { |
| p256_sub(&V, &U, &V); |
| if (p256_sub(&S, &R, &S)) p256_add(&S, MOD, &S); |
| if (p256_is_zero(&V)) break; // done. |
| } else { |
| p256_sub(&U, &V, &U); |
| if (p256_sub(&R, &S, &R)) p256_add(&R, MOD, &R); |
| } |
| } |
| } |
| |
| p256_mod(MOD, &R, b); |
| } |
| |
| void p256_mod(const p256_int* MOD, |
| const p256_int* in, |
| p256_int* out) { |
| if (out != in) *out = *in; |
| addM(MOD, 0, P256_DIGITS(out), subM(MOD, 0, P256_DIGITS(out), -1)); |
| } |
| |
| // Verify y^2 == x^3 - 3x + b mod p |
| // and 0 < x < p and 0 < y < p |
| int p256_is_valid_point(const p256_int* x, const p256_int* y) { |
| p256_int y2, x3; |
| |
| if (p256_cmp(&SECP256r1_p, x) <= 0 || |
| p256_cmp(&SECP256r1_p, y) <= 0 || |
| p256_is_zero(x) || |
| p256_is_zero(y)) return 0; |
| |
| p256_modmul(&SECP256r1_p, y, 0, y, &y2); // y^2 |
| |
| p256_modmul(&SECP256r1_p, x, 0, x, &x3); // x^2 |
| p256_modmul(&SECP256r1_p, x, 0, &x3, &x3); // x^3 |
| if (p256_sub(&x3, x, &x3)) p256_add(&x3, &SECP256r1_p, &x3); // x^3 - x |
| if (p256_sub(&x3, x, &x3)) p256_add(&x3, &SECP256r1_p, &x3); // x^3 - 2x |
| if (p256_sub(&x3, x, &x3)) p256_add(&x3, &SECP256r1_p, &x3); // x^3 - 3x |
| if (p256_add(&x3, &SECP256r1_b, &x3)) // x^3 - 3x + b |
| p256_sub(&x3, &SECP256r1_p, &x3); |
| if (p256_sub(&x3, &SECP256r1_p, &x3)) // make sure 0 <= x3 < p |
| p256_add(&x3, &SECP256r1_p, &x3); |
| |
| return p256_cmp(&y2, &x3) == 0; |
| } |
| |
| void p256_from_bin(const uint8_t src[P256_NBYTES], p256_int* dst) { |
| int i; |
| const uint8_t* p = &src[0]; |
| |
| for (i = P256_NDIGITS - 1; i >= 0; --i) { |
| P256_DIGIT(dst, i) = |
| (p[0] << 24) | |
| (p[1] << 16) | |
| (p[2] << 8) | |
| p[3]; |
| p += 4; |
| } |
| } |
| |
| void p256_to_bin(const p256_int* src, uint8_t dst[P256_NBYTES]) { |
| int i; |
| uint8_t* p = &dst[0]; |
| |
| for (i = P256_NDIGITS - 1; i >= 0; --i) { |
| p256_digit digit = P256_DIGIT(src, i); |
| p[0] = (uint8_t)(digit >> 24); |
| p[1] = (uint8_t)(digit >> 16); |
| p[2] = (uint8_t)(digit >> 8); |
| p[3] = (uint8_t)(digit); |
| p += 4; |
| } |
| } |