Janos Follath | 3ca0775 | 2022-08-09 11:45:47 +0100 | [diff] [blame] | 1 | /* |
Janos Follath | a95f204 | 2022-08-19 12:09:17 +0100 | [diff] [blame] | 2 | * Core bignum functions |
Janos Follath | 3ca0775 | 2022-08-09 11:45:47 +0100 | [diff] [blame] | 3 | * |
| 4 | * Copyright The Mbed TLS Contributors |
| 5 | * SPDX-License-Identifier: Apache-2.0 |
| 6 | * |
| 7 | * Licensed under the Apache License, Version 2.0 (the "License"); you may |
| 8 | * not use this file except in compliance with the License. |
| 9 | * You may obtain a copy of the License at |
| 10 | * |
| 11 | * http://www.apache.org/licenses/LICENSE-2.0 |
| 12 | * |
| 13 | * Unless required by applicable law or agreed to in writing, software |
| 14 | * distributed under the License is distributed on an "AS IS" BASIS, WITHOUT |
| 15 | * WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. |
| 16 | * See the License for the specific language governing permissions and |
| 17 | * limitations under the License. |
| 18 | */ |
| 19 | |
| 20 | #include "common.h" |
| 21 | |
| 22 | #if defined(MBEDTLS_BIGNUM_C) |
| 23 | |
| 24 | #include <string.h> |
| 25 | |
| 26 | #include "mbedtls/error.h" |
| 27 | #include "mbedtls/platform_util.h" |
Gabor Mezei | e1d31c4 | 2022-09-12 16:25:24 +0200 | [diff] [blame] | 28 | #include "constant_time_internal.h" |
Janos Follath | 3ca0775 | 2022-08-09 11:45:47 +0100 | [diff] [blame] | 29 | |
Janos Follath | 3ca0775 | 2022-08-09 11:45:47 +0100 | [diff] [blame] | 30 | #include "mbedtls/platform.h" |
Janos Follath | 3ca0775 | 2022-08-09 11:45:47 +0100 | [diff] [blame] | 31 | |
| 32 | #include "bignum_core.h" |
Tom Cosgrove | 958fd3d | 2022-08-24 11:08:51 +0100 | [diff] [blame] | 33 | #include "bn_mul.h" |
| 34 | #include "constant_time_internal.h" |
Janos Follath | 3ca0775 | 2022-08-09 11:45:47 +0100 | [diff] [blame] | 35 | |
Dave Rodgman | 914347b | 2023-04-27 14:20:30 +0100 | [diff] [blame] | 36 | size_t mbedtls_mpi_core_clz(mbedtls_mpi_uint a) |
| 37 | { |
| 38 | #if defined(__has_builtin) |
Agathiyan Bragadeesh | e55a1e1 | 2023-07-17 15:00:19 +0100 | [diff] [blame] | 39 | #if (MBEDTLS_MPI_UINT_MAX == UINT_MAX) && __has_builtin(__builtin_clz) |
| 40 | #define core_clz __builtin_clz |
| 41 | #elif (MBEDTLS_MPI_UINT_MAX == ULONG_MAX) && __has_builtin(__builtin_clzl) |
| 42 | #define core_clz __builtin_clzl |
| 43 | #elif (MBEDTLS_MPI_UINT_MAX == ULLONG_MAX) && __has_builtin(__builtin_clzll) |
| 44 | #define core_clz __builtin_clzll |
Dave Rodgman | 914347b | 2023-04-27 14:20:30 +0100 | [diff] [blame] | 45 | #endif |
| 46 | #endif |
Agathiyan Bragadeesh | e55a1e1 | 2023-07-17 15:00:19 +0100 | [diff] [blame] | 47 | #if defined(core_clz) |
| 48 | return (size_t) core_clz(a); |
Agathiyan Bragadeesh | 271a953 | 2023-07-12 11:15:17 +0100 | [diff] [blame] | 49 | #else |
Dave Rodgman | 914347b | 2023-04-27 14:20:30 +0100 | [diff] [blame] | 50 | size_t j; |
| 51 | mbedtls_mpi_uint mask = (mbedtls_mpi_uint) 1 << (biL - 1); |
| 52 | |
| 53 | for (j = 0; j < biL; j++) { |
| 54 | if (a & mask) { |
| 55 | break; |
| 56 | } |
| 57 | |
| 58 | mask >>= 1; |
| 59 | } |
| 60 | |
| 61 | return j; |
Agathiyan Bragadeesh | 271a953 | 2023-07-12 11:15:17 +0100 | [diff] [blame] | 62 | #endif |
Dave Rodgman | 914347b | 2023-04-27 14:20:30 +0100 | [diff] [blame] | 63 | } |
| 64 | |
Gilles Peskine | 449bd83 | 2023-01-11 14:50:10 +0100 | [diff] [blame] | 65 | size_t mbedtls_mpi_core_bitlen(const mbedtls_mpi_uint *A, size_t A_limbs) |
Janos Follath | 3ca0775 | 2022-08-09 11:45:47 +0100 | [diff] [blame] | 66 | { |
Dave Rodgman | 880a6b3 | 2023-04-20 09:50:31 +0100 | [diff] [blame] | 67 | int i; |
| 68 | size_t j; |
Janos Follath | 3ca0775 | 2022-08-09 11:45:47 +0100 | [diff] [blame] | 69 | |
Dave Rodgman | 2e863ec | 2023-04-25 17:34:59 +0100 | [diff] [blame] | 70 | for (i = ((int) A_limbs) - 1; i >= 0; i--) { |
| 71 | if (A[i] != 0) { |
| 72 | j = biL - mbedtls_mpi_core_clz(A[i]); |
| 73 | return (i * biL) + j; |
Gilles Peskine | 449bd83 | 2023-01-11 14:50:10 +0100 | [diff] [blame] | 74 | } |
| 75 | } |
Janos Follath | 3ca0775 | 2022-08-09 11:45:47 +0100 | [diff] [blame] | 76 | |
Dave Rodgman | 880a6b3 | 2023-04-20 09:50:31 +0100 | [diff] [blame] | 77 | return 0; |
Janos Follath | 3ca0775 | 2022-08-09 11:45:47 +0100 | [diff] [blame] | 78 | } |
| 79 | |
Gilles Peskine | 449bd83 | 2023-01-11 14:50:10 +0100 | [diff] [blame] | 80 | static mbedtls_mpi_uint mpi_bigendian_to_host(mbedtls_mpi_uint a) |
Janos Follath | 3ca0775 | 2022-08-09 11:45:47 +0100 | [diff] [blame] | 81 | { |
Gilles Peskine | 449bd83 | 2023-01-11 14:50:10 +0100 | [diff] [blame] | 82 | if (MBEDTLS_IS_BIG_ENDIAN) { |
Dave Rodgman | 6d23ff6 | 2022-11-28 14:38:53 +0000 | [diff] [blame] | 83 | /* Nothing to do on bigendian systems. */ |
Gilles Peskine | 449bd83 | 2023-01-11 14:50:10 +0100 | [diff] [blame] | 84 | return a; |
| 85 | } else { |
Dave Rodgman | 7e1e7be | 2023-09-05 18:12:33 +0100 | [diff] [blame] | 86 | #if defined(MBEDTLS_HAVE_INT32) |
Dave Rodgman | b7b8c09 | 2023-09-05 20:35:19 +0100 | [diff] [blame] | 87 | return (mbedtls_mpi_uint) MBEDTLS_BSWAP32(a); |
Dave Rodgman | 7e1e7be | 2023-09-05 18:12:33 +0100 | [diff] [blame] | 88 | #elif defined(MBEDTLS_HAVE_INT64) |
Dave Rodgman | b7b8c09 | 2023-09-05 20:35:19 +0100 | [diff] [blame] | 89 | return (mbedtls_mpi_uint) MBEDTLS_BSWAP64(a); |
Dave Rodgman | 7e1e7be | 2023-09-05 18:12:33 +0100 | [diff] [blame] | 90 | #endif |
Dave Rodgman | 6d23ff6 | 2022-11-28 14:38:53 +0000 | [diff] [blame] | 91 | } |
Janos Follath | 3ca0775 | 2022-08-09 11:45:47 +0100 | [diff] [blame] | 92 | } |
| 93 | |
Gilles Peskine | 449bd83 | 2023-01-11 14:50:10 +0100 | [diff] [blame] | 94 | void mbedtls_mpi_core_bigendian_to_host(mbedtls_mpi_uint *A, |
| 95 | size_t A_limbs) |
Janos Follath | 3ca0775 | 2022-08-09 11:45:47 +0100 | [diff] [blame] | 96 | { |
| 97 | mbedtls_mpi_uint *cur_limb_left; |
| 98 | mbedtls_mpi_uint *cur_limb_right; |
Gilles Peskine | 449bd83 | 2023-01-11 14:50:10 +0100 | [diff] [blame] | 99 | if (A_limbs == 0) { |
Janos Follath | 3ca0775 | 2022-08-09 11:45:47 +0100 | [diff] [blame] | 100 | return; |
Gilles Peskine | 449bd83 | 2023-01-11 14:50:10 +0100 | [diff] [blame] | 101 | } |
Janos Follath | 3ca0775 | 2022-08-09 11:45:47 +0100 | [diff] [blame] | 102 | |
| 103 | /* |
| 104 | * Traverse limbs and |
| 105 | * - adapt byte-order in each limb |
| 106 | * - swap the limbs themselves. |
| 107 | * For that, simultaneously traverse the limbs from left to right |
| 108 | * and from right to left, as long as the left index is not bigger |
| 109 | * than the right index (it's not a problem if limbs is odd and the |
| 110 | * indices coincide in the last iteration). |
| 111 | */ |
Gilles Peskine | 449bd83 | 2023-01-11 14:50:10 +0100 | [diff] [blame] | 112 | for (cur_limb_left = A, cur_limb_right = A + (A_limbs - 1); |
Janos Follath | 3ca0775 | 2022-08-09 11:45:47 +0100 | [diff] [blame] | 113 | cur_limb_left <= cur_limb_right; |
Gilles Peskine | 449bd83 | 2023-01-11 14:50:10 +0100 | [diff] [blame] | 114 | cur_limb_left++, cur_limb_right--) { |
Janos Follath | 3ca0775 | 2022-08-09 11:45:47 +0100 | [diff] [blame] | 115 | mbedtls_mpi_uint tmp; |
| 116 | /* Note that if cur_limb_left == cur_limb_right, |
| 117 | * this code effectively swaps the bytes only once. */ |
Gilles Peskine | 449bd83 | 2023-01-11 14:50:10 +0100 | [diff] [blame] | 118 | tmp = mpi_bigendian_to_host(*cur_limb_left); |
| 119 | *cur_limb_left = mpi_bigendian_to_host(*cur_limb_right); |
Janos Follath | 3ca0775 | 2022-08-09 11:45:47 +0100 | [diff] [blame] | 120 | *cur_limb_right = tmp; |
| 121 | } |
| 122 | } |
| 123 | |
Gilles Peskine | 6f949ea | 2022-09-20 18:38:35 +0200 | [diff] [blame] | 124 | /* Whether min <= A, in constant time. |
| 125 | * A_limbs must be at least 1. */ |
Dave Rodgman | fd7fab4 | 2023-05-17 14:00:39 +0100 | [diff] [blame] | 126 | mbedtls_ct_condition_t mbedtls_mpi_core_uint_le_mpi(mbedtls_mpi_uint min, |
| 127 | const mbedtls_mpi_uint *A, |
| 128 | size_t A_limbs) |
Gilles Peskine | 6f949ea | 2022-09-20 18:38:35 +0200 | [diff] [blame] | 129 | { |
| 130 | /* min <= least significant limb? */ |
Dave Rodgman | b7825ce | 2023-08-10 11:58:18 +0100 | [diff] [blame] | 131 | mbedtls_ct_condition_t min_le_lsl = mbedtls_ct_uint_ge(A[0], min); |
Gilles Peskine | 6f949ea | 2022-09-20 18:38:35 +0200 | [diff] [blame] | 132 | |
Gilles Peskine | 6b7ce96 | 2022-12-15 15:04:33 +0100 | [diff] [blame] | 133 | /* limbs other than the least significant one are all zero? */ |
Dave Rodgman | fd7fab4 | 2023-05-17 14:00:39 +0100 | [diff] [blame] | 134 | mbedtls_ct_condition_t msll_mask = MBEDTLS_CT_FALSE; |
Gilles Peskine | 449bd83 | 2023-01-11 14:50:10 +0100 | [diff] [blame] | 135 | for (size_t i = 1; i < A_limbs; i++) { |
Dave Rodgman | fd7fab4 | 2023-05-17 14:00:39 +0100 | [diff] [blame] | 136 | msll_mask = mbedtls_ct_bool_or(msll_mask, mbedtls_ct_bool(A[i])); |
Gilles Peskine | 449bd83 | 2023-01-11 14:50:10 +0100 | [diff] [blame] | 137 | } |
Gilles Peskine | 6f949ea | 2022-09-20 18:38:35 +0200 | [diff] [blame] | 138 | |
| 139 | /* min <= A iff the lowest limb of A is >= min or the other limbs |
| 140 | * are not all zero. */ |
Dave Rodgman | fd7fab4 | 2023-05-17 14:00:39 +0100 | [diff] [blame] | 141 | return mbedtls_ct_bool_or(msll_mask, min_le_lsl); |
Gilles Peskine | 6f949ea | 2022-09-20 18:38:35 +0200 | [diff] [blame] | 142 | } |
| 143 | |
Dave Rodgman | 8ac9a1d | 2023-05-17 15:16:22 +0100 | [diff] [blame] | 144 | mbedtls_ct_condition_t mbedtls_mpi_core_lt_ct(const mbedtls_mpi_uint *A, |
| 145 | const mbedtls_mpi_uint *B, |
| 146 | size_t limbs) |
Dave Rodgman | 7d4f019 | 2023-05-09 14:01:05 +0100 | [diff] [blame] | 147 | { |
Dave Rodgman | 8ac9a1d | 2023-05-17 15:16:22 +0100 | [diff] [blame] | 148 | mbedtls_ct_condition_t ret = MBEDTLS_CT_FALSE, cond = MBEDTLS_CT_FALSE, done = MBEDTLS_CT_FALSE; |
Dave Rodgman | 7d4f019 | 2023-05-09 14:01:05 +0100 | [diff] [blame] | 149 | |
| 150 | for (size_t i = limbs; i > 0; i--) { |
| 151 | /* |
| 152 | * If B[i - 1] < A[i - 1] then A < B is false and the result must |
| 153 | * remain 0. |
| 154 | * |
| 155 | * Again even if we can make a decision, we just mark the result and |
| 156 | * the fact that we are done and continue looping. |
| 157 | */ |
Dave Rodgman | b7825ce | 2023-08-10 11:58:18 +0100 | [diff] [blame] | 158 | cond = mbedtls_ct_uint_lt(B[i - 1], A[i - 1]); |
Dave Rodgman | 8ac9a1d | 2023-05-17 15:16:22 +0100 | [diff] [blame] | 159 | done = mbedtls_ct_bool_or(done, cond); |
Dave Rodgman | 7d4f019 | 2023-05-09 14:01:05 +0100 | [diff] [blame] | 160 | |
| 161 | /* |
| 162 | * If A[i - 1] < B[i - 1] then A < B is true. |
| 163 | * |
| 164 | * Again even if we can make a decision, we just mark the result and |
| 165 | * the fact that we are done and continue looping. |
| 166 | */ |
Dave Rodgman | b7825ce | 2023-08-10 11:58:18 +0100 | [diff] [blame] | 167 | cond = mbedtls_ct_uint_lt(A[i - 1], B[i - 1]); |
Dave Rodgman | 8ac9a1d | 2023-05-17 15:16:22 +0100 | [diff] [blame] | 168 | ret = mbedtls_ct_bool_or(ret, mbedtls_ct_bool_and(cond, mbedtls_ct_bool_not(done))); |
| 169 | done = mbedtls_ct_bool_or(done, cond); |
Dave Rodgman | 7d4f019 | 2023-05-09 14:01:05 +0100 | [diff] [blame] | 170 | } |
| 171 | |
| 172 | /* |
| 173 | * If all the limbs were equal, then the numbers are equal, A < B is false |
| 174 | * and leaving the result 0 is correct. |
| 175 | */ |
| 176 | |
| 177 | return ret; |
Janos Follath | 3ca0775 | 2022-08-09 11:45:47 +0100 | [diff] [blame] | 178 | } |
| 179 | |
Gilles Peskine | 449bd83 | 2023-01-11 14:50:10 +0100 | [diff] [blame] | 180 | void mbedtls_mpi_core_cond_assign(mbedtls_mpi_uint *X, |
| 181 | const mbedtls_mpi_uint *A, |
| 182 | size_t limbs, |
Dave Rodgman | cd2e38b | 2023-05-17 13:31:55 +0100 | [diff] [blame] | 183 | mbedtls_ct_condition_t assign) |
Gabor Mezei | e1d31c4 | 2022-09-12 16:25:24 +0200 | [diff] [blame] | 184 | { |
Gilles Peskine | 449bd83 | 2023-01-11 14:50:10 +0100 | [diff] [blame] | 185 | if (X == A) { |
Gabor Mezei | e9c013c | 2022-10-10 14:26:57 +0200 | [diff] [blame] | 186 | return; |
Gilles Peskine | 449bd83 | 2023-01-11 14:50:10 +0100 | [diff] [blame] | 187 | } |
Gabor Mezei | e9c013c | 2022-10-10 14:26:57 +0200 | [diff] [blame] | 188 | |
Dave Rodgman | 3b25c40 | 2023-05-18 14:41:06 +0100 | [diff] [blame] | 189 | /* This function is very performance-sensitive for RSA. For this reason |
| 190 | * we have the loop below, instead of calling mbedtls_ct_memcpy_if |
| 191 | * (this is more optimal since here we don't have to handle the case where |
| 192 | * we copy awkwardly sized data). |
| 193 | */ |
| 194 | for (size_t i = 0; i < limbs; i++) { |
| 195 | X[i] = mbedtls_ct_mpi_uint_if(assign, A[i], X[i]); |
| 196 | } |
Gabor Mezei | e1d31c4 | 2022-09-12 16:25:24 +0200 | [diff] [blame] | 197 | } |
| 198 | |
Gilles Peskine | 449bd83 | 2023-01-11 14:50:10 +0100 | [diff] [blame] | 199 | void mbedtls_mpi_core_cond_swap(mbedtls_mpi_uint *X, |
| 200 | mbedtls_mpi_uint *Y, |
| 201 | size_t limbs, |
Dave Rodgman | cd2e38b | 2023-05-17 13:31:55 +0100 | [diff] [blame] | 202 | mbedtls_ct_condition_t swap) |
Gabor Mezei | e1d31c4 | 2022-09-12 16:25:24 +0200 | [diff] [blame] | 203 | { |
Gilles Peskine | 449bd83 | 2023-01-11 14:50:10 +0100 | [diff] [blame] | 204 | if (X == Y) { |
Gabor Mezei | e9c013c | 2022-10-10 14:26:57 +0200 | [diff] [blame] | 205 | return; |
Gilles Peskine | 449bd83 | 2023-01-11 14:50:10 +0100 | [diff] [blame] | 206 | } |
Gabor Mezei | e9c013c | 2022-10-10 14:26:57 +0200 | [diff] [blame] | 207 | |
Gilles Peskine | 449bd83 | 2023-01-11 14:50:10 +0100 | [diff] [blame] | 208 | for (size_t i = 0; i < limbs; i++) { |
Gabor Mezei | e5b8585 | 2022-09-30 13:54:02 +0200 | [diff] [blame] | 209 | mbedtls_mpi_uint tmp = X[i]; |
Dave Rodgman | cd2e38b | 2023-05-17 13:31:55 +0100 | [diff] [blame] | 210 | X[i] = mbedtls_ct_mpi_uint_if(swap, Y[i], X[i]); |
| 211 | Y[i] = mbedtls_ct_mpi_uint_if(swap, tmp, Y[i]); |
Gabor Mezei | e1d31c4 | 2022-09-12 16:25:24 +0200 | [diff] [blame] | 212 | } |
Gabor Mezei | e1d31c4 | 2022-09-12 16:25:24 +0200 | [diff] [blame] | 213 | } |
| 214 | |
Gilles Peskine | 449bd83 | 2023-01-11 14:50:10 +0100 | [diff] [blame] | 215 | int mbedtls_mpi_core_read_le(mbedtls_mpi_uint *X, |
| 216 | size_t X_limbs, |
| 217 | const unsigned char *input, |
| 218 | size_t input_length) |
Janos Follath | 3ca0775 | 2022-08-09 11:45:47 +0100 | [diff] [blame] | 219 | { |
Gilles Peskine | 449bd83 | 2023-01-11 14:50:10 +0100 | [diff] [blame] | 220 | const size_t limbs = CHARS_TO_LIMBS(input_length); |
Janos Follath | 3ca0775 | 2022-08-09 11:45:47 +0100 | [diff] [blame] | 221 | |
Gilles Peskine | 449bd83 | 2023-01-11 14:50:10 +0100 | [diff] [blame] | 222 | if (X_limbs < limbs) { |
| 223 | return MBEDTLS_ERR_MPI_BUFFER_TOO_SMALL; |
| 224 | } |
Janos Follath | 2ab2d3e | 2022-08-11 16:13:53 +0100 | [diff] [blame] | 225 | |
Gilles Peskine | 449bd83 | 2023-01-11 14:50:10 +0100 | [diff] [blame] | 226 | if (X != NULL) { |
| 227 | memset(X, 0, X_limbs * ciL); |
Janos Follath | 3ca0775 | 2022-08-09 11:45:47 +0100 | [diff] [blame] | 228 | |
Gilles Peskine | 449bd83 | 2023-01-11 14:50:10 +0100 | [diff] [blame] | 229 | for (size_t i = 0; i < input_length; i++) { |
| 230 | size_t offset = ((i % ciL) << 3); |
| 231 | X[i / ciL] |= ((mbedtls_mpi_uint) input[i]) << offset; |
Janos Follath | ca5688e | 2022-08-19 12:05:28 +0100 | [diff] [blame] | 232 | } |
Gabor Mezei | bf9da1d | 2022-08-12 14:11:56 +0200 | [diff] [blame] | 233 | } |
Janos Follath | 3ca0775 | 2022-08-09 11:45:47 +0100 | [diff] [blame] | 234 | |
Gilles Peskine | 449bd83 | 2023-01-11 14:50:10 +0100 | [diff] [blame] | 235 | return 0; |
Janos Follath | 3ca0775 | 2022-08-09 11:45:47 +0100 | [diff] [blame] | 236 | } |
| 237 | |
Gilles Peskine | 449bd83 | 2023-01-11 14:50:10 +0100 | [diff] [blame] | 238 | int mbedtls_mpi_core_read_be(mbedtls_mpi_uint *X, |
| 239 | size_t X_limbs, |
| 240 | const unsigned char *input, |
| 241 | size_t input_length) |
Janos Follath | 3ca0775 | 2022-08-09 11:45:47 +0100 | [diff] [blame] | 242 | { |
Gilles Peskine | 449bd83 | 2023-01-11 14:50:10 +0100 | [diff] [blame] | 243 | const size_t limbs = CHARS_TO_LIMBS(input_length); |
Janos Follath | 3ca0775 | 2022-08-09 11:45:47 +0100 | [diff] [blame] | 244 | |
Gilles Peskine | 449bd83 | 2023-01-11 14:50:10 +0100 | [diff] [blame] | 245 | if (X_limbs < limbs) { |
| 246 | return MBEDTLS_ERR_MPI_BUFFER_TOO_SMALL; |
| 247 | } |
Janos Follath | 2ab2d3e | 2022-08-11 16:13:53 +0100 | [diff] [blame] | 248 | |
Janos Follath | b7a88ec | 2022-08-19 12:24:40 +0100 | [diff] [blame] | 249 | /* If X_limbs is 0, input_length must also be 0 (from previous test). |
| 250 | * Nothing to do. */ |
Gilles Peskine | 449bd83 | 2023-01-11 14:50:10 +0100 | [diff] [blame] | 251 | if (X_limbs == 0) { |
| 252 | return 0; |
Janos Follath | 3ca0775 | 2022-08-09 11:45:47 +0100 | [diff] [blame] | 253 | } |
| 254 | |
Gilles Peskine | 449bd83 | 2023-01-11 14:50:10 +0100 | [diff] [blame] | 255 | memset(X, 0, X_limbs * ciL); |
Gabor Mezei | c414ba3 | 2022-08-12 17:47:39 +0200 | [diff] [blame] | 256 | |
Gilles Peskine | 449bd83 | 2023-01-11 14:50:10 +0100 | [diff] [blame] | 257 | /* memcpy() with (NULL, 0) is undefined behaviour */ |
| 258 | if (input_length != 0) { |
| 259 | size_t overhead = (X_limbs * ciL) - input_length; |
| 260 | unsigned char *Xp = (unsigned char *) X; |
| 261 | memcpy(Xp + overhead, input, input_length); |
| 262 | } |
| 263 | |
| 264 | mbedtls_mpi_core_bigendian_to_host(X, X_limbs); |
| 265 | |
| 266 | return 0; |
Janos Follath | 3ca0775 | 2022-08-09 11:45:47 +0100 | [diff] [blame] | 267 | } |
| 268 | |
Gilles Peskine | 449bd83 | 2023-01-11 14:50:10 +0100 | [diff] [blame] | 269 | int mbedtls_mpi_core_write_le(const mbedtls_mpi_uint *A, |
| 270 | size_t A_limbs, |
| 271 | unsigned char *output, |
| 272 | size_t output_length) |
Janos Follath | 3ca0775 | 2022-08-09 11:45:47 +0100 | [diff] [blame] | 273 | { |
Janos Follath | b7a88ec | 2022-08-19 12:24:40 +0100 | [diff] [blame] | 274 | size_t stored_bytes = A_limbs * ciL; |
Janos Follath | 3ca0775 | 2022-08-09 11:45:47 +0100 | [diff] [blame] | 275 | size_t bytes_to_copy; |
Janos Follath | 3ca0775 | 2022-08-09 11:45:47 +0100 | [diff] [blame] | 276 | |
Gilles Peskine | 449bd83 | 2023-01-11 14:50:10 +0100 | [diff] [blame] | 277 | if (stored_bytes < output_length) { |
Janos Follath | 3ca0775 | 2022-08-09 11:45:47 +0100 | [diff] [blame] | 278 | bytes_to_copy = stored_bytes; |
Gilles Peskine | 449bd83 | 2023-01-11 14:50:10 +0100 | [diff] [blame] | 279 | } else { |
Janos Follath | b7a88ec | 2022-08-19 12:24:40 +0100 | [diff] [blame] | 280 | bytes_to_copy = output_length; |
Janos Follath | 3ca0775 | 2022-08-09 11:45:47 +0100 | [diff] [blame] | 281 | |
Janos Follath | af3f39c | 2022-08-22 09:06:32 +0100 | [diff] [blame] | 282 | /* The output buffer is smaller than the allocated size of A. |
Janos Follath | b7a88ec | 2022-08-19 12:24:40 +0100 | [diff] [blame] | 283 | * However A may fit if its leading bytes are zero. */ |
Gilles Peskine | 449bd83 | 2023-01-11 14:50:10 +0100 | [diff] [blame] | 284 | for (size_t i = bytes_to_copy; i < stored_bytes; i++) { |
| 285 | if (GET_BYTE(A, i) != 0) { |
| 286 | return MBEDTLS_ERR_MPI_BUFFER_TOO_SMALL; |
| 287 | } |
Janos Follath | 3ca0775 | 2022-08-09 11:45:47 +0100 | [diff] [blame] | 288 | } |
| 289 | } |
| 290 | |
Gilles Peskine | 449bd83 | 2023-01-11 14:50:10 +0100 | [diff] [blame] | 291 | for (size_t i = 0; i < bytes_to_copy; i++) { |
| 292 | output[i] = GET_BYTE(A, i); |
Janos Follath | 3ca0775 | 2022-08-09 11:45:47 +0100 | [diff] [blame] | 293 | } |
| 294 | |
Gilles Peskine | 449bd83 | 2023-01-11 14:50:10 +0100 | [diff] [blame] | 295 | if (stored_bytes < output_length) { |
| 296 | /* Write trailing 0 bytes */ |
| 297 | memset(output + stored_bytes, 0, output_length - stored_bytes); |
| 298 | } |
| 299 | |
| 300 | return 0; |
Janos Follath | 3ca0775 | 2022-08-09 11:45:47 +0100 | [diff] [blame] | 301 | } |
| 302 | |
Gilles Peskine | 449bd83 | 2023-01-11 14:50:10 +0100 | [diff] [blame] | 303 | int mbedtls_mpi_core_write_be(const mbedtls_mpi_uint *X, |
| 304 | size_t X_limbs, |
| 305 | unsigned char *output, |
| 306 | size_t output_length) |
Janos Follath | 3ca0775 | 2022-08-09 11:45:47 +0100 | [diff] [blame] | 307 | { |
| 308 | size_t stored_bytes; |
| 309 | size_t bytes_to_copy; |
| 310 | unsigned char *p; |
Janos Follath | 3ca0775 | 2022-08-09 11:45:47 +0100 | [diff] [blame] | 311 | |
Janos Follath | b7a88ec | 2022-08-19 12:24:40 +0100 | [diff] [blame] | 312 | stored_bytes = X_limbs * ciL; |
Janos Follath | 3ca0775 | 2022-08-09 11:45:47 +0100 | [diff] [blame] | 313 | |
Gilles Peskine | 449bd83 | 2023-01-11 14:50:10 +0100 | [diff] [blame] | 314 | if (stored_bytes < output_length) { |
Janos Follath | af3f39c | 2022-08-22 09:06:32 +0100 | [diff] [blame] | 315 | /* There is enough space in the output buffer. Write initial |
Janos Follath | 3ca0775 | 2022-08-09 11:45:47 +0100 | [diff] [blame] | 316 | * null bytes and record the position at which to start |
| 317 | * writing the significant bytes. In this case, the execution |
| 318 | * trace of this function does not depend on the value of the |
| 319 | * number. */ |
| 320 | bytes_to_copy = stored_bytes; |
Janos Follath | b7a88ec | 2022-08-19 12:24:40 +0100 | [diff] [blame] | 321 | p = output + output_length - stored_bytes; |
Gilles Peskine | 449bd83 | 2023-01-11 14:50:10 +0100 | [diff] [blame] | 322 | memset(output, 0, output_length - stored_bytes); |
| 323 | } else { |
Janos Follath | af3f39c | 2022-08-22 09:06:32 +0100 | [diff] [blame] | 324 | /* The output buffer is smaller than the allocated size of X. |
Janos Follath | 3ca0775 | 2022-08-09 11:45:47 +0100 | [diff] [blame] | 325 | * However X may fit if its leading bytes are zero. */ |
Janos Follath | b7a88ec | 2022-08-19 12:24:40 +0100 | [diff] [blame] | 326 | bytes_to_copy = output_length; |
| 327 | p = output; |
Gilles Peskine | 449bd83 | 2023-01-11 14:50:10 +0100 | [diff] [blame] | 328 | for (size_t i = bytes_to_copy; i < stored_bytes; i++) { |
| 329 | if (GET_BYTE(X, i) != 0) { |
| 330 | return MBEDTLS_ERR_MPI_BUFFER_TOO_SMALL; |
| 331 | } |
Janos Follath | 3ca0775 | 2022-08-09 11:45:47 +0100 | [diff] [blame] | 332 | } |
| 333 | } |
| 334 | |
Gilles Peskine | 449bd83 | 2023-01-11 14:50:10 +0100 | [diff] [blame] | 335 | for (size_t i = 0; i < bytes_to_copy; i++) { |
| 336 | p[bytes_to_copy - i - 1] = GET_BYTE(X, i); |
| 337 | } |
Janos Follath | 3ca0775 | 2022-08-09 11:45:47 +0100 | [diff] [blame] | 338 | |
Gilles Peskine | 449bd83 | 2023-01-11 14:50:10 +0100 | [diff] [blame] | 339 | return 0; |
Janos Follath | 3ca0775 | 2022-08-09 11:45:47 +0100 | [diff] [blame] | 340 | } |
| 341 | |
Gilles Peskine | 449bd83 | 2023-01-11 14:50:10 +0100 | [diff] [blame] | 342 | void mbedtls_mpi_core_shift_r(mbedtls_mpi_uint *X, size_t limbs, |
| 343 | size_t count) |
Gilles Peskine | c279b2f | 2022-09-21 15:38:38 +0200 | [diff] [blame] | 344 | { |
| 345 | size_t i, v0, v1; |
| 346 | mbedtls_mpi_uint r0 = 0, r1; |
| 347 | |
| 348 | v0 = count / biL; |
| 349 | v1 = count & (biL - 1); |
| 350 | |
Gilles Peskine | 449bd83 | 2023-01-11 14:50:10 +0100 | [diff] [blame] | 351 | if (v0 > limbs || (v0 == limbs && v1 > 0)) { |
| 352 | memset(X, 0, limbs * ciL); |
Gilles Peskine | c279b2f | 2022-09-21 15:38:38 +0200 | [diff] [blame] | 353 | return; |
| 354 | } |
| 355 | |
| 356 | /* |
| 357 | * shift by count / limb_size |
| 358 | */ |
Gilles Peskine | 449bd83 | 2023-01-11 14:50:10 +0100 | [diff] [blame] | 359 | if (v0 > 0) { |
| 360 | for (i = 0; i < limbs - v0; i++) { |
Gilles Peskine | c279b2f | 2022-09-21 15:38:38 +0200 | [diff] [blame] | 361 | X[i] = X[i + v0]; |
Gilles Peskine | 449bd83 | 2023-01-11 14:50:10 +0100 | [diff] [blame] | 362 | } |
Gilles Peskine | c279b2f | 2022-09-21 15:38:38 +0200 | [diff] [blame] | 363 | |
Gilles Peskine | 449bd83 | 2023-01-11 14:50:10 +0100 | [diff] [blame] | 364 | for (; i < limbs; i++) { |
Gilles Peskine | c279b2f | 2022-09-21 15:38:38 +0200 | [diff] [blame] | 365 | X[i] = 0; |
Gilles Peskine | 449bd83 | 2023-01-11 14:50:10 +0100 | [diff] [blame] | 366 | } |
Gilles Peskine | c279b2f | 2022-09-21 15:38:38 +0200 | [diff] [blame] | 367 | } |
| 368 | |
| 369 | /* |
| 370 | * shift by count % limb_size |
| 371 | */ |
Gilles Peskine | 449bd83 | 2023-01-11 14:50:10 +0100 | [diff] [blame] | 372 | if (v1 > 0) { |
| 373 | for (i = limbs; i > 0; i--) { |
Gilles Peskine | c279b2f | 2022-09-21 15:38:38 +0200 | [diff] [blame] | 374 | r1 = X[i - 1] << (biL - v1); |
| 375 | X[i - 1] >>= v1; |
| 376 | X[i - 1] |= r0; |
| 377 | r0 = r1; |
| 378 | } |
| 379 | } |
| 380 | } |
| 381 | |
Minos Galanakis | ec09e25 | 2023-04-20 14:22:16 +0100 | [diff] [blame] | 382 | void mbedtls_mpi_core_shift_l(mbedtls_mpi_uint *X, size_t limbs, |
| 383 | size_t count) |
Minos Galanakis | ad808dd | 2023-04-20 12:18:41 +0100 | [diff] [blame] | 384 | { |
Minos Galanakis | ec09e25 | 2023-04-20 14:22:16 +0100 | [diff] [blame] | 385 | size_t i, v0, v1; |
Minos Galanakis | ad808dd | 2023-04-20 12:18:41 +0100 | [diff] [blame] | 386 | mbedtls_mpi_uint r0 = 0, r1; |
Minos Galanakis | ad808dd | 2023-04-20 12:18:41 +0100 | [diff] [blame] | 387 | |
Minos Galanakis | ec09e25 | 2023-04-20 14:22:16 +0100 | [diff] [blame] | 388 | v0 = count / (biL); |
| 389 | v1 = count & (biL - 1); |
Minos Galanakis | ad808dd | 2023-04-20 12:18:41 +0100 | [diff] [blame] | 390 | |
Minos Galanakis | ad808dd | 2023-04-20 12:18:41 +0100 | [diff] [blame] | 391 | /* |
| 392 | * shift by count / limb_size |
| 393 | */ |
Minos Galanakis | ec09e25 | 2023-04-20 14:22:16 +0100 | [diff] [blame] | 394 | if (v0 > 0) { |
| 395 | for (i = limbs; i > v0; i--) { |
| 396 | X[i - 1] = X[i - v0 - 1]; |
| 397 | } |
Minos Galanakis | ad808dd | 2023-04-20 12:18:41 +0100 | [diff] [blame] | 398 | |
Minos Galanakis | ec09e25 | 2023-04-20 14:22:16 +0100 | [diff] [blame] | 399 | for (; i > 0; i--) { |
| 400 | X[i - 1] = 0; |
| 401 | } |
Minos Galanakis | ad808dd | 2023-04-20 12:18:41 +0100 | [diff] [blame] | 402 | } |
| 403 | |
| 404 | /* |
| 405 | * shift by count % limb_size |
| 406 | */ |
Minos Galanakis | ec09e25 | 2023-04-20 14:22:16 +0100 | [diff] [blame] | 407 | if (v1 > 0) { |
| 408 | for (i = v0; i < limbs; i++) { |
| 409 | r1 = X[i] >> (biL - v1); |
| 410 | X[i] <<= v1; |
| 411 | X[i] |= r0; |
Minos Galanakis | ad808dd | 2023-04-20 12:18:41 +0100 | [diff] [blame] | 412 | r0 = r1; |
| 413 | } |
| 414 | } |
Minos Galanakis | ad808dd | 2023-04-20 12:18:41 +0100 | [diff] [blame] | 415 | } |
| 416 | |
Gilles Peskine | 449bd83 | 2023-01-11 14:50:10 +0100 | [diff] [blame] | 417 | mbedtls_mpi_uint mbedtls_mpi_core_add(mbedtls_mpi_uint *X, |
| 418 | const mbedtls_mpi_uint *A, |
| 419 | const mbedtls_mpi_uint *B, |
| 420 | size_t limbs) |
Hanno Becker | c988713 | 2022-08-24 12:54:36 +0100 | [diff] [blame] | 421 | { |
Tom Cosgrove | af7d44b | 2022-08-24 14:05:26 +0100 | [diff] [blame] | 422 | mbedtls_mpi_uint c = 0; |
Gilles Peskine | c279b2f | 2022-09-21 15:38:38 +0200 | [diff] [blame] | 423 | |
Gilles Peskine | 449bd83 | 2023-01-11 14:50:10 +0100 | [diff] [blame] | 424 | for (size_t i = 0; i < limbs; i++) { |
Tom Cosgrove | af7d44b | 2022-08-24 14:05:26 +0100 | [diff] [blame] | 425 | mbedtls_mpi_uint t = c + A[i]; |
Gilles Peskine | 449bd83 | 2023-01-11 14:50:10 +0100 | [diff] [blame] | 426 | c = (t < A[i]); |
Tom Cosgrove | af7d44b | 2022-08-24 14:05:26 +0100 | [diff] [blame] | 427 | t += B[i]; |
Gilles Peskine | 449bd83 | 2023-01-11 14:50:10 +0100 | [diff] [blame] | 428 | c += (t < B[i]); |
Tom Cosgrove | af7d44b | 2022-08-24 14:05:26 +0100 | [diff] [blame] | 429 | X[i] = t; |
Hanno Becker | c988713 | 2022-08-24 12:54:36 +0100 | [diff] [blame] | 430 | } |
Tom Cosgrove | af7d44b | 2022-08-24 14:05:26 +0100 | [diff] [blame] | 431 | |
Gilles Peskine | 449bd83 | 2023-01-11 14:50:10 +0100 | [diff] [blame] | 432 | return c; |
Hanno Becker | c988713 | 2022-08-24 12:54:36 +0100 | [diff] [blame] | 433 | } |
Gilles Peskine | c279b2f | 2022-09-21 15:38:38 +0200 | [diff] [blame] | 434 | |
Gilles Peskine | 449bd83 | 2023-01-11 14:50:10 +0100 | [diff] [blame] | 435 | mbedtls_mpi_uint mbedtls_mpi_core_add_if(mbedtls_mpi_uint *X, |
| 436 | const mbedtls_mpi_uint *A, |
| 437 | size_t limbs, |
| 438 | unsigned cond) |
Tom Cosgrove | b496486 | 2022-08-30 11:57:22 +0100 | [diff] [blame] | 439 | { |
Tom Cosgrove | f0c8a8c | 2022-08-30 15:15:02 +0100 | [diff] [blame] | 440 | mbedtls_mpi_uint c = 0; |
| 441 | |
Dave Rodgman | b59b73e | 2023-05-17 15:17:12 +0100 | [diff] [blame] | 442 | mbedtls_ct_condition_t do_add = mbedtls_ct_bool(cond); |
Tom Cosgrove | 9354990 | 2022-08-30 17:41:23 +0100 | [diff] [blame] | 443 | |
Gilles Peskine | 449bd83 | 2023-01-11 14:50:10 +0100 | [diff] [blame] | 444 | for (size_t i = 0; i < limbs; i++) { |
Dave Rodgman | 98ddc01 | 2023-08-10 12:11:31 +0100 | [diff] [blame] | 445 | mbedtls_mpi_uint add = mbedtls_ct_mpi_uint_if_else_0(do_add, A[i]); |
Tom Cosgrove | 3bd7bc3 | 2022-09-15 15:55:07 +0100 | [diff] [blame] | 446 | mbedtls_mpi_uint t = c + X[i]; |
Gilles Peskine | 449bd83 | 2023-01-11 14:50:10 +0100 | [diff] [blame] | 447 | c = (t < X[i]); |
Tom Cosgrove | f0c8a8c | 2022-08-30 15:15:02 +0100 | [diff] [blame] | 448 | t += add; |
Gilles Peskine | 449bd83 | 2023-01-11 14:50:10 +0100 | [diff] [blame] | 449 | c += (t < add); |
Tom Cosgrove | 3bd7bc3 | 2022-09-15 15:55:07 +0100 | [diff] [blame] | 450 | X[i] = t; |
Tom Cosgrove | b496486 | 2022-08-30 11:57:22 +0100 | [diff] [blame] | 451 | } |
Tom Cosgrove | f0c8a8c | 2022-08-30 15:15:02 +0100 | [diff] [blame] | 452 | |
Gilles Peskine | 449bd83 | 2023-01-11 14:50:10 +0100 | [diff] [blame] | 453 | return c; |
Tom Cosgrove | b496486 | 2022-08-30 11:57:22 +0100 | [diff] [blame] | 454 | } |
| 455 | |
Gilles Peskine | 449bd83 | 2023-01-11 14:50:10 +0100 | [diff] [blame] | 456 | mbedtls_mpi_uint mbedtls_mpi_core_sub(mbedtls_mpi_uint *X, |
| 457 | const mbedtls_mpi_uint *A, |
| 458 | const mbedtls_mpi_uint *B, |
| 459 | size_t limbs) |
Tom Cosgrove | b496486 | 2022-08-30 11:57:22 +0100 | [diff] [blame] | 460 | { |
| 461 | mbedtls_mpi_uint c = 0; |
| 462 | |
Gilles Peskine | 449bd83 | 2023-01-11 14:50:10 +0100 | [diff] [blame] | 463 | for (size_t i = 0; i < limbs; i++) { |
| 464 | mbedtls_mpi_uint z = (A[i] < c); |
Tom Cosgrove | b496486 | 2022-08-30 11:57:22 +0100 | [diff] [blame] | 465 | mbedtls_mpi_uint t = A[i] - c; |
Gilles Peskine | 449bd83 | 2023-01-11 14:50:10 +0100 | [diff] [blame] | 466 | c = (t < B[i]) + z; |
Tom Cosgrove | b496486 | 2022-08-30 11:57:22 +0100 | [diff] [blame] | 467 | X[i] = t - B[i]; |
| 468 | } |
| 469 | |
Gilles Peskine | 449bd83 | 2023-01-11 14:50:10 +0100 | [diff] [blame] | 470 | return c; |
Tom Cosgrove | b496486 | 2022-08-30 11:57:22 +0100 | [diff] [blame] | 471 | } |
| 472 | |
Gilles Peskine | 449bd83 | 2023-01-11 14:50:10 +0100 | [diff] [blame] | 473 | mbedtls_mpi_uint mbedtls_mpi_core_mla(mbedtls_mpi_uint *d, size_t d_len, |
| 474 | const mbedtls_mpi_uint *s, size_t s_len, |
| 475 | mbedtls_mpi_uint b) |
Tom Cosgrove | b496486 | 2022-08-30 11:57:22 +0100 | [diff] [blame] | 476 | { |
| 477 | mbedtls_mpi_uint c = 0; /* carry */ |
Tom Cosgrove | 5dd97e6 | 2022-08-30 14:31:49 +0100 | [diff] [blame] | 478 | /* |
| 479 | * It is a documented precondition of this function that d_len >= s_len. |
| 480 | * If that's not the case, we swap these round: this turns what would be |
| 481 | * a buffer overflow into an incorrect result. |
| 482 | */ |
Gilles Peskine | 449bd83 | 2023-01-11 14:50:10 +0100 | [diff] [blame] | 483 | if (d_len < s_len) { |
Tom Cosgrove | b496486 | 2022-08-30 11:57:22 +0100 | [diff] [blame] | 484 | s_len = d_len; |
Gilles Peskine | 449bd83 | 2023-01-11 14:50:10 +0100 | [diff] [blame] | 485 | } |
Tom Cosgrove | b496486 | 2022-08-30 11:57:22 +0100 | [diff] [blame] | 486 | size_t excess_len = d_len - s_len; |
| 487 | size_t steps_x8 = s_len / 8; |
| 488 | size_t steps_x1 = s_len & 7; |
| 489 | |
Gilles Peskine | 449bd83 | 2023-01-11 14:50:10 +0100 | [diff] [blame] | 490 | while (steps_x8--) { |
Tom Cosgrove | b496486 | 2022-08-30 11:57:22 +0100 | [diff] [blame] | 491 | MULADDC_X8_INIT |
| 492 | MULADDC_X8_CORE |
Gilles Peskine | 449bd83 | 2023-01-11 14:50:10 +0100 | [diff] [blame] | 493 | MULADDC_X8_STOP |
Tom Cosgrove | b496486 | 2022-08-30 11:57:22 +0100 | [diff] [blame] | 494 | } |
| 495 | |
Gilles Peskine | 449bd83 | 2023-01-11 14:50:10 +0100 | [diff] [blame] | 496 | while (steps_x1--) { |
Tom Cosgrove | b496486 | 2022-08-30 11:57:22 +0100 | [diff] [blame] | 497 | MULADDC_X1_INIT |
| 498 | MULADDC_X1_CORE |
Gilles Peskine | 449bd83 | 2023-01-11 14:50:10 +0100 | [diff] [blame] | 499 | MULADDC_X1_STOP |
Tom Cosgrove | b496486 | 2022-08-30 11:57:22 +0100 | [diff] [blame] | 500 | } |
| 501 | |
Gilles Peskine | 449bd83 | 2023-01-11 14:50:10 +0100 | [diff] [blame] | 502 | while (excess_len--) { |
Tom Cosgrove | f0c8a8c | 2022-08-30 15:15:02 +0100 | [diff] [blame] | 503 | *d += c; |
Gilles Peskine | 449bd83 | 2023-01-11 14:50:10 +0100 | [diff] [blame] | 504 | c = (*d < c); |
Tom Cosgrove | f0c8a8c | 2022-08-30 15:15:02 +0100 | [diff] [blame] | 505 | d++; |
Tom Cosgrove | b496486 | 2022-08-30 11:57:22 +0100 | [diff] [blame] | 506 | } |
| 507 | |
Gilles Peskine | 449bd83 | 2023-01-11 14:50:10 +0100 | [diff] [blame] | 508 | return c; |
Tom Cosgrove | b496486 | 2022-08-30 11:57:22 +0100 | [diff] [blame] | 509 | } |
| 510 | |
Tom Cosgrove | 6af26f3 | 2022-08-24 16:40:55 +0100 | [diff] [blame] | 511 | void mbedtls_mpi_core_mul(mbedtls_mpi_uint *X, |
| 512 | const mbedtls_mpi_uint *A, size_t A_limbs, |
| 513 | const mbedtls_mpi_uint *B, size_t B_limbs) |
Hanno Becker | 4ae890b | 2022-08-24 16:17:52 +0100 | [diff] [blame] | 514 | { |
Tom Cosgrove | 6af26f3 | 2022-08-24 16:40:55 +0100 | [diff] [blame] | 515 | memset(X, 0, (A_limbs + B_limbs) * ciL); |
| 516 | |
| 517 | for (size_t i = 0; i < B_limbs; i++) { |
| 518 | (void) mbedtls_mpi_core_mla(X + i, A_limbs + 1, A, A_limbs, B[i]); |
| 519 | } |
Hanno Becker | 4ae890b | 2022-08-24 16:17:52 +0100 | [diff] [blame] | 520 | } |
| 521 | |
Tom Cosgrove | b496486 | 2022-08-30 11:57:22 +0100 | [diff] [blame] | 522 | /* |
| 523 | * Fast Montgomery initialization (thanks to Tom St Denis). |
| 524 | */ |
Gilles Peskine | 449bd83 | 2023-01-11 14:50:10 +0100 | [diff] [blame] | 525 | mbedtls_mpi_uint mbedtls_mpi_core_montmul_init(const mbedtls_mpi_uint *N) |
Tom Cosgrove | b496486 | 2022-08-30 11:57:22 +0100 | [diff] [blame] | 526 | { |
| 527 | mbedtls_mpi_uint x = N[0]; |
| 528 | |
Gilles Peskine | 449bd83 | 2023-01-11 14:50:10 +0100 | [diff] [blame] | 529 | x += ((N[0] + 2) & 4) << 1; |
Tom Cosgrove | b496486 | 2022-08-30 11:57:22 +0100 | [diff] [blame] | 530 | |
Gilles Peskine | 449bd83 | 2023-01-11 14:50:10 +0100 | [diff] [blame] | 531 | for (unsigned int i = biL; i >= 8; i /= 2) { |
| 532 | x *= (2 - (N[0] * x)); |
| 533 | } |
Tom Cosgrove | b496486 | 2022-08-30 11:57:22 +0100 | [diff] [blame] | 534 | |
Gilles Peskine | 449bd83 | 2023-01-11 14:50:10 +0100 | [diff] [blame] | 535 | return ~x + 1; |
Tom Cosgrove | b496486 | 2022-08-30 11:57:22 +0100 | [diff] [blame] | 536 | } |
| 537 | |
Gilles Peskine | 449bd83 | 2023-01-11 14:50:10 +0100 | [diff] [blame] | 538 | void mbedtls_mpi_core_montmul(mbedtls_mpi_uint *X, |
| 539 | const mbedtls_mpi_uint *A, |
| 540 | const mbedtls_mpi_uint *B, |
| 541 | size_t B_limbs, |
| 542 | const mbedtls_mpi_uint *N, |
| 543 | size_t AN_limbs, |
| 544 | mbedtls_mpi_uint mm, |
| 545 | mbedtls_mpi_uint *T) |
Tom Cosgrove | 958fd3d | 2022-08-24 11:08:51 +0100 | [diff] [blame] | 546 | { |
Gilles Peskine | 449bd83 | 2023-01-11 14:50:10 +0100 | [diff] [blame] | 547 | memset(T, 0, (2 * AN_limbs + 1) * ciL); |
Tom Cosgrove | 958fd3d | 2022-08-24 11:08:51 +0100 | [diff] [blame] | 548 | |
Gilles Peskine | 449bd83 | 2023-01-11 14:50:10 +0100 | [diff] [blame] | 549 | for (size_t i = 0; i < AN_limbs; i++) { |
Tom Cosgrove | 958fd3d | 2022-08-24 11:08:51 +0100 | [diff] [blame] | 550 | /* T = (T + u0*B + u1*N) / 2^biL */ |
Tom Cosgrove | f0b2231 | 2022-08-31 17:57:34 +0100 | [diff] [blame] | 551 | mbedtls_mpi_uint u0 = A[i]; |
Gilles Peskine | 449bd83 | 2023-01-11 14:50:10 +0100 | [diff] [blame] | 552 | mbedtls_mpi_uint u1 = (T[0] + u0 * B[0]) * mm; |
Tom Cosgrove | 958fd3d | 2022-08-24 11:08:51 +0100 | [diff] [blame] | 553 | |
Gilles Peskine | 449bd83 | 2023-01-11 14:50:10 +0100 | [diff] [blame] | 554 | (void) mbedtls_mpi_core_mla(T, AN_limbs + 2, B, B_limbs, u0); |
| 555 | (void) mbedtls_mpi_core_mla(T, AN_limbs + 2, N, AN_limbs, u1); |
Tom Cosgrove | 67c9247 | 2022-09-02 13:28:59 +0100 | [diff] [blame] | 556 | |
| 557 | T++; |
Tom Cosgrove | 958fd3d | 2022-08-24 11:08:51 +0100 | [diff] [blame] | 558 | } |
| 559 | |
Tom Cosgrove | f0b2231 | 2022-08-31 17:57:34 +0100 | [diff] [blame] | 560 | /* |
| 561 | * The result we want is (T >= N) ? T - N : T. |
| 562 | * |
| 563 | * For better constant-time properties in this function, we always do the |
| 564 | * subtraction, with the result in X. |
| 565 | * |
| 566 | * We also look to see if there was any carry in the final additions in the |
| 567 | * loop above. |
| 568 | */ |
Tom Cosgrove | 958fd3d | 2022-08-24 11:08:51 +0100 | [diff] [blame] | 569 | |
Tom Cosgrove | 7259463 | 2022-08-24 11:51:58 +0100 | [diff] [blame] | 570 | mbedtls_mpi_uint carry = T[AN_limbs]; |
Gilles Peskine | 449bd83 | 2023-01-11 14:50:10 +0100 | [diff] [blame] | 571 | mbedtls_mpi_uint borrow = mbedtls_mpi_core_sub(X, T, N, AN_limbs); |
Tom Cosgrove | 958fd3d | 2022-08-24 11:08:51 +0100 | [diff] [blame] | 572 | |
| 573 | /* |
Tom Cosgrove | f0b2231 | 2022-08-31 17:57:34 +0100 | [diff] [blame] | 574 | * Using R as the Montgomery radix (auxiliary modulus) i.e. 2^(biL*AN_limbs): |
Tom Cosgrove | 958fd3d | 2022-08-24 11:08:51 +0100 | [diff] [blame] | 575 | * |
Tom Cosgrove | f0b2231 | 2022-08-31 17:57:34 +0100 | [diff] [blame] | 576 | * T can be in one of 3 ranges: |
Tom Cosgrove | 958fd3d | 2022-08-24 11:08:51 +0100 | [diff] [blame] | 577 | * |
Tom Cosgrove | f0b2231 | 2022-08-31 17:57:34 +0100 | [diff] [blame] | 578 | * 1) T < N : (carry, borrow) = (0, 1): we want T |
| 579 | * 2) N <= T < R : (carry, borrow) = (0, 0): we want X |
| 580 | * 3) T >= R : (carry, borrow) = (1, 1): we want X |
Tom Cosgrove | 958fd3d | 2022-08-24 11:08:51 +0100 | [diff] [blame] | 581 | * |
Tom Cosgrove | f0b2231 | 2022-08-31 17:57:34 +0100 | [diff] [blame] | 582 | * and (carry, borrow) = (1, 0) can't happen. |
Tom Cosgrove | 958fd3d | 2022-08-24 11:08:51 +0100 | [diff] [blame] | 583 | * |
| 584 | * So the correct return value is already in X if (carry ^ borrow) = 0, |
Tom Cosgrove | 7259463 | 2022-08-24 11:51:58 +0100 | [diff] [blame] | 585 | * but is in (the lower AN_limbs limbs of) T if (carry ^ borrow) = 1. |
Tom Cosgrove | 958fd3d | 2022-08-24 11:08:51 +0100 | [diff] [blame] | 586 | */ |
Dave Rodgman | 231a516 | 2023-05-17 15:13:14 +0100 | [diff] [blame] | 587 | mbedtls_ct_memcpy_if(mbedtls_ct_bool(carry ^ borrow), |
| 588 | (unsigned char *) X, |
| 589 | (unsigned char *) T, |
| 590 | NULL, |
| 591 | AN_limbs * sizeof(mbedtls_mpi_uint)); |
Tom Cosgrove | 958fd3d | 2022-08-24 11:08:51 +0100 | [diff] [blame] | 592 | } |
| 593 | |
Gilles Peskine | 449bd83 | 2023-01-11 14:50:10 +0100 | [diff] [blame] | 594 | int mbedtls_mpi_core_get_mont_r2_unsafe(mbedtls_mpi *X, |
| 595 | const mbedtls_mpi *N) |
Hanno Becker | ec440f2 | 2022-08-11 17:29:32 +0100 | [diff] [blame] | 596 | { |
| 597 | int ret = MBEDTLS_ERR_ERROR_CORRUPTION_DETECTED; |
| 598 | |
Gilles Peskine | 449bd83 | 2023-01-11 14:50:10 +0100 | [diff] [blame] | 599 | MBEDTLS_MPI_CHK(mbedtls_mpi_lset(X, 1)); |
| 600 | MBEDTLS_MPI_CHK(mbedtls_mpi_shift_l(X, N->n * 2 * biL)); |
| 601 | MBEDTLS_MPI_CHK(mbedtls_mpi_mod_mpi(X, X, N)); |
| 602 | MBEDTLS_MPI_CHK(mbedtls_mpi_shrink(X, N->n)); |
Hanno Becker | ec440f2 | 2022-08-11 17:29:32 +0100 | [diff] [blame] | 603 | |
| 604 | cleanup: |
Gilles Peskine | 449bd83 | 2023-01-11 14:50:10 +0100 | [diff] [blame] | 605 | return ret; |
Hanno Becker | ec440f2 | 2022-08-11 17:29:32 +0100 | [diff] [blame] | 606 | } |
| 607 | |
Janos Follath | 59cbd1b | 2022-10-28 18:13:43 +0100 | [diff] [blame] | 608 | MBEDTLS_STATIC_TESTABLE |
Gilles Peskine | 449bd83 | 2023-01-11 14:50:10 +0100 | [diff] [blame] | 609 | void mbedtls_mpi_core_ct_uint_table_lookup(mbedtls_mpi_uint *dest, |
| 610 | const mbedtls_mpi_uint *table, |
| 611 | size_t limbs, |
| 612 | size_t count, |
| 613 | size_t index) |
Janos Follath | e50f2f1 | 2022-10-26 15:14:33 +0100 | [diff] [blame] | 614 | { |
Gilles Peskine | 449bd83 | 2023-01-11 14:50:10 +0100 | [diff] [blame] | 615 | for (size_t i = 0; i < count; i++, table += limbs) { |
Dave Rodgman | b7825ce | 2023-08-10 11:58:18 +0100 | [diff] [blame] | 616 | mbedtls_ct_condition_t assign = mbedtls_ct_uint_eq(i, index); |
Gilles Peskine | 449bd83 | 2023-01-11 14:50:10 +0100 | [diff] [blame] | 617 | mbedtls_mpi_core_cond_assign(dest, table, limbs, assign); |
Janos Follath | e50f2f1 | 2022-10-26 15:14:33 +0100 | [diff] [blame] | 618 | } |
| 619 | } |
| 620 | |
Gilles Peskine | 009d195 | 2022-09-09 21:00:00 +0200 | [diff] [blame] | 621 | /* Fill X with n_bytes random bytes. |
| 622 | * X must already have room for those bytes. |
| 623 | * The ordering of the bytes returned from the RNG is suitable for |
Gilles Peskine | 22cdd0c | 2022-10-27 20:15:13 +0200 | [diff] [blame] | 624 | * deterministic ECDSA (see RFC 6979 §3.3 and the specification of |
| 625 | * mbedtls_mpi_core_random()). |
Gilles Peskine | 009d195 | 2022-09-09 21:00:00 +0200 | [diff] [blame] | 626 | */ |
| 627 | int mbedtls_mpi_core_fill_random( |
| 628 | mbedtls_mpi_uint *X, size_t X_limbs, |
| 629 | size_t n_bytes, |
Gilles Peskine | 449bd83 | 2023-01-11 14:50:10 +0100 | [diff] [blame] | 630 | int (*f_rng)(void *, unsigned char *, size_t), void *p_rng) |
Gilles Peskine | 009d195 | 2022-09-09 21:00:00 +0200 | [diff] [blame] | 631 | { |
| 632 | int ret = MBEDTLS_ERR_ERROR_CORRUPTION_DETECTED; |
Gilles Peskine | 449bd83 | 2023-01-11 14:50:10 +0100 | [diff] [blame] | 633 | const size_t limbs = CHARS_TO_LIMBS(n_bytes); |
| 634 | const size_t overhead = (limbs * ciL) - n_bytes; |
Gilles Peskine | 009d195 | 2022-09-09 21:00:00 +0200 | [diff] [blame] | 635 | |
Gilles Peskine | 449bd83 | 2023-01-11 14:50:10 +0100 | [diff] [blame] | 636 | if (X_limbs < limbs) { |
| 637 | return MBEDTLS_ERR_MPI_BAD_INPUT_DATA; |
| 638 | } |
Gilles Peskine | 009d195 | 2022-09-09 21:00:00 +0200 | [diff] [blame] | 639 | |
Gilles Peskine | 449bd83 | 2023-01-11 14:50:10 +0100 | [diff] [blame] | 640 | memset(X, 0, overhead); |
| 641 | memset((unsigned char *) X + limbs * ciL, 0, (X_limbs - limbs) * ciL); |
| 642 | MBEDTLS_MPI_CHK(f_rng(p_rng, (unsigned char *) X + overhead, n_bytes)); |
| 643 | mbedtls_mpi_core_bigendian_to_host(X, limbs); |
Gilles Peskine | 009d195 | 2022-09-09 21:00:00 +0200 | [diff] [blame] | 644 | |
| 645 | cleanup: |
Gilles Peskine | 449bd83 | 2023-01-11 14:50:10 +0100 | [diff] [blame] | 646 | return ret; |
Gilles Peskine | 009d195 | 2022-09-09 21:00:00 +0200 | [diff] [blame] | 647 | } |
| 648 | |
Gilles Peskine | 449bd83 | 2023-01-11 14:50:10 +0100 | [diff] [blame] | 649 | int mbedtls_mpi_core_random(mbedtls_mpi_uint *X, |
| 650 | mbedtls_mpi_uint min, |
| 651 | const mbedtls_mpi_uint *N, |
| 652 | size_t limbs, |
| 653 | int (*f_rng)(void *, unsigned char *, size_t), |
| 654 | void *p_rng) |
Gilles Peskine | 70375b2 | 2022-09-21 15:47:23 +0200 | [diff] [blame] | 655 | { |
Dave Rodgman | fd492ab | 2023-05-17 15:17:29 +0100 | [diff] [blame] | 656 | mbedtls_ct_condition_t ge_lower = MBEDTLS_CT_TRUE, lt_upper = MBEDTLS_CT_FALSE; |
Gilles Peskine | 449bd83 | 2023-01-11 14:50:10 +0100 | [diff] [blame] | 657 | size_t n_bits = mbedtls_mpi_core_bitlen(N, limbs); |
| 658 | size_t n_bytes = (n_bits + 7) / 8; |
Gilles Peskine | 70375b2 | 2022-09-21 15:47:23 +0200 | [diff] [blame] | 659 | int ret = MBEDTLS_ERR_ERROR_CORRUPTION_DETECTED; |
| 660 | |
| 661 | /* |
| 662 | * When min == 0, each try has at worst a probability 1/2 of failing |
| 663 | * (the msb has a probability 1/2 of being 0, and then the result will |
| 664 | * be < N), so after 30 tries failure probability is a most 2**(-30). |
| 665 | * |
| 666 | * When N is just below a power of 2, as is the case when generating |
| 667 | * a random scalar on most elliptic curves, 1 try is enough with |
| 668 | * overwhelming probability. When N is just above a power of 2, |
| 669 | * as when generating a random scalar on secp224k1, each try has |
| 670 | * a probability of failing that is almost 1/2. |
| 671 | * |
| 672 | * The probabilities are almost the same if min is nonzero but negligible |
| 673 | * compared to N. This is always the case when N is crypto-sized, but |
| 674 | * it's convenient to support small N for testing purposes. When N |
| 675 | * is small, use a higher repeat count, otherwise the probability of |
| 676 | * failure is macroscopic. |
| 677 | */ |
Gilles Peskine | 449bd83 | 2023-01-11 14:50:10 +0100 | [diff] [blame] | 678 | int count = (n_bytes > 4 ? 30 : 250); |
Gilles Peskine | 70375b2 | 2022-09-21 15:47:23 +0200 | [diff] [blame] | 679 | |
| 680 | /* |
| 681 | * Match the procedure given in RFC 6979 §3.3 (deterministic ECDSA) |
| 682 | * when f_rng is a suitably parametrized instance of HMAC_DRBG: |
| 683 | * - use the same byte ordering; |
| 684 | * - keep the leftmost n_bits bits of the generated octet string; |
| 685 | * - try until result is in the desired range. |
| 686 | * This also avoids any bias, which is especially important for ECDSA. |
| 687 | */ |
Gilles Peskine | 449bd83 | 2023-01-11 14:50:10 +0100 | [diff] [blame] | 688 | do { |
| 689 | MBEDTLS_MPI_CHK(mbedtls_mpi_core_fill_random(X, limbs, |
| 690 | n_bytes, |
| 691 | f_rng, p_rng)); |
| 692 | mbedtls_mpi_core_shift_r(X, limbs, 8 * n_bytes - n_bits); |
Gilles Peskine | 70375b2 | 2022-09-21 15:47:23 +0200 | [diff] [blame] | 693 | |
Gilles Peskine | 449bd83 | 2023-01-11 14:50:10 +0100 | [diff] [blame] | 694 | if (--count == 0) { |
Gilles Peskine | 70375b2 | 2022-09-21 15:47:23 +0200 | [diff] [blame] | 695 | ret = MBEDTLS_ERR_MPI_NOT_ACCEPTABLE; |
| 696 | goto cleanup; |
| 697 | } |
| 698 | |
Gilles Peskine | 449bd83 | 2023-01-11 14:50:10 +0100 | [diff] [blame] | 699 | ge_lower = mbedtls_mpi_core_uint_le_mpi(min, X, limbs); |
| 700 | lt_upper = mbedtls_mpi_core_lt_ct(X, N, limbs); |
Dave Rodgman | fd492ab | 2023-05-17 15:17:29 +0100 | [diff] [blame] | 701 | } while (mbedtls_ct_bool_and(ge_lower, lt_upper) == MBEDTLS_CT_FALSE); |
Gilles Peskine | 70375b2 | 2022-09-21 15:47:23 +0200 | [diff] [blame] | 702 | |
| 703 | cleanup: |
Gilles Peskine | 449bd83 | 2023-01-11 14:50:10 +0100 | [diff] [blame] | 704 | return ret; |
Gilles Peskine | 70375b2 | 2022-09-21 15:47:23 +0200 | [diff] [blame] | 705 | } |
| 706 | |
Gilles Peskine | 449bd83 | 2023-01-11 14:50:10 +0100 | [diff] [blame] | 707 | static size_t exp_mod_get_window_size(size_t Ebits) |
Janos Follath | b6673f0 | 2022-09-30 14:13:14 +0100 | [diff] [blame] | 708 | { |
Dave Rodgman | 4883f10 | 2023-08-09 20:17:40 +0100 | [diff] [blame] | 709 | #if MBEDTLS_MPI_WINDOW_SIZE >= 6 |
| 710 | return (Ebits > 671) ? 6 : (Ebits > 239) ? 5 : (Ebits > 79) ? 4 : 1; |
| 711 | #elif MBEDTLS_MPI_WINDOW_SIZE == 5 |
| 712 | return (Ebits > 239) ? 5 : (Ebits > 79) ? 4 : 1; |
| 713 | #elif MBEDTLS_MPI_WINDOW_SIZE > 1 |
| 714 | return (Ebits > 79) ? MBEDTLS_MPI_WINDOW_SIZE : 1; |
| 715 | #else |
| 716 | (void) Ebits; |
| 717 | return 1; |
Janos Follath | b6673f0 | 2022-09-30 14:13:14 +0100 | [diff] [blame] | 718 | #endif |
Janos Follath | b6673f0 | 2022-09-30 14:13:14 +0100 | [diff] [blame] | 719 | } |
| 720 | |
Gilles Peskine | 449bd83 | 2023-01-11 14:50:10 +0100 | [diff] [blame] | 721 | size_t mbedtls_mpi_core_exp_mod_working_limbs(size_t AN_limbs, size_t E_limbs) |
Tom Cosgrove | 0a0dded | 2022-12-06 14:37:18 +0000 | [diff] [blame] | 722 | { |
Gilles Peskine | 449bd83 | 2023-01-11 14:50:10 +0100 | [diff] [blame] | 723 | const size_t wsize = exp_mod_get_window_size(E_limbs * biL); |
| 724 | const size_t welem = ((size_t) 1) << wsize; |
Tom Cosgrove | 0a0dded | 2022-12-06 14:37:18 +0000 | [diff] [blame] | 725 | |
| 726 | /* How big does each part of the working memory pool need to be? */ |
| 727 | const size_t table_limbs = welem * AN_limbs; |
| 728 | const size_t select_limbs = AN_limbs; |
| 729 | const size_t temp_limbs = 2 * AN_limbs + 1; |
| 730 | |
Gilles Peskine | 449bd83 | 2023-01-11 14:50:10 +0100 | [diff] [blame] | 731 | return table_limbs + select_limbs + temp_limbs; |
Tom Cosgrove | 0a0dded | 2022-12-06 14:37:18 +0000 | [diff] [blame] | 732 | } |
| 733 | |
Gilles Peskine | 449bd83 | 2023-01-11 14:50:10 +0100 | [diff] [blame] | 734 | static void exp_mod_precompute_window(const mbedtls_mpi_uint *A, |
| 735 | const mbedtls_mpi_uint *N, |
| 736 | size_t AN_limbs, |
| 737 | mbedtls_mpi_uint mm, |
| 738 | const mbedtls_mpi_uint *RR, |
| 739 | size_t welem, |
| 740 | mbedtls_mpi_uint *Wtable, |
| 741 | mbedtls_mpi_uint *temp) |
Gilles Peskine | 0de0a04 | 2022-11-16 20:12:49 +0100 | [diff] [blame] | 742 | { |
Gilles Peskine | 0de0a04 | 2022-11-16 20:12:49 +0100 | [diff] [blame] | 743 | /* W[0] = 1 (in Montgomery presentation) */ |
Gilles Peskine | 449bd83 | 2023-01-11 14:50:10 +0100 | [diff] [blame] | 744 | memset(Wtable, 0, AN_limbs * ciL); |
Gilles Peskine | 0de0a04 | 2022-11-16 20:12:49 +0100 | [diff] [blame] | 745 | Wtable[0] = 1; |
Gilles Peskine | 449bd83 | 2023-01-11 14:50:10 +0100 | [diff] [blame] | 746 | mbedtls_mpi_core_montmul(Wtable, Wtable, RR, AN_limbs, N, AN_limbs, mm, temp); |
Gilles Peskine | d83b5cb | 2022-11-16 20:26:14 +0100 | [diff] [blame] | 747 | |
Tom Cosgrove | ecda186 | 2022-12-06 10:46:30 +0000 | [diff] [blame] | 748 | /* W[1] = A (already in Montgomery presentation) */ |
Gilles Peskine | d83b5cb | 2022-11-16 20:26:14 +0100 | [diff] [blame] | 749 | mbedtls_mpi_uint *W1 = Wtable + AN_limbs; |
Gilles Peskine | 449bd83 | 2023-01-11 14:50:10 +0100 | [diff] [blame] | 750 | memcpy(W1, A, AN_limbs * ciL); |
Gilles Peskine | d83b5cb | 2022-11-16 20:26:14 +0100 | [diff] [blame] | 751 | |
Gilles Peskine | 0de0a04 | 2022-11-16 20:12:49 +0100 | [diff] [blame] | 752 | /* W[i+1] = W[i] * W[1], i >= 2 */ |
Gilles Peskine | d83b5cb | 2022-11-16 20:26:14 +0100 | [diff] [blame] | 753 | mbedtls_mpi_uint *Wprev = W1; |
Gilles Peskine | 449bd83 | 2023-01-11 14:50:10 +0100 | [diff] [blame] | 754 | for (size_t i = 2; i < welem; i++) { |
Gilles Peskine | d83b5cb | 2022-11-16 20:26:14 +0100 | [diff] [blame] | 755 | mbedtls_mpi_uint *Wcur = Wprev + AN_limbs; |
Gilles Peskine | 449bd83 | 2023-01-11 14:50:10 +0100 | [diff] [blame] | 756 | mbedtls_mpi_core_montmul(Wcur, Wprev, W1, AN_limbs, N, AN_limbs, mm, temp); |
Gilles Peskine | d83b5cb | 2022-11-16 20:26:14 +0100 | [diff] [blame] | 757 | Wprev = Wcur; |
| 758 | } |
Gilles Peskine | 0de0a04 | 2022-11-16 20:12:49 +0100 | [diff] [blame] | 759 | } |
| 760 | |
Gilles Peskine | 7d89d35 | 2022-11-16 22:54:14 +0100 | [diff] [blame] | 761 | /* Exponentiation: X := A^E mod N. |
| 762 | * |
Tom Cosgrove | ecda186 | 2022-12-06 10:46:30 +0000 | [diff] [blame] | 763 | * A must already be in Montgomery form. |
| 764 | * |
Gilles Peskine | 7d89d35 | 2022-11-16 22:54:14 +0100 | [diff] [blame] | 765 | * As in other bignum functions, assume that AN_limbs and E_limbs are nonzero. |
| 766 | * |
| 767 | * RR must contain 2^{2*biL} mod N. |
Janos Follath | 3321b58 | 2022-11-22 21:08:33 +0000 | [diff] [blame] | 768 | * |
| 769 | * The algorithm is a variant of Left-to-right k-ary exponentiation: HAC 14.82 |
| 770 | * (The difference is that the body in our loop processes a single bit instead |
| 771 | * of a full window.) |
Gilles Peskine | 7d89d35 | 2022-11-16 22:54:14 +0100 | [diff] [blame] | 772 | */ |
Gilles Peskine | 449bd83 | 2023-01-11 14:50:10 +0100 | [diff] [blame] | 773 | void mbedtls_mpi_core_exp_mod(mbedtls_mpi_uint *X, |
| 774 | const mbedtls_mpi_uint *A, |
| 775 | const mbedtls_mpi_uint *N, |
| 776 | size_t AN_limbs, |
| 777 | const mbedtls_mpi_uint *E, |
| 778 | size_t E_limbs, |
| 779 | const mbedtls_mpi_uint *RR, |
| 780 | mbedtls_mpi_uint *T) |
Janos Follath | b6673f0 | 2022-09-30 14:13:14 +0100 | [diff] [blame] | 781 | { |
Gilles Peskine | 449bd83 | 2023-01-11 14:50:10 +0100 | [diff] [blame] | 782 | const size_t wsize = exp_mod_get_window_size(E_limbs * biL); |
| 783 | const size_t welem = ((size_t) 1) << wsize; |
Janos Follath | b6673f0 | 2022-09-30 14:13:14 +0100 | [diff] [blame] | 784 | |
Tom Cosgrove | 0a0dded | 2022-12-06 14:37:18 +0000 | [diff] [blame] | 785 | /* This is how we will use the temporary storage T, which must have space |
| 786 | * for table_limbs, select_limbs and (2 * AN_limbs + 1) for montmul. */ |
| 787 | const size_t table_limbs = welem * AN_limbs; |
| 788 | const size_t select_limbs = AN_limbs; |
Janos Follath | b6673f0 | 2022-09-30 14:13:14 +0100 | [diff] [blame] | 789 | |
Tom Cosgrove | 0a0dded | 2022-12-06 14:37:18 +0000 | [diff] [blame] | 790 | /* Pointers to specific parts of the temporary working memory pool */ |
| 791 | mbedtls_mpi_uint *const Wtable = T; |
| 792 | mbedtls_mpi_uint *const Wselect = Wtable + table_limbs; |
| 793 | mbedtls_mpi_uint *const temp = Wselect + select_limbs; |
Janos Follath | b6673f0 | 2022-09-30 14:13:14 +0100 | [diff] [blame] | 794 | |
| 795 | /* |
| 796 | * Window precomputation |
| 797 | */ |
| 798 | |
Gilles Peskine | 449bd83 | 2023-01-11 14:50:10 +0100 | [diff] [blame] | 799 | const mbedtls_mpi_uint mm = mbedtls_mpi_core_montmul_init(N); |
Gilles Peskine | cf979b0 | 2022-11-16 20:04:00 +0100 | [diff] [blame] | 800 | |
Gilles Peskine | 0de0a04 | 2022-11-16 20:12:49 +0100 | [diff] [blame] | 801 | /* Set Wtable[i] = A^(2^i) (in Montgomery representation) */ |
Gilles Peskine | 449bd83 | 2023-01-11 14:50:10 +0100 | [diff] [blame] | 802 | exp_mod_precompute_window(A, N, AN_limbs, |
| 803 | mm, RR, |
| 804 | welem, Wtable, temp); |
Janos Follath | b6673f0 | 2022-09-30 14:13:14 +0100 | [diff] [blame] | 805 | |
| 806 | /* |
Janos Follath | 0ec6e3f | 2022-11-14 12:52:08 +0000 | [diff] [blame] | 807 | * Fixed window exponentiation |
Janos Follath | b6673f0 | 2022-09-30 14:13:14 +0100 | [diff] [blame] | 808 | */ |
| 809 | |
| 810 | /* X = 1 (in Montgomery presentation) initially */ |
Gilles Peskine | 449bd83 | 2023-01-11 14:50:10 +0100 | [diff] [blame] | 811 | memcpy(X, Wtable, AN_limbs * ciL); |
Janos Follath | b6673f0 | 2022-09-30 14:13:14 +0100 | [diff] [blame] | 812 | |
Gilles Peskine | c718a3c | 2022-11-16 20:42:09 +0100 | [diff] [blame] | 813 | /* We'll process the bits of E from most significant |
| 814 | * (limb_index=E_limbs-1, E_bit_index=biL-1) to least significant |
| 815 | * (limb_index=0, E_bit_index=0). */ |
| 816 | size_t E_limb_index = E_limbs; |
| 817 | size_t E_bit_index = 0; |
Gilles Peskine | 0b270a5 | 2022-11-16 22:54:03 +0100 | [diff] [blame] | 818 | /* At any given time, window contains window_bits bits from E. |
| 819 | * window_bits can go up to wsize. */ |
Janos Follath | bad42c4 | 2022-11-09 14:30:44 +0000 | [diff] [blame] | 820 | size_t window_bits = 0; |
Gilles Peskine | 0b270a5 | 2022-11-16 22:54:03 +0100 | [diff] [blame] | 821 | mbedtls_mpi_uint window = 0; |
Gilles Peskine | cf979b0 | 2022-11-16 20:04:00 +0100 | [diff] [blame] | 822 | |
Gilles Peskine | 449bd83 | 2023-01-11 14:50:10 +0100 | [diff] [blame] | 823 | do { |
Janos Follath | b6673f0 | 2022-09-30 14:13:14 +0100 | [diff] [blame] | 824 | /* Square */ |
Gilles Peskine | 449bd83 | 2023-01-11 14:50:10 +0100 | [diff] [blame] | 825 | mbedtls_mpi_core_montmul(X, X, X, AN_limbs, N, AN_limbs, mm, temp); |
Janos Follath | b6673f0 | 2022-09-30 14:13:14 +0100 | [diff] [blame] | 826 | |
Janos Follath | 3321b58 | 2022-11-22 21:08:33 +0000 | [diff] [blame] | 827 | /* Move to the next bit of the exponent */ |
Gilles Peskine | 449bd83 | 2023-01-11 14:50:10 +0100 | [diff] [blame] | 828 | if (E_bit_index == 0) { |
Gilles Peskine | c718a3c | 2022-11-16 20:42:09 +0100 | [diff] [blame] | 829 | --E_limb_index; |
| 830 | E_bit_index = biL - 1; |
Gilles Peskine | 449bd83 | 2023-01-11 14:50:10 +0100 | [diff] [blame] | 831 | } else { |
Gilles Peskine | c718a3c | 2022-11-16 20:42:09 +0100 | [diff] [blame] | 832 | --E_bit_index; |
| 833 | } |
Janos Follath | 3321b58 | 2022-11-22 21:08:33 +0000 | [diff] [blame] | 834 | /* Insert next exponent bit into window */ |
Gilles Peskine | d83b5cb | 2022-11-16 20:26:14 +0100 | [diff] [blame] | 835 | ++window_bits; |
Gilles Peskine | c718a3c | 2022-11-16 20:42:09 +0100 | [diff] [blame] | 836 | window <<= 1; |
Gilles Peskine | 449bd83 | 2023-01-11 14:50:10 +0100 | [diff] [blame] | 837 | window |= (E[E_limb_index] >> E_bit_index) & 1; |
Gilles Peskine | 3b63d09 | 2022-11-16 22:06:18 +0100 | [diff] [blame] | 838 | |
| 839 | /* Clear window if it's full. Also clear the window at the end, |
| 840 | * when we've finished processing the exponent. */ |
Gilles Peskine | 449bd83 | 2023-01-11 14:50:10 +0100 | [diff] [blame] | 841 | if (window_bits == wsize || |
| 842 | (E_bit_index == 0 && E_limb_index == 0)) { |
Gilles Peskine | 0b270a5 | 2022-11-16 22:54:03 +0100 | [diff] [blame] | 843 | /* Select Wtable[window] without leaking window through |
| 844 | * memory access patterns. */ |
Gilles Peskine | 449bd83 | 2023-01-11 14:50:10 +0100 | [diff] [blame] | 845 | mbedtls_mpi_core_ct_uint_table_lookup(Wselect, Wtable, |
| 846 | AN_limbs, welem, window); |
Gilles Peskine | 0b270a5 | 2022-11-16 22:54:03 +0100 | [diff] [blame] | 847 | /* Multiply X by the selected element. */ |
Gilles Peskine | 449bd83 | 2023-01-11 14:50:10 +0100 | [diff] [blame] | 848 | mbedtls_mpi_core_montmul(X, X, Wselect, AN_limbs, N, AN_limbs, mm, |
| 849 | temp); |
Gilles Peskine | 3b63d09 | 2022-11-16 22:06:18 +0100 | [diff] [blame] | 850 | window = 0; |
| 851 | window_bits = 0; |
| 852 | } |
Gilles Peskine | 449bd83 | 2023-01-11 14:50:10 +0100 | [diff] [blame] | 853 | } while (!(E_bit_index == 0 && E_limb_index == 0)); |
Janos Follath | b6673f0 | 2022-09-30 14:13:14 +0100 | [diff] [blame] | 854 | } |
| 855 | |
Gilles Peskine | 449bd83 | 2023-01-11 14:50:10 +0100 | [diff] [blame] | 856 | mbedtls_mpi_uint mbedtls_mpi_core_sub_int(mbedtls_mpi_uint *X, |
| 857 | const mbedtls_mpi_uint *A, |
| 858 | mbedtls_mpi_uint c, /* doubles as carry */ |
| 859 | size_t limbs) |
Hanno Becker | d9b2348 | 2022-08-25 08:25:19 +0100 | [diff] [blame] | 860 | { |
Gilles Peskine | 449bd83 | 2023-01-11 14:50:10 +0100 | [diff] [blame] | 861 | for (size_t i = 0; i < limbs; i++) { |
Tom Cosgrove | f7ff4c9 | 2022-08-25 08:39:07 +0100 | [diff] [blame] | 862 | mbedtls_mpi_uint s = A[i]; |
| 863 | mbedtls_mpi_uint t = s - c; |
Gilles Peskine | 449bd83 | 2023-01-11 14:50:10 +0100 | [diff] [blame] | 864 | c = (t > s); |
Tom Cosgrove | f7ff4c9 | 2022-08-25 08:39:07 +0100 | [diff] [blame] | 865 | X[i] = t; |
Hanno Becker | d9b2348 | 2022-08-25 08:25:19 +0100 | [diff] [blame] | 866 | } |
| 867 | |
Gilles Peskine | 449bd83 | 2023-01-11 14:50:10 +0100 | [diff] [blame] | 868 | return c; |
Hanno Becker | d9b2348 | 2022-08-25 08:25:19 +0100 | [diff] [blame] | 869 | } |
| 870 | |
Gilles Peskine | 449bd83 | 2023-01-11 14:50:10 +0100 | [diff] [blame] | 871 | mbedtls_mpi_uint mbedtls_mpi_core_check_zero_ct(const mbedtls_mpi_uint *A, |
| 872 | size_t limbs) |
Tom Cosgrove | 30f3b4d | 2022-12-12 16:54:57 +0000 | [diff] [blame] | 873 | { |
| 874 | mbedtls_mpi_uint bits = 0; |
| 875 | |
Gilles Peskine | 449bd83 | 2023-01-11 14:50:10 +0100 | [diff] [blame] | 876 | for (size_t i = 0; i < limbs; i++) { |
Tom Cosgrove | 30f3b4d | 2022-12-12 16:54:57 +0000 | [diff] [blame] | 877 | bits |= A[i]; |
Gilles Peskine | 449bd83 | 2023-01-11 14:50:10 +0100 | [diff] [blame] | 878 | } |
Tom Cosgrove | 30f3b4d | 2022-12-12 16:54:57 +0000 | [diff] [blame] | 879 | |
Gilles Peskine | 449bd83 | 2023-01-11 14:50:10 +0100 | [diff] [blame] | 880 | return bits; |
Tom Cosgrove | 30f3b4d | 2022-12-12 16:54:57 +0000 | [diff] [blame] | 881 | } |
| 882 | |
Gilles Peskine | 449bd83 | 2023-01-11 14:50:10 +0100 | [diff] [blame] | 883 | void mbedtls_mpi_core_to_mont_rep(mbedtls_mpi_uint *X, |
| 884 | const mbedtls_mpi_uint *A, |
| 885 | const mbedtls_mpi_uint *N, |
| 886 | size_t AN_limbs, |
| 887 | mbedtls_mpi_uint mm, |
| 888 | const mbedtls_mpi_uint *rr, |
| 889 | mbedtls_mpi_uint *T) |
Tom Cosgrove | 786848b | 2022-12-13 10:45:19 +0000 | [diff] [blame] | 890 | { |
Gilles Peskine | 449bd83 | 2023-01-11 14:50:10 +0100 | [diff] [blame] | 891 | mbedtls_mpi_core_montmul(X, A, rr, AN_limbs, N, AN_limbs, mm, T); |
Tom Cosgrove | 786848b | 2022-12-13 10:45:19 +0000 | [diff] [blame] | 892 | } |
| 893 | |
Gilles Peskine | 449bd83 | 2023-01-11 14:50:10 +0100 | [diff] [blame] | 894 | void mbedtls_mpi_core_from_mont_rep(mbedtls_mpi_uint *X, |
| 895 | const mbedtls_mpi_uint *A, |
| 896 | const mbedtls_mpi_uint *N, |
| 897 | size_t AN_limbs, |
| 898 | mbedtls_mpi_uint mm, |
| 899 | mbedtls_mpi_uint *T) |
Tom Cosgrove | 786848b | 2022-12-13 10:45:19 +0000 | [diff] [blame] | 900 | { |
| 901 | const mbedtls_mpi_uint Rinv = 1; /* 1/R in Mont. rep => 1 */ |
| 902 | |
Gilles Peskine | 449bd83 | 2023-01-11 14:50:10 +0100 | [diff] [blame] | 903 | mbedtls_mpi_core_montmul(X, A, &Rinv, 1, N, AN_limbs, mm, T); |
Tom Cosgrove | 786848b | 2022-12-13 10:45:19 +0000 | [diff] [blame] | 904 | } |
| 905 | |
Janos Follath | 3ca0775 | 2022-08-09 11:45:47 +0100 | [diff] [blame] | 906 | #endif /* MBEDTLS_BIGNUM_C */ |