|
6 | 6 | /* high level multiplication (handles sign) */
|
7 | 7 | mp_err mp_mul(const mp_int *a, const mp_int *b, mp_int *c)
|
8 | 8 | {
|
9 |
| - mp_err err; |
10 |
| - mp_sign neg; |
11 |
| -#ifdef BN_S_MP_BALANCE_MUL_C |
12 |
| - int len_b, len_a; |
13 |
| -#endif |
14 |
| - neg = (a->sign == b->sign) ? MP_ZPOS : MP_NEG; |
15 |
| -#ifdef BN_S_MP_BALANCE_MUL_C |
16 |
| - len_a = a->used; |
17 |
| - len_b = b->used; |
18 |
| - |
19 |
| - if (len_a == len_b) { |
20 |
| - goto GO_ON; |
21 |
| - } |
22 |
| - /* |
23 |
| - * Check sizes. The smaller one needs to be larger than the Karatsuba cut-off. |
24 |
| - * The bigger one needs to be at least about one KARATSUBA_MUL_CUTOFF bigger |
25 |
| - * to make some sense, but it depends on architecture, OS, position of the |
26 |
| - * stars... so YMMV. |
27 |
| - * Using it to cut the input into slices small enough for fast_s_mp_mul_digs |
28 |
| - * was actually slower on the author's machine, but YMMV. |
29 |
| - */ |
30 |
| - if ((MP_MIN(len_a, len_b) < MP_KARATSUBA_MUL_CUTOFF) |
31 |
| - || ((MP_MAX(len_a, len_b) / 2) < MP_KARATSUBA_MUL_CUTOFF)) { |
32 |
| - goto GO_ON; |
33 |
| - } |
34 |
| - /* |
35 |
| - * Not much effect was observed below a ratio of 1:2, but again: YMMV. |
36 |
| - */ |
37 |
| - if ((MP_MAX(len_a, len_b) / MP_MIN(len_a, len_b)) < 2) { |
38 |
| - goto GO_ON; |
39 |
| - } |
40 |
| - |
41 |
| - err = s_mp_balance_mul(a,b,c); |
42 |
| - goto END; |
43 |
| - |
44 |
| -GO_ON: |
45 |
| -#endif |
| 9 | + mp_err err; |
| 10 | + int min_len = MP_MIN(a->used, b->used), |
| 11 | + max_len = MP_MAX(a->used, b->used), |
| 12 | + digs = a->used + b->used + 1; |
| 13 | + mp_sign neg = (a->sign == b->sign) ? MP_ZPOS : MP_NEG; |
46 | 14 |
|
47 |
| - /* use Toom-Cook? */ |
48 |
| -#ifdef BN_S_MP_TOOM_MUL_C |
49 |
| - if (MP_MIN(a->used, b->used) >= MP_TOOM_MUL_CUTOFF) { |
| 15 | + if (MP_HAS(S_MP_BALANCE_MUL) && |
| 16 | + /* Check sizes. The smaller one needs to be larger than the Karatsuba cut-off. |
| 17 | + * The bigger one needs to be at least about one MP_KARATSUBA_MUL_CUTOFF bigger |
| 18 | + * to make some sense, but it depends on architecture, OS, position of the |
| 19 | + * stars... so YMMV. |
| 20 | + * Using it to cut the input into slices small enough for fast_s_mp_mul_digs |
| 21 | + * was actually slower on the author's machine, but YMMV. |
| 22 | + */ |
| 23 | + (min_len >= MP_KARATSUBA_MUL_CUTOFF) && |
| 24 | + (max_len / 2 >= MP_KARATSUBA_MUL_CUTOFF) && |
| 25 | + /* Not much effect was observed below a ratio of 1:2, but again: YMMV. */ |
| 26 | + (max_len >= (2 * min_len))) { |
| 27 | + err = s_mp_balance_mul(a,b,c); |
| 28 | + } else if (MP_HAS(S_MP_TOOM_MUL) && |
| 29 | + (min_len >= MP_TOOM_MUL_CUTOFF)) { |
50 | 30 | err = s_mp_toom_mul(a, b, c);
|
51 |
| - } else |
52 |
| -#endif |
53 |
| -#ifdef BN_S_MP_KARATSUBA_MUL_C |
54 |
| - /* use Karatsuba? */ |
55 |
| - if (MP_MIN(a->used, b->used) >= MP_KARATSUBA_MUL_CUTOFF) { |
56 |
| - err = s_mp_karatsuba_mul(a, b, c); |
57 |
| - } else |
58 |
| -#endif |
59 |
| - { |
60 |
| - /* can we use the fast multiplier? |
61 |
| - * |
62 |
| - * The fast multiplier can be used if the output will |
63 |
| - * have less than MP_WARRAY digits and the number of |
64 |
| - * digits won't affect carry propagation |
65 |
| - */ |
66 |
| - int digs = a->used + b->used + 1; |
67 |
| - |
68 |
| -#ifdef BN_S_MP_MUL_DIGS_FAST_C |
69 |
| - if ((digs < MP_WARRAY) && |
70 |
| - (MP_MIN(a->used, b->used) <= MP_MAXFAST)) { |
71 |
| - err = s_mp_mul_digs_fast(a, b, c, digs); |
72 |
| - } else |
73 |
| -#endif |
74 |
| - { |
75 |
| -#ifdef BN_S_MP_MUL_DIGS_C |
76 |
| - err = s_mp_mul_digs(a, b, c, a->used + b->used + 1); |
77 |
| -#else |
78 |
| - err = MP_VAL; |
79 |
| -#endif |
80 |
| - } |
81 |
| - } |
82 |
| -END: |
| 31 | + } else if (MP_HAS(S_MP_KARATSUBA_MUL) && |
| 32 | + (min_len >= MP_KARATSUBA_MUL_CUTOFF)) { |
| 33 | + err = s_mp_karatsuba_mul(a, b, c); |
| 34 | + } else if (MP_HAS(S_MP_MUL_DIGS_FAST) && |
| 35 | + /* can we use the fast multiplier? |
| 36 | + * |
| 37 | + * The fast multiplier can be used if the output will |
| 38 | + * have less than MP_WARRAY digits and the number of |
| 39 | + * digits won't affect carry propagation |
| 40 | + */ |
| 41 | + (digs < MP_WARRAY) && |
| 42 | + (min_len <= MP_MAXFAST)) { |
| 43 | + err = s_mp_mul_digs_fast(a, b, c, digs); |
| 44 | + } else if (MP_HAS(S_MP_MUL_DIGS)) { |
| 45 | + err = s_mp_mul_digs(a, b, c, digs); |
| 46 | + } else { |
| 47 | + err = MP_VAL; |
| 48 | + } |
83 | 49 | c->sign = (c->used > 0) ? neg : MP_ZPOS;
|
84 | 50 | return err;
|
85 | 51 | }
|
|
0 commit comments