1 2 3(* Copyright (c) 2011-2020 Stefan Krah. All rights reserved. *) 4 5 6======================================================================== 7 Calculate (a * b) % p using the 80-bit x87 FPU 8======================================================================== 9 10A description of the algorithm can be found in the apfloat manual by 11Tommila [1]. 12 13The proof follows an argument made by Granlund/Montgomery in [2]. 14 15 16Definitions and assumptions: 17---------------------------- 18 19The 80-bit extended precision format uses 64 bits for the significand: 20 21 (1) F = 64 22 23The modulus is prime and less than 2**31: 24 25 (2) 2 <= p < 2**31 26 27The factors are less than p: 28 29 (3) 0 <= a < p 30 (4) 0 <= b < p 31 32The product a * b is less than 2**62 and is thus exact in 64 bits: 33 34 (5) n = a * b 35 36The product can be represented in terms of quotient and remainder: 37 38 (6) n = q * p + r 39 40Using (3), (4) and the fact that p is prime, the remainder is always 41greater than zero: 42 43 (7) 0 <= q < p /\ 1 <= r < p 44 45 46Strategy: 47--------- 48 49Precalculate the 80-bit long double inverse of p, with a maximum 50relative error of 2**(1-F): 51 52 (8) pinv = (long double)1.0 / p 53 54Calculate an estimate for q = floor(n/p). The multiplication has another 55maximum relative error of 2**(1-F): 56 57 (9) qest = n * pinv 58 59If we can show that q < qest < q+1, then trunc(qest) = q. It is then 60easy to recover the remainder r. The complete algorithm is: 61 62 a) Set the control word to 64-bit precision and truncation mode. 63 64 b) n = a * b # Calculate exact product. 65 66 c) qest = n * pinv # Calculate estimate for the quotient. 67 68 d) q = (qest+2**63)-2**63 # Truncate qest to the exact quotient. 69 70 f) r = n - q * p # Calculate remainder. 71 72 73Proof for q < qest < q+1: 74------------------------- 75 76Using the cumulative error, the error bounds for qest are: 77 78 n n * (1 + 2**(1-F))**2 79 (9) --------------------- <= qest <= --------------------- 80 p * (1 + 2**(1-F))**2 p 81 82 83 Lemma 1: 84 -------- 85 n q * p + r 86 (10) q < --------------------- = --------------------- 87 p * (1 + 2**(1-F))**2 p * (1 + 2**(1-F))**2 88 89 90 Proof: 91 ~~~~~~ 92 93 (I) q * p * (1 + 2**(1-F))**2 < q * p + r 94 95 (II) q * p * 2**(2-F) + q * p * 2**(2-2*F) < r 96 97 Using (1) and (7), it is sufficient to show that: 98 99 (III) q * p * 2**(-62) + q * p * 2**(-126) < 1 <= r 100 101 (III) can easily be verified by substituting the largest possible 102 values p = 2**31-1 and q = 2**31-2. 103 104 The critical cases occur when r = 1, n = m * p + 1. These cases 105 can be exhaustively verified with a test program. 106 107 108 Lemma 2: 109 -------- 110 111 n * (1 + 2**(1-F))**2 (q * p + r) * (1 + 2**(1-F))**2 112 (11) --------------------- = ------------------------------- < q + 1 113 p p 114 115 Proof: 116 ~~~~~~ 117 118 (I) (q * p + r) + (q * p + r) * 2**(2-F) + (q * p + r) * 2**(2-2*F) < q * p + p 119 120 (II) (q * p + r) * 2**(2-F) + (q * p + r) * 2**(2-2*F) < p - r 121 122 Using (1) and (7), it is sufficient to show that: 123 124 (III) (q * p + r) * 2**(-62) + (q * p + r) * 2**(-126) < 1 <= p - r 125 126 (III) can easily be verified by substituting the largest possible 127 values p = 2**31-1, q = 2**31-2 and r = 2**31-2. 128 129 The critical cases occur when r = (p - 1), n = m * p - 1. These cases 130 can be exhaustively verified with a test program. 131 132 133[1] http://www.apfloat.org/apfloat/2.40/apfloat.pdf 134[2] http://gmplib.org/~tege/divcnst-pldi94.pdf 135 [Section 7: "Use of floating point"] 136 137 138 139(* Coq proof for (10) and (11) *) 140 141Require Import ZArith. 142Require Import QArith. 143Require Import Qpower. 144Require Import Qabs. 145Require Import Psatz. 146 147Open Scope Q_scope. 148 149 150Ltac qreduce T := 151 rewrite <- (Qred_correct (T)); simpl (Qred (T)). 152 153Theorem Qlt_move_right : 154 forall x y z:Q, x + z < y <-> x < y - z. 155Proof. 156 intros. 157 split. 158 intros. 159 psatzl Q. 160 intros. 161 psatzl Q. 162Qed. 163 164Theorem Qlt_mult_by_z : 165 forall x y z:Q, 0 < z -> (x < y <-> x * z < y * z). 166Proof. 167 intros. 168 split. 169 intros. 170 apply Qmult_lt_compat_r. trivial. trivial. 171 intros. 172 rewrite <- (Qdiv_mult_l x z). rewrite <- (Qdiv_mult_l y z). 173 apply Qmult_lt_compat_r. 174 apply Qlt_shift_inv_l. 175 trivial. psatzl Q. trivial. psatzl Q. psatzl Q. 176Qed. 177 178Theorem Qle_mult_quad : 179 forall (a b c d:Q), 180 0 <= a -> a <= c -> 181 0 <= b -> b <= d -> 182 a * b <= c * d. 183 intros. 184 psatz Q. 185Qed. 186 187 188Theorem q_lt_qest: 189 forall (p q r:Q), 190 (0 < p) -> (p <= (2#1)^31 - 1) -> 191 (0 <= q) -> (q <= p - 1) -> 192 (1 <= r) -> (r <= p - 1) -> 193 q < (q * p + r) / (p * (1 + (2#1)^(-63))^2). 194Proof. 195 intros. 196 rewrite Qlt_mult_by_z with (z := (p * (1 + (2#1)^(-63))^2)). 197 198 unfold Qdiv. 199 rewrite <- Qmult_assoc. 200 rewrite (Qmult_comm (/ (p * (1 + (2 # 1) ^ (-63)) ^ 2)) (p * (1 + (2 # 1) ^ (-63)) ^ 2)). 201 rewrite Qmult_inv_r. 202 rewrite Qmult_1_r. 203 204 assert (q * (p * (1 + (2 # 1) ^ (-63)) ^ 2) == q * p + (q * p) * ((2 # 1) ^ (-62) + (2 # 1) ^ (-126))). 205 qreduce ((1 + (2 # 1) ^ (-63)) ^ 2). 206 qreduce ((2 # 1) ^ (-62) + (2 # 1) ^ (-126)). 207 ring_simplify. 208 reflexivity. 209 rewrite H5. 210 211 rewrite Qplus_comm. 212 rewrite Qlt_move_right. 213 ring_simplify (q * p + r - q * p). 214 qreduce ((2 # 1) ^ (-62) + (2 # 1) ^ (-126)). 215 216 apply Qlt_le_trans with (y := 1). 217 rewrite Qlt_mult_by_z with (z := 85070591730234615865843651857942052864 # 18446744073709551617). 218 ring_simplify. 219 220 apply Qle_lt_trans with (y := ((2 # 1) ^ 31 - (2#1)) * ((2 # 1) ^ 31 - 1)). 221 apply Qle_mult_quad. 222 assumption. psatzl Q. psatzl Q. psatzl Q. psatzl Q. psatzl Q. assumption. psatzl Q. psatzl Q. 223Qed. 224 225Theorem qest_lt_qplus1: 226 forall (p q r:Q), 227 (0 < p) -> (p <= (2#1)^31 - 1) -> 228 (0 <= q) -> (q <= p - 1) -> 229 (1 <= r) -> (r <= p - 1) -> 230 ((q * p + r) * (1 + (2#1)^(-63))^2) / p < q + 1. 231Proof. 232 intros. 233 rewrite Qlt_mult_by_z with (z := p). 234 235 unfold Qdiv. 236 rewrite <- Qmult_assoc. 237 rewrite (Qmult_comm (/ p) p). 238 rewrite Qmult_inv_r. 239 rewrite Qmult_1_r. 240 241 assert ((q * p + r) * (1 + (2 # 1) ^ (-63)) ^ 2 == q * p + r + (q * p + r) * ((2 # 1) ^ (-62) + (2 # 1) ^ (-126))). 242 qreduce ((1 + (2 # 1) ^ (-63)) ^ 2). 243 qreduce ((2 # 1) ^ (-62) + (2 # 1) ^ (-126)). 244 ring_simplify. reflexivity. 245 rewrite H5. 246 247 rewrite <- Qplus_assoc. rewrite <- Qplus_comm. rewrite Qlt_move_right. 248 ring_simplify ((q + 1) * p - q * p). 249 250 rewrite <- Qplus_comm. rewrite Qlt_move_right. 251 252 apply Qlt_le_trans with (y := 1). 253 qreduce ((2 # 1) ^ (-62) + (2 # 1) ^ (-126)). 254 255 rewrite Qlt_mult_by_z with (z := 85070591730234615865843651857942052864 # 18446744073709551617). 256 ring_simplify. 257 258 ring_simplify in H0. 259 apply Qle_lt_trans with (y := (2147483646 # 1) * (2147483647 # 1) + (2147483646 # 1)). 260 261 apply Qplus_le_compat. 262 apply Qle_mult_quad. 263 assumption. psatzl Q. auto with qarith. assumption. psatzl Q. 264 auto with qarith. auto with qarith. 265 psatzl Q. psatzl Q. assumption. 266Qed. 267 268 269 270