1 // Copyright 2011 The Chromium Authors
2 // Use of this source code is governed by a BSD-style license that can be
3 // found in the LICENSE file.
4
5 // The original file was copied from sqlite, and was in the public domain.
6
7 /*
8 * This code implements the MD5 message-digest algorithm.
9 * The algorithm is due to Ron Rivest. This code was
10 * written by Colin Plumb in 1993, no copyright is claimed.
11 * This code is in the public domain; do with it what you wish.
12 *
13 * Equivalent code is available from RSA Data Security, Inc.
14 * This code has been tested against that, and is equivalent,
15 * except that you don't need to include two pages of legalese
16 * with every copy.
17 *
18 * To compute the message digest of a chunk of bytes, declare an
19 * MD5Context structure, pass it to MD5Init, call MD5Update as
20 * needed on buffers full of bytes, and then call MD5Final, which
21 * will fill a supplied 16-byte array with the digest.
22 */
23
24 #include "base/hash/md5.h"
25
26 #include <stddef.h>
27 #include <string.h>
28
29 #include <string_view>
30
31 #include "base/containers/span.h"
32 #include "base/strings/string_number_conversions.h"
33
34 namespace {
35
36 struct Context {
37 uint32_t buf[4];
38 uint32_t bits[2];
39 uint8_t in[64];
40 };
41
42 /*
43 * Note: this code is harmless on little-endian machines.
44 */
byteReverse(uint8_t * buf,unsigned longs)45 void byteReverse(uint8_t* buf, unsigned longs) {
46 do {
47 uint32_t temp =
48 static_cast<uint32_t>(static_cast<unsigned>(buf[3]) << 8 | buf[2])
49 << 16 |
50 (static_cast<unsigned>(buf[1]) << 8 | buf[0]);
51 *reinterpret_cast<uint32_t*>(buf) = temp;
52 buf += 4;
53 } while (--longs);
54 }
55
56 /* The four core functions - F1 is optimized somewhat */
57
58 /* #define F1(x, y, z) (x & y | ~x & z) */
59 #define F1(x, y, z) (z ^ (x & (y ^ z)))
60 #define F2(x, y, z) F1(z, x, y)
61 #define F3(x, y, z) (x ^ y ^ z)
62 #define F4(x, y, z) (y ^ (x | ~z))
63
64 /* This is the central step in the MD5 algorithm. */
65 #define MD5STEP(f, w, x, y, z, data, s) \
66 (w += f(x, y, z) + data, w = w << s | w >> (32 - s), w += x)
67
68 /*
69 * The core of the MD5 algorithm, this alters an existing MD5 hash to
70 * reflect the addition of 16 longwords of new data. MD5Update blocks
71 * the data and converts bytes into longwords for this routine.
72 */
MD5Transform(uint32_t buf[4],const uint32_t in[16])73 void MD5Transform(uint32_t buf[4], const uint32_t in[16]) {
74 uint32_t a, b, c, d;
75
76 a = buf[0];
77 b = buf[1];
78 c = buf[2];
79 d = buf[3];
80
81 MD5STEP(F1, a, b, c, d, in[0] + 0xd76aa478, 7);
82 MD5STEP(F1, d, a, b, c, in[1] + 0xe8c7b756, 12);
83 MD5STEP(F1, c, d, a, b, in[2] + 0x242070db, 17);
84 MD5STEP(F1, b, c, d, a, in[3] + 0xc1bdceee, 22);
85 MD5STEP(F1, a, b, c, d, in[4] + 0xf57c0faf, 7);
86 MD5STEP(F1, d, a, b, c, in[5] + 0x4787c62a, 12);
87 MD5STEP(F1, c, d, a, b, in[6] + 0xa8304613, 17);
88 MD5STEP(F1, b, c, d, a, in[7] + 0xfd469501, 22);
89 MD5STEP(F1, a, b, c, d, in[8] + 0x698098d8, 7);
90 MD5STEP(F1, d, a, b, c, in[9] + 0x8b44f7af, 12);
91 MD5STEP(F1, c, d, a, b, in[10] + 0xffff5bb1, 17);
92 MD5STEP(F1, b, c, d, a, in[11] + 0x895cd7be, 22);
93 MD5STEP(F1, a, b, c, d, in[12] + 0x6b901122, 7);
94 MD5STEP(F1, d, a, b, c, in[13] + 0xfd987193, 12);
95 MD5STEP(F1, c, d, a, b, in[14] + 0xa679438e, 17);
96 MD5STEP(F1, b, c, d, a, in[15] + 0x49b40821, 22);
97
98 MD5STEP(F2, a, b, c, d, in[1] + 0xf61e2562, 5);
99 MD5STEP(F2, d, a, b, c, in[6] + 0xc040b340, 9);
100 MD5STEP(F2, c, d, a, b, in[11] + 0x265e5a51, 14);
101 MD5STEP(F2, b, c, d, a, in[0] + 0xe9b6c7aa, 20);
102 MD5STEP(F2, a, b, c, d, in[5] + 0xd62f105d, 5);
103 MD5STEP(F2, d, a, b, c, in[10] + 0x02441453, 9);
104 MD5STEP(F2, c, d, a, b, in[15] + 0xd8a1e681, 14);
105 MD5STEP(F2, b, c, d, a, in[4] + 0xe7d3fbc8, 20);
106 MD5STEP(F2, a, b, c, d, in[9] + 0x21e1cde6, 5);
107 MD5STEP(F2, d, a, b, c, in[14] + 0xc33707d6, 9);
108 MD5STEP(F2, c, d, a, b, in[3] + 0xf4d50d87, 14);
109 MD5STEP(F2, b, c, d, a, in[8] + 0x455a14ed, 20);
110 MD5STEP(F2, a, b, c, d, in[13] + 0xa9e3e905, 5);
111 MD5STEP(F2, d, a, b, c, in[2] + 0xfcefa3f8, 9);
112 MD5STEP(F2, c, d, a, b, in[7] + 0x676f02d9, 14);
113 MD5STEP(F2, b, c, d, a, in[12] + 0x8d2a4c8a, 20);
114
115 MD5STEP(F3, a, b, c, d, in[5] + 0xfffa3942, 4);
116 MD5STEP(F3, d, a, b, c, in[8] + 0x8771f681, 11);
117 MD5STEP(F3, c, d, a, b, in[11] + 0x6d9d6122, 16);
118 MD5STEP(F3, b, c, d, a, in[14] + 0xfde5380c, 23);
119 MD5STEP(F3, a, b, c, d, in[1] + 0xa4beea44, 4);
120 MD5STEP(F3, d, a, b, c, in[4] + 0x4bdecfa9, 11);
121 MD5STEP(F3, c, d, a, b, in[7] + 0xf6bb4b60, 16);
122 MD5STEP(F3, b, c, d, a, in[10] + 0xbebfbc70, 23);
123 MD5STEP(F3, a, b, c, d, in[13] + 0x289b7ec6, 4);
124 MD5STEP(F3, d, a, b, c, in[0] + 0xeaa127fa, 11);
125 MD5STEP(F3, c, d, a, b, in[3] + 0xd4ef3085, 16);
126 MD5STEP(F3, b, c, d, a, in[6] + 0x04881d05, 23);
127 MD5STEP(F3, a, b, c, d, in[9] + 0xd9d4d039, 4);
128 MD5STEP(F3, d, a, b, c, in[12] + 0xe6db99e5, 11);
129 MD5STEP(F3, c, d, a, b, in[15] + 0x1fa27cf8, 16);
130 MD5STEP(F3, b, c, d, a, in[2] + 0xc4ac5665, 23);
131
132 MD5STEP(F4, a, b, c, d, in[0] + 0xf4292244, 6);
133 MD5STEP(F4, d, a, b, c, in[7] + 0x432aff97, 10);
134 MD5STEP(F4, c, d, a, b, in[14] + 0xab9423a7, 15);
135 MD5STEP(F4, b, c, d, a, in[5] + 0xfc93a039, 21);
136 MD5STEP(F4, a, b, c, d, in[12] + 0x655b59c3, 6);
137 MD5STEP(F4, d, a, b, c, in[3] + 0x8f0ccc92, 10);
138 MD5STEP(F4, c, d, a, b, in[10] + 0xffeff47d, 15);
139 MD5STEP(F4, b, c, d, a, in[1] + 0x85845dd1, 21);
140 MD5STEP(F4, a, b, c, d, in[8] + 0x6fa87e4f, 6);
141 MD5STEP(F4, d, a, b, c, in[15] + 0xfe2ce6e0, 10);
142 MD5STEP(F4, c, d, a, b, in[6] + 0xa3014314, 15);
143 MD5STEP(F4, b, c, d, a, in[13] + 0x4e0811a1, 21);
144 MD5STEP(F4, a, b, c, d, in[4] + 0xf7537e82, 6);
145 MD5STEP(F4, d, a, b, c, in[11] + 0xbd3af235, 10);
146 MD5STEP(F4, c, d, a, b, in[2] + 0x2ad7d2bb, 15);
147 MD5STEP(F4, b, c, d, a, in[9] + 0xeb86d391, 21);
148
149 buf[0] += a;
150 buf[1] += b;
151 buf[2] += c;
152 buf[3] += d;
153 }
154
155 } // namespace
156
157 namespace base {
158
159 /*
160 * Start MD5 accumulation. Set bit count to 0 and buffer to mysterious
161 * initialization constants.
162 */
MD5Init(MD5Context * context)163 void MD5Init(MD5Context* context) {
164 struct Context* ctx = reinterpret_cast<struct Context*>(context);
165 ctx->buf[0] = 0x67452301;
166 ctx->buf[1] = 0xefcdab89;
167 ctx->buf[2] = 0x98badcfe;
168 ctx->buf[3] = 0x10325476;
169 ctx->bits[0] = 0;
170 ctx->bits[1] = 0;
171 }
172
173 /*
174 * Update context to reflect the concatenation of another buffer full
175 * of bytes.
176 */
MD5Update(MD5Context * context,std::string_view data)177 void MD5Update(MD5Context* context, std::string_view data) {
178 MD5Update(context, base::as_byte_span(data));
179 }
180
MD5Update(MD5Context * context,base::span<const uint8_t> data)181 void MD5Update(MD5Context* context, base::span<const uint8_t> data) {
182 struct Context* ctx = reinterpret_cast<struct Context*>(context);
183 const uint8_t* buf = data.data();
184 size_t len = data.size();
185
186 /* Update bitcount */
187
188 uint32_t t = ctx->bits[0];
189 if ((ctx->bits[0] = t + (static_cast<uint32_t>(len) << 3)) < t)
190 ctx->bits[1]++; /* Carry from low to high */
191 ctx->bits[1] += static_cast<uint32_t>(len >> 29);
192
193 t = (t >> 3) & 0x3f; /* Bytes already in shsInfo->data */
194
195 /* Handle any leading odd-sized chunks */
196
197 if (t) {
198 uint8_t* p = static_cast<uint8_t*>(ctx->in + t);
199
200 t = 64 - t;
201 if (len < t) {
202 memcpy(p, buf, len);
203 return;
204 }
205 memcpy(p, buf, t);
206 byteReverse(ctx->in, 16);
207 MD5Transform(ctx->buf, reinterpret_cast<uint32_t*>(ctx->in));
208 buf += t;
209 len -= t;
210 }
211
212 /* Process data in 64-byte chunks */
213
214 while (len >= 64) {
215 memcpy(ctx->in, buf, 64);
216 byteReverse(ctx->in, 16);
217 MD5Transform(ctx->buf, reinterpret_cast<uint32_t*>(ctx->in));
218 buf += 64;
219 len -= 64;
220 }
221
222 /* Handle any remaining bytes of data. */
223
224 memcpy(ctx->in, buf, len);
225 }
226
227 /*
228 * Final wrapup - pad to 64-byte boundary with the bit pattern
229 * 1 0* (64-bit count of bits processed, MSB-first)
230 */
MD5Final(MD5Digest * digest,MD5Context * context)231 void MD5Final(MD5Digest* digest, MD5Context* context) {
232 struct Context* ctx = reinterpret_cast<struct Context*>(context);
233 unsigned count;
234 uint8_t* p;
235
236 /* Compute number of bytes mod 64 */
237 count = (ctx->bits[0] >> 3) & 0x3F;
238
239 /* Set the first char of padding to 0x80. This is safe since there is
240 always at least one byte free */
241 p = ctx->in + count;
242 *p++ = 0x80;
243
244 /* Bytes of padding needed to make 64 bytes */
245 count = 64 - 1 - count;
246
247 /* Pad out to 56 mod 64 */
248 if (count < 8) {
249 /* Two lots of padding: Pad the first block to 64 bytes */
250 memset(p, 0, count);
251 byteReverse(ctx->in, 16);
252 MD5Transform(ctx->buf, reinterpret_cast<uint32_t*>(ctx->in));
253
254 /* Now fill the next block with 56 bytes */
255 memset(ctx->in, 0, 56);
256 } else {
257 /* Pad block to 56 bytes */
258 memset(p, 0, count - 8);
259 }
260 byteReverse(ctx->in, 14);
261
262 /* Append length in bits and transform */
263 memcpy(&ctx->in[14 * sizeof(ctx->bits[0])], &ctx->bits[0],
264 sizeof(ctx->bits[0]));
265 memcpy(&ctx->in[15 * sizeof(ctx->bits[1])], &ctx->bits[1],
266 sizeof(ctx->bits[1]));
267
268 MD5Transform(ctx->buf, reinterpret_cast<uint32_t*>(ctx->in));
269 byteReverse(reinterpret_cast<uint8_t*>(ctx->buf), 4);
270 span(digest->a).copy_from(as_byte_span(ctx->buf));
271 std::ranges::fill(byte_span_from_ref(*ctx), 0u); /* In case it's sensitive */
272 }
273
MD5DigestToBase16(const MD5Digest & digest)274 std::string MD5DigestToBase16(const MD5Digest& digest) {
275 std::string ret;
276 ret.reserve(32);
277 for (uint8_t byte : digest.a) {
278 base::AppendHexEncodedByte(byte, ret, false);
279 }
280 return ret;
281 }
282
MD5Sum(span<const uint8_t> data,MD5Digest * digest)283 void MD5Sum(span<const uint8_t> data, MD5Digest* digest) {
284 MD5Context ctx;
285 MD5Init(&ctx);
286 MD5Update(&ctx, data);
287 MD5Final(digest, &ctx);
288 }
289
MD5String(std::string_view str)290 std::string MD5String(std::string_view str) {
291 MD5Digest digest;
292 MD5Sum(as_byte_span(str), &digest);
293 return MD5DigestToBase16(digest);
294 }
295
296 } // namespace base
297