2 * Copyright (c) 2017 Thomas Pornin <pornin@bolet.org>
4 * Permission is hereby granted, free of charge, to any person obtaining
5 * a copy of this software and associated documentation files (the
6 * "Software"), to deal in the Software without restriction, including
7 * without limitation the rights to use, copy, modify, merge, publish,
8 * distribute, sublicense, and/or sell copies of the Software, and to
9 * permit persons to whom the Software is furnished to do so, subject to
10 * the following conditions:
12 * The above copyright notice and this permission notice shall be
13 * included in all copies or substantial portions of the Software.
15 * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND,
16 * EXPRESS OR IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF
17 * MERCHANTABILITY, FITNESS FOR A PARTICULAR PURPOSE AND
18 * NONINFRINGEMENT. IN NO EVENT SHALL THE AUTHORS OR COPYRIGHT HOLDERS
19 * BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER LIABILITY, WHETHER IN AN
20 * ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM, OUT OF OR IN
21 * CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE
28 * This is a "reference" implementation of Poly1305 that uses the
29 * generic "i15" code for big integers. It is slow, but it handles all
30 * big-integer operations with generic code, thereby avoiding most
31 * tricky situations with carry propagation and modular reduction.
37 static const uint16_t P1305
[] = {
39 0x7FFB, 0x7FFF, 0x7FFF, 0x7FFF, 0x7FFF, 0x7FFF, 0x7FFF, 0x7FFF, 0x03FF
48 * R^2 mod p, for conversion to Montgomery representation (R = 2^135,
49 * since we use 9 words of 15 bits each, and 15*9 = 135).
51 static const uint16_t R2
[] = {
53 0x6400, 0x0000, 0x0000, 0x0000, 0x0000, 0x0000, 0x0000, 0x0000, 0x0000
57 * Perform the inner processing of blocks for Poly1305. The "r" array
58 * is in Montgomery representation, while the "a" array is not.
61 poly1305_inner(uint16_t *a
, const uint16_t *r
, const void *data
, size_t len
)
63 const unsigned char *buf
;
67 unsigned char tmp
[16], rev
[16];
73 * If there is a partial block, right-pad it with zeros.
76 memset(tmp
, 0, sizeof tmp
);
77 memcpy(tmp
, buf
, len
);
83 * Decode next block and apply the "high bit". Since
84 * decoding is little-endian, we must byte-swap the buffer.
86 for (i
= 0; i
< 16; i
++) {
89 br_i15_decode_mod(b
, rev
, sizeof rev
, P1305
);
93 * Add the accumulator to the decoded block (modular
96 ctl
= br_i15_add(b
, a
, 1);
97 ctl
|= NOT(br_i15_sub(b
, P1305
, 0));
98 br_i15_sub(b
, P1305
, ctl
);
101 * Multiply by r, result is the new accumulator value.
103 br_i15_montymul(a
, b
, r
, P1305
, P0I
);
111 * Byteswap a 16-byte value.
114 byteswap16(unsigned char *buf
)
118 for (i
= 0; i
< 8; i
++) {
122 buf
[i
] = buf
[15 - i
];
127 /* see bearssl_block.h */
129 br_poly1305_i15_run(const void *key
, const void *iv
,
130 void *data
, size_t len
, const void *aad
, size_t aad_len
,
131 void *tag
, br_chacha20_run ichacha
, int encrypt
)
133 unsigned char pkey
[32], foot
[16];
134 uint16_t t
[10], r
[10], acc
[10];
137 * Compute the MAC key. The 'r' value is the first 16 bytes of
140 memset(pkey
, 0, sizeof pkey
);
141 ichacha(key
, iv
, 0, pkey
, sizeof pkey
);
144 * If encrypting, ChaCha20 must run first, followed by Poly1305.
145 * When decrypting, the operations are reversed.
148 ichacha(key
, iv
, 1, data
, len
);
152 * Run Poly1305. We must process the AAD, then ciphertext, then
153 * the footer (with the lengths). Note that the AAD and ciphertext
154 * are meant to be padded with zeros up to the next multiple of 16,
155 * and the length of the footer is 16 bytes as well.
159 * Apply the "clamping" operation on the encoded 'r' value.
170 * Decode the clamped 'r' value. Decoding should use little-endian
171 * so we must byteswap the value first.
174 br_i15_decode_mod(t
, pkey
, 16, P1305
);
177 * Convert 'r' to Montgomery representation.
179 br_i15_montymul(r
, t
, R2
, P1305
, P0I
);
184 br_i15_zero(acc
, 0x8A);
187 * Process the additional authenticated data, ciphertext, and
188 * footer in due order.
190 br_enc64le(foot
, (uint64_t)aad_len
);
191 br_enc64le(foot
+ 8, (uint64_t)len
);
192 poly1305_inner(acc
, r
, aad
, aad_len
);
193 poly1305_inner(acc
, r
, data
, len
);
194 poly1305_inner(acc
, r
, foot
, sizeof foot
);
197 * Decode the value 's'. Again, a byteswap is needed.
199 byteswap16(pkey
+ 16);
200 br_i15_decode_mod(t
, pkey
+ 16, 16, P1305
);
203 * Add the value 's' to the accumulator. That addition is done
204 * modulo 2^128, so we just ignore the carry.
206 br_i15_add(acc
, t
, 1);
209 * Encode the result (128 low bits) to the tag. Encoding should
212 br_i15_encode(tag
, 16, acc
);
216 * If decrypting, then ChaCha20 runs _after_ Poly1305.
219 ichacha(key
, iv
, 1, data
, len
);