2 * Poly1305 authenticator algorithm, RFC7539
4 * Copyright (C) 2015 Martin Willi
6 * Based on public domain code by Andrew Moon and Daniel J. Bernstein.
8 * This program is free software; you can redistribute it and/or modify
9 * it under the terms of the GNU General Public License as published by
10 * the Free Software Foundation; either version 2 of the License, or
11 * (at your option) any later version.
14 #include <crypto/algapi.h>
15 #include <crypto/internal/hash.h>
16 #include <crypto/poly1305.h>
17 #include <linux/crypto.h>
18 #include <linux/kernel.h>
19 #include <linux/module.h>
20 #include <asm/unaligned.h>
22 static inline u64
mlt(u64 a
, u64 b
)
27 static inline u32
sr(u64 v
, u_char n
)
32 static inline u32
and(u32 v
, u32 mask
)
37 int crypto_poly1305_init(struct shash_desc
*desc
)
39 struct poly1305_desc_ctx
*dctx
= shash_desc_ctx(desc
);
41 memset(dctx
->h
, 0, sizeof(dctx
->h
));
48 EXPORT_SYMBOL_GPL(crypto_poly1305_init
);
50 static void poly1305_setrkey(struct poly1305_desc_ctx
*dctx
, const u8
*key
)
52 /* r &= 0xffffffc0ffffffc0ffffffc0fffffff */
53 dctx
->r
[0] = (get_unaligned_le32(key
+ 0) >> 0) & 0x3ffffff;
54 dctx
->r
[1] = (get_unaligned_le32(key
+ 3) >> 2) & 0x3ffff03;
55 dctx
->r
[2] = (get_unaligned_le32(key
+ 6) >> 4) & 0x3ffc0ff;
56 dctx
->r
[3] = (get_unaligned_le32(key
+ 9) >> 6) & 0x3f03fff;
57 dctx
->r
[4] = (get_unaligned_le32(key
+ 12) >> 8) & 0x00fffff;
60 static void poly1305_setskey(struct poly1305_desc_ctx
*dctx
, const u8
*key
)
62 dctx
->s
[0] = get_unaligned_le32(key
+ 0);
63 dctx
->s
[1] = get_unaligned_le32(key
+ 4);
64 dctx
->s
[2] = get_unaligned_le32(key
+ 8);
65 dctx
->s
[3] = get_unaligned_le32(key
+ 12);
69 * Poly1305 requires a unique key for each tag, which implies that we can't set
70 * it on the tfm that gets accessed by multiple users simultaneously. Instead we
71 * expect the key as the first 32 bytes in the update() call.
73 unsigned int crypto_poly1305_setdesckey(struct poly1305_desc_ctx
*dctx
,
74 const u8
*src
, unsigned int srclen
)
77 if (!dctx
->rset
&& srclen
>= POLY1305_BLOCK_SIZE
) {
78 poly1305_setrkey(dctx
, src
);
79 src
+= POLY1305_BLOCK_SIZE
;
80 srclen
-= POLY1305_BLOCK_SIZE
;
83 if (srclen
>= POLY1305_BLOCK_SIZE
) {
84 poly1305_setskey(dctx
, src
);
85 src
+= POLY1305_BLOCK_SIZE
;
86 srclen
-= POLY1305_BLOCK_SIZE
;
92 EXPORT_SYMBOL_GPL(crypto_poly1305_setdesckey
);
94 static unsigned int poly1305_blocks(struct poly1305_desc_ctx
*dctx
,
95 const u8
*src
, unsigned int srclen
,
98 u32 r0
, r1
, r2
, r3
, r4
;
100 u32 h0
, h1
, h2
, h3
, h4
;
101 u64 d0
, d1
, d2
, d3
, d4
;
102 unsigned int datalen
;
104 if (unlikely(!dctx
->sset
)) {
105 datalen
= crypto_poly1305_setdesckey(dctx
, src
, srclen
);
106 src
+= srclen
- datalen
;
127 while (likely(srclen
>= POLY1305_BLOCK_SIZE
)) {
130 h0
+= (get_unaligned_le32(src
+ 0) >> 0) & 0x3ffffff;
131 h1
+= (get_unaligned_le32(src
+ 3) >> 2) & 0x3ffffff;
132 h2
+= (get_unaligned_le32(src
+ 6) >> 4) & 0x3ffffff;
133 h3
+= (get_unaligned_le32(src
+ 9) >> 6) & 0x3ffffff;
134 h4
+= (get_unaligned_le32(src
+ 12) >> 8) | hibit
;
137 d0
= mlt(h0
, r0
) + mlt(h1
, s4
) + mlt(h2
, s3
) +
138 mlt(h3
, s2
) + mlt(h4
, s1
);
139 d1
= mlt(h0
, r1
) + mlt(h1
, r0
) + mlt(h2
, s4
) +
140 mlt(h3
, s3
) + mlt(h4
, s2
);
141 d2
= mlt(h0
, r2
) + mlt(h1
, r1
) + mlt(h2
, r0
) +
142 mlt(h3
, s4
) + mlt(h4
, s3
);
143 d3
= mlt(h0
, r3
) + mlt(h1
, r2
) + mlt(h2
, r1
) +
144 mlt(h3
, r0
) + mlt(h4
, s4
);
145 d4
= mlt(h0
, r4
) + mlt(h1
, r3
) + mlt(h2
, r2
) +
146 mlt(h3
, r1
) + mlt(h4
, r0
);
148 /* (partial) h %= p */
149 d1
+= sr(d0
, 26); h0
= and(d0
, 0x3ffffff);
150 d2
+= sr(d1
, 26); h1
= and(d1
, 0x3ffffff);
151 d3
+= sr(d2
, 26); h2
= and(d2
, 0x3ffffff);
152 d4
+= sr(d3
, 26); h3
= and(d3
, 0x3ffffff);
153 h0
+= sr(d4
, 26) * 5; h4
= and(d4
, 0x3ffffff);
154 h1
+= h0
>> 26; h0
= h0
& 0x3ffffff;
156 src
+= POLY1305_BLOCK_SIZE
;
157 srclen
-= POLY1305_BLOCK_SIZE
;
169 int crypto_poly1305_update(struct shash_desc
*desc
,
170 const u8
*src
, unsigned int srclen
)
172 struct poly1305_desc_ctx
*dctx
= shash_desc_ctx(desc
);
175 if (unlikely(dctx
->buflen
)) {
176 bytes
= min(srclen
, POLY1305_BLOCK_SIZE
- dctx
->buflen
);
177 memcpy(dctx
->buf
+ dctx
->buflen
, src
, bytes
);
180 dctx
->buflen
+= bytes
;
182 if (dctx
->buflen
== POLY1305_BLOCK_SIZE
) {
183 poly1305_blocks(dctx
, dctx
->buf
,
184 POLY1305_BLOCK_SIZE
, 1 << 24);
189 if (likely(srclen
>= POLY1305_BLOCK_SIZE
)) {
190 bytes
= poly1305_blocks(dctx
, src
, srclen
, 1 << 24);
191 src
+= srclen
- bytes
;
195 if (unlikely(srclen
)) {
196 dctx
->buflen
= srclen
;
197 memcpy(dctx
->buf
, src
, srclen
);
202 EXPORT_SYMBOL_GPL(crypto_poly1305_update
);
204 int crypto_poly1305_final(struct shash_desc
*desc
, u8
*dst
)
206 struct poly1305_desc_ctx
*dctx
= shash_desc_ctx(desc
);
207 __le32
*mac
= (__le32
*)dst
;
208 u32 h0
, h1
, h2
, h3
, h4
;
209 u32 g0
, g1
, g2
, g3
, g4
;
213 if (unlikely(!dctx
->sset
))
216 if (unlikely(dctx
->buflen
)) {
217 dctx
->buf
[dctx
->buflen
++] = 1;
218 memset(dctx
->buf
+ dctx
->buflen
, 0,
219 POLY1305_BLOCK_SIZE
- dctx
->buflen
);
220 poly1305_blocks(dctx
, dctx
->buf
, POLY1305_BLOCK_SIZE
, 0);
230 h2
+= (h1
>> 26); h1
= h1
& 0x3ffffff;
231 h3
+= (h2
>> 26); h2
= h2
& 0x3ffffff;
232 h4
+= (h3
>> 26); h3
= h3
& 0x3ffffff;
233 h0
+= (h4
>> 26) * 5; h4
= h4
& 0x3ffffff;
234 h1
+= (h0
>> 26); h0
= h0
& 0x3ffffff;
238 g1
= h1
+ (g0
>> 26); g0
&= 0x3ffffff;
239 g2
= h2
+ (g1
>> 26); g1
&= 0x3ffffff;
240 g3
= h3
+ (g2
>> 26); g2
&= 0x3ffffff;
241 g4
= h4
+ (g3
>> 26) - (1 << 26); g3
&= 0x3ffffff;
243 /* select h if h < p, or h + -p if h >= p */
244 mask
= (g4
>> ((sizeof(u32
) * 8) - 1)) - 1;
251 h0
= (h0
& mask
) | g0
;
252 h1
= (h1
& mask
) | g1
;
253 h2
= (h2
& mask
) | g2
;
254 h3
= (h3
& mask
) | g3
;
255 h4
= (h4
& mask
) | g4
;
257 /* h = h % (2^128) */
258 h0
= (h0
>> 0) | (h1
<< 26);
259 h1
= (h1
>> 6) | (h2
<< 20);
260 h2
= (h2
>> 12) | (h3
<< 14);
261 h3
= (h3
>> 18) | (h4
<< 8);
263 /* mac = (h + s) % (2^128) */
264 f
= (f
>> 32) + h0
+ dctx
->s
[0]; mac
[0] = cpu_to_le32(f
);
265 f
= (f
>> 32) + h1
+ dctx
->s
[1]; mac
[1] = cpu_to_le32(f
);
266 f
= (f
>> 32) + h2
+ dctx
->s
[2]; mac
[2] = cpu_to_le32(f
);
267 f
= (f
>> 32) + h3
+ dctx
->s
[3]; mac
[3] = cpu_to_le32(f
);
271 EXPORT_SYMBOL_GPL(crypto_poly1305_final
);
273 static struct shash_alg poly1305_alg
= {
274 .digestsize
= POLY1305_DIGEST_SIZE
,
275 .init
= crypto_poly1305_init
,
276 .update
= crypto_poly1305_update
,
277 .final
= crypto_poly1305_final
,
278 .descsize
= sizeof(struct poly1305_desc_ctx
),
280 .cra_name
= "poly1305",
281 .cra_driver_name
= "poly1305-generic",
283 .cra_flags
= CRYPTO_ALG_TYPE_SHASH
,
284 .cra_alignmask
= sizeof(u32
) - 1,
285 .cra_blocksize
= POLY1305_BLOCK_SIZE
,
286 .cra_module
= THIS_MODULE
,
290 static int __init
poly1305_mod_init(void)
292 return crypto_register_shash(&poly1305_alg
);
295 static void __exit
poly1305_mod_exit(void)
297 crypto_unregister_shash(&poly1305_alg
);
300 module_init(poly1305_mod_init
);
301 module_exit(poly1305_mod_exit
);
303 MODULE_LICENSE("GPL");
304 MODULE_AUTHOR("Martin Willi <martin@strongswan.org>");
305 MODULE_DESCRIPTION("Poly1305 authenticator");
306 MODULE_ALIAS_CRYPTO("poly1305");
307 MODULE_ALIAS_CRYPTO("poly1305-generic");