blob: 8536008e3e356511460acbb818dead4bf1d62340 [file] [log] [blame]
Thomas Gleixnerd2912cb2019-06-04 10:11:33 +02001// SPDX-License-Identifier: GPL-2.0-only
Ard Biesheuvelfdd23892014-03-26 20:53:05 +01002/*
3 * Accelerated GHASH implementation with ARMv8 PMULL instructions.
4 *
Ard Biesheuvel30f1a9f2018-07-30 23:06:42 +02005 * Copyright (C) 2014 - 2018 Linaro Ltd. <ard.biesheuvel@linaro.org>
Ard Biesheuvelfdd23892014-03-26 20:53:05 +01006 */
7
8#include <asm/neon.h>
Ard Biesheuvel6d6254d2017-07-24 11:28:05 +01009#include <asm/simd.h>
Ard Biesheuvelfdd23892014-03-26 20:53:05 +010010#include <asm/unaligned.h>
Ard Biesheuvel537c1442017-07-24 11:28:16 +010011#include <crypto/aes.h>
12#include <crypto/algapi.h>
13#include <crypto/b128ops.h>
Ard Biesheuvel6d6254d2017-07-24 11:28:05 +010014#include <crypto/gf128mul.h>
Ard Biesheuvel537c1442017-07-24 11:28:16 +010015#include <crypto/internal/aead.h>
Ard Biesheuvelfdd23892014-03-26 20:53:05 +010016#include <crypto/internal/hash.h>
Eric Biggerse52b7022019-03-12 22:12:50 -070017#include <crypto/internal/simd.h>
Ard Biesheuvel537c1442017-07-24 11:28:16 +010018#include <crypto/internal/skcipher.h>
19#include <crypto/scatterwalk.h>
Ard Biesheuvelfdd23892014-03-26 20:53:05 +010020#include <linux/cpufeature.h>
21#include <linux/crypto.h>
22#include <linux/module.h>
23
Ard Biesheuvel537c1442017-07-24 11:28:16 +010024MODULE_DESCRIPTION("GHASH and AES-GCM using ARMv8 Crypto Extensions");
Ard Biesheuvelfdd23892014-03-26 20:53:05 +010025MODULE_AUTHOR("Ard Biesheuvel <ard.biesheuvel@linaro.org>");
26MODULE_LICENSE("GPL v2");
Ard Biesheuvel03c9a332017-07-24 11:28:18 +010027MODULE_ALIAS_CRYPTO("ghash");
Ard Biesheuvelfdd23892014-03-26 20:53:05 +010028
29#define GHASH_BLOCK_SIZE 16
30#define GHASH_DIGEST_SIZE 16
Ard Biesheuvel537c1442017-07-24 11:28:16 +010031#define GCM_IV_SIZE 12
Ard Biesheuvelfdd23892014-03-26 20:53:05 +010032
33struct ghash_key {
Ard Biesheuvel22240df72018-08-04 20:46:25 +020034 be128 k;
Ard Biesheuvel17d0fb1f2020-06-29 09:39:23 +020035 u64 h[][2];
Ard Biesheuvelfdd23892014-03-26 20:53:05 +010036};
37
38struct ghash_desc_ctx {
39 u64 digest[GHASH_DIGEST_SIZE/sizeof(u64)];
40 u8 buf[GHASH_BLOCK_SIZE];
41 u32 count;
42};
43
Ard Biesheuvel537c1442017-07-24 11:28:16 +010044struct gcm_aes_ctx {
45 struct crypto_aes_ctx aes_key;
46 struct ghash_key ghash_key;
47};
48
Ard Biesheuvel03c9a332017-07-24 11:28:18 +010049asmlinkage void pmull_ghash_update_p64(int blocks, u64 dg[], const char *src,
Ard Biesheuvel17d0fb1f2020-06-29 09:39:23 +020050 u64 const h[][2], const char *head);
Ard Biesheuvel03c9a332017-07-24 11:28:18 +010051
52asmlinkage void pmull_ghash_update_p8(int blocks, u64 dg[], const char *src,
Ard Biesheuvel17d0fb1f2020-06-29 09:39:23 +020053 u64 const h[][2], const char *head);
Ard Biesheuvel03c9a332017-07-24 11:28:18 +010054
Ard Biesheuvel11031c02019-09-11 00:19:00 +010055asmlinkage void pmull_gcm_encrypt(int bytes, u8 dst[], const u8 src[],
Ard Biesheuvel17d0fb1f2020-06-29 09:39:23 +020056 u64 const h[][2], u64 dg[], u8 ctr[],
57 u32 const rk[], int rounds, u8 tag[]);
Ard Biesheuvel537c1442017-07-24 11:28:16 +010058
Ard Biesheuvel11031c02019-09-11 00:19:00 +010059asmlinkage void pmull_gcm_decrypt(int bytes, u8 dst[], const u8 src[],
Ard Biesheuvel17d0fb1f2020-06-29 09:39:23 +020060 u64 const h[][2], u64 dg[], u8 ctr[],
61 u32 const rk[], int rounds, u8 tag[]);
Ard Biesheuvel537c1442017-07-24 11:28:16 +010062
Ard Biesheuvelfdd23892014-03-26 20:53:05 +010063static int ghash_init(struct shash_desc *desc)
64{
65 struct ghash_desc_ctx *ctx = shash_desc_ctx(desc);
66
67 *ctx = (struct ghash_desc_ctx){};
68 return 0;
69}
70
Ard Biesheuvel6d6254d2017-07-24 11:28:05 +010071static void ghash_do_update(int blocks, u64 dg[], const char *src,
Ard Biesheuvele4f87482020-06-29 09:39:24 +020072 struct ghash_key *key, const char *head)
Ard Biesheuvel6d6254d2017-07-24 11:28:05 +010073{
Ard Biesheuvele4f87482020-06-29 09:39:24 +020074 be128 dst = { cpu_to_be64(dg[1]), cpu_to_be64(dg[0]) };
75
76 do {
77 const u8 *in = src;
78
79 if (head) {
80 in = head;
81 blocks++;
82 head = NULL;
83 } else {
84 src += GHASH_BLOCK_SIZE;
85 }
86
87 crypto_xor((u8 *)&dst, in, GHASH_BLOCK_SIZE);
88 gf128mul_lle(&dst, &key->k);
89 } while (--blocks);
90
91 dg[0] = be64_to_cpu(dst.b);
92 dg[1] = be64_to_cpu(dst.a);
93}
94
95static __always_inline
96void ghash_do_simd_update(int blocks, u64 dg[], const char *src,
97 struct ghash_key *key, const char *head,
98 void (*simd_update)(int blocks, u64 dg[],
99 const char *src,
100 u64 const h[][2],
101 const char *head))
102{
103 if (likely(crypto_simd_usable())) {
Ard Biesheuvel6d6254d2017-07-24 11:28:05 +0100104 kernel_neon_begin();
Ard Biesheuvel17d0fb1f2020-06-29 09:39:23 +0200105 simd_update(blocks, dg, src, key->h, head);
Ard Biesheuvel6d6254d2017-07-24 11:28:05 +0100106 kernel_neon_end();
107 } else {
Ard Biesheuvele4f87482020-06-29 09:39:24 +0200108 ghash_do_update(blocks, dg, src, key, head);
Ard Biesheuvel6d6254d2017-07-24 11:28:05 +0100109 }
110}
111
Ard Biesheuvel8e492ef2018-08-04 20:46:24 +0200112/* avoid hogging the CPU for too long */
113#define MAX_BLOCKS (SZ_64K / GHASH_BLOCK_SIZE)
114
Ard Biesheuvel37b6aab2020-06-29 09:39:21 +0200115static int ghash_update(struct shash_desc *desc, const u8 *src,
116 unsigned int len)
Ard Biesheuvelfdd23892014-03-26 20:53:05 +0100117{
118 struct ghash_desc_ctx *ctx = shash_desc_ctx(desc);
119 unsigned int partial = ctx->count % GHASH_BLOCK_SIZE;
120
121 ctx->count += len;
122
123 if ((partial + len) >= GHASH_BLOCK_SIZE) {
124 struct ghash_key *key = crypto_shash_ctx(desc->tfm);
125 int blocks;
126
127 if (partial) {
128 int p = GHASH_BLOCK_SIZE - partial;
129
130 memcpy(ctx->buf + partial, src, p);
131 src += p;
132 len -= p;
133 }
134
135 blocks = len / GHASH_BLOCK_SIZE;
136 len %= GHASH_BLOCK_SIZE;
137
Ard Biesheuvel8e492ef2018-08-04 20:46:24 +0200138 do {
139 int chunk = min(blocks, MAX_BLOCKS);
Ard Biesheuvel6d6254d2017-07-24 11:28:05 +0100140
Ard Biesheuvele4f87482020-06-29 09:39:24 +0200141 ghash_do_simd_update(chunk, ctx->digest, src, key,
142 partial ? ctx->buf : NULL,
143 pmull_ghash_update_p8);
Ard Biesheuvel8e492ef2018-08-04 20:46:24 +0200144
145 blocks -= chunk;
146 src += chunk * GHASH_BLOCK_SIZE;
147 partial = 0;
148 } while (unlikely(blocks > 0));
Ard Biesheuvelfdd23892014-03-26 20:53:05 +0100149 }
150 if (len)
151 memcpy(ctx->buf + partial, src, len);
152 return 0;
153}
154
Ard Biesheuvel37b6aab2020-06-29 09:39:21 +0200155static int ghash_final(struct shash_desc *desc, u8 *dst)
Ard Biesheuvelfdd23892014-03-26 20:53:05 +0100156{
157 struct ghash_desc_ctx *ctx = shash_desc_ctx(desc);
158 unsigned int partial = ctx->count % GHASH_BLOCK_SIZE;
159
160 if (partial) {
161 struct ghash_key *key = crypto_shash_ctx(desc->tfm);
162
163 memset(ctx->buf + partial, 0, GHASH_BLOCK_SIZE - partial);
164
Ard Biesheuvele4f87482020-06-29 09:39:24 +0200165 ghash_do_simd_update(1, ctx->digest, ctx->buf, key, NULL,
166 pmull_ghash_update_p8);
Ard Biesheuvel5a22b1982019-01-25 10:36:27 +0100167 }
168 put_unaligned_be64(ctx->digest[1], dst);
169 put_unaligned_be64(ctx->digest[0], dst + 8);
170
171 *ctx = (struct ghash_desc_ctx){};
172 return 0;
173}
174
Ard Biesheuvel22240df72018-08-04 20:46:25 +0200175static void ghash_reflect(u64 h[], const be128 *k)
176{
177 u64 carry = be64_to_cpu(k->a) & BIT(63) ? 1 : 0;
178
179 h[0] = (be64_to_cpu(k->b) << 1) | carry;
180 h[1] = (be64_to_cpu(k->a) << 1) | (be64_to_cpu(k->b) >> 63);
181
182 if (carry)
183 h[1] ^= 0xc200000000000000UL;
184}
185
Ard Biesheuvel537c1442017-07-24 11:28:16 +0100186static int ghash_setkey(struct crypto_shash *tfm,
187 const u8 *inkey, unsigned int keylen)
188{
189 struct ghash_key *key = crypto_shash_ctx(tfm);
190
Eric Biggers674f3682019-12-30 21:19:36 -0600191 if (keylen != GHASH_BLOCK_SIZE)
Ard Biesheuvel537c1442017-07-24 11:28:16 +0100192 return -EINVAL;
Ard Biesheuvel537c1442017-07-24 11:28:16 +0100193
Ard Biesheuvel94fe4502020-06-29 09:39:22 +0200194 /* needed for the fallback */
195 memcpy(&key->k, inkey, GHASH_BLOCK_SIZE);
196
Ard Biesheuvel17d0fb1f2020-06-29 09:39:23 +0200197 ghash_reflect(key->h[0], &key->k);
Ard Biesheuvel94fe4502020-06-29 09:39:22 +0200198 return 0;
Ard Biesheuvel537c1442017-07-24 11:28:16 +0100199}
200
Ard Biesheuvel37b6aab2020-06-29 09:39:21 +0200201static struct shash_alg ghash_alg = {
Ard Biesheuvel5a22b1982019-01-25 10:36:27 +0100202 .base.cra_name = "ghash",
203 .base.cra_driver_name = "ghash-neon",
Ard Biesheuvel5441c652019-11-28 13:55:31 +0100204 .base.cra_priority = 150,
Ard Biesheuvel5a22b1982019-01-25 10:36:27 +0100205 .base.cra_blocksize = GHASH_BLOCK_SIZE,
Ard Biesheuvel17d0fb1f2020-06-29 09:39:23 +0200206 .base.cra_ctxsize = sizeof(struct ghash_key) + sizeof(u64[2]),
Ard Biesheuvel5a22b1982019-01-25 10:36:27 +0100207 .base.cra_module = THIS_MODULE,
208
209 .digestsize = GHASH_DIGEST_SIZE,
210 .init = ghash_init,
Ard Biesheuvel37b6aab2020-06-29 09:39:21 +0200211 .update = ghash_update,
212 .final = ghash_final,
Ard Biesheuvel5a22b1982019-01-25 10:36:27 +0100213 .setkey = ghash_setkey,
214 .descsize = sizeof(struct ghash_desc_ctx),
Ard Biesheuvel37b6aab2020-06-29 09:39:21 +0200215};
Ard Biesheuvel537c1442017-07-24 11:28:16 +0100216
217static int num_rounds(struct crypto_aes_ctx *ctx)
218{
219 /*
220 * # of rounds specified by AES:
221 * 128 bit key 10 rounds
222 * 192 bit key 12 rounds
223 * 256 bit key 14 rounds
224 * => n byte key => 6 + (n/4) rounds
225 */
226 return 6 + ctx->key_length / 4;
227}
228
229static int gcm_setkey(struct crypto_aead *tfm, const u8 *inkey,
230 unsigned int keylen)
231{
232 struct gcm_aes_ctx *ctx = crypto_aead_ctx(tfm);
Ard Biesheuvel22240df72018-08-04 20:46:25 +0200233 u8 key[GHASH_BLOCK_SIZE];
Ard Biesheuvel94fe4502020-06-29 09:39:22 +0200234 be128 h;
Ard Biesheuvel537c1442017-07-24 11:28:16 +0100235 int ret;
236
Ard Biesheuvelfe3b99b2019-07-02 21:41:28 +0200237 ret = aes_expandkey(&ctx->aes_key, inkey, keylen);
Eric Biggers674f3682019-12-30 21:19:36 -0600238 if (ret)
Ard Biesheuvel537c1442017-07-24 11:28:16 +0100239 return -EINVAL;
Ard Biesheuvel537c1442017-07-24 11:28:16 +0100240
Ard Biesheuvelfe3b99b2019-07-02 21:41:28 +0200241 aes_encrypt(&ctx->aes_key, key, (u8[AES_BLOCK_SIZE]){});
Ard Biesheuvel537c1442017-07-24 11:28:16 +0100242
Ard Biesheuvel94fe4502020-06-29 09:39:22 +0200243 /* needed for the fallback */
244 memcpy(&ctx->ghash_key.k, key, GHASH_BLOCK_SIZE);
245
Ard Biesheuvel17d0fb1f2020-06-29 09:39:23 +0200246 ghash_reflect(ctx->ghash_key.h[0], &ctx->ghash_key.k);
Ard Biesheuvel94fe4502020-06-29 09:39:22 +0200247
248 h = ctx->ghash_key.k;
249 gf128mul_lle(&h, &ctx->ghash_key.k);
Ard Biesheuvel17d0fb1f2020-06-29 09:39:23 +0200250 ghash_reflect(ctx->ghash_key.h[1], &h);
Ard Biesheuvel94fe4502020-06-29 09:39:22 +0200251
252 gf128mul_lle(&h, &ctx->ghash_key.k);
Ard Biesheuvel17d0fb1f2020-06-29 09:39:23 +0200253 ghash_reflect(ctx->ghash_key.h[2], &h);
Ard Biesheuvel94fe4502020-06-29 09:39:22 +0200254
255 gf128mul_lle(&h, &ctx->ghash_key.k);
Ard Biesheuvel17d0fb1f2020-06-29 09:39:23 +0200256 ghash_reflect(ctx->ghash_key.h[3], &h);
Ard Biesheuvel94fe4502020-06-29 09:39:22 +0200257
258 return 0;
Ard Biesheuvel537c1442017-07-24 11:28:16 +0100259}
260
261static int gcm_setauthsize(struct crypto_aead *tfm, unsigned int authsize)
262{
263 switch (authsize) {
264 case 4:
265 case 8:
266 case 12 ... 16:
267 break;
268 default:
269 return -EINVAL;
270 }
271 return 0;
272}
273
274static void gcm_update_mac(u64 dg[], const u8 *src, int count, u8 buf[],
275 int *buf_count, struct gcm_aes_ctx *ctx)
276{
277 if (*buf_count > 0) {
278 int buf_added = min(count, GHASH_BLOCK_SIZE - *buf_count);
279
280 memcpy(&buf[*buf_count], src, buf_added);
281
282 *buf_count += buf_added;
283 src += buf_added;
284 count -= buf_added;
285 }
286
287 if (count >= GHASH_BLOCK_SIZE || *buf_count == GHASH_BLOCK_SIZE) {
288 int blocks = count / GHASH_BLOCK_SIZE;
289
Ard Biesheuvele4f87482020-06-29 09:39:24 +0200290 ghash_do_simd_update(blocks, dg, src, &ctx->ghash_key,
291 *buf_count ? buf : NULL,
292 pmull_ghash_update_p64);
Ard Biesheuvel537c1442017-07-24 11:28:16 +0100293
294 src += blocks * GHASH_BLOCK_SIZE;
295 count %= GHASH_BLOCK_SIZE;
296 *buf_count = 0;
297 }
298
299 if (count > 0) {
300 memcpy(buf, src, count);
301 *buf_count = count;
302 }
303}
304
305static void gcm_calculate_auth_mac(struct aead_request *req, u64 dg[])
306{
307 struct crypto_aead *aead = crypto_aead_reqtfm(req);
308 struct gcm_aes_ctx *ctx = crypto_aead_ctx(aead);
309 u8 buf[GHASH_BLOCK_SIZE];
310 struct scatter_walk walk;
311 u32 len = req->assoclen;
312 int buf_count = 0;
313
314 scatterwalk_start(&walk, req->src);
315
316 do {
317 u32 n = scatterwalk_clamp(&walk, len);
318 u8 *p;
319
320 if (!n) {
321 scatterwalk_start(&walk, sg_next(walk.sg));
322 n = scatterwalk_clamp(&walk, len);
323 }
324 p = scatterwalk_map(&walk);
325
326 gcm_update_mac(dg, p, n, buf, &buf_count, ctx);
327 len -= n;
328
329 scatterwalk_unmap(p);
330 scatterwalk_advance(&walk, n);
331 scatterwalk_done(&walk, 0, len);
332 } while (len);
333
334 if (buf_count) {
335 memset(&buf[buf_count], 0, GHASH_BLOCK_SIZE - buf_count);
Ard Biesheuvele4f87482020-06-29 09:39:24 +0200336 ghash_do_simd_update(1, dg, buf, &ctx->ghash_key, NULL,
337 pmull_ghash_update_p64);
Ard Biesheuvel537c1442017-07-24 11:28:16 +0100338 }
339}
340
Ard Biesheuvel537c1442017-07-24 11:28:16 +0100341static int gcm_encrypt(struct aead_request *req)
342{
343 struct crypto_aead *aead = crypto_aead_reqtfm(req);
344 struct gcm_aes_ctx *ctx = crypto_aead_ctx(aead);
Ard Biesheuvel71e52c272018-07-30 23:06:40 +0200345 int nrounds = num_rounds(&ctx->aes_key);
Ard Biesheuvel11031c02019-09-11 00:19:00 +0100346 struct skcipher_walk walk;
347 u8 buf[AES_BLOCK_SIZE];
348 u8 iv[AES_BLOCK_SIZE];
349 u64 dg[2] = {};
Herbert Xua4cb40f2020-08-25 11:38:01 +1000350 be128 lengths;
Ard Biesheuvel11031c02019-09-11 00:19:00 +0100351 u8 *tag;
Ard Biesheuvel537c1442017-07-24 11:28:16 +0100352 int err;
353
Ard Biesheuvel11031c02019-09-11 00:19:00 +0100354 lengths.a = cpu_to_be64(req->assoclen * 8);
355 lengths.b = cpu_to_be64(req->cryptlen * 8);
356
Ard Biesheuvel537c1442017-07-24 11:28:16 +0100357 if (req->assoclen)
358 gcm_calculate_auth_mac(req, dg);
359
360 memcpy(iv, req->iv, GCM_IV_SIZE);
Ard Biesheuvel11031c02019-09-11 00:19:00 +0100361 put_unaligned_be32(2, iv + GCM_IV_SIZE);
Ard Biesheuvel537c1442017-07-24 11:28:16 +0100362
Ard Biesheuvel30f1a9f2018-07-30 23:06:42 +0200363 err = skcipher_walk_aead_encrypt(&walk, req, false);
Ard Biesheuvel537c1442017-07-24 11:28:16 +0100364
Ard Biesheuvel11031c02019-09-11 00:19:00 +0100365 if (likely(crypto_simd_usable())) {
Ard Biesheuvel30f1a9f2018-07-30 23:06:42 +0200366 do {
Ard Biesheuvel11031c02019-09-11 00:19:00 +0100367 const u8 *src = walk.src.virt.addr;
368 u8 *dst = walk.dst.virt.addr;
369 int nbytes = walk.nbytes;
Ard Biesheuvel537c1442017-07-24 11:28:16 +0100370
Ard Biesheuvel11031c02019-09-11 00:19:00 +0100371 tag = (u8 *)&lengths;
Ard Biesheuvel30f1a9f2018-07-30 23:06:42 +0200372
Ard Biesheuvel11031c02019-09-11 00:19:00 +0100373 if (unlikely(nbytes > 0 && nbytes < AES_BLOCK_SIZE)) {
374 src = dst = memcpy(buf + sizeof(buf) - nbytes,
375 src, nbytes);
376 } else if (nbytes < walk.total) {
377 nbytes &= ~(AES_BLOCK_SIZE - 1);
378 tag = NULL;
379 }
380
381 kernel_neon_begin();
Ard Biesheuvel17d0fb1f2020-06-29 09:39:23 +0200382 pmull_gcm_encrypt(nbytes, dst, src, ctx->ghash_key.h,
383 dg, iv, ctx->aes_key.key_enc, nrounds,
Ard Biesheuvel11031c02019-09-11 00:19:00 +0100384 tag);
Ard Biesheuvel7c501362018-04-30 18:18:26 +0200385 kernel_neon_end();
Ard Biesheuvel537c1442017-07-24 11:28:16 +0100386
Ard Biesheuvel11031c02019-09-11 00:19:00 +0100387 if (unlikely(!nbytes))
388 break;
Ard Biesheuvel30f1a9f2018-07-30 23:06:42 +0200389
Ard Biesheuvel11031c02019-09-11 00:19:00 +0100390 if (unlikely(nbytes > 0 && nbytes < AES_BLOCK_SIZE))
391 memcpy(walk.dst.virt.addr,
392 buf + sizeof(buf) - nbytes, nbytes);
393
394 err = skcipher_walk_done(&walk, walk.nbytes - nbytes);
395 } while (walk.nbytes);
Ard Biesheuvel537c1442017-07-24 11:28:16 +0100396 } else {
Ard Biesheuvel11031c02019-09-11 00:19:00 +0100397 while (walk.nbytes >= AES_BLOCK_SIZE) {
398 int blocks = walk.nbytes / AES_BLOCK_SIZE;
399 const u8 *src = walk.src.virt.addr;
Ard Biesheuvel537c1442017-07-24 11:28:16 +0100400 u8 *dst = walk.dst.virt.addr;
Eric Biggers580e2952019-03-12 22:12:46 -0700401 int remaining = blocks;
Ard Biesheuvel537c1442017-07-24 11:28:16 +0100402
403 do {
Ard Biesheuvel11031c02019-09-11 00:19:00 +0100404 aes_encrypt(&ctx->aes_key, buf, iv);
405 crypto_xor_cpy(dst, src, buf, AES_BLOCK_SIZE);
Ard Biesheuvel537c1442017-07-24 11:28:16 +0100406 crypto_inc(iv, AES_BLOCK_SIZE);
407
408 dst += AES_BLOCK_SIZE;
409 src += AES_BLOCK_SIZE;
Eric Biggers580e2952019-03-12 22:12:46 -0700410 } while (--remaining > 0);
Ard Biesheuvel537c1442017-07-24 11:28:16 +0100411
Ard Biesheuvel11031c02019-09-11 00:19:00 +0100412 ghash_do_update(blocks, dg, walk.dst.virt.addr,
Ard Biesheuvele4f87482020-06-29 09:39:24 +0200413 &ctx->ghash_key, NULL);
Ard Biesheuvel537c1442017-07-24 11:28:16 +0100414
415 err = skcipher_walk_done(&walk,
Ard Biesheuvel11031c02019-09-11 00:19:00 +0100416 walk.nbytes % AES_BLOCK_SIZE);
Ard Biesheuvel537c1442017-07-24 11:28:16 +0100417 }
Ard Biesheuvel11031c02019-09-11 00:19:00 +0100418
419 /* handle the tail */
Ard Biesheuvelc2b24c32018-08-20 16:58:34 +0200420 if (walk.nbytes) {
Ard Biesheuvel11031c02019-09-11 00:19:00 +0100421 aes_encrypt(&ctx->aes_key, buf, iv);
Ard Biesheuvel537c1442017-07-24 11:28:16 +0100422
Ard Biesheuvel11031c02019-09-11 00:19:00 +0100423 crypto_xor_cpy(walk.dst.virt.addr, walk.src.virt.addr,
424 buf, walk.nbytes);
Ard Biesheuvel537c1442017-07-24 11:28:16 +0100425
Ard Biesheuvel11031c02019-09-11 00:19:00 +0100426 memcpy(buf, walk.dst.virt.addr, walk.nbytes);
427 memset(buf + walk.nbytes, 0, sizeof(buf) - walk.nbytes);
Ard Biesheuvel71e52c272018-07-30 23:06:40 +0200428 }
429
Ard Biesheuvel11031c02019-09-11 00:19:00 +0100430 tag = (u8 *)&lengths;
431 ghash_do_update(1, dg, tag, &ctx->ghash_key,
Ard Biesheuvele4f87482020-06-29 09:39:24 +0200432 walk.nbytes ? buf : NULL);
Ard Biesheuvel537c1442017-07-24 11:28:16 +0100433
Ard Biesheuvel11031c02019-09-11 00:19:00 +0100434 if (walk.nbytes)
435 err = skcipher_walk_done(&walk, 0);
436
437 put_unaligned_be64(dg[1], tag);
438 put_unaligned_be64(dg[0], tag + 8);
439 put_unaligned_be32(1, iv + GCM_IV_SIZE);
440 aes_encrypt(&ctx->aes_key, iv, iv);
441 crypto_xor(tag, iv, AES_BLOCK_SIZE);
Ard Biesheuvel537c1442017-07-24 11:28:16 +0100442 }
443
444 if (err)
445 return err;
446
Ard Biesheuvel537c1442017-07-24 11:28:16 +0100447 /* copy authtag to end of dst */
448 scatterwalk_map_and_copy(tag, req->dst, req->assoclen + req->cryptlen,
449 crypto_aead_authsize(aead), 1);
450
451 return 0;
452}
453
454static int gcm_decrypt(struct aead_request *req)
455{
456 struct crypto_aead *aead = crypto_aead_reqtfm(req);
457 struct gcm_aes_ctx *ctx = crypto_aead_ctx(aead);
458 unsigned int authsize = crypto_aead_authsize(aead);
Ard Biesheuvel71e52c272018-07-30 23:06:40 +0200459 int nrounds = num_rounds(&ctx->aes_key);
Ard Biesheuvel11031c02019-09-11 00:19:00 +0100460 struct skcipher_walk walk;
461 u8 buf[AES_BLOCK_SIZE];
462 u8 iv[AES_BLOCK_SIZE];
463 u64 dg[2] = {};
Herbert Xua4cb40f2020-08-25 11:38:01 +1000464 be128 lengths;
Ard Biesheuvel11031c02019-09-11 00:19:00 +0100465 u8 *tag;
Ard Biesheuvel537c1442017-07-24 11:28:16 +0100466 int err;
467
Ard Biesheuvel11031c02019-09-11 00:19:00 +0100468 lengths.a = cpu_to_be64(req->assoclen * 8);
469 lengths.b = cpu_to_be64((req->cryptlen - authsize) * 8);
470
Ard Biesheuvel537c1442017-07-24 11:28:16 +0100471 if (req->assoclen)
472 gcm_calculate_auth_mac(req, dg);
473
474 memcpy(iv, req->iv, GCM_IV_SIZE);
Ard Biesheuvel11031c02019-09-11 00:19:00 +0100475 put_unaligned_be32(2, iv + GCM_IV_SIZE);
Ard Biesheuvel537c1442017-07-24 11:28:16 +0100476
Ard Biesheuvel30f1a9f2018-07-30 23:06:42 +0200477 err = skcipher_walk_aead_decrypt(&walk, req, false);
478
Ard Biesheuvel11031c02019-09-11 00:19:00 +0100479 if (likely(crypto_simd_usable())) {
Ard Biesheuvel30f1a9f2018-07-30 23:06:42 +0200480 do {
Ard Biesheuvel11031c02019-09-11 00:19:00 +0100481 const u8 *src = walk.src.virt.addr;
482 u8 *dst = walk.dst.virt.addr;
483 int nbytes = walk.nbytes;
Ard Biesheuvel537c1442017-07-24 11:28:16 +0100484
Ard Biesheuvel11031c02019-09-11 00:19:00 +0100485 tag = (u8 *)&lengths;
Ard Biesheuvel30f1a9f2018-07-30 23:06:42 +0200486
Ard Biesheuvel11031c02019-09-11 00:19:00 +0100487 if (unlikely(nbytes > 0 && nbytes < AES_BLOCK_SIZE)) {
488 src = dst = memcpy(buf + sizeof(buf) - nbytes,
489 src, nbytes);
490 } else if (nbytes < walk.total) {
491 nbytes &= ~(AES_BLOCK_SIZE - 1);
492 tag = NULL;
Ard Biesheuvel30f1a9f2018-07-30 23:06:42 +0200493 }
494
Ard Biesheuvel11031c02019-09-11 00:19:00 +0100495 kernel_neon_begin();
Ard Biesheuvel17d0fb1f2020-06-29 09:39:23 +0200496 pmull_gcm_decrypt(nbytes, dst, src, ctx->ghash_key.h,
497 dg, iv, ctx->aes_key.key_enc, nrounds,
Ard Biesheuvel11031c02019-09-11 00:19:00 +0100498 tag);
Ard Biesheuvel7c501362018-04-30 18:18:26 +0200499 kernel_neon_end();
Ard Biesheuvel537c1442017-07-24 11:28:16 +0100500
Ard Biesheuvel11031c02019-09-11 00:19:00 +0100501 if (unlikely(!nbytes))
502 break;
Ard Biesheuvelc7513c22018-07-27 14:59:15 +0200503
Ard Biesheuvel11031c02019-09-11 00:19:00 +0100504 if (unlikely(nbytes > 0 && nbytes < AES_BLOCK_SIZE))
505 memcpy(walk.dst.virt.addr,
506 buf + sizeof(buf) - nbytes, nbytes);
507
508 err = skcipher_walk_done(&walk, walk.nbytes - nbytes);
509 } while (walk.nbytes);
Ard Biesheuvel537c1442017-07-24 11:28:16 +0100510 } else {
Ard Biesheuvel11031c02019-09-11 00:19:00 +0100511 while (walk.nbytes >= AES_BLOCK_SIZE) {
512 int blocks = walk.nbytes / AES_BLOCK_SIZE;
513 const u8 *src = walk.src.virt.addr;
Ard Biesheuvel537c1442017-07-24 11:28:16 +0100514 u8 *dst = walk.dst.virt.addr;
Ard Biesheuvel537c1442017-07-24 11:28:16 +0100515
516 ghash_do_update(blocks, dg, walk.src.virt.addr,
Ard Biesheuvele4f87482020-06-29 09:39:24 +0200517 &ctx->ghash_key, NULL);
Ard Biesheuvel537c1442017-07-24 11:28:16 +0100518
519 do {
Ard Biesheuvelfe3b99b2019-07-02 21:41:28 +0200520 aes_encrypt(&ctx->aes_key, buf, iv);
Ard Biesheuvel537c1442017-07-24 11:28:16 +0100521 crypto_xor_cpy(dst, src, buf, AES_BLOCK_SIZE);
522 crypto_inc(iv, AES_BLOCK_SIZE);
523
524 dst += AES_BLOCK_SIZE;
525 src += AES_BLOCK_SIZE;
526 } while (--blocks > 0);
527
528 err = skcipher_walk_done(&walk,
Ard Biesheuvel11031c02019-09-11 00:19:00 +0100529 walk.nbytes % AES_BLOCK_SIZE);
Ard Biesheuvel537c1442017-07-24 11:28:16 +0100530 }
Ard Biesheuvel11031c02019-09-11 00:19:00 +0100531
532 /* handle the tail */
Ard Biesheuvelc2b24c32018-08-20 16:58:34 +0200533 if (walk.nbytes) {
Ard Biesheuvel11031c02019-09-11 00:19:00 +0100534 memcpy(buf, walk.src.virt.addr, walk.nbytes);
535 memset(buf + walk.nbytes, 0, sizeof(buf) - walk.nbytes);
Ard Biesheuvel71e52c272018-07-30 23:06:40 +0200536 }
537
Ard Biesheuvel11031c02019-09-11 00:19:00 +0100538 tag = (u8 *)&lengths;
539 ghash_do_update(1, dg, tag, &ctx->ghash_key,
Ard Biesheuvele4f87482020-06-29 09:39:24 +0200540 walk.nbytes ? buf : NULL);
Ard Biesheuvel537c1442017-07-24 11:28:16 +0100541
Ard Biesheuvel11031c02019-09-11 00:19:00 +0100542 if (walk.nbytes) {
543 aes_encrypt(&ctx->aes_key, buf, iv);
Ard Biesheuvel537c1442017-07-24 11:28:16 +0100544
Ard Biesheuvel11031c02019-09-11 00:19:00 +0100545 crypto_xor_cpy(walk.dst.virt.addr, walk.src.virt.addr,
546 buf, walk.nbytes);
547
548 err = skcipher_walk_done(&walk, 0);
549 }
550
551 put_unaligned_be64(dg[1], tag);
552 put_unaligned_be64(dg[0], tag + 8);
553 put_unaligned_be32(1, iv + GCM_IV_SIZE);
554 aes_encrypt(&ctx->aes_key, iv, iv);
555 crypto_xor(tag, iv, AES_BLOCK_SIZE);
Ard Biesheuvel537c1442017-07-24 11:28:16 +0100556 }
557
558 if (err)
559 return err;
560
Ard Biesheuvel537c1442017-07-24 11:28:16 +0100561 /* compare calculated auth tag with the stored one */
562 scatterwalk_map_and_copy(buf, req->src,
563 req->assoclen + req->cryptlen - authsize,
564 authsize, 0);
565
566 if (crypto_memneq(tag, buf, authsize))
567 return -EBADMSG;
568 return 0;
569}
570
571static struct aead_alg gcm_aes_alg = {
572 .ivsize = GCM_IV_SIZE,
Ard Biesheuvel11031c02019-09-11 00:19:00 +0100573 .chunksize = AES_BLOCK_SIZE,
Ard Biesheuvel537c1442017-07-24 11:28:16 +0100574 .maxauthsize = AES_BLOCK_SIZE,
575 .setkey = gcm_setkey,
576 .setauthsize = gcm_setauthsize,
577 .encrypt = gcm_encrypt,
578 .decrypt = gcm_decrypt,
579
580 .base.cra_name = "gcm(aes)",
581 .base.cra_driver_name = "gcm-aes-ce",
582 .base.cra_priority = 300,
583 .base.cra_blocksize = 1,
Ard Biesheuvel17d0fb1f2020-06-29 09:39:23 +0200584 .base.cra_ctxsize = sizeof(struct gcm_aes_ctx) +
585 4 * sizeof(u64[2]),
Ard Biesheuvel537c1442017-07-24 11:28:16 +0100586 .base.cra_module = THIS_MODULE,
Ard Biesheuvelfdd23892014-03-26 20:53:05 +0100587};
588
589static int __init ghash_ce_mod_init(void)
590{
Andrew Murrayaaba0982019-04-09 10:52:40 +0100591 if (!cpu_have_named_feature(ASIMD))
Ard Biesheuvel03c9a332017-07-24 11:28:18 +0100592 return -ENODEV;
593
Andrew Murrayaaba0982019-04-09 10:52:40 +0100594 if (cpu_have_named_feature(PMULL))
Ard Biesheuvel37b6aab2020-06-29 09:39:21 +0200595 return crypto_register_aead(&gcm_aes_alg);
Ard Biesheuvel537c1442017-07-24 11:28:16 +0100596
Ard Biesheuvel37b6aab2020-06-29 09:39:21 +0200597 return crypto_register_shash(&ghash_alg);
Ard Biesheuvelfdd23892014-03-26 20:53:05 +0100598}
599
600static void __exit ghash_ce_mod_exit(void)
601{
Andrew Murrayaaba0982019-04-09 10:52:40 +0100602 if (cpu_have_named_feature(PMULL))
Ard Biesheuvel37b6aab2020-06-29 09:39:21 +0200603 crypto_unregister_aead(&gcm_aes_alg);
Ard Biesheuvel5a22b1982019-01-25 10:36:27 +0100604 else
Ard Biesheuvel37b6aab2020-06-29 09:39:21 +0200605 crypto_unregister_shash(&ghash_alg);
Ard Biesheuvelfdd23892014-03-26 20:53:05 +0100606}
607
Ard Biesheuvel03c9a332017-07-24 11:28:18 +0100608static const struct cpu_feature ghash_cpu_feature[] = {
609 { cpu_feature(PMULL) }, { }
610};
611MODULE_DEVICE_TABLE(cpu, ghash_cpu_feature);
612
613module_init(ghash_ce_mod_init);
Ard Biesheuvelfdd23892014-03-26 20:53:05 +0100614module_exit(ghash_ce_mod_exit);