Linux Audio

Check our new training course

Loading...
v6.13.7
  1/*
  2 * Cryptographic API.
  3 *
  4 * Glue code for the SHA256 Secure Hash Algorithm assembler implementations
  5 * using SSSE3, AVX, AVX2, and SHA-NI instructions.
  6 *
  7 * This file is based on sha256_generic.c
  8 *
  9 * Copyright (C) 2013 Intel Corporation.
 10 *
 11 * Author:
 12 *     Tim Chen <tim.c.chen@linux.intel.com>
 13 *
 14 * This program is free software; you can redistribute it and/or modify it
 15 * under the terms of the GNU General Public License as published by the Free
 16 * Software Foundation; either version 2 of the License, or (at your option)
 17 * any later version.
 18 *
 19 * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND,
 20 * EXPRESS OR IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF
 21 * MERCHANTABILITY, FITNESS FOR A PARTICULAR PURPOSE AND
 22 * NONINFRINGEMENT. IN NO EVENT SHALL THE AUTHORS OR COPYRIGHT HOLDERS
 23 * BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER LIABILITY, WHETHER IN AN
 24 * ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM, OUT OF OR IN
 25 * CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE
 26 * SOFTWARE.
 27 */
 28
 29
 30#define pr_fmt(fmt)	KBUILD_MODNAME ": " fmt
 31
 32#include <crypto/internal/hash.h>
 33#include <crypto/internal/simd.h>
 34#include <linux/init.h>
 35#include <linux/module.h>
 36#include <linux/mm.h>
 
 37#include <linux/types.h>
 38#include <crypto/sha2.h>
 39#include <crypto/sha256_base.h>
 
 
 
 40#include <linux/string.h>
 41#include <asm/cpu_device_id.h>
 42#include <asm/simd.h>
 43
 44asmlinkage void sha256_transform_ssse3(struct sha256_state *state,
 45				       const u8 *data, int blocks);
 46
 47static const struct x86_cpu_id module_cpu_ids[] = {
 48#ifdef CONFIG_AS_SHA256_NI
 49	X86_MATCH_FEATURE(X86_FEATURE_SHA_NI, NULL),
 
 
 
 50#endif
 51	X86_MATCH_FEATURE(X86_FEATURE_AVX2, NULL),
 52	X86_MATCH_FEATURE(X86_FEATURE_AVX, NULL),
 53	X86_MATCH_FEATURE(X86_FEATURE_SSSE3, NULL),
 54	{}
 55};
 56MODULE_DEVICE_TABLE(x86cpu, module_cpu_ids);
 57
 58static int _sha256_update(struct shash_desc *desc, const u8 *data,
 59			  unsigned int len, sha256_block_fn *sha256_xform)
 60{
 61	struct sha256_state *sctx = shash_desc_ctx(desc);
 62
 63	if (!crypto_simd_usable() ||
 64	    (sctx->count % SHA256_BLOCK_SIZE) + len < SHA256_BLOCK_SIZE)
 65		return crypto_sha256_update(desc, data, len);
 66
 67	/*
 68	 * Make sure struct sha256_state begins directly with the SHA256
 69	 * 256-bit internal state, as this is what the asm functions expect.
 70	 */
 71	BUILD_BUG_ON(offsetof(struct sha256_state, state) != 0);
 72
 73	kernel_fpu_begin();
 74	sha256_base_do_update(desc, data, len, sha256_xform);
 75	kernel_fpu_end();
 76
 77	return 0;
 78}
 79
 80static int sha256_finup(struct shash_desc *desc, const u8 *data,
 81	      unsigned int len, u8 *out, sha256_block_fn *sha256_xform)
 82{
 83	if (!crypto_simd_usable())
 84		return crypto_sha256_finup(desc, data, len, out);
 85
 86	kernel_fpu_begin();
 87	if (len)
 88		sha256_base_do_update(desc, data, len, sha256_xform);
 89	sha256_base_do_finalize(desc, sha256_xform);
 90	kernel_fpu_end();
 91
 92	return sha256_base_finish(desc, out);
 93}
 94
 95static int sha256_ssse3_update(struct shash_desc *desc, const u8 *data,
 96			 unsigned int len)
 97{
 98	return _sha256_update(desc, data, len, sha256_transform_ssse3);
 99}
 
 
 
 
100
101static int sha256_ssse3_finup(struct shash_desc *desc, const u8 *data,
102	      unsigned int len, u8 *out)
103{
104	return sha256_finup(desc, data, len, out, sha256_transform_ssse3);
105}
106
107/* Add padding and return the message digest. */
108static int sha256_ssse3_final(struct shash_desc *desc, u8 *out)
109{
110	return sha256_ssse3_finup(desc, NULL, 0, out);
111}
112
113static int sha256_ssse3_digest(struct shash_desc *desc, const u8 *data,
114	      unsigned int len, u8 *out)
115{
116	return sha256_base_init(desc) ?:
117	       sha256_ssse3_finup(desc, data, len, out);
118}
119
120static struct shash_alg sha256_ssse3_algs[] = { {
121	.digestsize	=	SHA256_DIGEST_SIZE,
122	.init		=	sha256_base_init,
123	.update		=	sha256_ssse3_update,
124	.final		=	sha256_ssse3_final,
125	.finup		=	sha256_ssse3_finup,
126	.digest		=	sha256_ssse3_digest,
127	.descsize	=	sizeof(struct sha256_state),
128	.base		=	{
129		.cra_name	=	"sha256",
130		.cra_driver_name =	"sha256-ssse3",
131		.cra_priority	=	150,
132		.cra_blocksize	=	SHA256_BLOCK_SIZE,
133		.cra_module	=	THIS_MODULE,
134	}
135}, {
136	.digestsize	=	SHA224_DIGEST_SIZE,
137	.init		=	sha224_base_init,
138	.update		=	sha256_ssse3_update,
139	.final		=	sha256_ssse3_final,
140	.finup		=	sha256_ssse3_finup,
141	.descsize	=	sizeof(struct sha256_state),
142	.base		=	{
143		.cra_name	=	"sha224",
144		.cra_driver_name =	"sha224-ssse3",
145		.cra_priority	=	150,
146		.cra_blocksize	=	SHA224_BLOCK_SIZE,
147		.cra_module	=	THIS_MODULE,
148	}
149} };
150
151static int register_sha256_ssse3(void)
152{
153	if (boot_cpu_has(X86_FEATURE_SSSE3))
154		return crypto_register_shashes(sha256_ssse3_algs,
155				ARRAY_SIZE(sha256_ssse3_algs));
156	return 0;
157}
158
159static void unregister_sha256_ssse3(void)
160{
161	if (boot_cpu_has(X86_FEATURE_SSSE3))
162		crypto_unregister_shashes(sha256_ssse3_algs,
163				ARRAY_SIZE(sha256_ssse3_algs));
164}
165
166asmlinkage void sha256_transform_avx(struct sha256_state *state,
167				     const u8 *data, int blocks);
168
169static int sha256_avx_update(struct shash_desc *desc, const u8 *data,
170			 unsigned int len)
171{
172	return _sha256_update(desc, data, len, sha256_transform_avx);
173}
174
175static int sha256_avx_finup(struct shash_desc *desc, const u8 *data,
176		      unsigned int len, u8 *out)
177{
178	return sha256_finup(desc, data, len, out, sha256_transform_avx);
179}
180
181static int sha256_avx_final(struct shash_desc *desc, u8 *out)
 
182{
183	return sha256_avx_finup(desc, NULL, 0, out);
184}
 
185
186static int sha256_avx_digest(struct shash_desc *desc, const u8 *data,
187		      unsigned int len, u8 *out)
188{
189	return sha256_base_init(desc) ?:
190	       sha256_avx_finup(desc, data, len, out);
191}
192
193static struct shash_alg sha256_avx_algs[] = { {
194	.digestsize	=	SHA256_DIGEST_SIZE,
195	.init		=	sha256_base_init,
196	.update		=	sha256_avx_update,
197	.final		=	sha256_avx_final,
198	.finup		=	sha256_avx_finup,
199	.digest		=	sha256_avx_digest,
200	.descsize	=	sizeof(struct sha256_state),
201	.base		=	{
202		.cra_name	=	"sha256",
203		.cra_driver_name =	"sha256-avx",
204		.cra_priority	=	160,
205		.cra_blocksize	=	SHA256_BLOCK_SIZE,
206		.cra_module	=	THIS_MODULE,
207	}
208}, {
209	.digestsize	=	SHA224_DIGEST_SIZE,
210	.init		=	sha224_base_init,
211	.update		=	sha256_avx_update,
212	.final		=	sha256_avx_final,
213	.finup		=	sha256_avx_finup,
214	.descsize	=	sizeof(struct sha256_state),
215	.base		=	{
216		.cra_name	=	"sha224",
217		.cra_driver_name =	"sha224-avx",
218		.cra_priority	=	160,
219		.cra_blocksize	=	SHA224_BLOCK_SIZE,
220		.cra_module	=	THIS_MODULE,
221	}
222} };
223
224static bool avx_usable(void)
225{
226	if (!cpu_has_xfeatures(XFEATURE_MASK_SSE | XFEATURE_MASK_YMM, NULL)) {
227		if (boot_cpu_has(X86_FEATURE_AVX))
228			pr_info("AVX detected but unusable.\n");
229		return false;
230	}
231
232	return true;
233}
234
235static int register_sha256_avx(void)
236{
237	if (avx_usable())
238		return crypto_register_shashes(sha256_avx_algs,
239				ARRAY_SIZE(sha256_avx_algs));
240	return 0;
241}
242
243static void unregister_sha256_avx(void)
 
244{
245	if (avx_usable())
246		crypto_unregister_shashes(sha256_avx_algs,
247				ARRAY_SIZE(sha256_avx_algs));
248}
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
249
250asmlinkage void sha256_transform_rorx(struct sha256_state *state,
251				      const u8 *data, int blocks);
252
253static int sha256_avx2_update(struct shash_desc *desc, const u8 *data,
254			 unsigned int len)
255{
256	return _sha256_update(desc, data, len, sha256_transform_rorx);
257}
258
259static int sha256_avx2_finup(struct shash_desc *desc, const u8 *data,
260		      unsigned int len, u8 *out)
261{
262	return sha256_finup(desc, data, len, out, sha256_transform_rorx);
263}
264
265static int sha256_avx2_final(struct shash_desc *desc, u8 *out)
266{
267	return sha256_avx2_finup(desc, NULL, 0, out);
268}
269
270static int sha256_avx2_digest(struct shash_desc *desc, const u8 *data,
271		      unsigned int len, u8 *out)
272{
273	return sha256_base_init(desc) ?:
274	       sha256_avx2_finup(desc, data, len, out);
275}
276
277static struct shash_alg sha256_avx2_algs[] = { {
278	.digestsize	=	SHA256_DIGEST_SIZE,
279	.init		=	sha256_base_init,
280	.update		=	sha256_avx2_update,
281	.final		=	sha256_avx2_final,
282	.finup		=	sha256_avx2_finup,
283	.digest		=	sha256_avx2_digest,
284	.descsize	=	sizeof(struct sha256_state),
285	.base		=	{
286		.cra_name	=	"sha256",
287		.cra_driver_name =	"sha256-avx2",
288		.cra_priority	=	170,
289		.cra_blocksize	=	SHA256_BLOCK_SIZE,
290		.cra_module	=	THIS_MODULE,
291	}
292}, {
293	.digestsize	=	SHA224_DIGEST_SIZE,
294	.init		=	sha224_base_init,
295	.update		=	sha256_avx2_update,
296	.final		=	sha256_avx2_final,
297	.finup		=	sha256_avx2_finup,
298	.descsize	=	sizeof(struct sha256_state),
299	.base		=	{
300		.cra_name	=	"sha224",
301		.cra_driver_name =	"sha224-avx2",
302		.cra_priority	=	170,
303		.cra_blocksize	=	SHA224_BLOCK_SIZE,
304		.cra_module	=	THIS_MODULE,
305	}
306} };
307
308static bool avx2_usable(void)
309{
310	if (avx_usable() && boot_cpu_has(X86_FEATURE_AVX2) &&
311		    boot_cpu_has(X86_FEATURE_BMI2))
312		return true;
313
314	return false;
315}
316
317static int register_sha256_avx2(void)
318{
319	if (avx2_usable())
320		return crypto_register_shashes(sha256_avx2_algs,
321				ARRAY_SIZE(sha256_avx2_algs));
322	return 0;
323}
324
325static void unregister_sha256_avx2(void)
326{
327	if (avx2_usable())
328		crypto_unregister_shashes(sha256_avx2_algs,
329				ARRAY_SIZE(sha256_avx2_algs));
330}
331
332#ifdef CONFIG_AS_SHA256_NI
333asmlinkage void sha256_ni_transform(struct sha256_state *digest,
334				    const u8 *data, int rounds);
 
 
 
 
 
 
335
336static int sha256_ni_update(struct shash_desc *desc, const u8 *data,
337			 unsigned int len)
338{
339	return _sha256_update(desc, data, len, sha256_ni_transform);
340}
341
342static int sha256_ni_finup(struct shash_desc *desc, const u8 *data,
343		      unsigned int len, u8 *out)
344{
345	return sha256_finup(desc, data, len, out, sha256_ni_transform);
346}
347
348static int sha256_ni_final(struct shash_desc *desc, u8 *out)
349{
350	return sha256_ni_finup(desc, NULL, 0, out);
351}
352
353static int sha256_ni_digest(struct shash_desc *desc, const u8 *data,
354		      unsigned int len, u8 *out)
355{
356	return sha256_base_init(desc) ?:
357	       sha256_ni_finup(desc, data, len, out);
358}
359
360static struct shash_alg sha256_ni_algs[] = { {
361	.digestsize	=	SHA256_DIGEST_SIZE,
362	.init		=	sha256_base_init,
363	.update		=	sha256_ni_update,
364	.final		=	sha256_ni_final,
365	.finup		=	sha256_ni_finup,
366	.digest		=	sha256_ni_digest,
367	.descsize	=	sizeof(struct sha256_state),
 
368	.base		=	{
369		.cra_name	=	"sha256",
370		.cra_driver_name =	"sha256-ni",
371		.cra_priority	=	250,
 
372		.cra_blocksize	=	SHA256_BLOCK_SIZE,
373		.cra_module	=	THIS_MODULE,
374	}
375}, {
376	.digestsize	=	SHA224_DIGEST_SIZE,
377	.init		=	sha224_base_init,
378	.update		=	sha256_ni_update,
379	.final		=	sha256_ni_final,
380	.finup		=	sha256_ni_finup,
 
381	.descsize	=	sizeof(struct sha256_state),
 
382	.base		=	{
383		.cra_name	=	"sha224",
384		.cra_driver_name =	"sha224-ni",
385		.cra_priority	=	250,
 
386		.cra_blocksize	=	SHA224_BLOCK_SIZE,
387		.cra_module	=	THIS_MODULE,
388	}
389} };
390
391static int register_sha256_ni(void)
 
392{
393	if (boot_cpu_has(X86_FEATURE_SHA_NI))
394		return crypto_register_shashes(sha256_ni_algs,
395				ARRAY_SIZE(sha256_ni_algs));
396	return 0;
397}
398
399static void unregister_sha256_ni(void)
400{
401	if (boot_cpu_has(X86_FEATURE_SHA_NI))
402		crypto_unregister_shashes(sha256_ni_algs,
403				ARRAY_SIZE(sha256_ni_algs));
404}
405
406#else
407static inline int register_sha256_ni(void) { return 0; }
408static inline void unregister_sha256_ni(void) { }
 
 
409#endif
410
411static int __init sha256_ssse3_mod_init(void)
412{
413	if (!x86_match_cpu(module_cpu_ids))
414		return -ENODEV;
415
416	if (register_sha256_ssse3())
417		goto fail;
418
419	if (register_sha256_avx()) {
420		unregister_sha256_ssse3();
421		goto fail;
422	}
423
424	if (register_sha256_avx2()) {
425		unregister_sha256_avx();
426		unregister_sha256_ssse3();
427		goto fail;
428	}
 
429
430	if (register_sha256_ni()) {
431		unregister_sha256_avx2();
432		unregister_sha256_avx();
433		unregister_sha256_ssse3();
434		goto fail;
 
 
 
 
 
 
 
435	}
 
436
437	return 0;
438fail:
439	return -ENODEV;
440}
441
442static void __exit sha256_ssse3_mod_fini(void)
443{
444	unregister_sha256_ni();
445	unregister_sha256_avx2();
446	unregister_sha256_avx();
447	unregister_sha256_ssse3();
448}
449
450module_init(sha256_ssse3_mod_init);
451module_exit(sha256_ssse3_mod_fini);
452
453MODULE_LICENSE("GPL");
454MODULE_DESCRIPTION("SHA256 Secure Hash Algorithm, Supplemental SSE3 accelerated");
455
456MODULE_ALIAS_CRYPTO("sha256");
457MODULE_ALIAS_CRYPTO("sha256-ssse3");
458MODULE_ALIAS_CRYPTO("sha256-avx");
459MODULE_ALIAS_CRYPTO("sha256-avx2");
460MODULE_ALIAS_CRYPTO("sha224");
461MODULE_ALIAS_CRYPTO("sha224-ssse3");
462MODULE_ALIAS_CRYPTO("sha224-avx");
463MODULE_ALIAS_CRYPTO("sha224-avx2");
464#ifdef CONFIG_AS_SHA256_NI
465MODULE_ALIAS_CRYPTO("sha256-ni");
466MODULE_ALIAS_CRYPTO("sha224-ni");
467#endif
v3.15
  1/*
  2 * Cryptographic API.
  3 *
  4 * Glue code for the SHA256 Secure Hash Algorithm assembler
  5 * implementation using supplemental SSE3 / AVX / AVX2 instructions.
  6 *
  7 * This file is based on sha256_generic.c
  8 *
  9 * Copyright (C) 2013 Intel Corporation.
 10 *
 11 * Author:
 12 *     Tim Chen <tim.c.chen@linux.intel.com>
 13 *
 14 * This program is free software; you can redistribute it and/or modify it
 15 * under the terms of the GNU General Public License as published by the Free
 16 * Software Foundation; either version 2 of the License, or (at your option)
 17 * any later version.
 18 *
 19 * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND,
 20 * EXPRESS OR IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF
 21 * MERCHANTABILITY, FITNESS FOR A PARTICULAR PURPOSE AND
 22 * NONINFRINGEMENT. IN NO EVENT SHALL THE AUTHORS OR COPYRIGHT HOLDERS
 23 * BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER LIABILITY, WHETHER IN AN
 24 * ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM, OUT OF OR IN
 25 * CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE
 26 * SOFTWARE.
 27 */
 28
 29
 30#define pr_fmt(fmt)	KBUILD_MODNAME ": " fmt
 31
 32#include <crypto/internal/hash.h>
 
 33#include <linux/init.h>
 34#include <linux/module.h>
 35#include <linux/mm.h>
 36#include <linux/cryptohash.h>
 37#include <linux/types.h>
 38#include <crypto/sha.h>
 39#include <asm/byteorder.h>
 40#include <asm/i387.h>
 41#include <asm/xcr.h>
 42#include <asm/xsave.h>
 43#include <linux/string.h>
 
 
 44
 45asmlinkage void sha256_transform_ssse3(const char *data, u32 *digest,
 46				     u64 rounds);
 47#ifdef CONFIG_AS_AVX
 48asmlinkage void sha256_transform_avx(const char *data, u32 *digest,
 49				     u64 rounds);
 50#endif
 51#ifdef CONFIG_AS_AVX2
 52asmlinkage void sha256_transform_rorx(const char *data, u32 *digest,
 53				     u64 rounds);
 54#endif
 
 
 
 
 
 
 
 
 
 
 
 55
 56static asmlinkage void (*sha256_transform_asm)(const char *, u32 *, u64);
 
 
 
 
 
 
 
 
 
 
 
 
 57
 
 
 58
 59static int sha256_ssse3_init(struct shash_desc *desc)
 
 60{
 61	struct sha256_state *sctx = shash_desc_ctx(desc);
 
 
 
 
 
 
 
 
 
 
 62
 63	sctx->state[0] = SHA256_H0;
 64	sctx->state[1] = SHA256_H1;
 65	sctx->state[2] = SHA256_H2;
 66	sctx->state[3] = SHA256_H3;
 67	sctx->state[4] = SHA256_H4;
 68	sctx->state[5] = SHA256_H5;
 69	sctx->state[6] = SHA256_H6;
 70	sctx->state[7] = SHA256_H7;
 71	sctx->count = 0;
 72
 73	return 0;
 
 
 
 74}
 75
 76static int __sha256_ssse3_update(struct shash_desc *desc, const u8 *data,
 77			       unsigned int len, unsigned int partial)
 78{
 79	struct sha256_state *sctx = shash_desc_ctx(desc);
 80	unsigned int done = 0;
 81
 82	sctx->count += len;
 
 
 
 
 
 83
 84	if (partial) {
 85		done = SHA256_BLOCK_SIZE - partial;
 86		memcpy(sctx->buf + partial, data, done);
 87		sha256_transform_asm(sctx->buf, sctx->state, 1);
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 88	}
 
 89
 90	if (len - done >= SHA256_BLOCK_SIZE) {
 91		const unsigned int rounds = (len - done) / SHA256_BLOCK_SIZE;
 
 
 
 
 
 92
 93		sha256_transform_asm(data + done, sctx->state, (u64) rounds);
 
 
 
 
 
 94
 95		done += rounds * SHA256_BLOCK_SIZE;
 96	}
 97
 98	memcpy(sctx->buf, data + done, len - done);
 
 
 
 
 99
100	return 0;
 
 
 
101}
102
103static int sha256_ssse3_update(struct shash_desc *desc, const u8 *data,
104			     unsigned int len)
105{
106	struct sha256_state *sctx = shash_desc_ctx(desc);
107	unsigned int partial = sctx->count % SHA256_BLOCK_SIZE;
108	int res;
109
110	/* Handle the fast case right here */
111	if (partial + len < SHA256_BLOCK_SIZE) {
112		sctx->count += len;
113		memcpy(sctx->buf + partial, data, len);
 
 
114
115		return 0;
 
 
 
 
 
 
 
 
 
 
 
 
 
116	}
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
117
118	if (!irq_fpu_usable()) {
119		res = crypto_sha256_update(desc, data, len);
120	} else {
121		kernel_fpu_begin();
122		res = __sha256_ssse3_update(desc, data, len, partial);
123		kernel_fpu_end();
124	}
125
126	return res;
127}
128
 
 
 
 
 
 
 
129
130/* Add padding and return the message digest. */
131static int sha256_ssse3_final(struct shash_desc *desc, u8 *out)
132{
133	struct sha256_state *sctx = shash_desc_ctx(desc);
134	unsigned int i, index, padlen;
135	__be32 *dst = (__be32 *)out;
136	__be64 bits;
137	static const u8 padding[SHA256_BLOCK_SIZE] = { 0x80, };
138
139	bits = cpu_to_be64(sctx->count << 3);
140
141	/* Pad out to 56 mod 64 and append length */
142	index = sctx->count % SHA256_BLOCK_SIZE;
143	padlen = (index < 56) ? (56 - index) : ((SHA256_BLOCK_SIZE+56)-index);
144
145	if (!irq_fpu_usable()) {
146		crypto_sha256_update(desc, padding, padlen);
147		crypto_sha256_update(desc, (const u8 *)&bits, sizeof(bits));
148	} else {
149		kernel_fpu_begin();
150		/* We need to fill a whole block for __sha256_ssse3_update() */
151		if (padlen <= 56) {
152			sctx->count += padlen;
153			memcpy(sctx->buf + index, padding, padlen);
154		} else {
155			__sha256_ssse3_update(desc, padding, padlen, index);
156		}
157		__sha256_ssse3_update(desc, (const u8 *)&bits,
158					sizeof(bits), 56);
159		kernel_fpu_end();
160	}
161
162	/* Store state in digest */
163	for (i = 0; i < 8; i++)
164		dst[i] = cpu_to_be32(sctx->state[i]);
165
166	/* Wipe context */
167	memset(sctx, 0, sizeof(*sctx));
168
169	return 0;
 
 
 
170}
171
172static int sha256_ssse3_export(struct shash_desc *desc, void *out)
 
173{
174	struct sha256_state *sctx = shash_desc_ctx(desc);
 
175
176	memcpy(out, sctx, sizeof(*sctx));
 
 
 
177
178	return 0;
 
 
 
 
179}
180
181static int sha256_ssse3_import(struct shash_desc *desc, const void *in)
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
182{
183	struct sha256_state *sctx = shash_desc_ctx(desc);
 
 
184
185	memcpy(sctx, in, sizeof(*sctx));
 
186
 
 
 
 
 
187	return 0;
188}
189
190static int sha224_ssse3_init(struct shash_desc *desc)
191{
192	struct sha256_state *sctx = shash_desc_ctx(desc);
 
 
 
193
194	sctx->state[0] = SHA224_H0;
195	sctx->state[1] = SHA224_H1;
196	sctx->state[2] = SHA224_H2;
197	sctx->state[3] = SHA224_H3;
198	sctx->state[4] = SHA224_H4;
199	sctx->state[5] = SHA224_H5;
200	sctx->state[6] = SHA224_H6;
201	sctx->state[7] = SHA224_H7;
202	sctx->count = 0;
203
204	return 0;
 
 
 
205}
206
207static int sha224_ssse3_final(struct shash_desc *desc, u8 *hash)
 
208{
209	u8 D[SHA256_DIGEST_SIZE];
 
210
211	sha256_ssse3_final(desc, D);
 
 
 
212
213	memcpy(hash, D, SHA224_DIGEST_SIZE);
214	memset(D, 0, SHA256_DIGEST_SIZE);
215
216	return 0;
 
217}
218
219static struct shash_alg algs[] = { {
220	.digestsize	=	SHA256_DIGEST_SIZE,
221	.init		=	sha256_ssse3_init,
222	.update		=	sha256_ssse3_update,
223	.final		=	sha256_ssse3_final,
224	.export		=	sha256_ssse3_export,
225	.import		=	sha256_ssse3_import,
226	.descsize	=	sizeof(struct sha256_state),
227	.statesize	=	sizeof(struct sha256_state),
228	.base		=	{
229		.cra_name	=	"sha256",
230		.cra_driver_name =	"sha256-ssse3",
231		.cra_priority	=	150,
232		.cra_flags	=	CRYPTO_ALG_TYPE_SHASH,
233		.cra_blocksize	=	SHA256_BLOCK_SIZE,
234		.cra_module	=	THIS_MODULE,
235	}
236}, {
237	.digestsize	=	SHA224_DIGEST_SIZE,
238	.init		=	sha224_ssse3_init,
239	.update		=	sha256_ssse3_update,
240	.final		=	sha224_ssse3_final,
241	.export		=	sha256_ssse3_export,
242	.import		=	sha256_ssse3_import,
243	.descsize	=	sizeof(struct sha256_state),
244	.statesize	=	sizeof(struct sha256_state),
245	.base		=	{
246		.cra_name	=	"sha224",
247		.cra_driver_name =	"sha224-ssse3",
248		.cra_priority	=	150,
249		.cra_flags	=	CRYPTO_ALG_TYPE_SHASH,
250		.cra_blocksize	=	SHA224_BLOCK_SIZE,
251		.cra_module	=	THIS_MODULE,
252	}
253} };
254
255#ifdef CONFIG_AS_AVX
256static bool __init avx_usable(void)
257{
258	u64 xcr0;
 
 
 
 
259
260	if (!cpu_has_avx || !cpu_has_osxsave)
261		return false;
262
263	xcr0 = xgetbv(XCR_XFEATURE_ENABLED_MASK);
264	if ((xcr0 & (XSTATE_SSE | XSTATE_YMM)) != (XSTATE_SSE | XSTATE_YMM)) {
265		pr_info("AVX detected but unusable.\n");
266
267		return false;
268	}
269
270	return true;
271}
272#endif
273
274static int __init sha256_ssse3_mod_init(void)
275{
276	/* test for SSSE3 first */
277	if (cpu_has_ssse3)
278		sha256_transform_asm = sha256_transform_ssse3;
279
280#ifdef CONFIG_AS_AVX
281	/* allow AVX to override SSSE3, it's a little faster */
282	if (avx_usable()) {
283#ifdef CONFIG_AS_AVX2
284		if (boot_cpu_has(X86_FEATURE_AVX2) && boot_cpu_has(X86_FEATURE_BMI2))
285			sha256_transform_asm = sha256_transform_rorx;
286		else
287#endif
288			sha256_transform_asm = sha256_transform_avx;
 
 
289	}
290#endif
291
292	if (sha256_transform_asm) {
293#ifdef CONFIG_AS_AVX
294		if (sha256_transform_asm == sha256_transform_avx)
295			pr_info("Using AVX optimized SHA-256 implementation\n");
296#ifdef CONFIG_AS_AVX2
297		else if (sha256_transform_asm == sha256_transform_rorx)
298			pr_info("Using AVX2 optimized SHA-256 implementation\n");
299#endif
300		else
301#endif
302			pr_info("Using SSSE3 optimized SHA-256 implementation\n");
303		return crypto_register_shashes(algs, ARRAY_SIZE(algs));
304	}
305	pr_info("Neither AVX nor SSSE3 is available/usable.\n");
306
 
 
307	return -ENODEV;
308}
309
310static void __exit sha256_ssse3_mod_fini(void)
311{
312	crypto_unregister_shashes(algs, ARRAY_SIZE(algs));
 
 
 
313}
314
315module_init(sha256_ssse3_mod_init);
316module_exit(sha256_ssse3_mod_fini);
317
318MODULE_LICENSE("GPL");
319MODULE_DESCRIPTION("SHA256 Secure Hash Algorithm, Supplemental SSE3 accelerated");
320
321MODULE_ALIAS("sha256");
322MODULE_ALIAS("sha224");