Commit 8a1955f9 authored by Peter Lafreniere's avatar Peter Lafreniere Committed by Herbert Xu

crypto: x86 - exit fpu context earlier in ECB/CBC macros

Currently the ecb/cbc macros hold fpu context unnecessarily when using
scalar cipher routines (e.g. when handling odd sizes of blocks per walk).

Change the macros to drop fpu context as soon as the fpu is out of use.

No performance impact found (on Intel Haswell).
Signed-off-by: default avatarPeter Lafreniere <peter@n8pjl.ca>
Acked-by: default avatarArd Biesheuvel <ardb@kernel.org>
Signed-off-by: default avatarHerbert Xu <herbert@gondor.apana.org.au>
parent 42a9a08b
...@@ -13,13 +13,14 @@ ...@@ -13,13 +13,14 @@
#define ECB_WALK_START(req, bsize, fpu_blocks) do { \ #define ECB_WALK_START(req, bsize, fpu_blocks) do { \
void *ctx = crypto_skcipher_ctx(crypto_skcipher_reqtfm(req)); \ void *ctx = crypto_skcipher_ctx(crypto_skcipher_reqtfm(req)); \
const int __fpu_blocks = (fpu_blocks); \
const int __bsize = (bsize); \ const int __bsize = (bsize); \
struct skcipher_walk walk; \ struct skcipher_walk walk; \
int err = skcipher_walk_virt(&walk, (req), false); \ int err = skcipher_walk_virt(&walk, (req), false); \
while (walk.nbytes > 0) { \ while (walk.nbytes > 0) { \
unsigned int nbytes = walk.nbytes; \ unsigned int nbytes = walk.nbytes; \
bool do_fpu = (fpu_blocks) != -1 && \ bool do_fpu = __fpu_blocks != -1 && \
nbytes >= (fpu_blocks) * __bsize; \ nbytes >= __fpu_blocks * __bsize; \
const u8 *src = walk.src.virt.addr; \ const u8 *src = walk.src.virt.addr; \
u8 *dst = walk.dst.virt.addr; \ u8 *dst = walk.dst.virt.addr; \
u8 __maybe_unused buf[(bsize)]; \ u8 __maybe_unused buf[(bsize)]; \
...@@ -35,7 +36,12 @@ ...@@ -35,7 +36,12 @@
} while (0) } while (0)
#define ECB_BLOCK(blocks, func) do { \ #define ECB_BLOCK(blocks, func) do { \
while (nbytes >= (blocks) * __bsize) { \ const int __blocks = (blocks); \
if (do_fpu && __blocks < __fpu_blocks) { \
kernel_fpu_end(); \
do_fpu = false; \
} \
while (nbytes >= __blocks * __bsize) { \
(func)(ctx, dst, src); \ (func)(ctx, dst, src); \
ECB_WALK_ADVANCE(blocks); \ ECB_WALK_ADVANCE(blocks); \
} \ } \
...@@ -53,7 +59,12 @@ ...@@ -53,7 +59,12 @@
} while (0) } while (0)
#define CBC_DEC_BLOCK(blocks, func) do { \ #define CBC_DEC_BLOCK(blocks, func) do { \
while (nbytes >= (blocks) * __bsize) { \ const int __blocks = (blocks); \
if (do_fpu && __blocks < __fpu_blocks) { \
kernel_fpu_end(); \
do_fpu = false; \
} \
while (nbytes >= __blocks * __bsize) { \
const u8 *__iv = src + ((blocks) - 1) * __bsize; \ const u8 *__iv = src + ((blocks) - 1) * __bsize; \
if (dst == src) \ if (dst == src) \
__iv = memcpy(buf, __iv, __bsize); \ __iv = memcpy(buf, __iv, __bsize); \
......
Markdown is supported
0%
or
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment