diff options
author | Eric Biggers <ebiggers@google.com> | 2018-09-11 23:05:10 -0400 |
---|---|---|
committer | Herbert Xu <herbert@gondor.apana.org.au> | 2018-09-21 01:24:50 -0400 |
commit | a5e9f557098e54af44ade5d501379be18435bfbf (patch) | |
tree | 4410647aaa269fd9a4e304851b06f83251b12853 /crypto/chacha20_generic.c | |
parent | 78105c7e769b8cfa4a4d59027807882b560a2634 (diff) |
crypto: chacha20 - Fix chacha20_block() keystream alignment (again)
In commit 9f480faec58c ("crypto: chacha20 - Fix keystream alignment for
chacha20_block()"), I had missed that chacha20_block() can be called
directly on the buffer passed to get_random_bytes(), which can have any
alignment. So, while my commit didn't break anything, it didn't fully
solve the alignment problems.
Revert my solution and just update chacha20_block() to use
put_unaligned_le32(), so the output buffer need not be aligned.
This is simpler, and on many CPUs it's the same speed.
But, I kept the 'tmp' buffers in extract_crng_user() and
_get_random_bytes() 4-byte aligned, since that alignment is actually
needed for _crng_backtrack_protect() too.
Reported-by: Stephan Müller <smueller@chronox.de>
Cc: Theodore Ts'o <tytso@mit.edu>
Signed-off-by: Eric Biggers <ebiggers@google.com>
Signed-off-by: Herbert Xu <herbert@gondor.apana.org.au>
Diffstat (limited to 'crypto/chacha20_generic.c')
-rw-r--r-- | crypto/chacha20_generic.c | 7 |
1 files changed, 4 insertions, 3 deletions
diff --git a/crypto/chacha20_generic.c b/crypto/chacha20_generic.c index e451c3cb6a56..3ae96587caf9 100644 --- a/crypto/chacha20_generic.c +++ b/crypto/chacha20_generic.c | |||
@@ -18,20 +18,21 @@ | |||
18 | static void chacha20_docrypt(u32 *state, u8 *dst, const u8 *src, | 18 | static void chacha20_docrypt(u32 *state, u8 *dst, const u8 *src, |
19 | unsigned int bytes) | 19 | unsigned int bytes) |
20 | { | 20 | { |
21 | u32 stream[CHACHA20_BLOCK_WORDS]; | 21 | /* aligned to potentially speed up crypto_xor() */ |
22 | u8 stream[CHACHA20_BLOCK_SIZE] __aligned(sizeof(long)); | ||
22 | 23 | ||
23 | if (dst != src) | 24 | if (dst != src) |
24 | memcpy(dst, src, bytes); | 25 | memcpy(dst, src, bytes); |
25 | 26 | ||
26 | while (bytes >= CHACHA20_BLOCK_SIZE) { | 27 | while (bytes >= CHACHA20_BLOCK_SIZE) { |
27 | chacha20_block(state, stream); | 28 | chacha20_block(state, stream); |
28 | crypto_xor(dst, (const u8 *)stream, CHACHA20_BLOCK_SIZE); | 29 | crypto_xor(dst, stream, CHACHA20_BLOCK_SIZE); |
29 | bytes -= CHACHA20_BLOCK_SIZE; | 30 | bytes -= CHACHA20_BLOCK_SIZE; |
30 | dst += CHACHA20_BLOCK_SIZE; | 31 | dst += CHACHA20_BLOCK_SIZE; |
31 | } | 32 | } |
32 | if (bytes) { | 33 | if (bytes) { |
33 | chacha20_block(state, stream); | 34 | chacha20_block(state, stream); |
34 | crypto_xor(dst, (const u8 *)stream, bytes); | 35 | crypto_xor(dst, stream, bytes); |
35 | } | 36 | } |
36 | } | 37 | } |
37 | 38 | ||