diff options
author | Mattias Andrée <maandree@kth.se> | 2022-01-19 20:28:55 +0100 |
---|---|---|
committer | Mattias Andrée <maandree@kth.se> | 2022-01-19 20:28:55 +0100 |
commit | 5d77a0178349ecac6536e0374cf689500efa22bc (patch) | |
tree | f6fcb38cd39e8f4240537233a08fdbb5c0284798 /libblake_internal_blake2xb_init0.c | |
parent | Improve portability (diff) | |
download | libblake-5d77a0178349ecac6536e0374cf689500efa22bc.tar.gz libblake-5d77a0178349ecac6536e0374cf689500efa22bc.tar.bz2 libblake-5d77a0178349ecac6536e0374cf689500efa22bc.tar.xz |
Optimisation for amd64
Increased major number as the ABI was broken
by insertion of padding into the BLAKE2
parameter structures (except for BLAKE2Xs)
Signed-off-by: Mattias Andrée <maandree@kth.se>
Diffstat (limited to 'libblake_internal_blake2xb_init0.c')
-rw-r--r-- | libblake_internal_blake2xb_init0.c | 112 |
1 files changed, 71 insertions, 41 deletions
diff --git a/libblake_internal_blake2xb_init0.c b/libblake_internal_blake2xb_init0.c index d6063dc..c045cec 100644 --- a/libblake_internal_blake2xb_init0.c +++ b/libblake_internal_blake2xb_init0.c @@ -1,6 +1,25 @@ /* See LICENSE file for copyright and license details. */ #include "common.h" +#if defined(LITTLE_ENDIAN) +# define le64(X) X +#else +static uint_least64_t +le64(uint_least64_t h) +{ + unsigned char r[8]; + r[0] = (unsigned char)((h >> 0) & 255); + r[1] = (unsigned char)((h >> 8) & 255); + r[2] = (unsigned char)((h >> 16) & 255); + r[3] = (unsigned char)((h >> 24) & 255); + r[4] = (unsigned char)((h >> 32) & 255); + r[5] = (unsigned char)((h >> 40) & 255); + r[6] = (unsigned char)((h >> 48) & 255); + r[7] = (unsigned char)((h >> 56) & 255); + return *(uint_least64_t *)r; +} +#endif + void libblake_internal_blake2xb_init0(struct libblake_blake2xb_state *state, const struct libblake_blake2xb_params *params) { @@ -18,45 +37,56 @@ libblake_internal_blake2xb_init0(struct libblake_blake2xb_state *state, const st state->b2b.f[0] = 0; state->b2b.f[1] = 0; - state->b2b.h[0] ^= ((uint_least64_t)params->digest_len & 255) << 0; - state->b2b.h[0] ^= ((uint_least64_t)params->key_len & 255) << 8; - state->b2b.h[0] ^= ((uint_least64_t)params->fanout & 255) << 16; - state->b2b.h[0] ^= ((uint_least64_t)params->depth & 255) << 24; - state->b2b.h[0] ^= (uint_least64_t)(params->leaf_len & UINT_LEAST32_C(0xFFFFffff)) << 32; - state->b2b.h[1] ^= (uint_least64_t)(params->node_offset & UINT_LEAST32_C(0xFFFFffff)) << 0; - state->b2b.h[1] ^= (uint_least64_t)(params->xof_len & UINT_LEAST32_C(0xFFFFffff)) << 32; - state->b2b.h[2] ^= ((uint_least64_t)params->node_depth & 255) << 0; - state->b2b.h[2] ^= ((uint_least64_t)params->inner_len & 255) << 8; - state->b2b.h[4] ^= ((uint_least64_t)params->salt[0] & 255) << 0; - state->b2b.h[4] ^= ((uint_least64_t)params->salt[1] & 255) << 8; - state->b2b.h[4] ^= ((uint_least64_t)params->salt[2] & 255) << 16; - state->b2b.h[4] ^= ((uint_least64_t)params->salt[3] & 255) << 24; - state->b2b.h[4] ^= ((uint_least64_t)params->salt[4] & 255) << 32; - state->b2b.h[4] ^= ((uint_least64_t)params->salt[5] & 255) << 40; - state->b2b.h[4] ^= ((uint_least64_t)params->salt[6] & 255) << 48; - state->b2b.h[4] ^= ((uint_least64_t)params->salt[7] & 255) << 56; - state->b2b.h[5] ^= ((uint_least64_t)params->salt[8] & 255) << 0; - state->b2b.h[5] ^= ((uint_least64_t)params->salt[9] & 255) << 8; - state->b2b.h[5] ^= ((uint_least64_t)params->salt[A] & 255) << 16; - state->b2b.h[5] ^= ((uint_least64_t)params->salt[B] & 255) << 24; - state->b2b.h[5] ^= ((uint_least64_t)params->salt[C] & 255) << 32; - state->b2b.h[5] ^= ((uint_least64_t)params->salt[D] & 255) << 40; - state->b2b.h[5] ^= ((uint_least64_t)params->salt[E] & 255) << 48; - state->b2b.h[5] ^= ((uint_least64_t)params->salt[F] & 255) << 56; - state->b2b.h[6] ^= ((uint_least64_t)params->pepper[0] & 255) << 0; - state->b2b.h[6] ^= ((uint_least64_t)params->pepper[1] & 255) << 8; - state->b2b.h[6] ^= ((uint_least64_t)params->pepper[2] & 255) << 16; - state->b2b.h[6] ^= ((uint_least64_t)params->pepper[3] & 255) << 24; - state->b2b.h[6] ^= ((uint_least64_t)params->pepper[4] & 255) << 32; - state->b2b.h[6] ^= ((uint_least64_t)params->pepper[5] & 255) << 40; - state->b2b.h[6] ^= ((uint_least64_t)params->pepper[6] & 255) << 48; - state->b2b.h[6] ^= ((uint_least64_t)params->pepper[7] & 255) << 56; - state->b2b.h[7] ^= ((uint_least64_t)params->pepper[8] & 255) << 0; - state->b2b.h[7] ^= ((uint_least64_t)params->pepper[9] & 255) << 8; - state->b2b.h[7] ^= ((uint_least64_t)params->pepper[A] & 255) << 16; - state->b2b.h[7] ^= ((uint_least64_t)params->pepper[B] & 255) << 24; - state->b2b.h[7] ^= ((uint_least64_t)params->pepper[C] & 255) << 32; - state->b2b.h[7] ^= ((uint_least64_t)params->pepper[D] & 255) << 40; - state->b2b.h[7] ^= ((uint_least64_t)params->pepper[E] & 255) << 48; - state->b2b.h[7] ^= ((uint_least64_t)params->pepper[F] & 255) << 56; + if (offsetof(struct libblake_blake2xb_params, inner_len) == 17) { + state->b2b.h[0] ^= le64(((uint_least64_t *)params)[0]); + state->b2b.h[1] ^= le64(((uint_least64_t *)params)[1]); + state->b2b.h[2] ^= le64(((uint_least64_t)params->node_depth << 0) | + ((uint_least64_t)params->inner_len << 8)); + state->b2b.h[4] ^= le64(*(uint_least64_t *)¶ms->salt[0]); + state->b2b.h[5] ^= le64(*(uint_least64_t *)¶ms->salt[8]); + state->b2b.h[6] ^= le64(*(uint_least64_t *)¶ms->pepper[0]); + state->b2b.h[7] ^= le64(*(uint_least64_t *)¶ms->pepper[8]); + } else { + state->b2b.h[0] ^= ((uint_least64_t)params->digest_len & 255) << 0; + state->b2b.h[0] ^= ((uint_least64_t)params->key_len & 255) << 8; + state->b2b.h[0] ^= ((uint_least64_t)params->fanout & 255) << 16; + state->b2b.h[0] ^= ((uint_least64_t)params->depth & 255) << 24; + state->b2b.h[0] ^= (uint_least64_t)(params->leaf_len & UINT_LEAST32_C(0xFFFFffff)) << 32; + state->b2b.h[1] ^= (uint_least64_t)(params->node_offset & UINT_LEAST32_C(0xFFFFffff)) << 0; + state->b2b.h[1] ^= (uint_least64_t)(params->xof_len & UINT_LEAST32_C(0xFFFFffff)) << 32; + state->b2b.h[2] ^= ((uint_least64_t)params->node_depth & 255) << 0; + state->b2b.h[2] ^= ((uint_least64_t)params->inner_len & 255) << 8; + state->b2b.h[4] ^= ((uint_least64_t)params->salt[0] & 255) << 0; + state->b2b.h[4] ^= ((uint_least64_t)params->salt[1] & 255) << 8; + state->b2b.h[4] ^= ((uint_least64_t)params->salt[2] & 255) << 16; + state->b2b.h[4] ^= ((uint_least64_t)params->salt[3] & 255) << 24; + state->b2b.h[4] ^= ((uint_least64_t)params->salt[4] & 255) << 32; + state->b2b.h[4] ^= ((uint_least64_t)params->salt[5] & 255) << 40; + state->b2b.h[4] ^= ((uint_least64_t)params->salt[6] & 255) << 48; + state->b2b.h[4] ^= ((uint_least64_t)params->salt[7] & 255) << 56; + state->b2b.h[5] ^= ((uint_least64_t)params->salt[8] & 255) << 0; + state->b2b.h[5] ^= ((uint_least64_t)params->salt[9] & 255) << 8; + state->b2b.h[5] ^= ((uint_least64_t)params->salt[A] & 255) << 16; + state->b2b.h[5] ^= ((uint_least64_t)params->salt[B] & 255) << 24; + state->b2b.h[5] ^= ((uint_least64_t)params->salt[C] & 255) << 32; + state->b2b.h[5] ^= ((uint_least64_t)params->salt[D] & 255) << 40; + state->b2b.h[5] ^= ((uint_least64_t)params->salt[E] & 255) << 48; + state->b2b.h[5] ^= ((uint_least64_t)params->salt[F] & 255) << 56; + state->b2b.h[6] ^= ((uint_least64_t)params->pepper[0] & 255) << 0; + state->b2b.h[6] ^= ((uint_least64_t)params->pepper[1] & 255) << 8; + state->b2b.h[6] ^= ((uint_least64_t)params->pepper[2] & 255) << 16; + state->b2b.h[6] ^= ((uint_least64_t)params->pepper[3] & 255) << 24; + state->b2b.h[6] ^= ((uint_least64_t)params->pepper[4] & 255) << 32; + state->b2b.h[6] ^= ((uint_least64_t)params->pepper[5] & 255) << 40; + state->b2b.h[6] ^= ((uint_least64_t)params->pepper[6] & 255) << 48; + state->b2b.h[6] ^= ((uint_least64_t)params->pepper[7] & 255) << 56; + state->b2b.h[7] ^= ((uint_least64_t)params->pepper[8] & 255) << 0; + state->b2b.h[7] ^= ((uint_least64_t)params->pepper[9] & 255) << 8; + state->b2b.h[7] ^= ((uint_least64_t)params->pepper[A] & 255) << 16; + state->b2b.h[7] ^= ((uint_least64_t)params->pepper[B] & 255) << 24; + state->b2b.h[7] ^= ((uint_least64_t)params->pepper[C] & 255) << 32; + state->b2b.h[7] ^= ((uint_least64_t)params->pepper[D] & 255) << 40; + state->b2b.h[7] ^= ((uint_least64_t)params->pepper[E] & 255) << 48; + state->b2b.h[7] ^= ((uint_least64_t)params->pepper[F] & 255) << 56; + } } |