aboutsummaryrefslogtreecommitdiffstats
path: root/libblake_blake2s_force_update.c
blob: 716f70f9c85da0003854740093399b8ac9020a9f (plain) (blame)
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
/* See LICENSE file for copyright and license details. */
#include "common.h"

size_t
libblake_blake2s_force_update(struct libblake_blake2s_state *state, const void *data_, size_t len)
{
	const unsigned char *data = data_;
	size_t off = 0;

	for (; len - off >= 64; off += 64) {
		/* The following optimisations have been tested:
		 * 
		 * 1)
		 *     `*(uint64_t *)state->t += 64;`
		 *     result: slower
		 * 
		 * 2)
		 *     using `__builtin_add_overflow`
		 *     result: no difference
		 * 
		 * These testes where preformed on amd64 with a compile-time
		 * assumption that `UINT_LEAST32_C(0xFFFFffff) + 1 == 0`,
		 * which the compiler accepted and those included the attempted
		 * optimisations.
		 * 
		 * UNLIKELY does not seem to make any difference, but it
		 * does change the output, theoretically of the better.
		 */
		state->t[0] = (state->t[0] + 64) & UINT_LEAST32_C(0xFFFFffff);
		if (UNLIKELY(state->t[0] < 64))
			state->t[1] = (state->t[1] + 1) & UINT_LEAST32_C(0xFFFFffff);

		libblake_internal_blake2s_compress(state, &data[off]);
	}

	return off;
}