-
Notifications
You must be signed in to change notification settings - Fork 4
/
Copy pathxxh3-64b-ref.c
642 lines (564 loc) · 26.4 KB
/
xxh3-64b-ref.c
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
167
168
169
170
171
172
173
174
175
176
177
178
179
180
181
182
183
184
185
186
187
188
189
190
191
192
193
194
195
196
197
198
199
200
201
202
203
204
205
206
207
208
209
210
211
212
213
214
215
216
217
218
219
220
221
222
223
224
225
226
227
228
229
230
231
232
233
234
235
236
237
238
239
240
241
242
243
244
245
246
247
248
249
250
251
252
253
254
255
256
257
258
259
260
261
262
263
264
265
266
267
268
269
270
271
272
273
274
275
276
277
278
279
280
281
282
283
284
285
286
287
288
289
290
291
292
293
294
295
296
297
298
299
300
301
302
303
304
305
306
307
308
309
310
311
312
313
314
315
316
317
318
319
320
321
322
323
324
325
326
327
328
329
330
331
332
333
334
335
336
337
338
339
340
341
342
343
344
345
346
347
348
349
350
351
352
353
354
355
356
357
358
359
360
361
362
363
364
365
366
367
368
369
370
371
372
373
374
375
376
377
378
379
380
381
382
383
384
385
386
387
388
389
390
391
392
393
394
395
396
397
398
399
400
401
402
403
404
405
406
407
408
409
410
411
412
413
414
415
416
417
418
419
420
421
422
423
424
425
426
427
428
429
430
431
432
433
434
435
436
437
438
439
440
441
442
443
444
445
446
447
448
449
450
451
452
453
454
455
456
457
458
459
460
461
462
463
464
465
466
467
468
469
470
471
472
473
474
475
476
477
478
479
480
481
482
483
484
485
486
487
488
489
490
491
492
493
494
495
496
497
498
499
500
501
502
503
504
505
506
507
508
509
510
511
512
513
514
515
516
517
518
519
520
521
522
523
524
525
526
527
528
529
530
531
532
533
534
535
536
537
538
539
540
541
542
543
544
545
546
547
548
549
550
551
552
553
554
555
556
557
558
559
560
561
562
563
564
565
566
567
568
569
570
571
572
573
574
575
576
577
578
579
580
581
582
583
584
585
586
587
588
589
590
591
592
593
594
595
596
597
598
599
600
601
602
603
604
605
606
607
608
609
610
611
612
613
614
615
616
617
618
619
620
621
622
623
624
625
626
627
628
629
630
631
632
633
634
635
636
637
638
639
640
641
/*
* xxHash - Extremely Fast Hash algorithm
* Copyright (C) 2019-2020 Yann Collet
* Copyright (C) 2019-2020 Devin Hussey (easyaspi314)
*
* BSD 2-Clause License (https://www.opensource.org/licenses/bsd-license.php)
*
* Redistribution and use in source and binary forms, with or without
* modification, are permitted provided that the following conditions are
* met:
*
* * Redistributions of source code must retain the above copyright
* notice, this list of conditions and the following disclaimer.
* * Redistributions in binary form must reproduce the above
* copyright notice, this list of conditions and the following disclaimer
* in the documentation and/or other materials provided with the
* distribution.
*
* THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS
* "AS IS" AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT
* LIMITED TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR
* A PARTICULAR PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT
* OWNER OR CONTRIBUTORS BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL,
* SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT
* LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE,
* DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY
* THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT
* (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE
* OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
*
* You can contact the author at:
* - xxHash homepage: https://www.xxhash.com
* - xxHash source repository: https://github.com/Cyan4973/xxHash
*/
/* A compact, 100% standalone reference XXH3_64bits implementation that focuses on clarity.
* correctness, and portability, instead of dirty speed hacks.
*
* This file aims to be 100% compatible with C90 and C++ with the additional requirement of
* stdint.h and long long.
*
* There is no self test at the moment as the official test values have not been updated
* for the new algorithm. */
#include <stddef.h> /* size_t */
#include <stdint.h> /* uint8_t, uint32_t, uint64_t */
#include <string.h> /* memcpy */
typedef uint64_t XXH64_hash_t;
#ifdef __cplusplus
extern "C" {
#endif
#define XXH3_SECRET_SIZE_MIN 136
XXH64_hash_t XXH3_64bits(void const *const input, size_t const length);
XXH64_hash_t XXH3_64bits_withSeed(void const *const input, size_t const length, XXH64_hash_t const seed);
XXH64_hash_t XXH3_64bits_withSecret(void const *const input, size_t const length, void const *const secret, size_t secret_size);
#ifdef __cplusplus
}
#endif
static uint32_t const PRIME32_1 = 0x9E3779B1U; /* 0b10011110001101110111100110110001 */
static uint32_t const PRIME32_2 = 0x85EBCA77U; /* 0b10000101111010111100101001110111 */
static uint32_t const PRIME32_3 = 0xC2B2AE3DU; /* 0b11000010101100101010111000111101 */
static uint64_t const PRIME64_1 = 0x9E3779B185EBCA87ULL; /* 0b1001111000110111011110011011000110000101111010111100101010000111 */
static uint64_t const PRIME64_2 = 0xC2B2AE3D27D4EB4FULL; /* 0b1100001010110010101011100011110100100111110101001110101101001111 */
static uint64_t const PRIME64_3 = 0x165667B19E3779F9ULL; /* 0b0001011001010110011001111011000110011110001101110111100111111001 */
static uint64_t const PRIME64_4 = 0x85EBCA77C2B2AE63ULL; /* 0b1000010111101011110010100111011111000010101100101010111001100011 */
static uint64_t const PRIME64_5 = 0x27D4EB2F165667C5ULL; /* 0b0010011111010100111010110010111100010110010101100110011111000101 */
/* Portably reads a 32-bit little endian integer from p. */
static uint32_t XXH_read32(uint8_t const *const p)
{
#if defined(_WIN32) || (defined(__BYTE_ORDER__) && __BYTE_ORDER__==__ORDER_LITTLE_ENDIAN__)
uint32_t ret;
memcpy(&ret, p, sizeof(uint32_t));
return ret;
#else
return (uint32_t)p[0]
| ((uint32_t)p[1] << 8)
| ((uint32_t)p[2] << 16)
| ((uint32_t)p[3] << 24);
#endif
}
/* Portably reads a 64-bit little endian integer from p. */
static uint64_t XXH_read64(uint8_t const *const p)
{
#if defined(_WIN32) || (defined(__BYTE_ORDER__) && __BYTE_ORDER__==__ORDER_LITTLE_ENDIAN__)
uint64_t ret;
memcpy(&ret, p, sizeof(uint64_t));
return ret;
#else
return (uint64_t)p[0]
| ((uint64_t)p[1] << 8)
| ((uint64_t)p[2] << 16)
| ((uint64_t)p[3] << 24)
| ((uint64_t)p[4] << 32)
| ((uint64_t)p[5] << 40)
| ((uint64_t)p[6] << 48)
| ((uint64_t)p[7] << 56);
#endif
}
/* Portably writes a 64-bit little endian integer to p. */
static void XXH_write64(uint8_t *const p, uint64_t val)
{
#if defined(_WIN32) || (defined(__BYTE_ORDER__) && __BYTE_ORDER__==__ORDER_LITTLE_ENDIAN__)
memcpy(p, &val, sizeof(uint64_t));
#else
p[0] = (uint8_t)(val >> 0);
p[1] = (uint8_t)(val >> 8);
p[2] = (uint8_t)(val >> 16);
p[3] = (uint8_t)(val >> 24);
p[4] = (uint8_t)(val >> 32);
p[5] = (uint8_t)(val >> 40);
p[6] = (uint8_t)(val >> 48);
p[7] = (uint8_t)(val >> 56);
#endif
}
/* 32-bit byteswap */
static uint32_t XXH_swap32(uint32_t const x)
{
return ((x << 24) & 0xff000000)
| ((x << 8) & 0x00ff0000)
| ((x >> 8) & 0x0000ff00)
| ((x >> 24) & 0x000000ff);
}
/* 32-bit byteswap */
static uint64_t XXH_swap64(uint64_t const x)
{
return ((x << 56) & 0xff00000000000000ULL)
| ((x << 40) & 0x00ff000000000000ULL)
| ((x << 24) & 0x0000ff0000000000ULL)
| ((x << 8) & 0x000000ff00000000ULL)
| ((x >> 8) & 0x00000000ff000000ULL)
| ((x >> 24) & 0x0000000000ff0000ULL)
| ((x >> 40) & 0x000000000000ff00ULL)
| ((x >> 56) & 0x00000000000000ffULL);
}
/* 64-bit rotate left */
static uint64_t XXH_rotl64(uint64_t const val, unsigned const amt)
{
return (val << (amt % 64)) | (val >> (64 - amt % 64));
}
#define XXH_SECRET_DEFAULT_SIZE 192 /* minimum XXH3_SECRET_SIZE_MIN */
/* Pseudorandom data taken directly from FARSH */
static uint8_t const kSecret[XXH_SECRET_DEFAULT_SIZE] = {
0xb8, 0xfe, 0x6c, 0x39, 0x23, 0xa4, 0x4b, 0xbe, 0x7c, 0x01, 0x81, 0x2c, 0xf7, 0x21, 0xad, 0x1c,
0xde, 0xd4, 0x6d, 0xe9, 0x83, 0x90, 0x97, 0xdb, 0x72, 0x40, 0xa4, 0xa4, 0xb7, 0xb3, 0x67, 0x1f,
0xcb, 0x79, 0xe6, 0x4e, 0xcc, 0xc0, 0xe5, 0x78, 0x82, 0x5a, 0xd0, 0x7d, 0xcc, 0xff, 0x72, 0x21,
0xb8, 0x08, 0x46, 0x74, 0xf7, 0x43, 0x24, 0x8e, 0xe0, 0x35, 0x90, 0xe6, 0x81, 0x3a, 0x26, 0x4c,
0x3c, 0x28, 0x52, 0xbb, 0x91, 0xc3, 0x00, 0xcb, 0x88, 0xd0, 0x65, 0x8b, 0x1b, 0x53, 0x2e, 0xa3,
0x71, 0x64, 0x48, 0x97, 0xa2, 0x0d, 0xf9, 0x4e, 0x38, 0x19, 0xef, 0x46, 0xa9, 0xde, 0xac, 0xd8,
0xa8, 0xfa, 0x76, 0x3f, 0xe3, 0x9c, 0x34, 0x3f, 0xf9, 0xdc, 0xbb, 0xc7, 0xc7, 0x0b, 0x4f, 0x1d,
0x8a, 0x51, 0xe0, 0x4b, 0xcd, 0xb4, 0x59, 0x31, 0xc8, 0x9f, 0x7e, 0xc9, 0xd9, 0x78, 0x73, 0x64,
0xea, 0xc5, 0xac, 0x83, 0x34, 0xd3, 0xeb, 0xc3, 0xc5, 0x81, 0xa0, 0xff, 0xfa, 0x13, 0x63, 0xeb,
0x17, 0x0d, 0xdd, 0x51, 0xb7, 0xf0, 0xda, 0x49, 0xd3, 0x16, 0x55, 0x26, 0x29, 0xd4, 0x68, 0x9e,
0x2b, 0x16, 0xbe, 0x58, 0x7d, 0x47, 0xa1, 0xfc, 0x8f, 0xf8, 0xb8, 0xd1, 0x7a, 0xd0, 0x31, 0xce,
0x45, 0xcb, 0x3a, 0x8f, 0x95, 0x16, 0x04, 0x28, 0xaf, 0xd7, 0xfb, 0xca, 0xbb, 0x4b, 0x40, 0x7e,
};
/* Calculates a 64-bit to 128-bit unsigned multiply, then xor's the low bits of the product with
* the high bits for a 64-bit result. */
static uint64_t XXH3_mul128_fold64(uint64_t const lhs, uint64_t const rhs)
{
#if defined(__SIZEOF_INT128__) || (defined(_INTEGRAL_MAX_BITS) && _INTEGRAL_MAX_BITS >= 128)
__uint128_t product = (__uint128_t) lhs * (__uint128_t) rhs;
return (uint64_t) (product & 0xFFFFFFFFFFFFFFFFULL) ^ (uint64_t) (product >> 64);
/* There are other platform-specific versions in the official repo.
* They would all be left out in favor of the code above, but it is not
* portable, so we keep the generic version. */
#else /* Portable scalar version */
/* First calculate all of the cross products. */
uint64_t const lo_lo = (lhs & 0xFFFFFFFF) * (rhs & 0xFFFFFFFF);
uint64_t const hi_lo = (lhs >> 32) * (rhs & 0xFFFFFFFF);
uint64_t const lo_hi = (lhs & 0xFFFFFFFF) * (rhs >> 32);
uint64_t const hi_hi = (lhs >> 32) * (rhs >> 32);
/* Now add the products together. These will never overflow. */
uint64_t const cross = (lo_lo >> 32) + (hi_lo & 0xFFFFFFFF) + lo_hi;
uint64_t const upper = (hi_lo >> 32) + (cross >> 32) + hi_hi;
uint64_t const lower = (cross << 32) | (lo_lo & 0xFFFFFFFF);
return upper ^ lower;
#endif
}
#define STRIPE_LEN 64
#define XXH_SECRET_CONSUME_RATE 8 /* nb of secret bytes consumed at each accumulation */
#define ACC_NB (STRIPE_LEN / sizeof(uint64_t))
/* Mixes up the hash to finalize */
static XXH64_hash_t XXH3_avalanche(uint64_t hash)
{
hash ^= hash >> 37;
hash *= 0x165667919E3779F9ULL;
hash ^= hash >> 32;
return hash;
}
/* ==========================================
* Short keys
* ========================================== */
/* Hashes zero-length keys */
static XXH64_hash_t XXH3_len_0_64b(uint8_t const *const secret, XXH64_hash_t const seed)
{
uint64_t acc = seed;
acc += PRIME64_1;
acc ^= XXH_read64(secret + 56);
acc ^= XXH_read64(secret + 64);
return XXH3_avalanche(acc);
}
/* Hashes short keys from 1 to 3 bytes. */
static XXH64_hash_t XXH3_len_1to3_64b(uint8_t const *const input,
size_t const length,
uint8_t const *const secret,
XXH64_hash_t const seed)
{
uint8_t const byte1 = input[0];
uint8_t const byte2 = (length > 1) ? input[1] : input[0];
uint8_t const byte3 = input[length - 1];
uint32_t const combined = ((uint32_t)byte1 << 16)
| ((uint32_t)byte2 << 24)
| ((uint32_t)byte3 << 0)
| ((uint32_t)length << 8);
uint64_t acc = (uint64_t)(XXH_read32(secret) ^ XXH_read32(secret + 4));
acc += seed;
acc ^= (uint64_t)combined;
acc *= PRIME64_1;
return XXH3_avalanche(acc);
}
/* Hashes short keys from 4 to 8 bytes. */
static XXH64_hash_t XXH3_len_4to8_64b(uint8_t const *const input,
size_t const length,
uint8_t const *const secret,
XXH64_hash_t seed)
{
uint32_t const input_hi = XXH_read32(input);
uint32_t const input_lo = XXH_read32(input + length - 4);
uint64_t const input_64 = (uint64_t)input_lo | ((uint64_t)input_hi << 32);
uint64_t acc = XXH_read64(secret + 8) ^ XXH_read64(secret + 16);
seed ^= (uint64_t)XXH_swap32(seed & 0xFFFFFFFF) << 32;
acc -= seed;
acc ^= input_64;
/* rrmxmx mix, skips XXH3_avalanche */
acc ^= XXH_rotl64(acc, 49) ^ XXH_rotl64(acc, 24);
acc *= 0x9FB21C651E98DF25ULL;
acc ^= (acc >> 35) + (uint64_t)length;
acc *= 0x9FB21C651E98DF25ULL;
acc ^= (acc >> 28);
return acc;
}
/* Hashes short keys from 9 to 16 bytes. */
static XXH64_hash_t XXH3_len_9to16_64b(uint8_t const *const input,
size_t const length,
uint8_t const *const secret,
XXH64_hash_t const seed)
{
uint64_t input_lo = XXH_read64(secret+24) ^ XXH_read64(secret+32);
uint64_t input_hi = XXH_read64(secret+40) ^ XXH_read64(secret+48);
uint64_t acc = (uint64_t)length;
input_lo += seed;
input_hi -= seed;
input_lo ^= XXH_read64(input);
input_hi ^= XXH_read64(input + length - 8);
acc += XXH_swap64(input_lo);
acc += input_hi;
acc += XXH3_mul128_fold64(input_lo, input_hi);
return XXH3_avalanche(acc);
}
/* Hashes short keys that are less than or equal to 16 bytes. */
static XXH64_hash_t XXH3_len_0to16_64b(uint8_t const *const input,
size_t const length,
uint8_t const *const secret,
XXH64_hash_t const seed)
{
if (length > 8)
return XXH3_len_9to16_64b(input, length, secret, seed);
else if (length >= 4)
return XXH3_len_4to8_64b(input, length, secret, seed);
else if (length != 0)
return XXH3_len_1to3_64b(input, length, secret, seed);
return XXH3_len_0_64b(secret, seed);
}
/* The primary mixer for the midsize hashes */
static uint64_t XXH3_mix16B(uint8_t const *const input,
uint8_t const *const secret,
XXH64_hash_t seed)
{
uint64_t lhs = seed;
uint64_t rhs = 0U - seed;
lhs += XXH_read64(secret);
rhs += XXH_read64(secret + 8);
lhs ^= XXH_read64(input);
rhs ^= XXH_read64(input + 8);
return XXH3_mul128_fold64(lhs, rhs);
}
/* Hashes midsize keys from 17 to 128 bytes */
static XXH64_hash_t XXH3_len_17to128_64b(uint8_t const *const input,
size_t const length,
uint8_t const *const secret,
XXH64_hash_t const seed)
{
int i = (int)((length - 1) / 32);
uint64_t acc = length * PRIME64_1;
for (; i >= 0; i--) {
acc += XXH3_mix16B(input + (16 * i), secret + (32 * i), seed);
acc += XXH3_mix16B(input + length - (16 * (i + 1)), secret + (32 * i) + 16, seed);
}
return XXH3_avalanche(acc);
}
#define XXH3_MIDSIZE_MAX 240
/* Hashes midsize keys from 129 to 240 bytes */
static XXH64_hash_t XXH3_len_129to240_64b(uint8_t const *const input,
size_t const length,
uint8_t const *const secret,
XXH64_hash_t const seed)
{
#define XXH3_MIDSIZE_STARTOFFSET 3
#define XXH3_MIDSIZE_LASTOFFSET 17
uint64_t acc = (uint64_t)length * PRIME64_1;
int const nbRounds = (int)length / 16;
int i;
for (i = 0; i < 8; i++) {
acc += XXH3_mix16B(input + (16 * i), secret + (16 * i), seed);
}
acc = XXH3_avalanche(acc);
for (i = 8; i < nbRounds; i++) {
acc += XXH3_mix16B(input + (16 * i),
secret + (16 * (i - 8))
+ XXH3_MIDSIZE_STARTOFFSET,
seed);
}
/* last bytes */
acc += XXH3_mix16B(input + length - 16,
secret + XXH3_SECRET_SIZE_MIN
- XXH3_MIDSIZE_LASTOFFSET,
seed);
return XXH3_avalanche(acc);
}
/* Hashes a short input, < 240 bytes */
static XXH64_hash_t XXH3_hashShort_64b(uint8_t const *const input,
size_t const length,
uint8_t const *const secret,
XXH64_hash_t const seed)
{
if (length <= 16)
return XXH3_len_0to16_64b(input, length, secret, seed);
if (length <= 128)
return XXH3_len_17to128_64b(input, length, secret, seed);
return XXH3_len_129to240_64b(input, length, secret, seed);
}
/* This is the main loop. This is usually written in SIMD code. */
static void XXH3_accumulate_512_64b(uint64_t *const acc,
uint8_t const *const input,
uint8_t const *const secret)
{
size_t i;
for (i = 0; i < ACC_NB; i++) {
uint64_t input_val = XXH_read64(input + (8 * i));
acc[i] += input_val;
input_val ^= XXH_read64(secret + (8 * i));
acc[i] += (uint32_t)input_val * (input_val >> 32);
}
}
/* Scrambles input. This is usually written in SIMD code, as it is usually part of the main loop. */
static void XXH3_scrambleAcc(uint64_t *const acc, uint8_t const *const secret)
{
size_t i;
for (i = 0; i < ACC_NB; i++) {
acc[i] ^= acc[i] >> 47;
acc[i] ^= XXH_read64(secret + (8 * i));
acc[i] *= PRIME32_1;
}
}
/* Processes a full block. */
static void XXH3_accumulate_64b(uint64_t *const acc,
uint8_t const *const input,
uint8_t const *const secret,
size_t const nb_stripes)
{
size_t n;
for (n = 0; n < nb_stripes; n++) {
XXH3_accumulate_512_64b(acc, input + n * STRIPE_LEN, secret + (8 * n));
}
}
/* Combines two accumulators with two keys */
static uint64_t XXH3_mix2Accs(uint64_t const *const acc, uint8_t const *const secret)
{
return XXH3_mul128_fold64(
acc[0] ^ XXH_read64(secret),
acc[1] ^ XXH_read64(secret + 8));
}
/* Combines 8 accumulators with keys into 1 finalized 64-bit hash. */
static XXH64_hash_t XXH3_mergeAccs(uint64_t const *const acc, uint8_t const *const key,
uint64_t const start)
{
uint64_t result64 = start;
size_t i = 0;
for (i = 0; i < 4; i++)
result64 += XXH3_mix2Accs(acc + 2 * i, key + 16 * i);
return XXH3_avalanche(result64);
}
/* Controls the long hash function. This is used for both XXH3_64 and XXH3_128. */
static XXH64_hash_t XXH3_hashLong_64b(uint8_t const *const input,
size_t const length,
uint8_t const *const secret,
size_t const secret_size)
{
size_t const nb_rounds = (secret_size - STRIPE_LEN) / XXH_SECRET_CONSUME_RATE;
size_t const block_len = STRIPE_LEN * nb_rounds;
size_t const nb_blocks = length / block_len;
size_t const nb_stripes = (length - (block_len * nb_blocks)) / STRIPE_LEN;
size_t n;
uint64_t acc[ACC_NB];
acc[0] = PRIME32_3;
acc[1] = PRIME64_1;
acc[2] = PRIME64_2;
acc[3] = PRIME64_3;
acc[4] = PRIME64_4;
acc[5] = PRIME32_2;
acc[6] = PRIME64_5;
acc[7] = PRIME32_1;
for (n = 0; n < nb_blocks; n++) {
XXH3_accumulate_64b(acc, input + n * block_len, secret, nb_rounds);
XXH3_scrambleAcc(acc, secret + secret_size - STRIPE_LEN);
}
/* last partial block */
XXH3_accumulate_64b(acc, input + nb_blocks * block_len, secret, nb_stripes);
/* last stripe */
if (length % STRIPE_LEN != 0) {
uint8_t const *const p = input + length - STRIPE_LEN;
/* Do not align on 8, so that the secret is different from the scrambler */
#define XXH_SECRET_LASTACC_START 7
XXH3_accumulate_512_64b(acc, p, secret + secret_size - STRIPE_LEN - XXH_SECRET_LASTACC_START);
}
#define XXH_SECRET_MERGEACCS_START 11
/* converge into final hash */
return XXH3_mergeAccs(acc, secret + XXH_SECRET_MERGEACCS_START, (uint64_t) length * PRIME64_1);
}
/* Hashes a long input, > 240 bytes */
static XXH64_hash_t XXH3_hashLong_64b_withSeed(uint8_t const *const input,
size_t const length,
XXH64_hash_t const seed)
{
uint8_t secret[XXH_SECRET_DEFAULT_SIZE];
size_t i;
for (i = 0; i < XXH_SECRET_DEFAULT_SIZE / 16; i++) {
XXH_write64(secret + (16 * i), XXH_read64(kSecret + (16 * i)) + seed);
XXH_write64(secret + (16 * i) + 8, XXH_read64(kSecret + (16 * i) + 8) - seed);
}
return XXH3_hashLong_64b(input, length, secret, sizeof(secret));
}
/* The XXH3_64 seeded hash function.
* input: The data to hash.
* length: The length of input. It is undefined behavior to have length larger than the
* capacity of input.
* seed: A 64-bit value to seed the hash with.
* returns: The 64-bit calculated hash value. */
XXH64_hash_t XXH3_64bits_withSeed(void const *const input, size_t const length, XXH64_hash_t const seed)
{
if (length <= XXH3_MIDSIZE_MAX)
return XXH3_hashShort_64b((uint8_t const *)input, length, kSecret, seed);
return XXH3_hashLong_64b_withSeed((uint8_t const *)input, length, seed);
}
/* The XXH3_64 non-seeded hash function.
* input: The data to hash.
* length: The length of input. It is undefined behavior to have length larger than the
* capacity of input.
* returns: The 64-bit calculated hash value. */
XXH64_hash_t XXH3_64bits(void const *const input, size_t const length)
{
return XXH3_64bits_withSeed(input, length, 0);
}
/* The XXH3_64 hash function with custom secrets
* input: The data to hash.
* length: The length of input. It is undefined behavior to have length larger than the
* capacity of input.
* secret: The custom secret.
* secret_size: The size of the custom secret. Must be >= XXH_SECRET_SIZE_MIN.
* returns: The 64-bit calculated hash value. */
XXH64_hash_t XXH3_64bits_withSecret(void const *const input, size_t const length,
void const *const secret, size_t const secret_size)
{
if (length <= XXH3_MIDSIZE_MAX)
return XXH3_hashShort_64b((uint8_t const *)input, length, (uint8_t const *)secret, 0);
return XXH3_hashLong_64b((uint8_t const *)input, length, (uint8_t const *)secret, secret_size);
}
#ifdef XXH_SELFTEST
#include <stdio.h> /* fprintf, puts */
#include <stdlib.h> /* exit */
#define TEST_DATA_SIZE 2243
static int test_num = 0;
static void verify(char const *const test_name, uint64_t const expected, uint64_t const result)
{
if (result != expected) {
fprintf(stderr, "Error: Test %i: %s test failed!\n", ++test_num, test_name);
fprintf(stderr, "Expected value: 0x%08X%08X. Actual value: 0x%08X%08X.\n",
(uint32_t) (expected >> 32), (uint32_t) expected, (uint32_t) (result >> 32), (uint32_t) result);
exit(1);
}
}
/* Checks a hash value. */
static void test_sequence(uint8_t const *const test_data, size_t const length,
uint64_t const seed, uint64_t const expected)
{
uint64_t result = XXH3_64bits_withSeed(test_data, length, seed);
verify("XXH3_64bits_withSeed", expected, result);
if (seed == 0) {
result = XXH3_64bits(test_data, length);
verify("XXH3_64bits", expected, result);
}
}
/* Checks a hash value. */
static void test_sequence_secret(uint8_t const *const test_data, size_t const length,
uint8_t const *const secret, size_t const secret_size, uint64_t const expected)
{
uint64_t result = XXH3_64bits_withSecret(test_data, length, secret, secret_size);
verify("XXH3_64bits_withSecret", expected, result);
}
static const uint64_t PRIME64 = 0x9e3779b185ebca8d;
int main(void)
{
uint8_t test_data[TEST_DATA_SIZE];
uint64_t byte_gen = PRIME32_1;
size_t i = 0;
/* Fill in the test_data buffer with "random" data. */
for (; i < TEST_DATA_SIZE; ++i) {
test_data[i] = (uint8_t) (byte_gen >> 56);
byte_gen *= PRIME64;
}
/* xxhsum verification values */
test_sequence(NULL, 0, 0, 0x776EDDFB6BFD9195ULL); /* empty string */
test_sequence(NULL, 0, PRIME64, 0x6AFCE90814C488CBULL);
test_sequence(test_data, 1, 0, 0xB936EBAE24CB01C5ULL); /* 1 - 3 */
test_sequence(test_data, 1, PRIME64, 0xF541B1905037FC39ULL); /* 1 - 3 */
test_sequence(test_data, 6, 0, 0x27B56A84CD2D7325ULL); /* 4 - 8 */
test_sequence(test_data, 6, PRIME64, 0x84589C116AB59AB9ULL); /* 4 - 8 */
test_sequence(test_data, 12, 0, 0xA713DAF0DFBB77E7ULL); /* 9 - 16 */
test_sequence(test_data, 12, PRIME64, 0xE7303E1B2336DE0EULL); /* 9 - 16 */
test_sequence(test_data, 24, 0, 0xA3FE70BF9D3510EBULL); /* 17 - 32 */
test_sequence(test_data, 24, PRIME64, 0x850E80FC35BDD690ULL); /* 17 - 32 */
test_sequence(test_data, 48, 0, 0x397DA259ECBA1F11ULL); /* 33 - 64 */
test_sequence(test_data, 48, PRIME64, 0xADC2CBAA44ACC616ULL); /* 33 - 64 */
test_sequence(test_data, 80, 0, 0xBCDEFBBB2C47C90AULL); /* 65 - 96 */
test_sequence(test_data, 80, PRIME64, 0xC6DD0CB699532E73ULL); /* 65 - 96 */
test_sequence(test_data, 195, 0, 0xCD94217EE362EC3AULL); /* 129-240 */
test_sequence(test_data, 195, PRIME64, 0xBA68003D370CB3D9ULL); /* 129-240 */
test_sequence(test_data, 403, 0, 0x1B2AFF3B46C74648ULL); /* one block, last stripe is overlapping */
test_sequence(test_data, 403, PRIME64, 0xB654F6FFF42AD787ULL); /* one block, last stripe is overlapping */
test_sequence(test_data, 512, 0, 0x43E368661808A9E8ULL); /* one block, finishing at stripe boundary */
test_sequence(test_data, 512, PRIME64, 0x3A865148E584E5B9ULL); /* one block, finishing at stripe boundary */
test_sequence(test_data,2048, 0, 0xC7169244BBDA8BD4ULL); /* 2 blocks, finishing at block boundary */
test_sequence(test_data,2048, PRIME64, 0x74BF9A802BBDFBAEULL); /* 2 blocks, finishing at block boundary */
test_sequence(test_data,2240, 0, 0x30FEB637E114C0C7ULL); /* 3 blocks, finishing at stripe boundary */
test_sequence(test_data,2240, PRIME64, 0xEEF78A36185EB61FULL); /* 3 blocks, finishing at stripe boundary */
test_sequence(test_data,2243, 0, 0x62C631454648A193ULL); /* 3 blocks, last stripe is overlapping */
test_sequence(test_data,2243, PRIME64, 0x6CF80A4BADEA4428ULL); /* 3 blocks, last stripe is overlapping */
{ const uint8_t* const secret = test_data + 7;
const size_t secret_size = XXH3_SECRET_SIZE_MIN + 11;
test_sequence_secret(NULL, 0, secret, secret_size, 0x6775FD10343C92C3ULL); /* empty string */
test_sequence_secret(test_data, 1, secret, secret_size, 0xC3382C326E24E3CDULL); /* 1 - 3 */
test_sequence_secret(test_data, 6, secret, secret_size, 0x82C90AB0519369ADULL); /* 4 - 8 */
test_sequence_secret(test_data, 12, secret, secret_size, 0x14631E773B78EC57ULL); /* 9 - 16 */
test_sequence_secret(test_data, 24, secret, secret_size, 0xCDD5542E4A9D9FE8ULL); /* 17 - 32 */
test_sequence_secret(test_data, 48, secret, secret_size, 0x33ABD54D094B2534ULL); /* 33 - 64 */
test_sequence_secret(test_data, 80, secret, secret_size, 0xE687BA1684965297ULL); /* 65 - 96 */
test_sequence_secret(test_data, 195, secret, secret_size, 0xA057273F5EECFB20ULL); /* 129-240 */
test_sequence_secret(test_data, 403, secret, secret_size, 0xF9C0BA5BA3AF70B8ULL); /* one block, last stripe is overlapping */
test_sequence_secret(test_data, 512, secret, secret_size, 0x7896E65DCFA09071ULL); /* one block, finishing at stripe boundary */
test_sequence_secret(test_data,2048, secret, secret_size, 0xD6545DB87ECFD98CULL); /* >= 2 blocks, at least one scrambling */
test_sequence_secret(test_data,2243, secret, secret_size, 0x887810081C32460AULL); /* >= 2 blocks, at least one scrambling, last stripe unaligned */
}
puts("XXH3_64bits reference implementation: OK");
return 0;
}
#endif /* XXH_SELFTEST */