2016-11-17 18:35:06 +11:00
|
|
|
/*
|
2018-08-04 15:14:06 +10:00
|
|
|
* This Source Code Form is subject to the terms of the Mozilla Public
|
|
|
|
* License, v. 2.0. If a copy of the MPL was not distributed with this
|
|
|
|
* file, You can obtain one at http://mozilla.org/MPL/2.0/.
|
2016-11-17 18:35:06 +11:00
|
|
|
*
|
2018-01-18 16:29:06 +11:00
|
|
|
* Copyright 2016-2018 Danny Robson <danny@nerdcruft.net>
|
2016-11-17 18:35:06 +11:00
|
|
|
*/
|
|
|
|
|
2017-11-22 16:49:37 +11:00
|
|
|
#include "xxhash.hpp"
|
2016-11-17 18:35:06 +11:00
|
|
|
|
2017-11-22 16:49:37 +11:00
|
|
|
#include "../bitwise.hpp"
|
|
|
|
#include "../debug.hpp"
|
|
|
|
#include "../endian.hpp"
|
2016-11-17 18:35:06 +11:00
|
|
|
|
2018-01-09 16:28:25 +11:00
|
|
|
#include <cstring>
|
|
|
|
|
2018-08-05 14:42:02 +10:00
|
|
|
using cruft::hash::xxhash;
|
2016-11-17 18:35:06 +11:00
|
|
|
|
|
|
|
|
2016-12-21 21:08:26 +11:00
|
|
|
///////////////////////////////////////////////////////////////////////////////
|
|
|
|
template <typename T>
|
|
|
|
static
|
|
|
|
T
|
|
|
|
read_le (const void *ptr)
|
2016-11-17 18:35:06 +11:00
|
|
|
{
|
2016-12-21 21:08:26 +11:00
|
|
|
return *static_cast<const T*> (ptr);
|
2016-11-17 18:35:06 +11:00
|
|
|
}
|
|
|
|
|
|
|
|
|
|
|
|
///////////////////////////////////////////////////////////////////////////////
|
|
|
|
template <typename T>
|
|
|
|
struct constants {
|
|
|
|
static const T prime[5];
|
2018-01-18 16:29:06 +11:00
|
|
|
static const T round_rotate;
|
|
|
|
static const T final_rotate[3];
|
2016-11-17 18:35:06 +11:00
|
|
|
};
|
|
|
|
|
|
|
|
|
2016-12-21 21:08:26 +11:00
|
|
|
//-----------------------------------------------------------------------------
|
2016-11-17 18:35:06 +11:00
|
|
|
template <>
|
|
|
|
const uint32_t
|
|
|
|
constants<uint32_t>::prime[5] = {
|
|
|
|
2654435761u,
|
|
|
|
2246822519u,
|
|
|
|
3266489917u,
|
|
|
|
668265263u,
|
|
|
|
374761393u,
|
|
|
|
};
|
|
|
|
|
2016-12-21 21:08:26 +11:00
|
|
|
|
2018-01-18 16:29:06 +11:00
|
|
|
template <>
|
|
|
|
const uint32_t
|
|
|
|
constants<uint32_t>::final_rotate[3] = {
|
|
|
|
15, 13, 16
|
|
|
|
};
|
|
|
|
|
|
|
|
|
2016-12-21 21:08:26 +11:00
|
|
|
//-----------------------------------------------------------------------------
|
2016-11-17 18:35:06 +11:00
|
|
|
template <>
|
|
|
|
const uint32_t
|
2018-01-18 16:29:06 +11:00
|
|
|
constants<uint32_t>::round_rotate = 13;
|
2016-11-17 18:35:06 +11:00
|
|
|
|
|
|
|
|
2016-12-21 21:08:26 +11:00
|
|
|
//-----------------------------------------------------------------------------
|
2016-11-17 18:35:06 +11:00
|
|
|
template <>
|
|
|
|
const uint64_t constants<uint64_t>::prime[5] = {
|
2018-01-18 16:29:06 +11:00
|
|
|
11400714785074694791ull,
|
|
|
|
14029467366897019727ull,
|
|
|
|
1609587929392839161ull,
|
|
|
|
9650029242287828579ull,
|
|
|
|
2870177450012600261ull,
|
|
|
|
};
|
|
|
|
|
|
|
|
|
|
|
|
template <>
|
|
|
|
const uint64_t
|
|
|
|
constants<uint64_t>::final_rotate[3] = {
|
|
|
|
33, 29, 32
|
2016-11-17 18:35:06 +11:00
|
|
|
};
|
|
|
|
|
|
|
|
|
2016-12-21 21:08:26 +11:00
|
|
|
//-----------------------------------------------------------------------------
|
2016-11-17 18:35:06 +11:00
|
|
|
template <>
|
|
|
|
const uint64_t
|
2018-01-18 16:29:06 +11:00
|
|
|
constants<uint64_t>::round_rotate = 31;
|
2016-11-17 18:35:06 +11:00
|
|
|
|
|
|
|
|
2016-12-21 21:08:26 +11:00
|
|
|
///////////////////////////////////////////////////////////////////////////////
|
2016-11-17 18:35:06 +11:00
|
|
|
template <typename T>
|
2018-01-13 13:48:58 +11:00
|
|
|
static
|
|
|
|
T
|
2018-01-18 16:29:06 +11:00
|
|
|
round (T state, T input)
|
2018-01-13 13:48:58 +11:00
|
|
|
{
|
2018-01-18 16:29:06 +11:00
|
|
|
state += input * constants<T>::prime[1];
|
2018-08-05 14:42:02 +10:00
|
|
|
state = cruft::rotatel (state, constants<T>::round_rotate);
|
2018-01-18 16:29:06 +11:00
|
|
|
state *= constants<T>::prime[0];
|
2018-01-13 13:48:58 +11:00
|
|
|
|
2018-01-18 16:29:06 +11:00
|
|
|
return state;
|
2018-01-13 13:48:58 +11:00
|
|
|
}
|
2016-11-17 18:35:06 +11:00
|
|
|
|
|
|
|
|
2018-01-13 13:48:58 +11:00
|
|
|
///////////////////////////////////////////////////////////////////////////////
|
2018-01-18 16:29:06 +11:00
|
|
|
template <typename WordT>
|
|
|
|
xxhash<WordT>::xxhash (WordT _seed):
|
2016-11-17 18:35:06 +11:00
|
|
|
m_seed (_seed)
|
2018-01-13 13:48:58 +11:00
|
|
|
{ ; }
|
2016-11-17 18:35:06 +11:00
|
|
|
|
|
|
|
|
2018-01-13 13:48:58 +11:00
|
|
|
///////////////////////////////////////////////////////////////////////////////
|
2018-01-18 16:29:06 +11:00
|
|
|
template <typename WordT>
|
|
|
|
typename xxhash<WordT>::digest_t
|
2018-08-05 14:42:02 +10:00
|
|
|
xxhash<WordT>::operator() (const cruft::view<const uint8_t*> data)
|
2016-11-17 18:35:06 +11:00
|
|
|
{
|
2018-01-18 16:29:06 +11:00
|
|
|
word_t state[4] {
|
|
|
|
m_seed + constants<WordT>::prime[0] + constants<WordT>::prime[1],
|
|
|
|
m_seed + constants<WordT>::prime[1],
|
|
|
|
m_seed,
|
|
|
|
m_seed - constants<WordT>::prime[0],
|
|
|
|
};
|
|
|
|
|
|
|
|
// consume block sized chunks while they're available.
|
|
|
|
// process each state word independently per block.
|
|
|
|
auto cursor = std::cbegin (data);
|
|
|
|
const auto last = std::cend (data);
|
|
|
|
while (last - cursor > block_bytes) {
|
|
|
|
for (int i = 0; i < 4; ++i) {
|
|
|
|
state[i] = round<word_t> (state[i], read_le<word_t> (cursor));
|
|
|
|
cursor += sizeof (word_t);
|
2016-11-17 18:35:06 +11:00
|
|
|
}
|
2018-01-18 16:29:06 +11:00
|
|
|
}
|
2016-11-17 18:35:06 +11:00
|
|
|
|
2018-01-18 16:29:06 +11:00
|
|
|
// leave the remainder. it's used midway through finalisation. note that we
|
|
|
|
// don't update the cursor as it's used to detect the remaining bytes
|
|
|
|
// during finalisation.
|
|
|
|
;
|
|
|
|
|
|
|
|
// compress the state and mix in the data size
|
|
|
|
word_t h;
|
|
|
|
if (data.size () < block_bytes) {
|
|
|
|
h = state[2] + constants<WordT>::prime[4];
|
|
|
|
} else {
|
|
|
|
h = rotatel (state[0], 1) +
|
|
|
|
rotatel (state[1], 7) +
|
|
|
|
rotatel (state[2], 12) +
|
|
|
|
rotatel (state[3], 18);
|
|
|
|
|
|
|
|
if constexpr (std::is_same_v<WordT,uint64_t>) {
|
|
|
|
h = (h ^ round<WordT> (0, state[0])) * constants<WordT>::prime[0] + constants<WordT>::prime[3];
|
|
|
|
h = (h ^ round<WordT> (0, state[1])) * constants<WordT>::prime[0] + constants<WordT>::prime[3];
|
|
|
|
h = (h ^ round<WordT> (0, state[2])) * constants<WordT>::prime[0] + constants<WordT>::prime[3];
|
|
|
|
h = (h ^ round<WordT> (0, state[3])) * constants<WordT>::prime[0] + constants<WordT>::prime[3];
|
2018-01-13 13:48:58 +11:00
|
|
|
}
|
2018-01-18 16:29:06 +11:00
|
|
|
}
|
2016-11-17 18:35:06 +11:00
|
|
|
|
2018-01-18 16:29:06 +11:00
|
|
|
h += static_cast<WordT> (data.size ());
|
2016-11-17 18:35:06 +11:00
|
|
|
|
2018-01-18 16:29:06 +11:00
|
|
|
// drain the remainder of the data, first by words...
|
|
|
|
while (cursor + sizeof (WordT) <= last) {
|
|
|
|
if constexpr (std::is_same_v<WordT,uint32_t>) {
|
|
|
|
h += read_le<WordT> (cursor) * constants<WordT>::prime[2];
|
|
|
|
h = rotatel (h, 17) * constants<WordT>::prime[3];
|
|
|
|
} else {
|
|
|
|
h = rotatel (
|
|
|
|
h ^ round<WordT> (0, read_le<WordT> (cursor)), 27
|
|
|
|
) * constants<WordT>::prime[0] + constants<WordT>::prime[3];
|
2018-01-13 13:48:58 +11:00
|
|
|
}
|
|
|
|
|
2018-01-18 16:29:06 +11:00
|
|
|
cursor += sizeof (WordT);
|
|
|
|
}
|
2018-01-13 13:48:58 +11:00
|
|
|
|
2018-01-18 16:29:06 +11:00
|
|
|
// ...then maybe by half words...
|
|
|
|
if constexpr (std::is_same_v<WordT,uint64_t>) {
|
|
|
|
while (cursor + sizeof (uint32_t) <= last) {
|
|
|
|
h = rotatel (
|
|
|
|
h ^ read_le<uint32_t> (cursor) * constants<WordT>::prime[0], 23
|
|
|
|
) * constants<WordT>::prime[1] + constants<WordT>::prime[2];
|
2018-01-13 13:48:58 +11:00
|
|
|
|
2018-01-18 16:29:06 +11:00
|
|
|
cursor += sizeof (uint32_t);
|
2018-01-13 13:48:58 +11:00
|
|
|
}
|
2018-01-18 16:29:06 +11:00
|
|
|
}
|
2016-11-17 18:35:06 +11:00
|
|
|
|
2018-01-18 16:29:06 +11:00
|
|
|
// ...then by bytes
|
|
|
|
while (cursor != last) {
|
|
|
|
if constexpr (std::is_same_v<WordT,uint32_t>) {
|
|
|
|
h += *cursor * constants<WordT>::prime[4];
|
|
|
|
h = rotatel (h, 11) * constants<WordT>::prime[0];
|
|
|
|
} else {
|
|
|
|
h = rotatel (h ^ *cursor * constants<WordT>::prime[4], 11) * constants<WordT>::prime[0];
|
2018-01-13 13:48:58 +11:00
|
|
|
}
|
2016-11-17 18:35:06 +11:00
|
|
|
|
2018-01-18 16:29:06 +11:00
|
|
|
++cursor;
|
|
|
|
}
|
2016-11-17 18:35:06 +11:00
|
|
|
|
2018-01-18 16:29:06 +11:00
|
|
|
// everything should have been consumed by now
|
|
|
|
CHECK_EQ (cursor, std::cend (data));
|
2016-11-17 18:35:06 +11:00
|
|
|
|
2018-01-18 16:29:06 +11:00
|
|
|
// mix the result one last time before returning
|
|
|
|
h ^= h >> constants<WordT>::final_rotate[0]; h *= constants<WordT>::prime[1];
|
|
|
|
h ^= h >> constants<WordT>::final_rotate[1]; h *= constants<WordT>::prime[2];
|
|
|
|
h ^= h >> constants<WordT>::final_rotate[2];
|
|
|
|
|
|
|
|
return h;
|
|
|
|
};
|
2016-11-17 18:35:06 +11:00
|
|
|
|
|
|
|
|
2016-12-21 21:08:26 +11:00
|
|
|
///////////////////////////////////////////////////////////////////////////////
|
2018-08-05 14:42:02 +10:00
|
|
|
template class cruft::hash::xxhash<uint32_t>;
|
|
|
|
template class cruft::hash::xxhash<uint64_t>;
|