Commit 3fe820cc authored by Davis King's avatar Davis King

Changed the murmur hash implementation to avoid any possibility of strict

aliasing violations in user code, even when things get inlined in unfavorable
ways.
parent 72cc9398
......@@ -6,6 +6,7 @@
#include "murmur_hash3_abstract.h"
#include "../uintn.h"
#include <utility>
#include <string.h>
namespace dlib
{
......@@ -14,7 +15,7 @@ namespace dlib
// in the public domain. The author hereby disclaims copyright to this source code.
// The code in this particular file was modified by Davis E. King. In
// particular, endian-swapping was added along with some other minor code
// changes.
// changes like avoiding strict aliasing violations.
//-----------------------------------------------------------------------------
......@@ -62,7 +63,12 @@ namespace dlib
DLIB_FORCE_INLINE uint32 murmur_getblock ( const uint32 * p, int i )
{
return p[i];
// The reason we do a memcpy() here instead of simply returning p[i] is because
// doing it this way avoids violations of the strict aliasing rule when all these
// functions are inlined into the user's code.
uint32 temp;
memcpy(&temp, p+i, 4);
return temp;
}
DLIB_FORCE_INLINE uint32 murmur_getblock_byte_swap ( const uint32 * p, int i )
......@@ -84,7 +90,12 @@ namespace dlib
DLIB_FORCE_INLINE uint64 murmur_getblock ( const uint64 * p, int i )
{
return p[i];
// The reason we do a memcpy() here instead of simply returning p[i] is because
// doing it this way avoids violations of the strict aliasing rule when all these
// functions are inlined into the user's code.
uint64 temp;
memcpy(&temp, p+i, 8);
return temp;
}
DLIB_FORCE_INLINE uint64 murmur_getblock_byte_swap ( const uint64 * p, int i )
......
......@@ -122,16 +122,11 @@ namespace
bo.host_to_little(buf);
// Copy buf into a char buf to avoid warnings about violation of strict
// aliasing when calling murmur_hash3_128bit().
char buf2[sizeof(buf)];
memcpy(buf2, buf, sizeof(buf));
std::pair<uint64,uint64> temp1, temp2;
// Make sure the 4 integer version of murmur hash does the same thing
// as the memory block version.
temp1 = murmur_hash3_128bit(buf2, sizeof(buf2), 0);
temp1 = murmur_hash3_128bit(buf, sizeof(buf), 0);
temp2 = murmur_hash3_128bit(buf[0], buf[1], buf[2], buf[3]);
DLIB_TEST( temp1.first == temp2.first);
DLIB_TEST( temp1.second == temp2.second);
......
Markdown is supported
0% or
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment