1 // Definition of _Hash_bytes. -*- C++ -*- 2 3 // Copyright (C) 2010-2014 Free Software Foundation, Inc. 4 // 5 // This file is part of the GNU ISO C++ Library. This library is free 6 // software; you can redistribute it and/or modify it under the 7 // terms of the GNU General Public License as published by the 8 // Free Software Foundation; either version 3, or (at your option) 9 // any later version. 10 11 // This library is distributed in the hope that it will be useful, 12 // but WITHOUT ANY WARRANTY; without even the implied warranty of 13 // MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the 14 // GNU General Public License for more details. 15 16 // Under Section 7 of GPL version 3, you are granted additional 17 // permissions described in the GCC Runtime Library Exception, version 18 // 3.1, as published by the Free Software Foundation. 19 20 // You should have received a copy of the GNU General Public License and 21 // a copy of the GCC Runtime Library Exception along with this program; 22 // see the files COPYING3 and COPYING.RUNTIME respectively. If not, see 23 // <http://www.gnu.org/licenses/>. 24 25 // This file defines Hash_bytes, a primitive used for defining hash 26 // functions. Based on public domain MurmurHashUnaligned2, by Austin 27 // Appleby. http://murmurhash.googlepages.com/ 28 29 // This file also defines _Fnv_hash_bytes, another primitive with 30 // exactly the same interface but using a different hash algorithm, 31 // Fowler / Noll / Vo (FNV) Hash (type FNV-1a). The Murmur hash 32 // function apears to be better in both speed and hash quality, and 33 // FNV is provided primarily for backward compatibility. 34 35 #include <bits/hash_bytes.h> 36 37 namespace 38 { 39 inline std::size_t unaligned_load(const char * p)40 unaligned_load(const char* p) 41 { 42 std::size_t result; 43 __builtin_memcpy(&result, p, sizeof(result)); 44 return result; 45 } 46 47 #if __SIZEOF_SIZE_T__ == 8 48 // Loads n bytes, where 1 <= n < 8. 49 inline std::size_t load_bytes(const char * p,int n)50 load_bytes(const char* p, int n) 51 { 52 std::size_t result = 0; 53 --n; 54 do 55 result = (result << 8) + static_cast<unsigned char>(p[n]); 56 while (--n >= 0); 57 return result; 58 } 59 60 inline std::size_t shift_mix(std::size_t v)61 shift_mix(std::size_t v) 62 { return v ^ (v >> 47);} 63 #endif 64 } 65 66 namespace std 67 { 68 _GLIBCXX_BEGIN_NAMESPACE_VERSION 69 70 #if __SIZEOF_SIZE_T__ == 4 71 72 // Implementation of Murmur hash for 32-bit size_t. 73 size_t _Hash_bytes(const void * ptr,size_t len,size_t seed)74 _Hash_bytes(const void* ptr, size_t len, size_t seed) 75 { 76 const size_t m = 0x5bd1e995; 77 size_t hash = seed ^ len; 78 const char* buf = static_cast<const char*>(ptr); 79 80 // Mix 4 bytes at a time into the hash. 81 while(len >= 4) 82 { 83 size_t k = unaligned_load(buf); 84 k *= m; 85 k ^= k >> 24; 86 k *= m; 87 hash *= m; 88 hash ^= k; 89 buf += 4; 90 len -= 4; 91 } 92 93 // Handle the last few bytes of the input array. 94 switch(len) 95 { 96 case 3: 97 hash ^= static_cast<unsigned char>(buf[2]) << 16; 98 case 2: 99 hash ^= static_cast<unsigned char>(buf[1]) << 8; 100 case 1: 101 hash ^= static_cast<unsigned char>(buf[0]); 102 hash *= m; 103 }; 104 105 // Do a few final mixes of the hash. 106 hash ^= hash >> 13; 107 hash *= m; 108 hash ^= hash >> 15; 109 return hash; 110 } 111 112 // Implementation of FNV hash for 32-bit size_t. 113 size_t _Fnv_hash_bytes(const void * ptr,size_t len,size_t hash)114 _Fnv_hash_bytes(const void* ptr, size_t len, size_t hash) 115 { 116 const char* cptr = static_cast<const char*>(ptr); 117 for (; len; --len) 118 { 119 hash ^= static_cast<size_t>(*cptr++); 120 hash *= static_cast<size_t>(16777619UL); 121 } 122 return hash; 123 } 124 125 #elif __SIZEOF_SIZE_T__ == 8 126 127 // Implementation of Murmur hash for 64-bit size_t. 128 size_t 129 _Hash_bytes(const void* ptr, size_t len, size_t seed) 130 { 131 static const size_t mul = (((size_t) 0xc6a4a793UL) << 32UL) 132 + (size_t) 0x5bd1e995UL; 133 const char* const buf = static_cast<const char*>(ptr); 134 135 // Remove the bytes not divisible by the sizeof(size_t). This 136 // allows the main loop to process the data as 64-bit integers. 137 const int len_aligned = len & ~0x7; 138 const char* const end = buf + len_aligned; 139 size_t hash = seed ^ (len * mul); 140 for (const char* p = buf; p != end; p += 8) 141 { 142 const size_t data = shift_mix(unaligned_load(p) * mul) * mul; 143 hash ^= data; 144 hash *= mul; 145 } 146 if ((len & 0x7) != 0) 147 { 148 const size_t data = load_bytes(end, len & 0x7); 149 hash ^= data; 150 hash *= mul; 151 } 152 hash = shift_mix(hash) * mul; 153 hash = shift_mix(hash); 154 return hash; 155 } 156 157 // Implementation of FNV hash for 64-bit size_t. 158 size_t 159 _Fnv_hash_bytes(const void* ptr, size_t len, size_t hash) 160 { 161 const char* cptr = static_cast<const char*>(ptr); 162 for (; len; --len) 163 { 164 hash ^= static_cast<size_t>(*cptr++); 165 hash *= static_cast<size_t>(1099511628211ULL); 166 } 167 return hash; 168 } 169 170 #else 171 172 // Dummy hash implementation for unusual sizeof(size_t). 173 size_t 174 _Hash_bytes(const void* ptr, size_t len, size_t seed) 175 { 176 size_t hash = seed; 177 const char* cptr = reinterpret_cast<const char*>(ptr); 178 for (; len; --len) 179 hash = (hash * 131) + *cptr++; 180 return hash; 181 } 182 183 size_t 184 _Fnv_hash_bytes(const void* ptr, size_t len, size_t seed) 185 { return _Hash_bytes(ptr, len, seed); } 186 187 #endif /* __SIZEOF_SIZE_T__ */ 188 189 _GLIBCXX_END_NAMESPACE_VERSION 190 } // namespace 191