1 // Copyright (c) 2011 The Chromium Authors. All rights reserved. 2 // Use of this source code is governed by a BSD-style license that can be 3 // found in the LICENSE file. 4 // 5 6 // 7 // Deal with the differences between Microsoft and GNU implemenations 8 // of hash_map. Allows all platforms to use |base::hash_map| and 9 // |base::hash_set|. 10 // eg: 11 // base::hash_map<int> my_map; 12 // base::hash_set<int> my_set; 13 // 14 // NOTE: It is an explicit non-goal of this class to provide a generic hash 15 // function for pointers. If you want to hash a pointers to a particular class, 16 // please define the template specialization elsewhere (for example, in its 17 // header file) and keep it specific to just pointers to that class. This is 18 // because identity hashes are not desirable for all types that might show up 19 // in containers as pointers. 20 21 #ifndef BASE_CONTAINERS_HASH_TABLES_H_ 22 #define BASE_CONTAINERS_HASH_TABLES_H_ 23 24 #include <stddef.h> 25 #include <stdint.h> 26 27 #include <utility> 28 29 #include "base/strings/string16.h" 30 #include "build/build_config.h" 31 32 #if defined(COMPILER_MSVC) 33 #include <unordered_map> 34 #include <unordered_set> 35 36 #define BASE_HASH_NAMESPACE std 37 38 #elif defined(COMPILER_GCC) 39 40 #define BASE_HASH_NAMESPACE base_hash 41 42 // This is a hack to disable the gcc 4.4 warning about hash_map and hash_set 43 // being deprecated. We can get rid of this when we upgrade to VS2008 and we 44 // can use <tr1/unordered_map> and <tr1/unordered_set>. 45 #ifdef __DEPRECATED 46 #define CHROME_OLD__DEPRECATED __DEPRECATED 47 #undef __DEPRECATED 48 #endif 49 50 #include <ext/hash_map> 51 #include <ext/hash_set> 52 #define BASE_HASH_IMPL_NAMESPACE __gnu_cxx 53 54 #include <string> 55 56 #ifdef CHROME_OLD__DEPRECATED 57 #define __DEPRECATED CHROME_OLD__DEPRECATED 58 #undef CHROME_OLD__DEPRECATED 59 #endif 60 61 namespace BASE_HASH_NAMESPACE { 62 63 // The pre-standard hash behaves like C++11's std::hash, except around pointers. 64 // const char* is specialized to hash the C string and hash functions for 65 // general T* are missing. Define a BASE_HASH_NAMESPACE::hash which aligns with 66 // the C++11 behavior. 67 68 template<typename T> 69 struct hash { 70 std::size_t operator()(const T& value) const { 71 return BASE_HASH_IMPL_NAMESPACE::hash<T>()(value); 72 } 73 }; 74 75 template<typename T> 76 struct hash<T*> { 77 std::size_t operator()(T* value) const { 78 return BASE_HASH_IMPL_NAMESPACE::hash<uintptr_t>()( 79 reinterpret_cast<uintptr_t>(value)); 80 } 81 }; 82 83 // The GNU C++ library provides identity hash functions for many integral types, 84 // but not for |long long|. This hash function will truncate if |size_t| is 85 // narrower than |long long|. This is probably good enough for what we will 86 // use it for. 87 88 #define DEFINE_TRIVIAL_HASH(integral_type) \ 89 template<> \ 90 struct hash<integral_type> { \ 91 std::size_t operator()(integral_type value) const { \ 92 return static_cast<std::size_t>(value); \ 93 } \ 94 } 95 96 DEFINE_TRIVIAL_HASH(long long); 97 DEFINE_TRIVIAL_HASH(unsigned long long); 98 99 #undef DEFINE_TRIVIAL_HASH 100 101 // Implement string hash functions so that strings of various flavors can 102 // be used as keys in STL maps and sets. The hash algorithm comes from the 103 // GNU C++ library, in <tr1/functional>. It is duplicated here because GCC 104 // versions prior to 4.3.2 are unable to compile <tr1/functional> when RTTI 105 // is disabled, as it is in our build. 106 107 #define DEFINE_STRING_HASH(string_type) \ 108 template<> \ 109 struct hash<string_type> { \ 110 std::size_t operator()(const string_type& s) const { \ 111 std::size_t result = 0; \ 112 for (string_type::const_iterator i = s.begin(); i != s.end(); ++i) \ 113 result = (result * 131) + *i; \ 114 return result; \ 115 } \ 116 } 117 118 DEFINE_STRING_HASH(std::string); 119 DEFINE_STRING_HASH(base::string16); 120 121 #undef DEFINE_STRING_HASH 122 123 } // namespace BASE_HASH_NAMESPACE 124 125 #else // COMPILER 126 #error define BASE_HASH_NAMESPACE for your compiler 127 #endif // COMPILER 128 129 namespace base { 130 131 // On MSVC, use the C++11 containers. 132 #if defined(COMPILER_MSVC) 133 134 template<class Key, class T, 135 class Hash = std::hash<Key>, 136 class Pred = std::equal_to<Key>, 137 class Alloc = std::allocator<std::pair<const Key, T>>> 138 using hash_map = std::unordered_map<Key, T, Hash, Pred, Alloc>; 139 140 template<class Key, class T, 141 class Hash = std::hash<Key>, 142 class Pred = std::equal_to<Key>, 143 class Alloc = std::allocator<std::pair<const Key, T>>> 144 using hash_multimap = std::unordered_multimap<Key, T, Hash, Pred, Alloc>; 145 146 template<class Key, 147 class Hash = std::hash<Key>, 148 class Pred = std::equal_to<Key>, 149 class Alloc = std::allocator<Key>> 150 using hash_multiset = std::unordered_multiset<Key, Hash, Pred, Alloc>; 151 152 template<class Key, 153 class Hash = std::hash<Key>, 154 class Pred = std::equal_to<Key>, 155 class Alloc = std::allocator<Key>> 156 using hash_set = std::unordered_set<Key, Hash, Pred, Alloc>; 157 158 #else // !COMPILER_MSVC 159 160 // Otherwise, use the pre-standard ones, but override the default hash to match 161 // C++11. 162 template<class Key, class T, 163 class Hash = BASE_HASH_NAMESPACE::hash<Key>, 164 class Pred = std::equal_to<Key>, 165 class Alloc = std::allocator<std::pair<const Key, T>>> 166 using hash_map = BASE_HASH_IMPL_NAMESPACE::hash_map<Key, T, Hash, Pred, Alloc>; 167 168 template<class Key, class T, 169 class Hash = BASE_HASH_NAMESPACE::hash<Key>, 170 class Pred = std::equal_to<Key>, 171 class Alloc = std::allocator<std::pair<const Key, T>>> 172 using hash_multimap = 173 BASE_HASH_IMPL_NAMESPACE::hash_multimap<Key, T, Hash, Pred, Alloc>; 174 175 template<class Key, 176 class Hash = BASE_HASH_NAMESPACE::hash<Key>, 177 class Pred = std::equal_to<Key>, 178 class Alloc = std::allocator<Key>> 179 using hash_multiset = 180 BASE_HASH_IMPL_NAMESPACE::hash_multiset<Key, Hash, Pred, Alloc>; 181 182 template<class Key, 183 class Hash = BASE_HASH_NAMESPACE::hash<Key>, 184 class Pred = std::equal_to<Key>, 185 class Alloc = std::allocator<Key>> 186 using hash_set = BASE_HASH_IMPL_NAMESPACE::hash_set<Key, Hash, Pred, Alloc>; 187 188 #undef BASE_HASH_IMPL_NAMESPACE 189 190 #endif // COMPILER_MSVC 191 192 // Implement hashing for pairs of at-most 32 bit integer values. 193 // When size_t is 32 bits, we turn the 64-bit hash code into 32 bits by using 194 // multiply-add hashing. This algorithm, as described in 195 // Theorem 4.3.3 of the thesis "ber die Komplexitt der Multiplikation in 196 // eingeschrnkten Branchingprogrammmodellen" by Woelfel, is: 197 // 198 // h32(x32, y32) = (h64(x32, y32) * rand_odd64 + rand16 * 2^16) % 2^64 / 2^32 199 // 200 // Contact danakj (at) chromium.org for any questions. 201 inline std::size_t HashInts32(uint32_t value1, uint32_t value2) { 202 uint64_t value1_64 = value1; 203 uint64_t hash64 = (value1_64 << 32) | value2; 204 205 if (sizeof(std::size_t) >= sizeof(uint64_t)) 206 return static_cast<std::size_t>(hash64); 207 208 uint64_t odd_random = 481046412LL << 32 | 1025306955LL; 209 uint32_t shift_random = 10121U << 16; 210 211 hash64 = hash64 * odd_random + shift_random; 212 std::size_t high_bits = static_cast<std::size_t>( 213 hash64 >> (8 * (sizeof(uint64_t) - sizeof(std::size_t)))); 214 return high_bits; 215 } 216 217 // Implement hashing for pairs of up-to 64-bit integer values. 218 // We use the compound integer hash method to produce a 64-bit hash code, by 219 // breaking the two 64-bit inputs into 4 32-bit values: 220 // http://opendatastructures.org/versions/edition-0.1d/ods-java/node33.html#SECTION00832000000000000000 221 // Then we reduce our result to 32 bits if required, similar to above. 222 inline std::size_t HashInts64(uint64_t value1, uint64_t value2) { 223 uint32_t short_random1 = 842304669U; 224 uint32_t short_random2 = 619063811U; 225 uint32_t short_random3 = 937041849U; 226 uint32_t short_random4 = 3309708029U; 227 228 uint32_t value1a = static_cast<uint32_t>(value1 & 0xffffffff); 229 uint32_t value1b = static_cast<uint32_t>((value1 >> 32) & 0xffffffff); 230 uint32_t value2a = static_cast<uint32_t>(value2 & 0xffffffff); 231 uint32_t value2b = static_cast<uint32_t>((value2 >> 32) & 0xffffffff); 232 233 uint64_t product1 = static_cast<uint64_t>(value1a) * short_random1; 234 uint64_t product2 = static_cast<uint64_t>(value1b) * short_random2; 235 uint64_t product3 = static_cast<uint64_t>(value2a) * short_random3; 236 uint64_t product4 = static_cast<uint64_t>(value2b) * short_random4; 237 238 uint64_t hash64 = product1 + product2 + product3 + product4; 239 240 if (sizeof(std::size_t) >= sizeof(uint64_t)) 241 return static_cast<std::size_t>(hash64); 242 243 uint64_t odd_random = 1578233944LL << 32 | 194370989LL; 244 uint32_t shift_random = 20591U << 16; 245 246 hash64 = hash64 * odd_random + shift_random; 247 std::size_t high_bits = static_cast<std::size_t>( 248 hash64 >> (8 * (sizeof(uint64_t) - sizeof(std::size_t)))); 249 return high_bits; 250 } 251 252 template<typename T1, typename T2> 253 inline std::size_t HashPair(T1 value1, T2 value2) { 254 // This condition is expected to be compile-time evaluated and optimised away 255 // in release builds. 256 if (sizeof(T1) > sizeof(uint32_t) || (sizeof(T2) > sizeof(uint32_t))) 257 return HashInts64(value1, value2); 258 259 return HashInts32(value1, value2); 260 } 261 262 } // namespace base 263 264 namespace BASE_HASH_NAMESPACE { 265 266 // Implement methods for hashing a pair of integers, so they can be used as 267 // keys in STL containers. 268 269 template<typename Type1, typename Type2> 270 struct hash<std::pair<Type1, Type2> > { 271 std::size_t operator()(std::pair<Type1, Type2> value) const { 272 return base::HashPair(value.first, value.second); 273 } 274 }; 275 276 } // namespace BASE_HASH_NAMESPACE 277 278 #undef DEFINE_PAIR_HASH_FUNCTION_START 279 #undef DEFINE_PAIR_HASH_FUNCTION_END 280 281 #endif // BASE_CONTAINERS_HASH_TABLES_H_ 282