blob: ac5481336bf14d96f5d8ec23ac70168305ee3728 [file] [log] [blame]
/*
* Copyright (C) 2015 The Android Open Source Project
*
* Licensed under the Apache License, Version 2.0 (the "License");
* you may not use this file except in compliance with the License.
* You may obtain a copy of the License at
*
* http://www.apache.org/licenses/LICENSE-2.0
*
* Unless required by applicable law or agreed to in writing, software
* distributed under the License is distributed on an "AS IS" BASIS,
* WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
* See the License for the specific language governing permissions and
* limitations under the License.
*/
#ifndef ART_COMPILER_UTILS_DEDUPE_SET_INL_H_
#define ART_COMPILER_UTILS_DEDUPE_SET_INL_H_
#include "dedupe_set.h"
#include <algorithm>
#include <inttypes.h>
#include <unordered_map>
#include "base/mutex.h"
#include "base/hash_set.h"
#include "base/stl_util.h"
#include "base/stringprintf.h"
#include "base/time_utils.h"
namespace art {
template <typename InKey,
typename StoreKey,
typename Alloc,
typename HashType,
typename HashFunc,
HashType kShard>
struct DedupeSet<InKey, StoreKey, Alloc, HashType, HashFunc, kShard>::Stats {
size_t collision_sum = 0u;
size_t collision_max = 0u;
size_t total_probe_distance = 0u;
size_t total_size = 0u;
};
template <typename InKey,
typename StoreKey,
typename Alloc,
typename HashType,
typename HashFunc,
HashType kShard>
class DedupeSet<InKey, StoreKey, Alloc, HashType, HashFunc, kShard>::Shard {
public:
Shard(const Alloc& alloc, const std::string& lock_name)
: alloc_(alloc),
lock_name_(lock_name),
lock_(lock_name_.c_str()),
keys_() {
}
~Shard() {
for (const HashedKey<StoreKey>& key : keys_) {
DCHECK(key.Key() != nullptr);
alloc_.Destroy(key.Key());
}
}
const StoreKey* Add(Thread* self, size_t hash, const InKey& in_key) REQUIRES(!lock_) {
MutexLock lock(self, lock_);
HashedKey<InKey> hashed_in_key(hash, &in_key);
auto it = keys_.Find(hashed_in_key);
if (it != keys_.end()) {
DCHECK(it->Key() != nullptr);
return it->Key();
}
const StoreKey* store_key = alloc_.Copy(in_key);
keys_.Insert(HashedKey<StoreKey> { hash, store_key });
return store_key;
}
void UpdateStats(Thread* self, Stats* global_stats) REQUIRES(!lock_) {
// HashSet<> doesn't keep entries ordered by hash, so we actually allocate memory
// for bookkeeping while collecting the stats.
std::unordered_map<HashType, size_t> stats;
{
MutexLock lock(self, lock_);
// Note: The total_probe_distance will be updated with the current state.
// It may have been higher before a re-hash.
global_stats->total_probe_distance += keys_.TotalProbeDistance();
global_stats->total_size += keys_.Size();
for (const HashedKey<StoreKey>& key : keys_) {
auto it = stats.find(key.Hash());
if (it == stats.end()) {
stats.insert({key.Hash(), 1u});
} else {
++it->second;
}
}
}
for (const auto& entry : stats) {
size_t number_of_entries = entry.second;
if (number_of_entries > 1u) {
global_stats->collision_sum += number_of_entries - 1u;
global_stats->collision_max = std::max(global_stats->collision_max, number_of_entries);
}
}
}
private:
template <typename T>
class HashedKey {
public:
HashedKey() : hash_(0u), key_(nullptr) { }
HashedKey(size_t hash, const T* key) : hash_(hash), key_(key) { }
size_t Hash() const {
return hash_;
}
const T* Key() const {
return key_;
}
bool IsEmpty() const {
return Key() == nullptr;
}
void MakeEmpty() {
key_ = nullptr;
}
private:
size_t hash_;
const T* key_;
};
class ShardEmptyFn {
public:
bool IsEmpty(const HashedKey<StoreKey>& key) const {
return key.IsEmpty();
}
void MakeEmpty(HashedKey<StoreKey>& key) {
key.MakeEmpty();
}
};
struct ShardHashFn {
template <typename T>
size_t operator()(const HashedKey<T>& key) const {
return key.Hash();
}
};
struct ShardPred {
typename std::enable_if<!std::is_same<StoreKey, InKey>::value, bool>::type
operator()(const HashedKey<StoreKey>& lhs, const HashedKey<StoreKey>& rhs) const {
DCHECK(lhs.Key() != nullptr);
DCHECK(rhs.Key() != nullptr);
// Rehashing: stored keys are already deduplicated, so we can simply compare key pointers.
return lhs.Key() == rhs.Key();
}
template <typename LeftT, typename RightT>
bool operator()(const HashedKey<LeftT>& lhs, const HashedKey<RightT>& rhs) const {
DCHECK(lhs.Key() != nullptr);
DCHECK(rhs.Key() != nullptr);
return lhs.Hash() == rhs.Hash() &&
lhs.Key()->size() == rhs.Key()->size() &&
std::equal(lhs.Key()->begin(), lhs.Key()->end(), rhs.Key()->begin());
}
};
Alloc alloc_;
const std::string lock_name_;
Mutex lock_;
HashSet<HashedKey<StoreKey>, ShardEmptyFn, ShardHashFn, ShardPred> keys_ GUARDED_BY(lock_);
};
template <typename InKey,
typename StoreKey,
typename Alloc,
typename HashType,
typename HashFunc,
HashType kShard>
const StoreKey* DedupeSet<InKey, StoreKey, Alloc, HashType, HashFunc, kShard>::Add(
Thread* self, const InKey& key) {
uint64_t hash_start;
if (kIsDebugBuild) {
hash_start = NanoTime();
}
HashType raw_hash = HashFunc()(key);
if (kIsDebugBuild) {
uint64_t hash_end = NanoTime();
hash_time_ += hash_end - hash_start;
}
HashType shard_hash = raw_hash / kShard;
HashType shard_bin = raw_hash % kShard;
return shards_[shard_bin]->Add(self, shard_hash, key);
}
template <typename InKey,
typename StoreKey,
typename Alloc,
typename HashType,
typename HashFunc,
HashType kShard>
DedupeSet<InKey, StoreKey, Alloc, HashType, HashFunc, kShard>::DedupeSet(const char* set_name,
const Alloc& alloc)
: hash_time_(0) {
for (HashType i = 0; i < kShard; ++i) {
std::ostringstream oss;
oss << set_name << " lock " << i;
shards_[i].reset(new Shard(alloc, oss.str()));
}
}
template <typename InKey,
typename StoreKey,
typename Alloc,
typename HashType,
typename HashFunc,
HashType kShard>
DedupeSet<InKey, StoreKey, Alloc, HashType, HashFunc, kShard>::~DedupeSet() {
// Everything done by member destructors.
}
template <typename InKey,
typename StoreKey,
typename Alloc,
typename HashType,
typename HashFunc,
HashType kShard>
std::string DedupeSet<InKey, StoreKey, Alloc, HashType, HashFunc, kShard>::DumpStats(
Thread* self) const {
Stats stats;
for (HashType shard = 0; shard < kShard; ++shard) {
shards_[shard]->UpdateStats(self, &stats);
}
return StringPrintf("%zu collisions, %zu max hash collisions, "
"%zu/%zu probe distance, %" PRIu64 " ns hash time",
stats.collision_sum,
stats.collision_max,
stats.total_probe_distance,
stats.total_size,
hash_time_);
}
} // namespace art
#endif // ART_COMPILER_UTILS_DEDUPE_SET_INL_H_