blob: 3e17d7189eb3511f57dbb3dca0aa78938c12094f [file] [log] [blame]
// Copyright (c) 2006, Google Inc.
// All rights reserved.
//
// Redistribution and use in source and binary forms, with or without
// modification, are permitted provided that the following conditions are
// met:
//
// * Redistributions of source code must retain the above copyright
// notice, this list of conditions and the following disclaimer.
// * Redistributions in binary form must reproduce the above
// copyright notice, this list of conditions and the following disclaimer
// in the documentation and/or other materials provided with the
// distribution.
// * Neither the name of Google Inc. nor the names of its
// contributors may be used to endorse or promote products derived from
// this software without specific prior written permission.
//
// THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS
// "AS IS" AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT
// LIMITED TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR
// A PARTICULAR PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT
// OWNER OR CONTRIBUTORS BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL,
// SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT
// LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE,
// DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY
// THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT
// (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE
// OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
// ---
//
// Author: kenton@google.com (Kenton Varda)
//
// small_map is a drop-in replacement for map or hash_map. It uses a fixed
// array to store a certain number of elements, then reverts to using a
// map or hash_map when it runs out of space. For maps that are typically
// small, this can be considerably faster than using something like hash_map
// directly, as hash_map is optimized for large data sets. Of course, in
// order for this to be a significant win, you have to have a situation where
// you are using lots and lots of these small maps. One such situation is
// MessageSet: A set of search results may contain thousands of MessageSets,
// each containing only a couple items.
//
// TODO(kenton): This is very minimal, and was originally written for a
// very specific use (MessageSet). It only implements a few core methods
// of the STL associative container interface, though you are welcome to
// extend it.
#ifndef UTIL_GTL_SMALL_MAP_H_
#define UTIL_GTL_SMALL_MAP_H_
#include <config.h>
#include <assert.h>
#include <utility> // for make_pair()
#include "base/manual_constructor.h"
namespace ctemplate {
template <bool> struct CompileAssert { };
#define COMPILE_ASSERT(expr, msg) \
typedef CompileAssert<(bool(expr))> msg[bool(expr) ? 1 : -1]
// An STL-like associative container which starts out backed by a simple
// array but switches to some other container type if it grows beyond a
// fixed size.
//
// NormalMap: The map type to fall back to. This also defines the key
// and value types for the small_map.
// kArraySize: The size of the initial array of results. Once the map
// grows beyond this size, the map type will be used instead.
// EqualKey: A functor which tests two keys for equality. If the wrapped
// map type has a "key_equal" member (hash_map does), then that
// will be used by default. Otherwise you must specify this
// manually.
// MapInit: A functor that takes a ManualConstructor<NormalMap>* and uses it to
// initialize the map. This functor will be called at most once per
// small_map, when the map exceeds the threshold of kArraySize and we
// are about to copy values from the array to the map. The functor
// *must* call one of the Init() methods provided by
// ManualConstructor, since after it runs we assume that the NormalMap
// has been initialized.
//
// example:
// small_map<hash_map<string, int> > days;
// days["sunday" ] = 0;
// days["monday" ] = 1;
// days["tuesday" ] = 2;
// days["wednesday"] = 3;
// days["thursday" ] = 4;
// days["friday" ] = 5;
// days["saturday" ] = 6;
//
// You should assume that small_map might invalidate all the iterators
// on any call to erase(), insert() and operator[].
template <typename NormalMap>
class small_map_default_init {
public:
void operator ()(ManualConstructor<NormalMap>* map) const {
map->Init();
}
};
template <typename NormalMap,
int kArraySize = 4,
typename EqualKey = typename NormalMap::key_equal,
typename MapInit = small_map_default_init<NormalMap> >
class small_map {
// We cannot rely on the compiler to reject array of size 0. In
// particular, gcc 2.95.3 does it but later versions allow 0-length
// arrays. Therefore, we explicitly reject non-positive kArraySize
// here.
COMPILE_ASSERT(kArraySize > 0, default_initial_size_should_be_positive);
public:
typedef typename NormalMap::key_type key_type;
typedef typename NormalMap::mapped_type data_type;
typedef typename NormalMap::mapped_type mapped_type;
typedef typename NormalMap::value_type value_type;
typedef EqualKey key_equal;
small_map() : size_(0), functor_(MapInit()) {}
explicit small_map(const MapInit& functor) : size_(0), functor_(functor) {}
// Allow copy-constructor and assignment, since STL allows them too.
small_map(const small_map& src) {
// size_ and functor_ are initted in InitFrom()
InitFrom(src);
}
void operator=(const small_map& src) {
if (&src == this) return;
// This is not optimal. If src and dest are both using the small
// array, we could skip the teardown and reconstruct. One problem
// to be resolved is that the value_type itself is pair<const K,
// V>, and const K is not assignable.
Destroy();
InitFrom(src);
}
~small_map() {
Destroy();
}
class const_iterator;
class iterator {
public:
typedef typename NormalMap::iterator::iterator_category iterator_category;
typedef typename NormalMap::iterator::value_type value_type;
typedef typename NormalMap::iterator::difference_type difference_type;
typedef typename NormalMap::iterator::pointer pointer;
typedef typename NormalMap::iterator::reference reference;
inline iterator(): array_iter_(NULL) {}
inline iterator& operator++() {
if (array_iter_ != NULL) {
++array_iter_;
} else {
++hash_iter_;
}
return *this;
}
inline iterator operator++(int) {
iterator result(*this);
++(*this);
return result;
}
inline iterator& operator--() {
if (array_iter_ != NULL) {
--array_iter_;
} else {
--hash_iter_;
}
return *this;
}
inline iterator operator--(int) {
iterator result(*this);
--(*this);
return result;
}
inline value_type* operator->() const {
if (array_iter_ != NULL) {
return array_iter_->get();
} else {
return hash_iter_.operator->();
}
}
inline value_type& operator*() const {
if (array_iter_ != NULL) {
return *array_iter_->get();
} else {
return *hash_iter_;
}
}
inline bool operator==(const iterator& other) const {
if (array_iter_ != NULL) {
return array_iter_ == other.array_iter_;
} else {
return other.array_iter_ == NULL && hash_iter_ == other.hash_iter_;
}
}
inline bool operator!=(const iterator& other) const {
return !(*this == other);
}
bool operator==(const const_iterator& other) const;
bool operator!=(const const_iterator& other) const;
private:
friend class small_map;
friend class const_iterator;
inline explicit iterator(ManualConstructor<value_type>* init)
: array_iter_(init) {}
inline explicit iterator(const typename NormalMap::iterator& init)
: array_iter_(NULL), hash_iter_(init) {}
ManualConstructor<value_type>* array_iter_;
typename NormalMap::iterator hash_iter_;
};
class const_iterator {
public:
typedef typename NormalMap::const_iterator::iterator_category iterator_category;
typedef typename NormalMap::const_iterator::value_type value_type;
typedef typename NormalMap::const_iterator::difference_type difference_type;
typedef typename NormalMap::const_iterator::pointer pointer;
typedef typename NormalMap::const_iterator::reference reference;
inline const_iterator(): array_iter_(NULL) {}
inline const_iterator(const iterator& other)
: array_iter_(other.array_iter_), hash_iter_(other.hash_iter_) {}
inline const_iterator& operator++() {
if (array_iter_ != NULL) {
++array_iter_;
} else {
++hash_iter_;
}
return *this;
}
inline const_iterator operator++(int) {
const_iterator result(*this);
++(*this);
return result;
}
inline const_iterator& operator--() {
if (array_iter_ != NULL) {
--array_iter_;
} else {
--hash_iter_;
}
return *this;
}
inline const_iterator operator--(int) {
const_iterator result(*this);
--(*this);
return result;
}
inline const value_type* operator->() const {
if (array_iter_ != NULL) {
return array_iter_->get();
} else {
return hash_iter_.operator->();
}
}
inline const value_type& operator*() const {
if (array_iter_ != NULL) {
return *array_iter_->get();
} else {
return *hash_iter_;
}
}
inline bool operator==(const const_iterator& other) const {
if (array_iter_ != NULL) {
return array_iter_ == other.array_iter_;
} else {
return other.array_iter_ == NULL && hash_iter_ == other.hash_iter_;
}
}
inline bool operator!=(const const_iterator& other) const {
return !(*this == other);
}
private:
friend class small_map;
inline explicit const_iterator(
const ManualConstructor<value_type>* init)
: array_iter_(init) {}
inline explicit const_iterator(
const typename NormalMap::const_iterator& init)
: array_iter_(NULL), hash_iter_(init) {}
const ManualConstructor<value_type>* array_iter_;
typename NormalMap::const_iterator hash_iter_;
};
iterator find(const key_type& key) {
key_equal compare;
if (size_ >= 0) {
for (int i = 0; i < size_; i++) {
if (compare(array_[i]->first, key)) {
return iterator(array_ + i);
}
}
return iterator(array_ + size_);
} else {
return iterator(map()->find(key));
}
}
const_iterator find(const key_type& key) const {
key_equal compare;
if (size_ >= 0) {
for (int i = 0; i < size_; i++) {
if (compare(array_[i]->first, key)) {
return const_iterator(array_ + i);
}
}
return const_iterator(array_ + size_);
} else {
return const_iterator(map()->find(key));
}
}
// Invalidates iterators.
data_type& operator[](const key_type& key) {
key_equal compare;
if (size_ >= 0) {
// operator[] searches backwards, favoring recently-added
// elements.
for (int i = size_-1; i >= 0; --i) {
if (compare(array_[i]->first, key)) {
return array_[i]->second;
}
}
if (size_ == kArraySize) {
ConvertToRealMap();
return (*map_)[key];
} else {
array_[size_].Init(key, data_type());
return array_[size_++]->second;
}
} else {
return (*map_)[key];
}
}
// Invalidates iterators.
std::pair<iterator, bool> insert(const value_type& x) {
key_equal compare;
if (size_ >= 0) {
for (int i = 0; i < size_; i++) {
if (compare(array_[i]->first, x.first)) {
return std::make_pair(iterator(array_ + i), false);
}
}
if (size_ == kArraySize) {
ConvertToRealMap(); // Invalidates all iterators!
std::pair<typename NormalMap::iterator, bool> ret = map_->insert(x);
return std::make_pair(iterator(ret.first), ret.second);
} else {
array_[size_].Init(x);
return std::make_pair(iterator(array_ + size_++), true);
}
} else {
std::pair<typename NormalMap::iterator, bool> ret = map_->insert(x);
return std::make_pair(iterator(ret.first), ret.second);
}
}
// Invalidates iterators.
template <class InputIterator>
void insert(InputIterator f, InputIterator l) {
while (f != l) {
insert(*f);
++f;
}
}
iterator begin() {
if (size_ >= 0) {
return iterator(array_);
} else {
return iterator(map_->begin());
}
}
const_iterator begin() const {
if (size_ >= 0) {
return const_iterator(array_);
} else {
return const_iterator(map_->begin());
}
}
iterator end() {
if (size_ >= 0) {
return iterator(array_ + size_);
} else {
return iterator(map_->end());
}
}
const_iterator end() const {
if (size_ >= 0) {
return const_iterator(array_ + size_);
} else {
return const_iterator(map_->end());
}
}
void clear() {
if (size_ >= 0) {
for (int i = 0; i < size_; i++) {
array_[i].Destroy();
}
} else {
map_.Destroy();
}
size_ = 0;
}
// Invalidates iterators.
void erase(const iterator& position) {
if (size_ >= 0) {
int i = position.array_iter_ - array_;
array_[i].Destroy();
--size_;
if (i != size_) {
array_[i].Init(*array_[size_]);
array_[size_].Destroy();
}
} else {
map_->erase(position.hash_iter_);
}
}
int erase(const key_type& key) {
iterator iter = find(key);
if (iter == end()) return 0;
erase(iter);
return 1;
}
int count(const key_type& key) const {
return (find(key) == end()) ? 0 : 1;
}
int size() const {
if (size_ >= 0) {
return size_;
} else {
return map_->size();
}
}
bool empty() const {
if (size_ >= 0) {
return (size_ == 0);
} else {
return map_->empty();
}
}
// Returns true if we have fallen back to using the underlying map
// representation.
bool using_full_map() const {
return size_ < 0;
}
inline NormalMap* map() {
assert(using_full_map());
return map_.get();
}
inline const NormalMap* map() const {
assert(using_full_map());
return map_.get();
}
private:
int size_; // negative = using hash_map
MapInit functor_;
// We want to call constructors and destructors manually, but we don't
// want to allocate and deallocate the memory used for them separately.
// So, we use this crazy ManualConstructor class.
//
// Since array_ and map_ are mutually exclusive, we'll put them in a
// union, too. We add in a dummy_ value which quiets MSVC (both
// 7.1 and 8.0) from otherwise giving an erroneous "union member has
// copy constructor" error message (C2621). This dummy member has
// to come before array_ to quiet the compiler. Shrug.
union {
ManualConstructor<value_type> dummy_;
ManualConstructor<value_type> array_[kArraySize];
ManualConstructor<NormalMap> map_;
};
void ConvertToRealMap() {
// Move the current elements into a temporary array.
ManualConstructor<value_type> temp_array[kArraySize];
for (int i = 0; i < kArraySize; i++) {
temp_array[i].Init(*array_[i]);
array_[i].Destroy();
}
// Initialize the map.
size_ = -1;
functor_(&map_);
// Insert elements into it.
for (int i = 0; i < kArraySize; i++) {
map_->insert(*temp_array[i]);
temp_array[i].Destroy();
}
}
// Helpers for constructors and destructors.
void InitFrom(const small_map& src) {
functor_ = src.functor_;
size_ = src.size_;
if (src.size_ >= 0) {
for (int i = 0; i < size_; i++) {
array_[i].Init(*src.array_[i]);
}
} else {
functor_(&map_);
(*map_.get()) = (*src.map_.get());
}
}
void Destroy() {
if (size_ >= 0) {
for (int i = 0; i < size_; i++) {
array_[i].Destroy();
}
} else {
map_.Destroy();
}
}
};
template <typename NormalMap, int kArraySize, typename EqualKey,
typename Functor>
inline bool small_map<NormalMap, kArraySize, EqualKey,
Functor>::iterator::operator==(
const const_iterator& other) const {
return other == *this;
}
template <typename NormalMap, int kArraySize, typename EqualKey,
typename Functor>
inline bool small_map<NormalMap, kArraySize, EqualKey,
Functor>::iterator::operator!=(
const const_iterator& other) const {
return other != *this;
}
}
#endif // UTIL_GTL_SMALL_MAP_H_