JavaScriptCore/wtf/TCPackedCache.h
changeset 0 4f2f89ce4247
equal deleted inserted replaced
-1:000000000000 0:4f2f89ce4247
       
     1 // Copyright (c) 2007, Google Inc.
       
     2 // All rights reserved.
       
     3 //
       
     4 // Redistribution and use in source and binary forms, with or without
       
     5 // modification, are permitted provided that the following conditions are
       
     6 // met:
       
     7 //
       
     8 //     * Redistributions of source code must retain the above copyright
       
     9 // notice, this list of conditions and the following disclaimer.
       
    10 //     * Redistributions in binary form must reproduce the above
       
    11 // copyright notice, this list of conditions and the following disclaimer
       
    12 // in the documentation and/or other materials provided with the
       
    13 // distribution.
       
    14 //     * Neither the name of Google Inc. nor the names of its
       
    15 // contributors may be used to endorse or promote products derived from
       
    16 // this software without specific prior written permission.
       
    17 //
       
    18 // THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS
       
    19 // "AS IS" AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT
       
    20 // LIMITED TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR
       
    21 // A PARTICULAR PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT
       
    22 // OWNER OR CONTRIBUTORS BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL,
       
    23 // SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT
       
    24 // LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE,
       
    25 // DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY
       
    26 // THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT
       
    27 // (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE
       
    28 // OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
       
    29 
       
    30 // ---
       
    31 // Author: Geoff Pike
       
    32 //
       
    33 // This file provides a minimal cache that can hold a <key, value> pair
       
    34 // with little if any wasted space.  The types of the key and value
       
    35 // must be unsigned integral types or at least have unsigned semantics
       
    36 // for >>, casting, and similar operations.
       
    37 //
       
    38 // Synchronization is not provided.  However, the cache is implemented
       
    39 // as an array of cache entries whose type is chosen at compile time.
       
    40 // If a[i] is atomic on your hardware for the chosen array type then
       
    41 // raciness will not necessarily lead to bugginess.  The cache entries
       
    42 // must be large enough to hold a partial key and a value packed
       
    43 // together.  The partial keys are bit strings of length
       
    44 // kKeybits - kHashbits, and the values are bit strings of length kValuebits.
       
    45 //
       
    46 // In an effort to use minimal space, every cache entry represents
       
    47 // some <key, value> pair; the class provides no way to mark a cache
       
    48 // entry as empty or uninitialized.  In practice, you may want to have
       
    49 // reserved keys or values to get around this limitation.  For example, in
       
    50 // tcmalloc's PageID-to-sizeclass cache, a value of 0 is used as
       
    51 // "unknown sizeclass."
       
    52 //
       
    53 // Usage Considerations
       
    54 // --------------------
       
    55 //
       
    56 // kHashbits controls the size of the cache.  The best value for
       
    57 // kHashbits will of course depend on the application.  Perhaps try
       
    58 // tuning the value of kHashbits by measuring different values on your
       
    59 // favorite benchmark.  Also remember not to be a pig; other
       
    60 // programs that need resources may suffer if you are.
       
    61 //
       
    62 // The main uses for this class will be when performance is
       
    63 // critical and there's a convenient type to hold the cache's
       
    64 // entries.  As described above, the number of bits required
       
    65 // for a cache entry is (kKeybits - kHashbits) + kValuebits.  Suppose
       
    66 // kKeybits + kValuebits is 43.  Then it probably makes sense to
       
    67 // chose kHashbits >= 11 so that cache entries fit in a uint32.
       
    68 //
       
    69 // On the other hand, suppose kKeybits = kValuebits = 64.  Then
       
    70 // using this class may be less worthwhile.  You'll probably
       
    71 // be using 128 bits for each entry anyway, so maybe just pick
       
    72 // a hash function, H, and use an array indexed by H(key):
       
    73 //    void Put(K key, V value) { a_[H(key)] = pair<K, V>(key, value); }
       
    74 //    V GetOrDefault(K key, V default) { const pair<K, V> &p = a_[H(key)]; ... }
       
    75 //    etc.
       
    76 //
       
    77 // Further Details
       
    78 // ---------------
       
    79 //
       
    80 // For caches used only by one thread, the following is true:
       
    81 // 1. For a cache c,
       
    82 //      (c.Put(key, value), c.GetOrDefault(key, 0)) == value
       
    83 //    and
       
    84 //      (c.Put(key, value), <...>, c.GetOrDefault(key, 0)) == value
       
    85 //    if the elided code contains no c.Put calls.
       
    86 //
       
    87 // 2. Has(key) will return false if no <key, value> pair with that key
       
    88 //    has ever been Put.  However, a newly initialized cache will have
       
    89 //    some <key, value> pairs already present.  When you create a new
       
    90 //    cache, you must specify an "initial value."  The initialization
       
    91 //    procedure is equivalent to Clear(initial_value), which is
       
    92 //    equivalent to Put(k, initial_value) for all keys k from 0 to
       
    93 //    2^kHashbits - 1.
       
    94 //
       
    95 // 3. If key and key' differ then the only way Put(key, value) may
       
    96 //    cause Has(key') to change is that Has(key') may change from true to
       
    97 //    false. Furthermore, a Put() call that doesn't change Has(key')
       
    98 //    doesn't change GetOrDefault(key', ...) either.
       
    99 //
       
   100 // Implementation details:
       
   101 //
       
   102 // This is a direct-mapped cache with 2^kHashbits entries;
       
   103 // the hash function simply takes the low bits of the key.
       
   104 // So, we don't have to store the low bits of the key in the entries.
       
   105 // Instead, an entry is the high bits of a key and a value, packed
       
   106 // together.  E.g., a 20 bit key and a 7 bit value only require
       
   107 // a uint16 for each entry if kHashbits >= 11.
       
   108 //
       
   109 // Alternatives to this scheme will be added as needed.
       
   110 
       
   111 #ifndef TCMALLOC_PACKED_CACHE_INL_H__
       
   112 #define TCMALLOC_PACKED_CACHE_INL_H__
       
   113 
       
   114 #ifndef WTF_CHANGES
       
   115 #include "base/basictypes.h"  // for COMPILE_ASSERT
       
   116 #include "base/logging.h"     // for DCHECK
       
   117 #endif
       
   118 
       
   119 #ifndef DCHECK_EQ
       
   120 #define DCHECK_EQ(val1, val2) ASSERT((val1) == (val2))
       
   121 #endif
       
   122 
       
   123 // A safe way of doing "(1 << n) - 1" -- without worrying about overflow
       
   124 // Note this will all be resolved to a constant expression at compile-time
       
   125 #define N_ONES_(IntType, N)                                     \
       
   126   ( (N) == 0 ? 0 : ((static_cast<IntType>(1) << ((N)-1))-1 +    \
       
   127                     (static_cast<IntType>(1) << ((N)-1))) )
       
   128 
       
   129 // The types K and V provide upper bounds on the number of valid keys
       
   130 // and values, but we explicitly require the keys to be less than
       
   131 // 2^kKeybits and the values to be less than 2^kValuebits.  The size of
       
   132 // the table is controlled by kHashbits, and the type of each entry in
       
   133 // the cache is T.  See also the big comment at the top of the file.
       
   134 template <int kKeybits, typename T>
       
   135 class PackedCache {
       
   136  public:
       
   137   typedef uintptr_t K;
       
   138   typedef size_t V;
       
   139   static const size_t kHashbits = 12;
       
   140   static const size_t kValuebits = 8;
       
   141 
       
   142   explicit PackedCache(V initial_value) {
       
   143     COMPILE_ASSERT(kKeybits <= sizeof(K) * 8, key_size);
       
   144     COMPILE_ASSERT(kValuebits <= sizeof(V) * 8, value_size);
       
   145     COMPILE_ASSERT(kHashbits <= kKeybits, hash_function);
       
   146     COMPILE_ASSERT(kKeybits - kHashbits + kValuebits <= kTbits,
       
   147                    entry_size_must_be_big_enough);
       
   148     Clear(initial_value);
       
   149   }
       
   150 
       
   151   void Put(K key, V value) {
       
   152     DCHECK_EQ(key, key & kKeyMask);
       
   153     DCHECK_EQ(value, value & kValueMask);
       
   154     array_[Hash(key)] = static_cast<T>(KeyToUpper(key) | value);
       
   155   }
       
   156 
       
   157   bool Has(K key) const {
       
   158     DCHECK_EQ(key, key & kKeyMask);
       
   159     return KeyMatch(array_[Hash(key)], key);
       
   160   }
       
   161 
       
   162   V GetOrDefault(K key, V default_value) const {
       
   163     // As with other code in this class, we touch array_ as few times
       
   164     // as we can.  Assuming entries are read atomically (e.g., their
       
   165     // type is uintptr_t on most hardware) then certain races are
       
   166     // harmless.
       
   167     DCHECK_EQ(key, key & kKeyMask);
       
   168     T entry = array_[Hash(key)];
       
   169     return KeyMatch(entry, key) ? EntryToValue(entry) : default_value;
       
   170   }
       
   171 
       
   172   void Clear(V value) {
       
   173     DCHECK_EQ(value, value & kValueMask);
       
   174     for (int i = 0; i < 1 << kHashbits; i++) {
       
   175       array_[i] = static_cast<T>(value);
       
   176     }
       
   177   }
       
   178 
       
   179  private:
       
   180   // We are going to pack a value and the upper part of a key into
       
   181   // an entry of type T.  The UPPER type is for the upper part of a key,
       
   182   // after the key has been masked and shifted for inclusion in an entry.
       
   183   typedef T UPPER;
       
   184 
       
   185   static V EntryToValue(T t) { return t & kValueMask; }
       
   186 
       
   187   static UPPER EntryToUpper(T t) { return t & kUpperMask; }
       
   188 
       
   189   // If v is a V and u is an UPPER then you can create an entry by
       
   190   // doing u | v.  kHashbits determines where in a K to find the upper
       
   191   // part of the key, and kValuebits determines where in the entry to put
       
   192   // it.
       
   193   static UPPER KeyToUpper(K k) {
       
   194     const int shift = kHashbits - kValuebits;
       
   195     // Assume kHashbits >= kValuebits. It would be easy to lift this assumption.
       
   196     return static_cast<T>(k >> shift) & kUpperMask;
       
   197   }
       
   198 
       
   199   // This is roughly the inverse of KeyToUpper().  Some of the key has been
       
   200   // thrown away, since KeyToUpper() masks off the low bits of the key.
       
   201   static K UpperToPartialKey(UPPER u) {
       
   202     DCHECK_EQ(u, u & kUpperMask);
       
   203     const int shift = kHashbits - kValuebits;
       
   204     // Assume kHashbits >= kValuebits. It would be easy to lift this assumption.
       
   205     return static_cast<K>(u) << shift;
       
   206   }
       
   207 
       
   208   static size_t Hash(K key) {
       
   209     return static_cast<size_t>(key) & N_ONES_(size_t, kHashbits);
       
   210   }
       
   211 
       
   212   // Does the entry's partial key match the relevant part of the given key?
       
   213   static bool KeyMatch(T entry, K key) {
       
   214     return ((KeyToUpper(key) ^ entry) & kUpperMask) == 0;
       
   215   }
       
   216 
       
   217   static const size_t kTbits = 8 * sizeof(T);
       
   218   static const int kUpperbits = kKeybits - kHashbits;
       
   219 
       
   220   // For masking a K.
       
   221   static const K kKeyMask = N_ONES_(K, kKeybits);
       
   222 
       
   223   // For masking a T.
       
   224   static const T kUpperMask = N_ONES_(T, kUpperbits) << kValuebits;
       
   225 
       
   226   // For masking a V or a T.
       
   227   static const V kValueMask = N_ONES_(V, kValuebits);
       
   228 
       
   229   T array_[1 << kHashbits];
       
   230 };
       
   231 
       
   232 #undef N_ONES_
       
   233 
       
   234 #endif  // TCMALLOC_PACKED_CACHE_INL_H__