~ubuntu-branches/ubuntu/jaunty/google-perftools/jaunty

Viewing changes to src/packed-cache-inl.h

Committer: Bazaar Package Importer
Author(s): Daigo Moriwaki
Date: 2008-06-15 23:41:36 UTC
mfrom: (3.1.1 sid)
Revision ID: james.westby@ubuntu.com-20080615234136-al5gawvdvt5vhdtz

Tags: 0.98-1

http://bugs.debian.org/425147

http://bugs.debian.org/454841

http://bugs.debian.org/450294

http://bugs.debian.org/404001

* New upstream release. (Closes: #425147)
* Compiled with GCC 4.3. (Closes: #454841)
* debian/watch: can now report upstream's version (Closes: #450294)
* Because of a file conflict between tau and libgoogle-perftools the
  binary pprof is renamed as google-pprof. (Closes: #404001)
  Great thanks to Michael Mende.
* debian/rules: autoconf files are now generated at the build time.
* Bumped up Standards-Version to 3.7.3, no changes are required.
* Split a new package, libtcmallc_minimal0. The upstream supports
  this module for wider platforms. So I leave its architecture to be
  `any'.
* libgoogle-perftools0's architecture is now i386. The upstream
  supports this module for x86 and x86_64. However, x86_64 requires
  libunwind's development head, which Debian does not have yet.
* Removed an unnecessary patch, debian/patches/02_profiler.cc_alpha.diff.

files added:
README.windows

debian/README.Debian

debian/libgoogle-perftools0.docs

debian/libtcmalloc-minimal0.dirs

debian/libtcmalloc-minimal0.install

doc/cpuprofile-fileformat.html

doc/cpuprofile.html

doc/designstyle.css

doc/heapprofile.html

doc/pprof_remote_servers.html

google-perftools.sln

m4/ac_have_attribute.m4

m4/acx_pthread.m4

m4/compiler_characteristics.m4

m4/install_prefix.m4

m4/namespaces.m4

m4/program_invocation_name.m4

m4/stl_hash.m4

m4/stl_namespace.m4

src/base/atomicops-internals-linuxppc.h

src/base/atomicops-internals-macosx.h

src/base/atomicops-internals-x86-msvc.h

src/base/atomicops-internals-x86.cc

src/base/atomicops-internals-x86.h

src/base/atomicops.h

src/base/cycleclock.h

src/base/dynamic_annotations.cc

src/base/dynamic_annotations.h

src/base/logging.cc

src/base/low_level_alloc.cc

src/base/low_level_alloc.h

src/base/simple_mutex.h

src/base/spinlock.cc

src/base/spinlock.h

src/base/stl_allocator.h

src/base/sysinfo.cc

src/base/sysinfo.h

src/config_for_unittests.h

src/getpc.h

src/heap-profile-table.cc

src/heap-profile-table.h

src/malloc_hook-inl.h

src/memfs_malloc.cc

src/memory_region_map.cc

src/memory_region_map.h

src/packed-cache-inl.h

src/profiledata.cc

src/profiledata.h

src/solaris

src/solaris/libstdc++.la

src/stacktrace_powerpc-inl.h

src/tcmalloc.h

src/tests/atomicops_unittest.cc

src/tests/frag_unittest.cc

src/tests/getpc_test.cc

src/tests/low_level_alloc_unittest.cc

src/tests/markidle_unittest.cc

src/tests/maybe_threads_unittest.sh

src/tests/memalign_unittest.cc

src/tests/packed-cache_test.cc

src/tests/profiledata_unittest.cc

src/tests/system-alloc_unittest.cc

src/tests/testutil.cc

src/tests/testutil.h

src/tests/thread_dealloc_unittest.cc

src/windows

src/windows/config.h

src/windows/ia32_modrm_map.cc

src/windows/ia32_opcode_map.cc

src/windows/mingw.h

src/windows/mini_disassembler.cc

src/windows/mini_disassembler.h

src/windows/mini_disassembler_types.h

src/windows/patch_functions.cc

src/windows/port.cc

src/windows/port.h

src/windows/preamble_patcher.cc

src/windows/preamble_patcher.h

src/windows/preamble_patcher_with_stub.cc

src/windows/vc7and8.def

vsprojects

vsprojects/addressmap_unittest

vsprojects/addressmap_unittest/addressmap_unittest.vcproj

vsprojects/frag_unittest

vsprojects/frag_unittest/frag_unittest.vcproj

vsprojects/libtcmalloc_minimal

vsprojects/libtcmalloc_minimal/libtcmalloc_minimal.vcproj

vsprojects/low_level_alloc_unittest

vsprojects/low_level_alloc_unittest/low_level_alloc_unittest.vcproj

vsprojects/markidle_unittest

vsprojects/markidle_unittest/markidle_unittest.vcproj

vsprojects/memalign_unittest

vsprojects/memalign_unittest/memalign_unittest.vcproj

vsprojects/packed-cache_test

vsprojects/packed-cache_test/packed-cache_test.vcproj

vsprojects/tcmalloc_minimal_large

vsprojects/tcmalloc_minimal_large/tcmalloc_minimal_large_unittest.vcproj

vsprojects/tcmalloc_minimal_unittest

vsprojects/tcmalloc_minimal_unittest-static

vsprojects/tcmalloc_minimal_unittest/tcmalloc_minimal_unittest.vcproj

vsprojects/thread_dealloc_unittest

vsprojects/thread_dealloc_unittest/thread_dealloc_unittest.vcproj

files removed:
debian/patches

debian/patches/01_linux_syscall_support_h.diff

debian/patches/02_profiler.cc_alpha.diff

debian/patches/03_FTBFS_gcc-4.3.diff

doc/cpu_profiler.html

doc/heap_profiler.html

src/config.h

src/google/perftools

src/google/perftools/hash_set.h

src/heap-profiler-inl.h

src/internal_spinlock.h

files modified:
ChangeLog

INSTALL

Makefile.am

Makefile.in

README

TODO

aclocal.m4

compile

config.guess

config.sub

configure

configure.ac

debian/changelog

debian/control

debian/docs

debian/libgoogle-perftools0.install

debian/libgoogle-perftools0.manpages

debian/rules

debian/watch

depcomp

doc/heap_checker.html

doc/index.html

doc/tcmalloc.html

install-sh

libtool

ltmain.sh

missing

mkinstalldirs

packages/deb/changelog

packages/deb/docs

packages/rpm/rpm.spec

src/addressmap-inl.h

src/base/basictypes.h

src/base/commandlineflags.h

src/base/elfcore.h

src/base/googleinit.h

src/base/linux_syscall_support.h

src/base/linuxthreads.c

src/base/linuxthreads.h

src/base/logging.h

src/base/thread_lister.c

src/base/thread_lister.h

src/config.h.in

src/google/heap-checker.h

src/google/heap-profiler.h

src/google/malloc_extension.h

src/google/malloc_hook.h

src/google/profiler.h

src/google/stacktrace.h

src/heap-checker-bcad.cc

src/heap-checker.cc

src/heap-profiler.cc

src/internal_logging.cc

src/internal_logging.h

src/malloc_extension.cc

src/malloc_hook.cc

src/maybe_threads.cc

src/maybe_threads.h

src/pagemap.h

src/pprof

src/profiler.cc

src/stacktrace.cc

src/stacktrace_generic-inl.h

src/stacktrace_libunwind-inl.h

src/stacktrace_x86-inl.h

src/stacktrace_x86_64-inl.h

src/system-alloc.cc

src/system-alloc.h

src/tcmalloc.cc

src/tests/addressmap_unittest.cc

src/tests/heap-checker-death_unittest.sh

src/tests/heap-checker_unittest.cc

src/tests/heap-checker_unittest.sh

src/tests/heap-profiler_unittest.cc

src/tests/heap-profiler_unittest.sh

src/tests/profiler_unittest.cc

src/tests/profiler_unittest.sh

src/tests/ptmalloc/malloc-machine.h

src/tests/stacktrace_unittest.cc

src/tests/tcmalloc_large_unittest.cc

src/tests/tcmalloc_unittest.cc

Show diffs side-by-side

added added

removed removed

src/packed-cache-inl.h

// Redistribution and use in source and binary forms, with or without

// modification, are permitted provided that the following conditions are

// met:

// * Redistributions of source code must retain the above copyright

// notice, this list of conditions and the following disclaimer.

// * Redistributions in binary form must reproduce the above

// copyright notice, this list of conditions and the following disclaimer

// in the documentation and/or other materials provided with the

// distribution.

// * Neither the name of Google Inc. nor the names of its

// contributors may be used to endorse or promote products derived from

// this software without specific prior written permission.

// THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS

// "AS IS" AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT

// LIMITED TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR

// A PARTICULAR PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT

// OWNER OR CONTRIBUTORS BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL,

// SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT

// LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE,

// DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY

// THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT

// (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE

// OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.

// ---

// Author: Geoff Pike

// This file provides a minimal cache that can hold a <key, value> pair

// with little if any wasted space. The types of the key and value

// must be unsigned integral types or at least have unsigned semantics

// for >>, casting, and similar operations.

// Synchronization is not provided. However, the cache is implemented

// as an array of cache entries whose type is chosen at compile time.

// If a[i] is atomic on your hardware for the chosen array type then

// raciness will not necessarily lead to bugginess. The cache entries

// must be large enough to hold a partial key and a value packed

// together. The partial keys are bit strings of length

// kKeybits - kHashbits, and the values are bit strings of length kValuebits.

// In an effort to use minimal space, every cache entry represents

// some <key, value> pair; the class provides no way to mark a cache

// entry as empty or uninitialized. In practice, you may want to have

// reserved keys or values to get around this limitation. For example, in

// tcmalloc's PageID-to-sizeclass cache, a value of 0 is used as

// "unknown sizeclass."

// Usage Considerations

// --------------------

// kHashbits controls the size of the cache. The best value for

// kHashbits will of course depend on the application. Perhaps try

// tuning the value of kHashbits by measuring different values on your

// favorite benchmark. Also remember not to be a pig; other

// programs that need resources may suffer if you are.

// The main uses for this class will be when performance is

// critical and there's a convenient type to hold the cache's

// entries. As described above, the number of bits required

// for a cache entry is (kKeybits - kHashbits) + kValuebits. Suppose

// kKeybits + kValuebits is 43. Then it probably makes sense to

// chose kHashbits >= 11 so that cache entries fit in a uint32.

// On the other hand, suppose kKeybits = kValuebits = 64. Then

// using this class may be less worthwhile. You'll probably

// be using 128 bits for each entry anyway, so maybe just pick

// a hash function, H, and use an array indexed by H(key):

// void Put(K key, V value) { a_[H(key)] = pair<K, V>(key, value); }

// V GetOrDefault(K key, V default) { const pair<K, V> &p = a_[H(key)]; ... }

// etc.

// Further Details

// ---------------

// For caches used only by one thread, the following is true:

// 1. For a cache c,

// (c.Put(key, value), c.GetOrDefault(key, 0)) == value

// and

// (c.Put(key, value), <...>, c.GetOrDefault(key, 0)) == value

// if the elided code contains no c.Put calls.

// 2. Has(key) will return false if no <key, value> pair with that key

// has ever been Put. However, a newly initialized cache will have

// some <key, value> pairs already present. When you create a new

// cache, you must specify an "initial value." The initialization

// procedure is equivalent to Clear(initial_value), which is

// equivalent to Put(k, initial_value) for all keys k from 0 to

// 2^kHashbits - 1.

// 3. If key and key' differ then the only way Put(key, value) may

// cause Has(key') to change is that Has(key') may change from true to

// false. Furthermore, a Put() call that doesn't change Has(key')

// doesn't change GetOrDefault(key', ...) either.

100

// Implementation details:

101

102

// This is a direct-mapped cache with 2^kHashbits entries; the hash

103

// function simply takes the low bits of the key. We store whole keys

104

// if a whole key plus a whole value fits in an entry. Otherwise, an

105

// entry is the high bits of a key and a value, packed together.

106

// E.g., a 20 bit key and a 7 bit value only require a uint16 for each

107

// entry if kHashbits >= 11.

108

109

// Alternatives to this scheme will be added as needed.

110

111

#ifndef TCMALLOC_PACKED_CACHE_INL_H_

112

#define TCMALLOC_PACKED_CACHE_INL_H_

113

114

#include "base/basictypes.h" // for COMPILE_ASSERT

115

#include "base/logging.h" // for DCHECK

116

117

// A safe way of doing "(1 << n) - 1" -- without worrying about overflow

118

// Note this will all be resolved to a constant expression at compile-time

119

#define N_ONES_(IntType, N) \

120

( (N) == 0 ? 0 : ((static_cast<IntType>(1) << ((N)-1))-1 + \

121

(static_cast<IntType>(1) << ((N)-1))) )

122

123

// The types K and V provide upper bounds on the number of valid keys

124

// and values, but we explicitly require the keys to be less than

125

// 2^kKeybits and the values to be less than 2^kValuebits. The size of

126

// the table is controlled by kHashbits, and the type of each entry in

127

// the cache is T. See also the big comment at the top of the file.

128

template <int kKeybits, typename T>

129

class PackedCache {

130

public:

131

typedef uintptr_t K;

132

typedef size_t V;

133

static const int kHashbits = 12;

134

static const int kValuebits = 7;

135

static const bool kUseWholeKeys = kKeybits + kValuebits <= 8 * sizeof(T);

136

137

explicit PackedCache(V initial_value) {

138

COMPILE_ASSERT(kKeybits <= sizeof(K) * 8, key_size);

139

COMPILE_ASSERT(kValuebits <= sizeof(V) * 8, value_size);

140

COMPILE_ASSERT(kHashbits <= kKeybits, hash_function);

141

COMPILE_ASSERT(kKeybits - kHashbits + kValuebits <= kTbits,

142

entry_size_must_be_big_enough);

143

Clear(initial_value);

144

}

145

146

void Put(K key, V value) {

147

DCHECK_EQ(key, key & kKeyMask);

148

DCHECK_EQ(value, value & kValueMask);

149

array_[Hash(key)] = KeyToUpper(key) | value;

150

}

151

152

bool Has(K key) const {

153

DCHECK_EQ(key, key & kKeyMask);

154

return KeyMatch(array_[Hash(key)], key);

155

}

156

157

V GetOrDefault(K key, V default_value) const {

158

// As with other code in this class, we touch array_ as few times

159

// as we can. Assuming entries are read atomically (e.g., their

160

// type is uintptr_t on most hardware) then certain races are

161

// harmless.

162

DCHECK_EQ(key, key & kKeyMask);

163

T entry = array_[Hash(key)];

164

return KeyMatch(entry, key) ? EntryToValue(entry) : default_value;

165

}

166

167

void Clear(V value) {

168

DCHECK_EQ(value, value & kValueMask);

169

for (int i = 0; i < 1 << kHashbits; i++) {

170

RAW_DCHECK(kUseWholeKeys || KeyToUpper(i) == 0, "KeyToUpper failure");

171

array_[i] = kUseWholeKeys ? (value | KeyToUpper(i)) : value;

172

}

173

}

174

175

private:

176

// We are going to pack a value and the upper part of a key (or a

177

// whole key) into an entry of type T. The UPPER type is for the

178

// upper part of a key, after the key has been masked and shifted

179

// for inclusion in an entry.

180

typedef T UPPER;

181

182

static V EntryToValue(T t) { return t & kValueMask; }

183

184

// If we have space for a whole key, we just shift it left.

185

// Otherwise kHashbits determines where in a K to find the upper

186

// part of the key, and kValuebits determines where in the entry to

187

// put it.

188

static UPPER KeyToUpper(K k) {

189

if (kUseWholeKeys) {

190

return static_cast<T>(k) << kValuebits;

191

} else {

192

const int shift = kHashbits - kValuebits;

193

// Assume kHashbits >= kValuebits. It'd be easy to lift this assumption.

194

return static_cast<T>(k >> shift) & kUpperMask;

195

}

196

}

197

198

static size_t Hash(K key) {

199

return static_cast<size_t>(key) & N_ONES_(size_t, kHashbits);

200

}

201

202

// Does the entry match the relevant part of the given key?

203

static bool KeyMatch(T entry, K key) {

204

return kUseWholeKeys ?

205

(entry >> kValuebits == key) :

206

((KeyToUpper(key) ^ entry) & kUpperMask) == 0;

207

}

208

209

static const int kTbits = 8 * sizeof(T);

210

static const int kUpperbits = kUseWholeKeys ? kKeybits : kKeybits - kHashbits;

211

212

// For masking a K.

213

static const K kKeyMask = N_ONES_(K, kKeybits);

214

215

// For masking a T.

216

static const T kUpperMask = N_ONES_(T, kUpperbits) << kValuebits;

217

218

// For masking a V or a T.

219

static const V kValueMask = N_ONES_(V, kValuebits);

220

221

// array_ is the cache. Its elements are volatile because any

222

// thread can write any array element at any time.

223

volatile T array_[1 << kHashbits];

224

};

225

226

#undef N_ONES_

227

228

#endif // TCMALLOC_PACKED_CACHE_INL_H_

Older »