Austin Schuh | 745610d | 2015-09-06 18:19:50 -0700 | [diff] [blame^] | 1 | // -*- Mode: C++; c-basic-offset: 2; indent-tabs-mode: nil -*- |
| 2 | // Copyright (c) 2005, Google Inc. |
| 3 | // All rights reserved. |
| 4 | // |
| 5 | // Redistribution and use in source and binary forms, with or without |
| 6 | // modification, are permitted provided that the following conditions are |
| 7 | // met: |
| 8 | // |
| 9 | // * Redistributions of source code must retain the above copyright |
| 10 | // notice, this list of conditions and the following disclaimer. |
| 11 | // * Redistributions in binary form must reproduce the above |
| 12 | // copyright notice, this list of conditions and the following disclaimer |
| 13 | // in the documentation and/or other materials provided with the |
| 14 | // distribution. |
| 15 | // * Neither the name of Google Inc. nor the names of its |
| 16 | // contributors may be used to endorse or promote products derived from |
| 17 | // this software without specific prior written permission. |
| 18 | // |
| 19 | // THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS |
| 20 | // "AS IS" AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT |
| 21 | // LIMITED TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR |
| 22 | // A PARTICULAR PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT |
| 23 | // OWNER OR CONTRIBUTORS BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, |
| 24 | // SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT |
| 25 | // LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, |
| 26 | // DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY |
| 27 | // THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT |
| 28 | // (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE |
| 29 | // OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE. |
| 30 | |
| 31 | // --- |
| 32 | // Author: Sanjay Ghemawat <opensource@google.com> |
| 33 | // |
| 34 | // Extra extensions exported by some malloc implementations. These |
| 35 | // extensions are accessed through a virtual base class so an |
| 36 | // application can link against a malloc that does not implement these |
| 37 | // extensions, and it will get default versions that do nothing. |
| 38 | // |
| 39 | // NOTE FOR C USERS: If you wish to use this functionality from within |
| 40 | // a C program, see malloc_extension_c.h. |
| 41 | |
| 42 | #ifndef BASE_MALLOC_EXTENSION_H_ |
| 43 | #define BASE_MALLOC_EXTENSION_H_ |
| 44 | |
| 45 | #include <stddef.h> |
| 46 | // I can't #include config.h in this public API file, but I should |
| 47 | // really use configure (and make malloc_extension.h a .in file) to |
| 48 | // figure out if the system has stdint.h or not. But I'm lazy, so |
| 49 | // for now I'm assuming it's a problem only with MSVC. |
| 50 | #ifndef _MSC_VER |
| 51 | #include <stdint.h> |
| 52 | #endif |
| 53 | #include <string> |
| 54 | #include <vector> |
| 55 | |
| 56 | // Annoying stuff for windows -- makes sure clients can import these functions |
| 57 | #ifndef PERFTOOLS_DLL_DECL |
| 58 | # ifdef _WIN32 |
| 59 | # define PERFTOOLS_DLL_DECL __declspec(dllimport) |
| 60 | # else |
| 61 | # define PERFTOOLS_DLL_DECL |
| 62 | # endif |
| 63 | #endif |
| 64 | |
| 65 | static const int kMallocHistogramSize = 64; |
| 66 | |
| 67 | // One day, we could support other types of writers (perhaps for C?) |
| 68 | typedef std::string MallocExtensionWriter; |
| 69 | |
| 70 | namespace base { |
| 71 | struct MallocRange; |
| 72 | } |
| 73 | |
| 74 | // Interface to a pluggable system allocator. |
| 75 | class PERFTOOLS_DLL_DECL SysAllocator { |
| 76 | public: |
| 77 | SysAllocator() { |
| 78 | } |
| 79 | virtual ~SysAllocator(); |
| 80 | |
| 81 | // Allocates "size"-byte of memory from system aligned with "alignment". |
| 82 | // Returns NULL if failed. Otherwise, the returned pointer p up to and |
| 83 | // including (p + actual_size -1) have been allocated. |
| 84 | virtual void* Alloc(size_t size, size_t *actual_size, size_t alignment) = 0; |
| 85 | }; |
| 86 | |
| 87 | // The default implementations of the following routines do nothing. |
| 88 | // All implementations should be thread-safe; the current one |
| 89 | // (TCMallocImplementation) is. |
| 90 | class PERFTOOLS_DLL_DECL MallocExtension { |
| 91 | public: |
| 92 | virtual ~MallocExtension(); |
| 93 | |
| 94 | // Call this very early in the program execution -- say, in a global |
| 95 | // constructor -- to set up parameters and state needed by all |
| 96 | // instrumented malloc implemenatations. One example: this routine |
| 97 | // sets environemnt variables to tell STL to use libc's malloc() |
| 98 | // instead of doing its own memory management. This is safe to call |
| 99 | // multiple times, as long as each time is before threads start up. |
| 100 | static void Initialize(); |
| 101 | |
| 102 | // See "verify_memory.h" to see what these routines do |
| 103 | virtual bool VerifyAllMemory(); |
| 104 | virtual bool VerifyNewMemory(const void* p); |
| 105 | virtual bool VerifyArrayNewMemory(const void* p); |
| 106 | virtual bool VerifyMallocMemory(const void* p); |
| 107 | virtual bool MallocMemoryStats(int* blocks, size_t* total, |
| 108 | int histogram[kMallocHistogramSize]); |
| 109 | |
| 110 | // Get a human readable description of the current state of the malloc |
| 111 | // data structures. The state is stored as a null-terminated string |
| 112 | // in a prefix of "buffer[0,buffer_length-1]". |
| 113 | // REQUIRES: buffer_length > 0. |
| 114 | virtual void GetStats(char* buffer, int buffer_length); |
| 115 | |
| 116 | // Outputs to "writer" a sample of live objects and the stack traces |
| 117 | // that allocated these objects. The format of the returned output |
| 118 | // is equivalent to the output of the heap profiler and can |
| 119 | // therefore be passed to "pprof". This function is equivalent to |
| 120 | // ReadStackTraces. The main difference is that this function returns |
| 121 | // serialized data appropriately formatted for use by the pprof tool. |
| 122 | // NOTE: by default, tcmalloc does not do any heap sampling, and this |
| 123 | // function will always return an empty sample. To get useful |
| 124 | // data from GetHeapSample, you must also set the environment |
| 125 | // variable TCMALLOC_SAMPLE_PARAMETER to a value such as 524288. |
| 126 | virtual void GetHeapSample(MallocExtensionWriter* writer); |
| 127 | |
| 128 | // Outputs to "writer" the stack traces that caused growth in the |
| 129 | // address space size. The format of the returned output is |
| 130 | // equivalent to the output of the heap profiler and can therefore |
| 131 | // be passed to "pprof". This function is equivalent to |
| 132 | // ReadHeapGrowthStackTraces. The main difference is that this function |
| 133 | // returns serialized data appropriately formatted for use by the |
| 134 | // pprof tool. (This does not depend on, or require, |
| 135 | // TCMALLOC_SAMPLE_PARAMETER.) |
| 136 | virtual void GetHeapGrowthStacks(MallocExtensionWriter* writer); |
| 137 | |
| 138 | // Invokes func(arg, range) for every controlled memory |
| 139 | // range. *range is filled in with information about the range. |
| 140 | // |
| 141 | // This is a best-effort interface useful only for performance |
| 142 | // analysis. The implementation may not call func at all. |
| 143 | typedef void (RangeFunction)(void*, const base::MallocRange*); |
| 144 | virtual void Ranges(void* arg, RangeFunction func); |
| 145 | |
| 146 | // ------------------------------------------------------------------- |
| 147 | // Control operations for getting and setting malloc implementation |
| 148 | // specific parameters. Some currently useful properties: |
| 149 | // |
| 150 | // generic |
| 151 | // ------- |
| 152 | // "generic.current_allocated_bytes" |
| 153 | // Number of bytes currently allocated by application |
| 154 | // This property is not writable. |
| 155 | // |
| 156 | // "generic.heap_size" |
| 157 | // Number of bytes in the heap == |
| 158 | // current_allocated_bytes + |
| 159 | // fragmentation + |
| 160 | // freed memory regions |
| 161 | // This property is not writable. |
| 162 | // |
| 163 | // tcmalloc |
| 164 | // -------- |
| 165 | // "tcmalloc.max_total_thread_cache_bytes" |
| 166 | // Upper limit on total number of bytes stored across all |
| 167 | // per-thread caches. Default: 16MB. |
| 168 | // |
| 169 | // "tcmalloc.current_total_thread_cache_bytes" |
| 170 | // Number of bytes used across all thread caches. |
| 171 | // This property is not writable. |
| 172 | // |
| 173 | // "tcmalloc.central_cache_free_bytes" |
| 174 | // Number of free bytes in the central cache that have been |
| 175 | // assigned to size classes. They always count towards virtual |
| 176 | // memory usage, and unless the underlying memory is swapped out |
| 177 | // by the OS, they also count towards physical memory usage. |
| 178 | // This property is not writable. |
| 179 | // |
| 180 | // "tcmalloc.transfer_cache_free_bytes" |
| 181 | // Number of free bytes that are waiting to be transfered between |
| 182 | // the central cache and a thread cache. They always count |
| 183 | // towards virtual memory usage, and unless the underlying memory |
| 184 | // is swapped out by the OS, they also count towards physical |
| 185 | // memory usage. This property is not writable. |
| 186 | // |
| 187 | // "tcmalloc.thread_cache_free_bytes" |
| 188 | // Number of free bytes in thread caches. They always count |
| 189 | // towards virtual memory usage, and unless the underlying memory |
| 190 | // is swapped out by the OS, they also count towards physical |
| 191 | // memory usage. This property is not writable. |
| 192 | // |
| 193 | // "tcmalloc.pageheap_free_bytes" |
| 194 | // Number of bytes in free, mapped pages in page heap. These |
| 195 | // bytes can be used to fulfill allocation requests. They |
| 196 | // always count towards virtual memory usage, and unless the |
| 197 | // underlying memory is swapped out by the OS, they also count |
| 198 | // towards physical memory usage. This property is not writable. |
| 199 | // |
| 200 | // "tcmalloc.pageheap_unmapped_bytes" |
| 201 | // Number of bytes in free, unmapped pages in page heap. |
| 202 | // These are bytes that have been released back to the OS, |
| 203 | // possibly by one of the MallocExtension "Release" calls. |
| 204 | // They can be used to fulfill allocation requests, but |
| 205 | // typically incur a page fault. They always count towards |
| 206 | // virtual memory usage, and depending on the OS, typically |
| 207 | // do not count towards physical memory usage. This property |
| 208 | // is not writable. |
| 209 | // ------------------------------------------------------------------- |
| 210 | |
| 211 | // Get the named "property"'s value. Returns true if the property |
| 212 | // is known. Returns false if the property is not a valid property |
| 213 | // name for the current malloc implementation. |
| 214 | // REQUIRES: property != NULL; value != NULL |
| 215 | virtual bool GetNumericProperty(const char* property, size_t* value); |
| 216 | |
| 217 | // Set the named "property"'s value. Returns true if the property |
| 218 | // is known and writable. Returns false if the property is not a |
| 219 | // valid property name for the current malloc implementation, or |
| 220 | // is not writable. |
| 221 | // REQUIRES: property != NULL |
| 222 | virtual bool SetNumericProperty(const char* property, size_t value); |
| 223 | |
| 224 | // Mark the current thread as "idle". This routine may optionally |
| 225 | // be called by threads as a hint to the malloc implementation that |
| 226 | // any thread-specific resources should be released. Note: this may |
| 227 | // be an expensive routine, so it should not be called too often. |
| 228 | // |
| 229 | // Also, if the code that calls this routine will go to sleep for |
| 230 | // a while, it should take care to not allocate anything between |
| 231 | // the call to this routine and the beginning of the sleep. |
| 232 | // |
| 233 | // Most malloc implementations ignore this routine. |
| 234 | virtual void MarkThreadIdle(); |
| 235 | |
| 236 | // Mark the current thread as "busy". This routine should be |
| 237 | // called after MarkThreadIdle() if the thread will now do more |
| 238 | // work. If this method is not called, performance may suffer. |
| 239 | // |
| 240 | // Most malloc implementations ignore this routine. |
| 241 | virtual void MarkThreadBusy(); |
| 242 | |
| 243 | // Gets the system allocator used by the malloc extension instance. Returns |
| 244 | // NULL for malloc implementations that do not support pluggable system |
| 245 | // allocators. |
| 246 | virtual SysAllocator* GetSystemAllocator(); |
| 247 | |
| 248 | // Sets the system allocator to the specified. |
| 249 | // |
| 250 | // Users could register their own system allocators for malloc implementation |
| 251 | // that supports pluggable system allocators, such as TCMalloc, by doing: |
| 252 | // alloc = new MyOwnSysAllocator(); |
| 253 | // MallocExtension::instance()->SetSystemAllocator(alloc); |
| 254 | // It's up to users whether to fall back (recommended) to the default |
| 255 | // system allocator (use GetSystemAllocator() above) or not. The caller is |
| 256 | // responsible to any necessary locking. |
| 257 | // See tcmalloc/system-alloc.h for the interface and |
| 258 | // tcmalloc/memfs_malloc.cc for the examples. |
| 259 | // |
| 260 | // It's a no-op for malloc implementations that do not support pluggable |
| 261 | // system allocators. |
| 262 | virtual void SetSystemAllocator(SysAllocator *a); |
| 263 | |
| 264 | // Try to release num_bytes of free memory back to the operating |
| 265 | // system for reuse. Use this extension with caution -- to get this |
| 266 | // memory back may require faulting pages back in by the OS, and |
| 267 | // that may be slow. (Currently only implemented in tcmalloc.) |
| 268 | virtual void ReleaseToSystem(size_t num_bytes); |
| 269 | |
| 270 | // Same as ReleaseToSystem() but release as much memory as possible. |
| 271 | virtual void ReleaseFreeMemory(); |
| 272 | |
| 273 | // Sets the rate at which we release unused memory to the system. |
| 274 | // Zero means we never release memory back to the system. Increase |
| 275 | // this flag to return memory faster; decrease it to return memory |
| 276 | // slower. Reasonable rates are in the range [0,10]. (Currently |
| 277 | // only implemented in tcmalloc). |
| 278 | virtual void SetMemoryReleaseRate(double rate); |
| 279 | |
| 280 | // Gets the release rate. Returns a value < 0 if unknown. |
| 281 | virtual double GetMemoryReleaseRate(); |
| 282 | |
| 283 | // Returns the estimated number of bytes that will be allocated for |
| 284 | // a request of "size" bytes. This is an estimate: an allocation of |
| 285 | // SIZE bytes may reserve more bytes, but will never reserve less. |
| 286 | // (Currently only implemented in tcmalloc, other implementations |
| 287 | // always return SIZE.) |
| 288 | // This is equivalent to malloc_good_size() in OS X. |
| 289 | virtual size_t GetEstimatedAllocatedSize(size_t size); |
| 290 | |
| 291 | // Returns the actual number N of bytes reserved by tcmalloc for the |
| 292 | // pointer p. The client is allowed to use the range of bytes |
| 293 | // [p, p+N) in any way it wishes (i.e. N is the "usable size" of this |
| 294 | // allocation). This number may be equal to or greater than the number |
| 295 | // of bytes requested when p was allocated. |
| 296 | // p must have been allocated by this malloc implementation, |
| 297 | // must not be an interior pointer -- that is, must be exactly |
| 298 | // the pointer returned to by malloc() et al., not some offset |
| 299 | // from that -- and should not have been freed yet. p may be NULL. |
| 300 | // (Currently only implemented in tcmalloc; other implementations |
| 301 | // will return 0.) |
| 302 | // This is equivalent to malloc_size() in OS X, malloc_usable_size() |
| 303 | // in glibc, and _msize() for windows. |
| 304 | virtual size_t GetAllocatedSize(const void* p); |
| 305 | |
| 306 | // Returns kOwned if this malloc implementation allocated the memory |
| 307 | // pointed to by p, or kNotOwned if some other malloc implementation |
| 308 | // allocated it or p is NULL. May also return kUnknownOwnership if |
| 309 | // the malloc implementation does not keep track of ownership. |
| 310 | // REQUIRES: p must be a value returned from a previous call to |
| 311 | // malloc(), calloc(), realloc(), memalign(), posix_memalign(), |
| 312 | // valloc(), pvalloc(), new, or new[], and must refer to memory that |
| 313 | // is currently allocated (so, for instance, you should not pass in |
| 314 | // a pointer after having called free() on it). |
| 315 | enum Ownership { |
| 316 | // NOTE: Enum values MUST be kept in sync with the version in |
| 317 | // malloc_extension_c.h |
| 318 | kUnknownOwnership = 0, |
| 319 | kOwned, |
| 320 | kNotOwned |
| 321 | }; |
| 322 | virtual Ownership GetOwnership(const void* p); |
| 323 | |
| 324 | // The current malloc implementation. Always non-NULL. |
| 325 | static MallocExtension* instance(); |
| 326 | |
| 327 | // Change the malloc implementation. Typically called by the |
| 328 | // malloc implementation during initialization. |
| 329 | static void Register(MallocExtension* implementation); |
| 330 | |
| 331 | // Returns detailed information about malloc's freelists. For each list, |
| 332 | // return a FreeListInfo: |
| 333 | struct FreeListInfo { |
| 334 | size_t min_object_size; |
| 335 | size_t max_object_size; |
| 336 | size_t total_bytes_free; |
| 337 | const char* type; |
| 338 | }; |
| 339 | // Each item in the vector refers to a different freelist. The lists |
| 340 | // are identified by the range of allocations that objects in the |
| 341 | // list can satisfy ([min_object_size, max_object_size]) and the |
| 342 | // type of freelist (see below). The current size of the list is |
| 343 | // returned in total_bytes_free (which count against a processes |
| 344 | // resident and virtual size). |
| 345 | // |
| 346 | // Currently supported types are: |
| 347 | // |
| 348 | // "tcmalloc.page{_unmapped}" - tcmalloc's page heap. An entry for each size |
| 349 | // class in the page heap is returned. Bytes in "page_unmapped" |
| 350 | // are no longer backed by physical memory and do not count against |
| 351 | // the resident size of a process. |
| 352 | // |
| 353 | // "tcmalloc.large{_unmapped}" - tcmalloc's list of objects larger |
| 354 | // than the largest page heap size class. Only one "large" |
| 355 | // entry is returned. There is no upper-bound on the size |
| 356 | // of objects in the large free list; this call returns |
| 357 | // kint64max for max_object_size. Bytes in |
| 358 | // "large_unmapped" are no longer backed by physical memory |
| 359 | // and do not count against the resident size of a process. |
| 360 | // |
| 361 | // "tcmalloc.central" - tcmalloc's central free-list. One entry per |
| 362 | // size-class is returned. Never unmapped. |
| 363 | // |
| 364 | // "debug.free_queue" - free objects queued by the debug allocator |
| 365 | // and not returned to tcmalloc. |
| 366 | // |
| 367 | // "tcmalloc.thread" - tcmalloc's per-thread caches. Never unmapped. |
| 368 | virtual void GetFreeListSizes(std::vector<FreeListInfo>* v); |
| 369 | |
| 370 | // Get a list of stack traces of sampled allocation points. Returns |
| 371 | // a pointer to a "new[]-ed" result array, and stores the sample |
| 372 | // period in "sample_period". |
| 373 | // |
| 374 | // The state is stored as a sequence of adjacent entries |
| 375 | // in the returned array. Each entry has the following form: |
| 376 | // uintptr_t count; // Number of objects with following trace |
| 377 | // uintptr_t size; // Total size of objects with following trace |
| 378 | // uintptr_t depth; // Number of PC values in stack trace |
| 379 | // void* stack[depth]; // PC values that form the stack trace |
| 380 | // |
| 381 | // The list of entries is terminated by a "count" of 0. |
| 382 | // |
| 383 | // It is the responsibility of the caller to "delete[]" the returned array. |
| 384 | // |
| 385 | // May return NULL to indicate no results. |
| 386 | // |
| 387 | // This is an internal extension. Callers should use the more |
| 388 | // convenient "GetHeapSample(string*)" method defined above. |
| 389 | virtual void** ReadStackTraces(int* sample_period); |
| 390 | |
| 391 | // Like ReadStackTraces(), but returns stack traces that caused growth |
| 392 | // in the address space size. |
| 393 | virtual void** ReadHeapGrowthStackTraces(); |
| 394 | }; |
| 395 | |
| 396 | namespace base { |
| 397 | |
| 398 | // Information passed per range. More fields may be added later. |
| 399 | struct MallocRange { |
| 400 | enum Type { |
| 401 | INUSE, // Application is using this range |
| 402 | FREE, // Range is currently free |
| 403 | UNMAPPED, // Backing physical memory has been returned to the OS |
| 404 | UNKNOWN |
| 405 | // More enum values may be added in the future |
| 406 | }; |
| 407 | |
| 408 | uintptr_t address; // Address of range |
| 409 | size_t length; // Byte length of range |
| 410 | Type type; // Type of this range |
| 411 | double fraction; // Fraction of range that is being used (0 if !INUSE) |
| 412 | |
| 413 | // Perhaps add the following: |
| 414 | // - stack trace if this range was sampled |
| 415 | // - heap growth stack trace if applicable to this range |
| 416 | // - age when allocated (for inuse) or freed (if not in use) |
| 417 | }; |
| 418 | |
| 419 | } // namespace base |
| 420 | |
| 421 | #endif // BASE_MALLOC_EXTENSION_H_ |