Blame - third_party/gperftools/src/common.cc - RealtimeRoboticsGroup/test

blob: 5e9e11ee5f735657bbf8625a7aaacc02995d7ed1 [file] [log] [blame]

Austin Schuh	745610d	2015-09-06 18:19:50 -0700	[diff] [blame]	1	// -- Mode: C++; c-basic-offset: 2; indent-tabs-mode: nil --
				2	// Copyright (c) 2008, Google Inc.
				3	// All rights reserved.
Brian Silverman	20350ac	2021-11-17 18:19:55 -0800	[diff] [blame]	4	//
Austin Schuh	745610d	2015-09-06 18:19:50 -0700	[diff] [blame]	5	// Redistribution and use in source and binary forms, with or without
				6	// modification, are permitted provided that the following conditions are
				7	// met:
Brian Silverman	20350ac	2021-11-17 18:19:55 -0800	[diff] [blame]	8	//
Austin Schuh	745610d	2015-09-06 18:19:50 -0700	[diff] [blame]	9	// * Redistributions of source code must retain the above copyright
				10	// notice, this list of conditions and the following disclaimer.
				11	// * Redistributions in binary form must reproduce the above
				12	// copyright notice, this list of conditions and the following disclaimer
				13	// in the documentation and/or other materials provided with the
				14	// distribution.
				15	// * Neither the name of Google Inc. nor the names of its
				16	// contributors may be used to endorse or promote products derived from
				17	// this software without specific prior written permission.
Brian Silverman	20350ac	2021-11-17 18:19:55 -0800	[diff] [blame]	18	//
Austin Schuh	745610d	2015-09-06 18:19:50 -0700	[diff] [blame]	19	// THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS
				20	// "AS IS" AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT
				21	// LIMITED TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR
				22	// A PARTICULAR PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT
				23	// OWNER OR CONTRIBUTORS BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL,
				24	// SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT
				25	// LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE,
				26	// DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY
				27	// THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT
				28	// (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE
				29	// OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
				30
				31	// ---
				32	// Author: Sanjay Ghemawat <opensource@google.com>
				33
				34	#include <stdlib.h> // for getenv and strtol
				35	#include "config.h"
				36	#include "common.h"
				37	#include "system-alloc.h"
				38	#include "base/spinlock.h"
				39	#include "getenv_safe.h" // TCMallocGetenvSafe
				40
				41	namespace tcmalloc {
				42
				43	// Define the maximum number of object per classe type to transfer between
				44	// thread and central caches.
				45	static int32 FLAGS_tcmalloc_transfer_num_objects;
				46
Brian Silverman	20350ac	2021-11-17 18:19:55 -0800	[diff] [blame]	47	static const int32 kDefaultTransferNumObjecs = 32;
Austin Schuh	745610d	2015-09-06 18:19:50 -0700	[diff] [blame]	48
				49	// The init function is provided to explicit initialize the variable value
				50	// from the env. var to avoid C++ global construction that might defer its
				51	// initialization after a malloc/new call.
				52	static inline void InitTCMallocTransferNumObjects()
				53	{
Brian Silverman	20350ac	2021-11-17 18:19:55 -0800	[diff] [blame]	54	if (FLAGS_tcmalloc_transfer_num_objects == 0) {
Austin Schuh	745610d	2015-09-06 18:19:50 -0700	[diff] [blame]	55	const char *envval = TCMallocGetenvSafe("TCMALLOC_TRANSFER_NUM_OBJ");
				56	FLAGS_tcmalloc_transfer_num_objects = !envval ? kDefaultTransferNumObjecs :
				57	strtol(envval, NULL, 10);
				58	}
				59	}
				60
				61	// Note: the following only works for "n"s that fit in 32-bits, but
				62	// that is fine since we only use it for small sizes.
				63	static inline int LgFloor(size_t n) {
				64	int log = 0;
				65	for (int i = 4; i >= 0; --i) {
				66	int shift = (1 << i);
				67	size_t x = n >> shift;
				68	if (x != 0) {
				69	n = x;
				70	log += shift;
				71	}
				72	}
				73	ASSERT(n == 1);
				74	return log;
				75	}
				76
				77	int AlignmentForSize(size_t size) {
				78	int alignment = kAlignment;
				79	if (size > kMaxSize) {
				80	// Cap alignment at kPageSize for large sizes.
				81	alignment = kPageSize;
				82	} else if (size >= 128) {
				83	// Space wasted due to alignment is at most 1/8, i.e., 12.5%.
				84	alignment = (1 << LgFloor(size)) / 8;
				85	} else if (size >= kMinAlign) {
				86	// We need an alignment of at least 16 bytes to satisfy
				87	// requirements for some SSE types.
				88	alignment = kMinAlign;
				89	}
				90	// Maximum alignment allowed is page size alignment.
				91	if (alignment > kPageSize) {
				92	alignment = kPageSize;
				93	}
				94	CHECK_CONDITION(size < kMinAlign \|\| alignment >= kMinAlign);
				95	CHECK_CONDITION((alignment & (alignment - 1)) == 0);
				96	return alignment;
				97	}
				98
				99	int SizeMap::NumMoveSize(size_t size) {
				100	if (size == 0) return 0;
				101	// Use approx 64k transfers between thread and central caches.
				102	int num = static_cast<int>(64.0 * 1024.0 / size);
				103	if (num < 2) num = 2;
				104
				105	// Avoid bringing too many objects into small object free lists.
				106	// If this value is too large:
				107	// - We waste memory with extra objects sitting in the thread caches.
				108	// - The central freelist holds its lock for too long while
				109	// building a linked list of objects, slowing down the allocations
				110	// of other threads.
				111	// If this value is too small:
				112	// - We go to the central freelist too often and we have to acquire
				113	// its lock each time.
				114	// This value strikes a balance between the constraints above.
				115	if (num > FLAGS_tcmalloc_transfer_num_objects)
				116	num = FLAGS_tcmalloc_transfer_num_objects;
				117
				118	return num;
				119	}
				120
				121	// Initialize the mapping arrays
				122	void SizeMap::Init() {
				123	InitTCMallocTransferNumObjects();
				124
				125	// Do some sanity checking on add_amount[]/shift_amount[]/class_array[]
				126	if (ClassIndex(0) != 0) {
				127	Log(kCrash, __FILE__, __LINE__,
				128	"Invalid class index for size 0", ClassIndex(0));
				129	}
				130	if (ClassIndex(kMaxSize) >= sizeof(class_array_)) {
				131	Log(kCrash, __FILE__, __LINE__,
				132	"Invalid class index for kMaxSize", ClassIndex(kMaxSize));
				133	}
				134
				135	// Compute the size classes we want to use
				136	int sc = 1; // Next size class to assign
				137	int alignment = kAlignment;
				138	CHECK_CONDITION(kAlignment <= kMinAlign);
				139	for (size_t size = kAlignment; size <= kMaxSize; size += alignment) {
				140	alignment = AlignmentForSize(size);
				141	CHECK_CONDITION((size % alignment) == 0);
				142
				143	int blocks_to_move = NumMoveSize(size) / 4;
				144	size_t psize = 0;
				145	do {
				146	psize += kPageSize;
				147	// Allocate enough pages so leftover is less than 1/8 of total.
				148	// This bounds wasted space to at most 12.5%.
				149	while ((psize % size) > (psize >> 3)) {
				150	psize += kPageSize;
				151	}
				152	// Continue to add pages until there are at least as many objects in
				153	// the span as are needed when moving objects from the central
				154	// freelists and spans to the thread caches.
				155	} while ((psize / size) < (blocks_to_move));
				156	const size_t my_pages = psize >> kPageShift;
				157
				158	if (sc > 1 && my_pages == class_to_pages_[sc-1]) {
				159	// See if we can merge this into the previous class without
				160	// increasing the fragmentation of the previous class.
				161	const size_t my_objects = (my_pages << kPageShift) / size;
				162	const size_t prev_objects = (class_to_pages_[sc-1] << kPageShift)
				163	/ class_to_size_[sc-1];
				164	if (my_objects == prev_objects) {
				165	// Adjust last class to include this size
				166	class_to_size_[sc-1] = size;
				167	continue;
				168	}
				169	}
				170
				171	// Add new class
				172	class_to_pages_[sc] = my_pages;
				173	class_to_size_[sc] = size;
				174	sc++;
				175	}
Brian Silverman	20350ac	2021-11-17 18:19:55 -0800	[diff] [blame]	176	num_size_classes = sc;
				177	if (sc > kClassSizesMax) {
Austin Schuh	745610d	2015-09-06 18:19:50 -0700	[diff] [blame]	178	Log(kCrash, __FILE__, __LINE__,
Brian Silverman	20350ac	2021-11-17 18:19:55 -0800	[diff] [blame]	179	"too many size classes: (found vs. max)", sc, kClassSizesMax);
Austin Schuh	745610d	2015-09-06 18:19:50 -0700	[diff] [blame]	180	}
				181
				182	// Initialize the mapping arrays
				183	int next_size = 0;
Brian Silverman	20350ac	2021-11-17 18:19:55 -0800	[diff] [blame]	184	for (int c = 1; c < num_size_classes; c++) {
Austin Schuh	745610d	2015-09-06 18:19:50 -0700	[diff] [blame]	185	const int max_size_in_class = class_to_size_[c];
				186	for (int s = next_size; s <= max_size_in_class; s += kAlignment) {
				187	class_array_[ClassIndex(s)] = c;
				188	}
				189	next_size = max_size_in_class + kAlignment;
				190	}
				191
				192	// Double-check sizes just to be safe
				193	for (size_t size = 0; size <= kMaxSize;) {
				194	const int sc = SizeClass(size);
Brian Silverman	20350ac	2021-11-17 18:19:55 -0800	[diff] [blame]	195	if (sc <= 0 \|\| sc >= num_size_classes) {
Austin Schuh	745610d	2015-09-06 18:19:50 -0700	[diff] [blame]	196	Log(kCrash, __FILE__, __LINE__,
				197	"Bad size class (class, size)", sc, size);
				198	}
				199	if (sc > 1 && size <= class_to_size_[sc-1]) {
				200	Log(kCrash, __FILE__, __LINE__,
				201	"Allocating unnecessarily large class (class, size)", sc, size);
				202	}
				203	const size_t s = class_to_size_[sc];
				204	if (size > s \|\| s == 0) {
				205	Log(kCrash, __FILE__, __LINE__,
				206	"Bad (class, size, requested)", sc, s, size);
				207	}
				208	if (size <= kMaxSmallSize) {
				209	size += 8;
				210	} else {
				211	size += 128;
				212	}
				213	}
				214
Brian Silverman	20350ac	2021-11-17 18:19:55 -0800	[diff] [blame]	215	// Our fast-path aligned allocation functions rely on 'naturally
				216	// aligned' sizes to produce aligned addresses. Lets check if that
				217	// holds for size classes that we produced.
				218	//
				219	// I.e. we're checking that
				220	//
				221	// align = (1 << shift), malloc(i * align) % align == 0,
				222	//
				223	// for all align values up to kPageSize.
				224	for (size_t align = kMinAlign; align <= kPageSize; align <<= 1) {
				225	for (size_t size = align; size < kPageSize; size += align) {
				226	CHECK_CONDITION(class_to_size_[SizeClass(size)] % align == 0);
				227	}
				228	}
				229
Austin Schuh	745610d	2015-09-06 18:19:50 -0700	[diff] [blame]	230	// Initialize the num_objects_to_move array.
Brian Silverman	20350ac	2021-11-17 18:19:55 -0800	[diff] [blame]	231	for (size_t cl = 1; cl < num_size_classes; ++cl) {
Austin Schuh	745610d	2015-09-06 18:19:50 -0700	[diff] [blame]	232	num_objects_to_move_[cl] = NumMoveSize(ByteSizeForClass(cl));
				233	}
				234	}
				235
				236	// Metadata allocator -- keeps stats about how many bytes allocated.
				237	static uint64_t metadata_system_bytes_ = 0;
				238	static const size_t kMetadataAllocChunkSize = 810241024;
Brian Silverman	20350ac	2021-11-17 18:19:55 -0800	[diff] [blame]	239	// As ThreadCache objects are allocated with MetaDataAlloc, and also
				240	// CACHELINE_ALIGNED, we must use the same alignment as TCMalloc_SystemAlloc.
				241	static const size_t kMetadataAllignment = sizeof(MemoryAligner);
Austin Schuh	745610d	2015-09-06 18:19:50 -0700	[diff] [blame]	242
				243	static char *metadata_chunk_alloc_;
				244	static size_t metadata_chunk_avail_;
				245
				246	static SpinLock metadata_alloc_lock(SpinLock::LINKER_INITIALIZED);
				247
				248	void* MetaDataAlloc(size_t bytes) {
				249	if (bytes >= kMetadataAllocChunkSize) {
				250	void *rv = TCMalloc_SystemAlloc(bytes,
				251	NULL, kMetadataAllignment);
				252	if (rv != NULL) {
				253	metadata_system_bytes_ += bytes;
				254	}
				255	return rv;
				256	}
				257
				258	SpinLockHolder h(&metadata_alloc_lock);
				259
				260	// the following works by essentially turning address to integer of
				261	// log_2 kMetadataAllignment size and negating it. I.e. negated
				262	// value + original value gets 0 and that's what we want modulo
				263	// kMetadataAllignment. Note, we negate before masking higher bits
				264	// off, otherwise we'd have to mask them off after negation anyways.
				265	intptr_t alignment = -reinterpret_cast<intptr_t>(metadata_chunk_alloc_) & (kMetadataAllignment-1);
				266
				267	if (metadata_chunk_avail_ < bytes + alignment) {
				268	size_t real_size;
				269	void *ptr = TCMalloc_SystemAlloc(kMetadataAllocChunkSize,
				270	&real_size, kMetadataAllignment);
				271	if (ptr == NULL) {
				272	return NULL;
				273	}
				274
				275	metadata_chunk_alloc_ = static_cast<char *>(ptr);
				276	metadata_chunk_avail_ = real_size;
				277
				278	alignment = 0;
				279	}
				280
				281	void rv = static_cast<void >(metadata_chunk_alloc_ + alignment);
				282	bytes += alignment;
				283	metadata_chunk_alloc_ += bytes;
				284	metadata_chunk_avail_ -= bytes;
				285	metadata_system_bytes_ += bytes;
				286	return rv;
				287	}
				288
				289	uint64_t metadata_system_bytes() { return metadata_system_bytes_; }
				290
				291	} // namespace tcmalloc