third_party/tcmalloc/tcmalloc_linux.cc - Issue 399081: Enable TCMalloc on Linux by default.

Unified Diff: third_party/tcmalloc/tcmalloc_linux.cc

Issue 399081: Enable TCMalloc on Linux by default. (Closed)

Patch Set: Oops, remove unintended change. Created 11 years, 1 month ago

Use n/p to move between diff chunks; N/P to move between comments. Draft comments are only viewable by you.

Jump to:

View side-by-side diff with in-line comments

Index: third_party/tcmalloc/tcmalloc_linux.cc

diff --git a/third_party/tcmalloc/tcmalloc_linux.cc b/third_party/tcmalloc/tcmalloc_linux.cc

new file mode 100644

index 0000000000000000000000000000000000000000..104520eba01c986a5875937cc235beaac955d9d2

--- /dev/null

+++ b/third_party/tcmalloc/tcmalloc_linux.cc

@@ -0,0 +1,1415 @@

+//

+// Redistribution and use in source and binary forms, with or without

+// modification, are permitted provided that the following conditions are

+// met:

+//

+// * Redistributions of source code must retain the above copyright

+// notice, this list of conditions and the following disclaimer.

+// * Redistributions in binary form must reproduce the above

+// copyright notice, this list of conditions and the following disclaimer

+// in the documentation and/or other materials provided with the

+// distribution.

+// * Neither the name of Google Inc. nor the names of its

+// contributors may be used to endorse or promote products derived from

+// this software without specific prior written permission.

+//

+// THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS

+// "AS IS" AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT

+// LIMITED TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR

+// A PARTICULAR PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT

+// OWNER OR CONTRIBUTORS BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL,

+// SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT

+// LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE,

+// DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY

+// THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT

+// (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE

+// OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.

+// ---

+// Author: Sanjay Ghemawat <opensource@google.com>

+//

+// A malloc that uses a per-thread cache to satisfy small malloc requests.

+// (The time for malloc/free of a small object drops from 300 ns to 50 ns.)

+//

+// See doc/tcmalloc.html for a high-level

+// description of how this malloc works.

+//

+// SYNCHRONIZATION

+// 1. The thread-specific lists are accessed without acquiring any locks.

+// This is safe because each such list is only accessed by one thread.

+// 2. We have a lock per central free-list, and hold it while manipulating

+// the central free list for a particular size.

+// 3. The central page allocator is protected by "pageheap_lock".

+// 4. The pagemap (which maps from page-number to descriptor),

+// can be read without holding any locks, and written while holding

+// the "pageheap_lock".

+// 5. To improve performance, a subset of the information one can get

+// from the pagemap is cached in a data structure, pagemap_cache_,

+// that atomically reads and writes its entries. This cache can be

+// read and written without locking.

+//

+// This multi-threaded access to the pagemap is safe for fairly

+// subtle reasons. We basically assume that when an object X is

+// allocated by thread A and deallocated by thread B, there must

+// have been appropriate synchronization in the handoff of object

+// X from thread A to thread B. The same logic applies to pagemap_cache_.

+//

+// THE PAGEID-TO-SIZECLASS CACHE

+// Hot PageID-to-sizeclass mappings are held by pagemap_cache_. If this cache

+// returns 0 for a particular PageID then that means "no information," not that

+// the sizeclass is 0. The cache may have stale information for pages that do

+// not hold the beginning of any free()'able object. Staleness is eliminated

+// in Populate() for pages with sizeclass > 0 objects, and in do_malloc() and

+// do_memalign() for all other relevant pages.

+//

+// PAGEMAP

+// -------

+// Page map contains a mapping from page id to Span.

+//

+// If Span s occupies pages [p..q],

+// pagemap[p] == s

+// pagemap[q] == s

+// pagemap[p+1..q-1] are undefined

+// pagemap[p-1] and pagemap[q+1] are defined:

+// NULL if the corresponding page is not yet in the address space.

+// Otherwise it points to a Span. This span may be free

+// or allocated. If free, it is in one of pageheap's freelist.

+//

+// TODO: Bias reclamation to larger addresses

+// TODO: implement mallinfo/mallopt

+// TODO: Better testing

+//

+// 9/28/2003 (new page-level allocator replaces ptmalloc2):

+// * malloc/free of small objects goes from ~300 ns to ~50 ns.

+// * allocation of a reasonably complicated struct

+// goes from about 1100 ns to about 300 ns.

+#include <config.h>

+#include <new>

+#include <stdio.h>

+#include <stddef.h>

+#if defined HAVE_STDINT_H

+#include <stdint.h>

+#elif defined HAVE_INTTYPES_H

+#include <inttypes.h>

+#else

+#include <sys/types.h>

+#endif

+#if defined(HAVE_MALLOC_H) && defined(HAVE_STRUCT_MALLINFO)

+#include <malloc.h> // for struct mallinfo

+#endif

+#include <string.h>

+#ifdef HAVE_PTHREAD

+#include <pthread.h>

+#endif

+#ifdef HAVE_UNISTD_H

+#include <unistd.h>

+#endif

+#include <errno.h>

+#include <stdarg.h>

+#include <algorithm>

+#include <google/tcmalloc.h>

+#include "base/commandlineflags.h"

+#include "base/basictypes.h" // gets us PRIu64

+#include "base/sysinfo.h"

+#include "base/spinlock.h"

+#include "common.h"

+#include "malloc_hook-inl.h"

+#include <google/malloc_hook.h>

+#include <google/malloc_extension.h>

+#include "central_freelist.h"

+#include "internal_logging.h"

+#include "linked_list.h"

+#include "maybe_threads.h"

+#include "page_heap.h"

+#include "page_heap_allocator.h"

+#include "pagemap.h"

+#include "span.h"

+#include "static_vars.h"

+#include "system-alloc.h"

+#include "tcmalloc_guard.h"

+#include "thread_cache.h"

+#if (defined(_WIN32) && !defined(__CYGWIN__) && !defined(__CYGWIN32__)) && !defined(WIN32_OVERRIDE_ALLOCATORS)

+# define WIN32_DO_PATCHING 1

+#endif

+using tcmalloc::PageHeap;

+using tcmalloc::PageHeapAllocator;

+using tcmalloc::SizeMap;

+using tcmalloc::Span;

+using tcmalloc::StackTrace;

+using tcmalloc::Static;

+using tcmalloc::ThreadCache;

+// __THROW is defined in glibc systems. It means, counter-intuitively,

+// "This function will never throw an exception." It's an optional

+// optimization tool, but we may need to use it to match glibc prototypes.

+#ifndef __THROW // I guess we're not on a glibc system

+# define __THROW // __THROW is just an optimization, so ok to make it ""

+#endif

+DECLARE_int64(tcmalloc_sample_parameter);

+DECLARE_double(tcmalloc_release_rate);

+// For windows, the printf we use to report large allocs is

+// potentially dangerous: it could cause a malloc that would cause an

+// infinite loop. So by default we set the threshold to a huge number

+// on windows, so this bad situation will never trigger. You can

+// always set TCMALLOC_LARGE_ALLOC_REPORT_THRESHOLD manually if you

+// want this functionality.

+#ifdef _WIN32

+const int64 kDefaultLargeAllocReportThreshold = static_cast<int64>(1) << 62;

+#else

+const int64 kDefaultLargeAllocReportThreshold = static_cast<int64>(1) << 30;

+#endif

+DEFINE_int64(tcmalloc_large_alloc_report_threshold,

+ EnvToInt64("TCMALLOC_LARGE_ALLOC_REPORT_THRESHOLD",

+ kDefaultLargeAllocReportThreshold),

+ "Allocations larger than this value cause a stack "

+ "trace to be dumped to stderr. The threshold for "

+ "dumping stack traces is increased by a factor of 1.125 "

+ "every time we print a message so that the threshold "

+ "automatically goes up by a factor of ~1000 every 60 "

+ "messages. This bounds the amount of extra logging "

+ "generated by this flag. Default value of this flag "

+ "is very large and therefore you should see no extra "

+ "logging unless the flag is overridden. Set to 0 to "

+ "disable reporting entirely.");

+// We already declared these functions in tcmalloc.h, but we have to

+// declare them again to give them an ATTRIBUTE_SECTION: we want to

+// put all callers of MallocHook::Invoke* in this module into

+// ATTRIBUTE_SECTION(google_malloc) section, so that

+// MallocHook::GetCallerStackTrace can function accurately.

+#ifndef _WIN32 // windows doesn't have attribute_section, so don't bother

+extern "C" {

+ void* tc_malloc(size_t size) __THROW