1// Copyright (c) 2012, Google Inc.
2// All rights reserved.
3//
4// Redistribution and use in source and binary forms, with or without
5// modification, are permitted provided that the following conditions are
6// met:
7//
8//     * Redistributions of source code must retain the above copyright
9// notice, this list of conditions and the following disclaimer.
10//     * Redistributions in binary form must reproduce the above
11// copyright notice, this list of conditions and the following disclaimer
12// in the documentation and/or other materials provided with the
13// distribution.
14//     * Neither the name of Google Inc. nor the names of its
15// contributors may be used to endorse or promote products derived from
16// this software without specific prior written permission.
17//
18// THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS
19// "AS IS" AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT
20// LIMITED TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR
21// A PARTICULAR PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT
22// OWNER OR CONTRIBUTORS BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL,
23// SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT
24// LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE,
25// DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY
26// THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT
27// (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE
28// OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
29
30// ---
31// Author: Sanjay Ghemawat <opensource@google.com>
32//
33// Extra extensions exported by some malloc implementations.  These
34// extensions are accessed through a virtual base class so an
35// application can link against a malloc that does not implement these
36// extensions, and it will get default versions that do nothing.
37//
38// NOTE FOR C USERS: If you wish to use this functionality from within
39// a C program, see malloc_extension_c.h.
40
41#ifndef BASE_MALLOC_EXTENSION_H_
42#define BASE_MALLOC_EXTENSION_H_
43
44#include <stddef.h>
45// I can't #include config.h in this public API file, but I should
46// really use configure (and make malloc_extension.h a .in file) to
47// figure out if the system has stdint.h or not.  But I'm lazy, so
48// for now I'm assuming it's a problem only with MSVC.
49#ifndef _MSC_VER
50#include <stdint.h>
51#endif
52#include <string>
53#include <vector>
54
55// Annoying stuff for windows -- makes sure clients can import these functions
56#ifndef PERFTOOLS_DLL_DECL
57# ifdef _WIN32
58#   define PERFTOOLS_DLL_DECL  __declspec(dllimport)
59# else
60#   define PERFTOOLS_DLL_DECL
61# endif
62#endif
63
64static const int kMallocHistogramSize = 64;
65
66// One day, we could support other types of writers (perhaps for C?)
67typedef std::string MallocExtensionWriter;
68
69namespace base {
70struct MallocRange;
71}
72
73// Interface to a pluggable system allocator.
74class SysAllocator {
75 public:
76  SysAllocator() {
77  }
78  virtual ~SysAllocator();
79
80  // Allocates "size"-byte of memory from system aligned with "alignment".
81  // Returns NULL if failed. Otherwise, the returned pointer p up to and
82  // including (p + actual_size -1) have been allocated.
83  virtual void* Alloc(size_t size, size_t *actual_size, size_t alignment) = 0;
84};
85
86// The default implementations of the following routines do nothing.
87// All implementations should be thread-safe; the current one
88// (TCMallocImplementation) is.
89class PERFTOOLS_DLL_DECL MallocExtension {
90 public:
91  virtual ~MallocExtension();
92
93  // Call this very early in the program execution -- say, in a global
94  // constructor -- to set up parameters and state needed by all
95  // instrumented malloc implemenatations.  One example: this routine
96  // sets environemnt variables to tell STL to use libc's malloc()
97  // instead of doing its own memory management.  This is safe to call
98  // multiple times, as long as each time is before threads start up.
99  static void Initialize();
100
101  // See "verify_memory.h" to see what these routines do
102  virtual bool VerifyAllMemory();
103  virtual bool VerifyNewMemory(const void* p);
104  virtual bool VerifyArrayNewMemory(const void* p);
105  virtual bool VerifyMallocMemory(const void* p);
106  virtual bool MallocMemoryStats(int* blocks, size_t* total,
107                                 int histogram[kMallocHistogramSize]);
108
109  // Get a human readable description of the current state of the malloc
110  // data structures.  The state is stored as a null-terminated string
111  // in a prefix of "buffer[0,buffer_length-1]".
112  // REQUIRES: buffer_length > 0.
113  virtual void GetStats(char* buffer, int buffer_length);
114
115  // Outputs to "writer" a sample of live objects and the stack traces
116  // that allocated these objects.  The format of the returned output
117  // is equivalent to the output of the heap profiler and can
118  // therefore be passed to "pprof". This function is equivalent to
119  // ReadStackTraces. The main difference is that this function returns
120  // serialized data appropriately formatted for use by the pprof tool.
121  // NOTE: by default, tcmalloc does not do any heap sampling, and this
122  //       function will always return an empty sample.  To get useful
123  //       data from GetHeapSample, you must also set the environment
124  //       variable TCMALLOC_SAMPLE_PARAMETER to a value such as 524288.
125  virtual void GetHeapSample(MallocExtensionWriter* writer);
126
127  // Outputs to "writer" the stack traces that caused growth in the
128  // address space size.  The format of the returned output is
129  // equivalent to the output of the heap profiler and can therefore
130  // be passed to "pprof". This function is equivalent to
131  // ReadHeapGrowthStackTraces. The main difference is that this function
132  // returns serialized data appropriately formatted for use by the
133  // pprof tool.  (This does not depend on, or require,
134  // TCMALLOC_SAMPLE_PARAMETER.)
135  virtual void GetHeapGrowthStacks(MallocExtensionWriter* writer);
136
137  // Invokes func(arg, range) for every controlled memory
138  // range.  *range is filled in with information about the range.
139  //
140  // This is a best-effort interface useful only for performance
141  // analysis.  The implementation may not call func at all.
142  typedef void (RangeFunction)(void*, const base::MallocRange*);
143  virtual void Ranges(void* arg, RangeFunction func);
144
145  // -------------------------------------------------------------------
146  // Control operations for getting and setting malloc implementation
147  // specific parameters.  Some currently useful properties:
148  //
149  // generic
150  // -------
151  // "generic.current_allocated_bytes"
152  //      Number of bytes currently allocated by application
153  //      This property is not writable.
154  //
155  // "generic.heap_size"
156  //      Number of bytes in the heap ==
157  //            current_allocated_bytes +
158  //            fragmentation +
159  //            freed memory regions
160  //      This property is not writable.
161  //
162  // tcmalloc
163  // --------
164  // "tcmalloc.max_total_thread_cache_bytes"
165  //      Upper limit on total number of bytes stored across all
166  //      per-thread caches.  Default: 16MB.
167  //
168  // "tcmalloc.current_total_thread_cache_bytes"
169  //      Number of bytes used across all thread caches.
170  //      This property is not writable.
171  //
172  // "tcmalloc.pageheap_free_bytes"
173  //      Number of bytes in free, mapped pages in page heap.  These
174  //      bytes can be used to fulfill allocation requests.  They
175  //      always count towards virtual memory usage, and unless the
176  //      underlying memory is swapped out by the OS, they also count
177  //      towards physical memory usage.  This property is not writable.
178  //
179  // "tcmalloc.pageheap_unmapped_bytes"
180  //        Number of bytes in free, unmapped pages in page heap.
181  //        These are bytes that have been released back to the OS,
182  //        possibly by one of the MallocExtension "Release" calls.
183  //        They can be used to fulfill allocation requests, but
184  //        typically incur a page fault.  They always count towards
185  //        virtual memory usage, and depending on the OS, typically
186  //        do not count towards physical memory usage.  This property
187  //        is not writable.
188  // -------------------------------------------------------------------
189
190  // Get the named "property"'s value.  Returns true if the property
191  // is known.  Returns false if the property is not a valid property
192  // name for the current malloc implementation.
193  // REQUIRES: property != NULL; value != NULL
194  virtual bool GetNumericProperty(const char* property, size_t* value);
195
196  // Set the named "property"'s value.  Returns true if the property
197  // is known and writable.  Returns false if the property is not a
198  // valid property name for the current malloc implementation, or
199  // is not writable.
200  // REQUIRES: property != NULL
201  virtual bool SetNumericProperty(const char* property, size_t value);
202
203  // Mark the current thread as "idle".  This routine may optionally
204  // be called by threads as a hint to the malloc implementation that
205  // any thread-specific resources should be released.  Note: this may
206  // be an expensive routine, so it should not be called too often.
207  //
208  // Also, if the code that calls this routine will go to sleep for
209  // a while, it should take care to not allocate anything between
210  // the call to this routine and the beginning of the sleep.
211  //
212  // Most malloc implementations ignore this routine.
213  virtual void MarkThreadIdle();
214
215  // Mark the current thread as "busy".  This routine should be
216  // called after MarkThreadIdle() if the thread will now do more
217  // work.  If this method is not called, performance may suffer.
218  //
219  // Most malloc implementations ignore this routine.
220  virtual void MarkThreadBusy();
221
222  // Gets the system allocator used by the malloc extension instance. Returns
223  // NULL for malloc implementations that do not support pluggable system
224  // allocators.
225  virtual SysAllocator* GetSystemAllocator();
226
227  // Sets the system allocator to the specified.
228  //
229  // Users could register their own system allocators for malloc implementation
230  // that supports pluggable system allocators, such as TCMalloc, by doing:
231  //   alloc = new MyOwnSysAllocator();
232  //   MallocExtension::instance()->SetSystemAllocator(alloc);
233  // It's up to users whether to fall back (recommended) to the default
234  // system allocator (use GetSystemAllocator() above) or not. The caller is
235  // responsible to any necessary locking.
236  // See tcmalloc/system-alloc.h for the interface and
237  //     tcmalloc/memfs_malloc.cc for the examples.
238  //
239  // It's a no-op for malloc implementations that do not support pluggable
240  // system allocators.
241  virtual void SetSystemAllocator(SysAllocator *a);
242
243  // Try to release num_bytes of free memory back to the operating
244  // system for reuse.  Use this extension with caution -- to get this
245  // memory back may require faulting pages back in by the OS, and
246  // that may be slow.  (Currently only implemented in tcmalloc.)
247  virtual void ReleaseToSystem(size_t num_bytes);
248
249  // Same as ReleaseToSystem() but release as much memory as possible.
250  virtual void ReleaseFreeMemory();
251
252  // Sets the rate at which we release unused memory to the system.
253  // Zero means we never release memory back to the system.  Increase
254  // this flag to return memory faster; decrease it to return memory
255  // slower.  Reasonable rates are in the range [0,10].  (Currently
256  // only implemented in tcmalloc).
257  virtual void SetMemoryReleaseRate(double rate);
258
259  // Gets the release rate.  Returns a value < 0 if unknown.
260  virtual double GetMemoryReleaseRate();
261
262  // Returns the estimated number of bytes that will be allocated for
263  // a request of "size" bytes.  This is an estimate: an allocation of
264  // SIZE bytes may reserve more bytes, but will never reserve less.
265  // (Currently only implemented in tcmalloc, other implementations
266  // always return SIZE.)
267  // This is equivalent to malloc_good_size() in OS X.
268  virtual size_t GetEstimatedAllocatedSize(size_t size);
269
270  // Returns the actual number N of bytes reserved by tcmalloc for the
271  // pointer p.  The client is allowed to use the range of bytes
272  // [p, p+N) in any way it wishes (i.e. N is the "usable size" of this
273  // allocation).  This number may be equal to or greater than the number
274  // of bytes requested when p was allocated.
275  // p must have been allocated by this malloc implementation,
276  // must not be an interior pointer -- that is, must be exactly
277  // the pointer returned to by malloc() et al., not some offset
278  // from that -- and should not have been freed yet.  p may be NULL.
279  // (Currently only implemented in tcmalloc; other implementations
280  // will return 0.)
281  // This is equivalent to malloc_size() in OS X, malloc_usable_size()
282  // in glibc, and _msize() for windows.
283  virtual size_t GetAllocatedSize(const void* p);
284
285  // Returns kOwned if this malloc implementation allocated the memory
286  // pointed to by p, or kNotOwned if some other malloc implementation
287  // allocated it or p is NULL.  May also return kUnknownOwnership if
288  // the malloc implementation does not keep track of ownership.
289  // REQUIRES: p must be a value returned from a previous call to
290  // malloc(), calloc(), realloc(), memalign(), posix_memalign(),
291  // valloc(), pvalloc(), new, or new[], and must refer to memory that
292  // is currently allocated (so, for instance, you should not pass in
293  // a pointer after having called free() on it).
294  enum Ownership {
295    // NOTE: Enum values MUST be kept in sync with the version in
296    // malloc_extension_c.h
297    kUnknownOwnership = 0,
298    kOwned,
299    kNotOwned
300  };
301  virtual Ownership GetOwnership(const void* p);
302
303  // The current malloc implementation.  Always non-NULL.
304  static MallocExtension* instance();
305
306  // Change the malloc implementation.  Typically called by the
307  // malloc implementation during initialization.
308  static void Register(MallocExtension* implementation);
309
310  // On the current thread, return the total number of bytes allocated.
311  // This function is added in Chromium for profiling.
312  // Currently only implemented in tcmalloc. Returns 0 if tcmalloc is not used.
313  // Note that malloc_extension can be used without tcmalloc if gperftools'
314  // heap-profiler is enabled without the tcmalloc memory allocator.
315  static unsigned int GetBytesAllocatedOnCurrentThread();
316
317  // Returns detailed information about malloc's freelists. For each list,
318  // return a FreeListInfo:
319  struct FreeListInfo {
320    size_t min_object_size;
321    size_t max_object_size;
322    size_t total_bytes_free;
323    const char* type;
324  };
325  // Each item in the vector refers to a different freelist. The lists
326  // are identified by the range of allocations that objects in the
327  // list can satisfy ([min_object_size, max_object_size]) and the
328  // type of freelist (see below). The current size of the list is
329  // returned in total_bytes_free (which count against a processes
330  // resident and virtual size).
331  //
332  // Currently supported types are:
333  //
334  // "tcmalloc.page{_unmapped}" - tcmalloc's page heap. An entry for each size
335  //          class in the page heap is returned. Bytes in "page_unmapped"
336  //          are no longer backed by physical memory and do not count against
337  //          the resident size of a process.
338  //
339  // "tcmalloc.large{_unmapped}" - tcmalloc's list of objects larger
340  //          than the largest page heap size class. Only one "large"
341  //          entry is returned. There is no upper-bound on the size
342  //          of objects in the large free list; this call returns
343  //          kint64max for max_object_size.  Bytes in
344  //          "large_unmapped" are no longer backed by physical memory
345  //          and do not count against the resident size of a process.
346  //
347  // "tcmalloc.central" - tcmalloc's central free-list. One entry per
348  //          size-class is returned. Never unmapped.
349  //
350  // "debug.free_queue" - free objects queued by the debug allocator
351  //                      and not returned to tcmalloc.
352  //
353  // "tcmalloc.thread" - tcmalloc's per-thread caches. Never unmapped.
354  virtual void GetFreeListSizes(std::vector<FreeListInfo>* v);
355
356  // Get a list of stack traces of sampled allocation points.  Returns
357  // a pointer to a "new[]-ed" result array, and stores the sample
358  // period in "sample_period".
359  //
360  // The state is stored as a sequence of adjacent entries
361  // in the returned array.  Each entry has the following form:
362  //    uintptr_t count;        // Number of objects with following trace
363  //    uintptr_t size;         // Total size of objects with following trace
364  //    uintptr_t depth;        // Number of PC values in stack trace
365  //    void*     stack[depth]; // PC values that form the stack trace
366  //
367  // The list of entries is terminated by a "count" of 0.
368  //
369  // It is the responsibility of the caller to "delete[]" the returned array.
370  //
371  // May return NULL to indicate no results.
372  //
373  // This is an internal extension.  Callers should use the more
374  // convenient "GetHeapSample(string*)" method defined above.
375  virtual void** ReadStackTraces(int* sample_period);
376
377  // Like ReadStackTraces(), but returns stack traces that caused growth
378  // in the address space size.
379  virtual void** ReadHeapGrowthStackTraces();
380};
381
382namespace base {
383
384// Information passed per range.  More fields may be added later.
385struct MallocRange {
386  enum Type {
387    INUSE,                // Application is using this range
388    FREE,                 // Range is currently free
389    UNMAPPED,             // Backing physical memory has been returned to the OS
390    UNKNOWN,
391    // More enum values may be added in the future
392  };
393
394  uintptr_t address;    // Address of range
395  size_t length;        // Byte length of range
396  Type type;            // Type of this range
397  double fraction;      // Fraction of range that is being used (0 if !INUSE)
398
399  // Perhaps add the following:
400  // - stack trace if this range was sampled
401  // - heap growth stack trace if applicable to this range
402  // - age when allocated (for inuse) or freed (if not in use)
403};
404
405} // namespace base
406
407#endif  // BASE_MALLOC_EXTENSION_H_
408