1
2/*--------------------------------------------------------------------*/
3/*--- The leak checker.                             mc_leakcheck.c ---*/
4/*--------------------------------------------------------------------*/
5
6/*
7   This file is part of MemCheck, a heavyweight Valgrind tool for
8   detecting memory errors.
9
10   Copyright (C) 2000-2011 Julian Seward
11      jseward@acm.org
12
13   This program is free software; you can redistribute it and/or
14   modify it under the terms of the GNU General Public License as
15   published by the Free Software Foundation; either version 2 of the
16   License, or (at your option) any later version.
17
18   This program is distributed in the hope that it will be useful, but
19   WITHOUT ANY WARRANTY; without even the implied warranty of
20   MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the GNU
21   General Public License for more details.
22
23   You should have received a copy of the GNU General Public License
24   along with this program; if not, write to the Free Software
25   Foundation, Inc., 59 Temple Place, Suite 330, Boston, MA
26   02111-1307, USA.
27
28   The GNU General Public License is contained in the file COPYING.
29*/
30
31#include "pub_tool_basics.h"
32#include "pub_tool_vki.h"
33#include "pub_tool_aspacehl.h"
34#include "pub_tool_aspacemgr.h"
35#include "pub_tool_execontext.h"
36#include "pub_tool_hashtable.h"
37#include "pub_tool_libcbase.h"
38#include "pub_tool_libcassert.h"
39#include "pub_tool_libcprint.h"
40#include "pub_tool_libcsignal.h"
41#include "pub_tool_machine.h"
42#include "pub_tool_mallocfree.h"
43#include "pub_tool_options.h"
44#include "pub_tool_oset.h"
45#include "pub_tool_signals.h"
46#include "pub_tool_libcsetjmp.h"    // setjmp facilities
47#include "pub_tool_tooliface.h"     // Needed for mc_include.h
48
49#include "mc_include.h"
50
51/*------------------------------------------------------------*/
52/*--- An overview of leak checking.                        ---*/
53/*------------------------------------------------------------*/
54
55// Leak-checking is a directed-graph traversal problem.  The graph has
56// two kinds of nodes:
57// - root-set nodes:
58//   - GP registers of all threads;
59//   - valid, aligned, pointer-sized data words in valid client memory,
60//     including stacks, but excluding words within client heap-allocated
61//     blocks (they are excluded so that later on we can differentiate
62//     between heap blocks that are indirectly leaked vs. directly leaked).
63// - heap-allocated blocks.  A block is a mempool chunk or a malloc chunk
64//   that doesn't contain a mempool chunk.  Nb: the terms "blocks" and
65//   "chunks" are used interchangeably below.
66//
67// There are two kinds of edges:
68// - start-pointers, i.e. pointers to the start of a block;
69// - interior-pointers, i.e. pointers to the interior of a block.
70//
71// We use "pointers" rather than "edges" below.
72//
73// Root set nodes only point to blocks.  Blocks only point to blocks;
74// a block can point to itself.
75//
76// The aim is to traverse the graph and determine the status of each block.
77//
78// There are 9 distinct cases.  See memcheck/docs/mc-manual.xml for details.
79// Presenting all nine categories to the user is probably too much.
80// Currently we do this:
81// - definitely lost:  case 3
82// - indirectly lost:  case 4, 9
83// - possibly lost:    cases 5..8
84// - still reachable:  cases 1, 2
85//
86// It's far from clear that this is the best possible categorisation;  it's
87// accreted over time without any central guiding principle.
88
89/*------------------------------------------------------------*/
90/*--- XXX: Thoughts for improvement.                       ---*/
91/*------------------------------------------------------------*/
92
93// From the user's point of view:
94// - If they aren't using interior-pointers, they just have to fix the
95//   directly lost blocks, and the indirectly lost ones will be fixed as
96//   part of that.  Any possibly lost blocks will just be due to random
97//   pointer garbage and can be ignored.
98//
99// - If they are using interior-pointers, the fact that they currently are not
100//   being told which ones might be directly lost vs. indirectly lost makes
101//   it hard to know where to begin.
102//
103// All this makes me wonder if new option is warranted:
104// --follow-interior-pointers.  By default it would be off, the leak checker
105// wouldn't follow interior-pointers and there would only be 3 categories:
106// R, DL, IL.
107//
108// If turned on, then it would show 7 categories (R, DL, IL, DR/DL, IR/IL,
109// IR/IL/DL, IL/DL).  That output is harder to understand but it's your own
110// damn fault for using interior-pointers...
111//
112// ----
113//
114// Also, why are two blank lines printed between each loss record?
115// [bug 197930]
116//
117// ----
118//
119// Also, --show-reachable is a bad name because it also turns on the showing
120// of indirectly leaked blocks(!)  It would be better named --show-all or
121// --show-all-heap-blocks, because that's the end result.
122//
123// ----
124//
125// Also, the VALGRIND_LEAK_CHECK and VALGRIND_QUICK_LEAK_CHECK aren't great
126// names.  VALGRIND_FULL_LEAK_CHECK and VALGRIND_SUMMARY_LEAK_CHECK would be
127// better.
128//
129// ----
130//
131// Also, VALGRIND_COUNT_LEAKS and VALGRIND_COUNT_LEAK_BLOCKS aren't great as
132// they combine direct leaks and indirect leaks into one.  New, more precise
133// ones (they'll need new names) would be good.  If more categories are
134// used, as per the --follow-interior-pointers option, they should be
135// updated accordingly.  And they should use a struct to return the values.
136//
137// ----
138//
139// Also, for this case:
140//
141//  (4)  p4      BBB ---> AAA
142//
143// BBB is definitely directly lost.  AAA is definitely indirectly lost.
144// Here's the relevant loss records printed for a full check (each block is
145// 16 bytes):
146//
147// ==20397== 16 bytes in 1 blocks are indirectly lost in loss record 9 of 15
148// ==20397==    at 0x4C2694E: malloc (vg_replace_malloc.c:177)
149// ==20397==    by 0x400521: mk (leak-cases.c:49)
150// ==20397==    by 0x400578: main (leak-cases.c:72)
151//
152// ==20397== 32 (16 direct, 16 indirect) bytes in 1 blocks are definitely
153// lost in loss record 14 of 15
154// ==20397==    at 0x4C2694E: malloc (vg_replace_malloc.c:177)
155// ==20397==    by 0x400521: mk (leak-cases.c:49)
156// ==20397==    by 0x400580: main (leak-cases.c:72)
157//
158// The first one is fine -- it describes AAA.
159//
160// The second one is for BBB.  It's correct in that 16 bytes in 1 block are
161// directly lost. It's also correct that 16 are indirectly lost as a result,
162// but it means that AAA is being counted twice in the loss records.  (It's
163// not, thankfully, counted twice in the summary counts).  Argh.
164//
165// This would be less confusing for the second one:
166//
167// ==20397== 16 bytes in 1 blocks are definitely lost in loss record 14
168// of 15 (and 16 bytes in 1 block are indirectly lost as a result;  they
169// are mentioned elsewhere (if --show-reachable=yes is given!))
170// ==20397==    at 0x4C2694E: malloc (vg_replace_malloc.c:177)
171// ==20397==    by 0x400521: mk (leak-cases.c:49)
172// ==20397==    by 0x400580: main (leak-cases.c:72)
173//
174// But ideally we'd present the loss record for the directly lost block and
175// then the resultant indirectly lost blocks and make it clear the
176// dependence.  Double argh.
177
178/*------------------------------------------------------------*/
179/*--- The actual algorithm.                                ---*/
180/*------------------------------------------------------------*/
181
182// - Find all the blocks (a.k.a. chunks) to check.  Mempool chunks require
183//   some special treatment because they can be within malloc'd blocks.
184// - Scan every word in the root set (GP registers and valid
185//   non-heap memory words).
186//   - First, we skip if it doesn't point to valid memory.
187//   - Then, we see if it points to the start or interior of a block.  If
188//     so, we push the block onto the mark stack and mark it as having been
189//     reached.
190// - Then, we process the mark stack, repeating the scanning for each block;
191//   this can push more blocks onto the mark stack.  We repeat until the
192//   mark stack is empty.  Each block is marked as definitely or possibly
193//   reachable, depending on whether interior-pointers were required to
194//   reach it.
195// - At this point we know for every block if it's reachable or not.
196// - We then push each unreached block onto the mark stack, using the block
197//   number as the "clique" number.
198// - We process the mark stack again, this time grouping blocks into cliques
199//   in order to facilitate the directly/indirectly lost categorisation.
200// - We group blocks by their ExeContexts and categorisation, and print them
201//   if --leak-check=full.  We also print summary numbers.
202//
203// A note on "cliques":
204// - A directly lost block is one with no pointers to it.  An indirectly
205//   lost block is one that is pointed to by a directly or indirectly lost
206//   block.
207// - Each directly lost block has zero or more indirectly lost blocks
208//   hanging off it.  All these blocks together form a "clique".  The
209//   directly lost block is called the "clique leader".  The clique number
210//   is the number (in lc_chunks[]) of the clique leader.
211// - Actually, a directly lost block may be pointed to if it's part of a
212//   cycle.  In that case, there may be more than one choice for the clique
213//   leader, and the choice is arbitrary.  Eg. if you have A-->B and B-->A
214//   either A or B could be the clique leader.
215// - Cliques cannot overlap, and will be truncated to avoid this.  Eg. if we
216//   have A-->C and B-->C, the two cliques will be {A,C} and {B}, or {A} and
217//   {B,C} (again the choice is arbitrary).  This is because we don't want
218//   to count a block as indirectly lost more than once.
219//
220// A note on 'is_prior_definite':
221// - This is a boolean used in various places that indicates if the chain
222//   up to the prior node (prior to the one being considered) is definite.
223// - In the clique == -1 case:
224//   - if True it means that the prior node is a root-set node, or that the
225//     prior node is a block which is reachable from the root-set via
226//     start-pointers.
227//   - if False it means that the prior node is a block that is only
228//     reachable from the root-set via a path including at least one
229//     interior-pointer.
230// - In the clique != -1 case, currently it's always True because we treat
231//   start-pointers and interior-pointers the same for direct/indirect leak
232//   checking.  If we added a PossibleIndirectLeak state then this would
233//   change.
234
235
236// Define to debug the memory-leak-detector.
237#define VG_DEBUG_LEAKCHECK 0
238#define VG_DEBUG_CLIQUE    0
239
240
241/*------------------------------------------------------------*/
242/*--- Getting the initial chunks, and searching them.      ---*/
243/*------------------------------------------------------------*/
244
245// Compare the MC_Chunks by 'data' (i.e. the address of the block).
246static Int compare_MC_Chunks(void* n1, void* n2)
247{
248   MC_Chunk* mc1 = *(MC_Chunk**)n1;
249   MC_Chunk* mc2 = *(MC_Chunk**)n2;
250   if (mc1->data < mc2->data) return -1;
251   if (mc1->data > mc2->data) return  1;
252   return 0;
253}
254
255#if VG_DEBUG_LEAKCHECK
256// Used to sanity-check the fast binary-search mechanism.
257static
258Int find_chunk_for_OLD ( Addr       ptr,
259                         MC_Chunk** chunks,
260                         Int        n_chunks )
261
262{
263   Int  i;
264   Addr a_lo, a_hi;
265   PROF_EVENT(70, "find_chunk_for_OLD");
266   for (i = 0; i < n_chunks; i++) {
267      PROF_EVENT(71, "find_chunk_for_OLD(loop)");
268      a_lo = chunks[i]->data;
269      a_hi = ((Addr)chunks[i]->data) + chunks[i]->szB;
270      if (a_lo <= ptr && ptr < a_hi)
271         return i;
272   }
273   return -1;
274}
275#endif
276
277// Find the i such that ptr points at or inside the block described by
278// chunks[i].  Return -1 if none found.  This assumes that chunks[]
279// has been sorted on the 'data' field.
280static
281Int find_chunk_for ( Addr       ptr,
282                     MC_Chunk** chunks,
283                     Int        n_chunks )
284{
285   Addr a_mid_lo, a_mid_hi;
286   Int lo, mid, hi, retVal;
287   // VG_(printf)("find chunk for %p = ", ptr);
288   retVal = -1;
289   lo = 0;
290   hi = n_chunks-1;
291   while (True) {
292      // Invariant: current unsearched space is from lo to hi, inclusive.
293      if (lo > hi) break; // not found
294
295      mid      = (lo + hi) / 2;
296      a_mid_lo = chunks[mid]->data;
297      a_mid_hi = chunks[mid]->data + chunks[mid]->szB;
298      // Extent of block 'mid' is [a_mid_lo .. a_mid_hi).
299      // Special-case zero-sized blocks - treat them as if they had
300      // size 1.  Not doing so causes them to not cover any address
301      // range at all and so will never be identified as the target of
302      // any pointer, which causes them to be incorrectly reported as
303      // definitely leaked.
304      if (chunks[mid]->szB == 0)
305         a_mid_hi++;
306
307      if (ptr < a_mid_lo) {
308         hi = mid-1;
309         continue;
310      }
311      if (ptr >= a_mid_hi) {
312         lo = mid+1;
313         continue;
314      }
315      tl_assert(ptr >= a_mid_lo && ptr < a_mid_hi);
316      retVal = mid;
317      break;
318   }
319
320#  if VG_DEBUG_LEAKCHECK
321   tl_assert(retVal == find_chunk_for_OLD ( ptr, chunks, n_chunks ));
322#  endif
323   // VG_(printf)("%d\n", retVal);
324   return retVal;
325}
326
327
328static MC_Chunk**
329find_active_chunks(UInt* pn_chunks)
330{
331   // Our goal is to construct a set of chunks that includes every
332   // mempool chunk, and every malloc region that *doesn't* contain a
333   // mempool chunk.
334   MC_Mempool *mp;
335   MC_Chunk **mallocs, **chunks, *mc;
336   UInt n_mallocs, n_chunks, m, s;
337   Bool *malloc_chunk_holds_a_pool_chunk;
338
339   // First we collect all the malloc chunks into an array and sort it.
340   // We do this because we want to query the chunks by interior
341   // pointers, requiring binary search.
342   mallocs = (MC_Chunk**) VG_(HT_to_array)( MC_(malloc_list), &n_mallocs );
343   if (n_mallocs == 0) {
344      tl_assert(mallocs == NULL);
345      *pn_chunks = 0;
346      return NULL;
347   }
348   VG_(ssort)(mallocs, n_mallocs, sizeof(VgHashNode*), compare_MC_Chunks);
349
350   // Then we build an array containing a Bool for each malloc chunk,
351   // indicating whether it contains any mempools.
352   malloc_chunk_holds_a_pool_chunk = VG_(calloc)( "mc.fas.1",
353                                                  n_mallocs, sizeof(Bool) );
354   n_chunks = n_mallocs;
355
356   // Then we loop over the mempool tables. For each chunk in each
357   // pool, we set the entry in the Bool array corresponding to the
358   // malloc chunk containing the mempool chunk.
359   VG_(HT_ResetIter)(MC_(mempool_list));
360   while ( (mp = VG_(HT_Next)(MC_(mempool_list))) ) {
361      VG_(HT_ResetIter)(mp->chunks);
362      while ( (mc = VG_(HT_Next)(mp->chunks)) ) {
363
364         // We'll need to record this chunk.
365         n_chunks++;
366
367         // Possibly invalidate the malloc holding the beginning of this chunk.
368         m = find_chunk_for(mc->data, mallocs, n_mallocs);
369         if (m != -1 && malloc_chunk_holds_a_pool_chunk[m] == False) {
370            tl_assert(n_chunks > 0);
371            n_chunks--;
372            malloc_chunk_holds_a_pool_chunk[m] = True;
373         }
374
375         // Possibly invalidate the malloc holding the end of this chunk.
376         if (mc->szB > 1) {
377            m = find_chunk_for(mc->data + (mc->szB - 1), mallocs, n_mallocs);
378            if (m != -1 && malloc_chunk_holds_a_pool_chunk[m] == False) {
379               tl_assert(n_chunks > 0);
380               n_chunks--;
381               malloc_chunk_holds_a_pool_chunk[m] = True;
382            }
383         }
384      }
385   }
386   tl_assert(n_chunks > 0);
387
388   // Create final chunk array.
389   chunks = VG_(malloc)("mc.fas.2", sizeof(VgHashNode*) * (n_chunks));
390   s = 0;
391
392   // Copy the mempool chunks and the non-marked malloc chunks into a
393   // combined array of chunks.
394   VG_(HT_ResetIter)(MC_(mempool_list));
395   while ( (mp = VG_(HT_Next)(MC_(mempool_list))) ) {
396      VG_(HT_ResetIter)(mp->chunks);
397      while ( (mc = VG_(HT_Next)(mp->chunks)) ) {
398         tl_assert(s < n_chunks);
399         chunks[s++] = mc;
400      }
401   }
402   for (m = 0; m < n_mallocs; ++m) {
403      if (!malloc_chunk_holds_a_pool_chunk[m]) {
404         tl_assert(s < n_chunks);
405         chunks[s++] = mallocs[m];
406      }
407   }
408   tl_assert(s == n_chunks);
409
410   // Free temporaries.
411   VG_(free)(mallocs);
412   VG_(free)(malloc_chunk_holds_a_pool_chunk);
413
414   *pn_chunks = n_chunks;
415
416   return chunks;
417}
418
419/*------------------------------------------------------------*/
420/*--- The leak detector proper.                            ---*/
421/*------------------------------------------------------------*/
422
423// Holds extra info about each block during leak checking.
424typedef
425   struct {
426      UInt  state:2;    // Reachedness.
427      UInt  pending:1;  // Scan pending.
428      SizeT indirect_szB : (sizeof(SizeT)*8)-3; // If Unreached, how many bytes
429                                                //   are unreachable from here.
430   }
431   LC_Extra;
432
433// An array holding pointers to every chunk we're checking.  Sorted by address.
434static MC_Chunk** lc_chunks;
435// How many chunks we're dealing with.
436static Int        lc_n_chunks;
437// chunks will be converted and merged in loss record, maintained in lr_table
438// lr_table elements are kept from one leak_search to another to implement
439// the "print new/changed leaks" client request
440static OSet*        lr_table;
441
442// DeltaMode used the last time we called detect_memory_leaks.
443// The recorded leak errors must be output using a logic based on this delta_mode.
444// The below avoids replicating the delta_mode in each LossRecord.
445LeakCheckDeltaMode MC_(detect_memory_leaks_last_delta_mode);
446
447
448// This has the same number of entries as lc_chunks, and each entry
449// in lc_chunks corresponds with the entry here (ie. lc_chunks[i] and
450// lc_extras[i] describe the same block).
451static LC_Extra* lc_extras;
452
453// Records chunks that are currently being processed.  Each element in the
454// stack is an index into lc_chunks and lc_extras.  Its size is
455// 'lc_n_chunks' because in the worst case that's how many chunks could be
456// pushed onto it (actually I think the maximum is lc_n_chunks-1 but let's
457// be conservative).
458static Int* lc_markstack;
459// The index of the top element of the stack; -1 if the stack is empty, 0 if
460// the stack has one element, 1 if it has two, etc.
461static Int  lc_markstack_top;
462
463// Keeps track of how many bytes of memory we've scanned, for printing.
464// (Nb: We don't keep track of how many register bytes we've scanned.)
465static SizeT lc_scanned_szB;
466
467
468SizeT MC_(bytes_leaked)     = 0;
469SizeT MC_(bytes_indirect)   = 0;
470SizeT MC_(bytes_dubious)    = 0;
471SizeT MC_(bytes_reachable)  = 0;
472SizeT MC_(bytes_suppressed) = 0;
473
474SizeT MC_(blocks_leaked)     = 0;
475SizeT MC_(blocks_indirect)   = 0;
476SizeT MC_(blocks_dubious)    = 0;
477SizeT MC_(blocks_reachable)  = 0;
478SizeT MC_(blocks_suppressed) = 0;
479
480
481// Determines if a pointer is to a chunk.  Returns the chunk number et al
482// via call-by-reference.
483static Bool
484lc_is_a_chunk_ptr(Addr ptr, Int* pch_no, MC_Chunk** pch, LC_Extra** pex)
485{
486   Int ch_no;
487   MC_Chunk* ch;
488   LC_Extra* ex;
489
490   // Quick filter.
491   if (!VG_(am_is_valid_for_client)(ptr, 1, VKI_PROT_READ)) {
492      return False;
493   } else {
494      ch_no = find_chunk_for(ptr, lc_chunks, lc_n_chunks);
495      tl_assert(ch_no >= -1 && ch_no < lc_n_chunks);
496
497      if (ch_no == -1) {
498         return False;
499      } else {
500         // Ok, we've found a pointer to a chunk.  Get the MC_Chunk and its
501         // LC_Extra.
502         ch = lc_chunks[ch_no];
503         ex = &(lc_extras[ch_no]);
504
505         tl_assert(ptr >= ch->data);
506         tl_assert(ptr < ch->data + ch->szB + (ch->szB==0  ? 1  : 0));
507
508         if (VG_DEBUG_LEAKCHECK)
509            VG_(printf)("ptr=%#lx -> block %d\n", ptr, ch_no);
510
511         *pch_no = ch_no;
512         *pch    = ch;
513         *pex    = ex;
514
515         return True;
516      }
517   }
518}
519
520// Push a chunk (well, just its index) onto the mark stack.
521static void lc_push(Int ch_no, MC_Chunk* ch)
522{
523   if (!lc_extras[ch_no].pending) {
524      if (0) {
525         VG_(printf)("pushing %#lx-%#lx\n", ch->data, ch->data + ch->szB);
526      }
527      lc_markstack_top++;
528      tl_assert(lc_markstack_top < lc_n_chunks);
529      lc_markstack[lc_markstack_top] = ch_no;
530      tl_assert(!lc_extras[ch_no].pending);
531      lc_extras[ch_no].pending = True;
532   }
533}
534
535// Return the index of the chunk on the top of the mark stack, or -1 if
536// there isn't one.
537static Bool lc_pop(Int* ret)
538{
539   if (-1 == lc_markstack_top) {
540      return False;
541   } else {
542      tl_assert(0 <= lc_markstack_top && lc_markstack_top < lc_n_chunks);
543      *ret = lc_markstack[lc_markstack_top];
544      lc_markstack_top--;
545      tl_assert(lc_extras[*ret].pending);
546      lc_extras[*ret].pending = False;
547      return True;
548   }
549}
550
551// Partial fix for https://bugs.kde.org/show_bug.cgi?id=280271
552// Only used in valgrind-variant now.
553static Bool vv_lc_is_start_pointer(Addr ptr, MC_Chunk* chunk)
554{
555   // Pointers to the start of the chunk are indeed start-pointers
556   if (ptr == chunk->data)
557      return True;
558
559   // Below are a few heuristics to reduce the number of false positive
560   // "possibly lost" reports on C++ types by treating some interior-pointers
561   // as start-pointers (inspired by the Dr. Memory article at CGO2011).
562
563   // Shortcut: heuristics assume 'ptr' is word-aligned.
564   if (ptr != VG_ROUNDUP(ptr, sizeof(Addr)))
565      return False;
566
567   if (ptr == chunk->data + sizeof(Addr)) {
568      // Pointer to a new[]-allocated buffer?
569      SizeT sz_from_header = *(SizeT*)chunk->data,
570            expected_sz = chunk->szB - sizeof(Addr);
571      if (sz_from_header > 0 && sz_from_header <= expected_sz &&
572          expected_sz % sz_from_header == 0)
573         return True;
574   }
575
576   if (ptr == chunk->data + 3*sizeof(Addr)) {
577      // Pointer to std::string internals?
578      SizeT assumed_len = *(SizeT*)chunk->data,
579            assumed_capacity = *((SizeT*)chunk->data + 1);
580      if (assumed_len <= assumed_capacity) {
581         // std::string
582         if (chunk->szB - 3*sizeof(SizeT) == assumed_capacity + 1)
583            return True;
584
585         // std::basic_string<unsigned short> a.k.a. string16
586         if (chunk->szB - 3*sizeof(SizeT) == 2*(assumed_capacity + 1))
587            return True;
588
589         // std::basic_string<wchar_t> on Linux
590         if (chunk->szB - 3*sizeof(SizeT) == 4*(assumed_capacity + 1))
591            return True;
592      }
593   }
594
595   if (ptr == chunk->data + 2*sizeof(Addr)) {
596      // Pointer to a nss_ZAlloc-allocated buffer?
597      // It adds a header like this: 'struct { void *ptr; uint32 size };'
598      SizeT sz_from_header = *(UInt*)(chunk->data + sizeof(Addr)),
599            expected_sz = chunk->szB - 2*sizeof(Addr);
600      tl_assert(sizeof(UInt) == 4);
601      if (sz_from_header == expected_sz)
602         return True;
603   }
604
605   return False;
606}
607
608// If 'ptr' is pointing to a heap-allocated block which hasn't been seen
609// before, push it onto the mark stack.
610static void
611lc_push_without_clique_if_a_chunk_ptr(Addr ptr, Bool is_prior_definite)
612{
613   Int ch_no;
614   MC_Chunk* ch;
615   LC_Extra* ex;
616
617   if ( ! lc_is_a_chunk_ptr(ptr, &ch_no, &ch, &ex) )
618      return;
619
620   // Possibly upgrade the state, ie. one of:
621   // - Unreached --> Possible
622   // - Unreached --> Reachable
623   // - Possible  --> Reachable
624   if (vv_lc_is_start_pointer(ptr, ch) &&
625       is_prior_definite && ex->state != Reachable) {
626      // 'ptr' points to the start of the block, and the prior node is
627      // definite, which means that this block is definitely reachable.
628      ex->state = Reachable;
629
630      // State has changed to Reachable so (re)scan the block to make
631      // sure any blocks it points to are correctly marked.
632      lc_push(ch_no, ch);
633
634   } else if (ex->state == Unreached) {
635      // Either 'ptr' is a interior-pointer, or the prior node isn't definite,
636      // which means that we can only mark this block as possibly reachable.
637      ex->state = Possible;
638
639      // State has changed to Possible so (re)scan the block to make
640      // sure any blocks it points to are correctly marked.
641      lc_push(ch_no, ch);
642   }
643}
644
645static void
646lc_push_if_a_chunk_ptr_register(Addr ptr)
647{
648   lc_push_without_clique_if_a_chunk_ptr(ptr, /*is_prior_definite*/True);
649}
650
651// If ptr is pointing to a heap-allocated block which hasn't been seen
652// before, push it onto the mark stack.  Clique is the index of the
653// clique leader.
654static void
655lc_push_with_clique_if_a_chunk_ptr(Addr ptr, Int clique)
656{
657   Int ch_no;
658   MC_Chunk* ch;
659   LC_Extra* ex;
660
661   tl_assert(0 <= clique && clique < lc_n_chunks);
662
663   if ( ! lc_is_a_chunk_ptr(ptr, &ch_no, &ch, &ex) )
664      return;
665
666   // If it's not Unreached, it's already been handled so ignore it.
667   // If ch_no==clique, it's the clique leader, which means this is a cyclic
668   // structure;  again ignore it because it's already been handled.
669   if (ex->state == Unreached && ch_no != clique) {
670      // Note that, unlike reachable blocks, we currently don't distinguish
671      // between start-pointers and interior-pointers here.  We probably
672      // should, though.
673      ex->state = IndirectLeak;
674      lc_push(ch_no, ch);
675
676      // Add the block to the clique, and add its size to the
677      // clique-leader's indirect size.  Also, if the new block was
678      // itself a clique leader, it isn't any more, so add its
679      // indirect_szB to the new clique leader.
680      if (VG_DEBUG_CLIQUE) {
681         if (ex->indirect_szB > 0)
682            VG_(printf)("  clique %d joining clique %d adding %lu+%lu\n",
683                        ch_no, clique, (unsigned long)ch->szB,
684			(unsigned long)ex->indirect_szB);
685         else
686            VG_(printf)("  block %d joining clique %d adding %lu\n",
687                        ch_no, clique, (unsigned long)ch->szB);
688      }
689
690      lc_extras[clique].indirect_szB += ch->szB;
691      lc_extras[clique].indirect_szB += ex->indirect_szB;
692      ex->indirect_szB = 0;    // Shouldn't matter.
693   }
694}
695
696static void
697lc_push_if_a_chunk_ptr(Addr ptr, Int clique, Bool is_prior_definite)
698{
699   if (-1 == clique)
700      lc_push_without_clique_if_a_chunk_ptr(ptr, is_prior_definite);
701   else
702      lc_push_with_clique_if_a_chunk_ptr(ptr, clique);
703}
704
705
706static VG_MINIMAL_JMP_BUF(memscan_jmpbuf);
707
708static
709void scan_all_valid_memory_catcher ( Int sigNo, Addr addr )
710{
711   if (0)
712      VG_(printf)("OUCH! sig=%d addr=%#lx\n", sigNo, addr);
713   if (sigNo == VKI_SIGSEGV || sigNo == VKI_SIGBUS)
714      VG_MINIMAL_LONGJMP(memscan_jmpbuf);
715}
716
717// Scan a block of memory between [start, start+len).  This range may
718// be bogus, inaccessable, or otherwise strange; we deal with it.  For each
719// valid aligned word we assume it's a pointer to a chunk a push the chunk
720// onto the mark stack if so.
721static void
722lc_scan_memory(Addr start, SizeT len, Bool is_prior_definite, Int clique)
723{
724   Addr ptr = VG_ROUNDUP(start,     sizeof(Addr));
725   Addr end = VG_ROUNDDN(start+len, sizeof(Addr));
726   vki_sigset_t sigmask;
727
728   if (VG_DEBUG_LEAKCHECK)
729      VG_(printf)("scan %#lx-%#lx (%lu)\n", start, end, len);
730
731   VG_(sigprocmask)(VKI_SIG_SETMASK, NULL, &sigmask);
732   VG_(set_fault_catcher)(scan_all_valid_memory_catcher);
733
734   // We might be in the middle of a page.  Do a cheap check to see if
735   // it's valid;  if not, skip onto the next page.
736   if (!VG_(am_is_valid_for_client)(ptr, sizeof(Addr), VKI_PROT_READ))
737      ptr = VG_PGROUNDUP(ptr+1);        // First page is bad - skip it.
738
739   while (ptr < end) {
740      Addr addr;
741
742      // Skip invalid chunks.
743      if ( ! MC_(is_within_valid_secondary)(ptr) ) {
744         ptr = VG_ROUNDUP(ptr+1, SM_SIZE);
745         continue;
746      }
747
748      // Look to see if this page seems reasonable.
749      if ((ptr % VKI_PAGE_SIZE) == 0) {
750         if (!VG_(am_is_valid_for_client)(ptr, sizeof(Addr), VKI_PROT_READ)) {
751            ptr += VKI_PAGE_SIZE;      // Bad page - skip it.
752            continue;
753         }
754      }
755
756      if (VG_MINIMAL_SETJMP(memscan_jmpbuf) == 0) {
757         if ( MC_(is_valid_aligned_word)(ptr) ) {
758            lc_scanned_szB += sizeof(Addr);
759            addr = *(Addr *)ptr;
760            // If we get here, the scanned word is in valid memory.  Now
761            // let's see if its contents point to a chunk.
762            lc_push_if_a_chunk_ptr(addr, clique, is_prior_definite);
763         } else if (0 && VG_DEBUG_LEAKCHECK) {
764            VG_(printf)("%#lx not valid\n", ptr);
765         }
766         ptr += sizeof(Addr);
767      } else {
768         // We need to restore the signal mask, because we were
769         // longjmped out of a signal handler.
770         VG_(sigprocmask)(VKI_SIG_SETMASK, &sigmask, NULL);
771
772         ptr = VG_PGROUNDUP(ptr+1);     // Bad page - skip it.
773      }
774   }
775
776   VG_(sigprocmask)(VKI_SIG_SETMASK, &sigmask, NULL);
777   VG_(set_fault_catcher)(NULL);
778}
779
780
781// Process the mark stack until empty.
782static void lc_process_markstack(Int clique)
783{
784   Int  top = -1;    // shut gcc up
785   Bool is_prior_definite;
786
787   while (lc_pop(&top)) {
788      tl_assert(top >= 0 && top < lc_n_chunks);
789
790      // See comment about 'is_prior_definite' at the top to understand this.
791      is_prior_definite = ( Possible != lc_extras[top].state );
792
793      lc_scan_memory(lc_chunks[top]->data, lc_chunks[top]->szB,
794                     is_prior_definite, clique);
795   }
796}
797
798static Word cmp_LossRecordKey_LossRecord(const void* key, const void* elem)
799{
800   LossRecordKey* a = (LossRecordKey*)key;
801   LossRecordKey* b = &(((LossRecord*)elem)->key);
802
803   // Compare on states first because that's fast.
804   if (a->state < b->state) return -1;
805   if (a->state > b->state) return  1;
806   // Ok, the states are equal.  Now compare the locations, which is slower.
807   if (VG_(eq_ExeContext)(
808            MC_(clo_leak_resolution), a->allocated_at, b->allocated_at))
809      return 0;
810   // Different locations.  Ordering is arbitrary, just use the ec pointer.
811   if (a->allocated_at < b->allocated_at) return -1;
812   if (a->allocated_at > b->allocated_at) return  1;
813   VG_(tool_panic)("bad LossRecord comparison");
814}
815
816static Int cmp_LossRecords(void* va, void* vb)
817{
818   LossRecord* lr_a = *(LossRecord**)va;
819   LossRecord* lr_b = *(LossRecord**)vb;
820   SizeT total_szB_a = lr_a->szB + lr_a->indirect_szB;
821   SizeT total_szB_b = lr_b->szB + lr_b->indirect_szB;
822
823   // First compare by sizes.
824   if (total_szB_a < total_szB_b) return -1;
825   if (total_szB_a > total_szB_b) return  1;
826   // If size are equal, compare by states.
827   if (lr_a->key.state < lr_b->key.state) return -1;
828   if (lr_a->key.state > lr_b->key.state) return  1;
829   // If they're still equal here, it doesn't matter that much, but we keep
830   // comparing other things so that regtests are as deterministic as
831   // possible.  So:  compare num_blocks.
832   if (lr_a->num_blocks < lr_b->num_blocks) return -1;
833   if (lr_a->num_blocks > lr_b->num_blocks) return  1;
834   // Finally, compare ExeContext addresses... older ones are likely to have
835   // lower addresses.
836   if (lr_a->key.allocated_at < lr_b->key.allocated_at) return -1;
837   if (lr_a->key.allocated_at > lr_b->key.allocated_at) return  1;
838   return 0;
839}
840
841static void print_results(ThreadId tid, LeakCheckParams lcp)
842{
843   Int          i, n_lossrecords;
844   LossRecord** lr_array;
845   LossRecord*  lr;
846   Bool         is_suppressed;
847   SizeT        old_bytes_leaked      = MC_(bytes_leaked); /* to report delta in summary */
848   SizeT        old_bytes_indirect    = MC_(bytes_indirect);
849   SizeT        old_bytes_dubious     = MC_(bytes_dubious);
850   SizeT        old_bytes_reachable   = MC_(bytes_reachable);
851   SizeT        old_bytes_suppressed  = MC_(bytes_suppressed);
852   SizeT        old_blocks_leaked     = MC_(blocks_leaked);
853   SizeT        old_blocks_indirect   = MC_(blocks_indirect);
854   SizeT        old_blocks_dubious    = MC_(blocks_dubious);
855   SizeT        old_blocks_reachable  = MC_(blocks_reachable);
856   SizeT        old_blocks_suppressed = MC_(blocks_suppressed);
857
858   if (lr_table == NULL)
859      // Create the lr_table, which holds the loss records.
860      // If the lr_table already exists, it means it contains
861      // loss_records from the previous leak search. The old_*
862      // values in these records are used to implement the
863      // leak check delta mode
864      lr_table =
865         VG_(OSetGen_Create)(offsetof(LossRecord, key),
866                             cmp_LossRecordKey_LossRecord,
867                             VG_(malloc), "mc.pr.1",
868                             VG_(free));
869
870
871   // Convert the chunks into loss records, merging them where appropriate.
872   for (i = 0; i < lc_n_chunks; i++) {
873      MC_Chunk*     ch = lc_chunks[i];
874      LC_Extra*     ex = &(lc_extras)[i];
875      LossRecord*   old_lr;
876      LossRecordKey lrkey;
877      lrkey.state        = ex->state;
878      lrkey.allocated_at = ch->where;
879
880      old_lr = VG_(OSetGen_Lookup)(lr_table, &lrkey);
881      if (old_lr) {
882         // We found an existing loss record matching this chunk.  Update the
883         // loss record's details in-situ.  This is safe because we don't
884         // change the elements used as the OSet key.
885         old_lr->szB          += ch->szB;
886         old_lr->indirect_szB += ex->indirect_szB;
887         old_lr->num_blocks++;
888      } else {
889         // No existing loss record matches this chunk.  Create a new loss
890         // record, initialise it from the chunk, and insert it into lr_table.
891         lr = VG_(OSetGen_AllocNode)(lr_table, sizeof(LossRecord));
892         lr->key              = lrkey;
893         lr->szB              = ch->szB;
894         lr->indirect_szB     = ex->indirect_szB;
895         lr->num_blocks       = 1;
896         lr->old_szB          = 0;
897         lr->old_indirect_szB = 0;
898         lr->old_num_blocks   = 0;
899         VG_(OSetGen_Insert)(lr_table, lr);
900      }
901   }
902   n_lossrecords = VG_(OSetGen_Size)(lr_table);
903
904   // Create an array of pointers to the loss records.
905   lr_array = VG_(malloc)("mc.pr.2", n_lossrecords * sizeof(LossRecord*));
906   i = 0;
907   VG_(OSetGen_ResetIter)(lr_table);
908   while ( (lr = VG_(OSetGen_Next)(lr_table)) ) {
909      lr_array[i++] = lr;
910   }
911   tl_assert(i == n_lossrecords);
912
913   // Sort the array by loss record sizes.
914   VG_(ssort)(lr_array, n_lossrecords, sizeof(LossRecord*),
915              cmp_LossRecords);
916
917   // Zero totals.
918   MC_(blocks_leaked)     = MC_(bytes_leaked)     = 0;
919   MC_(blocks_indirect)   = MC_(bytes_indirect)   = 0;
920   MC_(blocks_dubious)    = MC_(bytes_dubious)    = 0;
921   MC_(blocks_reachable)  = MC_(bytes_reachable)  = 0;
922   MC_(blocks_suppressed) = MC_(bytes_suppressed) = 0;
923
924   // Print the loss records (in size order) and collect summary stats.
925   for (i = 0; i < n_lossrecords; i++) {
926      Bool count_as_error, print_record, delta_considered;
927      // Rules for printing:
928      // - We don't show suppressed loss records ever (and that's controlled
929      //   within the error manager).
930      // - We show non-suppressed loss records that are not "reachable" if
931      //   --leak-check=yes.
932      // - We show all non-suppressed loss records if --leak-check=yes and
933      //   --show-reachable=yes.
934      //
935      // Nb: here "reachable" means Reachable *or* IndirectLeak;  note that
936      // this is different to "still reachable" used elsewhere because it
937      // includes indirectly lost blocks!
938      //
939      lr = lr_array[i];
940      switch (lcp.deltamode) {
941         case LCD_Any:
942            delta_considered = lr->num_blocks > 0;
943            break;
944         case LCD_Increased:
945            delta_considered
946               = lr_array[i]->szB > lr_array[i]->old_szB
947                 || lr_array[i]->indirect_szB > lr_array[i]->old_indirect_szB
948                 || lr->num_blocks > lr->old_num_blocks;
949            break;
950         case LCD_Changed:
951            delta_considered = lr_array[i]->szB != lr_array[i]->old_szB
952            || lr_array[i]->indirect_szB != lr_array[i]->old_indirect_szB
953            || lr->num_blocks != lr->old_num_blocks;
954            break;
955         default:
956            tl_assert(0);
957      }
958
959      print_record = lcp.mode == LC_Full && delta_considered &&
960                     ( lcp.show_reachable ||
961                       Unreached == lr->key.state ||
962                       ( lcp.show_possibly_lost &&
963                         Possible  == lr->key.state ) );
964      // We don't count a leaks as errors with lcp.mode==LC_Summary.
965      // Otherwise you can get high error counts with few or no error
966      // messages, which can be confusing.  Also, you could argue that
967      // indirect leaks should be counted as errors, but it seems better to
968      // make the counting criteria similar to the printing criteria.  So we
969      // don't count them.
970      count_as_error = lcp.mode == LC_Full && delta_considered &&
971                       ( Unreached == lr->key.state ||
972                         Possible  == lr->key.state );
973      if ((Reachable == lr->key.state && !MC_(clo_show_reachable)) ||
974          (Possible  == lr->key.state && !MC_(clo_show_possibly_lost)))
975         is_suppressed = False;
976      else
977         is_suppressed = MC_(record_leak_error)(tid, i+1, n_lossrecords, lr,
978                                                print_record, count_as_error);
979
980      if (is_suppressed) {
981         MC_(blocks_suppressed) += lr->num_blocks;
982         MC_(bytes_suppressed)  += lr->szB;
983
984      } else if (Unreached == lr->key.state) {
985         MC_(blocks_leaked)     += lr->num_blocks;
986         MC_(bytes_leaked)      += lr->szB;
987
988      } else if (IndirectLeak == lr->key.state) {
989         MC_(blocks_indirect)   += lr->num_blocks;
990         MC_(bytes_indirect)    += lr->szB;
991
992      } else if (Possible == lr->key.state) {
993         MC_(blocks_dubious)    += lr->num_blocks;
994         MC_(bytes_dubious)     += lr->szB;
995
996      } else if (Reachable == lr->key.state) {
997         MC_(blocks_reachable)  += lr->num_blocks;
998         MC_(bytes_reachable)   += lr->szB;
999
1000      } else {
1001         VG_(tool_panic)("unknown loss mode");
1002      }
1003   }
1004
1005   for (i = 0; i < n_lossrecords; i++)
1006      {
1007         if (lr->num_blocks == 0)
1008            // remove from lr_table the old loss_records with 0 bytes found
1009            VG_(OSetGen_Remove) (lr_table, &lr_array[i]->key);
1010         else
1011            {
1012               // move the leak sizes to old_* and zero the current sizes
1013               // for next leak search
1014               lr_array[i]->old_szB          = lr_array[i]->szB;
1015               lr_array[i]->old_indirect_szB = lr_array[i]->indirect_szB;
1016               lr_array[i]->old_num_blocks   = lr_array[i]->num_blocks;
1017               lr_array[i]->szB              = 0;
1018               lr_array[i]->indirect_szB     = 0;
1019               lr_array[i]->num_blocks       = 0;
1020            }
1021      }
1022   VG_(free)(lr_array);
1023
1024   if (VG_(clo_verbosity) > 0 && !VG_(clo_xml)) {
1025      char d_bytes[20];
1026      char d_blocks[20];
1027
1028      VG_(umsg)("LEAK SUMMARY:\n");
1029      VG_(umsg)("   definitely lost: %'lu%s bytes in %'lu%s blocks\n",
1030                MC_(bytes_leaked),
1031                MC_(snprintf_delta) (d_bytes, 20, MC_(bytes_leaked), old_bytes_leaked, lcp.deltamode),
1032                MC_(blocks_leaked),
1033                MC_(snprintf_delta) (d_blocks, 20, MC_(blocks_leaked), old_blocks_leaked, lcp.deltamode));
1034      VG_(umsg)("   indirectly lost: %'lu%s bytes in %'lu%s blocks\n",
1035                MC_(bytes_indirect),
1036                MC_(snprintf_delta) (d_bytes, 20, MC_(bytes_indirect), old_bytes_indirect, lcp.deltamode),
1037                MC_(blocks_indirect),
1038                MC_(snprintf_delta) (d_blocks, 20, MC_(blocks_indirect), old_blocks_indirect, lcp.deltamode) );
1039      VG_(umsg)("     possibly lost: %'lu%s bytes in %'lu%s blocks\n",
1040                MC_(bytes_dubious),
1041                MC_(snprintf_delta) (d_bytes, 20, MC_(bytes_dubious), old_bytes_dubious, lcp.deltamode),
1042                MC_(blocks_dubious),
1043                MC_(snprintf_delta) (d_blocks, 20, MC_(blocks_dubious), old_blocks_dubious, lcp.deltamode) );
1044      VG_(umsg)("   still reachable: %'lu%s bytes in %'lu%s blocks\n",
1045                MC_(bytes_reachable),
1046                MC_(snprintf_delta) (d_bytes, 20, MC_(bytes_reachable), old_bytes_reachable, lcp.deltamode),
1047                MC_(blocks_reachable),
1048                MC_(snprintf_delta) (d_blocks, 20, MC_(blocks_reachable), old_blocks_reachable, lcp.deltamode) );
1049      VG_(umsg)("        suppressed: %'lu%s bytes in %'lu%s blocks\n",
1050                MC_(bytes_suppressed),
1051                MC_(snprintf_delta) (d_bytes, 20, MC_(bytes_suppressed), old_bytes_suppressed, lcp.deltamode),
1052                MC_(blocks_suppressed),
1053                MC_(snprintf_delta) (d_blocks, 20, MC_(blocks_suppressed), old_blocks_suppressed, lcp.deltamode) );
1054      if (lcp.mode != LC_Full &&
1055          (MC_(blocks_leaked) + MC_(blocks_indirect) +
1056           MC_(blocks_dubious) + MC_(blocks_reachable)) > 0) {
1057         if (lcp.requested_by_monitor_command)
1058            VG_(umsg)("To see details of leaked memory, give 'full' arg to leak_check\n");
1059         else
1060            VG_(umsg)("Rerun with --leak-check=full to see details "
1061                      "of leaked memory\n");
1062      }
1063      if (lcp.mode == LC_Full &&
1064          MC_(blocks_reachable) > 0 && !lcp.show_reachable)
1065      {
1066         VG_(umsg)("Reachable blocks (those to which a pointer "
1067                   "was found) are not shown.\n");
1068         if (lcp.requested_by_monitor_command)
1069            VG_(umsg)("To see them, add 'reachable any' args to leak_check\n");
1070         else
1071            VG_(umsg)("To see them, rerun with: --leak-check=full "
1072                      "--show-reachable=yes\n");
1073      }
1074      VG_(umsg)("\n");
1075   }
1076}
1077
1078/*------------------------------------------------------------*/
1079/*--- Top-level entry point.                               ---*/
1080/*------------------------------------------------------------*/
1081
1082void MC_(detect_memory_leaks) ( ThreadId tid, LeakCheckParams lcp)
1083{
1084   Int i, j;
1085
1086   tl_assert(lcp.mode != LC_Off);
1087
1088   MC_(detect_memory_leaks_last_delta_mode) = lcp.deltamode;
1089
1090   // Get the chunks, stop if there were none.
1091   lc_chunks = find_active_chunks(&lc_n_chunks);
1092   if (lc_n_chunks == 0) {
1093      tl_assert(lc_chunks == NULL);
1094      if (lr_table != NULL) {
1095         // forget the previous recorded LossRecords as next leak search will in any case
1096         // just create new leaks.
1097         // Maybe it would be better to rather call print_result ?
1098         // (at least when leak decrease are requested)
1099         // This will then output all LossRecords with a size decreasing to 0
1100         VG_(OSetGen_Destroy) (lr_table);
1101      }
1102      if (VG_(clo_verbosity) >= 1 && !VG_(clo_xml)) {
1103         VG_(umsg)("All heap blocks were freed -- no leaks are possible\n");
1104         VG_(umsg)("\n");
1105      }
1106      return;
1107   }
1108
1109   // Sort the array so blocks are in ascending order in memory.
1110   VG_(ssort)(lc_chunks, lc_n_chunks, sizeof(VgHashNode*), compare_MC_Chunks);
1111
1112   // Sanity check -- make sure they're in order.
1113   for (i = 0; i < lc_n_chunks-1; i++) {
1114      tl_assert( lc_chunks[i]->data <= lc_chunks[i+1]->data);
1115   }
1116
1117   // Sanity check -- make sure they don't overlap.  The one exception is that
1118   // we allow a MALLOCLIKE block to sit entirely within a malloc() block.
1119   // This is for bug 100628.  If this occurs, we ignore the malloc() block
1120   // for leak-checking purposes.  This is a hack and probably should be done
1121   // better, but at least it's consistent with mempools (which are treated
1122   // like this in find_active_chunks).  Mempools have a separate VgHashTable
1123   // for mempool chunks, but if custom-allocated blocks are put in a separate
1124   // table from normal heap blocks it makes free-mismatch checking more
1125   // difficult.
1126   //
1127   // If this check fails, it probably means that the application
1128   // has done something stupid with VALGRIND_MALLOCLIKE_BLOCK client
1129   // requests, eg. has made overlapping requests (which are
1130   // nonsensical), or used VALGRIND_MALLOCLIKE_BLOCK for stack locations;
1131   // again nonsensical.
1132   //
1133   for (i = 0; i < lc_n_chunks-1; i++) {
1134      MC_Chunk* ch1 = lc_chunks[i];
1135      MC_Chunk* ch2 = lc_chunks[i+1];
1136
1137      Addr start1    = ch1->data;
1138      Addr start2    = ch2->data;
1139      Addr end1      = ch1->data + ch1->szB - 1;
1140      Addr end2      = ch2->data + ch2->szB - 1;
1141      Bool isCustom1 = ch1->allockind == MC_AllocCustom;
1142      Bool isCustom2 = ch2->allockind == MC_AllocCustom;
1143
1144      if (end1 < start2) {
1145         // Normal case - no overlap.
1146
1147      // We used to allow exact duplicates, I'm not sure why.  --njn
1148      //} else if (start1 == start2 && end1 == end2) {
1149         // Degenerate case: exact duplicates.
1150
1151      } else if (start1 >= start2 && end1 <= end2 && isCustom1 && !isCustom2) {
1152         // Block i is MALLOCLIKE and entirely within block i+1.
1153         // Remove block i+1.
1154         for (j = i+1; j < lc_n_chunks-1; j++) {
1155            lc_chunks[j] = lc_chunks[j+1];
1156         }
1157         lc_n_chunks--;
1158
1159      } else if (start2 >= start1 && end2 <= end1 && isCustom2 && !isCustom1) {
1160         // Block i+1 is MALLOCLIKE and entirely within block i.
1161         // Remove block i.
1162         for (j = i; j < lc_n_chunks-1; j++) {
1163            lc_chunks[j] = lc_chunks[j+1];
1164         }
1165         lc_n_chunks--;
1166
1167      } else {
1168         VG_(umsg)("Block 0x%lx..0x%lx overlaps with block 0x%lx..0x%lx",
1169                   start1, end1, start2, end2);
1170         VG_(umsg)("This is usually caused by using VALGRIND_MALLOCLIKE_BLOCK");
1171         VG_(umsg)("in an inappropriate way.");
1172         tl_assert (0);
1173      }
1174   }
1175
1176   // Initialise lc_extras.
1177   lc_extras = VG_(malloc)( "mc.dml.2", lc_n_chunks * sizeof(LC_Extra) );
1178   for (i = 0; i < lc_n_chunks; i++) {
1179      lc_extras[i].state        = Unreached;
1180      lc_extras[i].pending      = False;
1181      lc_extras[i].indirect_szB = 0;
1182   }
1183
1184   // Initialise lc_markstack.
1185   lc_markstack = VG_(malloc)( "mc.dml.2", lc_n_chunks * sizeof(Int) );
1186   for (i = 0; i < lc_n_chunks; i++) {
1187      lc_markstack[i] = -1;
1188   }
1189   lc_markstack_top = -1;
1190
1191   // Verbosity.
1192   if (VG_(clo_verbosity) > 1 && !VG_(clo_xml)) {
1193      VG_(umsg)( "Searching for pointers to %'d not-freed blocks\n",
1194                 lc_n_chunks );
1195   }
1196
1197   // Scan the memory root-set, pushing onto the mark stack any blocks
1198   // pointed to.
1199   {
1200      Int   n_seg_starts;
1201      Addr* seg_starts = VG_(get_segment_starts)( &n_seg_starts );
1202
1203      tl_assert(seg_starts && n_seg_starts > 0);
1204
1205      lc_scanned_szB = 0;
1206
1207      // VG_(am_show_nsegments)( 0, "leakcheck");
1208      for (i = 0; i < n_seg_starts; i++) {
1209         SizeT seg_size;
1210         NSegment const* seg = VG_(am_find_nsegment)( seg_starts[i] );
1211         tl_assert(seg);
1212
1213         if (seg->kind != SkFileC && seg->kind != SkAnonC) continue;
1214         if (!(seg->hasR && seg->hasW))                    continue;
1215         if (seg->isCH)                                    continue;
1216
1217         // Don't poke around in device segments as this may cause
1218         // hangs.  Exclude /dev/zero just in case someone allocated
1219         // memory by explicitly mapping /dev/zero.
1220         if (seg->kind == SkFileC
1221             && (VKI_S_ISCHR(seg->mode) || VKI_S_ISBLK(seg->mode))) {
1222            HChar* dev_name = VG_(am_get_filename)( (NSegment*)seg );
1223            if (dev_name && 0 == VG_(strcmp)(dev_name, "/dev/zero")) {
1224               // Don't skip /dev/zero.
1225            } else {
1226               // Skip this device mapping.
1227               continue;
1228            }
1229         }
1230
1231         if (0)
1232            VG_(printf)("ACCEPT %2d  %#lx %#lx\n", i, seg->start, seg->end);
1233
1234         // Scan the segment.  We use -1 for the clique number, because this
1235         // is a root-set.
1236         seg_size = seg->end - seg->start + 1;
1237         if (VG_(clo_verbosity) > 2) {
1238            VG_(message)(Vg_DebugMsg,
1239                         "  Scanning root segment: %#lx..%#lx (%lu)\n",
1240                         seg->start, seg->end, seg_size);
1241         }
1242         lc_scan_memory(seg->start, seg_size, /*is_prior_definite*/True, -1);
1243      }
1244   }
1245
1246   // Scan GP registers for chunk pointers.
1247   VG_(apply_to_GP_regs)(lc_push_if_a_chunk_ptr_register);
1248
1249   // Process the pushed blocks.  After this, every block that is reachable
1250   // from the root-set has been traced.
1251   lc_process_markstack(/*clique*/-1);
1252
1253   if (VG_(clo_verbosity) > 1 && !VG_(clo_xml)) {
1254      VG_(umsg)("Checked %'lu bytes\n", lc_scanned_szB);
1255      VG_(umsg)( "\n" );
1256   }
1257
1258   // Trace all the leaked blocks to determine which are directly leaked and
1259   // which are indirectly leaked.  For each Unreached block, push it onto
1260   // the mark stack, and find all the as-yet-Unreached blocks reachable
1261   // from it.  These form a clique and are marked IndirectLeak, and their
1262   // size is added to the clique leader's indirect size.  If one of the
1263   // found blocks was itself a clique leader (from a previous clique), then
1264   // the cliques are merged.
1265   for (i = 0; i < lc_n_chunks; i++) {
1266      MC_Chunk* ch = lc_chunks[i];
1267      LC_Extra* ex = &(lc_extras[i]);
1268
1269      if (VG_DEBUG_CLIQUE)
1270         VG_(printf)("cliques: %d at %#lx -> Loss state %d\n",
1271                     i, ch->data, ex->state);
1272
1273      tl_assert(lc_markstack_top == -1);
1274
1275      if (ex->state == Unreached) {
1276         if (VG_DEBUG_CLIQUE)
1277            VG_(printf)("%d: gathering clique %#lx\n", i, ch->data);
1278
1279         // Push this Unreached block onto the stack and process it.
1280         lc_push(i, ch);
1281         lc_process_markstack(i);
1282
1283         tl_assert(lc_markstack_top == -1);
1284         tl_assert(ex->state == Unreached);
1285      }
1286   }
1287
1288   print_results( tid, lcp);
1289
1290   VG_(free) ( lc_chunks );
1291   VG_(free) ( lc_extras );
1292   VG_(free) ( lc_markstack );
1293}
1294
1295/*--------------------------------------------------------------------*/
1296/*--- end                                                          ---*/
1297/*--------------------------------------------------------------------*/
1298