• Home
  • Line#
  • Scopes#
  • Navigate#
  • Raw
  • Download
1 
2 /*--------------------------------------------------------------------*/
3 /*--- Store and compare stack backtraces            m_execontext.c ---*/
4 /*--------------------------------------------------------------------*/
5 
6 /*
7    This file is part of Valgrind, a dynamic binary instrumentation
8    framework.
9 
10    Copyright (C) 2000-2010 Julian Seward
11       jseward@acm.org
12 
13    This program is free software; you can redistribute it and/or
14    modify it under the terms of the GNU General Public License as
15    published by the Free Software Foundation; either version 2 of the
16    License, or (at your option) any later version.
17 
18    This program is distributed in the hope that it will be useful, but
19    WITHOUT ANY WARRANTY; without even the implied warranty of
20    MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the GNU
21    General Public License for more details.
22 
23    You should have received a copy of the GNU General Public License
24    along with this program; if not, write to the Free Software
25    Foundation, Inc., 59 Temple Place, Suite 330, Boston, MA
26    02111-1307, USA.
27 
28    The GNU General Public License is contained in the file COPYING.
29 */
30 
31 #include "pub_core_basics.h"
32 #include "pub_core_debuglog.h"
33 #include "pub_core_libcassert.h"
34 #include "pub_core_libcprint.h"     // For VG_(message)()
35 #include "pub_core_mallocfree.h"
36 #include "pub_core_options.h"
37 #include "pub_core_stacktrace.h"
38 #include "pub_core_machine.h"       // VG_(get_IP)
39 #include "pub_core_vki.h"           // To keep pub_core_threadstate.h happy
40 #include "pub_core_threadstate.h"   // VG_(is_valid_tid)
41 #include "pub_core_execontext.h"    // self
42 
43 /*------------------------------------------------------------*/
44 /*--- Low-level ExeContext storage.                        ---*/
45 /*------------------------------------------------------------*/
46 
47 /* The first 4 IP values are used in comparisons to remove duplicate
48    errors, and for comparing against suppression specifications.  The
49    rest are purely informational (but often important).
50 
51    The contexts are stored in a traditional chained hash table, so as
52    to allow quick determination of whether a new context already
53    exists.  The hash table starts small and expands dynamically, so as
54    to keep the load factor below 1.0.
55 
56    The idea is only to ever store any one context once, so as to save
57    space and make exact comparisons faster. */
58 
59 
60 /* Primes for the hash table */
61 
62 #define N_EC_PRIMES 18
63 
64 static SizeT ec_primes[N_EC_PRIMES] = {
65          769UL,         1543UL,         3079UL,          6151UL,
66        12289UL,        24593UL,        49157UL,         98317UL,
67       196613UL,       393241UL,       786433UL,       1572869UL,
68      3145739UL,      6291469UL,     12582917UL,      25165843UL,
69     50331653UL,    100663319UL
70 };
71 
72 
73 /* Each element is present in a hash chain, and also contains a
74    variable length array of guest code addresses (the useful part). */
75 
76 struct _ExeContext {
77    struct _ExeContext* chain;
78    /* A 32-bit unsigned integer that uniquely identifies this
79       ExeContext.  Memcheck uses these for origin tracking.  Values
80       must be nonzero (else Memcheck's origin tracking is hosed), must
81       be a multiple of four, and must be unique.  Hence they start at
82       4. */
83    UInt ecu;
84    /* Variable-length array.  The size is 'n_ips'; at
85       least 1, at most VG_DEEPEST_BACKTRACE.  [0] is the current IP,
86       [1] is its caller, [2] is the caller of [1], etc. */
87    UInt n_ips;
88    Addr ips[0];
89 };
90 
91 
92 /* This is the dynamically expanding hash table. */
93 static ExeContext** ec_htab; /* array [ec_htab_size] of ExeContext* */
94 static SizeT        ec_htab_size;     /* one of the values in ec_primes */
95 static SizeT        ec_htab_size_idx; /* 0 .. N_EC_PRIMES-1 */
96 
97 /* ECU serial number */
98 static UInt ec_next_ecu = 4; /* We must never issue zero */
99 
100 
101 /* Stats only: the number of times the system was searched to locate a
102    context. */
103 static ULong ec_searchreqs;
104 
105 /* Stats only: the number of full context comparisons done. */
106 static ULong ec_searchcmps;
107 
108 /* Stats only: total number of stored contexts. */
109 static ULong ec_totstored;
110 
111 /* Number of 2, 4 and (fast) full cmps done. */
112 static ULong ec_cmp2s;
113 static ULong ec_cmp4s;
114 static ULong ec_cmpAlls;
115 
116 
117 /*------------------------------------------------------------*/
118 /*--- Exported functions.                                  ---*/
119 /*------------------------------------------------------------*/
120 
121 
122 /* Initialise this subsystem. */
init_ExeContext_storage(void)123 static void init_ExeContext_storage ( void )
124 {
125    Int i;
126    static Bool init_done = False;
127    if (LIKELY(init_done))
128       return;
129    ec_searchreqs = 0;
130    ec_searchcmps = 0;
131    ec_totstored = 0;
132    ec_cmp2s = 0;
133    ec_cmp4s = 0;
134    ec_cmpAlls = 0;
135 
136    ec_htab_size_idx = 0;
137    ec_htab_size = ec_primes[ec_htab_size_idx];
138    ec_htab = VG_(arena_malloc)(VG_AR_EXECTXT, "execontext.iEs1",
139                                sizeof(ExeContext*) * ec_htab_size);
140    for (i = 0; i < ec_htab_size; i++)
141       ec_htab[i] = NULL;
142 
143    init_done = True;
144 }
145 
146 
147 /* Print stats. */
VG_(print_ExeContext_stats)148 void VG_(print_ExeContext_stats) ( void )
149 {
150    init_ExeContext_storage();
151    VG_(message)(Vg_DebugMsg,
152       "   exectx: %'lu lists, %'llu contexts (avg %'llu per list)\n",
153       ec_htab_size, ec_totstored, ec_totstored / (ULong)ec_htab_size
154    );
155    VG_(message)(Vg_DebugMsg,
156       "   exectx: %'llu searches, %'llu full compares (%'llu per 1000)\n",
157       ec_searchreqs, ec_searchcmps,
158       ec_searchreqs == 0
159          ? 0ULL
160          : ( (ec_searchcmps * 1000ULL) / ec_searchreqs )
161    );
162    VG_(message)(Vg_DebugMsg,
163       "   exectx: %'llu cmp2, %'llu cmp4, %'llu cmpAll\n",
164       ec_cmp2s, ec_cmp4s, ec_cmpAlls
165    );
166 }
167 
168 
169 /* Print an ExeContext. */
VG_(pp_ExeContext)170 void VG_(pp_ExeContext) ( ExeContext* ec )
171 {
172    VG_(pp_StackTrace)( ec->ips, ec->n_ips );
173 }
174 
175 
176 /* Compare two ExeContexts.  Number of callers considered depends on res. */
VG_(eq_ExeContext)177 Bool VG_(eq_ExeContext) ( VgRes res, ExeContext* e1, ExeContext* e2 )
178 {
179    Int i;
180 
181    if (e1 == NULL || e2 == NULL)
182       return False;
183 
184    // Must be at least one address in each trace.
185    tl_assert(e1->n_ips >= 1 && e2->n_ips >= 1);
186 
187    switch (res) {
188    case Vg_LowRes:
189       /* Just compare the top two callers. */
190       ec_cmp2s++;
191       for (i = 0; i < 2; i++) {
192          if ( (e1->n_ips <= i) &&  (e2->n_ips <= i)) return True;
193          if ( (e1->n_ips <= i) && !(e2->n_ips <= i)) return False;
194          if (!(e1->n_ips <= i) &&  (e2->n_ips <= i)) return False;
195          if (e1->ips[i] != e2->ips[i])               return False;
196       }
197       return True;
198 
199    case Vg_MedRes:
200       /* Just compare the top four callers. */
201       ec_cmp4s++;
202       for (i = 0; i < 4; i++) {
203          if ( (e1->n_ips <= i) &&  (e2->n_ips <= i)) return True;
204          if ( (e1->n_ips <= i) && !(e2->n_ips <= i)) return False;
205          if (!(e1->n_ips <= i) &&  (e2->n_ips <= i)) return False;
206          if (e1->ips[i] != e2->ips[i])               return False;
207       }
208       return True;
209 
210    case Vg_HighRes:
211       ec_cmpAlls++;
212       /* Compare them all -- just do pointer comparison. */
213       if (e1 != e2) return False;
214       return True;
215 
216    default:
217       VG_(core_panic)("VG_(eq_ExeContext): unrecognised VgRes");
218    }
219 }
220 
221 /* VG_(record_ExeContext) is the head honcho here.  Take a snapshot of
222    the client's stack.  Search our collection of ExeContexts to see if
223    we already have it, and if not, allocate a new one.  Either way,
224    return a pointer to the context.  If there is a matching context we
225    guarantee to not allocate a new one.  Thus we never store
226    duplicates, and so exact equality can be quickly done as equality
227    on the returned ExeContext* values themselves.  Inspired by Hugs's
228    Text type.
229 
230    Also checks whether the hash table needs expanding, and expands it
231    if so. */
232 
ROLW(UWord w,Int n)233 static inline UWord ROLW ( UWord w, Int n )
234 {
235    Int bpw = 8 * sizeof(UWord);
236    w = (w << n) | (w >> (bpw-n));
237    return w;
238 }
239 
calc_hash(Addr * ips,UInt n_ips,UWord htab_sz)240 static UWord calc_hash ( Addr* ips, UInt n_ips, UWord htab_sz )
241 {
242    UInt  i;
243    UWord hash = 0;
244    vg_assert(htab_sz > 0);
245    for (i = 0; i < n_ips; i++) {
246       hash ^= ips[i];
247       hash = ROLW(hash, 19);
248    }
249    return hash % htab_sz;
250 }
251 
resize_ec_htab(void)252 static void resize_ec_htab ( void )
253 {
254    SizeT        i;
255    SizeT        new_size;
256    ExeContext** new_ec_htab;
257 
258    vg_assert(ec_htab_size_idx >= 0 && ec_htab_size_idx < N_EC_PRIMES);
259    if (ec_htab_size_idx == N_EC_PRIMES-1)
260       return; /* out of primes - can't resize further */
261 
262    new_size = ec_primes[ec_htab_size_idx + 1];
263    new_ec_htab = VG_(arena_malloc)(VG_AR_EXECTXT, "execontext.reh1",
264                                    sizeof(ExeContext*) * new_size);
265 
266    VG_(debugLog)(
267       1, "execontext",
268          "resizing htab from size %lu to %lu (idx %lu)  Total#ECs=%llu\n",
269          ec_htab_size, new_size, ec_htab_size_idx + 1, ec_totstored);
270 
271    for (i = 0; i < new_size; i++)
272       new_ec_htab[i] = NULL;
273 
274    for (i = 0; i < ec_htab_size; i++) {
275       ExeContext* cur = ec_htab[i];
276       while (cur) {
277          ExeContext* next = cur->chain;
278          UWord hash = calc_hash(cur->ips, cur->n_ips, new_size);
279          vg_assert(hash < new_size);
280          cur->chain = new_ec_htab[hash];
281          new_ec_htab[hash] = cur;
282          cur = next;
283       }
284    }
285 
286    VG_(arena_free)(VG_AR_EXECTXT, ec_htab);
287    ec_htab      = new_ec_htab;
288    ec_htab_size = new_size;
289    ec_htab_size_idx++;
290 }
291 
292 /* Do the first part of getting a stack trace: actually unwind the
293    stack, and hand the results off to the duplicate-trace-finder
294    (_wrk2). */
295 static ExeContext* record_ExeContext_wrk2 ( Addr* ips, UInt n_ips ); /*fwds*/
record_ExeContext_wrk(ThreadId tid,Word first_ip_delta,Bool first_ip_only)296 static ExeContext* record_ExeContext_wrk ( ThreadId tid, Word first_ip_delta,
297                                            Bool first_ip_only )
298 {
299    Addr ips[VG_DEEPEST_BACKTRACE];
300    UInt n_ips;
301 
302    init_ExeContext_storage();
303 
304    vg_assert(sizeof(void*) == sizeof(UWord));
305    vg_assert(sizeof(void*) == sizeof(Addr));
306 
307    vg_assert(VG_(is_valid_tid)(tid));
308 
309    vg_assert(VG_(clo_backtrace_size) >= 1 &&
310              VG_(clo_backtrace_size) <= VG_DEEPEST_BACKTRACE);
311 
312    if (first_ip_only) {
313       n_ips = 1;
314       ips[0] = VG_(get_IP)(tid);
315    } else {
316       n_ips = VG_(get_StackTrace)( tid, ips, VG_(clo_backtrace_size),
317                                    NULL/*array to dump SP values in*/,
318                                    NULL/*array to dump FP values in*/,
319                                    first_ip_delta );
320    }
321 
322    return record_ExeContext_wrk2 ( ips, n_ips );
323 }
324 
325 /* Do the second part of getting a stack trace: ips[0 .. n_ips-1]
326    holds a proposed trace.  Find or allocate a suitable ExeContext.
327    Note that callers must have done init_ExeContext_storage() before
328    getting to this point. */
record_ExeContext_wrk2(Addr * ips,UInt n_ips)329 static ExeContext* record_ExeContext_wrk2 ( Addr* ips, UInt n_ips )
330 {
331    Int         i;
332    Bool        same;
333    UWord       hash;
334    ExeContext* new_ec;
335    ExeContext* list;
336    ExeContext  *prev2, *prev;
337 
338    static UInt ctr = 0;
339 
340    tl_assert(n_ips >= 1 && n_ips <= VG_(clo_backtrace_size));
341 
342    /* Now figure out if we've seen this one before.  First hash it so
343       as to determine the list number. */
344    hash = calc_hash( ips, n_ips, ec_htab_size );
345 
346    /* And (the expensive bit) look a for matching entry in the list. */
347 
348    ec_searchreqs++;
349 
350    prev2 = NULL;
351    prev  = NULL;
352    list  = ec_htab[hash];
353 
354    while (True) {
355       if (list == NULL) break;
356       ec_searchcmps++;
357       same = True;
358       for (i = 0; i < n_ips; i++) {
359          if (list->ips[i] != ips[i]) {
360             same = False;
361             break;
362          }
363       }
364       if (same) break;
365       prev2 = prev;
366       prev  = list;
367       list  = list->chain;
368    }
369 
370    if (list != NULL) {
371       /* Yay!  We found it.  Once every 8 searches, move it one step
372          closer to the start of the list to make future searches
373          cheaper. */
374       if (0 == ((ctr++) & 7)) {
375          if (prev2 != NULL && prev != NULL) {
376             /* Found at 3rd or later position in the chain. */
377             vg_assert(prev2->chain == prev);
378             vg_assert(prev->chain  == list);
379             prev2->chain = list;
380             prev->chain  = list->chain;
381             list->chain  = prev;
382          }
383          else if (prev2 == NULL && prev != NULL) {
384             /* Found at 2nd position in the chain. */
385             vg_assert(ec_htab[hash] == prev);
386             vg_assert(prev->chain == list);
387             prev->chain = list->chain;
388             list->chain = prev;
389             ec_htab[hash] = list;
390          }
391       }
392       return list;
393    }
394 
395    /* Bummer.  We have to allocate a new context record. */
396    ec_totstored++;
397 
398    new_ec = VG_(arena_malloc)( VG_AR_EXECTXT, "execontext.rEw2.2",
399                                sizeof(struct _ExeContext)
400                                + n_ips * sizeof(Addr) );
401 
402    for (i = 0; i < n_ips; i++)
403       new_ec->ips[i] = ips[i];
404 
405    vg_assert(VG_(is_plausible_ECU)(ec_next_ecu));
406    new_ec->ecu = ec_next_ecu;
407    ec_next_ecu += 4;
408    if (ec_next_ecu == 0) {
409       /* Urr.  Now we're hosed; we emitted 2^30 ExeContexts already
410          and have run out of numbers.  Not sure what to do. */
411       VG_(core_panic)("m_execontext: more than 2^30 ExeContexts created");
412    }
413 
414    new_ec->n_ips = n_ips;
415    new_ec->chain = ec_htab[hash];
416    ec_htab[hash] = new_ec;
417 
418    /* Resize the hash table, maybe? */
419    if ( ((ULong)ec_totstored) > ((ULong)ec_htab_size) ) {
420       vg_assert(ec_htab_size_idx >= 0 && ec_htab_size_idx < N_EC_PRIMES);
421       if (ec_htab_size_idx < N_EC_PRIMES-1)
422          resize_ec_htab();
423    }
424 
425    return new_ec;
426 }
427 
VG_(record_ExeContext)428 ExeContext* VG_(record_ExeContext)( ThreadId tid, Word first_ip_delta ) {
429    return record_ExeContext_wrk( tid, first_ip_delta,
430                                       False/*!first_ip_only*/ );
431 }
432 
VG_(record_depth_1_ExeContext)433 ExeContext* VG_(record_depth_1_ExeContext)( ThreadId tid ) {
434    return record_ExeContext_wrk( tid, 0/*first_ip_delta*/,
435                                       True/*first_ip_only*/ );
436 }
437 
VG_(make_depth_1_ExeContext_from_Addr)438 ExeContext* VG_(make_depth_1_ExeContext_from_Addr)( Addr a ) {
439    init_ExeContext_storage();
440    return record_ExeContext_wrk2( &a, 1 );
441 }
442 
VG_(get_ExeContext_StackTrace)443 StackTrace VG_(get_ExeContext_StackTrace) ( ExeContext* e ) {
444    return e->ips;
445 }
446 
VG_(get_ECU_from_ExeContext)447 UInt VG_(get_ECU_from_ExeContext)( ExeContext* e ) {
448    vg_assert(VG_(is_plausible_ECU)(e->ecu));
449    return e->ecu;
450 }
451 
VG_(get_ExeContext_n_ips)452 Int VG_(get_ExeContext_n_ips)( ExeContext* e ) {
453    vg_assert(e->n_ips >= 1);
454    return e->n_ips;
455 }
456 
VG_(get_ExeContext_from_ECU)457 ExeContext* VG_(get_ExeContext_from_ECU)( UInt ecu )
458 {
459    UWord i;
460    ExeContext* ec;
461    vg_assert(VG_(is_plausible_ECU)(ecu));
462    vg_assert(ec_htab_size > 0);
463    for (i = 0; i < ec_htab_size; i++) {
464       for (ec = ec_htab[i]; ec; ec = ec->chain) {
465          if (ec->ecu == ecu)
466             return ec;
467       }
468    }
469    return NULL;
470 }
471 
VG_(make_ExeContext_from_StackTrace)472 ExeContext* VG_(make_ExeContext_from_StackTrace)( Addr* ips, UInt n_ips )
473 {
474    return record_ExeContext_wrk2(ips, n_ips);
475 }
476 
477 /*--------------------------------------------------------------------*/
478 /*--- end                                           m_execontext.c ---*/
479 /*--------------------------------------------------------------------*/
480