Home | History | Annotate | Download | only in callgrind
      1 /*--------------------------------------------------------------------*/
      2 /*--- Callgrind                                                    ---*/
      3 /*---                                                 ct_threads.c ---*/
      4 /*--------------------------------------------------------------------*/
      5 
      6 /*
      7    This file is part of Callgrind, a Valgrind tool for call tracing.
      8 
      9    Copyright (C) 2002-2015, Josef Weidendorfer (Josef.Weidendorfer (at) gmx.de)
     10 
     11    This program is free software; you can redistribute it and/or
     12    modify it under the terms of the GNU General Public License as
     13    published by the Free Software Foundation; either version 2 of the
     14    License, or (at your option) any later version.
     15 
     16    This program is distributed in the hope that it will be useful, but
     17    WITHOUT ANY WARRANTY; without even the implied warranty of
     18    MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the GNU
     19    General Public License for more details.
     20 
     21    You should have received a copy of the GNU General Public License
     22    along with this program; if not, write to the Free Software
     23    Foundation, Inc., 59 Temple Place, Suite 330, Boston, MA
     24    02111-1307, USA.
     25 
     26    The GNU General Public License is contained in the file COPYING.
     27 */
     28 
     29 #include "global.h"
     30 
     31 #include "pub_tool_threadstate.h"
     32 
     33 /* forward decls */
     34 static exec_state* exec_state_save(void);
     35 static exec_state* exec_state_restore(void);
     36 static exec_state* push_exec_state(int);
     37 static exec_state* top_exec_state(void);
     38 
     39 static exec_stack current_states;
     40 
     41 
     42 /*------------------------------------------------------------*/
     43 /*--- Support for multi-threading                          ---*/
     44 /*------------------------------------------------------------*/
     45 
     46 
     47 /*
     48  * For Valgrind, MT is cooperative (no preemting in our code),
     49  * so we don't need locks...
     50  *
     51  * Per-thread data:
     52  *  - BBCCs
     53  *  - call stack
     54  *  - call hash
     55  *  - event counters: last, current
     56  *
     57  * Even when ignoring MT, we need this functions to set up some
     58  * datastructures for the process (= Thread 1).
     59  */
     60 
     61 /* current running thread */
     62 ThreadId CLG_(current_tid);
     63 
     64 static thread_info** thread;
     65 
     66 thread_info** CLG_(get_threads)()
     67 {
     68   return thread;
     69 }
     70 
     71 thread_info* CLG_(get_current_thread)()
     72 {
     73   return thread[CLG_(current_tid)];
     74 }
     75 
     76 void CLG_(init_threads)()
     77 {
     78     UInt i;
     79 
     80     thread = CLG_MALLOC("cl.threads.it.1", VG_N_THREADS * sizeof thread[0]);
     81 
     82     for(i=0;i<VG_N_THREADS;i++)
     83 	thread[i] = 0;
     84     CLG_(current_tid) = VG_INVALID_THREADID;
     85 }
     86 
     87 /* switches through all threads and calls func */
     88 void CLG_(forall_threads)(void (*func)(thread_info*))
     89 {
     90   Int t, orig_tid = CLG_(current_tid);
     91 
     92   for(t=1;t<VG_N_THREADS;t++) {
     93     if (!thread[t]) continue;
     94     CLG_(switch_thread)(t);
     95     (*func)(thread[t]);
     96   }
     97   CLG_(switch_thread)(orig_tid);
     98 }
     99 
    100 
    101 static
    102 thread_info* new_thread(void)
    103 {
    104     thread_info* t;
    105 
    106     t = (thread_info*) CLG_MALLOC("cl.threads.nt.1",
    107                                   sizeof(thread_info));
    108 
    109     /* init state */
    110     CLG_(init_exec_stack)( &(t->states) );
    111     CLG_(init_call_stack)( &(t->calls) );
    112     CLG_(init_fn_stack)  ( &(t->fns) );
    113     /* t->states.entry[0]->cxt = CLG_(get_cxt)(t->fns.bottom); */
    114 
    115     /* event counters */
    116     t->lastdump_cost   = CLG_(get_eventset_cost)( CLG_(sets).full );
    117     t->sighandler_cost = CLG_(get_eventset_cost)( CLG_(sets).full );
    118     CLG_(init_cost)( CLG_(sets).full, t->lastdump_cost );
    119     CLG_(init_cost)( CLG_(sets).full, t->sighandler_cost );
    120 
    121     /* init data containers */
    122     CLG_(init_fn_array)( &(t->fn_active) );
    123     CLG_(init_bbcc_hash)( &(t->bbccs) );
    124     CLG_(init_jcc_hash)( &(t->jccs) );
    125 
    126     return t;
    127 }
    128 
    129 
    130 void CLG_(switch_thread)(ThreadId tid)
    131 {
    132   if (tid == CLG_(current_tid)) return;
    133 
    134   CLG_DEBUG(0, ">> thread %u (was %u)\n", tid, CLG_(current_tid));
    135 
    136   if (CLG_(current_tid) != VG_INVALID_THREADID) {
    137     /* save thread state */
    138     thread_info* t = thread[CLG_(current_tid)];
    139 
    140     CLG_ASSERT(t != 0);
    141 
    142     /* current context (including signal handler contexts) */
    143     exec_state_save();
    144     CLG_(copy_current_exec_stack)( &(t->states) );
    145     CLG_(copy_current_call_stack)( &(t->calls) );
    146     CLG_(copy_current_fn_stack)  ( &(t->fns) );
    147 
    148     CLG_(copy_current_fn_array) ( &(t->fn_active) );
    149     /* If we cumulate costs of threads, use TID 1 for all jccs/bccs */
    150     if (!CLG_(clo).separate_threads) t = thread[1];
    151     CLG_(copy_current_bbcc_hash)( &(t->bbccs) );
    152     CLG_(copy_current_jcc_hash) ( &(t->jccs) );
    153   }
    154 
    155   CLG_(current_tid) = tid;
    156   CLG_ASSERT(tid < VG_N_THREADS);
    157 
    158   if (tid != VG_INVALID_THREADID) {
    159     thread_info* t;
    160 
    161     /* load thread state */
    162 
    163     if (thread[tid] == 0) thread[tid] = new_thread();
    164     t = thread[tid];
    165 
    166     /* current context (including signal handler contexts) */
    167     CLG_(set_current_exec_stack)( &(t->states) );
    168     exec_state_restore();
    169     CLG_(set_current_call_stack)( &(t->calls) );
    170     CLG_(set_current_fn_stack)  ( &(t->fns) );
    171 
    172     CLG_(set_current_fn_array)  ( &(t->fn_active) );
    173     /* If we cumulate costs of threads, use TID 1 for all jccs/bccs */
    174     if (!CLG_(clo).separate_threads) t = thread[1];
    175     CLG_(set_current_bbcc_hash) ( &(t->bbccs) );
    176     CLG_(set_current_jcc_hash)  ( &(t->jccs) );
    177   }
    178 }
    179 
    180 
    181 void CLG_(run_thread)(ThreadId tid)
    182 {
    183     /* check for dumps needed */
    184     static ULong bbs_done = 0;
    185     HChar buf[50];   // large enough
    186 
    187     if (CLG_(clo).dump_every_bb >0) {
    188        if (CLG_(stat).bb_executions - bbs_done > CLG_(clo).dump_every_bb) {
    189            VG_(sprintf)(buf, "--dump-every-bb=%llu", CLG_(clo).dump_every_bb);
    190 	   CLG_(dump_profile)(buf, False);
    191            bbs_done = CLG_(stat).bb_executions;
    192        }
    193     }
    194 
    195     /* now check for thread switch */
    196     CLG_(switch_thread)(tid);
    197 }
    198 
    199 void CLG_(pre_signal)(ThreadId tid, Int sigNum, Bool alt_stack)
    200 {
    201     exec_state *es;
    202 
    203     CLG_DEBUG(0, ">> pre_signal(TID %u, sig %d, alt_st %s)\n",
    204 	     tid, sigNum, alt_stack ? "yes":"no");
    205 
    206     /* switch to the thread the handler runs in */
    207     CLG_(switch_thread)(tid);
    208 
    209     /* save current execution state */
    210     exec_state_save();
    211 
    212     /* setup new cxtinfo struct for this signal handler */
    213     es = push_exec_state(sigNum);
    214     CLG_(zero_cost)( CLG_(sets).full, es->cost );
    215     CLG_(current_state).cost = es->cost;
    216     es->call_stack_bottom = CLG_(current_call_stack).sp;
    217 
    218     /* setup current state for a spontaneous call */
    219     CLG_(init_exec_state)( &CLG_(current_state) );
    220     CLG_(current_state).sig = sigNum;
    221     CLG_(push_cxt)(0);
    222 }
    223 
    224 /* Run post-signal if the stackpointer for call stack is at
    225  * the bottom in current exec state (e.g. a signal handler)
    226  *
    227  * Called from CLG_(pop_call_stack)
    228  */
    229 void CLG_(run_post_signal_on_call_stack_bottom)()
    230 {
    231     exec_state* es = top_exec_state();
    232     CLG_ASSERT(es != 0);
    233     CLG_ASSERT(CLG_(current_state).sig >0);
    234 
    235     if (CLG_(current_call_stack).sp == es->call_stack_bottom)
    236 	CLG_(post_signal)( CLG_(current_tid), CLG_(current_state).sig );
    237 }
    238 
    239 void CLG_(post_signal)(ThreadId tid, Int sigNum)
    240 {
    241     exec_state* es;
    242     UInt fn_number, *pactive;
    243 
    244     CLG_DEBUG(0, ">> post_signal(TID %u, sig %d)\n",
    245 	     tid, sigNum);
    246 
    247     /* thread switching potentially needed, eg. with instrumentation off */
    248     CLG_(switch_thread)(tid);
    249     CLG_ASSERT(sigNum == CLG_(current_state).sig);
    250 
    251     /* Unwind call stack of this signal handler.
    252      * This should only be needed at finalisation time
    253      */
    254     es = top_exec_state();
    255     CLG_ASSERT(es != 0);
    256     while(CLG_(current_call_stack).sp > es->call_stack_bottom)
    257       CLG_(pop_call_stack)();
    258 
    259     if (CLG_(current_state).cxt) {
    260       /* correct active counts */
    261       fn_number = CLG_(current_state).cxt->fn[0]->number;
    262       pactive = CLG_(get_fn_entry)(fn_number);
    263       (*pactive)--;
    264       CLG_DEBUG(0, "  set active count of %s back to %u\n",
    265 	       CLG_(current_state).cxt->fn[0]->name, *pactive);
    266     }
    267 
    268     if (CLG_(current_fn_stack).top > CLG_(current_fn_stack).bottom) {
    269 	/* set fn_stack_top back.
    270 	 * top can point to 0 if nothing was executed in the signal handler;
    271 	 * this is possible at end on unwinding handlers.
    272 	 */
    273 	if (*(CLG_(current_fn_stack).top) != 0) {
    274 	    CLG_(current_fn_stack).top--;
    275 	    CLG_ASSERT(*(CLG_(current_fn_stack).top) == 0);
    276 	}
    277       if (CLG_(current_fn_stack).top > CLG_(current_fn_stack).bottom)
    278 	CLG_(current_fn_stack).top--;
    279     }
    280 
    281     /* sum up costs */
    282     CLG_ASSERT(CLG_(current_state).cost == es->cost);
    283     CLG_(add_and_zero_cost)( CLG_(sets).full,
    284 			    thread[CLG_(current_tid)]->sighandler_cost,
    285 			    CLG_(current_state).cost );
    286 
    287     /* restore previous context */
    288     es->sig = -1;
    289     current_states.sp--;
    290     es = top_exec_state();
    291     CLG_(current_state).sig = es->sig;
    292     exec_state_restore();
    293 
    294     /* There is no way to reliable get the thread ID we are switching to
    295      * after this handler returns. So we sync with actual TID at start of
    296      * CLG_(setup_bb)(), which should be the next for callgrind.
    297      */
    298 }
    299 
    300 
    301 
    302 /*------------------------------------------------------------*/
    303 /*--- Execution states in a thread & signal handlers       ---*/
    304 /*------------------------------------------------------------*/
    305 
    306 /* Each thread can be interrupted by a signal handler, and they
    307  * themselves again. But as there's no scheduling among handlers
    308  * of the same thread, we don't need additional stacks.
    309  * So storing execution contexts and
    310  * adding separators in the callstack(needed to not intermix normal/handler
    311  * functions in contexts) should be enough.
    312  */
    313 
    314 /* not initialized: call_stack_bottom, sig */
    315 void CLG_(init_exec_state)(exec_state* es)
    316 {
    317   es->collect = CLG_(clo).collect_atstart;
    318   es->cxt  = 0;
    319   es->jmps_passed = 0;
    320   es->bbcc = 0;
    321   es->nonskipped = 0;
    322 }
    323 
    324 
    325 static exec_state* new_exec_state(Int sigNum)
    326 {
    327     exec_state* es;
    328     es = (exec_state*) CLG_MALLOC("cl.threads.nes.1",
    329                                   sizeof(exec_state));
    330 
    331     /* allocate real cost space: needed as incremented by
    332      * simulation functions */
    333     es->cost       = CLG_(get_eventset_cost)(CLG_(sets).full);
    334     CLG_(zero_cost)( CLG_(sets).full, es->cost );
    335     CLG_(init_exec_state)(es);
    336     es->sig        = sigNum;
    337     es->call_stack_bottom  = 0;
    338 
    339     return es;
    340 }
    341 
    342 void CLG_(init_exec_stack)(exec_stack* es)
    343 {
    344   Int i;
    345 
    346   /* The first element is for the main thread */
    347   es->entry[0] = new_exec_state(0);
    348   for(i=1;i<MAX_SIGHANDLERS;i++)
    349     es->entry[i] = 0;
    350   es->sp = 0;
    351 }
    352 
    353 void CLG_(copy_current_exec_stack)(exec_stack* dst)
    354 {
    355   Int i;
    356 
    357   dst->sp = current_states.sp;
    358   for(i=0;i<MAX_SIGHANDLERS;i++)
    359     dst->entry[i] = current_states.entry[i];
    360 }
    361 
    362 void CLG_(set_current_exec_stack)(exec_stack* dst)
    363 {
    364   Int i;
    365 
    366   current_states.sp = dst->sp;
    367   for(i=0;i<MAX_SIGHANDLERS;i++)
    368     current_states.entry[i] = dst->entry[i];
    369 }
    370 
    371 
    372 /* Get top context info struct of current thread */
    373 static
    374 exec_state* top_exec_state(void)
    375 {
    376   Int sp = current_states.sp;
    377   exec_state* es;
    378 
    379   CLG_ASSERT((sp >= 0) && (sp < MAX_SIGHANDLERS));
    380   es = current_states.entry[sp];
    381   CLG_ASSERT(es != 0);
    382   return es;
    383 }
    384 
    385 /* Allocates a free context info structure for a new entered
    386  * signal handler, putting it on the context stack.
    387  * Returns a pointer to the structure.
    388  */
    389 static exec_state* push_exec_state(int sigNum)
    390 {
    391   Int sp;
    392   exec_state* es;
    393 
    394   current_states.sp++;
    395   sp = current_states.sp;
    396 
    397   CLG_ASSERT((sigNum > 0) && (sigNum <= _VKI_NSIG));
    398   CLG_ASSERT((sp > 0) && (sp < MAX_SIGHANDLERS));
    399   es = current_states.entry[sp];
    400   if (!es) {
    401     es = new_exec_state(sigNum);
    402     current_states.entry[sp] = es;
    403   }
    404   else
    405     es->sig = sigNum;
    406 
    407   return es;
    408 }
    409 
    410 /* Save current context to top cxtinfo struct */
    411 static
    412 exec_state* exec_state_save(void)
    413 {
    414   exec_state* es = top_exec_state();
    415 
    416   es->cxt         = CLG_(current_state).cxt;
    417   es->collect     = CLG_(current_state).collect;
    418   es->jmps_passed = CLG_(current_state).jmps_passed;
    419   es->bbcc        = CLG_(current_state).bbcc;
    420   es->nonskipped  = CLG_(current_state).nonskipped;
    421   CLG_ASSERT(es->cost == CLG_(current_state).cost);
    422 
    423   CLG_DEBUGIF(1) {
    424     CLG_DEBUG(1, "  cxtinfo_save(sig %d): collect %s, jmps_passed %d\n",
    425 	     es->sig, es->collect ? "Yes": "No", es->jmps_passed);
    426     CLG_(print_bbcc)(-9, es->bbcc);
    427     CLG_(print_cost)(-9, CLG_(sets).full, es->cost);
    428   }
    429 
    430   /* signal number does not need to be saved */
    431   CLG_ASSERT(CLG_(current_state).sig == es->sig);
    432 
    433   return es;
    434 }
    435 
    436 static
    437 exec_state* exec_state_restore(void)
    438 {
    439   exec_state* es = top_exec_state();
    440 
    441   CLG_(current_state).cxt     = es->cxt;
    442   CLG_(current_state).collect = es->collect;
    443   CLG_(current_state).jmps_passed = es->jmps_passed;
    444   CLG_(current_state).bbcc    = es->bbcc;
    445   CLG_(current_state).nonskipped = es->nonskipped;
    446   CLG_(current_state).cost    = es->cost;
    447   CLG_(current_state).sig     = es->sig;
    448 
    449   CLG_DEBUGIF(1) {
    450 	CLG_DEBUG(1, "  exec_state_restore(sig %d): collect %s, jmps_passed %d\n",
    451 		  es->sig, es->collect ? "Yes": "No", es->jmps_passed);
    452 	CLG_(print_bbcc)(-9, es->bbcc);
    453 	CLG_(print_cxt)(-9, es->cxt, 0);
    454 	CLG_(print_cost)(-9, CLG_(sets).full, es->cost);
    455   }
    456 
    457   return es;
    458 }
    459