blob: 17414cae18df8223c3e26afe9c1ea078e67af042 [file] [log] [blame]
weidendoa17f2a32006-03-20 10:27:30 +00001/*--------------------------------------------------------------------*/
2/*--- Callgrind ---*/
3/*--- dump.c ---*/
4/*--------------------------------------------------------------------*/
5
6/*
7 This file is part of Callgrind, a Valgrind tool for call tracing.
8
njn9f207462009-03-10 22:02:09 +00009 Copyright (C) 2002-2009, Josef Weidendorfer (Josef.Weidendorfer@gmx.de)
weidendoa17f2a32006-03-20 10:27:30 +000010
11 This program is free software; you can redistribute it and/or
12 modify it under the terms of the GNU General Public License as
13 published by the Free Software Foundation; either version 2 of the
14 License, or (at your option) any later version.
15
16 This program is distributed in the hope that it will be useful, but
17 WITHOUT ANY WARRANTY; without even the implied warranty of
18 MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
19 General Public License for more details.
20
21 You should have received a copy of the GNU General Public License
22 along with this program; if not, write to the Free Software
23 Foundation, Inc., 59 Temple Place, Suite 330, Boston, MA
24 02111-1307, USA.
25
26 The GNU General Public License is contained in the file COPYING.
27*/
28
29#include "config.h"
30#include "global.h"
31
32#include <pub_tool_threadstate.h>
33#include <pub_tool_libcfile.h>
34
weidendoa17f2a32006-03-20 10:27:30 +000035
36/* Dump Part Counter */
37static Int out_counter = 0;
38
weidendocbf4e192007-11-27 01:27:12 +000039static Char* out_file = 0;
40static Char* out_directory = 0;
weidendo4ce5e792006-09-20 21:29:39 +000041static Bool dumps_initialized = False;
weidendoa17f2a32006-03-20 10:27:30 +000042
43/* Command */
44static Char cmdbuf[BUF_LEN];
45
46/* Total reads/writes/misses sum over all dumps and threads.
47 * Updated during CC traversal at dump time.
48 */
49FullCost CLG_(total_cost) = 0;
50static FullCost dump_total_cost = 0;
51
52EventMapping* CLG_(dumpmap) = 0;
53
54/* Temporary output buffer for
55 * print_fn_pos, fprint_apos, fprint_fcost, fprint_jcc,
56 * fprint_fcc_ln, dump_run_info, dump_state_info
57 */
58static Char outbuf[FILENAME_LEN + FN_NAME_LEN + OBJ_NAME_LEN];
59
60Int CLG_(get_dump_counter)(void)
61{
62 return out_counter;
63}
64
weidendocbf4e192007-11-27 01:27:12 +000065Char* CLG_(get_out_file)()
weidendoa17f2a32006-03-20 10:27:30 +000066{
weidendod74d9f72008-10-24 18:50:00 +000067 CLG_(init_dumps)();
weidendocbf4e192007-11-27 01:27:12 +000068 return out_file;
weidendo4ce5e792006-09-20 21:29:39 +000069}
70
weidendocbf4e192007-11-27 01:27:12 +000071Char* CLG_(get_out_directory)()
weidendo4ce5e792006-09-20 21:29:39 +000072{
weidendod74d9f72008-10-24 18:50:00 +000073 CLG_(init_dumps)();
weidendocbf4e192007-11-27 01:27:12 +000074 return out_directory;
weidendoa17f2a32006-03-20 10:27:30 +000075}
76
77/*------------------------------------------------------------*/
78/*--- Output file related stuff ---*/
79/*------------------------------------------------------------*/
80
81/* Boolean dumping array */
82static Bool* dump_array = 0;
83static Int dump_array_size = 0;
84static Bool* obj_dumped = 0;
85static Bool* file_dumped = 0;
86static Bool* fn_dumped = 0;
87static Bool* cxt_dumped = 0;
88
89static
90void reset_dump_array(void)
91{
92 int i;
93
94 CLG_ASSERT(dump_array != 0);
95
96 for(i=0;i<dump_array_size;i++)
97 dump_array[i] = False;
98}
99
100static
101void init_dump_array(void)
102{
103 dump_array_size = CLG_(stat).distinct_objs +
104 CLG_(stat).distinct_files +
105 CLG_(stat).distinct_fns +
106 CLG_(stat).context_counter;
107 CLG_ASSERT(dump_array == 0);
sewardj9c606bd2008-09-18 18:12:50 +0000108 dump_array = (Bool*) CLG_MALLOC("cl.dump.ida.1",
109 dump_array_size * sizeof(Bool));
weidendoa17f2a32006-03-20 10:27:30 +0000110 obj_dumped = dump_array;
111 file_dumped = obj_dumped + CLG_(stat).distinct_objs;
112 fn_dumped = file_dumped + CLG_(stat).distinct_files;
113 cxt_dumped = fn_dumped + CLG_(stat).distinct_fns;
114
115 reset_dump_array();
116
117 CLG_DEBUG(1, " init_dump_array: size %d\n", dump_array_size);
118}
119
120static __inline__
121void free_dump_array(void)
122{
123 CLG_ASSERT(dump_array != 0);
124 VG_(free)(dump_array);
125
126 dump_array = 0;
127 obj_dumped = 0;
128 file_dumped = 0;
129 fn_dumped = 0;
130 cxt_dumped = 0;
131}
132
133
134/* Initialize to an invalid position */
135static __inline__
136void init_fpos(FnPos* p)
137 {
138 p->file = 0;
139 p->fn = 0;
140 p->obj = 0;
141 p->cxt = 0;
142 p->rec_index = 0;
143}
144
145
146#if 0
147static __inline__
148static void my_fwrite(Int fd, Char* buf, Int len)
149{
150 VG_(write)(fd, (void*)buf, len);
151}
152#else
153
154#define FWRITE_BUFSIZE 32000
155#define FWRITE_THROUGH 10000
156static Char fwrite_buf[FWRITE_BUFSIZE];
157static Int fwrite_pos;
158static Int fwrite_fd = -1;
159
160static __inline__
161void fwrite_flush(void)
162{
163 if ((fwrite_fd>=0) && (fwrite_pos>0))
164 VG_(write)(fwrite_fd, (void*)fwrite_buf, fwrite_pos);
165 fwrite_pos = 0;
166}
167
168static void my_fwrite(Int fd, Char* buf, Int len)
169{
170 if (fwrite_fd != fd) {
171 fwrite_flush();
172 fwrite_fd = fd;
173 }
174 if (len > FWRITE_THROUGH) {
175 fwrite_flush();
176 VG_(write)(fd, (void*)buf, len);
177 return;
178 }
179 if (FWRITE_BUFSIZE - fwrite_pos <= len) fwrite_flush();
180 VG_(strncpy)(fwrite_buf + fwrite_pos, buf, len);
181 fwrite_pos += len;
182}
183#endif
184
185
186static void print_obj(Char* buf, obj_node* obj)
187{
njn4c245e52009-03-15 23:25:38 +0000188 //int n;
weidendoa17f2a32006-03-20 10:27:30 +0000189
190 if (CLG_(clo).compress_strings) {
191 CLG_ASSERT(obj_dumped != 0);
192 if (obj_dumped[obj->number])
njn4c245e52009-03-15 23:25:38 +0000193 /*n =*/ VG_(sprintf)(buf, "(%d)\n", obj->number);
weidendoa17f2a32006-03-20 10:27:30 +0000194 else {
njn4c245e52009-03-15 23:25:38 +0000195 /*n =*/ VG_(sprintf)(buf, "(%d) %s\n",
weidendoa17f2a32006-03-20 10:27:30 +0000196 obj->number, obj->name);
197 }
198 }
199 else
njn4c245e52009-03-15 23:25:38 +0000200 /*n =*/ VG_(sprintf)(buf, "%s\n", obj->name);
weidendoa17f2a32006-03-20 10:27:30 +0000201
202#if 0
203 /* add mapping parameters the first time a object is dumped
204 * format: mp=0xSTART SIZE 0xOFFSET */
205 if (!obj_dumped[obj->number]) {
206 obj_dumped[obj->number];
207 VG_(sprintf)(buf+n, "mp=%p %p %p\n",
208 pos->obj->start, pos->obj->size, pos->obj->offset);
209 }
210#else
211 obj_dumped[obj->number] = True;
212#endif
213}
214
215static void print_file(Char* buf, file_node* file)
216{
217 if (CLG_(clo).compress_strings) {
218 CLG_ASSERT(file_dumped != 0);
219 if (file_dumped[file->number])
220 VG_(sprintf)(buf, "(%d)\n", file->number);
221 else {
222 VG_(sprintf)(buf, "(%d) %s\n",
223 file->number, file->name);
224 file_dumped[file->number] = True;
225 }
226 }
227 else
228 VG_(sprintf)(buf, "%s\n", file->name);
229}
230
231/*
232 * tag can be "fn", "cfn", "jfn"
233 */
234static void print_fn(Int fd, Char* buf, Char* tag, fn_node* fn)
235{
236 int p;
237 p = VG_(sprintf)(buf, "%s=",tag);
238 if (CLG_(clo).compress_strings) {
239 CLG_ASSERT(fn_dumped != 0);
240 if (fn_dumped[fn->number])
241 p += VG_(sprintf)(buf+p, "(%d)\n", fn->number);
242 else {
243 p += VG_(sprintf)(buf+p, "(%d) %s\n",
244 fn->number, fn->name);
245 fn_dumped[fn->number] = True;
246 }
247 }
248 else
249 p += VG_(sprintf)(buf+p, "%s\n", fn->name);
250
251 my_fwrite(fd, buf, p);
252}
253
254static void print_mangled_fn(Int fd, Char* buf, Char* tag,
255 Context* cxt, int rec_index)
256{
257 int p, i;
258
259 if (CLG_(clo).compress_strings && CLG_(clo).compress_mangled) {
260
261 int n;
262 Context* last;
263
264 CLG_ASSERT(cxt_dumped != 0);
265 if (cxt_dumped[cxt->base_number+rec_index]) {
266 p = VG_(sprintf)(buf, "%s=(%d)\n",
267 tag, cxt->base_number + rec_index);
268 my_fwrite(fd, buf, p);
269 return;
270 }
271
272 last = 0;
273 /* make sure that for all context parts compressed data is written */
274 for(i=cxt->size;i>0;i--) {
275 CLG_ASSERT(cxt->fn[i-1]->pure_cxt != 0);
276 n = cxt->fn[i-1]->pure_cxt->base_number;
277 if (cxt_dumped[n]) continue;
278 p = VG_(sprintf)(buf, "%s=(%d) %s\n",
279 tag, n, cxt->fn[i-1]->name);
280 my_fwrite(fd, buf, p);
281
282 cxt_dumped[n] = True;
283 last = cxt->fn[i-1]->pure_cxt;
284 }
285 /* If the last context was the context to print, we are finished */
286 if ((last == cxt) && (rec_index == 0)) return;
287
288 p = VG_(sprintf)(buf, "%s=(%d) (%d)", tag,
289 cxt->base_number + rec_index,
290 cxt->fn[0]->pure_cxt->base_number);
291 if (rec_index >0)
292 p += VG_(sprintf)(buf+p, "'%d", rec_index +1);
293 for(i=1;i<cxt->size;i++)
294 p += VG_(sprintf)(buf+p, "'(%d)",
295 cxt->fn[i]->pure_cxt->base_number);
296 p += VG_(sprintf)(buf+p, "\n");
297 my_fwrite(fd, buf, p);
298
299 cxt_dumped[cxt->base_number+rec_index] = True;
300 return;
301 }
302
303
304 p = VG_(sprintf)(buf, "%s=", tag);
305 if (CLG_(clo).compress_strings) {
306 CLG_ASSERT(cxt_dumped != 0);
307 if (cxt_dumped[cxt->base_number+rec_index]) {
308 p += VG_(sprintf)(buf+p, "(%d)\n", cxt->base_number + rec_index);
309 my_fwrite(fd, buf, p);
310 return;
311 }
312 else {
313 p += VG_(sprintf)(buf+p, "(%d) ", cxt->base_number + rec_index);
314 cxt_dumped[cxt->base_number+rec_index] = True;
315 }
316 }
317
318 p += VG_(sprintf)(buf+p, "%s", cxt->fn[0]->name);
319 if (rec_index >0)
320 p += VG_(sprintf)(buf+p, "'%d", rec_index +1);
321 for(i=1;i<cxt->size;i++)
322 p += VG_(sprintf)(buf+p, "'%s", cxt->fn[i]->name);
323
324 p += VG_(sprintf)(buf+p, "\n");
325 my_fwrite(fd, buf, p);
326}
327
328
329
330/**
331 * Print function position of the BBCC, but only print info differing to
332 * the <last> position, update <last>
333 * Return True if something changes.
334 */
335static Bool print_fn_pos(int fd, FnPos* last, BBCC* bbcc)
336{
337 Bool res = False;
338
339 CLG_DEBUGIF(3) {
340 CLG_DEBUG(2, "+ print_fn_pos: ");
341 CLG_(print_cxt)(16, bbcc->cxt, bbcc->rec_index);
342 }
343
344 if (!CLG_(clo).mangle_names) {
345 if (last->rec_index != bbcc->rec_index) {
346 VG_(sprintf)(outbuf, "rec=%d\n\n", bbcc->rec_index);
347 my_fwrite(fd, (void*)outbuf, VG_(strlen)(outbuf));
348 last->rec_index = bbcc->rec_index;
349 last->cxt = 0; /* reprint context */
350 res = True;
351 }
352
353 if (last->cxt != bbcc->cxt) {
354 fn_node* last_from = (last->cxt && last->cxt->size>1) ?
355 last->cxt->fn[1] : 0;
356 fn_node* curr_from = (bbcc->cxt && bbcc->cxt->size>1) ?
357 bbcc->cxt->fn[1] : 0;
358 if (curr_from == 0) {
359 if (last_from != 0) {
360 /* switch back to no context */
361 VG_(sprintf)(outbuf, "frfn=(spontaneous)\n");
362 my_fwrite(fd, (void*)outbuf, VG_(strlen)(outbuf));
363 res = True;
364 }
365 }
366 else if (last_from != curr_from) {
367 print_fn(fd,outbuf,"frfn", curr_from);
368 res = True;
369 }
370 last->cxt = bbcc->cxt;
371 }
372 }
373
374 if (last->obj != bbcc->cxt->fn[0]->file->obj) {
375 VG_(sprintf)(outbuf, "ob=");
376 print_obj(outbuf+3, bbcc->cxt->fn[0]->file->obj);
377 my_fwrite(fd, (void*)outbuf, VG_(strlen)(outbuf));
378 last->obj = bbcc->cxt->fn[0]->file->obj;
379 res = True;
380 }
381
382 if (last->file != bbcc->cxt->fn[0]->file) {
383 VG_(sprintf)(outbuf, "fl=");
384 print_file(outbuf+3, bbcc->cxt->fn[0]->file);
385 my_fwrite(fd, (void*)outbuf, VG_(strlen)(outbuf));
386 last->file = bbcc->cxt->fn[0]->file;
387 res = True;
388 }
389
390 if (!CLG_(clo).mangle_names) {
391 if (last->fn != bbcc->cxt->fn[0]) {
392 print_fn(fd,outbuf, "fn", bbcc->cxt->fn[0]);
393 last->fn = bbcc->cxt->fn[0];
394 res = True;
395 }
396 }
397 else {
398 /* Print mangled name if context or rec_index changes */
399 if ((last->rec_index != bbcc->rec_index) ||
400 (last->cxt != bbcc->cxt)) {
401
402 print_mangled_fn(fd, outbuf, "fn", bbcc->cxt, bbcc->rec_index);
403 last->fn = bbcc->cxt->fn[0];
404 last->rec_index = bbcc->rec_index;
405 res = True;
406 }
407 }
408
409 last->cxt = bbcc->cxt;
410
411 CLG_DEBUG(2, "- print_fn_pos: %s\n", res ? "changed" : "");
412
413 return res;
414}
415
416/* the debug lookup cache is useful if BBCC for same BB are
417 * dumped directly in a row. This is a direct mapped cache.
418 */
419#define DEBUG_CACHE_SIZE 1777
420
421static Addr debug_cache_addr[DEBUG_CACHE_SIZE];
422static file_node* debug_cache_file[DEBUG_CACHE_SIZE];
423static int debug_cache_line[DEBUG_CACHE_SIZE];
424static Bool debug_cache_info[DEBUG_CACHE_SIZE];
425
426static __inline__
427void init_debug_cache(void)
428{
429 int i;
430 for(i=0;i<DEBUG_CACHE_SIZE;i++) {
431 debug_cache_addr[i] = 0;
432 debug_cache_file[i] = 0;
433 debug_cache_line[i] = 0;
434 debug_cache_info[i] = 0;
435 }
436}
437
sewardj8cd42de2007-11-16 12:31:27 +0000438static /* __inline__ */
weidendoa17f2a32006-03-20 10:27:30 +0000439Bool get_debug_pos(BBCC* bbcc, Addr addr, AddrPos* p)
440{
441 Char file[FILENAME_LEN];
weidendo3db43222007-09-17 12:52:10 +0000442 Char dir[FILENAME_LEN];
443 Bool found_file_line, found_dirname;
weidendoa17f2a32006-03-20 10:27:30 +0000444
445 int cachepos = addr % DEBUG_CACHE_SIZE;
446
447 if (debug_cache_addr[cachepos] == addr) {
448 p->line = debug_cache_line[cachepos];
449 p->file = debug_cache_file[cachepos];
weidendo3db43222007-09-17 12:52:10 +0000450 found_file_line = debug_cache_info[cachepos];
weidendoa17f2a32006-03-20 10:27:30 +0000451 }
452 else {
weidendo3db43222007-09-17 12:52:10 +0000453 found_file_line = VG_(get_filename_linenum)(addr,
454 file, FILENAME_LEN,
455 dir, FILENAME_LEN,
456 &found_dirname,
457 &(p->line));
458 if (!found_file_line) {
weidendoa17f2a32006-03-20 10:27:30 +0000459 VG_(strcpy)(file, "???");
460 p->line = 0;
461 }
weidendo3db43222007-09-17 12:52:10 +0000462 if (found_dirname) {
463 // +1 for the '/'.
464 CLG_ASSERT(VG_(strlen)(dir) + VG_(strlen)(file) + 1 < FILENAME_LEN);
465 VG_(strcat)(dir, "/"); // Append '/'
466 VG_(strcat)(dir, file); // Append file to dir
467 VG_(strcpy)(file, dir); // Move dir+file to file
468 }
weidendoa17f2a32006-03-20 10:27:30 +0000469 p->file = CLG_(get_file_node)(bbcc->bb->obj, file);
470
weidendo3db43222007-09-17 12:52:10 +0000471 debug_cache_info[cachepos] = found_file_line;
weidendoa17f2a32006-03-20 10:27:30 +0000472 debug_cache_addr[cachepos] = addr;
473 debug_cache_line[cachepos] = p->line;
474 debug_cache_file[cachepos] = p->file;
475 }
476
477 /* Address offset from bbcc start address */
478 p->addr = addr - bbcc->bb->obj->offset;
479 p->bb_addr = bbcc->bb->offset;
480
barta0b6b2c2008-07-07 06:49:24 +0000481 CLG_DEBUG(3, " get_debug_pos(%#lx): BB %#lx, fn '%s', file '%s', line %u\n",
weidendoa17f2a32006-03-20 10:27:30 +0000482 addr, bb_addr(bbcc->bb), bbcc->cxt->fn[0]->name,
483 p->file->name, p->line);
484
weidendo3db43222007-09-17 12:52:10 +0000485 return found_file_line;
weidendoa17f2a32006-03-20 10:27:30 +0000486}
487
488
489/* copy file position and init cost */
490static void init_apos(AddrPos* p, Addr addr, Addr bbaddr, file_node* file)
491{
492 p->addr = addr;
493 p->bb_addr = bbaddr;
494 p->file = file;
495 p->line = 0;
496}
497
498static void copy_apos(AddrPos* dst, AddrPos* src)
499{
500 dst->addr = src->addr;
501 dst->bb_addr = src->bb_addr;
502 dst->file = src->file;
503 dst->line = src->line;
504}
505
506/* copy file position and init cost */
507static void init_fcost(AddrCost* c, Addr addr, Addr bbaddr, file_node* file)
508{
509 init_apos( &(c->p), addr, bbaddr, file);
510 /* FIXME: This is a memory leak as a AddrCost is inited multiple times */
511 c->cost = CLG_(get_eventset_cost)( CLG_(sets).full );
512 CLG_(init_cost)( CLG_(sets).full, c->cost );
513}
514
515
516/**
517 * print position change inside of a BB (last -> curr)
518 * this doesn't update last to curr!
519 */
520static void fprint_apos(Int fd, AddrPos* curr, AddrPos* last, file_node* func_file)
521{
522 CLG_ASSERT(curr->file != 0);
barta0b6b2c2008-07-07 06:49:24 +0000523 CLG_DEBUG(2, " print_apos(file '%s', line %d, bb %#lx, addr %#lx) fnFile '%s'\n",
weidendoa17f2a32006-03-20 10:27:30 +0000524 curr->file->name, curr->line, curr->bb_addr, curr->addr,
525 func_file->name);
526
527 if (curr->file != last->file) {
528
529 /* if we switch back to orig file, use fe=... */
530 if (curr->file == func_file)
531 VG_(sprintf)(outbuf, "fe=");
532 else
533 VG_(sprintf)(outbuf, "fi=");
534 print_file(outbuf+3, curr->file);
535 my_fwrite(fd, (void*)outbuf, VG_(strlen)(outbuf));
536 }
537
538 if (CLG_(clo).dump_bbs) {
539 if (curr->line != last->line) {
540 VG_(sprintf)(outbuf, "ln=%d\n", curr->line);
541 my_fwrite(fd, (void*)outbuf, VG_(strlen)(outbuf));
542 }
543 }
544}
545
546
547
548/**
549 * Print a position.
550 * This prints out differences if allowed
551 *
552 * This doesn't set last to curr afterwards!
553 */
554static
555void fprint_pos(Int fd, AddrPos* curr, AddrPos* last)
556{
557 if (0) //CLG_(clo).dump_bbs)
njn8a7b41b2007-09-23 00:51:24 +0000558 VG_(sprintf)(outbuf, "%lu ", curr->addr - curr->bb_addr);
weidendoa17f2a32006-03-20 10:27:30 +0000559 else {
560 int p = 0;
561 if (CLG_(clo).dump_instr) {
562 int diff = curr->addr - last->addr;
563 if ( CLG_(clo).compress_pos && (last->addr >0) &&
564 (diff > -100) && (diff < 100)) {
565 if (diff >0)
566 p = VG_(sprintf)(outbuf, "+%d ", diff);
567 else if (diff==0)
568 p = VG_(sprintf)(outbuf, "* ");
569 else
570 p = VG_(sprintf)(outbuf, "%d ", diff);
571 }
572 else
barta0b6b2c2008-07-07 06:49:24 +0000573 p = VG_(sprintf)(outbuf, "%#lx ", curr->addr);
weidendoa17f2a32006-03-20 10:27:30 +0000574 }
575
576 if (CLG_(clo).dump_bb) {
577 int diff = curr->bb_addr - last->bb_addr;
578 if ( CLG_(clo).compress_pos && (last->bb_addr >0) &&
579 (diff > -100) && (diff < 100)) {
580 if (diff >0)
581 p += VG_(sprintf)(outbuf+p, "+%d ", diff);
582 else if (diff==0)
583 p += VG_(sprintf)(outbuf+p, "* ");
584 else
585 p += VG_(sprintf)(outbuf+p, "%d ", diff);
586 }
587 else
barta0b6b2c2008-07-07 06:49:24 +0000588 p += VG_(sprintf)(outbuf+p, "%#lx ", curr->bb_addr);
weidendoa17f2a32006-03-20 10:27:30 +0000589 }
590
591 if (CLG_(clo).dump_line) {
592 int diff = curr->line - last->line;
593 if ( CLG_(clo).compress_pos && (last->line >0) &&
594 (diff > -100) && (diff < 100)) {
595
596 if (diff >0)
597 VG_(sprintf)(outbuf+p, "+%d ", diff);
598 else if (diff==0)
599 VG_(sprintf)(outbuf+p, "* ");
600 else
601 VG_(sprintf)(outbuf+p, "%d ", diff);
602 }
603 else
604 VG_(sprintf)(outbuf+p, "%u ", curr->line);
605 }
606 }
607 my_fwrite(fd, (void*)outbuf, VG_(strlen)(outbuf));
608}
609
610
611/**
612 * Print events.
613 */
614
615static
616void fprint_cost(int fd, EventMapping* es, ULong* cost)
617{
618 int p = CLG_(sprint_mappingcost)(outbuf, es, cost);
619 VG_(sprintf)(outbuf+p, "\n");
620 my_fwrite(fd, (void*)outbuf, VG_(strlen)(outbuf));
621 return;
622}
623
624
625
626/* Write the cost of a source line; only that parts of the source
627 * position are written that changed relative to last written position.
628 * funcPos is the source position of the first line of actual function.
629 * Something is written only if cost != 0; returns True in this case.
630 */
631static void fprint_fcost(Int fd, AddrCost* c, AddrPos* last)
632{
633 CLG_DEBUGIF(3) {
barta0b6b2c2008-07-07 06:49:24 +0000634 CLG_DEBUG(2, " print_fcost(file '%s', line %d, bb %#lx, addr %#lx):\n",
weidendoa17f2a32006-03-20 10:27:30 +0000635 c->p.file->name, c->p.line, c->p.bb_addr, c->p.addr);
636 CLG_(print_cost)(-5, CLG_(sets).full, c->cost);
637 }
638
639 fprint_pos(fd, &(c->p), last);
640 copy_apos( last, &(c->p) ); /* update last to current position */
641
642 fprint_cost(fd, CLG_(dumpmap), c->cost);
643
644 /* add cost to total */
645 CLG_(add_and_zero_cost)( CLG_(sets).full, dump_total_cost, c->cost );
646}
647
648
649/* Write out the calls from jcc (at pos)
650 */
651static void fprint_jcc(Int fd, jCC* jcc, AddrPos* curr, AddrPos* last, ULong ecounter)
652{
653 static AddrPos target;
654 file_node* file;
655 obj_node* obj;
656
657 CLG_DEBUGIF(2) {
658 CLG_DEBUG(2, " fprint_jcc (jkind %d)\n", jcc->jmpkind);
659 CLG_(print_jcc)(-10, jcc);
660 }
661
662 if (!get_debug_pos(jcc->to, bb_addr(jcc->to->bb), &target)) {
663 /* if we don't have debug info, don't switch to file "???" */
664 target.file = last->file;
665 }
666
667 if (jcc->from &&
668 (jcc->jmpkind == JmpCond || jcc->jmpkind == Ijk_Boring)) {
669
670 /* this is a JCC for a followed conditional or boring jump. */
671 CLG_ASSERT(CLG_(is_zero_cost)( CLG_(sets).full, jcc->cost));
672
673 /* objects among jumps should be the same.
674 * Otherwise this jump would have been changed to a call
675 * (see setup_bbcc)
676 */
677 CLG_ASSERT(jcc->from->bb->obj == jcc->to->bb->obj);
678
679 /* only print if target position info is usefull */
680 if (!CLG_(clo).dump_instr && !CLG_(clo).dump_bb && target.line==0) {
681 jcc->call_counter = 0;
682 return;
683 }
684
685 /* Different files/functions are possible e.g. with longjmp's
686 * which change the stack, and thus context
687 */
688 if (last->file != target.file) {
689 VG_(sprintf)(outbuf, "jfi=");
690 print_file(outbuf+4, target.file);
691 my_fwrite(fd, (void*)outbuf, VG_(strlen)(outbuf));
692 }
693
694 if (jcc->from->cxt != jcc->to->cxt) {
695 if (CLG_(clo).mangle_names)
696 print_mangled_fn(fd, outbuf, "jfn",
697 jcc->to->cxt, jcc->to->rec_index);
698 else
699 print_fn(fd, outbuf, "jfn", jcc->to->cxt->fn[0]);
700 }
701
702 if (jcc->jmpkind == JmpCond) {
703 /* format: jcnd=<followed>/<executions> <target> */
704 VG_(sprintf)(outbuf, "jcnd=%llu/%llu ",
705 jcc->call_counter, ecounter);
706 }
707 else {
708 /* format: jump=<jump count> <target> */
709 VG_(sprintf)(outbuf, "jump=%llu ",
710 jcc->call_counter);
711 }
712 my_fwrite(fd, (void*)outbuf, VG_(strlen)(outbuf));
713
714 fprint_pos(fd, &target, last);
715 my_fwrite(fd, "\n", 1);
716 fprint_pos(fd, curr, last);
717 my_fwrite(fd, "\n", 1);
718
719 jcc->call_counter = 0;
720 return;
721 }
722
723 CLG_ASSERT(jcc->to !=0);
724
725 file = jcc->to->cxt->fn[0]->file;
726 obj = jcc->to->bb->obj;
727
728 /* object of called position different to object of this function?*/
729 if (jcc->from->cxt->fn[0]->file->obj != obj) {
730 VG_(sprintf)(outbuf, "cob=");
731 print_obj(outbuf+4, obj);
732 my_fwrite(fd, (void*)outbuf, VG_(strlen)(outbuf));
733 }
734
735 /* file of called position different to current file? */
736 if (last->file != file) {
737 VG_(sprintf)(outbuf, "cfi=");
738 print_file(outbuf+4, file);
739 my_fwrite(fd, (void*)outbuf, VG_(strlen)(outbuf));
740 }
741
742 if (CLG_(clo).mangle_names)
743 print_mangled_fn(fd, outbuf, "cfn", jcc->to->cxt, jcc->to->rec_index);
744 else
745 print_fn(fd, outbuf, "cfn", jcc->to->cxt->fn[0]);
746
747 if (!CLG_(is_zero_cost)( CLG_(sets).full, jcc->cost)) {
748 VG_(sprintf)(outbuf, "calls=%llu ",
749 jcc->call_counter);
750 my_fwrite(fd, (void*)outbuf, VG_(strlen)(outbuf));
751
752 fprint_pos(fd, &target, last);
753 my_fwrite(fd, "\n", 1);
754 fprint_pos(fd, curr, last);
755 fprint_cost(fd, CLG_(dumpmap), jcc->cost);
756
757 CLG_(init_cost)( CLG_(sets).full, jcc->cost );
758
759 jcc->call_counter = 0;
760 }
761}
762
763
764
765/* Cost summation of functions.We use alternately ccSum[0/1], thus
766 * ssSum[currSum] for recently read lines with same line number.
767 */
768static AddrCost ccSum[2];
769static int currSum;
770
771/*
772 * Print all costs of a BBCC:
773 * - FCCs of instructions
774 * - JCCs of the unique jump of this BB
775 * returns True if something was written
776 */
777static Bool fprint_bbcc(Int fd, BBCC* bbcc, AddrPos* last)
778{
779 InstrInfo* instr_info;
780 ULong ecounter;
781 Bool something_written = False;
782 jCC* jcc;
783 AddrCost *currCost, *newCost;
784 Int jcc_count = 0, instr, i, jmp;
785 BB* bb = bbcc->bb;
786
787 CLG_ASSERT(bbcc->cxt != 0);
788 CLG_DEBUGIF(1) {
789 VG_(printf)("+ fprint_bbcc (Instr %d): ", bb->instr_count);
weidendo09ee78e2009-02-24 12:26:53 +0000790 CLG_(print_bbcc)(15, bbcc);
weidendoa17f2a32006-03-20 10:27:30 +0000791 }
792
793 CLG_ASSERT(currSum == 0 || currSum == 1);
794 currCost = &(ccSum[currSum]);
795 newCost = &(ccSum[1-currSum]);
796
797 ecounter = bbcc->ecounter_sum;
798 jmp = 0;
799 instr_info = &(bb->instr[0]);
800 for(instr=0; instr<bb->instr_count; instr++, instr_info++) {
801
802 /* get debug info of current instruction address and dump cost
803 * if CLG_(clo).dump_bbs or file/line has changed
804 */
805 if (!get_debug_pos(bbcc, bb_addr(bb) + instr_info->instr_offset,
806 &(newCost->p))) {
807 /* if we don't have debug info, don't switch to file "???" */
808 newCost->p.file = bbcc->cxt->fn[0]->file;
809 }
810
811 if (CLG_(clo).dump_bbs || CLG_(clo).dump_instr ||
812 (newCost->p.line != currCost->p.line) ||
813 (newCost->p.file != currCost->p.file)) {
814
815 if (!CLG_(is_zero_cost)( CLG_(sets).full, currCost->cost )) {
816 something_written = True;
817
818 fprint_apos(fd, &(currCost->p), last, bbcc->cxt->fn[0]->file);
819 fprint_fcost(fd, currCost, last);
820 }
821
822 /* switch buffers */
823 currSum = 1 - currSum;
824 currCost = &(ccSum[currSum]);
825 newCost = &(ccSum[1-currSum]);
826 }
827
828 /* add line cost to current cost sum */
829 (*CLG_(cachesim).add_icost)(currCost->cost, bbcc, instr_info, ecounter);
830
831 /* print jcc's if there are: only jumps */
832 if (bb->jmp[jmp].instr == instr) {
833 jcc_count=0;
834 for(jcc=bbcc->jmp[jmp].jcc_list; jcc; jcc=jcc->next_from)
835 if ((jcc->jmpkind != Ijk_Call) && (jcc->call_counter >0))
836 jcc_count++;
837
838 if (jcc_count>0) {
839 if (!CLG_(is_zero_cost)( CLG_(sets).full, currCost->cost )) {
840 /* no need to switch buffers, as position is the same */
841 fprint_apos(fd, &(currCost->p), last, bbcc->cxt->fn[0]->file);
842 fprint_fcost(fd, currCost, last);
843 }
844 get_debug_pos(bbcc, bb_addr(bb)+instr_info->instr_offset, &(currCost->p));
845 fprint_apos(fd, &(currCost->p), last, bbcc->cxt->fn[0]->file);
846 something_written = True;
847 for(jcc=bbcc->jmp[jmp].jcc_list; jcc; jcc=jcc->next_from) {
848 if ((jcc->jmpkind != Ijk_Call) && (jcc->call_counter >0))
849 fprint_jcc(fd, jcc, &(currCost->p), last, ecounter);
850 }
851 }
852 }
853
854 /* update execution counter */
855 if (jmp < bb->cjmp_count)
856 if (bb->jmp[jmp].instr == instr) {
857 ecounter -= bbcc->jmp[jmp].ecounter;
858 jmp++;
859 }
860 }
861
862 /* jCCs at end? If yes, dump cumulated line info first */
863 jcc_count = 0;
864 for(jcc=bbcc->jmp[jmp].jcc_list; jcc; jcc=jcc->next_from) {
865 /* yes, if JCC only counts jmp arcs or cost >0 */
866 if ( ((jcc->jmpkind != Ijk_Call) && (jcc->call_counter >0)) ||
867 (!CLG_(is_zero_cost)( CLG_(sets).full, jcc->cost )))
868 jcc_count++;
869 }
870
871 if ( (bbcc->skipped &&
872 !CLG_(is_zero_cost)(CLG_(sets).full, bbcc->skipped)) ||
873 (jcc_count>0) ) {
874
875 if (!CLG_(is_zero_cost)( CLG_(sets).full, currCost->cost )) {
876 /* no need to switch buffers, as position is the same */
877 fprint_apos(fd, &(currCost->p), last, bbcc->cxt->fn[0]->file);
878 fprint_fcost(fd, currCost, last);
879 }
880
881 get_debug_pos(bbcc, bb_jmpaddr(bb), &(currCost->p));
882 fprint_apos(fd, &(currCost->p), last, bbcc->cxt->fn[0]->file);
883 something_written = True;
884
885 /* first, print skipped costs for calls */
886 if (bbcc->skipped && !CLG_(is_zero_cost)( CLG_(sets).full,
887 bbcc->skipped )) {
888 CLG_(add_and_zero_cost)( CLG_(sets).full,
889 currCost->cost, bbcc->skipped );
890#if 0
891 VG_(sprintf)(outbuf, "# Skipped\n");
892 my_fwrite(fd, (void*)outbuf, VG_(strlen)(outbuf));
893#endif
894 fprint_fcost(fd, currCost, last);
895 }
896
897 if (jcc_count > 0)
898 for(jcc=bbcc->jmp[jmp].jcc_list; jcc; jcc=jcc->next_from) {
899 CLG_ASSERT(jcc->jmp == jmp);
900 if ( ((jcc->jmpkind != Ijk_Call) && (jcc->call_counter >0)) ||
901 (!CLG_(is_zero_cost)( CLG_(sets).full, jcc->cost )))
902
903 fprint_jcc(fd, jcc, &(currCost->p), last, ecounter);
904 }
905 }
906
907 if (CLG_(clo).dump_bbs || CLG_(clo).dump_bb) {
908 if (!CLG_(is_zero_cost)( CLG_(sets).full, currCost->cost )) {
909 something_written = True;
910
911 fprint_apos(fd, &(currCost->p), last, bbcc->cxt->fn[0]->file);
912 fprint_fcost(fd, currCost, last);
913 }
914 if (CLG_(clo).dump_bbs) my_fwrite(fd, (void*)"\n", 1);
915
916 /* when every cost was immediatly written, we must have done so,
917 * as this function is only called when there's cost in a BBCC
918 */
919 CLG_ASSERT(something_written);
920 }
921
922 bbcc->ecounter_sum = 0;
923 for(i=0; i<=bbcc->bb->cjmp_count; i++)
924 bbcc->jmp[i].ecounter = 0;
925 bbcc->ret_counter = 0;
926
927 CLG_DEBUG(1, "- fprint_bbcc: JCCs %d\n", jcc_count);
928
929 return something_written;
930}
931
932/* order by
933 * recursion,
934 * from->bb->obj, from->bb->fn
935 * obj, fn[0]->file, fn
936 * address
937 */
938static int my_cmp(BBCC** pbbcc1, BBCC** pbbcc2)
939{
940#if 0
941 return (*pbbcc1)->bb->offset - (*pbbcc2)->bb->offset;
942#else
943 BBCC *bbcc1 = *pbbcc1;
944 BBCC *bbcc2 = *pbbcc2;
945 Context* cxt1 = bbcc1->cxt;
946 Context* cxt2 = bbcc2->cxt;
947 int off = 1;
948
949 if (cxt1->fn[0]->file->obj != cxt2->fn[0]->file->obj)
950 return cxt1->fn[0]->file->obj - cxt2->fn[0]->file->obj;
951
952 if (cxt1->fn[0]->file != cxt2->fn[0]->file)
953 return cxt1->fn[0]->file - cxt2->fn[0]->file;
954
955 if (cxt1->fn[0] != cxt2->fn[0])
956 return cxt1->fn[0] - cxt2->fn[0];
957
958 if (bbcc1->rec_index != bbcc2->rec_index)
959 return bbcc1->rec_index - bbcc2->rec_index;
960
961 while((off < cxt1->size) && (off < cxt2->size)) {
962 fn_node* ffn1 = cxt1->fn[off];
963 fn_node* ffn2 = cxt2->fn[off];
964 if (ffn1->file->obj != ffn2->file->obj)
965 return ffn1->file->obj - ffn2->file->obj;
966 if (ffn1 != ffn2)
967 return ffn1 - ffn2;
968 off++;
969 }
970 if (cxt1->size > cxt2->size) return 1;
971 else if (cxt1->size < cxt2->size) return -1;
972
973 return bbcc1->bb->offset - bbcc2->bb->offset;
974#endif
975}
976
977
978
979
980
981/* modified version of:
982 *
983 * qsort -- qsort interface implemented by faster quicksort.
984 * J. L. Bentley and M. D. McIlroy, SPE 23 (1993) 1249-1265.
985 * Copyright 1993, John Wiley.
986*/
987
988static __inline__
989void swapfunc(BBCC** a, BBCC** b, int n)
990{
991 while(n>0) {
992 BBCC* t = *a; *a = *b; *b = t;
993 a++, b++;
994 n--;
995 }
996}
997
998static __inline__
999void swap(BBCC** a, BBCC** b)
1000{
1001 BBCC* t;
1002 t = *a; *a = *b; *b = t;
1003}
1004
1005#define min(x, y) ((x)<=(y) ? (x) : (y))
1006
1007static
1008BBCC** med3(BBCC **a, BBCC **b, BBCC **c, int (*cmp)(BBCC**,BBCC**))
1009{ return cmp(a, b) < 0 ?
1010 (cmp(b, c) < 0 ? b : cmp(a, c) < 0 ? c : a)
1011 : (cmp(b, c) > 0 ? b : cmp(a, c) > 0 ? c : a);
1012}
1013
1014static BBCC** qsort_start = 0;
1015
1016static void qsort(BBCC **a, int n, int (*cmp)(BBCC**,BBCC**))
1017{
1018 BBCC **pa, **pb, **pc, **pd, **pl, **pm, **pn, **pv;
1019 int s, r;
1020 BBCC* v;
1021
barta0b6b2c2008-07-07 06:49:24 +00001022 CLG_DEBUG(8, " qsort(%ld,%ld)\n", a-qsort_start + 0L, n + 0L);
weidendoa17f2a32006-03-20 10:27:30 +00001023
1024 if (n < 7) { /* Insertion sort on smallest arrays */
1025 for (pm = a+1; pm < a+n; pm++)
1026 for (pl = pm; pl > a && cmp(pl-1, pl) > 0; pl --)
1027 swap(pl, pl-1);
1028
1029 CLG_DEBUGIF(8) {
1030 for (pm = a; pm < a+n; pm++) {
barta0b6b2c2008-07-07 06:49:24 +00001031 VG_(printf)(" %3ld BB %#lx, ",
1032 pm - qsort_start + 0L,
weidendoa17f2a32006-03-20 10:27:30 +00001033 bb_addr((*pm)->bb));
1034 CLG_(print_cxt)(9, (*pm)->cxt, (*pm)->rec_index);
1035 }
1036 }
1037 return;
1038 }
1039 pm = a + n/2; /* Small arrays, middle element */
1040 if (n > 7) {
1041 pl = a;
1042 pn = a + (n-1);
1043 if (n > 40) { /* Big arrays, pseudomedian of 9 */
1044 s = n/8;
1045 pl = med3(pl, pl+s, pl+2*s, cmp);
1046 pm = med3(pm-s, pm, pm+s, cmp);
1047 pn = med3(pn-2*s, pn-s, pn, cmp);
1048 }
1049 pm = med3(pl, pm, pn, cmp); /* Mid-size, med of 3 */
1050 }
1051
1052
1053 v = *pm;
1054 pv = &v;
1055 pa = pb = a;
1056 pc = pd = a + (n-1);
1057 for (;;) {
1058 while ((pb <= pc) && ((r=cmp(pb, pv)) <= 0)) {
1059 if (r==0) {
1060 /* same as pivot, to start */
1061 swap(pa,pb); pa++;
1062 }
1063 pb ++;
1064 }
1065 while ((pb <= pc) && ((r=cmp(pc, pv)) >= 0)) {
1066 if (r==0) {
1067 /* same as pivot, to end */
1068 swap(pc,pd); pd--;
1069 }
1070 pc --;
1071 }
1072 if (pb > pc) { break; }
1073 swap(pb, pc);
1074 pb ++;
1075 pc --;
1076 }
1077 pb--;
1078 pc++;
1079
1080 /* put pivot from start into middle */
1081 if ((s = pa-a)>0) { for(r=0;r<s;r++) swap(a+r, pb+1-s+r); }
1082 /* put pivot from end into middle */
1083 if ((s = a+n-1-pd)>0) { for(r=0;r<s;r++) swap(pc+r, a+n-s+r); }
1084
1085 CLG_DEBUGIF(8) {
barta0b6b2c2008-07-07 06:49:24 +00001086 VG_(printf)(" PV BB %#lx, ", bb_addr((*pv)->bb));
weidendoa17f2a32006-03-20 10:27:30 +00001087 CLG_(print_cxt)(9, (*pv)->cxt, (*pv)->rec_index);
1088
1089 s = pb-pa+1;
barta0b6b2c2008-07-07 06:49:24 +00001090 VG_(printf)(" Lower %ld - %ld:\n",
1091 a-qsort_start + 0L,
1092 a+s-1-qsort_start + 0L);
weidendoa17f2a32006-03-20 10:27:30 +00001093 for (r=0;r<s;r++) {
1094 pm = a+r;
barta0b6b2c2008-07-07 06:49:24 +00001095 VG_(printf)(" %3ld BB %#lx, ",
1096 pm-qsort_start + 0L,
1097 bb_addr((*pm)->bb));
weidendoa17f2a32006-03-20 10:27:30 +00001098 CLG_(print_cxt)(9, (*pm)->cxt, (*pm)->rec_index);
1099 }
1100
1101 s = pd-pc+1;
barta0b6b2c2008-07-07 06:49:24 +00001102 VG_(printf)(" Upper %ld - %ld:\n",
1103 a+n-s-qsort_start + 0L,
1104 a+n-1-qsort_start + 0L);
weidendoa17f2a32006-03-20 10:27:30 +00001105 for (r=0;r<s;r++) {
1106 pm = a+n-s+r;
barta0b6b2c2008-07-07 06:49:24 +00001107 VG_(printf)(" %3ld BB %#lx, ",
1108 pm-qsort_start + 0L,
1109 bb_addr((*pm)->bb));
weidendoa17f2a32006-03-20 10:27:30 +00001110 CLG_(print_cxt)(9, (*pm)->cxt, (*pm)->rec_index);
1111 }
1112 }
1113
1114 if ((s = pb+1-pa) > 1) qsort(a, s, cmp);
1115 if ((s = pd+1-pc) > 1) qsort(a+n-s, s, cmp);
1116}
1117
1118
1119/* Helpers for prepare_dump */
1120
1121static Int prepare_count;
1122static BBCC** prepare_ptr;
1123
1124
1125static void hash_addCount(BBCC* bbcc)
1126{
1127 if ((bbcc->ecounter_sum > 0) || (bbcc->ret_counter>0))
1128 prepare_count++;
1129}
1130
1131static void hash_addPtr(BBCC* bbcc)
1132{
1133 if ((bbcc->ecounter_sum == 0) &&
1134 (bbcc->ret_counter == 0)) return;
1135
1136 *prepare_ptr = bbcc;
1137 prepare_ptr++;
1138}
1139
1140
1141static void cs_addCount(thread_info* ti)
1142{
1143 Int i;
1144 BBCC* bbcc;
1145
1146 /* add BBCCs with active call in call stack of current thread.
1147 * update cost sums for active calls
1148 */
1149
1150 for(i = 0; i < CLG_(current_call_stack).sp; i++) {
1151 call_entry* e = &(CLG_(current_call_stack).entry[i]);
1152 if (e->jcc == 0) continue;
1153
1154 CLG_(add_diff_cost_lz)( CLG_(sets).full, &(e->jcc->cost),
1155 e->enter_cost, CLG_(current_state).cost);
1156 bbcc = e->jcc->from;
1157
1158 CLG_DEBUG(1, " [%2d] (tid %d), added active: %s\n",
1159 i,CLG_(current_tid),bbcc->cxt->fn[0]->name);
1160
1161 if (bbcc->ecounter_sum>0 || bbcc->ret_counter>0) {
1162 /* already counted */
1163 continue;
1164 }
1165 prepare_count++;
1166 }
1167}
1168
1169static void cs_addPtr(thread_info* ti)
1170{
1171 Int i;
1172 BBCC* bbcc;
1173
1174 /* add BBCCs with active call in call stack of current thread.
1175 * update cost sums for active calls
1176 */
1177
1178 for(i = 0; i < CLG_(current_call_stack).sp; i++) {
1179 call_entry* e = &(CLG_(current_call_stack).entry[i]);
1180 if (e->jcc == 0) continue;
1181
1182 bbcc = e->jcc->from;
1183
1184 if (bbcc->ecounter_sum>0 || bbcc->ret_counter>0) {
1185 /* already counted */
1186 continue;
1187 }
1188
1189 *prepare_ptr = bbcc;
1190 prepare_ptr++;
1191 }
1192}
1193
1194
1195/**
1196 * Put all BBCCs with costs into a sorted array.
1197 * The returned arrays ends with a null pointer.
1198 * Must be freed after dumping.
1199 */
1200static
1201BBCC** prepare_dump(void)
1202{
1203 BBCC **array;
1204
1205 prepare_count = 0;
1206
1207 /* if we do not separate among threads, this gives all */
1208 /* count number of BBCCs with >0 executions */
1209 CLG_(forall_bbccs)(hash_addCount);
1210
1211 /* even if we do not separate among threads,
1212 * call stacks are separated */
1213 if (CLG_(clo).separate_threads)
1214 cs_addCount(0);
1215 else
1216 CLG_(forall_threads)(cs_addCount);
1217
1218 CLG_DEBUG(0, "prepare_dump: %d BBCCs\n", prepare_count);
1219
1220 /* allocate bbcc array, insert BBCCs and sort */
1221 prepare_ptr = array =
sewardj9c606bd2008-09-18 18:12:50 +00001222 (BBCC**) CLG_MALLOC("cl.dump.pd.1",
1223 (prepare_count+1) * sizeof(BBCC*));
weidendoa17f2a32006-03-20 10:27:30 +00001224
1225 CLG_(forall_bbccs)(hash_addPtr);
1226
1227 if (CLG_(clo).separate_threads)
1228 cs_addPtr(0);
1229 else
1230 CLG_(forall_threads)(cs_addPtr);
1231
1232 CLG_ASSERT(array + prepare_count == prepare_ptr);
1233
1234 /* end mark */
1235 *prepare_ptr = 0;
1236
1237 CLG_DEBUG(0," BBCCs inserted\n");
1238
1239 qsort_start = array;
1240 qsort(array, prepare_count, my_cmp);
1241
1242 CLG_DEBUG(0," BBCCs sorted\n");
1243
1244 return array;
1245}
1246
1247
1248
1249
1250static void fprint_cost_ln(int fd, Char* prefix,
1251 EventMapping* em, ULong* cost)
1252{
1253 int p;
1254
1255 p = VG_(sprintf)(outbuf, "%s", prefix);
1256 p += CLG_(sprint_mappingcost)(outbuf + p, em, cost);
1257 VG_(sprintf)(outbuf + p, "\n");
1258 my_fwrite(fd, (void*)outbuf, VG_(strlen)(outbuf));
1259}
1260
1261static ULong bbs_done = 0;
1262static Char* filename = 0;
1263
1264static
1265void file_err(void)
1266{
1267 VG_(message)(Vg_UserMsg,
1268 "Error: can not open cache simulation output file `%s'",
1269 filename );
1270 VG_(exit)(1);
1271}
1272
1273/**
1274 * Create a new dump file and write header.
1275 *
1276 * Naming: <CLG_(clo).filename_base>.<pid>[.<part>][-<tid>]
1277 * <part> is skipped for final dump (trigger==0)
1278 * <tid> is skipped for thread 1 with CLG_(clo).separate_threads=no
1279 *
1280 * Returns the file descriptor, and -1 on error (no write permission)
1281 */
1282static int new_dumpfile(Char buf[BUF_LEN], int tid, Char* trigger)
1283{
1284 Bool appending = False;
1285 int i, fd;
1286 FullCost sum = 0;
1287 SysRes res;
1288
weidendo4ce5e792006-09-20 21:29:39 +00001289 CLG_ASSERT(dumps_initialized);
weidendoa17f2a32006-03-20 10:27:30 +00001290 CLG_ASSERT(filename != 0);
1291
1292 if (!CLG_(clo).combine_dumps) {
weidendocbf4e192007-11-27 01:27:12 +00001293 i = VG_(sprintf)(filename, "%s", out_file);
weidendoa17f2a32006-03-20 10:27:30 +00001294
1295 if (trigger)
1296 i += VG_(sprintf)(filename+i, ".%d", out_counter);
1297
1298 if (CLG_(clo).separate_threads)
njn4c245e52009-03-15 23:25:38 +00001299 VG_(sprintf)(filename+i, "-%02d", tid);
weidendoa17f2a32006-03-20 10:27:30 +00001300
1301 res = VG_(open)(filename, VKI_O_WRONLY|VKI_O_TRUNC, 0);
1302 }
1303 else {
weidendocbf4e192007-11-27 01:27:12 +00001304 VG_(sprintf)(filename, "%s", out_file);
weidendoa17f2a32006-03-20 10:27:30 +00001305 res = VG_(open)(filename, VKI_O_WRONLY|VKI_O_APPEND, 0);
1306 if (!res.isError && out_counter>1)
1307 appending = True;
1308 }
1309
1310 if (res.isError) {
1311 res = VG_(open)(filename, VKI_O_CREAT|VKI_O_WRONLY,
1312 VKI_S_IRUSR|VKI_S_IWUSR);
1313 if (res.isError) {
1314 /* If the file can not be opened for whatever reason (conflict
1315 between multiple supervised processes?), give up now. */
1316 file_err();
1317 }
1318 }
sewardje8089302006-10-17 02:15:17 +00001319 fd = (Int) res.res;
weidendoa17f2a32006-03-20 10:27:30 +00001320
1321 CLG_DEBUG(2, " new_dumpfile '%s'\n", filename);
1322
1323 if (!appending)
1324 reset_dump_array();
1325
1326
1327 if (!appending) {
1328 /* version */
1329 VG_(sprintf)(buf, "version: 1\n");
1330 my_fwrite(fd, (void*)buf, VG_(strlen)(buf));
1331
1332 /* creator */
1333 VG_(sprintf)(buf, "creator: callgrind-" VERSION "\n");
1334 my_fwrite(fd, (void*)buf, VG_(strlen)(buf));
1335
1336 /* "pid:" line */
1337 VG_(sprintf)(buf, "pid: %d\n", VG_(getpid)());
1338 my_fwrite(fd, (void*)buf, VG_(strlen)(buf));
1339
1340 /* "cmd:" line */
1341 VG_(strcpy)(buf, "cmd: ");
1342 my_fwrite(fd, (void*)buf, VG_(strlen)(buf));
1343 my_fwrite(fd, (void*)cmdbuf, VG_(strlen)(cmdbuf));
1344 }
1345
1346 VG_(sprintf)(buf, "\npart: %d\n", out_counter);
1347 my_fwrite(fd, (void*)buf, VG_(strlen)(buf));
1348 if (CLG_(clo).separate_threads) {
1349 VG_(sprintf)(buf, "thread: %d\n", tid);
1350 my_fwrite(fd, (void*)buf, VG_(strlen)(buf));
1351 }
1352
1353 /* "desc:" lines */
1354 if (!appending) {
1355 my_fwrite(fd, "\n", 1);
1356
1357#if 0
1358 /* Global options changing the tracing behaviour */
1359 VG_(sprintf)(buf, "\ndesc: Option: --skip-plt=%s\n",
1360 CLG_(clo).skip_plt ? "yes" : "no");
1361 my_fwrite(fd, (void*)buf, VG_(strlen)(buf));
1362 VG_(sprintf)(buf, "desc: Option: --collect-jumps=%s\n",
1363 CLG_(clo).collect_jumps ? "yes" : "no");
1364 my_fwrite(fd, (void*)buf, VG_(strlen)(buf));
1365 VG_(sprintf)(buf, "desc: Option: --separate-recs=%d\n",
1366 CLG_(clo).separate_recursions);
1367 my_fwrite(fd, (void*)buf, VG_(strlen)(buf));
1368 VG_(sprintf)(buf, "desc: Option: --separate-callers=%d\n",
1369 CLG_(clo).separate_callers);
1370 my_fwrite(fd, (void*)buf, VG_(strlen)(buf));
1371
1372 VG_(sprintf)(buf, "desc: Option: --dump-bbs=%s\n",
1373 CLG_(clo).dump_bbs ? "yes" : "no");
1374 my_fwrite(fd, (void*)buf, VG_(strlen)(buf));
1375 VG_(sprintf)(buf, "desc: Option: --separate-threads=%s\n",
1376 CLG_(clo).separate_threads ? "yes" : "no");
1377 my_fwrite(fd, (void*)buf, VG_(strlen)(buf));
1378#endif
1379
1380 (*CLG_(cachesim).getdesc)(buf);
1381 my_fwrite(fd, (void*)buf, VG_(strlen)(buf));
1382 }
1383
1384 VG_(sprintf)(buf, "\ndesc: Timerange: Basic block %llu - %llu\n",
1385 bbs_done, CLG_(stat).bb_executions);
1386
1387 my_fwrite(fd, (void*)buf, VG_(strlen)(buf));
1388 VG_(sprintf)(buf, "desc: Trigger: %s\n",
1389 trigger ? trigger : (Char*)"Program termination");
1390 my_fwrite(fd, (void*)buf, VG_(strlen)(buf));
1391
1392#if 0
1393 /* Output function specific config
1394 * FIXME */
1395 for (i = 0; i < N_FNCONFIG_ENTRIES; i++) {
1396 fnc = fnc_table[i];
1397 while (fnc) {
1398 if (fnc->skip) {
1399 VG_(sprintf)(buf, "desc: Option: --fn-skip=%s\n", fnc->name);
1400 my_fwrite(fd, (void*)buf, VG_(strlen)(buf));
1401 }
1402 if (fnc->dump_at_enter) {
1403 VG_(sprintf)(buf, "desc: Option: --fn-dump-at-enter=%s\n",
1404 fnc->name);
1405 my_fwrite(fd, (void*)buf, VG_(strlen)(buf));
1406 }
1407 if (fnc->dump_at_leave) {
1408 VG_(sprintf)(buf, "desc: Option: --fn-dump-at-leave=%s\n",
1409 fnc->name);
1410 my_fwrite(fd, (void*)buf, VG_(strlen)(buf));
1411 }
1412 if (fnc->separate_callers != CLG_(clo).separate_callers) {
1413 VG_(sprintf)(buf, "desc: Option: --separate-callers%d=%s\n",
1414 fnc->separate_callers, fnc->name);
1415 my_fwrite(fd, (void*)buf, VG_(strlen)(buf));
1416 }
1417 if (fnc->separate_recursions != CLG_(clo).separate_recursions) {
1418 VG_(sprintf)(buf, "desc: Option: --separate-recs%d=%s\n",
1419 fnc->separate_recursions, fnc->name);
1420 my_fwrite(fd, (void*)buf, VG_(strlen)(buf));
1421 }
1422 fnc = fnc->next;
1423 }
1424 }
1425#endif
1426
1427 /* "positions:" line */
1428 VG_(sprintf)(buf, "\npositions:%s%s%s\n",
1429 CLG_(clo).dump_instr ? " instr" : "",
1430 CLG_(clo).dump_bb ? " bb" : "",
1431 CLG_(clo).dump_line ? " line" : "");
1432 my_fwrite(fd, (void*)buf, VG_(strlen)(buf));
1433
1434 /* "events:" line */
1435 i = VG_(sprintf)(buf, "events: ");
1436 CLG_(sprint_eventmapping)(buf+i, CLG_(dumpmap));
1437 my_fwrite(fd, (void*)buf, VG_(strlen)(buf));
1438 my_fwrite(fd, "\n", 1);
1439
1440 /* summary lines */
1441 sum = CLG_(get_eventset_cost)( CLG_(sets).full );
1442 CLG_(zero_cost)(CLG_(sets).full, sum);
1443 if (CLG_(clo).separate_threads) {
1444 thread_info* ti = CLG_(get_current_thread)();
1445 CLG_(add_diff_cost)(CLG_(sets).full, sum, ti->lastdump_cost,
1446 ti->states.entry[0]->cost);
1447 }
1448 else {
1449 /* This function is called once for thread 1, where
1450 * all costs are summed up when not dumping separate per thread.
1451 * But this is not true for summary: we need to add all threads.
1452 */
1453 int t;
1454 thread_info** thr = CLG_(get_threads)();
1455 for(t=1;t<VG_N_THREADS;t++) {
1456 if (!thr[t]) continue;
1457 CLG_(add_diff_cost)(CLG_(sets).full, sum,
1458 thr[t]->lastdump_cost,
1459 thr[t]->states.entry[0]->cost);
1460 }
1461 }
1462 fprint_cost_ln(fd, "summary: ", CLG_(dumpmap), sum);
1463
1464 /* all dumped cost will be added to total_fcc */
1465 CLG_(init_cost_lz)( CLG_(sets).full, &dump_total_cost );
1466
1467 my_fwrite(fd, "\n\n",2);
1468
1469 if (VG_(clo_verbosity) > 1)
1470 VG_(message)(Vg_DebugMsg, "Dump to %s", filename);
1471
1472 return fd;
1473}
1474
1475
weidendo09ee78e2009-02-24 12:26:53 +00001476static void close_dumpfile(int fd)
weidendoa17f2a32006-03-20 10:27:30 +00001477{
1478 if (fd <0) return;
1479
1480 fprint_cost_ln(fd, "totals: ", CLG_(dumpmap),
1481 dump_total_cost);
1482 //fprint_fcc_ln(fd, "summary: ", &dump_total_fcc);
1483 CLG_(add_cost_lz)(CLG_(sets).full,
1484 &CLG_(total_cost), dump_total_cost);
1485
1486 fwrite_flush();
1487 VG_(close)(fd);
1488
1489 if (filename[0] == '.') {
1490 if (-1 == VG_(rename) (filename, filename+1)) {
1491 /* Can not rename to correct file name: give out warning */
1492 VG_(message)(Vg_DebugMsg, "Warning: Can not rename .%s to %s",
1493 filename, filename);
1494 }
1495 }
1496}
1497
1498
1499/* Helper for print_bbccs */
1500
1501static Int print_fd;
1502static Char* print_trigger;
1503static Char print_buf[BUF_LEN];
1504
1505static void print_bbccs_of_thread(thread_info* ti)
1506{
1507 BBCC **p, **array;
1508 FnPos lastFnPos;
1509 AddrPos lastAPos;
1510
1511 CLG_DEBUG(1, "+ print_bbccs(tid %d)\n", CLG_(current_tid));
1512
1513 print_fd = new_dumpfile(print_buf, CLG_(current_tid), print_trigger);
1514 if (print_fd <0) {
1515 CLG_DEBUG(1, "- print_bbccs(tid %d): No output...\n", CLG_(current_tid));
1516 return;
1517 }
1518
1519 p = array = prepare_dump();
1520 init_fpos(&lastFnPos);
1521 init_apos(&lastAPos, 0, 0, 0);
1522
1523 if (p) while(1) {
1524
1525 /* on context/function change, print old cost buffer before */
1526 if (lastFnPos.cxt && ((*p==0) ||
1527 (lastFnPos.cxt != (*p)->cxt) ||
1528 (lastFnPos.rec_index != (*p)->rec_index))) {
1529 if (!CLG_(is_zero_cost)( CLG_(sets).full, ccSum[currSum].cost )) {
1530 /* no need to switch buffers, as position is the same */
1531 fprint_apos(print_fd, &(ccSum[currSum].p), &lastAPos,
1532 lastFnPos.cxt->fn[0]->file);
1533 fprint_fcost(print_fd, &ccSum[currSum], &lastAPos);
1534 }
1535
1536 if (ccSum[currSum].p.file != lastFnPos.cxt->fn[0]->file) {
1537 /* switch back to file of function */
1538 VG_(sprintf)(print_buf, "fe=");
1539 print_file(print_buf+3, lastFnPos.cxt->fn[0]->file);
1540 my_fwrite(print_fd, (void*)print_buf, VG_(strlen)(print_buf));
1541 }
1542 my_fwrite(print_fd, "\n", 1);
1543 }
1544
1545 if (*p == 0) break;
1546
1547 if (print_fn_pos(print_fd, &lastFnPos, *p)) {
1548
1549 /* new function */
1550 init_apos(&lastAPos, 0, 0, (*p)->cxt->fn[0]->file);
1551 init_fcost(&ccSum[0], 0, 0, 0);
1552 init_fcost(&ccSum[1], 0, 0, 0);
1553 currSum = 0;
1554 }
1555
1556 if (CLG_(clo).dump_bbs) {
1557 /* FIXME: Specify Object of BB if different to object of fn */
1558 int i, pos = 0;
1559 ULong ecounter = (*p)->ecounter_sum;
barta0b6b2c2008-07-07 06:49:24 +00001560 pos = VG_(sprintf)(print_buf, "bb=%#lx ", (*p)->bb->offset);
weidendoa17f2a32006-03-20 10:27:30 +00001561 for(i = 0; i<(*p)->bb->cjmp_count;i++) {
1562 pos += VG_(sprintf)(print_buf+pos, "%d %llu ",
1563 (*p)->bb->jmp[i].instr,
1564 ecounter);
1565 ecounter -= (*p)->jmp[i].ecounter;
1566 }
1567 VG_(sprintf)(print_buf+pos, "%d %llu\n",
1568 (*p)->bb->instr_count,
1569 ecounter);
1570 my_fwrite(print_fd, (void*)print_buf, VG_(strlen)(print_buf));
1571 }
1572
1573 fprint_bbcc(print_fd, *p, &lastAPos);
1574
1575 p++;
1576 }
sewardje8089302006-10-17 02:15:17 +00001577
weidendo09ee78e2009-02-24 12:26:53 +00001578 close_dumpfile(print_fd);
weidendoa17f2a32006-03-20 10:27:30 +00001579 if (array) VG_(free)(array);
1580
1581 /* set counters of last dump */
1582 CLG_(copy_cost)( CLG_(sets).full, ti->lastdump_cost,
1583 CLG_(current_state).cost );
1584
1585 CLG_DEBUG(1, "- print_bbccs(tid %d)\n", CLG_(current_tid));
1586}
1587
1588
1589static void print_bbccs(Char* trigger, Bool only_current_thread)
1590{
1591 init_dump_array();
1592 init_debug_cache();
1593
1594 print_fd = -1;
1595 print_trigger = trigger;
1596
1597 if (!CLG_(clo).separate_threads) {
1598 /* All BBCC/JCC costs is stored for thread 1 */
1599 Int orig_tid = CLG_(current_tid);
1600
1601 CLG_(switch_thread)(1);
1602 print_bbccs_of_thread( CLG_(get_current_thread)() );
1603 CLG_(switch_thread)(orig_tid);
1604 }
1605 else if (only_current_thread)
1606 print_bbccs_of_thread( CLG_(get_current_thread)() );
1607 else
1608 CLG_(forall_threads)(print_bbccs_of_thread);
1609
1610 free_dump_array();
1611}
1612
1613
1614void CLG_(dump_profile)(Char* trigger, Bool only_current_thread)
1615{
1616 CLG_DEBUG(2, "+ dump_profile(Trigger '%s')\n",
1617 trigger ? trigger : (Char*)"Prg.Term.");
1618
weidendod74d9f72008-10-24 18:50:00 +00001619 CLG_(init_dumps)();
1620
weidendoa17f2a32006-03-20 10:27:30 +00001621 if (VG_(clo_verbosity) > 1)
1622 VG_(message)(Vg_DebugMsg, "Start dumping at BB %llu (%s)...",
1623 CLG_(stat).bb_executions,
1624 trigger ? trigger : (Char*)"Prg.Term.");
1625
1626 out_counter++;
1627
1628 print_bbccs(trigger, only_current_thread);
1629
weidendoa17f2a32006-03-20 10:27:30 +00001630 bbs_done = CLG_(stat).bb_executions++;
1631
1632 if (VG_(clo_verbosity) > 1)
1633 VG_(message)(Vg_DebugMsg, "Dumping done.");
1634}
1635
1636/* copy command to cmd buffer (could change) */
1637static
1638void init_cmdbuf(void)
1639{
1640 Int i,j,size = 0;
1641 HChar* argv;
1642
weidendoa17f2a32006-03-20 10:27:30 +00001643 if (VG_(args_the_exename))
1644 size = VG_(sprintf)(cmdbuf, " %s", VG_(args_the_exename));
1645
sewardj14c7cc52007-02-25 15:08:24 +00001646 for(i = 0; i < VG_(sizeXA)( VG_(args_for_client) ); i++) {
1647 argv = * (HChar**) VG_(indexXA)( VG_(args_for_client), i );
weidendoa17f2a32006-03-20 10:27:30 +00001648 if (!argv) continue;
1649 if ((size>0) && (size < BUF_LEN)) cmdbuf[size++] = ' ';
1650 for(j=0;argv[j]!=0;j++)
1651 if (size < BUF_LEN) cmdbuf[size++] = argv[j];
1652 }
weidendoa17f2a32006-03-20 10:27:30 +00001653
1654 if (size == BUF_LEN) size--;
1655 cmdbuf[size] = 0;
1656}
1657
weidendo4ce5e792006-09-20 21:29:39 +00001658/*
weidendocbf4e192007-11-27 01:27:12 +00001659 * Set up file names for dump output: <out_directory>, <out_file>.
1660 * <out_file> is derived from the output format string, which defaults
1661 * to "callgrind.out.%p", where %p is replaced with the PID.
1662 * For the final file name, on intermediate dumps a counter is appended,
1663 * and further, if separate dumps per thread are requested, the thread ID.
weidendo4ce5e792006-09-20 21:29:39 +00001664 *
weidendocbf4e192007-11-27 01:27:12 +00001665 * <out_file> always starts with a full absolute path.
1666 * If the output format string represents a relative path, the current
1667 * working directory at program start is used.
weidendod74d9f72008-10-24 18:50:00 +00001668 *
1669 * This function has to be called every time a profile dump is generated
1670 * to be able to react on PID changes.
weidendo4ce5e792006-09-20 21:29:39 +00001671 */
1672void CLG_(init_dumps)()
weidendoa17f2a32006-03-20 10:27:30 +00001673{
weidendocbf4e192007-11-27 01:27:12 +00001674 Int lastSlash, i;
weidendo4ce5e792006-09-20 21:29:39 +00001675 SysRes res;
weidendoa17f2a32006-03-20 10:27:30 +00001676
weidendod74d9f72008-10-24 18:50:00 +00001677 static int thisPID = 0;
1678 int currentPID = VG_(getpid)();
1679 if (currentPID == thisPID) {
1680 /* already initialized, and no PID change */
1681 CLG_ASSERT(out_file != 0);
1682 return;
1683 }
1684 thisPID = currentPID;
1685
weidendocbf4e192007-11-27 01:27:12 +00001686 if (!CLG_(clo).out_format)
1687 CLG_(clo).out_format = DEFAULT_OUTFORMAT;
1688
weidendod74d9f72008-10-24 18:50:00 +00001689 /* If a file name was already set, clean up before */
1690 if (out_file) {
1691 VG_(free)(out_file);
1692 VG_(free)(out_directory);
1693 VG_(free)(filename);
1694 out_counter = 0;
1695 }
1696
weidendocbf4e192007-11-27 01:27:12 +00001697 // Setup output filename.
1698 out_file =
1699 VG_(expand_file_name)("--callgrind-out-file", CLG_(clo).out_format);
weidendoa17f2a32006-03-20 10:27:30 +00001700
1701 /* get base directory for dump/command/result files */
weidendocbf4e192007-11-27 01:27:12 +00001702 CLG_ASSERT(out_file[0] == '/');
1703 lastSlash = 0;
1704 i = 1;
1705 while(out_file[i]) {
1706 if (out_file[i] == '/') lastSlash = i;
1707 i++;
weidendoa17f2a32006-03-20 10:27:30 +00001708 }
weidendocbf4e192007-11-27 01:27:12 +00001709 i = lastSlash;
sewardj9c606bd2008-09-18 18:12:50 +00001710 out_directory = (Char*) CLG_MALLOC("cl.dump.init_dumps.1", i+1);
weidendocbf4e192007-11-27 01:27:12 +00001711 VG_(strncpy)(out_directory, out_file, i);
1712 out_directory[i] = 0;
weidendoa17f2a32006-03-20 10:27:30 +00001713
1714 /* allocate space big enough for final filenames */
sewardj9c606bd2008-09-18 18:12:50 +00001715 filename = (Char*) CLG_MALLOC("cl.dump.init_dumps.2",
1716 VG_(strlen)(out_file)+32);
weidendoa17f2a32006-03-20 10:27:30 +00001717 CLG_ASSERT(filename != 0);
1718
1719 /* Make sure the output base file can be written.
1720 * This is used for the dump at program termination.
1721 * We stop with an error here if we can not create the
1722 * file: This is probably because of missing rights,
1723 * and trace parts wouldn't be allowed to be written, too.
1724 */
weidendocbf4e192007-11-27 01:27:12 +00001725 VG_(strcpy)(filename, out_file);
weidendoa17f2a32006-03-20 10:27:30 +00001726 res = VG_(open)(filename, VKI_O_WRONLY|VKI_O_TRUNC, 0);
1727 if (res.isError) {
1728 res = VG_(open)(filename, VKI_O_CREAT|VKI_O_WRONLY,
1729 VKI_S_IRUSR|VKI_S_IWUSR);
1730 if (res.isError) {
1731 file_err();
1732 }
1733 }
sewardje8089302006-10-17 02:15:17 +00001734 if (!res.isError) VG_(close)( (Int)res.res );
weidendoa17f2a32006-03-20 10:27:30 +00001735
weidendod74d9f72008-10-24 18:50:00 +00001736 if (!dumps_initialized)
1737 init_cmdbuf();
weidendo4ce5e792006-09-20 21:29:39 +00001738
1739 dumps_initialized = True;
weidendoa17f2a32006-03-20 10:27:30 +00001740}