blob: 6250e1bf1eacd4806ec94597095b2e711d0659fc [file] [log] [blame]
njnea27e462005-05-31 02:38:09 +00001
2/*--------------------------------------------------------------------*/
3/*--- DebugInfo. pub_tool_debuginfo.h ---*/
4/*--------------------------------------------------------------------*/
5
6/*
7 This file is part of Valgrind, a dynamic binary instrumentation
8 framework.
9
Elliott Hughesed398002017-06-21 14:41:24 -070010 Copyright (C) 2000-2017 Julian Seward
njnea27e462005-05-31 02:38:09 +000011 jseward@acm.org
12
13 This program is free software; you can redistribute it and/or
14 modify it under the terms of the GNU General Public License as
15 published by the Free Software Foundation; either version 2 of the
16 License, or (at your option) any later version.
17
18 This program is distributed in the hope that it will be useful, but
19 WITHOUT ANY WARRANTY; without even the implied warranty of
20 MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
21 General Public License for more details.
22
23 You should have received a copy of the GNU General Public License
24 along with this program; if not, write to the Free Software
25 Foundation, Inc., 59 Temple Place, Suite 330, Boston, MA
26 02111-1307, USA.
27
28 The GNU General Public License is contained in the file COPYING.
29*/
30
31#ifndef __PUB_TOOL_DEBUGINFO_H
32#define __PUB_TOOL_DEBUGINFO_H
33
florian535fb1b2013-09-15 13:54:34 +000034#include "pub_tool_basics.h" // VG_ macro
florian09a8b142015-08-09 16:27:44 +000035#include "pub_tool_xarray.h" // XArray
florian535fb1b2013-09-15 13:54:34 +000036
njnea27e462005-05-31 02:38:09 +000037/*====================================================================*/
38/*=== Obtaining debug information ===*/
39/*====================================================================*/
40
Elliott Hughesed398002017-06-21 14:41:24 -070041/* IMPORTANT COMMENT about memory persistence and ownership.
42
43 Many functions below are returning a string in a HChar** argument.
44 This memory must not be freed by the caller : it belongs to the debuginfo
45 module. The returned string is *not* guaranteed to be persistent.
46 The exact persistence depends on the kind of information returned,
47 and of the internal implementation of the debuginfo module.
48 In other words: use the memory directly after the call, and if in doubt,
49 save it away.
50
51 In general, all returned strings will be invalidated when the
52 DebugInfo they correspond to is discarded. This is the case for
53 the filename, dirname, fnname and objname.
54 An objname might also be invalidated by changes to the address
55 space manager segments, e.g. if a segment is merged with another
56 segment.
57
58 Retrieving a fnname might imply a call to the c++ demangler.
59 A returned fnname is invalidated if any other call to the demangler
60 is done. In particular, this means that the memory returned by one of
61 the VG_(get_fnname...) functions is invalidated by :
62 * another call to any of the functions VG_(get_fnname...).
63 * any other call that will directly or indirectly invoke the
64 c++ demangler. Such an indirect call to the demangler can a.o. be
65 done by calls to pub_tool_errormgr.h functions.
66 So, among others, the following is WRONG:
67 VG_(get_fnname)(a1, &fnname1);
68 VG_(get_fnname)(a2, &fnname2);
69 ... it is WRONG to use fnname1 here ....
70*/
71
njnea27e462005-05-31 02:38:09 +000072/* Get the file/function/line number of the instruction at address
73 'a'. For these four, if debug info for the address is found, it
74 copies the info into the buffer/UInt and returns True. If not, it
florian46cc0452014-10-25 19:20:38 +000075 returns False. VG_(get_fnname) always
njnea27e462005-05-31 02:38:09 +000076 demangles C++ function names. VG_(get_fnname_w_offset) is the
Elliott Hughesed398002017-06-21 14:41:24 -070077 same, except it appends "+N" to symbol names to indicate offsets.
78 NOTE: See IMPORTANT COMMENT above about persistence and ownership. */
florian10ef7252014-10-27 12:06:35 +000079extern Bool VG_(get_filename) ( Addr a, const HChar** filename );
florian46cc0452014-10-25 19:20:38 +000080extern Bool VG_(get_fnname) ( Addr a, const HChar** fnname );
njnea27e462005-05-31 02:38:09 +000081extern Bool VG_(get_linenum) ( Addr a, UInt* linenum );
82extern Bool VG_(get_fnname_w_offset)
florian46cc0452014-10-25 19:20:38 +000083 ( Addr a, const HChar** fnname );
njnea27e462005-05-31 02:38:09 +000084
sewardj7cee6f92005-06-13 17:39:06 +000085/* This one is the most general. It gives filename, line number and
86 optionally directory name. filename and linenum may not be NULL.
87 dirname may be NULL, meaning that the caller does not want
florianf4384f42014-12-16 20:55:58 +000088 directory name info.
89 If dirname is non-null, directory info is written to *dirname, if
sewardj7cee6f92005-06-13 17:39:06 +000090 it is available; if not available, '\0' is written to the first
florianf4384f42014-12-16 20:55:58 +000091 byte.
sewardj7cee6f92005-06-13 17:39:06 +000092
Elliott Hughesed398002017-06-21 14:41:24 -070093 NOTE: See IMPORTANT COMMENT above about persistence and ownership.
florian10ef7252014-10-27 12:06:35 +000094
sewardj7cee6f92005-06-13 17:39:06 +000095 Returned value indicates whether any filename/line info could be
96 found. */
njnea27e462005-05-31 02:38:09 +000097extern Bool VG_(get_filename_linenum)
sewardj7cee6f92005-06-13 17:39:06 +000098 ( Addr a,
florian10ef7252014-10-27 12:06:35 +000099 /*OUT*/const HChar** filename,
100 /*OUT*/const HChar** dirname,
sewardj7cee6f92005-06-13 17:39:06 +0000101 /*OUT*/UInt* linenum );
njnea27e462005-05-31 02:38:09 +0000102
103/* Succeeds only if we find from debug info that 'a' is the address of the
104 first instruction in a function -- as opposed to VG_(get_fnname) which
105 succeeds if we find from debug info that 'a' is the address of any
106 instruction in a function. Use this to instrument the start of
107 a particular function. Nb: if an executable/shared object is stripped
108 of its symbols, this function will not be able to recognise function
Elliott Hughesed398002017-06-21 14:41:24 -0700109 entry points within it.
110 NOTE: See IMPORTANT COMMENT above about persistence and ownership. */
florian46cc0452014-10-25 19:20:38 +0000111extern Bool VG_(get_fnname_if_entry) ( Addr a, const HChar** fnname );
njnea27e462005-05-31 02:38:09 +0000112
njn68824432009-02-10 06:48:00 +0000113typedef
114 enum {
115 Vg_FnNameNormal, // A normal function.
116 Vg_FnNameMain, // "main"
117 Vg_FnNameBelowMain // Something below "main", eg. __libc_start_main.
118 } Vg_FnNameKind; // Such names are often filtered.
119
120/* Indicates what kind of fnname it is. */
florian46cc0452014-10-25 19:20:38 +0000121extern Vg_FnNameKind VG_(get_fnname_kind) ( const HChar* name );
njn68824432009-02-10 06:48:00 +0000122
123/* Like VG_(get_fnname_kind), but takes a code address. */
124extern Vg_FnNameKind VG_(get_fnname_kind_from_IP) ( Addr ip );
125
sewardjb8b79ad2008-03-03 01:35:41 +0000126/* Looks up data_addr in the collection of data symbols, and if found
127 puts its name (or as much as will fit) into dname[0 .. n_dname-1],
128 which is guaranteed to be zero terminated. Also data_addr's offset
129 from the symbol start is put into *offset. */
130extern Bool VG_(get_datasym_and_offset)( Addr data_addr,
florian46cc0452014-10-25 19:20:38 +0000131 /*OUT*/const HChar** dname,
njnc4431bf2009-01-15 21:29:24 +0000132 /*OUT*/PtrdiffT* offset );
sewardjb8b79ad2008-03-03 01:35:41 +0000133
sewardj5d9dc752009-07-15 14:52:18 +0000134/* Try to form some description of DATA_ADDR by looking at the DWARF3
philippe25963372013-01-16 22:07:02 +0000135 debug info we have. This considers all global variables, and 8
sewardj5d9dc752009-07-15 14:52:18 +0000136 frames in the stacks of all threads. Result is written at the ends
137 of DNAME{1,2}V, which are XArray*s of HChar, that have been
138 initialised by the caller, and True is returned. If no description
139 is created, False is returned. Regardless of the return value,
140 DNAME{1,2}V are guaranteed to be zero terminated after the call.
141
142 Note that after the call, DNAME{1,2} may have more than one
143 trailing zero, so callers should establish the useful text length
144 using VG_(strlen) on the contents, rather than VG_(sizeXA) on the
145 XArray itself.
146*/
147Bool VG_(get_data_description)(
florian09a8b142015-08-09 16:27:44 +0000148 /*MOD*/ XArray* /* of HChar */ dname1v,
149 /*MOD*/ XArray* /* of HChar */ dname2v,
sewardj5d9dc752009-07-15 14:52:18 +0000150 Addr data_addr
151 );
sewardjb8b79ad2008-03-03 01:35:41 +0000152
njnea27e462005-05-31 02:38:09 +0000153/* Succeeds if the address is within a shared object or the main executable.
Elliott Hughesed398002017-06-21 14:41:24 -0700154 It first searches if Addr a belongs to the text segment of debug info.
155 If not found, it asks the address space manager whether it
156 knows the name of the file associated with this mapping. */
florian46cc0452014-10-25 19:20:38 +0000157extern Bool VG_(get_objname) ( Addr a, const HChar** objname );
njnea27e462005-05-31 02:38:09 +0000158
philippea0a73932014-06-15 15:42:20 +0000159
160/* Cursor allowing to describe inlined function calls at an IP,
161 by doing successive calls to VG_(describe_IP). */
162typedef struct _InlIPCursor InlIPCursor;
163
florian770a8d22014-11-03 22:43:42 +0000164/* Returns info about the code address %eip: the address, function
njnea27e462005-05-31 02:38:09 +0000165 name (if known) and filename/line number (if known), like this:
166
167 0x4001BF05: realloc (vg_replace_malloc.c:339)
168
philippea0a73932014-06-15 15:42:20 +0000169 eip can possibly corresponds to inlined function call(s).
170 To describe eip and the inlined function calls, the following must
171 be done:
172 InlIPCursor *iipc = VG_(new_IIPC)(eip);
173 do {
florian770a8d22014-11-03 22:43:42 +0000174 buf = VG_(describe_IP)(eip, iipc);
philippea0a73932014-06-15 15:42:20 +0000175 ... use buf ...
176 } while (VG_(next_IIPC)(iipc));
177 VG_(delete_IIPC)(iipc);
178
179 To only describe eip, without the inlined calls at eip, give a NULL iipc:
florian770a8d22014-11-03 22:43:42 +0000180 buf = VG_(describe_IP)(eip, NULL);
181
182 Note, that the returned string is allocated in a static buffer local to
183 VG_(describe_IP). That buffer will be overwritten with every invocation.
184 Therefore, callers need to possibly stash away the string.
njnea27e462005-05-31 02:38:09 +0000185*/
florian770a8d22014-11-03 22:43:42 +0000186extern const HChar* VG_(describe_IP)(Addr eip, const InlIPCursor* iipc);
philippea0a73932014-06-15 15:42:20 +0000187
188/* Builds a IIPC (Inlined IP Cursor) to describe eip and all the inlined calls
189 at eip. Such a cursor must be deleted after use using VG_(delete_IIPC). */
190extern InlIPCursor* VG_(new_IIPC)(Addr eip);
191/* Move the cursor to the next call to describe.
192 Returns True if there are still calls to describe.
193 False if nothing to describe anymore. */
194extern Bool VG_(next_IIPC)(InlIPCursor *iipc);
195/* Free all memory associated with iipc. */
196extern void VG_(delete_IIPC)(InlIPCursor *iipc);
197
njnea27e462005-05-31 02:38:09 +0000198
sewardj9c606bd2008-09-18 18:12:50 +0000199
200/* Get an XArray of StackBlock which describe the stack (auto) blocks
201 for this ip. The caller is expected to free the XArray at some
202 point. If 'arrays_only' is True, only array-typed blocks are
203 returned; otherwise blocks of all types are returned. */
204
205typedef
206 struct {
njnc4431bf2009-01-15 21:29:24 +0000207 PtrdiffT base; /* offset from sp or fp */
208 SizeT szB; /* size in bytes */
209 Bool spRel; /* True => sp-rel, False => fp-rel */
210 Bool isVec; /* does block have an array type, or not? */
211 HChar name[16]; /* first 15 chars of name (asciiz) */
sewardj9c606bd2008-09-18 18:12:50 +0000212 }
213 StackBlock;
214
florian09a8b142015-08-09 16:27:44 +0000215extern XArray* /* of StackBlock */
216VG_(di_get_stack_blocks_at_ip)( Addr ip, Bool arrays_only );
sewardj9c606bd2008-09-18 18:12:50 +0000217
218
219/* Get an array of GlobalBlock which describe the global blocks owned
220 by the shared object characterised by the given di_handle. Asserts
221 if the handle is invalid. The caller is responsible for freeing
222 the array at some point. If 'arrays_only' is True, only
223 array-typed blocks are returned; otherwise blocks of all types are
224 returned. */
225
226typedef
227 struct {
228 Addr addr;
229 SizeT szB;
230 Bool isVec; /* does block have an array type, or not? */
231 HChar name[16]; /* first 15 chars of name (asciiz) */
232 HChar soname[16]; /* first 15 chars of name (asciiz) */
233 }
234 GlobalBlock;
235
florian09a8b142015-08-09 16:27:44 +0000236extern XArray* /* of GlobalBlock */
sewardj9c606bd2008-09-18 18:12:50 +0000237VG_(di_get_global_blocks_from_dihandle) ( ULong di_handle,
238 Bool arrays_only );
239
240
njnea27e462005-05-31 02:38:09 +0000241/*====================================================================*/
sewardje3f1e592009-07-31 09:41:29 +0000242/*=== Obtaining debug information ===*/
njnea27e462005-05-31 02:38:09 +0000243/*====================================================================*/
244
sewardje3f1e592009-07-31 09:41:29 +0000245/* A way to make limited debuginfo queries on a per-mapped-object
246 basis. */
247typedef struct _DebugInfo DebugInfo;
njnea27e462005-05-31 02:38:09 +0000248
sewardjb8b79ad2008-03-03 01:35:41 +0000249/* Returns NULL if the DebugInfo isn't found. It doesn't matter if
250 debug info is present or not. */
sewardje3f1e592009-07-31 09:41:29 +0000251DebugInfo* VG_(find_DebugInfo) ( Addr a );
njnea27e462005-05-31 02:38:09 +0000252
sewardjb8b79ad2008-03-03 01:35:41 +0000253/* Fish bits out of DebugInfos. */
sewardje3f1e592009-07-31 09:41:29 +0000254Addr VG_(DebugInfo_get_text_avma) ( const DebugInfo *di );
255SizeT VG_(DebugInfo_get_text_size) ( const DebugInfo *di );
bart38980222013-08-24 17:52:26 +0000256Addr VG_(DebugInfo_get_bss_avma) ( const DebugInfo *di );
257SizeT VG_(DebugInfo_get_bss_size) ( const DebugInfo *di );
sewardje3f1e592009-07-31 09:41:29 +0000258Addr VG_(DebugInfo_get_plt_avma) ( const DebugInfo *di );
259SizeT VG_(DebugInfo_get_plt_size) ( const DebugInfo *di );
260Addr VG_(DebugInfo_get_gotplt_avma) ( const DebugInfo *di );
261SizeT VG_(DebugInfo_get_gotplt_size) ( const DebugInfo *di );
bart68347832012-09-06 14:08:26 +0000262Addr VG_(DebugInfo_get_got_avma) ( const DebugInfo *di );
263SizeT VG_(DebugInfo_get_got_size) ( const DebugInfo *di );
florian1636d332012-11-15 04:27:04 +0000264const HChar* VG_(DebugInfo_get_soname) ( const DebugInfo *di );
265const HChar* VG_(DebugInfo_get_filename) ( const DebugInfo *di );
sewardje3f1e592009-07-31 09:41:29 +0000266PtrdiffT VG_(DebugInfo_get_text_bias) ( const DebugInfo *di );
njnea27e462005-05-31 02:38:09 +0000267
sewardje3f1e592009-07-31 09:41:29 +0000268/* Function for traversing the DebugInfo list. When called with NULL
269 it returns the first element; otherwise it returns the given
270 element's successor. Note that the order of elements in the list
271 changes in response to most of the queries listed in this header,
272 that explicitly or implicitly have to search the list for a
273 particular code address. So it isn't safe to assume that the order
274 of the list stays constant. */
275const DebugInfo* VG_(next_DebugInfo) ( const DebugInfo *di );
sewardj0ec07f32006-01-12 12:32:32 +0000276
sewardjb8b79ad2008-03-03 01:35:41 +0000277/* A simple enumeration to describe the 'kind' of various kinds of
278 segments that arise from the mapping of object files. */
njnea27e462005-05-31 02:38:09 +0000279typedef
280 enum {
281 Vg_SectUnknown,
282 Vg_SectText,
283 Vg_SectData,
284 Vg_SectBSS,
285 Vg_SectGOT,
sewardjb8b79ad2008-03-03 01:35:41 +0000286 Vg_SectPLT,
bart092b6262008-05-25 16:37:22 +0000287 Vg_SectGOTPLT,
sewardjb8b79ad2008-03-03 01:35:41 +0000288 Vg_SectOPD
njnea27e462005-05-31 02:38:09 +0000289 }
290 VgSectKind;
291
sewardjb8b79ad2008-03-03 01:35:41 +0000292/* Convert a VgSectKind to a string, which must be copied if you want
293 to change it. */
sewardjb8b79ad2008-03-03 01:35:41 +0000294const HChar* VG_(pp_SectKind)( VgSectKind kind );
njnea27e462005-05-31 02:38:09 +0000295
sewardjb8b79ad2008-03-03 01:35:41 +0000296/* Given an address 'a', make a guess of which section of which object
Elliott Hughesed398002017-06-21 14:41:24 -0700297 it comes from. If objname is non-NULL, then the object's name is put
298 into *objname. This only looks in debug info, it does not examine
299 the address space manager mapped files. */
300VgSectKind VG_(DebugInfo_sect_kind)( /*OUT*/const HChar** objname, Addr a);
sewardjbbec7722007-11-25 14:08:53 +0000301
302
njnea27e462005-05-31 02:38:09 +0000303#endif // __PUB_TOOL_DEBUGINFO_H
304
305/*--------------------------------------------------------------------*/
306/*--- end ---*/
307/*--------------------------------------------------------------------*/