blob: 9a19973b12e1f6501b55f1302c18e011a1a2c7e1 [file] [log] [blame]
Chris Lattner24943d22010-06-08 16:52:24 +00001//===-- Symtab.cpp ----------------------------------------------*- C++ -*-===//
2//
3// The LLVM Compiler Infrastructure
4//
5// This file is distributed under the University of Illinois Open Source
6// License. See LICENSE.TXT for details.
7//
8//===----------------------------------------------------------------------===//
9
10#include <map>
11
12#include "lldb/Core/Module.h"
13#include "lldb/Core/RegularExpression.h"
14#include "lldb/Core/Timer.h"
15#include "lldb/Symbol/ObjectFile.h"
16#include "lldb/Symbol/Symtab.h"
17
18using namespace lldb;
19using namespace lldb_private;
20
21
22
23Symtab::Symtab(ObjectFile *objfile) :
24 m_objfile(objfile),
25 m_symbols(),
26 m_addr_indexes(),
27 m_name_to_index()
28{
29}
30
31Symtab::~Symtab()
32{
33}
34
35void
36Symtab::Reserve(uint32_t count)
37{
38 m_symbols.reserve (count);
39}
40
41Symbol *
42Symtab::Resize(uint32_t count)
43{
44 m_symbols.resize (count);
45 return &m_symbols[0];
46}
47
48uint32_t
49Symtab::AddSymbol(const Symbol& symbol)
50{
51 uint32_t symbol_idx = m_symbols.size();
52 m_name_to_index.Clear();
53 m_addr_indexes.clear();
54 m_symbols.push_back(symbol);
55 return symbol_idx;
56}
57
58size_t
59Symtab::GetNumSymbols() const
60{
61 return m_symbols.size();
62}
63
64void
65Symtab::Dump(Stream *s, Process *process) const
66{
67 const_iterator pos;
68 s->Printf("%.*p: ", (int)sizeof(void*) * 2, this);
69 s->Indent();
70 const FileSpec &file_spec = m_objfile->GetFileSpec();
71 const char * object_name = NULL;
72 if (m_objfile->GetModule())
73 object_name = m_objfile->GetModule()->GetObjectName().GetCString();
74
75 if (file_spec)
76 s->Printf("Symtab, file = %s/%s%s%s%s, num_symbols = %u:\n",
77 file_spec.GetDirectory().AsCString(),
78 file_spec.GetFilename().AsCString(),
79 object_name ? "(" : "",
80 object_name ? object_name : "",
81 object_name ? ")" : "",
82 m_symbols.size());
83 else
84 s->Printf("Symtab, num_symbols = %u:\n", m_symbols.size());
85 s->IndentMore();
86
87 if (!m_symbols.empty())
88 {
89 const_iterator begin = m_symbols.begin();
90 const_iterator end = m_symbols.end();
91 DumpSymbolHeader (s);
92 for (pos = m_symbols.begin(); pos != end; ++pos)
93 {
94 s->Indent();
95 pos->Dump(s, process, std::distance(begin, pos));
96 }
97 }
98 s->IndentLess ();
99}
100
101void
102Symtab::Dump(Stream *s, Process *process, std::vector<uint32_t>& indexes) const
103{
104 const size_t num_symbols = GetNumSymbols();
105 s->Printf("%.*p: ", (int)sizeof(void*) * 2, this);
106 s->Indent();
107 s->Printf("Symtab %u symbol indexes (%u symbols total):\n", indexes.size(), m_symbols.size());
108 s->IndentMore();
109
110 if (!indexes.empty())
111 {
112 std::vector<uint32_t>::const_iterator pos;
113 std::vector<uint32_t>::const_iterator end = indexes.end();
114 DumpSymbolHeader (s);
115 for (pos = indexes.begin(); pos != end; ++pos)
116 {
117 uint32_t idx = *pos;
118 if (idx < num_symbols)
119 {
120 s->Indent();
121 m_symbols[idx].Dump(s, process, idx);
122 }
123 }
124 }
125 s->IndentLess ();
126}
127
128void
129Symtab::DumpSymbolHeader (Stream *s)
130{
131 s->Indent(" Debug symbol\n");
132 s->Indent(" |Synthetic symbol\n");
133 s->Indent(" ||Externally Visible\n");
134 s->Indent(" |||\n");
135 s->Indent("Index UserID DSX Type File Address/Value Load Address Size Flags Name\n");
136 s->Indent("------- ------ --- ------------ ------------------ ------------------ ------------------ ---------- ----------------------------------\n");
137}
138
139Symbol *
140Symtab::SymbolAtIndex(uint32_t idx)
141{
142 if (idx < m_symbols.size())
143 return &m_symbols[idx];
144 return NULL;
145}
146
147
148const Symbol *
149Symtab::SymbolAtIndex(uint32_t idx) const
150{
151 if (idx < m_symbols.size())
152 return &m_symbols[idx];
153 return NULL;
154}
155
156//----------------------------------------------------------------------
157// InitNameIndexes
158//----------------------------------------------------------------------
159void
160Symtab::InitNameIndexes()
161{
162 Timer scoped_timer (__PRETTY_FUNCTION__, "%s", __PRETTY_FUNCTION__);
163 // Create the name index vector to be able to quickly search by name
164 const size_t count = m_symbols.size();
165 assert(m_objfile != NULL);
166 assert(m_objfile->GetModule() != NULL);
167 m_name_to_index.Reserve (count);
168
169 UniqueCStringMap<uint32_t>::Entry entry;
170
171 for (entry.value = 0; entry.value < count; ++entry.value)
172 {
173 const Symbol *symbol = &m_symbols[entry.value];
174
175 // Don't let trampolines get into the lookup by name map
176 // If we ever need the trampoline symbols to be searchable by name
177 // we can remove this and then possibly add a new bool to any of the
178 // Symtab functions that lookup symbols by name to indicate if they
179 // want trampolines.
180 if (symbol->IsTrampoline())
181 continue;
182
183 const Mangled &mangled = symbol->GetMangled();
184 entry.cstring = mangled.GetMangledName().GetCString();
185 if (entry.cstring && entry.cstring[0])
186 m_name_to_index.Append (entry);
187
188 entry.cstring = mangled.GetDemangledName().GetCString();
189 if (entry.cstring && entry.cstring[0])
190 m_name_to_index.Append (entry);
191 }
192 m_name_to_index.Sort();
193}
194
195uint32_t
196Symtab::AppendSymbolIndexesWithType(SymbolType symbol_type, std::vector<uint32_t>& indexes, uint32_t start_idx, uint32_t end_index) const
197{
198 uint32_t prev_size = indexes.size();
199
200 const uint32_t count = std::min<uint32_t> (m_symbols.size(), end_index);
201
202 for (uint32_t i = start_idx; i < count; ++i)
203 {
204 if (symbol_type == eSymbolTypeAny || m_symbols[i].GetType() == symbol_type)
205 indexes.push_back(i);
206 }
207
208 return indexes.size() - prev_size;
209}
210
211struct SymbolSortInfo
212{
213 const bool sort_by_load_addr;
214 const Symbol *symbols;
215};
216
217int
218Symtab::CompareSymbolValueByIndex (void *thunk, const void *a, const void *b)
219{
220 const Symbol *symbols = (const Symbol *)thunk;
221 uint32_t index_a = *((uint32_t *) a);
222 uint32_t index_b = *((uint32_t *) b);
223
224 addr_t value_a;
225 addr_t value_b;
226 if (symbols[index_a].GetValue().GetSection() == symbols[index_b].GetValue().GetSection())
227 {
228 value_a = symbols[index_a].GetValue ().GetOffset();
229 value_b = symbols[index_b].GetValue ().GetOffset();
230 }
231 else
232 {
233 value_a = symbols[index_a].GetValue ().GetFileAddress();
234 value_b = symbols[index_b].GetValue ().GetFileAddress();
235 }
236
237 if (value_a == value_b)
238 {
239 // The if the values are equal, use the original symbol user ID
240 lldb::user_id_t uid_a = symbols[index_a].GetID();
241 lldb::user_id_t uid_b = symbols[index_b].GetID();
242 if (uid_a < uid_b)
243 return -1;
244 if (uid_a > uid_b)
245 return 1;
246 return 0;
247 }
248 else if (value_a < value_b)
249 return -1;
250
251 return 1;
252}
253
Eli Friedman020f3532010-06-10 23:36:31 +0000254int Symtab::CompareSymbolValueByIndexLinux(const void* a, const void* b, void* thunk) {
255 CompareSymbolValueByIndex(thunk, a, b);
256}
257
Chris Lattner24943d22010-06-08 16:52:24 +0000258void
259Symtab::SortSymbolIndexesByValue (std::vector<uint32_t>& indexes, bool remove_duplicates) const
260{
261 // No need to sort if we have zero or one items...
262 if (indexes.size() <= 1)
263 return;
264
265 // Sort the indexes in place using qsort
Eli Friedman020f3532010-06-10 23:36:31 +0000266 // FIXME: (WRONGDEFINE) Need a better define for this!
267#ifdef __APPLE__
Chris Lattner24943d22010-06-08 16:52:24 +0000268 ::qsort_r (&indexes[0], indexes.size(), sizeof(uint32_t), (void *)&m_symbols[0], Symtab::CompareSymbolValueByIndex);
Eli Friedman020f3532010-06-10 23:36:31 +0000269#else
270 ::qsort_r (&indexes[0], indexes.size(), sizeof(uint32_t), CompareSymbolValueByIndexLinux, (void *)&m_symbols[0]);
271#endif
Chris Lattner24943d22010-06-08 16:52:24 +0000272
273 // Remove any duplicates if requested
274 if (remove_duplicates)
275 std::unique(indexes.begin(), indexes.end());
276}
277
278uint32_t
279Symtab::AppendSymbolIndexesWithName(const ConstString& symbol_name, std::vector<uint32_t>& indexes)
280{
281 Timer scoped_timer (__PRETTY_FUNCTION__, "%s", __PRETTY_FUNCTION__);
282 if (symbol_name)
283 {
284 const size_t old_size = indexes.size();
285 if (m_name_to_index.IsEmpty())
286 InitNameIndexes();
287
288 const char *symbol_cstr = symbol_name.GetCString();
289 const UniqueCStringMap<uint32_t>::Entry *entry_ptr;
290 for (entry_ptr = m_name_to_index.FindFirstValueForName (symbol_cstr);
291 entry_ptr!= NULL;
292 entry_ptr = m_name_to_index.FindNextValueForName (symbol_cstr, entry_ptr))
293 {
294 indexes.push_back (entry_ptr->value);
295 }
296 return indexes.size() - old_size;
297 }
298 return 0;
299}
300
301uint32_t
302Symtab::AppendSymbolIndexesWithNameAndType(const ConstString& symbol_name, SymbolType symbol_type, std::vector<uint32_t>& indexes)
303{
304 if (AppendSymbolIndexesWithName(symbol_name, indexes) > 0)
305 {
306 std::vector<uint32_t>::iterator pos = indexes.begin();
307 while (pos != indexes.end())
308 {
309 if (symbol_type == eSymbolTypeAny || m_symbols[*pos].GetType() == symbol_type)
310 ++pos;
311 else
312 indexes.erase(pos);
313 }
314 }
315 return indexes.size();
316}
317
318uint32_t
319Symtab::AppendSymbolIndexesMatchingRegExAndType (const RegularExpression &regexp, SymbolType symbol_type, std::vector<uint32_t>& indexes)
320{
321 uint32_t prev_size = indexes.size();
322 uint32_t sym_end = m_symbols.size();
323
324 for (int i = 0; i < sym_end; i++)
325 {
326 if (symbol_type == eSymbolTypeAny || m_symbols[i].GetType() == symbol_type)
327 {
328 const char *name = m_symbols[i].GetMangled().GetName().AsCString();
329 if (name)
330 {
331 if (regexp.Execute (name))
332 indexes.push_back(i);
333 }
334 }
335 }
336 return indexes.size() - prev_size;
337
338}
339
340Symbol *
341Symtab::FindSymbolWithType(SymbolType symbol_type, uint32_t& start_idx)
342{
343 const size_t count = m_symbols.size();
344 for (uint32_t idx = start_idx; idx < count; ++idx)
345 {
346 if (symbol_type == eSymbolTypeAny || m_symbols[idx].GetType() == symbol_type)
347 {
348 start_idx = idx;
349 return &m_symbols[idx];
350 }
351 }
352 return NULL;
353}
354
355const Symbol *
356Symtab::FindSymbolWithType(SymbolType symbol_type, uint32_t& start_idx) const
357{
358 const size_t count = m_symbols.size();
359 for (uint32_t idx = start_idx; idx < count; ++idx)
360 {
361 if (symbol_type == eSymbolTypeAny || m_symbols[idx].GetType() == symbol_type)
362 {
363 start_idx = idx;
364 return &m_symbols[idx];
365 }
366 }
367 return NULL;
368}
369
370size_t
371Symtab::FindAllSymbolsWithNameAndType (const ConstString &name, SymbolType symbol_type, std::vector<uint32_t>& symbol_indexes)
372{
373 Timer scoped_timer (__PRETTY_FUNCTION__, "%s", __PRETTY_FUNCTION__);
374 // Initialize all of the lookup by name indexes before converting NAME
375 // to a uniqued string NAME_STR below.
376 if (m_name_to_index.IsEmpty())
377 InitNameIndexes();
378
379 if (name)
380 {
381 // The string table did have a string that matched, but we need
382 // to check the symbols and match the symbol_type if any was given.
383 AppendSymbolIndexesWithNameAndType(name, symbol_type, symbol_indexes);
384 }
385 return symbol_indexes.size();
386}
387
388size_t
389Symtab::FindAllSymbolsMatchingRexExAndType (const RegularExpression &regex, SymbolType symbol_type, std::vector<uint32_t>& symbol_indexes)
390{
391 AppendSymbolIndexesMatchingRegExAndType(regex, symbol_type, symbol_indexes);
392 return symbol_indexes.size();
393}
394
395Symbol *
396Symtab::FindFirstSymbolWithNameAndType (const ConstString &name, SymbolType symbol_type)
397{
398 Timer scoped_timer (__PRETTY_FUNCTION__, "%s", __PRETTY_FUNCTION__);
399 if (m_name_to_index.IsEmpty())
400 InitNameIndexes();
401
402 if (name)
403 {
404 std::vector<uint32_t> matching_indexes;
405 // The string table did have a string that matched, but we need
406 // to check the symbols and match the symbol_type if any was given.
407 if (AppendSymbolIndexesWithNameAndType(name, symbol_type, matching_indexes))
408 {
409 std::vector<uint32_t>::const_iterator pos, end = matching_indexes.end();
410 for (pos = matching_indexes.begin(); pos != end; ++pos)
411 {
412 Symbol *symbol = SymbolAtIndex(*pos);
413
414 if (symbol->Compare(name, symbol_type))
415 return symbol;
416 }
417 }
418 }
419 return NULL;
420}
421
422typedef struct
423{
424 const Symtab *symtab;
425 const addr_t file_addr;
426 Symbol *match_symbol;
427 const uint32_t *match_index_ptr;
428 addr_t match_offset;
429} SymbolSearchInfo;
430
431static int
432SymbolWithFileAddress (SymbolSearchInfo *info, const uint32_t *index_ptr)
433{
434 const Symbol *curr_symbol = info->symtab->SymbolAtIndex (index_ptr[0]);
435 if (curr_symbol == NULL)
436 return -1;
437
438 const addr_t info_file_addr = info->file_addr;
439
440 // lldb::Symbol::GetAddressRangePtr() will only return a non NULL address
441 // range if the symbol has a section!
442 const AddressRange *curr_range = curr_symbol->GetAddressRangePtr();
443 if (curr_range)
444 {
445 const addr_t curr_file_addr = curr_range->GetBaseAddress().GetFileAddress();
446 if (info_file_addr < curr_file_addr)
447 return -1;
448 if (info_file_addr > curr_file_addr)
449 return +1;
450 info->match_symbol = const_cast<Symbol *>(curr_symbol);
451 info->match_index_ptr = index_ptr;
452 return 0;
453 }
454
455 return -1;
456}
457
458static int
459SymbolWithClosestFileAddress (SymbolSearchInfo *info, const uint32_t *index_ptr)
460{
461 const Symbol *symbol = info->symtab->SymbolAtIndex (index_ptr[0]);
462 if (symbol == NULL)
463 return -1;
464
465 const addr_t info_file_addr = info->file_addr;
466 const AddressRange *curr_range = symbol->GetAddressRangePtr();
467 if (curr_range)
468 {
469 const addr_t curr_file_addr = curr_range->GetBaseAddress().GetFileAddress();
470 if (info_file_addr < curr_file_addr)
471 return -1;
472
473 // Since we are finding the closest symbol that is greater than or equal
474 // to 'info->file_addr' we set the symbol here. This will get set
475 // multiple times, but after the search is done it will contain the best
476 // symbol match
477 info->match_symbol = const_cast<Symbol *>(symbol);
478 info->match_index_ptr = index_ptr;
479 info->match_offset = info_file_addr - curr_file_addr;
480
481 if (info_file_addr > curr_file_addr)
482 return +1;
483 return 0;
484 }
485 return -1;
486}
487
488static SymbolSearchInfo
489FindIndexPtrForSymbolContainingAddress(Symtab* symtab, addr_t file_addr, const uint32_t* indexes, uint32_t num_indexes)
490{
491 SymbolSearchInfo info = { symtab, file_addr, NULL, NULL, 0 };
492 bsearch(&info, indexes, num_indexes, sizeof(uint32_t), (comparison_function)SymbolWithClosestFileAddress);
493 return info;
494}
495
496
497void
498Symtab::InitAddressIndexes()
499{
500 if (m_addr_indexes.empty())
501 {
502 AppendSymbolIndexesWithType (eSymbolTypeFunction, m_addr_indexes);
503 AppendSymbolIndexesWithType (eSymbolTypeGlobal, m_addr_indexes);
504 AppendSymbolIndexesWithType (eSymbolTypeStatic, m_addr_indexes);
505 AppendSymbolIndexesWithType (eSymbolTypeCode, m_addr_indexes);
506 AppendSymbolIndexesWithType (eSymbolTypeTrampoline, m_addr_indexes);
507 AppendSymbolIndexesWithType (eSymbolTypeData, m_addr_indexes);
508 SortSymbolIndexesByValue(m_addr_indexes, true);
509 m_addr_indexes.push_back(UINT32_MAX); // Terminator for bsearch since we might need to look at the next symbol
510 }
511}
512
513size_t
514Symtab::CalculateSymbolSize (Symbol *symbol)
515{
516 // Make sure this symbol is from this symbol table...
517 if (symbol < m_symbols.data() && symbol >= m_symbols.data() + m_symbols.size())
518 return 0;
519
520 // See if this symbol already has a byte size?
521 size_t byte_size = symbol->GetByteSize();
522
523 if (byte_size)
524 {
525 // It does, just return it
526 return byte_size;
527 }
528
529 // Else if this is an address based symbol, figure out the delta between
530 // it and the next address based symbol
531 if (symbol->GetAddressRangePtr())
532 {
533 if (m_addr_indexes.empty())
534 InitAddressIndexes();
535 const size_t num_addr_indexes = m_addr_indexes.size();
536 SymbolSearchInfo info = FindIndexPtrForSymbolContainingAddress(this, symbol->GetAddressRangePtr()->GetBaseAddress().GetFileAddress(), m_addr_indexes.data(), num_addr_indexes);
537 if (info.match_index_ptr != NULL)
538 {
539 const lldb::addr_t curr_file_addr = symbol->GetAddressRangePtr()->GetBaseAddress().GetFileAddress();
540 // We can figure out the address range of all symbols except the
541 // last one by taking the delta between the current symbol and
542 // the next symbol
543
544 for (uint32_t addr_index = info.match_index_ptr - m_addr_indexes.data() + 1;
545 addr_index < num_addr_indexes;
546 ++addr_index)
547 {
548 Symbol *next_symbol = SymbolAtIndex(m_addr_indexes[addr_index]);
549 if (next_symbol == NULL)
550 break;
551
552 assert (next_symbol->GetAddressRangePtr());
553 const lldb::addr_t next_file_addr = next_symbol->GetAddressRangePtr()->GetBaseAddress().GetFileAddress();
554 if (next_file_addr > curr_file_addr)
555 {
556 byte_size = next_file_addr - curr_file_addr;
557 symbol->GetAddressRangePtr()->SetByteSize(byte_size);
558 symbol->SetSizeIsSynthesized(true);
559 break;
560 }
561 }
562 }
563 }
564 return byte_size;
565}
566
567Symbol *
568Symtab::FindSymbolWithFileAddress (addr_t file_addr)
569{
570 if (m_addr_indexes.empty())
571 InitAddressIndexes();
572
573 SymbolSearchInfo info = { this, file_addr, NULL, NULL, 0 };
574
575 uint32_t* match = (uint32_t*)bsearch(&info, &m_addr_indexes[0], m_addr_indexes.size(), sizeof(uint32_t), (comparison_function)SymbolWithFileAddress);
576 if (match)
577 return SymbolAtIndex (*match);
578 return NULL;
579}
580
581
582Symbol *
583Symtab::FindSymbolContainingFileAddress (addr_t file_addr, const uint32_t* indexes, uint32_t num_indexes)
584{
585 SymbolSearchInfo info = { this, file_addr, NULL, NULL, 0 };
586
587 bsearch(&info, indexes, num_indexes, sizeof(uint32_t), (comparison_function)SymbolWithClosestFileAddress);
588
589 if (info.match_symbol)
590 {
591 if (info.match_offset < CalculateSymbolSize(info.match_symbol))
592 return info.match_symbol;
593 }
594 return NULL;
595}
596
597Symbol *
598Symtab::FindSymbolContainingFileAddress (addr_t file_addr)
599{
600 if (m_addr_indexes.empty())
601 InitAddressIndexes();
602
603 return FindSymbolContainingFileAddress (file_addr, &m_addr_indexes[0], m_addr_indexes.size());
604}
605