blob: 0ce83c72f24ed4a4fb9fd0e63f2405ceb919c4d4 [file] [log] [blame]
Gabor Greif0e535c3c2007-07-04 21:55:50 +00001//===-- llvm-bcanalyzer.cpp - Bitcode Analyzer --------------------------===//
Misha Brukman650ba8e2005-04-22 00:00:37 +00002//
Reid Spencerdb5c86d2004-06-07 17:53:43 +00003// The LLVM Compiler Infrastructure
4//
Chris Lattner345353d2007-12-29 20:44:31 +00005// This file is distributed under the University of Illinois Open Source
6// License. See LICENSE.TXT for details.
Misha Brukman650ba8e2005-04-22 00:00:37 +00007//
Reid Spencerdb5c86d2004-06-07 17:53:43 +00008//===----------------------------------------------------------------------===//
9//
Reid Spencerddc6fb12004-06-08 05:56:58 +000010// This tool may be invoked in the following manner:
Gabor Greif0e535c3c2007-07-04 21:55:50 +000011// llvm-bcanalyzer [options] - Read LLVM bitcode from stdin
12// llvm-bcanalyzer [options] x.bc - Read LLVM bitcode from the x.bc file
Reid Spencerdb5c86d2004-06-07 17:53:43 +000013//
Reid Spencerddc6fb12004-06-08 05:56:58 +000014// Options:
Reid Spencerb3a4e0b2004-06-10 18:38:44 +000015// --help - Output information about command line switches
Gabor Greif0e535c3c2007-07-04 21:55:50 +000016// --dump - Dump low-level bitcode structure in readable format
Reid Spencerddc6fb12004-06-08 05:56:58 +000017//
Gabor Greif0e535c3c2007-07-04 21:55:50 +000018// This tool provides analytical information about a bitcode file. It is
19// intended as an aid to developers of bitcode reading and writing software. It
20// produces on std::out a summary of the bitcode file that shows various
Reid Spencerb3a4e0b2004-06-10 18:38:44 +000021// statistics about the contents of the file. By default this information is
Gabor Greif0e535c3c2007-07-04 21:55:50 +000022// detailed and contains information about individual bitcode blocks and the
Daniel Dunbar75359a7c2009-09-25 16:03:57 +000023// functions in the module.
Gabor Greif0e535c3c2007-07-04 21:55:50 +000024// The tool is also able to print a bitcode file in a straight forward text
Misha Brukman650ba8e2005-04-22 00:00:37 +000025// format that shows the containment and relationships of the information in
Gabor Greif0e535c3c2007-07-04 21:55:50 +000026// the bitcode file (-dump option).
Chris Lattnercc189892007-04-29 05:51:00 +000027//
Reid Spencerdb5c86d2004-06-07 17:53:43 +000028//===----------------------------------------------------------------------===//
29
Mehdi Aminid7ad2212016-04-01 05:33:11 +000030#include "llvm/ADT/StringExtras.h"
Mehdi Aminib550cb12016-04-18 09:17:29 +000031#include "llvm/Bitcode/BitstreamReader.h"
Chris Lattner1684cee2007-04-29 20:00:02 +000032#include "llvm/Bitcode/LLVMBitCodes.h"
Chris Lattnerb9e07fd2009-04-06 20:54:32 +000033#include "llvm/Bitcode/ReaderWriter.h"
Chandler Carruth5ad5f152014-01-13 09:26:24 +000034#include "llvm/IR/Verifier.h"
Reid Spencer7c16caa2004-09-01 22:55:40 +000035#include "llvm/Support/CommandLine.h"
Daniel Dunbare813b222009-09-25 16:04:21 +000036#include "llvm/Support/Format.h"
Chris Lattner76d46322006-12-06 01:18:01 +000037#include "llvm/Support/ManagedStatic.h"
Chris Lattner03997582007-04-29 08:12:22 +000038#include "llvm/Support/MemoryBuffer.h"
Chris Lattnere3fc2d12009-03-06 05:34:10 +000039#include "llvm/Support/PrettyStackTrace.h"
Mehdi Aminid7ad2212016-04-01 05:33:11 +000040#include "llvm/Support/SHA1.h"
Mehdi Aminib550cb12016-04-18 09:17:29 +000041#include "llvm/Support/Signals.h"
Chandler Carruth4d88a1c2012-12-04 10:44:52 +000042#include "llvm/Support/raw_ostream.h"
Chris Lattner4a7ac9f2007-05-05 01:46:49 +000043#include <algorithm>
Will Dietz981af002013-10-12 00:55:57 +000044#include <cctype>
Chandler Carruth4d88a1c2012-12-04 10:44:52 +000045#include <map>
Rafael Espindolaa6e9c3e2014-06-12 17:38:55 +000046#include <system_error>
Reid Spencerdb5c86d2004-06-07 17:53:43 +000047using namespace llvm;
48
49static cl::opt<std::string>
Gabor Greif0e535c3c2007-07-04 21:55:50 +000050 InputFilename(cl::Positional, cl::desc("<input bitcode>"), cl::init("-"));
Reid Spencerdb5c86d2004-06-07 17:53:43 +000051
Gabor Greif0e535c3c2007-07-04 21:55:50 +000052static cl::opt<bool> Dump("dump", cl::desc("Dump low level bitcode trace"));
Chris Lattnerca0ea542007-04-29 08:31:14 +000053
54//===----------------------------------------------------------------------===//
55// Bitcode specific analysis.
56//===----------------------------------------------------------------------===//
57
Chris Lattner4a7ac9f2007-05-05 01:46:49 +000058static cl::opt<bool> NoHistogram("disable-histogram",
59 cl::desc("Do not print per-code histogram"));
Chris Lattner03997582007-04-29 08:12:22 +000060
Chris Lattner3543caa2007-04-29 21:48:19 +000061static cl::opt<bool>
62NonSymbolic("non-symbolic",
Michael J. Spencer39a0ffc2010-12-16 03:29:14 +000063 cl::desc("Emit numeric info in dump even if"
Chris Lattner3543caa2007-04-29 21:48:19 +000064 " symbolic info is available"));
65
Jordan Rose88eb5342014-08-30 17:07:55 +000066static cl::opt<std::string>
67 BlockInfoFilename("block-info",
68 cl::desc("Use the BLOCK_INFO from the given file"));
69
Jordan Rose0fa38b82015-05-13 18:51:49 +000070static cl::opt<bool>
71 ShowBinaryBlobs("show-binary-blobs",
72 cl::desc("Print binary blobs using hex escapes"));
73
Dan Gohmanf749ad72010-12-09 20:35:40 +000074namespace {
75
76/// CurStreamTypeType - A type for CurStreamType
77enum CurStreamTypeType {
Chris Lattner03997582007-04-29 08:12:22 +000078 UnknownBitstream,
79 LLVMIRBitstream
Dan Gohmanf749ad72010-12-09 20:35:40 +000080};
81
82}
83
Chris Lattner1684cee2007-04-29 20:00:02 +000084/// GetBlockName - Return a symbolic block name if known, otherwise return
Chris Lattner3543caa2007-04-29 21:48:19 +000085/// null.
Chris Lattnera6fdf5a2009-04-26 22:21:57 +000086static const char *GetBlockName(unsigned BlockID,
Jordan Rose88eb5342014-08-30 17:07:55 +000087 const BitstreamReader &StreamFile,
88 CurStreamTypeType CurStreamType) {
Chris Lattner9181ddf2007-05-05 00:17:42 +000089 // Standard blocks for all bitcode files.
90 if (BlockID < bitc::FIRST_APPLICATION_BLOCKID) {
91 if (BlockID == bitc::BLOCKINFO_BLOCK_ID)
92 return "BLOCKINFO_BLOCK";
Craig Toppere6cb63e2014-04-25 04:24:47 +000093 return nullptr;
Chris Lattner9181ddf2007-05-05 00:17:42 +000094 }
Daniel Dunbar75359a7c2009-09-25 16:03:57 +000095
Chris Lattnera6fdf5a2009-04-26 22:21:57 +000096 // Check to see if we have a blockinfo record for this block, with a name.
97 if (const BitstreamReader::BlockInfo *Info =
98 StreamFile.getBlockInfo(BlockID)) {
99 if (!Info->Name.empty())
100 return Info->Name.c_str();
101 }
Daniel Dunbar75359a7c2009-09-25 16:03:57 +0000102
103
Craig Toppere6cb63e2014-04-25 04:24:47 +0000104 if (CurStreamType != LLVMIRBitstream) return nullptr;
Daniel Dunbar75359a7c2009-09-25 16:03:57 +0000105
Chris Lattner1684cee2007-04-29 20:00:02 +0000106 switch (BlockID) {
Craig Toppere6cb63e2014-04-25 04:24:47 +0000107 default: return nullptr;
Bill Wendlingd7e05d62013-02-10 23:17:10 +0000108 case bitc::MODULE_BLOCK_ID: return "MODULE_BLOCK";
109 case bitc::PARAMATTR_BLOCK_ID: return "PARAMATTR_BLOCK";
110 case bitc::PARAMATTR_GROUP_BLOCK_ID: return "PARAMATTR_GROUP_BLOCK_ID";
111 case bitc::TYPE_BLOCK_ID_NEW: return "TYPE_BLOCK_ID";
112 case bitc::CONSTANTS_BLOCK_ID: return "CONSTANTS_BLOCK";
113 case bitc::FUNCTION_BLOCK_ID: return "FUNCTION_BLOCK";
Mehdi Amini5d303282015-10-26 18:37:00 +0000114 case bitc::IDENTIFICATION_BLOCK_ID:
115 return "IDENTIFICATION_BLOCK_ID";
Bill Wendlingd7e05d62013-02-10 23:17:10 +0000116 case bitc::VALUE_SYMTAB_BLOCK_ID: return "VALUE_SYMTAB";
117 case bitc::METADATA_BLOCK_ID: return "METADATA_BLOCK";
Teresa Johnson12545072015-11-15 02:00:09 +0000118 case bitc::METADATA_KIND_BLOCK_ID: return "METADATA_KIND_BLOCK";
Bill Wendlingd7e05d62013-02-10 23:17:10 +0000119 case bitc::METADATA_ATTACHMENT_ID: return "METADATA_ATTACHMENT_BLOCK";
120 case bitc::USELIST_BLOCK_ID: return "USELIST_BLOCK_ID";
Teresa Johnson76a1c1d2016-03-11 18:52:24 +0000121 case bitc::GLOBALVAL_SUMMARY_BLOCK_ID:
122 return "GLOBALVAL_SUMMARY_BLOCK";
Teresa Johnson403a7872015-10-04 14:33:43 +0000123 case bitc::MODULE_STRTAB_BLOCK_ID: return "MODULE_STRTAB_BLOCK";
Chris Lattner1684cee2007-04-29 20:00:02 +0000124 }
125}
126
Chris Lattner3543caa2007-04-29 21:48:19 +0000127/// GetCodeName - Return a symbolic code name if known, otherwise return
128/// null.
Chris Lattnera6fdf5a2009-04-26 22:21:57 +0000129static const char *GetCodeName(unsigned CodeID, unsigned BlockID,
Jordan Rose88eb5342014-08-30 17:07:55 +0000130 const BitstreamReader &StreamFile,
131 CurStreamTypeType CurStreamType) {
Chris Lattner9181ddf2007-05-05 00:17:42 +0000132 // Standard blocks for all bitcode files.
133 if (BlockID < bitc::FIRST_APPLICATION_BLOCKID) {
134 if (BlockID == bitc::BLOCKINFO_BLOCK_ID) {
135 switch (CodeID) {
Craig Toppere6cb63e2014-04-25 04:24:47 +0000136 default: return nullptr;
Chris Lattnera6fdf5a2009-04-26 22:21:57 +0000137 case bitc::BLOCKINFO_CODE_SETBID: return "SETBID";
138 case bitc::BLOCKINFO_CODE_BLOCKNAME: return "BLOCKNAME";
139 case bitc::BLOCKINFO_CODE_SETRECORDNAME: return "SETRECORDNAME";
Chris Lattner9181ddf2007-05-05 00:17:42 +0000140 }
141 }
Craig Toppere6cb63e2014-04-25 04:24:47 +0000142 return nullptr;
Chris Lattner9181ddf2007-05-05 00:17:42 +0000143 }
Daniel Dunbar75359a7c2009-09-25 16:03:57 +0000144
Chris Lattnera6fdf5a2009-04-26 22:21:57 +0000145 // Check to see if we have a blockinfo record for this record, with a name.
146 if (const BitstreamReader::BlockInfo *Info =
147 StreamFile.getBlockInfo(BlockID)) {
148 for (unsigned i = 0, e = Info->RecordNames.size(); i != e; ++i)
149 if (Info->RecordNames[i].first == CodeID)
150 return Info->RecordNames[i].second.c_str();
151 }
Daniel Dunbar75359a7c2009-09-25 16:03:57 +0000152
153
Craig Toppere6cb63e2014-04-25 04:24:47 +0000154 if (CurStreamType != LLVMIRBitstream) return nullptr;
Daniel Dunbar75359a7c2009-09-25 16:03:57 +0000155
Duncan P. N. Exon Smithcb8ee002015-06-29 22:50:32 +0000156#define STRINGIFY_CODE(PREFIX, CODE) \
157 case bitc::PREFIX##_##CODE: \
158 return #CODE;
Chris Lattner3543caa2007-04-29 21:48:19 +0000159 switch (BlockID) {
Craig Toppere6cb63e2014-04-25 04:24:47 +0000160 default: return nullptr;
Chris Lattner3543caa2007-04-29 21:48:19 +0000161 case bitc::MODULE_BLOCK_ID:
162 switch (CodeID) {
Craig Toppere6cb63e2014-04-25 04:24:47 +0000163 default: return nullptr;
Duncan P. N. Exon Smithcb8ee002015-06-29 22:50:32 +0000164 STRINGIFY_CODE(MODULE_CODE, VERSION)
165 STRINGIFY_CODE(MODULE_CODE, TRIPLE)
166 STRINGIFY_CODE(MODULE_CODE, DATALAYOUT)
167 STRINGIFY_CODE(MODULE_CODE, ASM)
168 STRINGIFY_CODE(MODULE_CODE, SECTIONNAME)
169 STRINGIFY_CODE(MODULE_CODE, DEPLIB) // FIXME: Remove in 4.0
170 STRINGIFY_CODE(MODULE_CODE, GLOBALVAR)
171 STRINGIFY_CODE(MODULE_CODE, FUNCTION)
172 STRINGIFY_CODE(MODULE_CODE, ALIAS)
173 STRINGIFY_CODE(MODULE_CODE, PURGEVALS)
174 STRINGIFY_CODE(MODULE_CODE, GCNAME)
Teresa Johnsonff642b92015-09-17 20:12:00 +0000175 STRINGIFY_CODE(MODULE_CODE, VSTOFFSET)
Duncan P. N. Exon Smith68f56242016-03-25 01:29:50 +0000176 STRINGIFY_CODE(MODULE_CODE, METADATA_VALUES_UNUSED)
Teresa Johnsone1164de2016-02-10 21:55:02 +0000177 STRINGIFY_CODE(MODULE_CODE, SOURCE_FILENAME)
Mehdi Aminid7ad2212016-04-01 05:33:11 +0000178 STRINGIFY_CODE(MODULE_CODE, HASH)
Chris Lattner3543caa2007-04-29 21:48:19 +0000179 }
Mehdi Amini5d303282015-10-26 18:37:00 +0000180 case bitc::IDENTIFICATION_BLOCK_ID:
181 switch (CodeID) {
182 default:
183 return nullptr;
184 STRINGIFY_CODE(IDENTIFICATION_CODE, STRING)
185 STRINGIFY_CODE(IDENTIFICATION_CODE, EPOCH)
186 }
Chris Lattner0b7c5122007-05-04 03:01:41 +0000187 case bitc::PARAMATTR_BLOCK_ID:
188 switch (CodeID) {
Craig Toppere6cb63e2014-04-25 04:24:47 +0000189 default: return nullptr;
Duncan P. N. Exon Smithcb8ee002015-06-29 22:50:32 +0000190 // FIXME: Should these be different?
Bill Wendlingd7e05d62013-02-10 23:17:10 +0000191 case bitc::PARAMATTR_CODE_ENTRY_OLD: return "ENTRY";
192 case bitc::PARAMATTR_CODE_ENTRY: return "ENTRY";
Justin Bogner68b28d02016-03-15 22:37:25 +0000193 }
194 case bitc::PARAMATTR_GROUP_BLOCK_ID:
195 switch (CodeID) {
196 default: return nullptr;
Bill Wendlingd7e05d62013-02-10 23:17:10 +0000197 case bitc::PARAMATTR_GRP_CODE_ENTRY: return "ENTRY";
Chris Lattner0b7c5122007-05-04 03:01:41 +0000198 }
Chris Lattnerb1ed91f2011-07-09 17:41:24 +0000199 case bitc::TYPE_BLOCK_ID_NEW:
Chris Lattner3543caa2007-04-29 21:48:19 +0000200 switch (CodeID) {
Craig Toppere6cb63e2014-04-25 04:24:47 +0000201 default: return nullptr;
Duncan P. N. Exon Smithcb8ee002015-06-29 22:50:32 +0000202 STRINGIFY_CODE(TYPE_CODE, NUMENTRY)
203 STRINGIFY_CODE(TYPE_CODE, VOID)
204 STRINGIFY_CODE(TYPE_CODE, FLOAT)
205 STRINGIFY_CODE(TYPE_CODE, DOUBLE)
206 STRINGIFY_CODE(TYPE_CODE, LABEL)
207 STRINGIFY_CODE(TYPE_CODE, OPAQUE)
208 STRINGIFY_CODE(TYPE_CODE, INTEGER)
209 STRINGIFY_CODE(TYPE_CODE, POINTER)
210 STRINGIFY_CODE(TYPE_CODE, ARRAY)
211 STRINGIFY_CODE(TYPE_CODE, VECTOR)
212 STRINGIFY_CODE(TYPE_CODE, X86_FP80)
213 STRINGIFY_CODE(TYPE_CODE, FP128)
214 STRINGIFY_CODE(TYPE_CODE, PPC_FP128)
215 STRINGIFY_CODE(TYPE_CODE, METADATA)
216 STRINGIFY_CODE(TYPE_CODE, STRUCT_ANON)
217 STRINGIFY_CODE(TYPE_CODE, STRUCT_NAME)
218 STRINGIFY_CODE(TYPE_CODE, STRUCT_NAMED)
219 STRINGIFY_CODE(TYPE_CODE, FUNCTION)
Chris Lattner3543caa2007-04-29 21:48:19 +0000220 }
Daniel Dunbar75359a7c2009-09-25 16:03:57 +0000221
Chris Lattner3543caa2007-04-29 21:48:19 +0000222 case bitc::CONSTANTS_BLOCK_ID:
223 switch (CodeID) {
Craig Toppere6cb63e2014-04-25 04:24:47 +0000224 default: return nullptr;
Duncan P. N. Exon Smithcb8ee002015-06-29 22:50:32 +0000225 STRINGIFY_CODE(CST_CODE, SETTYPE)
226 STRINGIFY_CODE(CST_CODE, NULL)
227 STRINGIFY_CODE(CST_CODE, UNDEF)
228 STRINGIFY_CODE(CST_CODE, INTEGER)
229 STRINGIFY_CODE(CST_CODE, WIDE_INTEGER)
230 STRINGIFY_CODE(CST_CODE, FLOAT)
231 STRINGIFY_CODE(CST_CODE, AGGREGATE)
232 STRINGIFY_CODE(CST_CODE, STRING)
233 STRINGIFY_CODE(CST_CODE, CSTRING)
234 STRINGIFY_CODE(CST_CODE, CE_BINOP)
235 STRINGIFY_CODE(CST_CODE, CE_CAST)
236 STRINGIFY_CODE(CST_CODE, CE_GEP)
237 STRINGIFY_CODE(CST_CODE, CE_INBOUNDS_GEP)
238 STRINGIFY_CODE(CST_CODE, CE_SELECT)
239 STRINGIFY_CODE(CST_CODE, CE_EXTRACTELT)
240 STRINGIFY_CODE(CST_CODE, CE_INSERTELT)
241 STRINGIFY_CODE(CST_CODE, CE_SHUFFLEVEC)
242 STRINGIFY_CODE(CST_CODE, CE_CMP)
243 STRINGIFY_CODE(CST_CODE, INLINEASM)
244 STRINGIFY_CODE(CST_CODE, CE_SHUFVEC_EX)
Chris Lattner372dd1e2012-01-30 00:51:16 +0000245 case bitc::CST_CODE_BLOCKADDRESS: return "CST_CODE_BLOCKADDRESS";
Duncan P. N. Exon Smithcb8ee002015-06-29 22:50:32 +0000246 STRINGIFY_CODE(CST_CODE, DATA)
Daniel Dunbar75359a7c2009-09-25 16:03:57 +0000247 }
Chris Lattner3543caa2007-04-29 21:48:19 +0000248 case bitc::FUNCTION_BLOCK_ID:
249 switch (CodeID) {
Craig Toppere6cb63e2014-04-25 04:24:47 +0000250 default: return nullptr;
Duncan P. N. Exon Smithcb8ee002015-06-29 22:50:32 +0000251 STRINGIFY_CODE(FUNC_CODE, DECLAREBLOCKS)
252 STRINGIFY_CODE(FUNC_CODE, INST_BINOP)
253 STRINGIFY_CODE(FUNC_CODE, INST_CAST)
254 STRINGIFY_CODE(FUNC_CODE, INST_GEP_OLD)
255 STRINGIFY_CODE(FUNC_CODE, INST_INBOUNDS_GEP_OLD)
256 STRINGIFY_CODE(FUNC_CODE, INST_SELECT)
257 STRINGIFY_CODE(FUNC_CODE, INST_EXTRACTELT)
258 STRINGIFY_CODE(FUNC_CODE, INST_INSERTELT)
259 STRINGIFY_CODE(FUNC_CODE, INST_SHUFFLEVEC)
260 STRINGIFY_CODE(FUNC_CODE, INST_CMP)
261 STRINGIFY_CODE(FUNC_CODE, INST_RET)
262 STRINGIFY_CODE(FUNC_CODE, INST_BR)
263 STRINGIFY_CODE(FUNC_CODE, INST_SWITCH)
264 STRINGIFY_CODE(FUNC_CODE, INST_INVOKE)
265 STRINGIFY_CODE(FUNC_CODE, INST_UNREACHABLE)
David Majnemer654e1302015-07-31 17:58:14 +0000266 STRINGIFY_CODE(FUNC_CODE, INST_CLEANUPRET)
267 STRINGIFY_CODE(FUNC_CODE, INST_CATCHRET)
268 STRINGIFY_CODE(FUNC_CODE, INST_CATCHPAD)
Duncan P. N. Exon Smithcb8ee002015-06-29 22:50:32 +0000269 STRINGIFY_CODE(FUNC_CODE, INST_PHI)
270 STRINGIFY_CODE(FUNC_CODE, INST_ALLOCA)
271 STRINGIFY_CODE(FUNC_CODE, INST_LOAD)
272 STRINGIFY_CODE(FUNC_CODE, INST_VAARG)
273 STRINGIFY_CODE(FUNC_CODE, INST_STORE)
274 STRINGIFY_CODE(FUNC_CODE, INST_EXTRACTVAL)
275 STRINGIFY_CODE(FUNC_CODE, INST_INSERTVAL)
276 STRINGIFY_CODE(FUNC_CODE, INST_CMP2)
277 STRINGIFY_CODE(FUNC_CODE, INST_VSELECT)
278 STRINGIFY_CODE(FUNC_CODE, DEBUG_LOC_AGAIN)
279 STRINGIFY_CODE(FUNC_CODE, INST_CALL)
280 STRINGIFY_CODE(FUNC_CODE, DEBUG_LOC)
281 STRINGIFY_CODE(FUNC_CODE, INST_GEP)
Chris Lattner3543caa2007-04-29 21:48:19 +0000282 }
Chris Lattner3543caa2007-04-29 21:48:19 +0000283 case bitc::VALUE_SYMTAB_BLOCK_ID:
284 switch (CodeID) {
Craig Toppere6cb63e2014-04-25 04:24:47 +0000285 default: return nullptr;
Duncan P. N. Exon Smithcb8ee002015-06-29 22:50:32 +0000286 STRINGIFY_CODE(VST_CODE, ENTRY)
287 STRINGIFY_CODE(VST_CODE, BBENTRY)
Teresa Johnsonff642b92015-09-17 20:12:00 +0000288 STRINGIFY_CODE(VST_CODE, FNENTRY)
Teresa Johnson76a1c1d2016-03-11 18:52:24 +0000289 STRINGIFY_CODE(VST_CODE, COMBINED_GVDEFENTRY)
290 STRINGIFY_CODE(VST_CODE, COMBINED_ENTRY)
Teresa Johnson403a7872015-10-04 14:33:43 +0000291 }
292 case bitc::MODULE_STRTAB_BLOCK_ID:
293 switch (CodeID) {
Teresa Johnsonf72278f2015-11-02 18:02:11 +0000294 default:
295 return nullptr;
296 STRINGIFY_CODE(MST_CODE, ENTRY)
Mehdi Aminid7ad2212016-04-01 05:33:11 +0000297 STRINGIFY_CODE(MST_CODE, HASH)
Teresa Johnson403a7872015-10-04 14:33:43 +0000298 }
Teresa Johnson76a1c1d2016-03-11 18:52:24 +0000299 case bitc::GLOBALVAL_SUMMARY_BLOCK_ID:
Teresa Johnson403a7872015-10-04 14:33:43 +0000300 switch (CodeID) {
Teresa Johnsonf72278f2015-11-02 18:02:11 +0000301 default:
302 return nullptr;
Teresa Johnson76a1c1d2016-03-11 18:52:24 +0000303 STRINGIFY_CODE(FS, PERMODULE)
304 STRINGIFY_CODE(FS, PERMODULE_PROFILE)
305 STRINGIFY_CODE(FS, PERMODULE_GLOBALVAR_INIT_REFS)
306 STRINGIFY_CODE(FS, COMBINED)
307 STRINGIFY_CODE(FS, COMBINED_PROFILE)
308 STRINGIFY_CODE(FS, COMBINED_GLOBALVAR_INIT_REFS)
Mehdi Amini2d28f7a2016-04-16 06:56:44 +0000309 STRINGIFY_CODE(FS, ALIAS)
310 STRINGIFY_CODE(FS, COMBINED_ALIAS)
Mehdi Aminiae64eaf2016-04-23 23:38:17 +0000311 STRINGIFY_CODE(FS, COMBINED_ORIGINAL_NAME)
Chris Lattner3543caa2007-04-29 21:48:19 +0000312 }
Devang Patelaf206b82009-09-18 19:26:43 +0000313 case bitc::METADATA_ATTACHMENT_ID:
314 switch(CodeID) {
Craig Toppere6cb63e2014-04-25 04:24:47 +0000315 default:return nullptr;
Duncan P. N. Exon Smith706b80d2015-06-29 22:50:35 +0000316 STRINGIFY_CODE(METADATA, ATTACHMENT)
Devang Patelaf206b82009-09-18 19:26:43 +0000317 }
Devang Patel7428d8a2009-07-22 17:43:22 +0000318 case bitc::METADATA_BLOCK_ID:
319 switch(CodeID) {
Craig Toppere6cb63e2014-04-25 04:24:47 +0000320 default:return nullptr;
Duncan P. N. Exon Smith6565a0d2016-03-27 23:17:54 +0000321 STRINGIFY_CODE(METADATA, STRING_OLD)
322 STRINGIFY_CODE(METADATA, STRINGS)
Duncan P. N. Exon Smith706b80d2015-06-29 22:50:35 +0000323 STRINGIFY_CODE(METADATA, NAME)
Teresa Johnson12545072015-11-15 02:00:09 +0000324 STRINGIFY_CODE(METADATA, KIND) // Older bitcode has it in a MODULE_BLOCK
Duncan P. N. Exon Smith706b80d2015-06-29 22:50:35 +0000325 STRINGIFY_CODE(METADATA, NODE)
326 STRINGIFY_CODE(METADATA, VALUE)
327 STRINGIFY_CODE(METADATA, OLD_NODE)
328 STRINGIFY_CODE(METADATA, OLD_FN_NODE)
329 STRINGIFY_CODE(METADATA, NAMED_NODE)
330 STRINGIFY_CODE(METADATA, DISTINCT_NODE)
331 STRINGIFY_CODE(METADATA, LOCATION)
332 STRINGIFY_CODE(METADATA, GENERIC_DEBUG)
333 STRINGIFY_CODE(METADATA, SUBRANGE)
334 STRINGIFY_CODE(METADATA, ENUMERATOR)
335 STRINGIFY_CODE(METADATA, BASIC_TYPE)
336 STRINGIFY_CODE(METADATA, FILE)
337 STRINGIFY_CODE(METADATA, DERIVED_TYPE)
338 STRINGIFY_CODE(METADATA, COMPOSITE_TYPE)
339 STRINGIFY_CODE(METADATA, SUBROUTINE_TYPE)
340 STRINGIFY_CODE(METADATA, COMPILE_UNIT)
341 STRINGIFY_CODE(METADATA, SUBPROGRAM)
342 STRINGIFY_CODE(METADATA, LEXICAL_BLOCK)
343 STRINGIFY_CODE(METADATA, LEXICAL_BLOCK_FILE)
344 STRINGIFY_CODE(METADATA, NAMESPACE)
345 STRINGIFY_CODE(METADATA, TEMPLATE_TYPE)
346 STRINGIFY_CODE(METADATA, TEMPLATE_VALUE)
347 STRINGIFY_CODE(METADATA, GLOBAL_VAR)
348 STRINGIFY_CODE(METADATA, LOCAL_VAR)
349 STRINGIFY_CODE(METADATA, EXPRESSION)
350 STRINGIFY_CODE(METADATA, OBJC_PROPERTY)
351 STRINGIFY_CODE(METADATA, IMPORTED_ENTITY)
Adrian Prantla7ad09d2015-06-30 00:25:41 +0000352 STRINGIFY_CODE(METADATA, MODULE)
Devang Patel7428d8a2009-07-22 17:43:22 +0000353 }
Teresa Johnson12545072015-11-15 02:00:09 +0000354 case bitc::METADATA_KIND_BLOCK_ID:
355 switch (CodeID) {
356 default:
357 return nullptr;
358 STRINGIFY_CODE(METADATA, KIND)
359 }
Chad Rosierdd4ffae2011-12-07 21:45:13 +0000360 case bitc::USELIST_BLOCK_ID:
361 switch(CodeID) {
Craig Toppere6cb63e2014-04-25 04:24:47 +0000362 default:return nullptr;
Duncan P. N. Exon Smith1f66c852014-07-28 21:19:41 +0000363 case bitc::USELIST_CODE_DEFAULT: return "USELIST_CODE_DEFAULT";
364 case bitc::USELIST_CODE_BB: return "USELIST_CODE_BB";
Chad Rosierdd4ffae2011-12-07 21:45:13 +0000365 }
Chris Lattner3543caa2007-04-29 21:48:19 +0000366 }
Duncan P. N. Exon Smithcb8ee002015-06-29 22:50:32 +0000367#undef STRINGIFY_CODE
Chris Lattner3543caa2007-04-29 21:48:19 +0000368}
369
Chris Lattnerbf419a92009-04-27 17:59:34 +0000370struct PerRecordStats {
371 unsigned NumInstances;
Chris Lattner1cf80692009-04-27 18:15:27 +0000372 unsigned NumAbbrev;
373 uint64_t TotalBits;
Daniel Dunbar75359a7c2009-09-25 16:03:57 +0000374
Mehdi Aminid2638562015-10-21 06:10:55 +0000375 PerRecordStats() : NumInstances(0), NumAbbrev(0), TotalBits(0) {}
Chris Lattnerbf419a92009-04-27 17:59:34 +0000376};
Chris Lattner1684cee2007-04-29 20:00:02 +0000377
378struct PerBlockIDStats {
379 /// NumInstances - This the number of times this block ID has been seen.
380 unsigned NumInstances;
Daniel Dunbar75359a7c2009-09-25 16:03:57 +0000381
Chris Lattner1684cee2007-04-29 20:00:02 +0000382 /// NumBits - The total size in bits of all of these blocks.
383 uint64_t NumBits;
Daniel Dunbar75359a7c2009-09-25 16:03:57 +0000384
Chris Lattner1684cee2007-04-29 20:00:02 +0000385 /// NumSubBlocks - The total number of blocks these blocks contain.
386 unsigned NumSubBlocks;
Daniel Dunbar75359a7c2009-09-25 16:03:57 +0000387
Chris Lattner1684cee2007-04-29 20:00:02 +0000388 /// NumAbbrevs - The total number of abbreviations.
389 unsigned NumAbbrevs;
Daniel Dunbar75359a7c2009-09-25 16:03:57 +0000390
391 /// NumRecords - The total number of records these blocks contain, and the
Chris Lattner1684cee2007-04-29 20:00:02 +0000392 /// number that are abbreviated.
393 unsigned NumRecords, NumAbbreviatedRecords;
Daniel Dunbar75359a7c2009-09-25 16:03:57 +0000394
Chris Lattner4a7ac9f2007-05-05 01:46:49 +0000395 /// CodeFreq - Keep track of the number of times we see each code.
Chris Lattnerbf419a92009-04-27 17:59:34 +0000396 std::vector<PerRecordStats> CodeFreq;
Daniel Dunbar75359a7c2009-09-25 16:03:57 +0000397
Chris Lattner1684cee2007-04-29 20:00:02 +0000398 PerBlockIDStats()
399 : NumInstances(0), NumBits(0),
400 NumSubBlocks(0), NumAbbrevs(0), NumRecords(0), NumAbbreviatedRecords(0) {}
401};
402
403static std::map<unsigned, PerBlockIDStats> BlockIDStats;
404
405
406
Chris Lattnerca0ea542007-04-29 08:31:14 +0000407/// Error - All bitcode analysis errors go through this function, making this a
408/// good place to breakpoint if debugging.
Jordan Rose88eb5342014-08-30 17:07:55 +0000409static bool Error(const Twine &Err) {
Dan Gohmand8db3762009-07-15 16:35:29 +0000410 errs() << Err << "\n";
Chris Lattnerca0ea542007-04-29 08:31:14 +0000411 return true;
412}
413
Duncan P. N. Exon Smith6565a0d2016-03-27 23:17:54 +0000414static bool decodeMetadataStringsBlob(BitstreamReader &Reader, StringRef Indent,
415 ArrayRef<uint64_t> Record,
416 StringRef Blob) {
417 if (Blob.empty())
418 return true;
419
420 if (Record.size() != 2)
421 return true;
422
423 unsigned NumStrings = Record[0];
424 unsigned StringsOffset = Record[1];
425 outs() << " num-strings = " << NumStrings << " {\n";
426
427 StringRef Lengths = Blob.slice(0, StringsOffset);
428 SimpleBitstreamCursor R(Reader);
429 R.jumpToPointer(Lengths.begin());
430
431 // Ensure that Blob doesn't get invalidated, even if this is reading from a
432 // StreamingMemoryObject with corrupt data.
433 R.setArtificialByteLimit(R.getCurrentByteNo() + StringsOffset);
434
435 StringRef Strings = Blob.drop_front(StringsOffset);
436 do {
437 if (R.AtEndOfStream())
438 return Error("bad length");
439
440 unsigned Size = R.ReadVBR(6);
441 if (Strings.size() < Size)
442 return Error("truncated chars");
443
444 outs() << Indent << " '";
445 outs().write_escaped(Strings.slice(0, Size), /*hex=*/true);
446 outs() << "'\n";
447 Strings = Strings.drop_front(Size);
448 } while (--NumStrings);
449
450 outs() << Indent << " }";
451 return false;
452}
453
454static bool decodeBlob(unsigned Code, unsigned BlockID, BitstreamReader &Reader,
455 StringRef Indent, ArrayRef<uint64_t> Record,
456 StringRef Blob) {
457 if (BlockID != bitc::METADATA_BLOCK_ID)
458 return true;
459 if (Code != bitc::METADATA_STRINGS)
460 return true;
461
462 return decodeMetadataStringsBlob(Reader, Indent, Record, Blob);
463}
464
Chris Lattnerca0ea542007-04-29 08:31:14 +0000465/// ParseBlock - Read a block, updating statistics, etc.
Chris Lattner0271af82013-01-20 02:50:32 +0000466static bool ParseBlock(BitstreamCursor &Stream, unsigned BlockID,
Jordan Rose88eb5342014-08-30 17:07:55 +0000467 unsigned IndentLevel, CurStreamTypeType CurStreamType) {
Chris Lattner9181ddf2007-05-05 00:17:42 +0000468 std::string Indent(IndentLevel*2, ' ');
Chris Lattner1684cee2007-04-29 20:00:02 +0000469 uint64_t BlockBitStart = Stream.GetCurrentBitNo();
Chris Lattner3543caa2007-04-29 21:48:19 +0000470
Chris Lattner1684cee2007-04-29 20:00:02 +0000471 // Get the statistics for this BlockID.
472 PerBlockIDStats &BlockStats = BlockIDStats[BlockID];
Daniel Dunbar75359a7c2009-09-25 16:03:57 +0000473
Chris Lattner1684cee2007-04-29 20:00:02 +0000474 BlockStats.NumInstances++;
Daniel Dunbar75359a7c2009-09-25 16:03:57 +0000475
Chris Lattner9181ddf2007-05-05 00:17:42 +0000476 // BLOCKINFO is a special part of the stream.
Richard Smithdc1414b2016-02-06 00:46:09 +0000477 bool DumpRecords = Dump;
Chris Lattner9181ddf2007-05-05 00:17:42 +0000478 if (BlockID == bitc::BLOCKINFO_BLOCK_ID) {
Chris Lattner633ab162012-03-19 23:40:48 +0000479 if (Dump) outs() << Indent << "<BLOCKINFO_BLOCK/>\n";
Richard Smithdc1414b2016-02-06 00:46:09 +0000480 if (BitstreamCursor(Stream).ReadBlockInfoBlock())
Chris Lattner9181ddf2007-05-05 00:17:42 +0000481 return Error("Malformed BlockInfoBlock");
Richard Smithdc1414b2016-02-06 00:46:09 +0000482 // It's not really interesting to dump the contents of the blockinfo block.
483 DumpRecords = false;
Chris Lattner9181ddf2007-05-05 00:17:42 +0000484 }
Daniel Dunbar75359a7c2009-09-25 16:03:57 +0000485
Chris Lattner3543caa2007-04-29 21:48:19 +0000486 unsigned NumWords = 0;
Chris Lattner9181ddf2007-05-05 00:17:42 +0000487 if (Stream.EnterSubBlock(BlockID, &NumWords))
Chris Lattnerca0ea542007-04-29 08:31:14 +0000488 return Error("Malformed block record");
489
Mehdi Aminid7ad2212016-04-01 05:33:11 +0000490 // Keep it for later, when we see a MODULE_HASH record
491 uint64_t BlockEntryPos = Stream.getCurrentByteNo();
492
Craig Toppere6cb63e2014-04-25 04:24:47 +0000493 const char *BlockName = nullptr;
Richard Smithdc1414b2016-02-06 00:46:09 +0000494 if (DumpRecords) {
Chris Lattner633ab162012-03-19 23:40:48 +0000495 outs() << Indent << "<";
Jordan Rose88eb5342014-08-30 17:07:55 +0000496 if ((BlockName = GetBlockName(BlockID, *Stream.getBitStreamReader(),
497 CurStreamType)))
Chris Lattner633ab162012-03-19 23:40:48 +0000498 outs() << BlockName;
Chris Lattner3543caa2007-04-29 21:48:19 +0000499 else
Chris Lattner633ab162012-03-19 23:40:48 +0000500 outs() << "UnknownBlock" << BlockID;
Daniel Dunbar75359a7c2009-09-25 16:03:57 +0000501
Chris Lattner3543caa2007-04-29 21:48:19 +0000502 if (NonSymbolic && BlockName)
Chris Lattner633ab162012-03-19 23:40:48 +0000503 outs() << " BlockID=" << BlockID;
Daniel Dunbar75359a7c2009-09-25 16:03:57 +0000504
Chris Lattner633ab162012-03-19 23:40:48 +0000505 outs() << " NumWords=" << NumWords
Chris Lattner3fa323d2013-01-19 21:37:14 +0000506 << " BlockCodeSize=" << Stream.getAbbrevIDWidth() << ">\n";
Chris Lattner3543caa2007-04-29 21:48:19 +0000507 }
Daniel Dunbar75359a7c2009-09-25 16:03:57 +0000508
Chris Lattnerca0ea542007-04-29 08:31:14 +0000509 SmallVector<uint64_t, 64> Record;
510
511 // Read all the records for this block.
512 while (1) {
513 if (Stream.AtEndOfStream())
514 return Error("Premature end of bitstream");
515
Chris Lattner1cf80692009-04-27 18:15:27 +0000516 uint64_t RecordStartBit = Stream.GetCurrentBitNo();
Daniel Dunbar75359a7c2009-09-25 16:03:57 +0000517
Chris Lattner0271af82013-01-20 02:50:32 +0000518 BitstreamEntry Entry =
519 Stream.advance(BitstreamCursor::AF_DontAutoprocessAbbrevs);
520
521 switch (Entry.Kind) {
522 case BitstreamEntry::Error:
523 return Error("malformed bitcode file");
524 case BitstreamEntry::EndBlock: {
Chris Lattner1684cee2007-04-29 20:00:02 +0000525 uint64_t BlockBitEnd = Stream.GetCurrentBitNo();
526 BlockStats.NumBits += BlockBitEnd-BlockBitStart;
Richard Smithdc1414b2016-02-06 00:46:09 +0000527 if (DumpRecords) {
Chris Lattner633ab162012-03-19 23:40:48 +0000528 outs() << Indent << "</";
Chris Lattner3543caa2007-04-29 21:48:19 +0000529 if (BlockName)
Chris Lattner633ab162012-03-19 23:40:48 +0000530 outs() << BlockName << ">\n";
Chris Lattner3543caa2007-04-29 21:48:19 +0000531 else
Chris Lattner633ab162012-03-19 23:40:48 +0000532 outs() << "UnknownBlock" << BlockID << ">\n";
Chris Lattner3543caa2007-04-29 21:48:19 +0000533 }
Chris Lattnerca0ea542007-04-29 08:31:14 +0000534 return false;
Daniel Dunbar75359a7c2009-09-25 16:03:57 +0000535 }
Chris Lattner0271af82013-01-20 02:50:32 +0000536
537 case BitstreamEntry::SubBlock: {
Chris Lattner9e808cd2007-05-05 01:29:31 +0000538 uint64_t SubBlockBitStart = Stream.GetCurrentBitNo();
Jordan Rose88eb5342014-08-30 17:07:55 +0000539 if (ParseBlock(Stream, Entry.ID, IndentLevel+1, CurStreamType))
Chris Lattnerca0ea542007-04-29 08:31:14 +0000540 return true;
Chris Lattner1684cee2007-04-29 20:00:02 +0000541 ++BlockStats.NumSubBlocks;
Chris Lattner9e808cd2007-05-05 01:29:31 +0000542 uint64_t SubBlockBitEnd = Stream.GetCurrentBitNo();
Chris Lattner0271af82013-01-20 02:50:32 +0000543
Chris Lattner9e808cd2007-05-05 01:29:31 +0000544 // Don't include subblock sizes in the size of this block.
545 BlockBitStart += SubBlockBitEnd-SubBlockBitStart;
Chris Lattner0271af82013-01-20 02:50:32 +0000546 continue;
547 }
548 case BitstreamEntry::Record:
549 // The interesting case.
Chris Lattnerca0ea542007-04-29 08:31:14 +0000550 break;
Chris Lattner9e808cd2007-05-05 01:29:31 +0000551 }
Chris Lattner0271af82013-01-20 02:50:32 +0000552
553 if (Entry.ID == bitc::DEFINE_ABBREV) {
Chris Lattnerca0ea542007-04-29 08:31:14 +0000554 Stream.ReadAbbrevRecord();
Chris Lattner1684cee2007-04-29 20:00:02 +0000555 ++BlockStats.NumAbbrevs;
Chris Lattner0271af82013-01-20 02:50:32 +0000556 continue;
557 }
558
559 Record.clear();
Chris Lattner2ed6a202009-04-06 22:44:40 +0000560
Chris Lattner0271af82013-01-20 02:50:32 +0000561 ++BlockStats.NumRecords;
Daniel Dunbar75359a7c2009-09-25 16:03:57 +0000562
Chris Lattner0271af82013-01-20 02:50:32 +0000563 StringRef Blob;
Mehdi Aminid7ad2212016-04-01 05:33:11 +0000564 unsigned CurrentRecordPos = Stream.getCurrentByteNo();
Chris Lattner0271af82013-01-20 02:50:32 +0000565 unsigned Code = Stream.readRecord(Entry.ID, Record, &Blob);
Chris Lattner4a7ac9f2007-05-05 01:46:49 +0000566
Chris Lattner0271af82013-01-20 02:50:32 +0000567 // Increment the # occurrences of this code.
568 if (BlockStats.CodeFreq.size() <= Code)
569 BlockStats.CodeFreq.resize(Code+1);
570 BlockStats.CodeFreq[Code].NumInstances++;
571 BlockStats.CodeFreq[Code].TotalBits +=
572 Stream.GetCurrentBitNo()-RecordStartBit;
573 if (Entry.ID != bitc::UNABBREV_RECORD) {
574 BlockStats.CodeFreq[Code].NumAbbrev++;
575 ++BlockStats.NumAbbreviatedRecords;
576 }
Daniel Dunbar75359a7c2009-09-25 16:03:57 +0000577
Richard Smithdc1414b2016-02-06 00:46:09 +0000578 if (DumpRecords) {
Chris Lattner0271af82013-01-20 02:50:32 +0000579 outs() << Indent << " <";
580 if (const char *CodeName =
Jordan Rose88eb5342014-08-30 17:07:55 +0000581 GetCodeName(Code, BlockID, *Stream.getBitStreamReader(),
582 CurStreamType))
Chris Lattner0271af82013-01-20 02:50:32 +0000583 outs() << CodeName;
584 else
585 outs() << "UnknownCode" << Code;
586 if (NonSymbolic &&
Jordan Rose88eb5342014-08-30 17:07:55 +0000587 GetCodeName(Code, BlockID, *Stream.getBitStreamReader(),
588 CurStreamType))
Chris Lattner0271af82013-01-20 02:50:32 +0000589 outs() << " codeid=" << Code;
Teresa Johnsonb1cfcd42015-10-08 15:56:24 +0000590 const BitCodeAbbrev *Abbv = nullptr;
591 if (Entry.ID != bitc::UNABBREV_RECORD) {
592 Abbv = Stream.getAbbrev(Entry.ID);
Chris Lattner0271af82013-01-20 02:50:32 +0000593 outs() << " abbrevid=" << Entry.ID;
Teresa Johnsonb1cfcd42015-10-08 15:56:24 +0000594 }
Chris Lattner3543caa2007-04-29 21:48:19 +0000595
Chris Lattner0271af82013-01-20 02:50:32 +0000596 for (unsigned i = 0, e = Record.size(); i != e; ++i)
597 outs() << " op" << i << "=" << (int64_t)Record[i];
Daniel Dunbar75359a7c2009-09-25 16:03:57 +0000598
Mehdi Aminid7ad2212016-04-01 05:33:11 +0000599 // If we found a module hash, let's verify that it matches!
600 if (BlockID == bitc::MODULE_BLOCK_ID && Code == bitc::MODULE_CODE_HASH) {
601 if (Record.size() != 5)
602 outs() << " (invalid)";
603 else {
604 // Recompute the hash and compare it to the one in the bitcode
605 SHA1 Hasher;
606 StringRef Hash;
607 {
608 int BlockSize = CurrentRecordPos - BlockEntryPos;
609 auto Ptr = Stream.getPointerToByte(BlockEntryPos, BlockSize);
610 Hasher.update(ArrayRef<uint8_t>(Ptr, BlockSize));
611 Hash = Hasher.result();
612 }
613 SmallString<20> RecordedHash;
614 RecordedHash.resize(20);
615 int Pos = 0;
616 for (auto &Val : Record) {
617 assert(!(Val >> 32) && "Unexpected high bits set");
618 RecordedHash[Pos++] = (Val >> 24) & 0xFF;
619 RecordedHash[Pos++] = (Val >> 16) & 0xFF;
620 RecordedHash[Pos++] = (Val >> 8) & 0xFF;
621 RecordedHash[Pos++] = (Val >> 0) & 0xFF;
622 }
623 if (Hash == RecordedHash)
624 outs() << " (match)";
625 else
626 outs() << " (!mismatch!)";
627 }
628 }
629
Chris Lattner0271af82013-01-20 02:50:32 +0000630 outs() << "/>";
Daniel Dunbar75359a7c2009-09-25 16:03:57 +0000631
Teresa Johnsonb1cfcd42015-10-08 15:56:24 +0000632 if (Abbv) {
633 for (unsigned i = 1, e = Abbv->getNumOperandInfos(); i != e; ++i) {
634 const BitCodeAbbrevOp &Op = Abbv->getOperandInfo(i);
635 if (!Op.isEncoding() || Op.getEncoding() != BitCodeAbbrevOp::Array)
636 continue;
637 assert(i + 2 == e && "Array op not second to last");
638 std::string Str;
639 bool ArrayIsPrintable = true;
640 for (unsigned j = i - 1, je = Record.size(); j != je; ++j) {
641 if (!isprint(static_cast<unsigned char>(Record[j]))) {
642 ArrayIsPrintable = false;
643 break;
644 }
645 Str += (char)Record[j];
646 }
Teresa Johnsonf72278f2015-11-02 18:02:11 +0000647 if (ArrayIsPrintable)
648 outs() << " record string = '" << Str << "'";
Teresa Johnsonb1cfcd42015-10-08 15:56:24 +0000649 break;
650 }
651 }
652
Duncan P. N. Exon Smith6565a0d2016-03-27 23:17:54 +0000653 if (Blob.data() && decodeBlob(Code, BlockID, *Stream.getBitStreamReader(),
654 Indent, Record, Blob)) {
Chris Lattner0271af82013-01-20 02:50:32 +0000655 outs() << " blob data = ";
Jordan Rose0fa38b82015-05-13 18:51:49 +0000656 if (ShowBinaryBlobs) {
657 outs() << "'";
658 outs().write_escaped(Blob, /*hex=*/true) << "'";
659 } else {
660 bool BlobIsPrintable = true;
661 for (unsigned i = 0, e = Blob.size(); i != e; ++i)
662 if (!isprint(static_cast<unsigned char>(Blob[i]))) {
663 BlobIsPrintable = false;
664 break;
665 }
Daniel Dunbar75359a7c2009-09-25 16:03:57 +0000666
Jordan Rose0fa38b82015-05-13 18:51:49 +0000667 if (BlobIsPrintable)
668 outs() << "'" << Blob << "'";
669 else
670 outs() << "unprintable, " << Blob.size() << " bytes.";
671 }
Chris Lattner3543caa2007-04-29 21:48:19 +0000672 }
Daniel Dunbar75359a7c2009-09-25 16:03:57 +0000673
Chris Lattner0271af82013-01-20 02:50:32 +0000674 outs() << "\n";
Chris Lattnerca0ea542007-04-29 08:31:14 +0000675 }
676 }
677}
678
Chris Lattner1684cee2007-04-29 20:00:02 +0000679static void PrintSize(double Bits) {
Jan Wen Voung52ad2082012-09-05 20:55:54 +0000680 outs() << format("%.2f/%.2fB/%luW", Bits, Bits/8,(unsigned long)(Bits/32));
Chris Lattnerbf419a92009-04-27 17:59:34 +0000681}
682static void PrintSize(uint64_t Bits) {
Jan Wen Voung52ad2082012-09-05 20:55:54 +0000683 outs() << format("%lub/%.2fB/%luW", (unsigned long)Bits,
684 (double)Bits/8, (unsigned long)(Bits/32));
Chris Lattner1684cee2007-04-29 20:00:02 +0000685}
686
Jordan Rose88eb5342014-08-30 17:07:55 +0000687static bool openBitcodeFile(StringRef Path,
688 std::unique_ptr<MemoryBuffer> &MemBuf,
689 BitstreamReader &StreamFile,
690 BitstreamCursor &Stream,
691 CurStreamTypeType &CurStreamType) {
Chris Lattner03997582007-04-29 08:12:22 +0000692 // Read the input file.
Rafael Espindolaadf21f22014-07-06 17:43:13 +0000693 ErrorOr<std::unique_ptr<MemoryBuffer>> MemBufOrErr =
Jordan Rose88eb5342014-08-30 17:07:55 +0000694 MemoryBuffer::getFileOrSTDIN(Path);
Rafael Espindolaadf21f22014-07-06 17:43:13 +0000695 if (std::error_code EC = MemBufOrErr.getError())
Jordan Rose88eb5342014-08-30 17:07:55 +0000696 return Error(Twine("Error reading '") + Path + "': " + EC.message());
697 MemBuf = std::move(MemBufOrErr.get());
Daniel Dunbar75359a7c2009-09-25 16:03:57 +0000698
Jordan Rose88eb5342014-08-30 17:07:55 +0000699 if (MemBuf->getBufferSize() & 3)
Chris Lattnerca0ea542007-04-29 08:31:14 +0000700 return Error("Bitcode stream should be a multiple of 4 bytes in length");
Daniel Dunbar75359a7c2009-09-25 16:03:57 +0000701
Jordan Rose88eb5342014-08-30 17:07:55 +0000702 const unsigned char *BufPtr = (const unsigned char *)MemBuf->getBufferStart();
703 const unsigned char *EndBufPtr = BufPtr + MemBuf->getBufferSize();
Daniel Dunbar75359a7c2009-09-25 16:03:57 +0000704
Chris Lattnerb9e07fd2009-04-06 20:54:32 +0000705 // If we have a wrapper header, parse it and ignore the non-bc file contents.
706 // The magic number is 0x0B17C0DE stored in little endian.
Akira Hatanaka4f472a882016-01-29 05:55:09 +0000707 if (isBitcodeWrapper(BufPtr, EndBufPtr)) {
Mehdi Aminieed26932016-04-01 05:19:14 +0000708 if (MemBuf->getBufferSize() < BWH_HeaderSize)
Akira Hatanaka4f472a882016-01-29 05:55:09 +0000709 return Error("Invalid bitcode wrapper header");
710
711 if (Dump) {
712 unsigned Magic = support::endian::read32le(&BufPtr[BWH_MagicField]);
713 unsigned Version = support::endian::read32le(&BufPtr[BWH_VersionField]);
714 unsigned Offset = support::endian::read32le(&BufPtr[BWH_OffsetField]);
715 unsigned Size = support::endian::read32le(&BufPtr[BWH_SizeField]);
716 unsigned CPUType = support::endian::read32le(&BufPtr[BWH_CPUTypeField]);
717
718 outs() << "<BITCODE_WRAPPER_HEADER"
719 << " Magic=" << format_hex(Magic, 10)
720 << " Version=" << format_hex(Version, 10)
721 << " Offset=" << format_hex(Offset, 10)
722 << " Size=" << format_hex(Size, 10)
723 << " CPUType=" << format_hex(CPUType, 10) << "/>\n";
724 }
725
Derek Schuff8b2dcad2012-02-06 22:30:29 +0000726 if (SkipBitcodeWrapperHeader(BufPtr, EndBufPtr, true))
Chris Lattnerb9e07fd2009-04-06 20:54:32 +0000727 return Error("Invalid bitcode wrapper header");
Akira Hatanaka4f472a882016-01-29 05:55:09 +0000728 }
Daniel Dunbar75359a7c2009-09-25 16:03:57 +0000729
Jordan Rose88eb5342014-08-30 17:07:55 +0000730 StreamFile = BitstreamReader(BufPtr, EndBufPtr);
731 Stream = BitstreamCursor(StreamFile);
Chris Lattner0e3f50d2009-04-27 20:04:08 +0000732 StreamFile.CollectBlockInfoNames();
Daniel Dunbar75359a7c2009-09-25 16:03:57 +0000733
Chris Lattner03997582007-04-29 08:12:22 +0000734 // Read the stream signature.
735 char Signature[6];
736 Signature[0] = Stream.Read(8);
737 Signature[1] = Stream.Read(8);
738 Signature[2] = Stream.Read(4);
739 Signature[3] = Stream.Read(4);
740 Signature[4] = Stream.Read(4);
741 Signature[5] = Stream.Read(4);
Daniel Dunbar75359a7c2009-09-25 16:03:57 +0000742
Chris Lattnerca0ea542007-04-29 08:31:14 +0000743 // Autodetect the file contents, if it is one we know.
Chris Lattner03997582007-04-29 08:12:22 +0000744 CurStreamType = UnknownBitstream;
745 if (Signature[0] == 'B' && Signature[1] == 'C' &&
746 Signature[2] == 0x0 && Signature[3] == 0xC &&
747 Signature[4] == 0xE && Signature[5] == 0xD)
748 CurStreamType = LLVMIRBitstream;
749
Jordan Rose88eb5342014-08-30 17:07:55 +0000750 return false;
751}
752
753/// AnalyzeBitcode - Analyze the bitcode file specified by InputFilename.
754static int AnalyzeBitcode() {
755 std::unique_ptr<MemoryBuffer> StreamBuffer;
756 BitstreamReader StreamFile;
757 BitstreamCursor Stream;
758 CurStreamTypeType CurStreamType;
759 if (openBitcodeFile(InputFilename, StreamBuffer, StreamFile, Stream,
760 CurStreamType))
761 return true;
762
763 // Read block info from BlockInfoFilename, if specified.
764 // The block info must be a top-level block.
765 if (!BlockInfoFilename.empty()) {
766 std::unique_ptr<MemoryBuffer> BlockInfoBuffer;
767 BitstreamReader BlockInfoFile;
768 BitstreamCursor BlockInfoCursor;
769 CurStreamTypeType BlockInfoStreamType;
770 if (openBitcodeFile(BlockInfoFilename, BlockInfoBuffer, BlockInfoFile,
771 BlockInfoCursor, BlockInfoStreamType))
772 return true;
773
774 while (!BlockInfoCursor.AtEndOfStream()) {
775 unsigned Code = BlockInfoCursor.ReadCode();
776 if (Code != bitc::ENTER_SUBBLOCK)
777 return Error("Invalid record at top-level in block info file");
778
779 unsigned BlockID = BlockInfoCursor.ReadSubBlockID();
780 if (BlockID == bitc::BLOCKINFO_BLOCK_ID) {
781 if (BlockInfoCursor.ReadBlockInfoBlock())
782 return Error("Malformed BlockInfoBlock in block info file");
783 break;
784 }
785
786 BlockInfoCursor.SkipBlock();
787 }
788
789 StreamFile.takeBlockInfo(std::move(BlockInfoFile));
790 }
791
Chris Lattner1684cee2007-04-29 20:00:02 +0000792 unsigned NumTopBlocks = 0;
Daniel Dunbar75359a7c2009-09-25 16:03:57 +0000793
Chris Lattnerca0ea542007-04-29 08:31:14 +0000794 // Parse the top-level structure. We only allow blocks at the top-level.
795 while (!Stream.AtEndOfStream()) {
796 unsigned Code = Stream.ReadCode();
797 if (Code != bitc::ENTER_SUBBLOCK)
798 return Error("Invalid record at top-level");
Daniel Dunbar75359a7c2009-09-25 16:03:57 +0000799
Chris Lattner0271af82013-01-20 02:50:32 +0000800 unsigned BlockID = Stream.ReadSubBlockID();
801
Jordan Rose88eb5342014-08-30 17:07:55 +0000802 if (ParseBlock(Stream, BlockID, 0, CurStreamType))
Chris Lattnerca0ea542007-04-29 08:31:14 +0000803 return true;
Chris Lattner1684cee2007-04-29 20:00:02 +0000804 ++NumTopBlocks;
Chris Lattnerca0ea542007-04-29 08:31:14 +0000805 }
Daniel Dunbar75359a7c2009-09-25 16:03:57 +0000806
Chris Lattner633ab162012-03-19 23:40:48 +0000807 if (Dump) outs() << "\n\n";
Daniel Dunbar75359a7c2009-09-25 16:03:57 +0000808
Jordan Rose88eb5342014-08-30 17:07:55 +0000809 uint64_t BufferSizeBits = StreamFile.getBitcodeBytes().getExtent() * CHAR_BIT;
Chris Lattnerca0ea542007-04-29 08:31:14 +0000810 // Print a summary of the read file.
Chris Lattner633ab162012-03-19 23:40:48 +0000811 outs() << "Summary of " << InputFilename << ":\n";
812 outs() << " Total size: ";
Chris Lattner5fab65d2007-05-01 02:43:46 +0000813 PrintSize(BufferSizeBits);
Chris Lattner633ab162012-03-19 23:40:48 +0000814 outs() << "\n";
815 outs() << " Stream type: ";
Chris Lattner03997582007-04-29 08:12:22 +0000816 switch (CurStreamType) {
Chris Lattner633ab162012-03-19 23:40:48 +0000817 case UnknownBitstream: outs() << "unknown\n"; break;
818 case LLVMIRBitstream: outs() << "LLVM IR\n"; break;
Chris Lattner03997582007-04-29 08:12:22 +0000819 }
Chris Lattner633ab162012-03-19 23:40:48 +0000820 outs() << " # Toplevel Blocks: " << NumTopBlocks << "\n";
821 outs() << "\n";
Chris Lattner1684cee2007-04-29 20:00:02 +0000822
823 // Emit per-block stats.
Chris Lattner633ab162012-03-19 23:40:48 +0000824 outs() << "Per-block Summary:\n";
Chris Lattner1684cee2007-04-29 20:00:02 +0000825 for (std::map<unsigned, PerBlockIDStats>::iterator I = BlockIDStats.begin(),
826 E = BlockIDStats.end(); I != E; ++I) {
Chris Lattner633ab162012-03-19 23:40:48 +0000827 outs() << " Block ID #" << I->first;
Jordan Rose88eb5342014-08-30 17:07:55 +0000828 if (const char *BlockName = GetBlockName(I->first, StreamFile,
829 CurStreamType))
Chris Lattner633ab162012-03-19 23:40:48 +0000830 outs() << " (" << BlockName << ")";
831 outs() << ":\n";
Daniel Dunbar75359a7c2009-09-25 16:03:57 +0000832
Chris Lattner1684cee2007-04-29 20:00:02 +0000833 const PerBlockIDStats &Stats = I->second;
Chris Lattner633ab162012-03-19 23:40:48 +0000834 outs() << " Num Instances: " << Stats.NumInstances << "\n";
835 outs() << " Total Size: ";
Chris Lattner1684cee2007-04-29 20:00:02 +0000836 PrintSize(Stats.NumBits);
Chris Lattner633ab162012-03-19 23:40:48 +0000837 outs() << "\n";
Daniel Dunbare813b222009-09-25 16:04:21 +0000838 double pct = (Stats.NumBits * 100.0) / BufferSizeBits;
Jan Wen Voung52ad2082012-09-05 20:55:54 +0000839 outs() << " Percent of file: " << format("%2.4f%%", pct) << "\n";
Chris Lattner4a7ac9f2007-05-05 01:46:49 +0000840 if (Stats.NumInstances > 1) {
Chris Lattner633ab162012-03-19 23:40:48 +0000841 outs() << " Average Size: ";
Chris Lattner4a7ac9f2007-05-05 01:46:49 +0000842 PrintSize(Stats.NumBits/(double)Stats.NumInstances);
Chris Lattner633ab162012-03-19 23:40:48 +0000843 outs() << "\n";
844 outs() << " Tot/Avg SubBlocks: " << Stats.NumSubBlocks << "/"
Dan Gohmand8db3762009-07-15 16:35:29 +0000845 << Stats.NumSubBlocks/(double)Stats.NumInstances << "\n";
Chris Lattner633ab162012-03-19 23:40:48 +0000846 outs() << " Tot/Avg Abbrevs: " << Stats.NumAbbrevs << "/"
Dan Gohmand8db3762009-07-15 16:35:29 +0000847 << Stats.NumAbbrevs/(double)Stats.NumInstances << "\n";
Chris Lattner633ab162012-03-19 23:40:48 +0000848 outs() << " Tot/Avg Records: " << Stats.NumRecords << "/"
Dan Gohmand8db3762009-07-15 16:35:29 +0000849 << Stats.NumRecords/(double)Stats.NumInstances << "\n";
Chris Lattner4a7ac9f2007-05-05 01:46:49 +0000850 } else {
Chris Lattner633ab162012-03-19 23:40:48 +0000851 outs() << " Num SubBlocks: " << Stats.NumSubBlocks << "\n";
852 outs() << " Num Abbrevs: " << Stats.NumAbbrevs << "\n";
853 outs() << " Num Records: " << Stats.NumRecords << "\n";
Chris Lattner4a7ac9f2007-05-05 01:46:49 +0000854 }
Daniel Dunbare813b222009-09-25 16:04:21 +0000855 if (Stats.NumRecords) {
856 double pct = (Stats.NumAbbreviatedRecords * 100.0) / Stats.NumRecords;
Chris Lattner633ab162012-03-19 23:40:48 +0000857 outs() << " Percent Abbrevs: " << format("%2.4f%%", pct) << "\n";
Daniel Dunbare813b222009-09-25 16:04:21 +0000858 }
Chris Lattner633ab162012-03-19 23:40:48 +0000859 outs() << "\n";
Daniel Dunbar75359a7c2009-09-25 16:03:57 +0000860
Chris Lattner4a7ac9f2007-05-05 01:46:49 +0000861 // Print a histogram of the codes we see.
862 if (!NoHistogram && !Stats.CodeFreq.empty()) {
Mehdi Aminid2638562015-10-21 06:10:55 +0000863 std::vector<std::pair<unsigned, unsigned> > FreqPairs; // <freq,code>
Chris Lattner4a7ac9f2007-05-05 01:46:49 +0000864 for (unsigned i = 0, e = Stats.CodeFreq.size(); i != e; ++i)
Mehdi Aminid2638562015-10-21 06:10:55 +0000865 if (unsigned Freq = Stats.CodeFreq[i].NumInstances)
Chris Lattner4a7ac9f2007-05-05 01:46:49 +0000866 FreqPairs.push_back(std::make_pair(Freq, i));
867 std::stable_sort(FreqPairs.begin(), FreqPairs.end());
868 std::reverse(FreqPairs.begin(), FreqPairs.end());
Daniel Dunbar75359a7c2009-09-25 16:03:57 +0000869
Chris Lattner633ab162012-03-19 23:40:48 +0000870 outs() << "\tRecord Histogram:\n";
Richard Smithdc1414b2016-02-06 00:46:09 +0000871 outs() << "\t\t Count # Bits b/Rec % Abv Record Kind\n";
Chris Lattner4a7ac9f2007-05-05 01:46:49 +0000872 for (unsigned i = 0, e = FreqPairs.size(); i != e; ++i) {
Chris Lattner1cf80692009-04-27 18:15:27 +0000873 const PerRecordStats &RecStats = Stats.CodeFreq[FreqPairs[i].second];
Daniel Dunbar75359a7c2009-09-25 16:03:57 +0000874
Mehdi Aminid2638562015-10-21 06:10:55 +0000875 outs() << format("\t\t%7d %9lu",
Jan Wen Voung05ff5702012-09-05 20:55:57 +0000876 RecStats.NumInstances,
877 (unsigned long)RecStats.TotalBits);
Daniel Dunbar75359a7c2009-09-25 16:03:57 +0000878
Richard Smithdc1414b2016-02-06 00:46:09 +0000879 if (RecStats.NumInstances > 1)
880 outs() << format(" %9.1f",
881 (double)RecStats.TotalBits/RecStats.NumInstances);
882 else
883 outs() << " ";
884
Chris Lattner1cf80692009-04-27 18:15:27 +0000885 if (RecStats.NumAbbrev)
Jan Wen Voung52ad2082012-09-05 20:55:54 +0000886 outs() <<
Richard Smithdc1414b2016-02-06 00:46:09 +0000887 format(" %7.2f",
Jan Wen Voung52ad2082012-09-05 20:55:54 +0000888 (double)RecStats.NumAbbrev/RecStats.NumInstances*100);
Chris Lattner1cf80692009-04-27 18:15:27 +0000889 else
Richard Smithdc1414b2016-02-06 00:46:09 +0000890 outs() << " ";
Daniel Dunbar75359a7c2009-09-25 16:03:57 +0000891
Richard Smithdc1414b2016-02-06 00:46:09 +0000892 outs() << " ";
Daniel Dunbar75359a7c2009-09-25 16:03:57 +0000893 if (const char *CodeName =
Jordan Rose88eb5342014-08-30 17:07:55 +0000894 GetCodeName(FreqPairs[i].second, I->first, StreamFile,
895 CurStreamType))
Jan Wen Voung52ad2082012-09-05 20:55:54 +0000896 outs() << CodeName << "\n";
Chris Lattner4a7ac9f2007-05-05 01:46:49 +0000897 else
Jan Wen Voung52ad2082012-09-05 20:55:54 +0000898 outs() << "UnknownCode" << FreqPairs[i].second << "\n";
Chris Lattner4a7ac9f2007-05-05 01:46:49 +0000899 }
Chris Lattner633ab162012-03-19 23:40:48 +0000900 outs() << "\n";
Daniel Dunbar75359a7c2009-09-25 16:03:57 +0000901
Chris Lattner4a7ac9f2007-05-05 01:46:49 +0000902 }
Chris Lattner1684cee2007-04-29 20:00:02 +0000903 }
Chris Lattner03997582007-04-29 08:12:22 +0000904 return 0;
905}
Reid Spencerdb5c86d2004-06-07 17:53:43 +0000906
Chris Lattnerca0ea542007-04-29 08:31:14 +0000907
Chris Lattner76d46322006-12-06 01:18:01 +0000908int main(int argc, char **argv) {
Chris Lattnere3fc2d12009-03-06 05:34:10 +0000909 // Print a stack trace if we signal out.
Chris Lattner03997582007-04-29 08:12:22 +0000910 sys::PrintStackTraceOnErrorSignal();
Chris Lattnere3fc2d12009-03-06 05:34:10 +0000911 PrettyStackTraceProgram X(argc, argv);
912 llvm_shutdown_obj Y; // Call llvm_shutdown() on exit.
913 cl::ParseCommandLineOptions(argc, argv, "llvm-bcanalyzer file analyzer\n");
Daniel Dunbar75359a7c2009-09-25 16:03:57 +0000914
Chris Lattner6d80e212007-05-06 09:29:57 +0000915 return AnalyzeBitcode();
Reid Spencerdb5c86d2004-06-07 17:53:43 +0000916}