blob: e9d81870e6dc5fee05f64fe5443fd4ccff732d75 [file] [log] [blame]
Nick Lewycky3e62b2d2009-02-03 07:13:24 +00001//===-- gold-plugin.cpp - Plugin to gold for Link Time Optimization ------===//
2//
3// The LLVM Compiler Infrastructure
4//
5// This file is distributed under the University of Illinois Open Source
6// License. See LICENSE.TXT for details.
7//
8//===----------------------------------------------------------------------===//
9//
10// This is a gold plugin for LLVM. It provides an LLVM implementation of the
11// interface described in http://gcc.gnu.org/wiki/whopr/driver .
12//
13//===----------------------------------------------------------------------===//
14
15#include "plugin-api.h"
16
17#include "llvm-c/lto.h"
18
19#include "llvm/Support/raw_ostream.h"
20#include "llvm/System/Path.h"
21
Torok Edwin6cbbdfd2009-02-04 21:00:02 +000022#include <cerrno>
Nick Lewycky3e62b2d2009-02-03 07:13:24 +000023#include <cstdlib>
24#include <cstring>
25#include <list>
26#include <vector>
27
28using namespace llvm;
29
30namespace {
31 ld_plugin_status discard_message(int level, const char *format, ...) {
32 // Die loudly. Recent versions of Gold pass ld_plugin_message as the first
33 // callback in the transfer vector. This should never be called.
34 abort();
35 }
36
37 ld_plugin_add_symbols add_symbols = NULL;
38 ld_plugin_get_symbols get_symbols = NULL;
39 ld_plugin_add_input_file add_input_file = NULL;
40 ld_plugin_message message = discard_message;
41
42 int api_version = 0;
43 int gold_version = 0;
44
45 struct claimed_file {
46 lto_module_t M;
47 void *handle;
48 std::vector<ld_plugin_symbol> syms;
49 };
50
51 lto_codegen_model output_type = LTO_CODEGEN_PIC_MODEL_STATIC;
52 std::list<claimed_file> Modules;
53 std::vector<sys::Path> Cleanup;
54}
55
56ld_plugin_status claim_file_hook(const ld_plugin_input_file *file,
57 int *claimed);
58ld_plugin_status all_symbols_read_hook(void);
59ld_plugin_status cleanup_hook(void);
60
61extern "C" ld_plugin_status onload(ld_plugin_tv *tv);
62ld_plugin_status onload(ld_plugin_tv *tv) {
63 // We're given a pointer to the first transfer vector. We read through them
64 // until we find one where tv_tag == LDPT_NULL. The REGISTER_* tagged values
65 // contain pointers to functions that we need to call to register our own
66 // hooks. The others are addresses of functions we can use to call into gold
67 // for services.
68
69 bool registeredClaimFile = false;
70 bool registeredAllSymbolsRead = false;
71 bool registeredCleanup = false;
72
73 for (; tv->tv_tag != LDPT_NULL; ++tv) {
74 switch (tv->tv_tag) {
75 case LDPT_API_VERSION:
76 api_version = tv->tv_u.tv_val;
77 break;
78 case LDPT_GOLD_VERSION: // major * 100 + minor
79 gold_version = tv->tv_u.tv_val;
80 break;
81 case LDPT_LINKER_OUTPUT:
82 switch (tv->tv_u.tv_val) {
83 case LDPO_REL: // .o
84 case LDPO_DYN: // .so
85 output_type = LTO_CODEGEN_PIC_MODEL_DYNAMIC;
86 break;
87 case LDPO_EXEC: // .exe
88 output_type = LTO_CODEGEN_PIC_MODEL_STATIC;
89 break;
90 default:
91 (*message)(LDPL_ERROR, "Unknown output file type %d",
92 tv->tv_u.tv_val);
93 return LDPS_ERR;
94 }
95 // TODO: add an option to disable PIC.
96 //output_type = LTO_CODEGEN_PIC_MODEL_DYNAMIC_NO_PIC;
97 break;
98 case LDPT_OPTION:
99 (*message)(LDPL_WARNING, "Ignoring flag %s", tv->tv_u.tv_string);
100 break;
101 case LDPT_REGISTER_CLAIM_FILE_HOOK: {
102 ld_plugin_register_claim_file callback;
103 callback = tv->tv_u.tv_register_claim_file;
104
105 if ((*callback)(claim_file_hook) != LDPS_OK)
106 return LDPS_ERR;
107
108 registeredClaimFile = true;
109 } break;
110 case LDPT_REGISTER_ALL_SYMBOLS_READ_HOOK: {
111 ld_plugin_register_all_symbols_read callback;
112 callback = tv->tv_u.tv_register_all_symbols_read;
113
114 if ((*callback)(all_symbols_read_hook) != LDPS_OK)
115 return LDPS_ERR;
116
117 registeredAllSymbolsRead = true;
118 } break;
119 case LDPT_REGISTER_CLEANUP_HOOK: {
120 ld_plugin_register_cleanup callback;
121 callback = tv->tv_u.tv_register_cleanup;
122
123 if ((*callback)(cleanup_hook) != LDPS_OK)
124 return LDPS_ERR;
125
126 registeredCleanup = true;
127 } break;
128 case LDPT_ADD_SYMBOLS:
129 add_symbols = tv->tv_u.tv_add_symbols;
130 break;
131 case LDPT_GET_SYMBOLS:
132 get_symbols = tv->tv_u.tv_get_symbols;
133 break;
134 case LDPT_ADD_INPUT_FILE:
135 add_input_file = tv->tv_u.tv_add_input_file;
136 break;
137 case LDPT_MESSAGE:
138 message = tv->tv_u.tv_message;
139 break;
140 default:
141 break;
142 }
143 }
144
Rafael Espindola98c507e2009-02-18 08:30:15 +0000145 if (!registeredClaimFile) {
Rafael Espindolaf163a952009-02-17 21:08:21 +0000146 (*message)(LDPL_ERROR, "register_claim_file not passed to LLVMgold.");
147 return LDPS_ERR;
148 }
Rafael Espindola98c507e2009-02-18 08:30:15 +0000149 if (!add_symbols) {
Rafael Espindolaf163a952009-02-17 21:08:21 +0000150 (*message)(LDPL_ERROR, "add_symbols not passed to LLVMgold.");
151 return LDPS_ERR;
152 }
Nick Lewycky3e62b2d2009-02-03 07:13:24 +0000153
154 return LDPS_OK;
155}
156
157/// claim_file_hook - called by gold to see whether this file is one that
158/// our plugin can handle. We'll try to open it and register all the symbols
159/// with add_symbol if possible.
160ld_plugin_status claim_file_hook(const ld_plugin_input_file *file,
161 int *claimed) {
Torok Edwin3e5a0d82009-02-04 17:39:30 +0000162 void *buf = NULL;
Torok Edwin3e5a0d82009-02-04 17:39:30 +0000163 if (file->offset) {
Nick Lewyckyc1da8862009-02-05 04:14:23 +0000164 // Gold has found what might be IR part-way inside of a file, such as
165 // an .a archive.
Torok Edwin3e5a0d82009-02-04 17:39:30 +0000166 if (lseek(file->fd, file->offset, SEEK_SET) == -1) {
Nick Lewycky0df91b22009-02-07 03:15:01 +0000167 (*message)(LDPL_ERROR,
Torok Edwin3e5a0d82009-02-04 17:39:30 +0000168 "Failed to seek to archive member of %s at offset %d: %s\n",
169 file->name,
170 file->offset, strerror(errno));
171 return LDPS_ERR;
172 }
173 buf = malloc(file->filesize);
174 if (!buf) {
Nick Lewycky0df91b22009-02-07 03:15:01 +0000175 (*message)(LDPL_ERROR,
Torok Edwin3e5a0d82009-02-04 17:39:30 +0000176 "Failed to allocate buffer for archive member of size: %d\n",
177 file->filesize);
178 return LDPS_ERR;
179 }
180 if (read(file->fd, buf, file->filesize) != file->filesize) {
Nick Lewycky0df91b22009-02-07 03:15:01 +0000181 (*message)(LDPL_ERROR,
182 "Failed to read archive member of %s at offset %d: %s\n",
Torok Edwin3e5a0d82009-02-04 17:39:30 +0000183 file->name,
Nick Lewycky0df91b22009-02-07 03:15:01 +0000184 file->offset,
Torok Edwin3e5a0d82009-02-04 17:39:30 +0000185 strerror(errno));
Nick Lewycky0df91b22009-02-07 03:15:01 +0000186 free(buf);
Torok Edwin3e5a0d82009-02-04 17:39:30 +0000187 return LDPS_ERR;
188 }
Nick Lewycky0df91b22009-02-07 03:15:01 +0000189 if (!lto_module_is_object_file_in_memory(buf, file->filesize)) {
190 free(buf);
Torok Edwin3e5a0d82009-02-04 17:39:30 +0000191 return LDPS_OK;
Nick Lewycky0df91b22009-02-07 03:15:01 +0000192 }
Torok Edwin3e5a0d82009-02-04 17:39:30 +0000193 } else if (!lto_module_is_object_file(file->name))
Nick Lewycky3e62b2d2009-02-03 07:13:24 +0000194 return LDPS_OK;
195
196 *claimed = 1;
197 Modules.resize(Modules.size() + 1);
198 claimed_file &cf = Modules.back();
199
Nick Lewyckyc1da8862009-02-05 04:14:23 +0000200 cf.M = buf ? lto_module_create_from_memory(buf, file->filesize) :
201 lto_module_create(file->name);
Nick Lewyckyea97aa62009-02-06 01:58:34 +0000202 free(buf);
Nick Lewycky3e62b2d2009-02-03 07:13:24 +0000203 if (!cf.M) {
204 (*message)(LDPL_ERROR, "Failed to create LLVM module: %s",
205 lto_get_error_message());
206 return LDPS_ERR;
207 }
208 cf.handle = file->handle;
209 unsigned sym_count = lto_module_get_num_symbols(cf.M);
210 cf.syms.reserve(sym_count);
211
212 for (unsigned i = 0; i != sym_count; ++i) {
213 lto_symbol_attributes attrs = lto_module_get_symbol_attribute(cf.M, i);
214 if ((attrs & LTO_SYMBOL_SCOPE_MASK) == LTO_SYMBOL_SCOPE_INTERNAL)
215 continue;
216
217 cf.syms.push_back(ld_plugin_symbol());
218 ld_plugin_symbol &sym = cf.syms.back();
219 sym.name = const_cast<char *>(lto_module_get_symbol_name(cf.M, i));
220 sym.version = NULL;
221
222 int scope = attrs & LTO_SYMBOL_SCOPE_MASK;
223 switch (scope) {
224 case LTO_SYMBOL_SCOPE_HIDDEN:
225 sym.visibility = LDPV_HIDDEN;
226 break;
227 case LTO_SYMBOL_SCOPE_PROTECTED:
228 sym.visibility = LDPV_PROTECTED;
229 break;
230 case 0: // extern
231 case LTO_SYMBOL_SCOPE_DEFAULT:
232 sym.visibility = LDPV_DEFAULT;
233 break;
234 default:
235 (*message)(LDPL_ERROR, "Unknown scope attribute: %d", scope);
236 return LDPS_ERR;
237 }
238
239 int definition = attrs & LTO_SYMBOL_DEFINITION_MASK;
240 switch (definition) {
241 case LTO_SYMBOL_DEFINITION_REGULAR:
242 sym.def = LDPK_DEF;
243 break;
244 case LTO_SYMBOL_DEFINITION_UNDEFINED:
245 sym.def = LDPK_UNDEF;
246 break;
247 case LTO_SYMBOL_DEFINITION_TENTATIVE:
248 sym.def = LDPK_COMMON;
249 break;
250 case LTO_SYMBOL_DEFINITION_WEAK:
251 sym.def = LDPK_WEAKDEF;
252 break;
253 default:
254 (*message)(LDPL_ERROR, "Unknown definition attribute: %d", definition);
255 return LDPS_ERR;
256 }
257
258 // LLVM never emits COMDAT.
259 sym.size = 0;
260 sym.comdat_key = NULL;
261
262 sym.resolution = LDPR_UNKNOWN;
263 }
264
265 cf.syms.reserve(cf.syms.size());
266
267 if (!cf.syms.empty()) {
268 if ((*add_symbols)(cf.handle, cf.syms.size(), &cf.syms[0]) != LDPS_OK) {
269 (*message)(LDPL_ERROR, "Unable to add symbols!");
270 return LDPS_ERR;
271 }
272 }
273
274 return LDPS_OK;
275}
276
277/// all_symbols_read_hook - gold informs us that all symbols have been read.
278/// At this point, we use get_symbols to see if any of our definitions have
279/// been overridden by a native object file. Then, perform optimization and
280/// codegen.
281ld_plugin_status all_symbols_read_hook(void) {
282 lto_code_gen_t cg = lto_codegen_create();
283
284 for (std::list<claimed_file>::iterator I = Modules.begin(),
285 E = Modules.end(); I != E; ++I)
286 lto_codegen_add_module(cg, I->M);
287
288 // If we don't preserve any symbols, libLTO will assume that all symbols are
289 // needed. Keep all symbols unless we're producing a final executable.
290 if (output_type == LTO_CODEGEN_PIC_MODEL_STATIC) {
291 bool anySymbolsPreserved = false;
292 for (std::list<claimed_file>::iterator I = Modules.begin(),
293 E = Modules.end(); I != E; ++I) {
294 (*get_symbols)(I->handle, I->syms.size(), &I->syms[0]);
295 for (unsigned i = 0, e = I->syms.size(); i != e; i++) {
Nick Lewyckye0afaa32009-02-15 22:49:17 +0000296 if (I->syms[i].resolution == LDPR_PREVAILING_DEF ||
297 (I->syms[i].def == LDPK_COMMON &&
298 I->syms[i].resolution == LDPR_RESOLVED_IR)) {
Nick Lewycky3e62b2d2009-02-03 07:13:24 +0000299 lto_codegen_add_must_preserve_symbol(cg, I->syms[i].name);
300 anySymbolsPreserved = true;
301 }
302 }
303 }
304
305 if (!anySymbolsPreserved) {
306 // This entire file is unnecessary!
307 lto_codegen_dispose(cg);
308 return LDPS_OK;
309 }
310 }
311
312 lto_codegen_set_pic_model(cg, output_type);
313 lto_codegen_set_debug_model(cg, LTO_DEBUG_MODEL_DWARF);
314
315 size_t bufsize = 0;
316 const char *buffer = static_cast<const char *>(lto_codegen_compile(cg,
317 &bufsize));
318
319 std::string ErrMsg;
320
321 sys::Path uniqueObjPath("/tmp/llvmgold.o");
322 if (uniqueObjPath.createTemporaryFileOnDisk(true, &ErrMsg)) {
323 (*message)(LDPL_ERROR, "%s", ErrMsg.c_str());
324 return LDPS_ERR;
325 }
326 raw_fd_ostream *objFile = new raw_fd_ostream(uniqueObjPath.c_str(), true,
327 ErrMsg);
328 if (!ErrMsg.empty()) {
329 delete objFile;
330 (*message)(LDPL_ERROR, "%s", ErrMsg.c_str());
331 return LDPS_ERR;
332 }
333
334 objFile->write(buffer, bufsize);
335 objFile->close();
336
337 lto_codegen_dispose(cg);
Nick Lewycky3e62b2d2009-02-03 07:13:24 +0000338
339 if ((*add_input_file)(const_cast<char*>(uniqueObjPath.c_str())) != LDPS_OK) {
340 (*message)(LDPL_ERROR, "Unable to add .o file to the link.");
341 (*message)(LDPL_ERROR, "File left behind in: %s", uniqueObjPath.c_str());
342 return LDPS_ERR;
343 }
344
345 Cleanup.push_back(uniqueObjPath);
346
347 return LDPS_OK;
348}
349
350ld_plugin_status cleanup_hook(void) {
351 std::string ErrMsg;
352
353 for (int i = 0, e = Cleanup.size(); i != e; ++i)
354 if (Cleanup[i].eraseFromDisk(false, &ErrMsg))
355 (*message)(LDPL_ERROR, "Failed to delete '%s': %s", Cleanup[i].c_str(),
356 ErrMsg.c_str());
357
358 return LDPS_OK;
359}