blob: dd42e954058979d38ac7d532025382a2e76cc46e [file] [log] [blame]
Ulrich Drepperb08d5a82005-07-26 05:00:05 +00001/* Reconstruct an ELF file by reading the segments out of remote memory.
Mark Wielaard9202fe12015-05-19 13:39:39 +02002 Copyright (C) 2005-2011, 2014, 2015 Red Hat, Inc.
Mark Wielaardde2ed972012-06-05 17:15:16 +02003 This file is part of elfutils.
Ulrich Drepperb08d5a82005-07-26 05:00:05 +00004
Mark Wielaardde2ed972012-06-05 17:15:16 +02005 This file is free software; you can redistribute it and/or modify
6 it under the terms of either
Ulrich Drepperb08d5a82005-07-26 05:00:05 +00007
Mark Wielaardde2ed972012-06-05 17:15:16 +02008 * the GNU Lesser General Public License as published by the Free
9 Software Foundation; either version 3 of the License, or (at
10 your option) any later version
11
12 or
13
14 * the GNU General Public License as published by the Free
15 Software Foundation; either version 2 of the License, or (at
16 your option) any later version
17
18 or both in parallel, as here.
19
20 elfutils is distributed in the hope that it will be useful, but
Ulrich Drepper361df7d2006-04-04 21:38:57 +000021 WITHOUT ANY WARRANTY; without even the implied warranty of
22 MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
23 General Public License for more details.
24
Mark Wielaardde2ed972012-06-05 17:15:16 +020025 You should have received copies of the GNU General Public License and
26 the GNU Lesser General Public License along with this program. If
27 not, see <http://www.gnu.org/licenses/>. */
Ulrich Drepperb08d5a82005-07-26 05:00:05 +000028
29#include <config.h>
30#include "../libelf/libelfP.h"
31#undef _
32
33#include "libdwflP.h"
34
35#include <gelf.h>
36#include <sys/types.h>
37#include <stdbool.h>
38#include <stdlib.h>
39#include <string.h>
40
41/* Reconstruct an ELF file by reading the segments out of remote memory
42 based on the ELF file header at EHDR_VMA and the ELF program headers it
43 points to. If not null, *LOADBASEP is filled in with the difference
44 between the addresses from which the segments were read, and the
45 addresses the file headers put them at.
46
47 The function READ_MEMORY is called to copy at least MINREAD and at most
48 MAXREAD bytes from the remote memory at target address ADDRESS into the
49 local buffer at DATA; it should return -1 for errors (with code in
50 `errno'), 0 if it failed to read at least MINREAD bytes due to EOF, or
Mark Wielaardf15bcda2014-03-03 11:43:43 +010051 the number of bytes read if >= MINREAD. ARG is passed through.
52
53 PAGESIZE is the minimum page size and alignment used for the PT_LOAD
54 segments. */
Ulrich Drepperb08d5a82005-07-26 05:00:05 +000055
56Elf *
57elf_from_remote_memory (GElf_Addr ehdr_vma,
Mark Wielaardf15bcda2014-03-03 11:43:43 +010058 GElf_Xword pagesize,
Ulrich Drepperb08d5a82005-07-26 05:00:05 +000059 GElf_Addr *loadbasep,
60 ssize_t (*read_memory) (void *arg, void *data,
61 GElf_Addr address,
62 size_t minread,
63 size_t maxread),
64 void *arg)
65{
Mark Wielaard9202fe12015-05-19 13:39:39 +020066 /* We might have to reserve some memory for the phdrs. Set to NULL
67 here so we can always safely free it. */
68 void *phdrsp = NULL;
69
Ulrich Drepperb08d5a82005-07-26 05:00:05 +000070 /* First read in the file header and check its sanity. */
71
72 const size_t initial_bufsize = 256;
73 unsigned char *buffer = malloc (initial_bufsize);
Mark Wielaard9202fe12015-05-19 13:39:39 +020074 if (unlikely (buffer == NULL))
Ulrich Drepperb08d5a82005-07-26 05:00:05 +000075 {
76 no_memory:
77 __libdwfl_seterrno (DWFL_E_NOMEM);
78 return NULL;
79 }
80
81 ssize_t nread = (*read_memory) (arg, buffer, ehdr_vma,
82 sizeof (Elf32_Ehdr), initial_bufsize);
83 if (nread <= 0)
84 {
85 read_error:
86 free (buffer);
Mark Wielaard9202fe12015-05-19 13:39:39 +020087 free (phdrsp);
Ulrich Drepperb08d5a82005-07-26 05:00:05 +000088 __libdwfl_seterrno (nread < 0 ? DWFL_E_ERRNO : DWFL_E_TRUNCATED);
89 return NULL;
90 }
91
92 if (memcmp (buffer, ELFMAG, SELFMAG) != 0)
93 {
94 bad_elf:
Mark Wielaardf15bcda2014-03-03 11:43:43 +010095 free (buffer);
Mark Wielaard9202fe12015-05-19 13:39:39 +020096 free (phdrsp);
Ulrich Drepperb08d5a82005-07-26 05:00:05 +000097 __libdwfl_seterrno (DWFL_E_BADELF);
98 return NULL;
99 }
100
101 /* Extract the information we need from the file header. */
102
103 union
104 {
105 Elf32_Ehdr e32;
106 Elf64_Ehdr e64;
107 } ehdr;
108 Elf_Data xlatefrom =
109 {
110 .d_type = ELF_T_EHDR,
111 .d_buf = buffer,
112 .d_version = EV_CURRENT,
113 };
114 Elf_Data xlateto =
115 {
116 .d_type = ELF_T_EHDR,
117 .d_buf = &ehdr,
118 .d_size = sizeof ehdr,
119 .d_version = EV_CURRENT,
120 };
121
122 GElf_Off phoff;
123 uint_fast16_t phnum;
124 uint_fast16_t phentsize;
125 GElf_Off shdrs_end;
126
127 switch (buffer[EI_CLASS])
128 {
129 case ELFCLASS32:
130 xlatefrom.d_size = sizeof (Elf32_Ehdr);
131 if (elf32_xlatetom (&xlateto, &xlatefrom, buffer[EI_DATA]) == NULL)
132 {
133 libelf_error:
134 __libdwfl_seterrno (DWFL_E_LIBELF);
135 return NULL;
136 }
137 phoff = ehdr.e32.e_phoff;
138 phnum = ehdr.e32.e_phnum;
139 phentsize = ehdr.e32.e_phentsize;
140 if (phentsize != sizeof (Elf32_Phdr) || phnum == 0)
141 goto bad_elf;
142 shdrs_end = ehdr.e32.e_shoff + ehdr.e32.e_shnum * ehdr.e32.e_shentsize;
143 break;
144
145 case ELFCLASS64:
146 xlatefrom.d_size = sizeof (Elf64_Ehdr);
Ulrich Drepper6258e742007-03-13 06:22:40 +0000147 if (elf64_xlatetom (&xlateto, &xlatefrom, buffer[EI_DATA]) == NULL)
Ulrich Drepperb08d5a82005-07-26 05:00:05 +0000148 goto libelf_error;
149 phoff = ehdr.e64.e_phoff;
150 phnum = ehdr.e64.e_phnum;
151 phentsize = ehdr.e64.e_phentsize;
152 if (phentsize != sizeof (Elf64_Phdr) || phnum == 0)
153 goto bad_elf;
154 shdrs_end = ehdr.e64.e_shoff + ehdr.e64.e_shnum * ehdr.e64.e_shentsize;
155 break;
156
157 default:
158 goto bad_elf;
159 }
160
161
162 /* The file header tells where to find the program headers.
163 These are what we use to actually choose what to read. */
164
165 xlatefrom.d_type = xlateto.d_type = ELF_T_PHDR;
166 xlatefrom.d_size = phnum * phentsize;
167
168 if ((size_t) nread >= phoff + phnum * phentsize)
169 /* We already have all the phdrs from the initial read. */
170 xlatefrom.d_buf = buffer + phoff;
171 else
172 {
173 /* Read in the program headers. */
174
175 if (initial_bufsize < phnum * phentsize)
176 {
177 unsigned char *newbuf = realloc (buffer, phnum * phentsize);
178 if (newbuf == NULL)
179 {
180 free (buffer);
Mark Wielaard9202fe12015-05-19 13:39:39 +0200181 free (phdrsp);
Ulrich Drepperb08d5a82005-07-26 05:00:05 +0000182 goto no_memory;
183 }
184 buffer = newbuf;
185 }
186 nread = (*read_memory) (arg, buffer, ehdr_vma + phoff,
187 phnum * phentsize, phnum * phentsize);
188 if (nread <= 0)
189 goto read_error;
190
191 xlatefrom.d_buf = buffer;
192 }
193
Mark Wielaard86ed7f72015-10-08 00:16:03 +0200194 bool class32 = ehdr.e32.e_ident[EI_CLASS] == ELFCLASS32;
195 size_t phdr_size = class32 ? sizeof (Elf32_Phdr) : sizeof (Elf64_Phdr);
196 if (unlikely (phnum > SIZE_MAX / phdr_size))
Chih-Hung Hsieh7eff36d2015-10-06 15:53:15 -0700197 {
198 free (buffer);
199 goto no_memory;
200 }
Mark Wielaard86ed7f72015-10-08 00:16:03 +0200201 const size_t phdrsp_bytes = phnum * phdr_size;
Chih-Hung Hsieh7eff36d2015-10-06 15:53:15 -0700202 phdrsp = malloc (phdrsp_bytes);
Mark Wielaard9202fe12015-05-19 13:39:39 +0200203 if (unlikely (phdrsp == NULL))
204 {
205 free (buffer);
206 goto no_memory;
207 }
Mark Wielaard9202fe12015-05-19 13:39:39 +0200208
Chih-Hung Hsieh7eff36d2015-10-06 15:53:15 -0700209 xlateto.d_buf = phdrsp;
210 xlateto.d_size = phdrsp_bytes;
Ulrich Drepperb08d5a82005-07-26 05:00:05 +0000211
212 /* Scan for PT_LOAD segments to find the total size of the file image. */
213 size_t contents_size = 0;
214 GElf_Off segments_end = 0;
Mark Wielaarddd64d4a2014-03-03 15:07:31 +0100215 GElf_Off segments_end_mem = 0;
Ulrich Drepperb08d5a82005-07-26 05:00:05 +0000216 GElf_Addr loadbase = ehdr_vma;
Roland McGrath099dd522007-08-13 22:58:36 +0000217 bool found_base = false;
Mark Wielaard86ed7f72015-10-08 00:16:03 +0200218 Elf32_Phdr (*p32)[phnum] = phdrsp;
219 Elf64_Phdr (*p64)[phnum] = phdrsp;
Ulrich Drepperb08d5a82005-07-26 05:00:05 +0000220 switch (ehdr.e32.e_ident[EI_CLASS])
221 {
Mark Wielaardf15bcda2014-03-03 11:43:43 +0100222 /* Sanity checks segments and calculates segment_end,
223 segments_end, segments_end_mem and loadbase (if not
224 found_base yet). Returns true if sanity checking failed,
225 false otherwise. */
226 inline bool handle_segment (GElf_Addr vaddr, GElf_Off offset,
Mark Wielaard32b6c6a2014-12-19 15:40:16 +0100227 GElf_Xword filesz, GElf_Xword memsz)
Ulrich Drepperb08d5a82005-07-26 05:00:05 +0000228 {
Mark Wielaard32b6c6a2014-12-19 15:40:16 +0100229 /* Sanity check the segment load aligns with the pagesize. */
230 if (((vaddr - offset) & (pagesize - 1)) != 0)
Mark Wielaardf15bcda2014-03-03 11:43:43 +0100231 return true;
232
233 GElf_Off segment_end = ((offset + filesz + pagesize - 1)
234 & -pagesize);
Ulrich Drepperb08d5a82005-07-26 05:00:05 +0000235
236 if (segment_end > (GElf_Off) contents_size)
237 contents_size = segment_end;
238
Mark Wielaardf15bcda2014-03-03 11:43:43 +0100239 if (!found_base && (offset & -pagesize) == 0)
Roland McGrath099dd522007-08-13 22:58:36 +0000240 {
Mark Wielaardf15bcda2014-03-03 11:43:43 +0100241 loadbase = ehdr_vma - (vaddr & -pagesize);
Roland McGrath099dd522007-08-13 22:58:36 +0000242 found_base = true;
243 }
Ulrich Drepperb08d5a82005-07-26 05:00:05 +0000244
245 segments_end = offset + filesz;
Mark Wielaarddd64d4a2014-03-03 15:07:31 +0100246 segments_end_mem = offset + memsz;
Mark Wielaardf15bcda2014-03-03 11:43:43 +0100247 return false;
Ulrich Drepperb08d5a82005-07-26 05:00:05 +0000248 }
249
250 case ELFCLASS32:
251 if (elf32_xlatetom (&xlateto, &xlatefrom,
252 ehdr.e32.e_ident[EI_DATA]) == NULL)
253 goto libelf_error;
254 for (uint_fast16_t i = 0; i < phnum; ++i)
Chih-Hung Hsieh7eff36d2015-10-06 15:53:15 -0700255 if ((*p32)[i].p_type == PT_LOAD)
256 if (handle_segment ((*p32)[i].p_vaddr, (*p32)[i].p_offset,
257 (*p32)[i].p_filesz, (*p32)[i].p_memsz))
Mark Wielaardf15bcda2014-03-03 11:43:43 +0100258 goto bad_elf;
Ulrich Drepperb08d5a82005-07-26 05:00:05 +0000259 break;
260
261 case ELFCLASS64:
Roland McGrath01fef9d2011-12-02 09:45:53 -0800262 if (elf64_xlatetom (&xlateto, &xlatefrom,
263 ehdr.e64.e_ident[EI_DATA]) == NULL)
Ulrich Drepperb08d5a82005-07-26 05:00:05 +0000264 goto libelf_error;
265 for (uint_fast16_t i = 0; i < phnum; ++i)
Chih-Hung Hsieh7eff36d2015-10-06 15:53:15 -0700266 if ((*p64)[i].p_type == PT_LOAD)
267 if (handle_segment ((*p64)[i].p_vaddr, (*p64)[i].p_offset,
268 (*p64)[i].p_filesz, (*p64)[i].p_memsz))
Mark Wielaardf15bcda2014-03-03 11:43:43 +0100269 goto bad_elf;
Ulrich Drepperb08d5a82005-07-26 05:00:05 +0000270 break;
271
272 default:
273 abort ();
274 break;
275 }
276
277 /* Trim the last segment so we don't bother with zeros in the last page
278 that are off the end of the file. However, if the extra bit in that
Mark Wielaarddd64d4a2014-03-03 15:07:31 +0100279 page includes the section headers and the memory isn't extended (which
280 might indicate it will have been reused otherwise), keep them. */
Ulrich Drepperb08d5a82005-07-26 05:00:05 +0000281 if ((GElf_Off) contents_size > segments_end
Mark Wielaarddd64d4a2014-03-03 15:07:31 +0100282 && (GElf_Off) contents_size >= shdrs_end
283 && segments_end == segments_end_mem)
Ulrich Drepperb08d5a82005-07-26 05:00:05 +0000284 {
285 contents_size = segments_end;
286 if ((GElf_Off) contents_size < shdrs_end)
287 contents_size = shdrs_end;
288 }
289 else
290 contents_size = segments_end;
291
292 free (buffer);
293
294 /* Now we know the size of the whole image we want read in. */
295 buffer = calloc (1, contents_size);
296 if (buffer == NULL)
Mark Wielaard9202fe12015-05-19 13:39:39 +0200297 {
298 free (phdrsp);
299 goto no_memory;
300 }
Ulrich Drepperb08d5a82005-07-26 05:00:05 +0000301
302 switch (ehdr.e32.e_ident[EI_CLASS])
303 {
Mark Wielaardf15bcda2014-03-03 11:43:43 +0100304 /* Reads the given segment. Returns true if reading fails,
305 false otherwise. */
Ulrich Drepperb08d5a82005-07-26 05:00:05 +0000306 inline bool handle_segment (GElf_Addr vaddr, GElf_Off offset,
Mark Wielaardf15bcda2014-03-03 11:43:43 +0100307 GElf_Xword filesz)
Ulrich Drepperb08d5a82005-07-26 05:00:05 +0000308 {
Mark Wielaardf15bcda2014-03-03 11:43:43 +0100309 GElf_Off start = offset & -pagesize;
310 GElf_Off end = (offset + filesz + pagesize - 1) & -pagesize;
Ulrich Drepperb08d5a82005-07-26 05:00:05 +0000311 if (end > (GElf_Off) contents_size)
312 end = contents_size;
313 nread = (*read_memory) (arg, buffer + start,
Mark Wielaardf15bcda2014-03-03 11:43:43 +0100314 (loadbase + vaddr) & -pagesize,
Ulrich Drepperb08d5a82005-07-26 05:00:05 +0000315 end - start, end - start);
316 return nread <= 0;
317 }
318
319 case ELFCLASS32:
320 for (uint_fast16_t i = 0; i < phnum; ++i)
Chih-Hung Hsieh7eff36d2015-10-06 15:53:15 -0700321 if ((*p32)[i].p_type == PT_LOAD)
322 if (handle_segment ((*p32)[i].p_vaddr, (*p32)[i].p_offset,
323 (*p32)[i].p_filesz))
Ulrich Drepperb08d5a82005-07-26 05:00:05 +0000324 goto read_error;
325
326 /* If the segments visible in memory didn't include the section
327 headers, then clear them from the file header. */
328 if (contents_size < shdrs_end)
329 {
330 ehdr.e32.e_shoff = 0;
331 ehdr.e32.e_shnum = 0;
332 ehdr.e32.e_shstrndx = 0;
333 }
334
335 /* This will normally have been in the first PT_LOAD segment. But it
336 conceivably could be missing, and we might have just changed it. */
337 xlatefrom.d_type = xlateto.d_type = ELF_T_EHDR;
338 xlatefrom.d_size = xlateto.d_size = sizeof ehdr.e32;
339 xlatefrom.d_buf = &ehdr.e32;
340 xlateto.d_buf = buffer;
341 if (elf32_xlatetof (&xlateto, &xlatefrom,
342 ehdr.e32.e_ident[EI_DATA]) == NULL)
343 goto libelf_error;
344 break;
345
346 case ELFCLASS64:
347 for (uint_fast16_t i = 0; i < phnum; ++i)
Chih-Hung Hsieh7eff36d2015-10-06 15:53:15 -0700348 if ((*p64)[i].p_type == PT_LOAD)
349 if (handle_segment ((*p64)[i].p_vaddr, (*p64)[i].p_offset,
350 (*p64)[i].p_filesz))
Ulrich Drepperb08d5a82005-07-26 05:00:05 +0000351 goto read_error;
352
353 /* If the segments visible in memory didn't include the section
354 headers, then clear them from the file header. */
355 if (contents_size < shdrs_end)
356 {
357 ehdr.e64.e_shoff = 0;
358 ehdr.e64.e_shnum = 0;
359 ehdr.e64.e_shstrndx = 0;
360 }
361
362 /* This will normally have been in the first PT_LOAD segment. But it
363 conceivably could be missing, and we might have just changed it. */
364 xlatefrom.d_type = xlateto.d_type = ELF_T_EHDR;
365 xlatefrom.d_size = xlateto.d_size = sizeof ehdr.e64;
366 xlatefrom.d_buf = &ehdr.e64;
367 xlateto.d_buf = buffer;
Ulrich Drepperd5a75192006-06-15 03:07:46 +0000368 if (elf64_xlatetof (&xlateto, &xlatefrom,
Ulrich Drepperb08d5a82005-07-26 05:00:05 +0000369 ehdr.e64.e_ident[EI_DATA]) == NULL)
370 goto libelf_error;
371 break;
372
373 default:
374 abort ();
375 break;
376 }
377
Mark Wielaard9202fe12015-05-19 13:39:39 +0200378 free (phdrsp);
Chih-Hung Hsieh7eff36d2015-10-06 15:53:15 -0700379 phdrsp = NULL;
Mark Wielaard9202fe12015-05-19 13:39:39 +0200380
Ulrich Drepperb08d5a82005-07-26 05:00:05 +0000381 /* Now we have the image. Open libelf on it. */
382
383 Elf *elf = elf_memory ((char *) buffer, contents_size);
384 if (elf == NULL)
385 {
386 free (buffer);
Ulrich Drepperd5a75192006-06-15 03:07:46 +0000387 goto libelf_error;
Ulrich Drepperb08d5a82005-07-26 05:00:05 +0000388 }
389
390 elf->flags |= ELF_F_MALLOCED;
391 if (loadbasep != NULL)
392 *loadbasep = loadbase;
393 return elf;
394}