blob: 0d69e809673ab20b0fb631bb541109441eb2e64b [file] [log] [blame]
Linus Torvalds1da177e2005-04-16 15:20:36 -07001/*
2 * misc.c
Ian Campbell818a08f2008-01-30 13:33:38 +01003 *
Kees Cookc0402882016-04-18 09:42:13 -07004 * This is a collection of several routines used to extract the kernel
5 * which includes KASLR relocation, decompression, ELF parsing, and
6 * relocation processing. Additionally included are the screen and serial
7 * output functions and related debugging support functions.
Linus Torvalds1da177e2005-04-16 15:20:36 -07008 *
9 * malloc by Hannu Savolainen 1993 and Matthias Urlichs 1994
10 * puts by Nick Holloway 1993, better puts by Martin Mares 1995
11 * High loaded stuff by Hans Lermen & Werner Almesberger, Feb. 1996
12 */
13
Yinghai Lu8fee13a42010-08-02 16:21:22 -070014#include "misc.h"
Vivek Goyal820e8fe2014-03-18 15:26:38 -040015#include "../string.h"
Eric W. Biederman968de4f2006-12-07 02:14:04 +010016
17/* WARNING!!
18 * This code is compiled with -fPIC and it is relocated dynamically
19 * at run time, but no relocation processing is performed.
20 * This means that it is not safe to place pointers in static structures.
21 */
22
23/*
24 * Getting to provable safe in place decompression is hard.
Simon Arlott27b46d72007-10-20 01:13:56 +020025 * Worst case behaviours need to be analyzed.
Eric W. Biederman968de4f2006-12-07 02:14:04 +010026 * Background information:
27 *
28 * The file layout is:
29 * magic[2]
30 * method[1]
31 * flags[1]
32 * timestamp[4]
33 * extraflags[1]
34 * os[1]
35 * compressed data blocks[N]
36 * crc[4] orig_len[4]
37 *
38 * resulting in 18 bytes of non compressed data overhead.
39 *
40 * Files divided into blocks
41 * 1 bit (last block flag)
42 * 2 bits (block type)
43 *
Ingo Molnar1180e012008-02-21 05:03:48 +010044 * 1 block occurs every 32K -1 bytes or when there 50% compression
45 * has been achieved. The smallest block type encoding is always used.
Eric W. Biederman968de4f2006-12-07 02:14:04 +010046 *
47 * stored:
48 * 32 bits length in bytes.
49 *
50 * fixed:
51 * magic fixed tree.
52 * symbols.
53 *
54 * dynamic:
55 * dynamic tree encoding.
56 * symbols.
57 *
58 *
59 * The buffer for decompression in place is the length of the
60 * uncompressed data, plus a small amount extra to keep the algorithm safe.
61 * The compressed data is placed at the end of the buffer. The output
62 * pointer is placed at the start of the buffer and the input pointer
63 * is placed where the compressed data starts. Problems will occur
64 * when the output pointer overruns the input pointer.
65 *
66 * The output pointer can only overrun the input pointer if the input
67 * pointer is moving faster than the output pointer. A condition only
68 * triggered by data whose compressed form is larger than the uncompressed
69 * form.
70 *
71 * The worst case at the block level is a growth of the compressed data
72 * of 5 bytes per 32767 bytes.
73 *
74 * The worst case internal to a compressed block is very hard to figure.
75 * The worst case can at least be boundined by having one bit that represents
76 * 32764 bytes and then all of the rest of the bytes representing the very
77 * very last byte.
78 *
79 * All of which is enough to compute an amount of extra data that is required
80 * to be safe. To avoid problems at the block level allocating 5 extra bytes
Ingo Molnar1180e012008-02-21 05:03:48 +010081 * per 32767 bytes of data is sufficient. To avoind problems internal to a
82 * block adding an extra 32767 bytes (the worst case uncompressed block size)
83 * is sufficient, to ensure that in the worst case the decompressed data for
Eric W. Biederman968de4f2006-12-07 02:14:04 +010084 * block will stop the byte before the compressed data for a block begins.
85 * To avoid problems with the compressed data's meta information an extra 18
86 * bytes are needed. Leading to the formula:
87 *
88 * extra_bytes = (uncompressed_size >> 12) + 32768 + 18 + decompressor_size.
89 *
90 * Adding 8 bytes per 32K is a bit excessive but much easier to calculate.
91 * Adding 32768 instead of 32767 just makes for round numbers.
92 * Adding the decompressor_size is necessary as it musht live after all
93 * of the data as well. Last I measured the decompressor is about 14K.
Simon Arlott27b46d72007-10-20 01:13:56 +020094 * 10K of actual data and 4K of bss.
Eric W. Biederman968de4f2006-12-07 02:14:04 +010095 *
96 */
Linus Torvalds1da177e2005-04-16 15:20:36 -070097
98/*
99 * gzip declarations
100 */
Ingo Molnar1180e012008-02-21 05:03:48 +0100101#define STATIC static
Linus Torvalds1da177e2005-04-16 15:20:36 -0700102
Linus Torvalds1da177e2005-04-16 15:20:36 -0700103#undef memcpy
Vivek Goyal04999552014-03-18 15:26:40 -0400104
105/*
106 * Use a normal definition of memset() from string.c. There are already
107 * included header files which expect a definition of memset() and by
108 * the time we define memset macro, it is too late.
109 */
110#undef memset
Ingo Molnar1180e012008-02-21 05:03:48 +0100111#define memzero(s, n) memset((s), 0, (n))
Linus Torvalds1da177e2005-04-16 15:20:36 -0700112
Linus Torvalds1da177e2005-04-16 15:20:36 -0700113
Linus Torvalds1da177e2005-04-16 15:20:36 -0700114static void error(char *m);
Paolo Ciarrocchifd77c7c2008-02-21 00:19:10 +0100115
Linus Torvalds1da177e2005-04-16 15:20:36 -0700116/*
117 * This is set up by the setup-routine at boot-time
118 */
Kees Cook6655e0a2016-04-18 09:42:12 -0700119struct boot_params *boot_params;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700120
Kees Cook82fa9632013-10-10 17:18:16 -0700121memptr free_mem_ptr;
122memptr free_mem_end_ptr;
Ian Campbell778cb922008-01-30 13:33:38 +0100123
Alexander van Heukelum03056c82008-04-06 14:47:00 +0200124static char *vidmem;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700125static int vidport;
126static int lines, cols;
127
Alain Knaffae03c492009-01-04 22:46:17 +0100128#ifdef CONFIG_KERNEL_GZIP
129#include "../../../../lib/decompress_inflate.c"
130#endif
131
132#ifdef CONFIG_KERNEL_BZIP2
133#include "../../../../lib/decompress_bunzip2.c"
134#endif
135
136#ifdef CONFIG_KERNEL_LZMA
137#include "../../../../lib/decompress_unlzma.c"
138#endif
Linus Torvalds1da177e2005-04-16 15:20:36 -0700139
Lasse Collin30314802011-01-12 17:01:24 -0800140#ifdef CONFIG_KERNEL_XZ
141#include "../../../../lib/decompress_unxz.c"
142#endif
143
Albin Tonnerre13510992010-01-08 14:42:45 -0800144#ifdef CONFIG_KERNEL_LZO
145#include "../../../../lib/decompress_unlzo.c"
146#endif
147
Kyungsik Leef9b493a2013-07-08 16:01:48 -0700148#ifdef CONFIG_KERNEL_LZ4
149#include "../../../../lib/decompress_unlz4.c"
150#endif
151
Linus Torvalds1da177e2005-04-16 15:20:36 -0700152static void scroll(void)
153{
154 int i;
155
Paolo Ciarrocchifd77c7c2008-02-21 00:19:10 +0100156 memcpy(vidmem, vidmem + cols * 2, (lines - 1) * cols * 2);
157 for (i = (lines - 1) * cols * 2; i < lines * cols * 2; i += 2)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700158 vidmem[i] = ' ';
159}
160
Yinghai Lu8fee13a42010-08-02 16:21:22 -0700161#define XMTRDY 0x20
162
163#define TXR 0 /* Transmit register (WRITE) */
164#define LSR 5 /* Line Status */
165static void serial_putchar(int ch)
166{
167 unsigned timeout = 0xffff;
168
169 while ((inb(early_serial_base + LSR) & XMTRDY) == 0 && --timeout)
170 cpu_relax();
171
172 outb(ch, early_serial_base + TXR);
173}
174
Joe Millenbach7aac3012012-07-19 18:04:39 -0700175void __putstr(const char *s)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700176{
Paolo Ciarrocchifd77c7c2008-02-21 00:19:10 +0100177 int x, y, pos;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700178 char c;
179
Yinghai Lu8fee13a42010-08-02 16:21:22 -0700180 if (early_serial_base) {
181 const char *str = s;
182 while (*str) {
183 if (*str == '\n')
184 serial_putchar('\r');
185 serial_putchar(*str++);
186 }
187 }
Ben Collins6bcb13b2008-06-18 14:04:35 -0400188
Kees Cook6655e0a2016-04-18 09:42:12 -0700189 if (boot_params->screen_info.orig_video_mode == 0 &&
Kristian Høgsberg23968f72008-05-29 18:31:14 -0400190 lines == 0 && cols == 0)
Rusty Russella24e7852007-10-21 16:41:35 -0700191 return;
192
Kees Cook6655e0a2016-04-18 09:42:12 -0700193 x = boot_params->screen_info.orig_x;
194 y = boot_params->screen_info.orig_y;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700195
Paolo Ciarrocchifd77c7c2008-02-21 00:19:10 +0100196 while ((c = *s++) != '\0') {
197 if (c == '\n') {
Linus Torvalds1da177e2005-04-16 15:20:36 -0700198 x = 0;
Paolo Ciarrocchifd77c7c2008-02-21 00:19:10 +0100199 if (++y >= lines) {
Linus Torvalds1da177e2005-04-16 15:20:36 -0700200 scroll();
201 y--;
202 }
203 } else {
Paolo Ciarrocchi020878a2008-08-02 21:23:36 +0200204 vidmem[(x + cols * y) * 2] = c;
Paolo Ciarrocchifd77c7c2008-02-21 00:19:10 +0100205 if (++x >= cols) {
Linus Torvalds1da177e2005-04-16 15:20:36 -0700206 x = 0;
Paolo Ciarrocchifd77c7c2008-02-21 00:19:10 +0100207 if (++y >= lines) {
Linus Torvalds1da177e2005-04-16 15:20:36 -0700208 scroll();
209 y--;
210 }
211 }
212 }
213 }
214
Kees Cook6655e0a2016-04-18 09:42:12 -0700215 boot_params->screen_info.orig_x = x;
216 boot_params->screen_info.orig_y = y;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700217
218 pos = (x + cols * y) * 2; /* Update cursor position */
Rene Hermanb02aae92008-01-30 13:30:05 +0100219 outb(14, vidport);
220 outb(0xff & (pos >> 9), vidport+1);
221 outb(15, vidport);
222 outb(0xff & (pos >> 1), vidport+1);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700223}
224
Kees Cook79063a72015-07-06 16:06:20 -0700225void __puthex(unsigned long value)
226{
227 char alpha[2] = "0";
228 int bits;
229
230 for (bits = sizeof(value) * 8 - 4; bits >= 0; bits -= 4) {
231 unsigned long digit = (value >> bits) & 0xf;
232
233 if (digit < 0xA)
234 alpha[0] = '0' + digit;
235 else
236 alpha[0] = 'a' + (digit - 0xA);
237
238 __putstr(alpha);
239 }
240}
241
Linus Torvalds1da177e2005-04-16 15:20:36 -0700242static void error(char *x)
243{
Joe Millenbachcb454fe2012-07-19 18:04:38 -0700244 error_putstr("\n\n");
245 error_putstr(x);
246 error_putstr("\n\n -- System halted");
Linus Torvalds1da177e2005-04-16 15:20:36 -0700247
Ingo Molnarff3cf852008-01-30 13:32:31 +0100248 while (1)
249 asm("hlt");
Linus Torvalds1da177e2005-04-16 15:20:36 -0700250}
251
Kees Cooka0215062013-07-08 09:15:17 -0700252#if CONFIG_X86_NEED_RELOCS
253static void handle_relocations(void *output, unsigned long output_len)
254{
255 int *reloc;
256 unsigned long delta, map, ptr;
257 unsigned long min_addr = (unsigned long)output;
258 unsigned long max_addr = min_addr + output_len;
259
260 /*
261 * Calculate the delta between where vmlinux was linked to load
262 * and where it was actually loaded.
263 */
264 delta = min_addr - LOAD_PHYSICAL_ADDR;
265 if (!delta) {
266 debug_putstr("No relocation needed... ");
267 return;
268 }
269 debug_putstr("Performing relocations... ");
270
271 /*
272 * The kernel contains a table of relocation addresses. Those
273 * addresses have the final load address of the kernel in virtual
274 * memory. We are currently working in the self map. So we need to
275 * create an adjustment for kernel memory addresses to the self map.
276 * This will involve subtracting out the base address of the kernel.
277 */
278 map = delta - __START_KERNEL_map;
279
280 /*
281 * Process relocations: 32 bit relocations first then 64 bit after.
Jan Beulich6d24c5f2014-11-04 08:50:18 +0000282 * Three sets of binary relocations are added to the end of the kernel
Kees Cooka0215062013-07-08 09:15:17 -0700283 * before compression. Each relocation table entry is the kernel
284 * address of the location which needs to be updated stored as a
285 * 32-bit value which is sign extended to 64 bits.
286 *
287 * Format is:
288 *
289 * kernel bits...
290 * 0 - zero terminator for 64 bit relocations
291 * 64 bit relocation repeated
Jan Beulich6d24c5f2014-11-04 08:50:18 +0000292 * 0 - zero terminator for inverse 32 bit relocations
293 * 32 bit inverse relocation repeated
Kees Cooka0215062013-07-08 09:15:17 -0700294 * 0 - zero terminator for 32 bit relocations
295 * 32 bit relocation repeated
296 *
297 * So we work backwards from the end of the decompressed image.
298 */
299 for (reloc = output + output_len - sizeof(*reloc); *reloc; reloc--) {
300 int extended = *reloc;
301 extended += map;
302
303 ptr = (unsigned long)extended;
304 if (ptr < min_addr || ptr > max_addr)
305 error("32-bit relocation outside of kernel!\n");
306
307 *(uint32_t *)ptr += delta;
308 }
309#ifdef CONFIG_X86_64
Jan Beulich6d24c5f2014-11-04 08:50:18 +0000310 while (*--reloc) {
311 long extended = *reloc;
312 extended += map;
313
314 ptr = (unsigned long)extended;
315 if (ptr < min_addr || ptr > max_addr)
316 error("inverse 32-bit relocation outside of kernel!\n");
317
318 *(int32_t *)ptr -= delta;
319 }
Kees Cooka0215062013-07-08 09:15:17 -0700320 for (reloc--; *reloc; reloc--) {
321 long extended = *reloc;
322 extended += map;
323
324 ptr = (unsigned long)extended;
325 if (ptr < min_addr || ptr > max_addr)
326 error("64-bit relocation outside of kernel!\n");
327
328 *(uint64_t *)ptr += delta;
329 }
330#endif
331}
332#else
333static inline void handle_relocations(void *output, unsigned long output_len)
334{ }
335#endif
336
Ian Campbell099e1372008-02-13 20:54:58 +0000337static void parse_elf(void *output)
338{
339#ifdef CONFIG_X86_64
340 Elf64_Ehdr ehdr;
341 Elf64_Phdr *phdrs, *phdr;
342#else
343 Elf32_Ehdr ehdr;
344 Elf32_Phdr *phdrs, *phdr;
345#endif
346 void *dest;
347 int i;
348
349 memcpy(&ehdr, output, sizeof(ehdr));
Paolo Ciarrocchifd77c7c2008-02-21 00:19:10 +0100350 if (ehdr.e_ident[EI_MAG0] != ELFMAG0 ||
Ian Campbell099e1372008-02-13 20:54:58 +0000351 ehdr.e_ident[EI_MAG1] != ELFMAG1 ||
352 ehdr.e_ident[EI_MAG2] != ELFMAG2 ||
Paolo Ciarrocchifd77c7c2008-02-21 00:19:10 +0100353 ehdr.e_ident[EI_MAG3] != ELFMAG3) {
Ian Campbell099e1372008-02-13 20:54:58 +0000354 error("Kernel is not a valid ELF file");
355 return;
356 }
357
Joe Millenbache605a422012-07-19 18:04:37 -0700358 debug_putstr("Parsing ELF... ");
Ian Campbell099e1372008-02-13 20:54:58 +0000359
360 phdrs = malloc(sizeof(*phdrs) * ehdr.e_phnum);
361 if (!phdrs)
362 error("Failed to allocate space for phdrs");
363
364 memcpy(phdrs, output + ehdr.e_phoff, sizeof(*phdrs) * ehdr.e_phnum);
365
Paolo Ciarrocchifd77c7c2008-02-21 00:19:10 +0100366 for (i = 0; i < ehdr.e_phnum; i++) {
Ian Campbell099e1372008-02-13 20:54:58 +0000367 phdr = &phdrs[i];
368
369 switch (phdr->p_type) {
370 case PT_LOAD:
371#ifdef CONFIG_RELOCATABLE
372 dest = output;
373 dest += (phdr->p_paddr - LOAD_PHYSICAL_ADDR);
374#else
Paolo Ciarrocchifd77c7c2008-02-21 00:19:10 +0100375 dest = (void *)(phdr->p_paddr);
Ian Campbell099e1372008-02-13 20:54:58 +0000376#endif
377 memcpy(dest,
378 output + phdr->p_offset,
379 phdr->p_filesz);
380 break;
381 default: /* Ignore other PT_* */ break;
382 }
383 }
Jesper Juhl5067cf52012-01-23 23:34:59 +0100384
385 free(phdrs);
Ian Campbell099e1372008-02-13 20:54:58 +0000386}
387
Kees Cookc0402882016-04-18 09:42:13 -0700388asmlinkage __visible void *extract_kernel(void *rmode, memptr heap,
Ingo Molnar1180e012008-02-21 05:03:48 +0100389 unsigned char *input_data,
390 unsigned long input_len,
Kees Cooka0215062013-07-08 09:15:17 -0700391 unsigned char *output,
Junjie Maoe6023362014-10-31 21:40:38 +0800392 unsigned long output_len,
393 unsigned long run_size)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700394{
Kees Cookf285f4a2015-01-15 16:51:46 -0800395 unsigned char *output_orig = output;
396
Kees Cook6655e0a2016-04-18 09:42:12 -0700397 /* Retain x86 boot parameters pointer passed from startup_32/64. */
398 boot_params = rmode;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700399
Kees Cook6655e0a2016-04-18 09:42:12 -0700400 /* Clear flags intended for solely in-kernel use. */
401 boot_params->hdr.loadflags &= ~KASLR_FLAG;
Borislav Petkov78cac482015-04-01 12:49:52 +0200402
Kees Cook6655e0a2016-04-18 09:42:12 -0700403 sanitize_boot_params(boot_params);
H. Peter Anvin5dcd14e2013-01-29 01:05:24 -0800404
Kees Cook6655e0a2016-04-18 09:42:12 -0700405 if (boot_params->screen_info.orig_video_mode == 7) {
Linus Torvalds1da177e2005-04-16 15:20:36 -0700406 vidmem = (char *) 0xb0000;
407 vidport = 0x3b4;
408 } else {
409 vidmem = (char *) 0xb8000;
410 vidport = 0x3d4;
411 }
412
Kees Cook6655e0a2016-04-18 09:42:12 -0700413 lines = boot_params->screen_info.orig_video_lines;
414 cols = boot_params->screen_info.orig_video_cols;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700415
Yinghai Lu8fee13a42010-08-02 16:21:22 -0700416 console_init();
Kees Cookc0402882016-04-18 09:42:13 -0700417 debug_putstr("early console in extract_kernel\n");
Yinghai Lu8fee13a42010-08-02 16:21:22 -0700418
Ian Campbell4c83d652008-01-30 13:33:38 +0100419 free_mem_ptr = heap; /* Heap */
Alexander van Heukelum7c539762008-04-08 12:54:30 +0200420 free_mem_end_ptr = heap + BOOT_HEAP_SIZE;
Eric W. Biederman968de4f2006-12-07 02:14:04 +0100421
Kees Cook79063a72015-07-06 16:06:20 -0700422 /* Report initial kernel position details. */
423 debug_putaddr(input_data);
424 debug_putaddr(input_len);
425 debug_putaddr(output);
426 debug_putaddr(output_len);
427 debug_putaddr(run_size);
428
Junjie Maoe6023362014-10-31 21:40:38 +0800429 /*
430 * The memory hole needed for the kernel is the larger of either
431 * the entire decompressed kernel plus relocation table, or the
432 * entire decompressed kernel plus .bss and .brk sections.
433 */
Yinghai Lu206f25a2016-04-18 09:42:11 -0700434 output = choose_kernel_location(input_data, input_len, output,
Junjie Maoe6023362014-10-31 21:40:38 +0800435 output_len > run_size ? output_len
436 : run_size);
Kees Cook8ab38202013-10-10 17:18:14 -0700437
438 /* Validate memory location choices. */
H. Peter Anvin7ed42a22009-05-12 11:33:08 -0700439 if ((unsigned long)output & (MIN_KERNEL_ALIGN - 1))
440 error("Destination address inappropriately aligned");
Ian Campbell778cb922008-01-30 13:33:38 +0100441#ifdef CONFIG_X86_64
H. Peter Anvin7ed42a22009-05-12 11:33:08 -0700442 if (heap > 0x3fffffffffffUL)
Ian Campbell778cb922008-01-30 13:33:38 +0100443 error("Destination address too large");
444#else
H. Peter Anvin147dd562010-12-16 19:11:09 -0800445 if (heap > ((-__PAGE_OFFSET-(128<<20)-1) & 0x7fffffff))
Eric W. Biederman968de4f2006-12-07 02:14:04 +0100446 error("Destination address too large");
Eric W. Biederman968de4f2006-12-07 02:14:04 +0100447#endif
H. Peter Anvin7ed42a22009-05-12 11:33:08 -0700448#ifndef CONFIG_RELOCATABLE
449 if ((unsigned long)output != LOAD_PHYSICAL_ADDR)
450 error("Wrong destination address");
Ian Campbell778cb922008-01-30 13:33:38 +0100451#endif
Linus Torvalds1da177e2005-04-16 15:20:36 -0700452
Joe Millenbache605a422012-07-19 18:04:37 -0700453 debug_putstr("\nDecompressing Linux... ");
Yinghai Lu2d3862d2015-09-09 15:39:12 -0700454 __decompress(input_data, input_len, NULL, NULL, output, output_len,
455 NULL, error);
Ian Campbell099e1372008-02-13 20:54:58 +0000456 parse_elf(output);
Kees Cookf285f4a2015-01-15 16:51:46 -0800457 /*
458 * 32-bit always performs relocations. 64-bit relocations are only
459 * needed if kASLR has chosen a different load address.
460 */
461 if (!IS_ENABLED(CONFIG_X86_64) || output != output_orig)
462 handle_relocations(output, output_len);
Joe Millenbache605a422012-07-19 18:04:37 -0700463 debug_putstr("done.\nBooting the kernel.\n");
Kees Cook8ab38202013-10-10 17:18:14 -0700464 return output;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700465}