Andi Kleen | 2aae950 | 2007-07-21 17:10:01 +0200 | [diff] [blame] | 1 | /* |
| 2 | * Set up the VMAs to tell the VM about the vDSO. |
| 3 | * Copyright 2007 Andi Kleen, SUSE Labs. |
| 4 | * Subject to the GPL, v.2 |
| 5 | */ |
| 6 | #include <linux/mm.h> |
Alexey Dobriyan | 4e950f6 | 2007-07-30 02:36:13 +0400 | [diff] [blame] | 7 | #include <linux/err.h> |
Andi Kleen | 2aae950 | 2007-07-21 17:10:01 +0200 | [diff] [blame] | 8 | #include <linux/sched.h> |
Tejun Heo | 5a0e3ad | 2010-03-24 17:04:11 +0900 | [diff] [blame] | 9 | #include <linux/slab.h> |
Andi Kleen | 2aae950 | 2007-07-21 17:10:01 +0200 | [diff] [blame] | 10 | #include <linux/init.h> |
| 11 | #include <linux/random.h> |
Jaswinder Singh Rajput | 3fa89ca | 2009-04-12 20:37:25 +0530 | [diff] [blame] | 12 | #include <linux/elf.h> |
Andi Kleen | 2aae950 | 2007-07-21 17:10:01 +0200 | [diff] [blame] | 13 | #include <asm/vsyscall.h> |
| 14 | #include <asm/vgtod.h> |
| 15 | #include <asm/proto.h> |
Roland McGrath | 7f3646a | 2008-01-30 13:30:41 +0100 | [diff] [blame] | 16 | #include <asm/vdso.h> |
Andy Lutomirski | aafade2 | 2011-07-21 15:47:10 -0400 | [diff] [blame] | 17 | #include <asm/page.h> |
Roland McGrath | 7f3646a | 2008-01-30 13:30:41 +0100 | [diff] [blame] | 18 | |
OGAWA Hirofumi | e6b0ede | 2008-05-12 15:43:38 +0200 | [diff] [blame] | 19 | unsigned int __read_mostly vdso_enabled = 1; |
Andi Kleen | 2aae950 | 2007-07-21 17:10:01 +0200 | [diff] [blame] | 20 | |
Roland McGrath | 7f3646a | 2008-01-30 13:30:41 +0100 | [diff] [blame] | 21 | extern char vdso_start[], vdso_end[]; |
Andi Kleen | 2aae950 | 2007-07-21 17:10:01 +0200 | [diff] [blame] | 22 | extern unsigned short vdso_sync_cpuid; |
| 23 | |
Andy Lutomirski | aafade2 | 2011-07-21 15:47:10 -0400 | [diff] [blame] | 24 | extern struct page *vdso_pages[]; |
Jan Beulich | 369c992 | 2008-07-18 13:37:53 +0100 | [diff] [blame] | 25 | static unsigned vdso_size; |
Andi Kleen | 2aae950 | 2007-07-21 17:10:01 +0200 | [diff] [blame] | 26 | |
H. J. Lu | 1a21d4e | 2012-02-19 11:38:06 -0800 | [diff] [blame] | 27 | #ifdef CONFIG_X86_X32_ABI |
| 28 | extern char vdsox32_start[], vdsox32_end[]; |
| 29 | extern struct page *vdsox32_pages[]; |
| 30 | static unsigned vdsox32_size; |
| 31 | |
| 32 | static void __init patch_vdsox32(void *vdso, size_t len) |
| 33 | { |
| 34 | Elf32_Ehdr *hdr = vdso; |
| 35 | Elf32_Shdr *sechdrs, *alt_sec = 0; |
| 36 | char *secstrings; |
| 37 | void *alt_data; |
| 38 | int i; |
| 39 | |
| 40 | BUG_ON(len < sizeof(Elf32_Ehdr)); |
| 41 | BUG_ON(memcmp(hdr->e_ident, ELFMAG, SELFMAG) != 0); |
| 42 | |
| 43 | sechdrs = (void *)hdr + hdr->e_shoff; |
| 44 | secstrings = (void *)hdr + sechdrs[hdr->e_shstrndx].sh_offset; |
| 45 | |
| 46 | for (i = 1; i < hdr->e_shnum; i++) { |
| 47 | Elf32_Shdr *shdr = &sechdrs[i]; |
| 48 | if (!strcmp(secstrings + shdr->sh_name, ".altinstructions")) { |
| 49 | alt_sec = shdr; |
| 50 | goto found; |
| 51 | } |
| 52 | } |
| 53 | |
| 54 | /* If we get here, it's probably a bug. */ |
| 55 | pr_warning("patch_vdsox32: .altinstructions not found\n"); |
| 56 | return; /* nothing to patch */ |
| 57 | |
| 58 | found: |
| 59 | alt_data = (void *)hdr + alt_sec->sh_offset; |
| 60 | apply_alternatives(alt_data, alt_data + alt_sec->sh_size); |
| 61 | } |
| 62 | #endif |
| 63 | |
| 64 | static void __init patch_vdso64(void *vdso, size_t len) |
Andy Lutomirski | 1b3f2a7 | 2011-07-13 09:24:11 -0400 | [diff] [blame] | 65 | { |
| 66 | Elf64_Ehdr *hdr = vdso; |
| 67 | Elf64_Shdr *sechdrs, *alt_sec = 0; |
| 68 | char *secstrings; |
| 69 | void *alt_data; |
| 70 | int i; |
| 71 | |
| 72 | BUG_ON(len < sizeof(Elf64_Ehdr)); |
| 73 | BUG_ON(memcmp(hdr->e_ident, ELFMAG, SELFMAG) != 0); |
| 74 | |
| 75 | sechdrs = (void *)hdr + hdr->e_shoff; |
| 76 | secstrings = (void *)hdr + sechdrs[hdr->e_shstrndx].sh_offset; |
| 77 | |
| 78 | for (i = 1; i < hdr->e_shnum; i++) { |
| 79 | Elf64_Shdr *shdr = &sechdrs[i]; |
| 80 | if (!strcmp(secstrings + shdr->sh_name, ".altinstructions")) { |
| 81 | alt_sec = shdr; |
| 82 | goto found; |
| 83 | } |
| 84 | } |
| 85 | |
| 86 | /* If we get here, it's probably a bug. */ |
H. J. Lu | 1a21d4e | 2012-02-19 11:38:06 -0800 | [diff] [blame] | 87 | pr_warning("patch_vdso64: .altinstructions not found\n"); |
Andy Lutomirski | 1b3f2a7 | 2011-07-13 09:24:11 -0400 | [diff] [blame] | 88 | return; /* nothing to patch */ |
| 89 | |
| 90 | found: |
| 91 | alt_data = (void *)hdr + alt_sec->sh_offset; |
| 92 | apply_alternatives(alt_data, alt_data + alt_sec->sh_size); |
| 93 | } |
| 94 | |
Andy Lutomirski | aafade2 | 2011-07-21 15:47:10 -0400 | [diff] [blame] | 95 | static int __init init_vdso(void) |
Andi Kleen | 2aae950 | 2007-07-21 17:10:01 +0200 | [diff] [blame] | 96 | { |
| 97 | int npages = (vdso_end - vdso_start + PAGE_SIZE - 1) / PAGE_SIZE; |
| 98 | int i; |
Andi Kleen | 2aae950 | 2007-07-21 17:10:01 +0200 | [diff] [blame] | 99 | |
H. J. Lu | 1a21d4e | 2012-02-19 11:38:06 -0800 | [diff] [blame] | 100 | patch_vdso64(vdso_start, vdso_end - vdso_start); |
Andy Lutomirski | 1b3f2a7 | 2011-07-13 09:24:11 -0400 | [diff] [blame] | 101 | |
Jan Beulich | 369c992 | 2008-07-18 13:37:53 +0100 | [diff] [blame] | 102 | vdso_size = npages << PAGE_SHIFT; |
Andy Lutomirski | aafade2 | 2011-07-21 15:47:10 -0400 | [diff] [blame] | 103 | for (i = 0; i < npages; i++) |
| 104 | vdso_pages[i] = virt_to_page(vdso_start + i*PAGE_SIZE); |
Andi Kleen | 2aae950 | 2007-07-21 17:10:01 +0200 | [diff] [blame] | 105 | |
H. J. Lu | 1a21d4e | 2012-02-19 11:38:06 -0800 | [diff] [blame] | 106 | #ifdef CONFIG_X86_X32_ABI |
| 107 | patch_vdsox32(vdsox32_start, vdsox32_end - vdsox32_start); |
| 108 | npages = (vdsox32_end - vdsox32_start + PAGE_SIZE - 1) / PAGE_SIZE; |
| 109 | vdsox32_size = npages << PAGE_SHIFT; |
| 110 | for (i = 0; i < npages; i++) |
| 111 | vdsox32_pages[i] = virt_to_page(vdsox32_start + i*PAGE_SIZE); |
| 112 | #endif |
| 113 | |
Andi Kleen | 2aae950 | 2007-07-21 17:10:01 +0200 | [diff] [blame] | 114 | return 0; |
Andi Kleen | 2aae950 | 2007-07-21 17:10:01 +0200 | [diff] [blame] | 115 | } |
Andy Lutomirski | aafade2 | 2011-07-21 15:47:10 -0400 | [diff] [blame] | 116 | subsys_initcall(init_vdso); |
Andi Kleen | 2aae950 | 2007-07-21 17:10:01 +0200 | [diff] [blame] | 117 | |
| 118 | struct linux_binprm; |
| 119 | |
| 120 | /* Put the vdso above the (randomized) stack with another randomized offset. |
| 121 | This way there is no hole in the middle of address space. |
| 122 | To save memory make sure it is still in the same PTE as the stack top. |
| 123 | This doesn't give that many random bits */ |
| 124 | static unsigned long vdso_addr(unsigned long start, unsigned len) |
| 125 | { |
| 126 | unsigned long addr, end; |
| 127 | unsigned offset; |
| 128 | end = (start + PMD_SIZE - 1) & PMD_MASK; |
Ingo Molnar | d951734 | 2009-02-20 23:32:28 +0100 | [diff] [blame] | 129 | if (end >= TASK_SIZE_MAX) |
| 130 | end = TASK_SIZE_MAX; |
Andi Kleen | 2aae950 | 2007-07-21 17:10:01 +0200 | [diff] [blame] | 131 | end -= len; |
| 132 | /* This loses some more bits than a modulo, but is cheaper */ |
| 133 | offset = get_random_int() & (PTRS_PER_PTE - 1); |
| 134 | addr = start + (offset << PAGE_SHIFT); |
| 135 | if (addr >= end) |
| 136 | addr = end; |
Borislav Petkov | dfb09f9 | 2011-08-05 15:15:08 +0200 | [diff] [blame] | 137 | |
| 138 | /* |
| 139 | * page-align it here so that get_unmapped_area doesn't |
| 140 | * align it wrongfully again to the next page. addr can come in 4K |
| 141 | * unaligned here as a result of stack start randomization. |
| 142 | */ |
| 143 | addr = PAGE_ALIGN(addr); |
Michel Lespinasse | f9902472 | 2012-12-11 16:01:52 -0800 | [diff] [blame] | 144 | addr = align_vdso_addr(addr); |
Borislav Petkov | dfb09f9 | 2011-08-05 15:15:08 +0200 | [diff] [blame] | 145 | |
Andi Kleen | 2aae950 | 2007-07-21 17:10:01 +0200 | [diff] [blame] | 146 | return addr; |
| 147 | } |
| 148 | |
| 149 | /* Setup a VMA at program startup for the vsyscall page. |
| 150 | Not called for compat tasks */ |
H. J. Lu | 1a21d4e | 2012-02-19 11:38:06 -0800 | [diff] [blame] | 151 | static int setup_additional_pages(struct linux_binprm *bprm, |
| 152 | int uses_interp, |
| 153 | struct page **pages, |
| 154 | unsigned size) |
Andi Kleen | 2aae950 | 2007-07-21 17:10:01 +0200 | [diff] [blame] | 155 | { |
| 156 | struct mm_struct *mm = current->mm; |
| 157 | unsigned long addr; |
| 158 | int ret; |
Andi Kleen | 2aae950 | 2007-07-21 17:10:01 +0200 | [diff] [blame] | 159 | |
| 160 | if (!vdso_enabled) |
| 161 | return 0; |
| 162 | |
| 163 | down_write(&mm->mmap_sem); |
H. J. Lu | 1a21d4e | 2012-02-19 11:38:06 -0800 | [diff] [blame] | 164 | addr = vdso_addr(mm->start_stack, size); |
| 165 | addr = get_unmapped_area(NULL, addr, size, 0, 0); |
Andi Kleen | 2aae950 | 2007-07-21 17:10:01 +0200 | [diff] [blame] | 166 | if (IS_ERR_VALUE(addr)) { |
| 167 | ret = addr; |
| 168 | goto up_fail; |
| 169 | } |
| 170 | |
Peter Zijlstra | f7b6eb3 | 2009-06-05 14:04:51 +0200 | [diff] [blame] | 171 | current->mm->context.vdso = (void *)addr; |
| 172 | |
H. J. Lu | 1a21d4e | 2012-02-19 11:38:06 -0800 | [diff] [blame] | 173 | ret = install_special_mapping(mm, addr, size, |
Andi Kleen | 2aae950 | 2007-07-21 17:10:01 +0200 | [diff] [blame] | 174 | VM_READ|VM_EXEC| |
Jason Baron | 909af76 | 2012-03-23 15:02:51 -0700 | [diff] [blame] | 175 | VM_MAYREAD|VM_MAYWRITE|VM_MAYEXEC, |
H. J. Lu | 1a21d4e | 2012-02-19 11:38:06 -0800 | [diff] [blame] | 176 | pages); |
Peter Zijlstra | f7b6eb3 | 2009-06-05 14:04:51 +0200 | [diff] [blame] | 177 | if (ret) { |
| 178 | current->mm->context.vdso = NULL; |
Andi Kleen | 2aae950 | 2007-07-21 17:10:01 +0200 | [diff] [blame] | 179 | goto up_fail; |
Peter Zijlstra | f7b6eb3 | 2009-06-05 14:04:51 +0200 | [diff] [blame] | 180 | } |
Andi Kleen | 2aae950 | 2007-07-21 17:10:01 +0200 | [diff] [blame] | 181 | |
Andi Kleen | 2aae950 | 2007-07-21 17:10:01 +0200 | [diff] [blame] | 182 | up_fail: |
| 183 | up_write(&mm->mmap_sem); |
| 184 | return ret; |
| 185 | } |
| 186 | |
H. J. Lu | 1a21d4e | 2012-02-19 11:38:06 -0800 | [diff] [blame] | 187 | int arch_setup_additional_pages(struct linux_binprm *bprm, int uses_interp) |
| 188 | { |
H. Peter Anvin | 22e842d | 2012-02-21 14:32:19 -0800 | [diff] [blame] | 189 | return setup_additional_pages(bprm, uses_interp, vdso_pages, |
| 190 | vdso_size); |
H. J. Lu | 1a21d4e | 2012-02-19 11:38:06 -0800 | [diff] [blame] | 191 | } |
| 192 | |
| 193 | #ifdef CONFIG_X86_X32_ABI |
| 194 | int x32_setup_additional_pages(struct linux_binprm *bprm, int uses_interp) |
| 195 | { |
H. Peter Anvin | 22e842d | 2012-02-21 14:32:19 -0800 | [diff] [blame] | 196 | return setup_additional_pages(bprm, uses_interp, vdsox32_pages, |
| 197 | vdsox32_size); |
H. J. Lu | 1a21d4e | 2012-02-19 11:38:06 -0800 | [diff] [blame] | 198 | } |
| 199 | #endif |
| 200 | |
Andi Kleen | 2aae950 | 2007-07-21 17:10:01 +0200 | [diff] [blame] | 201 | static __init int vdso_setup(char *s) |
| 202 | { |
| 203 | vdso_enabled = simple_strtoul(s, NULL, 0); |
| 204 | return 0; |
| 205 | } |
| 206 | __setup("vdso=", vdso_setup); |