Linus Torvalds | 1da177e | 2005-04-16 15:20:36 -0700 | [diff] [blame] | 1 | /* |
Anton Ivanov | 2eb5f31 | 2015-11-02 16:16:37 +0000 | [diff] [blame] | 2 | * Copyright (C) 2015 Thomas Meyer (thomas@m3y3r.de) |
Jeff Dike | ba180fd | 2007-10-16 01:27:00 -0700 | [diff] [blame] | 3 | * Copyright (C) 2000 - 2007 Jeff Dike (jdike@{addtoit,linux.intel}.com) |
Linus Torvalds | 1da177e | 2005-04-16 15:20:36 -0700 | [diff] [blame] | 4 | * Licensed under the GPL |
| 5 | */ |
| 6 | |
Linus Torvalds | 1da177e | 2005-04-16 15:20:36 -0700 | [diff] [blame] | 7 | #include <stdio.h> |
| 8 | #include <stdlib.h> |
Jeff Dike | ba180fd | 2007-10-16 01:27:00 -0700 | [diff] [blame] | 9 | #include <unistd.h> |
Linus Torvalds | 1da177e | 2005-04-16 15:20:36 -0700 | [diff] [blame] | 10 | #include <errno.h> |
Jeff Dike | ba180fd | 2007-10-16 01:27:00 -0700 | [diff] [blame] | 11 | #include <signal.h> |
| 12 | #include <string.h> |
Linus Torvalds | 1da177e | 2005-04-16 15:20:36 -0700 | [diff] [blame] | 13 | #include <sys/resource.h> |
Al Viro | 37185b3 | 2012-10-08 03:27:32 +0100 | [diff] [blame] | 14 | #include <as-layout.h> |
| 15 | #include <init.h> |
| 16 | #include <kern_util.h> |
| 17 | #include <os.h> |
| 18 | #include <um_malloc.h> |
Linus Torvalds | 1da177e | 2005-04-16 15:20:36 -0700 | [diff] [blame] | 19 | |
Linus Torvalds | 1da177e | 2005-04-16 15:20:36 -0700 | [diff] [blame] | 20 | #define PGD_BOUND (4 * 1024 * 1024) |
| 21 | #define STACKSIZE (8 * 1024 * 1024) |
| 22 | #define THREAD_NAME_LEN (256) |
| 23 | |
Richard Weinberger | b743ac5 | 2011-07-25 17:12:52 -0700 | [diff] [blame] | 24 | long elf_aux_hwcap; |
| 25 | |
Linus Torvalds | 1da177e | 2005-04-16 15:20:36 -0700 | [diff] [blame] | 26 | static void set_stklim(void) |
| 27 | { |
| 28 | struct rlimit lim; |
| 29 | |
Jeff Dike | ba180fd | 2007-10-16 01:27:00 -0700 | [diff] [blame] | 30 | if (getrlimit(RLIMIT_STACK, &lim) < 0) { |
Linus Torvalds | 1da177e | 2005-04-16 15:20:36 -0700 | [diff] [blame] | 31 | perror("getrlimit"); |
| 32 | exit(1); |
| 33 | } |
Jeff Dike | ba180fd | 2007-10-16 01:27:00 -0700 | [diff] [blame] | 34 | if ((lim.rlim_cur == RLIM_INFINITY) || (lim.rlim_cur > STACKSIZE)) { |
Linus Torvalds | 1da177e | 2005-04-16 15:20:36 -0700 | [diff] [blame] | 35 | lim.rlim_cur = STACKSIZE; |
Jeff Dike | ba180fd | 2007-10-16 01:27:00 -0700 | [diff] [blame] | 36 | if (setrlimit(RLIMIT_STACK, &lim) < 0) { |
Linus Torvalds | 1da177e | 2005-04-16 15:20:36 -0700 | [diff] [blame] | 37 | perror("setrlimit"); |
| 38 | exit(1); |
| 39 | } |
| 40 | } |
Linus Torvalds | 1da177e | 2005-04-16 15:20:36 -0700 | [diff] [blame] | 41 | } |
| 42 | |
| 43 | static __init void do_uml_initcalls(void) |
| 44 | { |
| 45 | initcall_t *call; |
| 46 | |
| 47 | call = &__uml_initcall_start; |
Jeff Dike | ba180fd | 2007-10-16 01:27:00 -0700 | [diff] [blame] | 48 | while (call < &__uml_initcall_end) { |
Linus Torvalds | 1da177e | 2005-04-16 15:20:36 -0700 | [diff] [blame] | 49 | (*call)(); |
| 50 | call++; |
| 51 | } |
| 52 | } |
| 53 | |
| 54 | static void last_ditch_exit(int sig) |
| 55 | { |
Linus Torvalds | 1da177e | 2005-04-16 15:20:36 -0700 | [diff] [blame] | 56 | uml_cleanup(); |
| 57 | exit(1); |
| 58 | } |
| 59 | |
Jeff Dike | 4b84c69 | 2006-09-25 23:33:04 -0700 | [diff] [blame] | 60 | static void install_fatal_handler(int sig) |
| 61 | { |
| 62 | struct sigaction action; |
| 63 | |
| 64 | /* All signals are enabled in this handler ... */ |
| 65 | sigemptyset(&action.sa_mask); |
| 66 | |
Jeff Dike | ba180fd | 2007-10-16 01:27:00 -0700 | [diff] [blame] | 67 | /* |
| 68 | * ... including the signal being handled, plus we want the |
Jeff Dike | 4b84c69 | 2006-09-25 23:33:04 -0700 | [diff] [blame] | 69 | * handler reset to the default behavior, so that if an exit |
| 70 | * handler is hanging for some reason, the UML will just die |
| 71 | * after this signal is sent a second time. |
| 72 | */ |
| 73 | action.sa_flags = SA_RESETHAND | SA_NODEFER; |
| 74 | action.sa_restorer = NULL; |
| 75 | action.sa_handler = last_ditch_exit; |
Jeff Dike | ba180fd | 2007-10-16 01:27:00 -0700 | [diff] [blame] | 76 | if (sigaction(sig, &action, NULL) < 0) { |
Jeff Dike | 4b84c69 | 2006-09-25 23:33:04 -0700 | [diff] [blame] | 77 | printf("failed to install handler for signal %d - errno = %d\n", |
WANG Cong | c9a3072 | 2008-02-04 22:30:35 -0800 | [diff] [blame] | 78 | sig, errno); |
Jeff Dike | 4b84c69 | 2006-09-25 23:33:04 -0700 | [diff] [blame] | 79 | exit(1); |
| 80 | } |
| 81 | } |
| 82 | |
Richard Weinberger | 0ce451a | 2011-05-24 17:13:00 -0700 | [diff] [blame] | 83 | #define UML_LIB_PATH ":" OS_LIB_PATH "/uml" |
Mattia Dongili | cb98cdc | 2006-05-01 12:16:01 -0700 | [diff] [blame] | 84 | |
| 85 | static void setup_env_path(void) |
| 86 | { |
| 87 | char *new_path = NULL; |
| 88 | char *old_path = NULL; |
| 89 | int path_len = 0; |
| 90 | |
| 91 | old_path = getenv("PATH"); |
Jeff Dike | ba180fd | 2007-10-16 01:27:00 -0700 | [diff] [blame] | 92 | /* |
| 93 | * if no PATH variable is set or it has an empty value |
Mattia Dongili | cb98cdc | 2006-05-01 12:16:01 -0700 | [diff] [blame] | 94 | * just use the default + /usr/lib/uml |
| 95 | */ |
| 96 | if (!old_path || (path_len = strlen(old_path)) == 0) { |
WANG Cong | c9a3072 | 2008-02-04 22:30:35 -0800 | [diff] [blame] | 97 | if (putenv("PATH=:/bin:/usr/bin/" UML_LIB_PATH)) |
| 98 | perror("couldn't putenv"); |
Mattia Dongili | cb98cdc | 2006-05-01 12:16:01 -0700 | [diff] [blame] | 99 | return; |
| 100 | } |
| 101 | |
| 102 | /* append /usr/lib/uml to the existing path */ |
| 103 | path_len += strlen("PATH=" UML_LIB_PATH) + 1; |
| 104 | new_path = malloc(path_len); |
| 105 | if (!new_path) { |
WANG Cong | c9a3072 | 2008-02-04 22:30:35 -0800 | [diff] [blame] | 106 | perror("couldn't malloc to set a new PATH"); |
Mattia Dongili | cb98cdc | 2006-05-01 12:16:01 -0700 | [diff] [blame] | 107 | return; |
| 108 | } |
| 109 | snprintf(new_path, path_len, "PATH=%s" UML_LIB_PATH, old_path); |
WANG Cong | c9a3072 | 2008-02-04 22:30:35 -0800 | [diff] [blame] | 110 | if (putenv(new_path)) { |
| 111 | perror("couldn't putenv to set a new PATH"); |
| 112 | free(new_path); |
| 113 | } |
Mattia Dongili | cb98cdc | 2006-05-01 12:16:01 -0700 | [diff] [blame] | 114 | } |
| 115 | |
Linus Torvalds | 1da177e | 2005-04-16 15:20:36 -0700 | [diff] [blame] | 116 | extern void scan_elf_aux( char **envp); |
| 117 | |
Jeff Dike | 36e4546 | 2007-05-06 14:51:11 -0700 | [diff] [blame] | 118 | int __init main(int argc, char **argv, char **envp) |
Linus Torvalds | 1da177e | 2005-04-16 15:20:36 -0700 | [diff] [blame] | 119 | { |
| 120 | char **new_argv; |
Jeff Dike | 92515da | 2005-05-28 15:51:56 -0700 | [diff] [blame] | 121 | int ret, i, err; |
Linus Torvalds | 1da177e | 2005-04-16 15:20:36 -0700 | [diff] [blame] | 122 | |
Linus Torvalds | 1da177e | 2005-04-16 15:20:36 -0700 | [diff] [blame] | 123 | set_stklim(); |
| 124 | |
Mattia Dongili | cb98cdc | 2006-05-01 12:16:01 -0700 | [diff] [blame] | 125 | setup_env_path(); |
| 126 | |
Richard Weinberger | 2501272 | 2013-08-18 13:30:09 +0200 | [diff] [blame] | 127 | setsid(); |
| 128 | |
Linus Torvalds | 1da177e | 2005-04-16 15:20:36 -0700 | [diff] [blame] | 129 | new_argv = malloc((argc + 1) * sizeof(char *)); |
Jeff Dike | ba180fd | 2007-10-16 01:27:00 -0700 | [diff] [blame] | 130 | if (new_argv == NULL) { |
Linus Torvalds | 1da177e | 2005-04-16 15:20:36 -0700 | [diff] [blame] | 131 | perror("Mallocing argv"); |
| 132 | exit(1); |
| 133 | } |
Jeff Dike | ba180fd | 2007-10-16 01:27:00 -0700 | [diff] [blame] | 134 | for (i = 0; i < argc; i++) { |
Linus Torvalds | 1da177e | 2005-04-16 15:20:36 -0700 | [diff] [blame] | 135 | new_argv[i] = strdup(argv[i]); |
Jeff Dike | ba180fd | 2007-10-16 01:27:00 -0700 | [diff] [blame] | 136 | if (new_argv[i] == NULL) { |
Linus Torvalds | 1da177e | 2005-04-16 15:20:36 -0700 | [diff] [blame] | 137 | perror("Mallocing an arg"); |
| 138 | exit(1); |
| 139 | } |
| 140 | } |
| 141 | new_argv[argc] = NULL; |
| 142 | |
Jeff Dike | ba180fd | 2007-10-16 01:27:00 -0700 | [diff] [blame] | 143 | /* |
| 144 | * Allow these signals to bring down a UML if all other |
Jeff Dike | 4b84c69 | 2006-09-25 23:33:04 -0700 | [diff] [blame] | 145 | * methods of control fail. |
| 146 | */ |
| 147 | install_fatal_handler(SIGINT); |
| 148 | install_fatal_handler(SIGTERM); |
Linus Torvalds | 1da177e | 2005-04-16 15:20:36 -0700 | [diff] [blame] | 149 | |
Richard Weinberger | b743ac5 | 2011-07-25 17:12:52 -0700 | [diff] [blame] | 150 | #ifdef CONFIG_ARCH_REUSE_HOST_VSYSCALL_AREA |
Jeff Dike | ba180fd | 2007-10-16 01:27:00 -0700 | [diff] [blame] | 151 | scan_elf_aux(envp); |
Richard Weinberger | b743ac5 | 2011-07-25 17:12:52 -0700 | [diff] [blame] | 152 | #endif |
Linus Torvalds | 1da177e | 2005-04-16 15:20:36 -0700 | [diff] [blame] | 153 | |
| 154 | do_uml_initcalls(); |
Anton Ivanov | 9fcb663 | 2014-03-07 18:37:46 +0000 | [diff] [blame] | 155 | change_sig(SIGPIPE, 0); |
Linus Torvalds | 1da177e | 2005-04-16 15:20:36 -0700 | [diff] [blame] | 156 | ret = linux_main(argc, argv); |
| 157 | |
Jeff Dike | ba180fd | 2007-10-16 01:27:00 -0700 | [diff] [blame] | 158 | /* |
| 159 | * Disable SIGPROF - I have no idea why libc doesn't do this or turn |
Linus Torvalds | 1da177e | 2005-04-16 15:20:36 -0700 | [diff] [blame] | 160 | * off the profiling time, but UML dies with a SIGPROF just before |
| 161 | * exiting when profiling is active. |
| 162 | */ |
| 163 | change_sig(SIGPROF, 0); |
| 164 | |
Jeff Dike | ba180fd | 2007-10-16 01:27:00 -0700 | [diff] [blame] | 165 | /* |
| 166 | * This signal stuff used to be in the reboot case. However, |
Anton Ivanov | 2eb5f31 | 2015-11-02 16:16:37 +0000 | [diff] [blame] | 167 | * sometimes a timer signal can come in when we're halting (reproducably |
Jeff Dike | 52c653b | 2005-11-07 00:58:50 -0800 | [diff] [blame] | 168 | * when writing out gcov information, presumably because that takes |
| 169 | * some time) and cause a segfault. |
| 170 | */ |
Jeff Dike | 92515da | 2005-05-28 15:51:56 -0700 | [diff] [blame] | 171 | |
Anton Ivanov | 2eb5f31 | 2015-11-02 16:16:37 +0000 | [diff] [blame] | 172 | /* stop timers and set timer signal to be ignored */ |
| 173 | os_timer_disable(); |
Jeff Dike | 92515da | 2005-05-28 15:51:56 -0700 | [diff] [blame] | 174 | |
Jeff Dike | 52c653b | 2005-11-07 00:58:50 -0800 | [diff] [blame] | 175 | /* disable SIGIO for the fds and set SIGIO to be ignored */ |
| 176 | err = deactivate_all_fds(); |
Jeff Dike | ba180fd | 2007-10-16 01:27:00 -0700 | [diff] [blame] | 177 | if (err) |
Jeff Dike | 52c653b | 2005-11-07 00:58:50 -0800 | [diff] [blame] | 178 | printf("deactivate_all_fds failed, errno = %d\n", -err); |
Jeff Dike | 92515da | 2005-05-28 15:51:56 -0700 | [diff] [blame] | 179 | |
Jeff Dike | ba180fd | 2007-10-16 01:27:00 -0700 | [diff] [blame] | 180 | /* |
| 181 | * Let any pending signals fire now. This ensures |
Jeff Dike | 52c653b | 2005-11-07 00:58:50 -0800 | [diff] [blame] | 182 | * that they won't be delivered after the exec, when |
| 183 | * they are definitely not expected. |
| 184 | */ |
| 185 | unblock_signals(); |
Jeff Dike | 92515da | 2005-05-28 15:51:56 -0700 | [diff] [blame] | 186 | |
Linus Torvalds | 1da177e | 2005-04-16 15:20:36 -0700 | [diff] [blame] | 187 | /* Reboot */ |
Jeff Dike | ba180fd | 2007-10-16 01:27:00 -0700 | [diff] [blame] | 188 | if (ret) { |
Linus Torvalds | 1da177e | 2005-04-16 15:20:36 -0700 | [diff] [blame] | 189 | printf("\n"); |
Linus Torvalds | 1da177e | 2005-04-16 15:20:36 -0700 | [diff] [blame] | 190 | execvp(new_argv[0], new_argv); |
| 191 | perror("Failed to exec kernel"); |
| 192 | ret = 1; |
| 193 | } |
| 194 | printf("\n"); |
Jeff Dike | a5ed1ff | 2007-05-06 14:50:58 -0700 | [diff] [blame] | 195 | return uml_exitcode; |
Linus Torvalds | 1da177e | 2005-04-16 15:20:36 -0700 | [diff] [blame] | 196 | } |
| 197 | |
Linus Torvalds | 1da177e | 2005-04-16 15:20:36 -0700 | [diff] [blame] | 198 | extern void *__real_malloc(int); |
| 199 | |
| 200 | void *__wrap_malloc(int size) |
| 201 | { |
| 202 | void *ret; |
| 203 | |
Jeff Dike | ba180fd | 2007-10-16 01:27:00 -0700 | [diff] [blame] | 204 | if (!kmalloc_ok) |
Jeff Dike | a5ed1ff | 2007-05-06 14:50:58 -0700 | [diff] [blame] | 205 | return __real_malloc(size); |
Jeff Dike | ba180fd | 2007-10-16 01:27:00 -0700 | [diff] [blame] | 206 | else if (size <= UM_KERN_PAGE_SIZE) |
Jeff Dike | c539ab7 | 2007-06-16 10:16:09 -0700 | [diff] [blame] | 207 | /* finding contiguous pages can be hard*/ |
Jeff Dike | 43f5b30 | 2008-05-12 14:01:52 -0700 | [diff] [blame] | 208 | ret = uml_kmalloc(size, UM_GFP_KERNEL); |
Jeff Dike | e4c4bf9 | 2007-07-15 23:38:56 -0700 | [diff] [blame] | 209 | else ret = vmalloc(size); |
Linus Torvalds | 1da177e | 2005-04-16 15:20:36 -0700 | [diff] [blame] | 210 | |
Jeff Dike | ba180fd | 2007-10-16 01:27:00 -0700 | [diff] [blame] | 211 | /* |
| 212 | * glibc people insist that if malloc fails, errno should be |
Linus Torvalds | 1da177e | 2005-04-16 15:20:36 -0700 | [diff] [blame] | 213 | * set by malloc as well. So we do. |
| 214 | */ |
Jeff Dike | ba180fd | 2007-10-16 01:27:00 -0700 | [diff] [blame] | 215 | if (ret == NULL) |
Linus Torvalds | 1da177e | 2005-04-16 15:20:36 -0700 | [diff] [blame] | 216 | errno = ENOMEM; |
| 217 | |
Jeff Dike | a5ed1ff | 2007-05-06 14:50:58 -0700 | [diff] [blame] | 218 | return ret; |
Linus Torvalds | 1da177e | 2005-04-16 15:20:36 -0700 | [diff] [blame] | 219 | } |
| 220 | |
| 221 | void *__wrap_calloc(int n, int size) |
| 222 | { |
| 223 | void *ptr = __wrap_malloc(n * size); |
| 224 | |
Jeff Dike | ba180fd | 2007-10-16 01:27:00 -0700 | [diff] [blame] | 225 | if (ptr == NULL) |
Jeff Dike | a5ed1ff | 2007-05-06 14:50:58 -0700 | [diff] [blame] | 226 | return NULL; |
Linus Torvalds | 1da177e | 2005-04-16 15:20:36 -0700 | [diff] [blame] | 227 | memset(ptr, 0, n * size); |
Jeff Dike | a5ed1ff | 2007-05-06 14:50:58 -0700 | [diff] [blame] | 228 | return ptr; |
Linus Torvalds | 1da177e | 2005-04-16 15:20:36 -0700 | [diff] [blame] | 229 | } |
| 230 | |
| 231 | extern void __real_free(void *); |
| 232 | |
| 233 | extern unsigned long high_physmem; |
| 234 | |
| 235 | void __wrap_free(void *ptr) |
| 236 | { |
| 237 | unsigned long addr = (unsigned long) ptr; |
| 238 | |
Jeff Dike | ba180fd | 2007-10-16 01:27:00 -0700 | [diff] [blame] | 239 | /* |
| 240 | * We need to know how the allocation happened, so it can be correctly |
Linus Torvalds | 1da177e | 2005-04-16 15:20:36 -0700 | [diff] [blame] | 241 | * freed. This is done by seeing what region of memory the pointer is |
| 242 | * in - |
| 243 | * physical memory - kmalloc/kfree |
| 244 | * kernel virtual memory - vmalloc/vfree |
| 245 | * anywhere else - malloc/free |
| 246 | * If kmalloc is not yet possible, then either high_physmem and/or |
| 247 | * end_vm are still 0 (as at startup), in which case we call free, or |
| 248 | * we have set them, but anyway addr has not been allocated from those |
| 249 | * areas. So, in both cases __real_free is called. |
| 250 | * |
| 251 | * CAN_KMALLOC is checked because it would be bad to free a buffer |
| 252 | * with kmalloc/vmalloc after they have been turned off during |
| 253 | * shutdown. |
| 254 | * XXX: However, we sometimes shutdown CAN_KMALLOC temporarily, so |
| 255 | * there is a possibility for memory leaks. |
| 256 | */ |
| 257 | |
Jeff Dike | ba180fd | 2007-10-16 01:27:00 -0700 | [diff] [blame] | 258 | if ((addr >= uml_physmem) && (addr < high_physmem)) { |
| 259 | if (kmalloc_ok) |
Linus Torvalds | 1da177e | 2005-04-16 15:20:36 -0700 | [diff] [blame] | 260 | kfree(ptr); |
| 261 | } |
Jeff Dike | ba180fd | 2007-10-16 01:27:00 -0700 | [diff] [blame] | 262 | else if ((addr >= start_vm) && (addr < end_vm)) { |
| 263 | if (kmalloc_ok) |
Linus Torvalds | 1da177e | 2005-04-16 15:20:36 -0700 | [diff] [blame] | 264 | vfree(ptr); |
| 265 | } |
| 266 | else __real_free(ptr); |
| 267 | } |