blob: e299ee5a753d7b1adddad393e926a4609509cfdb [file] [log] [blame]
Linus Torvalds1da177e2005-04-16 15:20:36 -07001/*
2 * Copyright (C) 2001, 2002 Jeff Dike (jdike@karaya.com)
3 * Licensed under the GPL
4 */
5
Bodo Stroesser858259c2005-11-07 00:58:55 -08006#include "linux/stddef.h"
Paolo 'Blaisorblade' Giarrusso2e5e5592005-07-14 00:33:37 -07007#include "linux/sched.h"
Linus Torvalds1da177e2005-04-16 15:20:36 -07008#include "linux/slab.h"
Paolo 'Blaisorblade' Giarrusso2e5e5592005-07-14 00:33:37 -07009#include "linux/types.h"
Bodo Stroesser858259c2005-11-07 00:58:55 -080010#include "linux/errno.h"
Linus Torvalds1da177e2005-04-16 15:20:36 -070011#include "asm/uaccess.h"
Paolo 'Blaisorblade' Giarrusso2e5e5592005-07-14 00:33:37 -070012#include "asm/smp.h"
13#include "asm/ldt.h"
Bodo Stroesser858259c2005-11-07 00:58:55 -080014#include "asm/unistd.h"
Linus Torvalds1da177e2005-04-16 15:20:36 -070015#include "choose-mode.h"
16#include "kern.h"
Paolo 'Blaisorblade' Giarrusso2e5e5592005-07-14 00:33:37 -070017#include "mode_kern.h"
Bodo Stroesser12919aa2006-01-18 17:42:39 -080018#include "os.h"
Linus Torvalds1da177e2005-04-16 15:20:36 -070019
Linus Torvalds1da177e2005-04-16 15:20:36 -070020extern int modify_ldt(int func, void *ptr, unsigned long bytecount);
21
Bodo Stroesser858259c2005-11-07 00:58:55 -080022#ifdef CONFIG_MODE_TT
Paolo 'Blaisorblade' Giarrusso2e5e5592005-07-14 00:33:37 -070023
Bodo Stroesser858259c2005-11-07 00:58:55 -080024static long do_modify_ldt_tt(int func, void __user *ptr,
25 unsigned long bytecount)
Paolo 'Blaisorblade' Giarrusso2e5e5592005-07-14 00:33:37 -070026{
27 struct user_desc info;
28 int res = 0;
29 void *buf = NULL;
30 void *p = NULL; /* What we pass to host. */
Linus Torvalds1da177e2005-04-16 15:20:36 -070031
32 switch(func){
33 case 1:
Paolo 'Blaisorblade' Giarrusso2e5e5592005-07-14 00:33:37 -070034 case 0x11: /* write_ldt */
35 /* Do this check now to avoid overflows. */
36 if (bytecount != sizeof(struct user_desc)) {
37 res = -EINVAL;
38 goto out;
39 }
Linus Torvalds1da177e2005-04-16 15:20:36 -070040
Paolo 'Blaisorblade' Giarrusso2e5e5592005-07-14 00:33:37 -070041 if(copy_from_user(&info, ptr, sizeof(info))) {
42 res = -EFAULT;
43 goto out;
44 }
45
46 p = &info;
47 break;
48 case 0:
49 case 2: /* read_ldt */
50
51 /* The use of info avoids kmalloc on the write case, not on the
52 * read one. */
53 buf = kmalloc(bytecount, GFP_KERNEL);
54 if (!buf) {
55 res = -ENOMEM;
56 goto out;
57 }
58 p = buf;
Paolo 'Blaisorblade' Giarrusso36decba2005-09-21 18:38:57 +020059 break;
Paolo 'Blaisorblade' Giarrusso2e5e5592005-07-14 00:33:37 -070060 default:
61 res = -ENOSYS;
Linus Torvalds1da177e2005-04-16 15:20:36 -070062 goto out;
63 }
64
Bodo Stroesser858259c2005-11-07 00:58:55 -080065 res = modify_ldt(func, p, bytecount);
Linus Torvalds1da177e2005-04-16 15:20:36 -070066 if(res < 0)
67 goto out;
68
69 switch(func){
70 case 0:
71 case 2:
Paolo 'Blaisorblade' Giarrusso2e5e5592005-07-14 00:33:37 -070072 /* Modify_ldt was for reading and returned the number of read
73 * bytes.*/
74 if(copy_to_user(ptr, p, res))
Linus Torvalds1da177e2005-04-16 15:20:36 -070075 res = -EFAULT;
Linus Torvalds1da177e2005-04-16 15:20:36 -070076 break;
77 }
78
Paolo 'Blaisorblade' Giarrusso2e5e5592005-07-14 00:33:37 -070079out:
Linus Torvalds1da177e2005-04-16 15:20:36 -070080 kfree(buf);
Paolo 'Blaisorblade' Giarrusso2e5e5592005-07-14 00:33:37 -070081 return res;
Linus Torvalds1da177e2005-04-16 15:20:36 -070082}
Bodo Stroesser858259c2005-11-07 00:58:55 -080083
84#endif
85
86#ifdef CONFIG_MODE_SKAS
87
88#include "skas.h"
89#include "skas_ptrace.h"
90#include "asm/mmu_context.h"
Pekka Enberge8730ea2006-02-01 03:05:06 -080091#include "proc_mm.h"
Bodo Stroesser858259c2005-11-07 00:58:55 -080092
93long write_ldt_entry(struct mm_id * mm_idp, int func, struct user_desc * desc,
94 void **addr, int done)
95{
96 long res;
97
98 if(proc_mm){
99 /* This is a special handling for the case, that the mm to
100 * modify isn't current->active_mm.
101 * If this is called directly by modify_ldt,
102 * (current->active_mm->context.skas.u == mm_idp)
103 * will be true. So no call to switch_mm_skas(mm_idp) is done.
104 * If this is called in case of init_new_ldt or PTRACE_LDT,
105 * mm_idp won't belong to current->active_mm, but child->mm.
106 * So we need to switch child's mm into our userspace, then
107 * later switch back.
108 *
Paolo 'Blaisorblade' Giarrusso07f4e2c2006-02-24 13:03:55 -0800109 * Note: I'm unsure: should interrupts be disabled here?
Bodo Stroesser858259c2005-11-07 00:58:55 -0800110 */
111 if(!current->active_mm || current->active_mm == &init_mm ||
112 mm_idp != &current->active_mm->context.skas.id)
113 switch_mm_skas(mm_idp);
114 }
115
116 if(ptrace_ldt) {
117 struct ptrace_ldt ldt_op = (struct ptrace_ldt) {
118 .func = func,
119 .ptr = desc,
120 .bytecount = sizeof(*desc)};
121 u32 cpu;
122 int pid;
123
124 if(!proc_mm)
125 pid = mm_idp->u.pid;
126 else {
127 cpu = get_cpu();
128 pid = userspace_pid[cpu];
129 }
130
Paolo 'Blaisorblade' Giarrusso07f4e2c2006-02-24 13:03:55 -0800131 res = os_ptrace_ldt(pid, 0, (unsigned long) &ldt_op);
Bodo Stroesser858259c2005-11-07 00:58:55 -0800132
133 if(proc_mm)
134 put_cpu();
135 }
136 else {
137 void *stub_addr;
138 res = syscall_stub_data(mm_idp, (unsigned long *)desc,
139 (sizeof(*desc) + sizeof(long) - 1) &
140 ~(sizeof(long) - 1),
141 addr, &stub_addr);
142 if(!res){
143 unsigned long args[] = { func,
144 (unsigned long)stub_addr,
145 sizeof(*desc),
146 0, 0, 0 };
147 res = run_syscall_stub(mm_idp, __NR_modify_ldt, args,
148 0, addr, done);
149 }
150 }
151
152 if(proc_mm){
153 /* This is the second part of special handling, that makes
154 * PTRACE_LDT possible to implement.
155 */
156 if(current->active_mm && current->active_mm != &init_mm &&
157 mm_idp != &current->active_mm->context.skas.id)
158 switch_mm_skas(&current->active_mm->context.skas.id);
159 }
160
161 return res;
162}
163
164static long read_ldt_from_host(void __user * ptr, unsigned long bytecount)
165{
166 int res, n;
167 struct ptrace_ldt ptrace_ldt = (struct ptrace_ldt) {
168 .func = 0,
169 .bytecount = bytecount,
170 .ptr = (void *)kmalloc(bytecount, GFP_KERNEL)};
171 u32 cpu;
172
173 if(ptrace_ldt.ptr == NULL)
174 return -ENOMEM;
175
176 /* This is called from sys_modify_ldt only, so userspace_pid gives
177 * us the right number
178 */
179
180 cpu = get_cpu();
Paolo 'Blaisorblade' Giarrusso07f4e2c2006-02-24 13:03:55 -0800181 res = os_ptrace_ldt(userspace_pid[cpu], 0, (unsigned long) &ptrace_ldt);
Bodo Stroesser858259c2005-11-07 00:58:55 -0800182 put_cpu();
183 if(res < 0)
184 goto out;
185
186 n = copy_to_user(ptr, ptrace_ldt.ptr, res);
187 if(n != 0)
188 res = -EFAULT;
189
190 out:
191 kfree(ptrace_ldt.ptr);
192
193 return res;
194}
195
196/*
197 * In skas mode, we hold our own ldt data in UML.
198 * Thus, the code implementing sys_modify_ldt_skas
199 * is very similar to (and mostly stolen from) sys_modify_ldt
200 * for arch/i386/kernel/ldt.c
201 * The routines copied and modified in part are:
202 * - read_ldt
203 * - read_default_ldt
204 * - write_ldt
205 * - sys_modify_ldt_skas
206 */
207
208static int read_ldt(void __user * ptr, unsigned long bytecount)
209{
210 int i, err = 0;
211 unsigned long size;
212 uml_ldt_t * ldt = &current->mm->context.skas.ldt;
213
214 if(!ldt->entry_count)
215 goto out;
216 if(bytecount > LDT_ENTRY_SIZE*LDT_ENTRIES)
217 bytecount = LDT_ENTRY_SIZE*LDT_ENTRIES;
218 err = bytecount;
219
220 if(ptrace_ldt){
221 return read_ldt_from_host(ptr, bytecount);
222 }
223
224 down(&ldt->semaphore);
225 if(ldt->entry_count <= LDT_DIRECT_ENTRIES){
226 size = LDT_ENTRY_SIZE*LDT_DIRECT_ENTRIES;
227 if(size > bytecount)
228 size = bytecount;
Jeff Dikee23181d2005-11-21 21:32:08 -0800229 if(copy_to_user(ptr, ldt->u.entries, size))
Bodo Stroesser858259c2005-11-07 00:58:55 -0800230 err = -EFAULT;
231 bytecount -= size;
232 ptr += size;
233 }
234 else {
235 for(i=0; i<ldt->entry_count/LDT_ENTRIES_PER_PAGE && bytecount;
236 i++){
237 size = PAGE_SIZE;
238 if(size > bytecount)
239 size = bytecount;
Jeff Dikee23181d2005-11-21 21:32:08 -0800240 if(copy_to_user(ptr, ldt->u.pages[i], size)){
Bodo Stroesser858259c2005-11-07 00:58:55 -0800241 err = -EFAULT;
242 break;
243 }
244 bytecount -= size;
245 ptr += size;
246 }
247 }
248 up(&ldt->semaphore);
249
250 if(bytecount == 0 || err == -EFAULT)
251 goto out;
252
253 if(clear_user(ptr, bytecount))
254 err = -EFAULT;
255
256out:
257 return err;
258}
259
260static int read_default_ldt(void __user * ptr, unsigned long bytecount)
261{
262 int err;
263
264 if(bytecount > 5*LDT_ENTRY_SIZE)
265 bytecount = 5*LDT_ENTRY_SIZE;
266
267 err = bytecount;
268 /* UML doesn't support lcall7 and lcall27.
269 * So, we don't really have a default ldt, but emulate
270 * an empty ldt of common host default ldt size.
271 */
272 if(clear_user(ptr, bytecount))
273 err = -EFAULT;
274
275 return err;
276}
277
278static int write_ldt(void __user * ptr, unsigned long bytecount, int func)
279{
280 uml_ldt_t * ldt = &current->mm->context.skas.ldt;
281 struct mm_id * mm_idp = &current->mm->context.skas.id;
282 int i, err;
283 struct user_desc ldt_info;
284 struct ldt_entry entry0, *ldt_p;
285 void *addr = NULL;
286
287 err = -EINVAL;
288 if(bytecount != sizeof(ldt_info))
289 goto out;
290 err = -EFAULT;
291 if(copy_from_user(&ldt_info, ptr, sizeof(ldt_info)))
292 goto out;
293
294 err = -EINVAL;
295 if(ldt_info.entry_number >= LDT_ENTRIES)
296 goto out;
297 if(ldt_info.contents == 3){
298 if (func == 1)
299 goto out;
300 if (ldt_info.seg_not_present == 0)
301 goto out;
302 }
303
304 if(!ptrace_ldt)
305 down(&ldt->semaphore);
306
307 err = write_ldt_entry(mm_idp, func, &ldt_info, &addr, 1);
308 if(err)
309 goto out_unlock;
310 else if(ptrace_ldt) {
311 /* With PTRACE_LDT available, this is used as a flag only */
312 ldt->entry_count = 1;
313 goto out;
314 }
315
316 if(ldt_info.entry_number >= ldt->entry_count &&
317 ldt_info.entry_number >= LDT_DIRECT_ENTRIES){
318 for(i=ldt->entry_count/LDT_ENTRIES_PER_PAGE;
319 i*LDT_ENTRIES_PER_PAGE <= ldt_info.entry_number;
320 i++){
321 if(i == 0)
Jeff Dikee23181d2005-11-21 21:32:08 -0800322 memcpy(&entry0, ldt->u.entries,
323 sizeof(entry0));
324 ldt->u.pages[i] = (struct ldt_entry *)
325 __get_free_page(GFP_KERNEL|__GFP_ZERO);
326 if(!ldt->u.pages[i]){
Bodo Stroesser858259c2005-11-07 00:58:55 -0800327 err = -ENOMEM;
328 /* Undo the change in host */
329 memset(&ldt_info, 0, sizeof(ldt_info));
330 write_ldt_entry(mm_idp, 1, &ldt_info, &addr, 1);
331 goto out_unlock;
332 }
333 if(i == 0) {
Jeff Dikee23181d2005-11-21 21:32:08 -0800334 memcpy(ldt->u.pages[0], &entry0,
335 sizeof(entry0));
336 memcpy(ldt->u.pages[0]+1, ldt->u.entries+1,
Bodo Stroesser858259c2005-11-07 00:58:55 -0800337 sizeof(entry0)*(LDT_DIRECT_ENTRIES-1));
338 }
339 ldt->entry_count = (i + 1) * LDT_ENTRIES_PER_PAGE;
340 }
341 }
342 if(ldt->entry_count <= ldt_info.entry_number)
343 ldt->entry_count = ldt_info.entry_number + 1;
344
345 if(ldt->entry_count <= LDT_DIRECT_ENTRIES)
Jeff Dikee23181d2005-11-21 21:32:08 -0800346 ldt_p = ldt->u.entries + ldt_info.entry_number;
Bodo Stroesser858259c2005-11-07 00:58:55 -0800347 else
Jeff Dikee23181d2005-11-21 21:32:08 -0800348 ldt_p = ldt->u.pages[ldt_info.entry_number/LDT_ENTRIES_PER_PAGE] +
Bodo Stroesser858259c2005-11-07 00:58:55 -0800349 ldt_info.entry_number%LDT_ENTRIES_PER_PAGE;
350
351 if(ldt_info.base_addr == 0 && ldt_info.limit == 0 &&
352 (func == 1 || LDT_empty(&ldt_info))){
353 ldt_p->a = 0;
354 ldt_p->b = 0;
355 }
356 else{
357 if (func == 1)
358 ldt_info.useable = 0;
359 ldt_p->a = LDT_entry_a(&ldt_info);
360 ldt_p->b = LDT_entry_b(&ldt_info);
361 }
362 err = 0;
363
364out_unlock:
365 up(&ldt->semaphore);
366out:
367 return err;
368}
369
370static long do_modify_ldt_skas(int func, void __user *ptr,
371 unsigned long bytecount)
372{
373 int ret = -ENOSYS;
374
375 switch (func) {
376 case 0:
377 ret = read_ldt(ptr, bytecount);
378 break;
379 case 1:
380 case 0x11:
381 ret = write_ldt(ptr, bytecount, func);
382 break;
383 case 2:
384 ret = read_default_ldt(ptr, bytecount);
385 break;
386 }
387 return ret;
388}
389
390short dummy_list[9] = {0, -1};
391short * host_ldt_entries = NULL;
392
393void ldt_get_host_info(void)
394{
395 long ret;
396 struct ldt_entry * ldt;
397 int i, size, k, order;
398
399 host_ldt_entries = dummy_list+1;
400
401 for(i = LDT_PAGES_MAX-1, order=0; i; i>>=1, order++);
402
403 ldt = (struct ldt_entry *)
404 __get_free_pages(GFP_KERNEL|__GFP_ZERO, order);
405 if(ldt == NULL) {
406 printk("ldt_get_host_info: couldn't allocate buffer for host ldt\n");
407 return;
408 }
409
410 ret = modify_ldt(0, ldt, (1<<order)*PAGE_SIZE);
411 if(ret < 0) {
412 printk("ldt_get_host_info: couldn't read host ldt\n");
413 goto out_free;
414 }
415 if(ret == 0) {
416 /* default_ldt is active, simply write an empty entry 0 */
417 host_ldt_entries = dummy_list;
418 goto out_free;
419 }
420
421 for(i=0, size=0; i<ret/LDT_ENTRY_SIZE; i++){
422 if(ldt[i].a != 0 || ldt[i].b != 0)
423 size++;
424 }
425
Jeff Dike91b165c2006-09-25 23:33:00 -0700426 if(size < ARRAY_SIZE(dummy_list))
Bodo Stroesser858259c2005-11-07 00:58:55 -0800427 host_ldt_entries = dummy_list;
Bodo Stroesser858259c2005-11-07 00:58:55 -0800428 else {
429 size = (size + 1) * sizeof(dummy_list[0]);
430 host_ldt_entries = (short *)kmalloc(size, GFP_KERNEL);
431 if(host_ldt_entries == NULL) {
432 printk("ldt_get_host_info: couldn't allocate host ldt list\n");
433 goto out_free;
434 }
435 }
436
437 for(i=0, k=0; i<ret/LDT_ENTRY_SIZE; i++){
438 if(ldt[i].a != 0 || ldt[i].b != 0) {
439 host_ldt_entries[k++] = i;
440 }
441 }
442 host_ldt_entries[k] = -1;
443
444out_free:
445 free_pages((unsigned long)ldt, order);
446}
447
448long init_new_ldt(struct mmu_context_skas * new_mm,
449 struct mmu_context_skas * from_mm)
450{
451 struct user_desc desc;
452 short * num_p;
453 int i;
454 long page, err=0;
455 void *addr = NULL;
Bodo Stroesser12919aa2006-01-18 17:42:39 -0800456 struct proc_mm_op copy;
Bodo Stroesser858259c2005-11-07 00:58:55 -0800457
Bodo Stroesser858259c2005-11-07 00:58:55 -0800458
459 if(!ptrace_ldt)
460 init_MUTEX(&new_mm->ldt.semaphore);
461
462 if(!from_mm){
Bodo Stroesser12919aa2006-01-18 17:42:39 -0800463 memset(&desc, 0, sizeof(desc));
Bodo Stroesser858259c2005-11-07 00:58:55 -0800464 /*
465 * We have to initialize a clean ldt.
466 */
467 if(proc_mm) {
468 /*
469 * If the new mm was created using proc_mm, host's
470 * default-ldt currently is assigned, which normally
471 * contains the call-gates for lcall7 and lcall27.
472 * To remove these gates, we simply write an empty
473 * entry as number 0 to the host.
474 */
475 err = write_ldt_entry(&new_mm->id, 1, &desc,
476 &addr, 1);
477 }
478 else{
479 /*
480 * Now we try to retrieve info about the ldt, we
481 * inherited from the host. All ldt-entries found
482 * will be reset in the following loop
483 */
484 if(host_ldt_entries == NULL)
485 ldt_get_host_info();
486 for(num_p=host_ldt_entries; *num_p != -1; num_p++){
487 desc.entry_number = *num_p;
488 err = write_ldt_entry(&new_mm->id, 1, &desc,
489 &addr, *(num_p + 1) == -1);
490 if(err)
491 break;
492 }
493 }
494 new_mm->ldt.entry_count = 0;
Bodo Stroesser12919aa2006-01-18 17:42:39 -0800495
496 goto out;
Bodo Stroesser858259c2005-11-07 00:58:55 -0800497 }
Bodo Stroesser12919aa2006-01-18 17:42:39 -0800498
499 if(proc_mm){
500 /* We have a valid from_mm, so we now have to copy the LDT of
501 * from_mm to new_mm, because using proc_mm an new mm with
502 * an empty/default LDT was created in new_mm()
503 */
504 copy = ((struct proc_mm_op) { .op = MM_COPY_SEGMENTS,
505 .u =
506 { .copy_segments =
507 from_mm->id.u.mm_fd } } );
508 i = os_write_file(new_mm->id.u.mm_fd, &copy, sizeof(copy));
509 if(i != sizeof(copy))
510 printk("new_mm : /proc/mm copy_segments failed, "
511 "err = %d\n", -i);
512 }
513
514 if(!ptrace_ldt) {
Bodo Stroesser858259c2005-11-07 00:58:55 -0800515 /* Our local LDT is used to supply the data for
516 * modify_ldt(READLDT), if PTRACE_LDT isn't available,
517 * i.e., we have to use the stub for modify_ldt, which
518 * can't handle the big read buffer of up to 64kB.
519 */
520 down(&from_mm->ldt.semaphore);
521 if(from_mm->ldt.entry_count <= LDT_DIRECT_ENTRIES){
Jeff Dikee23181d2005-11-21 21:32:08 -0800522 memcpy(new_mm->ldt.u.entries, from_mm->ldt.u.entries,
523 sizeof(new_mm->ldt.u.entries));
Bodo Stroesser858259c2005-11-07 00:58:55 -0800524 }
525 else{
526 i = from_mm->ldt.entry_count / LDT_ENTRIES_PER_PAGE;
527 while(i-->0){
528 page = __get_free_page(GFP_KERNEL|__GFP_ZERO);
529 if (!page){
530 err = -ENOMEM;
531 break;
532 }
Jeff Dikee23181d2005-11-21 21:32:08 -0800533 new_mm->ldt.u.pages[i] =
534 (struct ldt_entry *) page;
535 memcpy(new_mm->ldt.u.pages[i],
536 from_mm->ldt.u.pages[i], PAGE_SIZE);
Bodo Stroesser858259c2005-11-07 00:58:55 -0800537 }
538 }
539 new_mm->ldt.entry_count = from_mm->ldt.entry_count;
540 up(&from_mm->ldt.semaphore);
541 }
542
Bodo Stroesser12919aa2006-01-18 17:42:39 -0800543 out:
Bodo Stroesser858259c2005-11-07 00:58:55 -0800544 return err;
545}
546
547
548void free_ldt(struct mmu_context_skas * mm)
549{
550 int i;
551
552 if(!ptrace_ldt && mm->ldt.entry_count > LDT_DIRECT_ENTRIES){
553 i = mm->ldt.entry_count / LDT_ENTRIES_PER_PAGE;
554 while(i-- > 0){
Jeff Dikee23181d2005-11-21 21:32:08 -0800555 free_page((long )mm->ldt.u.pages[i]);
Bodo Stroesser858259c2005-11-07 00:58:55 -0800556 }
557 }
558 mm->ldt.entry_count = 0;
559}
560#endif
561
562int sys_modify_ldt(int func, void __user *ptr, unsigned long bytecount)
563{
564 return(CHOOSE_MODE_PROC(do_modify_ldt_tt, do_modify_ldt_skas, func,
565 ptr, bytecount));
566}