blob: 0a615f87142eaeb61581aeb31ddb1f486d2445bd [file] [log] [blame]
Jens Axboe22e2c502005-06-27 10:55:12 +02001/*
2 * fs/ioprio.c
3 *
Jens Axboe0fe23472006-09-04 15:41:16 +02004 * Copyright (C) 2004 Jens Axboe <axboe@kernel.dk>
Jens Axboe22e2c502005-06-27 10:55:12 +02005 *
6 * Helper functions for setting/querying io priorities of processes. The
7 * system calls closely mimmick getpriority/setpriority, see the man page for
8 * those. The prio argument is a composite of prio class and prio data, where
9 * the data argument has meaning within that class. The standard scheduling
10 * classes have 8 distinct prio levels, with 0 being the highest prio and 7
11 * being the lowest.
12 *
13 * IOW, setting BE scheduling class with prio 2 is done ala:
14 *
15 * unsigned int prio = (IOPRIO_CLASS_BE << IOPRIO_CLASS_SHIFT) | 2;
16 *
17 * ioprio_set(PRIO_PROCESS, pid, prio);
18 *
19 * See also Documentation/block/ioprio.txt
20 *
21 */
22#include <linux/kernel.h>
23#include <linux/ioprio.h>
24#include <linux/blkdev.h>
Randy Dunlap16f7e0f2006-01-11 12:17:46 -080025#include <linux/capability.h>
Adrian Bunk9abdc4c2005-11-08 16:57:02 +010026#include <linux/syscalls.h>
James Morris03e68062006-06-23 02:03:58 -070027#include <linux/security.h>
Pavel Emelyanovb4888932007-10-18 23:40:14 -070028#include <linux/pid_namespace.h>
Jens Axboe22e2c502005-06-27 10:55:12 +020029
30static int set_task_ioprio(struct task_struct *task, int ioprio)
31{
James Morris03e68062006-06-23 02:03:58 -070032 int err;
Jens Axboe22e2c502005-06-27 10:55:12 +020033 struct io_context *ioc;
34
35 if (task->uid != current->euid &&
36 task->uid != current->uid && !capable(CAP_SYS_NICE))
37 return -EPERM;
38
James Morris03e68062006-06-23 02:03:58 -070039 err = security_task_setioprio(task, ioprio);
40 if (err)
41 return err;
42
Jens Axboe22e2c502005-06-27 10:55:12 +020043 task_lock(task);
44
45 task->ioprio = ioprio;
46
47 ioc = task->io_context;
Oleg Nesterov9f83e452006-08-21 08:34:15 +020048 /* see wmb() in current_io_context() */
49 smp_read_barrier_depends();
50
Jens Axboefc463792006-08-29 09:05:44 +020051 if (ioc)
52 ioc->ioprio_changed = 1;
Jens Axboe22e2c502005-06-27 10:55:12 +020053
54 task_unlock(task);
55 return 0;
56}
57
Anton Blanchardcf366802005-07-07 17:56:13 -070058asmlinkage long sys_ioprio_set(int which, int who, int ioprio)
Jens Axboe22e2c502005-06-27 10:55:12 +020059{
60 int class = IOPRIO_PRIO_CLASS(ioprio);
61 int data = IOPRIO_PRIO_DATA(ioprio);
62 struct task_struct *p, *g;
63 struct user_struct *user;
Eric W. Biederman41487c62007-02-12 00:53:01 -080064 struct pid *pgrp;
Jens Axboe22e2c502005-06-27 10:55:12 +020065 int ret;
66
67 switch (class) {
68 case IOPRIO_CLASS_RT:
69 if (!capable(CAP_SYS_ADMIN))
70 return -EPERM;
71 /* fall through, rt has prio field too */
72 case IOPRIO_CLASS_BE:
73 if (data >= IOPRIO_BE_NR || data < 0)
74 return -EINVAL;
75
76 break;
77 case IOPRIO_CLASS_IDLE:
Linus Torvaldsf6fdd7d2005-08-20 18:51:29 -070078 if (!capable(CAP_SYS_ADMIN))
79 return -EPERM;
Jens Axboe22e2c502005-06-27 10:55:12 +020080 break;
81 default:
82 return -EINVAL;
83 }
84
85 ret = -ESRCH;
Oleg Nesterovcf342e52006-08-29 09:17:41 +020086 /*
87 * We want IOPRIO_WHO_PGRP/IOPRIO_WHO_USER to be "atomic",
88 * so we can't use rcu_read_lock(). See re-copy of ->ioprio
89 * in copy_process().
90 */
91 read_lock(&tasklist_lock);
Jens Axboe22e2c502005-06-27 10:55:12 +020092 switch (which) {
93 case IOPRIO_WHO_PROCESS:
94 if (!who)
95 p = current;
96 else
Pavel Emelyanovb4888932007-10-18 23:40:14 -070097 p = find_task_by_pid_ns(who,
98 current->nsproxy->pid_ns);
Jens Axboe22e2c502005-06-27 10:55:12 +020099 if (p)
100 ret = set_task_ioprio(p, ioprio);
101 break;
102 case IOPRIO_WHO_PGRP:
103 if (!who)
Eric W. Biederman41487c62007-02-12 00:53:01 -0800104 pgrp = task_pgrp(current);
105 else
Pavel Emelyanovb4888932007-10-18 23:40:14 -0700106 pgrp = find_vpid(who);
Eric W. Biederman41487c62007-02-12 00:53:01 -0800107 do_each_pid_task(pgrp, PIDTYPE_PGID, p) {
Jens Axboe22e2c502005-06-27 10:55:12 +0200108 ret = set_task_ioprio(p, ioprio);
109 if (ret)
110 break;
Eric W. Biederman41487c62007-02-12 00:53:01 -0800111 } while_each_pid_task(pgrp, PIDTYPE_PGID, p);
Jens Axboe22e2c502005-06-27 10:55:12 +0200112 break;
113 case IOPRIO_WHO_USER:
114 if (!who)
115 user = current->user;
116 else
117 user = find_user(who);
118
119 if (!user)
120 break;
121
122 do_each_thread(g, p) {
123 if (p->uid != who)
124 continue;
125 ret = set_task_ioprio(p, ioprio);
126 if (ret)
Oleg Nesterov78bd4d42006-08-21 08:33:23 +0200127 goto free_uid;
Jens Axboe22e2c502005-06-27 10:55:12 +0200128 } while_each_thread(g, p);
Oleg Nesterov78bd4d42006-08-21 08:33:23 +0200129free_uid:
Jens Axboe22e2c502005-06-27 10:55:12 +0200130 if (who)
131 free_uid(user);
132 break;
133 default:
134 ret = -EINVAL;
135 }
136
Oleg Nesterovcf342e52006-08-29 09:17:41 +0200137 read_unlock(&tasklist_lock);
Jens Axboe22e2c502005-06-27 10:55:12 +0200138 return ret;
139}
140
David Quigleya1836a42006-06-30 01:55:49 -0700141static int get_task_ioprio(struct task_struct *p)
142{
143 int ret;
144
145 ret = security_task_getioprio(p);
146 if (ret)
147 goto out;
148 ret = p->ioprio;
149out:
150 return ret;
151}
152
Oleg Nesterove014ff82006-08-21 10:02:50 +0200153int ioprio_best(unsigned short aprio, unsigned short bprio)
154{
155 unsigned short aclass = IOPRIO_PRIO_CLASS(aprio);
156 unsigned short bclass = IOPRIO_PRIO_CLASS(bprio);
157
Oleg Nesterove014ff82006-08-21 10:02:50 +0200158 if (aclass == IOPRIO_CLASS_NONE)
159 aclass = IOPRIO_CLASS_BE;
160 if (bclass == IOPRIO_CLASS_NONE)
161 bclass = IOPRIO_CLASS_BE;
162
163 if (aclass == bclass)
164 return min(aprio, bprio);
165 if (aclass > bclass)
166 return bprio;
167 else
168 return aprio;
169}
170
Anton Blanchardcf366802005-07-07 17:56:13 -0700171asmlinkage long sys_ioprio_get(int which, int who)
Jens Axboe22e2c502005-06-27 10:55:12 +0200172{
173 struct task_struct *g, *p;
174 struct user_struct *user;
Eric W. Biederman41487c62007-02-12 00:53:01 -0800175 struct pid *pgrp;
Jens Axboe22e2c502005-06-27 10:55:12 +0200176 int ret = -ESRCH;
David Quigleya1836a42006-06-30 01:55:49 -0700177 int tmpio;
Jens Axboe22e2c502005-06-27 10:55:12 +0200178
Oleg Nesterovcf342e52006-08-29 09:17:41 +0200179 read_lock(&tasklist_lock);
Jens Axboe22e2c502005-06-27 10:55:12 +0200180 switch (which) {
181 case IOPRIO_WHO_PROCESS:
182 if (!who)
183 p = current;
184 else
Pavel Emelyanovb4888932007-10-18 23:40:14 -0700185 p = find_task_by_pid_ns(who,
186 current->nsproxy->pid_ns);
Jens Axboe22e2c502005-06-27 10:55:12 +0200187 if (p)
David Quigleya1836a42006-06-30 01:55:49 -0700188 ret = get_task_ioprio(p);
Jens Axboe22e2c502005-06-27 10:55:12 +0200189 break;
190 case IOPRIO_WHO_PGRP:
191 if (!who)
Eric W. Biederman41487c62007-02-12 00:53:01 -0800192 pgrp = task_pgrp(current);
193 else
Pavel Emelyanovb4888932007-10-18 23:40:14 -0700194 pgrp = find_vpid(who);
Eric W. Biederman41487c62007-02-12 00:53:01 -0800195 do_each_pid_task(pgrp, PIDTYPE_PGID, p) {
David Quigleya1836a42006-06-30 01:55:49 -0700196 tmpio = get_task_ioprio(p);
197 if (tmpio < 0)
198 continue;
Jens Axboe22e2c502005-06-27 10:55:12 +0200199 if (ret == -ESRCH)
David Quigleya1836a42006-06-30 01:55:49 -0700200 ret = tmpio;
Jens Axboe22e2c502005-06-27 10:55:12 +0200201 else
David Quigleya1836a42006-06-30 01:55:49 -0700202 ret = ioprio_best(ret, tmpio);
Eric W. Biederman41487c62007-02-12 00:53:01 -0800203 } while_each_pid_task(pgrp, PIDTYPE_PGID, p);
Jens Axboe22e2c502005-06-27 10:55:12 +0200204 break;
205 case IOPRIO_WHO_USER:
206 if (!who)
207 user = current->user;
208 else
209 user = find_user(who);
210
211 if (!user)
212 break;
213
214 do_each_thread(g, p) {
215 if (p->uid != user->uid)
216 continue;
David Quigleya1836a42006-06-30 01:55:49 -0700217 tmpio = get_task_ioprio(p);
218 if (tmpio < 0)
219 continue;
Jens Axboe22e2c502005-06-27 10:55:12 +0200220 if (ret == -ESRCH)
David Quigleya1836a42006-06-30 01:55:49 -0700221 ret = tmpio;
Jens Axboe22e2c502005-06-27 10:55:12 +0200222 else
David Quigleya1836a42006-06-30 01:55:49 -0700223 ret = ioprio_best(ret, tmpio);
Jens Axboe22e2c502005-06-27 10:55:12 +0200224 } while_each_thread(g, p);
225
226 if (who)
227 free_uid(user);
228 break;
229 default:
230 ret = -EINVAL;
231 }
232
Oleg Nesterovcf342e52006-08-29 09:17:41 +0200233 read_unlock(&tasklist_lock);
Jens Axboe22e2c502005-06-27 10:55:12 +0200234 return ret;
235}
236