blob: 1b738827b2f69b68041fd3d85150483e7ac6e63c [file] [log] [blame]
Vivek Goyal31e4c282009-12-03 12:59:42 -05001#ifndef _BLK_CGROUP_H
2#define _BLK_CGROUP_H
3/*
4 * Common Block IO controller cgroup interface
5 *
6 * Based on ideas and code from CFQ, CFS and BFQ:
7 * Copyright (C) 2003 Jens Axboe <axboe@kernel.dk>
8 *
9 * Copyright (C) 2008 Fabio Checconi <fabio@gandalf.sssup.it>
10 * Paolo Valente <paolo.valente@unimore.it>
11 *
12 * Copyright (C) 2009 Vivek Goyal <vgoyal@redhat.com>
13 * Nauman Rafique <nauman@google.com>
14 */
15
16#include <linux/cgroup.h>
17
Vivek Goyal062a6442010-09-15 17:06:33 -040018enum blkio_policy_id {
19 BLKIO_POLICY_PROP = 0, /* Proportional Bandwidth division */
Vivek Goyal4c9eefa2010-09-15 17:06:34 -040020 BLKIO_POLICY_THROTL, /* Throttling */
Vivek Goyal062a6442010-09-15 17:06:33 -040021};
22
Ben Blum67523c42010-03-10 15:22:11 -080023#if defined(CONFIG_BLK_CGROUP) || defined(CONFIG_BLK_CGROUP_MODULE)
24
25#ifndef CONFIG_BLK_CGROUP
26/* When blk-cgroup is a module, its subsys_id isn't a compile-time constant */
27extern struct cgroup_subsys blkio_subsys;
28#define blkio_subsys_id blkio_subsys.subsys_id
29#endif
Jens Axboe2f5ea472009-12-03 21:06:43 +010030
Divyesh Shah84c124d2010-04-09 08:31:19 +020031enum stat_type {
32 /* Total time spent (in ns) between request dispatch to the driver and
33 * request completion for IOs doen by this cgroup. This may not be
34 * accurate when NCQ is turned on. */
35 BLKIO_STAT_SERVICE_TIME = 0,
36 /* Total bytes transferred */
37 BLKIO_STAT_SERVICE_BYTES,
38 /* Total IOs serviced, post merge */
39 BLKIO_STAT_SERVICED,
40 /* Total time spent waiting in scheduler queue in ns */
41 BLKIO_STAT_WAIT_TIME,
Divyesh Shah812d4022010-04-08 21:14:23 -070042 /* Number of IOs merged */
43 BLKIO_STAT_MERGED,
Divyesh Shahcdc11842010-04-08 21:15:10 -070044 /* Number of IOs queued up */
45 BLKIO_STAT_QUEUED,
Divyesh Shah84c124d2010-04-09 08:31:19 +020046 /* All the single valued stats go below this */
47 BLKIO_STAT_TIME,
48 BLKIO_STAT_SECTORS,
49#ifdef CONFIG_DEBUG_BLK_CGROUP
Divyesh Shahcdc11842010-04-08 21:15:10 -070050 BLKIO_STAT_AVG_QUEUE_SIZE,
Divyesh Shah812df482010-04-08 21:15:35 -070051 BLKIO_STAT_IDLE_TIME,
52 BLKIO_STAT_EMPTY_TIME,
53 BLKIO_STAT_GROUP_WAIT_TIME,
Divyesh Shah84c124d2010-04-09 08:31:19 +020054 BLKIO_STAT_DEQUEUE
55#endif
56};
57
58enum stat_sub_type {
59 BLKIO_STAT_READ = 0,
60 BLKIO_STAT_WRITE,
61 BLKIO_STAT_SYNC,
62 BLKIO_STAT_ASYNC,
63 BLKIO_STAT_TOTAL
Divyesh Shah303a3ac2010-04-01 15:01:24 -070064};
65
Divyesh Shah812df482010-04-08 21:15:35 -070066/* blkg state flags */
67enum blkg_state_flags {
68 BLKG_waiting = 0,
69 BLKG_idling,
70 BLKG_empty,
71};
72
Vivek Goyal062a6442010-09-15 17:06:33 -040073/* cgroup files owned by proportional weight policy */
74enum blkcg_file_name_prop {
75 BLKIO_PROP_weight = 1,
76 BLKIO_PROP_weight_device,
77 BLKIO_PROP_io_service_bytes,
78 BLKIO_PROP_io_serviced,
79 BLKIO_PROP_time,
80 BLKIO_PROP_sectors,
81 BLKIO_PROP_io_service_time,
82 BLKIO_PROP_io_wait_time,
83 BLKIO_PROP_io_merged,
84 BLKIO_PROP_io_queued,
85 BLKIO_PROP_avg_queue_size,
86 BLKIO_PROP_group_wait_time,
87 BLKIO_PROP_idle_time,
88 BLKIO_PROP_empty_time,
89 BLKIO_PROP_dequeue,
90};
91
Vivek Goyal4c9eefa2010-09-15 17:06:34 -040092/* cgroup files owned by throttle policy */
93enum blkcg_file_name_throtl {
94 BLKIO_THROTL_read_bps_device,
95 BLKIO_THROTL_write_bps_device,
96 BLKIO_THROTL_io_service_bytes,
97 BLKIO_THROTL_io_serviced,
98};
99
Vivek Goyal31e4c282009-12-03 12:59:42 -0500100struct blkio_cgroup {
101 struct cgroup_subsys_state css;
102 unsigned int weight;
103 spinlock_t lock;
104 struct hlist_head blkg_list;
Gui Jianfeng34d0f172010-04-13 16:05:49 +0800105 struct list_head policy_list; /* list of blkio_policy_node */
Vivek Goyal31e4c282009-12-03 12:59:42 -0500106};
107
Divyesh Shah303a3ac2010-04-01 15:01:24 -0700108struct blkio_group_stats {
109 /* total disk time and nr sectors dispatched by this group */
110 uint64_t time;
111 uint64_t sectors;
Divyesh Shahcdc11842010-04-08 21:15:10 -0700112 uint64_t stat_arr[BLKIO_STAT_QUEUED + 1][BLKIO_STAT_TOTAL];
Divyesh Shah303a3ac2010-04-01 15:01:24 -0700113#ifdef CONFIG_DEBUG_BLK_CGROUP
Divyesh Shahcdc11842010-04-08 21:15:10 -0700114 /* Sum of number of IOs queued across all samples */
115 uint64_t avg_queue_size_sum;
116 /* Count of samples taken for average */
117 uint64_t avg_queue_size_samples;
Divyesh Shah303a3ac2010-04-01 15:01:24 -0700118 /* How many times this group has been removed from service tree */
119 unsigned long dequeue;
Divyesh Shah812df482010-04-08 21:15:35 -0700120
121 /* Total time spent waiting for it to be assigned a timeslice. */
122 uint64_t group_wait_time;
123 uint64_t start_group_wait_time;
124
125 /* Time spent idling for this blkio_group */
126 uint64_t idle_time;
127 uint64_t start_idle_time;
128 /*
129 * Total time when we have requests queued and do not contain the
130 * current active queue.
131 */
132 uint64_t empty_time;
133 uint64_t start_empty_time;
134 uint16_t flags;
Divyesh Shah303a3ac2010-04-01 15:01:24 -0700135#endif
136};
137
Vivek Goyal31e4c282009-12-03 12:59:42 -0500138struct blkio_group {
139 /* An rcu protected unique identifier for the group */
140 void *key;
141 struct hlist_node blkcg_node;
Vivek Goyalb1c35762009-12-03 12:59:47 -0500142 unsigned short blkcg_id;
Vivek Goyal2868ef72009-12-03 12:59:48 -0500143 /* Store cgroup path */
144 char path[128];
Vivek Goyal22084192009-12-03 12:59:49 -0500145 /* The device MKDEV(major, minor), this group has been created for */
Divyesh Shah84c124d2010-04-09 08:31:19 +0200146 dev_t dev;
Vivek Goyal062a6442010-09-15 17:06:33 -0400147 /* policy which owns this blk group */
148 enum blkio_policy_id plid;
Vivek Goyal22084192009-12-03 12:59:49 -0500149
Divyesh Shah303a3ac2010-04-01 15:01:24 -0700150 /* Need to serialize the stats in the case of reset/update */
151 spinlock_t stats_lock;
152 struct blkio_group_stats stats;
Vivek Goyal31e4c282009-12-03 12:59:42 -0500153};
154
Gui Jianfeng34d0f172010-04-13 16:05:49 +0800155struct blkio_policy_node {
156 struct list_head node;
157 dev_t dev;
Vivek Goyal062a6442010-09-15 17:06:33 -0400158 /* This node belongs to max bw policy or porportional weight policy */
159 enum blkio_policy_id plid;
160 /* cgroup file to which this rule belongs to */
161 int fileid;
Vivek Goyal4c9eefa2010-09-15 17:06:34 -0400162
163 union {
164 unsigned int weight;
165 /*
166 * Rate read/write in terms of byptes per second
167 * Whether this rate represents read or write is determined
168 * by file type "fileid".
169 */
170 u64 bps;
171 } val;
Gui Jianfeng34d0f172010-04-13 16:05:49 +0800172};
173
174extern unsigned int blkcg_get_weight(struct blkio_cgroup *blkcg,
175 dev_t dev);
Vivek Goyal4c9eefa2010-09-15 17:06:34 -0400176extern uint64_t blkcg_get_read_bps(struct blkio_cgroup *blkcg,
177 dev_t dev);
178extern uint64_t blkcg_get_write_bps(struct blkio_cgroup *blkcg,
179 dev_t dev);
Gui Jianfeng34d0f172010-04-13 16:05:49 +0800180
Vivek Goyal3e252062009-12-04 10:36:42 -0500181typedef void (blkio_unlink_group_fn) (void *key, struct blkio_group *blkg);
182typedef void (blkio_update_group_weight_fn) (struct blkio_group *blkg,
183 unsigned int weight);
Vivek Goyal4c9eefa2010-09-15 17:06:34 -0400184typedef void (blkio_update_group_read_bps_fn) (struct blkio_group *blkg,
185 u64 read_bps);
186typedef void (blkio_update_group_write_bps_fn) (struct blkio_group *blkg,
187 u64 write_bps);
Vivek Goyal3e252062009-12-04 10:36:42 -0500188
189struct blkio_policy_ops {
190 blkio_unlink_group_fn *blkio_unlink_group_fn;
191 blkio_update_group_weight_fn *blkio_update_group_weight_fn;
Vivek Goyal4c9eefa2010-09-15 17:06:34 -0400192 blkio_update_group_read_bps_fn *blkio_update_group_read_bps_fn;
193 blkio_update_group_write_bps_fn *blkio_update_group_write_bps_fn;
Vivek Goyal3e252062009-12-04 10:36:42 -0500194};
195
196struct blkio_policy_type {
197 struct list_head list;
198 struct blkio_policy_ops ops;
Vivek Goyal062a6442010-09-15 17:06:33 -0400199 enum blkio_policy_id plid;
Vivek Goyal3e252062009-12-04 10:36:42 -0500200};
201
202/* Blkio controller policy registration */
203extern void blkio_policy_register(struct blkio_policy_type *);
204extern void blkio_policy_unregister(struct blkio_policy_type *);
205
Vivek Goyalafc24d42010-04-26 19:27:56 +0200206static inline char *blkg_path(struct blkio_group *blkg)
207{
208 return blkg->path;
209}
210
Jens Axboe2f5ea472009-12-03 21:06:43 +0100211#else
212
213struct blkio_group {
214};
215
Vivek Goyal3e252062009-12-04 10:36:42 -0500216struct blkio_policy_type {
217};
218
219static inline void blkio_policy_register(struct blkio_policy_type *blkiop) { }
220static inline void blkio_policy_unregister(struct blkio_policy_type *blkiop) { }
221
Vivek Goyalafc24d42010-04-26 19:27:56 +0200222static inline char *blkg_path(struct blkio_group *blkg) { return NULL; }
223
Jens Axboe2f5ea472009-12-03 21:06:43 +0100224#endif
225
Vivek Goyal31e4c282009-12-03 12:59:42 -0500226#define BLKIO_WEIGHT_MIN 100
227#define BLKIO_WEIGHT_MAX 1000
228#define BLKIO_WEIGHT_DEFAULT 500
229
Vivek Goyal2868ef72009-12-03 12:59:48 -0500230#ifdef CONFIG_DEBUG_BLK_CGROUP
Divyesh Shaha11cdaa2010-04-13 19:59:17 +0200231void blkiocg_update_avg_queue_size_stats(struct blkio_group *blkg);
Divyesh Shah91952912010-04-01 15:01:41 -0700232void blkiocg_update_dequeue_stats(struct blkio_group *blkg,
Vivek Goyal22084192009-12-03 12:59:49 -0500233 unsigned long dequeue);
Divyesh Shah812df482010-04-08 21:15:35 -0700234void blkiocg_update_set_idle_time_stats(struct blkio_group *blkg);
235void blkiocg_update_idle_time_stats(struct blkio_group *blkg);
Vivek Goyale5ff0822010-04-26 19:25:11 +0200236void blkiocg_set_start_empty_time(struct blkio_group *blkg);
Divyesh Shah812df482010-04-08 21:15:35 -0700237
238#define BLKG_FLAG_FNS(name) \
239static inline void blkio_mark_blkg_##name( \
240 struct blkio_group_stats *stats) \
241{ \
242 stats->flags |= (1 << BLKG_##name); \
243} \
244static inline void blkio_clear_blkg_##name( \
245 struct blkio_group_stats *stats) \
246{ \
247 stats->flags &= ~(1 << BLKG_##name); \
248} \
249static inline int blkio_blkg_##name(struct blkio_group_stats *stats) \
250{ \
251 return (stats->flags & (1 << BLKG_##name)) != 0; \
252} \
253
254BLKG_FLAG_FNS(waiting)
255BLKG_FLAG_FNS(idling)
256BLKG_FLAG_FNS(empty)
257#undef BLKG_FLAG_FNS
Vivek Goyal2868ef72009-12-03 12:59:48 -0500258#else
Divyesh Shaha11cdaa2010-04-13 19:59:17 +0200259static inline void blkiocg_update_avg_queue_size_stats(
Divyesh Shahcdc11842010-04-08 21:15:10 -0700260 struct blkio_group *blkg) {}
Divyesh Shah91952912010-04-01 15:01:41 -0700261static inline void blkiocg_update_dequeue_stats(struct blkio_group *blkg,
262 unsigned long dequeue) {}
Divyesh Shah812df482010-04-08 21:15:35 -0700263static inline void blkiocg_update_set_idle_time_stats(struct blkio_group *blkg)
264{}
265static inline void blkiocg_update_idle_time_stats(struct blkio_group *blkg) {}
Vivek Goyale5ff0822010-04-26 19:25:11 +0200266static inline void blkiocg_set_start_empty_time(struct blkio_group *blkg) {}
Vivek Goyal2868ef72009-12-03 12:59:48 -0500267#endif
268
Ben Blum67523c42010-03-10 15:22:11 -0800269#if defined(CONFIG_BLK_CGROUP) || defined(CONFIG_BLK_CGROUP_MODULE)
Vivek Goyal31e4c282009-12-03 12:59:42 -0500270extern struct blkio_cgroup blkio_root_cgroup;
271extern struct blkio_cgroup *cgroup_to_blkio_cgroup(struct cgroup *cgroup);
272extern void blkiocg_add_blkio_group(struct blkio_cgroup *blkcg,
Vivek Goyal062a6442010-09-15 17:06:33 -0400273 struct blkio_group *blkg, void *key, dev_t dev,
274 enum blkio_policy_id plid);
Vivek Goyal31e4c282009-12-03 12:59:42 -0500275extern int blkiocg_del_blkio_group(struct blkio_group *blkg);
276extern struct blkio_group *blkiocg_lookup_group(struct blkio_cgroup *blkcg,
277 void *key);
Divyesh Shah303a3ac2010-04-01 15:01:24 -0700278void blkiocg_update_timeslice_used(struct blkio_group *blkg,
279 unsigned long time);
Divyesh Shah84c124d2010-04-09 08:31:19 +0200280void blkiocg_update_dispatch_stats(struct blkio_group *blkg, uint64_t bytes,
281 bool direction, bool sync);
282void blkiocg_update_completion_stats(struct blkio_group *blkg,
283 uint64_t start_time, uint64_t io_start_time, bool direction, bool sync);
Divyesh Shah812d4022010-04-08 21:14:23 -0700284void blkiocg_update_io_merged_stats(struct blkio_group *blkg, bool direction,
285 bool sync);
Divyesh Shaha11cdaa2010-04-13 19:59:17 +0200286void blkiocg_update_io_add_stats(struct blkio_group *blkg,
Divyesh Shahcdc11842010-04-08 21:15:10 -0700287 struct blkio_group *curr_blkg, bool direction, bool sync);
Divyesh Shaha11cdaa2010-04-13 19:59:17 +0200288void blkiocg_update_io_remove_stats(struct blkio_group *blkg,
Divyesh Shahcdc11842010-04-08 21:15:10 -0700289 bool direction, bool sync);
Vivek Goyal31e4c282009-12-03 12:59:42 -0500290#else
Jens Axboe2f5ea472009-12-03 21:06:43 +0100291struct cgroup;
Vivek Goyal31e4c282009-12-03 12:59:42 -0500292static inline struct blkio_cgroup *
293cgroup_to_blkio_cgroup(struct cgroup *cgroup) { return NULL; }
294
295static inline void blkiocg_add_blkio_group(struct blkio_cgroup *blkcg,
Vivek Goyal062a6442010-09-15 17:06:33 -0400296 struct blkio_group *blkg, void *key, dev_t dev,
297 enum blkio_policy_id plid) {}
Vivek Goyal31e4c282009-12-03 12:59:42 -0500298
299static inline int
300blkiocg_del_blkio_group(struct blkio_group *blkg) { return 0; }
301
302static inline struct blkio_group *
303blkiocg_lookup_group(struct blkio_cgroup *blkcg, void *key) { return NULL; }
Divyesh Shah303a3ac2010-04-01 15:01:24 -0700304static inline void blkiocg_update_timeslice_used(struct blkio_group *blkg,
Divyesh Shah9a0785b2010-04-01 15:01:04 -0700305 unsigned long time) {}
Divyesh Shah84c124d2010-04-09 08:31:19 +0200306static inline void blkiocg_update_dispatch_stats(struct blkio_group *blkg,
307 uint64_t bytes, bool direction, bool sync) {}
308static inline void blkiocg_update_completion_stats(struct blkio_group *blkg,
309 uint64_t start_time, uint64_t io_start_time, bool direction,
310 bool sync) {}
Divyesh Shah812d4022010-04-08 21:14:23 -0700311static inline void blkiocg_update_io_merged_stats(struct blkio_group *blkg,
312 bool direction, bool sync) {}
Divyesh Shaha11cdaa2010-04-13 19:59:17 +0200313static inline void blkiocg_update_io_add_stats(struct blkio_group *blkg,
Divyesh Shahcdc11842010-04-08 21:15:10 -0700314 struct blkio_group *curr_blkg, bool direction, bool sync) {}
Divyesh Shaha11cdaa2010-04-13 19:59:17 +0200315static inline void blkiocg_update_io_remove_stats(struct blkio_group *blkg,
Divyesh Shahcdc11842010-04-08 21:15:10 -0700316 bool direction, bool sync) {}
Vivek Goyal31e4c282009-12-03 12:59:42 -0500317#endif
318#endif /* _BLK_CGROUP_H */