blob: b791022beef3158ba02a739c061838bf57500bf5 [file] [log] [blame]
Jens Axboe86db1e22008-01-29 14:53:40 +01001/*
2 * Functions related to io context handling
3 */
4#include <linux/kernel.h>
5#include <linux/module.h>
6#include <linux/init.h>
7#include <linux/bio.h>
8#include <linux/blkdev.h>
9#include <linux/bootmem.h> /* for max_pfn/max_low_pfn */
Tejun Heo5a0e3ad2010-03-24 17:04:11 +090010#include <linux/slab.h>
Jens Axboe86db1e22008-01-29 14:53:40 +010011
12#include "blk.h"
13
14/*
15 * For io context allocations
16 */
17static struct kmem_cache *iocontext_cachep;
18
19static void cfq_dtor(struct io_context *ioc)
20{
Jens Axboeffc4e752008-02-19 10:02:29 +010021 if (!hlist_empty(&ioc->cic_list)) {
22 struct cfq_io_context *cic;
Jens Axboe86db1e22008-01-29 14:53:40 +010023
Jens Axboeffc4e752008-02-19 10:02:29 +010024 cic = list_entry(ioc->cic_list.first, struct cfq_io_context,
25 cic_list);
26 cic->dtor(ioc);
27 }
Jens Axboe86db1e22008-01-29 14:53:40 +010028}
29
30/*
31 * IO Context helper functions. put_io_context() returns 1 if there are no
32 * more users of this io context, 0 otherwise.
33 */
34int put_io_context(struct io_context *ioc)
35{
36 if (ioc == NULL)
37 return 1;
38
Nikanth Karthikesand9c7d392009-06-10 12:57:06 -070039 BUG_ON(atomic_long_read(&ioc->refcount) == 0);
Jens Axboe86db1e22008-01-29 14:53:40 +010040
Nikanth Karthikesand9c7d392009-06-10 12:57:06 -070041 if (atomic_long_dec_and_test(&ioc->refcount)) {
Jens Axboe86db1e22008-01-29 14:53:40 +010042 rcu_read_lock();
Jens Axboe86db1e22008-01-29 14:53:40 +010043 cfq_dtor(ioc);
Jens Axboe07416d22008-05-07 09:17:12 +020044 rcu_read_unlock();
Jens Axboe86db1e22008-01-29 14:53:40 +010045
46 kmem_cache_free(iocontext_cachep, ioc);
47 return 1;
48 }
49 return 0;
50}
51EXPORT_SYMBOL(put_io_context);
52
53static void cfq_exit(struct io_context *ioc)
54{
Jens Axboe86db1e22008-01-29 14:53:40 +010055 rcu_read_lock();
Jens Axboe86db1e22008-01-29 14:53:40 +010056
Jens Axboeffc4e752008-02-19 10:02:29 +010057 if (!hlist_empty(&ioc->cic_list)) {
58 struct cfq_io_context *cic;
59
60 cic = list_entry(ioc->cic_list.first, struct cfq_io_context,
61 cic_list);
62 cic->exit(ioc);
63 }
64 rcu_read_unlock();
Jens Axboe86db1e22008-01-29 14:53:40 +010065}
66
Bart Van Assche27667c92010-12-21 15:07:45 +010067/* Called by the exiting task */
Louis Rillingb69f2292009-12-04 14:52:42 +010068void exit_io_context(struct task_struct *task)
Jens Axboe86db1e22008-01-29 14:53:40 +010069{
70 struct io_context *ioc;
71
Louis Rillingb69f2292009-12-04 14:52:42 +010072 task_lock(task);
73 ioc = task->io_context;
74 task->io_context = NULL;
75 task_unlock(task);
Jens Axboe86db1e22008-01-29 14:53:40 +010076
Bart Van Assche27667c92010-12-21 15:07:45 +010077 if (atomic_dec_and_test(&ioc->nr_tasks))
Jens Axboe86db1e22008-01-29 14:53:40 +010078 cfq_exit(ioc);
79
Louis Rilling61cc74f2009-12-04 14:52:41 +010080 put_io_context(ioc);
Jens Axboe86db1e22008-01-29 14:53:40 +010081}
82
83struct io_context *alloc_io_context(gfp_t gfp_flags, int node)
84{
85 struct io_context *ret;
86
87 ret = kmem_cache_alloc_node(iocontext_cachep, gfp_flags, node);
88 if (ret) {
Nikanth Karthikesand9c7d392009-06-10 12:57:06 -070089 atomic_long_set(&ret->refcount, 1);
Jens Axboe86db1e22008-01-29 14:53:40 +010090 atomic_set(&ret->nr_tasks, 1);
91 spin_lock_init(&ret->lock);
92 ret->ioprio_changed = 0;
93 ret->ioprio = 0;
Richard Kennedy4671a132010-03-01 10:57:22 +010094 ret->last_waited = 0; /* doesn't matter... */
Jens Axboe86db1e22008-01-29 14:53:40 +010095 ret->nr_batch_requests = 0; /* because this is 0 */
Jens Axboe86db1e22008-01-29 14:53:40 +010096 INIT_RADIX_TREE(&ret->radix_root, GFP_ATOMIC | __GFP_HIGH);
Jens Axboeffc4e752008-02-19 10:02:29 +010097 INIT_HLIST_HEAD(&ret->cic_list);
Jens Axboe86db1e22008-01-29 14:53:40 +010098 ret->ioc_data = NULL;
99 }
100
101 return ret;
102}
103
104/*
105 * If the current task has no IO context then create one and initialise it.
106 * Otherwise, return its existing IO context.
107 *
108 * This returned IO context doesn't have a specifically elevated refcount,
109 * but since the current task itself holds a reference, the context can be
110 * used in general code, so long as it stays within `current` context.
111 */
112struct io_context *current_io_context(gfp_t gfp_flags, int node)
113{
114 struct task_struct *tsk = current;
115 struct io_context *ret;
116
117 ret = tsk->io_context;
118 if (likely(ret))
119 return ret;
120
121 ret = alloc_io_context(gfp_flags, node);
122 if (ret) {
123 /* make sure set_task_ioprio() sees the settings above */
124 smp_wmb();
125 tsk->io_context = ret;
126 }
127
128 return ret;
129}
130
131/*
132 * If the current task has no IO context then create one and initialise it.
133 * If it does have a context, take a ref on it.
134 *
135 * This is always called in the context of the task which submitted the I/O.
136 */
137struct io_context *get_io_context(gfp_t gfp_flags, int node)
138{
139 struct io_context *ret = NULL;
140
141 /*
142 * Check for unlikely race with exiting task. ioc ref count is
143 * zero when ioc is being detached.
144 */
145 do {
146 ret = current_io_context(gfp_flags, node);
147 if (unlikely(!ret))
148 break;
Nikanth Karthikesand9c7d392009-06-10 12:57:06 -0700149 } while (!atomic_long_inc_not_zero(&ret->refcount));
Jens Axboe86db1e22008-01-29 14:53:40 +0100150
151 return ret;
152}
153EXPORT_SYMBOL(get_io_context);
154
Adrian Bunk13341592008-02-18 13:45:53 +0100155static int __init blk_ioc_init(void)
Jens Axboe86db1e22008-01-29 14:53:40 +0100156{
157 iocontext_cachep = kmem_cache_create("blkdev_ioc",
158 sizeof(struct io_context), 0, SLAB_PANIC, NULL);
159 return 0;
160}
161subsys_initcall(blk_ioc_init);