blob: 6ef05d5b884db3748b2662098864fe41f711670e [file] [log] [blame]
Chris Wilson5cc9ed42014-05-16 14:22:37 +01001/*
2 * Copyright © 2012-2014 Intel Corporation
3 *
4 * Permission is hereby granted, free of charge, to any person obtaining a
5 * copy of this software and associated documentation files (the "Software"),
6 * to deal in the Software without restriction, including without limitation
7 * the rights to use, copy, modify, merge, publish, distribute, sublicense,
8 * and/or sell copies of the Software, and to permit persons to whom the
9 * Software is furnished to do so, subject to the following conditions:
10 *
11 * The above copyright notice and this permission notice (including the next
12 * paragraph) shall be included in all copies or substantial portions of the
13 * Software.
14 *
15 * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
16 * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
17 * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL
18 * THE AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
19 * LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING
20 * FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS
21 * IN THE SOFTWARE.
22 *
23 */
24
Maarten Lankhorstb588c922015-05-13 09:56:00 +020025#include <drm/drmP.h>
26#include <drm/i915_drm.h>
Chris Wilson5cc9ed42014-05-16 14:22:37 +010027#include "i915_drv.h"
28#include "i915_trace.h"
29#include "intel_drv.h"
30#include <linux/mmu_context.h>
31#include <linux/mmu_notifier.h>
32#include <linux/mempolicy.h>
33#include <linux/swap.h>
Ingo Molnar6e84f312017-02-08 18:51:29 +010034#include <linux/sched/mm.h>
Chris Wilson5cc9ed42014-05-16 14:22:37 +010035
Chris Wilsonad46cb52014-08-07 14:20:40 +010036struct i915_mm_struct {
37 struct mm_struct *mm;
Chris Wilsonf470b192016-04-05 15:00:01 +010038 struct drm_i915_private *i915;
Chris Wilsonad46cb52014-08-07 14:20:40 +010039 struct i915_mmu_notifier *mn;
40 struct hlist_node node;
41 struct kref kref;
42 struct work_struct work;
43};
44
Chris Wilson5cc9ed42014-05-16 14:22:37 +010045#if defined(CONFIG_MMU_NOTIFIER)
46#include <linux/interval_tree.h>
47
48struct i915_mmu_notifier {
49 spinlock_t lock;
50 struct hlist_node node;
51 struct mmu_notifier mn;
52 struct rb_root objects;
Chris Wilson393afc22016-04-05 14:59:59 +010053 struct workqueue_struct *wq;
Chris Wilson5cc9ed42014-05-16 14:22:37 +010054};
55
56struct i915_mmu_object {
Chris Wilsonad46cb52014-08-07 14:20:40 +010057 struct i915_mmu_notifier *mn;
Chris Wilson768e1592016-01-21 17:32:43 +000058 struct drm_i915_gem_object *obj;
Chris Wilson5cc9ed42014-05-16 14:22:37 +010059 struct interval_tree_node it;
Chris Wilsonec8b0dd2014-07-21 13:21:23 +010060 struct list_head link;
Chris Wilson380996a2015-10-01 12:34:47 +010061 struct work_struct work;
Chris Wilson768e1592016-01-21 17:32:43 +000062 bool attached;
Chris Wilson5cc9ed42014-05-16 14:22:37 +010063};
64
Chris Wilson768e1592016-01-21 17:32:43 +000065static void cancel_userptr(struct work_struct *work)
Chris Wilsonec8b0dd2014-07-21 13:21:23 +010066{
Chris Wilson380996a2015-10-01 12:34:47 +010067 struct i915_mmu_object *mo = container_of(work, typeof(*mo), work);
68 struct drm_i915_gem_object *obj = mo->obj;
Chris Wilsonec8b0dd2014-07-21 13:21:23 +010069 struct drm_device *dev = obj->base.dev;
Chris Wilsonec8b0dd2014-07-21 13:21:23 +010070
Chris Wilsone95433c2016-10-28 13:58:27 +010071 i915_gem_object_wait(obj, I915_WAIT_ALL, MAX_SCHEDULE_TIMEOUT, NULL);
Chris Wilson8a3b3d52016-08-05 10:14:08 +010072
Chris Wilsonec8b0dd2014-07-21 13:21:23 +010073 mutex_lock(&dev->struct_mutex);
74 /* Cancel any active worker and force us to re-evaluate gup */
75 obj->userptr.work = NULL;
76
Chris Wilson03ac84f2016-10-28 13:58:36 +010077 /* We are inside a kthread context and can't be interrupted */
78 if (i915_gem_object_unbind(obj) == 0)
Chris Wilson548625e2016-11-01 12:11:34 +000079 __i915_gem_object_put_pages(obj, I915_MM_NORMAL);
Chris Wilson03ac84f2016-10-28 13:58:36 +010080 WARN_ONCE(obj->mm.pages,
81 "Failed to release pages: bind_count=%d, pages_pin_count=%d, pin_display=%d\n",
82 obj->bind_count,
Chris Wilson1233e2d2016-10-28 13:58:37 +010083 atomic_read(&obj->mm.pages_pin_count),
Chris Wilson03ac84f2016-10-28 13:58:36 +010084 obj->pin_display);
Chris Wilsonec8b0dd2014-07-21 13:21:23 +010085
Chris Wilsonf8c417c2016-07-20 13:31:53 +010086 i915_gem_object_put(obj);
Chris Wilsonec8b0dd2014-07-21 13:21:23 +010087 mutex_unlock(&dev->struct_mutex);
Chris Wilsonec8b0dd2014-07-21 13:21:23 +010088}
89
Chris Wilson768e1592016-01-21 17:32:43 +000090static void add_object(struct i915_mmu_object *mo)
Chris Wilsonec8b0dd2014-07-21 13:21:23 +010091{
Chris Wilson768e1592016-01-21 17:32:43 +000092 if (mo->attached)
93 return;
Chris Wilsonec8b0dd2014-07-21 13:21:23 +010094
Chris Wilson768e1592016-01-21 17:32:43 +000095 interval_tree_insert(&mo->it, &mo->mn->objects);
96 mo->attached = true;
97}
Chris Wilsonec8b0dd2014-07-21 13:21:23 +010098
Chris Wilson768e1592016-01-21 17:32:43 +000099static void del_object(struct i915_mmu_object *mo)
100{
101 if (!mo->attached)
102 return;
103
104 interval_tree_remove(&mo->it, &mo->mn->objects);
105 mo->attached = false;
Chris Wilsonec8b0dd2014-07-21 13:21:23 +0100106}
107
Chris Wilson5cc9ed42014-05-16 14:22:37 +0100108static void i915_gem_userptr_mn_invalidate_range_start(struct mmu_notifier *_mn,
109 struct mm_struct *mm,
110 unsigned long start,
111 unsigned long end)
112{
Chris Wilson380996a2015-10-01 12:34:47 +0100113 struct i915_mmu_notifier *mn =
114 container_of(_mn, struct i915_mmu_notifier, mn);
115 struct i915_mmu_object *mo;
Chris Wilson768e1592016-01-21 17:32:43 +0000116 struct interval_tree_node *it;
117 LIST_HEAD(cancelled);
118
119 if (RB_EMPTY_ROOT(&mn->objects))
120 return;
Chris Wilson5cc9ed42014-05-16 14:22:37 +0100121
Chris Wilson380996a2015-10-01 12:34:47 +0100122 /* interval ranges are inclusive, but invalidate range is exclusive */
123 end--;
Chris Wilson5cc9ed42014-05-16 14:22:37 +0100124
Chris Wilson380996a2015-10-01 12:34:47 +0100125 spin_lock(&mn->lock);
Chris Wilson768e1592016-01-21 17:32:43 +0000126 it = interval_tree_iter_first(&mn->objects, start, end);
127 while (it) {
128 /* The mmu_object is released late when destroying the
129 * GEM object so it is entirely possible to gain a
130 * reference on an object in the process of being freed
131 * since our serialisation is via the spinlock and not
132 * the struct_mutex - and consequently use it after it
133 * is freed and then double free it. To prevent that
134 * use-after-free we only acquire a reference on the
135 * object if it is not in the process of being destroyed.
136 */
137 mo = container_of(it, struct i915_mmu_object, it);
138 if (kref_get_unless_zero(&mo->obj->base.refcount))
Chris Wilson393afc22016-04-05 14:59:59 +0100139 queue_work(mn->wq, &mo->work);
Michał Winiarski460822b2015-02-03 15:48:17 +0100140
Chris Wilson768e1592016-01-21 17:32:43 +0000141 list_add(&mo->link, &cancelled);
142 it = interval_tree_iter_next(it, start, end);
Chris Wilson5cc9ed42014-05-16 14:22:37 +0100143 }
Chris Wilson768e1592016-01-21 17:32:43 +0000144 list_for_each_entry(mo, &cancelled, link)
145 del_object(mo);
Chris Wilson380996a2015-10-01 12:34:47 +0100146 spin_unlock(&mn->lock);
Chris Wilson393afc22016-04-05 14:59:59 +0100147
148 flush_workqueue(mn->wq);
Chris Wilson5cc9ed42014-05-16 14:22:37 +0100149}
150
151static const struct mmu_notifier_ops i915_gem_userptr_notifier = {
152 .invalidate_range_start = i915_gem_userptr_mn_invalidate_range_start,
153};
154
155static struct i915_mmu_notifier *
Chris Wilsonad46cb52014-08-07 14:20:40 +0100156i915_mmu_notifier_create(struct mm_struct *mm)
Chris Wilson5cc9ed42014-05-16 14:22:37 +0100157{
Chris Wilsonad46cb52014-08-07 14:20:40 +0100158 struct i915_mmu_notifier *mn;
Chris Wilson5cc9ed42014-05-16 14:22:37 +0100159 int ret;
160
Chris Wilsonad46cb52014-08-07 14:20:40 +0100161 mn = kmalloc(sizeof(*mn), GFP_KERNEL);
162 if (mn == NULL)
Chris Wilson5cc9ed42014-05-16 14:22:37 +0100163 return ERR_PTR(-ENOMEM);
164
Chris Wilsonad46cb52014-08-07 14:20:40 +0100165 spin_lock_init(&mn->lock);
166 mn->mn.ops = &i915_gem_userptr_notifier;
167 mn->objects = RB_ROOT;
Chris Wilson393afc22016-04-05 14:59:59 +0100168 mn->wq = alloc_workqueue("i915-userptr-release", WQ_UNBOUND, 0);
169 if (mn->wq == NULL) {
170 kfree(mn);
171 return ERR_PTR(-ENOMEM);
172 }
Chris Wilson5cc9ed42014-05-16 14:22:37 +0100173
Chris Wilsonad46cb52014-08-07 14:20:40 +0100174 /* Protected by mmap_sem (write-lock) */
175 ret = __mmu_notifier_register(&mn->mn, mm);
Chris Wilson5cc9ed42014-05-16 14:22:37 +0100176 if (ret) {
Chris Wilson393afc22016-04-05 14:59:59 +0100177 destroy_workqueue(mn->wq);
Chris Wilsonad46cb52014-08-07 14:20:40 +0100178 kfree(mn);
Chris Wilson5cc9ed42014-05-16 14:22:37 +0100179 return ERR_PTR(ret);
180 }
181
Chris Wilsonad46cb52014-08-07 14:20:40 +0100182 return mn;
Chris Wilson5cc9ed42014-05-16 14:22:37 +0100183}
184
Chris Wilson5cc9ed42014-05-16 14:22:37 +0100185static void
186i915_gem_userptr_release__mmu_notifier(struct drm_i915_gem_object *obj)
187{
Chris Wilsonad46cb52014-08-07 14:20:40 +0100188 struct i915_mmu_object *mo;
Chris Wilson5cc9ed42014-05-16 14:22:37 +0100189
Chris Wilsonad46cb52014-08-07 14:20:40 +0100190 mo = obj->userptr.mmu_object;
191 if (mo == NULL)
Chris Wilson5cc9ed42014-05-16 14:22:37 +0100192 return;
193
Chris Wilson768e1592016-01-21 17:32:43 +0000194 spin_lock(&mo->mn->lock);
195 del_object(mo);
196 spin_unlock(&mo->mn->lock);
Chris Wilsonad46cb52014-08-07 14:20:40 +0100197 kfree(mo);
198
199 obj->userptr.mmu_object = NULL;
200}
201
202static struct i915_mmu_notifier *
203i915_mmu_notifier_find(struct i915_mm_struct *mm)
204{
Chris Wilsone9681362014-09-26 10:31:02 +0100205 struct i915_mmu_notifier *mn = mm->mn;
206
207 mn = mm->mn;
208 if (mn)
209 return mn;
210
211 down_write(&mm->mm->mmap_sem);
Chris Wilsonf470b192016-04-05 15:00:01 +0100212 mutex_lock(&mm->i915->mm_lock);
Chris Wilsone9681362014-09-26 10:31:02 +0100213 if ((mn = mm->mn) == NULL) {
214 mn = i915_mmu_notifier_create(mm->mm);
215 if (!IS_ERR(mn))
216 mm->mn = mn;
Chris Wilsonad46cb52014-08-07 14:20:40 +0100217 }
Chris Wilsonf470b192016-04-05 15:00:01 +0100218 mutex_unlock(&mm->i915->mm_lock);
Chris Wilsone9681362014-09-26 10:31:02 +0100219 up_write(&mm->mm->mmap_sem);
220
221 return mn;
Chris Wilson5cc9ed42014-05-16 14:22:37 +0100222}
223
224static int
225i915_gem_userptr_init__mmu_notifier(struct drm_i915_gem_object *obj,
226 unsigned flags)
227{
Chris Wilsonad46cb52014-08-07 14:20:40 +0100228 struct i915_mmu_notifier *mn;
229 struct i915_mmu_object *mo;
Chris Wilson5cc9ed42014-05-16 14:22:37 +0100230
231 if (flags & I915_USERPTR_UNSYNCHRONIZED)
232 return capable(CAP_SYS_ADMIN) ? 0 : -EPERM;
233
Chris Wilsonad46cb52014-08-07 14:20:40 +0100234 if (WARN_ON(obj->userptr.mm == NULL))
235 return -EINVAL;
236
237 mn = i915_mmu_notifier_find(obj->userptr.mm);
238 if (IS_ERR(mn))
239 return PTR_ERR(mn);
240
241 mo = kzalloc(sizeof(*mo), GFP_KERNEL);
242 if (mo == NULL)
243 return -ENOMEM;
244
245 mo->mn = mn;
Chris Wilsonad46cb52014-08-07 14:20:40 +0100246 mo->obj = obj;
Chris Wilson768e1592016-01-21 17:32:43 +0000247 mo->it.start = obj->userptr.ptr;
248 mo->it.last = obj->userptr.ptr + obj->base.size - 1;
249 INIT_WORK(&mo->work, cancel_userptr);
Chris Wilson5cc9ed42014-05-16 14:22:37 +0100250
Chris Wilsonad46cb52014-08-07 14:20:40 +0100251 obj->userptr.mmu_object = mo;
Chris Wilson5cc9ed42014-05-16 14:22:37 +0100252 return 0;
Chris Wilsonad46cb52014-08-07 14:20:40 +0100253}
Chris Wilson5cc9ed42014-05-16 14:22:37 +0100254
Chris Wilsonad46cb52014-08-07 14:20:40 +0100255static void
256i915_mmu_notifier_free(struct i915_mmu_notifier *mn,
257 struct mm_struct *mm)
258{
259 if (mn == NULL)
260 return;
261
262 mmu_notifier_unregister(&mn->mn, mm);
Chris Wilson393afc22016-04-05 14:59:59 +0100263 destroy_workqueue(mn->wq);
Chris Wilson5cc9ed42014-05-16 14:22:37 +0100264 kfree(mn);
Chris Wilson5cc9ed42014-05-16 14:22:37 +0100265}
266
267#else
268
269static void
270i915_gem_userptr_release__mmu_notifier(struct drm_i915_gem_object *obj)
271{
272}
273
274static int
275i915_gem_userptr_init__mmu_notifier(struct drm_i915_gem_object *obj,
276 unsigned flags)
277{
278 if ((flags & I915_USERPTR_UNSYNCHRONIZED) == 0)
279 return -ENODEV;
280
281 if (!capable(CAP_SYS_ADMIN))
282 return -EPERM;
283
284 return 0;
285}
Chris Wilsonad46cb52014-08-07 14:20:40 +0100286
287static void
288i915_mmu_notifier_free(struct i915_mmu_notifier *mn,
289 struct mm_struct *mm)
290{
291}
292
Chris Wilson5cc9ed42014-05-16 14:22:37 +0100293#endif
294
Chris Wilsonad46cb52014-08-07 14:20:40 +0100295static struct i915_mm_struct *
296__i915_mm_struct_find(struct drm_i915_private *dev_priv, struct mm_struct *real)
297{
298 struct i915_mm_struct *mm;
299
300 /* Protected by dev_priv->mm_lock */
301 hash_for_each_possible(dev_priv->mm_structs, mm, node, (unsigned long)real)
302 if (mm->mm == real)
303 return mm;
304
305 return NULL;
306}
307
308static int
309i915_gem_userptr_init__mm_struct(struct drm_i915_gem_object *obj)
310{
311 struct drm_i915_private *dev_priv = to_i915(obj->base.dev);
312 struct i915_mm_struct *mm;
313 int ret = 0;
314
315 /* During release of the GEM object we hold the struct_mutex. This
316 * precludes us from calling mmput() at that time as that may be
317 * the last reference and so call exit_mmap(). exit_mmap() will
318 * attempt to reap the vma, and if we were holding a GTT mmap
319 * would then call drm_gem_vm_close() and attempt to reacquire
320 * the struct mutex. So in order to avoid that recursion, we have
321 * to defer releasing the mm reference until after we drop the
322 * struct_mutex, i.e. we need to schedule a worker to do the clean
323 * up.
324 */
325 mutex_lock(&dev_priv->mm_lock);
326 mm = __i915_mm_struct_find(dev_priv, current->mm);
327 if (mm == NULL) {
328 mm = kmalloc(sizeof(*mm), GFP_KERNEL);
329 if (mm == NULL) {
330 ret = -ENOMEM;
331 goto out;
332 }
333
334 kref_init(&mm->kref);
Chris Wilsonf470b192016-04-05 15:00:01 +0100335 mm->i915 = to_i915(obj->base.dev);
Chris Wilsonad46cb52014-08-07 14:20:40 +0100336
337 mm->mm = current->mm;
Vegard Nossumf1f10072017-02-27 14:30:07 -0800338 mmgrab(current->mm);
Chris Wilsonad46cb52014-08-07 14:20:40 +0100339
340 mm->mn = NULL;
341
342 /* Protected by dev_priv->mm_lock */
343 hash_add(dev_priv->mm_structs,
344 &mm->node, (unsigned long)mm->mm);
345 } else
346 kref_get(&mm->kref);
347
348 obj->userptr.mm = mm;
349out:
350 mutex_unlock(&dev_priv->mm_lock);
351 return ret;
352}
353
354static void
355__i915_mm_struct_free__worker(struct work_struct *work)
356{
357 struct i915_mm_struct *mm = container_of(work, typeof(*mm), work);
358 i915_mmu_notifier_free(mm->mn, mm->mm);
359 mmdrop(mm->mm);
360 kfree(mm);
361}
362
363static void
364__i915_mm_struct_free(struct kref *kref)
365{
366 struct i915_mm_struct *mm = container_of(kref, typeof(*mm), kref);
367
368 /* Protected by dev_priv->mm_lock */
369 hash_del(&mm->node);
Chris Wilsonf470b192016-04-05 15:00:01 +0100370 mutex_unlock(&mm->i915->mm_lock);
Chris Wilsonad46cb52014-08-07 14:20:40 +0100371
372 INIT_WORK(&mm->work, __i915_mm_struct_free__worker);
373 schedule_work(&mm->work);
374}
375
376static void
377i915_gem_userptr_release__mm_struct(struct drm_i915_gem_object *obj)
378{
379 if (obj->userptr.mm == NULL)
380 return;
381
382 kref_put_mutex(&obj->userptr.mm->kref,
383 __i915_mm_struct_free,
384 &to_i915(obj->base.dev)->mm_lock);
385 obj->userptr.mm = NULL;
386}
387
Chris Wilson5cc9ed42014-05-16 14:22:37 +0100388struct get_pages_work {
389 struct work_struct work;
390 struct drm_i915_gem_object *obj;
391 struct task_struct *task;
392};
393
Chris Wilson5cc9ed42014-05-16 14:22:37 +0100394#if IS_ENABLED(CONFIG_SWIOTLB)
395#define swiotlb_active() swiotlb_nr_tbl()
396#else
397#define swiotlb_active() 0
398#endif
399
400static int
401st_set_pages(struct sg_table **st, struct page **pvec, int num_pages)
402{
403 struct scatterlist *sg;
404 int ret, n;
405
406 *st = kmalloc(sizeof(**st), GFP_KERNEL);
407 if (*st == NULL)
408 return -ENOMEM;
409
410 if (swiotlb_active()) {
411 ret = sg_alloc_table(*st, num_pages, GFP_KERNEL);
412 if (ret)
413 goto err;
414
415 for_each_sg((*st)->sgl, sg, num_pages, n)
416 sg_set_page(sg, pvec[n], PAGE_SIZE, 0);
417 } else {
418 ret = sg_alloc_table_from_pages(*st, pvec, num_pages,
419 0, num_pages << PAGE_SHIFT,
420 GFP_KERNEL);
421 if (ret)
422 goto err;
423 }
424
425 return 0;
426
427err:
428 kfree(*st);
429 *st = NULL;
430 return ret;
431}
432
Chris Wilson03ac84f2016-10-28 13:58:36 +0100433static struct sg_table *
Imre Deake2273302015-07-09 12:59:05 +0300434__i915_gem_userptr_set_pages(struct drm_i915_gem_object *obj,
435 struct page **pvec, int num_pages)
436{
Chris Wilson03ac84f2016-10-28 13:58:36 +0100437 struct sg_table *pages;
Imre Deake2273302015-07-09 12:59:05 +0300438 int ret;
439
Chris Wilson03ac84f2016-10-28 13:58:36 +0100440 ret = st_set_pages(&pages, pvec, num_pages);
Imre Deake2273302015-07-09 12:59:05 +0300441 if (ret)
Chris Wilson03ac84f2016-10-28 13:58:36 +0100442 return ERR_PTR(ret);
Imre Deake2273302015-07-09 12:59:05 +0300443
Chris Wilson03ac84f2016-10-28 13:58:36 +0100444 ret = i915_gem_gtt_prepare_pages(obj, pages);
Imre Deake2273302015-07-09 12:59:05 +0300445 if (ret) {
Chris Wilson03ac84f2016-10-28 13:58:36 +0100446 sg_free_table(pages);
447 kfree(pages);
448 return ERR_PTR(ret);
Imre Deake2273302015-07-09 12:59:05 +0300449 }
450
Chris Wilson03ac84f2016-10-28 13:58:36 +0100451 return pages;
Imre Deake2273302015-07-09 12:59:05 +0300452}
453
Chris Wilson380996a2015-10-01 12:34:47 +0100454static int
Chris Wilsone4b946b2015-10-01 12:34:46 +0100455__i915_gem_userptr_set_active(struct drm_i915_gem_object *obj,
456 bool value)
457{
Chris Wilson380996a2015-10-01 12:34:47 +0100458 int ret = 0;
459
Chris Wilsone4b946b2015-10-01 12:34:46 +0100460 /* During mm_invalidate_range we need to cancel any userptr that
461 * overlaps the range being invalidated. Doing so requires the
462 * struct_mutex, and that risks recursion. In order to cause
463 * recursion, the user must alias the userptr address space with
464 * a GTT mmapping (possible with a MAP_FIXED) - then when we have
465 * to invalidate that mmaping, mm_invalidate_range is called with
466 * the userptr address *and* the struct_mutex held. To prevent that
467 * we set a flag under the i915_mmu_notifier spinlock to indicate
468 * whether this object is valid.
469 */
470#if defined(CONFIG_MMU_NOTIFIER)
471 if (obj->userptr.mmu_object == NULL)
Chris Wilson380996a2015-10-01 12:34:47 +0100472 return 0;
Chris Wilsone4b946b2015-10-01 12:34:46 +0100473
474 spin_lock(&obj->userptr.mmu_object->mn->lock);
Chris Wilson380996a2015-10-01 12:34:47 +0100475 /* In order to serialise get_pages with an outstanding
476 * cancel_userptr, we must drop the struct_mutex and try again.
477 */
Chris Wilson768e1592016-01-21 17:32:43 +0000478 if (!value)
479 del_object(obj->userptr.mmu_object);
480 else if (!work_pending(&obj->userptr.mmu_object->work))
481 add_object(obj->userptr.mmu_object);
Chris Wilson380996a2015-10-01 12:34:47 +0100482 else
483 ret = -EAGAIN;
Chris Wilsone4b946b2015-10-01 12:34:46 +0100484 spin_unlock(&obj->userptr.mmu_object->mn->lock);
485#endif
Chris Wilson380996a2015-10-01 12:34:47 +0100486
487 return ret;
Chris Wilsone4b946b2015-10-01 12:34:46 +0100488}
489
Chris Wilson5cc9ed42014-05-16 14:22:37 +0100490static void
491__i915_gem_userptr_get_pages_worker(struct work_struct *_work)
492{
493 struct get_pages_work *work = container_of(_work, typeof(*work), work);
494 struct drm_i915_gem_object *obj = work->obj;
Chris Wilson68d6c842015-10-01 12:34:45 +0100495 const int npages = obj->base.size >> PAGE_SHIFT;
Chris Wilson5cc9ed42014-05-16 14:22:37 +0100496 struct page **pvec;
497 int pinned, ret;
498
499 ret = -ENOMEM;
500 pinned = 0;
501
Chris Wilsonf2a85e12016-04-08 12:11:13 +0100502 pvec = drm_malloc_gfp(npages, sizeof(struct page *), GFP_TEMPORARY);
Chris Wilson5cc9ed42014-05-16 14:22:37 +0100503 if (pvec != NULL) {
Chris Wilsonad46cb52014-08-07 14:20:40 +0100504 struct mm_struct *mm = obj->userptr.mm->mm;
Lorenzo Stoakes9beae1e2016-10-13 01:20:17 +0100505 unsigned int flags = 0;
506
507 if (!obj->userptr.read_only)
508 flags |= FOLL_WRITE;
Chris Wilson5cc9ed42014-05-16 14:22:37 +0100509
Chris Wilson40313f02016-04-05 15:00:00 +0100510 ret = -EFAULT;
Vegard Nossum388f7932017-02-27 14:30:13 -0800511 if (mmget_not_zero(mm)) {
Chris Wilson40313f02016-04-05 15:00:00 +0100512 down_read(&mm->mmap_sem);
513 while (pinned < npages) {
514 ret = get_user_pages_remote
515 (work->task, mm,
516 obj->userptr.ptr + pinned * PAGE_SIZE,
517 npages - pinned,
Lorenzo Stoakes9beae1e2016-10-13 01:20:17 +0100518 flags,
Lorenzo Stoakes5b56d492016-12-14 15:06:52 -0800519 pvec + pinned, NULL, NULL);
Chris Wilson40313f02016-04-05 15:00:00 +0100520 if (ret < 0)
521 break;
Chris Wilson5cc9ed42014-05-16 14:22:37 +0100522
Chris Wilson40313f02016-04-05 15:00:00 +0100523 pinned += ret;
524 }
525 up_read(&mm->mmap_sem);
526 mmput(mm);
Chris Wilson5cc9ed42014-05-16 14:22:37 +0100527 }
Chris Wilson5cc9ed42014-05-16 14:22:37 +0100528 }
529
Chris Wilson1233e2d2016-10-28 13:58:37 +0100530 mutex_lock(&obj->mm.lock);
Chris Wilson68d6c842015-10-01 12:34:45 +0100531 if (obj->userptr.work == &work->work) {
Chris Wilson03ac84f2016-10-28 13:58:36 +0100532 struct sg_table *pages = ERR_PTR(ret);
533
Chris Wilson68d6c842015-10-01 12:34:45 +0100534 if (pinned == npages) {
Chris Wilson03ac84f2016-10-28 13:58:36 +0100535 pages = __i915_gem_userptr_set_pages(obj, pvec, npages);
536 if (!IS_ERR(pages)) {
537 __i915_gem_object_set_pages(obj, pages);
Chris Wilson68d6c842015-10-01 12:34:45 +0100538 pinned = 0;
Chris Wilson03ac84f2016-10-28 13:58:36 +0100539 pages = NULL;
Chris Wilson68d6c842015-10-01 12:34:45 +0100540 }
Chris Wilson5cc9ed42014-05-16 14:22:37 +0100541 }
Chris Wilson03ac84f2016-10-28 13:58:36 +0100542
543 obj->userptr.work = ERR_CAST(pages);
Chris Wilson42953b32017-03-07 20:58:49 +0000544 if (IS_ERR(pages))
545 __i915_gem_userptr_set_active(obj, false);
Chris Wilson5cc9ed42014-05-16 14:22:37 +0100546 }
Chris Wilson1233e2d2016-10-28 13:58:37 +0100547 mutex_unlock(&obj->mm.lock);
Chris Wilson5cc9ed42014-05-16 14:22:37 +0100548
549 release_pages(pvec, pinned, 0);
550 drm_free_large(pvec);
551
Chris Wilsonf0cd5182016-10-28 13:58:43 +0100552 i915_gem_object_put(obj);
Chris Wilson5cc9ed42014-05-16 14:22:37 +0100553 put_task_struct(work->task);
554 kfree(work);
555}
556
Chris Wilson03ac84f2016-10-28 13:58:36 +0100557static struct sg_table *
Chris Wilsone4b946b2015-10-01 12:34:46 +0100558__i915_gem_userptr_get_pages_schedule(struct drm_i915_gem_object *obj,
559 bool *active)
560{
561 struct get_pages_work *work;
562
563 /* Spawn a worker so that we can acquire the
564 * user pages without holding our mutex. Access
565 * to the user pages requires mmap_sem, and we have
566 * a strict lock ordering of mmap_sem, struct_mutex -
567 * we already hold struct_mutex here and so cannot
568 * call gup without encountering a lock inversion.
569 *
570 * Userspace will keep on repeating the operation
571 * (thanks to EAGAIN) until either we hit the fast
572 * path or the worker completes. If the worker is
573 * cancelled or superseded, the task is still run
574 * but the results ignored. (This leads to
575 * complications that we may have a stray object
576 * refcount that we need to be wary of when
577 * checking for existing objects during creation.)
578 * If the worker encounters an error, it reports
579 * that error back to this function through
580 * obj->userptr.work = ERR_PTR.
581 */
Chris Wilsone4b946b2015-10-01 12:34:46 +0100582 work = kmalloc(sizeof(*work), GFP_KERNEL);
583 if (work == NULL)
Chris Wilson03ac84f2016-10-28 13:58:36 +0100584 return ERR_PTR(-ENOMEM);
Chris Wilsone4b946b2015-10-01 12:34:46 +0100585
586 obj->userptr.work = &work->work;
Chris Wilsone4b946b2015-10-01 12:34:46 +0100587
Chris Wilson25dc5562016-07-20 13:31:52 +0100588 work->obj = i915_gem_object_get(obj);
Chris Wilsone4b946b2015-10-01 12:34:46 +0100589
590 work->task = current;
591 get_task_struct(work->task);
592
593 INIT_WORK(&work->work, __i915_gem_userptr_get_pages_worker);
594 schedule_work(&work->work);
595
596 *active = true;
Chris Wilson03ac84f2016-10-28 13:58:36 +0100597 return ERR_PTR(-EAGAIN);
Chris Wilsone4b946b2015-10-01 12:34:46 +0100598}
599
Chris Wilson03ac84f2016-10-28 13:58:36 +0100600static struct sg_table *
Chris Wilson5cc9ed42014-05-16 14:22:37 +0100601i915_gem_userptr_get_pages(struct drm_i915_gem_object *obj)
602{
603 const int num_pages = obj->base.size >> PAGE_SHIFT;
604 struct page **pvec;
Chris Wilson03ac84f2016-10-28 13:58:36 +0100605 struct sg_table *pages;
Chris Wilson5cc9ed42014-05-16 14:22:37 +0100606 int pinned, ret;
Chris Wilsone4b946b2015-10-01 12:34:46 +0100607 bool active;
Chris Wilson5cc9ed42014-05-16 14:22:37 +0100608
609 /* If userspace should engineer that these pages are replaced in
610 * the vma between us binding this page into the GTT and completion
611 * of rendering... Their loss. If they change the mapping of their
612 * pages they need to create a new bo to point to the new vma.
613 *
614 * However, that still leaves open the possibility of the vma
615 * being copied upon fork. Which falls under the same userspace
616 * synchronisation issue as a regular bo, except that this time
617 * the process may not be expecting that a particular piece of
618 * memory is tied to the GPU.
619 *
620 * Fortunately, we can hook into the mmu_notifier in order to
621 * discard the page references prior to anything nasty happening
622 * to the vma (discard or cloning) which should prevent the more
623 * egregious cases from causing harm.
624 */
Chris Wilson364c8172016-08-18 17:16:58 +0100625
626 if (obj->userptr.work) {
Chris Wilsone4b946b2015-10-01 12:34:46 +0100627 /* active flag should still be held for the pending work */
Chris Wilson364c8172016-08-18 17:16:58 +0100628 if (IS_ERR(obj->userptr.work))
Chris Wilson03ac84f2016-10-28 13:58:36 +0100629 return ERR_CAST(obj->userptr.work);
Chris Wilson364c8172016-08-18 17:16:58 +0100630 else
Chris Wilson03ac84f2016-10-28 13:58:36 +0100631 return ERR_PTR(-EAGAIN);
Chris Wilson364c8172016-08-18 17:16:58 +0100632 }
Chris Wilsone4b946b2015-10-01 12:34:46 +0100633
634 /* Let the mmu-notifier know that we have begun and need cancellation */
Chris Wilson380996a2015-10-01 12:34:47 +0100635 ret = __i915_gem_userptr_set_active(obj, true);
636 if (ret)
Chris Wilson03ac84f2016-10-28 13:58:36 +0100637 return ERR_PTR(ret);
Chris Wilson5cc9ed42014-05-16 14:22:37 +0100638
639 pvec = NULL;
640 pinned = 0;
Chris Wilsonad46cb52014-08-07 14:20:40 +0100641 if (obj->userptr.mm->mm == current->mm) {
Chris Wilsonf2a85e12016-04-08 12:11:13 +0100642 pvec = drm_malloc_gfp(num_pages, sizeof(struct page *),
643 GFP_TEMPORARY);
Chris Wilson5cc9ed42014-05-16 14:22:37 +0100644 if (pvec == NULL) {
Chris Wilsonf2a85e12016-04-08 12:11:13 +0100645 __i915_gem_userptr_set_active(obj, false);
Chris Wilson03ac84f2016-10-28 13:58:36 +0100646 return ERR_PTR(-ENOMEM);
Chris Wilson5cc9ed42014-05-16 14:22:37 +0100647 }
648
649 pinned = __get_user_pages_fast(obj->userptr.ptr, num_pages,
650 !obj->userptr.read_only, pvec);
651 }
Chris Wilson5cc9ed42014-05-16 14:22:37 +0100652
Chris Wilsone4b946b2015-10-01 12:34:46 +0100653 active = false;
654 if (pinned < 0)
Chris Wilson03ac84f2016-10-28 13:58:36 +0100655 pages = ERR_PTR(pinned), pinned = 0;
Chris Wilsone4b946b2015-10-01 12:34:46 +0100656 else if (pinned < num_pages)
Chris Wilson03ac84f2016-10-28 13:58:36 +0100657 pages = __i915_gem_userptr_get_pages_schedule(obj, &active);
Chris Wilsone4b946b2015-10-01 12:34:46 +0100658 else
Chris Wilson03ac84f2016-10-28 13:58:36 +0100659 pages = __i915_gem_userptr_set_pages(obj, pvec, num_pages);
660 if (IS_ERR(pages)) {
Chris Wilsone4b946b2015-10-01 12:34:46 +0100661 __i915_gem_userptr_set_active(obj, active);
662 release_pages(pvec, pinned, 0);
Chris Wilson5cc9ed42014-05-16 14:22:37 +0100663 }
Chris Wilson5cc9ed42014-05-16 14:22:37 +0100664 drm_free_large(pvec);
Chris Wilson03ac84f2016-10-28 13:58:36 +0100665 return pages;
Chris Wilson5cc9ed42014-05-16 14:22:37 +0100666}
667
668static void
Chris Wilson03ac84f2016-10-28 13:58:36 +0100669i915_gem_userptr_put_pages(struct drm_i915_gem_object *obj,
670 struct sg_table *pages)
Chris Wilson5cc9ed42014-05-16 14:22:37 +0100671{
Dave Gordon85d12252016-05-20 11:54:06 +0100672 struct sgt_iter sgt_iter;
673 struct page *page;
Chris Wilson5cc9ed42014-05-16 14:22:37 +0100674
675 BUG_ON(obj->userptr.work != NULL);
Chris Wilsone4b946b2015-10-01 12:34:46 +0100676 __i915_gem_userptr_set_active(obj, false);
Chris Wilson5cc9ed42014-05-16 14:22:37 +0100677
Chris Wilsona4f5ea62016-10-28 13:58:35 +0100678 if (obj->mm.madv != I915_MADV_WILLNEED)
679 obj->mm.dirty = false;
Chris Wilson5cc9ed42014-05-16 14:22:37 +0100680
Chris Wilson03ac84f2016-10-28 13:58:36 +0100681 i915_gem_gtt_finish_pages(obj, pages);
Imre Deake2273302015-07-09 12:59:05 +0300682
Chris Wilson03ac84f2016-10-28 13:58:36 +0100683 for_each_sgt_page(page, sgt_iter, pages) {
Chris Wilsona4f5ea62016-10-28 13:58:35 +0100684 if (obj->mm.dirty)
Chris Wilson5cc9ed42014-05-16 14:22:37 +0100685 set_page_dirty(page);
686
687 mark_page_accessed(page);
Kirill A. Shutemov09cbfea2016-04-01 15:29:47 +0300688 put_page(page);
Chris Wilson5cc9ed42014-05-16 14:22:37 +0100689 }
Chris Wilsona4f5ea62016-10-28 13:58:35 +0100690 obj->mm.dirty = false;
Chris Wilson5cc9ed42014-05-16 14:22:37 +0100691
Chris Wilson03ac84f2016-10-28 13:58:36 +0100692 sg_free_table(pages);
693 kfree(pages);
Chris Wilson5cc9ed42014-05-16 14:22:37 +0100694}
695
696static void
697i915_gem_userptr_release(struct drm_i915_gem_object *obj)
698{
699 i915_gem_userptr_release__mmu_notifier(obj);
Chris Wilsonad46cb52014-08-07 14:20:40 +0100700 i915_gem_userptr_release__mm_struct(obj);
Chris Wilson5cc9ed42014-05-16 14:22:37 +0100701}
702
703static int
704i915_gem_userptr_dmabuf_export(struct drm_i915_gem_object *obj)
705{
Chris Wilsonad46cb52014-08-07 14:20:40 +0100706 if (obj->userptr.mmu_object)
Chris Wilson5cc9ed42014-05-16 14:22:37 +0100707 return 0;
708
709 return i915_gem_userptr_init__mmu_notifier(obj, 0);
710}
711
712static const struct drm_i915_gem_object_ops i915_gem_userptr_ops = {
Tvrtko Ursulin3599a912016-11-01 14:44:10 +0000713 .flags = I915_GEM_OBJECT_HAS_STRUCT_PAGE |
714 I915_GEM_OBJECT_IS_SHRINKABLE,
Chris Wilson5cc9ed42014-05-16 14:22:37 +0100715 .get_pages = i915_gem_userptr_get_pages,
716 .put_pages = i915_gem_userptr_put_pages,
Chris Wilsonde472662016-01-22 18:32:31 +0000717 .dmabuf_export = i915_gem_userptr_dmabuf_export,
Chris Wilson5cc9ed42014-05-16 14:22:37 +0100718 .release = i915_gem_userptr_release,
719};
720
721/**
722 * Creates a new mm object that wraps some normal memory from the process
723 * context - user memory.
724 *
725 * We impose several restrictions upon the memory being mapped
726 * into the GPU.
727 * 1. It must be page aligned (both start/end addresses, i.e ptr and size).
Chris Wilsonec8b0dd2014-07-21 13:21:23 +0100728 * 2. It must be normal system memory, not a pointer into another map of IO
Chris Wilson5cc9ed42014-05-16 14:22:37 +0100729 * space (e.g. it must not be a GTT mmapping of another object).
Chris Wilsonec8b0dd2014-07-21 13:21:23 +0100730 * 3. We only allow a bo as large as we could in theory map into the GTT,
Chris Wilson5cc9ed42014-05-16 14:22:37 +0100731 * that is we limit the size to the total size of the GTT.
Chris Wilsonec8b0dd2014-07-21 13:21:23 +0100732 * 4. The bo is marked as being snoopable. The backing pages are left
Chris Wilson5cc9ed42014-05-16 14:22:37 +0100733 * accessible directly by the CPU, but reads and writes by the GPU may
734 * incur the cost of a snoop (unless you have an LLC architecture).
735 *
736 * Synchronisation between multiple users and the GPU is left to userspace
737 * through the normal set-domain-ioctl. The kernel will enforce that the
738 * GPU relinquishes the VMA before it is returned back to the system
739 * i.e. upon free(), munmap() or process termination. However, the userspace
740 * malloc() library may not immediately relinquish the VMA after free() and
741 * instead reuse it whilst the GPU is still reading and writing to the VMA.
742 * Caveat emptor.
743 *
744 * Also note, that the object created here is not currently a "first class"
745 * object, in that several ioctls are banned. These are the CPU access
746 * ioctls: mmap(), pwrite and pread. In practice, you are expected to use
Chris Wilsoncc917ab2015-10-13 14:22:26 +0100747 * direct access via your pointer rather than use those ioctls. Another
748 * restriction is that we do not allow userptr surfaces to be pinned to the
749 * hardware and so we reject any attempt to create a framebuffer out of a
750 * userptr.
Chris Wilson5cc9ed42014-05-16 14:22:37 +0100751 *
752 * If you think this is a good interface to use to pass GPU memory between
753 * drivers, please use dma-buf instead. In fact, wherever possible use
754 * dma-buf instead.
755 */
756int
757i915_gem_userptr_ioctl(struct drm_device *dev, void *data, struct drm_file *file)
758{
Tvrtko Ursulin0031fb92016-11-04 14:42:44 +0000759 struct drm_i915_private *dev_priv = to_i915(dev);
Chris Wilson5cc9ed42014-05-16 14:22:37 +0100760 struct drm_i915_gem_userptr *args = data;
761 struct drm_i915_gem_object *obj;
762 int ret;
763 u32 handle;
764
Tvrtko Ursulin0031fb92016-11-04 14:42:44 +0000765 if (!HAS_LLC(dev_priv) && !HAS_SNOOP(dev_priv)) {
Tvrtko Ursulinca377802016-03-02 12:10:31 +0000766 /* We cannot support coherent userptr objects on hw without
767 * LLC and broken snooping.
768 */
769 return -ENODEV;
770 }
771
Chris Wilson5cc9ed42014-05-16 14:22:37 +0100772 if (args->flags & ~(I915_USERPTR_READ_ONLY |
773 I915_USERPTR_UNSYNCHRONIZED))
774 return -EINVAL;
775
776 if (offset_in_page(args->user_ptr | args->user_size))
777 return -EINVAL;
778
Chris Wilson5cc9ed42014-05-16 14:22:37 +0100779 if (!access_ok(args->flags & I915_USERPTR_READ_ONLY ? VERIFY_READ : VERIFY_WRITE,
780 (char __user *)(unsigned long)args->user_ptr, args->user_size))
781 return -EFAULT;
782
783 if (args->flags & I915_USERPTR_READ_ONLY) {
784 /* On almost all of the current hw, we cannot tell the GPU that a
785 * page is readonly, so this is just a placeholder in the uAPI.
786 */
787 return -ENODEV;
788 }
789
Tvrtko Ursulin187685c2016-12-01 14:16:36 +0000790 obj = i915_gem_object_alloc(dev_priv);
Chris Wilson5cc9ed42014-05-16 14:22:37 +0100791 if (obj == NULL)
792 return -ENOMEM;
793
794 drm_gem_private_object_init(dev, &obj->base, args->user_size);
795 i915_gem_object_init(obj, &i915_gem_userptr_ops);
796 obj->cache_level = I915_CACHE_LLC;
797 obj->base.write_domain = I915_GEM_DOMAIN_CPU;
798 obj->base.read_domains = I915_GEM_DOMAIN_CPU;
799
800 obj->userptr.ptr = args->user_ptr;
801 obj->userptr.read_only = !!(args->flags & I915_USERPTR_READ_ONLY);
802
803 /* And keep a pointer to the current->mm for resolving the user pages
804 * at binding. This means that we need to hook into the mmu_notifier
805 * in order to detect if the mmu is destroyed.
806 */
Chris Wilsonad46cb52014-08-07 14:20:40 +0100807 ret = i915_gem_userptr_init__mm_struct(obj);
808 if (ret == 0)
Chris Wilson5cc9ed42014-05-16 14:22:37 +0100809 ret = i915_gem_userptr_init__mmu_notifier(obj, args->flags);
810 if (ret == 0)
811 ret = drm_gem_handle_create(file, &obj->base, &handle);
812
813 /* drop reference from allocate - handle holds it now */
Chris Wilsonf0cd5182016-10-28 13:58:43 +0100814 i915_gem_object_put(obj);
Chris Wilson5cc9ed42014-05-16 14:22:37 +0100815 if (ret)
816 return ret;
817
818 args->handle = handle;
819 return 0;
820}
821
Chris Wilson72778cb2016-05-19 16:17:16 +0100822void i915_gem_init_userptr(struct drm_i915_private *dev_priv)
Chris Wilson5cc9ed42014-05-16 14:22:37 +0100823{
Chris Wilsonad46cb52014-08-07 14:20:40 +0100824 mutex_init(&dev_priv->mm_lock);
825 hash_init(dev_priv->mm_structs);
Chris Wilson5cc9ed42014-05-16 14:22:37 +0100826}