blob: 47fe8ecef135faacd0967805e213f23e764e4f1b [file] [log] [blame]
Chris Wilson54cf91d2010-11-25 18:00:26 +00001/*
2 * Copyright © 2008,2010 Intel Corporation
3 *
4 * Permission is hereby granted, free of charge, to any person obtaining a
5 * copy of this software and associated documentation files (the "Software"),
6 * to deal in the Software without restriction, including without limitation
7 * the rights to use, copy, modify, merge, publish, distribute, sublicense,
8 * and/or sell copies of the Software, and to permit persons to whom the
9 * Software is furnished to do so, subject to the following conditions:
10 *
11 * The above copyright notice and this permission notice (including the next
12 * paragraph) shall be included in all copies or substantial portions of the
13 * Software.
14 *
15 * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
16 * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
17 * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL
18 * THE AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
19 * LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING
20 * FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS
21 * IN THE SOFTWARE.
22 *
23 * Authors:
24 * Eric Anholt <eric@anholt.net>
25 * Chris Wilson <chris@chris-wilson.co.uk>
26 *
27 */
28
David Howells760285e2012-10-02 18:01:07 +010029#include <drm/drmP.h>
30#include <drm/i915_drm.h>
Chris Wilson54cf91d2010-11-25 18:00:26 +000031#include "i915_drv.h"
32#include "i915_trace.h"
33#include "intel_drv.h"
Eugeni Dodonovf45b5552011-12-09 17:16:37 -080034#include <linux/dma_remapping.h>
Chris Wilson54cf91d2010-11-25 18:00:26 +000035
Chris Wilsona415d352013-11-26 11:23:15 +000036#define __EXEC_OBJECT_HAS_PIN (1<<31)
37#define __EXEC_OBJECT_HAS_FENCE (1<<30)
38
Ben Widawsky27173f12013-08-14 11:38:36 +020039struct eb_vmas {
40 struct list_head vmas;
Chris Wilson67731b82010-12-08 10:38:14 +000041 int and;
Chris Wilsoneef90cc2013-01-08 10:53:17 +000042 union {
Ben Widawsky27173f12013-08-14 11:38:36 +020043 struct i915_vma *lut[0];
Chris Wilsoneef90cc2013-01-08 10:53:17 +000044 struct hlist_head buckets[0];
45 };
Chris Wilson67731b82010-12-08 10:38:14 +000046};
47
Ben Widawsky27173f12013-08-14 11:38:36 +020048static struct eb_vmas *
Ben Widawsky17601cbc2013-11-25 09:54:38 -080049eb_create(struct drm_i915_gem_execbuffer2 *args)
Chris Wilson67731b82010-12-08 10:38:14 +000050{
Ben Widawsky27173f12013-08-14 11:38:36 +020051 struct eb_vmas *eb = NULL;
Chris Wilson67731b82010-12-08 10:38:14 +000052
Chris Wilsoneef90cc2013-01-08 10:53:17 +000053 if (args->flags & I915_EXEC_HANDLE_LUT) {
Daniel Vetterb205ca52013-09-19 14:00:11 +020054 unsigned size = args->buffer_count;
Ben Widawsky27173f12013-08-14 11:38:36 +020055 size *= sizeof(struct i915_vma *);
56 size += sizeof(struct eb_vmas);
Chris Wilsoneef90cc2013-01-08 10:53:17 +000057 eb = kmalloc(size, GFP_TEMPORARY | __GFP_NOWARN | __GFP_NORETRY);
58 }
59
60 if (eb == NULL) {
Daniel Vetterb205ca52013-09-19 14:00:11 +020061 unsigned size = args->buffer_count;
62 unsigned count = PAGE_SIZE / sizeof(struct hlist_head) / 2;
Lauri Kasanen27b7c632013-03-27 15:04:55 +020063 BUILD_BUG_ON_NOT_POWER_OF_2(PAGE_SIZE / sizeof(struct hlist_head));
Chris Wilsoneef90cc2013-01-08 10:53:17 +000064 while (count > 2*size)
65 count >>= 1;
66 eb = kzalloc(count*sizeof(struct hlist_head) +
Ben Widawsky27173f12013-08-14 11:38:36 +020067 sizeof(struct eb_vmas),
Chris Wilsoneef90cc2013-01-08 10:53:17 +000068 GFP_TEMPORARY);
69 if (eb == NULL)
70 return eb;
71
72 eb->and = count - 1;
73 } else
74 eb->and = -args->buffer_count;
75
Ben Widawsky27173f12013-08-14 11:38:36 +020076 INIT_LIST_HEAD(&eb->vmas);
Chris Wilson67731b82010-12-08 10:38:14 +000077 return eb;
78}
79
80static void
Ben Widawsky27173f12013-08-14 11:38:36 +020081eb_reset(struct eb_vmas *eb)
Chris Wilson67731b82010-12-08 10:38:14 +000082{
Chris Wilsoneef90cc2013-01-08 10:53:17 +000083 if (eb->and >= 0)
84 memset(eb->buckets, 0, (eb->and+1)*sizeof(struct hlist_head));
Chris Wilson67731b82010-12-08 10:38:14 +000085}
86
Chris Wilson3b96eff2013-01-08 10:53:14 +000087static int
Ben Widawsky27173f12013-08-14 11:38:36 +020088eb_lookup_vmas(struct eb_vmas *eb,
89 struct drm_i915_gem_exec_object2 *exec,
90 const struct drm_i915_gem_execbuffer2 *args,
91 struct i915_address_space *vm,
92 struct drm_file *file)
Chris Wilson3b96eff2013-01-08 10:53:14 +000093{
Ben Widawsky6f65e292013-12-06 14:10:56 -080094 struct drm_i915_private *dev_priv = vm->dev->dev_private;
Ben Widawsky27173f12013-08-14 11:38:36 +020095 struct drm_i915_gem_object *obj;
96 struct list_head objects;
Chris Wilson9ae9ab52013-12-04 09:52:58 +000097 int i, ret;
Chris Wilson3b96eff2013-01-08 10:53:14 +000098
Ben Widawsky27173f12013-08-14 11:38:36 +020099 INIT_LIST_HEAD(&objects);
Chris Wilson3b96eff2013-01-08 10:53:14 +0000100 spin_lock(&file->table_lock);
Ben Widawsky27173f12013-08-14 11:38:36 +0200101 /* Grab a reference to the object and release the lock so we can lookup
102 * or create the VMA without using GFP_ATOMIC */
Chris Wilsoneef90cc2013-01-08 10:53:17 +0000103 for (i = 0; i < args->buffer_count; i++) {
Chris Wilson3b96eff2013-01-08 10:53:14 +0000104 obj = to_intel_bo(idr_find(&file->object_idr, exec[i].handle));
105 if (obj == NULL) {
106 spin_unlock(&file->table_lock);
107 DRM_DEBUG("Invalid object handle %d at index %d\n",
108 exec[i].handle, i);
Ben Widawsky27173f12013-08-14 11:38:36 +0200109 ret = -ENOENT;
Chris Wilson9ae9ab52013-12-04 09:52:58 +0000110 goto err;
Chris Wilson3b96eff2013-01-08 10:53:14 +0000111 }
112
Ben Widawsky27173f12013-08-14 11:38:36 +0200113 if (!list_empty(&obj->obj_exec_link)) {
Chris Wilson3b96eff2013-01-08 10:53:14 +0000114 spin_unlock(&file->table_lock);
115 DRM_DEBUG("Object %p [handle %d, index %d] appears more than once in object list\n",
116 obj, exec[i].handle, i);
Ben Widawsky27173f12013-08-14 11:38:36 +0200117 ret = -EINVAL;
Chris Wilson9ae9ab52013-12-04 09:52:58 +0000118 goto err;
Chris Wilson3b96eff2013-01-08 10:53:14 +0000119 }
120
121 drm_gem_object_reference(&obj->base);
Ben Widawsky27173f12013-08-14 11:38:36 +0200122 list_add_tail(&obj->obj_exec_link, &objects);
Chris Wilson3b96eff2013-01-08 10:53:14 +0000123 }
124 spin_unlock(&file->table_lock);
125
Ben Widawsky27173f12013-08-14 11:38:36 +0200126 i = 0;
Chris Wilson9ae9ab52013-12-04 09:52:58 +0000127 while (!list_empty(&objects)) {
Ben Widawsky27173f12013-08-14 11:38:36 +0200128 struct i915_vma *vma;
Ben Widawsky6f65e292013-12-06 14:10:56 -0800129 struct i915_address_space *bind_vm = vm;
130
Daniel Vetter2c9f8d52013-12-18 17:38:53 +0100131 if (exec[i].flags & EXEC_OBJECT_NEEDS_GTT &&
132 USES_FULL_PPGTT(vm->dev)) {
133 ret = -EINVAL;
Rodrigo Vivia25eebb2014-01-14 16:21:49 -0200134 goto err;
Daniel Vetter2c9f8d52013-12-18 17:38:53 +0100135 }
136
Ben Widawsky6f65e292013-12-06 14:10:56 -0800137 /* If we have secure dispatch, or the userspace assures us that
138 * they know what they're doing, use the GGTT VM.
139 */
Daniel Vettera7c1d4262013-12-18 17:46:18 +0100140 if (((args->flags & I915_EXEC_SECURE) &&
Ben Widawsky6f65e292013-12-06 14:10:56 -0800141 (i == (args->buffer_count - 1))))
142 bind_vm = &dev_priv->gtt.base;
Ben Widawsky27173f12013-08-14 11:38:36 +0200143
Chris Wilson9ae9ab52013-12-04 09:52:58 +0000144 obj = list_first_entry(&objects,
145 struct drm_i915_gem_object,
146 obj_exec_link);
147
Daniel Vettere656a6c2013-08-14 14:14:04 +0200148 /*
149 * NOTE: We can leak any vmas created here when something fails
150 * later on. But that's no issue since vma_unbind can deal with
151 * vmas which are not actually bound. And since only
152 * lookup_or_create exists as an interface to get at the vma
153 * from the (obj, vm) we don't run the risk of creating
154 * duplicated vmas for the same vm.
155 */
Ben Widawsky6f65e292013-12-06 14:10:56 -0800156 vma = i915_gem_obj_lookup_or_create_vma(obj, bind_vm);
Ben Widawsky27173f12013-08-14 11:38:36 +0200157 if (IS_ERR(vma)) {
Ben Widawsky27173f12013-08-14 11:38:36 +0200158 DRM_DEBUG("Failed to lookup VMA\n");
159 ret = PTR_ERR(vma);
Chris Wilson9ae9ab52013-12-04 09:52:58 +0000160 goto err;
Ben Widawsky27173f12013-08-14 11:38:36 +0200161 }
162
Chris Wilson9ae9ab52013-12-04 09:52:58 +0000163 /* Transfer ownership from the objects list to the vmas list. */
Ben Widawsky27173f12013-08-14 11:38:36 +0200164 list_add_tail(&vma->exec_list, &eb->vmas);
Chris Wilson9ae9ab52013-12-04 09:52:58 +0000165 list_del_init(&obj->obj_exec_link);
Ben Widawsky27173f12013-08-14 11:38:36 +0200166
167 vma->exec_entry = &exec[i];
168 if (eb->and < 0) {
169 eb->lut[i] = vma;
170 } else {
171 uint32_t handle = args->flags & I915_EXEC_HANDLE_LUT ? i : exec[i].handle;
172 vma->exec_handle = handle;
173 hlist_add_head(&vma->exec_node,
174 &eb->buckets[handle & eb->and]);
175 }
176 ++i;
177 }
178
Chris Wilson9ae9ab52013-12-04 09:52:58 +0000179 return 0;
Ben Widawsky27173f12013-08-14 11:38:36 +0200180
Chris Wilson9ae9ab52013-12-04 09:52:58 +0000181
182err:
Ben Widawsky27173f12013-08-14 11:38:36 +0200183 while (!list_empty(&objects)) {
184 obj = list_first_entry(&objects,
185 struct drm_i915_gem_object,
186 obj_exec_link);
187 list_del_init(&obj->obj_exec_link);
Chris Wilson9ae9ab52013-12-04 09:52:58 +0000188 drm_gem_object_unreference(&obj->base);
Ben Widawsky27173f12013-08-14 11:38:36 +0200189 }
Chris Wilson9ae9ab52013-12-04 09:52:58 +0000190 /*
191 * Objects already transfered to the vmas list will be unreferenced by
192 * eb_destroy.
193 */
194
Ben Widawsky27173f12013-08-14 11:38:36 +0200195 return ret;
Chris Wilson3b96eff2013-01-08 10:53:14 +0000196}
197
Ben Widawsky27173f12013-08-14 11:38:36 +0200198static struct i915_vma *eb_get_vma(struct eb_vmas *eb, unsigned long handle)
Chris Wilson67731b82010-12-08 10:38:14 +0000199{
Chris Wilsoneef90cc2013-01-08 10:53:17 +0000200 if (eb->and < 0) {
201 if (handle >= -eb->and)
202 return NULL;
203 return eb->lut[handle];
204 } else {
205 struct hlist_head *head;
206 struct hlist_node *node;
Chris Wilson67731b82010-12-08 10:38:14 +0000207
Chris Wilsoneef90cc2013-01-08 10:53:17 +0000208 head = &eb->buckets[handle & eb->and];
209 hlist_for_each(node, head) {
Ben Widawsky27173f12013-08-14 11:38:36 +0200210 struct i915_vma *vma;
Chris Wilsoneef90cc2013-01-08 10:53:17 +0000211
Ben Widawsky27173f12013-08-14 11:38:36 +0200212 vma = hlist_entry(node, struct i915_vma, exec_node);
213 if (vma->exec_handle == handle)
214 return vma;
Chris Wilsoneef90cc2013-01-08 10:53:17 +0000215 }
216 return NULL;
Chris Wilson67731b82010-12-08 10:38:14 +0000217 }
Chris Wilson67731b82010-12-08 10:38:14 +0000218}
219
Chris Wilsona415d352013-11-26 11:23:15 +0000220static void
221i915_gem_execbuffer_unreserve_vma(struct i915_vma *vma)
222{
223 struct drm_i915_gem_exec_object2 *entry;
224 struct drm_i915_gem_object *obj = vma->obj;
225
226 if (!drm_mm_node_allocated(&vma->node))
227 return;
228
229 entry = vma->exec_entry;
230
231 if (entry->flags & __EXEC_OBJECT_HAS_FENCE)
232 i915_gem_object_unpin_fence(obj);
233
234 if (entry->flags & __EXEC_OBJECT_HAS_PIN)
Daniel Vetter3d7f0f92013-12-18 16:23:37 +0100235 vma->pin_count--;
Chris Wilsona415d352013-11-26 11:23:15 +0000236
237 entry->flags &= ~(__EXEC_OBJECT_HAS_FENCE | __EXEC_OBJECT_HAS_PIN);
238}
239
240static void eb_destroy(struct eb_vmas *eb)
241{
Ben Widawsky27173f12013-08-14 11:38:36 +0200242 while (!list_empty(&eb->vmas)) {
243 struct i915_vma *vma;
Chris Wilsonbcffc3f2013-01-08 10:53:15 +0000244
Ben Widawsky27173f12013-08-14 11:38:36 +0200245 vma = list_first_entry(&eb->vmas,
246 struct i915_vma,
Chris Wilsonbcffc3f2013-01-08 10:53:15 +0000247 exec_list);
Ben Widawsky27173f12013-08-14 11:38:36 +0200248 list_del_init(&vma->exec_list);
Chris Wilsona415d352013-11-26 11:23:15 +0000249 i915_gem_execbuffer_unreserve_vma(vma);
Ben Widawsky27173f12013-08-14 11:38:36 +0200250 drm_gem_object_unreference(&vma->obj->base);
Chris Wilsonbcffc3f2013-01-08 10:53:15 +0000251 }
Chris Wilson67731b82010-12-08 10:38:14 +0000252 kfree(eb);
253}
254
Chris Wilsondabdfe02012-03-26 10:10:27 +0200255static inline int use_cpu_reloc(struct drm_i915_gem_object *obj)
256{
Chris Wilson2cc86b82013-08-26 19:51:00 -0300257 return (HAS_LLC(obj->base.dev) ||
258 obj->base.write_domain == I915_GEM_DOMAIN_CPU ||
Chris Wilson504c7262012-08-23 13:12:52 +0100259 !obj->map_and_fenceable ||
Chris Wilsondabdfe02012-03-26 10:10:27 +0200260 obj->cache_level != I915_CACHE_NONE);
261}
262
Chris Wilson54cf91d2010-11-25 18:00:26 +0000263static int
Rafael Barbalho5032d872013-08-21 17:10:51 +0100264relocate_entry_cpu(struct drm_i915_gem_object *obj,
Ben Widawskyd9ceb952014-04-28 17:18:28 -0700265 struct drm_i915_gem_relocation_entry *reloc,
266 uint64_t target_offset)
Rafael Barbalho5032d872013-08-21 17:10:51 +0100267{
Ben Widawsky3c94cee2013-11-02 21:07:11 -0700268 struct drm_device *dev = obj->base.dev;
Rafael Barbalho5032d872013-08-21 17:10:51 +0100269 uint32_t page_offset = offset_in_page(reloc->offset);
Ben Widawskyd9ceb952014-04-28 17:18:28 -0700270 uint64_t delta = reloc->delta + target_offset;
Rafael Barbalho5032d872013-08-21 17:10:51 +0100271 char *vaddr;
Ben Widawsky8b78f0e2013-12-26 13:39:50 -0800272 int ret;
Rafael Barbalho5032d872013-08-21 17:10:51 +0100273
Chris Wilson2cc86b82013-08-26 19:51:00 -0300274 ret = i915_gem_object_set_to_cpu_domain(obj, true);
Rafael Barbalho5032d872013-08-21 17:10:51 +0100275 if (ret)
276 return ret;
277
278 vaddr = kmap_atomic(i915_gem_object_get_page(obj,
279 reloc->offset >> PAGE_SHIFT));
Ben Widawskyd9ceb952014-04-28 17:18:28 -0700280 *(uint32_t *)(vaddr + page_offset) = lower_32_bits(delta);
Ben Widawsky3c94cee2013-11-02 21:07:11 -0700281
282 if (INTEL_INFO(dev)->gen >= 8) {
283 page_offset = offset_in_page(page_offset + sizeof(uint32_t));
284
285 if (page_offset == 0) {
286 kunmap_atomic(vaddr);
287 vaddr = kmap_atomic(i915_gem_object_get_page(obj,
288 (reloc->offset + sizeof(uint32_t)) >> PAGE_SHIFT));
289 }
290
Ben Widawskyd9ceb952014-04-28 17:18:28 -0700291 *(uint32_t *)(vaddr + page_offset) = upper_32_bits(delta);
Ben Widawsky3c94cee2013-11-02 21:07:11 -0700292 }
293
Rafael Barbalho5032d872013-08-21 17:10:51 +0100294 kunmap_atomic(vaddr);
295
296 return 0;
297}
298
299static int
300relocate_entry_gtt(struct drm_i915_gem_object *obj,
Ben Widawskyd9ceb952014-04-28 17:18:28 -0700301 struct drm_i915_gem_relocation_entry *reloc,
302 uint64_t target_offset)
Rafael Barbalho5032d872013-08-21 17:10:51 +0100303{
304 struct drm_device *dev = obj->base.dev;
305 struct drm_i915_private *dev_priv = dev->dev_private;
Ben Widawskyd9ceb952014-04-28 17:18:28 -0700306 uint64_t delta = reloc->delta + target_offset;
Rafael Barbalho5032d872013-08-21 17:10:51 +0100307 uint32_t __iomem *reloc_entry;
308 void __iomem *reloc_page;
Ben Widawsky8b78f0e2013-12-26 13:39:50 -0800309 int ret;
Rafael Barbalho5032d872013-08-21 17:10:51 +0100310
311 ret = i915_gem_object_set_to_gtt_domain(obj, true);
312 if (ret)
313 return ret;
314
315 ret = i915_gem_object_put_fence(obj);
316 if (ret)
317 return ret;
318
319 /* Map the page containing the relocation we're going to perform. */
320 reloc->offset += i915_gem_obj_ggtt_offset(obj);
321 reloc_page = io_mapping_map_atomic_wc(dev_priv->gtt.mappable,
322 reloc->offset & PAGE_MASK);
323 reloc_entry = (uint32_t __iomem *)
324 (reloc_page + offset_in_page(reloc->offset));
Ben Widawskyd9ceb952014-04-28 17:18:28 -0700325 iowrite32(lower_32_bits(delta), reloc_entry);
Ben Widawsky3c94cee2013-11-02 21:07:11 -0700326
327 if (INTEL_INFO(dev)->gen >= 8) {
328 reloc_entry += 1;
329
330 if (offset_in_page(reloc->offset + sizeof(uint32_t)) == 0) {
331 io_mapping_unmap_atomic(reloc_page);
332 reloc_page = io_mapping_map_atomic_wc(
333 dev_priv->gtt.mappable,
334 reloc->offset + sizeof(uint32_t));
335 reloc_entry = reloc_page;
336 }
337
Ben Widawskyd9ceb952014-04-28 17:18:28 -0700338 iowrite32(upper_32_bits(delta), reloc_entry);
Ben Widawsky3c94cee2013-11-02 21:07:11 -0700339 }
340
Rafael Barbalho5032d872013-08-21 17:10:51 +0100341 io_mapping_unmap_atomic(reloc_page);
342
343 return 0;
344}
345
346static int
Chris Wilson54cf91d2010-11-25 18:00:26 +0000347i915_gem_execbuffer_relocate_entry(struct drm_i915_gem_object *obj,
Ben Widawsky27173f12013-08-14 11:38:36 +0200348 struct eb_vmas *eb,
Ben Widawsky3e7a0322013-12-06 14:10:57 -0800349 struct drm_i915_gem_relocation_entry *reloc)
Chris Wilson54cf91d2010-11-25 18:00:26 +0000350{
351 struct drm_device *dev = obj->base.dev;
352 struct drm_gem_object *target_obj;
Daniel Vetter149c8402012-02-15 23:50:23 +0100353 struct drm_i915_gem_object *target_i915_obj;
Ben Widawsky27173f12013-08-14 11:38:36 +0200354 struct i915_vma *target_vma;
Ben Widawskyd9ceb952014-04-28 17:18:28 -0700355 uint64_t target_offset;
Ben Widawsky8b78f0e2013-12-26 13:39:50 -0800356 int ret;
Chris Wilson54cf91d2010-11-25 18:00:26 +0000357
Chris Wilson67731b82010-12-08 10:38:14 +0000358 /* we've already hold a reference to all valid objects */
Ben Widawsky27173f12013-08-14 11:38:36 +0200359 target_vma = eb_get_vma(eb, reloc->target_handle);
360 if (unlikely(target_vma == NULL))
Chris Wilson54cf91d2010-11-25 18:00:26 +0000361 return -ENOENT;
Ben Widawsky27173f12013-08-14 11:38:36 +0200362 target_i915_obj = target_vma->obj;
363 target_obj = &target_vma->obj->base;
Chris Wilson54cf91d2010-11-25 18:00:26 +0000364
Ben Widawsky5ce09722013-11-25 09:54:40 -0800365 target_offset = target_vma->node.start;
Chris Wilson54cf91d2010-11-25 18:00:26 +0000366
Eric Anholte844b992012-07-31 15:35:01 -0700367 /* Sandybridge PPGTT errata: We need a global gtt mapping for MI and
368 * pipe_control writes because the gpu doesn't properly redirect them
369 * through the ppgtt for non_secure batchbuffers. */
370 if (unlikely(IS_GEN6(dev) &&
371 reloc->write_domain == I915_GEM_DOMAIN_INSTRUCTION &&
372 !target_i915_obj->has_global_gtt_mapping)) {
Ben Widawsky3e7a0322013-12-06 14:10:57 -0800373 struct i915_vma *vma =
374 list_first_entry(&target_i915_obj->vma_list,
375 typeof(*vma), vma_link);
Ben Widawsky6f65e292013-12-06 14:10:56 -0800376 vma->bind_vma(vma, target_i915_obj->cache_level, GLOBAL_BIND);
Eric Anholte844b992012-07-31 15:35:01 -0700377 }
378
Chris Wilson54cf91d2010-11-25 18:00:26 +0000379 /* Validate that the target is in a valid r/w GPU domain */
Chris Wilsonb8f7ab12010-12-08 10:43:06 +0000380 if (unlikely(reloc->write_domain & (reloc->write_domain - 1))) {
Daniel Vetterff240192012-01-31 21:08:14 +0100381 DRM_DEBUG("reloc with multiple write domains: "
Chris Wilson54cf91d2010-11-25 18:00:26 +0000382 "obj %p target %d offset %d "
383 "read %08x write %08x",
384 obj, reloc->target_handle,
385 (int) reloc->offset,
386 reloc->read_domains,
387 reloc->write_domain);
Ben Widawsky8b78f0e2013-12-26 13:39:50 -0800388 return -EINVAL;
Chris Wilson54cf91d2010-11-25 18:00:26 +0000389 }
Daniel Vetter4ca4a252011-12-14 13:57:27 +0100390 if (unlikely((reloc->write_domain | reloc->read_domains)
391 & ~I915_GEM_GPU_DOMAINS)) {
Daniel Vetterff240192012-01-31 21:08:14 +0100392 DRM_DEBUG("reloc with read/write non-GPU domains: "
Chris Wilson54cf91d2010-11-25 18:00:26 +0000393 "obj %p target %d offset %d "
394 "read %08x write %08x",
395 obj, reloc->target_handle,
396 (int) reloc->offset,
397 reloc->read_domains,
398 reloc->write_domain);
Ben Widawsky8b78f0e2013-12-26 13:39:50 -0800399 return -EINVAL;
Chris Wilson54cf91d2010-11-25 18:00:26 +0000400 }
Chris Wilson54cf91d2010-11-25 18:00:26 +0000401
402 target_obj->pending_read_domains |= reloc->read_domains;
403 target_obj->pending_write_domain |= reloc->write_domain;
404
405 /* If the relocation already has the right value in it, no
406 * more work needs to be done.
407 */
408 if (target_offset == reloc->presumed_offset)
Chris Wilson67731b82010-12-08 10:38:14 +0000409 return 0;
Chris Wilson54cf91d2010-11-25 18:00:26 +0000410
411 /* Check that the relocation address is valid... */
Ben Widawsky3c94cee2013-11-02 21:07:11 -0700412 if (unlikely(reloc->offset >
413 obj->base.size - (INTEL_INFO(dev)->gen >= 8 ? 8 : 4))) {
Daniel Vetterff240192012-01-31 21:08:14 +0100414 DRM_DEBUG("Relocation beyond object bounds: "
Chris Wilson54cf91d2010-11-25 18:00:26 +0000415 "obj %p target %d offset %d size %d.\n",
416 obj, reloc->target_handle,
417 (int) reloc->offset,
418 (int) obj->base.size);
Ben Widawsky8b78f0e2013-12-26 13:39:50 -0800419 return -EINVAL;
Chris Wilson54cf91d2010-11-25 18:00:26 +0000420 }
Chris Wilsonb8f7ab12010-12-08 10:43:06 +0000421 if (unlikely(reloc->offset & 3)) {
Daniel Vetterff240192012-01-31 21:08:14 +0100422 DRM_DEBUG("Relocation not 4-byte aligned: "
Chris Wilson54cf91d2010-11-25 18:00:26 +0000423 "obj %p target %d offset %d.\n",
424 obj, reloc->target_handle,
425 (int) reloc->offset);
Ben Widawsky8b78f0e2013-12-26 13:39:50 -0800426 return -EINVAL;
Chris Wilson54cf91d2010-11-25 18:00:26 +0000427 }
428
Chris Wilsondabdfe02012-03-26 10:10:27 +0200429 /* We can't wait for rendering with pagefaults disabled */
430 if (obj->active && in_atomic())
431 return -EFAULT;
432
Rafael Barbalho5032d872013-08-21 17:10:51 +0100433 if (use_cpu_reloc(obj))
Ben Widawskyd9ceb952014-04-28 17:18:28 -0700434 ret = relocate_entry_cpu(obj, reloc, target_offset);
Rafael Barbalho5032d872013-08-21 17:10:51 +0100435 else
Ben Widawskyd9ceb952014-04-28 17:18:28 -0700436 ret = relocate_entry_gtt(obj, reloc, target_offset);
Chris Wilson54cf91d2010-11-25 18:00:26 +0000437
Daniel Vetterd4d36012013-09-02 20:56:23 +0200438 if (ret)
439 return ret;
440
Chris Wilson54cf91d2010-11-25 18:00:26 +0000441 /* and update the user's relocation entry */
442 reloc->presumed_offset = target_offset;
443
Chris Wilson67731b82010-12-08 10:38:14 +0000444 return 0;
Chris Wilson54cf91d2010-11-25 18:00:26 +0000445}
446
447static int
Ben Widawsky27173f12013-08-14 11:38:36 +0200448i915_gem_execbuffer_relocate_vma(struct i915_vma *vma,
449 struct eb_vmas *eb)
Chris Wilson54cf91d2010-11-25 18:00:26 +0000450{
Chris Wilson1d83f442012-03-24 20:12:53 +0000451#define N_RELOC(x) ((x) / sizeof(struct drm_i915_gem_relocation_entry))
452 struct drm_i915_gem_relocation_entry stack_reloc[N_RELOC(512)];
Chris Wilson54cf91d2010-11-25 18:00:26 +0000453 struct drm_i915_gem_relocation_entry __user *user_relocs;
Ben Widawsky27173f12013-08-14 11:38:36 +0200454 struct drm_i915_gem_exec_object2 *entry = vma->exec_entry;
Chris Wilson1d83f442012-03-24 20:12:53 +0000455 int remain, ret;
Chris Wilson54cf91d2010-11-25 18:00:26 +0000456
Ville Syrjälä2bb46292013-02-22 16:12:51 +0200457 user_relocs = to_user_ptr(entry->relocs_ptr);
Chris Wilson54cf91d2010-11-25 18:00:26 +0000458
Chris Wilson1d83f442012-03-24 20:12:53 +0000459 remain = entry->relocation_count;
460 while (remain) {
461 struct drm_i915_gem_relocation_entry *r = stack_reloc;
462 int count = remain;
463 if (count > ARRAY_SIZE(stack_reloc))
464 count = ARRAY_SIZE(stack_reloc);
465 remain -= count;
466
467 if (__copy_from_user_inatomic(r, user_relocs, count*sizeof(r[0])))
Chris Wilson54cf91d2010-11-25 18:00:26 +0000468 return -EFAULT;
469
Chris Wilson1d83f442012-03-24 20:12:53 +0000470 do {
471 u64 offset = r->presumed_offset;
Chris Wilson54cf91d2010-11-25 18:00:26 +0000472
Ben Widawsky3e7a0322013-12-06 14:10:57 -0800473 ret = i915_gem_execbuffer_relocate_entry(vma->obj, eb, r);
Chris Wilson1d83f442012-03-24 20:12:53 +0000474 if (ret)
475 return ret;
476
477 if (r->presumed_offset != offset &&
478 __copy_to_user_inatomic(&user_relocs->presumed_offset,
479 &r->presumed_offset,
480 sizeof(r->presumed_offset))) {
481 return -EFAULT;
482 }
483
484 user_relocs++;
485 r++;
486 } while (--count);
Chris Wilson54cf91d2010-11-25 18:00:26 +0000487 }
488
489 return 0;
Chris Wilson1d83f442012-03-24 20:12:53 +0000490#undef N_RELOC
Chris Wilson54cf91d2010-11-25 18:00:26 +0000491}
492
493static int
Ben Widawsky27173f12013-08-14 11:38:36 +0200494i915_gem_execbuffer_relocate_vma_slow(struct i915_vma *vma,
495 struct eb_vmas *eb,
496 struct drm_i915_gem_relocation_entry *relocs)
Chris Wilson54cf91d2010-11-25 18:00:26 +0000497{
Ben Widawsky27173f12013-08-14 11:38:36 +0200498 const struct drm_i915_gem_exec_object2 *entry = vma->exec_entry;
Chris Wilson54cf91d2010-11-25 18:00:26 +0000499 int i, ret;
500
501 for (i = 0; i < entry->relocation_count; i++) {
Ben Widawsky3e7a0322013-12-06 14:10:57 -0800502 ret = i915_gem_execbuffer_relocate_entry(vma->obj, eb, &relocs[i]);
Chris Wilson54cf91d2010-11-25 18:00:26 +0000503 if (ret)
504 return ret;
505 }
506
507 return 0;
508}
509
510static int
Ben Widawsky17601cbc2013-11-25 09:54:38 -0800511i915_gem_execbuffer_relocate(struct eb_vmas *eb)
Chris Wilson54cf91d2010-11-25 18:00:26 +0000512{
Ben Widawsky27173f12013-08-14 11:38:36 +0200513 struct i915_vma *vma;
Chris Wilsond4aeee72011-03-14 15:11:24 +0000514 int ret = 0;
Chris Wilson54cf91d2010-11-25 18:00:26 +0000515
Chris Wilsond4aeee72011-03-14 15:11:24 +0000516 /* This is the fast path and we cannot handle a pagefault whilst
517 * holding the struct mutex lest the user pass in the relocations
518 * contained within a mmaped bo. For in such a case we, the page
519 * fault handler would call i915_gem_fault() and we would try to
520 * acquire the struct mutex again. Obviously this is bad and so
521 * lockdep complains vehemently.
522 */
523 pagefault_disable();
Ben Widawsky27173f12013-08-14 11:38:36 +0200524 list_for_each_entry(vma, &eb->vmas, exec_list) {
525 ret = i915_gem_execbuffer_relocate_vma(vma, eb);
Chris Wilson54cf91d2010-11-25 18:00:26 +0000526 if (ret)
Chris Wilsond4aeee72011-03-14 15:11:24 +0000527 break;
Chris Wilson54cf91d2010-11-25 18:00:26 +0000528 }
Chris Wilsond4aeee72011-03-14 15:11:24 +0000529 pagefault_enable();
Chris Wilson54cf91d2010-11-25 18:00:26 +0000530
Chris Wilsond4aeee72011-03-14 15:11:24 +0000531 return ret;
Chris Wilson54cf91d2010-11-25 18:00:26 +0000532}
533
Chris Wilson1690e1e2011-12-14 13:57:08 +0100534static int
Ben Widawsky27173f12013-08-14 11:38:36 +0200535need_reloc_mappable(struct i915_vma *vma)
Chris Wilsondabdfe02012-03-26 10:10:27 +0200536{
Ben Widawsky27173f12013-08-14 11:38:36 +0200537 struct drm_i915_gem_exec_object2 *entry = vma->exec_entry;
538 return entry->relocation_count && !use_cpu_reloc(vma->obj) &&
539 i915_is_ggtt(vma->vm);
Chris Wilsondabdfe02012-03-26 10:10:27 +0200540}
541
542static int
Ben Widawsky27173f12013-08-14 11:38:36 +0200543i915_gem_execbuffer_reserve_vma(struct i915_vma *vma,
544 struct intel_ring_buffer *ring,
545 bool *need_reloc)
Chris Wilson1690e1e2011-12-14 13:57:08 +0100546{
Ben Widawsky6f65e292013-12-06 14:10:56 -0800547 struct drm_i915_gem_object *obj = vma->obj;
Ben Widawsky27173f12013-08-14 11:38:36 +0200548 struct drm_i915_gem_exec_object2 *entry = vma->exec_entry;
Chris Wilson1690e1e2011-12-14 13:57:08 +0100549 bool has_fenced_gpu_access = INTEL_INFO(ring->dev)->gen < 4;
Daniel Vetter1ec9e262014-02-14 14:01:11 +0100550 bool need_fence;
551 unsigned flags;
Chris Wilson1690e1e2011-12-14 13:57:08 +0100552 int ret;
553
Daniel Vetter1ec9e262014-02-14 14:01:11 +0100554 flags = 0;
555
Chris Wilson1690e1e2011-12-14 13:57:08 +0100556 need_fence =
557 has_fenced_gpu_access &&
558 entry->flags & EXEC_OBJECT_NEEDS_FENCE &&
559 obj->tiling_mode != I915_TILING_NONE;
Daniel Vetter1ec9e262014-02-14 14:01:11 +0100560 if (need_fence || need_reloc_mappable(vma))
561 flags |= PIN_MAPPABLE;
Chris Wilson1690e1e2011-12-14 13:57:08 +0100562
Daniel Vetter1ec9e262014-02-14 14:01:11 +0100563 if (entry->flags & EXEC_OBJECT_NEEDS_GTT)
Daniel Vetterbf3d1492014-02-14 14:01:12 +0100564 flags |= PIN_GLOBAL;
Daniel Vetter1ec9e262014-02-14 14:01:11 +0100565
566 ret = i915_gem_object_pin(obj, vma->vm, entry->alignment, flags);
Chris Wilson1690e1e2011-12-14 13:57:08 +0100567 if (ret)
568 return ret;
569
Chris Wilson7788a762012-08-24 19:18:18 +0100570 entry->flags |= __EXEC_OBJECT_HAS_PIN;
571
Chris Wilson1690e1e2011-12-14 13:57:08 +0100572 if (has_fenced_gpu_access) {
573 if (entry->flags & EXEC_OBJECT_NEEDS_FENCE) {
Chris Wilson06d98132012-04-17 15:31:24 +0100574 ret = i915_gem_object_get_fence(obj);
Chris Wilson9a5a53b2012-03-22 15:10:00 +0000575 if (ret)
Chris Wilson7788a762012-08-24 19:18:18 +0100576 return ret;
Chris Wilson1690e1e2011-12-14 13:57:08 +0100577
Chris Wilson9a5a53b2012-03-22 15:10:00 +0000578 if (i915_gem_object_pin_fence(obj))
Chris Wilson1690e1e2011-12-14 13:57:08 +0100579 entry->flags |= __EXEC_OBJECT_HAS_FENCE;
Chris Wilson9a5a53b2012-03-22 15:10:00 +0000580
Chris Wilson7dd49062012-03-21 10:48:18 +0000581 obj->pending_fenced_gpu_access = true;
Chris Wilson1690e1e2011-12-14 13:57:08 +0100582 }
Chris Wilson1690e1e2011-12-14 13:57:08 +0100583 }
584
Ben Widawsky27173f12013-08-14 11:38:36 +0200585 if (entry->offset != vma->node.start) {
586 entry->offset = vma->node.start;
Daniel Vettered5982e2013-01-17 22:23:36 +0100587 *need_reloc = true;
588 }
589
590 if (entry->flags & EXEC_OBJECT_WRITE) {
591 obj->base.pending_read_domains = I915_GEM_DOMAIN_RENDER;
592 obj->base.pending_write_domain = I915_GEM_DOMAIN_RENDER;
593 }
594
Chris Wilson1690e1e2011-12-14 13:57:08 +0100595 return 0;
Chris Wilson7788a762012-08-24 19:18:18 +0100596}
Chris Wilson1690e1e2011-12-14 13:57:08 +0100597
Chris Wilson54cf91d2010-11-25 18:00:26 +0000598static int
Chris Wilsond9e86c02010-11-10 16:40:20 +0000599i915_gem_execbuffer_reserve(struct intel_ring_buffer *ring,
Ben Widawsky27173f12013-08-14 11:38:36 +0200600 struct list_head *vmas,
Daniel Vettered5982e2013-01-17 22:23:36 +0100601 bool *need_relocs)
Chris Wilson54cf91d2010-11-25 18:00:26 +0000602{
Chris Wilson432e58e2010-11-25 19:32:06 +0000603 struct drm_i915_gem_object *obj;
Ben Widawsky27173f12013-08-14 11:38:36 +0200604 struct i915_vma *vma;
Ben Widawsky68c8c172013-09-11 14:57:50 -0700605 struct i915_address_space *vm;
Ben Widawsky27173f12013-08-14 11:38:36 +0200606 struct list_head ordered_vmas;
Chris Wilson7788a762012-08-24 19:18:18 +0100607 bool has_fenced_gpu_access = INTEL_INFO(ring->dev)->gen < 4;
608 int retry;
Chris Wilson6fe4f142011-01-10 17:35:37 +0000609
Ben Widawsky68c8c172013-09-11 14:57:50 -0700610 if (list_empty(vmas))
611 return 0;
612
613 vm = list_first_entry(vmas, struct i915_vma, exec_list)->vm;
614
Ben Widawsky27173f12013-08-14 11:38:36 +0200615 INIT_LIST_HEAD(&ordered_vmas);
616 while (!list_empty(vmas)) {
Chris Wilson6fe4f142011-01-10 17:35:37 +0000617 struct drm_i915_gem_exec_object2 *entry;
618 bool need_fence, need_mappable;
619
Ben Widawsky27173f12013-08-14 11:38:36 +0200620 vma = list_first_entry(vmas, struct i915_vma, exec_list);
621 obj = vma->obj;
622 entry = vma->exec_entry;
Chris Wilson6fe4f142011-01-10 17:35:37 +0000623
624 need_fence =
625 has_fenced_gpu_access &&
626 entry->flags & EXEC_OBJECT_NEEDS_FENCE &&
627 obj->tiling_mode != I915_TILING_NONE;
Ben Widawsky27173f12013-08-14 11:38:36 +0200628 need_mappable = need_fence || need_reloc_mappable(vma);
Chris Wilson6fe4f142011-01-10 17:35:37 +0000629
630 if (need_mappable)
Ben Widawsky27173f12013-08-14 11:38:36 +0200631 list_move(&vma->exec_list, &ordered_vmas);
Chris Wilson6fe4f142011-01-10 17:35:37 +0000632 else
Ben Widawsky27173f12013-08-14 11:38:36 +0200633 list_move_tail(&vma->exec_list, &ordered_vmas);
Chris Wilson595dad72011-01-13 11:03:48 +0000634
Daniel Vettered5982e2013-01-17 22:23:36 +0100635 obj->base.pending_read_domains = I915_GEM_GPU_DOMAINS & ~I915_GEM_DOMAIN_COMMAND;
Chris Wilson595dad72011-01-13 11:03:48 +0000636 obj->base.pending_write_domain = 0;
Chris Wilson016fd0c2012-07-20 12:41:07 +0100637 obj->pending_fenced_gpu_access = false;
Chris Wilson6fe4f142011-01-10 17:35:37 +0000638 }
Ben Widawsky27173f12013-08-14 11:38:36 +0200639 list_splice(&ordered_vmas, vmas);
Chris Wilson54cf91d2010-11-25 18:00:26 +0000640
641 /* Attempt to pin all of the buffers into the GTT.
642 * This is done in 3 phases:
643 *
644 * 1a. Unbind all objects that do not match the GTT constraints for
645 * the execbuffer (fenceable, mappable, alignment etc).
646 * 1b. Increment pin count for already bound objects.
647 * 2. Bind new objects.
648 * 3. Decrement pin count.
649 *
Chris Wilson7788a762012-08-24 19:18:18 +0100650 * This avoid unnecessary unbinding of later objects in order to make
Chris Wilson54cf91d2010-11-25 18:00:26 +0000651 * room for the earlier objects *unless* we need to defragment.
652 */
653 retry = 0;
654 do {
Chris Wilson7788a762012-08-24 19:18:18 +0100655 int ret = 0;
Chris Wilson54cf91d2010-11-25 18:00:26 +0000656
657 /* Unbind any ill-fitting objects or pin. */
Ben Widawsky27173f12013-08-14 11:38:36 +0200658 list_for_each_entry(vma, vmas, exec_list) {
659 struct drm_i915_gem_exec_object2 *entry = vma->exec_entry;
Chris Wilson54cf91d2010-11-25 18:00:26 +0000660 bool need_fence, need_mappable;
Chris Wilson1690e1e2011-12-14 13:57:08 +0100661
Ben Widawsky27173f12013-08-14 11:38:36 +0200662 obj = vma->obj;
663
664 if (!drm_mm_node_allocated(&vma->node))
Chris Wilson54cf91d2010-11-25 18:00:26 +0000665 continue;
666
667 need_fence =
Chris Wilson9b3826b2010-12-05 17:11:54 +0000668 has_fenced_gpu_access &&
Chris Wilson54cf91d2010-11-25 18:00:26 +0000669 entry->flags & EXEC_OBJECT_NEEDS_FENCE &&
670 obj->tiling_mode != I915_TILING_NONE;
Ben Widawsky27173f12013-08-14 11:38:36 +0200671 need_mappable = need_fence || need_reloc_mappable(vma);
Chris Wilson54cf91d2010-11-25 18:00:26 +0000672
Ben Widawsky28d6a7b2013-07-31 17:00:02 -0700673 WARN_ON((need_mappable || need_fence) &&
Ben Widawsky27173f12013-08-14 11:38:36 +0200674 !i915_is_ggtt(vma->vm));
Ben Widawsky28d6a7b2013-07-31 17:00:02 -0700675
Ben Widawskyf343c5f2013-07-05 14:41:04 -0700676 if ((entry->alignment &&
Ben Widawsky27173f12013-08-14 11:38:36 +0200677 vma->node.start & (entry->alignment - 1)) ||
Chris Wilson54cf91d2010-11-25 18:00:26 +0000678 (need_mappable && !obj->map_and_fenceable))
Ben Widawsky27173f12013-08-14 11:38:36 +0200679 ret = i915_vma_unbind(vma);
Chris Wilson54cf91d2010-11-25 18:00:26 +0000680 else
Ben Widawsky27173f12013-08-14 11:38:36 +0200681 ret = i915_gem_execbuffer_reserve_vma(vma, ring, need_relocs);
Chris Wilson432e58e2010-11-25 19:32:06 +0000682 if (ret)
Chris Wilson54cf91d2010-11-25 18:00:26 +0000683 goto err;
Chris Wilson54cf91d2010-11-25 18:00:26 +0000684 }
685
686 /* Bind fresh objects */
Ben Widawsky27173f12013-08-14 11:38:36 +0200687 list_for_each_entry(vma, vmas, exec_list) {
688 if (drm_mm_node_allocated(&vma->node))
Chris Wilson1690e1e2011-12-14 13:57:08 +0100689 continue;
Chris Wilson54cf91d2010-11-25 18:00:26 +0000690
Ben Widawsky27173f12013-08-14 11:38:36 +0200691 ret = i915_gem_execbuffer_reserve_vma(vma, ring, need_relocs);
Chris Wilson7788a762012-08-24 19:18:18 +0100692 if (ret)
693 goto err;
Chris Wilson54cf91d2010-11-25 18:00:26 +0000694 }
695
Chris Wilsona415d352013-11-26 11:23:15 +0000696err:
Chris Wilson6c085a72012-08-20 11:40:46 +0200697 if (ret != -ENOSPC || retry++)
Chris Wilson54cf91d2010-11-25 18:00:26 +0000698 return ret;
699
Chris Wilsona415d352013-11-26 11:23:15 +0000700 /* Decrement pin count for bound objects */
701 list_for_each_entry(vma, vmas, exec_list)
702 i915_gem_execbuffer_unreserve_vma(vma);
703
Ben Widawsky68c8c172013-09-11 14:57:50 -0700704 ret = i915_gem_evict_vm(vm, true);
Chris Wilson54cf91d2010-11-25 18:00:26 +0000705 if (ret)
706 return ret;
Chris Wilson54cf91d2010-11-25 18:00:26 +0000707 } while (1);
708}
709
710static int
711i915_gem_execbuffer_relocate_slow(struct drm_device *dev,
Daniel Vettered5982e2013-01-17 22:23:36 +0100712 struct drm_i915_gem_execbuffer2 *args,
Chris Wilson54cf91d2010-11-25 18:00:26 +0000713 struct drm_file *file,
Chris Wilsond9e86c02010-11-10 16:40:20 +0000714 struct intel_ring_buffer *ring,
Ben Widawsky27173f12013-08-14 11:38:36 +0200715 struct eb_vmas *eb,
716 struct drm_i915_gem_exec_object2 *exec)
Chris Wilson54cf91d2010-11-25 18:00:26 +0000717{
718 struct drm_i915_gem_relocation_entry *reloc;
Ben Widawsky27173f12013-08-14 11:38:36 +0200719 struct i915_address_space *vm;
720 struct i915_vma *vma;
Daniel Vettered5982e2013-01-17 22:23:36 +0100721 bool need_relocs;
Chris Wilsondd6864a2011-01-12 23:49:13 +0000722 int *reloc_offset;
Chris Wilson54cf91d2010-11-25 18:00:26 +0000723 int i, total, ret;
Daniel Vetterb205ca52013-09-19 14:00:11 +0200724 unsigned count = args->buffer_count;
Chris Wilson54cf91d2010-11-25 18:00:26 +0000725
Ben Widawsky27173f12013-08-14 11:38:36 +0200726 if (WARN_ON(list_empty(&eb->vmas)))
727 return 0;
728
729 vm = list_first_entry(&eb->vmas, struct i915_vma, exec_list)->vm;
730
Chris Wilson67731b82010-12-08 10:38:14 +0000731 /* We may process another execbuffer during the unlock... */
Ben Widawsky27173f12013-08-14 11:38:36 +0200732 while (!list_empty(&eb->vmas)) {
733 vma = list_first_entry(&eb->vmas, struct i915_vma, exec_list);
734 list_del_init(&vma->exec_list);
Chris Wilsona415d352013-11-26 11:23:15 +0000735 i915_gem_execbuffer_unreserve_vma(vma);
Ben Widawsky27173f12013-08-14 11:38:36 +0200736 drm_gem_object_unreference(&vma->obj->base);
Chris Wilson67731b82010-12-08 10:38:14 +0000737 }
738
Chris Wilson54cf91d2010-11-25 18:00:26 +0000739 mutex_unlock(&dev->struct_mutex);
740
741 total = 0;
742 for (i = 0; i < count; i++)
Chris Wilson432e58e2010-11-25 19:32:06 +0000743 total += exec[i].relocation_count;
Chris Wilson54cf91d2010-11-25 18:00:26 +0000744
Chris Wilsondd6864a2011-01-12 23:49:13 +0000745 reloc_offset = drm_malloc_ab(count, sizeof(*reloc_offset));
Chris Wilson54cf91d2010-11-25 18:00:26 +0000746 reloc = drm_malloc_ab(total, sizeof(*reloc));
Chris Wilsondd6864a2011-01-12 23:49:13 +0000747 if (reloc == NULL || reloc_offset == NULL) {
748 drm_free_large(reloc);
749 drm_free_large(reloc_offset);
Chris Wilson54cf91d2010-11-25 18:00:26 +0000750 mutex_lock(&dev->struct_mutex);
751 return -ENOMEM;
752 }
753
754 total = 0;
755 for (i = 0; i < count; i++) {
756 struct drm_i915_gem_relocation_entry __user *user_relocs;
Chris Wilson262b6d32013-01-15 16:17:54 +0000757 u64 invalid_offset = (u64)-1;
758 int j;
Chris Wilson54cf91d2010-11-25 18:00:26 +0000759
Ville Syrjälä2bb46292013-02-22 16:12:51 +0200760 user_relocs = to_user_ptr(exec[i].relocs_ptr);
Chris Wilson54cf91d2010-11-25 18:00:26 +0000761
762 if (copy_from_user(reloc+total, user_relocs,
Chris Wilson432e58e2010-11-25 19:32:06 +0000763 exec[i].relocation_count * sizeof(*reloc))) {
Chris Wilson54cf91d2010-11-25 18:00:26 +0000764 ret = -EFAULT;
765 mutex_lock(&dev->struct_mutex);
766 goto err;
767 }
768
Chris Wilson262b6d32013-01-15 16:17:54 +0000769 /* As we do not update the known relocation offsets after
770 * relocating (due to the complexities in lock handling),
771 * we need to mark them as invalid now so that we force the
772 * relocation processing next time. Just in case the target
773 * object is evicted and then rebound into its old
774 * presumed_offset before the next execbuffer - if that
775 * happened we would make the mistake of assuming that the
776 * relocations were valid.
777 */
778 for (j = 0; j < exec[i].relocation_count; j++) {
779 if (copy_to_user(&user_relocs[j].presumed_offset,
780 &invalid_offset,
781 sizeof(invalid_offset))) {
782 ret = -EFAULT;
783 mutex_lock(&dev->struct_mutex);
784 goto err;
785 }
786 }
787
Chris Wilsondd6864a2011-01-12 23:49:13 +0000788 reloc_offset[i] = total;
Chris Wilson432e58e2010-11-25 19:32:06 +0000789 total += exec[i].relocation_count;
Chris Wilson54cf91d2010-11-25 18:00:26 +0000790 }
791
792 ret = i915_mutex_lock_interruptible(dev);
793 if (ret) {
794 mutex_lock(&dev->struct_mutex);
795 goto err;
796 }
797
Chris Wilson67731b82010-12-08 10:38:14 +0000798 /* reacquire the objects */
Chris Wilson67731b82010-12-08 10:38:14 +0000799 eb_reset(eb);
Ben Widawsky27173f12013-08-14 11:38:36 +0200800 ret = eb_lookup_vmas(eb, exec, args, vm, file);
Chris Wilson3b96eff2013-01-08 10:53:14 +0000801 if (ret)
802 goto err;
Chris Wilson67731b82010-12-08 10:38:14 +0000803
Daniel Vettered5982e2013-01-17 22:23:36 +0100804 need_relocs = (args->flags & I915_EXEC_NO_RELOC) == 0;
Ben Widawsky27173f12013-08-14 11:38:36 +0200805 ret = i915_gem_execbuffer_reserve(ring, &eb->vmas, &need_relocs);
Chris Wilson54cf91d2010-11-25 18:00:26 +0000806 if (ret)
807 goto err;
808
Ben Widawsky27173f12013-08-14 11:38:36 +0200809 list_for_each_entry(vma, &eb->vmas, exec_list) {
810 int offset = vma->exec_entry - exec;
811 ret = i915_gem_execbuffer_relocate_vma_slow(vma, eb,
812 reloc + reloc_offset[offset]);
Chris Wilson54cf91d2010-11-25 18:00:26 +0000813 if (ret)
814 goto err;
Chris Wilson54cf91d2010-11-25 18:00:26 +0000815 }
816
817 /* Leave the user relocations as are, this is the painfully slow path,
818 * and we want to avoid the complication of dropping the lock whilst
819 * having buffers reserved in the aperture and so causing spurious
820 * ENOSPC for random operations.
821 */
822
823err:
824 drm_free_large(reloc);
Chris Wilsondd6864a2011-01-12 23:49:13 +0000825 drm_free_large(reloc_offset);
Chris Wilson54cf91d2010-11-25 18:00:26 +0000826 return ret;
827}
828
Chris Wilson54cf91d2010-11-25 18:00:26 +0000829static int
Chris Wilson432e58e2010-11-25 19:32:06 +0000830i915_gem_execbuffer_move_to_gpu(struct intel_ring_buffer *ring,
Ben Widawsky27173f12013-08-14 11:38:36 +0200831 struct list_head *vmas)
Chris Wilson54cf91d2010-11-25 18:00:26 +0000832{
Ben Widawsky27173f12013-08-14 11:38:36 +0200833 struct i915_vma *vma;
Daniel Vetter6ac42f42012-07-21 12:25:01 +0200834 uint32_t flush_domains = 0;
Chris Wilson000433b2013-08-08 14:41:09 +0100835 bool flush_chipset = false;
Chris Wilson432e58e2010-11-25 19:32:06 +0000836 int ret;
Chris Wilson54cf91d2010-11-25 18:00:26 +0000837
Ben Widawsky27173f12013-08-14 11:38:36 +0200838 list_for_each_entry(vma, vmas, exec_list) {
839 struct drm_i915_gem_object *obj = vma->obj;
Ben Widawsky2911a352012-04-05 14:47:36 -0700840 ret = i915_gem_object_sync(obj, ring);
Chris Wilson1ec14ad2010-12-04 11:30:53 +0000841 if (ret)
842 return ret;
Daniel Vetter6ac42f42012-07-21 12:25:01 +0200843
844 if (obj->base.write_domain & I915_GEM_DOMAIN_CPU)
Chris Wilson000433b2013-08-08 14:41:09 +0100845 flush_chipset |= i915_gem_clflush_object(obj, false);
Daniel Vetter6ac42f42012-07-21 12:25:01 +0200846
Daniel Vetter6ac42f42012-07-21 12:25:01 +0200847 flush_domains |= obj->base.write_domain;
Chris Wilson54cf91d2010-11-25 18:00:26 +0000848 }
849
Chris Wilson000433b2013-08-08 14:41:09 +0100850 if (flush_chipset)
Ben Widawskye76e9ae2012-11-04 09:21:27 -0800851 i915_gem_chipset_flush(ring->dev);
Daniel Vetter6ac42f42012-07-21 12:25:01 +0200852
853 if (flush_domains & I915_GEM_DOMAIN_GTT)
854 wmb();
855
Chris Wilson09cf7c92012-07-13 14:14:08 +0100856 /* Unconditionally invalidate gpu caches and ensure that we do flush
857 * any residual writes from the previous batch.
858 */
Chris Wilsona7b97612012-07-20 12:41:08 +0100859 return intel_ring_invalidate_all_caches(ring);
Chris Wilson54cf91d2010-11-25 18:00:26 +0000860}
861
Chris Wilson432e58e2010-11-25 19:32:06 +0000862static bool
863i915_gem_check_execbuffer(struct drm_i915_gem_execbuffer2 *exec)
Chris Wilson54cf91d2010-11-25 18:00:26 +0000864{
Daniel Vettered5982e2013-01-17 22:23:36 +0100865 if (exec->flags & __I915_EXEC_UNKNOWN_FLAGS)
866 return false;
867
Chris Wilson432e58e2010-11-25 19:32:06 +0000868 return ((exec->batch_start_offset | exec->batch_len) & 0x7) == 0;
Chris Wilson54cf91d2010-11-25 18:00:26 +0000869}
870
871static int
872validate_exec_list(struct drm_i915_gem_exec_object2 *exec,
873 int count)
874{
875 int i;
Daniel Vetterb205ca52013-09-19 14:00:11 +0200876 unsigned relocs_total = 0;
877 unsigned relocs_max = UINT_MAX / sizeof(struct drm_i915_gem_relocation_entry);
Chris Wilson54cf91d2010-11-25 18:00:26 +0000878
879 for (i = 0; i < count; i++) {
Ville Syrjälä2bb46292013-02-22 16:12:51 +0200880 char __user *ptr = to_user_ptr(exec[i].relocs_ptr);
Chris Wilson54cf91d2010-11-25 18:00:26 +0000881 int length; /* limited by fault_in_pages_readable() */
882
Daniel Vettered5982e2013-01-17 22:23:36 +0100883 if (exec[i].flags & __EXEC_OBJECT_UNKNOWN_FLAGS)
884 return -EINVAL;
885
Kees Cook3118a4f2013-03-11 17:31:45 -0700886 /* First check for malicious input causing overflow in
887 * the worst case where we need to allocate the entire
888 * relocation tree as a single array.
889 */
890 if (exec[i].relocation_count > relocs_max - relocs_total)
Chris Wilson54cf91d2010-11-25 18:00:26 +0000891 return -EINVAL;
Kees Cook3118a4f2013-03-11 17:31:45 -0700892 relocs_total += exec[i].relocation_count;
Chris Wilson54cf91d2010-11-25 18:00:26 +0000893
894 length = exec[i].relocation_count *
895 sizeof(struct drm_i915_gem_relocation_entry);
Kees Cook30587532013-03-11 14:37:35 -0700896 /*
897 * We must check that the entire relocation array is safe
898 * to read, but since we may need to update the presumed
899 * offsets during execution, check for full write access.
900 */
Chris Wilson54cf91d2010-11-25 18:00:26 +0000901 if (!access_ok(VERIFY_WRITE, ptr, length))
902 return -EFAULT;
903
Jani Nikulad330a952014-01-21 11:24:25 +0200904 if (likely(!i915.prefault_disable)) {
Xiong Zhang0b74b502013-07-19 13:51:24 +0800905 if (fault_in_multipages_readable(ptr, length))
906 return -EFAULT;
907 }
Chris Wilson54cf91d2010-11-25 18:00:26 +0000908 }
909
910 return 0;
911}
912
Ben Widawsky41bde552013-12-06 14:11:21 -0800913static struct i915_hw_context *
Mika Kuoppalad299cce2013-11-26 16:14:33 +0200914i915_gem_validate_context(struct drm_device *dev, struct drm_file *file,
Daniel Vetter7c9c4b82013-12-18 16:37:49 +0100915 struct intel_ring_buffer *ring, const u32 ctx_id)
Mika Kuoppalad299cce2013-11-26 16:14:33 +0200916{
Ben Widawsky41bde552013-12-06 14:11:21 -0800917 struct i915_hw_context *ctx = NULL;
Mika Kuoppalad299cce2013-11-26 16:14:33 +0200918 struct i915_ctx_hang_stats *hs;
919
Daniel Vetter7c9c4b82013-12-18 16:37:49 +0100920 if (ring->id != RCS && ctx_id != DEFAULT_CONTEXT_ID)
921 return ERR_PTR(-EINVAL);
Mika Kuoppalad299cce2013-11-26 16:14:33 +0200922
Ben Widawsky41bde552013-12-06 14:11:21 -0800923 ctx = i915_gem_context_get(file->driver_priv, ctx_id);
Ben Widawsky72ad5c42014-01-02 19:50:27 -1000924 if (IS_ERR(ctx))
Ben Widawsky41bde552013-12-06 14:11:21 -0800925 return ctx;
Mika Kuoppalad299cce2013-11-26 16:14:33 +0200926
Ben Widawsky41bde552013-12-06 14:11:21 -0800927 hs = &ctx->hang_stats;
Mika Kuoppalad299cce2013-11-26 16:14:33 +0200928 if (hs->banned) {
929 DRM_DEBUG("Context %u tried to submit while banned\n", ctx_id);
Ben Widawsky41bde552013-12-06 14:11:21 -0800930 return ERR_PTR(-EIO);
Mika Kuoppalad299cce2013-11-26 16:14:33 +0200931 }
932
Ben Widawsky41bde552013-12-06 14:11:21 -0800933 return ctx;
Mika Kuoppalad299cce2013-11-26 16:14:33 +0200934}
935
Chris Wilson432e58e2010-11-25 19:32:06 +0000936static void
Ben Widawsky27173f12013-08-14 11:38:36 +0200937i915_gem_execbuffer_move_to_active(struct list_head *vmas,
Chris Wilson9d7730912012-11-27 16:22:52 +0000938 struct intel_ring_buffer *ring)
Chris Wilson432e58e2010-11-25 19:32:06 +0000939{
Ben Widawsky27173f12013-08-14 11:38:36 +0200940 struct i915_vma *vma;
Chris Wilson432e58e2010-11-25 19:32:06 +0000941
Ben Widawsky27173f12013-08-14 11:38:36 +0200942 list_for_each_entry(vma, vmas, exec_list) {
943 struct drm_i915_gem_object *obj = vma->obj;
Chris Wilson69c2fc82012-07-20 12:41:03 +0100944 u32 old_read = obj->base.read_domains;
945 u32 old_write = obj->base.write_domain;
Chris Wilsondb53a302011-02-03 11:57:46 +0000946
Chris Wilson432e58e2010-11-25 19:32:06 +0000947 obj->base.write_domain = obj->base.pending_write_domain;
Daniel Vettered5982e2013-01-17 22:23:36 +0100948 if (obj->base.write_domain == 0)
949 obj->base.pending_read_domains |= obj->base.read_domains;
950 obj->base.read_domains = obj->base.pending_read_domains;
Chris Wilson432e58e2010-11-25 19:32:06 +0000951 obj->fenced_gpu_access = obj->pending_fenced_gpu_access;
952
Ben Widawskye2d05a82013-09-24 09:57:58 -0700953 i915_vma_move_to_active(vma, ring);
Chris Wilson432e58e2010-11-25 19:32:06 +0000954 if (obj->base.write_domain) {
955 obj->dirty = 1;
Chris Wilson9d7730912012-11-27 16:22:52 +0000956 obj->last_write_seqno = intel_ring_get_seqno(ring);
Ben Widawskyd7f46fc2013-12-06 14:10:55 -0800957 /* check for potential scanout */
958 if (i915_gem_obj_ggtt_bound(obj) &&
959 i915_gem_obj_to_ggtt(obj)->pin_count)
Chris Wilsonc65355b2013-06-06 16:53:41 -0300960 intel_mark_fb_busy(obj, ring);
Chris Wilsonc8725f32014-03-17 12:21:55 +0000961
962 /* update for the implicit flush after a batch */
963 obj->base.write_domain &= ~I915_GEM_GPU_DOMAINS;
Chris Wilson432e58e2010-11-25 19:32:06 +0000964 }
965
Chris Wilsondb53a302011-02-03 11:57:46 +0000966 trace_i915_gem_object_change_domain(obj, old_read, old_write);
Chris Wilson432e58e2010-11-25 19:32:06 +0000967 }
968}
969
Chris Wilson54cf91d2010-11-25 18:00:26 +0000970static void
971i915_gem_execbuffer_retire_commands(struct drm_device *dev,
Chris Wilson432e58e2010-11-25 19:32:06 +0000972 struct drm_file *file,
Mika Kuoppala7d736f42013-06-12 15:01:39 +0300973 struct intel_ring_buffer *ring,
974 struct drm_i915_gem_object *obj)
Chris Wilson54cf91d2010-11-25 18:00:26 +0000975{
Daniel Vettercc889e02012-06-13 20:45:19 +0200976 /* Unconditionally force add_request to emit a full flush. */
977 ring->gpu_caches_dirty = true;
Chris Wilson54cf91d2010-11-25 18:00:26 +0000978
Chris Wilson432e58e2010-11-25 19:32:06 +0000979 /* Add a breadcrumb for the completion of the batch buffer */
Mika Kuoppala7d736f42013-06-12 15:01:39 +0300980 (void)__i915_add_request(ring, file, obj, NULL);
Chris Wilson432e58e2010-11-25 19:32:06 +0000981}
Chris Wilson54cf91d2010-11-25 18:00:26 +0000982
983static int
Eric Anholtae662d32012-01-03 09:23:29 -0800984i915_reset_gen7_sol_offsets(struct drm_device *dev,
985 struct intel_ring_buffer *ring)
986{
Jani Nikula50227e12014-03-31 14:27:21 +0300987 struct drm_i915_private *dev_priv = dev->dev_private;
Eric Anholtae662d32012-01-03 09:23:29 -0800988 int ret, i;
989
Daniel Vetter9d662da2014-04-24 08:09:09 +0200990 if (!IS_GEN7(dev) || ring != &dev_priv->ring[RCS]) {
991 DRM_DEBUG("sol reset is gen7/rcs only\n");
992 return -EINVAL;
993 }
Eric Anholtae662d32012-01-03 09:23:29 -0800994
995 ret = intel_ring_begin(ring, 4 * 3);
996 if (ret)
997 return ret;
998
999 for (i = 0; i < 4; i++) {
1000 intel_ring_emit(ring, MI_LOAD_REGISTER_IMM(1));
1001 intel_ring_emit(ring, GEN7_SO_WRITE_OFFSET(i));
1002 intel_ring_emit(ring, 0);
1003 }
1004
1005 intel_ring_advance(ring);
1006
1007 return 0;
1008}
1009
Zhao Yakuia8ebba72014-04-17 10:37:40 +08001010/**
1011 * Find one BSD ring to dispatch the corresponding BSD command.
1012 * The Ring ID is returned.
1013 */
1014static int gen8_dispatch_bsd_ring(struct drm_device *dev,
1015 struct drm_file *file)
1016{
1017 struct drm_i915_private *dev_priv = dev->dev_private;
1018 struct drm_i915_file_private *file_priv = file->driver_priv;
1019
1020 /* Check whether the file_priv is using one ring */
1021 if (file_priv->bsd_ring)
1022 return file_priv->bsd_ring->id;
1023 else {
1024 /* If no, use the ping-pong mechanism to select one ring */
1025 int ring_id;
1026
1027 mutex_lock(&dev->struct_mutex);
1028 if (dev_priv->ring_index == 0) {
1029 ring_id = VCS;
1030 dev_priv->ring_index = 1;
1031 } else {
1032 ring_id = VCS2;
1033 dev_priv->ring_index = 0;
1034 }
1035 file_priv->bsd_ring = &dev_priv->ring[ring_id];
1036 mutex_unlock(&dev->struct_mutex);
1037 return ring_id;
1038 }
1039}
1040
Eric Anholtae662d32012-01-03 09:23:29 -08001041static int
Chris Wilson54cf91d2010-11-25 18:00:26 +00001042i915_gem_do_execbuffer(struct drm_device *dev, void *data,
1043 struct drm_file *file,
1044 struct drm_i915_gem_execbuffer2 *args,
Ben Widawsky41bde552013-12-06 14:11:21 -08001045 struct drm_i915_gem_exec_object2 *exec)
Chris Wilson54cf91d2010-11-25 18:00:26 +00001046{
Jani Nikula50227e12014-03-31 14:27:21 +03001047 struct drm_i915_private *dev_priv = dev->dev_private;
Ben Widawsky27173f12013-08-14 11:38:36 +02001048 struct eb_vmas *eb;
Chris Wilson54cf91d2010-11-25 18:00:26 +00001049 struct drm_i915_gem_object *batch_obj;
1050 struct drm_clip_rect *cliprects = NULL;
Chris Wilson54cf91d2010-11-25 18:00:26 +00001051 struct intel_ring_buffer *ring;
Ben Widawsky41bde552013-12-06 14:11:21 -08001052 struct i915_hw_context *ctx;
1053 struct i915_address_space *vm;
Mika Kuoppalad299cce2013-11-26 16:14:33 +02001054 const u32 ctx_id = i915_execbuffer2_get_context_id(*args);
Ben Widawsky9bcb1442014-04-28 19:29:25 -07001055 u64 exec_start = args->batch_start_offset, exec_len;
Daniel Vettered5982e2013-01-17 22:23:36 +01001056 u32 mask, flags;
Chris Wilson72bfa192010-12-19 11:42:05 +00001057 int ret, mode, i;
Daniel Vettered5982e2013-01-17 22:23:36 +01001058 bool need_relocs;
Chris Wilson54cf91d2010-11-25 18:00:26 +00001059
Daniel Vettered5982e2013-01-17 22:23:36 +01001060 if (!i915_gem_check_execbuffer(args))
Chris Wilson432e58e2010-11-25 19:32:06 +00001061 return -EINVAL;
Chris Wilson432e58e2010-11-25 19:32:06 +00001062
1063 ret = validate_exec_list(exec, args->buffer_count);
Chris Wilson54cf91d2010-11-25 18:00:26 +00001064 if (ret)
1065 return ret;
1066
Chris Wilsond7d4eed2012-10-17 12:09:54 +01001067 flags = 0;
1068 if (args->flags & I915_EXEC_SECURE) {
1069 if (!file->is_master || !capable(CAP_SYS_ADMIN))
1070 return -EPERM;
1071
1072 flags |= I915_DISPATCH_SECURE;
1073 }
Daniel Vetterb45305f2012-12-17 16:21:27 +01001074 if (args->flags & I915_EXEC_IS_PINNED)
1075 flags |= I915_DISPATCH_PINNED;
Chris Wilsond7d4eed2012-10-17 12:09:54 +01001076
Zhao Yakuib1a93302014-04-17 10:37:36 +08001077 if ((args->flags & I915_EXEC_RING_MASK) > LAST_USER_RING) {
Daniel Vetterff240192012-01-31 21:08:14 +01001078 DRM_DEBUG("execbuf with unknown ring: %d\n",
Chris Wilson54cf91d2010-11-25 18:00:26 +00001079 (int)(args->flags & I915_EXEC_RING_MASK));
1080 return -EINVAL;
1081 }
Ben Widawskyca01b122013-12-06 14:11:00 -08001082
1083 if ((args->flags & I915_EXEC_RING_MASK) == I915_EXEC_DEFAULT)
1084 ring = &dev_priv->ring[RCS];
Zhao Yakuia8ebba72014-04-17 10:37:40 +08001085 else if ((args->flags & I915_EXEC_RING_MASK) == I915_EXEC_BSD) {
1086 if (HAS_BSD2(dev)) {
1087 int ring_id;
1088 ring_id = gen8_dispatch_bsd_ring(dev, file);
1089 ring = &dev_priv->ring[ring_id];
1090 } else
1091 ring = &dev_priv->ring[VCS];
1092 } else
Ben Widawskyca01b122013-12-06 14:11:00 -08001093 ring = &dev_priv->ring[(args->flags & I915_EXEC_RING_MASK) - 1];
1094
Chris Wilsona15817c2012-05-11 14:29:31 +01001095 if (!intel_ring_initialized(ring)) {
1096 DRM_DEBUG("execbuf with invalid ring: %d\n",
1097 (int)(args->flags & I915_EXEC_RING_MASK));
1098 return -EINVAL;
1099 }
Chris Wilson54cf91d2010-11-25 18:00:26 +00001100
Chris Wilson72bfa192010-12-19 11:42:05 +00001101 mode = args->flags & I915_EXEC_CONSTANTS_MASK;
Ben Widawsky84f9f932011-12-12 19:21:58 -08001102 mask = I915_EXEC_CONSTANTS_MASK;
Chris Wilson72bfa192010-12-19 11:42:05 +00001103 switch (mode) {
1104 case I915_EXEC_CONSTANTS_REL_GENERAL:
1105 case I915_EXEC_CONSTANTS_ABSOLUTE:
1106 case I915_EXEC_CONSTANTS_REL_SURFACE:
Daniel Vetterc0f5b822014-04-24 08:09:10 +02001107 if (mode != 0 && ring != &dev_priv->ring[RCS]) {
1108 DRM_DEBUG("non-0 rel constants mode on non-RCS\n");
1109 return -EINVAL;
1110 }
1111
1112 if (mode != dev_priv->relative_constants_mode) {
1113 if (INTEL_INFO(dev)->gen < 4) {
1114 DRM_DEBUG("no rel constants on pre-gen4\n");
Chris Wilson72bfa192010-12-19 11:42:05 +00001115 return -EINVAL;
Daniel Vetterc0f5b822014-04-24 08:09:10 +02001116 }
Chris Wilson72bfa192010-12-19 11:42:05 +00001117
1118 if (INTEL_INFO(dev)->gen > 5 &&
Daniel Vetterc0f5b822014-04-24 08:09:10 +02001119 mode == I915_EXEC_CONSTANTS_REL_SURFACE) {
1120 DRM_DEBUG("rel surface constants mode invalid on gen5+\n");
Chris Wilson72bfa192010-12-19 11:42:05 +00001121 return -EINVAL;
Daniel Vetterc0f5b822014-04-24 08:09:10 +02001122 }
Ben Widawsky84f9f932011-12-12 19:21:58 -08001123
1124 /* The HW changed the meaning on this bit on gen6 */
1125 if (INTEL_INFO(dev)->gen >= 6)
1126 mask &= ~I915_EXEC_CONSTANTS_REL_SURFACE;
Chris Wilson72bfa192010-12-19 11:42:05 +00001127 }
1128 break;
1129 default:
Daniel Vetterff240192012-01-31 21:08:14 +01001130 DRM_DEBUG("execbuf with unknown constants: %d\n", mode);
Chris Wilson72bfa192010-12-19 11:42:05 +00001131 return -EINVAL;
1132 }
1133
Chris Wilson54cf91d2010-11-25 18:00:26 +00001134 if (args->buffer_count < 1) {
Daniel Vetterff240192012-01-31 21:08:14 +01001135 DRM_DEBUG("execbuf with %d buffers\n", args->buffer_count);
Chris Wilson54cf91d2010-11-25 18:00:26 +00001136 return -EINVAL;
1137 }
Chris Wilson54cf91d2010-11-25 18:00:26 +00001138
1139 if (args->num_cliprects != 0) {
Chris Wilson1ec14ad2010-12-04 11:30:53 +00001140 if (ring != &dev_priv->ring[RCS]) {
Daniel Vetterff240192012-01-31 21:08:14 +01001141 DRM_DEBUG("clip rectangles are only valid with the render ring\n");
Chris Wilsonc4e7a412010-11-30 14:10:25 +00001142 return -EINVAL;
1143 }
1144
Daniel Vetter6ebebc92012-04-26 23:28:11 +02001145 if (INTEL_INFO(dev)->gen >= 5) {
1146 DRM_DEBUG("clip rectangles are only valid on pre-gen5\n");
1147 return -EINVAL;
1148 }
1149
Xi Wang44afb3a2012-04-23 04:06:42 -04001150 if (args->num_cliprects > UINT_MAX / sizeof(*cliprects)) {
1151 DRM_DEBUG("execbuf with %u cliprects\n",
1152 args->num_cliprects);
1153 return -EINVAL;
1154 }
Daniel Vetter5e13a0c2012-05-08 13:39:59 +02001155
Daniel Vettera1e22652013-09-21 00:35:38 +02001156 cliprects = kcalloc(args->num_cliprects,
1157 sizeof(*cliprects),
Chris Wilson54cf91d2010-11-25 18:00:26 +00001158 GFP_KERNEL);
1159 if (cliprects == NULL) {
1160 ret = -ENOMEM;
1161 goto pre_mutex_err;
1162 }
1163
Chris Wilson432e58e2010-11-25 19:32:06 +00001164 if (copy_from_user(cliprects,
Ville Syrjälä2bb46292013-02-22 16:12:51 +02001165 to_user_ptr(args->cliprects_ptr),
1166 sizeof(*cliprects)*args->num_cliprects)) {
Chris Wilson54cf91d2010-11-25 18:00:26 +00001167 ret = -EFAULT;
1168 goto pre_mutex_err;
1169 }
Daniel Vetter9cb34662014-04-24 08:09:11 +02001170 } else {
1171 if (args->DR1 || args->DR4 || args->cliprects_ptr) {
1172 DRM_DEBUG("0 cliprects but dirt in cliprects fields\n");
1173 return -EINVAL;
1174 }
Chris Wilson54cf91d2010-11-25 18:00:26 +00001175 }
1176
Paulo Zanonif65c9162013-11-27 18:20:34 -02001177 intel_runtime_pm_get(dev_priv);
1178
Chris Wilson54cf91d2010-11-25 18:00:26 +00001179 ret = i915_mutex_lock_interruptible(dev);
1180 if (ret)
1181 goto pre_mutex_err;
1182
Daniel Vetterdb1b76c2013-07-09 16:51:37 +02001183 if (dev_priv->ums.mm_suspended) {
Chris Wilson54cf91d2010-11-25 18:00:26 +00001184 mutex_unlock(&dev->struct_mutex);
1185 ret = -EBUSY;
1186 goto pre_mutex_err;
1187 }
1188
Daniel Vetter7c9c4b82013-12-18 16:37:49 +01001189 ctx = i915_gem_validate_context(dev, file, ring, ctx_id);
Ben Widawsky72ad5c42014-01-02 19:50:27 -10001190 if (IS_ERR(ctx)) {
Mika Kuoppalad299cce2013-11-26 16:14:33 +02001191 mutex_unlock(&dev->struct_mutex);
Ben Widawsky41bde552013-12-06 14:11:21 -08001192 ret = PTR_ERR(ctx);
Mika Kuoppalad299cce2013-11-26 16:14:33 +02001193 goto pre_mutex_err;
Ben Widawsky935f38d2014-04-04 22:41:07 -07001194 }
Ben Widawsky41bde552013-12-06 14:11:21 -08001195
1196 i915_gem_context_reference(ctx);
1197
Ben Widawsky7e0d96b2013-12-06 14:11:26 -08001198 vm = ctx->vm;
1199 if (!USES_FULL_PPGTT(dev))
1200 vm = &dev_priv->gtt.base;
Mika Kuoppalad299cce2013-11-26 16:14:33 +02001201
Ben Widawsky17601cbc2013-11-25 09:54:38 -08001202 eb = eb_create(args);
Chris Wilson67731b82010-12-08 10:38:14 +00001203 if (eb == NULL) {
Ben Widawsky935f38d2014-04-04 22:41:07 -07001204 i915_gem_context_unreference(ctx);
Chris Wilson67731b82010-12-08 10:38:14 +00001205 mutex_unlock(&dev->struct_mutex);
1206 ret = -ENOMEM;
1207 goto pre_mutex_err;
1208 }
1209
Chris Wilson54cf91d2010-11-25 18:00:26 +00001210 /* Look up object handles */
Ben Widawsky27173f12013-08-14 11:38:36 +02001211 ret = eb_lookup_vmas(eb, exec, args, vm, file);
Chris Wilson3b96eff2013-01-08 10:53:14 +00001212 if (ret)
1213 goto err;
Chris Wilson54cf91d2010-11-25 18:00:26 +00001214
Chris Wilson6fe4f142011-01-10 17:35:37 +00001215 /* take note of the batch buffer before we might reorder the lists */
Ben Widawsky27173f12013-08-14 11:38:36 +02001216 batch_obj = list_entry(eb->vmas.prev, struct i915_vma, exec_list)->obj;
Chris Wilson6fe4f142011-01-10 17:35:37 +00001217
Chris Wilson54cf91d2010-11-25 18:00:26 +00001218 /* Move the objects en-masse into the GTT, evicting if necessary. */
Daniel Vettered5982e2013-01-17 22:23:36 +01001219 need_relocs = (args->flags & I915_EXEC_NO_RELOC) == 0;
Ben Widawsky27173f12013-08-14 11:38:36 +02001220 ret = i915_gem_execbuffer_reserve(ring, &eb->vmas, &need_relocs);
Chris Wilson54cf91d2010-11-25 18:00:26 +00001221 if (ret)
1222 goto err;
1223
1224 /* The objects are in their final locations, apply the relocations. */
Daniel Vettered5982e2013-01-17 22:23:36 +01001225 if (need_relocs)
Ben Widawsky17601cbc2013-11-25 09:54:38 -08001226 ret = i915_gem_execbuffer_relocate(eb);
Chris Wilson54cf91d2010-11-25 18:00:26 +00001227 if (ret) {
1228 if (ret == -EFAULT) {
Daniel Vettered5982e2013-01-17 22:23:36 +01001229 ret = i915_gem_execbuffer_relocate_slow(dev, args, file, ring,
Ben Widawsky27173f12013-08-14 11:38:36 +02001230 eb, exec);
Chris Wilson54cf91d2010-11-25 18:00:26 +00001231 BUG_ON(!mutex_is_locked(&dev->struct_mutex));
1232 }
1233 if (ret)
1234 goto err;
1235 }
1236
1237 /* Set the pending read domains for the batch buffer to COMMAND */
Chris Wilson54cf91d2010-11-25 18:00:26 +00001238 if (batch_obj->base.pending_write_domain) {
Daniel Vetterff240192012-01-31 21:08:14 +01001239 DRM_DEBUG("Attempting to use self-modifying batch buffer\n");
Chris Wilson54cf91d2010-11-25 18:00:26 +00001240 ret = -EINVAL;
1241 goto err;
1242 }
1243 batch_obj->base.pending_read_domains |= I915_GEM_DOMAIN_COMMAND;
1244
Brad Volkin351e3db2014-02-18 10:15:46 -08001245 if (i915_needs_cmd_parser(ring)) {
1246 ret = i915_parse_cmds(ring,
1247 batch_obj,
1248 args->batch_start_offset,
1249 file->is_master);
1250 if (ret)
1251 goto err;
1252
1253 /*
1254 * XXX: Actually do this when enabling batch copy...
1255 *
1256 * Set the DISPATCH_SECURE bit to remove the NON_SECURE bit
1257 * from MI_BATCH_BUFFER_START commands issued in the
1258 * dispatch_execbuffer implementations. We specifically don't
1259 * want that set when the command parser is enabled.
1260 */
1261 }
1262
Chris Wilsond7d4eed2012-10-17 12:09:54 +01001263 /* snb/ivb/vlv conflate the "batch in ppgtt" bit with the "non-secure
1264 * batch" bit. Hence we need to pin secure batches into the global gtt.
Ben Widawsky28cf5412013-11-02 21:07:26 -07001265 * hsw should have this fixed, but bdw mucks it up again. */
Ben Widawsky6f65e292013-12-06 14:10:56 -08001266 if (flags & I915_DISPATCH_SECURE &&
1267 !batch_obj->has_global_gtt_mapping) {
1268 /* When we have multiple VMs, we'll need to make sure that we
1269 * allocate space first */
1270 struct i915_vma *vma = i915_gem_obj_to_ggtt(batch_obj);
1271 BUG_ON(!vma);
1272 vma->bind_vma(vma, batch_obj->cache_level, GLOBAL_BIND);
1273 }
Chris Wilsond7d4eed2012-10-17 12:09:54 +01001274
Ben Widawsky7e0d96b2013-12-06 14:11:26 -08001275 if (flags & I915_DISPATCH_SECURE)
1276 exec_start += i915_gem_obj_ggtt_offset(batch_obj);
1277 else
1278 exec_start += i915_gem_obj_offset(batch_obj, vm);
Chris Wilson54cf91d2010-11-25 18:00:26 +00001279
Ben Widawsky27173f12013-08-14 11:38:36 +02001280 ret = i915_gem_execbuffer_move_to_gpu(ring, &eb->vmas);
Chris Wilson54cf91d2010-11-25 18:00:26 +00001281 if (ret)
1282 goto err;
1283
Chris Wilson691e6412014-04-09 09:07:36 +01001284 ret = i915_switch_context(ring, ctx);
Eric Anholt0da5cec2012-07-23 12:33:55 -07001285 if (ret)
1286 goto err;
1287
Ben Widawskye2971bd2011-12-12 19:21:57 -08001288 if (ring == &dev_priv->ring[RCS] &&
1289 mode != dev_priv->relative_constants_mode) {
1290 ret = intel_ring_begin(ring, 4);
1291 if (ret)
1292 goto err;
1293
1294 intel_ring_emit(ring, MI_NOOP);
1295 intel_ring_emit(ring, MI_LOAD_REGISTER_IMM(1));
1296 intel_ring_emit(ring, INSTPM);
Ben Widawsky84f9f932011-12-12 19:21:58 -08001297 intel_ring_emit(ring, mask << 16 | mode);
Ben Widawskye2971bd2011-12-12 19:21:57 -08001298 intel_ring_advance(ring);
1299
1300 dev_priv->relative_constants_mode = mode;
1301 }
1302
Eric Anholtae662d32012-01-03 09:23:29 -08001303 if (args->flags & I915_EXEC_GEN7_SOL_RESET) {
1304 ret = i915_reset_gen7_sol_offsets(dev, ring);
1305 if (ret)
1306 goto err;
1307 }
1308
Ben Widawsky7e0d96b2013-12-06 14:11:26 -08001309
Chris Wilsonc4e7a412010-11-30 14:10:25 +00001310 exec_len = args->batch_len;
1311 if (cliprects) {
1312 for (i = 0; i < args->num_cliprects; i++) {
1313 ret = i915_emit_box(dev, &cliprects[i],
1314 args->DR1, args->DR4);
1315 if (ret)
1316 goto err;
1317
1318 ret = ring->dispatch_execbuffer(ring,
Chris Wilsond7d4eed2012-10-17 12:09:54 +01001319 exec_start, exec_len,
1320 flags);
Chris Wilsonc4e7a412010-11-30 14:10:25 +00001321 if (ret)
1322 goto err;
1323 }
1324 } else {
Chris Wilsond7d4eed2012-10-17 12:09:54 +01001325 ret = ring->dispatch_execbuffer(ring,
1326 exec_start, exec_len,
1327 flags);
Chris Wilsonc4e7a412010-11-30 14:10:25 +00001328 if (ret)
1329 goto err;
1330 }
Chris Wilson54cf91d2010-11-25 18:00:26 +00001331
Chris Wilson9d7730912012-11-27 16:22:52 +00001332 trace_i915_gem_ring_dispatch(ring, intel_ring_get_seqno(ring), flags);
1333
Ben Widawsky27173f12013-08-14 11:38:36 +02001334 i915_gem_execbuffer_move_to_active(&eb->vmas, ring);
Mika Kuoppala7d736f42013-06-12 15:01:39 +03001335 i915_gem_execbuffer_retire_commands(dev, file, ring, batch_obj);
Chris Wilson54cf91d2010-11-25 18:00:26 +00001336
1337err:
Ben Widawsky41bde552013-12-06 14:11:21 -08001338 /* the request owns the ref now */
1339 i915_gem_context_unreference(ctx);
Chris Wilson67731b82010-12-08 10:38:14 +00001340 eb_destroy(eb);
Chris Wilson54cf91d2010-11-25 18:00:26 +00001341
1342 mutex_unlock(&dev->struct_mutex);
1343
1344pre_mutex_err:
Chris Wilson54cf91d2010-11-25 18:00:26 +00001345 kfree(cliprects);
Paulo Zanonif65c9162013-11-27 18:20:34 -02001346
1347 /* intel_gpu_busy should also get a ref, so it will free when the device
1348 * is really idle. */
1349 intel_runtime_pm_put(dev_priv);
Chris Wilson54cf91d2010-11-25 18:00:26 +00001350 return ret;
1351}
1352
1353/*
1354 * Legacy execbuffer just creates an exec2 list from the original exec object
1355 * list array and passes it to the real function.
1356 */
1357int
1358i915_gem_execbuffer(struct drm_device *dev, void *data,
1359 struct drm_file *file)
1360{
1361 struct drm_i915_gem_execbuffer *args = data;
1362 struct drm_i915_gem_execbuffer2 exec2;
1363 struct drm_i915_gem_exec_object *exec_list = NULL;
1364 struct drm_i915_gem_exec_object2 *exec2_list = NULL;
1365 int ret, i;
1366
Chris Wilson54cf91d2010-11-25 18:00:26 +00001367 if (args->buffer_count < 1) {
Daniel Vetterff240192012-01-31 21:08:14 +01001368 DRM_DEBUG("execbuf with %d buffers\n", args->buffer_count);
Chris Wilson54cf91d2010-11-25 18:00:26 +00001369 return -EINVAL;
1370 }
1371
1372 /* Copy in the exec list from userland */
1373 exec_list = drm_malloc_ab(sizeof(*exec_list), args->buffer_count);
1374 exec2_list = drm_malloc_ab(sizeof(*exec2_list), args->buffer_count);
1375 if (exec_list == NULL || exec2_list == NULL) {
Daniel Vetterff240192012-01-31 21:08:14 +01001376 DRM_DEBUG("Failed to allocate exec list for %d buffers\n",
Chris Wilson54cf91d2010-11-25 18:00:26 +00001377 args->buffer_count);
1378 drm_free_large(exec_list);
1379 drm_free_large(exec2_list);
1380 return -ENOMEM;
1381 }
1382 ret = copy_from_user(exec_list,
Ville Syrjälä2bb46292013-02-22 16:12:51 +02001383 to_user_ptr(args->buffers_ptr),
Chris Wilson54cf91d2010-11-25 18:00:26 +00001384 sizeof(*exec_list) * args->buffer_count);
1385 if (ret != 0) {
Daniel Vetterff240192012-01-31 21:08:14 +01001386 DRM_DEBUG("copy %d exec entries failed %d\n",
Chris Wilson54cf91d2010-11-25 18:00:26 +00001387 args->buffer_count, ret);
1388 drm_free_large(exec_list);
1389 drm_free_large(exec2_list);
1390 return -EFAULT;
1391 }
1392
1393 for (i = 0; i < args->buffer_count; i++) {
1394 exec2_list[i].handle = exec_list[i].handle;
1395 exec2_list[i].relocation_count = exec_list[i].relocation_count;
1396 exec2_list[i].relocs_ptr = exec_list[i].relocs_ptr;
1397 exec2_list[i].alignment = exec_list[i].alignment;
1398 exec2_list[i].offset = exec_list[i].offset;
1399 if (INTEL_INFO(dev)->gen < 4)
1400 exec2_list[i].flags = EXEC_OBJECT_NEEDS_FENCE;
1401 else
1402 exec2_list[i].flags = 0;
1403 }
1404
1405 exec2.buffers_ptr = args->buffers_ptr;
1406 exec2.buffer_count = args->buffer_count;
1407 exec2.batch_start_offset = args->batch_start_offset;
1408 exec2.batch_len = args->batch_len;
1409 exec2.DR1 = args->DR1;
1410 exec2.DR4 = args->DR4;
1411 exec2.num_cliprects = args->num_cliprects;
1412 exec2.cliprects_ptr = args->cliprects_ptr;
1413 exec2.flags = I915_EXEC_RENDER;
Ben Widawsky6e0a69d2012-06-04 14:42:55 -07001414 i915_execbuffer2_set_context_id(exec2, 0);
Chris Wilson54cf91d2010-11-25 18:00:26 +00001415
Ben Widawsky41bde552013-12-06 14:11:21 -08001416 ret = i915_gem_do_execbuffer(dev, data, file, &exec2, exec2_list);
Chris Wilson54cf91d2010-11-25 18:00:26 +00001417 if (!ret) {
1418 /* Copy the new buffer offsets back to the user's exec list. */
1419 for (i = 0; i < args->buffer_count; i++)
1420 exec_list[i].offset = exec2_list[i].offset;
1421 /* ... and back out to userspace */
Ville Syrjälä2bb46292013-02-22 16:12:51 +02001422 ret = copy_to_user(to_user_ptr(args->buffers_ptr),
Chris Wilson54cf91d2010-11-25 18:00:26 +00001423 exec_list,
1424 sizeof(*exec_list) * args->buffer_count);
1425 if (ret) {
1426 ret = -EFAULT;
Daniel Vetterff240192012-01-31 21:08:14 +01001427 DRM_DEBUG("failed to copy %d exec entries "
Chris Wilson54cf91d2010-11-25 18:00:26 +00001428 "back to user (%d)\n",
1429 args->buffer_count, ret);
1430 }
1431 }
1432
1433 drm_free_large(exec_list);
1434 drm_free_large(exec2_list);
1435 return ret;
1436}
1437
1438int
1439i915_gem_execbuffer2(struct drm_device *dev, void *data,
1440 struct drm_file *file)
1441{
1442 struct drm_i915_gem_execbuffer2 *args = data;
1443 struct drm_i915_gem_exec_object2 *exec2_list = NULL;
1444 int ret;
1445
Xi Wanged8cd3b2012-04-23 04:06:41 -04001446 if (args->buffer_count < 1 ||
1447 args->buffer_count > UINT_MAX / sizeof(*exec2_list)) {
Daniel Vetterff240192012-01-31 21:08:14 +01001448 DRM_DEBUG("execbuf2 with %d buffers\n", args->buffer_count);
Chris Wilson54cf91d2010-11-25 18:00:26 +00001449 return -EINVAL;
1450 }
1451
Daniel Vetter9cb34662014-04-24 08:09:11 +02001452 if (args->rsvd2 != 0) {
1453 DRM_DEBUG("dirty rvsd2 field\n");
1454 return -EINVAL;
1455 }
1456
Chris Wilson8408c282011-02-21 12:54:48 +00001457 exec2_list = kmalloc(sizeof(*exec2_list)*args->buffer_count,
Chris Wilson419fa722013-01-08 10:53:13 +00001458 GFP_TEMPORARY | __GFP_NOWARN | __GFP_NORETRY);
Chris Wilson8408c282011-02-21 12:54:48 +00001459 if (exec2_list == NULL)
1460 exec2_list = drm_malloc_ab(sizeof(*exec2_list),
1461 args->buffer_count);
Chris Wilson54cf91d2010-11-25 18:00:26 +00001462 if (exec2_list == NULL) {
Daniel Vetterff240192012-01-31 21:08:14 +01001463 DRM_DEBUG("Failed to allocate exec list for %d buffers\n",
Chris Wilson54cf91d2010-11-25 18:00:26 +00001464 args->buffer_count);
1465 return -ENOMEM;
1466 }
1467 ret = copy_from_user(exec2_list,
Ville Syrjälä2bb46292013-02-22 16:12:51 +02001468 to_user_ptr(args->buffers_ptr),
Chris Wilson54cf91d2010-11-25 18:00:26 +00001469 sizeof(*exec2_list) * args->buffer_count);
1470 if (ret != 0) {
Daniel Vetterff240192012-01-31 21:08:14 +01001471 DRM_DEBUG("copy %d exec entries failed %d\n",
Chris Wilson54cf91d2010-11-25 18:00:26 +00001472 args->buffer_count, ret);
1473 drm_free_large(exec2_list);
1474 return -EFAULT;
1475 }
1476
Ben Widawsky41bde552013-12-06 14:11:21 -08001477 ret = i915_gem_do_execbuffer(dev, data, file, args, exec2_list);
Chris Wilson54cf91d2010-11-25 18:00:26 +00001478 if (!ret) {
1479 /* Copy the new buffer offsets back to the user's exec list. */
Ville Syrjälä2bb46292013-02-22 16:12:51 +02001480 ret = copy_to_user(to_user_ptr(args->buffers_ptr),
Chris Wilson54cf91d2010-11-25 18:00:26 +00001481 exec2_list,
1482 sizeof(*exec2_list) * args->buffer_count);
1483 if (ret) {
1484 ret = -EFAULT;
Daniel Vetterff240192012-01-31 21:08:14 +01001485 DRM_DEBUG("failed to copy %d exec entries "
Chris Wilson54cf91d2010-11-25 18:00:26 +00001486 "back to user (%d)\n",
1487 args->buffer_count, ret);
1488 }
1489 }
1490
1491 drm_free_large(exec2_list);
1492 return ret;
1493}