blob: 34ef339158c1a609d5aa50f2fc9a47e9a6aa2578 [file] [log] [blame]
Eric Anholt673a3942008-07-30 12:06:12 -07001/*
2 * Copyright © 2008 Intel Corporation
3 *
4 * Permission is hereby granted, free of charge, to any person obtaining a
5 * copy of this software and associated documentation files (the "Software"),
6 * to deal in the Software without restriction, including without limitation
7 * the rights to use, copy, modify, merge, publish, distribute, sublicense,
8 * and/or sell copies of the Software, and to permit persons to whom the
9 * Software is furnished to do so, subject to the following conditions:
10 *
11 * The above copyright notice and this permission notice (including the next
12 * paragraph) shall be included in all copies or substantial portions of the
13 * Software.
14 *
15 * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
16 * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
17 * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL
18 * THE AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
19 * LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING
20 * FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS
21 * IN THE SOFTWARE.
22 *
23 * Authors:
24 * Eric Anholt <eric@anholt.net>
25 *
26 */
27
28#include "drmP.h"
29#include "drm.h"
30#include "i915_drm.h"
31#include "i915_drv.h"
Chris Wilson1c5d22f2009-08-25 11:15:50 +010032#include "i915_trace.h"
Jesse Barnes652c3932009-08-17 13:31:43 -070033#include "intel_drv.h"
Hugh Dickins5949eac2011-06-27 16:18:18 -070034#include <linux/shmem_fs.h>
Tejun Heo5a0e3ad2010-03-24 17:04:11 +090035#include <linux/slab.h>
Eric Anholt673a3942008-07-30 12:06:12 -070036#include <linux/swap.h>
Jesse Barnes79e53942008-11-07 14:24:08 -080037#include <linux/pci.h>
Eric Anholt673a3942008-07-30 12:06:12 -070038
Chris Wilson88241782011-01-07 17:09:48 +000039static __must_check int i915_gem_object_flush_gpu_write_domain(struct drm_i915_gem_object *obj);
Chris Wilson05394f32010-11-08 19:18:58 +000040static void i915_gem_object_flush_gtt_write_domain(struct drm_i915_gem_object *obj);
41static void i915_gem_object_flush_cpu_write_domain(struct drm_i915_gem_object *obj);
Chris Wilson88241782011-01-07 17:09:48 +000042static __must_check int i915_gem_object_bind_to_gtt(struct drm_i915_gem_object *obj,
43 unsigned alignment,
44 bool map_and_fenceable);
Chris Wilsond9e86c02010-11-10 16:40:20 +000045static void i915_gem_clear_fence_reg(struct drm_device *dev,
46 struct drm_i915_fence_reg *reg);
Chris Wilson05394f32010-11-08 19:18:58 +000047static int i915_gem_phys_pwrite(struct drm_device *dev,
48 struct drm_i915_gem_object *obj,
Dave Airlie71acb5e2008-12-30 20:31:46 +100049 struct drm_i915_gem_pwrite *args,
Chris Wilson05394f32010-11-08 19:18:58 +000050 struct drm_file *file);
51static void i915_gem_free_object_tail(struct drm_i915_gem_object *obj);
Eric Anholt673a3942008-07-30 12:06:12 -070052
Chris Wilson17250b72010-10-28 12:51:39 +010053static int i915_gem_inactive_shrink(struct shrinker *shrinker,
Ying Han1495f232011-05-24 17:12:27 -070054 struct shrink_control *sc);
Daniel Vetter8c599672011-12-14 13:57:31 +010055static void i915_gem_object_truncate(struct drm_i915_gem_object *obj);
Chris Wilson31169712009-09-14 16:50:28 +010056
Chris Wilson73aa8082010-09-30 11:46:12 +010057/* some bookkeeping */
58static void i915_gem_info_add_obj(struct drm_i915_private *dev_priv,
59 size_t size)
60{
61 dev_priv->mm.object_count++;
62 dev_priv->mm.object_memory += size;
63}
64
65static void i915_gem_info_remove_obj(struct drm_i915_private *dev_priv,
66 size_t size)
67{
68 dev_priv->mm.object_count--;
69 dev_priv->mm.object_memory -= size;
70}
71
Chris Wilson21dd3732011-01-26 15:55:56 +000072static int
73i915_gem_wait_for_error(struct drm_device *dev)
Chris Wilson30dbf0c2010-09-25 10:19:17 +010074{
75 struct drm_i915_private *dev_priv = dev->dev_private;
76 struct completion *x = &dev_priv->error_completion;
77 unsigned long flags;
78 int ret;
79
80 if (!atomic_read(&dev_priv->mm.wedged))
81 return 0;
82
83 ret = wait_for_completion_interruptible(x);
84 if (ret)
85 return ret;
86
Chris Wilson21dd3732011-01-26 15:55:56 +000087 if (atomic_read(&dev_priv->mm.wedged)) {
88 /* GPU is hung, bump the completion count to account for
89 * the token we just consumed so that we never hit zero and
90 * end up waiting upon a subsequent completion event that
91 * will never happen.
92 */
93 spin_lock_irqsave(&x->wait.lock, flags);
94 x->done++;
95 spin_unlock_irqrestore(&x->wait.lock, flags);
96 }
97 return 0;
Chris Wilson30dbf0c2010-09-25 10:19:17 +010098}
99
Chris Wilson54cf91d2010-11-25 18:00:26 +0000100int i915_mutex_lock_interruptible(struct drm_device *dev)
Chris Wilson76c1dec2010-09-25 11:22:51 +0100101{
Chris Wilson76c1dec2010-09-25 11:22:51 +0100102 int ret;
103
Chris Wilson21dd3732011-01-26 15:55:56 +0000104 ret = i915_gem_wait_for_error(dev);
Chris Wilson76c1dec2010-09-25 11:22:51 +0100105 if (ret)
106 return ret;
107
108 ret = mutex_lock_interruptible(&dev->struct_mutex);
109 if (ret)
110 return ret;
111
Chris Wilson23bc5982010-09-29 16:10:57 +0100112 WARN_ON(i915_verify_lists(dev));
Chris Wilson76c1dec2010-09-25 11:22:51 +0100113 return 0;
114}
Chris Wilson30dbf0c2010-09-25 10:19:17 +0100115
Chris Wilson7d1c4802010-08-07 21:45:03 +0100116static inline bool
Chris Wilson05394f32010-11-08 19:18:58 +0000117i915_gem_object_is_inactive(struct drm_i915_gem_object *obj)
Chris Wilson7d1c4802010-08-07 21:45:03 +0100118{
Chris Wilson05394f32010-11-08 19:18:58 +0000119 return obj->gtt_space && !obj->active && obj->pin_count == 0;
Chris Wilson7d1c4802010-08-07 21:45:03 +0100120}
121
Eric Anholt673a3942008-07-30 12:06:12 -0700122int
123i915_gem_init_ioctl(struct drm_device *dev, void *data,
Chris Wilson05394f32010-11-08 19:18:58 +0000124 struct drm_file *file)
Eric Anholt673a3942008-07-30 12:06:12 -0700125{
Eric Anholt673a3942008-07-30 12:06:12 -0700126 struct drm_i915_gem_init *args = data;
Chris Wilson20217462010-11-23 15:26:33 +0000127
128 if (args->gtt_start >= args->gtt_end ||
129 (args->gtt_end | args->gtt_start) & (PAGE_SIZE - 1))
130 return -EINVAL;
Eric Anholt673a3942008-07-30 12:06:12 -0700131
132 mutex_lock(&dev->struct_mutex);
Daniel Vetter644ec022012-03-26 09:45:40 +0200133 i915_gem_init_global_gtt(dev, args->gtt_start,
134 args->gtt_end, args->gtt_end);
Eric Anholt673a3942008-07-30 12:06:12 -0700135 mutex_unlock(&dev->struct_mutex);
136
Chris Wilson20217462010-11-23 15:26:33 +0000137 return 0;
Eric Anholt673a3942008-07-30 12:06:12 -0700138}
139
Eric Anholt5a125c32008-10-22 21:40:13 -0700140int
141i915_gem_get_aperture_ioctl(struct drm_device *dev, void *data,
Chris Wilson05394f32010-11-08 19:18:58 +0000142 struct drm_file *file)
Eric Anholt5a125c32008-10-22 21:40:13 -0700143{
Chris Wilson73aa8082010-09-30 11:46:12 +0100144 struct drm_i915_private *dev_priv = dev->dev_private;
Eric Anholt5a125c32008-10-22 21:40:13 -0700145 struct drm_i915_gem_get_aperture *args = data;
Chris Wilson6299f992010-11-24 12:23:44 +0000146 struct drm_i915_gem_object *obj;
147 size_t pinned;
Eric Anholt5a125c32008-10-22 21:40:13 -0700148
149 if (!(dev->driver->driver_features & DRIVER_GEM))
150 return -ENODEV;
151
Chris Wilson6299f992010-11-24 12:23:44 +0000152 pinned = 0;
Chris Wilson73aa8082010-09-30 11:46:12 +0100153 mutex_lock(&dev->struct_mutex);
Chris Wilson6299f992010-11-24 12:23:44 +0000154 list_for_each_entry(obj, &dev_priv->mm.pinned_list, mm_list)
155 pinned += obj->gtt_space->size;
Chris Wilson73aa8082010-09-30 11:46:12 +0100156 mutex_unlock(&dev->struct_mutex);
Eric Anholt5a125c32008-10-22 21:40:13 -0700157
Chris Wilson6299f992010-11-24 12:23:44 +0000158 args->aper_size = dev_priv->mm.gtt_total;
Akshay Joshi0206e352011-08-16 15:34:10 -0400159 args->aper_available_size = args->aper_size - pinned;
Chris Wilson6299f992010-11-24 12:23:44 +0000160
Eric Anholt5a125c32008-10-22 21:40:13 -0700161 return 0;
162}
163
Dave Airlieff72145b2011-02-07 12:16:14 +1000164static int
165i915_gem_create(struct drm_file *file,
166 struct drm_device *dev,
167 uint64_t size,
168 uint32_t *handle_p)
Eric Anholt673a3942008-07-30 12:06:12 -0700169{
Chris Wilson05394f32010-11-08 19:18:58 +0000170 struct drm_i915_gem_object *obj;
Pekka Paalanena1a2d1d2009-08-23 12:40:55 +0300171 int ret;
172 u32 handle;
Eric Anholt673a3942008-07-30 12:06:12 -0700173
Dave Airlieff72145b2011-02-07 12:16:14 +1000174 size = roundup(size, PAGE_SIZE);
Chris Wilson8ffc0242011-09-14 14:14:28 +0200175 if (size == 0)
176 return -EINVAL;
Eric Anholt673a3942008-07-30 12:06:12 -0700177
178 /* Allocate the new object */
Dave Airlieff72145b2011-02-07 12:16:14 +1000179 obj = i915_gem_alloc_object(dev, size);
Eric Anholt673a3942008-07-30 12:06:12 -0700180 if (obj == NULL)
181 return -ENOMEM;
182
Chris Wilson05394f32010-11-08 19:18:58 +0000183 ret = drm_gem_handle_create(file, &obj->base, &handle);
Chris Wilson1dfd9752010-09-06 14:44:14 +0100184 if (ret) {
Chris Wilson05394f32010-11-08 19:18:58 +0000185 drm_gem_object_release(&obj->base);
186 i915_gem_info_remove_obj(dev->dev_private, obj->base.size);
Chris Wilson202f2fe2010-10-14 13:20:40 +0100187 kfree(obj);
Eric Anholt673a3942008-07-30 12:06:12 -0700188 return ret;
Chris Wilson1dfd9752010-09-06 14:44:14 +0100189 }
190
Chris Wilson202f2fe2010-10-14 13:20:40 +0100191 /* drop reference from allocate - handle holds it now */
Chris Wilson05394f32010-11-08 19:18:58 +0000192 drm_gem_object_unreference(&obj->base);
Chris Wilson202f2fe2010-10-14 13:20:40 +0100193 trace_i915_gem_object_create(obj);
194
Dave Airlieff72145b2011-02-07 12:16:14 +1000195 *handle_p = handle;
Eric Anholt673a3942008-07-30 12:06:12 -0700196 return 0;
197}
198
Dave Airlieff72145b2011-02-07 12:16:14 +1000199int
200i915_gem_dumb_create(struct drm_file *file,
201 struct drm_device *dev,
202 struct drm_mode_create_dumb *args)
203{
204 /* have to work out size/pitch and return them */
Chris Wilsoned0291f2011-03-19 08:21:45 +0000205 args->pitch = ALIGN(args->width * ((args->bpp + 7) / 8), 64);
Dave Airlieff72145b2011-02-07 12:16:14 +1000206 args->size = args->pitch * args->height;
207 return i915_gem_create(file, dev,
208 args->size, &args->handle);
209}
210
211int i915_gem_dumb_destroy(struct drm_file *file,
212 struct drm_device *dev,
213 uint32_t handle)
214{
215 return drm_gem_handle_delete(file, handle);
216}
217
218/**
219 * Creates a new mm object and returns a handle to it.
220 */
221int
222i915_gem_create_ioctl(struct drm_device *dev, void *data,
223 struct drm_file *file)
224{
225 struct drm_i915_gem_create *args = data;
226 return i915_gem_create(file, dev,
227 args->size, &args->handle);
228}
229
Chris Wilson05394f32010-11-08 19:18:58 +0000230static int i915_gem_object_needs_bit17_swizzle(struct drm_i915_gem_object *obj)
Eric Anholt280b7132009-03-12 16:56:27 -0700231{
Chris Wilson05394f32010-11-08 19:18:58 +0000232 drm_i915_private_t *dev_priv = obj->base.dev->dev_private;
Eric Anholt280b7132009-03-12 16:56:27 -0700233
234 return dev_priv->mm.bit_6_swizzle_x == I915_BIT_6_SWIZZLE_9_10_17 &&
Chris Wilson05394f32010-11-08 19:18:58 +0000235 obj->tiling_mode != I915_TILING_NONE;
Eric Anholt280b7132009-03-12 16:56:27 -0700236}
237
Daniel Vetter8c599672011-12-14 13:57:31 +0100238static inline int
Daniel Vetter8461d222011-12-14 13:57:32 +0100239__copy_to_user_swizzled(char __user *cpu_vaddr,
240 const char *gpu_vaddr, int gpu_offset,
241 int length)
242{
243 int ret, cpu_offset = 0;
244
245 while (length > 0) {
246 int cacheline_end = ALIGN(gpu_offset + 1, 64);
247 int this_length = min(cacheline_end - gpu_offset, length);
248 int swizzled_gpu_offset = gpu_offset ^ 64;
249
250 ret = __copy_to_user(cpu_vaddr + cpu_offset,
251 gpu_vaddr + swizzled_gpu_offset,
252 this_length);
253 if (ret)
254 return ret + length;
255
256 cpu_offset += this_length;
257 gpu_offset += this_length;
258 length -= this_length;
259 }
260
261 return 0;
262}
263
264static inline int
Daniel Vetter8c599672011-12-14 13:57:31 +0100265__copy_from_user_swizzled(char __user *gpu_vaddr, int gpu_offset,
266 const char *cpu_vaddr,
267 int length)
268{
269 int ret, cpu_offset = 0;
270
271 while (length > 0) {
272 int cacheline_end = ALIGN(gpu_offset + 1, 64);
273 int this_length = min(cacheline_end - gpu_offset, length);
274 int swizzled_gpu_offset = gpu_offset ^ 64;
275
276 ret = __copy_from_user(gpu_vaddr + swizzled_gpu_offset,
277 cpu_vaddr + cpu_offset,
278 this_length);
279 if (ret)
280 return ret + length;
281
282 cpu_offset += this_length;
283 gpu_offset += this_length;
284 length -= this_length;
285 }
286
287 return 0;
288}
289
Eric Anholteb014592009-03-10 11:44:52 -0700290static int
Daniel Vetterdbf7bff2012-03-25 19:47:29 +0200291i915_gem_shmem_pread(struct drm_device *dev,
292 struct drm_i915_gem_object *obj,
293 struct drm_i915_gem_pread *args,
294 struct drm_file *file)
Eric Anholteb014592009-03-10 11:44:52 -0700295{
Chris Wilson05394f32010-11-08 19:18:58 +0000296 struct address_space *mapping = obj->base.filp->f_path.dentry->d_inode->i_mapping;
Daniel Vetter8461d222011-12-14 13:57:32 +0100297 char __user *user_data;
Eric Anholteb014592009-03-10 11:44:52 -0700298 ssize_t remain;
Daniel Vetter8461d222011-12-14 13:57:32 +0100299 loff_t offset;
Ben Widawskyeb2c0c82012-02-15 14:42:43 +0100300 int shmem_page_offset, page_length, ret = 0;
Daniel Vetter8461d222011-12-14 13:57:32 +0100301 int obj_do_bit17_swizzling, page_do_bit17_swizzling;
Daniel Vetterdbf7bff2012-03-25 19:47:29 +0200302 int hit_slowpath = 0;
Daniel Vetter84897312012-03-25 19:47:31 +0200303 int needs_clflush = 0;
Eric Anholteb014592009-03-10 11:44:52 -0700304
Daniel Vetter8461d222011-12-14 13:57:32 +0100305 user_data = (char __user *) (uintptr_t) args->data_ptr;
Eric Anholteb014592009-03-10 11:44:52 -0700306 remain = args->size;
307
Daniel Vetter8461d222011-12-14 13:57:32 +0100308 obj_do_bit17_swizzling = i915_gem_object_needs_bit17_swizzle(obj);
Eric Anholteb014592009-03-10 11:44:52 -0700309
Daniel Vetter84897312012-03-25 19:47:31 +0200310 if (!(obj->base.read_domains & I915_GEM_DOMAIN_CPU)) {
311 /* If we're not in the cpu read domain, set ourself into the gtt
312 * read domain and manually flush cachelines (if required). This
313 * optimizes for the case when the gpu will dirty the data
314 * anyway again before the next pread happens. */
315 if (obj->cache_level == I915_CACHE_NONE)
316 needs_clflush = 1;
317 ret = i915_gem_object_set_to_gtt_domain(obj, false);
318 if (ret)
319 return ret;
320 }
321
Eric Anholteb014592009-03-10 11:44:52 -0700322 offset = args->offset;
323
324 while (remain > 0) {
Chris Wilsone5281cc2010-10-28 13:45:36 +0100325 struct page *page;
Daniel Vetter8461d222011-12-14 13:57:32 +0100326 char *vaddr;
Chris Wilsone5281cc2010-10-28 13:45:36 +0100327
Eric Anholteb014592009-03-10 11:44:52 -0700328 /* Operation in this page
329 *
Eric Anholteb014592009-03-10 11:44:52 -0700330 * shmem_page_offset = offset within page in shmem file
Eric Anholteb014592009-03-10 11:44:52 -0700331 * page_length = bytes to copy for this page
332 */
Chris Wilsonc8cbbb82011-05-12 22:17:11 +0100333 shmem_page_offset = offset_in_page(offset);
Eric Anholteb014592009-03-10 11:44:52 -0700334 page_length = remain;
335 if ((shmem_page_offset + page_length) > PAGE_SIZE)
336 page_length = PAGE_SIZE - shmem_page_offset;
Eric Anholteb014592009-03-10 11:44:52 -0700337
Hugh Dickins5949eac2011-06-27 16:18:18 -0700338 page = shmem_read_mapping_page(mapping, offset >> PAGE_SHIFT);
Jesper Juhlb65552f2011-06-12 20:53:44 +0000339 if (IS_ERR(page)) {
340 ret = PTR_ERR(page);
341 goto out;
342 }
Chris Wilsone5281cc2010-10-28 13:45:36 +0100343
Daniel Vetter8461d222011-12-14 13:57:32 +0100344 page_do_bit17_swizzling = obj_do_bit17_swizzling &&
345 (page_to_phys(page) & (1 << 17)) != 0;
346
Daniel Vetterdbf7bff2012-03-25 19:47:29 +0200347 if (!page_do_bit17_swizzling) {
348 vaddr = kmap_atomic(page);
Daniel Vetter84897312012-03-25 19:47:31 +0200349 if (needs_clflush)
350 drm_clflush_virt_range(vaddr + shmem_page_offset,
351 page_length);
Daniel Vetterdbf7bff2012-03-25 19:47:29 +0200352 ret = __copy_to_user_inatomic(user_data,
353 vaddr + shmem_page_offset,
354 page_length);
355 kunmap_atomic(vaddr);
356 if (ret == 0)
357 goto next_page;
358 }
359
360 hit_slowpath = 1;
361
362 mutex_unlock(&dev->struct_mutex);
363
Daniel Vetter8461d222011-12-14 13:57:32 +0100364 vaddr = kmap(page);
Daniel Vetter84897312012-03-25 19:47:31 +0200365 if (needs_clflush)
366 drm_clflush_virt_range(vaddr + shmem_page_offset,
367 page_length);
368
Daniel Vetter8461d222011-12-14 13:57:32 +0100369 if (page_do_bit17_swizzling)
370 ret = __copy_to_user_swizzled(user_data,
371 vaddr, shmem_page_offset,
372 page_length);
373 else
374 ret = __copy_to_user(user_data,
375 vaddr + shmem_page_offset,
376 page_length);
377 kunmap(page);
Eric Anholteb014592009-03-10 11:44:52 -0700378
Daniel Vetterdbf7bff2012-03-25 19:47:29 +0200379 mutex_lock(&dev->struct_mutex);
380next_page:
Chris Wilsone5281cc2010-10-28 13:45:36 +0100381 mark_page_accessed(page);
382 page_cache_release(page);
383
Daniel Vetter8461d222011-12-14 13:57:32 +0100384 if (ret) {
385 ret = -EFAULT;
386 goto out;
387 }
388
Eric Anholteb014592009-03-10 11:44:52 -0700389 remain -= page_length;
Daniel Vetter8461d222011-12-14 13:57:32 +0100390 user_data += page_length;
Eric Anholteb014592009-03-10 11:44:52 -0700391 offset += page_length;
392 }
393
Chris Wilson4f27b752010-10-14 15:26:45 +0100394out:
Daniel Vetterdbf7bff2012-03-25 19:47:29 +0200395 if (hit_slowpath) {
396 /* Fixup: Kill any reinstated backing storage pages */
397 if (obj->madv == __I915_MADV_PURGED)
398 i915_gem_object_truncate(obj);
399 }
Eric Anholteb014592009-03-10 11:44:52 -0700400
401 return ret;
402}
403
Eric Anholt673a3942008-07-30 12:06:12 -0700404/**
405 * Reads data from the object referenced by handle.
406 *
407 * On error, the contents of *data are undefined.
408 */
409int
410i915_gem_pread_ioctl(struct drm_device *dev, void *data,
Chris Wilson05394f32010-11-08 19:18:58 +0000411 struct drm_file *file)
Eric Anholt673a3942008-07-30 12:06:12 -0700412{
413 struct drm_i915_gem_pread *args = data;
Chris Wilson05394f32010-11-08 19:18:58 +0000414 struct drm_i915_gem_object *obj;
Chris Wilson35b62a82010-09-26 20:23:38 +0100415 int ret = 0;
Eric Anholt673a3942008-07-30 12:06:12 -0700416
Chris Wilson51311d02010-11-17 09:10:42 +0000417 if (args->size == 0)
418 return 0;
419
420 if (!access_ok(VERIFY_WRITE,
421 (char __user *)(uintptr_t)args->data_ptr,
422 args->size))
423 return -EFAULT;
424
425 ret = fault_in_pages_writeable((char __user *)(uintptr_t)args->data_ptr,
426 args->size);
427 if (ret)
428 return -EFAULT;
429
Chris Wilson4f27b752010-10-14 15:26:45 +0100430 ret = i915_mutex_lock_interruptible(dev);
Chris Wilson1d7cfea2010-10-17 09:45:41 +0100431 if (ret)
Chris Wilson4f27b752010-10-14 15:26:45 +0100432 return ret;
Eric Anholt673a3942008-07-30 12:06:12 -0700433
Chris Wilson05394f32010-11-08 19:18:58 +0000434 obj = to_intel_bo(drm_gem_object_lookup(dev, file, args->handle));
Chris Wilsonc8725222011-02-19 11:31:06 +0000435 if (&obj->base == NULL) {
Chris Wilson1d7cfea2010-10-17 09:45:41 +0100436 ret = -ENOENT;
437 goto unlock;
Chris Wilson4f27b752010-10-14 15:26:45 +0100438 }
Eric Anholt673a3942008-07-30 12:06:12 -0700439
Chris Wilson7dcd2492010-09-26 20:21:44 +0100440 /* Bounds check source. */
Chris Wilson05394f32010-11-08 19:18:58 +0000441 if (args->offset > obj->base.size ||
442 args->size > obj->base.size - args->offset) {
Chris Wilsonce9d4192010-09-26 20:50:05 +0100443 ret = -EINVAL;
Chris Wilson35b62a82010-09-26 20:23:38 +0100444 goto out;
Chris Wilsonce9d4192010-09-26 20:50:05 +0100445 }
446
Chris Wilsondb53a302011-02-03 11:57:46 +0000447 trace_i915_gem_object_pread(obj, args->offset, args->size);
448
Daniel Vetterdbf7bff2012-03-25 19:47:29 +0200449 ret = i915_gem_shmem_pread(dev, obj, args, file);
Eric Anholt673a3942008-07-30 12:06:12 -0700450
Chris Wilson35b62a82010-09-26 20:23:38 +0100451out:
Chris Wilson05394f32010-11-08 19:18:58 +0000452 drm_gem_object_unreference(&obj->base);
Chris Wilson1d7cfea2010-10-17 09:45:41 +0100453unlock:
Chris Wilson4f27b752010-10-14 15:26:45 +0100454 mutex_unlock(&dev->struct_mutex);
Eric Anholteb014592009-03-10 11:44:52 -0700455 return ret;
Eric Anholt673a3942008-07-30 12:06:12 -0700456}
457
Keith Packard0839ccb2008-10-30 19:38:48 -0700458/* This is the fast write path which cannot handle
459 * page faults in the source data
Linus Torvalds9b7530cc2008-10-20 14:16:43 -0700460 */
Linus Torvalds9b7530cc2008-10-20 14:16:43 -0700461
Keith Packard0839ccb2008-10-30 19:38:48 -0700462static inline int
463fast_user_write(struct io_mapping *mapping,
464 loff_t page_base, int page_offset,
465 char __user *user_data,
466 int length)
467{
468 char *vaddr_atomic;
469 unsigned long unwritten;
470
Peter Zijlstra3e4d3af2010-10-26 14:21:51 -0700471 vaddr_atomic = io_mapping_map_atomic_wc(mapping, page_base);
Keith Packard0839ccb2008-10-30 19:38:48 -0700472 unwritten = __copy_from_user_inatomic_nocache(vaddr_atomic + page_offset,
473 user_data, length);
Peter Zijlstra3e4d3af2010-10-26 14:21:51 -0700474 io_mapping_unmap_atomic(vaddr_atomic);
Chris Wilsonfbd5a262010-10-14 15:03:58 +0100475 return unwritten;
Keith Packard0839ccb2008-10-30 19:38:48 -0700476}
477
478/* Here's the write path which can sleep for
479 * page faults
480 */
481
Chris Wilsonab34c222010-05-27 14:15:35 +0100482static inline void
Eric Anholt3de09aa2009-03-09 09:42:23 -0700483slow_kernel_write(struct io_mapping *mapping,
484 loff_t gtt_base, int gtt_offset,
485 struct page *user_page, int user_offset,
486 int length)
Keith Packard0839ccb2008-10-30 19:38:48 -0700487{
Chris Wilsonab34c222010-05-27 14:15:35 +0100488 char __iomem *dst_vaddr;
489 char *src_vaddr;
Keith Packard0839ccb2008-10-30 19:38:48 -0700490
Chris Wilsonab34c222010-05-27 14:15:35 +0100491 dst_vaddr = io_mapping_map_wc(mapping, gtt_base);
492 src_vaddr = kmap(user_page);
493
494 memcpy_toio(dst_vaddr + gtt_offset,
495 src_vaddr + user_offset,
496 length);
497
498 kunmap(user_page);
499 io_mapping_unmap(dst_vaddr);
Linus Torvalds9b7530cc2008-10-20 14:16:43 -0700500}
501
Eric Anholt3de09aa2009-03-09 09:42:23 -0700502/**
503 * This is the fast pwrite path, where we copy the data directly from the
504 * user into the GTT, uncached.
505 */
Eric Anholt673a3942008-07-30 12:06:12 -0700506static int
Chris Wilson05394f32010-11-08 19:18:58 +0000507i915_gem_gtt_pwrite_fast(struct drm_device *dev,
508 struct drm_i915_gem_object *obj,
Eric Anholt3de09aa2009-03-09 09:42:23 -0700509 struct drm_i915_gem_pwrite *args,
Chris Wilson05394f32010-11-08 19:18:58 +0000510 struct drm_file *file)
Eric Anholt673a3942008-07-30 12:06:12 -0700511{
Keith Packard0839ccb2008-10-30 19:38:48 -0700512 drm_i915_private_t *dev_priv = dev->dev_private;
Eric Anholt673a3942008-07-30 12:06:12 -0700513 ssize_t remain;
Keith Packard0839ccb2008-10-30 19:38:48 -0700514 loff_t offset, page_base;
Eric Anholt673a3942008-07-30 12:06:12 -0700515 char __user *user_data;
Keith Packard0839ccb2008-10-30 19:38:48 -0700516 int page_offset, page_length;
Eric Anholt673a3942008-07-30 12:06:12 -0700517
518 user_data = (char __user *) (uintptr_t) args->data_ptr;
519 remain = args->size;
Eric Anholt673a3942008-07-30 12:06:12 -0700520
Chris Wilson05394f32010-11-08 19:18:58 +0000521 offset = obj->gtt_offset + args->offset;
Eric Anholt673a3942008-07-30 12:06:12 -0700522
523 while (remain > 0) {
524 /* Operation in this page
525 *
Keith Packard0839ccb2008-10-30 19:38:48 -0700526 * page_base = page offset within aperture
527 * page_offset = offset within page
528 * page_length = bytes to copy for this page
Eric Anholt673a3942008-07-30 12:06:12 -0700529 */
Chris Wilsonc8cbbb82011-05-12 22:17:11 +0100530 page_base = offset & PAGE_MASK;
531 page_offset = offset_in_page(offset);
Keith Packard0839ccb2008-10-30 19:38:48 -0700532 page_length = remain;
533 if ((page_offset + remain) > PAGE_SIZE)
534 page_length = PAGE_SIZE - page_offset;
Eric Anholt673a3942008-07-30 12:06:12 -0700535
Keith Packard0839ccb2008-10-30 19:38:48 -0700536 /* If we get a fault while copying data, then (presumably) our
Eric Anholt3de09aa2009-03-09 09:42:23 -0700537 * source page isn't available. Return the error and we'll
538 * retry in the slow path.
Keith Packard0839ccb2008-10-30 19:38:48 -0700539 */
Chris Wilsonfbd5a262010-10-14 15:03:58 +0100540 if (fast_user_write(dev_priv->mm.gtt_mapping, page_base,
541 page_offset, user_data, page_length))
Chris Wilsonfbd5a262010-10-14 15:03:58 +0100542 return -EFAULT;
Eric Anholt673a3942008-07-30 12:06:12 -0700543
Keith Packard0839ccb2008-10-30 19:38:48 -0700544 remain -= page_length;
545 user_data += page_length;
546 offset += page_length;
Eric Anholt673a3942008-07-30 12:06:12 -0700547 }
Eric Anholt673a3942008-07-30 12:06:12 -0700548
Chris Wilsonfbd5a262010-10-14 15:03:58 +0100549 return 0;
Eric Anholt673a3942008-07-30 12:06:12 -0700550}
551
Eric Anholt3de09aa2009-03-09 09:42:23 -0700552/**
553 * This is the fallback GTT pwrite path, which uses get_user_pages to pin
554 * the memory and maps it using kmap_atomic for copying.
555 *
556 * This code resulted in x11perf -rgb10text consuming about 10% more CPU
557 * than using i915_gem_gtt_pwrite_fast on a G45 (32-bit).
558 */
Eric Anholt3043c602008-10-02 12:24:47 -0700559static int
Chris Wilson05394f32010-11-08 19:18:58 +0000560i915_gem_gtt_pwrite_slow(struct drm_device *dev,
561 struct drm_i915_gem_object *obj,
Eric Anholt3de09aa2009-03-09 09:42:23 -0700562 struct drm_i915_gem_pwrite *args,
Chris Wilson05394f32010-11-08 19:18:58 +0000563 struct drm_file *file)
Eric Anholt673a3942008-07-30 12:06:12 -0700564{
Eric Anholt3de09aa2009-03-09 09:42:23 -0700565 drm_i915_private_t *dev_priv = dev->dev_private;
566 ssize_t remain;
567 loff_t gtt_page_base, offset;
568 loff_t first_data_page, last_data_page, num_pages;
569 loff_t pinned_pages, i;
570 struct page **user_pages;
571 struct mm_struct *mm = current->mm;
572 int gtt_page_offset, data_page_offset, data_page_index, page_length;
Eric Anholt673a3942008-07-30 12:06:12 -0700573 int ret;
Eric Anholt3de09aa2009-03-09 09:42:23 -0700574 uint64_t data_ptr = args->data_ptr;
575
576 remain = args->size;
577
578 /* Pin the user pages containing the data. We can't fault while
579 * holding the struct mutex, and all of the pwrite implementations
580 * want to hold it while dereferencing the user data.
581 */
582 first_data_page = data_ptr / PAGE_SIZE;
583 last_data_page = (data_ptr + args->size - 1) / PAGE_SIZE;
584 num_pages = last_data_page - first_data_page + 1;
585
Chris Wilsonfbd5a262010-10-14 15:03:58 +0100586 user_pages = drm_malloc_ab(num_pages, sizeof(struct page *));
Eric Anholt3de09aa2009-03-09 09:42:23 -0700587 if (user_pages == NULL)
588 return -ENOMEM;
589
Chris Wilsonfbd5a262010-10-14 15:03:58 +0100590 mutex_unlock(&dev->struct_mutex);
Eric Anholt3de09aa2009-03-09 09:42:23 -0700591 down_read(&mm->mmap_sem);
592 pinned_pages = get_user_pages(current, mm, (uintptr_t)args->data_ptr,
593 num_pages, 0, 0, user_pages, NULL);
594 up_read(&mm->mmap_sem);
Chris Wilsonfbd5a262010-10-14 15:03:58 +0100595 mutex_lock(&dev->struct_mutex);
Eric Anholt3de09aa2009-03-09 09:42:23 -0700596 if (pinned_pages < num_pages) {
597 ret = -EFAULT;
598 goto out_unpin_pages;
599 }
600
Chris Wilsond9e86c02010-11-10 16:40:20 +0000601 ret = i915_gem_object_set_to_gtt_domain(obj, true);
602 if (ret)
603 goto out_unpin_pages;
604
605 ret = i915_gem_object_put_fence(obj);
Eric Anholt3de09aa2009-03-09 09:42:23 -0700606 if (ret)
Chris Wilsonfbd5a262010-10-14 15:03:58 +0100607 goto out_unpin_pages;
Eric Anholt3de09aa2009-03-09 09:42:23 -0700608
Chris Wilson05394f32010-11-08 19:18:58 +0000609 offset = obj->gtt_offset + args->offset;
Eric Anholt3de09aa2009-03-09 09:42:23 -0700610
611 while (remain > 0) {
612 /* Operation in this page
613 *
614 * gtt_page_base = page offset within aperture
615 * gtt_page_offset = offset within page in aperture
616 * data_page_index = page number in get_user_pages return
617 * data_page_offset = offset with data_page_index page.
618 * page_length = bytes to copy for this page
619 */
620 gtt_page_base = offset & PAGE_MASK;
Chris Wilsonc8cbbb82011-05-12 22:17:11 +0100621 gtt_page_offset = offset_in_page(offset);
Eric Anholt3de09aa2009-03-09 09:42:23 -0700622 data_page_index = data_ptr / PAGE_SIZE - first_data_page;
Chris Wilsonc8cbbb82011-05-12 22:17:11 +0100623 data_page_offset = offset_in_page(data_ptr);
Eric Anholt3de09aa2009-03-09 09:42:23 -0700624
625 page_length = remain;
626 if ((gtt_page_offset + page_length) > PAGE_SIZE)
627 page_length = PAGE_SIZE - gtt_page_offset;
628 if ((data_page_offset + page_length) > PAGE_SIZE)
629 page_length = PAGE_SIZE - data_page_offset;
630
Chris Wilsonab34c222010-05-27 14:15:35 +0100631 slow_kernel_write(dev_priv->mm.gtt_mapping,
632 gtt_page_base, gtt_page_offset,
633 user_pages[data_page_index],
634 data_page_offset,
635 page_length);
Eric Anholt3de09aa2009-03-09 09:42:23 -0700636
637 remain -= page_length;
638 offset += page_length;
639 data_ptr += page_length;
640 }
641
Eric Anholt3de09aa2009-03-09 09:42:23 -0700642out_unpin_pages:
643 for (i = 0; i < pinned_pages; i++)
644 page_cache_release(user_pages[i]);
Jesse Barnes8e7d2b22009-05-08 16:13:25 -0700645 drm_free_large(user_pages);
Eric Anholt3de09aa2009-03-09 09:42:23 -0700646
647 return ret;
648}
649
Eric Anholt673a3942008-07-30 12:06:12 -0700650static int
Daniel Vettere244a442012-03-25 19:47:28 +0200651i915_gem_shmem_pwrite(struct drm_device *dev,
652 struct drm_i915_gem_object *obj,
653 struct drm_i915_gem_pwrite *args,
654 struct drm_file *file)
Eric Anholt40123c12009-03-09 13:42:30 -0700655{
Chris Wilson05394f32010-11-08 19:18:58 +0000656 struct address_space *mapping = obj->base.filp->f_path.dentry->d_inode->i_mapping;
Eric Anholt40123c12009-03-09 13:42:30 -0700657 ssize_t remain;
Daniel Vetter8c599672011-12-14 13:57:31 +0100658 loff_t offset;
659 char __user *user_data;
Ben Widawskyeb2c0c82012-02-15 14:42:43 +0100660 int shmem_page_offset, page_length, ret = 0;
Daniel Vetter8c599672011-12-14 13:57:31 +0100661 int obj_do_bit17_swizzling, page_do_bit17_swizzling;
Daniel Vettere244a442012-03-25 19:47:28 +0200662 int hit_slowpath = 0;
Eric Anholt40123c12009-03-09 13:42:30 -0700663
Daniel Vetter8c599672011-12-14 13:57:31 +0100664 user_data = (char __user *) (uintptr_t) args->data_ptr;
Eric Anholt40123c12009-03-09 13:42:30 -0700665 remain = args->size;
666
Daniel Vetter8c599672011-12-14 13:57:31 +0100667 obj_do_bit17_swizzling = i915_gem_object_needs_bit17_swizzle(obj);
Eric Anholt40123c12009-03-09 13:42:30 -0700668
Eric Anholt40123c12009-03-09 13:42:30 -0700669 offset = args->offset;
Chris Wilson05394f32010-11-08 19:18:58 +0000670 obj->dirty = 1;
Eric Anholt40123c12009-03-09 13:42:30 -0700671
672 while (remain > 0) {
Chris Wilsone5281cc2010-10-28 13:45:36 +0100673 struct page *page;
Daniel Vetter8c599672011-12-14 13:57:31 +0100674 char *vaddr;
Chris Wilsone5281cc2010-10-28 13:45:36 +0100675
Eric Anholt40123c12009-03-09 13:42:30 -0700676 /* Operation in this page
677 *
Eric Anholt40123c12009-03-09 13:42:30 -0700678 * shmem_page_offset = offset within page in shmem file
Eric Anholt40123c12009-03-09 13:42:30 -0700679 * page_length = bytes to copy for this page
680 */
Chris Wilsonc8cbbb82011-05-12 22:17:11 +0100681 shmem_page_offset = offset_in_page(offset);
Eric Anholt40123c12009-03-09 13:42:30 -0700682
683 page_length = remain;
684 if ((shmem_page_offset + page_length) > PAGE_SIZE)
685 page_length = PAGE_SIZE - shmem_page_offset;
Eric Anholt40123c12009-03-09 13:42:30 -0700686
Hugh Dickins5949eac2011-06-27 16:18:18 -0700687 page = shmem_read_mapping_page(mapping, offset >> PAGE_SHIFT);
Chris Wilsone5281cc2010-10-28 13:45:36 +0100688 if (IS_ERR(page)) {
689 ret = PTR_ERR(page);
690 goto out;
691 }
692
Daniel Vetter8c599672011-12-14 13:57:31 +0100693 page_do_bit17_swizzling = obj_do_bit17_swizzling &&
694 (page_to_phys(page) & (1 << 17)) != 0;
695
Daniel Vettere244a442012-03-25 19:47:28 +0200696 if (!page_do_bit17_swizzling) {
697 vaddr = kmap_atomic(page);
698 ret = __copy_from_user_inatomic(vaddr + shmem_page_offset,
699 user_data,
700 page_length);
701 kunmap_atomic(vaddr);
702
703 if (ret == 0)
704 goto next_page;
705 }
706
707 hit_slowpath = 1;
708
709 mutex_unlock(&dev->struct_mutex);
710
Daniel Vetter8c599672011-12-14 13:57:31 +0100711 vaddr = kmap(page);
712 if (page_do_bit17_swizzling)
713 ret = __copy_from_user_swizzled(vaddr, shmem_page_offset,
714 user_data,
715 page_length);
716 else
717 ret = __copy_from_user(vaddr + shmem_page_offset,
718 user_data,
719 page_length);
720 kunmap(page);
Eric Anholt40123c12009-03-09 13:42:30 -0700721
Daniel Vettere244a442012-03-25 19:47:28 +0200722 mutex_lock(&dev->struct_mutex);
723next_page:
Chris Wilsone5281cc2010-10-28 13:45:36 +0100724 set_page_dirty(page);
725 mark_page_accessed(page);
726 page_cache_release(page);
727
Daniel Vetter8c599672011-12-14 13:57:31 +0100728 if (ret) {
729 ret = -EFAULT;
730 goto out;
731 }
732
Eric Anholt40123c12009-03-09 13:42:30 -0700733 remain -= page_length;
Daniel Vetter8c599672011-12-14 13:57:31 +0100734 user_data += page_length;
Eric Anholt40123c12009-03-09 13:42:30 -0700735 offset += page_length;
736 }
737
Chris Wilsonfbd5a262010-10-14 15:03:58 +0100738out:
Daniel Vettere244a442012-03-25 19:47:28 +0200739 if (hit_slowpath) {
740 /* Fixup: Kill any reinstated backing storage pages */
741 if (obj->madv == __I915_MADV_PURGED)
742 i915_gem_object_truncate(obj);
743 /* and flush dirty cachelines in case the object isn't in the cpu write
744 * domain anymore. */
745 if (obj->base.write_domain != I915_GEM_DOMAIN_CPU) {
746 i915_gem_clflush_object(obj);
747 intel_gtt_chipset_flush();
748 }
Daniel Vetter8c599672011-12-14 13:57:31 +0100749 }
Eric Anholt40123c12009-03-09 13:42:30 -0700750
751 return ret;
Eric Anholt673a3942008-07-30 12:06:12 -0700752}
753
754/**
755 * Writes data to the object referenced by handle.
756 *
757 * On error, the contents of the buffer that were to be modified are undefined.
758 */
759int
760i915_gem_pwrite_ioctl(struct drm_device *dev, void *data,
Chris Wilsonfbd5a262010-10-14 15:03:58 +0100761 struct drm_file *file)
Eric Anholt673a3942008-07-30 12:06:12 -0700762{
763 struct drm_i915_gem_pwrite *args = data;
Chris Wilson05394f32010-11-08 19:18:58 +0000764 struct drm_i915_gem_object *obj;
Chris Wilson51311d02010-11-17 09:10:42 +0000765 int ret;
766
767 if (args->size == 0)
768 return 0;
769
770 if (!access_ok(VERIFY_READ,
771 (char __user *)(uintptr_t)args->data_ptr,
772 args->size))
773 return -EFAULT;
774
775 ret = fault_in_pages_readable((char __user *)(uintptr_t)args->data_ptr,
776 args->size);
777 if (ret)
778 return -EFAULT;
Eric Anholt673a3942008-07-30 12:06:12 -0700779
Chris Wilson1d7cfea2010-10-17 09:45:41 +0100780 ret = i915_mutex_lock_interruptible(dev);
781 if (ret)
782 return ret;
783
Chris Wilson05394f32010-11-08 19:18:58 +0000784 obj = to_intel_bo(drm_gem_object_lookup(dev, file, args->handle));
Chris Wilsonc8725222011-02-19 11:31:06 +0000785 if (&obj->base == NULL) {
Chris Wilson1d7cfea2010-10-17 09:45:41 +0100786 ret = -ENOENT;
787 goto unlock;
788 }
Eric Anholt673a3942008-07-30 12:06:12 -0700789
Chris Wilson7dcd2492010-09-26 20:21:44 +0100790 /* Bounds check destination. */
Chris Wilson05394f32010-11-08 19:18:58 +0000791 if (args->offset > obj->base.size ||
792 args->size > obj->base.size - args->offset) {
Chris Wilsonce9d4192010-09-26 20:50:05 +0100793 ret = -EINVAL;
Chris Wilson35b62a82010-09-26 20:23:38 +0100794 goto out;
Chris Wilsonce9d4192010-09-26 20:50:05 +0100795 }
796
Chris Wilsondb53a302011-02-03 11:57:46 +0000797 trace_i915_gem_object_pwrite(obj, args->offset, args->size);
798
Eric Anholt673a3942008-07-30 12:06:12 -0700799 /* We can only do the GTT pwrite on untiled buffers, as otherwise
800 * it would end up going through the fenced access, and we'll get
801 * different detiling behavior between reading and writing.
802 * pread/pwrite currently are reading and writing from the CPU
803 * perspective, requiring manual detiling by the client.
804 */
Daniel Vetter5c0480f2011-12-14 13:57:30 +0100805 if (obj->phys_obj) {
Chris Wilsonfbd5a262010-10-14 15:03:58 +0100806 ret = i915_gem_phys_pwrite(dev, obj, args, file);
Daniel Vetter5c0480f2011-12-14 13:57:30 +0100807 goto out;
808 }
809
810 if (obj->gtt_space &&
811 obj->base.write_domain != I915_GEM_DOMAIN_CPU) {
Daniel Vetter75e9e912010-11-04 17:11:09 +0100812 ret = i915_gem_object_pin(obj, 0, true);
Chris Wilsonfbd5a262010-10-14 15:03:58 +0100813 if (ret)
814 goto out;
815
Chris Wilsond9e86c02010-11-10 16:40:20 +0000816 ret = i915_gem_object_set_to_gtt_domain(obj, true);
817 if (ret)
818 goto out_unpin;
819
820 ret = i915_gem_object_put_fence(obj);
Chris Wilsonfbd5a262010-10-14 15:03:58 +0100821 if (ret)
822 goto out_unpin;
823
824 ret = i915_gem_gtt_pwrite_fast(dev, obj, args, file);
825 if (ret == -EFAULT)
826 ret = i915_gem_gtt_pwrite_slow(dev, obj, args, file);
827
828out_unpin:
829 i915_gem_object_unpin(obj);
Chris Wilsonfbd5a262010-10-14 15:03:58 +0100830
Daniel Vetter5c0480f2011-12-14 13:57:30 +0100831 if (ret != -EFAULT)
832 goto out;
833 /* Fall through to the shmfs paths because the gtt paths might
834 * fail with non-page-backed user pointers (e.g. gtt mappings
835 * when moving data between textures). */
Eric Anholt40123c12009-03-09 13:42:30 -0700836 }
Eric Anholt673a3942008-07-30 12:06:12 -0700837
Daniel Vetter5c0480f2011-12-14 13:57:30 +0100838 ret = i915_gem_object_set_to_cpu_domain(obj, 1);
839 if (ret)
840 goto out;
841
Daniel Vettere244a442012-03-25 19:47:28 +0200842 ret = i915_gem_shmem_pwrite(dev, obj, args, file);
Daniel Vetter5c0480f2011-12-14 13:57:30 +0100843
Chris Wilson35b62a82010-09-26 20:23:38 +0100844out:
Chris Wilson05394f32010-11-08 19:18:58 +0000845 drm_gem_object_unreference(&obj->base);
Chris Wilson1d7cfea2010-10-17 09:45:41 +0100846unlock:
Chris Wilsonfbd5a262010-10-14 15:03:58 +0100847 mutex_unlock(&dev->struct_mutex);
Eric Anholt673a3942008-07-30 12:06:12 -0700848 return ret;
849}
850
851/**
Eric Anholt2ef7eea2008-11-10 10:53:25 -0800852 * Called when user space prepares to use an object with the CPU, either
853 * through the mmap ioctl's mapping or a GTT mapping.
Eric Anholt673a3942008-07-30 12:06:12 -0700854 */
855int
856i915_gem_set_domain_ioctl(struct drm_device *dev, void *data,
Chris Wilson05394f32010-11-08 19:18:58 +0000857 struct drm_file *file)
Eric Anholt673a3942008-07-30 12:06:12 -0700858{
859 struct drm_i915_gem_set_domain *args = data;
Chris Wilson05394f32010-11-08 19:18:58 +0000860 struct drm_i915_gem_object *obj;
Eric Anholt2ef7eea2008-11-10 10:53:25 -0800861 uint32_t read_domains = args->read_domains;
862 uint32_t write_domain = args->write_domain;
Eric Anholt673a3942008-07-30 12:06:12 -0700863 int ret;
864
865 if (!(dev->driver->driver_features & DRIVER_GEM))
866 return -ENODEV;
867
Eric Anholt2ef7eea2008-11-10 10:53:25 -0800868 /* Only handle setting domains to types used by the CPU. */
Chris Wilson21d509e2009-06-06 09:46:02 +0100869 if (write_domain & I915_GEM_GPU_DOMAINS)
Eric Anholt2ef7eea2008-11-10 10:53:25 -0800870 return -EINVAL;
871
Chris Wilson21d509e2009-06-06 09:46:02 +0100872 if (read_domains & I915_GEM_GPU_DOMAINS)
Eric Anholt2ef7eea2008-11-10 10:53:25 -0800873 return -EINVAL;
874
875 /* Having something in the write domain implies it's in the read
876 * domain, and only that read domain. Enforce that in the request.
877 */
878 if (write_domain != 0 && read_domains != write_domain)
879 return -EINVAL;
880
Chris Wilson76c1dec2010-09-25 11:22:51 +0100881 ret = i915_mutex_lock_interruptible(dev);
Chris Wilson1d7cfea2010-10-17 09:45:41 +0100882 if (ret)
Chris Wilson76c1dec2010-09-25 11:22:51 +0100883 return ret;
Eric Anholt673a3942008-07-30 12:06:12 -0700884
Chris Wilson05394f32010-11-08 19:18:58 +0000885 obj = to_intel_bo(drm_gem_object_lookup(dev, file, args->handle));
Chris Wilsonc8725222011-02-19 11:31:06 +0000886 if (&obj->base == NULL) {
Chris Wilson1d7cfea2010-10-17 09:45:41 +0100887 ret = -ENOENT;
888 goto unlock;
Chris Wilson76c1dec2010-09-25 11:22:51 +0100889 }
Jesse Barnes652c3932009-08-17 13:31:43 -0700890
Eric Anholt2ef7eea2008-11-10 10:53:25 -0800891 if (read_domains & I915_GEM_DOMAIN_GTT) {
892 ret = i915_gem_object_set_to_gtt_domain(obj, write_domain != 0);
Eric Anholt02354392008-11-26 13:58:13 -0800893
894 /* Silently promote "you're not bound, there was nothing to do"
895 * to success, since the client was just asking us to
896 * make sure everything was done.
897 */
898 if (ret == -EINVAL)
899 ret = 0;
Eric Anholt2ef7eea2008-11-10 10:53:25 -0800900 } else {
Eric Anholte47c68e2008-11-14 13:35:19 -0800901 ret = i915_gem_object_set_to_cpu_domain(obj, write_domain != 0);
Eric Anholt2ef7eea2008-11-10 10:53:25 -0800902 }
903
Chris Wilson05394f32010-11-08 19:18:58 +0000904 drm_gem_object_unreference(&obj->base);
Chris Wilson1d7cfea2010-10-17 09:45:41 +0100905unlock:
Eric Anholt673a3942008-07-30 12:06:12 -0700906 mutex_unlock(&dev->struct_mutex);
907 return ret;
908}
909
910/**
911 * Called when user space has done writes to this buffer
912 */
913int
914i915_gem_sw_finish_ioctl(struct drm_device *dev, void *data,
Chris Wilson05394f32010-11-08 19:18:58 +0000915 struct drm_file *file)
Eric Anholt673a3942008-07-30 12:06:12 -0700916{
917 struct drm_i915_gem_sw_finish *args = data;
Chris Wilson05394f32010-11-08 19:18:58 +0000918 struct drm_i915_gem_object *obj;
Eric Anholt673a3942008-07-30 12:06:12 -0700919 int ret = 0;
920
921 if (!(dev->driver->driver_features & DRIVER_GEM))
922 return -ENODEV;
923
Chris Wilson76c1dec2010-09-25 11:22:51 +0100924 ret = i915_mutex_lock_interruptible(dev);
Chris Wilson1d7cfea2010-10-17 09:45:41 +0100925 if (ret)
Chris Wilson76c1dec2010-09-25 11:22:51 +0100926 return ret;
Chris Wilson1d7cfea2010-10-17 09:45:41 +0100927
Chris Wilson05394f32010-11-08 19:18:58 +0000928 obj = to_intel_bo(drm_gem_object_lookup(dev, file, args->handle));
Chris Wilsonc8725222011-02-19 11:31:06 +0000929 if (&obj->base == NULL) {
Chris Wilson1d7cfea2010-10-17 09:45:41 +0100930 ret = -ENOENT;
931 goto unlock;
Eric Anholt673a3942008-07-30 12:06:12 -0700932 }
933
Eric Anholt673a3942008-07-30 12:06:12 -0700934 /* Pinned buffers may be scanout, so flush the cache */
Chris Wilson05394f32010-11-08 19:18:58 +0000935 if (obj->pin_count)
Eric Anholte47c68e2008-11-14 13:35:19 -0800936 i915_gem_object_flush_cpu_write_domain(obj);
937
Chris Wilson05394f32010-11-08 19:18:58 +0000938 drm_gem_object_unreference(&obj->base);
Chris Wilson1d7cfea2010-10-17 09:45:41 +0100939unlock:
Eric Anholt673a3942008-07-30 12:06:12 -0700940 mutex_unlock(&dev->struct_mutex);
941 return ret;
942}
943
944/**
945 * Maps the contents of an object, returning the address it is mapped
946 * into.
947 *
948 * While the mapping holds a reference on the contents of the object, it doesn't
949 * imply a ref on the object itself.
950 */
951int
952i915_gem_mmap_ioctl(struct drm_device *dev, void *data,
Chris Wilson05394f32010-11-08 19:18:58 +0000953 struct drm_file *file)
Eric Anholt673a3942008-07-30 12:06:12 -0700954{
955 struct drm_i915_gem_mmap *args = data;
956 struct drm_gem_object *obj;
Eric Anholt673a3942008-07-30 12:06:12 -0700957 unsigned long addr;
958
959 if (!(dev->driver->driver_features & DRIVER_GEM))
960 return -ENODEV;
961
Chris Wilson05394f32010-11-08 19:18:58 +0000962 obj = drm_gem_object_lookup(dev, file, args->handle);
Eric Anholt673a3942008-07-30 12:06:12 -0700963 if (obj == NULL)
Chris Wilsonbf79cb92010-08-04 14:19:46 +0100964 return -ENOENT;
Eric Anholt673a3942008-07-30 12:06:12 -0700965
Eric Anholt673a3942008-07-30 12:06:12 -0700966 down_write(&current->mm->mmap_sem);
967 addr = do_mmap(obj->filp, 0, args->size,
968 PROT_READ | PROT_WRITE, MAP_SHARED,
969 args->offset);
970 up_write(&current->mm->mmap_sem);
Luca Barbieribc9025b2010-02-09 05:49:12 +0000971 drm_gem_object_unreference_unlocked(obj);
Eric Anholt673a3942008-07-30 12:06:12 -0700972 if (IS_ERR((void *)addr))
973 return addr;
974
975 args->addr_ptr = (uint64_t) addr;
976
977 return 0;
978}
979
Jesse Barnesde151cf2008-11-12 10:03:55 -0800980/**
981 * i915_gem_fault - fault a page into the GTT
982 * vma: VMA in question
983 * vmf: fault info
984 *
985 * The fault handler is set up by drm_gem_mmap() when a object is GTT mapped
986 * from userspace. The fault handler takes care of binding the object to
987 * the GTT (if needed), allocating and programming a fence register (again,
988 * only if needed based on whether the old reg is still valid or the object
989 * is tiled) and inserting a new PTE into the faulting process.
990 *
991 * Note that the faulting process may involve evicting existing objects
992 * from the GTT and/or fence registers to make room. So performance may
993 * suffer if the GTT working set is large or there are few fence registers
994 * left.
995 */
996int i915_gem_fault(struct vm_area_struct *vma, struct vm_fault *vmf)
997{
Chris Wilson05394f32010-11-08 19:18:58 +0000998 struct drm_i915_gem_object *obj = to_intel_bo(vma->vm_private_data);
999 struct drm_device *dev = obj->base.dev;
Chris Wilson7d1c4802010-08-07 21:45:03 +01001000 drm_i915_private_t *dev_priv = dev->dev_private;
Jesse Barnesde151cf2008-11-12 10:03:55 -08001001 pgoff_t page_offset;
1002 unsigned long pfn;
1003 int ret = 0;
Jesse Barnes0f973f22009-01-26 17:10:45 -08001004 bool write = !!(vmf->flags & FAULT_FLAG_WRITE);
Jesse Barnesde151cf2008-11-12 10:03:55 -08001005
1006 /* We don't use vmf->pgoff since that has the fake offset */
1007 page_offset = ((unsigned long)vmf->virtual_address - vma->vm_start) >>
1008 PAGE_SHIFT;
1009
Chris Wilsond9bc7e92011-02-07 13:09:31 +00001010 ret = i915_mutex_lock_interruptible(dev);
1011 if (ret)
1012 goto out;
Chris Wilsona00b10c2010-09-24 21:15:47 +01001013
Chris Wilsondb53a302011-02-03 11:57:46 +00001014 trace_i915_gem_object_fault(obj, page_offset, true, write);
1015
Chris Wilsond9bc7e92011-02-07 13:09:31 +00001016 /* Now bind it into the GTT if needed */
Chris Wilson919926a2010-11-12 13:42:53 +00001017 if (!obj->map_and_fenceable) {
1018 ret = i915_gem_object_unbind(obj);
1019 if (ret)
1020 goto unlock;
Chris Wilsona00b10c2010-09-24 21:15:47 +01001021 }
Chris Wilson05394f32010-11-08 19:18:58 +00001022 if (!obj->gtt_space) {
Daniel Vetter75e9e912010-11-04 17:11:09 +01001023 ret = i915_gem_object_bind_to_gtt(obj, 0, true);
Chris Wilsonc7150892009-09-23 00:43:56 +01001024 if (ret)
1025 goto unlock;
Jesse Barnesde151cf2008-11-12 10:03:55 -08001026
Eric Anholte92d03b2011-06-14 16:43:09 -07001027 ret = i915_gem_object_set_to_gtt_domain(obj, write);
1028 if (ret)
1029 goto unlock;
1030 }
Chris Wilson4a684a42010-10-28 14:44:08 +01001031
Daniel Vetter74898d72012-02-15 23:50:22 +01001032 if (!obj->has_global_gtt_mapping)
1033 i915_gem_gtt_bind_object(obj, obj->cache_level);
1034
Chris Wilsond9e86c02010-11-10 16:40:20 +00001035 if (obj->tiling_mode == I915_TILING_NONE)
1036 ret = i915_gem_object_put_fence(obj);
1037 else
Chris Wilsonce453d82011-02-21 14:43:56 +00001038 ret = i915_gem_object_get_fence(obj, NULL);
Chris Wilsond9e86c02010-11-10 16:40:20 +00001039 if (ret)
1040 goto unlock;
Jesse Barnesde151cf2008-11-12 10:03:55 -08001041
Chris Wilson05394f32010-11-08 19:18:58 +00001042 if (i915_gem_object_is_inactive(obj))
1043 list_move_tail(&obj->mm_list, &dev_priv->mm.inactive_list);
Chris Wilson7d1c4802010-08-07 21:45:03 +01001044
Chris Wilson6299f992010-11-24 12:23:44 +00001045 obj->fault_mappable = true;
1046
Chris Wilson05394f32010-11-08 19:18:58 +00001047 pfn = ((dev->agp->base + obj->gtt_offset) >> PAGE_SHIFT) +
Jesse Barnesde151cf2008-11-12 10:03:55 -08001048 page_offset;
1049
1050 /* Finally, remap it using the new GTT offset */
1051 ret = vm_insert_pfn(vma, (unsigned long)vmf->virtual_address, pfn);
Chris Wilsonc7150892009-09-23 00:43:56 +01001052unlock:
Jesse Barnesde151cf2008-11-12 10:03:55 -08001053 mutex_unlock(&dev->struct_mutex);
Chris Wilsond9bc7e92011-02-07 13:09:31 +00001054out:
Jesse Barnesde151cf2008-11-12 10:03:55 -08001055 switch (ret) {
Chris Wilsond9bc7e92011-02-07 13:09:31 +00001056 case -EIO:
Chris Wilson045e7692010-11-07 09:18:22 +00001057 case -EAGAIN:
Chris Wilsond9bc7e92011-02-07 13:09:31 +00001058 /* Give the error handler a chance to run and move the
1059 * objects off the GPU active list. Next time we service the
1060 * fault, we should be able to transition the page into the
1061 * GTT without touching the GPU (and so avoid further
1062 * EIO/EGAIN). If the GPU is wedged, then there is no issue
1063 * with coherency, just lost writes.
1064 */
Chris Wilson045e7692010-11-07 09:18:22 +00001065 set_need_resched();
Chris Wilsonc7150892009-09-23 00:43:56 +01001066 case 0:
1067 case -ERESTARTSYS:
Chris Wilsonbed636a2011-02-11 20:31:19 +00001068 case -EINTR:
Chris Wilsonc7150892009-09-23 00:43:56 +01001069 return VM_FAULT_NOPAGE;
Jesse Barnesde151cf2008-11-12 10:03:55 -08001070 case -ENOMEM:
Jesse Barnesde151cf2008-11-12 10:03:55 -08001071 return VM_FAULT_OOM;
Jesse Barnesde151cf2008-11-12 10:03:55 -08001072 default:
Chris Wilsonc7150892009-09-23 00:43:56 +01001073 return VM_FAULT_SIGBUS;
Jesse Barnesde151cf2008-11-12 10:03:55 -08001074 }
1075}
1076
1077/**
Chris Wilson901782b2009-07-10 08:18:50 +01001078 * i915_gem_release_mmap - remove physical page mappings
1079 * @obj: obj in question
1080 *
André Goddard Rosaaf901ca2009-11-14 13:09:05 -02001081 * Preserve the reservation of the mmapping with the DRM core code, but
Chris Wilson901782b2009-07-10 08:18:50 +01001082 * relinquish ownership of the pages back to the system.
1083 *
1084 * It is vital that we remove the page mapping if we have mapped a tiled
1085 * object through the GTT and then lose the fence register due to
1086 * resource pressure. Similarly if the object has been moved out of the
1087 * aperture, than pages mapped into userspace must be revoked. Removing the
1088 * mapping will then trigger a page fault on the next user access, allowing
1089 * fixup by i915_gem_fault().
1090 */
Eric Anholtd05ca302009-07-10 13:02:26 -07001091void
Chris Wilson05394f32010-11-08 19:18:58 +00001092i915_gem_release_mmap(struct drm_i915_gem_object *obj)
Chris Wilson901782b2009-07-10 08:18:50 +01001093{
Chris Wilson6299f992010-11-24 12:23:44 +00001094 if (!obj->fault_mappable)
1095 return;
Chris Wilson901782b2009-07-10 08:18:50 +01001096
Chris Wilsonf6e47882011-03-20 21:09:12 +00001097 if (obj->base.dev->dev_mapping)
1098 unmap_mapping_range(obj->base.dev->dev_mapping,
1099 (loff_t)obj->base.map_list.hash.key<<PAGE_SHIFT,
1100 obj->base.size, 1);
Daniel Vetterfb7d5162010-10-01 22:05:20 +02001101
Chris Wilson6299f992010-11-24 12:23:44 +00001102 obj->fault_mappable = false;
Chris Wilson901782b2009-07-10 08:18:50 +01001103}
1104
Chris Wilson92b88ae2010-11-09 11:47:32 +00001105static uint32_t
Chris Wilsone28f8712011-07-18 13:11:49 -07001106i915_gem_get_gtt_size(struct drm_device *dev, uint32_t size, int tiling_mode)
Chris Wilson92b88ae2010-11-09 11:47:32 +00001107{
Chris Wilsone28f8712011-07-18 13:11:49 -07001108 uint32_t gtt_size;
Chris Wilson92b88ae2010-11-09 11:47:32 +00001109
1110 if (INTEL_INFO(dev)->gen >= 4 ||
Chris Wilsone28f8712011-07-18 13:11:49 -07001111 tiling_mode == I915_TILING_NONE)
1112 return size;
Chris Wilson92b88ae2010-11-09 11:47:32 +00001113
1114 /* Previous chips need a power-of-two fence region when tiling */
1115 if (INTEL_INFO(dev)->gen == 3)
Chris Wilsone28f8712011-07-18 13:11:49 -07001116 gtt_size = 1024*1024;
Chris Wilson92b88ae2010-11-09 11:47:32 +00001117 else
Chris Wilsone28f8712011-07-18 13:11:49 -07001118 gtt_size = 512*1024;
Chris Wilson92b88ae2010-11-09 11:47:32 +00001119
Chris Wilsone28f8712011-07-18 13:11:49 -07001120 while (gtt_size < size)
1121 gtt_size <<= 1;
Chris Wilson92b88ae2010-11-09 11:47:32 +00001122
Chris Wilsone28f8712011-07-18 13:11:49 -07001123 return gtt_size;
Chris Wilson92b88ae2010-11-09 11:47:32 +00001124}
1125
Jesse Barnesde151cf2008-11-12 10:03:55 -08001126/**
1127 * i915_gem_get_gtt_alignment - return required GTT alignment for an object
1128 * @obj: object to check
1129 *
1130 * Return the required GTT alignment for an object, taking into account
Daniel Vetter5e783302010-11-14 22:32:36 +01001131 * potential fence register mapping.
Jesse Barnesde151cf2008-11-12 10:03:55 -08001132 */
1133static uint32_t
Chris Wilsone28f8712011-07-18 13:11:49 -07001134i915_gem_get_gtt_alignment(struct drm_device *dev,
1135 uint32_t size,
1136 int tiling_mode)
Jesse Barnesde151cf2008-11-12 10:03:55 -08001137{
Jesse Barnesde151cf2008-11-12 10:03:55 -08001138 /*
1139 * Minimum alignment is 4k (GTT page size), but might be greater
1140 * if a fence register is needed for the object.
1141 */
Chris Wilsona00b10c2010-09-24 21:15:47 +01001142 if (INTEL_INFO(dev)->gen >= 4 ||
Chris Wilsone28f8712011-07-18 13:11:49 -07001143 tiling_mode == I915_TILING_NONE)
Jesse Barnesde151cf2008-11-12 10:03:55 -08001144 return 4096;
1145
1146 /*
1147 * Previous chips need to be aligned to the size of the smallest
1148 * fence register that can contain the object.
1149 */
Chris Wilsone28f8712011-07-18 13:11:49 -07001150 return i915_gem_get_gtt_size(dev, size, tiling_mode);
Chris Wilsona00b10c2010-09-24 21:15:47 +01001151}
1152
Daniel Vetter5e783302010-11-14 22:32:36 +01001153/**
1154 * i915_gem_get_unfenced_gtt_alignment - return required GTT alignment for an
1155 * unfenced object
Chris Wilsone28f8712011-07-18 13:11:49 -07001156 * @dev: the device
1157 * @size: size of the object
1158 * @tiling_mode: tiling mode of the object
Daniel Vetter5e783302010-11-14 22:32:36 +01001159 *
1160 * Return the required GTT alignment for an object, only taking into account
1161 * unfenced tiled surface requirements.
1162 */
Chris Wilson467cffb2011-03-07 10:42:03 +00001163uint32_t
Chris Wilsone28f8712011-07-18 13:11:49 -07001164i915_gem_get_unfenced_gtt_alignment(struct drm_device *dev,
1165 uint32_t size,
1166 int tiling_mode)
Daniel Vetter5e783302010-11-14 22:32:36 +01001167{
Daniel Vetter5e783302010-11-14 22:32:36 +01001168 /*
1169 * Minimum alignment is 4k (GTT page size) for sane hw.
1170 */
1171 if (INTEL_INFO(dev)->gen >= 4 || IS_G33(dev) ||
Chris Wilsone28f8712011-07-18 13:11:49 -07001172 tiling_mode == I915_TILING_NONE)
Daniel Vetter5e783302010-11-14 22:32:36 +01001173 return 4096;
1174
Chris Wilsone28f8712011-07-18 13:11:49 -07001175 /* Previous hardware however needs to be aligned to a power-of-two
1176 * tile height. The simplest method for determining this is to reuse
1177 * the power-of-tile object size.
Daniel Vetter5e783302010-11-14 22:32:36 +01001178 */
Chris Wilsone28f8712011-07-18 13:11:49 -07001179 return i915_gem_get_gtt_size(dev, size, tiling_mode);
Daniel Vetter5e783302010-11-14 22:32:36 +01001180}
1181
Jesse Barnesde151cf2008-11-12 10:03:55 -08001182int
Dave Airlieff72145b2011-02-07 12:16:14 +10001183i915_gem_mmap_gtt(struct drm_file *file,
1184 struct drm_device *dev,
1185 uint32_t handle,
1186 uint64_t *offset)
Jesse Barnesde151cf2008-11-12 10:03:55 -08001187{
Chris Wilsonda761a62010-10-27 17:37:08 +01001188 struct drm_i915_private *dev_priv = dev->dev_private;
Chris Wilson05394f32010-11-08 19:18:58 +00001189 struct drm_i915_gem_object *obj;
Jesse Barnesde151cf2008-11-12 10:03:55 -08001190 int ret;
1191
1192 if (!(dev->driver->driver_features & DRIVER_GEM))
1193 return -ENODEV;
1194
Chris Wilson76c1dec2010-09-25 11:22:51 +01001195 ret = i915_mutex_lock_interruptible(dev);
Chris Wilson1d7cfea2010-10-17 09:45:41 +01001196 if (ret)
Chris Wilson76c1dec2010-09-25 11:22:51 +01001197 return ret;
Jesse Barnesde151cf2008-11-12 10:03:55 -08001198
Dave Airlieff72145b2011-02-07 12:16:14 +10001199 obj = to_intel_bo(drm_gem_object_lookup(dev, file, handle));
Chris Wilsonc8725222011-02-19 11:31:06 +00001200 if (&obj->base == NULL) {
Chris Wilson1d7cfea2010-10-17 09:45:41 +01001201 ret = -ENOENT;
1202 goto unlock;
1203 }
Jesse Barnesde151cf2008-11-12 10:03:55 -08001204
Chris Wilson05394f32010-11-08 19:18:58 +00001205 if (obj->base.size > dev_priv->mm.gtt_mappable_end) {
Chris Wilsonda761a62010-10-27 17:37:08 +01001206 ret = -E2BIG;
Eric Anholtff56b0b2011-10-31 23:16:21 -07001207 goto out;
Chris Wilsonda761a62010-10-27 17:37:08 +01001208 }
1209
Chris Wilson05394f32010-11-08 19:18:58 +00001210 if (obj->madv != I915_MADV_WILLNEED) {
Chris Wilsonab182822009-09-22 18:46:17 +01001211 DRM_ERROR("Attempting to mmap a purgeable buffer\n");
Chris Wilson1d7cfea2010-10-17 09:45:41 +01001212 ret = -EINVAL;
1213 goto out;
Chris Wilsonab182822009-09-22 18:46:17 +01001214 }
1215
Chris Wilson05394f32010-11-08 19:18:58 +00001216 if (!obj->base.map_list.map) {
Rob Clarkb464e9a2011-08-10 08:09:08 -05001217 ret = drm_gem_create_mmap_offset(&obj->base);
Chris Wilson1d7cfea2010-10-17 09:45:41 +01001218 if (ret)
1219 goto out;
Jesse Barnesde151cf2008-11-12 10:03:55 -08001220 }
1221
Dave Airlieff72145b2011-02-07 12:16:14 +10001222 *offset = (u64)obj->base.map_list.hash.key << PAGE_SHIFT;
Jesse Barnesde151cf2008-11-12 10:03:55 -08001223
Chris Wilson1d7cfea2010-10-17 09:45:41 +01001224out:
Chris Wilson05394f32010-11-08 19:18:58 +00001225 drm_gem_object_unreference(&obj->base);
Chris Wilson1d7cfea2010-10-17 09:45:41 +01001226unlock:
Jesse Barnesde151cf2008-11-12 10:03:55 -08001227 mutex_unlock(&dev->struct_mutex);
Chris Wilson1d7cfea2010-10-17 09:45:41 +01001228 return ret;
Jesse Barnesde151cf2008-11-12 10:03:55 -08001229}
1230
Dave Airlieff72145b2011-02-07 12:16:14 +10001231/**
1232 * i915_gem_mmap_gtt_ioctl - prepare an object for GTT mmap'ing
1233 * @dev: DRM device
1234 * @data: GTT mapping ioctl data
1235 * @file: GEM object info
1236 *
1237 * Simply returns the fake offset to userspace so it can mmap it.
1238 * The mmap call will end up in drm_gem_mmap(), which will set things
1239 * up so we can get faults in the handler above.
1240 *
1241 * The fault handler will take care of binding the object into the GTT
1242 * (since it may have been evicted to make room for something), allocating
1243 * a fence register, and mapping the appropriate aperture address into
1244 * userspace.
1245 */
1246int
1247i915_gem_mmap_gtt_ioctl(struct drm_device *dev, void *data,
1248 struct drm_file *file)
1249{
1250 struct drm_i915_gem_mmap_gtt *args = data;
1251
1252 if (!(dev->driver->driver_features & DRIVER_GEM))
1253 return -ENODEV;
1254
1255 return i915_gem_mmap_gtt(file, dev, args->handle, &args->offset);
1256}
1257
1258
Chris Wilsone5281cc2010-10-28 13:45:36 +01001259static int
Chris Wilson05394f32010-11-08 19:18:58 +00001260i915_gem_object_get_pages_gtt(struct drm_i915_gem_object *obj,
Chris Wilsone5281cc2010-10-28 13:45:36 +01001261 gfp_t gfpmask)
1262{
Chris Wilsone5281cc2010-10-28 13:45:36 +01001263 int page_count, i;
1264 struct address_space *mapping;
1265 struct inode *inode;
1266 struct page *page;
1267
1268 /* Get the list of pages out of our struct file. They'll be pinned
1269 * at this point until we release them.
1270 */
Chris Wilson05394f32010-11-08 19:18:58 +00001271 page_count = obj->base.size / PAGE_SIZE;
1272 BUG_ON(obj->pages != NULL);
1273 obj->pages = drm_malloc_ab(page_count, sizeof(struct page *));
1274 if (obj->pages == NULL)
Chris Wilsone5281cc2010-10-28 13:45:36 +01001275 return -ENOMEM;
1276
Chris Wilson05394f32010-11-08 19:18:58 +00001277 inode = obj->base.filp->f_path.dentry->d_inode;
Chris Wilsone5281cc2010-10-28 13:45:36 +01001278 mapping = inode->i_mapping;
Hugh Dickins5949eac2011-06-27 16:18:18 -07001279 gfpmask |= mapping_gfp_mask(mapping);
1280
Chris Wilsone5281cc2010-10-28 13:45:36 +01001281 for (i = 0; i < page_count; i++) {
Hugh Dickins5949eac2011-06-27 16:18:18 -07001282 page = shmem_read_mapping_page_gfp(mapping, i, gfpmask);
Chris Wilsone5281cc2010-10-28 13:45:36 +01001283 if (IS_ERR(page))
1284 goto err_pages;
1285
Chris Wilson05394f32010-11-08 19:18:58 +00001286 obj->pages[i] = page;
Chris Wilsone5281cc2010-10-28 13:45:36 +01001287 }
1288
Daniel Vetter6dacfd22011-09-12 21:30:02 +02001289 if (i915_gem_object_needs_bit17_swizzle(obj))
Chris Wilsone5281cc2010-10-28 13:45:36 +01001290 i915_gem_object_do_bit_17_swizzle(obj);
1291
1292 return 0;
1293
1294err_pages:
1295 while (i--)
Chris Wilson05394f32010-11-08 19:18:58 +00001296 page_cache_release(obj->pages[i]);
Chris Wilsone5281cc2010-10-28 13:45:36 +01001297
Chris Wilson05394f32010-11-08 19:18:58 +00001298 drm_free_large(obj->pages);
1299 obj->pages = NULL;
Chris Wilsone5281cc2010-10-28 13:45:36 +01001300 return PTR_ERR(page);
1301}
1302
Chris Wilson5cdf5882010-09-27 15:51:07 +01001303static void
Chris Wilson05394f32010-11-08 19:18:58 +00001304i915_gem_object_put_pages_gtt(struct drm_i915_gem_object *obj)
Eric Anholt673a3942008-07-30 12:06:12 -07001305{
Chris Wilson05394f32010-11-08 19:18:58 +00001306 int page_count = obj->base.size / PAGE_SIZE;
Eric Anholt673a3942008-07-30 12:06:12 -07001307 int i;
1308
Chris Wilson05394f32010-11-08 19:18:58 +00001309 BUG_ON(obj->madv == __I915_MADV_PURGED);
Eric Anholt856fa192009-03-19 14:10:50 -07001310
Daniel Vetter6dacfd22011-09-12 21:30:02 +02001311 if (i915_gem_object_needs_bit17_swizzle(obj))
Eric Anholt280b7132009-03-12 16:56:27 -07001312 i915_gem_object_save_bit_17_swizzle(obj);
1313
Chris Wilson05394f32010-11-08 19:18:58 +00001314 if (obj->madv == I915_MADV_DONTNEED)
1315 obj->dirty = 0;
Chris Wilson3ef94da2009-09-14 16:50:29 +01001316
1317 for (i = 0; i < page_count; i++) {
Chris Wilson05394f32010-11-08 19:18:58 +00001318 if (obj->dirty)
1319 set_page_dirty(obj->pages[i]);
Chris Wilson3ef94da2009-09-14 16:50:29 +01001320
Chris Wilson05394f32010-11-08 19:18:58 +00001321 if (obj->madv == I915_MADV_WILLNEED)
1322 mark_page_accessed(obj->pages[i]);
Chris Wilson3ef94da2009-09-14 16:50:29 +01001323
Chris Wilson05394f32010-11-08 19:18:58 +00001324 page_cache_release(obj->pages[i]);
Chris Wilson3ef94da2009-09-14 16:50:29 +01001325 }
Chris Wilson05394f32010-11-08 19:18:58 +00001326 obj->dirty = 0;
Eric Anholt673a3942008-07-30 12:06:12 -07001327
Chris Wilson05394f32010-11-08 19:18:58 +00001328 drm_free_large(obj->pages);
1329 obj->pages = NULL;
Eric Anholt673a3942008-07-30 12:06:12 -07001330}
1331
Chris Wilson54cf91d2010-11-25 18:00:26 +00001332void
Chris Wilson05394f32010-11-08 19:18:58 +00001333i915_gem_object_move_to_active(struct drm_i915_gem_object *obj,
Chris Wilson1ec14ad2010-12-04 11:30:53 +00001334 struct intel_ring_buffer *ring,
1335 u32 seqno)
Eric Anholt673a3942008-07-30 12:06:12 -07001336{
Chris Wilson05394f32010-11-08 19:18:58 +00001337 struct drm_device *dev = obj->base.dev;
Chris Wilson69dc4982010-10-19 10:36:51 +01001338 struct drm_i915_private *dev_priv = dev->dev_private;
Daniel Vetter617dbe22010-02-11 22:16:02 +01001339
Zou Nan hai852835f2010-05-21 09:08:56 +08001340 BUG_ON(ring == NULL);
Chris Wilson05394f32010-11-08 19:18:58 +00001341 obj->ring = ring;
Eric Anholt673a3942008-07-30 12:06:12 -07001342
1343 /* Add a reference if we're newly entering the active list. */
Chris Wilson05394f32010-11-08 19:18:58 +00001344 if (!obj->active) {
1345 drm_gem_object_reference(&obj->base);
1346 obj->active = 1;
Eric Anholt673a3942008-07-30 12:06:12 -07001347 }
Daniel Vettere35a41d2010-02-11 22:13:59 +01001348
Eric Anholt673a3942008-07-30 12:06:12 -07001349 /* Move from whatever list we were on to the tail of execution. */
Chris Wilson05394f32010-11-08 19:18:58 +00001350 list_move_tail(&obj->mm_list, &dev_priv->mm.active_list);
1351 list_move_tail(&obj->ring_list, &ring->active_list);
Chris Wilsoncaea7472010-11-12 13:53:37 +00001352
Chris Wilson05394f32010-11-08 19:18:58 +00001353 obj->last_rendering_seqno = seqno;
Chris Wilsoncaea7472010-11-12 13:53:37 +00001354 if (obj->fenced_gpu_access) {
1355 struct drm_i915_fence_reg *reg;
1356
1357 BUG_ON(obj->fence_reg == I915_FENCE_REG_NONE);
1358
1359 obj->last_fenced_seqno = seqno;
1360 obj->last_fenced_ring = ring;
1361
1362 reg = &dev_priv->fence_regs[obj->fence_reg];
1363 list_move_tail(&reg->lru_list, &dev_priv->mm.fence_list);
1364 }
1365}
1366
1367static void
1368i915_gem_object_move_off_active(struct drm_i915_gem_object *obj)
1369{
1370 list_del_init(&obj->ring_list);
1371 obj->last_rendering_seqno = 0;
Eric Anholt673a3942008-07-30 12:06:12 -07001372}
1373
Eric Anholtce44b0e2008-11-06 16:00:31 -08001374static void
Chris Wilson05394f32010-11-08 19:18:58 +00001375i915_gem_object_move_to_flushing(struct drm_i915_gem_object *obj)
Eric Anholtce44b0e2008-11-06 16:00:31 -08001376{
Chris Wilson05394f32010-11-08 19:18:58 +00001377 struct drm_device *dev = obj->base.dev;
Eric Anholtce44b0e2008-11-06 16:00:31 -08001378 drm_i915_private_t *dev_priv = dev->dev_private;
Eric Anholtce44b0e2008-11-06 16:00:31 -08001379
Chris Wilson05394f32010-11-08 19:18:58 +00001380 BUG_ON(!obj->active);
1381 list_move_tail(&obj->mm_list, &dev_priv->mm.flushing_list);
Chris Wilsoncaea7472010-11-12 13:53:37 +00001382
1383 i915_gem_object_move_off_active(obj);
1384}
1385
1386static void
1387i915_gem_object_move_to_inactive(struct drm_i915_gem_object *obj)
1388{
1389 struct drm_device *dev = obj->base.dev;
1390 struct drm_i915_private *dev_priv = dev->dev_private;
1391
1392 if (obj->pin_count != 0)
1393 list_move_tail(&obj->mm_list, &dev_priv->mm.pinned_list);
1394 else
1395 list_move_tail(&obj->mm_list, &dev_priv->mm.inactive_list);
1396
1397 BUG_ON(!list_empty(&obj->gpu_write_list));
1398 BUG_ON(!obj->active);
1399 obj->ring = NULL;
1400
1401 i915_gem_object_move_off_active(obj);
1402 obj->fenced_gpu_access = false;
Chris Wilsoncaea7472010-11-12 13:53:37 +00001403
1404 obj->active = 0;
Chris Wilson87ca9c82010-12-02 09:42:56 +00001405 obj->pending_gpu_write = false;
Chris Wilsoncaea7472010-11-12 13:53:37 +00001406 drm_gem_object_unreference(&obj->base);
1407
1408 WARN_ON(i915_verify_lists(dev));
Eric Anholtce44b0e2008-11-06 16:00:31 -08001409}
Eric Anholt673a3942008-07-30 12:06:12 -07001410
Chris Wilson963b4832009-09-20 23:03:54 +01001411/* Immediately discard the backing storage */
1412static void
Chris Wilson05394f32010-11-08 19:18:58 +00001413i915_gem_object_truncate(struct drm_i915_gem_object *obj)
Chris Wilson963b4832009-09-20 23:03:54 +01001414{
Chris Wilsonbb6baf72009-09-22 14:24:13 +01001415 struct inode *inode;
Chris Wilson963b4832009-09-20 23:03:54 +01001416
Chris Wilsonae9fed62010-08-07 11:01:30 +01001417 /* Our goal here is to return as much of the memory as
1418 * is possible back to the system as we are called from OOM.
1419 * To do this we must instruct the shmfs to drop all of its
Hugh Dickinse2377fe2011-06-27 16:18:19 -07001420 * backing pages, *now*.
Chris Wilsonae9fed62010-08-07 11:01:30 +01001421 */
Chris Wilson05394f32010-11-08 19:18:58 +00001422 inode = obj->base.filp->f_path.dentry->d_inode;
Hugh Dickinse2377fe2011-06-27 16:18:19 -07001423 shmem_truncate_range(inode, 0, (loff_t)-1);
Chris Wilsonbb6baf72009-09-22 14:24:13 +01001424
Chris Wilsona14917e2012-02-24 21:13:38 +00001425 if (obj->base.map_list.map)
1426 drm_gem_free_mmap_offset(&obj->base);
1427
Chris Wilson05394f32010-11-08 19:18:58 +00001428 obj->madv = __I915_MADV_PURGED;
Chris Wilson963b4832009-09-20 23:03:54 +01001429}
1430
1431static inline int
Chris Wilson05394f32010-11-08 19:18:58 +00001432i915_gem_object_is_purgeable(struct drm_i915_gem_object *obj)
Chris Wilson963b4832009-09-20 23:03:54 +01001433{
Chris Wilson05394f32010-11-08 19:18:58 +00001434 return obj->madv == I915_MADV_DONTNEED;
Chris Wilson963b4832009-09-20 23:03:54 +01001435}
1436
Eric Anholt673a3942008-07-30 12:06:12 -07001437static void
Chris Wilsondb53a302011-02-03 11:57:46 +00001438i915_gem_process_flushing_list(struct intel_ring_buffer *ring,
1439 uint32_t flush_domains)
Daniel Vetter63560392010-02-19 11:51:59 +01001440{
Chris Wilson05394f32010-11-08 19:18:58 +00001441 struct drm_i915_gem_object *obj, *next;
Daniel Vetter63560392010-02-19 11:51:59 +01001442
Chris Wilson05394f32010-11-08 19:18:58 +00001443 list_for_each_entry_safe(obj, next,
Chris Wilson64193402010-10-24 12:38:05 +01001444 &ring->gpu_write_list,
Daniel Vetter63560392010-02-19 11:51:59 +01001445 gpu_write_list) {
Chris Wilson05394f32010-11-08 19:18:58 +00001446 if (obj->base.write_domain & flush_domains) {
1447 uint32_t old_write_domain = obj->base.write_domain;
Daniel Vetter63560392010-02-19 11:51:59 +01001448
Chris Wilson05394f32010-11-08 19:18:58 +00001449 obj->base.write_domain = 0;
1450 list_del_init(&obj->gpu_write_list);
Chris Wilson1ec14ad2010-12-04 11:30:53 +00001451 i915_gem_object_move_to_active(obj, ring,
Chris Wilsondb53a302011-02-03 11:57:46 +00001452 i915_gem_next_request_seqno(ring));
Daniel Vetter63560392010-02-19 11:51:59 +01001453
Daniel Vetter63560392010-02-19 11:51:59 +01001454 trace_i915_gem_object_change_domain(obj,
Chris Wilson05394f32010-11-08 19:18:58 +00001455 obj->base.read_domains,
Daniel Vetter63560392010-02-19 11:51:59 +01001456 old_write_domain);
1457 }
1458 }
1459}
Zou Nan hai8187a2b2010-05-21 09:08:55 +08001460
Daniel Vetter53d227f2012-01-25 16:32:49 +01001461static u32
1462i915_gem_get_seqno(struct drm_device *dev)
1463{
1464 drm_i915_private_t *dev_priv = dev->dev_private;
1465 u32 seqno = dev_priv->next_seqno;
1466
1467 /* reserve 0 for non-seqno */
1468 if (++dev_priv->next_seqno == 0)
1469 dev_priv->next_seqno = 1;
1470
1471 return seqno;
1472}
1473
1474u32
1475i915_gem_next_request_seqno(struct intel_ring_buffer *ring)
1476{
1477 if (ring->outstanding_lazy_request == 0)
1478 ring->outstanding_lazy_request = i915_gem_get_seqno(ring->dev);
1479
1480 return ring->outstanding_lazy_request;
1481}
1482
Chris Wilson3cce4692010-10-27 16:11:02 +01001483int
Chris Wilsondb53a302011-02-03 11:57:46 +00001484i915_add_request(struct intel_ring_buffer *ring,
Chris Wilsonf787a5f2010-09-24 16:02:42 +01001485 struct drm_file *file,
Chris Wilsondb53a302011-02-03 11:57:46 +00001486 struct drm_i915_gem_request *request)
Eric Anholt673a3942008-07-30 12:06:12 -07001487{
Chris Wilsondb53a302011-02-03 11:57:46 +00001488 drm_i915_private_t *dev_priv = ring->dev->dev_private;
Eric Anholt673a3942008-07-30 12:06:12 -07001489 uint32_t seqno;
Chris Wilsona71d8d92012-02-15 11:25:36 +00001490 u32 request_ring_position;
Eric Anholt673a3942008-07-30 12:06:12 -07001491 int was_empty;
Chris Wilson3cce4692010-10-27 16:11:02 +01001492 int ret;
1493
1494 BUG_ON(request == NULL);
Daniel Vetter53d227f2012-01-25 16:32:49 +01001495 seqno = i915_gem_next_request_seqno(ring);
Eric Anholt673a3942008-07-30 12:06:12 -07001496
Chris Wilsona71d8d92012-02-15 11:25:36 +00001497 /* Record the position of the start of the request so that
1498 * should we detect the updated seqno part-way through the
1499 * GPU processing the request, we never over-estimate the
1500 * position of the head.
1501 */
1502 request_ring_position = intel_ring_get_tail(ring);
1503
Chris Wilson3cce4692010-10-27 16:11:02 +01001504 ret = ring->add_request(ring, &seqno);
1505 if (ret)
1506 return ret;
Eric Anholt673a3942008-07-30 12:06:12 -07001507
Chris Wilsondb53a302011-02-03 11:57:46 +00001508 trace_i915_gem_request_add(ring, seqno);
Eric Anholt673a3942008-07-30 12:06:12 -07001509
1510 request->seqno = seqno;
Zou Nan hai852835f2010-05-21 09:08:56 +08001511 request->ring = ring;
Chris Wilsona71d8d92012-02-15 11:25:36 +00001512 request->tail = request_ring_position;
Eric Anholt673a3942008-07-30 12:06:12 -07001513 request->emitted_jiffies = jiffies;
Zou Nan hai852835f2010-05-21 09:08:56 +08001514 was_empty = list_empty(&ring->request_list);
1515 list_add_tail(&request->list, &ring->request_list);
1516
Chris Wilsondb53a302011-02-03 11:57:46 +00001517 if (file) {
1518 struct drm_i915_file_private *file_priv = file->driver_priv;
1519
Chris Wilson1c255952010-09-26 11:03:27 +01001520 spin_lock(&file_priv->mm.lock);
Chris Wilsonf787a5f2010-09-24 16:02:42 +01001521 request->file_priv = file_priv;
Eric Anholtb9624422009-06-03 07:27:35 +00001522 list_add_tail(&request->client_list,
Chris Wilsonf787a5f2010-09-24 16:02:42 +01001523 &file_priv->mm.request_list);
Chris Wilson1c255952010-09-26 11:03:27 +01001524 spin_unlock(&file_priv->mm.lock);
Eric Anholtb9624422009-06-03 07:27:35 +00001525 }
Eric Anholt673a3942008-07-30 12:06:12 -07001526
Daniel Vetter5391d0c2012-01-25 14:03:57 +01001527 ring->outstanding_lazy_request = 0;
Chris Wilsondb53a302011-02-03 11:57:46 +00001528
Ben Gamarif65d9422009-09-14 17:48:44 -04001529 if (!dev_priv->mm.suspended) {
Ben Widawsky3e0dc6b2011-06-29 10:26:42 -07001530 if (i915_enable_hangcheck) {
1531 mod_timer(&dev_priv->hangcheck_timer,
1532 jiffies +
1533 msecs_to_jiffies(DRM_I915_HANGCHECK_PERIOD));
1534 }
Ben Gamarif65d9422009-09-14 17:48:44 -04001535 if (was_empty)
Chris Wilsonb3b079d2010-09-13 23:44:34 +01001536 queue_delayed_work(dev_priv->wq,
1537 &dev_priv->mm.retire_work, HZ);
Ben Gamarif65d9422009-09-14 17:48:44 -04001538 }
Chris Wilson3cce4692010-10-27 16:11:02 +01001539 return 0;
Eric Anholt673a3942008-07-30 12:06:12 -07001540}
1541
Chris Wilsonf787a5f2010-09-24 16:02:42 +01001542static inline void
1543i915_gem_request_remove_from_client(struct drm_i915_gem_request *request)
Eric Anholt673a3942008-07-30 12:06:12 -07001544{
Chris Wilson1c255952010-09-26 11:03:27 +01001545 struct drm_i915_file_private *file_priv = request->file_priv;
Eric Anholt673a3942008-07-30 12:06:12 -07001546
Chris Wilson1c255952010-09-26 11:03:27 +01001547 if (!file_priv)
1548 return;
Chris Wilson1c5d22f2009-08-25 11:15:50 +01001549
Chris Wilson1c255952010-09-26 11:03:27 +01001550 spin_lock(&file_priv->mm.lock);
Herton Ronaldo Krzesinski09bfa512011-03-17 13:45:12 +00001551 if (request->file_priv) {
1552 list_del(&request->client_list);
1553 request->file_priv = NULL;
1554 }
Chris Wilson1c255952010-09-26 11:03:27 +01001555 spin_unlock(&file_priv->mm.lock);
Eric Anholt673a3942008-07-30 12:06:12 -07001556}
1557
Chris Wilsondfaae392010-09-22 10:31:52 +01001558static void i915_gem_reset_ring_lists(struct drm_i915_private *dev_priv,
1559 struct intel_ring_buffer *ring)
Chris Wilson9375e442010-09-19 12:21:28 +01001560{
Chris Wilsondfaae392010-09-22 10:31:52 +01001561 while (!list_empty(&ring->request_list)) {
1562 struct drm_i915_gem_request *request;
Chris Wilson9375e442010-09-19 12:21:28 +01001563
Chris Wilsondfaae392010-09-22 10:31:52 +01001564 request = list_first_entry(&ring->request_list,
1565 struct drm_i915_gem_request,
1566 list);
1567
1568 list_del(&request->list);
Chris Wilsonf787a5f2010-09-24 16:02:42 +01001569 i915_gem_request_remove_from_client(request);
Chris Wilsondfaae392010-09-22 10:31:52 +01001570 kfree(request);
1571 }
1572
1573 while (!list_empty(&ring->active_list)) {
Chris Wilson05394f32010-11-08 19:18:58 +00001574 struct drm_i915_gem_object *obj;
Eric Anholt673a3942008-07-30 12:06:12 -07001575
Chris Wilson05394f32010-11-08 19:18:58 +00001576 obj = list_first_entry(&ring->active_list,
1577 struct drm_i915_gem_object,
1578 ring_list);
Eric Anholt673a3942008-07-30 12:06:12 -07001579
Chris Wilson05394f32010-11-08 19:18:58 +00001580 obj->base.write_domain = 0;
1581 list_del_init(&obj->gpu_write_list);
1582 i915_gem_object_move_to_inactive(obj);
Eric Anholt673a3942008-07-30 12:06:12 -07001583 }
Eric Anholt673a3942008-07-30 12:06:12 -07001584}
1585
Chris Wilson312817a2010-11-22 11:50:11 +00001586static void i915_gem_reset_fences(struct drm_device *dev)
1587{
1588 struct drm_i915_private *dev_priv = dev->dev_private;
1589 int i;
1590
Daniel Vetter4b9de732011-10-09 21:52:02 +02001591 for (i = 0; i < dev_priv->num_fence_regs; i++) {
Chris Wilson312817a2010-11-22 11:50:11 +00001592 struct drm_i915_fence_reg *reg = &dev_priv->fence_regs[i];
Chris Wilson7d2cb392010-11-27 17:38:29 +00001593 struct drm_i915_gem_object *obj = reg->obj;
1594
1595 if (!obj)
1596 continue;
1597
1598 if (obj->tiling_mode)
1599 i915_gem_release_mmap(obj);
1600
Chris Wilsond9e86c02010-11-10 16:40:20 +00001601 reg->obj->fence_reg = I915_FENCE_REG_NONE;
1602 reg->obj->fenced_gpu_access = false;
1603 reg->obj->last_fenced_seqno = 0;
1604 reg->obj->last_fenced_ring = NULL;
1605 i915_gem_clear_fence_reg(dev, reg);
Chris Wilson312817a2010-11-22 11:50:11 +00001606 }
1607}
1608
Chris Wilson069efc12010-09-30 16:53:18 +01001609void i915_gem_reset(struct drm_device *dev)
Eric Anholt673a3942008-07-30 12:06:12 -07001610{
Chris Wilsondfaae392010-09-22 10:31:52 +01001611 struct drm_i915_private *dev_priv = dev->dev_private;
Chris Wilson05394f32010-11-08 19:18:58 +00001612 struct drm_i915_gem_object *obj;
Chris Wilson1ec14ad2010-12-04 11:30:53 +00001613 int i;
Eric Anholt673a3942008-07-30 12:06:12 -07001614
Chris Wilson1ec14ad2010-12-04 11:30:53 +00001615 for (i = 0; i < I915_NUM_RINGS; i++)
1616 i915_gem_reset_ring_lists(dev_priv, &dev_priv->ring[i]);
Chris Wilsondfaae392010-09-22 10:31:52 +01001617
1618 /* Remove anything from the flushing lists. The GPU cache is likely
1619 * to be lost on reset along with the data, so simply move the
1620 * lost bo to the inactive list.
1621 */
1622 while (!list_empty(&dev_priv->mm.flushing_list)) {
Akshay Joshi0206e352011-08-16 15:34:10 -04001623 obj = list_first_entry(&dev_priv->mm.flushing_list,
Chris Wilson05394f32010-11-08 19:18:58 +00001624 struct drm_i915_gem_object,
1625 mm_list);
Chris Wilson9375e442010-09-19 12:21:28 +01001626
Chris Wilson05394f32010-11-08 19:18:58 +00001627 obj->base.write_domain = 0;
1628 list_del_init(&obj->gpu_write_list);
1629 i915_gem_object_move_to_inactive(obj);
Chris Wilson9375e442010-09-19 12:21:28 +01001630 }
Chris Wilson9375e442010-09-19 12:21:28 +01001631
Chris Wilsondfaae392010-09-22 10:31:52 +01001632 /* Move everything out of the GPU domains to ensure we do any
1633 * necessary invalidation upon reuse.
1634 */
Chris Wilson05394f32010-11-08 19:18:58 +00001635 list_for_each_entry(obj,
Chris Wilson77f01232010-09-19 12:31:36 +01001636 &dev_priv->mm.inactive_list,
Chris Wilson69dc4982010-10-19 10:36:51 +01001637 mm_list)
Chris Wilson77f01232010-09-19 12:31:36 +01001638 {
Chris Wilson05394f32010-11-08 19:18:58 +00001639 obj->base.read_domains &= ~I915_GEM_GPU_DOMAINS;
Chris Wilson77f01232010-09-19 12:31:36 +01001640 }
Chris Wilson069efc12010-09-30 16:53:18 +01001641
1642 /* The fence registers are invalidated so clear them out */
Chris Wilson312817a2010-11-22 11:50:11 +00001643 i915_gem_reset_fences(dev);
Eric Anholt673a3942008-07-30 12:06:12 -07001644}
1645
1646/**
1647 * This function clears the request list as sequence numbers are passed.
1648 */
Chris Wilsona71d8d92012-02-15 11:25:36 +00001649void
Chris Wilsondb53a302011-02-03 11:57:46 +00001650i915_gem_retire_requests_ring(struct intel_ring_buffer *ring)
Eric Anholt673a3942008-07-30 12:06:12 -07001651{
Eric Anholt673a3942008-07-30 12:06:12 -07001652 uint32_t seqno;
Chris Wilson1ec14ad2010-12-04 11:30:53 +00001653 int i;
Eric Anholt673a3942008-07-30 12:06:12 -07001654
Chris Wilsondb53a302011-02-03 11:57:46 +00001655 if (list_empty(&ring->request_list))
Karsten Wiese6c0594a2009-02-23 15:07:57 +01001656 return;
1657
Chris Wilsondb53a302011-02-03 11:57:46 +00001658 WARN_ON(i915_verify_lists(ring->dev));
Eric Anholt673a3942008-07-30 12:06:12 -07001659
Chris Wilson78501ea2010-10-27 12:18:21 +01001660 seqno = ring->get_seqno(ring);
Chris Wilson1ec14ad2010-12-04 11:30:53 +00001661
Chris Wilson076e2c02011-01-21 10:07:18 +00001662 for (i = 0; i < ARRAY_SIZE(ring->sync_seqno); i++)
Chris Wilson1ec14ad2010-12-04 11:30:53 +00001663 if (seqno >= ring->sync_seqno[i])
1664 ring->sync_seqno[i] = 0;
1665
Zou Nan hai852835f2010-05-21 09:08:56 +08001666 while (!list_empty(&ring->request_list)) {
Eric Anholt673a3942008-07-30 12:06:12 -07001667 struct drm_i915_gem_request *request;
Eric Anholt673a3942008-07-30 12:06:12 -07001668
Zou Nan hai852835f2010-05-21 09:08:56 +08001669 request = list_first_entry(&ring->request_list,
Eric Anholt673a3942008-07-30 12:06:12 -07001670 struct drm_i915_gem_request,
1671 list);
Eric Anholt673a3942008-07-30 12:06:12 -07001672
Chris Wilsondfaae392010-09-22 10:31:52 +01001673 if (!i915_seqno_passed(seqno, request->seqno))
Eric Anholt673a3942008-07-30 12:06:12 -07001674 break;
Chris Wilsonb84d5f02010-09-18 01:38:04 +01001675
Chris Wilsondb53a302011-02-03 11:57:46 +00001676 trace_i915_gem_request_retire(ring, request->seqno);
Chris Wilsona71d8d92012-02-15 11:25:36 +00001677 /* We know the GPU must have read the request to have
1678 * sent us the seqno + interrupt, so use the position
1679 * of tail of the request to update the last known position
1680 * of the GPU head.
1681 */
1682 ring->last_retired_head = request->tail;
Chris Wilsonb84d5f02010-09-18 01:38:04 +01001683
1684 list_del(&request->list);
Chris Wilsonf787a5f2010-09-24 16:02:42 +01001685 i915_gem_request_remove_from_client(request);
Chris Wilsonb84d5f02010-09-18 01:38:04 +01001686 kfree(request);
1687 }
1688
1689 /* Move any buffers on the active list that are no longer referenced
1690 * by the ringbuffer to the flushing/inactive lists as appropriate.
1691 */
1692 while (!list_empty(&ring->active_list)) {
Chris Wilson05394f32010-11-08 19:18:58 +00001693 struct drm_i915_gem_object *obj;
Chris Wilsonb84d5f02010-09-18 01:38:04 +01001694
Akshay Joshi0206e352011-08-16 15:34:10 -04001695 obj = list_first_entry(&ring->active_list,
Chris Wilson05394f32010-11-08 19:18:58 +00001696 struct drm_i915_gem_object,
1697 ring_list);
Chris Wilsonb84d5f02010-09-18 01:38:04 +01001698
Chris Wilson05394f32010-11-08 19:18:58 +00001699 if (!i915_seqno_passed(seqno, obj->last_rendering_seqno))
Chris Wilsonb84d5f02010-09-18 01:38:04 +01001700 break;
1701
Chris Wilson05394f32010-11-08 19:18:58 +00001702 if (obj->base.write_domain != 0)
Chris Wilsonb84d5f02010-09-18 01:38:04 +01001703 i915_gem_object_move_to_flushing(obj);
1704 else
1705 i915_gem_object_move_to_inactive(obj);
Eric Anholt673a3942008-07-30 12:06:12 -07001706 }
Chris Wilson9d34e5d2009-09-24 05:26:06 +01001707
Chris Wilsondb53a302011-02-03 11:57:46 +00001708 if (unlikely(ring->trace_irq_seqno &&
1709 i915_seqno_passed(seqno, ring->trace_irq_seqno))) {
Chris Wilson1ec14ad2010-12-04 11:30:53 +00001710 ring->irq_put(ring);
Chris Wilsondb53a302011-02-03 11:57:46 +00001711 ring->trace_irq_seqno = 0;
Chris Wilson9d34e5d2009-09-24 05:26:06 +01001712 }
Chris Wilson23bc5982010-09-29 16:10:57 +01001713
Chris Wilsondb53a302011-02-03 11:57:46 +00001714 WARN_ON(i915_verify_lists(ring->dev));
Eric Anholt673a3942008-07-30 12:06:12 -07001715}
1716
1717void
Chris Wilsonb09a1fe2010-07-23 23:18:49 +01001718i915_gem_retire_requests(struct drm_device *dev)
1719{
1720 drm_i915_private_t *dev_priv = dev->dev_private;
Chris Wilson1ec14ad2010-12-04 11:30:53 +00001721 int i;
Chris Wilsonb09a1fe2010-07-23 23:18:49 +01001722
Chris Wilsonbe726152010-07-23 23:18:50 +01001723 if (!list_empty(&dev_priv->mm.deferred_free_list)) {
Chris Wilson05394f32010-11-08 19:18:58 +00001724 struct drm_i915_gem_object *obj, *next;
Chris Wilsonbe726152010-07-23 23:18:50 +01001725
1726 /* We must be careful that during unbind() we do not
1727 * accidentally infinitely recurse into retire requests.
1728 * Currently:
1729 * retire -> free -> unbind -> wait -> retire_ring
1730 */
Chris Wilson05394f32010-11-08 19:18:58 +00001731 list_for_each_entry_safe(obj, next,
Chris Wilsonbe726152010-07-23 23:18:50 +01001732 &dev_priv->mm.deferred_free_list,
Chris Wilson69dc4982010-10-19 10:36:51 +01001733 mm_list)
Chris Wilson05394f32010-11-08 19:18:58 +00001734 i915_gem_free_object_tail(obj);
Chris Wilsonbe726152010-07-23 23:18:50 +01001735 }
1736
Chris Wilson1ec14ad2010-12-04 11:30:53 +00001737 for (i = 0; i < I915_NUM_RINGS; i++)
Chris Wilsondb53a302011-02-03 11:57:46 +00001738 i915_gem_retire_requests_ring(&dev_priv->ring[i]);
Chris Wilsonb09a1fe2010-07-23 23:18:49 +01001739}
1740
Daniel Vetter75ef9da2010-08-21 00:25:16 +02001741static void
Eric Anholt673a3942008-07-30 12:06:12 -07001742i915_gem_retire_work_handler(struct work_struct *work)
1743{
1744 drm_i915_private_t *dev_priv;
1745 struct drm_device *dev;
Chris Wilson0a587052011-01-09 21:05:44 +00001746 bool idle;
1747 int i;
Eric Anholt673a3942008-07-30 12:06:12 -07001748
1749 dev_priv = container_of(work, drm_i915_private_t,
1750 mm.retire_work.work);
1751 dev = dev_priv->dev;
1752
Chris Wilson891b48c2010-09-29 12:26:37 +01001753 /* Come back later if the device is busy... */
1754 if (!mutex_trylock(&dev->struct_mutex)) {
1755 queue_delayed_work(dev_priv->wq, &dev_priv->mm.retire_work, HZ);
1756 return;
1757 }
1758
Chris Wilsonb09a1fe2010-07-23 23:18:49 +01001759 i915_gem_retire_requests(dev);
Zou Nan haid1b851f2010-05-21 09:08:57 +08001760
Chris Wilson0a587052011-01-09 21:05:44 +00001761 /* Send a periodic flush down the ring so we don't hold onto GEM
1762 * objects indefinitely.
1763 */
1764 idle = true;
1765 for (i = 0; i < I915_NUM_RINGS; i++) {
1766 struct intel_ring_buffer *ring = &dev_priv->ring[i];
1767
1768 if (!list_empty(&ring->gpu_write_list)) {
1769 struct drm_i915_gem_request *request;
1770 int ret;
1771
Chris Wilsondb53a302011-02-03 11:57:46 +00001772 ret = i915_gem_flush_ring(ring,
1773 0, I915_GEM_GPU_DOMAINS);
Chris Wilson0a587052011-01-09 21:05:44 +00001774 request = kzalloc(sizeof(*request), GFP_KERNEL);
1775 if (ret || request == NULL ||
Chris Wilsondb53a302011-02-03 11:57:46 +00001776 i915_add_request(ring, NULL, request))
Chris Wilson0a587052011-01-09 21:05:44 +00001777 kfree(request);
1778 }
1779
1780 idle &= list_empty(&ring->request_list);
1781 }
1782
1783 if (!dev_priv->mm.suspended && !idle)
Eric Anholt9c9fe1f2009-08-03 16:09:16 -07001784 queue_delayed_work(dev_priv->wq, &dev_priv->mm.retire_work, HZ);
Chris Wilson0a587052011-01-09 21:05:44 +00001785
Eric Anholt673a3942008-07-30 12:06:12 -07001786 mutex_unlock(&dev->struct_mutex);
1787}
1788
Chris Wilsondb53a302011-02-03 11:57:46 +00001789/**
1790 * Waits for a sequence number to be signaled, and cleans up the
1791 * request and object lists appropriately for that event.
1792 */
Daniel Vetter5a5a0c62009-09-15 22:57:36 +02001793int
Chris Wilsondb53a302011-02-03 11:57:46 +00001794i915_wait_request(struct intel_ring_buffer *ring,
Ben Widawskyb93f9cf2012-01-25 15:39:34 -08001795 uint32_t seqno,
1796 bool do_retire)
Eric Anholt673a3942008-07-30 12:06:12 -07001797{
Chris Wilsondb53a302011-02-03 11:57:46 +00001798 drm_i915_private_t *dev_priv = ring->dev->dev_private;
Jesse Barnes802c7eb2009-05-05 16:03:48 -07001799 u32 ier;
Eric Anholt673a3942008-07-30 12:06:12 -07001800 int ret = 0;
1801
1802 BUG_ON(seqno == 0);
1803
Chris Wilsond9bc7e92011-02-07 13:09:31 +00001804 if (atomic_read(&dev_priv->mm.wedged)) {
1805 struct completion *x = &dev_priv->error_completion;
1806 bool recovery_complete;
1807 unsigned long flags;
1808
1809 /* Give the error handler a chance to run. */
1810 spin_lock_irqsave(&x->wait.lock, flags);
1811 recovery_complete = x->done > 0;
1812 spin_unlock_irqrestore(&x->wait.lock, flags);
1813
1814 return recovery_complete ? -EIO : -EAGAIN;
1815 }
Ben Gamariffed1d02009-09-14 17:48:41 -04001816
Chris Wilson5d97eb62010-11-10 20:40:02 +00001817 if (seqno == ring->outstanding_lazy_request) {
Chris Wilson3cce4692010-10-27 16:11:02 +01001818 struct drm_i915_gem_request *request;
1819
1820 request = kzalloc(sizeof(*request), GFP_KERNEL);
1821 if (request == NULL)
Daniel Vettere35a41d2010-02-11 22:13:59 +01001822 return -ENOMEM;
Chris Wilson3cce4692010-10-27 16:11:02 +01001823
Chris Wilsondb53a302011-02-03 11:57:46 +00001824 ret = i915_add_request(ring, NULL, request);
Chris Wilson3cce4692010-10-27 16:11:02 +01001825 if (ret) {
1826 kfree(request);
1827 return ret;
1828 }
1829
1830 seqno = request->seqno;
Daniel Vettere35a41d2010-02-11 22:13:59 +01001831 }
1832
Chris Wilson78501ea2010-10-27 12:18:21 +01001833 if (!i915_seqno_passed(ring->get_seqno(ring), seqno)) {
Chris Wilsondb53a302011-02-03 11:57:46 +00001834 if (HAS_PCH_SPLIT(ring->dev))
Zhenyu Wang036a4a72009-06-08 14:40:19 +08001835 ier = I915_READ(DEIER) | I915_READ(GTIER);
1836 else
1837 ier = I915_READ(IER);
Jesse Barnes802c7eb2009-05-05 16:03:48 -07001838 if (!ier) {
1839 DRM_ERROR("something (likely vbetool) disabled "
1840 "interrupts, re-enabling\n");
Chris Wilsonf01c22f2011-06-28 11:48:51 +01001841 ring->dev->driver->irq_preinstall(ring->dev);
1842 ring->dev->driver->irq_postinstall(ring->dev);
Jesse Barnes802c7eb2009-05-05 16:03:48 -07001843 }
1844
Chris Wilsondb53a302011-02-03 11:57:46 +00001845 trace_i915_gem_request_wait_begin(ring, seqno);
Chris Wilson1c5d22f2009-08-25 11:15:50 +01001846
Chris Wilsonb2223492010-10-27 15:27:33 +01001847 ring->waiting_seqno = seqno;
Chris Wilsonb13c2b92010-12-13 16:54:50 +00001848 if (ring->irq_get(ring)) {
Chris Wilsonce453d82011-02-21 14:43:56 +00001849 if (dev_priv->mm.interruptible)
Chris Wilsonb13c2b92010-12-13 16:54:50 +00001850 ret = wait_event_interruptible(ring->irq_queue,
1851 i915_seqno_passed(ring->get_seqno(ring), seqno)
1852 || atomic_read(&dev_priv->mm.wedged));
1853 else
1854 wait_event(ring->irq_queue,
1855 i915_seqno_passed(ring->get_seqno(ring), seqno)
1856 || atomic_read(&dev_priv->mm.wedged));
Daniel Vetter48764bf2009-09-15 22:57:32 +02001857
Chris Wilsonb13c2b92010-12-13 16:54:50 +00001858 ring->irq_put(ring);
Eric Anholte959b5d2011-12-22 14:55:01 -08001859 } else if (wait_for_atomic(i915_seqno_passed(ring->get_seqno(ring),
1860 seqno) ||
1861 atomic_read(&dev_priv->mm.wedged), 3000))
Chris Wilsonb5ba1772010-12-14 12:17:15 +00001862 ret = -EBUSY;
Chris Wilsonb2223492010-10-27 15:27:33 +01001863 ring->waiting_seqno = 0;
Chris Wilson1c5d22f2009-08-25 11:15:50 +01001864
Chris Wilsondb53a302011-02-03 11:57:46 +00001865 trace_i915_gem_request_wait_end(ring, seqno);
Eric Anholt673a3942008-07-30 12:06:12 -07001866 }
Ben Gamariba1234d2009-09-14 17:48:47 -04001867 if (atomic_read(&dev_priv->mm.wedged))
Chris Wilson30dbf0c2010-09-25 10:19:17 +01001868 ret = -EAGAIN;
Eric Anholt673a3942008-07-30 12:06:12 -07001869
Eric Anholt673a3942008-07-30 12:06:12 -07001870 /* Directly dispatch request retiring. While we have the work queue
1871 * to handle this, the waiter on a request often wants an associated
1872 * buffer to have made it to the inactive list, and we would need
1873 * a separate wait queue to handle that.
1874 */
Ben Widawskyb93f9cf2012-01-25 15:39:34 -08001875 if (ret == 0 && do_retire)
Chris Wilsondb53a302011-02-03 11:57:46 +00001876 i915_gem_retire_requests_ring(ring);
Eric Anholt673a3942008-07-30 12:06:12 -07001877
1878 return ret;
1879}
1880
Daniel Vetter48764bf2009-09-15 22:57:32 +02001881/**
Eric Anholt673a3942008-07-30 12:06:12 -07001882 * Ensures that all rendering to the object has completed and the object is
1883 * safe to unbind from the GTT or access from the CPU.
1884 */
Chris Wilson54cf91d2010-11-25 18:00:26 +00001885int
Chris Wilsonce453d82011-02-21 14:43:56 +00001886i915_gem_object_wait_rendering(struct drm_i915_gem_object *obj)
Eric Anholt673a3942008-07-30 12:06:12 -07001887{
Eric Anholt673a3942008-07-30 12:06:12 -07001888 int ret;
1889
Eric Anholte47c68e2008-11-14 13:35:19 -08001890 /* This function only exists to support waiting for existing rendering,
1891 * not for emitting required flushes.
Eric Anholt673a3942008-07-30 12:06:12 -07001892 */
Chris Wilson05394f32010-11-08 19:18:58 +00001893 BUG_ON((obj->base.write_domain & I915_GEM_GPU_DOMAINS) != 0);
Eric Anholt673a3942008-07-30 12:06:12 -07001894
1895 /* If there is rendering queued on the buffer being evicted, wait for
1896 * it.
1897 */
Chris Wilson05394f32010-11-08 19:18:58 +00001898 if (obj->active) {
Ben Widawskyb93f9cf2012-01-25 15:39:34 -08001899 ret = i915_wait_request(obj->ring, obj->last_rendering_seqno,
1900 true);
Chris Wilson2cf34d72010-09-14 13:03:28 +01001901 if (ret)
Eric Anholt673a3942008-07-30 12:06:12 -07001902 return ret;
1903 }
1904
1905 return 0;
1906}
1907
Chris Wilsonb5ffc9b2011-04-13 22:06:03 +01001908static void i915_gem_object_finish_gtt(struct drm_i915_gem_object *obj)
1909{
1910 u32 old_write_domain, old_read_domains;
1911
Chris Wilsonb5ffc9b2011-04-13 22:06:03 +01001912 /* Act a barrier for all accesses through the GTT */
1913 mb();
1914
1915 /* Force a pagefault for domain tracking on next user access */
1916 i915_gem_release_mmap(obj);
1917
Keith Packardb97c3d92011-06-24 21:02:59 -07001918 if ((obj->base.read_domains & I915_GEM_DOMAIN_GTT) == 0)
1919 return;
1920
Chris Wilsonb5ffc9b2011-04-13 22:06:03 +01001921 old_read_domains = obj->base.read_domains;
1922 old_write_domain = obj->base.write_domain;
1923
1924 obj->base.read_domains &= ~I915_GEM_DOMAIN_GTT;
1925 obj->base.write_domain &= ~I915_GEM_DOMAIN_GTT;
1926
1927 trace_i915_gem_object_change_domain(obj,
1928 old_read_domains,
1929 old_write_domain);
1930}
1931
Eric Anholt673a3942008-07-30 12:06:12 -07001932/**
1933 * Unbinds an object from the GTT aperture.
1934 */
Jesse Barnes0f973f22009-01-26 17:10:45 -08001935int
Chris Wilson05394f32010-11-08 19:18:58 +00001936i915_gem_object_unbind(struct drm_i915_gem_object *obj)
Eric Anholt673a3942008-07-30 12:06:12 -07001937{
Daniel Vetter7bddb012012-02-09 17:15:47 +01001938 drm_i915_private_t *dev_priv = obj->base.dev->dev_private;
Eric Anholt673a3942008-07-30 12:06:12 -07001939 int ret = 0;
1940
Chris Wilson05394f32010-11-08 19:18:58 +00001941 if (obj->gtt_space == NULL)
Eric Anholt673a3942008-07-30 12:06:12 -07001942 return 0;
1943
Chris Wilson05394f32010-11-08 19:18:58 +00001944 if (obj->pin_count != 0) {
Eric Anholt673a3942008-07-30 12:06:12 -07001945 DRM_ERROR("Attempting to unbind pinned buffer\n");
1946 return -EINVAL;
1947 }
1948
Chris Wilsona8198ee2011-04-13 22:04:09 +01001949 ret = i915_gem_object_finish_gpu(obj);
Chris Wilson8dc17752010-07-23 23:18:51 +01001950 if (ret == -ERESTARTSYS)
Eric Anholt673a3942008-07-30 12:06:12 -07001951 return ret;
Chris Wilson8dc17752010-07-23 23:18:51 +01001952 /* Continue on if we fail due to EIO, the GPU is hung so we
1953 * should be safe and we need to cleanup or else we might
1954 * cause memory corruption through use-after-free.
1955 */
Chris Wilsona8198ee2011-04-13 22:04:09 +01001956
Chris Wilsonb5ffc9b2011-04-13 22:06:03 +01001957 i915_gem_object_finish_gtt(obj);
Chris Wilsona8198ee2011-04-13 22:04:09 +01001958
1959 /* Move the object to the CPU domain to ensure that
1960 * any possible CPU writes while it's not in the GTT
1961 * are flushed when we go to remap it.
1962 */
1963 if (ret == 0)
1964 ret = i915_gem_object_set_to_cpu_domain(obj, 1);
1965 if (ret == -ERESTARTSYS)
1966 return ret;
Chris Wilson812ed4922010-09-30 15:08:57 +01001967 if (ret) {
Chris Wilsona8198ee2011-04-13 22:04:09 +01001968 /* In the event of a disaster, abandon all caches and
1969 * hope for the best.
1970 */
Chris Wilson812ed4922010-09-30 15:08:57 +01001971 i915_gem_clflush_object(obj);
Chris Wilson05394f32010-11-08 19:18:58 +00001972 obj->base.read_domains = obj->base.write_domain = I915_GEM_DOMAIN_CPU;
Chris Wilson812ed4922010-09-30 15:08:57 +01001973 }
Eric Anholt673a3942008-07-30 12:06:12 -07001974
Daniel Vetter96b47b62009-12-15 17:50:00 +01001975 /* release the fence reg _after_ flushing */
Chris Wilsond9e86c02010-11-10 16:40:20 +00001976 ret = i915_gem_object_put_fence(obj);
1977 if (ret == -ERESTARTSYS)
1978 return ret;
Daniel Vetter96b47b62009-12-15 17:50:00 +01001979
Chris Wilsondb53a302011-02-03 11:57:46 +00001980 trace_i915_gem_object_unbind(obj);
1981
Daniel Vetter74898d72012-02-15 23:50:22 +01001982 if (obj->has_global_gtt_mapping)
1983 i915_gem_gtt_unbind_object(obj);
Daniel Vetter7bddb012012-02-09 17:15:47 +01001984 if (obj->has_aliasing_ppgtt_mapping) {
1985 i915_ppgtt_unbind_object(dev_priv->mm.aliasing_ppgtt, obj);
1986 obj->has_aliasing_ppgtt_mapping = 0;
1987 }
Daniel Vetter74163902012-02-15 23:50:21 +01001988 i915_gem_gtt_finish_object(obj);
Daniel Vetter7bddb012012-02-09 17:15:47 +01001989
Chris Wilsone5281cc2010-10-28 13:45:36 +01001990 i915_gem_object_put_pages_gtt(obj);
Eric Anholt673a3942008-07-30 12:06:12 -07001991
Chris Wilson6299f992010-11-24 12:23:44 +00001992 list_del_init(&obj->gtt_list);
Chris Wilson05394f32010-11-08 19:18:58 +00001993 list_del_init(&obj->mm_list);
Daniel Vetter75e9e912010-11-04 17:11:09 +01001994 /* Avoid an unnecessary call to unbind on rebind. */
Chris Wilson05394f32010-11-08 19:18:58 +00001995 obj->map_and_fenceable = true;
Eric Anholt673a3942008-07-30 12:06:12 -07001996
Chris Wilson05394f32010-11-08 19:18:58 +00001997 drm_mm_put_block(obj->gtt_space);
1998 obj->gtt_space = NULL;
1999 obj->gtt_offset = 0;
Eric Anholt673a3942008-07-30 12:06:12 -07002000
Chris Wilson05394f32010-11-08 19:18:58 +00002001 if (i915_gem_object_is_purgeable(obj))
Chris Wilson963b4832009-09-20 23:03:54 +01002002 i915_gem_object_truncate(obj);
2003
Chris Wilson8dc17752010-07-23 23:18:51 +01002004 return ret;
Eric Anholt673a3942008-07-30 12:06:12 -07002005}
2006
Chris Wilson88241782011-01-07 17:09:48 +00002007int
Chris Wilsondb53a302011-02-03 11:57:46 +00002008i915_gem_flush_ring(struct intel_ring_buffer *ring,
Chris Wilson54cf91d2010-11-25 18:00:26 +00002009 uint32_t invalidate_domains,
2010 uint32_t flush_domains)
2011{
Chris Wilson88241782011-01-07 17:09:48 +00002012 int ret;
2013
Chris Wilson36d527d2011-03-19 22:26:49 +00002014 if (((invalidate_domains | flush_domains) & I915_GEM_GPU_DOMAINS) == 0)
2015 return 0;
2016
Chris Wilsondb53a302011-02-03 11:57:46 +00002017 trace_i915_gem_ring_flush(ring, invalidate_domains, flush_domains);
2018
Chris Wilson88241782011-01-07 17:09:48 +00002019 ret = ring->flush(ring, invalidate_domains, flush_domains);
2020 if (ret)
2021 return ret;
2022
Chris Wilson36d527d2011-03-19 22:26:49 +00002023 if (flush_domains & I915_GEM_GPU_DOMAINS)
2024 i915_gem_process_flushing_list(ring, flush_domains);
2025
Chris Wilson88241782011-01-07 17:09:48 +00002026 return 0;
Chris Wilson54cf91d2010-11-25 18:00:26 +00002027}
2028
Ben Widawskyb93f9cf2012-01-25 15:39:34 -08002029static int i915_ring_idle(struct intel_ring_buffer *ring, bool do_retire)
Chris Wilsona56ba562010-09-28 10:07:56 +01002030{
Chris Wilson88241782011-01-07 17:09:48 +00002031 int ret;
2032
Chris Wilson395b70b2010-10-28 21:28:46 +01002033 if (list_empty(&ring->gpu_write_list) && list_empty(&ring->active_list))
Chris Wilson64193402010-10-24 12:38:05 +01002034 return 0;
2035
Chris Wilson88241782011-01-07 17:09:48 +00002036 if (!list_empty(&ring->gpu_write_list)) {
Chris Wilsondb53a302011-02-03 11:57:46 +00002037 ret = i915_gem_flush_ring(ring,
Chris Wilson0ac74c62010-12-06 14:36:02 +00002038 I915_GEM_GPU_DOMAINS, I915_GEM_GPU_DOMAINS);
Chris Wilson88241782011-01-07 17:09:48 +00002039 if (ret)
2040 return ret;
2041 }
2042
Ben Widawskyb93f9cf2012-01-25 15:39:34 -08002043 return i915_wait_request(ring, i915_gem_next_request_seqno(ring),
2044 do_retire);
Chris Wilsona56ba562010-09-28 10:07:56 +01002045}
2046
Ben Widawskyb93f9cf2012-01-25 15:39:34 -08002047int i915_gpu_idle(struct drm_device *dev, bool do_retire)
Daniel Vetter4df2faf2010-02-19 11:52:00 +01002048{
2049 drm_i915_private_t *dev_priv = dev->dev_private;
Chris Wilson1ec14ad2010-12-04 11:30:53 +00002050 int ret, i;
Daniel Vetter4df2faf2010-02-19 11:52:00 +01002051
Daniel Vetter4df2faf2010-02-19 11:52:00 +01002052 /* Flush everything onto the inactive list. */
Chris Wilson1ec14ad2010-12-04 11:30:53 +00002053 for (i = 0; i < I915_NUM_RINGS; i++) {
Ben Widawskyb93f9cf2012-01-25 15:39:34 -08002054 ret = i915_ring_idle(&dev_priv->ring[i], do_retire);
Chris Wilson1ec14ad2010-12-04 11:30:53 +00002055 if (ret)
2056 return ret;
2057 }
Zou Nan haid1b851f2010-05-21 09:08:57 +08002058
Daniel Vetter8a1a49f2010-02-11 22:29:04 +01002059 return 0;
Daniel Vetter4df2faf2010-02-19 11:52:00 +01002060}
2061
Daniel Vetterc6642782010-11-12 13:46:18 +00002062static int sandybridge_write_fence_reg(struct drm_i915_gem_object *obj,
2063 struct intel_ring_buffer *pipelined)
Eric Anholt4e901fd2009-10-26 16:44:17 -07002064{
Chris Wilson05394f32010-11-08 19:18:58 +00002065 struct drm_device *dev = obj->base.dev;
Eric Anholt4e901fd2009-10-26 16:44:17 -07002066 drm_i915_private_t *dev_priv = dev->dev_private;
Chris Wilson05394f32010-11-08 19:18:58 +00002067 u32 size = obj->gtt_space->size;
2068 int regnum = obj->fence_reg;
Eric Anholt4e901fd2009-10-26 16:44:17 -07002069 uint64_t val;
2070
Chris Wilson05394f32010-11-08 19:18:58 +00002071 val = (uint64_t)((obj->gtt_offset + size - 4096) &
Daniel Vetterc6642782010-11-12 13:46:18 +00002072 0xfffff000) << 32;
Chris Wilson05394f32010-11-08 19:18:58 +00002073 val |= obj->gtt_offset & 0xfffff000;
2074 val |= (uint64_t)((obj->stride / 128) - 1) <<
Eric Anholt4e901fd2009-10-26 16:44:17 -07002075 SANDYBRIDGE_FENCE_PITCH_SHIFT;
2076
Chris Wilson05394f32010-11-08 19:18:58 +00002077 if (obj->tiling_mode == I915_TILING_Y)
Eric Anholt4e901fd2009-10-26 16:44:17 -07002078 val |= 1 << I965_FENCE_TILING_Y_SHIFT;
2079 val |= I965_FENCE_REG_VALID;
2080
Daniel Vetterc6642782010-11-12 13:46:18 +00002081 if (pipelined) {
2082 int ret = intel_ring_begin(pipelined, 6);
2083 if (ret)
2084 return ret;
2085
2086 intel_ring_emit(pipelined, MI_NOOP);
2087 intel_ring_emit(pipelined, MI_LOAD_REGISTER_IMM(2));
2088 intel_ring_emit(pipelined, FENCE_REG_SANDYBRIDGE_0 + regnum*8);
2089 intel_ring_emit(pipelined, (u32)val);
2090 intel_ring_emit(pipelined, FENCE_REG_SANDYBRIDGE_0 + regnum*8 + 4);
2091 intel_ring_emit(pipelined, (u32)(val >> 32));
2092 intel_ring_advance(pipelined);
2093 } else
2094 I915_WRITE64(FENCE_REG_SANDYBRIDGE_0 + regnum * 8, val);
2095
2096 return 0;
Eric Anholt4e901fd2009-10-26 16:44:17 -07002097}
2098
Daniel Vetterc6642782010-11-12 13:46:18 +00002099static int i965_write_fence_reg(struct drm_i915_gem_object *obj,
2100 struct intel_ring_buffer *pipelined)
Jesse Barnesde151cf2008-11-12 10:03:55 -08002101{
Chris Wilson05394f32010-11-08 19:18:58 +00002102 struct drm_device *dev = obj->base.dev;
Jesse Barnesde151cf2008-11-12 10:03:55 -08002103 drm_i915_private_t *dev_priv = dev->dev_private;
Chris Wilson05394f32010-11-08 19:18:58 +00002104 u32 size = obj->gtt_space->size;
2105 int regnum = obj->fence_reg;
Jesse Barnesde151cf2008-11-12 10:03:55 -08002106 uint64_t val;
2107
Chris Wilson05394f32010-11-08 19:18:58 +00002108 val = (uint64_t)((obj->gtt_offset + size - 4096) &
Jesse Barnesde151cf2008-11-12 10:03:55 -08002109 0xfffff000) << 32;
Chris Wilson05394f32010-11-08 19:18:58 +00002110 val |= obj->gtt_offset & 0xfffff000;
2111 val |= ((obj->stride / 128) - 1) << I965_FENCE_PITCH_SHIFT;
2112 if (obj->tiling_mode == I915_TILING_Y)
Jesse Barnesde151cf2008-11-12 10:03:55 -08002113 val |= 1 << I965_FENCE_TILING_Y_SHIFT;
2114 val |= I965_FENCE_REG_VALID;
2115
Daniel Vetterc6642782010-11-12 13:46:18 +00002116 if (pipelined) {
2117 int ret = intel_ring_begin(pipelined, 6);
2118 if (ret)
2119 return ret;
2120
2121 intel_ring_emit(pipelined, MI_NOOP);
2122 intel_ring_emit(pipelined, MI_LOAD_REGISTER_IMM(2));
2123 intel_ring_emit(pipelined, FENCE_REG_965_0 + regnum*8);
2124 intel_ring_emit(pipelined, (u32)val);
2125 intel_ring_emit(pipelined, FENCE_REG_965_0 + regnum*8 + 4);
2126 intel_ring_emit(pipelined, (u32)(val >> 32));
2127 intel_ring_advance(pipelined);
2128 } else
2129 I915_WRITE64(FENCE_REG_965_0 + regnum * 8, val);
2130
2131 return 0;
Jesse Barnesde151cf2008-11-12 10:03:55 -08002132}
2133
Daniel Vetterc6642782010-11-12 13:46:18 +00002134static int i915_write_fence_reg(struct drm_i915_gem_object *obj,
2135 struct intel_ring_buffer *pipelined)
Jesse Barnesde151cf2008-11-12 10:03:55 -08002136{
Chris Wilson05394f32010-11-08 19:18:58 +00002137 struct drm_device *dev = obj->base.dev;
Jesse Barnesde151cf2008-11-12 10:03:55 -08002138 drm_i915_private_t *dev_priv = dev->dev_private;
Chris Wilson05394f32010-11-08 19:18:58 +00002139 u32 size = obj->gtt_space->size;
Daniel Vetterc6642782010-11-12 13:46:18 +00002140 u32 fence_reg, val, pitch_val;
Jesse Barnes0f973f22009-01-26 17:10:45 -08002141 int tile_width;
Jesse Barnesde151cf2008-11-12 10:03:55 -08002142
Daniel Vetterc6642782010-11-12 13:46:18 +00002143 if (WARN((obj->gtt_offset & ~I915_FENCE_START_MASK) ||
2144 (size & -size) != size ||
2145 (obj->gtt_offset & (size - 1)),
2146 "object 0x%08x [fenceable? %d] not 1M or pot-size (0x%08x) aligned\n",
2147 obj->gtt_offset, obj->map_and_fenceable, size))
2148 return -EINVAL;
Jesse Barnesde151cf2008-11-12 10:03:55 -08002149
Daniel Vetterc6642782010-11-12 13:46:18 +00002150 if (obj->tiling_mode == I915_TILING_Y && HAS_128_BYTE_Y_TILING(dev))
Jesse Barnes0f973f22009-01-26 17:10:45 -08002151 tile_width = 128;
Jesse Barnesde151cf2008-11-12 10:03:55 -08002152 else
Jesse Barnes0f973f22009-01-26 17:10:45 -08002153 tile_width = 512;
2154
2155 /* Note: pitch better be a power of two tile widths */
Chris Wilson05394f32010-11-08 19:18:58 +00002156 pitch_val = obj->stride / tile_width;
Jesse Barnes0f973f22009-01-26 17:10:45 -08002157 pitch_val = ffs(pitch_val) - 1;
Jesse Barnesde151cf2008-11-12 10:03:55 -08002158
Chris Wilson05394f32010-11-08 19:18:58 +00002159 val = obj->gtt_offset;
2160 if (obj->tiling_mode == I915_TILING_Y)
Jesse Barnesde151cf2008-11-12 10:03:55 -08002161 val |= 1 << I830_FENCE_TILING_Y_SHIFT;
Chris Wilsona00b10c2010-09-24 21:15:47 +01002162 val |= I915_FENCE_SIZE_BITS(size);
Jesse Barnesde151cf2008-11-12 10:03:55 -08002163 val |= pitch_val << I830_FENCE_PITCH_SHIFT;
2164 val |= I830_FENCE_REG_VALID;
2165
Chris Wilson05394f32010-11-08 19:18:58 +00002166 fence_reg = obj->fence_reg;
Chris Wilsona00b10c2010-09-24 21:15:47 +01002167 if (fence_reg < 8)
2168 fence_reg = FENCE_REG_830_0 + fence_reg * 4;
Eric Anholtdc529a42009-03-10 22:34:49 -07002169 else
Chris Wilsona00b10c2010-09-24 21:15:47 +01002170 fence_reg = FENCE_REG_945_8 + (fence_reg - 8) * 4;
Daniel Vetterc6642782010-11-12 13:46:18 +00002171
2172 if (pipelined) {
2173 int ret = intel_ring_begin(pipelined, 4);
2174 if (ret)
2175 return ret;
2176
2177 intel_ring_emit(pipelined, MI_NOOP);
2178 intel_ring_emit(pipelined, MI_LOAD_REGISTER_IMM(1));
2179 intel_ring_emit(pipelined, fence_reg);
2180 intel_ring_emit(pipelined, val);
2181 intel_ring_advance(pipelined);
2182 } else
2183 I915_WRITE(fence_reg, val);
2184
2185 return 0;
Jesse Barnesde151cf2008-11-12 10:03:55 -08002186}
2187
Daniel Vetterc6642782010-11-12 13:46:18 +00002188static int i830_write_fence_reg(struct drm_i915_gem_object *obj,
2189 struct intel_ring_buffer *pipelined)
Jesse Barnesde151cf2008-11-12 10:03:55 -08002190{
Chris Wilson05394f32010-11-08 19:18:58 +00002191 struct drm_device *dev = obj->base.dev;
Jesse Barnesde151cf2008-11-12 10:03:55 -08002192 drm_i915_private_t *dev_priv = dev->dev_private;
Chris Wilson05394f32010-11-08 19:18:58 +00002193 u32 size = obj->gtt_space->size;
2194 int regnum = obj->fence_reg;
Jesse Barnesde151cf2008-11-12 10:03:55 -08002195 uint32_t val;
2196 uint32_t pitch_val;
2197
Daniel Vetterc6642782010-11-12 13:46:18 +00002198 if (WARN((obj->gtt_offset & ~I830_FENCE_START_MASK) ||
2199 (size & -size) != size ||
2200 (obj->gtt_offset & (size - 1)),
2201 "object 0x%08x not 512K or pot-size 0x%08x aligned\n",
2202 obj->gtt_offset, size))
2203 return -EINVAL;
Jesse Barnesde151cf2008-11-12 10:03:55 -08002204
Chris Wilson05394f32010-11-08 19:18:58 +00002205 pitch_val = obj->stride / 128;
Eric Anholte76a16d2009-05-26 17:44:56 -07002206 pitch_val = ffs(pitch_val) - 1;
Eric Anholte76a16d2009-05-26 17:44:56 -07002207
Chris Wilson05394f32010-11-08 19:18:58 +00002208 val = obj->gtt_offset;
2209 if (obj->tiling_mode == I915_TILING_Y)
Jesse Barnesde151cf2008-11-12 10:03:55 -08002210 val |= 1 << I830_FENCE_TILING_Y_SHIFT;
Daniel Vetterc6642782010-11-12 13:46:18 +00002211 val |= I830_FENCE_SIZE_BITS(size);
Jesse Barnesde151cf2008-11-12 10:03:55 -08002212 val |= pitch_val << I830_FENCE_PITCH_SHIFT;
2213 val |= I830_FENCE_REG_VALID;
2214
Daniel Vetterc6642782010-11-12 13:46:18 +00002215 if (pipelined) {
2216 int ret = intel_ring_begin(pipelined, 4);
2217 if (ret)
2218 return ret;
2219
2220 intel_ring_emit(pipelined, MI_NOOP);
2221 intel_ring_emit(pipelined, MI_LOAD_REGISTER_IMM(1));
2222 intel_ring_emit(pipelined, FENCE_REG_830_0 + regnum*4);
2223 intel_ring_emit(pipelined, val);
2224 intel_ring_advance(pipelined);
2225 } else
2226 I915_WRITE(FENCE_REG_830_0 + regnum * 4, val);
2227
2228 return 0;
Jesse Barnesde151cf2008-11-12 10:03:55 -08002229}
2230
Chris Wilsond9e86c02010-11-10 16:40:20 +00002231static bool ring_passed_seqno(struct intel_ring_buffer *ring, u32 seqno)
2232{
2233 return i915_seqno_passed(ring->get_seqno(ring), seqno);
2234}
2235
2236static int
2237i915_gem_object_flush_fence(struct drm_i915_gem_object *obj,
Chris Wilsonce453d82011-02-21 14:43:56 +00002238 struct intel_ring_buffer *pipelined)
Chris Wilsond9e86c02010-11-10 16:40:20 +00002239{
2240 int ret;
2241
2242 if (obj->fenced_gpu_access) {
Chris Wilson88241782011-01-07 17:09:48 +00002243 if (obj->base.write_domain & I915_GEM_GPU_DOMAINS) {
Chris Wilsondb53a302011-02-03 11:57:46 +00002244 ret = i915_gem_flush_ring(obj->last_fenced_ring,
Chris Wilson88241782011-01-07 17:09:48 +00002245 0, obj->base.write_domain);
2246 if (ret)
2247 return ret;
2248 }
Chris Wilsond9e86c02010-11-10 16:40:20 +00002249
2250 obj->fenced_gpu_access = false;
2251 }
2252
2253 if (obj->last_fenced_seqno && pipelined != obj->last_fenced_ring) {
2254 if (!ring_passed_seqno(obj->last_fenced_ring,
2255 obj->last_fenced_seqno)) {
Chris Wilsondb53a302011-02-03 11:57:46 +00002256 ret = i915_wait_request(obj->last_fenced_ring,
Ben Widawskyb93f9cf2012-01-25 15:39:34 -08002257 obj->last_fenced_seqno,
2258 true);
Chris Wilsond9e86c02010-11-10 16:40:20 +00002259 if (ret)
2260 return ret;
2261 }
2262
2263 obj->last_fenced_seqno = 0;
2264 obj->last_fenced_ring = NULL;
2265 }
2266
Chris Wilson63256ec2011-01-04 18:42:07 +00002267 /* Ensure that all CPU reads are completed before installing a fence
2268 * and all writes before removing the fence.
2269 */
2270 if (obj->base.read_domains & I915_GEM_DOMAIN_GTT)
2271 mb();
2272
Chris Wilsond9e86c02010-11-10 16:40:20 +00002273 return 0;
2274}
2275
2276int
2277i915_gem_object_put_fence(struct drm_i915_gem_object *obj)
2278{
2279 int ret;
2280
2281 if (obj->tiling_mode)
2282 i915_gem_release_mmap(obj);
2283
Chris Wilsonce453d82011-02-21 14:43:56 +00002284 ret = i915_gem_object_flush_fence(obj, NULL);
Chris Wilsond9e86c02010-11-10 16:40:20 +00002285 if (ret)
2286 return ret;
2287
2288 if (obj->fence_reg != I915_FENCE_REG_NONE) {
2289 struct drm_i915_private *dev_priv = obj->base.dev->dev_private;
Chris Wilson1690e1e2011-12-14 13:57:08 +01002290
2291 WARN_ON(dev_priv->fence_regs[obj->fence_reg].pin_count);
Chris Wilsond9e86c02010-11-10 16:40:20 +00002292 i915_gem_clear_fence_reg(obj->base.dev,
2293 &dev_priv->fence_regs[obj->fence_reg]);
2294
2295 obj->fence_reg = I915_FENCE_REG_NONE;
2296 }
2297
2298 return 0;
2299}
2300
2301static struct drm_i915_fence_reg *
2302i915_find_fence_reg(struct drm_device *dev,
2303 struct intel_ring_buffer *pipelined)
Daniel Vetterae3db242010-02-19 11:51:58 +01002304{
Daniel Vetterae3db242010-02-19 11:51:58 +01002305 struct drm_i915_private *dev_priv = dev->dev_private;
Chris Wilsond9e86c02010-11-10 16:40:20 +00002306 struct drm_i915_fence_reg *reg, *first, *avail;
2307 int i;
Daniel Vetterae3db242010-02-19 11:51:58 +01002308
2309 /* First try to find a free reg */
Chris Wilsond9e86c02010-11-10 16:40:20 +00002310 avail = NULL;
Daniel Vetterae3db242010-02-19 11:51:58 +01002311 for (i = dev_priv->fence_reg_start; i < dev_priv->num_fence_regs; i++) {
2312 reg = &dev_priv->fence_regs[i];
2313 if (!reg->obj)
Chris Wilsond9e86c02010-11-10 16:40:20 +00002314 return reg;
Daniel Vetterae3db242010-02-19 11:51:58 +01002315
Chris Wilson1690e1e2011-12-14 13:57:08 +01002316 if (!reg->pin_count)
Chris Wilsond9e86c02010-11-10 16:40:20 +00002317 avail = reg;
Daniel Vetterae3db242010-02-19 11:51:58 +01002318 }
2319
Chris Wilsond9e86c02010-11-10 16:40:20 +00002320 if (avail == NULL)
2321 return NULL;
Daniel Vetterae3db242010-02-19 11:51:58 +01002322
2323 /* None available, try to steal one or wait for a user to finish */
Chris Wilsond9e86c02010-11-10 16:40:20 +00002324 avail = first = NULL;
2325 list_for_each_entry(reg, &dev_priv->mm.fence_list, lru_list) {
Chris Wilson1690e1e2011-12-14 13:57:08 +01002326 if (reg->pin_count)
Daniel Vetterae3db242010-02-19 11:51:58 +01002327 continue;
2328
Chris Wilsond9e86c02010-11-10 16:40:20 +00002329 if (first == NULL)
2330 first = reg;
2331
2332 if (!pipelined ||
2333 !reg->obj->last_fenced_ring ||
2334 reg->obj->last_fenced_ring == pipelined) {
2335 avail = reg;
2336 break;
2337 }
Daniel Vetterae3db242010-02-19 11:51:58 +01002338 }
2339
Chris Wilsond9e86c02010-11-10 16:40:20 +00002340 if (avail == NULL)
2341 avail = first;
Daniel Vetterae3db242010-02-19 11:51:58 +01002342
Chris Wilsona00b10c2010-09-24 21:15:47 +01002343 return avail;
Daniel Vetterae3db242010-02-19 11:51:58 +01002344}
2345
Jesse Barnesde151cf2008-11-12 10:03:55 -08002346/**
Chris Wilsond9e86c02010-11-10 16:40:20 +00002347 * i915_gem_object_get_fence - set up a fence reg for an object
Jesse Barnesde151cf2008-11-12 10:03:55 -08002348 * @obj: object to map through a fence reg
Chris Wilsond9e86c02010-11-10 16:40:20 +00002349 * @pipelined: ring on which to queue the change, or NULL for CPU access
2350 * @interruptible: must we wait uninterruptibly for the register to retire?
Jesse Barnesde151cf2008-11-12 10:03:55 -08002351 *
2352 * When mapping objects through the GTT, userspace wants to be able to write
2353 * to them without having to worry about swizzling if the object is tiled.
2354 *
2355 * This function walks the fence regs looking for a free one for @obj,
2356 * stealing one if it can't find any.
2357 *
2358 * It then sets up the reg based on the object's properties: address, pitch
2359 * and tiling format.
2360 */
Chris Wilson8c4b8c32009-06-17 22:08:52 +01002361int
Chris Wilsond9e86c02010-11-10 16:40:20 +00002362i915_gem_object_get_fence(struct drm_i915_gem_object *obj,
Chris Wilsonce453d82011-02-21 14:43:56 +00002363 struct intel_ring_buffer *pipelined)
Jesse Barnesde151cf2008-11-12 10:03:55 -08002364{
Chris Wilson05394f32010-11-08 19:18:58 +00002365 struct drm_device *dev = obj->base.dev;
Jesse Barnes79e53942008-11-07 14:24:08 -08002366 struct drm_i915_private *dev_priv = dev->dev_private;
Chris Wilsond9e86c02010-11-10 16:40:20 +00002367 struct drm_i915_fence_reg *reg;
Daniel Vetterae3db242010-02-19 11:51:58 +01002368 int ret;
Jesse Barnesde151cf2008-11-12 10:03:55 -08002369
Chris Wilson6bda10d2010-12-05 21:04:18 +00002370 /* XXX disable pipelining. There are bugs. Shocking. */
2371 pipelined = NULL;
2372
Chris Wilsond9e86c02010-11-10 16:40:20 +00002373 /* Just update our place in the LRU if our fence is getting reused. */
Chris Wilson05394f32010-11-08 19:18:58 +00002374 if (obj->fence_reg != I915_FENCE_REG_NONE) {
2375 reg = &dev_priv->fence_regs[obj->fence_reg];
Daniel Vetter007cc8a2010-04-28 11:02:31 +02002376 list_move_tail(&reg->lru_list, &dev_priv->mm.fence_list);
Chris Wilsond9e86c02010-11-10 16:40:20 +00002377
Chris Wilson29c5a582011-03-17 15:23:22 +00002378 if (obj->tiling_changed) {
2379 ret = i915_gem_object_flush_fence(obj, pipelined);
2380 if (ret)
2381 return ret;
2382
2383 if (!obj->fenced_gpu_access && !obj->last_fenced_seqno)
2384 pipelined = NULL;
2385
2386 if (pipelined) {
2387 reg->setup_seqno =
2388 i915_gem_next_request_seqno(pipelined);
2389 obj->last_fenced_seqno = reg->setup_seqno;
2390 obj->last_fenced_ring = pipelined;
2391 }
2392
2393 goto update;
2394 }
Chris Wilsond9e86c02010-11-10 16:40:20 +00002395
2396 if (!pipelined) {
2397 if (reg->setup_seqno) {
2398 if (!ring_passed_seqno(obj->last_fenced_ring,
2399 reg->setup_seqno)) {
Chris Wilsondb53a302011-02-03 11:57:46 +00002400 ret = i915_wait_request(obj->last_fenced_ring,
Ben Widawskyb93f9cf2012-01-25 15:39:34 -08002401 reg->setup_seqno,
2402 true);
Chris Wilsond9e86c02010-11-10 16:40:20 +00002403 if (ret)
2404 return ret;
2405 }
2406
2407 reg->setup_seqno = 0;
2408 }
2409 } else if (obj->last_fenced_ring &&
2410 obj->last_fenced_ring != pipelined) {
Chris Wilsonce453d82011-02-21 14:43:56 +00002411 ret = i915_gem_object_flush_fence(obj, pipelined);
Chris Wilsond9e86c02010-11-10 16:40:20 +00002412 if (ret)
2413 return ret;
Chris Wilsond9e86c02010-11-10 16:40:20 +00002414 }
2415
Eric Anholta09ba7f2009-08-29 12:49:51 -07002416 return 0;
2417 }
2418
Chris Wilsond9e86c02010-11-10 16:40:20 +00002419 reg = i915_find_fence_reg(dev, pipelined);
2420 if (reg == NULL)
Daniel Vetter39965b32011-12-14 13:57:09 +01002421 return -EDEADLK;
Jesse Barnesde151cf2008-11-12 10:03:55 -08002422
Chris Wilsonce453d82011-02-21 14:43:56 +00002423 ret = i915_gem_object_flush_fence(obj, pipelined);
Chris Wilsond9e86c02010-11-10 16:40:20 +00002424 if (ret)
Daniel Vetterae3db242010-02-19 11:51:58 +01002425 return ret;
Chris Wilsonfc7170b2009-02-11 14:26:46 +00002426
Chris Wilsond9e86c02010-11-10 16:40:20 +00002427 if (reg->obj) {
2428 struct drm_i915_gem_object *old = reg->obj;
2429
2430 drm_gem_object_reference(&old->base);
2431
2432 if (old->tiling_mode)
2433 i915_gem_release_mmap(old);
2434
Chris Wilsonce453d82011-02-21 14:43:56 +00002435 ret = i915_gem_object_flush_fence(old, pipelined);
Chris Wilsond9e86c02010-11-10 16:40:20 +00002436 if (ret) {
2437 drm_gem_object_unreference(&old->base);
2438 return ret;
2439 }
2440
2441 if (old->last_fenced_seqno == 0 && obj->last_fenced_seqno == 0)
2442 pipelined = NULL;
2443
2444 old->fence_reg = I915_FENCE_REG_NONE;
2445 old->last_fenced_ring = pipelined;
2446 old->last_fenced_seqno =
Chris Wilsondb53a302011-02-03 11:57:46 +00002447 pipelined ? i915_gem_next_request_seqno(pipelined) : 0;
Chris Wilsond9e86c02010-11-10 16:40:20 +00002448
2449 drm_gem_object_unreference(&old->base);
2450 } else if (obj->last_fenced_seqno == 0)
2451 pipelined = NULL;
Eric Anholta09ba7f2009-08-29 12:49:51 -07002452
Jesse Barnesde151cf2008-11-12 10:03:55 -08002453 reg->obj = obj;
Chris Wilsond9e86c02010-11-10 16:40:20 +00002454 list_move_tail(&reg->lru_list, &dev_priv->mm.fence_list);
2455 obj->fence_reg = reg - dev_priv->fence_regs;
2456 obj->last_fenced_ring = pipelined;
Jesse Barnesde151cf2008-11-12 10:03:55 -08002457
Chris Wilsond9e86c02010-11-10 16:40:20 +00002458 reg->setup_seqno =
Chris Wilsondb53a302011-02-03 11:57:46 +00002459 pipelined ? i915_gem_next_request_seqno(pipelined) : 0;
Chris Wilsond9e86c02010-11-10 16:40:20 +00002460 obj->last_fenced_seqno = reg->setup_seqno;
2461
2462update:
2463 obj->tiling_changed = false;
Chris Wilsone259bef2010-09-17 00:32:02 +01002464 switch (INTEL_INFO(dev)->gen) {
Eric Anholt25aebfc32011-05-06 13:55:53 -07002465 case 7:
Chris Wilsone259bef2010-09-17 00:32:02 +01002466 case 6:
Daniel Vetterc6642782010-11-12 13:46:18 +00002467 ret = sandybridge_write_fence_reg(obj, pipelined);
Chris Wilsone259bef2010-09-17 00:32:02 +01002468 break;
2469 case 5:
2470 case 4:
Daniel Vetterc6642782010-11-12 13:46:18 +00002471 ret = i965_write_fence_reg(obj, pipelined);
Chris Wilsone259bef2010-09-17 00:32:02 +01002472 break;
2473 case 3:
Daniel Vetterc6642782010-11-12 13:46:18 +00002474 ret = i915_write_fence_reg(obj, pipelined);
Chris Wilsone259bef2010-09-17 00:32:02 +01002475 break;
2476 case 2:
Daniel Vetterc6642782010-11-12 13:46:18 +00002477 ret = i830_write_fence_reg(obj, pipelined);
Chris Wilsone259bef2010-09-17 00:32:02 +01002478 break;
2479 }
Eric Anholtd9ddcb92009-01-27 10:33:49 -08002480
Daniel Vetterc6642782010-11-12 13:46:18 +00002481 return ret;
Jesse Barnesde151cf2008-11-12 10:03:55 -08002482}
2483
2484/**
2485 * i915_gem_clear_fence_reg - clear out fence register info
2486 * @obj: object to clear
2487 *
2488 * Zeroes out the fence register itself and clears out the associated
Chris Wilson05394f32010-11-08 19:18:58 +00002489 * data structures in dev_priv and obj.
Jesse Barnesde151cf2008-11-12 10:03:55 -08002490 */
2491static void
Chris Wilsond9e86c02010-11-10 16:40:20 +00002492i915_gem_clear_fence_reg(struct drm_device *dev,
2493 struct drm_i915_fence_reg *reg)
Jesse Barnesde151cf2008-11-12 10:03:55 -08002494{
Jesse Barnes79e53942008-11-07 14:24:08 -08002495 drm_i915_private_t *dev_priv = dev->dev_private;
Chris Wilsond9e86c02010-11-10 16:40:20 +00002496 uint32_t fence_reg = reg - dev_priv->fence_regs;
Jesse Barnesde151cf2008-11-12 10:03:55 -08002497
Chris Wilsone259bef2010-09-17 00:32:02 +01002498 switch (INTEL_INFO(dev)->gen) {
Eric Anholt25aebfc32011-05-06 13:55:53 -07002499 case 7:
Chris Wilsone259bef2010-09-17 00:32:02 +01002500 case 6:
Chris Wilsond9e86c02010-11-10 16:40:20 +00002501 I915_WRITE64(FENCE_REG_SANDYBRIDGE_0 + fence_reg*8, 0);
Chris Wilsone259bef2010-09-17 00:32:02 +01002502 break;
2503 case 5:
2504 case 4:
Chris Wilsond9e86c02010-11-10 16:40:20 +00002505 I915_WRITE64(FENCE_REG_965_0 + fence_reg*8, 0);
Chris Wilsone259bef2010-09-17 00:32:02 +01002506 break;
2507 case 3:
Chris Wilsond9e86c02010-11-10 16:40:20 +00002508 if (fence_reg >= 8)
2509 fence_reg = FENCE_REG_945_8 + (fence_reg - 8) * 4;
Eric Anholtdc529a42009-03-10 22:34:49 -07002510 else
Chris Wilsone259bef2010-09-17 00:32:02 +01002511 case 2:
Chris Wilsond9e86c02010-11-10 16:40:20 +00002512 fence_reg = FENCE_REG_830_0 + fence_reg * 4;
Eric Anholtdc529a42009-03-10 22:34:49 -07002513
2514 I915_WRITE(fence_reg, 0);
Chris Wilsone259bef2010-09-17 00:32:02 +01002515 break;
Eric Anholtdc529a42009-03-10 22:34:49 -07002516 }
Jesse Barnesde151cf2008-11-12 10:03:55 -08002517
Daniel Vetter007cc8a2010-04-28 11:02:31 +02002518 list_del_init(&reg->lru_list);
Chris Wilsond9e86c02010-11-10 16:40:20 +00002519 reg->obj = NULL;
2520 reg->setup_seqno = 0;
Chris Wilson1690e1e2011-12-14 13:57:08 +01002521 reg->pin_count = 0;
Chris Wilson52dc7d32009-06-06 09:46:01 +01002522}
2523
2524/**
Eric Anholt673a3942008-07-30 12:06:12 -07002525 * Finds free space in the GTT aperture and binds the object there.
2526 */
2527static int
Chris Wilson05394f32010-11-08 19:18:58 +00002528i915_gem_object_bind_to_gtt(struct drm_i915_gem_object *obj,
Daniel Vetter920afa72010-09-16 17:54:23 +02002529 unsigned alignment,
Daniel Vetter75e9e912010-11-04 17:11:09 +01002530 bool map_and_fenceable)
Eric Anholt673a3942008-07-30 12:06:12 -07002531{
Chris Wilson05394f32010-11-08 19:18:58 +00002532 struct drm_device *dev = obj->base.dev;
Eric Anholt673a3942008-07-30 12:06:12 -07002533 drm_i915_private_t *dev_priv = dev->dev_private;
Eric Anholt673a3942008-07-30 12:06:12 -07002534 struct drm_mm_node *free_space;
Chris Wilsona00b10c2010-09-24 21:15:47 +01002535 gfp_t gfpmask = __GFP_NORETRY | __GFP_NOWARN;
Daniel Vetter5e783302010-11-14 22:32:36 +01002536 u32 size, fence_size, fence_alignment, unfenced_alignment;
Daniel Vetter75e9e912010-11-04 17:11:09 +01002537 bool mappable, fenceable;
Chris Wilson07f73f62009-09-14 16:50:30 +01002538 int ret;
Eric Anholt673a3942008-07-30 12:06:12 -07002539
Chris Wilson05394f32010-11-08 19:18:58 +00002540 if (obj->madv != I915_MADV_WILLNEED) {
Chris Wilson3ef94da2009-09-14 16:50:29 +01002541 DRM_ERROR("Attempting to bind a purgeable object\n");
2542 return -EINVAL;
2543 }
2544
Chris Wilsone28f8712011-07-18 13:11:49 -07002545 fence_size = i915_gem_get_gtt_size(dev,
2546 obj->base.size,
2547 obj->tiling_mode);
2548 fence_alignment = i915_gem_get_gtt_alignment(dev,
2549 obj->base.size,
2550 obj->tiling_mode);
2551 unfenced_alignment =
2552 i915_gem_get_unfenced_gtt_alignment(dev,
2553 obj->base.size,
2554 obj->tiling_mode);
Chris Wilsona00b10c2010-09-24 21:15:47 +01002555
Eric Anholt673a3942008-07-30 12:06:12 -07002556 if (alignment == 0)
Daniel Vetter5e783302010-11-14 22:32:36 +01002557 alignment = map_and_fenceable ? fence_alignment :
2558 unfenced_alignment;
Daniel Vetter75e9e912010-11-04 17:11:09 +01002559 if (map_and_fenceable && alignment & (fence_alignment - 1)) {
Eric Anholt673a3942008-07-30 12:06:12 -07002560 DRM_ERROR("Invalid object alignment requested %u\n", alignment);
2561 return -EINVAL;
2562 }
2563
Chris Wilson05394f32010-11-08 19:18:58 +00002564 size = map_and_fenceable ? fence_size : obj->base.size;
Chris Wilsona00b10c2010-09-24 21:15:47 +01002565
Chris Wilson654fc602010-05-27 13:18:21 +01002566 /* If the object is bigger than the entire aperture, reject it early
2567 * before evicting everything in a vain attempt to find space.
2568 */
Chris Wilson05394f32010-11-08 19:18:58 +00002569 if (obj->base.size >
Daniel Vetter75e9e912010-11-04 17:11:09 +01002570 (map_and_fenceable ? dev_priv->mm.gtt_mappable_end : dev_priv->mm.gtt_total)) {
Chris Wilson654fc602010-05-27 13:18:21 +01002571 DRM_ERROR("Attempting to bind an object larger than the aperture\n");
2572 return -E2BIG;
2573 }
2574
Eric Anholt673a3942008-07-30 12:06:12 -07002575 search_free:
Daniel Vetter75e9e912010-11-04 17:11:09 +01002576 if (map_and_fenceable)
Daniel Vetter920afa72010-09-16 17:54:23 +02002577 free_space =
2578 drm_mm_search_free_in_range(&dev_priv->mm.gtt_space,
Chris Wilsona00b10c2010-09-24 21:15:47 +01002579 size, alignment, 0,
Daniel Vetter920afa72010-09-16 17:54:23 +02002580 dev_priv->mm.gtt_mappable_end,
2581 0);
2582 else
2583 free_space = drm_mm_search_free(&dev_priv->mm.gtt_space,
Chris Wilsona00b10c2010-09-24 21:15:47 +01002584 size, alignment, 0);
Daniel Vetter920afa72010-09-16 17:54:23 +02002585
2586 if (free_space != NULL) {
Daniel Vetter75e9e912010-11-04 17:11:09 +01002587 if (map_and_fenceable)
Chris Wilson05394f32010-11-08 19:18:58 +00002588 obj->gtt_space =
Daniel Vetter920afa72010-09-16 17:54:23 +02002589 drm_mm_get_block_range_generic(free_space,
Chris Wilsona00b10c2010-09-24 21:15:47 +01002590 size, alignment, 0,
Daniel Vetter920afa72010-09-16 17:54:23 +02002591 dev_priv->mm.gtt_mappable_end,
2592 0);
2593 else
Chris Wilson05394f32010-11-08 19:18:58 +00002594 obj->gtt_space =
Chris Wilsona00b10c2010-09-24 21:15:47 +01002595 drm_mm_get_block(free_space, size, alignment);
Daniel Vetter920afa72010-09-16 17:54:23 +02002596 }
Chris Wilson05394f32010-11-08 19:18:58 +00002597 if (obj->gtt_space == NULL) {
Eric Anholt673a3942008-07-30 12:06:12 -07002598 /* If the gtt is empty and we're still having trouble
2599 * fitting our object in, we're out of memory.
2600 */
Daniel Vetter75e9e912010-11-04 17:11:09 +01002601 ret = i915_gem_evict_something(dev, size, alignment,
2602 map_and_fenceable);
Chris Wilson97311292009-09-21 00:22:34 +01002603 if (ret)
Eric Anholt673a3942008-07-30 12:06:12 -07002604 return ret;
Chris Wilson97311292009-09-21 00:22:34 +01002605
Eric Anholt673a3942008-07-30 12:06:12 -07002606 goto search_free;
2607 }
2608
Chris Wilsone5281cc2010-10-28 13:45:36 +01002609 ret = i915_gem_object_get_pages_gtt(obj, gfpmask);
Eric Anholt673a3942008-07-30 12:06:12 -07002610 if (ret) {
Chris Wilson05394f32010-11-08 19:18:58 +00002611 drm_mm_put_block(obj->gtt_space);
2612 obj->gtt_space = NULL;
Chris Wilson07f73f62009-09-14 16:50:30 +01002613
2614 if (ret == -ENOMEM) {
Chris Wilson809b6332011-01-10 17:33:15 +00002615 /* first try to reclaim some memory by clearing the GTT */
2616 ret = i915_gem_evict_everything(dev, false);
Chris Wilson07f73f62009-09-14 16:50:30 +01002617 if (ret) {
Chris Wilson07f73f62009-09-14 16:50:30 +01002618 /* now try to shrink everyone else */
Chris Wilson4bdadb92010-01-27 13:36:32 +00002619 if (gfpmask) {
2620 gfpmask = 0;
2621 goto search_free;
Chris Wilson07f73f62009-09-14 16:50:30 +01002622 }
2623
Chris Wilson809b6332011-01-10 17:33:15 +00002624 return -ENOMEM;
Chris Wilson07f73f62009-09-14 16:50:30 +01002625 }
2626
2627 goto search_free;
2628 }
2629
Eric Anholt673a3942008-07-30 12:06:12 -07002630 return ret;
2631 }
2632
Daniel Vetter74163902012-02-15 23:50:21 +01002633 ret = i915_gem_gtt_prepare_object(obj);
Daniel Vetter7c2e6fd2010-11-06 10:10:47 +01002634 if (ret) {
Chris Wilsone5281cc2010-10-28 13:45:36 +01002635 i915_gem_object_put_pages_gtt(obj);
Chris Wilson05394f32010-11-08 19:18:58 +00002636 drm_mm_put_block(obj->gtt_space);
2637 obj->gtt_space = NULL;
Chris Wilson07f73f62009-09-14 16:50:30 +01002638
Chris Wilson809b6332011-01-10 17:33:15 +00002639 if (i915_gem_evict_everything(dev, false))
Chris Wilson07f73f62009-09-14 16:50:30 +01002640 return ret;
Chris Wilson07f73f62009-09-14 16:50:30 +01002641
2642 goto search_free;
Eric Anholt673a3942008-07-30 12:06:12 -07002643 }
Daniel Vetter0ebb9822012-02-15 23:50:24 +01002644
2645 if (!dev_priv->mm.aliasing_ppgtt)
2646 i915_gem_gtt_bind_object(obj, obj->cache_level);
Eric Anholt673a3942008-07-30 12:06:12 -07002647
Chris Wilson6299f992010-11-24 12:23:44 +00002648 list_add_tail(&obj->gtt_list, &dev_priv->mm.gtt_list);
Chris Wilson05394f32010-11-08 19:18:58 +00002649 list_add_tail(&obj->mm_list, &dev_priv->mm.inactive_list);
Chris Wilsonbf1a1092010-08-07 11:01:20 +01002650
Eric Anholt673a3942008-07-30 12:06:12 -07002651 /* Assert that the object is not currently in any GPU domain. As it
2652 * wasn't in the GTT, there shouldn't be any way it could have been in
2653 * a GPU cache
2654 */
Chris Wilson05394f32010-11-08 19:18:58 +00002655 BUG_ON(obj->base.read_domains & I915_GEM_GPU_DOMAINS);
2656 BUG_ON(obj->base.write_domain & I915_GEM_GPU_DOMAINS);
Eric Anholt673a3942008-07-30 12:06:12 -07002657
Chris Wilson6299f992010-11-24 12:23:44 +00002658 obj->gtt_offset = obj->gtt_space->start;
Chris Wilson1c5d22f2009-08-25 11:15:50 +01002659
Daniel Vetter75e9e912010-11-04 17:11:09 +01002660 fenceable =
Chris Wilson05394f32010-11-08 19:18:58 +00002661 obj->gtt_space->size == fence_size &&
Akshay Joshi0206e352011-08-16 15:34:10 -04002662 (obj->gtt_space->start & (fence_alignment - 1)) == 0;
Chris Wilsona00b10c2010-09-24 21:15:47 +01002663
Daniel Vetter75e9e912010-11-04 17:11:09 +01002664 mappable =
Chris Wilson05394f32010-11-08 19:18:58 +00002665 obj->gtt_offset + obj->base.size <= dev_priv->mm.gtt_mappable_end;
Chris Wilsona00b10c2010-09-24 21:15:47 +01002666
Chris Wilson05394f32010-11-08 19:18:58 +00002667 obj->map_and_fenceable = mappable && fenceable;
Daniel Vetter75e9e912010-11-04 17:11:09 +01002668
Chris Wilsondb53a302011-02-03 11:57:46 +00002669 trace_i915_gem_object_bind(obj, map_and_fenceable);
Eric Anholt673a3942008-07-30 12:06:12 -07002670 return 0;
2671}
2672
2673void
Chris Wilson05394f32010-11-08 19:18:58 +00002674i915_gem_clflush_object(struct drm_i915_gem_object *obj)
Eric Anholt673a3942008-07-30 12:06:12 -07002675{
Eric Anholt673a3942008-07-30 12:06:12 -07002676 /* If we don't have a page list set up, then we're not pinned
2677 * to GPU, and we can ignore the cache flush because it'll happen
2678 * again at bind time.
2679 */
Chris Wilson05394f32010-11-08 19:18:58 +00002680 if (obj->pages == NULL)
Eric Anholt673a3942008-07-30 12:06:12 -07002681 return;
2682
Chris Wilson9c23f7f2011-03-29 16:59:52 -07002683 /* If the GPU is snooping the contents of the CPU cache,
2684 * we do not need to manually clear the CPU cache lines. However,
2685 * the caches are only snooped when the render cache is
2686 * flushed/invalidated. As we always have to emit invalidations
2687 * and flushes when moving into and out of the RENDER domain, correct
2688 * snooping behaviour occurs naturally as the result of our domain
2689 * tracking.
2690 */
2691 if (obj->cache_level != I915_CACHE_NONE)
2692 return;
2693
Chris Wilson1c5d22f2009-08-25 11:15:50 +01002694 trace_i915_gem_object_clflush(obj);
Eric Anholtcfa16a02009-05-26 18:46:16 -07002695
Chris Wilson05394f32010-11-08 19:18:58 +00002696 drm_clflush_pages(obj->pages, obj->base.size / PAGE_SIZE);
Eric Anholt673a3942008-07-30 12:06:12 -07002697}
2698
Eric Anholte47c68e2008-11-14 13:35:19 -08002699/** Flushes any GPU write domain for the object if it's dirty. */
Chris Wilson88241782011-01-07 17:09:48 +00002700static int
Chris Wilson3619df02010-11-28 15:37:17 +00002701i915_gem_object_flush_gpu_write_domain(struct drm_i915_gem_object *obj)
Eric Anholte47c68e2008-11-14 13:35:19 -08002702{
Chris Wilson05394f32010-11-08 19:18:58 +00002703 if ((obj->base.write_domain & I915_GEM_GPU_DOMAINS) == 0)
Chris Wilson88241782011-01-07 17:09:48 +00002704 return 0;
Eric Anholte47c68e2008-11-14 13:35:19 -08002705
2706 /* Queue the GPU write cache flushing we need. */
Chris Wilsondb53a302011-02-03 11:57:46 +00002707 return i915_gem_flush_ring(obj->ring, 0, obj->base.write_domain);
Eric Anholte47c68e2008-11-14 13:35:19 -08002708}
2709
2710/** Flushes the GTT write domain for the object if it's dirty. */
2711static void
Chris Wilson05394f32010-11-08 19:18:58 +00002712i915_gem_object_flush_gtt_write_domain(struct drm_i915_gem_object *obj)
Eric Anholte47c68e2008-11-14 13:35:19 -08002713{
Chris Wilson1c5d22f2009-08-25 11:15:50 +01002714 uint32_t old_write_domain;
2715
Chris Wilson05394f32010-11-08 19:18:58 +00002716 if (obj->base.write_domain != I915_GEM_DOMAIN_GTT)
Eric Anholte47c68e2008-11-14 13:35:19 -08002717 return;
2718
Chris Wilson63256ec2011-01-04 18:42:07 +00002719 /* No actual flushing is required for the GTT write domain. Writes
Eric Anholte47c68e2008-11-14 13:35:19 -08002720 * to it immediately go to main memory as far as we know, so there's
2721 * no chipset flush. It also doesn't land in render cache.
Chris Wilson63256ec2011-01-04 18:42:07 +00002722 *
2723 * However, we do have to enforce the order so that all writes through
2724 * the GTT land before any writes to the device, such as updates to
2725 * the GATT itself.
Eric Anholte47c68e2008-11-14 13:35:19 -08002726 */
Chris Wilson63256ec2011-01-04 18:42:07 +00002727 wmb();
2728
Chris Wilson05394f32010-11-08 19:18:58 +00002729 old_write_domain = obj->base.write_domain;
2730 obj->base.write_domain = 0;
Chris Wilson1c5d22f2009-08-25 11:15:50 +01002731
2732 trace_i915_gem_object_change_domain(obj,
Chris Wilson05394f32010-11-08 19:18:58 +00002733 obj->base.read_domains,
Chris Wilson1c5d22f2009-08-25 11:15:50 +01002734 old_write_domain);
Eric Anholte47c68e2008-11-14 13:35:19 -08002735}
2736
2737/** Flushes the CPU write domain for the object if it's dirty. */
2738static void
Chris Wilson05394f32010-11-08 19:18:58 +00002739i915_gem_object_flush_cpu_write_domain(struct drm_i915_gem_object *obj)
Eric Anholte47c68e2008-11-14 13:35:19 -08002740{
Chris Wilson1c5d22f2009-08-25 11:15:50 +01002741 uint32_t old_write_domain;
Eric Anholte47c68e2008-11-14 13:35:19 -08002742
Chris Wilson05394f32010-11-08 19:18:58 +00002743 if (obj->base.write_domain != I915_GEM_DOMAIN_CPU)
Eric Anholte47c68e2008-11-14 13:35:19 -08002744 return;
2745
2746 i915_gem_clflush_object(obj);
Daniel Vetter40ce6572010-11-05 18:12:18 +01002747 intel_gtt_chipset_flush();
Chris Wilson05394f32010-11-08 19:18:58 +00002748 old_write_domain = obj->base.write_domain;
2749 obj->base.write_domain = 0;
Chris Wilson1c5d22f2009-08-25 11:15:50 +01002750
2751 trace_i915_gem_object_change_domain(obj,
Chris Wilson05394f32010-11-08 19:18:58 +00002752 obj->base.read_domains,
Chris Wilson1c5d22f2009-08-25 11:15:50 +01002753 old_write_domain);
Eric Anholte47c68e2008-11-14 13:35:19 -08002754}
2755
Eric Anholt2ef7eea2008-11-10 10:53:25 -08002756/**
2757 * Moves a single object to the GTT read, and possibly write domain.
2758 *
2759 * This function returns when the move is complete, including waiting on
2760 * flushes to occur.
2761 */
Jesse Barnes79e53942008-11-07 14:24:08 -08002762int
Chris Wilson20217462010-11-23 15:26:33 +00002763i915_gem_object_set_to_gtt_domain(struct drm_i915_gem_object *obj, bool write)
Eric Anholt2ef7eea2008-11-10 10:53:25 -08002764{
Chris Wilson1c5d22f2009-08-25 11:15:50 +01002765 uint32_t old_write_domain, old_read_domains;
Eric Anholte47c68e2008-11-14 13:35:19 -08002766 int ret;
Eric Anholt2ef7eea2008-11-10 10:53:25 -08002767
Eric Anholt02354392008-11-26 13:58:13 -08002768 /* Not valid to be called on unbound objects. */
Chris Wilson05394f32010-11-08 19:18:58 +00002769 if (obj->gtt_space == NULL)
Eric Anholt02354392008-11-26 13:58:13 -08002770 return -EINVAL;
2771
Chris Wilson8d7e3de2011-02-07 15:23:02 +00002772 if (obj->base.write_domain == I915_GEM_DOMAIN_GTT)
2773 return 0;
2774
Chris Wilson88241782011-01-07 17:09:48 +00002775 ret = i915_gem_object_flush_gpu_write_domain(obj);
2776 if (ret)
2777 return ret;
2778
Chris Wilson87ca9c82010-12-02 09:42:56 +00002779 if (obj->pending_gpu_write || write) {
Chris Wilsonce453d82011-02-21 14:43:56 +00002780 ret = i915_gem_object_wait_rendering(obj);
Chris Wilson87ca9c82010-12-02 09:42:56 +00002781 if (ret)
2782 return ret;
2783 }
Chris Wilson2dafb1e2010-06-07 14:03:05 +01002784
Chris Wilson72133422010-09-13 23:56:38 +01002785 i915_gem_object_flush_cpu_write_domain(obj);
Chris Wilson1c5d22f2009-08-25 11:15:50 +01002786
Chris Wilson05394f32010-11-08 19:18:58 +00002787 old_write_domain = obj->base.write_domain;
2788 old_read_domains = obj->base.read_domains;
Eric Anholt2ef7eea2008-11-10 10:53:25 -08002789
Eric Anholt2ef7eea2008-11-10 10:53:25 -08002790 /* It should now be out of any other write domains, and we can update
2791 * the domain values for our changes.
2792 */
Chris Wilson05394f32010-11-08 19:18:58 +00002793 BUG_ON((obj->base.write_domain & ~I915_GEM_DOMAIN_GTT) != 0);
2794 obj->base.read_domains |= I915_GEM_DOMAIN_GTT;
Eric Anholte47c68e2008-11-14 13:35:19 -08002795 if (write) {
Chris Wilson05394f32010-11-08 19:18:58 +00002796 obj->base.read_domains = I915_GEM_DOMAIN_GTT;
2797 obj->base.write_domain = I915_GEM_DOMAIN_GTT;
2798 obj->dirty = 1;
Eric Anholte47c68e2008-11-14 13:35:19 -08002799 }
2800
Chris Wilson1c5d22f2009-08-25 11:15:50 +01002801 trace_i915_gem_object_change_domain(obj,
2802 old_read_domains,
2803 old_write_domain);
2804
Eric Anholte47c68e2008-11-14 13:35:19 -08002805 return 0;
2806}
2807
Chris Wilsone4ffd172011-04-04 09:44:39 +01002808int i915_gem_object_set_cache_level(struct drm_i915_gem_object *obj,
2809 enum i915_cache_level cache_level)
2810{
Daniel Vetter7bddb012012-02-09 17:15:47 +01002811 struct drm_device *dev = obj->base.dev;
2812 drm_i915_private_t *dev_priv = dev->dev_private;
Chris Wilsone4ffd172011-04-04 09:44:39 +01002813 int ret;
2814
2815 if (obj->cache_level == cache_level)
2816 return 0;
2817
2818 if (obj->pin_count) {
2819 DRM_DEBUG("can not change the cache level of pinned objects\n");
2820 return -EBUSY;
2821 }
2822
2823 if (obj->gtt_space) {
2824 ret = i915_gem_object_finish_gpu(obj);
2825 if (ret)
2826 return ret;
2827
2828 i915_gem_object_finish_gtt(obj);
2829
2830 /* Before SandyBridge, you could not use tiling or fence
2831 * registers with snooped memory, so relinquish any fences
2832 * currently pointing to our region in the aperture.
2833 */
2834 if (INTEL_INFO(obj->base.dev)->gen < 6) {
2835 ret = i915_gem_object_put_fence(obj);
2836 if (ret)
2837 return ret;
2838 }
2839
Daniel Vetter74898d72012-02-15 23:50:22 +01002840 if (obj->has_global_gtt_mapping)
2841 i915_gem_gtt_bind_object(obj, cache_level);
Daniel Vetter7bddb012012-02-09 17:15:47 +01002842 if (obj->has_aliasing_ppgtt_mapping)
2843 i915_ppgtt_bind_object(dev_priv->mm.aliasing_ppgtt,
2844 obj, cache_level);
Chris Wilsone4ffd172011-04-04 09:44:39 +01002845 }
2846
2847 if (cache_level == I915_CACHE_NONE) {
2848 u32 old_read_domains, old_write_domain;
2849
2850 /* If we're coming from LLC cached, then we haven't
2851 * actually been tracking whether the data is in the
2852 * CPU cache or not, since we only allow one bit set
2853 * in obj->write_domain and have been skipping the clflushes.
2854 * Just set it to the CPU cache for now.
2855 */
2856 WARN_ON(obj->base.write_domain & ~I915_GEM_DOMAIN_CPU);
2857 WARN_ON(obj->base.read_domains & ~I915_GEM_DOMAIN_CPU);
2858
2859 old_read_domains = obj->base.read_domains;
2860 old_write_domain = obj->base.write_domain;
2861
2862 obj->base.read_domains = I915_GEM_DOMAIN_CPU;
2863 obj->base.write_domain = I915_GEM_DOMAIN_CPU;
2864
2865 trace_i915_gem_object_change_domain(obj,
2866 old_read_domains,
2867 old_write_domain);
2868 }
2869
2870 obj->cache_level = cache_level;
2871 return 0;
2872}
2873
Zhenyu Wangb9241ea2009-11-25 13:09:39 +08002874/*
Chris Wilson2da3b9b2011-04-14 09:41:17 +01002875 * Prepare buffer for display plane (scanout, cursors, etc).
2876 * Can be called from an uninterruptible phase (modesetting) and allows
2877 * any flushes to be pipelined (for pageflips).
2878 *
2879 * For the display plane, we want to be in the GTT but out of any write
2880 * domains. So in many ways this looks like set_to_gtt_domain() apart from the
2881 * ability to pipeline the waits, pinning and any additional subtleties
2882 * that may differentiate the display plane from ordinary buffers.
Zhenyu Wangb9241ea2009-11-25 13:09:39 +08002883 */
2884int
Chris Wilson2da3b9b2011-04-14 09:41:17 +01002885i915_gem_object_pin_to_display_plane(struct drm_i915_gem_object *obj,
2886 u32 alignment,
Chris Wilson919926a2010-11-12 13:42:53 +00002887 struct intel_ring_buffer *pipelined)
Zhenyu Wangb9241ea2009-11-25 13:09:39 +08002888{
Chris Wilson2da3b9b2011-04-14 09:41:17 +01002889 u32 old_read_domains, old_write_domain;
Zhenyu Wangb9241ea2009-11-25 13:09:39 +08002890 int ret;
2891
Chris Wilson88241782011-01-07 17:09:48 +00002892 ret = i915_gem_object_flush_gpu_write_domain(obj);
2893 if (ret)
2894 return ret;
2895
Chris Wilson0be73282010-12-06 14:36:27 +00002896 if (pipelined != obj->ring) {
Chris Wilsonce453d82011-02-21 14:43:56 +00002897 ret = i915_gem_object_wait_rendering(obj);
Keith Packardf0b69ef2011-07-19 16:21:40 -07002898 if (ret == -ERESTARTSYS)
Zhenyu Wangb9241ea2009-11-25 13:09:39 +08002899 return ret;
2900 }
2901
Eric Anholta7ef0642011-03-29 16:59:54 -07002902 /* The display engine is not coherent with the LLC cache on gen6. As
2903 * a result, we make sure that the pinning that is about to occur is
2904 * done with uncached PTEs. This is lowest common denominator for all
2905 * chipsets.
2906 *
2907 * However for gen6+, we could do better by using the GFDT bit instead
2908 * of uncaching, which would allow us to flush all the LLC-cached data
2909 * with that bit in the PTE to main memory with just one PIPE_CONTROL.
2910 */
2911 ret = i915_gem_object_set_cache_level(obj, I915_CACHE_NONE);
2912 if (ret)
2913 return ret;
2914
Chris Wilson2da3b9b2011-04-14 09:41:17 +01002915 /* As the user may map the buffer once pinned in the display plane
2916 * (e.g. libkms for the bootup splash), we have to ensure that we
2917 * always use map_and_fenceable for all scanout buffers.
2918 */
2919 ret = i915_gem_object_pin(obj, alignment, true);
2920 if (ret)
2921 return ret;
2922
Chris Wilsonb118c1e2010-05-27 13:18:14 +01002923 i915_gem_object_flush_cpu_write_domain(obj);
2924
Chris Wilson2da3b9b2011-04-14 09:41:17 +01002925 old_write_domain = obj->base.write_domain;
Chris Wilson05394f32010-11-08 19:18:58 +00002926 old_read_domains = obj->base.read_domains;
Chris Wilson2da3b9b2011-04-14 09:41:17 +01002927
2928 /* It should now be out of any other write domains, and we can update
2929 * the domain values for our changes.
2930 */
2931 BUG_ON((obj->base.write_domain & ~I915_GEM_DOMAIN_GTT) != 0);
Chris Wilson05394f32010-11-08 19:18:58 +00002932 obj->base.read_domains |= I915_GEM_DOMAIN_GTT;
Zhenyu Wangb9241ea2009-11-25 13:09:39 +08002933
2934 trace_i915_gem_object_change_domain(obj,
2935 old_read_domains,
Chris Wilson2da3b9b2011-04-14 09:41:17 +01002936 old_write_domain);
Zhenyu Wangb9241ea2009-11-25 13:09:39 +08002937
2938 return 0;
2939}
2940
Chris Wilson85345512010-11-13 09:49:11 +00002941int
Chris Wilsona8198ee2011-04-13 22:04:09 +01002942i915_gem_object_finish_gpu(struct drm_i915_gem_object *obj)
Chris Wilson85345512010-11-13 09:49:11 +00002943{
Chris Wilson88241782011-01-07 17:09:48 +00002944 int ret;
2945
Chris Wilsona8198ee2011-04-13 22:04:09 +01002946 if ((obj->base.read_domains & I915_GEM_GPU_DOMAINS) == 0)
Chris Wilson85345512010-11-13 09:49:11 +00002947 return 0;
2948
Chris Wilson88241782011-01-07 17:09:48 +00002949 if (obj->base.write_domain & I915_GEM_GPU_DOMAINS) {
Chris Wilsondb53a302011-02-03 11:57:46 +00002950 ret = i915_gem_flush_ring(obj->ring, 0, obj->base.write_domain);
Chris Wilson88241782011-01-07 17:09:48 +00002951 if (ret)
2952 return ret;
2953 }
Chris Wilson85345512010-11-13 09:49:11 +00002954
Chris Wilsonc501ae72011-12-14 13:57:23 +01002955 ret = i915_gem_object_wait_rendering(obj);
2956 if (ret)
2957 return ret;
2958
Chris Wilsona8198ee2011-04-13 22:04:09 +01002959 /* Ensure that we invalidate the GPU's caches and TLBs. */
2960 obj->base.read_domains &= ~I915_GEM_GPU_DOMAINS;
Chris Wilsonc501ae72011-12-14 13:57:23 +01002961 return 0;
Chris Wilson85345512010-11-13 09:49:11 +00002962}
2963
Eric Anholte47c68e2008-11-14 13:35:19 -08002964/**
2965 * Moves a single object to the CPU read, and possibly write domain.
2966 *
2967 * This function returns when the move is complete, including waiting on
2968 * flushes to occur.
2969 */
Chris Wilsondabdfe02012-03-26 10:10:27 +02002970int
Chris Wilson919926a2010-11-12 13:42:53 +00002971i915_gem_object_set_to_cpu_domain(struct drm_i915_gem_object *obj, bool write)
Eric Anholte47c68e2008-11-14 13:35:19 -08002972{
Chris Wilson1c5d22f2009-08-25 11:15:50 +01002973 uint32_t old_write_domain, old_read_domains;
Eric Anholte47c68e2008-11-14 13:35:19 -08002974 int ret;
2975
Chris Wilson8d7e3de2011-02-07 15:23:02 +00002976 if (obj->base.write_domain == I915_GEM_DOMAIN_CPU)
2977 return 0;
2978
Chris Wilson88241782011-01-07 17:09:48 +00002979 ret = i915_gem_object_flush_gpu_write_domain(obj);
2980 if (ret)
2981 return ret;
2982
Chris Wilsonce453d82011-02-21 14:43:56 +00002983 ret = i915_gem_object_wait_rendering(obj);
Daniel Vetterde18a292010-11-27 22:30:41 +01002984 if (ret)
Eric Anholte47c68e2008-11-14 13:35:19 -08002985 return ret;
2986
2987 i915_gem_object_flush_gtt_write_domain(obj);
2988
Chris Wilson05394f32010-11-08 19:18:58 +00002989 old_write_domain = obj->base.write_domain;
2990 old_read_domains = obj->base.read_domains;
Chris Wilson1c5d22f2009-08-25 11:15:50 +01002991
Eric Anholte47c68e2008-11-14 13:35:19 -08002992 /* Flush the CPU cache if it's still invalid. */
Chris Wilson05394f32010-11-08 19:18:58 +00002993 if ((obj->base.read_domains & I915_GEM_DOMAIN_CPU) == 0) {
Eric Anholte47c68e2008-11-14 13:35:19 -08002994 i915_gem_clflush_object(obj);
Eric Anholte47c68e2008-11-14 13:35:19 -08002995
Chris Wilson05394f32010-11-08 19:18:58 +00002996 obj->base.read_domains |= I915_GEM_DOMAIN_CPU;
Eric Anholte47c68e2008-11-14 13:35:19 -08002997 }
2998
2999 /* It should now be out of any other write domains, and we can update
3000 * the domain values for our changes.
3001 */
Chris Wilson05394f32010-11-08 19:18:58 +00003002 BUG_ON((obj->base.write_domain & ~I915_GEM_DOMAIN_CPU) != 0);
Eric Anholte47c68e2008-11-14 13:35:19 -08003003
3004 /* If we're writing through the CPU, then the GPU read domains will
3005 * need to be invalidated at next use.
3006 */
3007 if (write) {
Chris Wilson05394f32010-11-08 19:18:58 +00003008 obj->base.read_domains = I915_GEM_DOMAIN_CPU;
3009 obj->base.write_domain = I915_GEM_DOMAIN_CPU;
Eric Anholte47c68e2008-11-14 13:35:19 -08003010 }
Eric Anholt2ef7eea2008-11-10 10:53:25 -08003011
Chris Wilson1c5d22f2009-08-25 11:15:50 +01003012 trace_i915_gem_object_change_domain(obj,
3013 old_read_domains,
3014 old_write_domain);
3015
Eric Anholt2ef7eea2008-11-10 10:53:25 -08003016 return 0;
3017}
3018
Eric Anholt673a3942008-07-30 12:06:12 -07003019/* Throttle our rendering by waiting until the ring has completed our requests
3020 * emitted over 20 msec ago.
3021 *
Eric Anholtb9624422009-06-03 07:27:35 +00003022 * Note that if we were to use the current jiffies each time around the loop,
3023 * we wouldn't escape the function with any frames outstanding if the time to
3024 * render a frame was over 20ms.
3025 *
Eric Anholt673a3942008-07-30 12:06:12 -07003026 * This should get us reasonable parallelism between CPU and GPU but also
3027 * relatively low latency when blocking on a particular request to finish.
3028 */
3029static int
Chris Wilsonf787a5f2010-09-24 16:02:42 +01003030i915_gem_ring_throttle(struct drm_device *dev, struct drm_file *file)
Eric Anholt673a3942008-07-30 12:06:12 -07003031{
Chris Wilsonf787a5f2010-09-24 16:02:42 +01003032 struct drm_i915_private *dev_priv = dev->dev_private;
3033 struct drm_i915_file_private *file_priv = file->driver_priv;
Eric Anholtb9624422009-06-03 07:27:35 +00003034 unsigned long recent_enough = jiffies - msecs_to_jiffies(20);
Chris Wilsonf787a5f2010-09-24 16:02:42 +01003035 struct drm_i915_gem_request *request;
3036 struct intel_ring_buffer *ring = NULL;
3037 u32 seqno = 0;
3038 int ret;
Eric Anholt673a3942008-07-30 12:06:12 -07003039
Chris Wilsone110e8d2011-01-26 15:39:14 +00003040 if (atomic_read(&dev_priv->mm.wedged))
3041 return -EIO;
3042
Chris Wilson1c255952010-09-26 11:03:27 +01003043 spin_lock(&file_priv->mm.lock);
Chris Wilsonf787a5f2010-09-24 16:02:42 +01003044 list_for_each_entry(request, &file_priv->mm.request_list, client_list) {
Eric Anholtb9624422009-06-03 07:27:35 +00003045 if (time_after_eq(request->emitted_jiffies, recent_enough))
3046 break;
3047
Chris Wilsonf787a5f2010-09-24 16:02:42 +01003048 ring = request->ring;
3049 seqno = request->seqno;
Eric Anholtb9624422009-06-03 07:27:35 +00003050 }
Chris Wilson1c255952010-09-26 11:03:27 +01003051 spin_unlock(&file_priv->mm.lock);
Chris Wilsonf787a5f2010-09-24 16:02:42 +01003052
3053 if (seqno == 0)
3054 return 0;
3055
3056 ret = 0;
Chris Wilson78501ea2010-10-27 12:18:21 +01003057 if (!i915_seqno_passed(ring->get_seqno(ring), seqno)) {
Chris Wilsonf787a5f2010-09-24 16:02:42 +01003058 /* And wait for the seqno passing without holding any locks and
3059 * causing extra latency for others. This is safe as the irq
3060 * generation is designed to be run atomically and so is
3061 * lockless.
3062 */
Chris Wilsonb13c2b92010-12-13 16:54:50 +00003063 if (ring->irq_get(ring)) {
3064 ret = wait_event_interruptible(ring->irq_queue,
3065 i915_seqno_passed(ring->get_seqno(ring), seqno)
3066 || atomic_read(&dev_priv->mm.wedged));
3067 ring->irq_put(ring);
Chris Wilsonf787a5f2010-09-24 16:02:42 +01003068
Chris Wilsonb13c2b92010-12-13 16:54:50 +00003069 if (ret == 0 && atomic_read(&dev_priv->mm.wedged))
3070 ret = -EIO;
Eric Anholte959b5d2011-12-22 14:55:01 -08003071 } else if (wait_for_atomic(i915_seqno_passed(ring->get_seqno(ring),
3072 seqno) ||
Eric Anholt7ea29b12011-12-22 14:54:59 -08003073 atomic_read(&dev_priv->mm.wedged), 3000)) {
3074 ret = -EBUSY;
Chris Wilsonb13c2b92010-12-13 16:54:50 +00003075 }
Chris Wilsonf787a5f2010-09-24 16:02:42 +01003076 }
3077
3078 if (ret == 0)
3079 queue_delayed_work(dev_priv->wq, &dev_priv->mm.retire_work, 0);
Eric Anholtb9624422009-06-03 07:27:35 +00003080
Eric Anholt673a3942008-07-30 12:06:12 -07003081 return ret;
3082}
3083
Eric Anholt673a3942008-07-30 12:06:12 -07003084int
Chris Wilson05394f32010-11-08 19:18:58 +00003085i915_gem_object_pin(struct drm_i915_gem_object *obj,
3086 uint32_t alignment,
Daniel Vetter75e9e912010-11-04 17:11:09 +01003087 bool map_and_fenceable)
Eric Anholt673a3942008-07-30 12:06:12 -07003088{
Chris Wilson05394f32010-11-08 19:18:58 +00003089 struct drm_device *dev = obj->base.dev;
Chris Wilsonf13d3f72010-09-20 17:36:15 +01003090 struct drm_i915_private *dev_priv = dev->dev_private;
Eric Anholt673a3942008-07-30 12:06:12 -07003091 int ret;
3092
Chris Wilson05394f32010-11-08 19:18:58 +00003093 BUG_ON(obj->pin_count == DRM_I915_GEM_OBJECT_MAX_PIN_COUNT);
Chris Wilson23bc5982010-09-29 16:10:57 +01003094 WARN_ON(i915_verify_lists(dev));
Chris Wilsonac0c6b52010-05-27 13:18:18 +01003095
Chris Wilson05394f32010-11-08 19:18:58 +00003096 if (obj->gtt_space != NULL) {
3097 if ((alignment && obj->gtt_offset & (alignment - 1)) ||
3098 (map_and_fenceable && !obj->map_and_fenceable)) {
3099 WARN(obj->pin_count,
Chris Wilsonae7d49d2010-08-04 12:37:41 +01003100 "bo is already pinned with incorrect alignment:"
Daniel Vetter75e9e912010-11-04 17:11:09 +01003101 " offset=%x, req.alignment=%x, req.map_and_fenceable=%d,"
3102 " obj->map_and_fenceable=%d\n",
Chris Wilson05394f32010-11-08 19:18:58 +00003103 obj->gtt_offset, alignment,
Daniel Vetter75e9e912010-11-04 17:11:09 +01003104 map_and_fenceable,
Chris Wilson05394f32010-11-08 19:18:58 +00003105 obj->map_and_fenceable);
Chris Wilsonac0c6b52010-05-27 13:18:18 +01003106 ret = i915_gem_object_unbind(obj);
3107 if (ret)
3108 return ret;
3109 }
3110 }
3111
Chris Wilson05394f32010-11-08 19:18:58 +00003112 if (obj->gtt_space == NULL) {
Chris Wilsona00b10c2010-09-24 21:15:47 +01003113 ret = i915_gem_object_bind_to_gtt(obj, alignment,
Daniel Vetter75e9e912010-11-04 17:11:09 +01003114 map_and_fenceable);
Chris Wilson97311292009-09-21 00:22:34 +01003115 if (ret)
Eric Anholt673a3942008-07-30 12:06:12 -07003116 return ret;
Chris Wilson22c344e2009-02-11 14:26:45 +00003117 }
Jesse Barnes76446ca2009-12-17 22:05:42 -05003118
Daniel Vetter74898d72012-02-15 23:50:22 +01003119 if (!obj->has_global_gtt_mapping && map_and_fenceable)
3120 i915_gem_gtt_bind_object(obj, obj->cache_level);
3121
Chris Wilson05394f32010-11-08 19:18:58 +00003122 if (obj->pin_count++ == 0) {
Chris Wilson05394f32010-11-08 19:18:58 +00003123 if (!obj->active)
3124 list_move_tail(&obj->mm_list,
Chris Wilsonf13d3f72010-09-20 17:36:15 +01003125 &dev_priv->mm.pinned_list);
Eric Anholt673a3942008-07-30 12:06:12 -07003126 }
Chris Wilson6299f992010-11-24 12:23:44 +00003127 obj->pin_mappable |= map_and_fenceable;
Eric Anholt673a3942008-07-30 12:06:12 -07003128
Chris Wilson23bc5982010-09-29 16:10:57 +01003129 WARN_ON(i915_verify_lists(dev));
Eric Anholt673a3942008-07-30 12:06:12 -07003130 return 0;
3131}
3132
3133void
Chris Wilson05394f32010-11-08 19:18:58 +00003134i915_gem_object_unpin(struct drm_i915_gem_object *obj)
Eric Anholt673a3942008-07-30 12:06:12 -07003135{
Chris Wilson05394f32010-11-08 19:18:58 +00003136 struct drm_device *dev = obj->base.dev;
Eric Anholt673a3942008-07-30 12:06:12 -07003137 drm_i915_private_t *dev_priv = dev->dev_private;
Eric Anholt673a3942008-07-30 12:06:12 -07003138
Chris Wilson23bc5982010-09-29 16:10:57 +01003139 WARN_ON(i915_verify_lists(dev));
Chris Wilson05394f32010-11-08 19:18:58 +00003140 BUG_ON(obj->pin_count == 0);
3141 BUG_ON(obj->gtt_space == NULL);
Eric Anholt673a3942008-07-30 12:06:12 -07003142
Chris Wilson05394f32010-11-08 19:18:58 +00003143 if (--obj->pin_count == 0) {
3144 if (!obj->active)
3145 list_move_tail(&obj->mm_list,
Eric Anholt673a3942008-07-30 12:06:12 -07003146 &dev_priv->mm.inactive_list);
Chris Wilson6299f992010-11-24 12:23:44 +00003147 obj->pin_mappable = false;
Eric Anholt673a3942008-07-30 12:06:12 -07003148 }
Chris Wilson23bc5982010-09-29 16:10:57 +01003149 WARN_ON(i915_verify_lists(dev));
Eric Anholt673a3942008-07-30 12:06:12 -07003150}
3151
3152int
3153i915_gem_pin_ioctl(struct drm_device *dev, void *data,
Chris Wilson05394f32010-11-08 19:18:58 +00003154 struct drm_file *file)
Eric Anholt673a3942008-07-30 12:06:12 -07003155{
3156 struct drm_i915_gem_pin *args = data;
Chris Wilson05394f32010-11-08 19:18:58 +00003157 struct drm_i915_gem_object *obj;
Eric Anholt673a3942008-07-30 12:06:12 -07003158 int ret;
3159
Chris Wilson1d7cfea2010-10-17 09:45:41 +01003160 ret = i915_mutex_lock_interruptible(dev);
3161 if (ret)
3162 return ret;
Eric Anholt673a3942008-07-30 12:06:12 -07003163
Chris Wilson05394f32010-11-08 19:18:58 +00003164 obj = to_intel_bo(drm_gem_object_lookup(dev, file, args->handle));
Chris Wilsonc8725222011-02-19 11:31:06 +00003165 if (&obj->base == NULL) {
Chris Wilson1d7cfea2010-10-17 09:45:41 +01003166 ret = -ENOENT;
3167 goto unlock;
Eric Anholt673a3942008-07-30 12:06:12 -07003168 }
Eric Anholt673a3942008-07-30 12:06:12 -07003169
Chris Wilson05394f32010-11-08 19:18:58 +00003170 if (obj->madv != I915_MADV_WILLNEED) {
Chris Wilsonbb6baf72009-09-22 14:24:13 +01003171 DRM_ERROR("Attempting to pin a purgeable buffer\n");
Chris Wilson1d7cfea2010-10-17 09:45:41 +01003172 ret = -EINVAL;
3173 goto out;
Chris Wilson3ef94da2009-09-14 16:50:29 +01003174 }
3175
Chris Wilson05394f32010-11-08 19:18:58 +00003176 if (obj->pin_filp != NULL && obj->pin_filp != file) {
Jesse Barnes79e53942008-11-07 14:24:08 -08003177 DRM_ERROR("Already pinned in i915_gem_pin_ioctl(): %d\n",
3178 args->handle);
Chris Wilson1d7cfea2010-10-17 09:45:41 +01003179 ret = -EINVAL;
3180 goto out;
Jesse Barnes79e53942008-11-07 14:24:08 -08003181 }
3182
Chris Wilson05394f32010-11-08 19:18:58 +00003183 obj->user_pin_count++;
3184 obj->pin_filp = file;
3185 if (obj->user_pin_count == 1) {
Daniel Vetter75e9e912010-11-04 17:11:09 +01003186 ret = i915_gem_object_pin(obj, args->alignment, true);
Chris Wilson1d7cfea2010-10-17 09:45:41 +01003187 if (ret)
3188 goto out;
Eric Anholt673a3942008-07-30 12:06:12 -07003189 }
3190
3191 /* XXX - flush the CPU caches for pinned objects
3192 * as the X server doesn't manage domains yet
3193 */
Eric Anholte47c68e2008-11-14 13:35:19 -08003194 i915_gem_object_flush_cpu_write_domain(obj);
Chris Wilson05394f32010-11-08 19:18:58 +00003195 args->offset = obj->gtt_offset;
Chris Wilson1d7cfea2010-10-17 09:45:41 +01003196out:
Chris Wilson05394f32010-11-08 19:18:58 +00003197 drm_gem_object_unreference(&obj->base);
Chris Wilson1d7cfea2010-10-17 09:45:41 +01003198unlock:
Eric Anholt673a3942008-07-30 12:06:12 -07003199 mutex_unlock(&dev->struct_mutex);
Chris Wilson1d7cfea2010-10-17 09:45:41 +01003200 return ret;
Eric Anholt673a3942008-07-30 12:06:12 -07003201}
3202
3203int
3204i915_gem_unpin_ioctl(struct drm_device *dev, void *data,
Chris Wilson05394f32010-11-08 19:18:58 +00003205 struct drm_file *file)
Eric Anholt673a3942008-07-30 12:06:12 -07003206{
3207 struct drm_i915_gem_pin *args = data;
Chris Wilson05394f32010-11-08 19:18:58 +00003208 struct drm_i915_gem_object *obj;
Chris Wilson76c1dec2010-09-25 11:22:51 +01003209 int ret;
Eric Anholt673a3942008-07-30 12:06:12 -07003210
Chris Wilson1d7cfea2010-10-17 09:45:41 +01003211 ret = i915_mutex_lock_interruptible(dev);
3212 if (ret)
3213 return ret;
Eric Anholt673a3942008-07-30 12:06:12 -07003214
Chris Wilson05394f32010-11-08 19:18:58 +00003215 obj = to_intel_bo(drm_gem_object_lookup(dev, file, args->handle));
Chris Wilsonc8725222011-02-19 11:31:06 +00003216 if (&obj->base == NULL) {
Chris Wilson1d7cfea2010-10-17 09:45:41 +01003217 ret = -ENOENT;
3218 goto unlock;
Eric Anholt673a3942008-07-30 12:06:12 -07003219 }
Chris Wilson76c1dec2010-09-25 11:22:51 +01003220
Chris Wilson05394f32010-11-08 19:18:58 +00003221 if (obj->pin_filp != file) {
Jesse Barnes79e53942008-11-07 14:24:08 -08003222 DRM_ERROR("Not pinned by caller in i915_gem_pin_ioctl(): %d\n",
3223 args->handle);
Chris Wilson1d7cfea2010-10-17 09:45:41 +01003224 ret = -EINVAL;
3225 goto out;
Jesse Barnes79e53942008-11-07 14:24:08 -08003226 }
Chris Wilson05394f32010-11-08 19:18:58 +00003227 obj->user_pin_count--;
3228 if (obj->user_pin_count == 0) {
3229 obj->pin_filp = NULL;
Jesse Barnes79e53942008-11-07 14:24:08 -08003230 i915_gem_object_unpin(obj);
3231 }
Eric Anholt673a3942008-07-30 12:06:12 -07003232
Chris Wilson1d7cfea2010-10-17 09:45:41 +01003233out:
Chris Wilson05394f32010-11-08 19:18:58 +00003234 drm_gem_object_unreference(&obj->base);
Chris Wilson1d7cfea2010-10-17 09:45:41 +01003235unlock:
Eric Anholt673a3942008-07-30 12:06:12 -07003236 mutex_unlock(&dev->struct_mutex);
Chris Wilson1d7cfea2010-10-17 09:45:41 +01003237 return ret;
Eric Anholt673a3942008-07-30 12:06:12 -07003238}
3239
3240int
3241i915_gem_busy_ioctl(struct drm_device *dev, void *data,
Chris Wilson05394f32010-11-08 19:18:58 +00003242 struct drm_file *file)
Eric Anholt673a3942008-07-30 12:06:12 -07003243{
3244 struct drm_i915_gem_busy *args = data;
Chris Wilson05394f32010-11-08 19:18:58 +00003245 struct drm_i915_gem_object *obj;
Chris Wilson30dbf0c2010-09-25 10:19:17 +01003246 int ret;
3247
Chris Wilson1d7cfea2010-10-17 09:45:41 +01003248 ret = i915_mutex_lock_interruptible(dev);
3249 if (ret)
3250 return ret;
Eric Anholt673a3942008-07-30 12:06:12 -07003251
Chris Wilson05394f32010-11-08 19:18:58 +00003252 obj = to_intel_bo(drm_gem_object_lookup(dev, file, args->handle));
Chris Wilsonc8725222011-02-19 11:31:06 +00003253 if (&obj->base == NULL) {
Chris Wilson1d7cfea2010-10-17 09:45:41 +01003254 ret = -ENOENT;
3255 goto unlock;
Eric Anholt673a3942008-07-30 12:06:12 -07003256 }
Zou Nan haid1b851f2010-05-21 09:08:57 +08003257
Chris Wilson0be555b2010-08-04 15:36:30 +01003258 /* Count all active objects as busy, even if they are currently not used
3259 * by the gpu. Users of this interface expect objects to eventually
3260 * become non-busy without any further actions, therefore emit any
3261 * necessary flushes here.
Eric Anholtc4de0a52008-12-14 19:05:04 -08003262 */
Chris Wilson05394f32010-11-08 19:18:58 +00003263 args->busy = obj->active;
Chris Wilson0be555b2010-08-04 15:36:30 +01003264 if (args->busy) {
3265 /* Unconditionally flush objects, even when the gpu still uses this
3266 * object. Userspace calling this function indicates that it wants to
3267 * use this buffer rather sooner than later, so issuing the required
3268 * flush earlier is beneficial.
3269 */
Chris Wilson1a1c6972010-12-07 23:00:20 +00003270 if (obj->base.write_domain & I915_GEM_GPU_DOMAINS) {
Chris Wilsondb53a302011-02-03 11:57:46 +00003271 ret = i915_gem_flush_ring(obj->ring,
Chris Wilson88241782011-01-07 17:09:48 +00003272 0, obj->base.write_domain);
Chris Wilson1a1c6972010-12-07 23:00:20 +00003273 } else if (obj->ring->outstanding_lazy_request ==
3274 obj->last_rendering_seqno) {
3275 struct drm_i915_gem_request *request;
3276
Chris Wilson7a194872010-12-07 10:38:40 +00003277 /* This ring is not being cleared by active usage,
3278 * so emit a request to do so.
3279 */
Chris Wilson1a1c6972010-12-07 23:00:20 +00003280 request = kzalloc(sizeof(*request), GFP_KERNEL);
Rakib Mullick457eafc2011-11-16 00:49:28 +06003281 if (request) {
Akshay Joshi0206e352011-08-16 15:34:10 -04003282 ret = i915_add_request(obj->ring, NULL, request);
Rakib Mullick457eafc2011-11-16 00:49:28 +06003283 if (ret)
3284 kfree(request);
3285 } else
Chris Wilson7a194872010-12-07 10:38:40 +00003286 ret = -ENOMEM;
3287 }
Chris Wilson0be555b2010-08-04 15:36:30 +01003288
3289 /* Update the active list for the hardware's current position.
3290 * Otherwise this only updates on a delayed timer or when irqs
3291 * are actually unmasked, and our working set ends up being
3292 * larger than required.
3293 */
Chris Wilsondb53a302011-02-03 11:57:46 +00003294 i915_gem_retire_requests_ring(obj->ring);
Chris Wilson0be555b2010-08-04 15:36:30 +01003295
Chris Wilson05394f32010-11-08 19:18:58 +00003296 args->busy = obj->active;
Chris Wilson0be555b2010-08-04 15:36:30 +01003297 }
Eric Anholt673a3942008-07-30 12:06:12 -07003298
Chris Wilson05394f32010-11-08 19:18:58 +00003299 drm_gem_object_unreference(&obj->base);
Chris Wilson1d7cfea2010-10-17 09:45:41 +01003300unlock:
Eric Anholt673a3942008-07-30 12:06:12 -07003301 mutex_unlock(&dev->struct_mutex);
Chris Wilson1d7cfea2010-10-17 09:45:41 +01003302 return ret;
Eric Anholt673a3942008-07-30 12:06:12 -07003303}
3304
3305int
3306i915_gem_throttle_ioctl(struct drm_device *dev, void *data,
3307 struct drm_file *file_priv)
3308{
Akshay Joshi0206e352011-08-16 15:34:10 -04003309 return i915_gem_ring_throttle(dev, file_priv);
Eric Anholt673a3942008-07-30 12:06:12 -07003310}
3311
Chris Wilson3ef94da2009-09-14 16:50:29 +01003312int
3313i915_gem_madvise_ioctl(struct drm_device *dev, void *data,
3314 struct drm_file *file_priv)
3315{
3316 struct drm_i915_gem_madvise *args = data;
Chris Wilson05394f32010-11-08 19:18:58 +00003317 struct drm_i915_gem_object *obj;
Chris Wilson76c1dec2010-09-25 11:22:51 +01003318 int ret;
Chris Wilson3ef94da2009-09-14 16:50:29 +01003319
3320 switch (args->madv) {
3321 case I915_MADV_DONTNEED:
3322 case I915_MADV_WILLNEED:
3323 break;
3324 default:
3325 return -EINVAL;
3326 }
3327
Chris Wilson1d7cfea2010-10-17 09:45:41 +01003328 ret = i915_mutex_lock_interruptible(dev);
3329 if (ret)
3330 return ret;
3331
Chris Wilson05394f32010-11-08 19:18:58 +00003332 obj = to_intel_bo(drm_gem_object_lookup(dev, file_priv, args->handle));
Chris Wilsonc8725222011-02-19 11:31:06 +00003333 if (&obj->base == NULL) {
Chris Wilson1d7cfea2010-10-17 09:45:41 +01003334 ret = -ENOENT;
3335 goto unlock;
Chris Wilson3ef94da2009-09-14 16:50:29 +01003336 }
Chris Wilson3ef94da2009-09-14 16:50:29 +01003337
Chris Wilson05394f32010-11-08 19:18:58 +00003338 if (obj->pin_count) {
Chris Wilson1d7cfea2010-10-17 09:45:41 +01003339 ret = -EINVAL;
3340 goto out;
Chris Wilson3ef94da2009-09-14 16:50:29 +01003341 }
3342
Chris Wilson05394f32010-11-08 19:18:58 +00003343 if (obj->madv != __I915_MADV_PURGED)
3344 obj->madv = args->madv;
Chris Wilson3ef94da2009-09-14 16:50:29 +01003345
Chris Wilson2d7ef392009-09-20 23:13:10 +01003346 /* if the object is no longer bound, discard its backing storage */
Chris Wilson05394f32010-11-08 19:18:58 +00003347 if (i915_gem_object_is_purgeable(obj) &&
3348 obj->gtt_space == NULL)
Chris Wilson2d7ef392009-09-20 23:13:10 +01003349 i915_gem_object_truncate(obj);
3350
Chris Wilson05394f32010-11-08 19:18:58 +00003351 args->retained = obj->madv != __I915_MADV_PURGED;
Chris Wilsonbb6baf72009-09-22 14:24:13 +01003352
Chris Wilson1d7cfea2010-10-17 09:45:41 +01003353out:
Chris Wilson05394f32010-11-08 19:18:58 +00003354 drm_gem_object_unreference(&obj->base);
Chris Wilson1d7cfea2010-10-17 09:45:41 +01003355unlock:
Chris Wilson3ef94da2009-09-14 16:50:29 +01003356 mutex_unlock(&dev->struct_mutex);
Chris Wilson1d7cfea2010-10-17 09:45:41 +01003357 return ret;
Chris Wilson3ef94da2009-09-14 16:50:29 +01003358}
3359
Chris Wilson05394f32010-11-08 19:18:58 +00003360struct drm_i915_gem_object *i915_gem_alloc_object(struct drm_device *dev,
3361 size_t size)
Daniel Vetterac52bc52010-04-09 19:05:06 +00003362{
Chris Wilson73aa8082010-09-30 11:46:12 +01003363 struct drm_i915_private *dev_priv = dev->dev_private;
Daniel Vetterc397b902010-04-09 19:05:07 +00003364 struct drm_i915_gem_object *obj;
Hugh Dickins5949eac2011-06-27 16:18:18 -07003365 struct address_space *mapping;
Daniel Vetterc397b902010-04-09 19:05:07 +00003366
3367 obj = kzalloc(sizeof(*obj), GFP_KERNEL);
3368 if (obj == NULL)
3369 return NULL;
3370
3371 if (drm_gem_object_init(dev, &obj->base, size) != 0) {
3372 kfree(obj);
3373 return NULL;
3374 }
3375
Hugh Dickins5949eac2011-06-27 16:18:18 -07003376 mapping = obj->base.filp->f_path.dentry->d_inode->i_mapping;
3377 mapping_set_gfp_mask(mapping, GFP_HIGHUSER | __GFP_RECLAIMABLE);
3378
Chris Wilson73aa8082010-09-30 11:46:12 +01003379 i915_gem_info_add_obj(dev_priv, size);
3380
Daniel Vetterc397b902010-04-09 19:05:07 +00003381 obj->base.write_domain = I915_GEM_DOMAIN_CPU;
3382 obj->base.read_domains = I915_GEM_DOMAIN_CPU;
3383
Eugeni Dodonov3d29b842012-01-17 14:43:53 -02003384 if (HAS_LLC(dev)) {
3385 /* On some devices, we can have the GPU use the LLC (the CPU
Eric Anholta1871112011-03-29 16:59:55 -07003386 * cache) for about a 10% performance improvement
3387 * compared to uncached. Graphics requests other than
3388 * display scanout are coherent with the CPU in
3389 * accessing this cache. This means in this mode we
3390 * don't need to clflush on the CPU side, and on the
3391 * GPU side we only need to flush internal caches to
3392 * get data visible to the CPU.
3393 *
3394 * However, we maintain the display planes as UC, and so
3395 * need to rebind when first used as such.
3396 */
3397 obj->cache_level = I915_CACHE_LLC;
3398 } else
3399 obj->cache_level = I915_CACHE_NONE;
3400
Daniel Vetter62b8b212010-04-09 19:05:08 +00003401 obj->base.driver_private = NULL;
Daniel Vetterc397b902010-04-09 19:05:07 +00003402 obj->fence_reg = I915_FENCE_REG_NONE;
Chris Wilson69dc4982010-10-19 10:36:51 +01003403 INIT_LIST_HEAD(&obj->mm_list);
Daniel Vetter93a37f22010-11-05 20:24:53 +01003404 INIT_LIST_HEAD(&obj->gtt_list);
Chris Wilson69dc4982010-10-19 10:36:51 +01003405 INIT_LIST_HEAD(&obj->ring_list);
Chris Wilson432e58e2010-11-25 19:32:06 +00003406 INIT_LIST_HEAD(&obj->exec_list);
Daniel Vetterc397b902010-04-09 19:05:07 +00003407 INIT_LIST_HEAD(&obj->gpu_write_list);
Daniel Vetterc397b902010-04-09 19:05:07 +00003408 obj->madv = I915_MADV_WILLNEED;
Daniel Vetter75e9e912010-11-04 17:11:09 +01003409 /* Avoid an unnecessary call to unbind on the first bind. */
3410 obj->map_and_fenceable = true;
Daniel Vetterc397b902010-04-09 19:05:07 +00003411
Chris Wilson05394f32010-11-08 19:18:58 +00003412 return obj;
Daniel Vetterac52bc52010-04-09 19:05:06 +00003413}
3414
Eric Anholt673a3942008-07-30 12:06:12 -07003415int i915_gem_init_object(struct drm_gem_object *obj)
3416{
Daniel Vetterc397b902010-04-09 19:05:07 +00003417 BUG();
Jesse Barnesde151cf2008-11-12 10:03:55 -08003418
Eric Anholt673a3942008-07-30 12:06:12 -07003419 return 0;
3420}
3421
Chris Wilson05394f32010-11-08 19:18:58 +00003422static void i915_gem_free_object_tail(struct drm_i915_gem_object *obj)
Chris Wilsonbe726152010-07-23 23:18:50 +01003423{
Chris Wilson05394f32010-11-08 19:18:58 +00003424 struct drm_device *dev = obj->base.dev;
Chris Wilsonbe726152010-07-23 23:18:50 +01003425 drm_i915_private_t *dev_priv = dev->dev_private;
Chris Wilsonbe726152010-07-23 23:18:50 +01003426 int ret;
3427
3428 ret = i915_gem_object_unbind(obj);
3429 if (ret == -ERESTARTSYS) {
Chris Wilson05394f32010-11-08 19:18:58 +00003430 list_move(&obj->mm_list,
Chris Wilsonbe726152010-07-23 23:18:50 +01003431 &dev_priv->mm.deferred_free_list);
3432 return;
3433 }
3434
Chris Wilson26e12f82011-03-20 11:20:19 +00003435 trace_i915_gem_object_destroy(obj);
3436
Chris Wilson05394f32010-11-08 19:18:58 +00003437 if (obj->base.map_list.map)
Rob Clarkb464e9a2011-08-10 08:09:08 -05003438 drm_gem_free_mmap_offset(&obj->base);
Chris Wilsonbe726152010-07-23 23:18:50 +01003439
Chris Wilson05394f32010-11-08 19:18:58 +00003440 drm_gem_object_release(&obj->base);
3441 i915_gem_info_remove_obj(dev_priv, obj->base.size);
Chris Wilsonbe726152010-07-23 23:18:50 +01003442
Chris Wilson05394f32010-11-08 19:18:58 +00003443 kfree(obj->bit_17);
3444 kfree(obj);
Chris Wilsonbe726152010-07-23 23:18:50 +01003445}
3446
Chris Wilson05394f32010-11-08 19:18:58 +00003447void i915_gem_free_object(struct drm_gem_object *gem_obj)
Eric Anholt673a3942008-07-30 12:06:12 -07003448{
Chris Wilson05394f32010-11-08 19:18:58 +00003449 struct drm_i915_gem_object *obj = to_intel_bo(gem_obj);
3450 struct drm_device *dev = obj->base.dev;
Eric Anholt673a3942008-07-30 12:06:12 -07003451
Chris Wilson05394f32010-11-08 19:18:58 +00003452 while (obj->pin_count > 0)
Eric Anholt673a3942008-07-30 12:06:12 -07003453 i915_gem_object_unpin(obj);
3454
Chris Wilson05394f32010-11-08 19:18:58 +00003455 if (obj->phys_obj)
Dave Airlie71acb5e2008-12-30 20:31:46 +10003456 i915_gem_detach_phys_object(dev, obj);
3457
Chris Wilsonbe726152010-07-23 23:18:50 +01003458 i915_gem_free_object_tail(obj);
Eric Anholt673a3942008-07-30 12:06:12 -07003459}
3460
Jesse Barnes5669fca2009-02-17 15:13:31 -08003461int
Eric Anholt673a3942008-07-30 12:06:12 -07003462i915_gem_idle(struct drm_device *dev)
3463{
3464 drm_i915_private_t *dev_priv = dev->dev_private;
Chris Wilson29105cc2010-01-07 10:39:13 +00003465 int ret;
Eric Anholt673a3942008-07-30 12:06:12 -07003466
Keith Packard6dbe2772008-10-14 21:41:13 -07003467 mutex_lock(&dev->struct_mutex);
3468
Chris Wilson87acb0a2010-10-19 10:13:00 +01003469 if (dev_priv->mm.suspended) {
Keith Packard6dbe2772008-10-14 21:41:13 -07003470 mutex_unlock(&dev->struct_mutex);
Eric Anholt673a3942008-07-30 12:06:12 -07003471 return 0;
Keith Packard6dbe2772008-10-14 21:41:13 -07003472 }
Eric Anholt673a3942008-07-30 12:06:12 -07003473
Ben Widawskyb93f9cf2012-01-25 15:39:34 -08003474 ret = i915_gpu_idle(dev, true);
Keith Packard6dbe2772008-10-14 21:41:13 -07003475 if (ret) {
3476 mutex_unlock(&dev->struct_mutex);
Eric Anholt673a3942008-07-30 12:06:12 -07003477 return ret;
Keith Packard6dbe2772008-10-14 21:41:13 -07003478 }
Eric Anholt673a3942008-07-30 12:06:12 -07003479
Chris Wilson29105cc2010-01-07 10:39:13 +00003480 /* Under UMS, be paranoid and evict. */
3481 if (!drm_core_check_feature(dev, DRIVER_MODESET)) {
Chris Wilson5eac3ab2010-10-31 08:49:47 +00003482 ret = i915_gem_evict_inactive(dev, false);
Chris Wilson29105cc2010-01-07 10:39:13 +00003483 if (ret) {
3484 mutex_unlock(&dev->struct_mutex);
3485 return ret;
3486 }
3487 }
3488
Chris Wilson312817a2010-11-22 11:50:11 +00003489 i915_gem_reset_fences(dev);
3490
Chris Wilson29105cc2010-01-07 10:39:13 +00003491 /* Hack! Don't let anybody do execbuf while we don't control the chip.
3492 * We need to replace this with a semaphore, or something.
3493 * And not confound mm.suspended!
3494 */
3495 dev_priv->mm.suspended = 1;
Daniel Vetterbc0c7f12010-08-20 18:18:48 +02003496 del_timer_sync(&dev_priv->hangcheck_timer);
Chris Wilson29105cc2010-01-07 10:39:13 +00003497
3498 i915_kernel_lost_context(dev);
Keith Packard6dbe2772008-10-14 21:41:13 -07003499 i915_gem_cleanup_ringbuffer(dev);
Chris Wilson29105cc2010-01-07 10:39:13 +00003500
Keith Packard6dbe2772008-10-14 21:41:13 -07003501 mutex_unlock(&dev->struct_mutex);
3502
Chris Wilson29105cc2010-01-07 10:39:13 +00003503 /* Cancel the retire work handler, which should be idle now. */
3504 cancel_delayed_work_sync(&dev_priv->mm.retire_work);
3505
Eric Anholt673a3942008-07-30 12:06:12 -07003506 return 0;
3507}
3508
Daniel Vetterf691e2f2012-02-02 09:58:12 +01003509void i915_gem_init_swizzling(struct drm_device *dev)
3510{
3511 drm_i915_private_t *dev_priv = dev->dev_private;
3512
Daniel Vetter11782b02012-01-31 16:47:55 +01003513 if (INTEL_INFO(dev)->gen < 5 ||
Daniel Vetterf691e2f2012-02-02 09:58:12 +01003514 dev_priv->mm.bit_6_swizzle_x == I915_BIT_6_SWIZZLE_NONE)
3515 return;
3516
3517 I915_WRITE(DISP_ARB_CTL, I915_READ(DISP_ARB_CTL) |
3518 DISP_TILE_SURFACE_SWIZZLING);
3519
Daniel Vetter11782b02012-01-31 16:47:55 +01003520 if (IS_GEN5(dev))
3521 return;
3522
Daniel Vetterf691e2f2012-02-02 09:58:12 +01003523 I915_WRITE(TILECTL, I915_READ(TILECTL) | TILECTL_SWZCTL);
3524 if (IS_GEN6(dev))
3525 I915_WRITE(ARB_MODE, ARB_MODE_ENABLE(ARB_MODE_SWIZZLE_SNB));
3526 else
3527 I915_WRITE(ARB_MODE, ARB_MODE_ENABLE(ARB_MODE_SWIZZLE_IVB));
3528}
Daniel Vettere21af882012-02-09 20:53:27 +01003529
3530void i915_gem_init_ppgtt(struct drm_device *dev)
3531{
3532 drm_i915_private_t *dev_priv = dev->dev_private;
3533 uint32_t pd_offset;
3534 struct intel_ring_buffer *ring;
3535 int i;
3536
3537 if (!dev_priv->mm.aliasing_ppgtt)
3538 return;
3539
3540 pd_offset = dev_priv->mm.aliasing_ppgtt->pd_offset;
3541 pd_offset /= 64; /* in cachelines, */
3542 pd_offset <<= 16;
3543
3544 if (INTEL_INFO(dev)->gen == 6) {
3545 uint32_t ecochk = I915_READ(GAM_ECOCHK);
3546 I915_WRITE(GAM_ECOCHK, ecochk | ECOCHK_SNB_BIT |
3547 ECOCHK_PPGTT_CACHE64B);
3548 I915_WRITE(GFX_MODE, GFX_MODE_ENABLE(GFX_PPGTT_ENABLE));
3549 } else if (INTEL_INFO(dev)->gen >= 7) {
3550 I915_WRITE(GAM_ECOCHK, ECOCHK_PPGTT_CACHE64B);
3551 /* GFX_MODE is per-ring on gen7+ */
3552 }
3553
3554 for (i = 0; i < I915_NUM_RINGS; i++) {
3555 ring = &dev_priv->ring[i];
3556
3557 if (INTEL_INFO(dev)->gen >= 7)
3558 I915_WRITE(RING_MODE_GEN7(ring),
3559 GFX_MODE_ENABLE(GFX_PPGTT_ENABLE));
3560
3561 I915_WRITE(RING_PP_DIR_DCLV(ring), PP_DIR_DCLV_2G);
3562 I915_WRITE(RING_PP_DIR_BASE(ring), pd_offset);
3563 }
3564}
3565
Eric Anholt673a3942008-07-30 12:06:12 -07003566int
Daniel Vetterf691e2f2012-02-02 09:58:12 +01003567i915_gem_init_hw(struct drm_device *dev)
Zou Nan hai8187a2b2010-05-21 09:08:55 +08003568{
3569 drm_i915_private_t *dev_priv = dev->dev_private;
3570 int ret;
Chris Wilson68f95ba2010-05-27 13:18:22 +01003571
Daniel Vetterf691e2f2012-02-02 09:58:12 +01003572 i915_gem_init_swizzling(dev);
3573
Xiang, Haihao5c1143b2010-09-16 10:43:11 +08003574 ret = intel_init_render_ring_buffer(dev);
Chris Wilson68f95ba2010-05-27 13:18:22 +01003575 if (ret)
Chris Wilsonb6913e42010-11-12 10:46:37 +00003576 return ret;
Chris Wilson68f95ba2010-05-27 13:18:22 +01003577
3578 if (HAS_BSD(dev)) {
Xiang, Haihao5c1143b2010-09-16 10:43:11 +08003579 ret = intel_init_bsd_ring_buffer(dev);
Chris Wilson68f95ba2010-05-27 13:18:22 +01003580 if (ret)
3581 goto cleanup_render_ring;
Zou Nan haid1b851f2010-05-21 09:08:57 +08003582 }
Chris Wilson68f95ba2010-05-27 13:18:22 +01003583
Chris Wilson549f7362010-10-19 11:19:32 +01003584 if (HAS_BLT(dev)) {
3585 ret = intel_init_blt_ring_buffer(dev);
3586 if (ret)
3587 goto cleanup_bsd_ring;
3588 }
3589
Chris Wilson6f392d52010-08-07 11:01:22 +01003590 dev_priv->next_seqno = 1;
3591
Daniel Vettere21af882012-02-09 20:53:27 +01003592 i915_gem_init_ppgtt(dev);
3593
Chris Wilson68f95ba2010-05-27 13:18:22 +01003594 return 0;
3595
Chris Wilson549f7362010-10-19 11:19:32 +01003596cleanup_bsd_ring:
Chris Wilson1ec14ad2010-12-04 11:30:53 +00003597 intel_cleanup_ring_buffer(&dev_priv->ring[VCS]);
Chris Wilson68f95ba2010-05-27 13:18:22 +01003598cleanup_render_ring:
Chris Wilson1ec14ad2010-12-04 11:30:53 +00003599 intel_cleanup_ring_buffer(&dev_priv->ring[RCS]);
Zou Nan hai8187a2b2010-05-21 09:08:55 +08003600 return ret;
3601}
3602
3603void
3604i915_gem_cleanup_ringbuffer(struct drm_device *dev)
3605{
3606 drm_i915_private_t *dev_priv = dev->dev_private;
Chris Wilson1ec14ad2010-12-04 11:30:53 +00003607 int i;
Zou Nan hai8187a2b2010-05-21 09:08:55 +08003608
Chris Wilson1ec14ad2010-12-04 11:30:53 +00003609 for (i = 0; i < I915_NUM_RINGS; i++)
3610 intel_cleanup_ring_buffer(&dev_priv->ring[i]);
Zou Nan hai8187a2b2010-05-21 09:08:55 +08003611}
3612
3613int
Eric Anholt673a3942008-07-30 12:06:12 -07003614i915_gem_entervt_ioctl(struct drm_device *dev, void *data,
3615 struct drm_file *file_priv)
3616{
3617 drm_i915_private_t *dev_priv = dev->dev_private;
Chris Wilson1ec14ad2010-12-04 11:30:53 +00003618 int ret, i;
Eric Anholt673a3942008-07-30 12:06:12 -07003619
Jesse Barnes79e53942008-11-07 14:24:08 -08003620 if (drm_core_check_feature(dev, DRIVER_MODESET))
3621 return 0;
3622
Ben Gamariba1234d2009-09-14 17:48:47 -04003623 if (atomic_read(&dev_priv->mm.wedged)) {
Eric Anholt673a3942008-07-30 12:06:12 -07003624 DRM_ERROR("Reenabling wedged hardware, good luck\n");
Ben Gamariba1234d2009-09-14 17:48:47 -04003625 atomic_set(&dev_priv->mm.wedged, 0);
Eric Anholt673a3942008-07-30 12:06:12 -07003626 }
3627
Eric Anholt673a3942008-07-30 12:06:12 -07003628 mutex_lock(&dev->struct_mutex);
Eric Anholt9bb2d6f2008-12-23 18:42:32 -08003629 dev_priv->mm.suspended = 0;
3630
Daniel Vetterf691e2f2012-02-02 09:58:12 +01003631 ret = i915_gem_init_hw(dev);
Wu Fengguangd816f6a2009-04-18 10:43:32 +08003632 if (ret != 0) {
3633 mutex_unlock(&dev->struct_mutex);
Eric Anholt9bb2d6f2008-12-23 18:42:32 -08003634 return ret;
Wu Fengguangd816f6a2009-04-18 10:43:32 +08003635 }
Eric Anholt9bb2d6f2008-12-23 18:42:32 -08003636
Chris Wilson69dc4982010-10-19 10:36:51 +01003637 BUG_ON(!list_empty(&dev_priv->mm.active_list));
Eric Anholt673a3942008-07-30 12:06:12 -07003638 BUG_ON(!list_empty(&dev_priv->mm.flushing_list));
3639 BUG_ON(!list_empty(&dev_priv->mm.inactive_list));
Chris Wilson1ec14ad2010-12-04 11:30:53 +00003640 for (i = 0; i < I915_NUM_RINGS; i++) {
3641 BUG_ON(!list_empty(&dev_priv->ring[i].active_list));
3642 BUG_ON(!list_empty(&dev_priv->ring[i].request_list));
3643 }
Eric Anholt673a3942008-07-30 12:06:12 -07003644 mutex_unlock(&dev->struct_mutex);
Kristian Høgsbergdbb19d32008-08-20 11:04:27 -04003645
Chris Wilson5f353082010-06-07 14:03:03 +01003646 ret = drm_irq_install(dev);
3647 if (ret)
3648 goto cleanup_ringbuffer;
Kristian Høgsbergdbb19d32008-08-20 11:04:27 -04003649
Eric Anholt673a3942008-07-30 12:06:12 -07003650 return 0;
Chris Wilson5f353082010-06-07 14:03:03 +01003651
3652cleanup_ringbuffer:
3653 mutex_lock(&dev->struct_mutex);
3654 i915_gem_cleanup_ringbuffer(dev);
3655 dev_priv->mm.suspended = 1;
3656 mutex_unlock(&dev->struct_mutex);
3657
3658 return ret;
Eric Anholt673a3942008-07-30 12:06:12 -07003659}
3660
3661int
3662i915_gem_leavevt_ioctl(struct drm_device *dev, void *data,
3663 struct drm_file *file_priv)
3664{
Jesse Barnes79e53942008-11-07 14:24:08 -08003665 if (drm_core_check_feature(dev, DRIVER_MODESET))
3666 return 0;
3667
Kristian Høgsbergdbb19d32008-08-20 11:04:27 -04003668 drm_irq_uninstall(dev);
Linus Torvaldse6890f62009-09-08 17:09:24 -07003669 return i915_gem_idle(dev);
Eric Anholt673a3942008-07-30 12:06:12 -07003670}
3671
3672void
3673i915_gem_lastclose(struct drm_device *dev)
3674{
3675 int ret;
Eric Anholt673a3942008-07-30 12:06:12 -07003676
Eric Anholte806b492009-01-22 09:56:58 -08003677 if (drm_core_check_feature(dev, DRIVER_MODESET))
3678 return;
3679
Keith Packard6dbe2772008-10-14 21:41:13 -07003680 ret = i915_gem_idle(dev);
3681 if (ret)
3682 DRM_ERROR("failed to idle hardware: %d\n", ret);
Eric Anholt673a3942008-07-30 12:06:12 -07003683}
3684
Chris Wilson64193402010-10-24 12:38:05 +01003685static void
3686init_ring_lists(struct intel_ring_buffer *ring)
3687{
3688 INIT_LIST_HEAD(&ring->active_list);
3689 INIT_LIST_HEAD(&ring->request_list);
3690 INIT_LIST_HEAD(&ring->gpu_write_list);
3691}
3692
Eric Anholt673a3942008-07-30 12:06:12 -07003693void
3694i915_gem_load(struct drm_device *dev)
3695{
Grégoire Henryb5aa8a02009-06-23 15:41:02 +02003696 int i;
Eric Anholt673a3942008-07-30 12:06:12 -07003697 drm_i915_private_t *dev_priv = dev->dev_private;
3698
Chris Wilson69dc4982010-10-19 10:36:51 +01003699 INIT_LIST_HEAD(&dev_priv->mm.active_list);
Eric Anholt673a3942008-07-30 12:06:12 -07003700 INIT_LIST_HEAD(&dev_priv->mm.flushing_list);
3701 INIT_LIST_HEAD(&dev_priv->mm.inactive_list);
Chris Wilsonf13d3f72010-09-20 17:36:15 +01003702 INIT_LIST_HEAD(&dev_priv->mm.pinned_list);
Eric Anholta09ba7f2009-08-29 12:49:51 -07003703 INIT_LIST_HEAD(&dev_priv->mm.fence_list);
Chris Wilsonbe726152010-07-23 23:18:50 +01003704 INIT_LIST_HEAD(&dev_priv->mm.deferred_free_list);
Daniel Vetter93a37f22010-11-05 20:24:53 +01003705 INIT_LIST_HEAD(&dev_priv->mm.gtt_list);
Chris Wilson1ec14ad2010-12-04 11:30:53 +00003706 for (i = 0; i < I915_NUM_RINGS; i++)
3707 init_ring_lists(&dev_priv->ring[i]);
Daniel Vetter4b9de732011-10-09 21:52:02 +02003708 for (i = 0; i < I915_MAX_NUM_FENCES; i++)
Daniel Vetter007cc8a2010-04-28 11:02:31 +02003709 INIT_LIST_HEAD(&dev_priv->fence_regs[i].lru_list);
Eric Anholt673a3942008-07-30 12:06:12 -07003710 INIT_DELAYED_WORK(&dev_priv->mm.retire_work,
3711 i915_gem_retire_work_handler);
Chris Wilson30dbf0c2010-09-25 10:19:17 +01003712 init_completion(&dev_priv->error_completion);
Chris Wilson31169712009-09-14 16:50:28 +01003713
Dave Airlie94400122010-07-20 13:15:31 +10003714 /* On GEN3 we really need to make sure the ARB C3 LP bit is set */
3715 if (IS_GEN3(dev)) {
3716 u32 tmp = I915_READ(MI_ARB_STATE);
3717 if (!(tmp & MI_ARB_C3_LP_WRITE_ENABLE)) {
3718 /* arb state is a masked write, so set bit + bit in mask */
3719 tmp = MI_ARB_C3_LP_WRITE_ENABLE | (MI_ARB_C3_LP_WRITE_ENABLE << MI_ARB_MASK_SHIFT);
3720 I915_WRITE(MI_ARB_STATE, tmp);
3721 }
3722 }
3723
Chris Wilson72bfa192010-12-19 11:42:05 +00003724 dev_priv->relative_constants_mode = I915_EXEC_CONSTANTS_REL_GENERAL;
3725
Jesse Barnesde151cf2008-11-12 10:03:55 -08003726 /* Old X drivers will take 0-2 for front, back, depth buffers */
Eric Anholtb397c832010-01-26 09:43:10 -08003727 if (!drm_core_check_feature(dev, DRIVER_MODESET))
3728 dev_priv->fence_reg_start = 3;
Jesse Barnesde151cf2008-11-12 10:03:55 -08003729
Chris Wilsona6c45cf2010-09-17 00:32:17 +01003730 if (INTEL_INFO(dev)->gen >= 4 || IS_I945G(dev) || IS_I945GM(dev) || IS_G33(dev))
Jesse Barnesde151cf2008-11-12 10:03:55 -08003731 dev_priv->num_fence_regs = 16;
3732 else
3733 dev_priv->num_fence_regs = 8;
3734
Grégoire Henryb5aa8a02009-06-23 15:41:02 +02003735 /* Initialize fence registers to zero */
Eric Anholt10ed13e2011-05-06 13:53:49 -07003736 for (i = 0; i < dev_priv->num_fence_regs; i++) {
3737 i915_gem_clear_fence_reg(dev, &dev_priv->fence_regs[i]);
Grégoire Henryb5aa8a02009-06-23 15:41:02 +02003738 }
Eric Anholt10ed13e2011-05-06 13:53:49 -07003739
Eric Anholt673a3942008-07-30 12:06:12 -07003740 i915_gem_detect_bit_6_swizzle(dev);
Kristian Høgsberg6b95a202009-11-18 11:25:18 -05003741 init_waitqueue_head(&dev_priv->pending_flip_queue);
Chris Wilson17250b72010-10-28 12:51:39 +01003742
Chris Wilsonce453d82011-02-21 14:43:56 +00003743 dev_priv->mm.interruptible = true;
3744
Chris Wilson17250b72010-10-28 12:51:39 +01003745 dev_priv->mm.inactive_shrinker.shrink = i915_gem_inactive_shrink;
3746 dev_priv->mm.inactive_shrinker.seeks = DEFAULT_SEEKS;
3747 register_shrinker(&dev_priv->mm.inactive_shrinker);
Eric Anholt673a3942008-07-30 12:06:12 -07003748}
Dave Airlie71acb5e2008-12-30 20:31:46 +10003749
3750/*
3751 * Create a physically contiguous memory object for this object
3752 * e.g. for cursor + overlay regs
3753 */
Chris Wilson995b6762010-08-20 13:23:26 +01003754static int i915_gem_init_phys_object(struct drm_device *dev,
3755 int id, int size, int align)
Dave Airlie71acb5e2008-12-30 20:31:46 +10003756{
3757 drm_i915_private_t *dev_priv = dev->dev_private;
3758 struct drm_i915_gem_phys_object *phys_obj;
3759 int ret;
3760
3761 if (dev_priv->mm.phys_objs[id - 1] || !size)
3762 return 0;
3763
Eric Anholt9a298b22009-03-24 12:23:04 -07003764 phys_obj = kzalloc(sizeof(struct drm_i915_gem_phys_object), GFP_KERNEL);
Dave Airlie71acb5e2008-12-30 20:31:46 +10003765 if (!phys_obj)
3766 return -ENOMEM;
3767
3768 phys_obj->id = id;
3769
Chris Wilson6eeefaf2010-08-07 11:01:39 +01003770 phys_obj->handle = drm_pci_alloc(dev, size, align);
Dave Airlie71acb5e2008-12-30 20:31:46 +10003771 if (!phys_obj->handle) {
3772 ret = -ENOMEM;
3773 goto kfree_obj;
3774 }
3775#ifdef CONFIG_X86
3776 set_memory_wc((unsigned long)phys_obj->handle->vaddr, phys_obj->handle->size / PAGE_SIZE);
3777#endif
3778
3779 dev_priv->mm.phys_objs[id - 1] = phys_obj;
3780
3781 return 0;
3782kfree_obj:
Eric Anholt9a298b22009-03-24 12:23:04 -07003783 kfree(phys_obj);
Dave Airlie71acb5e2008-12-30 20:31:46 +10003784 return ret;
3785}
3786
Chris Wilson995b6762010-08-20 13:23:26 +01003787static void i915_gem_free_phys_object(struct drm_device *dev, int id)
Dave Airlie71acb5e2008-12-30 20:31:46 +10003788{
3789 drm_i915_private_t *dev_priv = dev->dev_private;
3790 struct drm_i915_gem_phys_object *phys_obj;
3791
3792 if (!dev_priv->mm.phys_objs[id - 1])
3793 return;
3794
3795 phys_obj = dev_priv->mm.phys_objs[id - 1];
3796 if (phys_obj->cur_obj) {
3797 i915_gem_detach_phys_object(dev, phys_obj->cur_obj);
3798 }
3799
3800#ifdef CONFIG_X86
3801 set_memory_wb((unsigned long)phys_obj->handle->vaddr, phys_obj->handle->size / PAGE_SIZE);
3802#endif
3803 drm_pci_free(dev, phys_obj->handle);
3804 kfree(phys_obj);
3805 dev_priv->mm.phys_objs[id - 1] = NULL;
3806}
3807
3808void i915_gem_free_all_phys_object(struct drm_device *dev)
3809{
3810 int i;
3811
Dave Airlie260883c2009-01-22 17:58:49 +10003812 for (i = I915_GEM_PHYS_CURSOR_0; i <= I915_MAX_PHYS_OBJECT; i++)
Dave Airlie71acb5e2008-12-30 20:31:46 +10003813 i915_gem_free_phys_object(dev, i);
3814}
3815
3816void i915_gem_detach_phys_object(struct drm_device *dev,
Chris Wilson05394f32010-11-08 19:18:58 +00003817 struct drm_i915_gem_object *obj)
Dave Airlie71acb5e2008-12-30 20:31:46 +10003818{
Chris Wilson05394f32010-11-08 19:18:58 +00003819 struct address_space *mapping = obj->base.filp->f_path.dentry->d_inode->i_mapping;
Chris Wilsone5281cc2010-10-28 13:45:36 +01003820 char *vaddr;
Dave Airlie71acb5e2008-12-30 20:31:46 +10003821 int i;
Dave Airlie71acb5e2008-12-30 20:31:46 +10003822 int page_count;
3823
Chris Wilson05394f32010-11-08 19:18:58 +00003824 if (!obj->phys_obj)
Dave Airlie71acb5e2008-12-30 20:31:46 +10003825 return;
Chris Wilson05394f32010-11-08 19:18:58 +00003826 vaddr = obj->phys_obj->handle->vaddr;
Dave Airlie71acb5e2008-12-30 20:31:46 +10003827
Chris Wilson05394f32010-11-08 19:18:58 +00003828 page_count = obj->base.size / PAGE_SIZE;
Dave Airlie71acb5e2008-12-30 20:31:46 +10003829 for (i = 0; i < page_count; i++) {
Hugh Dickins5949eac2011-06-27 16:18:18 -07003830 struct page *page = shmem_read_mapping_page(mapping, i);
Chris Wilsone5281cc2010-10-28 13:45:36 +01003831 if (!IS_ERR(page)) {
3832 char *dst = kmap_atomic(page);
3833 memcpy(dst, vaddr + i*PAGE_SIZE, PAGE_SIZE);
3834 kunmap_atomic(dst);
Dave Airlie71acb5e2008-12-30 20:31:46 +10003835
Chris Wilsone5281cc2010-10-28 13:45:36 +01003836 drm_clflush_pages(&page, 1);
3837
3838 set_page_dirty(page);
3839 mark_page_accessed(page);
3840 page_cache_release(page);
3841 }
Dave Airlie71acb5e2008-12-30 20:31:46 +10003842 }
Daniel Vetter40ce6572010-11-05 18:12:18 +01003843 intel_gtt_chipset_flush();
Chris Wilsond78b47b2009-06-17 21:52:49 +01003844
Chris Wilson05394f32010-11-08 19:18:58 +00003845 obj->phys_obj->cur_obj = NULL;
3846 obj->phys_obj = NULL;
Dave Airlie71acb5e2008-12-30 20:31:46 +10003847}
3848
3849int
3850i915_gem_attach_phys_object(struct drm_device *dev,
Chris Wilson05394f32010-11-08 19:18:58 +00003851 struct drm_i915_gem_object *obj,
Chris Wilson6eeefaf2010-08-07 11:01:39 +01003852 int id,
3853 int align)
Dave Airlie71acb5e2008-12-30 20:31:46 +10003854{
Chris Wilson05394f32010-11-08 19:18:58 +00003855 struct address_space *mapping = obj->base.filp->f_path.dentry->d_inode->i_mapping;
Dave Airlie71acb5e2008-12-30 20:31:46 +10003856 drm_i915_private_t *dev_priv = dev->dev_private;
Dave Airlie71acb5e2008-12-30 20:31:46 +10003857 int ret = 0;
3858 int page_count;
3859 int i;
3860
3861 if (id > I915_MAX_PHYS_OBJECT)
3862 return -EINVAL;
3863
Chris Wilson05394f32010-11-08 19:18:58 +00003864 if (obj->phys_obj) {
3865 if (obj->phys_obj->id == id)
Dave Airlie71acb5e2008-12-30 20:31:46 +10003866 return 0;
3867 i915_gem_detach_phys_object(dev, obj);
3868 }
3869
Dave Airlie71acb5e2008-12-30 20:31:46 +10003870 /* create a new object */
3871 if (!dev_priv->mm.phys_objs[id - 1]) {
3872 ret = i915_gem_init_phys_object(dev, id,
Chris Wilson05394f32010-11-08 19:18:58 +00003873 obj->base.size, align);
Dave Airlie71acb5e2008-12-30 20:31:46 +10003874 if (ret) {
Chris Wilson05394f32010-11-08 19:18:58 +00003875 DRM_ERROR("failed to init phys object %d size: %zu\n",
3876 id, obj->base.size);
Chris Wilsone5281cc2010-10-28 13:45:36 +01003877 return ret;
Dave Airlie71acb5e2008-12-30 20:31:46 +10003878 }
3879 }
3880
3881 /* bind to the object */
Chris Wilson05394f32010-11-08 19:18:58 +00003882 obj->phys_obj = dev_priv->mm.phys_objs[id - 1];
3883 obj->phys_obj->cur_obj = obj;
Dave Airlie71acb5e2008-12-30 20:31:46 +10003884
Chris Wilson05394f32010-11-08 19:18:58 +00003885 page_count = obj->base.size / PAGE_SIZE;
Dave Airlie71acb5e2008-12-30 20:31:46 +10003886
3887 for (i = 0; i < page_count; i++) {
Chris Wilsone5281cc2010-10-28 13:45:36 +01003888 struct page *page;
3889 char *dst, *src;
Dave Airlie71acb5e2008-12-30 20:31:46 +10003890
Hugh Dickins5949eac2011-06-27 16:18:18 -07003891 page = shmem_read_mapping_page(mapping, i);
Chris Wilsone5281cc2010-10-28 13:45:36 +01003892 if (IS_ERR(page))
3893 return PTR_ERR(page);
3894
Chris Wilsonff75b9b2010-10-30 22:52:31 +01003895 src = kmap_atomic(page);
Chris Wilson05394f32010-11-08 19:18:58 +00003896 dst = obj->phys_obj->handle->vaddr + (i * PAGE_SIZE);
Dave Airlie71acb5e2008-12-30 20:31:46 +10003897 memcpy(dst, src, PAGE_SIZE);
Peter Zijlstra3e4d3af2010-10-26 14:21:51 -07003898 kunmap_atomic(src);
Chris Wilsone5281cc2010-10-28 13:45:36 +01003899
3900 mark_page_accessed(page);
3901 page_cache_release(page);
Dave Airlie71acb5e2008-12-30 20:31:46 +10003902 }
3903
3904 return 0;
Dave Airlie71acb5e2008-12-30 20:31:46 +10003905}
3906
3907static int
Chris Wilson05394f32010-11-08 19:18:58 +00003908i915_gem_phys_pwrite(struct drm_device *dev,
3909 struct drm_i915_gem_object *obj,
Dave Airlie71acb5e2008-12-30 20:31:46 +10003910 struct drm_i915_gem_pwrite *args,
3911 struct drm_file *file_priv)
3912{
Chris Wilson05394f32010-11-08 19:18:58 +00003913 void *vaddr = obj->phys_obj->handle->vaddr + args->offset;
Chris Wilsonb47b30c2010-11-08 01:12:29 +00003914 char __user *user_data = (char __user *) (uintptr_t) args->data_ptr;
Dave Airlie71acb5e2008-12-30 20:31:46 +10003915
Chris Wilsonb47b30c2010-11-08 01:12:29 +00003916 if (__copy_from_user_inatomic_nocache(vaddr, user_data, args->size)) {
3917 unsigned long unwritten;
3918
3919 /* The physical object once assigned is fixed for the lifetime
3920 * of the obj, so we can safely drop the lock and continue
3921 * to access vaddr.
3922 */
3923 mutex_unlock(&dev->struct_mutex);
3924 unwritten = copy_from_user(vaddr, user_data, args->size);
3925 mutex_lock(&dev->struct_mutex);
3926 if (unwritten)
3927 return -EFAULT;
3928 }
Dave Airlie71acb5e2008-12-30 20:31:46 +10003929
Daniel Vetter40ce6572010-11-05 18:12:18 +01003930 intel_gtt_chipset_flush();
Dave Airlie71acb5e2008-12-30 20:31:46 +10003931 return 0;
3932}
Eric Anholtb9624422009-06-03 07:27:35 +00003933
Chris Wilsonf787a5f2010-09-24 16:02:42 +01003934void i915_gem_release(struct drm_device *dev, struct drm_file *file)
Eric Anholtb9624422009-06-03 07:27:35 +00003935{
Chris Wilsonf787a5f2010-09-24 16:02:42 +01003936 struct drm_i915_file_private *file_priv = file->driver_priv;
Eric Anholtb9624422009-06-03 07:27:35 +00003937
3938 /* Clean up our request list when the client is going away, so that
3939 * later retire_requests won't dereference our soon-to-be-gone
3940 * file_priv.
3941 */
Chris Wilson1c255952010-09-26 11:03:27 +01003942 spin_lock(&file_priv->mm.lock);
Chris Wilsonf787a5f2010-09-24 16:02:42 +01003943 while (!list_empty(&file_priv->mm.request_list)) {
3944 struct drm_i915_gem_request *request;
3945
3946 request = list_first_entry(&file_priv->mm.request_list,
3947 struct drm_i915_gem_request,
3948 client_list);
3949 list_del(&request->client_list);
3950 request->file_priv = NULL;
3951 }
Chris Wilson1c255952010-09-26 11:03:27 +01003952 spin_unlock(&file_priv->mm.lock);
Eric Anholtb9624422009-06-03 07:27:35 +00003953}
Chris Wilson31169712009-09-14 16:50:28 +01003954
Chris Wilson31169712009-09-14 16:50:28 +01003955static int
Chris Wilson1637ef42010-04-20 17:10:35 +01003956i915_gpu_is_active(struct drm_device *dev)
3957{
3958 drm_i915_private_t *dev_priv = dev->dev_private;
3959 int lists_empty;
3960
Chris Wilson1637ef42010-04-20 17:10:35 +01003961 lists_empty = list_empty(&dev_priv->mm.flushing_list) &&
Chris Wilson17250b72010-10-28 12:51:39 +01003962 list_empty(&dev_priv->mm.active_list);
Chris Wilson1637ef42010-04-20 17:10:35 +01003963
3964 return !lists_empty;
3965}
3966
3967static int
Ying Han1495f232011-05-24 17:12:27 -07003968i915_gem_inactive_shrink(struct shrinker *shrinker, struct shrink_control *sc)
Chris Wilson31169712009-09-14 16:50:28 +01003969{
Chris Wilson17250b72010-10-28 12:51:39 +01003970 struct drm_i915_private *dev_priv =
3971 container_of(shrinker,
3972 struct drm_i915_private,
3973 mm.inactive_shrinker);
3974 struct drm_device *dev = dev_priv->dev;
3975 struct drm_i915_gem_object *obj, *next;
Ying Han1495f232011-05-24 17:12:27 -07003976 int nr_to_scan = sc->nr_to_scan;
Chris Wilson17250b72010-10-28 12:51:39 +01003977 int cnt;
3978
3979 if (!mutex_trylock(&dev->struct_mutex))
Chris Wilsonbbe2e112010-10-28 22:35:07 +01003980 return 0;
Chris Wilson31169712009-09-14 16:50:28 +01003981
3982 /* "fast-path" to count number of available objects */
3983 if (nr_to_scan == 0) {
Chris Wilson17250b72010-10-28 12:51:39 +01003984 cnt = 0;
3985 list_for_each_entry(obj,
3986 &dev_priv->mm.inactive_list,
3987 mm_list)
3988 cnt++;
3989 mutex_unlock(&dev->struct_mutex);
3990 return cnt / 100 * sysctl_vfs_cache_pressure;
Chris Wilson31169712009-09-14 16:50:28 +01003991 }
3992
Chris Wilson1637ef42010-04-20 17:10:35 +01003993rescan:
Chris Wilson31169712009-09-14 16:50:28 +01003994 /* first scan for clean buffers */
Chris Wilson17250b72010-10-28 12:51:39 +01003995 i915_gem_retire_requests(dev);
Chris Wilson31169712009-09-14 16:50:28 +01003996
Chris Wilson17250b72010-10-28 12:51:39 +01003997 list_for_each_entry_safe(obj, next,
3998 &dev_priv->mm.inactive_list,
3999 mm_list) {
4000 if (i915_gem_object_is_purgeable(obj)) {
Chris Wilson20217462010-11-23 15:26:33 +00004001 if (i915_gem_object_unbind(obj) == 0 &&
4002 --nr_to_scan == 0)
Chris Wilson17250b72010-10-28 12:51:39 +01004003 break;
Chris Wilson31169712009-09-14 16:50:28 +01004004 }
Chris Wilson31169712009-09-14 16:50:28 +01004005 }
4006
4007 /* second pass, evict/count anything still on the inactive list */
Chris Wilson17250b72010-10-28 12:51:39 +01004008 cnt = 0;
4009 list_for_each_entry_safe(obj, next,
4010 &dev_priv->mm.inactive_list,
4011 mm_list) {
Chris Wilson20217462010-11-23 15:26:33 +00004012 if (nr_to_scan &&
4013 i915_gem_object_unbind(obj) == 0)
Chris Wilson17250b72010-10-28 12:51:39 +01004014 nr_to_scan--;
Chris Wilson20217462010-11-23 15:26:33 +00004015 else
Chris Wilson17250b72010-10-28 12:51:39 +01004016 cnt++;
Chris Wilson31169712009-09-14 16:50:28 +01004017 }
4018
Chris Wilson17250b72010-10-28 12:51:39 +01004019 if (nr_to_scan && i915_gpu_is_active(dev)) {
Chris Wilson1637ef42010-04-20 17:10:35 +01004020 /*
4021 * We are desperate for pages, so as a last resort, wait
4022 * for the GPU to finish and discard whatever we can.
4023 * This has a dramatic impact to reduce the number of
4024 * OOM-killer events whilst running the GPU aggressively.
4025 */
Ben Widawskyb93f9cf2012-01-25 15:39:34 -08004026 if (i915_gpu_idle(dev, true) == 0)
Chris Wilson1637ef42010-04-20 17:10:35 +01004027 goto rescan;
4028 }
Chris Wilson17250b72010-10-28 12:51:39 +01004029 mutex_unlock(&dev->struct_mutex);
4030 return cnt / 100 * sysctl_vfs_cache_pressure;
Chris Wilson31169712009-09-14 16:50:28 +01004031}