blob: 6026817372da0cb024504f4af7a95ed4585cff1b [file] [log] [blame]
Eric Anholt673a3942008-07-30 12:06:12 -07001/*
2 * Copyright © 2008 Intel Corporation
3 *
4 * Permission is hereby granted, free of charge, to any person obtaining a
5 * copy of this software and associated documentation files (the "Software"),
6 * to deal in the Software without restriction, including without limitation
7 * the rights to use, copy, modify, merge, publish, distribute, sublicense,
8 * and/or sell copies of the Software, and to permit persons to whom the
9 * Software is furnished to do so, subject to the following conditions:
10 *
11 * The above copyright notice and this permission notice (including the next
12 * paragraph) shall be included in all copies or substantial portions of the
13 * Software.
14 *
15 * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
16 * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
17 * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL
18 * THE AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
19 * LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING
20 * FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS
21 * IN THE SOFTWARE.
22 *
23 * Authors:
24 * Eric Anholt <eric@anholt.net>
25 *
26 */
27
28#include "drmP.h"
29#include "drm.h"
30#include "i915_drm.h"
31#include "i915_drv.h"
Chris Wilson1c5d22f2009-08-25 11:15:50 +010032#include "i915_trace.h"
Jesse Barnes652c3932009-08-17 13:31:43 -070033#include "intel_drv.h"
Tejun Heo5a0e3ad2010-03-24 17:04:11 +090034#include <linux/slab.h>
Eric Anholt673a3942008-07-30 12:06:12 -070035#include <linux/swap.h>
Jesse Barnes79e53942008-11-07 14:24:08 -080036#include <linux/pci.h>
Eric Anholt673a3942008-07-30 12:06:12 -070037
Chris Wilson88241782011-01-07 17:09:48 +000038static __must_check int i915_gem_object_flush_gpu_write_domain(struct drm_i915_gem_object *obj);
Chris Wilson05394f32010-11-08 19:18:58 +000039static void i915_gem_object_flush_gtt_write_domain(struct drm_i915_gem_object *obj);
40static void i915_gem_object_flush_cpu_write_domain(struct drm_i915_gem_object *obj);
Chris Wilson88241782011-01-07 17:09:48 +000041static __must_check int i915_gem_object_set_to_cpu_domain(struct drm_i915_gem_object *obj,
42 bool write);
43static __must_check int i915_gem_object_set_cpu_read_domain_range(struct drm_i915_gem_object *obj,
44 uint64_t offset,
45 uint64_t size);
Chris Wilson05394f32010-11-08 19:18:58 +000046static void i915_gem_object_set_to_full_cpu_read_domain(struct drm_i915_gem_object *obj);
Chris Wilson88241782011-01-07 17:09:48 +000047static __must_check int i915_gem_object_bind_to_gtt(struct drm_i915_gem_object *obj,
48 unsigned alignment,
49 bool map_and_fenceable);
Chris Wilsond9e86c02010-11-10 16:40:20 +000050static void i915_gem_clear_fence_reg(struct drm_device *dev,
51 struct drm_i915_fence_reg *reg);
Chris Wilson05394f32010-11-08 19:18:58 +000052static int i915_gem_phys_pwrite(struct drm_device *dev,
53 struct drm_i915_gem_object *obj,
Dave Airlie71acb5e2008-12-30 20:31:46 +100054 struct drm_i915_gem_pwrite *args,
Chris Wilson05394f32010-11-08 19:18:58 +000055 struct drm_file *file);
56static void i915_gem_free_object_tail(struct drm_i915_gem_object *obj);
Eric Anholt673a3942008-07-30 12:06:12 -070057
Chris Wilson17250b72010-10-28 12:51:39 +010058static int i915_gem_inactive_shrink(struct shrinker *shrinker,
Ying Han1495f232011-05-24 17:12:27 -070059 struct shrink_control *sc);
Chris Wilson31169712009-09-14 16:50:28 +010060
Chris Wilson73aa8082010-09-30 11:46:12 +010061/* some bookkeeping */
62static void i915_gem_info_add_obj(struct drm_i915_private *dev_priv,
63 size_t size)
64{
65 dev_priv->mm.object_count++;
66 dev_priv->mm.object_memory += size;
67}
68
69static void i915_gem_info_remove_obj(struct drm_i915_private *dev_priv,
70 size_t size)
71{
72 dev_priv->mm.object_count--;
73 dev_priv->mm.object_memory -= size;
74}
75
Chris Wilson21dd3732011-01-26 15:55:56 +000076static int
77i915_gem_wait_for_error(struct drm_device *dev)
Chris Wilson30dbf0c2010-09-25 10:19:17 +010078{
79 struct drm_i915_private *dev_priv = dev->dev_private;
80 struct completion *x = &dev_priv->error_completion;
81 unsigned long flags;
82 int ret;
83
84 if (!atomic_read(&dev_priv->mm.wedged))
85 return 0;
86
87 ret = wait_for_completion_interruptible(x);
88 if (ret)
89 return ret;
90
Chris Wilson21dd3732011-01-26 15:55:56 +000091 if (atomic_read(&dev_priv->mm.wedged)) {
92 /* GPU is hung, bump the completion count to account for
93 * the token we just consumed so that we never hit zero and
94 * end up waiting upon a subsequent completion event that
95 * will never happen.
96 */
97 spin_lock_irqsave(&x->wait.lock, flags);
98 x->done++;
99 spin_unlock_irqrestore(&x->wait.lock, flags);
100 }
101 return 0;
Chris Wilson30dbf0c2010-09-25 10:19:17 +0100102}
103
Chris Wilson54cf91d2010-11-25 18:00:26 +0000104int i915_mutex_lock_interruptible(struct drm_device *dev)
Chris Wilson76c1dec2010-09-25 11:22:51 +0100105{
Chris Wilson76c1dec2010-09-25 11:22:51 +0100106 int ret;
107
Chris Wilson21dd3732011-01-26 15:55:56 +0000108 ret = i915_gem_wait_for_error(dev);
Chris Wilson76c1dec2010-09-25 11:22:51 +0100109 if (ret)
110 return ret;
111
112 ret = mutex_lock_interruptible(&dev->struct_mutex);
113 if (ret)
114 return ret;
115
Chris Wilson23bc5982010-09-29 16:10:57 +0100116 WARN_ON(i915_verify_lists(dev));
Chris Wilson76c1dec2010-09-25 11:22:51 +0100117 return 0;
118}
Chris Wilson30dbf0c2010-09-25 10:19:17 +0100119
Chris Wilson7d1c4802010-08-07 21:45:03 +0100120static inline bool
Chris Wilson05394f32010-11-08 19:18:58 +0000121i915_gem_object_is_inactive(struct drm_i915_gem_object *obj)
Chris Wilson7d1c4802010-08-07 21:45:03 +0100122{
Chris Wilson05394f32010-11-08 19:18:58 +0000123 return obj->gtt_space && !obj->active && obj->pin_count == 0;
Chris Wilson7d1c4802010-08-07 21:45:03 +0100124}
125
Chris Wilson20217462010-11-23 15:26:33 +0000126void i915_gem_do_init(struct drm_device *dev,
127 unsigned long start,
128 unsigned long mappable_end,
129 unsigned long end)
Jesse Barnes79e53942008-11-07 14:24:08 -0800130{
131 drm_i915_private_t *dev_priv = dev->dev_private;
132
Chris Wilsonbee4a182011-01-21 10:54:32 +0000133 drm_mm_init(&dev_priv->mm.gtt_space, start, end - start);
Jesse Barnes79e53942008-11-07 14:24:08 -0800134
Chris Wilsonbee4a182011-01-21 10:54:32 +0000135 dev_priv->mm.gtt_start = start;
136 dev_priv->mm.gtt_mappable_end = mappable_end;
137 dev_priv->mm.gtt_end = end;
Chris Wilson73aa8082010-09-30 11:46:12 +0100138 dev_priv->mm.gtt_total = end - start;
Daniel Vetterfb7d5162010-10-01 22:05:20 +0200139 dev_priv->mm.mappable_gtt_total = min(end, mappable_end) - start;
Chris Wilsonbee4a182011-01-21 10:54:32 +0000140
141 /* Take over this portion of the GTT */
142 intel_gtt_clear_range(start / PAGE_SIZE, (end-start) / PAGE_SIZE);
Jesse Barnes79e53942008-11-07 14:24:08 -0800143}
Keith Packard6dbe2772008-10-14 21:41:13 -0700144
Eric Anholt673a3942008-07-30 12:06:12 -0700145int
146i915_gem_init_ioctl(struct drm_device *dev, void *data,
Chris Wilson05394f32010-11-08 19:18:58 +0000147 struct drm_file *file)
Eric Anholt673a3942008-07-30 12:06:12 -0700148{
Eric Anholt673a3942008-07-30 12:06:12 -0700149 struct drm_i915_gem_init *args = data;
Chris Wilson20217462010-11-23 15:26:33 +0000150
151 if (args->gtt_start >= args->gtt_end ||
152 (args->gtt_end | args->gtt_start) & (PAGE_SIZE - 1))
153 return -EINVAL;
Eric Anholt673a3942008-07-30 12:06:12 -0700154
155 mutex_lock(&dev->struct_mutex);
Chris Wilson20217462010-11-23 15:26:33 +0000156 i915_gem_do_init(dev, args->gtt_start, args->gtt_end, args->gtt_end);
Eric Anholt673a3942008-07-30 12:06:12 -0700157 mutex_unlock(&dev->struct_mutex);
158
Chris Wilson20217462010-11-23 15:26:33 +0000159 return 0;
Eric Anholt673a3942008-07-30 12:06:12 -0700160}
161
Eric Anholt5a125c32008-10-22 21:40:13 -0700162int
163i915_gem_get_aperture_ioctl(struct drm_device *dev, void *data,
Chris Wilson05394f32010-11-08 19:18:58 +0000164 struct drm_file *file)
Eric Anholt5a125c32008-10-22 21:40:13 -0700165{
Chris Wilson73aa8082010-09-30 11:46:12 +0100166 struct drm_i915_private *dev_priv = dev->dev_private;
Eric Anholt5a125c32008-10-22 21:40:13 -0700167 struct drm_i915_gem_get_aperture *args = data;
Chris Wilson6299f992010-11-24 12:23:44 +0000168 struct drm_i915_gem_object *obj;
169 size_t pinned;
Eric Anholt5a125c32008-10-22 21:40:13 -0700170
171 if (!(dev->driver->driver_features & DRIVER_GEM))
172 return -ENODEV;
173
Chris Wilson6299f992010-11-24 12:23:44 +0000174 pinned = 0;
Chris Wilson73aa8082010-09-30 11:46:12 +0100175 mutex_lock(&dev->struct_mutex);
Chris Wilson6299f992010-11-24 12:23:44 +0000176 list_for_each_entry(obj, &dev_priv->mm.pinned_list, mm_list)
177 pinned += obj->gtt_space->size;
Chris Wilson73aa8082010-09-30 11:46:12 +0100178 mutex_unlock(&dev->struct_mutex);
Eric Anholt5a125c32008-10-22 21:40:13 -0700179
Chris Wilson6299f992010-11-24 12:23:44 +0000180 args->aper_size = dev_priv->mm.gtt_total;
181 args->aper_available_size = args->aper_size -pinned;
182
Eric Anholt5a125c32008-10-22 21:40:13 -0700183 return 0;
184}
185
Dave Airlieff72145b2011-02-07 12:16:14 +1000186static int
187i915_gem_create(struct drm_file *file,
188 struct drm_device *dev,
189 uint64_t size,
190 uint32_t *handle_p)
Eric Anholt673a3942008-07-30 12:06:12 -0700191{
Chris Wilson05394f32010-11-08 19:18:58 +0000192 struct drm_i915_gem_object *obj;
Pekka Paalanena1a2d1d2009-08-23 12:40:55 +0300193 int ret;
194 u32 handle;
Eric Anholt673a3942008-07-30 12:06:12 -0700195
Dave Airlieff72145b2011-02-07 12:16:14 +1000196 size = roundup(size, PAGE_SIZE);
Eric Anholt673a3942008-07-30 12:06:12 -0700197
198 /* Allocate the new object */
Dave Airlieff72145b2011-02-07 12:16:14 +1000199 obj = i915_gem_alloc_object(dev, size);
Eric Anholt673a3942008-07-30 12:06:12 -0700200 if (obj == NULL)
201 return -ENOMEM;
202
Chris Wilson05394f32010-11-08 19:18:58 +0000203 ret = drm_gem_handle_create(file, &obj->base, &handle);
Chris Wilson1dfd9752010-09-06 14:44:14 +0100204 if (ret) {
Chris Wilson05394f32010-11-08 19:18:58 +0000205 drm_gem_object_release(&obj->base);
206 i915_gem_info_remove_obj(dev->dev_private, obj->base.size);
Chris Wilson202f2fe2010-10-14 13:20:40 +0100207 kfree(obj);
Eric Anholt673a3942008-07-30 12:06:12 -0700208 return ret;
Chris Wilson1dfd9752010-09-06 14:44:14 +0100209 }
210
Chris Wilson202f2fe2010-10-14 13:20:40 +0100211 /* drop reference from allocate - handle holds it now */
Chris Wilson05394f32010-11-08 19:18:58 +0000212 drm_gem_object_unreference(&obj->base);
Chris Wilson202f2fe2010-10-14 13:20:40 +0100213 trace_i915_gem_object_create(obj);
214
Dave Airlieff72145b2011-02-07 12:16:14 +1000215 *handle_p = handle;
Eric Anholt673a3942008-07-30 12:06:12 -0700216 return 0;
217}
218
Dave Airlieff72145b2011-02-07 12:16:14 +1000219int
220i915_gem_dumb_create(struct drm_file *file,
221 struct drm_device *dev,
222 struct drm_mode_create_dumb *args)
223{
224 /* have to work out size/pitch and return them */
Chris Wilsoned0291f2011-03-19 08:21:45 +0000225 args->pitch = ALIGN(args->width * ((args->bpp + 7) / 8), 64);
Dave Airlieff72145b2011-02-07 12:16:14 +1000226 args->size = args->pitch * args->height;
227 return i915_gem_create(file, dev,
228 args->size, &args->handle);
229}
230
231int i915_gem_dumb_destroy(struct drm_file *file,
232 struct drm_device *dev,
233 uint32_t handle)
234{
235 return drm_gem_handle_delete(file, handle);
236}
237
238/**
239 * Creates a new mm object and returns a handle to it.
240 */
241int
242i915_gem_create_ioctl(struct drm_device *dev, void *data,
243 struct drm_file *file)
244{
245 struct drm_i915_gem_create *args = data;
246 return i915_gem_create(file, dev,
247 args->size, &args->handle);
248}
249
Chris Wilson05394f32010-11-08 19:18:58 +0000250static int i915_gem_object_needs_bit17_swizzle(struct drm_i915_gem_object *obj)
Eric Anholt280b7132009-03-12 16:56:27 -0700251{
Chris Wilson05394f32010-11-08 19:18:58 +0000252 drm_i915_private_t *dev_priv = obj->base.dev->dev_private;
Eric Anholt280b7132009-03-12 16:56:27 -0700253
254 return dev_priv->mm.bit_6_swizzle_x == I915_BIT_6_SWIZZLE_9_10_17 &&
Chris Wilson05394f32010-11-08 19:18:58 +0000255 obj->tiling_mode != I915_TILING_NONE;
Eric Anholt280b7132009-03-12 16:56:27 -0700256}
257
Chris Wilson99a03df2010-05-27 14:15:34 +0100258static inline void
Eric Anholt40123c12009-03-09 13:42:30 -0700259slow_shmem_copy(struct page *dst_page,
260 int dst_offset,
261 struct page *src_page,
262 int src_offset,
263 int length)
264{
265 char *dst_vaddr, *src_vaddr;
266
Chris Wilson99a03df2010-05-27 14:15:34 +0100267 dst_vaddr = kmap(dst_page);
268 src_vaddr = kmap(src_page);
Eric Anholt40123c12009-03-09 13:42:30 -0700269
270 memcpy(dst_vaddr + dst_offset, src_vaddr + src_offset, length);
271
Chris Wilson99a03df2010-05-27 14:15:34 +0100272 kunmap(src_page);
273 kunmap(dst_page);
Eric Anholt40123c12009-03-09 13:42:30 -0700274}
275
Chris Wilson99a03df2010-05-27 14:15:34 +0100276static inline void
Eric Anholt280b7132009-03-12 16:56:27 -0700277slow_shmem_bit17_copy(struct page *gpu_page,
278 int gpu_offset,
279 struct page *cpu_page,
280 int cpu_offset,
281 int length,
282 int is_read)
283{
284 char *gpu_vaddr, *cpu_vaddr;
285
286 /* Use the unswizzled path if this page isn't affected. */
287 if ((page_to_phys(gpu_page) & (1 << 17)) == 0) {
288 if (is_read)
289 return slow_shmem_copy(cpu_page, cpu_offset,
290 gpu_page, gpu_offset, length);
291 else
292 return slow_shmem_copy(gpu_page, gpu_offset,
293 cpu_page, cpu_offset, length);
294 }
295
Chris Wilson99a03df2010-05-27 14:15:34 +0100296 gpu_vaddr = kmap(gpu_page);
297 cpu_vaddr = kmap(cpu_page);
Eric Anholt280b7132009-03-12 16:56:27 -0700298
299 /* Copy the data, XORing A6 with A17 (1). The user already knows he's
300 * XORing with the other bits (A9 for Y, A9 and A10 for X)
301 */
302 while (length > 0) {
303 int cacheline_end = ALIGN(gpu_offset + 1, 64);
304 int this_length = min(cacheline_end - gpu_offset, length);
305 int swizzled_gpu_offset = gpu_offset ^ 64;
306
307 if (is_read) {
308 memcpy(cpu_vaddr + cpu_offset,
309 gpu_vaddr + swizzled_gpu_offset,
310 this_length);
311 } else {
312 memcpy(gpu_vaddr + swizzled_gpu_offset,
313 cpu_vaddr + cpu_offset,
314 this_length);
315 }
316 cpu_offset += this_length;
317 gpu_offset += this_length;
318 length -= this_length;
319 }
320
Chris Wilson99a03df2010-05-27 14:15:34 +0100321 kunmap(cpu_page);
322 kunmap(gpu_page);
Eric Anholt280b7132009-03-12 16:56:27 -0700323}
324
Eric Anholt673a3942008-07-30 12:06:12 -0700325/**
Eric Anholteb014592009-03-10 11:44:52 -0700326 * This is the fast shmem pread path, which attempts to copy_from_user directly
327 * from the backing pages of the object to the user's address space. On a
328 * fault, it fails so we can fall back to i915_gem_shmem_pwrite_slow().
329 */
330static int
Chris Wilson05394f32010-11-08 19:18:58 +0000331i915_gem_shmem_pread_fast(struct drm_device *dev,
332 struct drm_i915_gem_object *obj,
Eric Anholteb014592009-03-10 11:44:52 -0700333 struct drm_i915_gem_pread *args,
Chris Wilson05394f32010-11-08 19:18:58 +0000334 struct drm_file *file)
Eric Anholteb014592009-03-10 11:44:52 -0700335{
Chris Wilson05394f32010-11-08 19:18:58 +0000336 struct address_space *mapping = obj->base.filp->f_path.dentry->d_inode->i_mapping;
Eric Anholteb014592009-03-10 11:44:52 -0700337 ssize_t remain;
Chris Wilsone5281cc2010-10-28 13:45:36 +0100338 loff_t offset;
Eric Anholteb014592009-03-10 11:44:52 -0700339 char __user *user_data;
340 int page_offset, page_length;
Eric Anholteb014592009-03-10 11:44:52 -0700341
342 user_data = (char __user *) (uintptr_t) args->data_ptr;
343 remain = args->size;
344
Eric Anholteb014592009-03-10 11:44:52 -0700345 offset = args->offset;
346
347 while (remain > 0) {
Chris Wilsone5281cc2010-10-28 13:45:36 +0100348 struct page *page;
349 char *vaddr;
350 int ret;
351
Eric Anholteb014592009-03-10 11:44:52 -0700352 /* Operation in this page
353 *
Eric Anholteb014592009-03-10 11:44:52 -0700354 * page_offset = offset within page
355 * page_length = bytes to copy for this page
356 */
Chris Wilsonc8cbbb82011-05-12 22:17:11 +0100357 page_offset = offset_in_page(offset);
Eric Anholteb014592009-03-10 11:44:52 -0700358 page_length = remain;
359 if ((page_offset + remain) > PAGE_SIZE)
360 page_length = PAGE_SIZE - page_offset;
361
Chris Wilsone5281cc2010-10-28 13:45:36 +0100362 page = read_cache_page_gfp(mapping, offset >> PAGE_SHIFT,
363 GFP_HIGHUSER | __GFP_RECLAIMABLE);
364 if (IS_ERR(page))
365 return PTR_ERR(page);
366
367 vaddr = kmap_atomic(page);
368 ret = __copy_to_user_inatomic(user_data,
369 vaddr + page_offset,
370 page_length);
371 kunmap_atomic(vaddr);
372
373 mark_page_accessed(page);
374 page_cache_release(page);
375 if (ret)
Chris Wilson4f27b752010-10-14 15:26:45 +0100376 return -EFAULT;
Eric Anholteb014592009-03-10 11:44:52 -0700377
378 remain -= page_length;
379 user_data += page_length;
380 offset += page_length;
381 }
382
Chris Wilson4f27b752010-10-14 15:26:45 +0100383 return 0;
Eric Anholteb014592009-03-10 11:44:52 -0700384}
385
386/**
387 * This is the fallback shmem pread path, which allocates temporary storage
388 * in kernel space to copy_to_user into outside of the struct_mutex, so we
389 * can copy out of the object's backing pages while holding the struct mutex
390 * and not take page faults.
391 */
392static int
Chris Wilson05394f32010-11-08 19:18:58 +0000393i915_gem_shmem_pread_slow(struct drm_device *dev,
394 struct drm_i915_gem_object *obj,
Eric Anholteb014592009-03-10 11:44:52 -0700395 struct drm_i915_gem_pread *args,
Chris Wilson05394f32010-11-08 19:18:58 +0000396 struct drm_file *file)
Eric Anholteb014592009-03-10 11:44:52 -0700397{
Chris Wilson05394f32010-11-08 19:18:58 +0000398 struct address_space *mapping = obj->base.filp->f_path.dentry->d_inode->i_mapping;
Eric Anholteb014592009-03-10 11:44:52 -0700399 struct mm_struct *mm = current->mm;
400 struct page **user_pages;
401 ssize_t remain;
402 loff_t offset, pinned_pages, i;
403 loff_t first_data_page, last_data_page, num_pages;
Chris Wilsone5281cc2010-10-28 13:45:36 +0100404 int shmem_page_offset;
405 int data_page_index, data_page_offset;
Eric Anholteb014592009-03-10 11:44:52 -0700406 int page_length;
407 int ret;
408 uint64_t data_ptr = args->data_ptr;
Eric Anholt280b7132009-03-12 16:56:27 -0700409 int do_bit17_swizzling;
Eric Anholteb014592009-03-10 11:44:52 -0700410
411 remain = args->size;
412
413 /* Pin the user pages containing the data. We can't fault while
414 * holding the struct mutex, yet we want to hold it while
415 * dereferencing the user data.
416 */
417 first_data_page = data_ptr / PAGE_SIZE;
418 last_data_page = (data_ptr + args->size - 1) / PAGE_SIZE;
419 num_pages = last_data_page - first_data_page + 1;
420
Chris Wilson4f27b752010-10-14 15:26:45 +0100421 user_pages = drm_malloc_ab(num_pages, sizeof(struct page *));
Eric Anholteb014592009-03-10 11:44:52 -0700422 if (user_pages == NULL)
423 return -ENOMEM;
424
Chris Wilson4f27b752010-10-14 15:26:45 +0100425 mutex_unlock(&dev->struct_mutex);
Eric Anholteb014592009-03-10 11:44:52 -0700426 down_read(&mm->mmap_sem);
427 pinned_pages = get_user_pages(current, mm, (uintptr_t)args->data_ptr,
Eric Anholte5e9ecd2009-04-07 16:01:22 -0700428 num_pages, 1, 0, user_pages, NULL);
Eric Anholteb014592009-03-10 11:44:52 -0700429 up_read(&mm->mmap_sem);
Chris Wilson4f27b752010-10-14 15:26:45 +0100430 mutex_lock(&dev->struct_mutex);
Eric Anholteb014592009-03-10 11:44:52 -0700431 if (pinned_pages < num_pages) {
432 ret = -EFAULT;
Chris Wilson4f27b752010-10-14 15:26:45 +0100433 goto out;
Eric Anholteb014592009-03-10 11:44:52 -0700434 }
435
Chris Wilson4f27b752010-10-14 15:26:45 +0100436 ret = i915_gem_object_set_cpu_read_domain_range(obj,
437 args->offset,
Eric Anholteb014592009-03-10 11:44:52 -0700438 args->size);
Chris Wilson4f27b752010-10-14 15:26:45 +0100439 if (ret)
440 goto out;
441
442 do_bit17_swizzling = i915_gem_object_needs_bit17_swizzle(obj);
Eric Anholteb014592009-03-10 11:44:52 -0700443
Eric Anholteb014592009-03-10 11:44:52 -0700444 offset = args->offset;
445
446 while (remain > 0) {
Chris Wilsone5281cc2010-10-28 13:45:36 +0100447 struct page *page;
448
Eric Anholteb014592009-03-10 11:44:52 -0700449 /* Operation in this page
450 *
Eric Anholteb014592009-03-10 11:44:52 -0700451 * shmem_page_offset = offset within page in shmem file
452 * data_page_index = page number in get_user_pages return
453 * data_page_offset = offset with data_page_index page.
454 * page_length = bytes to copy for this page
455 */
Chris Wilsonc8cbbb82011-05-12 22:17:11 +0100456 shmem_page_offset = offset_in_page(offset);
Eric Anholteb014592009-03-10 11:44:52 -0700457 data_page_index = data_ptr / PAGE_SIZE - first_data_page;
Chris Wilsonc8cbbb82011-05-12 22:17:11 +0100458 data_page_offset = offset_in_page(data_ptr);
Eric Anholteb014592009-03-10 11:44:52 -0700459
460 page_length = remain;
461 if ((shmem_page_offset + page_length) > PAGE_SIZE)
462 page_length = PAGE_SIZE - shmem_page_offset;
463 if ((data_page_offset + page_length) > PAGE_SIZE)
464 page_length = PAGE_SIZE - data_page_offset;
465
Chris Wilsone5281cc2010-10-28 13:45:36 +0100466 page = read_cache_page_gfp(mapping, offset >> PAGE_SHIFT,
467 GFP_HIGHUSER | __GFP_RECLAIMABLE);
Jesper Juhlb65552f2011-06-12 20:53:44 +0000468 if (IS_ERR(page)) {
469 ret = PTR_ERR(page);
470 goto out;
471 }
Chris Wilsone5281cc2010-10-28 13:45:36 +0100472
Eric Anholt280b7132009-03-12 16:56:27 -0700473 if (do_bit17_swizzling) {
Chris Wilsone5281cc2010-10-28 13:45:36 +0100474 slow_shmem_bit17_copy(page,
Eric Anholt280b7132009-03-12 16:56:27 -0700475 shmem_page_offset,
Chris Wilson99a03df2010-05-27 14:15:34 +0100476 user_pages[data_page_index],
477 data_page_offset,
478 page_length,
479 1);
480 } else {
481 slow_shmem_copy(user_pages[data_page_index],
482 data_page_offset,
Chris Wilsone5281cc2010-10-28 13:45:36 +0100483 page,
Chris Wilson99a03df2010-05-27 14:15:34 +0100484 shmem_page_offset,
485 page_length);
Eric Anholt280b7132009-03-12 16:56:27 -0700486 }
Eric Anholteb014592009-03-10 11:44:52 -0700487
Chris Wilsone5281cc2010-10-28 13:45:36 +0100488 mark_page_accessed(page);
489 page_cache_release(page);
490
Eric Anholteb014592009-03-10 11:44:52 -0700491 remain -= page_length;
492 data_ptr += page_length;
493 offset += page_length;
494 }
495
Chris Wilson4f27b752010-10-14 15:26:45 +0100496out:
Eric Anholteb014592009-03-10 11:44:52 -0700497 for (i = 0; i < pinned_pages; i++) {
498 SetPageDirty(user_pages[i]);
Chris Wilsone5281cc2010-10-28 13:45:36 +0100499 mark_page_accessed(user_pages[i]);
Eric Anholteb014592009-03-10 11:44:52 -0700500 page_cache_release(user_pages[i]);
501 }
Jesse Barnes8e7d2b22009-05-08 16:13:25 -0700502 drm_free_large(user_pages);
Eric Anholteb014592009-03-10 11:44:52 -0700503
504 return ret;
505}
506
Eric Anholt673a3942008-07-30 12:06:12 -0700507/**
508 * Reads data from the object referenced by handle.
509 *
510 * On error, the contents of *data are undefined.
511 */
512int
513i915_gem_pread_ioctl(struct drm_device *dev, void *data,
Chris Wilson05394f32010-11-08 19:18:58 +0000514 struct drm_file *file)
Eric Anholt673a3942008-07-30 12:06:12 -0700515{
516 struct drm_i915_gem_pread *args = data;
Chris Wilson05394f32010-11-08 19:18:58 +0000517 struct drm_i915_gem_object *obj;
Chris Wilson35b62a82010-09-26 20:23:38 +0100518 int ret = 0;
Eric Anholt673a3942008-07-30 12:06:12 -0700519
Chris Wilson51311d02010-11-17 09:10:42 +0000520 if (args->size == 0)
521 return 0;
522
523 if (!access_ok(VERIFY_WRITE,
524 (char __user *)(uintptr_t)args->data_ptr,
525 args->size))
526 return -EFAULT;
527
528 ret = fault_in_pages_writeable((char __user *)(uintptr_t)args->data_ptr,
529 args->size);
530 if (ret)
531 return -EFAULT;
532
Chris Wilson4f27b752010-10-14 15:26:45 +0100533 ret = i915_mutex_lock_interruptible(dev);
Chris Wilson1d7cfea2010-10-17 09:45:41 +0100534 if (ret)
Chris Wilson4f27b752010-10-14 15:26:45 +0100535 return ret;
Eric Anholt673a3942008-07-30 12:06:12 -0700536
Chris Wilson05394f32010-11-08 19:18:58 +0000537 obj = to_intel_bo(drm_gem_object_lookup(dev, file, args->handle));
Chris Wilsonc8725222011-02-19 11:31:06 +0000538 if (&obj->base == NULL) {
Chris Wilson1d7cfea2010-10-17 09:45:41 +0100539 ret = -ENOENT;
540 goto unlock;
Chris Wilson4f27b752010-10-14 15:26:45 +0100541 }
Eric Anholt673a3942008-07-30 12:06:12 -0700542
Chris Wilson7dcd2492010-09-26 20:21:44 +0100543 /* Bounds check source. */
Chris Wilson05394f32010-11-08 19:18:58 +0000544 if (args->offset > obj->base.size ||
545 args->size > obj->base.size - args->offset) {
Chris Wilsonce9d4192010-09-26 20:50:05 +0100546 ret = -EINVAL;
Chris Wilson35b62a82010-09-26 20:23:38 +0100547 goto out;
Chris Wilsonce9d4192010-09-26 20:50:05 +0100548 }
549
Chris Wilsondb53a302011-02-03 11:57:46 +0000550 trace_i915_gem_object_pread(obj, args->offset, args->size);
551
Chris Wilson4f27b752010-10-14 15:26:45 +0100552 ret = i915_gem_object_set_cpu_read_domain_range(obj,
553 args->offset,
554 args->size);
555 if (ret)
Chris Wilsone5281cc2010-10-28 13:45:36 +0100556 goto out;
Chris Wilson4f27b752010-10-14 15:26:45 +0100557
558 ret = -EFAULT;
559 if (!i915_gem_object_needs_bit17_swizzle(obj))
Chris Wilson05394f32010-11-08 19:18:58 +0000560 ret = i915_gem_shmem_pread_fast(dev, obj, args, file);
Chris Wilson4f27b752010-10-14 15:26:45 +0100561 if (ret == -EFAULT)
Chris Wilson05394f32010-11-08 19:18:58 +0000562 ret = i915_gem_shmem_pread_slow(dev, obj, args, file);
Eric Anholt673a3942008-07-30 12:06:12 -0700563
Chris Wilson35b62a82010-09-26 20:23:38 +0100564out:
Chris Wilson05394f32010-11-08 19:18:58 +0000565 drm_gem_object_unreference(&obj->base);
Chris Wilson1d7cfea2010-10-17 09:45:41 +0100566unlock:
Chris Wilson4f27b752010-10-14 15:26:45 +0100567 mutex_unlock(&dev->struct_mutex);
Eric Anholteb014592009-03-10 11:44:52 -0700568 return ret;
Eric Anholt673a3942008-07-30 12:06:12 -0700569}
570
Keith Packard0839ccb2008-10-30 19:38:48 -0700571/* This is the fast write path which cannot handle
572 * page faults in the source data
Linus Torvalds9b7530cc2008-10-20 14:16:43 -0700573 */
Linus Torvalds9b7530cc2008-10-20 14:16:43 -0700574
Keith Packard0839ccb2008-10-30 19:38:48 -0700575static inline int
576fast_user_write(struct io_mapping *mapping,
577 loff_t page_base, int page_offset,
578 char __user *user_data,
579 int length)
580{
581 char *vaddr_atomic;
582 unsigned long unwritten;
583
Peter Zijlstra3e4d3af2010-10-26 14:21:51 -0700584 vaddr_atomic = io_mapping_map_atomic_wc(mapping, page_base);
Keith Packard0839ccb2008-10-30 19:38:48 -0700585 unwritten = __copy_from_user_inatomic_nocache(vaddr_atomic + page_offset,
586 user_data, length);
Peter Zijlstra3e4d3af2010-10-26 14:21:51 -0700587 io_mapping_unmap_atomic(vaddr_atomic);
Chris Wilsonfbd5a262010-10-14 15:03:58 +0100588 return unwritten;
Keith Packard0839ccb2008-10-30 19:38:48 -0700589}
590
591/* Here's the write path which can sleep for
592 * page faults
593 */
594
Chris Wilsonab34c222010-05-27 14:15:35 +0100595static inline void
Eric Anholt3de09aa2009-03-09 09:42:23 -0700596slow_kernel_write(struct io_mapping *mapping,
597 loff_t gtt_base, int gtt_offset,
598 struct page *user_page, int user_offset,
599 int length)
Keith Packard0839ccb2008-10-30 19:38:48 -0700600{
Chris Wilsonab34c222010-05-27 14:15:35 +0100601 char __iomem *dst_vaddr;
602 char *src_vaddr;
Keith Packard0839ccb2008-10-30 19:38:48 -0700603
Chris Wilsonab34c222010-05-27 14:15:35 +0100604 dst_vaddr = io_mapping_map_wc(mapping, gtt_base);
605 src_vaddr = kmap(user_page);
606
607 memcpy_toio(dst_vaddr + gtt_offset,
608 src_vaddr + user_offset,
609 length);
610
611 kunmap(user_page);
612 io_mapping_unmap(dst_vaddr);
Linus Torvalds9b7530cc2008-10-20 14:16:43 -0700613}
614
Eric Anholt3de09aa2009-03-09 09:42:23 -0700615/**
616 * This is the fast pwrite path, where we copy the data directly from the
617 * user into the GTT, uncached.
618 */
Eric Anholt673a3942008-07-30 12:06:12 -0700619static int
Chris Wilson05394f32010-11-08 19:18:58 +0000620i915_gem_gtt_pwrite_fast(struct drm_device *dev,
621 struct drm_i915_gem_object *obj,
Eric Anholt3de09aa2009-03-09 09:42:23 -0700622 struct drm_i915_gem_pwrite *args,
Chris Wilson05394f32010-11-08 19:18:58 +0000623 struct drm_file *file)
Eric Anholt673a3942008-07-30 12:06:12 -0700624{
Keith Packard0839ccb2008-10-30 19:38:48 -0700625 drm_i915_private_t *dev_priv = dev->dev_private;
Eric Anholt673a3942008-07-30 12:06:12 -0700626 ssize_t remain;
Keith Packard0839ccb2008-10-30 19:38:48 -0700627 loff_t offset, page_base;
Eric Anholt673a3942008-07-30 12:06:12 -0700628 char __user *user_data;
Keith Packard0839ccb2008-10-30 19:38:48 -0700629 int page_offset, page_length;
Eric Anholt673a3942008-07-30 12:06:12 -0700630
631 user_data = (char __user *) (uintptr_t) args->data_ptr;
632 remain = args->size;
Eric Anholt673a3942008-07-30 12:06:12 -0700633
Chris Wilson05394f32010-11-08 19:18:58 +0000634 offset = obj->gtt_offset + args->offset;
Eric Anholt673a3942008-07-30 12:06:12 -0700635
636 while (remain > 0) {
637 /* Operation in this page
638 *
Keith Packard0839ccb2008-10-30 19:38:48 -0700639 * page_base = page offset within aperture
640 * page_offset = offset within page
641 * page_length = bytes to copy for this page
Eric Anholt673a3942008-07-30 12:06:12 -0700642 */
Chris Wilsonc8cbbb82011-05-12 22:17:11 +0100643 page_base = offset & PAGE_MASK;
644 page_offset = offset_in_page(offset);
Keith Packard0839ccb2008-10-30 19:38:48 -0700645 page_length = remain;
646 if ((page_offset + remain) > PAGE_SIZE)
647 page_length = PAGE_SIZE - page_offset;
Eric Anholt673a3942008-07-30 12:06:12 -0700648
Keith Packard0839ccb2008-10-30 19:38:48 -0700649 /* If we get a fault while copying data, then (presumably) our
Eric Anholt3de09aa2009-03-09 09:42:23 -0700650 * source page isn't available. Return the error and we'll
651 * retry in the slow path.
Keith Packard0839ccb2008-10-30 19:38:48 -0700652 */
Chris Wilsonfbd5a262010-10-14 15:03:58 +0100653 if (fast_user_write(dev_priv->mm.gtt_mapping, page_base,
654 page_offset, user_data, page_length))
Chris Wilsonfbd5a262010-10-14 15:03:58 +0100655 return -EFAULT;
Eric Anholt673a3942008-07-30 12:06:12 -0700656
Keith Packard0839ccb2008-10-30 19:38:48 -0700657 remain -= page_length;
658 user_data += page_length;
659 offset += page_length;
Eric Anholt673a3942008-07-30 12:06:12 -0700660 }
Eric Anholt673a3942008-07-30 12:06:12 -0700661
Chris Wilsonfbd5a262010-10-14 15:03:58 +0100662 return 0;
Eric Anholt673a3942008-07-30 12:06:12 -0700663}
664
Eric Anholt3de09aa2009-03-09 09:42:23 -0700665/**
666 * This is the fallback GTT pwrite path, which uses get_user_pages to pin
667 * the memory and maps it using kmap_atomic for copying.
668 *
669 * This code resulted in x11perf -rgb10text consuming about 10% more CPU
670 * than using i915_gem_gtt_pwrite_fast on a G45 (32-bit).
671 */
Eric Anholt3043c602008-10-02 12:24:47 -0700672static int
Chris Wilson05394f32010-11-08 19:18:58 +0000673i915_gem_gtt_pwrite_slow(struct drm_device *dev,
674 struct drm_i915_gem_object *obj,
Eric Anholt3de09aa2009-03-09 09:42:23 -0700675 struct drm_i915_gem_pwrite *args,
Chris Wilson05394f32010-11-08 19:18:58 +0000676 struct drm_file *file)
Eric Anholt673a3942008-07-30 12:06:12 -0700677{
Eric Anholt3de09aa2009-03-09 09:42:23 -0700678 drm_i915_private_t *dev_priv = dev->dev_private;
679 ssize_t remain;
680 loff_t gtt_page_base, offset;
681 loff_t first_data_page, last_data_page, num_pages;
682 loff_t pinned_pages, i;
683 struct page **user_pages;
684 struct mm_struct *mm = current->mm;
685 int gtt_page_offset, data_page_offset, data_page_index, page_length;
Eric Anholt673a3942008-07-30 12:06:12 -0700686 int ret;
Eric Anholt3de09aa2009-03-09 09:42:23 -0700687 uint64_t data_ptr = args->data_ptr;
688
689 remain = args->size;
690
691 /* Pin the user pages containing the data. We can't fault while
692 * holding the struct mutex, and all of the pwrite implementations
693 * want to hold it while dereferencing the user data.
694 */
695 first_data_page = data_ptr / PAGE_SIZE;
696 last_data_page = (data_ptr + args->size - 1) / PAGE_SIZE;
697 num_pages = last_data_page - first_data_page + 1;
698
Chris Wilsonfbd5a262010-10-14 15:03:58 +0100699 user_pages = drm_malloc_ab(num_pages, sizeof(struct page *));
Eric Anholt3de09aa2009-03-09 09:42:23 -0700700 if (user_pages == NULL)
701 return -ENOMEM;
702
Chris Wilsonfbd5a262010-10-14 15:03:58 +0100703 mutex_unlock(&dev->struct_mutex);
Eric Anholt3de09aa2009-03-09 09:42:23 -0700704 down_read(&mm->mmap_sem);
705 pinned_pages = get_user_pages(current, mm, (uintptr_t)args->data_ptr,
706 num_pages, 0, 0, user_pages, NULL);
707 up_read(&mm->mmap_sem);
Chris Wilsonfbd5a262010-10-14 15:03:58 +0100708 mutex_lock(&dev->struct_mutex);
Eric Anholt3de09aa2009-03-09 09:42:23 -0700709 if (pinned_pages < num_pages) {
710 ret = -EFAULT;
711 goto out_unpin_pages;
712 }
713
Chris Wilsond9e86c02010-11-10 16:40:20 +0000714 ret = i915_gem_object_set_to_gtt_domain(obj, true);
715 if (ret)
716 goto out_unpin_pages;
717
718 ret = i915_gem_object_put_fence(obj);
Eric Anholt3de09aa2009-03-09 09:42:23 -0700719 if (ret)
Chris Wilsonfbd5a262010-10-14 15:03:58 +0100720 goto out_unpin_pages;
Eric Anholt3de09aa2009-03-09 09:42:23 -0700721
Chris Wilson05394f32010-11-08 19:18:58 +0000722 offset = obj->gtt_offset + args->offset;
Eric Anholt3de09aa2009-03-09 09:42:23 -0700723
724 while (remain > 0) {
725 /* Operation in this page
726 *
727 * gtt_page_base = page offset within aperture
728 * gtt_page_offset = offset within page in aperture
729 * data_page_index = page number in get_user_pages return
730 * data_page_offset = offset with data_page_index page.
731 * page_length = bytes to copy for this page
732 */
733 gtt_page_base = offset & PAGE_MASK;
Chris Wilsonc8cbbb82011-05-12 22:17:11 +0100734 gtt_page_offset = offset_in_page(offset);
Eric Anholt3de09aa2009-03-09 09:42:23 -0700735 data_page_index = data_ptr / PAGE_SIZE - first_data_page;
Chris Wilsonc8cbbb82011-05-12 22:17:11 +0100736 data_page_offset = offset_in_page(data_ptr);
Eric Anholt3de09aa2009-03-09 09:42:23 -0700737
738 page_length = remain;
739 if ((gtt_page_offset + page_length) > PAGE_SIZE)
740 page_length = PAGE_SIZE - gtt_page_offset;
741 if ((data_page_offset + page_length) > PAGE_SIZE)
742 page_length = PAGE_SIZE - data_page_offset;
743
Chris Wilsonab34c222010-05-27 14:15:35 +0100744 slow_kernel_write(dev_priv->mm.gtt_mapping,
745 gtt_page_base, gtt_page_offset,
746 user_pages[data_page_index],
747 data_page_offset,
748 page_length);
Eric Anholt3de09aa2009-03-09 09:42:23 -0700749
750 remain -= page_length;
751 offset += page_length;
752 data_ptr += page_length;
753 }
754
Eric Anholt3de09aa2009-03-09 09:42:23 -0700755out_unpin_pages:
756 for (i = 0; i < pinned_pages; i++)
757 page_cache_release(user_pages[i]);
Jesse Barnes8e7d2b22009-05-08 16:13:25 -0700758 drm_free_large(user_pages);
Eric Anholt3de09aa2009-03-09 09:42:23 -0700759
760 return ret;
761}
762
Eric Anholt40123c12009-03-09 13:42:30 -0700763/**
764 * This is the fast shmem pwrite path, which attempts to directly
765 * copy_from_user into the kmapped pages backing the object.
766 */
Eric Anholt673a3942008-07-30 12:06:12 -0700767static int
Chris Wilson05394f32010-11-08 19:18:58 +0000768i915_gem_shmem_pwrite_fast(struct drm_device *dev,
769 struct drm_i915_gem_object *obj,
Eric Anholt40123c12009-03-09 13:42:30 -0700770 struct drm_i915_gem_pwrite *args,
Chris Wilson05394f32010-11-08 19:18:58 +0000771 struct drm_file *file)
Eric Anholt673a3942008-07-30 12:06:12 -0700772{
Chris Wilson05394f32010-11-08 19:18:58 +0000773 struct address_space *mapping = obj->base.filp->f_path.dentry->d_inode->i_mapping;
Eric Anholt40123c12009-03-09 13:42:30 -0700774 ssize_t remain;
Chris Wilsone5281cc2010-10-28 13:45:36 +0100775 loff_t offset;
Eric Anholt40123c12009-03-09 13:42:30 -0700776 char __user *user_data;
777 int page_offset, page_length;
Eric Anholt40123c12009-03-09 13:42:30 -0700778
779 user_data = (char __user *) (uintptr_t) args->data_ptr;
780 remain = args->size;
Eric Anholt673a3942008-07-30 12:06:12 -0700781
Eric Anholt673a3942008-07-30 12:06:12 -0700782 offset = args->offset;
Chris Wilson05394f32010-11-08 19:18:58 +0000783 obj->dirty = 1;
Eric Anholt673a3942008-07-30 12:06:12 -0700784
Eric Anholt40123c12009-03-09 13:42:30 -0700785 while (remain > 0) {
Chris Wilsone5281cc2010-10-28 13:45:36 +0100786 struct page *page;
787 char *vaddr;
788 int ret;
789
Eric Anholt40123c12009-03-09 13:42:30 -0700790 /* Operation in this page
791 *
Eric Anholt40123c12009-03-09 13:42:30 -0700792 * page_offset = offset within page
793 * page_length = bytes to copy for this page
794 */
Chris Wilsonc8cbbb82011-05-12 22:17:11 +0100795 page_offset = offset_in_page(offset);
Eric Anholt40123c12009-03-09 13:42:30 -0700796 page_length = remain;
797 if ((page_offset + remain) > PAGE_SIZE)
798 page_length = PAGE_SIZE - page_offset;
799
Chris Wilsone5281cc2010-10-28 13:45:36 +0100800 page = read_cache_page_gfp(mapping, offset >> PAGE_SHIFT,
801 GFP_HIGHUSER | __GFP_RECLAIMABLE);
802 if (IS_ERR(page))
803 return PTR_ERR(page);
804
805 vaddr = kmap_atomic(page, KM_USER0);
806 ret = __copy_from_user_inatomic(vaddr + page_offset,
807 user_data,
808 page_length);
809 kunmap_atomic(vaddr, KM_USER0);
810
811 set_page_dirty(page);
812 mark_page_accessed(page);
813 page_cache_release(page);
814
815 /* If we get a fault while copying data, then (presumably) our
816 * source page isn't available. Return the error and we'll
817 * retry in the slow path.
818 */
819 if (ret)
Chris Wilsonfbd5a262010-10-14 15:03:58 +0100820 return -EFAULT;
Eric Anholt40123c12009-03-09 13:42:30 -0700821
822 remain -= page_length;
823 user_data += page_length;
824 offset += page_length;
Eric Anholt673a3942008-07-30 12:06:12 -0700825 }
826
Chris Wilsonfbd5a262010-10-14 15:03:58 +0100827 return 0;
Eric Anholt40123c12009-03-09 13:42:30 -0700828}
829
830/**
831 * This is the fallback shmem pwrite path, which uses get_user_pages to pin
832 * the memory and maps it using kmap_atomic for copying.
833 *
834 * This avoids taking mmap_sem for faulting on the user's address while the
835 * struct_mutex is held.
836 */
837static int
Chris Wilson05394f32010-11-08 19:18:58 +0000838i915_gem_shmem_pwrite_slow(struct drm_device *dev,
839 struct drm_i915_gem_object *obj,
Eric Anholt40123c12009-03-09 13:42:30 -0700840 struct drm_i915_gem_pwrite *args,
Chris Wilson05394f32010-11-08 19:18:58 +0000841 struct drm_file *file)
Eric Anholt40123c12009-03-09 13:42:30 -0700842{
Chris Wilson05394f32010-11-08 19:18:58 +0000843 struct address_space *mapping = obj->base.filp->f_path.dentry->d_inode->i_mapping;
Eric Anholt40123c12009-03-09 13:42:30 -0700844 struct mm_struct *mm = current->mm;
845 struct page **user_pages;
846 ssize_t remain;
847 loff_t offset, pinned_pages, i;
848 loff_t first_data_page, last_data_page, num_pages;
Chris Wilsone5281cc2010-10-28 13:45:36 +0100849 int shmem_page_offset;
Eric Anholt40123c12009-03-09 13:42:30 -0700850 int data_page_index, data_page_offset;
851 int page_length;
852 int ret;
853 uint64_t data_ptr = args->data_ptr;
Eric Anholt280b7132009-03-12 16:56:27 -0700854 int do_bit17_swizzling;
Eric Anholt40123c12009-03-09 13:42:30 -0700855
856 remain = args->size;
857
858 /* Pin the user pages containing the data. We can't fault while
859 * holding the struct mutex, and all of the pwrite implementations
860 * want to hold it while dereferencing the user data.
861 */
862 first_data_page = data_ptr / PAGE_SIZE;
863 last_data_page = (data_ptr + args->size - 1) / PAGE_SIZE;
864 num_pages = last_data_page - first_data_page + 1;
865
Chris Wilson4f27b752010-10-14 15:26:45 +0100866 user_pages = drm_malloc_ab(num_pages, sizeof(struct page *));
Eric Anholt40123c12009-03-09 13:42:30 -0700867 if (user_pages == NULL)
868 return -ENOMEM;
869
Chris Wilsonfbd5a262010-10-14 15:03:58 +0100870 mutex_unlock(&dev->struct_mutex);
Eric Anholt40123c12009-03-09 13:42:30 -0700871 down_read(&mm->mmap_sem);
872 pinned_pages = get_user_pages(current, mm, (uintptr_t)args->data_ptr,
873 num_pages, 0, 0, user_pages, NULL);
874 up_read(&mm->mmap_sem);
Chris Wilsonfbd5a262010-10-14 15:03:58 +0100875 mutex_lock(&dev->struct_mutex);
Eric Anholt40123c12009-03-09 13:42:30 -0700876 if (pinned_pages < num_pages) {
877 ret = -EFAULT;
Chris Wilsonfbd5a262010-10-14 15:03:58 +0100878 goto out;
Eric Anholt40123c12009-03-09 13:42:30 -0700879 }
880
Eric Anholt40123c12009-03-09 13:42:30 -0700881 ret = i915_gem_object_set_to_cpu_domain(obj, 1);
Chris Wilsonfbd5a262010-10-14 15:03:58 +0100882 if (ret)
883 goto out;
884
885 do_bit17_swizzling = i915_gem_object_needs_bit17_swizzle(obj);
Eric Anholt40123c12009-03-09 13:42:30 -0700886
Eric Anholt40123c12009-03-09 13:42:30 -0700887 offset = args->offset;
Chris Wilson05394f32010-11-08 19:18:58 +0000888 obj->dirty = 1;
Eric Anholt40123c12009-03-09 13:42:30 -0700889
890 while (remain > 0) {
Chris Wilsone5281cc2010-10-28 13:45:36 +0100891 struct page *page;
892
Eric Anholt40123c12009-03-09 13:42:30 -0700893 /* Operation in this page
894 *
Eric Anholt40123c12009-03-09 13:42:30 -0700895 * shmem_page_offset = offset within page in shmem file
896 * data_page_index = page number in get_user_pages return
897 * data_page_offset = offset with data_page_index page.
898 * page_length = bytes to copy for this page
899 */
Chris Wilsonc8cbbb82011-05-12 22:17:11 +0100900 shmem_page_offset = offset_in_page(offset);
Eric Anholt40123c12009-03-09 13:42:30 -0700901 data_page_index = data_ptr / PAGE_SIZE - first_data_page;
Chris Wilsonc8cbbb82011-05-12 22:17:11 +0100902 data_page_offset = offset_in_page(data_ptr);
Eric Anholt40123c12009-03-09 13:42:30 -0700903
904 page_length = remain;
905 if ((shmem_page_offset + page_length) > PAGE_SIZE)
906 page_length = PAGE_SIZE - shmem_page_offset;
907 if ((data_page_offset + page_length) > PAGE_SIZE)
908 page_length = PAGE_SIZE - data_page_offset;
909
Chris Wilsone5281cc2010-10-28 13:45:36 +0100910 page = read_cache_page_gfp(mapping, offset >> PAGE_SHIFT,
911 GFP_HIGHUSER | __GFP_RECLAIMABLE);
912 if (IS_ERR(page)) {
913 ret = PTR_ERR(page);
914 goto out;
915 }
916
Eric Anholt280b7132009-03-12 16:56:27 -0700917 if (do_bit17_swizzling) {
Chris Wilsone5281cc2010-10-28 13:45:36 +0100918 slow_shmem_bit17_copy(page,
Eric Anholt280b7132009-03-12 16:56:27 -0700919 shmem_page_offset,
920 user_pages[data_page_index],
921 data_page_offset,
Chris Wilson99a03df2010-05-27 14:15:34 +0100922 page_length,
923 0);
924 } else {
Chris Wilsone5281cc2010-10-28 13:45:36 +0100925 slow_shmem_copy(page,
Chris Wilson99a03df2010-05-27 14:15:34 +0100926 shmem_page_offset,
927 user_pages[data_page_index],
928 data_page_offset,
929 page_length);
Eric Anholt280b7132009-03-12 16:56:27 -0700930 }
Eric Anholt40123c12009-03-09 13:42:30 -0700931
Chris Wilsone5281cc2010-10-28 13:45:36 +0100932 set_page_dirty(page);
933 mark_page_accessed(page);
934 page_cache_release(page);
935
Eric Anholt40123c12009-03-09 13:42:30 -0700936 remain -= page_length;
937 data_ptr += page_length;
938 offset += page_length;
939 }
940
Chris Wilsonfbd5a262010-10-14 15:03:58 +0100941out:
Eric Anholt40123c12009-03-09 13:42:30 -0700942 for (i = 0; i < pinned_pages; i++)
943 page_cache_release(user_pages[i]);
Jesse Barnes8e7d2b22009-05-08 16:13:25 -0700944 drm_free_large(user_pages);
Eric Anholt40123c12009-03-09 13:42:30 -0700945
946 return ret;
Eric Anholt673a3942008-07-30 12:06:12 -0700947}
948
949/**
950 * Writes data to the object referenced by handle.
951 *
952 * On error, the contents of the buffer that were to be modified are undefined.
953 */
954int
955i915_gem_pwrite_ioctl(struct drm_device *dev, void *data,
Chris Wilsonfbd5a262010-10-14 15:03:58 +0100956 struct drm_file *file)
Eric Anholt673a3942008-07-30 12:06:12 -0700957{
958 struct drm_i915_gem_pwrite *args = data;
Chris Wilson05394f32010-11-08 19:18:58 +0000959 struct drm_i915_gem_object *obj;
Chris Wilson51311d02010-11-17 09:10:42 +0000960 int ret;
961
962 if (args->size == 0)
963 return 0;
964
965 if (!access_ok(VERIFY_READ,
966 (char __user *)(uintptr_t)args->data_ptr,
967 args->size))
968 return -EFAULT;
969
970 ret = fault_in_pages_readable((char __user *)(uintptr_t)args->data_ptr,
971 args->size);
972 if (ret)
973 return -EFAULT;
Eric Anholt673a3942008-07-30 12:06:12 -0700974
Chris Wilson1d7cfea2010-10-17 09:45:41 +0100975 ret = i915_mutex_lock_interruptible(dev);
976 if (ret)
977 return ret;
978
Chris Wilson05394f32010-11-08 19:18:58 +0000979 obj = to_intel_bo(drm_gem_object_lookup(dev, file, args->handle));
Chris Wilsonc8725222011-02-19 11:31:06 +0000980 if (&obj->base == NULL) {
Chris Wilson1d7cfea2010-10-17 09:45:41 +0100981 ret = -ENOENT;
982 goto unlock;
983 }
Eric Anholt673a3942008-07-30 12:06:12 -0700984
Chris Wilson7dcd2492010-09-26 20:21:44 +0100985 /* Bounds check destination. */
Chris Wilson05394f32010-11-08 19:18:58 +0000986 if (args->offset > obj->base.size ||
987 args->size > obj->base.size - args->offset) {
Chris Wilsonce9d4192010-09-26 20:50:05 +0100988 ret = -EINVAL;
Chris Wilson35b62a82010-09-26 20:23:38 +0100989 goto out;
Chris Wilsonce9d4192010-09-26 20:50:05 +0100990 }
991
Chris Wilsondb53a302011-02-03 11:57:46 +0000992 trace_i915_gem_object_pwrite(obj, args->offset, args->size);
993
Eric Anholt673a3942008-07-30 12:06:12 -0700994 /* We can only do the GTT pwrite on untiled buffers, as otherwise
995 * it would end up going through the fenced access, and we'll get
996 * different detiling behavior between reading and writing.
997 * pread/pwrite currently are reading and writing from the CPU
998 * perspective, requiring manual detiling by the client.
999 */
Chris Wilson05394f32010-11-08 19:18:58 +00001000 if (obj->phys_obj)
Chris Wilsonfbd5a262010-10-14 15:03:58 +01001001 ret = i915_gem_phys_pwrite(dev, obj, args, file);
Chris Wilsond9e86c02010-11-10 16:40:20 +00001002 else if (obj->gtt_space &&
Chris Wilson05394f32010-11-08 19:18:58 +00001003 obj->base.write_domain != I915_GEM_DOMAIN_CPU) {
Daniel Vetter75e9e912010-11-04 17:11:09 +01001004 ret = i915_gem_object_pin(obj, 0, true);
Chris Wilsonfbd5a262010-10-14 15:03:58 +01001005 if (ret)
1006 goto out;
1007
Chris Wilsond9e86c02010-11-10 16:40:20 +00001008 ret = i915_gem_object_set_to_gtt_domain(obj, true);
1009 if (ret)
1010 goto out_unpin;
1011
1012 ret = i915_gem_object_put_fence(obj);
Chris Wilsonfbd5a262010-10-14 15:03:58 +01001013 if (ret)
1014 goto out_unpin;
1015
1016 ret = i915_gem_gtt_pwrite_fast(dev, obj, args, file);
1017 if (ret == -EFAULT)
1018 ret = i915_gem_gtt_pwrite_slow(dev, obj, args, file);
1019
1020out_unpin:
1021 i915_gem_object_unpin(obj);
Eric Anholt40123c12009-03-09 13:42:30 -07001022 } else {
Chris Wilsonfbd5a262010-10-14 15:03:58 +01001023 ret = i915_gem_object_set_to_cpu_domain(obj, 1);
1024 if (ret)
Chris Wilsone5281cc2010-10-28 13:45:36 +01001025 goto out;
Chris Wilsonfbd5a262010-10-14 15:03:58 +01001026
1027 ret = -EFAULT;
1028 if (!i915_gem_object_needs_bit17_swizzle(obj))
1029 ret = i915_gem_shmem_pwrite_fast(dev, obj, args, file);
1030 if (ret == -EFAULT)
1031 ret = i915_gem_shmem_pwrite_slow(dev, obj, args, file);
Eric Anholt40123c12009-03-09 13:42:30 -07001032 }
Eric Anholt673a3942008-07-30 12:06:12 -07001033
Chris Wilson35b62a82010-09-26 20:23:38 +01001034out:
Chris Wilson05394f32010-11-08 19:18:58 +00001035 drm_gem_object_unreference(&obj->base);
Chris Wilson1d7cfea2010-10-17 09:45:41 +01001036unlock:
Chris Wilsonfbd5a262010-10-14 15:03:58 +01001037 mutex_unlock(&dev->struct_mutex);
Eric Anholt673a3942008-07-30 12:06:12 -07001038 return ret;
1039}
1040
1041/**
Eric Anholt2ef7eea2008-11-10 10:53:25 -08001042 * Called when user space prepares to use an object with the CPU, either
1043 * through the mmap ioctl's mapping or a GTT mapping.
Eric Anholt673a3942008-07-30 12:06:12 -07001044 */
1045int
1046i915_gem_set_domain_ioctl(struct drm_device *dev, void *data,
Chris Wilson05394f32010-11-08 19:18:58 +00001047 struct drm_file *file)
Eric Anholt673a3942008-07-30 12:06:12 -07001048{
1049 struct drm_i915_gem_set_domain *args = data;
Chris Wilson05394f32010-11-08 19:18:58 +00001050 struct drm_i915_gem_object *obj;
Eric Anholt2ef7eea2008-11-10 10:53:25 -08001051 uint32_t read_domains = args->read_domains;
1052 uint32_t write_domain = args->write_domain;
Eric Anholt673a3942008-07-30 12:06:12 -07001053 int ret;
1054
1055 if (!(dev->driver->driver_features & DRIVER_GEM))
1056 return -ENODEV;
1057
Eric Anholt2ef7eea2008-11-10 10:53:25 -08001058 /* Only handle setting domains to types used by the CPU. */
Chris Wilson21d509e2009-06-06 09:46:02 +01001059 if (write_domain & I915_GEM_GPU_DOMAINS)
Eric Anholt2ef7eea2008-11-10 10:53:25 -08001060 return -EINVAL;
1061
Chris Wilson21d509e2009-06-06 09:46:02 +01001062 if (read_domains & I915_GEM_GPU_DOMAINS)
Eric Anholt2ef7eea2008-11-10 10:53:25 -08001063 return -EINVAL;
1064
1065 /* Having something in the write domain implies it's in the read
1066 * domain, and only that read domain. Enforce that in the request.
1067 */
1068 if (write_domain != 0 && read_domains != write_domain)
1069 return -EINVAL;
1070
Chris Wilson76c1dec2010-09-25 11:22:51 +01001071 ret = i915_mutex_lock_interruptible(dev);
Chris Wilson1d7cfea2010-10-17 09:45:41 +01001072 if (ret)
Chris Wilson76c1dec2010-09-25 11:22:51 +01001073 return ret;
Eric Anholt673a3942008-07-30 12:06:12 -07001074
Chris Wilson05394f32010-11-08 19:18:58 +00001075 obj = to_intel_bo(drm_gem_object_lookup(dev, file, args->handle));
Chris Wilsonc8725222011-02-19 11:31:06 +00001076 if (&obj->base == NULL) {
Chris Wilson1d7cfea2010-10-17 09:45:41 +01001077 ret = -ENOENT;
1078 goto unlock;
Chris Wilson76c1dec2010-09-25 11:22:51 +01001079 }
Jesse Barnes652c3932009-08-17 13:31:43 -07001080
Eric Anholt2ef7eea2008-11-10 10:53:25 -08001081 if (read_domains & I915_GEM_DOMAIN_GTT) {
1082 ret = i915_gem_object_set_to_gtt_domain(obj, write_domain != 0);
Eric Anholt02354392008-11-26 13:58:13 -08001083
1084 /* Silently promote "you're not bound, there was nothing to do"
1085 * to success, since the client was just asking us to
1086 * make sure everything was done.
1087 */
1088 if (ret == -EINVAL)
1089 ret = 0;
Eric Anholt2ef7eea2008-11-10 10:53:25 -08001090 } else {
Eric Anholte47c68e2008-11-14 13:35:19 -08001091 ret = i915_gem_object_set_to_cpu_domain(obj, write_domain != 0);
Eric Anholt2ef7eea2008-11-10 10:53:25 -08001092 }
1093
Chris Wilson05394f32010-11-08 19:18:58 +00001094 drm_gem_object_unreference(&obj->base);
Chris Wilson1d7cfea2010-10-17 09:45:41 +01001095unlock:
Eric Anholt673a3942008-07-30 12:06:12 -07001096 mutex_unlock(&dev->struct_mutex);
1097 return ret;
1098}
1099
1100/**
1101 * Called when user space has done writes to this buffer
1102 */
1103int
1104i915_gem_sw_finish_ioctl(struct drm_device *dev, void *data,
Chris Wilson05394f32010-11-08 19:18:58 +00001105 struct drm_file *file)
Eric Anholt673a3942008-07-30 12:06:12 -07001106{
1107 struct drm_i915_gem_sw_finish *args = data;
Chris Wilson05394f32010-11-08 19:18:58 +00001108 struct drm_i915_gem_object *obj;
Eric Anholt673a3942008-07-30 12:06:12 -07001109 int ret = 0;
1110
1111 if (!(dev->driver->driver_features & DRIVER_GEM))
1112 return -ENODEV;
1113
Chris Wilson76c1dec2010-09-25 11:22:51 +01001114 ret = i915_mutex_lock_interruptible(dev);
Chris Wilson1d7cfea2010-10-17 09:45:41 +01001115 if (ret)
Chris Wilson76c1dec2010-09-25 11:22:51 +01001116 return ret;
Chris Wilson1d7cfea2010-10-17 09:45:41 +01001117
Chris Wilson05394f32010-11-08 19:18:58 +00001118 obj = to_intel_bo(drm_gem_object_lookup(dev, file, args->handle));
Chris Wilsonc8725222011-02-19 11:31:06 +00001119 if (&obj->base == NULL) {
Chris Wilson1d7cfea2010-10-17 09:45:41 +01001120 ret = -ENOENT;
1121 goto unlock;
Eric Anholt673a3942008-07-30 12:06:12 -07001122 }
1123
Eric Anholt673a3942008-07-30 12:06:12 -07001124 /* Pinned buffers may be scanout, so flush the cache */
Chris Wilson05394f32010-11-08 19:18:58 +00001125 if (obj->pin_count)
Eric Anholte47c68e2008-11-14 13:35:19 -08001126 i915_gem_object_flush_cpu_write_domain(obj);
1127
Chris Wilson05394f32010-11-08 19:18:58 +00001128 drm_gem_object_unreference(&obj->base);
Chris Wilson1d7cfea2010-10-17 09:45:41 +01001129unlock:
Eric Anholt673a3942008-07-30 12:06:12 -07001130 mutex_unlock(&dev->struct_mutex);
1131 return ret;
1132}
1133
1134/**
1135 * Maps the contents of an object, returning the address it is mapped
1136 * into.
1137 *
1138 * While the mapping holds a reference on the contents of the object, it doesn't
1139 * imply a ref on the object itself.
1140 */
1141int
1142i915_gem_mmap_ioctl(struct drm_device *dev, void *data,
Chris Wilson05394f32010-11-08 19:18:58 +00001143 struct drm_file *file)
Eric Anholt673a3942008-07-30 12:06:12 -07001144{
Chris Wilsonda761a62010-10-27 17:37:08 +01001145 struct drm_i915_private *dev_priv = dev->dev_private;
Eric Anholt673a3942008-07-30 12:06:12 -07001146 struct drm_i915_gem_mmap *args = data;
1147 struct drm_gem_object *obj;
Eric Anholt673a3942008-07-30 12:06:12 -07001148 unsigned long addr;
1149
1150 if (!(dev->driver->driver_features & DRIVER_GEM))
1151 return -ENODEV;
1152
Chris Wilson05394f32010-11-08 19:18:58 +00001153 obj = drm_gem_object_lookup(dev, file, args->handle);
Eric Anholt673a3942008-07-30 12:06:12 -07001154 if (obj == NULL)
Chris Wilsonbf79cb92010-08-04 14:19:46 +01001155 return -ENOENT;
Eric Anholt673a3942008-07-30 12:06:12 -07001156
Chris Wilsonda761a62010-10-27 17:37:08 +01001157 if (obj->size > dev_priv->mm.gtt_mappable_end) {
1158 drm_gem_object_unreference_unlocked(obj);
1159 return -E2BIG;
1160 }
1161
Eric Anholt673a3942008-07-30 12:06:12 -07001162 down_write(&current->mm->mmap_sem);
1163 addr = do_mmap(obj->filp, 0, args->size,
1164 PROT_READ | PROT_WRITE, MAP_SHARED,
1165 args->offset);
1166 up_write(&current->mm->mmap_sem);
Luca Barbieribc9025b2010-02-09 05:49:12 +00001167 drm_gem_object_unreference_unlocked(obj);
Eric Anholt673a3942008-07-30 12:06:12 -07001168 if (IS_ERR((void *)addr))
1169 return addr;
1170
1171 args->addr_ptr = (uint64_t) addr;
1172
1173 return 0;
1174}
1175
Jesse Barnesde151cf2008-11-12 10:03:55 -08001176/**
1177 * i915_gem_fault - fault a page into the GTT
1178 * vma: VMA in question
1179 * vmf: fault info
1180 *
1181 * The fault handler is set up by drm_gem_mmap() when a object is GTT mapped
1182 * from userspace. The fault handler takes care of binding the object to
1183 * the GTT (if needed), allocating and programming a fence register (again,
1184 * only if needed based on whether the old reg is still valid or the object
1185 * is tiled) and inserting a new PTE into the faulting process.
1186 *
1187 * Note that the faulting process may involve evicting existing objects
1188 * from the GTT and/or fence registers to make room. So performance may
1189 * suffer if the GTT working set is large or there are few fence registers
1190 * left.
1191 */
1192int i915_gem_fault(struct vm_area_struct *vma, struct vm_fault *vmf)
1193{
Chris Wilson05394f32010-11-08 19:18:58 +00001194 struct drm_i915_gem_object *obj = to_intel_bo(vma->vm_private_data);
1195 struct drm_device *dev = obj->base.dev;
Chris Wilson7d1c4802010-08-07 21:45:03 +01001196 drm_i915_private_t *dev_priv = dev->dev_private;
Jesse Barnesde151cf2008-11-12 10:03:55 -08001197 pgoff_t page_offset;
1198 unsigned long pfn;
1199 int ret = 0;
Jesse Barnes0f973f22009-01-26 17:10:45 -08001200 bool write = !!(vmf->flags & FAULT_FLAG_WRITE);
Jesse Barnesde151cf2008-11-12 10:03:55 -08001201
1202 /* We don't use vmf->pgoff since that has the fake offset */
1203 page_offset = ((unsigned long)vmf->virtual_address - vma->vm_start) >>
1204 PAGE_SHIFT;
1205
Chris Wilsond9bc7e92011-02-07 13:09:31 +00001206 ret = i915_mutex_lock_interruptible(dev);
1207 if (ret)
1208 goto out;
Chris Wilsona00b10c2010-09-24 21:15:47 +01001209
Chris Wilsondb53a302011-02-03 11:57:46 +00001210 trace_i915_gem_object_fault(obj, page_offset, true, write);
1211
Chris Wilsond9bc7e92011-02-07 13:09:31 +00001212 /* Now bind it into the GTT if needed */
Chris Wilson919926a2010-11-12 13:42:53 +00001213 if (!obj->map_and_fenceable) {
1214 ret = i915_gem_object_unbind(obj);
1215 if (ret)
1216 goto unlock;
Chris Wilsona00b10c2010-09-24 21:15:47 +01001217 }
Chris Wilson05394f32010-11-08 19:18:58 +00001218 if (!obj->gtt_space) {
Daniel Vetter75e9e912010-11-04 17:11:09 +01001219 ret = i915_gem_object_bind_to_gtt(obj, 0, true);
Chris Wilsonc7150892009-09-23 00:43:56 +01001220 if (ret)
1221 goto unlock;
Jesse Barnesde151cf2008-11-12 10:03:55 -08001222
Eric Anholte92d03b2011-06-14 16:43:09 -07001223 ret = i915_gem_object_set_to_gtt_domain(obj, write);
1224 if (ret)
1225 goto unlock;
1226 }
Chris Wilson4a684a42010-10-28 14:44:08 +01001227
Chris Wilsond9e86c02010-11-10 16:40:20 +00001228 if (obj->tiling_mode == I915_TILING_NONE)
1229 ret = i915_gem_object_put_fence(obj);
1230 else
Chris Wilsonce453d82011-02-21 14:43:56 +00001231 ret = i915_gem_object_get_fence(obj, NULL);
Chris Wilsond9e86c02010-11-10 16:40:20 +00001232 if (ret)
1233 goto unlock;
Jesse Barnesde151cf2008-11-12 10:03:55 -08001234
Chris Wilson05394f32010-11-08 19:18:58 +00001235 if (i915_gem_object_is_inactive(obj))
1236 list_move_tail(&obj->mm_list, &dev_priv->mm.inactive_list);
Chris Wilson7d1c4802010-08-07 21:45:03 +01001237
Chris Wilson6299f992010-11-24 12:23:44 +00001238 obj->fault_mappable = true;
1239
Chris Wilson05394f32010-11-08 19:18:58 +00001240 pfn = ((dev->agp->base + obj->gtt_offset) >> PAGE_SHIFT) +
Jesse Barnesde151cf2008-11-12 10:03:55 -08001241 page_offset;
1242
1243 /* Finally, remap it using the new GTT offset */
1244 ret = vm_insert_pfn(vma, (unsigned long)vmf->virtual_address, pfn);
Chris Wilsonc7150892009-09-23 00:43:56 +01001245unlock:
Jesse Barnesde151cf2008-11-12 10:03:55 -08001246 mutex_unlock(&dev->struct_mutex);
Chris Wilsond9bc7e92011-02-07 13:09:31 +00001247out:
Jesse Barnesde151cf2008-11-12 10:03:55 -08001248 switch (ret) {
Chris Wilsond9bc7e92011-02-07 13:09:31 +00001249 case -EIO:
Chris Wilson045e7692010-11-07 09:18:22 +00001250 case -EAGAIN:
Chris Wilsond9bc7e92011-02-07 13:09:31 +00001251 /* Give the error handler a chance to run and move the
1252 * objects off the GPU active list. Next time we service the
1253 * fault, we should be able to transition the page into the
1254 * GTT without touching the GPU (and so avoid further
1255 * EIO/EGAIN). If the GPU is wedged, then there is no issue
1256 * with coherency, just lost writes.
1257 */
Chris Wilson045e7692010-11-07 09:18:22 +00001258 set_need_resched();
Chris Wilsonc7150892009-09-23 00:43:56 +01001259 case 0:
1260 case -ERESTARTSYS:
Chris Wilsonbed636a2011-02-11 20:31:19 +00001261 case -EINTR:
Chris Wilsonc7150892009-09-23 00:43:56 +01001262 return VM_FAULT_NOPAGE;
Jesse Barnesde151cf2008-11-12 10:03:55 -08001263 case -ENOMEM:
Jesse Barnesde151cf2008-11-12 10:03:55 -08001264 return VM_FAULT_OOM;
Jesse Barnesde151cf2008-11-12 10:03:55 -08001265 default:
Chris Wilsonc7150892009-09-23 00:43:56 +01001266 return VM_FAULT_SIGBUS;
Jesse Barnesde151cf2008-11-12 10:03:55 -08001267 }
1268}
1269
1270/**
1271 * i915_gem_create_mmap_offset - create a fake mmap offset for an object
1272 * @obj: obj in question
1273 *
1274 * GEM memory mapping works by handing back to userspace a fake mmap offset
1275 * it can use in a subsequent mmap(2) call. The DRM core code then looks
1276 * up the object based on the offset and sets up the various memory mapping
1277 * structures.
1278 *
1279 * This routine allocates and attaches a fake offset for @obj.
1280 */
1281static int
Chris Wilson05394f32010-11-08 19:18:58 +00001282i915_gem_create_mmap_offset(struct drm_i915_gem_object *obj)
Jesse Barnesde151cf2008-11-12 10:03:55 -08001283{
Chris Wilson05394f32010-11-08 19:18:58 +00001284 struct drm_device *dev = obj->base.dev;
Jesse Barnesde151cf2008-11-12 10:03:55 -08001285 struct drm_gem_mm *mm = dev->mm_private;
Jesse Barnesde151cf2008-11-12 10:03:55 -08001286 struct drm_map_list *list;
Benjamin Herrenschmidtf77d3902009-02-02 16:55:46 +11001287 struct drm_local_map *map;
Jesse Barnesde151cf2008-11-12 10:03:55 -08001288 int ret = 0;
1289
1290 /* Set the object up for mmap'ing */
Chris Wilson05394f32010-11-08 19:18:58 +00001291 list = &obj->base.map_list;
Eric Anholt9a298b22009-03-24 12:23:04 -07001292 list->map = kzalloc(sizeof(struct drm_map_list), GFP_KERNEL);
Jesse Barnesde151cf2008-11-12 10:03:55 -08001293 if (!list->map)
1294 return -ENOMEM;
1295
1296 map = list->map;
1297 map->type = _DRM_GEM;
Chris Wilson05394f32010-11-08 19:18:58 +00001298 map->size = obj->base.size;
Jesse Barnesde151cf2008-11-12 10:03:55 -08001299 map->handle = obj;
1300
1301 /* Get a DRM GEM mmap offset allocated... */
1302 list->file_offset_node = drm_mm_search_free(&mm->offset_manager,
Chris Wilson05394f32010-11-08 19:18:58 +00001303 obj->base.size / PAGE_SIZE,
1304 0, 0);
Jesse Barnesde151cf2008-11-12 10:03:55 -08001305 if (!list->file_offset_node) {
Chris Wilson05394f32010-11-08 19:18:58 +00001306 DRM_ERROR("failed to allocate offset for bo %d\n",
1307 obj->base.name);
Chris Wilson9e0ae5342010-09-21 15:05:24 +01001308 ret = -ENOSPC;
Jesse Barnesde151cf2008-11-12 10:03:55 -08001309 goto out_free_list;
1310 }
1311
1312 list->file_offset_node = drm_mm_get_block(list->file_offset_node,
Chris Wilson05394f32010-11-08 19:18:58 +00001313 obj->base.size / PAGE_SIZE,
1314 0);
Jesse Barnesde151cf2008-11-12 10:03:55 -08001315 if (!list->file_offset_node) {
1316 ret = -ENOMEM;
1317 goto out_free_list;
1318 }
1319
1320 list->hash.key = list->file_offset_node->start;
Chris Wilson9e0ae5342010-09-21 15:05:24 +01001321 ret = drm_ht_insert_item(&mm->offset_hash, &list->hash);
1322 if (ret) {
Jesse Barnesde151cf2008-11-12 10:03:55 -08001323 DRM_ERROR("failed to add to map hash\n");
1324 goto out_free_mm;
1325 }
1326
Jesse Barnesde151cf2008-11-12 10:03:55 -08001327 return 0;
1328
1329out_free_mm:
1330 drm_mm_put_block(list->file_offset_node);
1331out_free_list:
Eric Anholt9a298b22009-03-24 12:23:04 -07001332 kfree(list->map);
Chris Wilson39a01d12010-10-28 13:03:06 +01001333 list->map = NULL;
Jesse Barnesde151cf2008-11-12 10:03:55 -08001334
1335 return ret;
1336}
1337
Chris Wilson901782b2009-07-10 08:18:50 +01001338/**
1339 * i915_gem_release_mmap - remove physical page mappings
1340 * @obj: obj in question
1341 *
André Goddard Rosaaf901ca2009-11-14 13:09:05 -02001342 * Preserve the reservation of the mmapping with the DRM core code, but
Chris Wilson901782b2009-07-10 08:18:50 +01001343 * relinquish ownership of the pages back to the system.
1344 *
1345 * It is vital that we remove the page mapping if we have mapped a tiled
1346 * object through the GTT and then lose the fence register due to
1347 * resource pressure. Similarly if the object has been moved out of the
1348 * aperture, than pages mapped into userspace must be revoked. Removing the
1349 * mapping will then trigger a page fault on the next user access, allowing
1350 * fixup by i915_gem_fault().
1351 */
Eric Anholtd05ca302009-07-10 13:02:26 -07001352void
Chris Wilson05394f32010-11-08 19:18:58 +00001353i915_gem_release_mmap(struct drm_i915_gem_object *obj)
Chris Wilson901782b2009-07-10 08:18:50 +01001354{
Chris Wilson6299f992010-11-24 12:23:44 +00001355 if (!obj->fault_mappable)
1356 return;
Chris Wilson901782b2009-07-10 08:18:50 +01001357
Chris Wilsonf6e47882011-03-20 21:09:12 +00001358 if (obj->base.dev->dev_mapping)
1359 unmap_mapping_range(obj->base.dev->dev_mapping,
1360 (loff_t)obj->base.map_list.hash.key<<PAGE_SHIFT,
1361 obj->base.size, 1);
Daniel Vetterfb7d5162010-10-01 22:05:20 +02001362
Chris Wilson6299f992010-11-24 12:23:44 +00001363 obj->fault_mappable = false;
Chris Wilson901782b2009-07-10 08:18:50 +01001364}
1365
Jesse Barnesab00b3e2009-02-11 14:01:46 -08001366static void
Chris Wilson05394f32010-11-08 19:18:58 +00001367i915_gem_free_mmap_offset(struct drm_i915_gem_object *obj)
Jesse Barnesab00b3e2009-02-11 14:01:46 -08001368{
Chris Wilson05394f32010-11-08 19:18:58 +00001369 struct drm_device *dev = obj->base.dev;
Jesse Barnesab00b3e2009-02-11 14:01:46 -08001370 struct drm_gem_mm *mm = dev->mm_private;
Chris Wilson05394f32010-11-08 19:18:58 +00001371 struct drm_map_list *list = &obj->base.map_list;
Jesse Barnesab00b3e2009-02-11 14:01:46 -08001372
Jesse Barnesab00b3e2009-02-11 14:01:46 -08001373 drm_ht_remove_item(&mm->offset_hash, &list->hash);
Chris Wilson39a01d12010-10-28 13:03:06 +01001374 drm_mm_put_block(list->file_offset_node);
1375 kfree(list->map);
1376 list->map = NULL;
Jesse Barnesab00b3e2009-02-11 14:01:46 -08001377}
1378
Chris Wilson92b88ae2010-11-09 11:47:32 +00001379static uint32_t
1380i915_gem_get_gtt_size(struct drm_i915_gem_object *obj)
1381{
1382 struct drm_device *dev = obj->base.dev;
1383 uint32_t size;
1384
1385 if (INTEL_INFO(dev)->gen >= 4 ||
1386 obj->tiling_mode == I915_TILING_NONE)
1387 return obj->base.size;
1388
1389 /* Previous chips need a power-of-two fence region when tiling */
1390 if (INTEL_INFO(dev)->gen == 3)
1391 size = 1024*1024;
1392 else
1393 size = 512*1024;
1394
1395 while (size < obj->base.size)
1396 size <<= 1;
1397
1398 return size;
1399}
1400
Jesse Barnesde151cf2008-11-12 10:03:55 -08001401/**
1402 * i915_gem_get_gtt_alignment - return required GTT alignment for an object
1403 * @obj: object to check
1404 *
1405 * Return the required GTT alignment for an object, taking into account
Daniel Vetter5e783302010-11-14 22:32:36 +01001406 * potential fence register mapping.
Jesse Barnesde151cf2008-11-12 10:03:55 -08001407 */
1408static uint32_t
Chris Wilson05394f32010-11-08 19:18:58 +00001409i915_gem_get_gtt_alignment(struct drm_i915_gem_object *obj)
Jesse Barnesde151cf2008-11-12 10:03:55 -08001410{
Chris Wilson05394f32010-11-08 19:18:58 +00001411 struct drm_device *dev = obj->base.dev;
Jesse Barnesde151cf2008-11-12 10:03:55 -08001412
1413 /*
1414 * Minimum alignment is 4k (GTT page size), but might be greater
1415 * if a fence register is needed for the object.
1416 */
Chris Wilsona00b10c2010-09-24 21:15:47 +01001417 if (INTEL_INFO(dev)->gen >= 4 ||
Chris Wilson05394f32010-11-08 19:18:58 +00001418 obj->tiling_mode == I915_TILING_NONE)
Jesse Barnesde151cf2008-11-12 10:03:55 -08001419 return 4096;
1420
1421 /*
1422 * Previous chips need to be aligned to the size of the smallest
1423 * fence register that can contain the object.
1424 */
Chris Wilson05394f32010-11-08 19:18:58 +00001425 return i915_gem_get_gtt_size(obj);
Chris Wilsona00b10c2010-09-24 21:15:47 +01001426}
1427
Daniel Vetter5e783302010-11-14 22:32:36 +01001428/**
1429 * i915_gem_get_unfenced_gtt_alignment - return required GTT alignment for an
1430 * unfenced object
1431 * @obj: object to check
1432 *
1433 * Return the required GTT alignment for an object, only taking into account
1434 * unfenced tiled surface requirements.
1435 */
Chris Wilson467cffb2011-03-07 10:42:03 +00001436uint32_t
Chris Wilson05394f32010-11-08 19:18:58 +00001437i915_gem_get_unfenced_gtt_alignment(struct drm_i915_gem_object *obj)
Daniel Vetter5e783302010-11-14 22:32:36 +01001438{
Chris Wilson05394f32010-11-08 19:18:58 +00001439 struct drm_device *dev = obj->base.dev;
Daniel Vetter5e783302010-11-14 22:32:36 +01001440 int tile_height;
1441
1442 /*
1443 * Minimum alignment is 4k (GTT page size) for sane hw.
1444 */
1445 if (INTEL_INFO(dev)->gen >= 4 || IS_G33(dev) ||
Chris Wilson05394f32010-11-08 19:18:58 +00001446 obj->tiling_mode == I915_TILING_NONE)
Daniel Vetter5e783302010-11-14 22:32:36 +01001447 return 4096;
1448
1449 /*
1450 * Older chips need unfenced tiled buffers to be aligned to the left
1451 * edge of an even tile row (where tile rows are counted as if the bo is
1452 * placed in a fenced gtt region).
1453 */
Daniel Vetterc8ebc2b2011-05-12 22:17:20 +01001454 if (IS_GEN2(dev))
1455 tile_height = 16;
1456 else if (obj->tiling_mode == I915_TILING_Y && HAS_128_BYTE_Y_TILING(dev))
Daniel Vetter5e783302010-11-14 22:32:36 +01001457 tile_height = 32;
1458 else
1459 tile_height = 8;
1460
Chris Wilson05394f32010-11-08 19:18:58 +00001461 return tile_height * obj->stride * 2;
Daniel Vetter5e783302010-11-14 22:32:36 +01001462}
1463
Jesse Barnesde151cf2008-11-12 10:03:55 -08001464int
Dave Airlieff72145b2011-02-07 12:16:14 +10001465i915_gem_mmap_gtt(struct drm_file *file,
1466 struct drm_device *dev,
1467 uint32_t handle,
1468 uint64_t *offset)
Jesse Barnesde151cf2008-11-12 10:03:55 -08001469{
Chris Wilsonda761a62010-10-27 17:37:08 +01001470 struct drm_i915_private *dev_priv = dev->dev_private;
Chris Wilson05394f32010-11-08 19:18:58 +00001471 struct drm_i915_gem_object *obj;
Jesse Barnesde151cf2008-11-12 10:03:55 -08001472 int ret;
1473
1474 if (!(dev->driver->driver_features & DRIVER_GEM))
1475 return -ENODEV;
1476
Chris Wilson76c1dec2010-09-25 11:22:51 +01001477 ret = i915_mutex_lock_interruptible(dev);
Chris Wilson1d7cfea2010-10-17 09:45:41 +01001478 if (ret)
Chris Wilson76c1dec2010-09-25 11:22:51 +01001479 return ret;
Jesse Barnesde151cf2008-11-12 10:03:55 -08001480
Dave Airlieff72145b2011-02-07 12:16:14 +10001481 obj = to_intel_bo(drm_gem_object_lookup(dev, file, handle));
Chris Wilsonc8725222011-02-19 11:31:06 +00001482 if (&obj->base == NULL) {
Chris Wilson1d7cfea2010-10-17 09:45:41 +01001483 ret = -ENOENT;
1484 goto unlock;
1485 }
Jesse Barnesde151cf2008-11-12 10:03:55 -08001486
Chris Wilson05394f32010-11-08 19:18:58 +00001487 if (obj->base.size > dev_priv->mm.gtt_mappable_end) {
Chris Wilsonda761a62010-10-27 17:37:08 +01001488 ret = -E2BIG;
1489 goto unlock;
1490 }
1491
Chris Wilson05394f32010-11-08 19:18:58 +00001492 if (obj->madv != I915_MADV_WILLNEED) {
Chris Wilsonab182822009-09-22 18:46:17 +01001493 DRM_ERROR("Attempting to mmap a purgeable buffer\n");
Chris Wilson1d7cfea2010-10-17 09:45:41 +01001494 ret = -EINVAL;
1495 goto out;
Chris Wilsonab182822009-09-22 18:46:17 +01001496 }
1497
Chris Wilson05394f32010-11-08 19:18:58 +00001498 if (!obj->base.map_list.map) {
Jesse Barnesde151cf2008-11-12 10:03:55 -08001499 ret = i915_gem_create_mmap_offset(obj);
Chris Wilson1d7cfea2010-10-17 09:45:41 +01001500 if (ret)
1501 goto out;
Jesse Barnesde151cf2008-11-12 10:03:55 -08001502 }
1503
Dave Airlieff72145b2011-02-07 12:16:14 +10001504 *offset = (u64)obj->base.map_list.hash.key << PAGE_SHIFT;
Jesse Barnesde151cf2008-11-12 10:03:55 -08001505
Chris Wilson1d7cfea2010-10-17 09:45:41 +01001506out:
Chris Wilson05394f32010-11-08 19:18:58 +00001507 drm_gem_object_unreference(&obj->base);
Chris Wilson1d7cfea2010-10-17 09:45:41 +01001508unlock:
Jesse Barnesde151cf2008-11-12 10:03:55 -08001509 mutex_unlock(&dev->struct_mutex);
Chris Wilson1d7cfea2010-10-17 09:45:41 +01001510 return ret;
Jesse Barnesde151cf2008-11-12 10:03:55 -08001511}
1512
Dave Airlieff72145b2011-02-07 12:16:14 +10001513/**
1514 * i915_gem_mmap_gtt_ioctl - prepare an object for GTT mmap'ing
1515 * @dev: DRM device
1516 * @data: GTT mapping ioctl data
1517 * @file: GEM object info
1518 *
1519 * Simply returns the fake offset to userspace so it can mmap it.
1520 * The mmap call will end up in drm_gem_mmap(), which will set things
1521 * up so we can get faults in the handler above.
1522 *
1523 * The fault handler will take care of binding the object into the GTT
1524 * (since it may have been evicted to make room for something), allocating
1525 * a fence register, and mapping the appropriate aperture address into
1526 * userspace.
1527 */
1528int
1529i915_gem_mmap_gtt_ioctl(struct drm_device *dev, void *data,
1530 struct drm_file *file)
1531{
1532 struct drm_i915_gem_mmap_gtt *args = data;
1533
1534 if (!(dev->driver->driver_features & DRIVER_GEM))
1535 return -ENODEV;
1536
1537 return i915_gem_mmap_gtt(file, dev, args->handle, &args->offset);
1538}
1539
1540
Chris Wilsone5281cc2010-10-28 13:45:36 +01001541static int
Chris Wilson05394f32010-11-08 19:18:58 +00001542i915_gem_object_get_pages_gtt(struct drm_i915_gem_object *obj,
Chris Wilsone5281cc2010-10-28 13:45:36 +01001543 gfp_t gfpmask)
1544{
Chris Wilsone5281cc2010-10-28 13:45:36 +01001545 int page_count, i;
1546 struct address_space *mapping;
1547 struct inode *inode;
1548 struct page *page;
1549
1550 /* Get the list of pages out of our struct file. They'll be pinned
1551 * at this point until we release them.
1552 */
Chris Wilson05394f32010-11-08 19:18:58 +00001553 page_count = obj->base.size / PAGE_SIZE;
1554 BUG_ON(obj->pages != NULL);
1555 obj->pages = drm_malloc_ab(page_count, sizeof(struct page *));
1556 if (obj->pages == NULL)
Chris Wilsone5281cc2010-10-28 13:45:36 +01001557 return -ENOMEM;
1558
Chris Wilson05394f32010-11-08 19:18:58 +00001559 inode = obj->base.filp->f_path.dentry->d_inode;
Chris Wilsone5281cc2010-10-28 13:45:36 +01001560 mapping = inode->i_mapping;
1561 for (i = 0; i < page_count; i++) {
1562 page = read_cache_page_gfp(mapping, i,
1563 GFP_HIGHUSER |
1564 __GFP_COLD |
1565 __GFP_RECLAIMABLE |
1566 gfpmask);
1567 if (IS_ERR(page))
1568 goto err_pages;
1569
Chris Wilson05394f32010-11-08 19:18:58 +00001570 obj->pages[i] = page;
Chris Wilsone5281cc2010-10-28 13:45:36 +01001571 }
1572
Chris Wilson05394f32010-11-08 19:18:58 +00001573 if (obj->tiling_mode != I915_TILING_NONE)
Chris Wilsone5281cc2010-10-28 13:45:36 +01001574 i915_gem_object_do_bit_17_swizzle(obj);
1575
1576 return 0;
1577
1578err_pages:
1579 while (i--)
Chris Wilson05394f32010-11-08 19:18:58 +00001580 page_cache_release(obj->pages[i]);
Chris Wilsone5281cc2010-10-28 13:45:36 +01001581
Chris Wilson05394f32010-11-08 19:18:58 +00001582 drm_free_large(obj->pages);
1583 obj->pages = NULL;
Chris Wilsone5281cc2010-10-28 13:45:36 +01001584 return PTR_ERR(page);
1585}
1586
Chris Wilson5cdf5882010-09-27 15:51:07 +01001587static void
Chris Wilson05394f32010-11-08 19:18:58 +00001588i915_gem_object_put_pages_gtt(struct drm_i915_gem_object *obj)
Eric Anholt673a3942008-07-30 12:06:12 -07001589{
Chris Wilson05394f32010-11-08 19:18:58 +00001590 int page_count = obj->base.size / PAGE_SIZE;
Eric Anholt673a3942008-07-30 12:06:12 -07001591 int i;
1592
Chris Wilson05394f32010-11-08 19:18:58 +00001593 BUG_ON(obj->madv == __I915_MADV_PURGED);
Eric Anholt856fa192009-03-19 14:10:50 -07001594
Chris Wilson05394f32010-11-08 19:18:58 +00001595 if (obj->tiling_mode != I915_TILING_NONE)
Eric Anholt280b7132009-03-12 16:56:27 -07001596 i915_gem_object_save_bit_17_swizzle(obj);
1597
Chris Wilson05394f32010-11-08 19:18:58 +00001598 if (obj->madv == I915_MADV_DONTNEED)
1599 obj->dirty = 0;
Chris Wilson3ef94da2009-09-14 16:50:29 +01001600
1601 for (i = 0; i < page_count; i++) {
Chris Wilson05394f32010-11-08 19:18:58 +00001602 if (obj->dirty)
1603 set_page_dirty(obj->pages[i]);
Chris Wilson3ef94da2009-09-14 16:50:29 +01001604
Chris Wilson05394f32010-11-08 19:18:58 +00001605 if (obj->madv == I915_MADV_WILLNEED)
1606 mark_page_accessed(obj->pages[i]);
Chris Wilson3ef94da2009-09-14 16:50:29 +01001607
Chris Wilson05394f32010-11-08 19:18:58 +00001608 page_cache_release(obj->pages[i]);
Chris Wilson3ef94da2009-09-14 16:50:29 +01001609 }
Chris Wilson05394f32010-11-08 19:18:58 +00001610 obj->dirty = 0;
Eric Anholt673a3942008-07-30 12:06:12 -07001611
Chris Wilson05394f32010-11-08 19:18:58 +00001612 drm_free_large(obj->pages);
1613 obj->pages = NULL;
Eric Anholt673a3942008-07-30 12:06:12 -07001614}
1615
Chris Wilson54cf91d2010-11-25 18:00:26 +00001616void
Chris Wilson05394f32010-11-08 19:18:58 +00001617i915_gem_object_move_to_active(struct drm_i915_gem_object *obj,
Chris Wilson1ec14ad2010-12-04 11:30:53 +00001618 struct intel_ring_buffer *ring,
1619 u32 seqno)
Eric Anholt673a3942008-07-30 12:06:12 -07001620{
Chris Wilson05394f32010-11-08 19:18:58 +00001621 struct drm_device *dev = obj->base.dev;
Chris Wilson69dc4982010-10-19 10:36:51 +01001622 struct drm_i915_private *dev_priv = dev->dev_private;
Daniel Vetter617dbe22010-02-11 22:16:02 +01001623
Zou Nan hai852835f2010-05-21 09:08:56 +08001624 BUG_ON(ring == NULL);
Chris Wilson05394f32010-11-08 19:18:58 +00001625 obj->ring = ring;
Eric Anholt673a3942008-07-30 12:06:12 -07001626
1627 /* Add a reference if we're newly entering the active list. */
Chris Wilson05394f32010-11-08 19:18:58 +00001628 if (!obj->active) {
1629 drm_gem_object_reference(&obj->base);
1630 obj->active = 1;
Eric Anholt673a3942008-07-30 12:06:12 -07001631 }
Daniel Vettere35a41d2010-02-11 22:13:59 +01001632
Eric Anholt673a3942008-07-30 12:06:12 -07001633 /* Move from whatever list we were on to the tail of execution. */
Chris Wilson05394f32010-11-08 19:18:58 +00001634 list_move_tail(&obj->mm_list, &dev_priv->mm.active_list);
1635 list_move_tail(&obj->ring_list, &ring->active_list);
Chris Wilsoncaea7472010-11-12 13:53:37 +00001636
Chris Wilson05394f32010-11-08 19:18:58 +00001637 obj->last_rendering_seqno = seqno;
Chris Wilsoncaea7472010-11-12 13:53:37 +00001638 if (obj->fenced_gpu_access) {
1639 struct drm_i915_fence_reg *reg;
1640
1641 BUG_ON(obj->fence_reg == I915_FENCE_REG_NONE);
1642
1643 obj->last_fenced_seqno = seqno;
1644 obj->last_fenced_ring = ring;
1645
1646 reg = &dev_priv->fence_regs[obj->fence_reg];
1647 list_move_tail(&reg->lru_list, &dev_priv->mm.fence_list);
1648 }
1649}
1650
1651static void
1652i915_gem_object_move_off_active(struct drm_i915_gem_object *obj)
1653{
1654 list_del_init(&obj->ring_list);
1655 obj->last_rendering_seqno = 0;
Eric Anholt673a3942008-07-30 12:06:12 -07001656}
1657
Eric Anholtce44b0e2008-11-06 16:00:31 -08001658static void
Chris Wilson05394f32010-11-08 19:18:58 +00001659i915_gem_object_move_to_flushing(struct drm_i915_gem_object *obj)
Eric Anholtce44b0e2008-11-06 16:00:31 -08001660{
Chris Wilson05394f32010-11-08 19:18:58 +00001661 struct drm_device *dev = obj->base.dev;
Eric Anholtce44b0e2008-11-06 16:00:31 -08001662 drm_i915_private_t *dev_priv = dev->dev_private;
Eric Anholtce44b0e2008-11-06 16:00:31 -08001663
Chris Wilson05394f32010-11-08 19:18:58 +00001664 BUG_ON(!obj->active);
1665 list_move_tail(&obj->mm_list, &dev_priv->mm.flushing_list);
Chris Wilsoncaea7472010-11-12 13:53:37 +00001666
1667 i915_gem_object_move_off_active(obj);
1668}
1669
1670static void
1671i915_gem_object_move_to_inactive(struct drm_i915_gem_object *obj)
1672{
1673 struct drm_device *dev = obj->base.dev;
1674 struct drm_i915_private *dev_priv = dev->dev_private;
1675
1676 if (obj->pin_count != 0)
1677 list_move_tail(&obj->mm_list, &dev_priv->mm.pinned_list);
1678 else
1679 list_move_tail(&obj->mm_list, &dev_priv->mm.inactive_list);
1680
1681 BUG_ON(!list_empty(&obj->gpu_write_list));
1682 BUG_ON(!obj->active);
1683 obj->ring = NULL;
1684
1685 i915_gem_object_move_off_active(obj);
1686 obj->fenced_gpu_access = false;
Chris Wilsoncaea7472010-11-12 13:53:37 +00001687
1688 obj->active = 0;
Chris Wilson87ca9c82010-12-02 09:42:56 +00001689 obj->pending_gpu_write = false;
Chris Wilsoncaea7472010-11-12 13:53:37 +00001690 drm_gem_object_unreference(&obj->base);
1691
1692 WARN_ON(i915_verify_lists(dev));
Eric Anholtce44b0e2008-11-06 16:00:31 -08001693}
Eric Anholt673a3942008-07-30 12:06:12 -07001694
Chris Wilson963b4832009-09-20 23:03:54 +01001695/* Immediately discard the backing storage */
1696static void
Chris Wilson05394f32010-11-08 19:18:58 +00001697i915_gem_object_truncate(struct drm_i915_gem_object *obj)
Chris Wilson963b4832009-09-20 23:03:54 +01001698{
Chris Wilsonbb6baf72009-09-22 14:24:13 +01001699 struct inode *inode;
Chris Wilson963b4832009-09-20 23:03:54 +01001700
Chris Wilsonae9fed62010-08-07 11:01:30 +01001701 /* Our goal here is to return as much of the memory as
1702 * is possible back to the system as we are called from OOM.
1703 * To do this we must instruct the shmfs to drop all of its
1704 * backing pages, *now*. Here we mirror the actions taken
1705 * when by shmem_delete_inode() to release the backing store.
1706 */
Chris Wilson05394f32010-11-08 19:18:58 +00001707 inode = obj->base.filp->f_path.dentry->d_inode;
Chris Wilsonae9fed62010-08-07 11:01:30 +01001708 truncate_inode_pages(inode->i_mapping, 0);
1709 if (inode->i_op->truncate_range)
1710 inode->i_op->truncate_range(inode, 0, (loff_t)-1);
Chris Wilsonbb6baf72009-09-22 14:24:13 +01001711
Chris Wilson05394f32010-11-08 19:18:58 +00001712 obj->madv = __I915_MADV_PURGED;
Chris Wilson963b4832009-09-20 23:03:54 +01001713}
1714
1715static inline int
Chris Wilson05394f32010-11-08 19:18:58 +00001716i915_gem_object_is_purgeable(struct drm_i915_gem_object *obj)
Chris Wilson963b4832009-09-20 23:03:54 +01001717{
Chris Wilson05394f32010-11-08 19:18:58 +00001718 return obj->madv == I915_MADV_DONTNEED;
Chris Wilson963b4832009-09-20 23:03:54 +01001719}
1720
Eric Anholt673a3942008-07-30 12:06:12 -07001721static void
Chris Wilsondb53a302011-02-03 11:57:46 +00001722i915_gem_process_flushing_list(struct intel_ring_buffer *ring,
1723 uint32_t flush_domains)
Daniel Vetter63560392010-02-19 11:51:59 +01001724{
Chris Wilson05394f32010-11-08 19:18:58 +00001725 struct drm_i915_gem_object *obj, *next;
Daniel Vetter63560392010-02-19 11:51:59 +01001726
Chris Wilson05394f32010-11-08 19:18:58 +00001727 list_for_each_entry_safe(obj, next,
Chris Wilson64193402010-10-24 12:38:05 +01001728 &ring->gpu_write_list,
Daniel Vetter63560392010-02-19 11:51:59 +01001729 gpu_write_list) {
Chris Wilson05394f32010-11-08 19:18:58 +00001730 if (obj->base.write_domain & flush_domains) {
1731 uint32_t old_write_domain = obj->base.write_domain;
Daniel Vetter63560392010-02-19 11:51:59 +01001732
Chris Wilson05394f32010-11-08 19:18:58 +00001733 obj->base.write_domain = 0;
1734 list_del_init(&obj->gpu_write_list);
Chris Wilson1ec14ad2010-12-04 11:30:53 +00001735 i915_gem_object_move_to_active(obj, ring,
Chris Wilsondb53a302011-02-03 11:57:46 +00001736 i915_gem_next_request_seqno(ring));
Daniel Vetter63560392010-02-19 11:51:59 +01001737
Daniel Vetter63560392010-02-19 11:51:59 +01001738 trace_i915_gem_object_change_domain(obj,
Chris Wilson05394f32010-11-08 19:18:58 +00001739 obj->base.read_domains,
Daniel Vetter63560392010-02-19 11:51:59 +01001740 old_write_domain);
1741 }
1742 }
1743}
Zou Nan hai8187a2b2010-05-21 09:08:55 +08001744
Chris Wilson3cce4692010-10-27 16:11:02 +01001745int
Chris Wilsondb53a302011-02-03 11:57:46 +00001746i915_add_request(struct intel_ring_buffer *ring,
Chris Wilsonf787a5f2010-09-24 16:02:42 +01001747 struct drm_file *file,
Chris Wilsondb53a302011-02-03 11:57:46 +00001748 struct drm_i915_gem_request *request)
Eric Anholt673a3942008-07-30 12:06:12 -07001749{
Chris Wilsondb53a302011-02-03 11:57:46 +00001750 drm_i915_private_t *dev_priv = ring->dev->dev_private;
Eric Anholt673a3942008-07-30 12:06:12 -07001751 uint32_t seqno;
1752 int was_empty;
Chris Wilson3cce4692010-10-27 16:11:02 +01001753 int ret;
1754
1755 BUG_ON(request == NULL);
Eric Anholt673a3942008-07-30 12:06:12 -07001756
Chris Wilson3cce4692010-10-27 16:11:02 +01001757 ret = ring->add_request(ring, &seqno);
1758 if (ret)
1759 return ret;
Eric Anholt673a3942008-07-30 12:06:12 -07001760
Chris Wilsondb53a302011-02-03 11:57:46 +00001761 trace_i915_gem_request_add(ring, seqno);
Eric Anholt673a3942008-07-30 12:06:12 -07001762
1763 request->seqno = seqno;
Zou Nan hai852835f2010-05-21 09:08:56 +08001764 request->ring = ring;
Eric Anholt673a3942008-07-30 12:06:12 -07001765 request->emitted_jiffies = jiffies;
Zou Nan hai852835f2010-05-21 09:08:56 +08001766 was_empty = list_empty(&ring->request_list);
1767 list_add_tail(&request->list, &ring->request_list);
1768
Chris Wilsondb53a302011-02-03 11:57:46 +00001769 if (file) {
1770 struct drm_i915_file_private *file_priv = file->driver_priv;
1771
Chris Wilson1c255952010-09-26 11:03:27 +01001772 spin_lock(&file_priv->mm.lock);
Chris Wilsonf787a5f2010-09-24 16:02:42 +01001773 request->file_priv = file_priv;
Eric Anholtb9624422009-06-03 07:27:35 +00001774 list_add_tail(&request->client_list,
Chris Wilsonf787a5f2010-09-24 16:02:42 +01001775 &file_priv->mm.request_list);
Chris Wilson1c255952010-09-26 11:03:27 +01001776 spin_unlock(&file_priv->mm.lock);
Eric Anholtb9624422009-06-03 07:27:35 +00001777 }
Eric Anholt673a3942008-07-30 12:06:12 -07001778
Chris Wilsondb53a302011-02-03 11:57:46 +00001779 ring->outstanding_lazy_request = false;
1780
Ben Gamarif65d9422009-09-14 17:48:44 -04001781 if (!dev_priv->mm.suspended) {
Chris Wilsonb3b079d2010-09-13 23:44:34 +01001782 mod_timer(&dev_priv->hangcheck_timer,
1783 jiffies + msecs_to_jiffies(DRM_I915_HANGCHECK_PERIOD));
Ben Gamarif65d9422009-09-14 17:48:44 -04001784 if (was_empty)
Chris Wilsonb3b079d2010-09-13 23:44:34 +01001785 queue_delayed_work(dev_priv->wq,
1786 &dev_priv->mm.retire_work, HZ);
Ben Gamarif65d9422009-09-14 17:48:44 -04001787 }
Chris Wilson3cce4692010-10-27 16:11:02 +01001788 return 0;
Eric Anholt673a3942008-07-30 12:06:12 -07001789}
1790
Chris Wilsonf787a5f2010-09-24 16:02:42 +01001791static inline void
1792i915_gem_request_remove_from_client(struct drm_i915_gem_request *request)
Eric Anholt673a3942008-07-30 12:06:12 -07001793{
Chris Wilson1c255952010-09-26 11:03:27 +01001794 struct drm_i915_file_private *file_priv = request->file_priv;
Eric Anholt673a3942008-07-30 12:06:12 -07001795
Chris Wilson1c255952010-09-26 11:03:27 +01001796 if (!file_priv)
1797 return;
Chris Wilson1c5d22f2009-08-25 11:15:50 +01001798
Chris Wilson1c255952010-09-26 11:03:27 +01001799 spin_lock(&file_priv->mm.lock);
Herton Ronaldo Krzesinski09bfa512011-03-17 13:45:12 +00001800 if (request->file_priv) {
1801 list_del(&request->client_list);
1802 request->file_priv = NULL;
1803 }
Chris Wilson1c255952010-09-26 11:03:27 +01001804 spin_unlock(&file_priv->mm.lock);
Eric Anholt673a3942008-07-30 12:06:12 -07001805}
1806
Chris Wilsondfaae392010-09-22 10:31:52 +01001807static void i915_gem_reset_ring_lists(struct drm_i915_private *dev_priv,
1808 struct intel_ring_buffer *ring)
Chris Wilson9375e442010-09-19 12:21:28 +01001809{
Chris Wilsondfaae392010-09-22 10:31:52 +01001810 while (!list_empty(&ring->request_list)) {
1811 struct drm_i915_gem_request *request;
Chris Wilson9375e442010-09-19 12:21:28 +01001812
Chris Wilsondfaae392010-09-22 10:31:52 +01001813 request = list_first_entry(&ring->request_list,
1814 struct drm_i915_gem_request,
1815 list);
1816
1817 list_del(&request->list);
Chris Wilsonf787a5f2010-09-24 16:02:42 +01001818 i915_gem_request_remove_from_client(request);
Chris Wilsondfaae392010-09-22 10:31:52 +01001819 kfree(request);
1820 }
1821
1822 while (!list_empty(&ring->active_list)) {
Chris Wilson05394f32010-11-08 19:18:58 +00001823 struct drm_i915_gem_object *obj;
Eric Anholt673a3942008-07-30 12:06:12 -07001824
Chris Wilson05394f32010-11-08 19:18:58 +00001825 obj = list_first_entry(&ring->active_list,
1826 struct drm_i915_gem_object,
1827 ring_list);
Eric Anholt673a3942008-07-30 12:06:12 -07001828
Chris Wilson05394f32010-11-08 19:18:58 +00001829 obj->base.write_domain = 0;
1830 list_del_init(&obj->gpu_write_list);
1831 i915_gem_object_move_to_inactive(obj);
Eric Anholt673a3942008-07-30 12:06:12 -07001832 }
Eric Anholt673a3942008-07-30 12:06:12 -07001833}
1834
Chris Wilson312817a2010-11-22 11:50:11 +00001835static void i915_gem_reset_fences(struct drm_device *dev)
1836{
1837 struct drm_i915_private *dev_priv = dev->dev_private;
1838 int i;
1839
1840 for (i = 0; i < 16; i++) {
1841 struct drm_i915_fence_reg *reg = &dev_priv->fence_regs[i];
Chris Wilson7d2cb392010-11-27 17:38:29 +00001842 struct drm_i915_gem_object *obj = reg->obj;
1843
1844 if (!obj)
1845 continue;
1846
1847 if (obj->tiling_mode)
1848 i915_gem_release_mmap(obj);
1849
Chris Wilsond9e86c02010-11-10 16:40:20 +00001850 reg->obj->fence_reg = I915_FENCE_REG_NONE;
1851 reg->obj->fenced_gpu_access = false;
1852 reg->obj->last_fenced_seqno = 0;
1853 reg->obj->last_fenced_ring = NULL;
1854 i915_gem_clear_fence_reg(dev, reg);
Chris Wilson312817a2010-11-22 11:50:11 +00001855 }
1856}
1857
Chris Wilson069efc12010-09-30 16:53:18 +01001858void i915_gem_reset(struct drm_device *dev)
Eric Anholt673a3942008-07-30 12:06:12 -07001859{
Chris Wilsondfaae392010-09-22 10:31:52 +01001860 struct drm_i915_private *dev_priv = dev->dev_private;
Chris Wilson05394f32010-11-08 19:18:58 +00001861 struct drm_i915_gem_object *obj;
Chris Wilson1ec14ad2010-12-04 11:30:53 +00001862 int i;
Eric Anholt673a3942008-07-30 12:06:12 -07001863
Chris Wilson1ec14ad2010-12-04 11:30:53 +00001864 for (i = 0; i < I915_NUM_RINGS; i++)
1865 i915_gem_reset_ring_lists(dev_priv, &dev_priv->ring[i]);
Chris Wilsondfaae392010-09-22 10:31:52 +01001866
1867 /* Remove anything from the flushing lists. The GPU cache is likely
1868 * to be lost on reset along with the data, so simply move the
1869 * lost bo to the inactive list.
1870 */
1871 while (!list_empty(&dev_priv->mm.flushing_list)) {
Chris Wilson05394f32010-11-08 19:18:58 +00001872 obj= list_first_entry(&dev_priv->mm.flushing_list,
1873 struct drm_i915_gem_object,
1874 mm_list);
Chris Wilson9375e442010-09-19 12:21:28 +01001875
Chris Wilson05394f32010-11-08 19:18:58 +00001876 obj->base.write_domain = 0;
1877 list_del_init(&obj->gpu_write_list);
1878 i915_gem_object_move_to_inactive(obj);
Chris Wilson9375e442010-09-19 12:21:28 +01001879 }
Chris Wilson9375e442010-09-19 12:21:28 +01001880
Chris Wilsondfaae392010-09-22 10:31:52 +01001881 /* Move everything out of the GPU domains to ensure we do any
1882 * necessary invalidation upon reuse.
1883 */
Chris Wilson05394f32010-11-08 19:18:58 +00001884 list_for_each_entry(obj,
Chris Wilson77f01232010-09-19 12:31:36 +01001885 &dev_priv->mm.inactive_list,
Chris Wilson69dc4982010-10-19 10:36:51 +01001886 mm_list)
Chris Wilson77f01232010-09-19 12:31:36 +01001887 {
Chris Wilson05394f32010-11-08 19:18:58 +00001888 obj->base.read_domains &= ~I915_GEM_GPU_DOMAINS;
Chris Wilson77f01232010-09-19 12:31:36 +01001889 }
Chris Wilson069efc12010-09-30 16:53:18 +01001890
1891 /* The fence registers are invalidated so clear them out */
Chris Wilson312817a2010-11-22 11:50:11 +00001892 i915_gem_reset_fences(dev);
Eric Anholt673a3942008-07-30 12:06:12 -07001893}
1894
1895/**
1896 * This function clears the request list as sequence numbers are passed.
1897 */
Chris Wilsonb09a1fe2010-07-23 23:18:49 +01001898static void
Chris Wilsondb53a302011-02-03 11:57:46 +00001899i915_gem_retire_requests_ring(struct intel_ring_buffer *ring)
Eric Anholt673a3942008-07-30 12:06:12 -07001900{
Eric Anholt673a3942008-07-30 12:06:12 -07001901 uint32_t seqno;
Chris Wilson1ec14ad2010-12-04 11:30:53 +00001902 int i;
Eric Anholt673a3942008-07-30 12:06:12 -07001903
Chris Wilsondb53a302011-02-03 11:57:46 +00001904 if (list_empty(&ring->request_list))
Karsten Wiese6c0594a2009-02-23 15:07:57 +01001905 return;
1906
Chris Wilsondb53a302011-02-03 11:57:46 +00001907 WARN_ON(i915_verify_lists(ring->dev));
Eric Anholt673a3942008-07-30 12:06:12 -07001908
Chris Wilson78501ea2010-10-27 12:18:21 +01001909 seqno = ring->get_seqno(ring);
Chris Wilson1ec14ad2010-12-04 11:30:53 +00001910
Chris Wilson076e2c02011-01-21 10:07:18 +00001911 for (i = 0; i < ARRAY_SIZE(ring->sync_seqno); i++)
Chris Wilson1ec14ad2010-12-04 11:30:53 +00001912 if (seqno >= ring->sync_seqno[i])
1913 ring->sync_seqno[i] = 0;
1914
Zou Nan hai852835f2010-05-21 09:08:56 +08001915 while (!list_empty(&ring->request_list)) {
Eric Anholt673a3942008-07-30 12:06:12 -07001916 struct drm_i915_gem_request *request;
Eric Anholt673a3942008-07-30 12:06:12 -07001917
Zou Nan hai852835f2010-05-21 09:08:56 +08001918 request = list_first_entry(&ring->request_list,
Eric Anholt673a3942008-07-30 12:06:12 -07001919 struct drm_i915_gem_request,
1920 list);
Eric Anholt673a3942008-07-30 12:06:12 -07001921
Chris Wilsondfaae392010-09-22 10:31:52 +01001922 if (!i915_seqno_passed(seqno, request->seqno))
Eric Anholt673a3942008-07-30 12:06:12 -07001923 break;
Chris Wilsonb84d5f02010-09-18 01:38:04 +01001924
Chris Wilsondb53a302011-02-03 11:57:46 +00001925 trace_i915_gem_request_retire(ring, request->seqno);
Chris Wilsonb84d5f02010-09-18 01:38:04 +01001926
1927 list_del(&request->list);
Chris Wilsonf787a5f2010-09-24 16:02:42 +01001928 i915_gem_request_remove_from_client(request);
Chris Wilsonb84d5f02010-09-18 01:38:04 +01001929 kfree(request);
1930 }
1931
1932 /* Move any buffers on the active list that are no longer referenced
1933 * by the ringbuffer to the flushing/inactive lists as appropriate.
1934 */
1935 while (!list_empty(&ring->active_list)) {
Chris Wilson05394f32010-11-08 19:18:58 +00001936 struct drm_i915_gem_object *obj;
Chris Wilsonb84d5f02010-09-18 01:38:04 +01001937
Chris Wilson05394f32010-11-08 19:18:58 +00001938 obj= list_first_entry(&ring->active_list,
1939 struct drm_i915_gem_object,
1940 ring_list);
Chris Wilsonb84d5f02010-09-18 01:38:04 +01001941
Chris Wilson05394f32010-11-08 19:18:58 +00001942 if (!i915_seqno_passed(seqno, obj->last_rendering_seqno))
Chris Wilsonb84d5f02010-09-18 01:38:04 +01001943 break;
1944
Chris Wilson05394f32010-11-08 19:18:58 +00001945 if (obj->base.write_domain != 0)
Chris Wilsonb84d5f02010-09-18 01:38:04 +01001946 i915_gem_object_move_to_flushing(obj);
1947 else
1948 i915_gem_object_move_to_inactive(obj);
Eric Anholt673a3942008-07-30 12:06:12 -07001949 }
Chris Wilson9d34e5d2009-09-24 05:26:06 +01001950
Chris Wilsondb53a302011-02-03 11:57:46 +00001951 if (unlikely(ring->trace_irq_seqno &&
1952 i915_seqno_passed(seqno, ring->trace_irq_seqno))) {
Chris Wilson1ec14ad2010-12-04 11:30:53 +00001953 ring->irq_put(ring);
Chris Wilsondb53a302011-02-03 11:57:46 +00001954 ring->trace_irq_seqno = 0;
Chris Wilson9d34e5d2009-09-24 05:26:06 +01001955 }
Chris Wilson23bc5982010-09-29 16:10:57 +01001956
Chris Wilsondb53a302011-02-03 11:57:46 +00001957 WARN_ON(i915_verify_lists(ring->dev));
Eric Anholt673a3942008-07-30 12:06:12 -07001958}
1959
1960void
Chris Wilsonb09a1fe2010-07-23 23:18:49 +01001961i915_gem_retire_requests(struct drm_device *dev)
1962{
1963 drm_i915_private_t *dev_priv = dev->dev_private;
Chris Wilson1ec14ad2010-12-04 11:30:53 +00001964 int i;
Chris Wilsonb09a1fe2010-07-23 23:18:49 +01001965
Chris Wilsonbe726152010-07-23 23:18:50 +01001966 if (!list_empty(&dev_priv->mm.deferred_free_list)) {
Chris Wilson05394f32010-11-08 19:18:58 +00001967 struct drm_i915_gem_object *obj, *next;
Chris Wilsonbe726152010-07-23 23:18:50 +01001968
1969 /* We must be careful that during unbind() we do not
1970 * accidentally infinitely recurse into retire requests.
1971 * Currently:
1972 * retire -> free -> unbind -> wait -> retire_ring
1973 */
Chris Wilson05394f32010-11-08 19:18:58 +00001974 list_for_each_entry_safe(obj, next,
Chris Wilsonbe726152010-07-23 23:18:50 +01001975 &dev_priv->mm.deferred_free_list,
Chris Wilson69dc4982010-10-19 10:36:51 +01001976 mm_list)
Chris Wilson05394f32010-11-08 19:18:58 +00001977 i915_gem_free_object_tail(obj);
Chris Wilsonbe726152010-07-23 23:18:50 +01001978 }
1979
Chris Wilson1ec14ad2010-12-04 11:30:53 +00001980 for (i = 0; i < I915_NUM_RINGS; i++)
Chris Wilsondb53a302011-02-03 11:57:46 +00001981 i915_gem_retire_requests_ring(&dev_priv->ring[i]);
Chris Wilsonb09a1fe2010-07-23 23:18:49 +01001982}
1983
Daniel Vetter75ef9da2010-08-21 00:25:16 +02001984static void
Eric Anholt673a3942008-07-30 12:06:12 -07001985i915_gem_retire_work_handler(struct work_struct *work)
1986{
1987 drm_i915_private_t *dev_priv;
1988 struct drm_device *dev;
Chris Wilson0a587052011-01-09 21:05:44 +00001989 bool idle;
1990 int i;
Eric Anholt673a3942008-07-30 12:06:12 -07001991
1992 dev_priv = container_of(work, drm_i915_private_t,
1993 mm.retire_work.work);
1994 dev = dev_priv->dev;
1995
Chris Wilson891b48c2010-09-29 12:26:37 +01001996 /* Come back later if the device is busy... */
1997 if (!mutex_trylock(&dev->struct_mutex)) {
1998 queue_delayed_work(dev_priv->wq, &dev_priv->mm.retire_work, HZ);
1999 return;
2000 }
2001
Chris Wilsonb09a1fe2010-07-23 23:18:49 +01002002 i915_gem_retire_requests(dev);
Zou Nan haid1b851f2010-05-21 09:08:57 +08002003
Chris Wilson0a587052011-01-09 21:05:44 +00002004 /* Send a periodic flush down the ring so we don't hold onto GEM
2005 * objects indefinitely.
2006 */
2007 idle = true;
2008 for (i = 0; i < I915_NUM_RINGS; i++) {
2009 struct intel_ring_buffer *ring = &dev_priv->ring[i];
2010
2011 if (!list_empty(&ring->gpu_write_list)) {
2012 struct drm_i915_gem_request *request;
2013 int ret;
2014
Chris Wilsondb53a302011-02-03 11:57:46 +00002015 ret = i915_gem_flush_ring(ring,
2016 0, I915_GEM_GPU_DOMAINS);
Chris Wilson0a587052011-01-09 21:05:44 +00002017 request = kzalloc(sizeof(*request), GFP_KERNEL);
2018 if (ret || request == NULL ||
Chris Wilsondb53a302011-02-03 11:57:46 +00002019 i915_add_request(ring, NULL, request))
Chris Wilson0a587052011-01-09 21:05:44 +00002020 kfree(request);
2021 }
2022
2023 idle &= list_empty(&ring->request_list);
2024 }
2025
2026 if (!dev_priv->mm.suspended && !idle)
Eric Anholt9c9fe1f2009-08-03 16:09:16 -07002027 queue_delayed_work(dev_priv->wq, &dev_priv->mm.retire_work, HZ);
Chris Wilson0a587052011-01-09 21:05:44 +00002028
Eric Anholt673a3942008-07-30 12:06:12 -07002029 mutex_unlock(&dev->struct_mutex);
2030}
2031
Chris Wilsondb53a302011-02-03 11:57:46 +00002032/**
2033 * Waits for a sequence number to be signaled, and cleans up the
2034 * request and object lists appropriately for that event.
2035 */
Daniel Vetter5a5a0c62009-09-15 22:57:36 +02002036int
Chris Wilsondb53a302011-02-03 11:57:46 +00002037i915_wait_request(struct intel_ring_buffer *ring,
Chris Wilsonce453d82011-02-21 14:43:56 +00002038 uint32_t seqno)
Eric Anholt673a3942008-07-30 12:06:12 -07002039{
Chris Wilsondb53a302011-02-03 11:57:46 +00002040 drm_i915_private_t *dev_priv = ring->dev->dev_private;
Jesse Barnes802c7eb2009-05-05 16:03:48 -07002041 u32 ier;
Eric Anholt673a3942008-07-30 12:06:12 -07002042 int ret = 0;
2043
2044 BUG_ON(seqno == 0);
2045
Chris Wilsond9bc7e92011-02-07 13:09:31 +00002046 if (atomic_read(&dev_priv->mm.wedged)) {
2047 struct completion *x = &dev_priv->error_completion;
2048 bool recovery_complete;
2049 unsigned long flags;
2050
2051 /* Give the error handler a chance to run. */
2052 spin_lock_irqsave(&x->wait.lock, flags);
2053 recovery_complete = x->done > 0;
2054 spin_unlock_irqrestore(&x->wait.lock, flags);
2055
2056 return recovery_complete ? -EIO : -EAGAIN;
2057 }
Ben Gamariffed1d02009-09-14 17:48:41 -04002058
Chris Wilson5d97eb62010-11-10 20:40:02 +00002059 if (seqno == ring->outstanding_lazy_request) {
Chris Wilson3cce4692010-10-27 16:11:02 +01002060 struct drm_i915_gem_request *request;
2061
2062 request = kzalloc(sizeof(*request), GFP_KERNEL);
2063 if (request == NULL)
Daniel Vettere35a41d2010-02-11 22:13:59 +01002064 return -ENOMEM;
Chris Wilson3cce4692010-10-27 16:11:02 +01002065
Chris Wilsondb53a302011-02-03 11:57:46 +00002066 ret = i915_add_request(ring, NULL, request);
Chris Wilson3cce4692010-10-27 16:11:02 +01002067 if (ret) {
2068 kfree(request);
2069 return ret;
2070 }
2071
2072 seqno = request->seqno;
Daniel Vettere35a41d2010-02-11 22:13:59 +01002073 }
2074
Chris Wilson78501ea2010-10-27 12:18:21 +01002075 if (!i915_seqno_passed(ring->get_seqno(ring), seqno)) {
Chris Wilsondb53a302011-02-03 11:57:46 +00002076 if (HAS_PCH_SPLIT(ring->dev))
Zhenyu Wang036a4a72009-06-08 14:40:19 +08002077 ier = I915_READ(DEIER) | I915_READ(GTIER);
2078 else
2079 ier = I915_READ(IER);
Jesse Barnes802c7eb2009-05-05 16:03:48 -07002080 if (!ier) {
2081 DRM_ERROR("something (likely vbetool) disabled "
2082 "interrupts, re-enabling\n");
Chris Wilsondb53a302011-02-03 11:57:46 +00002083 i915_driver_irq_preinstall(ring->dev);
2084 i915_driver_irq_postinstall(ring->dev);
Jesse Barnes802c7eb2009-05-05 16:03:48 -07002085 }
2086
Chris Wilsondb53a302011-02-03 11:57:46 +00002087 trace_i915_gem_request_wait_begin(ring, seqno);
Chris Wilson1c5d22f2009-08-25 11:15:50 +01002088
Chris Wilsonb2223492010-10-27 15:27:33 +01002089 ring->waiting_seqno = seqno;
Chris Wilsonb13c2b92010-12-13 16:54:50 +00002090 if (ring->irq_get(ring)) {
Chris Wilsonce453d82011-02-21 14:43:56 +00002091 if (dev_priv->mm.interruptible)
Chris Wilsonb13c2b92010-12-13 16:54:50 +00002092 ret = wait_event_interruptible(ring->irq_queue,
2093 i915_seqno_passed(ring->get_seqno(ring), seqno)
2094 || atomic_read(&dev_priv->mm.wedged));
2095 else
2096 wait_event(ring->irq_queue,
2097 i915_seqno_passed(ring->get_seqno(ring), seqno)
2098 || atomic_read(&dev_priv->mm.wedged));
Daniel Vetter48764bf2009-09-15 22:57:32 +02002099
Chris Wilsonb13c2b92010-12-13 16:54:50 +00002100 ring->irq_put(ring);
Chris Wilsonb5ba1772010-12-14 12:17:15 +00002101 } else if (wait_for(i915_seqno_passed(ring->get_seqno(ring),
2102 seqno) ||
2103 atomic_read(&dev_priv->mm.wedged), 3000))
2104 ret = -EBUSY;
Chris Wilsonb2223492010-10-27 15:27:33 +01002105 ring->waiting_seqno = 0;
Chris Wilson1c5d22f2009-08-25 11:15:50 +01002106
Chris Wilsondb53a302011-02-03 11:57:46 +00002107 trace_i915_gem_request_wait_end(ring, seqno);
Eric Anholt673a3942008-07-30 12:06:12 -07002108 }
Ben Gamariba1234d2009-09-14 17:48:47 -04002109 if (atomic_read(&dev_priv->mm.wedged))
Chris Wilson30dbf0c2010-09-25 10:19:17 +01002110 ret = -EAGAIN;
Eric Anholt673a3942008-07-30 12:06:12 -07002111
2112 if (ret && ret != -ERESTARTSYS)
Daniel Vetter8bff9172010-02-11 22:19:40 +01002113 DRM_ERROR("%s returns %d (awaiting %d at %d, next %d)\n",
Chris Wilson78501ea2010-10-27 12:18:21 +01002114 __func__, ret, seqno, ring->get_seqno(ring),
Daniel Vetter8bff9172010-02-11 22:19:40 +01002115 dev_priv->next_seqno);
Eric Anholt673a3942008-07-30 12:06:12 -07002116
2117 /* Directly dispatch request retiring. While we have the work queue
2118 * to handle this, the waiter on a request often wants an associated
2119 * buffer to have made it to the inactive list, and we would need
2120 * a separate wait queue to handle that.
2121 */
2122 if (ret == 0)
Chris Wilsondb53a302011-02-03 11:57:46 +00002123 i915_gem_retire_requests_ring(ring);
Eric Anholt673a3942008-07-30 12:06:12 -07002124
2125 return ret;
2126}
2127
Daniel Vetter48764bf2009-09-15 22:57:32 +02002128/**
Eric Anholt673a3942008-07-30 12:06:12 -07002129 * Ensures that all rendering to the object has completed and the object is
2130 * safe to unbind from the GTT or access from the CPU.
2131 */
Chris Wilson54cf91d2010-11-25 18:00:26 +00002132int
Chris Wilsonce453d82011-02-21 14:43:56 +00002133i915_gem_object_wait_rendering(struct drm_i915_gem_object *obj)
Eric Anholt673a3942008-07-30 12:06:12 -07002134{
Eric Anholt673a3942008-07-30 12:06:12 -07002135 int ret;
2136
Eric Anholte47c68e2008-11-14 13:35:19 -08002137 /* This function only exists to support waiting for existing rendering,
2138 * not for emitting required flushes.
Eric Anholt673a3942008-07-30 12:06:12 -07002139 */
Chris Wilson05394f32010-11-08 19:18:58 +00002140 BUG_ON((obj->base.write_domain & I915_GEM_GPU_DOMAINS) != 0);
Eric Anholt673a3942008-07-30 12:06:12 -07002141
2142 /* If there is rendering queued on the buffer being evicted, wait for
2143 * it.
2144 */
Chris Wilson05394f32010-11-08 19:18:58 +00002145 if (obj->active) {
Chris Wilsonce453d82011-02-21 14:43:56 +00002146 ret = i915_wait_request(obj->ring, obj->last_rendering_seqno);
Chris Wilson2cf34d72010-09-14 13:03:28 +01002147 if (ret)
Eric Anholt673a3942008-07-30 12:06:12 -07002148 return ret;
2149 }
2150
2151 return 0;
2152}
2153
Chris Wilsonb5ffc9b2011-04-13 22:06:03 +01002154static void i915_gem_object_finish_gtt(struct drm_i915_gem_object *obj)
2155{
2156 u32 old_write_domain, old_read_domains;
2157
Chris Wilsonb5ffc9b2011-04-13 22:06:03 +01002158 /* Act a barrier for all accesses through the GTT */
2159 mb();
2160
2161 /* Force a pagefault for domain tracking on next user access */
2162 i915_gem_release_mmap(obj);
2163
Keith Packardb97c3d92011-06-24 21:02:59 -07002164 if ((obj->base.read_domains & I915_GEM_DOMAIN_GTT) == 0)
2165 return;
2166
Chris Wilsonb5ffc9b2011-04-13 22:06:03 +01002167 old_read_domains = obj->base.read_domains;
2168 old_write_domain = obj->base.write_domain;
2169
2170 obj->base.read_domains &= ~I915_GEM_DOMAIN_GTT;
2171 obj->base.write_domain &= ~I915_GEM_DOMAIN_GTT;
2172
2173 trace_i915_gem_object_change_domain(obj,
2174 old_read_domains,
2175 old_write_domain);
2176}
2177
Eric Anholt673a3942008-07-30 12:06:12 -07002178/**
2179 * Unbinds an object from the GTT aperture.
2180 */
Jesse Barnes0f973f22009-01-26 17:10:45 -08002181int
Chris Wilson05394f32010-11-08 19:18:58 +00002182i915_gem_object_unbind(struct drm_i915_gem_object *obj)
Eric Anholt673a3942008-07-30 12:06:12 -07002183{
Eric Anholt673a3942008-07-30 12:06:12 -07002184 int ret = 0;
2185
Chris Wilson05394f32010-11-08 19:18:58 +00002186 if (obj->gtt_space == NULL)
Eric Anholt673a3942008-07-30 12:06:12 -07002187 return 0;
2188
Chris Wilson05394f32010-11-08 19:18:58 +00002189 if (obj->pin_count != 0) {
Eric Anholt673a3942008-07-30 12:06:12 -07002190 DRM_ERROR("Attempting to unbind pinned buffer\n");
2191 return -EINVAL;
2192 }
2193
Chris Wilsona8198ee2011-04-13 22:04:09 +01002194 ret = i915_gem_object_finish_gpu(obj);
Chris Wilson8dc17752010-07-23 23:18:51 +01002195 if (ret == -ERESTARTSYS)
Eric Anholt673a3942008-07-30 12:06:12 -07002196 return ret;
Chris Wilson8dc17752010-07-23 23:18:51 +01002197 /* Continue on if we fail due to EIO, the GPU is hung so we
2198 * should be safe and we need to cleanup or else we might
2199 * cause memory corruption through use-after-free.
2200 */
Chris Wilsona8198ee2011-04-13 22:04:09 +01002201
Chris Wilsonb5ffc9b2011-04-13 22:06:03 +01002202 i915_gem_object_finish_gtt(obj);
Chris Wilsona8198ee2011-04-13 22:04:09 +01002203
2204 /* Move the object to the CPU domain to ensure that
2205 * any possible CPU writes while it's not in the GTT
2206 * are flushed when we go to remap it.
2207 */
2208 if (ret == 0)
2209 ret = i915_gem_object_set_to_cpu_domain(obj, 1);
2210 if (ret == -ERESTARTSYS)
2211 return ret;
Chris Wilson812ed4922010-09-30 15:08:57 +01002212 if (ret) {
Chris Wilsona8198ee2011-04-13 22:04:09 +01002213 /* In the event of a disaster, abandon all caches and
2214 * hope for the best.
2215 */
Chris Wilson812ed4922010-09-30 15:08:57 +01002216 i915_gem_clflush_object(obj);
Chris Wilson05394f32010-11-08 19:18:58 +00002217 obj->base.read_domains = obj->base.write_domain = I915_GEM_DOMAIN_CPU;
Chris Wilson812ed4922010-09-30 15:08:57 +01002218 }
Eric Anholt673a3942008-07-30 12:06:12 -07002219
Daniel Vetter96b47b62009-12-15 17:50:00 +01002220 /* release the fence reg _after_ flushing */
Chris Wilsond9e86c02010-11-10 16:40:20 +00002221 ret = i915_gem_object_put_fence(obj);
2222 if (ret == -ERESTARTSYS)
2223 return ret;
Daniel Vetter96b47b62009-12-15 17:50:00 +01002224
Chris Wilsondb53a302011-02-03 11:57:46 +00002225 trace_i915_gem_object_unbind(obj);
2226
Daniel Vetter7c2e6fd2010-11-06 10:10:47 +01002227 i915_gem_gtt_unbind_object(obj);
Chris Wilsone5281cc2010-10-28 13:45:36 +01002228 i915_gem_object_put_pages_gtt(obj);
Eric Anholt673a3942008-07-30 12:06:12 -07002229
Chris Wilson6299f992010-11-24 12:23:44 +00002230 list_del_init(&obj->gtt_list);
Chris Wilson05394f32010-11-08 19:18:58 +00002231 list_del_init(&obj->mm_list);
Daniel Vetter75e9e912010-11-04 17:11:09 +01002232 /* Avoid an unnecessary call to unbind on rebind. */
Chris Wilson05394f32010-11-08 19:18:58 +00002233 obj->map_and_fenceable = true;
Eric Anholt673a3942008-07-30 12:06:12 -07002234
Chris Wilson05394f32010-11-08 19:18:58 +00002235 drm_mm_put_block(obj->gtt_space);
2236 obj->gtt_space = NULL;
2237 obj->gtt_offset = 0;
Eric Anholt673a3942008-07-30 12:06:12 -07002238
Chris Wilson05394f32010-11-08 19:18:58 +00002239 if (i915_gem_object_is_purgeable(obj))
Chris Wilson963b4832009-09-20 23:03:54 +01002240 i915_gem_object_truncate(obj);
2241
Chris Wilson8dc17752010-07-23 23:18:51 +01002242 return ret;
Eric Anholt673a3942008-07-30 12:06:12 -07002243}
2244
Chris Wilson88241782011-01-07 17:09:48 +00002245int
Chris Wilsondb53a302011-02-03 11:57:46 +00002246i915_gem_flush_ring(struct intel_ring_buffer *ring,
Chris Wilson54cf91d2010-11-25 18:00:26 +00002247 uint32_t invalidate_domains,
2248 uint32_t flush_domains)
2249{
Chris Wilson88241782011-01-07 17:09:48 +00002250 int ret;
2251
Chris Wilson36d527d2011-03-19 22:26:49 +00002252 if (((invalidate_domains | flush_domains) & I915_GEM_GPU_DOMAINS) == 0)
2253 return 0;
2254
Chris Wilsondb53a302011-02-03 11:57:46 +00002255 trace_i915_gem_ring_flush(ring, invalidate_domains, flush_domains);
2256
Chris Wilson88241782011-01-07 17:09:48 +00002257 ret = ring->flush(ring, invalidate_domains, flush_domains);
2258 if (ret)
2259 return ret;
2260
Chris Wilson36d527d2011-03-19 22:26:49 +00002261 if (flush_domains & I915_GEM_GPU_DOMAINS)
2262 i915_gem_process_flushing_list(ring, flush_domains);
2263
Chris Wilson88241782011-01-07 17:09:48 +00002264 return 0;
Chris Wilson54cf91d2010-11-25 18:00:26 +00002265}
2266
Chris Wilsondb53a302011-02-03 11:57:46 +00002267static int i915_ring_idle(struct intel_ring_buffer *ring)
Chris Wilsona56ba562010-09-28 10:07:56 +01002268{
Chris Wilson88241782011-01-07 17:09:48 +00002269 int ret;
2270
Chris Wilson395b70b2010-10-28 21:28:46 +01002271 if (list_empty(&ring->gpu_write_list) && list_empty(&ring->active_list))
Chris Wilson64193402010-10-24 12:38:05 +01002272 return 0;
2273
Chris Wilson88241782011-01-07 17:09:48 +00002274 if (!list_empty(&ring->gpu_write_list)) {
Chris Wilsondb53a302011-02-03 11:57:46 +00002275 ret = i915_gem_flush_ring(ring,
Chris Wilson0ac74c62010-12-06 14:36:02 +00002276 I915_GEM_GPU_DOMAINS, I915_GEM_GPU_DOMAINS);
Chris Wilson88241782011-01-07 17:09:48 +00002277 if (ret)
2278 return ret;
2279 }
2280
Chris Wilsonce453d82011-02-21 14:43:56 +00002281 return i915_wait_request(ring, i915_gem_next_request_seqno(ring));
Chris Wilsona56ba562010-09-28 10:07:56 +01002282}
2283
Chris Wilsonb47eb4a2010-08-07 11:01:23 +01002284int
Daniel Vetter4df2faf2010-02-19 11:52:00 +01002285i915_gpu_idle(struct drm_device *dev)
2286{
2287 drm_i915_private_t *dev_priv = dev->dev_private;
2288 bool lists_empty;
Chris Wilson1ec14ad2010-12-04 11:30:53 +00002289 int ret, i;
Daniel Vetter4df2faf2010-02-19 11:52:00 +01002290
Zou Nan haid1b851f2010-05-21 09:08:57 +08002291 lists_empty = (list_empty(&dev_priv->mm.flushing_list) &&
Chris Wilson395b70b2010-10-28 21:28:46 +01002292 list_empty(&dev_priv->mm.active_list));
Daniel Vetter4df2faf2010-02-19 11:52:00 +01002293 if (lists_empty)
2294 return 0;
2295
2296 /* Flush everything onto the inactive list. */
Chris Wilson1ec14ad2010-12-04 11:30:53 +00002297 for (i = 0; i < I915_NUM_RINGS; i++) {
Chris Wilsondb53a302011-02-03 11:57:46 +00002298 ret = i915_ring_idle(&dev_priv->ring[i]);
Chris Wilson1ec14ad2010-12-04 11:30:53 +00002299 if (ret)
2300 return ret;
2301 }
Zou Nan haid1b851f2010-05-21 09:08:57 +08002302
Daniel Vetter8a1a49f2010-02-11 22:29:04 +01002303 return 0;
Daniel Vetter4df2faf2010-02-19 11:52:00 +01002304}
2305
Daniel Vetterc6642782010-11-12 13:46:18 +00002306static int sandybridge_write_fence_reg(struct drm_i915_gem_object *obj,
2307 struct intel_ring_buffer *pipelined)
Eric Anholt4e901fd2009-10-26 16:44:17 -07002308{
Chris Wilson05394f32010-11-08 19:18:58 +00002309 struct drm_device *dev = obj->base.dev;
Eric Anholt4e901fd2009-10-26 16:44:17 -07002310 drm_i915_private_t *dev_priv = dev->dev_private;
Chris Wilson05394f32010-11-08 19:18:58 +00002311 u32 size = obj->gtt_space->size;
2312 int regnum = obj->fence_reg;
Eric Anholt4e901fd2009-10-26 16:44:17 -07002313 uint64_t val;
2314
Chris Wilson05394f32010-11-08 19:18:58 +00002315 val = (uint64_t)((obj->gtt_offset + size - 4096) &
Daniel Vetterc6642782010-11-12 13:46:18 +00002316 0xfffff000) << 32;
Chris Wilson05394f32010-11-08 19:18:58 +00002317 val |= obj->gtt_offset & 0xfffff000;
2318 val |= (uint64_t)((obj->stride / 128) - 1) <<
Eric Anholt4e901fd2009-10-26 16:44:17 -07002319 SANDYBRIDGE_FENCE_PITCH_SHIFT;
2320
Chris Wilson05394f32010-11-08 19:18:58 +00002321 if (obj->tiling_mode == I915_TILING_Y)
Eric Anholt4e901fd2009-10-26 16:44:17 -07002322 val |= 1 << I965_FENCE_TILING_Y_SHIFT;
2323 val |= I965_FENCE_REG_VALID;
2324
Daniel Vetterc6642782010-11-12 13:46:18 +00002325 if (pipelined) {
2326 int ret = intel_ring_begin(pipelined, 6);
2327 if (ret)
2328 return ret;
2329
2330 intel_ring_emit(pipelined, MI_NOOP);
2331 intel_ring_emit(pipelined, MI_LOAD_REGISTER_IMM(2));
2332 intel_ring_emit(pipelined, FENCE_REG_SANDYBRIDGE_0 + regnum*8);
2333 intel_ring_emit(pipelined, (u32)val);
2334 intel_ring_emit(pipelined, FENCE_REG_SANDYBRIDGE_0 + regnum*8 + 4);
2335 intel_ring_emit(pipelined, (u32)(val >> 32));
2336 intel_ring_advance(pipelined);
2337 } else
2338 I915_WRITE64(FENCE_REG_SANDYBRIDGE_0 + regnum * 8, val);
2339
2340 return 0;
Eric Anholt4e901fd2009-10-26 16:44:17 -07002341}
2342
Daniel Vetterc6642782010-11-12 13:46:18 +00002343static int i965_write_fence_reg(struct drm_i915_gem_object *obj,
2344 struct intel_ring_buffer *pipelined)
Jesse Barnesde151cf2008-11-12 10:03:55 -08002345{
Chris Wilson05394f32010-11-08 19:18:58 +00002346 struct drm_device *dev = obj->base.dev;
Jesse Barnesde151cf2008-11-12 10:03:55 -08002347 drm_i915_private_t *dev_priv = dev->dev_private;
Chris Wilson05394f32010-11-08 19:18:58 +00002348 u32 size = obj->gtt_space->size;
2349 int regnum = obj->fence_reg;
Jesse Barnesde151cf2008-11-12 10:03:55 -08002350 uint64_t val;
2351
Chris Wilson05394f32010-11-08 19:18:58 +00002352 val = (uint64_t)((obj->gtt_offset + size - 4096) &
Jesse Barnesde151cf2008-11-12 10:03:55 -08002353 0xfffff000) << 32;
Chris Wilson05394f32010-11-08 19:18:58 +00002354 val |= obj->gtt_offset & 0xfffff000;
2355 val |= ((obj->stride / 128) - 1) << I965_FENCE_PITCH_SHIFT;
2356 if (obj->tiling_mode == I915_TILING_Y)
Jesse Barnesde151cf2008-11-12 10:03:55 -08002357 val |= 1 << I965_FENCE_TILING_Y_SHIFT;
2358 val |= I965_FENCE_REG_VALID;
2359
Daniel Vetterc6642782010-11-12 13:46:18 +00002360 if (pipelined) {
2361 int ret = intel_ring_begin(pipelined, 6);
2362 if (ret)
2363 return ret;
2364
2365 intel_ring_emit(pipelined, MI_NOOP);
2366 intel_ring_emit(pipelined, MI_LOAD_REGISTER_IMM(2));
2367 intel_ring_emit(pipelined, FENCE_REG_965_0 + regnum*8);
2368 intel_ring_emit(pipelined, (u32)val);
2369 intel_ring_emit(pipelined, FENCE_REG_965_0 + regnum*8 + 4);
2370 intel_ring_emit(pipelined, (u32)(val >> 32));
2371 intel_ring_advance(pipelined);
2372 } else
2373 I915_WRITE64(FENCE_REG_965_0 + regnum * 8, val);
2374
2375 return 0;
Jesse Barnesde151cf2008-11-12 10:03:55 -08002376}
2377
Daniel Vetterc6642782010-11-12 13:46:18 +00002378static int i915_write_fence_reg(struct drm_i915_gem_object *obj,
2379 struct intel_ring_buffer *pipelined)
Jesse Barnesde151cf2008-11-12 10:03:55 -08002380{
Chris Wilson05394f32010-11-08 19:18:58 +00002381 struct drm_device *dev = obj->base.dev;
Jesse Barnesde151cf2008-11-12 10:03:55 -08002382 drm_i915_private_t *dev_priv = dev->dev_private;
Chris Wilson05394f32010-11-08 19:18:58 +00002383 u32 size = obj->gtt_space->size;
Daniel Vetterc6642782010-11-12 13:46:18 +00002384 u32 fence_reg, val, pitch_val;
Jesse Barnes0f973f22009-01-26 17:10:45 -08002385 int tile_width;
Jesse Barnesde151cf2008-11-12 10:03:55 -08002386
Daniel Vetterc6642782010-11-12 13:46:18 +00002387 if (WARN((obj->gtt_offset & ~I915_FENCE_START_MASK) ||
2388 (size & -size) != size ||
2389 (obj->gtt_offset & (size - 1)),
2390 "object 0x%08x [fenceable? %d] not 1M or pot-size (0x%08x) aligned\n",
2391 obj->gtt_offset, obj->map_and_fenceable, size))
2392 return -EINVAL;
Jesse Barnesde151cf2008-11-12 10:03:55 -08002393
Daniel Vetterc6642782010-11-12 13:46:18 +00002394 if (obj->tiling_mode == I915_TILING_Y && HAS_128_BYTE_Y_TILING(dev))
Jesse Barnes0f973f22009-01-26 17:10:45 -08002395 tile_width = 128;
Jesse Barnesde151cf2008-11-12 10:03:55 -08002396 else
Jesse Barnes0f973f22009-01-26 17:10:45 -08002397 tile_width = 512;
2398
2399 /* Note: pitch better be a power of two tile widths */
Chris Wilson05394f32010-11-08 19:18:58 +00002400 pitch_val = obj->stride / tile_width;
Jesse Barnes0f973f22009-01-26 17:10:45 -08002401 pitch_val = ffs(pitch_val) - 1;
Jesse Barnesde151cf2008-11-12 10:03:55 -08002402
Chris Wilson05394f32010-11-08 19:18:58 +00002403 val = obj->gtt_offset;
2404 if (obj->tiling_mode == I915_TILING_Y)
Jesse Barnesde151cf2008-11-12 10:03:55 -08002405 val |= 1 << I830_FENCE_TILING_Y_SHIFT;
Chris Wilsona00b10c2010-09-24 21:15:47 +01002406 val |= I915_FENCE_SIZE_BITS(size);
Jesse Barnesde151cf2008-11-12 10:03:55 -08002407 val |= pitch_val << I830_FENCE_PITCH_SHIFT;
2408 val |= I830_FENCE_REG_VALID;
2409
Chris Wilson05394f32010-11-08 19:18:58 +00002410 fence_reg = obj->fence_reg;
Chris Wilsona00b10c2010-09-24 21:15:47 +01002411 if (fence_reg < 8)
2412 fence_reg = FENCE_REG_830_0 + fence_reg * 4;
Eric Anholtdc529a42009-03-10 22:34:49 -07002413 else
Chris Wilsona00b10c2010-09-24 21:15:47 +01002414 fence_reg = FENCE_REG_945_8 + (fence_reg - 8) * 4;
Daniel Vetterc6642782010-11-12 13:46:18 +00002415
2416 if (pipelined) {
2417 int ret = intel_ring_begin(pipelined, 4);
2418 if (ret)
2419 return ret;
2420
2421 intel_ring_emit(pipelined, MI_NOOP);
2422 intel_ring_emit(pipelined, MI_LOAD_REGISTER_IMM(1));
2423 intel_ring_emit(pipelined, fence_reg);
2424 intel_ring_emit(pipelined, val);
2425 intel_ring_advance(pipelined);
2426 } else
2427 I915_WRITE(fence_reg, val);
2428
2429 return 0;
Jesse Barnesde151cf2008-11-12 10:03:55 -08002430}
2431
Daniel Vetterc6642782010-11-12 13:46:18 +00002432static int i830_write_fence_reg(struct drm_i915_gem_object *obj,
2433 struct intel_ring_buffer *pipelined)
Jesse Barnesde151cf2008-11-12 10:03:55 -08002434{
Chris Wilson05394f32010-11-08 19:18:58 +00002435 struct drm_device *dev = obj->base.dev;
Jesse Barnesde151cf2008-11-12 10:03:55 -08002436 drm_i915_private_t *dev_priv = dev->dev_private;
Chris Wilson05394f32010-11-08 19:18:58 +00002437 u32 size = obj->gtt_space->size;
2438 int regnum = obj->fence_reg;
Jesse Barnesde151cf2008-11-12 10:03:55 -08002439 uint32_t val;
2440 uint32_t pitch_val;
2441
Daniel Vetterc6642782010-11-12 13:46:18 +00002442 if (WARN((obj->gtt_offset & ~I830_FENCE_START_MASK) ||
2443 (size & -size) != size ||
2444 (obj->gtt_offset & (size - 1)),
2445 "object 0x%08x not 512K or pot-size 0x%08x aligned\n",
2446 obj->gtt_offset, size))
2447 return -EINVAL;
Jesse Barnesde151cf2008-11-12 10:03:55 -08002448
Chris Wilson05394f32010-11-08 19:18:58 +00002449 pitch_val = obj->stride / 128;
Eric Anholte76a16d2009-05-26 17:44:56 -07002450 pitch_val = ffs(pitch_val) - 1;
Eric Anholte76a16d2009-05-26 17:44:56 -07002451
Chris Wilson05394f32010-11-08 19:18:58 +00002452 val = obj->gtt_offset;
2453 if (obj->tiling_mode == I915_TILING_Y)
Jesse Barnesde151cf2008-11-12 10:03:55 -08002454 val |= 1 << I830_FENCE_TILING_Y_SHIFT;
Daniel Vetterc6642782010-11-12 13:46:18 +00002455 val |= I830_FENCE_SIZE_BITS(size);
Jesse Barnesde151cf2008-11-12 10:03:55 -08002456 val |= pitch_val << I830_FENCE_PITCH_SHIFT;
2457 val |= I830_FENCE_REG_VALID;
2458
Daniel Vetterc6642782010-11-12 13:46:18 +00002459 if (pipelined) {
2460 int ret = intel_ring_begin(pipelined, 4);
2461 if (ret)
2462 return ret;
2463
2464 intel_ring_emit(pipelined, MI_NOOP);
2465 intel_ring_emit(pipelined, MI_LOAD_REGISTER_IMM(1));
2466 intel_ring_emit(pipelined, FENCE_REG_830_0 + regnum*4);
2467 intel_ring_emit(pipelined, val);
2468 intel_ring_advance(pipelined);
2469 } else
2470 I915_WRITE(FENCE_REG_830_0 + regnum * 4, val);
2471
2472 return 0;
Jesse Barnesde151cf2008-11-12 10:03:55 -08002473}
2474
Chris Wilsond9e86c02010-11-10 16:40:20 +00002475static bool ring_passed_seqno(struct intel_ring_buffer *ring, u32 seqno)
2476{
2477 return i915_seqno_passed(ring->get_seqno(ring), seqno);
2478}
2479
2480static int
2481i915_gem_object_flush_fence(struct drm_i915_gem_object *obj,
Chris Wilsonce453d82011-02-21 14:43:56 +00002482 struct intel_ring_buffer *pipelined)
Chris Wilsond9e86c02010-11-10 16:40:20 +00002483{
2484 int ret;
2485
2486 if (obj->fenced_gpu_access) {
Chris Wilson88241782011-01-07 17:09:48 +00002487 if (obj->base.write_domain & I915_GEM_GPU_DOMAINS) {
Chris Wilsondb53a302011-02-03 11:57:46 +00002488 ret = i915_gem_flush_ring(obj->last_fenced_ring,
Chris Wilson88241782011-01-07 17:09:48 +00002489 0, obj->base.write_domain);
2490 if (ret)
2491 return ret;
2492 }
Chris Wilsond9e86c02010-11-10 16:40:20 +00002493
2494 obj->fenced_gpu_access = false;
2495 }
2496
2497 if (obj->last_fenced_seqno && pipelined != obj->last_fenced_ring) {
2498 if (!ring_passed_seqno(obj->last_fenced_ring,
2499 obj->last_fenced_seqno)) {
Chris Wilsondb53a302011-02-03 11:57:46 +00002500 ret = i915_wait_request(obj->last_fenced_ring,
Chris Wilsonce453d82011-02-21 14:43:56 +00002501 obj->last_fenced_seqno);
Chris Wilsond9e86c02010-11-10 16:40:20 +00002502 if (ret)
2503 return ret;
2504 }
2505
2506 obj->last_fenced_seqno = 0;
2507 obj->last_fenced_ring = NULL;
2508 }
2509
Chris Wilson63256ec2011-01-04 18:42:07 +00002510 /* Ensure that all CPU reads are completed before installing a fence
2511 * and all writes before removing the fence.
2512 */
2513 if (obj->base.read_domains & I915_GEM_DOMAIN_GTT)
2514 mb();
2515
Chris Wilsond9e86c02010-11-10 16:40:20 +00002516 return 0;
2517}
2518
2519int
2520i915_gem_object_put_fence(struct drm_i915_gem_object *obj)
2521{
2522 int ret;
2523
2524 if (obj->tiling_mode)
2525 i915_gem_release_mmap(obj);
2526
Chris Wilsonce453d82011-02-21 14:43:56 +00002527 ret = i915_gem_object_flush_fence(obj, NULL);
Chris Wilsond9e86c02010-11-10 16:40:20 +00002528 if (ret)
2529 return ret;
2530
2531 if (obj->fence_reg != I915_FENCE_REG_NONE) {
2532 struct drm_i915_private *dev_priv = obj->base.dev->dev_private;
2533 i915_gem_clear_fence_reg(obj->base.dev,
2534 &dev_priv->fence_regs[obj->fence_reg]);
2535
2536 obj->fence_reg = I915_FENCE_REG_NONE;
2537 }
2538
2539 return 0;
2540}
2541
2542static struct drm_i915_fence_reg *
2543i915_find_fence_reg(struct drm_device *dev,
2544 struct intel_ring_buffer *pipelined)
Daniel Vetterae3db242010-02-19 11:51:58 +01002545{
Daniel Vetterae3db242010-02-19 11:51:58 +01002546 struct drm_i915_private *dev_priv = dev->dev_private;
Chris Wilsond9e86c02010-11-10 16:40:20 +00002547 struct drm_i915_fence_reg *reg, *first, *avail;
2548 int i;
Daniel Vetterae3db242010-02-19 11:51:58 +01002549
2550 /* First try to find a free reg */
Chris Wilsond9e86c02010-11-10 16:40:20 +00002551 avail = NULL;
Daniel Vetterae3db242010-02-19 11:51:58 +01002552 for (i = dev_priv->fence_reg_start; i < dev_priv->num_fence_regs; i++) {
2553 reg = &dev_priv->fence_regs[i];
2554 if (!reg->obj)
Chris Wilsond9e86c02010-11-10 16:40:20 +00002555 return reg;
Daniel Vetterae3db242010-02-19 11:51:58 +01002556
Chris Wilson05394f32010-11-08 19:18:58 +00002557 if (!reg->obj->pin_count)
Chris Wilsond9e86c02010-11-10 16:40:20 +00002558 avail = reg;
Daniel Vetterae3db242010-02-19 11:51:58 +01002559 }
2560
Chris Wilsond9e86c02010-11-10 16:40:20 +00002561 if (avail == NULL)
2562 return NULL;
Daniel Vetterae3db242010-02-19 11:51:58 +01002563
2564 /* None available, try to steal one or wait for a user to finish */
Chris Wilsond9e86c02010-11-10 16:40:20 +00002565 avail = first = NULL;
2566 list_for_each_entry(reg, &dev_priv->mm.fence_list, lru_list) {
2567 if (reg->obj->pin_count)
Daniel Vetterae3db242010-02-19 11:51:58 +01002568 continue;
2569
Chris Wilsond9e86c02010-11-10 16:40:20 +00002570 if (first == NULL)
2571 first = reg;
2572
2573 if (!pipelined ||
2574 !reg->obj->last_fenced_ring ||
2575 reg->obj->last_fenced_ring == pipelined) {
2576 avail = reg;
2577 break;
2578 }
Daniel Vetterae3db242010-02-19 11:51:58 +01002579 }
2580
Chris Wilsond9e86c02010-11-10 16:40:20 +00002581 if (avail == NULL)
2582 avail = first;
Daniel Vetterae3db242010-02-19 11:51:58 +01002583
Chris Wilsona00b10c2010-09-24 21:15:47 +01002584 return avail;
Daniel Vetterae3db242010-02-19 11:51:58 +01002585}
2586
Jesse Barnesde151cf2008-11-12 10:03:55 -08002587/**
Chris Wilsond9e86c02010-11-10 16:40:20 +00002588 * i915_gem_object_get_fence - set up a fence reg for an object
Jesse Barnesde151cf2008-11-12 10:03:55 -08002589 * @obj: object to map through a fence reg
Chris Wilsond9e86c02010-11-10 16:40:20 +00002590 * @pipelined: ring on which to queue the change, or NULL for CPU access
2591 * @interruptible: must we wait uninterruptibly for the register to retire?
Jesse Barnesde151cf2008-11-12 10:03:55 -08002592 *
2593 * When mapping objects through the GTT, userspace wants to be able to write
2594 * to them without having to worry about swizzling if the object is tiled.
2595 *
2596 * This function walks the fence regs looking for a free one for @obj,
2597 * stealing one if it can't find any.
2598 *
2599 * It then sets up the reg based on the object's properties: address, pitch
2600 * and tiling format.
2601 */
Chris Wilson8c4b8c32009-06-17 22:08:52 +01002602int
Chris Wilsond9e86c02010-11-10 16:40:20 +00002603i915_gem_object_get_fence(struct drm_i915_gem_object *obj,
Chris Wilsonce453d82011-02-21 14:43:56 +00002604 struct intel_ring_buffer *pipelined)
Jesse Barnesde151cf2008-11-12 10:03:55 -08002605{
Chris Wilson05394f32010-11-08 19:18:58 +00002606 struct drm_device *dev = obj->base.dev;
Jesse Barnes79e53942008-11-07 14:24:08 -08002607 struct drm_i915_private *dev_priv = dev->dev_private;
Chris Wilsond9e86c02010-11-10 16:40:20 +00002608 struct drm_i915_fence_reg *reg;
Daniel Vetterae3db242010-02-19 11:51:58 +01002609 int ret;
Jesse Barnesde151cf2008-11-12 10:03:55 -08002610
Chris Wilson6bda10d2010-12-05 21:04:18 +00002611 /* XXX disable pipelining. There are bugs. Shocking. */
2612 pipelined = NULL;
2613
Chris Wilsond9e86c02010-11-10 16:40:20 +00002614 /* Just update our place in the LRU if our fence is getting reused. */
Chris Wilson05394f32010-11-08 19:18:58 +00002615 if (obj->fence_reg != I915_FENCE_REG_NONE) {
2616 reg = &dev_priv->fence_regs[obj->fence_reg];
Daniel Vetter007cc8a2010-04-28 11:02:31 +02002617 list_move_tail(&reg->lru_list, &dev_priv->mm.fence_list);
Chris Wilsond9e86c02010-11-10 16:40:20 +00002618
Chris Wilson29c5a582011-03-17 15:23:22 +00002619 if (obj->tiling_changed) {
2620 ret = i915_gem_object_flush_fence(obj, pipelined);
2621 if (ret)
2622 return ret;
2623
2624 if (!obj->fenced_gpu_access && !obj->last_fenced_seqno)
2625 pipelined = NULL;
2626
2627 if (pipelined) {
2628 reg->setup_seqno =
2629 i915_gem_next_request_seqno(pipelined);
2630 obj->last_fenced_seqno = reg->setup_seqno;
2631 obj->last_fenced_ring = pipelined;
2632 }
2633
2634 goto update;
2635 }
Chris Wilsond9e86c02010-11-10 16:40:20 +00002636
2637 if (!pipelined) {
2638 if (reg->setup_seqno) {
2639 if (!ring_passed_seqno(obj->last_fenced_ring,
2640 reg->setup_seqno)) {
Chris Wilsondb53a302011-02-03 11:57:46 +00002641 ret = i915_wait_request(obj->last_fenced_ring,
Chris Wilsonce453d82011-02-21 14:43:56 +00002642 reg->setup_seqno);
Chris Wilsond9e86c02010-11-10 16:40:20 +00002643 if (ret)
2644 return ret;
2645 }
2646
2647 reg->setup_seqno = 0;
2648 }
2649 } else if (obj->last_fenced_ring &&
2650 obj->last_fenced_ring != pipelined) {
Chris Wilsonce453d82011-02-21 14:43:56 +00002651 ret = i915_gem_object_flush_fence(obj, pipelined);
Chris Wilsond9e86c02010-11-10 16:40:20 +00002652 if (ret)
2653 return ret;
Chris Wilsond9e86c02010-11-10 16:40:20 +00002654 }
2655
Eric Anholta09ba7f2009-08-29 12:49:51 -07002656 return 0;
2657 }
2658
Chris Wilsond9e86c02010-11-10 16:40:20 +00002659 reg = i915_find_fence_reg(dev, pipelined);
2660 if (reg == NULL)
2661 return -ENOSPC;
Jesse Barnesde151cf2008-11-12 10:03:55 -08002662
Chris Wilsonce453d82011-02-21 14:43:56 +00002663 ret = i915_gem_object_flush_fence(obj, pipelined);
Chris Wilsond9e86c02010-11-10 16:40:20 +00002664 if (ret)
Daniel Vetterae3db242010-02-19 11:51:58 +01002665 return ret;
Chris Wilsonfc7170b2009-02-11 14:26:46 +00002666
Chris Wilsond9e86c02010-11-10 16:40:20 +00002667 if (reg->obj) {
2668 struct drm_i915_gem_object *old = reg->obj;
2669
2670 drm_gem_object_reference(&old->base);
2671
2672 if (old->tiling_mode)
2673 i915_gem_release_mmap(old);
2674
Chris Wilsonce453d82011-02-21 14:43:56 +00002675 ret = i915_gem_object_flush_fence(old, pipelined);
Chris Wilsond9e86c02010-11-10 16:40:20 +00002676 if (ret) {
2677 drm_gem_object_unreference(&old->base);
2678 return ret;
2679 }
2680
2681 if (old->last_fenced_seqno == 0 && obj->last_fenced_seqno == 0)
2682 pipelined = NULL;
2683
2684 old->fence_reg = I915_FENCE_REG_NONE;
2685 old->last_fenced_ring = pipelined;
2686 old->last_fenced_seqno =
Chris Wilsondb53a302011-02-03 11:57:46 +00002687 pipelined ? i915_gem_next_request_seqno(pipelined) : 0;
Chris Wilsond9e86c02010-11-10 16:40:20 +00002688
2689 drm_gem_object_unreference(&old->base);
2690 } else if (obj->last_fenced_seqno == 0)
2691 pipelined = NULL;
Eric Anholta09ba7f2009-08-29 12:49:51 -07002692
Jesse Barnesde151cf2008-11-12 10:03:55 -08002693 reg->obj = obj;
Chris Wilsond9e86c02010-11-10 16:40:20 +00002694 list_move_tail(&reg->lru_list, &dev_priv->mm.fence_list);
2695 obj->fence_reg = reg - dev_priv->fence_regs;
2696 obj->last_fenced_ring = pipelined;
Jesse Barnesde151cf2008-11-12 10:03:55 -08002697
Chris Wilsond9e86c02010-11-10 16:40:20 +00002698 reg->setup_seqno =
Chris Wilsondb53a302011-02-03 11:57:46 +00002699 pipelined ? i915_gem_next_request_seqno(pipelined) : 0;
Chris Wilsond9e86c02010-11-10 16:40:20 +00002700 obj->last_fenced_seqno = reg->setup_seqno;
2701
2702update:
2703 obj->tiling_changed = false;
Chris Wilsone259bef2010-09-17 00:32:02 +01002704 switch (INTEL_INFO(dev)->gen) {
Eric Anholt25aebfc32011-05-06 13:55:53 -07002705 case 7:
Chris Wilsone259bef2010-09-17 00:32:02 +01002706 case 6:
Daniel Vetterc6642782010-11-12 13:46:18 +00002707 ret = sandybridge_write_fence_reg(obj, pipelined);
Chris Wilsone259bef2010-09-17 00:32:02 +01002708 break;
2709 case 5:
2710 case 4:
Daniel Vetterc6642782010-11-12 13:46:18 +00002711 ret = i965_write_fence_reg(obj, pipelined);
Chris Wilsone259bef2010-09-17 00:32:02 +01002712 break;
2713 case 3:
Daniel Vetterc6642782010-11-12 13:46:18 +00002714 ret = i915_write_fence_reg(obj, pipelined);
Chris Wilsone259bef2010-09-17 00:32:02 +01002715 break;
2716 case 2:
Daniel Vetterc6642782010-11-12 13:46:18 +00002717 ret = i830_write_fence_reg(obj, pipelined);
Chris Wilsone259bef2010-09-17 00:32:02 +01002718 break;
2719 }
Eric Anholtd9ddcb92009-01-27 10:33:49 -08002720
Daniel Vetterc6642782010-11-12 13:46:18 +00002721 return ret;
Jesse Barnesde151cf2008-11-12 10:03:55 -08002722}
2723
2724/**
2725 * i915_gem_clear_fence_reg - clear out fence register info
2726 * @obj: object to clear
2727 *
2728 * Zeroes out the fence register itself and clears out the associated
Chris Wilson05394f32010-11-08 19:18:58 +00002729 * data structures in dev_priv and obj.
Jesse Barnesde151cf2008-11-12 10:03:55 -08002730 */
2731static void
Chris Wilsond9e86c02010-11-10 16:40:20 +00002732i915_gem_clear_fence_reg(struct drm_device *dev,
2733 struct drm_i915_fence_reg *reg)
Jesse Barnesde151cf2008-11-12 10:03:55 -08002734{
Jesse Barnes79e53942008-11-07 14:24:08 -08002735 drm_i915_private_t *dev_priv = dev->dev_private;
Chris Wilsond9e86c02010-11-10 16:40:20 +00002736 uint32_t fence_reg = reg - dev_priv->fence_regs;
Jesse Barnesde151cf2008-11-12 10:03:55 -08002737
Chris Wilsone259bef2010-09-17 00:32:02 +01002738 switch (INTEL_INFO(dev)->gen) {
Eric Anholt25aebfc32011-05-06 13:55:53 -07002739 case 7:
Chris Wilsone259bef2010-09-17 00:32:02 +01002740 case 6:
Chris Wilsond9e86c02010-11-10 16:40:20 +00002741 I915_WRITE64(FENCE_REG_SANDYBRIDGE_0 + fence_reg*8, 0);
Chris Wilsone259bef2010-09-17 00:32:02 +01002742 break;
2743 case 5:
2744 case 4:
Chris Wilsond9e86c02010-11-10 16:40:20 +00002745 I915_WRITE64(FENCE_REG_965_0 + fence_reg*8, 0);
Chris Wilsone259bef2010-09-17 00:32:02 +01002746 break;
2747 case 3:
Chris Wilsond9e86c02010-11-10 16:40:20 +00002748 if (fence_reg >= 8)
2749 fence_reg = FENCE_REG_945_8 + (fence_reg - 8) * 4;
Eric Anholtdc529a42009-03-10 22:34:49 -07002750 else
Chris Wilsone259bef2010-09-17 00:32:02 +01002751 case 2:
Chris Wilsond9e86c02010-11-10 16:40:20 +00002752 fence_reg = FENCE_REG_830_0 + fence_reg * 4;
Eric Anholtdc529a42009-03-10 22:34:49 -07002753
2754 I915_WRITE(fence_reg, 0);
Chris Wilsone259bef2010-09-17 00:32:02 +01002755 break;
Eric Anholtdc529a42009-03-10 22:34:49 -07002756 }
Jesse Barnesde151cf2008-11-12 10:03:55 -08002757
Daniel Vetter007cc8a2010-04-28 11:02:31 +02002758 list_del_init(&reg->lru_list);
Chris Wilsond9e86c02010-11-10 16:40:20 +00002759 reg->obj = NULL;
2760 reg->setup_seqno = 0;
Chris Wilson52dc7d32009-06-06 09:46:01 +01002761}
2762
2763/**
Eric Anholt673a3942008-07-30 12:06:12 -07002764 * Finds free space in the GTT aperture and binds the object there.
2765 */
2766static int
Chris Wilson05394f32010-11-08 19:18:58 +00002767i915_gem_object_bind_to_gtt(struct drm_i915_gem_object *obj,
Daniel Vetter920afa72010-09-16 17:54:23 +02002768 unsigned alignment,
Daniel Vetter75e9e912010-11-04 17:11:09 +01002769 bool map_and_fenceable)
Eric Anholt673a3942008-07-30 12:06:12 -07002770{
Chris Wilson05394f32010-11-08 19:18:58 +00002771 struct drm_device *dev = obj->base.dev;
Eric Anholt673a3942008-07-30 12:06:12 -07002772 drm_i915_private_t *dev_priv = dev->dev_private;
Eric Anholt673a3942008-07-30 12:06:12 -07002773 struct drm_mm_node *free_space;
Chris Wilsona00b10c2010-09-24 21:15:47 +01002774 gfp_t gfpmask = __GFP_NORETRY | __GFP_NOWARN;
Daniel Vetter5e783302010-11-14 22:32:36 +01002775 u32 size, fence_size, fence_alignment, unfenced_alignment;
Daniel Vetter75e9e912010-11-04 17:11:09 +01002776 bool mappable, fenceable;
Chris Wilson07f73f62009-09-14 16:50:30 +01002777 int ret;
Eric Anholt673a3942008-07-30 12:06:12 -07002778
Chris Wilson05394f32010-11-08 19:18:58 +00002779 if (obj->madv != I915_MADV_WILLNEED) {
Chris Wilson3ef94da2009-09-14 16:50:29 +01002780 DRM_ERROR("Attempting to bind a purgeable object\n");
2781 return -EINVAL;
2782 }
2783
Chris Wilson05394f32010-11-08 19:18:58 +00002784 fence_size = i915_gem_get_gtt_size(obj);
2785 fence_alignment = i915_gem_get_gtt_alignment(obj);
2786 unfenced_alignment = i915_gem_get_unfenced_gtt_alignment(obj);
Chris Wilsona00b10c2010-09-24 21:15:47 +01002787
Eric Anholt673a3942008-07-30 12:06:12 -07002788 if (alignment == 0)
Daniel Vetter5e783302010-11-14 22:32:36 +01002789 alignment = map_and_fenceable ? fence_alignment :
2790 unfenced_alignment;
Daniel Vetter75e9e912010-11-04 17:11:09 +01002791 if (map_and_fenceable && alignment & (fence_alignment - 1)) {
Eric Anholt673a3942008-07-30 12:06:12 -07002792 DRM_ERROR("Invalid object alignment requested %u\n", alignment);
2793 return -EINVAL;
2794 }
2795
Chris Wilson05394f32010-11-08 19:18:58 +00002796 size = map_and_fenceable ? fence_size : obj->base.size;
Chris Wilsona00b10c2010-09-24 21:15:47 +01002797
Chris Wilson654fc602010-05-27 13:18:21 +01002798 /* If the object is bigger than the entire aperture, reject it early
2799 * before evicting everything in a vain attempt to find space.
2800 */
Chris Wilson05394f32010-11-08 19:18:58 +00002801 if (obj->base.size >
Daniel Vetter75e9e912010-11-04 17:11:09 +01002802 (map_and_fenceable ? dev_priv->mm.gtt_mappable_end : dev_priv->mm.gtt_total)) {
Chris Wilson654fc602010-05-27 13:18:21 +01002803 DRM_ERROR("Attempting to bind an object larger than the aperture\n");
2804 return -E2BIG;
2805 }
2806
Eric Anholt673a3942008-07-30 12:06:12 -07002807 search_free:
Daniel Vetter75e9e912010-11-04 17:11:09 +01002808 if (map_and_fenceable)
Daniel Vetter920afa72010-09-16 17:54:23 +02002809 free_space =
2810 drm_mm_search_free_in_range(&dev_priv->mm.gtt_space,
Chris Wilsona00b10c2010-09-24 21:15:47 +01002811 size, alignment, 0,
Daniel Vetter920afa72010-09-16 17:54:23 +02002812 dev_priv->mm.gtt_mappable_end,
2813 0);
2814 else
2815 free_space = drm_mm_search_free(&dev_priv->mm.gtt_space,
Chris Wilsona00b10c2010-09-24 21:15:47 +01002816 size, alignment, 0);
Daniel Vetter920afa72010-09-16 17:54:23 +02002817
2818 if (free_space != NULL) {
Daniel Vetter75e9e912010-11-04 17:11:09 +01002819 if (map_and_fenceable)
Chris Wilson05394f32010-11-08 19:18:58 +00002820 obj->gtt_space =
Daniel Vetter920afa72010-09-16 17:54:23 +02002821 drm_mm_get_block_range_generic(free_space,
Chris Wilsona00b10c2010-09-24 21:15:47 +01002822 size, alignment, 0,
Daniel Vetter920afa72010-09-16 17:54:23 +02002823 dev_priv->mm.gtt_mappable_end,
2824 0);
2825 else
Chris Wilson05394f32010-11-08 19:18:58 +00002826 obj->gtt_space =
Chris Wilsona00b10c2010-09-24 21:15:47 +01002827 drm_mm_get_block(free_space, size, alignment);
Daniel Vetter920afa72010-09-16 17:54:23 +02002828 }
Chris Wilson05394f32010-11-08 19:18:58 +00002829 if (obj->gtt_space == NULL) {
Eric Anholt673a3942008-07-30 12:06:12 -07002830 /* If the gtt is empty and we're still having trouble
2831 * fitting our object in, we're out of memory.
2832 */
Daniel Vetter75e9e912010-11-04 17:11:09 +01002833 ret = i915_gem_evict_something(dev, size, alignment,
2834 map_and_fenceable);
Chris Wilson97311292009-09-21 00:22:34 +01002835 if (ret)
Eric Anholt673a3942008-07-30 12:06:12 -07002836 return ret;
Chris Wilson97311292009-09-21 00:22:34 +01002837
Eric Anholt673a3942008-07-30 12:06:12 -07002838 goto search_free;
2839 }
2840
Chris Wilsone5281cc2010-10-28 13:45:36 +01002841 ret = i915_gem_object_get_pages_gtt(obj, gfpmask);
Eric Anholt673a3942008-07-30 12:06:12 -07002842 if (ret) {
Chris Wilson05394f32010-11-08 19:18:58 +00002843 drm_mm_put_block(obj->gtt_space);
2844 obj->gtt_space = NULL;
Chris Wilson07f73f62009-09-14 16:50:30 +01002845
2846 if (ret == -ENOMEM) {
Chris Wilson809b6332011-01-10 17:33:15 +00002847 /* first try to reclaim some memory by clearing the GTT */
2848 ret = i915_gem_evict_everything(dev, false);
Chris Wilson07f73f62009-09-14 16:50:30 +01002849 if (ret) {
Chris Wilson07f73f62009-09-14 16:50:30 +01002850 /* now try to shrink everyone else */
Chris Wilson4bdadb92010-01-27 13:36:32 +00002851 if (gfpmask) {
2852 gfpmask = 0;
2853 goto search_free;
Chris Wilson07f73f62009-09-14 16:50:30 +01002854 }
2855
Chris Wilson809b6332011-01-10 17:33:15 +00002856 return -ENOMEM;
Chris Wilson07f73f62009-09-14 16:50:30 +01002857 }
2858
2859 goto search_free;
2860 }
2861
Eric Anholt673a3942008-07-30 12:06:12 -07002862 return ret;
2863 }
2864
Daniel Vetter7c2e6fd2010-11-06 10:10:47 +01002865 ret = i915_gem_gtt_bind_object(obj);
2866 if (ret) {
Chris Wilsone5281cc2010-10-28 13:45:36 +01002867 i915_gem_object_put_pages_gtt(obj);
Chris Wilson05394f32010-11-08 19:18:58 +00002868 drm_mm_put_block(obj->gtt_space);
2869 obj->gtt_space = NULL;
Chris Wilson07f73f62009-09-14 16:50:30 +01002870
Chris Wilson809b6332011-01-10 17:33:15 +00002871 if (i915_gem_evict_everything(dev, false))
Chris Wilson07f73f62009-09-14 16:50:30 +01002872 return ret;
Chris Wilson07f73f62009-09-14 16:50:30 +01002873
2874 goto search_free;
Eric Anholt673a3942008-07-30 12:06:12 -07002875 }
Eric Anholt673a3942008-07-30 12:06:12 -07002876
Chris Wilson6299f992010-11-24 12:23:44 +00002877 list_add_tail(&obj->gtt_list, &dev_priv->mm.gtt_list);
Chris Wilson05394f32010-11-08 19:18:58 +00002878 list_add_tail(&obj->mm_list, &dev_priv->mm.inactive_list);
Chris Wilsonbf1a1092010-08-07 11:01:20 +01002879
Eric Anholt673a3942008-07-30 12:06:12 -07002880 /* Assert that the object is not currently in any GPU domain. As it
2881 * wasn't in the GTT, there shouldn't be any way it could have been in
2882 * a GPU cache
2883 */
Chris Wilson05394f32010-11-08 19:18:58 +00002884 BUG_ON(obj->base.read_domains & I915_GEM_GPU_DOMAINS);
2885 BUG_ON(obj->base.write_domain & I915_GEM_GPU_DOMAINS);
Eric Anholt673a3942008-07-30 12:06:12 -07002886
Chris Wilson6299f992010-11-24 12:23:44 +00002887 obj->gtt_offset = obj->gtt_space->start;
Chris Wilson1c5d22f2009-08-25 11:15:50 +01002888
Daniel Vetter75e9e912010-11-04 17:11:09 +01002889 fenceable =
Chris Wilson05394f32010-11-08 19:18:58 +00002890 obj->gtt_space->size == fence_size &&
2891 (obj->gtt_space->start & (fence_alignment -1)) == 0;
Chris Wilsona00b10c2010-09-24 21:15:47 +01002892
Daniel Vetter75e9e912010-11-04 17:11:09 +01002893 mappable =
Chris Wilson05394f32010-11-08 19:18:58 +00002894 obj->gtt_offset + obj->base.size <= dev_priv->mm.gtt_mappable_end;
Chris Wilsona00b10c2010-09-24 21:15:47 +01002895
Chris Wilson05394f32010-11-08 19:18:58 +00002896 obj->map_and_fenceable = mappable && fenceable;
Daniel Vetter75e9e912010-11-04 17:11:09 +01002897
Chris Wilsondb53a302011-02-03 11:57:46 +00002898 trace_i915_gem_object_bind(obj, map_and_fenceable);
Eric Anholt673a3942008-07-30 12:06:12 -07002899 return 0;
2900}
2901
2902void
Chris Wilson05394f32010-11-08 19:18:58 +00002903i915_gem_clflush_object(struct drm_i915_gem_object *obj)
Eric Anholt673a3942008-07-30 12:06:12 -07002904{
Eric Anholt673a3942008-07-30 12:06:12 -07002905 /* If we don't have a page list set up, then we're not pinned
2906 * to GPU, and we can ignore the cache flush because it'll happen
2907 * again at bind time.
2908 */
Chris Wilson05394f32010-11-08 19:18:58 +00002909 if (obj->pages == NULL)
Eric Anholt673a3942008-07-30 12:06:12 -07002910 return;
2911
Chris Wilson9c23f7f2011-03-29 16:59:52 -07002912 /* If the GPU is snooping the contents of the CPU cache,
2913 * we do not need to manually clear the CPU cache lines. However,
2914 * the caches are only snooped when the render cache is
2915 * flushed/invalidated. As we always have to emit invalidations
2916 * and flushes when moving into and out of the RENDER domain, correct
2917 * snooping behaviour occurs naturally as the result of our domain
2918 * tracking.
2919 */
2920 if (obj->cache_level != I915_CACHE_NONE)
2921 return;
2922
Chris Wilson1c5d22f2009-08-25 11:15:50 +01002923 trace_i915_gem_object_clflush(obj);
Eric Anholtcfa16a02009-05-26 18:46:16 -07002924
Chris Wilson05394f32010-11-08 19:18:58 +00002925 drm_clflush_pages(obj->pages, obj->base.size / PAGE_SIZE);
Eric Anholt673a3942008-07-30 12:06:12 -07002926}
2927
Eric Anholte47c68e2008-11-14 13:35:19 -08002928/** Flushes any GPU write domain for the object if it's dirty. */
Chris Wilson88241782011-01-07 17:09:48 +00002929static int
Chris Wilson3619df02010-11-28 15:37:17 +00002930i915_gem_object_flush_gpu_write_domain(struct drm_i915_gem_object *obj)
Eric Anholte47c68e2008-11-14 13:35:19 -08002931{
Chris Wilson05394f32010-11-08 19:18:58 +00002932 if ((obj->base.write_domain & I915_GEM_GPU_DOMAINS) == 0)
Chris Wilson88241782011-01-07 17:09:48 +00002933 return 0;
Eric Anholte47c68e2008-11-14 13:35:19 -08002934
2935 /* Queue the GPU write cache flushing we need. */
Chris Wilsondb53a302011-02-03 11:57:46 +00002936 return i915_gem_flush_ring(obj->ring, 0, obj->base.write_domain);
Eric Anholte47c68e2008-11-14 13:35:19 -08002937}
2938
2939/** Flushes the GTT write domain for the object if it's dirty. */
2940static void
Chris Wilson05394f32010-11-08 19:18:58 +00002941i915_gem_object_flush_gtt_write_domain(struct drm_i915_gem_object *obj)
Eric Anholte47c68e2008-11-14 13:35:19 -08002942{
Chris Wilson1c5d22f2009-08-25 11:15:50 +01002943 uint32_t old_write_domain;
2944
Chris Wilson05394f32010-11-08 19:18:58 +00002945 if (obj->base.write_domain != I915_GEM_DOMAIN_GTT)
Eric Anholte47c68e2008-11-14 13:35:19 -08002946 return;
2947
Chris Wilson63256ec2011-01-04 18:42:07 +00002948 /* No actual flushing is required for the GTT write domain. Writes
Eric Anholte47c68e2008-11-14 13:35:19 -08002949 * to it immediately go to main memory as far as we know, so there's
2950 * no chipset flush. It also doesn't land in render cache.
Chris Wilson63256ec2011-01-04 18:42:07 +00002951 *
2952 * However, we do have to enforce the order so that all writes through
2953 * the GTT land before any writes to the device, such as updates to
2954 * the GATT itself.
Eric Anholte47c68e2008-11-14 13:35:19 -08002955 */
Chris Wilson63256ec2011-01-04 18:42:07 +00002956 wmb();
2957
Chris Wilson05394f32010-11-08 19:18:58 +00002958 old_write_domain = obj->base.write_domain;
2959 obj->base.write_domain = 0;
Chris Wilson1c5d22f2009-08-25 11:15:50 +01002960
2961 trace_i915_gem_object_change_domain(obj,
Chris Wilson05394f32010-11-08 19:18:58 +00002962 obj->base.read_domains,
Chris Wilson1c5d22f2009-08-25 11:15:50 +01002963 old_write_domain);
Eric Anholte47c68e2008-11-14 13:35:19 -08002964}
2965
2966/** Flushes the CPU write domain for the object if it's dirty. */
2967static void
Chris Wilson05394f32010-11-08 19:18:58 +00002968i915_gem_object_flush_cpu_write_domain(struct drm_i915_gem_object *obj)
Eric Anholte47c68e2008-11-14 13:35:19 -08002969{
Chris Wilson1c5d22f2009-08-25 11:15:50 +01002970 uint32_t old_write_domain;
Eric Anholte47c68e2008-11-14 13:35:19 -08002971
Chris Wilson05394f32010-11-08 19:18:58 +00002972 if (obj->base.write_domain != I915_GEM_DOMAIN_CPU)
Eric Anholte47c68e2008-11-14 13:35:19 -08002973 return;
2974
2975 i915_gem_clflush_object(obj);
Daniel Vetter40ce6572010-11-05 18:12:18 +01002976 intel_gtt_chipset_flush();
Chris Wilson05394f32010-11-08 19:18:58 +00002977 old_write_domain = obj->base.write_domain;
2978 obj->base.write_domain = 0;
Chris Wilson1c5d22f2009-08-25 11:15:50 +01002979
2980 trace_i915_gem_object_change_domain(obj,
Chris Wilson05394f32010-11-08 19:18:58 +00002981 obj->base.read_domains,
Chris Wilson1c5d22f2009-08-25 11:15:50 +01002982 old_write_domain);
Eric Anholte47c68e2008-11-14 13:35:19 -08002983}
2984
Eric Anholt2ef7eea2008-11-10 10:53:25 -08002985/**
2986 * Moves a single object to the GTT read, and possibly write domain.
2987 *
2988 * This function returns when the move is complete, including waiting on
2989 * flushes to occur.
2990 */
Jesse Barnes79e53942008-11-07 14:24:08 -08002991int
Chris Wilson20217462010-11-23 15:26:33 +00002992i915_gem_object_set_to_gtt_domain(struct drm_i915_gem_object *obj, bool write)
Eric Anholt2ef7eea2008-11-10 10:53:25 -08002993{
Chris Wilson1c5d22f2009-08-25 11:15:50 +01002994 uint32_t old_write_domain, old_read_domains;
Eric Anholte47c68e2008-11-14 13:35:19 -08002995 int ret;
Eric Anholt2ef7eea2008-11-10 10:53:25 -08002996
Eric Anholt02354392008-11-26 13:58:13 -08002997 /* Not valid to be called on unbound objects. */
Chris Wilson05394f32010-11-08 19:18:58 +00002998 if (obj->gtt_space == NULL)
Eric Anholt02354392008-11-26 13:58:13 -08002999 return -EINVAL;
3000
Chris Wilson8d7e3de2011-02-07 15:23:02 +00003001 if (obj->base.write_domain == I915_GEM_DOMAIN_GTT)
3002 return 0;
3003
Chris Wilson88241782011-01-07 17:09:48 +00003004 ret = i915_gem_object_flush_gpu_write_domain(obj);
3005 if (ret)
3006 return ret;
3007
Chris Wilson87ca9c82010-12-02 09:42:56 +00003008 if (obj->pending_gpu_write || write) {
Chris Wilsonce453d82011-02-21 14:43:56 +00003009 ret = i915_gem_object_wait_rendering(obj);
Chris Wilson87ca9c82010-12-02 09:42:56 +00003010 if (ret)
3011 return ret;
3012 }
Chris Wilson2dafb1e2010-06-07 14:03:05 +01003013
Chris Wilson72133422010-09-13 23:56:38 +01003014 i915_gem_object_flush_cpu_write_domain(obj);
Chris Wilson1c5d22f2009-08-25 11:15:50 +01003015
Chris Wilson05394f32010-11-08 19:18:58 +00003016 old_write_domain = obj->base.write_domain;
3017 old_read_domains = obj->base.read_domains;
Eric Anholt2ef7eea2008-11-10 10:53:25 -08003018
Eric Anholt2ef7eea2008-11-10 10:53:25 -08003019 /* It should now be out of any other write domains, and we can update
3020 * the domain values for our changes.
3021 */
Chris Wilson05394f32010-11-08 19:18:58 +00003022 BUG_ON((obj->base.write_domain & ~I915_GEM_DOMAIN_GTT) != 0);
3023 obj->base.read_domains |= I915_GEM_DOMAIN_GTT;
Eric Anholte47c68e2008-11-14 13:35:19 -08003024 if (write) {
Chris Wilson05394f32010-11-08 19:18:58 +00003025 obj->base.read_domains = I915_GEM_DOMAIN_GTT;
3026 obj->base.write_domain = I915_GEM_DOMAIN_GTT;
3027 obj->dirty = 1;
Eric Anholte47c68e2008-11-14 13:35:19 -08003028 }
3029
Chris Wilson1c5d22f2009-08-25 11:15:50 +01003030 trace_i915_gem_object_change_domain(obj,
3031 old_read_domains,
3032 old_write_domain);
3033
Eric Anholte47c68e2008-11-14 13:35:19 -08003034 return 0;
3035}
3036
Chris Wilsone4ffd172011-04-04 09:44:39 +01003037int i915_gem_object_set_cache_level(struct drm_i915_gem_object *obj,
3038 enum i915_cache_level cache_level)
3039{
3040 int ret;
3041
3042 if (obj->cache_level == cache_level)
3043 return 0;
3044
3045 if (obj->pin_count) {
3046 DRM_DEBUG("can not change the cache level of pinned objects\n");
3047 return -EBUSY;
3048 }
3049
3050 if (obj->gtt_space) {
3051 ret = i915_gem_object_finish_gpu(obj);
3052 if (ret)
3053 return ret;
3054
3055 i915_gem_object_finish_gtt(obj);
3056
3057 /* Before SandyBridge, you could not use tiling or fence
3058 * registers with snooped memory, so relinquish any fences
3059 * currently pointing to our region in the aperture.
3060 */
3061 if (INTEL_INFO(obj->base.dev)->gen < 6) {
3062 ret = i915_gem_object_put_fence(obj);
3063 if (ret)
3064 return ret;
3065 }
3066
3067 i915_gem_gtt_rebind_object(obj, cache_level);
3068 }
3069
3070 if (cache_level == I915_CACHE_NONE) {
3071 u32 old_read_domains, old_write_domain;
3072
3073 /* If we're coming from LLC cached, then we haven't
3074 * actually been tracking whether the data is in the
3075 * CPU cache or not, since we only allow one bit set
3076 * in obj->write_domain and have been skipping the clflushes.
3077 * Just set it to the CPU cache for now.
3078 */
3079 WARN_ON(obj->base.write_domain & ~I915_GEM_DOMAIN_CPU);
3080 WARN_ON(obj->base.read_domains & ~I915_GEM_DOMAIN_CPU);
3081
3082 old_read_domains = obj->base.read_domains;
3083 old_write_domain = obj->base.write_domain;
3084
3085 obj->base.read_domains = I915_GEM_DOMAIN_CPU;
3086 obj->base.write_domain = I915_GEM_DOMAIN_CPU;
3087
3088 trace_i915_gem_object_change_domain(obj,
3089 old_read_domains,
3090 old_write_domain);
3091 }
3092
3093 obj->cache_level = cache_level;
3094 return 0;
3095}
3096
Zhenyu Wangb9241ea2009-11-25 13:09:39 +08003097/*
Chris Wilson2da3b9b2011-04-14 09:41:17 +01003098 * Prepare buffer for display plane (scanout, cursors, etc).
3099 * Can be called from an uninterruptible phase (modesetting) and allows
3100 * any flushes to be pipelined (for pageflips).
3101 *
3102 * For the display plane, we want to be in the GTT but out of any write
3103 * domains. So in many ways this looks like set_to_gtt_domain() apart from the
3104 * ability to pipeline the waits, pinning and any additional subtleties
3105 * that may differentiate the display plane from ordinary buffers.
Zhenyu Wangb9241ea2009-11-25 13:09:39 +08003106 */
3107int
Chris Wilson2da3b9b2011-04-14 09:41:17 +01003108i915_gem_object_pin_to_display_plane(struct drm_i915_gem_object *obj,
3109 u32 alignment,
Chris Wilson919926a2010-11-12 13:42:53 +00003110 struct intel_ring_buffer *pipelined)
Zhenyu Wangb9241ea2009-11-25 13:09:39 +08003111{
Chris Wilson2da3b9b2011-04-14 09:41:17 +01003112 u32 old_read_domains, old_write_domain;
Zhenyu Wangb9241ea2009-11-25 13:09:39 +08003113 int ret;
3114
Chris Wilson88241782011-01-07 17:09:48 +00003115 ret = i915_gem_object_flush_gpu_write_domain(obj);
3116 if (ret)
3117 return ret;
3118
Chris Wilson0be73282010-12-06 14:36:27 +00003119 if (pipelined != obj->ring) {
Chris Wilsonce453d82011-02-21 14:43:56 +00003120 ret = i915_gem_object_wait_rendering(obj);
Chris Wilsonced270f2010-09-26 22:47:46 +01003121 if (ret)
Zhenyu Wangb9241ea2009-11-25 13:09:39 +08003122 return ret;
3123 }
3124
Eric Anholta7ef0642011-03-29 16:59:54 -07003125 /* The display engine is not coherent with the LLC cache on gen6. As
3126 * a result, we make sure that the pinning that is about to occur is
3127 * done with uncached PTEs. This is lowest common denominator for all
3128 * chipsets.
3129 *
3130 * However for gen6+, we could do better by using the GFDT bit instead
3131 * of uncaching, which would allow us to flush all the LLC-cached data
3132 * with that bit in the PTE to main memory with just one PIPE_CONTROL.
3133 */
3134 ret = i915_gem_object_set_cache_level(obj, I915_CACHE_NONE);
3135 if (ret)
3136 return ret;
3137
Chris Wilson2da3b9b2011-04-14 09:41:17 +01003138 /* As the user may map the buffer once pinned in the display plane
3139 * (e.g. libkms for the bootup splash), we have to ensure that we
3140 * always use map_and_fenceable for all scanout buffers.
3141 */
3142 ret = i915_gem_object_pin(obj, alignment, true);
3143 if (ret)
3144 return ret;
3145
Chris Wilsonb118c1e2010-05-27 13:18:14 +01003146 i915_gem_object_flush_cpu_write_domain(obj);
3147
Chris Wilson2da3b9b2011-04-14 09:41:17 +01003148 old_write_domain = obj->base.write_domain;
Chris Wilson05394f32010-11-08 19:18:58 +00003149 old_read_domains = obj->base.read_domains;
Chris Wilson2da3b9b2011-04-14 09:41:17 +01003150
3151 /* It should now be out of any other write domains, and we can update
3152 * the domain values for our changes.
3153 */
3154 BUG_ON((obj->base.write_domain & ~I915_GEM_DOMAIN_GTT) != 0);
Chris Wilson05394f32010-11-08 19:18:58 +00003155 obj->base.read_domains |= I915_GEM_DOMAIN_GTT;
Zhenyu Wangb9241ea2009-11-25 13:09:39 +08003156
3157 trace_i915_gem_object_change_domain(obj,
3158 old_read_domains,
Chris Wilson2da3b9b2011-04-14 09:41:17 +01003159 old_write_domain);
Zhenyu Wangb9241ea2009-11-25 13:09:39 +08003160
3161 return 0;
3162}
3163
Chris Wilson85345512010-11-13 09:49:11 +00003164int
Chris Wilsona8198ee2011-04-13 22:04:09 +01003165i915_gem_object_finish_gpu(struct drm_i915_gem_object *obj)
Chris Wilson85345512010-11-13 09:49:11 +00003166{
Chris Wilson88241782011-01-07 17:09:48 +00003167 int ret;
3168
Chris Wilsona8198ee2011-04-13 22:04:09 +01003169 if ((obj->base.read_domains & I915_GEM_GPU_DOMAINS) == 0)
Chris Wilson85345512010-11-13 09:49:11 +00003170 return 0;
3171
Chris Wilson88241782011-01-07 17:09:48 +00003172 if (obj->base.write_domain & I915_GEM_GPU_DOMAINS) {
Chris Wilsondb53a302011-02-03 11:57:46 +00003173 ret = i915_gem_flush_ring(obj->ring, 0, obj->base.write_domain);
Chris Wilson88241782011-01-07 17:09:48 +00003174 if (ret)
3175 return ret;
3176 }
Chris Wilson85345512010-11-13 09:49:11 +00003177
Chris Wilsona8198ee2011-04-13 22:04:09 +01003178 /* Ensure that we invalidate the GPU's caches and TLBs. */
3179 obj->base.read_domains &= ~I915_GEM_GPU_DOMAINS;
3180
Chris Wilsonce453d82011-02-21 14:43:56 +00003181 return i915_gem_object_wait_rendering(obj);
Chris Wilson85345512010-11-13 09:49:11 +00003182}
3183
Eric Anholte47c68e2008-11-14 13:35:19 -08003184/**
3185 * Moves a single object to the CPU read, and possibly write domain.
3186 *
3187 * This function returns when the move is complete, including waiting on
3188 * flushes to occur.
3189 */
3190static int
Chris Wilson919926a2010-11-12 13:42:53 +00003191i915_gem_object_set_to_cpu_domain(struct drm_i915_gem_object *obj, bool write)
Eric Anholte47c68e2008-11-14 13:35:19 -08003192{
Chris Wilson1c5d22f2009-08-25 11:15:50 +01003193 uint32_t old_write_domain, old_read_domains;
Eric Anholte47c68e2008-11-14 13:35:19 -08003194 int ret;
3195
Chris Wilson8d7e3de2011-02-07 15:23:02 +00003196 if (obj->base.write_domain == I915_GEM_DOMAIN_CPU)
3197 return 0;
3198
Chris Wilson88241782011-01-07 17:09:48 +00003199 ret = i915_gem_object_flush_gpu_write_domain(obj);
3200 if (ret)
3201 return ret;
3202
Chris Wilsonce453d82011-02-21 14:43:56 +00003203 ret = i915_gem_object_wait_rendering(obj);
Daniel Vetterde18a292010-11-27 22:30:41 +01003204 if (ret)
Eric Anholte47c68e2008-11-14 13:35:19 -08003205 return ret;
3206
3207 i915_gem_object_flush_gtt_write_domain(obj);
3208
3209 /* If we have a partially-valid cache of the object in the CPU,
3210 * finish invalidating it and free the per-page flags.
3211 */
3212 i915_gem_object_set_to_full_cpu_read_domain(obj);
3213
Chris Wilson05394f32010-11-08 19:18:58 +00003214 old_write_domain = obj->base.write_domain;
3215 old_read_domains = obj->base.read_domains;
Chris Wilson1c5d22f2009-08-25 11:15:50 +01003216
Eric Anholte47c68e2008-11-14 13:35:19 -08003217 /* Flush the CPU cache if it's still invalid. */
Chris Wilson05394f32010-11-08 19:18:58 +00003218 if ((obj->base.read_domains & I915_GEM_DOMAIN_CPU) == 0) {
Eric Anholte47c68e2008-11-14 13:35:19 -08003219 i915_gem_clflush_object(obj);
Eric Anholte47c68e2008-11-14 13:35:19 -08003220
Chris Wilson05394f32010-11-08 19:18:58 +00003221 obj->base.read_domains |= I915_GEM_DOMAIN_CPU;
Eric Anholte47c68e2008-11-14 13:35:19 -08003222 }
3223
3224 /* It should now be out of any other write domains, and we can update
3225 * the domain values for our changes.
3226 */
Chris Wilson05394f32010-11-08 19:18:58 +00003227 BUG_ON((obj->base.write_domain & ~I915_GEM_DOMAIN_CPU) != 0);
Eric Anholte47c68e2008-11-14 13:35:19 -08003228
3229 /* If we're writing through the CPU, then the GPU read domains will
3230 * need to be invalidated at next use.
3231 */
3232 if (write) {
Chris Wilson05394f32010-11-08 19:18:58 +00003233 obj->base.read_domains = I915_GEM_DOMAIN_CPU;
3234 obj->base.write_domain = I915_GEM_DOMAIN_CPU;
Eric Anholte47c68e2008-11-14 13:35:19 -08003235 }
Eric Anholt2ef7eea2008-11-10 10:53:25 -08003236
Chris Wilson1c5d22f2009-08-25 11:15:50 +01003237 trace_i915_gem_object_change_domain(obj,
3238 old_read_domains,
3239 old_write_domain);
3240
Eric Anholt2ef7eea2008-11-10 10:53:25 -08003241 return 0;
3242}
3243
Eric Anholt673a3942008-07-30 12:06:12 -07003244/**
Eric Anholte47c68e2008-11-14 13:35:19 -08003245 * Moves the object from a partially CPU read to a full one.
Eric Anholt673a3942008-07-30 12:06:12 -07003246 *
Eric Anholte47c68e2008-11-14 13:35:19 -08003247 * Note that this only resolves i915_gem_object_set_cpu_read_domain_range(),
3248 * and doesn't handle transitioning from !(read_domains & I915_GEM_DOMAIN_CPU).
3249 */
3250static void
Chris Wilson05394f32010-11-08 19:18:58 +00003251i915_gem_object_set_to_full_cpu_read_domain(struct drm_i915_gem_object *obj)
Eric Anholte47c68e2008-11-14 13:35:19 -08003252{
Chris Wilson05394f32010-11-08 19:18:58 +00003253 if (!obj->page_cpu_valid)
Eric Anholte47c68e2008-11-14 13:35:19 -08003254 return;
3255
3256 /* If we're partially in the CPU read domain, finish moving it in.
3257 */
Chris Wilson05394f32010-11-08 19:18:58 +00003258 if (obj->base.read_domains & I915_GEM_DOMAIN_CPU) {
Eric Anholte47c68e2008-11-14 13:35:19 -08003259 int i;
3260
Chris Wilson05394f32010-11-08 19:18:58 +00003261 for (i = 0; i <= (obj->base.size - 1) / PAGE_SIZE; i++) {
3262 if (obj->page_cpu_valid[i])
Eric Anholte47c68e2008-11-14 13:35:19 -08003263 continue;
Chris Wilson05394f32010-11-08 19:18:58 +00003264 drm_clflush_pages(obj->pages + i, 1);
Eric Anholte47c68e2008-11-14 13:35:19 -08003265 }
Eric Anholte47c68e2008-11-14 13:35:19 -08003266 }
3267
3268 /* Free the page_cpu_valid mappings which are now stale, whether
3269 * or not we've got I915_GEM_DOMAIN_CPU.
3270 */
Chris Wilson05394f32010-11-08 19:18:58 +00003271 kfree(obj->page_cpu_valid);
3272 obj->page_cpu_valid = NULL;
Eric Anholte47c68e2008-11-14 13:35:19 -08003273}
3274
3275/**
3276 * Set the CPU read domain on a range of the object.
3277 *
3278 * The object ends up with I915_GEM_DOMAIN_CPU in its read flags although it's
3279 * not entirely valid. The page_cpu_valid member of the object flags which
3280 * pages have been flushed, and will be respected by
3281 * i915_gem_object_set_to_cpu_domain() if it's called on to get a valid mapping
3282 * of the whole object.
3283 *
3284 * This function returns when the move is complete, including waiting on
3285 * flushes to occur.
Eric Anholt673a3942008-07-30 12:06:12 -07003286 */
3287static int
Chris Wilson05394f32010-11-08 19:18:58 +00003288i915_gem_object_set_cpu_read_domain_range(struct drm_i915_gem_object *obj,
Eric Anholte47c68e2008-11-14 13:35:19 -08003289 uint64_t offset, uint64_t size)
Eric Anholt673a3942008-07-30 12:06:12 -07003290{
Chris Wilson1c5d22f2009-08-25 11:15:50 +01003291 uint32_t old_read_domains;
Eric Anholte47c68e2008-11-14 13:35:19 -08003292 int i, ret;
Eric Anholt673a3942008-07-30 12:06:12 -07003293
Chris Wilson05394f32010-11-08 19:18:58 +00003294 if (offset == 0 && size == obj->base.size)
Eric Anholte47c68e2008-11-14 13:35:19 -08003295 return i915_gem_object_set_to_cpu_domain(obj, 0);
3296
Chris Wilson88241782011-01-07 17:09:48 +00003297 ret = i915_gem_object_flush_gpu_write_domain(obj);
3298 if (ret)
3299 return ret;
3300
Chris Wilsonce453d82011-02-21 14:43:56 +00003301 ret = i915_gem_object_wait_rendering(obj);
Daniel Vetterde18a292010-11-27 22:30:41 +01003302 if (ret)
Eric Anholte47c68e2008-11-14 13:35:19 -08003303 return ret;
Daniel Vetterde18a292010-11-27 22:30:41 +01003304
Eric Anholte47c68e2008-11-14 13:35:19 -08003305 i915_gem_object_flush_gtt_write_domain(obj);
3306
3307 /* If we're already fully in the CPU read domain, we're done. */
Chris Wilson05394f32010-11-08 19:18:58 +00003308 if (obj->page_cpu_valid == NULL &&
3309 (obj->base.read_domains & I915_GEM_DOMAIN_CPU) != 0)
Eric Anholt673a3942008-07-30 12:06:12 -07003310 return 0;
3311
Eric Anholte47c68e2008-11-14 13:35:19 -08003312 /* Otherwise, create/clear the per-page CPU read domain flag if we're
3313 * newly adding I915_GEM_DOMAIN_CPU
3314 */
Chris Wilson05394f32010-11-08 19:18:58 +00003315 if (obj->page_cpu_valid == NULL) {
3316 obj->page_cpu_valid = kzalloc(obj->base.size / PAGE_SIZE,
3317 GFP_KERNEL);
3318 if (obj->page_cpu_valid == NULL)
Eric Anholte47c68e2008-11-14 13:35:19 -08003319 return -ENOMEM;
Chris Wilson05394f32010-11-08 19:18:58 +00003320 } else if ((obj->base.read_domains & I915_GEM_DOMAIN_CPU) == 0)
3321 memset(obj->page_cpu_valid, 0, obj->base.size / PAGE_SIZE);
Eric Anholt673a3942008-07-30 12:06:12 -07003322
3323 /* Flush the cache on any pages that are still invalid from the CPU's
3324 * perspective.
3325 */
Eric Anholte47c68e2008-11-14 13:35:19 -08003326 for (i = offset / PAGE_SIZE; i <= (offset + size - 1) / PAGE_SIZE;
3327 i++) {
Chris Wilson05394f32010-11-08 19:18:58 +00003328 if (obj->page_cpu_valid[i])
Eric Anholt673a3942008-07-30 12:06:12 -07003329 continue;
3330
Chris Wilson05394f32010-11-08 19:18:58 +00003331 drm_clflush_pages(obj->pages + i, 1);
Eric Anholt673a3942008-07-30 12:06:12 -07003332
Chris Wilson05394f32010-11-08 19:18:58 +00003333 obj->page_cpu_valid[i] = 1;
Eric Anholt673a3942008-07-30 12:06:12 -07003334 }
3335
Eric Anholte47c68e2008-11-14 13:35:19 -08003336 /* It should now be out of any other write domains, and we can update
3337 * the domain values for our changes.
3338 */
Chris Wilson05394f32010-11-08 19:18:58 +00003339 BUG_ON((obj->base.write_domain & ~I915_GEM_DOMAIN_CPU) != 0);
Eric Anholte47c68e2008-11-14 13:35:19 -08003340
Chris Wilson05394f32010-11-08 19:18:58 +00003341 old_read_domains = obj->base.read_domains;
3342 obj->base.read_domains |= I915_GEM_DOMAIN_CPU;
Eric Anholte47c68e2008-11-14 13:35:19 -08003343
Chris Wilson1c5d22f2009-08-25 11:15:50 +01003344 trace_i915_gem_object_change_domain(obj,
3345 old_read_domains,
Chris Wilson05394f32010-11-08 19:18:58 +00003346 obj->base.write_domain);
Chris Wilson1c5d22f2009-08-25 11:15:50 +01003347
Eric Anholt673a3942008-07-30 12:06:12 -07003348 return 0;
3349}
3350
Eric Anholt673a3942008-07-30 12:06:12 -07003351/* Throttle our rendering by waiting until the ring has completed our requests
3352 * emitted over 20 msec ago.
3353 *
Eric Anholtb9624422009-06-03 07:27:35 +00003354 * Note that if we were to use the current jiffies each time around the loop,
3355 * we wouldn't escape the function with any frames outstanding if the time to
3356 * render a frame was over 20ms.
3357 *
Eric Anholt673a3942008-07-30 12:06:12 -07003358 * This should get us reasonable parallelism between CPU and GPU but also
3359 * relatively low latency when blocking on a particular request to finish.
3360 */
3361static int
Chris Wilsonf787a5f2010-09-24 16:02:42 +01003362i915_gem_ring_throttle(struct drm_device *dev, struct drm_file *file)
Eric Anholt673a3942008-07-30 12:06:12 -07003363{
Chris Wilsonf787a5f2010-09-24 16:02:42 +01003364 struct drm_i915_private *dev_priv = dev->dev_private;
3365 struct drm_i915_file_private *file_priv = file->driver_priv;
Eric Anholtb9624422009-06-03 07:27:35 +00003366 unsigned long recent_enough = jiffies - msecs_to_jiffies(20);
Chris Wilsonf787a5f2010-09-24 16:02:42 +01003367 struct drm_i915_gem_request *request;
3368 struct intel_ring_buffer *ring = NULL;
3369 u32 seqno = 0;
3370 int ret;
Eric Anholt673a3942008-07-30 12:06:12 -07003371
Chris Wilsone110e8d2011-01-26 15:39:14 +00003372 if (atomic_read(&dev_priv->mm.wedged))
3373 return -EIO;
3374
Chris Wilson1c255952010-09-26 11:03:27 +01003375 spin_lock(&file_priv->mm.lock);
Chris Wilsonf787a5f2010-09-24 16:02:42 +01003376 list_for_each_entry(request, &file_priv->mm.request_list, client_list) {
Eric Anholtb9624422009-06-03 07:27:35 +00003377 if (time_after_eq(request->emitted_jiffies, recent_enough))
3378 break;
3379
Chris Wilsonf787a5f2010-09-24 16:02:42 +01003380 ring = request->ring;
3381 seqno = request->seqno;
Eric Anholtb9624422009-06-03 07:27:35 +00003382 }
Chris Wilson1c255952010-09-26 11:03:27 +01003383 spin_unlock(&file_priv->mm.lock);
Chris Wilsonf787a5f2010-09-24 16:02:42 +01003384
3385 if (seqno == 0)
3386 return 0;
3387
3388 ret = 0;
Chris Wilson78501ea2010-10-27 12:18:21 +01003389 if (!i915_seqno_passed(ring->get_seqno(ring), seqno)) {
Chris Wilsonf787a5f2010-09-24 16:02:42 +01003390 /* And wait for the seqno passing without holding any locks and
3391 * causing extra latency for others. This is safe as the irq
3392 * generation is designed to be run atomically and so is
3393 * lockless.
3394 */
Chris Wilsonb13c2b92010-12-13 16:54:50 +00003395 if (ring->irq_get(ring)) {
3396 ret = wait_event_interruptible(ring->irq_queue,
3397 i915_seqno_passed(ring->get_seqno(ring), seqno)
3398 || atomic_read(&dev_priv->mm.wedged));
3399 ring->irq_put(ring);
Chris Wilsonf787a5f2010-09-24 16:02:42 +01003400
Chris Wilsonb13c2b92010-12-13 16:54:50 +00003401 if (ret == 0 && atomic_read(&dev_priv->mm.wedged))
3402 ret = -EIO;
3403 }
Chris Wilsonf787a5f2010-09-24 16:02:42 +01003404 }
3405
3406 if (ret == 0)
3407 queue_delayed_work(dev_priv->wq, &dev_priv->mm.retire_work, 0);
Eric Anholtb9624422009-06-03 07:27:35 +00003408
Eric Anholt673a3942008-07-30 12:06:12 -07003409 return ret;
3410}
3411
Eric Anholt673a3942008-07-30 12:06:12 -07003412int
Chris Wilson05394f32010-11-08 19:18:58 +00003413i915_gem_object_pin(struct drm_i915_gem_object *obj,
3414 uint32_t alignment,
Daniel Vetter75e9e912010-11-04 17:11:09 +01003415 bool map_and_fenceable)
Eric Anholt673a3942008-07-30 12:06:12 -07003416{
Chris Wilson05394f32010-11-08 19:18:58 +00003417 struct drm_device *dev = obj->base.dev;
Chris Wilsonf13d3f72010-09-20 17:36:15 +01003418 struct drm_i915_private *dev_priv = dev->dev_private;
Eric Anholt673a3942008-07-30 12:06:12 -07003419 int ret;
3420
Chris Wilson05394f32010-11-08 19:18:58 +00003421 BUG_ON(obj->pin_count == DRM_I915_GEM_OBJECT_MAX_PIN_COUNT);
Chris Wilson23bc5982010-09-29 16:10:57 +01003422 WARN_ON(i915_verify_lists(dev));
Chris Wilsonac0c6b52010-05-27 13:18:18 +01003423
Chris Wilson05394f32010-11-08 19:18:58 +00003424 if (obj->gtt_space != NULL) {
3425 if ((alignment && obj->gtt_offset & (alignment - 1)) ||
3426 (map_and_fenceable && !obj->map_and_fenceable)) {
3427 WARN(obj->pin_count,
Chris Wilsonae7d49d2010-08-04 12:37:41 +01003428 "bo is already pinned with incorrect alignment:"
Daniel Vetter75e9e912010-11-04 17:11:09 +01003429 " offset=%x, req.alignment=%x, req.map_and_fenceable=%d,"
3430 " obj->map_and_fenceable=%d\n",
Chris Wilson05394f32010-11-08 19:18:58 +00003431 obj->gtt_offset, alignment,
Daniel Vetter75e9e912010-11-04 17:11:09 +01003432 map_and_fenceable,
Chris Wilson05394f32010-11-08 19:18:58 +00003433 obj->map_and_fenceable);
Chris Wilsonac0c6b52010-05-27 13:18:18 +01003434 ret = i915_gem_object_unbind(obj);
3435 if (ret)
3436 return ret;
3437 }
3438 }
3439
Chris Wilson05394f32010-11-08 19:18:58 +00003440 if (obj->gtt_space == NULL) {
Chris Wilsona00b10c2010-09-24 21:15:47 +01003441 ret = i915_gem_object_bind_to_gtt(obj, alignment,
Daniel Vetter75e9e912010-11-04 17:11:09 +01003442 map_and_fenceable);
Chris Wilson97311292009-09-21 00:22:34 +01003443 if (ret)
Eric Anholt673a3942008-07-30 12:06:12 -07003444 return ret;
Chris Wilson22c344e2009-02-11 14:26:45 +00003445 }
Jesse Barnes76446ca2009-12-17 22:05:42 -05003446
Chris Wilson05394f32010-11-08 19:18:58 +00003447 if (obj->pin_count++ == 0) {
Chris Wilson05394f32010-11-08 19:18:58 +00003448 if (!obj->active)
3449 list_move_tail(&obj->mm_list,
Chris Wilsonf13d3f72010-09-20 17:36:15 +01003450 &dev_priv->mm.pinned_list);
Eric Anholt673a3942008-07-30 12:06:12 -07003451 }
Chris Wilson6299f992010-11-24 12:23:44 +00003452 obj->pin_mappable |= map_and_fenceable;
Eric Anholt673a3942008-07-30 12:06:12 -07003453
Chris Wilson23bc5982010-09-29 16:10:57 +01003454 WARN_ON(i915_verify_lists(dev));
Eric Anholt673a3942008-07-30 12:06:12 -07003455 return 0;
3456}
3457
3458void
Chris Wilson05394f32010-11-08 19:18:58 +00003459i915_gem_object_unpin(struct drm_i915_gem_object *obj)
Eric Anholt673a3942008-07-30 12:06:12 -07003460{
Chris Wilson05394f32010-11-08 19:18:58 +00003461 struct drm_device *dev = obj->base.dev;
Eric Anholt673a3942008-07-30 12:06:12 -07003462 drm_i915_private_t *dev_priv = dev->dev_private;
Eric Anholt673a3942008-07-30 12:06:12 -07003463
Chris Wilson23bc5982010-09-29 16:10:57 +01003464 WARN_ON(i915_verify_lists(dev));
Chris Wilson05394f32010-11-08 19:18:58 +00003465 BUG_ON(obj->pin_count == 0);
3466 BUG_ON(obj->gtt_space == NULL);
Eric Anholt673a3942008-07-30 12:06:12 -07003467
Chris Wilson05394f32010-11-08 19:18:58 +00003468 if (--obj->pin_count == 0) {
3469 if (!obj->active)
3470 list_move_tail(&obj->mm_list,
Eric Anholt673a3942008-07-30 12:06:12 -07003471 &dev_priv->mm.inactive_list);
Chris Wilson6299f992010-11-24 12:23:44 +00003472 obj->pin_mappable = false;
Eric Anholt673a3942008-07-30 12:06:12 -07003473 }
Chris Wilson23bc5982010-09-29 16:10:57 +01003474 WARN_ON(i915_verify_lists(dev));
Eric Anholt673a3942008-07-30 12:06:12 -07003475}
3476
3477int
3478i915_gem_pin_ioctl(struct drm_device *dev, void *data,
Chris Wilson05394f32010-11-08 19:18:58 +00003479 struct drm_file *file)
Eric Anholt673a3942008-07-30 12:06:12 -07003480{
3481 struct drm_i915_gem_pin *args = data;
Chris Wilson05394f32010-11-08 19:18:58 +00003482 struct drm_i915_gem_object *obj;
Eric Anholt673a3942008-07-30 12:06:12 -07003483 int ret;
3484
Chris Wilson1d7cfea2010-10-17 09:45:41 +01003485 ret = i915_mutex_lock_interruptible(dev);
3486 if (ret)
3487 return ret;
Eric Anholt673a3942008-07-30 12:06:12 -07003488
Chris Wilson05394f32010-11-08 19:18:58 +00003489 obj = to_intel_bo(drm_gem_object_lookup(dev, file, args->handle));
Chris Wilsonc8725222011-02-19 11:31:06 +00003490 if (&obj->base == NULL) {
Chris Wilson1d7cfea2010-10-17 09:45:41 +01003491 ret = -ENOENT;
3492 goto unlock;
Eric Anholt673a3942008-07-30 12:06:12 -07003493 }
Eric Anholt673a3942008-07-30 12:06:12 -07003494
Chris Wilson05394f32010-11-08 19:18:58 +00003495 if (obj->madv != I915_MADV_WILLNEED) {
Chris Wilsonbb6baf72009-09-22 14:24:13 +01003496 DRM_ERROR("Attempting to pin a purgeable buffer\n");
Chris Wilson1d7cfea2010-10-17 09:45:41 +01003497 ret = -EINVAL;
3498 goto out;
Chris Wilson3ef94da2009-09-14 16:50:29 +01003499 }
3500
Chris Wilson05394f32010-11-08 19:18:58 +00003501 if (obj->pin_filp != NULL && obj->pin_filp != file) {
Jesse Barnes79e53942008-11-07 14:24:08 -08003502 DRM_ERROR("Already pinned in i915_gem_pin_ioctl(): %d\n",
3503 args->handle);
Chris Wilson1d7cfea2010-10-17 09:45:41 +01003504 ret = -EINVAL;
3505 goto out;
Jesse Barnes79e53942008-11-07 14:24:08 -08003506 }
3507
Chris Wilson05394f32010-11-08 19:18:58 +00003508 obj->user_pin_count++;
3509 obj->pin_filp = file;
3510 if (obj->user_pin_count == 1) {
Daniel Vetter75e9e912010-11-04 17:11:09 +01003511 ret = i915_gem_object_pin(obj, args->alignment, true);
Chris Wilson1d7cfea2010-10-17 09:45:41 +01003512 if (ret)
3513 goto out;
Eric Anholt673a3942008-07-30 12:06:12 -07003514 }
3515
3516 /* XXX - flush the CPU caches for pinned objects
3517 * as the X server doesn't manage domains yet
3518 */
Eric Anholte47c68e2008-11-14 13:35:19 -08003519 i915_gem_object_flush_cpu_write_domain(obj);
Chris Wilson05394f32010-11-08 19:18:58 +00003520 args->offset = obj->gtt_offset;
Chris Wilson1d7cfea2010-10-17 09:45:41 +01003521out:
Chris Wilson05394f32010-11-08 19:18:58 +00003522 drm_gem_object_unreference(&obj->base);
Chris Wilson1d7cfea2010-10-17 09:45:41 +01003523unlock:
Eric Anholt673a3942008-07-30 12:06:12 -07003524 mutex_unlock(&dev->struct_mutex);
Chris Wilson1d7cfea2010-10-17 09:45:41 +01003525 return ret;
Eric Anholt673a3942008-07-30 12:06:12 -07003526}
3527
3528int
3529i915_gem_unpin_ioctl(struct drm_device *dev, void *data,
Chris Wilson05394f32010-11-08 19:18:58 +00003530 struct drm_file *file)
Eric Anholt673a3942008-07-30 12:06:12 -07003531{
3532 struct drm_i915_gem_pin *args = data;
Chris Wilson05394f32010-11-08 19:18:58 +00003533 struct drm_i915_gem_object *obj;
Chris Wilson76c1dec2010-09-25 11:22:51 +01003534 int ret;
Eric Anholt673a3942008-07-30 12:06:12 -07003535
Chris Wilson1d7cfea2010-10-17 09:45:41 +01003536 ret = i915_mutex_lock_interruptible(dev);
3537 if (ret)
3538 return ret;
Eric Anholt673a3942008-07-30 12:06:12 -07003539
Chris Wilson05394f32010-11-08 19:18:58 +00003540 obj = to_intel_bo(drm_gem_object_lookup(dev, file, args->handle));
Chris Wilsonc8725222011-02-19 11:31:06 +00003541 if (&obj->base == NULL) {
Chris Wilson1d7cfea2010-10-17 09:45:41 +01003542 ret = -ENOENT;
3543 goto unlock;
Eric Anholt673a3942008-07-30 12:06:12 -07003544 }
Chris Wilson76c1dec2010-09-25 11:22:51 +01003545
Chris Wilson05394f32010-11-08 19:18:58 +00003546 if (obj->pin_filp != file) {
Jesse Barnes79e53942008-11-07 14:24:08 -08003547 DRM_ERROR("Not pinned by caller in i915_gem_pin_ioctl(): %d\n",
3548 args->handle);
Chris Wilson1d7cfea2010-10-17 09:45:41 +01003549 ret = -EINVAL;
3550 goto out;
Jesse Barnes79e53942008-11-07 14:24:08 -08003551 }
Chris Wilson05394f32010-11-08 19:18:58 +00003552 obj->user_pin_count--;
3553 if (obj->user_pin_count == 0) {
3554 obj->pin_filp = NULL;
Jesse Barnes79e53942008-11-07 14:24:08 -08003555 i915_gem_object_unpin(obj);
3556 }
Eric Anholt673a3942008-07-30 12:06:12 -07003557
Chris Wilson1d7cfea2010-10-17 09:45:41 +01003558out:
Chris Wilson05394f32010-11-08 19:18:58 +00003559 drm_gem_object_unreference(&obj->base);
Chris Wilson1d7cfea2010-10-17 09:45:41 +01003560unlock:
Eric Anholt673a3942008-07-30 12:06:12 -07003561 mutex_unlock(&dev->struct_mutex);
Chris Wilson1d7cfea2010-10-17 09:45:41 +01003562 return ret;
Eric Anholt673a3942008-07-30 12:06:12 -07003563}
3564
3565int
3566i915_gem_busy_ioctl(struct drm_device *dev, void *data,
Chris Wilson05394f32010-11-08 19:18:58 +00003567 struct drm_file *file)
Eric Anholt673a3942008-07-30 12:06:12 -07003568{
3569 struct drm_i915_gem_busy *args = data;
Chris Wilson05394f32010-11-08 19:18:58 +00003570 struct drm_i915_gem_object *obj;
Chris Wilson30dbf0c2010-09-25 10:19:17 +01003571 int ret;
3572
Chris Wilson1d7cfea2010-10-17 09:45:41 +01003573 ret = i915_mutex_lock_interruptible(dev);
3574 if (ret)
3575 return ret;
Eric Anholt673a3942008-07-30 12:06:12 -07003576
Chris Wilson05394f32010-11-08 19:18:58 +00003577 obj = to_intel_bo(drm_gem_object_lookup(dev, file, args->handle));
Chris Wilsonc8725222011-02-19 11:31:06 +00003578 if (&obj->base == NULL) {
Chris Wilson1d7cfea2010-10-17 09:45:41 +01003579 ret = -ENOENT;
3580 goto unlock;
Eric Anholt673a3942008-07-30 12:06:12 -07003581 }
Zou Nan haid1b851f2010-05-21 09:08:57 +08003582
Chris Wilson0be555b2010-08-04 15:36:30 +01003583 /* Count all active objects as busy, even if they are currently not used
3584 * by the gpu. Users of this interface expect objects to eventually
3585 * become non-busy without any further actions, therefore emit any
3586 * necessary flushes here.
Eric Anholtc4de0a52008-12-14 19:05:04 -08003587 */
Chris Wilson05394f32010-11-08 19:18:58 +00003588 args->busy = obj->active;
Chris Wilson0be555b2010-08-04 15:36:30 +01003589 if (args->busy) {
3590 /* Unconditionally flush objects, even when the gpu still uses this
3591 * object. Userspace calling this function indicates that it wants to
3592 * use this buffer rather sooner than later, so issuing the required
3593 * flush earlier is beneficial.
3594 */
Chris Wilson1a1c6972010-12-07 23:00:20 +00003595 if (obj->base.write_domain & I915_GEM_GPU_DOMAINS) {
Chris Wilsondb53a302011-02-03 11:57:46 +00003596 ret = i915_gem_flush_ring(obj->ring,
Chris Wilson88241782011-01-07 17:09:48 +00003597 0, obj->base.write_domain);
Chris Wilson1a1c6972010-12-07 23:00:20 +00003598 } else if (obj->ring->outstanding_lazy_request ==
3599 obj->last_rendering_seqno) {
3600 struct drm_i915_gem_request *request;
3601
Chris Wilson7a194872010-12-07 10:38:40 +00003602 /* This ring is not being cleared by active usage,
3603 * so emit a request to do so.
3604 */
Chris Wilson1a1c6972010-12-07 23:00:20 +00003605 request = kzalloc(sizeof(*request), GFP_KERNEL);
3606 if (request)
Chris Wilsondb53a302011-02-03 11:57:46 +00003607 ret = i915_add_request(obj->ring, NULL,request);
Chris Wilson1a1c6972010-12-07 23:00:20 +00003608 else
Chris Wilson7a194872010-12-07 10:38:40 +00003609 ret = -ENOMEM;
3610 }
Chris Wilson0be555b2010-08-04 15:36:30 +01003611
3612 /* Update the active list for the hardware's current position.
3613 * Otherwise this only updates on a delayed timer or when irqs
3614 * are actually unmasked, and our working set ends up being
3615 * larger than required.
3616 */
Chris Wilsondb53a302011-02-03 11:57:46 +00003617 i915_gem_retire_requests_ring(obj->ring);
Chris Wilson0be555b2010-08-04 15:36:30 +01003618
Chris Wilson05394f32010-11-08 19:18:58 +00003619 args->busy = obj->active;
Chris Wilson0be555b2010-08-04 15:36:30 +01003620 }
Eric Anholt673a3942008-07-30 12:06:12 -07003621
Chris Wilson05394f32010-11-08 19:18:58 +00003622 drm_gem_object_unreference(&obj->base);
Chris Wilson1d7cfea2010-10-17 09:45:41 +01003623unlock:
Eric Anholt673a3942008-07-30 12:06:12 -07003624 mutex_unlock(&dev->struct_mutex);
Chris Wilson1d7cfea2010-10-17 09:45:41 +01003625 return ret;
Eric Anholt673a3942008-07-30 12:06:12 -07003626}
3627
3628int
3629i915_gem_throttle_ioctl(struct drm_device *dev, void *data,
3630 struct drm_file *file_priv)
3631{
3632 return i915_gem_ring_throttle(dev, file_priv);
3633}
3634
Chris Wilson3ef94da2009-09-14 16:50:29 +01003635int
3636i915_gem_madvise_ioctl(struct drm_device *dev, void *data,
3637 struct drm_file *file_priv)
3638{
3639 struct drm_i915_gem_madvise *args = data;
Chris Wilson05394f32010-11-08 19:18:58 +00003640 struct drm_i915_gem_object *obj;
Chris Wilson76c1dec2010-09-25 11:22:51 +01003641 int ret;
Chris Wilson3ef94da2009-09-14 16:50:29 +01003642
3643 switch (args->madv) {
3644 case I915_MADV_DONTNEED:
3645 case I915_MADV_WILLNEED:
3646 break;
3647 default:
3648 return -EINVAL;
3649 }
3650
Chris Wilson1d7cfea2010-10-17 09:45:41 +01003651 ret = i915_mutex_lock_interruptible(dev);
3652 if (ret)
3653 return ret;
3654
Chris Wilson05394f32010-11-08 19:18:58 +00003655 obj = to_intel_bo(drm_gem_object_lookup(dev, file_priv, args->handle));
Chris Wilsonc8725222011-02-19 11:31:06 +00003656 if (&obj->base == NULL) {
Chris Wilson1d7cfea2010-10-17 09:45:41 +01003657 ret = -ENOENT;
3658 goto unlock;
Chris Wilson3ef94da2009-09-14 16:50:29 +01003659 }
Chris Wilson3ef94da2009-09-14 16:50:29 +01003660
Chris Wilson05394f32010-11-08 19:18:58 +00003661 if (obj->pin_count) {
Chris Wilson1d7cfea2010-10-17 09:45:41 +01003662 ret = -EINVAL;
3663 goto out;
Chris Wilson3ef94da2009-09-14 16:50:29 +01003664 }
3665
Chris Wilson05394f32010-11-08 19:18:58 +00003666 if (obj->madv != __I915_MADV_PURGED)
3667 obj->madv = args->madv;
Chris Wilson3ef94da2009-09-14 16:50:29 +01003668
Chris Wilson2d7ef392009-09-20 23:13:10 +01003669 /* if the object is no longer bound, discard its backing storage */
Chris Wilson05394f32010-11-08 19:18:58 +00003670 if (i915_gem_object_is_purgeable(obj) &&
3671 obj->gtt_space == NULL)
Chris Wilson2d7ef392009-09-20 23:13:10 +01003672 i915_gem_object_truncate(obj);
3673
Chris Wilson05394f32010-11-08 19:18:58 +00003674 args->retained = obj->madv != __I915_MADV_PURGED;
Chris Wilsonbb6baf72009-09-22 14:24:13 +01003675
Chris Wilson1d7cfea2010-10-17 09:45:41 +01003676out:
Chris Wilson05394f32010-11-08 19:18:58 +00003677 drm_gem_object_unreference(&obj->base);
Chris Wilson1d7cfea2010-10-17 09:45:41 +01003678unlock:
Chris Wilson3ef94da2009-09-14 16:50:29 +01003679 mutex_unlock(&dev->struct_mutex);
Chris Wilson1d7cfea2010-10-17 09:45:41 +01003680 return ret;
Chris Wilson3ef94da2009-09-14 16:50:29 +01003681}
3682
Chris Wilson05394f32010-11-08 19:18:58 +00003683struct drm_i915_gem_object *i915_gem_alloc_object(struct drm_device *dev,
3684 size_t size)
Daniel Vetterac52bc52010-04-09 19:05:06 +00003685{
Chris Wilson73aa8082010-09-30 11:46:12 +01003686 struct drm_i915_private *dev_priv = dev->dev_private;
Daniel Vetterc397b902010-04-09 19:05:07 +00003687 struct drm_i915_gem_object *obj;
3688
3689 obj = kzalloc(sizeof(*obj), GFP_KERNEL);
3690 if (obj == NULL)
3691 return NULL;
3692
3693 if (drm_gem_object_init(dev, &obj->base, size) != 0) {
3694 kfree(obj);
3695 return NULL;
3696 }
3697
Chris Wilson73aa8082010-09-30 11:46:12 +01003698 i915_gem_info_add_obj(dev_priv, size);
3699
Daniel Vetterc397b902010-04-09 19:05:07 +00003700 obj->base.write_domain = I915_GEM_DOMAIN_CPU;
3701 obj->base.read_domains = I915_GEM_DOMAIN_CPU;
3702
Eric Anholta1871112011-03-29 16:59:55 -07003703 if (IS_GEN6(dev)) {
3704 /* On Gen6, we can have the GPU use the LLC (the CPU
3705 * cache) for about a 10% performance improvement
3706 * compared to uncached. Graphics requests other than
3707 * display scanout are coherent with the CPU in
3708 * accessing this cache. This means in this mode we
3709 * don't need to clflush on the CPU side, and on the
3710 * GPU side we only need to flush internal caches to
3711 * get data visible to the CPU.
3712 *
3713 * However, we maintain the display planes as UC, and so
3714 * need to rebind when first used as such.
3715 */
3716 obj->cache_level = I915_CACHE_LLC;
3717 } else
3718 obj->cache_level = I915_CACHE_NONE;
3719
Daniel Vetter62b8b212010-04-09 19:05:08 +00003720 obj->base.driver_private = NULL;
Daniel Vetterc397b902010-04-09 19:05:07 +00003721 obj->fence_reg = I915_FENCE_REG_NONE;
Chris Wilson69dc4982010-10-19 10:36:51 +01003722 INIT_LIST_HEAD(&obj->mm_list);
Daniel Vetter93a37f22010-11-05 20:24:53 +01003723 INIT_LIST_HEAD(&obj->gtt_list);
Chris Wilson69dc4982010-10-19 10:36:51 +01003724 INIT_LIST_HEAD(&obj->ring_list);
Chris Wilson432e58e2010-11-25 19:32:06 +00003725 INIT_LIST_HEAD(&obj->exec_list);
Daniel Vetterc397b902010-04-09 19:05:07 +00003726 INIT_LIST_HEAD(&obj->gpu_write_list);
Daniel Vetterc397b902010-04-09 19:05:07 +00003727 obj->madv = I915_MADV_WILLNEED;
Daniel Vetter75e9e912010-11-04 17:11:09 +01003728 /* Avoid an unnecessary call to unbind on the first bind. */
3729 obj->map_and_fenceable = true;
Daniel Vetterc397b902010-04-09 19:05:07 +00003730
Chris Wilson05394f32010-11-08 19:18:58 +00003731 return obj;
Daniel Vetterac52bc52010-04-09 19:05:06 +00003732}
3733
Eric Anholt673a3942008-07-30 12:06:12 -07003734int i915_gem_init_object(struct drm_gem_object *obj)
3735{
Daniel Vetterc397b902010-04-09 19:05:07 +00003736 BUG();
Jesse Barnesde151cf2008-11-12 10:03:55 -08003737
Eric Anholt673a3942008-07-30 12:06:12 -07003738 return 0;
3739}
3740
Chris Wilson05394f32010-11-08 19:18:58 +00003741static void i915_gem_free_object_tail(struct drm_i915_gem_object *obj)
Chris Wilsonbe726152010-07-23 23:18:50 +01003742{
Chris Wilson05394f32010-11-08 19:18:58 +00003743 struct drm_device *dev = obj->base.dev;
Chris Wilsonbe726152010-07-23 23:18:50 +01003744 drm_i915_private_t *dev_priv = dev->dev_private;
Chris Wilsonbe726152010-07-23 23:18:50 +01003745 int ret;
3746
3747 ret = i915_gem_object_unbind(obj);
3748 if (ret == -ERESTARTSYS) {
Chris Wilson05394f32010-11-08 19:18:58 +00003749 list_move(&obj->mm_list,
Chris Wilsonbe726152010-07-23 23:18:50 +01003750 &dev_priv->mm.deferred_free_list);
3751 return;
3752 }
3753
Chris Wilson26e12f892011-03-20 11:20:19 +00003754 trace_i915_gem_object_destroy(obj);
3755
Chris Wilson05394f32010-11-08 19:18:58 +00003756 if (obj->base.map_list.map)
Chris Wilsonbe726152010-07-23 23:18:50 +01003757 i915_gem_free_mmap_offset(obj);
3758
Chris Wilson05394f32010-11-08 19:18:58 +00003759 drm_gem_object_release(&obj->base);
3760 i915_gem_info_remove_obj(dev_priv, obj->base.size);
Chris Wilsonbe726152010-07-23 23:18:50 +01003761
Chris Wilson05394f32010-11-08 19:18:58 +00003762 kfree(obj->page_cpu_valid);
3763 kfree(obj->bit_17);
3764 kfree(obj);
Chris Wilsonbe726152010-07-23 23:18:50 +01003765}
3766
Chris Wilson05394f32010-11-08 19:18:58 +00003767void i915_gem_free_object(struct drm_gem_object *gem_obj)
Eric Anholt673a3942008-07-30 12:06:12 -07003768{
Chris Wilson05394f32010-11-08 19:18:58 +00003769 struct drm_i915_gem_object *obj = to_intel_bo(gem_obj);
3770 struct drm_device *dev = obj->base.dev;
Eric Anholt673a3942008-07-30 12:06:12 -07003771
Chris Wilson05394f32010-11-08 19:18:58 +00003772 while (obj->pin_count > 0)
Eric Anholt673a3942008-07-30 12:06:12 -07003773 i915_gem_object_unpin(obj);
3774
Chris Wilson05394f32010-11-08 19:18:58 +00003775 if (obj->phys_obj)
Dave Airlie71acb5e2008-12-30 20:31:46 +10003776 i915_gem_detach_phys_object(dev, obj);
3777
Chris Wilsonbe726152010-07-23 23:18:50 +01003778 i915_gem_free_object_tail(obj);
Eric Anholt673a3942008-07-30 12:06:12 -07003779}
3780
Jesse Barnes5669fca2009-02-17 15:13:31 -08003781int
Eric Anholt673a3942008-07-30 12:06:12 -07003782i915_gem_idle(struct drm_device *dev)
3783{
3784 drm_i915_private_t *dev_priv = dev->dev_private;
Chris Wilson29105cc2010-01-07 10:39:13 +00003785 int ret;
Eric Anholt673a3942008-07-30 12:06:12 -07003786
Keith Packard6dbe2772008-10-14 21:41:13 -07003787 mutex_lock(&dev->struct_mutex);
3788
Chris Wilson87acb0a2010-10-19 10:13:00 +01003789 if (dev_priv->mm.suspended) {
Keith Packard6dbe2772008-10-14 21:41:13 -07003790 mutex_unlock(&dev->struct_mutex);
Eric Anholt673a3942008-07-30 12:06:12 -07003791 return 0;
Keith Packard6dbe2772008-10-14 21:41:13 -07003792 }
Eric Anholt673a3942008-07-30 12:06:12 -07003793
Chris Wilson29105cc2010-01-07 10:39:13 +00003794 ret = i915_gpu_idle(dev);
Keith Packard6dbe2772008-10-14 21:41:13 -07003795 if (ret) {
3796 mutex_unlock(&dev->struct_mutex);
Eric Anholt673a3942008-07-30 12:06:12 -07003797 return ret;
Keith Packard6dbe2772008-10-14 21:41:13 -07003798 }
Eric Anholt673a3942008-07-30 12:06:12 -07003799
Chris Wilson29105cc2010-01-07 10:39:13 +00003800 /* Under UMS, be paranoid and evict. */
3801 if (!drm_core_check_feature(dev, DRIVER_MODESET)) {
Chris Wilson5eac3ab2010-10-31 08:49:47 +00003802 ret = i915_gem_evict_inactive(dev, false);
Chris Wilson29105cc2010-01-07 10:39:13 +00003803 if (ret) {
3804 mutex_unlock(&dev->struct_mutex);
3805 return ret;
3806 }
3807 }
3808
Chris Wilson312817a2010-11-22 11:50:11 +00003809 i915_gem_reset_fences(dev);
3810
Chris Wilson29105cc2010-01-07 10:39:13 +00003811 /* Hack! Don't let anybody do execbuf while we don't control the chip.
3812 * We need to replace this with a semaphore, or something.
3813 * And not confound mm.suspended!
3814 */
3815 dev_priv->mm.suspended = 1;
Daniel Vetterbc0c7f12010-08-20 18:18:48 +02003816 del_timer_sync(&dev_priv->hangcheck_timer);
Chris Wilson29105cc2010-01-07 10:39:13 +00003817
3818 i915_kernel_lost_context(dev);
Keith Packard6dbe2772008-10-14 21:41:13 -07003819 i915_gem_cleanup_ringbuffer(dev);
Chris Wilson29105cc2010-01-07 10:39:13 +00003820
Keith Packard6dbe2772008-10-14 21:41:13 -07003821 mutex_unlock(&dev->struct_mutex);
3822
Chris Wilson29105cc2010-01-07 10:39:13 +00003823 /* Cancel the retire work handler, which should be idle now. */
3824 cancel_delayed_work_sync(&dev_priv->mm.retire_work);
3825
Eric Anholt673a3942008-07-30 12:06:12 -07003826 return 0;
3827}
3828
Eric Anholt673a3942008-07-30 12:06:12 -07003829int
Zou Nan hai8187a2b2010-05-21 09:08:55 +08003830i915_gem_init_ringbuffer(struct drm_device *dev)
3831{
3832 drm_i915_private_t *dev_priv = dev->dev_private;
3833 int ret;
Chris Wilson68f95ba2010-05-27 13:18:22 +01003834
Xiang, Haihao5c1143b2010-09-16 10:43:11 +08003835 ret = intel_init_render_ring_buffer(dev);
Chris Wilson68f95ba2010-05-27 13:18:22 +01003836 if (ret)
Chris Wilsonb6913e42010-11-12 10:46:37 +00003837 return ret;
Chris Wilson68f95ba2010-05-27 13:18:22 +01003838
3839 if (HAS_BSD(dev)) {
Xiang, Haihao5c1143b2010-09-16 10:43:11 +08003840 ret = intel_init_bsd_ring_buffer(dev);
Chris Wilson68f95ba2010-05-27 13:18:22 +01003841 if (ret)
3842 goto cleanup_render_ring;
Zou Nan haid1b851f2010-05-21 09:08:57 +08003843 }
Chris Wilson68f95ba2010-05-27 13:18:22 +01003844
Chris Wilson549f7362010-10-19 11:19:32 +01003845 if (HAS_BLT(dev)) {
3846 ret = intel_init_blt_ring_buffer(dev);
3847 if (ret)
3848 goto cleanup_bsd_ring;
3849 }
3850
Chris Wilson6f392d5482010-08-07 11:01:22 +01003851 dev_priv->next_seqno = 1;
3852
Chris Wilson68f95ba2010-05-27 13:18:22 +01003853 return 0;
3854
Chris Wilson549f7362010-10-19 11:19:32 +01003855cleanup_bsd_ring:
Chris Wilson1ec14ad2010-12-04 11:30:53 +00003856 intel_cleanup_ring_buffer(&dev_priv->ring[VCS]);
Chris Wilson68f95ba2010-05-27 13:18:22 +01003857cleanup_render_ring:
Chris Wilson1ec14ad2010-12-04 11:30:53 +00003858 intel_cleanup_ring_buffer(&dev_priv->ring[RCS]);
Zou Nan hai8187a2b2010-05-21 09:08:55 +08003859 return ret;
3860}
3861
3862void
3863i915_gem_cleanup_ringbuffer(struct drm_device *dev)
3864{
3865 drm_i915_private_t *dev_priv = dev->dev_private;
Chris Wilson1ec14ad2010-12-04 11:30:53 +00003866 int i;
Zou Nan hai8187a2b2010-05-21 09:08:55 +08003867
Chris Wilson1ec14ad2010-12-04 11:30:53 +00003868 for (i = 0; i < I915_NUM_RINGS; i++)
3869 intel_cleanup_ring_buffer(&dev_priv->ring[i]);
Zou Nan hai8187a2b2010-05-21 09:08:55 +08003870}
3871
3872int
Eric Anholt673a3942008-07-30 12:06:12 -07003873i915_gem_entervt_ioctl(struct drm_device *dev, void *data,
3874 struct drm_file *file_priv)
3875{
3876 drm_i915_private_t *dev_priv = dev->dev_private;
Chris Wilson1ec14ad2010-12-04 11:30:53 +00003877 int ret, i;
Eric Anholt673a3942008-07-30 12:06:12 -07003878
Jesse Barnes79e53942008-11-07 14:24:08 -08003879 if (drm_core_check_feature(dev, DRIVER_MODESET))
3880 return 0;
3881
Ben Gamariba1234d2009-09-14 17:48:47 -04003882 if (atomic_read(&dev_priv->mm.wedged)) {
Eric Anholt673a3942008-07-30 12:06:12 -07003883 DRM_ERROR("Reenabling wedged hardware, good luck\n");
Ben Gamariba1234d2009-09-14 17:48:47 -04003884 atomic_set(&dev_priv->mm.wedged, 0);
Eric Anholt673a3942008-07-30 12:06:12 -07003885 }
3886
Eric Anholt673a3942008-07-30 12:06:12 -07003887 mutex_lock(&dev->struct_mutex);
Eric Anholt9bb2d6f2008-12-23 18:42:32 -08003888 dev_priv->mm.suspended = 0;
3889
3890 ret = i915_gem_init_ringbuffer(dev);
Wu Fengguangd816f6a2009-04-18 10:43:32 +08003891 if (ret != 0) {
3892 mutex_unlock(&dev->struct_mutex);
Eric Anholt9bb2d6f2008-12-23 18:42:32 -08003893 return ret;
Wu Fengguangd816f6a2009-04-18 10:43:32 +08003894 }
Eric Anholt9bb2d6f2008-12-23 18:42:32 -08003895
Chris Wilson69dc4982010-10-19 10:36:51 +01003896 BUG_ON(!list_empty(&dev_priv->mm.active_list));
Eric Anholt673a3942008-07-30 12:06:12 -07003897 BUG_ON(!list_empty(&dev_priv->mm.flushing_list));
3898 BUG_ON(!list_empty(&dev_priv->mm.inactive_list));
Chris Wilson1ec14ad2010-12-04 11:30:53 +00003899 for (i = 0; i < I915_NUM_RINGS; i++) {
3900 BUG_ON(!list_empty(&dev_priv->ring[i].active_list));
3901 BUG_ON(!list_empty(&dev_priv->ring[i].request_list));
3902 }
Eric Anholt673a3942008-07-30 12:06:12 -07003903 mutex_unlock(&dev->struct_mutex);
Kristian Høgsbergdbb19d32008-08-20 11:04:27 -04003904
Chris Wilson5f353082010-06-07 14:03:03 +01003905 ret = drm_irq_install(dev);
3906 if (ret)
3907 goto cleanup_ringbuffer;
Kristian Høgsbergdbb19d32008-08-20 11:04:27 -04003908
Eric Anholt673a3942008-07-30 12:06:12 -07003909 return 0;
Chris Wilson5f353082010-06-07 14:03:03 +01003910
3911cleanup_ringbuffer:
3912 mutex_lock(&dev->struct_mutex);
3913 i915_gem_cleanup_ringbuffer(dev);
3914 dev_priv->mm.suspended = 1;
3915 mutex_unlock(&dev->struct_mutex);
3916
3917 return ret;
Eric Anholt673a3942008-07-30 12:06:12 -07003918}
3919
3920int
3921i915_gem_leavevt_ioctl(struct drm_device *dev, void *data,
3922 struct drm_file *file_priv)
3923{
Jesse Barnes79e53942008-11-07 14:24:08 -08003924 if (drm_core_check_feature(dev, DRIVER_MODESET))
3925 return 0;
3926
Kristian Høgsbergdbb19d32008-08-20 11:04:27 -04003927 drm_irq_uninstall(dev);
Linus Torvaldse6890f62009-09-08 17:09:24 -07003928 return i915_gem_idle(dev);
Eric Anholt673a3942008-07-30 12:06:12 -07003929}
3930
3931void
3932i915_gem_lastclose(struct drm_device *dev)
3933{
3934 int ret;
Eric Anholt673a3942008-07-30 12:06:12 -07003935
Eric Anholte806b492009-01-22 09:56:58 -08003936 if (drm_core_check_feature(dev, DRIVER_MODESET))
3937 return;
3938
Keith Packard6dbe2772008-10-14 21:41:13 -07003939 ret = i915_gem_idle(dev);
3940 if (ret)
3941 DRM_ERROR("failed to idle hardware: %d\n", ret);
Eric Anholt673a3942008-07-30 12:06:12 -07003942}
3943
Chris Wilson64193402010-10-24 12:38:05 +01003944static void
3945init_ring_lists(struct intel_ring_buffer *ring)
3946{
3947 INIT_LIST_HEAD(&ring->active_list);
3948 INIT_LIST_HEAD(&ring->request_list);
3949 INIT_LIST_HEAD(&ring->gpu_write_list);
3950}
3951
Eric Anholt673a3942008-07-30 12:06:12 -07003952void
3953i915_gem_load(struct drm_device *dev)
3954{
Grégoire Henryb5aa8a02009-06-23 15:41:02 +02003955 int i;
Eric Anholt673a3942008-07-30 12:06:12 -07003956 drm_i915_private_t *dev_priv = dev->dev_private;
3957
Chris Wilson69dc4982010-10-19 10:36:51 +01003958 INIT_LIST_HEAD(&dev_priv->mm.active_list);
Eric Anholt673a3942008-07-30 12:06:12 -07003959 INIT_LIST_HEAD(&dev_priv->mm.flushing_list);
3960 INIT_LIST_HEAD(&dev_priv->mm.inactive_list);
Chris Wilsonf13d3f72010-09-20 17:36:15 +01003961 INIT_LIST_HEAD(&dev_priv->mm.pinned_list);
Eric Anholta09ba7f2009-08-29 12:49:51 -07003962 INIT_LIST_HEAD(&dev_priv->mm.fence_list);
Chris Wilsonbe726152010-07-23 23:18:50 +01003963 INIT_LIST_HEAD(&dev_priv->mm.deferred_free_list);
Daniel Vetter93a37f22010-11-05 20:24:53 +01003964 INIT_LIST_HEAD(&dev_priv->mm.gtt_list);
Chris Wilson1ec14ad2010-12-04 11:30:53 +00003965 for (i = 0; i < I915_NUM_RINGS; i++)
3966 init_ring_lists(&dev_priv->ring[i]);
Daniel Vetter007cc8a2010-04-28 11:02:31 +02003967 for (i = 0; i < 16; i++)
3968 INIT_LIST_HEAD(&dev_priv->fence_regs[i].lru_list);
Eric Anholt673a3942008-07-30 12:06:12 -07003969 INIT_DELAYED_WORK(&dev_priv->mm.retire_work,
3970 i915_gem_retire_work_handler);
Chris Wilson30dbf0c2010-09-25 10:19:17 +01003971 init_completion(&dev_priv->error_completion);
Chris Wilson31169712009-09-14 16:50:28 +01003972
Dave Airlie94400122010-07-20 13:15:31 +10003973 /* On GEN3 we really need to make sure the ARB C3 LP bit is set */
3974 if (IS_GEN3(dev)) {
3975 u32 tmp = I915_READ(MI_ARB_STATE);
3976 if (!(tmp & MI_ARB_C3_LP_WRITE_ENABLE)) {
3977 /* arb state is a masked write, so set bit + bit in mask */
3978 tmp = MI_ARB_C3_LP_WRITE_ENABLE | (MI_ARB_C3_LP_WRITE_ENABLE << MI_ARB_MASK_SHIFT);
3979 I915_WRITE(MI_ARB_STATE, tmp);
3980 }
3981 }
3982
Chris Wilson72bfa192010-12-19 11:42:05 +00003983 dev_priv->relative_constants_mode = I915_EXEC_CONSTANTS_REL_GENERAL;
3984
Jesse Barnesde151cf2008-11-12 10:03:55 -08003985 /* Old X drivers will take 0-2 for front, back, depth buffers */
Eric Anholtb397c832010-01-26 09:43:10 -08003986 if (!drm_core_check_feature(dev, DRIVER_MODESET))
3987 dev_priv->fence_reg_start = 3;
Jesse Barnesde151cf2008-11-12 10:03:55 -08003988
Chris Wilsona6c45cf2010-09-17 00:32:17 +01003989 if (INTEL_INFO(dev)->gen >= 4 || IS_I945G(dev) || IS_I945GM(dev) || IS_G33(dev))
Jesse Barnesde151cf2008-11-12 10:03:55 -08003990 dev_priv->num_fence_regs = 16;
3991 else
3992 dev_priv->num_fence_regs = 8;
3993
Grégoire Henryb5aa8a02009-06-23 15:41:02 +02003994 /* Initialize fence registers to zero */
Eric Anholt10ed13e2011-05-06 13:53:49 -07003995 for (i = 0; i < dev_priv->num_fence_regs; i++) {
3996 i915_gem_clear_fence_reg(dev, &dev_priv->fence_regs[i]);
Grégoire Henryb5aa8a02009-06-23 15:41:02 +02003997 }
Eric Anholt10ed13e2011-05-06 13:53:49 -07003998
Eric Anholt673a3942008-07-30 12:06:12 -07003999 i915_gem_detect_bit_6_swizzle(dev);
Kristian Høgsberg6b95a202009-11-18 11:25:18 -05004000 init_waitqueue_head(&dev_priv->pending_flip_queue);
Chris Wilson17250b72010-10-28 12:51:39 +01004001
Chris Wilsonce453d82011-02-21 14:43:56 +00004002 dev_priv->mm.interruptible = true;
4003
Chris Wilson17250b72010-10-28 12:51:39 +01004004 dev_priv->mm.inactive_shrinker.shrink = i915_gem_inactive_shrink;
4005 dev_priv->mm.inactive_shrinker.seeks = DEFAULT_SEEKS;
4006 register_shrinker(&dev_priv->mm.inactive_shrinker);
Eric Anholt673a3942008-07-30 12:06:12 -07004007}
Dave Airlie71acb5e2008-12-30 20:31:46 +10004008
4009/*
4010 * Create a physically contiguous memory object for this object
4011 * e.g. for cursor + overlay regs
4012 */
Chris Wilson995b6762010-08-20 13:23:26 +01004013static int i915_gem_init_phys_object(struct drm_device *dev,
4014 int id, int size, int align)
Dave Airlie71acb5e2008-12-30 20:31:46 +10004015{
4016 drm_i915_private_t *dev_priv = dev->dev_private;
4017 struct drm_i915_gem_phys_object *phys_obj;
4018 int ret;
4019
4020 if (dev_priv->mm.phys_objs[id - 1] || !size)
4021 return 0;
4022
Eric Anholt9a298b22009-03-24 12:23:04 -07004023 phys_obj = kzalloc(sizeof(struct drm_i915_gem_phys_object), GFP_KERNEL);
Dave Airlie71acb5e2008-12-30 20:31:46 +10004024 if (!phys_obj)
4025 return -ENOMEM;
4026
4027 phys_obj->id = id;
4028
Chris Wilson6eeefaf2010-08-07 11:01:39 +01004029 phys_obj->handle = drm_pci_alloc(dev, size, align);
Dave Airlie71acb5e2008-12-30 20:31:46 +10004030 if (!phys_obj->handle) {
4031 ret = -ENOMEM;
4032 goto kfree_obj;
4033 }
4034#ifdef CONFIG_X86
4035 set_memory_wc((unsigned long)phys_obj->handle->vaddr, phys_obj->handle->size / PAGE_SIZE);
4036#endif
4037
4038 dev_priv->mm.phys_objs[id - 1] = phys_obj;
4039
4040 return 0;
4041kfree_obj:
Eric Anholt9a298b22009-03-24 12:23:04 -07004042 kfree(phys_obj);
Dave Airlie71acb5e2008-12-30 20:31:46 +10004043 return ret;
4044}
4045
Chris Wilson995b6762010-08-20 13:23:26 +01004046static void i915_gem_free_phys_object(struct drm_device *dev, int id)
Dave Airlie71acb5e2008-12-30 20:31:46 +10004047{
4048 drm_i915_private_t *dev_priv = dev->dev_private;
4049 struct drm_i915_gem_phys_object *phys_obj;
4050
4051 if (!dev_priv->mm.phys_objs[id - 1])
4052 return;
4053
4054 phys_obj = dev_priv->mm.phys_objs[id - 1];
4055 if (phys_obj->cur_obj) {
4056 i915_gem_detach_phys_object(dev, phys_obj->cur_obj);
4057 }
4058
4059#ifdef CONFIG_X86
4060 set_memory_wb((unsigned long)phys_obj->handle->vaddr, phys_obj->handle->size / PAGE_SIZE);
4061#endif
4062 drm_pci_free(dev, phys_obj->handle);
4063 kfree(phys_obj);
4064 dev_priv->mm.phys_objs[id - 1] = NULL;
4065}
4066
4067void i915_gem_free_all_phys_object(struct drm_device *dev)
4068{
4069 int i;
4070
Dave Airlie260883c2009-01-22 17:58:49 +10004071 for (i = I915_GEM_PHYS_CURSOR_0; i <= I915_MAX_PHYS_OBJECT; i++)
Dave Airlie71acb5e2008-12-30 20:31:46 +10004072 i915_gem_free_phys_object(dev, i);
4073}
4074
4075void i915_gem_detach_phys_object(struct drm_device *dev,
Chris Wilson05394f32010-11-08 19:18:58 +00004076 struct drm_i915_gem_object *obj)
Dave Airlie71acb5e2008-12-30 20:31:46 +10004077{
Chris Wilson05394f32010-11-08 19:18:58 +00004078 struct address_space *mapping = obj->base.filp->f_path.dentry->d_inode->i_mapping;
Chris Wilsone5281cc2010-10-28 13:45:36 +01004079 char *vaddr;
Dave Airlie71acb5e2008-12-30 20:31:46 +10004080 int i;
Dave Airlie71acb5e2008-12-30 20:31:46 +10004081 int page_count;
4082
Chris Wilson05394f32010-11-08 19:18:58 +00004083 if (!obj->phys_obj)
Dave Airlie71acb5e2008-12-30 20:31:46 +10004084 return;
Chris Wilson05394f32010-11-08 19:18:58 +00004085 vaddr = obj->phys_obj->handle->vaddr;
Dave Airlie71acb5e2008-12-30 20:31:46 +10004086
Chris Wilson05394f32010-11-08 19:18:58 +00004087 page_count = obj->base.size / PAGE_SIZE;
Dave Airlie71acb5e2008-12-30 20:31:46 +10004088 for (i = 0; i < page_count; i++) {
Chris Wilsone5281cc2010-10-28 13:45:36 +01004089 struct page *page = read_cache_page_gfp(mapping, i,
4090 GFP_HIGHUSER | __GFP_RECLAIMABLE);
4091 if (!IS_ERR(page)) {
4092 char *dst = kmap_atomic(page);
4093 memcpy(dst, vaddr + i*PAGE_SIZE, PAGE_SIZE);
4094 kunmap_atomic(dst);
Dave Airlie71acb5e2008-12-30 20:31:46 +10004095
Chris Wilsone5281cc2010-10-28 13:45:36 +01004096 drm_clflush_pages(&page, 1);
4097
4098 set_page_dirty(page);
4099 mark_page_accessed(page);
4100 page_cache_release(page);
4101 }
Dave Airlie71acb5e2008-12-30 20:31:46 +10004102 }
Daniel Vetter40ce6572010-11-05 18:12:18 +01004103 intel_gtt_chipset_flush();
Chris Wilsond78b47b2009-06-17 21:52:49 +01004104
Chris Wilson05394f32010-11-08 19:18:58 +00004105 obj->phys_obj->cur_obj = NULL;
4106 obj->phys_obj = NULL;
Dave Airlie71acb5e2008-12-30 20:31:46 +10004107}
4108
4109int
4110i915_gem_attach_phys_object(struct drm_device *dev,
Chris Wilson05394f32010-11-08 19:18:58 +00004111 struct drm_i915_gem_object *obj,
Chris Wilson6eeefaf2010-08-07 11:01:39 +01004112 int id,
4113 int align)
Dave Airlie71acb5e2008-12-30 20:31:46 +10004114{
Chris Wilson05394f32010-11-08 19:18:58 +00004115 struct address_space *mapping = obj->base.filp->f_path.dentry->d_inode->i_mapping;
Dave Airlie71acb5e2008-12-30 20:31:46 +10004116 drm_i915_private_t *dev_priv = dev->dev_private;
Dave Airlie71acb5e2008-12-30 20:31:46 +10004117 int ret = 0;
4118 int page_count;
4119 int i;
4120
4121 if (id > I915_MAX_PHYS_OBJECT)
4122 return -EINVAL;
4123
Chris Wilson05394f32010-11-08 19:18:58 +00004124 if (obj->phys_obj) {
4125 if (obj->phys_obj->id == id)
Dave Airlie71acb5e2008-12-30 20:31:46 +10004126 return 0;
4127 i915_gem_detach_phys_object(dev, obj);
4128 }
4129
Dave Airlie71acb5e2008-12-30 20:31:46 +10004130 /* create a new object */
4131 if (!dev_priv->mm.phys_objs[id - 1]) {
4132 ret = i915_gem_init_phys_object(dev, id,
Chris Wilson05394f32010-11-08 19:18:58 +00004133 obj->base.size, align);
Dave Airlie71acb5e2008-12-30 20:31:46 +10004134 if (ret) {
Chris Wilson05394f32010-11-08 19:18:58 +00004135 DRM_ERROR("failed to init phys object %d size: %zu\n",
4136 id, obj->base.size);
Chris Wilsone5281cc2010-10-28 13:45:36 +01004137 return ret;
Dave Airlie71acb5e2008-12-30 20:31:46 +10004138 }
4139 }
4140
4141 /* bind to the object */
Chris Wilson05394f32010-11-08 19:18:58 +00004142 obj->phys_obj = dev_priv->mm.phys_objs[id - 1];
4143 obj->phys_obj->cur_obj = obj;
Dave Airlie71acb5e2008-12-30 20:31:46 +10004144
Chris Wilson05394f32010-11-08 19:18:58 +00004145 page_count = obj->base.size / PAGE_SIZE;
Dave Airlie71acb5e2008-12-30 20:31:46 +10004146
4147 for (i = 0; i < page_count; i++) {
Chris Wilsone5281cc2010-10-28 13:45:36 +01004148 struct page *page;
4149 char *dst, *src;
Dave Airlie71acb5e2008-12-30 20:31:46 +10004150
Chris Wilsone5281cc2010-10-28 13:45:36 +01004151 page = read_cache_page_gfp(mapping, i,
4152 GFP_HIGHUSER | __GFP_RECLAIMABLE);
4153 if (IS_ERR(page))
4154 return PTR_ERR(page);
4155
Chris Wilsonff75b9b2010-10-30 22:52:31 +01004156 src = kmap_atomic(page);
Chris Wilson05394f32010-11-08 19:18:58 +00004157 dst = obj->phys_obj->handle->vaddr + (i * PAGE_SIZE);
Dave Airlie71acb5e2008-12-30 20:31:46 +10004158 memcpy(dst, src, PAGE_SIZE);
Peter Zijlstra3e4d3af2010-10-26 14:21:51 -07004159 kunmap_atomic(src);
Chris Wilsone5281cc2010-10-28 13:45:36 +01004160
4161 mark_page_accessed(page);
4162 page_cache_release(page);
Dave Airlie71acb5e2008-12-30 20:31:46 +10004163 }
4164
4165 return 0;
Dave Airlie71acb5e2008-12-30 20:31:46 +10004166}
4167
4168static int
Chris Wilson05394f32010-11-08 19:18:58 +00004169i915_gem_phys_pwrite(struct drm_device *dev,
4170 struct drm_i915_gem_object *obj,
Dave Airlie71acb5e2008-12-30 20:31:46 +10004171 struct drm_i915_gem_pwrite *args,
4172 struct drm_file *file_priv)
4173{
Chris Wilson05394f32010-11-08 19:18:58 +00004174 void *vaddr = obj->phys_obj->handle->vaddr + args->offset;
Chris Wilsonb47b30c2010-11-08 01:12:29 +00004175 char __user *user_data = (char __user *) (uintptr_t) args->data_ptr;
Dave Airlie71acb5e2008-12-30 20:31:46 +10004176
Chris Wilsonb47b30c2010-11-08 01:12:29 +00004177 if (__copy_from_user_inatomic_nocache(vaddr, user_data, args->size)) {
4178 unsigned long unwritten;
4179
4180 /* The physical object once assigned is fixed for the lifetime
4181 * of the obj, so we can safely drop the lock and continue
4182 * to access vaddr.
4183 */
4184 mutex_unlock(&dev->struct_mutex);
4185 unwritten = copy_from_user(vaddr, user_data, args->size);
4186 mutex_lock(&dev->struct_mutex);
4187 if (unwritten)
4188 return -EFAULT;
4189 }
Dave Airlie71acb5e2008-12-30 20:31:46 +10004190
Daniel Vetter40ce6572010-11-05 18:12:18 +01004191 intel_gtt_chipset_flush();
Dave Airlie71acb5e2008-12-30 20:31:46 +10004192 return 0;
4193}
Eric Anholtb9624422009-06-03 07:27:35 +00004194
Chris Wilsonf787a5f2010-09-24 16:02:42 +01004195void i915_gem_release(struct drm_device *dev, struct drm_file *file)
Eric Anholtb9624422009-06-03 07:27:35 +00004196{
Chris Wilsonf787a5f2010-09-24 16:02:42 +01004197 struct drm_i915_file_private *file_priv = file->driver_priv;
Eric Anholtb9624422009-06-03 07:27:35 +00004198
4199 /* Clean up our request list when the client is going away, so that
4200 * later retire_requests won't dereference our soon-to-be-gone
4201 * file_priv.
4202 */
Chris Wilson1c255952010-09-26 11:03:27 +01004203 spin_lock(&file_priv->mm.lock);
Chris Wilsonf787a5f2010-09-24 16:02:42 +01004204 while (!list_empty(&file_priv->mm.request_list)) {
4205 struct drm_i915_gem_request *request;
4206
4207 request = list_first_entry(&file_priv->mm.request_list,
4208 struct drm_i915_gem_request,
4209 client_list);
4210 list_del(&request->client_list);
4211 request->file_priv = NULL;
4212 }
Chris Wilson1c255952010-09-26 11:03:27 +01004213 spin_unlock(&file_priv->mm.lock);
Eric Anholtb9624422009-06-03 07:27:35 +00004214}
Chris Wilson31169712009-09-14 16:50:28 +01004215
Chris Wilson31169712009-09-14 16:50:28 +01004216static int
Chris Wilson1637ef42010-04-20 17:10:35 +01004217i915_gpu_is_active(struct drm_device *dev)
4218{
4219 drm_i915_private_t *dev_priv = dev->dev_private;
4220 int lists_empty;
4221
Chris Wilson1637ef42010-04-20 17:10:35 +01004222 lists_empty = list_empty(&dev_priv->mm.flushing_list) &&
Chris Wilson17250b72010-10-28 12:51:39 +01004223 list_empty(&dev_priv->mm.active_list);
Chris Wilson1637ef42010-04-20 17:10:35 +01004224
4225 return !lists_empty;
4226}
4227
4228static int
Ying Han1495f232011-05-24 17:12:27 -07004229i915_gem_inactive_shrink(struct shrinker *shrinker, struct shrink_control *sc)
Chris Wilson31169712009-09-14 16:50:28 +01004230{
Chris Wilson17250b72010-10-28 12:51:39 +01004231 struct drm_i915_private *dev_priv =
4232 container_of(shrinker,
4233 struct drm_i915_private,
4234 mm.inactive_shrinker);
4235 struct drm_device *dev = dev_priv->dev;
4236 struct drm_i915_gem_object *obj, *next;
Ying Han1495f232011-05-24 17:12:27 -07004237 int nr_to_scan = sc->nr_to_scan;
Chris Wilson17250b72010-10-28 12:51:39 +01004238 int cnt;
4239
4240 if (!mutex_trylock(&dev->struct_mutex))
Chris Wilsonbbe2e112010-10-28 22:35:07 +01004241 return 0;
Chris Wilson31169712009-09-14 16:50:28 +01004242
4243 /* "fast-path" to count number of available objects */
4244 if (nr_to_scan == 0) {
Chris Wilson17250b72010-10-28 12:51:39 +01004245 cnt = 0;
4246 list_for_each_entry(obj,
4247 &dev_priv->mm.inactive_list,
4248 mm_list)
4249 cnt++;
4250 mutex_unlock(&dev->struct_mutex);
4251 return cnt / 100 * sysctl_vfs_cache_pressure;
Chris Wilson31169712009-09-14 16:50:28 +01004252 }
4253
Chris Wilson1637ef42010-04-20 17:10:35 +01004254rescan:
Chris Wilson31169712009-09-14 16:50:28 +01004255 /* first scan for clean buffers */
Chris Wilson17250b72010-10-28 12:51:39 +01004256 i915_gem_retire_requests(dev);
Chris Wilson31169712009-09-14 16:50:28 +01004257
Chris Wilson17250b72010-10-28 12:51:39 +01004258 list_for_each_entry_safe(obj, next,
4259 &dev_priv->mm.inactive_list,
4260 mm_list) {
4261 if (i915_gem_object_is_purgeable(obj)) {
Chris Wilson20217462010-11-23 15:26:33 +00004262 if (i915_gem_object_unbind(obj) == 0 &&
4263 --nr_to_scan == 0)
Chris Wilson17250b72010-10-28 12:51:39 +01004264 break;
Chris Wilson31169712009-09-14 16:50:28 +01004265 }
Chris Wilson31169712009-09-14 16:50:28 +01004266 }
4267
4268 /* second pass, evict/count anything still on the inactive list */
Chris Wilson17250b72010-10-28 12:51:39 +01004269 cnt = 0;
4270 list_for_each_entry_safe(obj, next,
4271 &dev_priv->mm.inactive_list,
4272 mm_list) {
Chris Wilson20217462010-11-23 15:26:33 +00004273 if (nr_to_scan &&
4274 i915_gem_object_unbind(obj) == 0)
Chris Wilson17250b72010-10-28 12:51:39 +01004275 nr_to_scan--;
Chris Wilson20217462010-11-23 15:26:33 +00004276 else
Chris Wilson17250b72010-10-28 12:51:39 +01004277 cnt++;
Chris Wilson31169712009-09-14 16:50:28 +01004278 }
4279
Chris Wilson17250b72010-10-28 12:51:39 +01004280 if (nr_to_scan && i915_gpu_is_active(dev)) {
Chris Wilson1637ef42010-04-20 17:10:35 +01004281 /*
4282 * We are desperate for pages, so as a last resort, wait
4283 * for the GPU to finish and discard whatever we can.
4284 * This has a dramatic impact to reduce the number of
4285 * OOM-killer events whilst running the GPU aggressively.
4286 */
Chris Wilson17250b72010-10-28 12:51:39 +01004287 if (i915_gpu_idle(dev) == 0)
Chris Wilson1637ef42010-04-20 17:10:35 +01004288 goto rescan;
4289 }
Chris Wilson17250b72010-10-28 12:51:39 +01004290 mutex_unlock(&dev->struct_mutex);
4291 return cnt / 100 * sysctl_vfs_cache_pressure;
Chris Wilson31169712009-09-14 16:50:28 +01004292}