blob: af664ba923c5c5cafab9022a8dde829a2e3ff45d [file] [log] [blame]
Eric Anholt673a3942008-07-30 12:06:12 -07001/*
2 * Copyright © 2008 Intel Corporation
3 *
4 * Permission is hereby granted, free of charge, to any person obtaining a
5 * copy of this software and associated documentation files (the "Software"),
6 * to deal in the Software without restriction, including without limitation
7 * the rights to use, copy, modify, merge, publish, distribute, sublicense,
8 * and/or sell copies of the Software, and to permit persons to whom the
9 * Software is furnished to do so, subject to the following conditions:
10 *
11 * The above copyright notice and this permission notice (including the next
12 * paragraph) shall be included in all copies or substantial portions of the
13 * Software.
14 *
15 * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
16 * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
17 * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL
18 * THE AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
19 * LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING
20 * FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS
21 * IN THE SOFTWARE.
22 *
23 * Authors:
24 * Eric Anholt <eric@anholt.net>
25 *
26 */
27
28#include "drmP.h"
29#include "drm.h"
30#include "i915_drm.h"
31#include "i915_drv.h"
Chris Wilson1c5d22f2009-08-25 11:15:50 +010032#include "i915_trace.h"
Jesse Barnes652c3932009-08-17 13:31:43 -070033#include "intel_drv.h"
Tejun Heo5a0e3ad2010-03-24 17:04:11 +090034#include <linux/slab.h>
Eric Anholt673a3942008-07-30 12:06:12 -070035#include <linux/swap.h>
Jesse Barnes79e53942008-11-07 14:24:08 -080036#include <linux/pci.h>
Eric Anholt673a3942008-07-30 12:06:12 -070037
Eric Anholte47c68e2008-11-14 13:35:19 -080038static void i915_gem_object_flush_gpu_write_domain(struct drm_gem_object *obj);
39static void i915_gem_object_flush_gtt_write_domain(struct drm_gem_object *obj);
40static void i915_gem_object_flush_cpu_write_domain(struct drm_gem_object *obj);
Eric Anholte47c68e2008-11-14 13:35:19 -080041static int i915_gem_object_set_to_cpu_domain(struct drm_gem_object *obj,
42 int write);
43static int i915_gem_object_set_cpu_read_domain_range(struct drm_gem_object *obj,
44 uint64_t offset,
45 uint64_t size);
46static void i915_gem_object_set_to_full_cpu_read_domain(struct drm_gem_object *obj);
Eric Anholt673a3942008-07-30 12:06:12 -070047static int i915_gem_object_wait_rendering(struct drm_gem_object *obj);
Jesse Barnesde151cf2008-11-12 10:03:55 -080048static int i915_gem_object_bind_to_gtt(struct drm_gem_object *obj,
49 unsigned alignment);
Jesse Barnesde151cf2008-11-12 10:03:55 -080050static void i915_gem_clear_fence_reg(struct drm_gem_object *obj);
Chris Wilson07f73f62009-09-14 16:50:30 +010051static int i915_gem_evict_something(struct drm_device *dev, int min_size);
Chris Wilsonab5ee572009-09-20 19:25:47 +010052static int i915_gem_evict_from_inactive_list(struct drm_device *dev);
Dave Airlie71acb5e2008-12-30 20:31:46 +100053static int i915_gem_phys_pwrite(struct drm_device *dev, struct drm_gem_object *obj,
54 struct drm_i915_gem_pwrite *args,
55 struct drm_file *file_priv);
Eric Anholt673a3942008-07-30 12:06:12 -070056
Chris Wilson31169712009-09-14 16:50:28 +010057static LIST_HEAD(shrink_list);
58static DEFINE_SPINLOCK(shrink_list_lock);
59
Jesse Barnes79e53942008-11-07 14:24:08 -080060int i915_gem_do_init(struct drm_device *dev, unsigned long start,
61 unsigned long end)
62{
63 drm_i915_private_t *dev_priv = dev->dev_private;
64
65 if (start >= end ||
66 (start & (PAGE_SIZE - 1)) != 0 ||
67 (end & (PAGE_SIZE - 1)) != 0) {
68 return -EINVAL;
69 }
70
71 drm_mm_init(&dev_priv->mm.gtt_space, start,
72 end - start);
73
74 dev->gtt_total = (uint32_t) (end - start);
75
76 return 0;
77}
Keith Packard6dbe2772008-10-14 21:41:13 -070078
Eric Anholt673a3942008-07-30 12:06:12 -070079int
80i915_gem_init_ioctl(struct drm_device *dev, void *data,
81 struct drm_file *file_priv)
82{
Eric Anholt673a3942008-07-30 12:06:12 -070083 struct drm_i915_gem_init *args = data;
Jesse Barnes79e53942008-11-07 14:24:08 -080084 int ret;
Eric Anholt673a3942008-07-30 12:06:12 -070085
86 mutex_lock(&dev->struct_mutex);
Jesse Barnes79e53942008-11-07 14:24:08 -080087 ret = i915_gem_do_init(dev, args->gtt_start, args->gtt_end);
Eric Anholt673a3942008-07-30 12:06:12 -070088 mutex_unlock(&dev->struct_mutex);
89
Jesse Barnes79e53942008-11-07 14:24:08 -080090 return ret;
Eric Anholt673a3942008-07-30 12:06:12 -070091}
92
Eric Anholt5a125c32008-10-22 21:40:13 -070093int
94i915_gem_get_aperture_ioctl(struct drm_device *dev, void *data,
95 struct drm_file *file_priv)
96{
Eric Anholt5a125c32008-10-22 21:40:13 -070097 struct drm_i915_gem_get_aperture *args = data;
Eric Anholt5a125c32008-10-22 21:40:13 -070098
99 if (!(dev->driver->driver_features & DRIVER_GEM))
100 return -ENODEV;
101
102 args->aper_size = dev->gtt_total;
Keith Packard2678d9d2008-11-20 22:54:54 -0800103 args->aper_available_size = (args->aper_size -
104 atomic_read(&dev->pin_memory));
Eric Anholt5a125c32008-10-22 21:40:13 -0700105
106 return 0;
107}
108
Eric Anholt673a3942008-07-30 12:06:12 -0700109
110/**
111 * Creates a new mm object and returns a handle to it.
112 */
113int
114i915_gem_create_ioctl(struct drm_device *dev, void *data,
115 struct drm_file *file_priv)
116{
117 struct drm_i915_gem_create *args = data;
118 struct drm_gem_object *obj;
Pekka Paalanena1a2d1d2009-08-23 12:40:55 +0300119 int ret;
120 u32 handle;
Eric Anholt673a3942008-07-30 12:06:12 -0700121
122 args->size = roundup(args->size, PAGE_SIZE);
123
124 /* Allocate the new object */
Daniel Vetterac52bc52010-04-09 19:05:06 +0000125 obj = i915_gem_alloc_object(dev, args->size);
Eric Anholt673a3942008-07-30 12:06:12 -0700126 if (obj == NULL)
127 return -ENOMEM;
128
129 ret = drm_gem_handle_create(file_priv, obj, &handle);
Luca Barbieribc9025b2010-02-09 05:49:12 +0000130 drm_gem_object_handle_unreference_unlocked(obj);
Eric Anholt673a3942008-07-30 12:06:12 -0700131
132 if (ret)
133 return ret;
134
135 args->handle = handle;
136
137 return 0;
138}
139
Eric Anholt40123c12009-03-09 13:42:30 -0700140static inline int
Eric Anholteb014592009-03-10 11:44:52 -0700141fast_shmem_read(struct page **pages,
142 loff_t page_base, int page_offset,
143 char __user *data,
144 int length)
145{
146 char __iomem *vaddr;
Florian Mickler2bc43b52009-04-06 22:55:41 +0200147 int unwritten;
Eric Anholteb014592009-03-10 11:44:52 -0700148
149 vaddr = kmap_atomic(pages[page_base >> PAGE_SHIFT], KM_USER0);
150 if (vaddr == NULL)
151 return -ENOMEM;
Florian Mickler2bc43b52009-04-06 22:55:41 +0200152 unwritten = __copy_to_user_inatomic(data, vaddr + page_offset, length);
Eric Anholteb014592009-03-10 11:44:52 -0700153 kunmap_atomic(vaddr, KM_USER0);
154
Florian Mickler2bc43b52009-04-06 22:55:41 +0200155 if (unwritten)
156 return -EFAULT;
157
158 return 0;
Eric Anholteb014592009-03-10 11:44:52 -0700159}
160
Eric Anholt280b7132009-03-12 16:56:27 -0700161static int i915_gem_object_needs_bit17_swizzle(struct drm_gem_object *obj)
162{
163 drm_i915_private_t *dev_priv = obj->dev->dev_private;
Daniel Vetter23010e42010-03-08 13:35:02 +0100164 struct drm_i915_gem_object *obj_priv = to_intel_bo(obj);
Eric Anholt280b7132009-03-12 16:56:27 -0700165
166 return dev_priv->mm.bit_6_swizzle_x == I915_BIT_6_SWIZZLE_9_10_17 &&
167 obj_priv->tiling_mode != I915_TILING_NONE;
168}
169
Eric Anholteb014592009-03-10 11:44:52 -0700170static inline int
Eric Anholt40123c12009-03-09 13:42:30 -0700171slow_shmem_copy(struct page *dst_page,
172 int dst_offset,
173 struct page *src_page,
174 int src_offset,
175 int length)
176{
177 char *dst_vaddr, *src_vaddr;
178
179 dst_vaddr = kmap_atomic(dst_page, KM_USER0);
180 if (dst_vaddr == NULL)
181 return -ENOMEM;
182
183 src_vaddr = kmap_atomic(src_page, KM_USER1);
184 if (src_vaddr == NULL) {
185 kunmap_atomic(dst_vaddr, KM_USER0);
186 return -ENOMEM;
187 }
188
189 memcpy(dst_vaddr + dst_offset, src_vaddr + src_offset, length);
190
191 kunmap_atomic(src_vaddr, KM_USER1);
192 kunmap_atomic(dst_vaddr, KM_USER0);
193
194 return 0;
195}
196
Eric Anholt280b7132009-03-12 16:56:27 -0700197static inline int
198slow_shmem_bit17_copy(struct page *gpu_page,
199 int gpu_offset,
200 struct page *cpu_page,
201 int cpu_offset,
202 int length,
203 int is_read)
204{
205 char *gpu_vaddr, *cpu_vaddr;
206
207 /* Use the unswizzled path if this page isn't affected. */
208 if ((page_to_phys(gpu_page) & (1 << 17)) == 0) {
209 if (is_read)
210 return slow_shmem_copy(cpu_page, cpu_offset,
211 gpu_page, gpu_offset, length);
212 else
213 return slow_shmem_copy(gpu_page, gpu_offset,
214 cpu_page, cpu_offset, length);
215 }
216
217 gpu_vaddr = kmap_atomic(gpu_page, KM_USER0);
218 if (gpu_vaddr == NULL)
219 return -ENOMEM;
220
221 cpu_vaddr = kmap_atomic(cpu_page, KM_USER1);
222 if (cpu_vaddr == NULL) {
223 kunmap_atomic(gpu_vaddr, KM_USER0);
224 return -ENOMEM;
225 }
226
227 /* Copy the data, XORing A6 with A17 (1). The user already knows he's
228 * XORing with the other bits (A9 for Y, A9 and A10 for X)
229 */
230 while (length > 0) {
231 int cacheline_end = ALIGN(gpu_offset + 1, 64);
232 int this_length = min(cacheline_end - gpu_offset, length);
233 int swizzled_gpu_offset = gpu_offset ^ 64;
234
235 if (is_read) {
236 memcpy(cpu_vaddr + cpu_offset,
237 gpu_vaddr + swizzled_gpu_offset,
238 this_length);
239 } else {
240 memcpy(gpu_vaddr + swizzled_gpu_offset,
241 cpu_vaddr + cpu_offset,
242 this_length);
243 }
244 cpu_offset += this_length;
245 gpu_offset += this_length;
246 length -= this_length;
247 }
248
249 kunmap_atomic(cpu_vaddr, KM_USER1);
250 kunmap_atomic(gpu_vaddr, KM_USER0);
251
252 return 0;
253}
254
Eric Anholt673a3942008-07-30 12:06:12 -0700255/**
Eric Anholteb014592009-03-10 11:44:52 -0700256 * This is the fast shmem pread path, which attempts to copy_from_user directly
257 * from the backing pages of the object to the user's address space. On a
258 * fault, it fails so we can fall back to i915_gem_shmem_pwrite_slow().
259 */
260static int
261i915_gem_shmem_pread_fast(struct drm_device *dev, struct drm_gem_object *obj,
262 struct drm_i915_gem_pread *args,
263 struct drm_file *file_priv)
264{
Daniel Vetter23010e42010-03-08 13:35:02 +0100265 struct drm_i915_gem_object *obj_priv = to_intel_bo(obj);
Eric Anholteb014592009-03-10 11:44:52 -0700266 ssize_t remain;
267 loff_t offset, page_base;
268 char __user *user_data;
269 int page_offset, page_length;
270 int ret;
271
272 user_data = (char __user *) (uintptr_t) args->data_ptr;
273 remain = args->size;
274
275 mutex_lock(&dev->struct_mutex);
276
Chris Wilson4bdadb92010-01-27 13:36:32 +0000277 ret = i915_gem_object_get_pages(obj, 0);
Eric Anholteb014592009-03-10 11:44:52 -0700278 if (ret != 0)
279 goto fail_unlock;
280
281 ret = i915_gem_object_set_cpu_read_domain_range(obj, args->offset,
282 args->size);
283 if (ret != 0)
284 goto fail_put_pages;
285
Daniel Vetter23010e42010-03-08 13:35:02 +0100286 obj_priv = to_intel_bo(obj);
Eric Anholteb014592009-03-10 11:44:52 -0700287 offset = args->offset;
288
289 while (remain > 0) {
290 /* Operation in this page
291 *
292 * page_base = page offset within aperture
293 * page_offset = offset within page
294 * page_length = bytes to copy for this page
295 */
296 page_base = (offset & ~(PAGE_SIZE-1));
297 page_offset = offset & (PAGE_SIZE-1);
298 page_length = remain;
299 if ((page_offset + remain) > PAGE_SIZE)
300 page_length = PAGE_SIZE - page_offset;
301
302 ret = fast_shmem_read(obj_priv->pages,
303 page_base, page_offset,
304 user_data, page_length);
305 if (ret)
306 goto fail_put_pages;
307
308 remain -= page_length;
309 user_data += page_length;
310 offset += page_length;
311 }
312
313fail_put_pages:
314 i915_gem_object_put_pages(obj);
315fail_unlock:
316 mutex_unlock(&dev->struct_mutex);
317
318 return ret;
319}
320
Chris Wilson07f73f62009-09-14 16:50:30 +0100321static int
322i915_gem_object_get_pages_or_evict(struct drm_gem_object *obj)
323{
324 int ret;
325
Chris Wilson4bdadb92010-01-27 13:36:32 +0000326 ret = i915_gem_object_get_pages(obj, __GFP_NORETRY | __GFP_NOWARN);
Chris Wilson07f73f62009-09-14 16:50:30 +0100327
328 /* If we've insufficient memory to map in the pages, attempt
329 * to make some space by throwing out some old buffers.
330 */
331 if (ret == -ENOMEM) {
332 struct drm_device *dev = obj->dev;
Chris Wilson07f73f62009-09-14 16:50:30 +0100333
334 ret = i915_gem_evict_something(dev, obj->size);
335 if (ret)
336 return ret;
337
Chris Wilson4bdadb92010-01-27 13:36:32 +0000338 ret = i915_gem_object_get_pages(obj, 0);
Chris Wilson07f73f62009-09-14 16:50:30 +0100339 }
340
341 return ret;
342}
343
Eric Anholteb014592009-03-10 11:44:52 -0700344/**
345 * This is the fallback shmem pread path, which allocates temporary storage
346 * in kernel space to copy_to_user into outside of the struct_mutex, so we
347 * can copy out of the object's backing pages while holding the struct mutex
348 * and not take page faults.
349 */
350static int
351i915_gem_shmem_pread_slow(struct drm_device *dev, struct drm_gem_object *obj,
352 struct drm_i915_gem_pread *args,
353 struct drm_file *file_priv)
354{
Daniel Vetter23010e42010-03-08 13:35:02 +0100355 struct drm_i915_gem_object *obj_priv = to_intel_bo(obj);
Eric Anholteb014592009-03-10 11:44:52 -0700356 struct mm_struct *mm = current->mm;
357 struct page **user_pages;
358 ssize_t remain;
359 loff_t offset, pinned_pages, i;
360 loff_t first_data_page, last_data_page, num_pages;
361 int shmem_page_index, shmem_page_offset;
362 int data_page_index, data_page_offset;
363 int page_length;
364 int ret;
365 uint64_t data_ptr = args->data_ptr;
Eric Anholt280b7132009-03-12 16:56:27 -0700366 int do_bit17_swizzling;
Eric Anholteb014592009-03-10 11:44:52 -0700367
368 remain = args->size;
369
370 /* Pin the user pages containing the data. We can't fault while
371 * holding the struct mutex, yet we want to hold it while
372 * dereferencing the user data.
373 */
374 first_data_page = data_ptr / PAGE_SIZE;
375 last_data_page = (data_ptr + args->size - 1) / PAGE_SIZE;
376 num_pages = last_data_page - first_data_page + 1;
377
Jesse Barnes8e7d2b22009-05-08 16:13:25 -0700378 user_pages = drm_calloc_large(num_pages, sizeof(struct page *));
Eric Anholteb014592009-03-10 11:44:52 -0700379 if (user_pages == NULL)
380 return -ENOMEM;
381
382 down_read(&mm->mmap_sem);
383 pinned_pages = get_user_pages(current, mm, (uintptr_t)args->data_ptr,
Eric Anholte5e9ecd2009-04-07 16:01:22 -0700384 num_pages, 1, 0, user_pages, NULL);
Eric Anholteb014592009-03-10 11:44:52 -0700385 up_read(&mm->mmap_sem);
386 if (pinned_pages < num_pages) {
387 ret = -EFAULT;
388 goto fail_put_user_pages;
389 }
390
Eric Anholt280b7132009-03-12 16:56:27 -0700391 do_bit17_swizzling = i915_gem_object_needs_bit17_swizzle(obj);
392
Eric Anholteb014592009-03-10 11:44:52 -0700393 mutex_lock(&dev->struct_mutex);
394
Chris Wilson07f73f62009-09-14 16:50:30 +0100395 ret = i915_gem_object_get_pages_or_evict(obj);
396 if (ret)
Eric Anholteb014592009-03-10 11:44:52 -0700397 goto fail_unlock;
398
399 ret = i915_gem_object_set_cpu_read_domain_range(obj, args->offset,
400 args->size);
401 if (ret != 0)
402 goto fail_put_pages;
403
Daniel Vetter23010e42010-03-08 13:35:02 +0100404 obj_priv = to_intel_bo(obj);
Eric Anholteb014592009-03-10 11:44:52 -0700405 offset = args->offset;
406
407 while (remain > 0) {
408 /* Operation in this page
409 *
410 * shmem_page_index = page number within shmem file
411 * shmem_page_offset = offset within page in shmem file
412 * data_page_index = page number in get_user_pages return
413 * data_page_offset = offset with data_page_index page.
414 * page_length = bytes to copy for this page
415 */
416 shmem_page_index = offset / PAGE_SIZE;
417 shmem_page_offset = offset & ~PAGE_MASK;
418 data_page_index = data_ptr / PAGE_SIZE - first_data_page;
419 data_page_offset = data_ptr & ~PAGE_MASK;
420
421 page_length = remain;
422 if ((shmem_page_offset + page_length) > PAGE_SIZE)
423 page_length = PAGE_SIZE - shmem_page_offset;
424 if ((data_page_offset + page_length) > PAGE_SIZE)
425 page_length = PAGE_SIZE - data_page_offset;
426
Eric Anholt280b7132009-03-12 16:56:27 -0700427 if (do_bit17_swizzling) {
428 ret = slow_shmem_bit17_copy(obj_priv->pages[shmem_page_index],
429 shmem_page_offset,
430 user_pages[data_page_index],
431 data_page_offset,
432 page_length,
433 1);
434 } else {
435 ret = slow_shmem_copy(user_pages[data_page_index],
436 data_page_offset,
437 obj_priv->pages[shmem_page_index],
438 shmem_page_offset,
439 page_length);
440 }
Eric Anholteb014592009-03-10 11:44:52 -0700441 if (ret)
442 goto fail_put_pages;
443
444 remain -= page_length;
445 data_ptr += page_length;
446 offset += page_length;
447 }
448
449fail_put_pages:
450 i915_gem_object_put_pages(obj);
451fail_unlock:
452 mutex_unlock(&dev->struct_mutex);
453fail_put_user_pages:
454 for (i = 0; i < pinned_pages; i++) {
455 SetPageDirty(user_pages[i]);
456 page_cache_release(user_pages[i]);
457 }
Jesse Barnes8e7d2b22009-05-08 16:13:25 -0700458 drm_free_large(user_pages);
Eric Anholteb014592009-03-10 11:44:52 -0700459
460 return ret;
461}
462
Eric Anholt673a3942008-07-30 12:06:12 -0700463/**
464 * Reads data from the object referenced by handle.
465 *
466 * On error, the contents of *data are undefined.
467 */
468int
469i915_gem_pread_ioctl(struct drm_device *dev, void *data,
470 struct drm_file *file_priv)
471{
472 struct drm_i915_gem_pread *args = data;
473 struct drm_gem_object *obj;
474 struct drm_i915_gem_object *obj_priv;
Eric Anholt673a3942008-07-30 12:06:12 -0700475 int ret;
476
477 obj = drm_gem_object_lookup(dev, file_priv, args->handle);
478 if (obj == NULL)
479 return -EBADF;
Daniel Vetter23010e42010-03-08 13:35:02 +0100480 obj_priv = to_intel_bo(obj);
Eric Anholt673a3942008-07-30 12:06:12 -0700481
482 /* Bounds check source.
483 *
484 * XXX: This could use review for overflow issues...
485 */
486 if (args->offset > obj->size || args->size > obj->size ||
487 args->offset + args->size > obj->size) {
Luca Barbieribc9025b2010-02-09 05:49:12 +0000488 drm_gem_object_unreference_unlocked(obj);
Eric Anholt673a3942008-07-30 12:06:12 -0700489 return -EINVAL;
490 }
491
Eric Anholt280b7132009-03-12 16:56:27 -0700492 if (i915_gem_object_needs_bit17_swizzle(obj)) {
Eric Anholteb014592009-03-10 11:44:52 -0700493 ret = i915_gem_shmem_pread_slow(dev, obj, args, file_priv);
Eric Anholt280b7132009-03-12 16:56:27 -0700494 } else {
495 ret = i915_gem_shmem_pread_fast(dev, obj, args, file_priv);
496 if (ret != 0)
497 ret = i915_gem_shmem_pread_slow(dev, obj, args,
498 file_priv);
499 }
Eric Anholt673a3942008-07-30 12:06:12 -0700500
Luca Barbieribc9025b2010-02-09 05:49:12 +0000501 drm_gem_object_unreference_unlocked(obj);
Eric Anholt673a3942008-07-30 12:06:12 -0700502
Eric Anholteb014592009-03-10 11:44:52 -0700503 return ret;
Eric Anholt673a3942008-07-30 12:06:12 -0700504}
505
Keith Packard0839ccb2008-10-30 19:38:48 -0700506/* This is the fast write path which cannot handle
507 * page faults in the source data
Linus Torvalds9b7530cc2008-10-20 14:16:43 -0700508 */
Linus Torvalds9b7530cc2008-10-20 14:16:43 -0700509
Keith Packard0839ccb2008-10-30 19:38:48 -0700510static inline int
511fast_user_write(struct io_mapping *mapping,
512 loff_t page_base, int page_offset,
513 char __user *user_data,
514 int length)
515{
516 char *vaddr_atomic;
517 unsigned long unwritten;
518
519 vaddr_atomic = io_mapping_map_atomic_wc(mapping, page_base);
520 unwritten = __copy_from_user_inatomic_nocache(vaddr_atomic + page_offset,
521 user_data, length);
522 io_mapping_unmap_atomic(vaddr_atomic);
523 if (unwritten)
524 return -EFAULT;
Linus Torvalds9b7530cc2008-10-20 14:16:43 -0700525 return 0;
Keith Packard0839ccb2008-10-30 19:38:48 -0700526}
527
528/* Here's the write path which can sleep for
529 * page faults
530 */
531
532static inline int
Eric Anholt3de09aa2009-03-09 09:42:23 -0700533slow_kernel_write(struct io_mapping *mapping,
534 loff_t gtt_base, int gtt_offset,
535 struct page *user_page, int user_offset,
536 int length)
Keith Packard0839ccb2008-10-30 19:38:48 -0700537{
Eric Anholt3de09aa2009-03-09 09:42:23 -0700538 char *src_vaddr, *dst_vaddr;
Keith Packard0839ccb2008-10-30 19:38:48 -0700539 unsigned long unwritten;
540
Eric Anholt3de09aa2009-03-09 09:42:23 -0700541 dst_vaddr = io_mapping_map_atomic_wc(mapping, gtt_base);
542 src_vaddr = kmap_atomic(user_page, KM_USER1);
543 unwritten = __copy_from_user_inatomic_nocache(dst_vaddr + gtt_offset,
544 src_vaddr + user_offset,
545 length);
546 kunmap_atomic(src_vaddr, KM_USER1);
547 io_mapping_unmap_atomic(dst_vaddr);
Keith Packard0839ccb2008-10-30 19:38:48 -0700548 if (unwritten)
549 return -EFAULT;
550 return 0;
Linus Torvalds9b7530cc2008-10-20 14:16:43 -0700551}
552
Eric Anholt40123c12009-03-09 13:42:30 -0700553static inline int
554fast_shmem_write(struct page **pages,
555 loff_t page_base, int page_offset,
556 char __user *data,
557 int length)
558{
559 char __iomem *vaddr;
Dave Airlied0088772009-03-28 20:29:48 -0400560 unsigned long unwritten;
Eric Anholt40123c12009-03-09 13:42:30 -0700561
562 vaddr = kmap_atomic(pages[page_base >> PAGE_SHIFT], KM_USER0);
563 if (vaddr == NULL)
564 return -ENOMEM;
Dave Airlied0088772009-03-28 20:29:48 -0400565 unwritten = __copy_from_user_inatomic(vaddr + page_offset, data, length);
Eric Anholt40123c12009-03-09 13:42:30 -0700566 kunmap_atomic(vaddr, KM_USER0);
567
Dave Airlied0088772009-03-28 20:29:48 -0400568 if (unwritten)
569 return -EFAULT;
Eric Anholt40123c12009-03-09 13:42:30 -0700570 return 0;
571}
572
Eric Anholt3de09aa2009-03-09 09:42:23 -0700573/**
574 * This is the fast pwrite path, where we copy the data directly from the
575 * user into the GTT, uncached.
576 */
Eric Anholt673a3942008-07-30 12:06:12 -0700577static int
Eric Anholt3de09aa2009-03-09 09:42:23 -0700578i915_gem_gtt_pwrite_fast(struct drm_device *dev, struct drm_gem_object *obj,
579 struct drm_i915_gem_pwrite *args,
580 struct drm_file *file_priv)
Eric Anholt673a3942008-07-30 12:06:12 -0700581{
Daniel Vetter23010e42010-03-08 13:35:02 +0100582 struct drm_i915_gem_object *obj_priv = to_intel_bo(obj);
Keith Packard0839ccb2008-10-30 19:38:48 -0700583 drm_i915_private_t *dev_priv = dev->dev_private;
Eric Anholt673a3942008-07-30 12:06:12 -0700584 ssize_t remain;
Keith Packard0839ccb2008-10-30 19:38:48 -0700585 loff_t offset, page_base;
Eric Anholt673a3942008-07-30 12:06:12 -0700586 char __user *user_data;
Keith Packard0839ccb2008-10-30 19:38:48 -0700587 int page_offset, page_length;
588 int ret;
Eric Anholt673a3942008-07-30 12:06:12 -0700589
590 user_data = (char __user *) (uintptr_t) args->data_ptr;
591 remain = args->size;
592 if (!access_ok(VERIFY_READ, user_data, remain))
593 return -EFAULT;
594
595
596 mutex_lock(&dev->struct_mutex);
597 ret = i915_gem_object_pin(obj, 0);
598 if (ret) {
599 mutex_unlock(&dev->struct_mutex);
600 return ret;
601 }
Eric Anholt2ef7eea2008-11-10 10:53:25 -0800602 ret = i915_gem_object_set_to_gtt_domain(obj, 1);
Eric Anholt673a3942008-07-30 12:06:12 -0700603 if (ret)
604 goto fail;
605
Daniel Vetter23010e42010-03-08 13:35:02 +0100606 obj_priv = to_intel_bo(obj);
Eric Anholt673a3942008-07-30 12:06:12 -0700607 offset = obj_priv->gtt_offset + args->offset;
Eric Anholt673a3942008-07-30 12:06:12 -0700608
609 while (remain > 0) {
610 /* Operation in this page
611 *
Keith Packard0839ccb2008-10-30 19:38:48 -0700612 * page_base = page offset within aperture
613 * page_offset = offset within page
614 * page_length = bytes to copy for this page
Eric Anholt673a3942008-07-30 12:06:12 -0700615 */
Keith Packard0839ccb2008-10-30 19:38:48 -0700616 page_base = (offset & ~(PAGE_SIZE-1));
617 page_offset = offset & (PAGE_SIZE-1);
618 page_length = remain;
619 if ((page_offset + remain) > PAGE_SIZE)
620 page_length = PAGE_SIZE - page_offset;
Eric Anholt673a3942008-07-30 12:06:12 -0700621
Keith Packard0839ccb2008-10-30 19:38:48 -0700622 ret = fast_user_write (dev_priv->mm.gtt_mapping, page_base,
623 page_offset, user_data, page_length);
Eric Anholt673a3942008-07-30 12:06:12 -0700624
Keith Packard0839ccb2008-10-30 19:38:48 -0700625 /* If we get a fault while copying data, then (presumably) our
Eric Anholt3de09aa2009-03-09 09:42:23 -0700626 * source page isn't available. Return the error and we'll
627 * retry in the slow path.
Keith Packard0839ccb2008-10-30 19:38:48 -0700628 */
Eric Anholt3de09aa2009-03-09 09:42:23 -0700629 if (ret)
630 goto fail;
Eric Anholt673a3942008-07-30 12:06:12 -0700631
Keith Packard0839ccb2008-10-30 19:38:48 -0700632 remain -= page_length;
633 user_data += page_length;
634 offset += page_length;
Eric Anholt673a3942008-07-30 12:06:12 -0700635 }
Eric Anholt673a3942008-07-30 12:06:12 -0700636
637fail:
638 i915_gem_object_unpin(obj);
639 mutex_unlock(&dev->struct_mutex);
640
641 return ret;
642}
643
Eric Anholt3de09aa2009-03-09 09:42:23 -0700644/**
645 * This is the fallback GTT pwrite path, which uses get_user_pages to pin
646 * the memory and maps it using kmap_atomic for copying.
647 *
648 * This code resulted in x11perf -rgb10text consuming about 10% more CPU
649 * than using i915_gem_gtt_pwrite_fast on a G45 (32-bit).
650 */
Eric Anholt3043c602008-10-02 12:24:47 -0700651static int
Eric Anholt3de09aa2009-03-09 09:42:23 -0700652i915_gem_gtt_pwrite_slow(struct drm_device *dev, struct drm_gem_object *obj,
653 struct drm_i915_gem_pwrite *args,
654 struct drm_file *file_priv)
Eric Anholt673a3942008-07-30 12:06:12 -0700655{
Daniel Vetter23010e42010-03-08 13:35:02 +0100656 struct drm_i915_gem_object *obj_priv = to_intel_bo(obj);
Eric Anholt3de09aa2009-03-09 09:42:23 -0700657 drm_i915_private_t *dev_priv = dev->dev_private;
658 ssize_t remain;
659 loff_t gtt_page_base, offset;
660 loff_t first_data_page, last_data_page, num_pages;
661 loff_t pinned_pages, i;
662 struct page **user_pages;
663 struct mm_struct *mm = current->mm;
664 int gtt_page_offset, data_page_offset, data_page_index, page_length;
Eric Anholt673a3942008-07-30 12:06:12 -0700665 int ret;
Eric Anholt3de09aa2009-03-09 09:42:23 -0700666 uint64_t data_ptr = args->data_ptr;
667
668 remain = args->size;
669
670 /* Pin the user pages containing the data. We can't fault while
671 * holding the struct mutex, and all of the pwrite implementations
672 * want to hold it while dereferencing the user data.
673 */
674 first_data_page = data_ptr / PAGE_SIZE;
675 last_data_page = (data_ptr + args->size - 1) / PAGE_SIZE;
676 num_pages = last_data_page - first_data_page + 1;
677
Jesse Barnes8e7d2b22009-05-08 16:13:25 -0700678 user_pages = drm_calloc_large(num_pages, sizeof(struct page *));
Eric Anholt3de09aa2009-03-09 09:42:23 -0700679 if (user_pages == NULL)
680 return -ENOMEM;
681
682 down_read(&mm->mmap_sem);
683 pinned_pages = get_user_pages(current, mm, (uintptr_t)args->data_ptr,
684 num_pages, 0, 0, user_pages, NULL);
685 up_read(&mm->mmap_sem);
686 if (pinned_pages < num_pages) {
687 ret = -EFAULT;
688 goto out_unpin_pages;
689 }
690
691 mutex_lock(&dev->struct_mutex);
692 ret = i915_gem_object_pin(obj, 0);
693 if (ret)
694 goto out_unlock;
695
696 ret = i915_gem_object_set_to_gtt_domain(obj, 1);
697 if (ret)
698 goto out_unpin_object;
699
Daniel Vetter23010e42010-03-08 13:35:02 +0100700 obj_priv = to_intel_bo(obj);
Eric Anholt3de09aa2009-03-09 09:42:23 -0700701 offset = obj_priv->gtt_offset + args->offset;
702
703 while (remain > 0) {
704 /* Operation in this page
705 *
706 * gtt_page_base = page offset within aperture
707 * gtt_page_offset = offset within page in aperture
708 * data_page_index = page number in get_user_pages return
709 * data_page_offset = offset with data_page_index page.
710 * page_length = bytes to copy for this page
711 */
712 gtt_page_base = offset & PAGE_MASK;
713 gtt_page_offset = offset & ~PAGE_MASK;
714 data_page_index = data_ptr / PAGE_SIZE - first_data_page;
715 data_page_offset = data_ptr & ~PAGE_MASK;
716
717 page_length = remain;
718 if ((gtt_page_offset + page_length) > PAGE_SIZE)
719 page_length = PAGE_SIZE - gtt_page_offset;
720 if ((data_page_offset + page_length) > PAGE_SIZE)
721 page_length = PAGE_SIZE - data_page_offset;
722
723 ret = slow_kernel_write(dev_priv->mm.gtt_mapping,
724 gtt_page_base, gtt_page_offset,
725 user_pages[data_page_index],
726 data_page_offset,
727 page_length);
728
729 /* If we get a fault while copying data, then (presumably) our
730 * source page isn't available. Return the error and we'll
731 * retry in the slow path.
732 */
733 if (ret)
734 goto out_unpin_object;
735
736 remain -= page_length;
737 offset += page_length;
738 data_ptr += page_length;
739 }
740
741out_unpin_object:
742 i915_gem_object_unpin(obj);
743out_unlock:
744 mutex_unlock(&dev->struct_mutex);
745out_unpin_pages:
746 for (i = 0; i < pinned_pages; i++)
747 page_cache_release(user_pages[i]);
Jesse Barnes8e7d2b22009-05-08 16:13:25 -0700748 drm_free_large(user_pages);
Eric Anholt3de09aa2009-03-09 09:42:23 -0700749
750 return ret;
751}
752
Eric Anholt40123c12009-03-09 13:42:30 -0700753/**
754 * This is the fast shmem pwrite path, which attempts to directly
755 * copy_from_user into the kmapped pages backing the object.
756 */
Eric Anholt673a3942008-07-30 12:06:12 -0700757static int
Eric Anholt40123c12009-03-09 13:42:30 -0700758i915_gem_shmem_pwrite_fast(struct drm_device *dev, struct drm_gem_object *obj,
759 struct drm_i915_gem_pwrite *args,
760 struct drm_file *file_priv)
Eric Anholt673a3942008-07-30 12:06:12 -0700761{
Daniel Vetter23010e42010-03-08 13:35:02 +0100762 struct drm_i915_gem_object *obj_priv = to_intel_bo(obj);
Eric Anholt40123c12009-03-09 13:42:30 -0700763 ssize_t remain;
764 loff_t offset, page_base;
765 char __user *user_data;
766 int page_offset, page_length;
Eric Anholt673a3942008-07-30 12:06:12 -0700767 int ret;
Eric Anholt40123c12009-03-09 13:42:30 -0700768
769 user_data = (char __user *) (uintptr_t) args->data_ptr;
770 remain = args->size;
Eric Anholt673a3942008-07-30 12:06:12 -0700771
772 mutex_lock(&dev->struct_mutex);
773
Chris Wilson4bdadb92010-01-27 13:36:32 +0000774 ret = i915_gem_object_get_pages(obj, 0);
Eric Anholt40123c12009-03-09 13:42:30 -0700775 if (ret != 0)
776 goto fail_unlock;
777
Eric Anholte47c68e2008-11-14 13:35:19 -0800778 ret = i915_gem_object_set_to_cpu_domain(obj, 1);
Eric Anholt40123c12009-03-09 13:42:30 -0700779 if (ret != 0)
780 goto fail_put_pages;
Eric Anholt673a3942008-07-30 12:06:12 -0700781
Daniel Vetter23010e42010-03-08 13:35:02 +0100782 obj_priv = to_intel_bo(obj);
Eric Anholt673a3942008-07-30 12:06:12 -0700783 offset = args->offset;
Eric Anholt40123c12009-03-09 13:42:30 -0700784 obj_priv->dirty = 1;
Eric Anholt673a3942008-07-30 12:06:12 -0700785
Eric Anholt40123c12009-03-09 13:42:30 -0700786 while (remain > 0) {
787 /* Operation in this page
788 *
789 * page_base = page offset within aperture
790 * page_offset = offset within page
791 * page_length = bytes to copy for this page
792 */
793 page_base = (offset & ~(PAGE_SIZE-1));
794 page_offset = offset & (PAGE_SIZE-1);
795 page_length = remain;
796 if ((page_offset + remain) > PAGE_SIZE)
797 page_length = PAGE_SIZE - page_offset;
798
799 ret = fast_shmem_write(obj_priv->pages,
800 page_base, page_offset,
801 user_data, page_length);
802 if (ret)
803 goto fail_put_pages;
804
805 remain -= page_length;
806 user_data += page_length;
807 offset += page_length;
Eric Anholt673a3942008-07-30 12:06:12 -0700808 }
809
Eric Anholt40123c12009-03-09 13:42:30 -0700810fail_put_pages:
811 i915_gem_object_put_pages(obj);
812fail_unlock:
Eric Anholt673a3942008-07-30 12:06:12 -0700813 mutex_unlock(&dev->struct_mutex);
814
Eric Anholt40123c12009-03-09 13:42:30 -0700815 return ret;
816}
817
818/**
819 * This is the fallback shmem pwrite path, which uses get_user_pages to pin
820 * the memory and maps it using kmap_atomic for copying.
821 *
822 * This avoids taking mmap_sem for faulting on the user's address while the
823 * struct_mutex is held.
824 */
825static int
826i915_gem_shmem_pwrite_slow(struct drm_device *dev, struct drm_gem_object *obj,
827 struct drm_i915_gem_pwrite *args,
828 struct drm_file *file_priv)
829{
Daniel Vetter23010e42010-03-08 13:35:02 +0100830 struct drm_i915_gem_object *obj_priv = to_intel_bo(obj);
Eric Anholt40123c12009-03-09 13:42:30 -0700831 struct mm_struct *mm = current->mm;
832 struct page **user_pages;
833 ssize_t remain;
834 loff_t offset, pinned_pages, i;
835 loff_t first_data_page, last_data_page, num_pages;
836 int shmem_page_index, shmem_page_offset;
837 int data_page_index, data_page_offset;
838 int page_length;
839 int ret;
840 uint64_t data_ptr = args->data_ptr;
Eric Anholt280b7132009-03-12 16:56:27 -0700841 int do_bit17_swizzling;
Eric Anholt40123c12009-03-09 13:42:30 -0700842
843 remain = args->size;
844
845 /* Pin the user pages containing the data. We can't fault while
846 * holding the struct mutex, and all of the pwrite implementations
847 * want to hold it while dereferencing the user data.
848 */
849 first_data_page = data_ptr / PAGE_SIZE;
850 last_data_page = (data_ptr + args->size - 1) / PAGE_SIZE;
851 num_pages = last_data_page - first_data_page + 1;
852
Jesse Barnes8e7d2b22009-05-08 16:13:25 -0700853 user_pages = drm_calloc_large(num_pages, sizeof(struct page *));
Eric Anholt40123c12009-03-09 13:42:30 -0700854 if (user_pages == NULL)
855 return -ENOMEM;
856
857 down_read(&mm->mmap_sem);
858 pinned_pages = get_user_pages(current, mm, (uintptr_t)args->data_ptr,
859 num_pages, 0, 0, user_pages, NULL);
860 up_read(&mm->mmap_sem);
861 if (pinned_pages < num_pages) {
862 ret = -EFAULT;
863 goto fail_put_user_pages;
864 }
865
Eric Anholt280b7132009-03-12 16:56:27 -0700866 do_bit17_swizzling = i915_gem_object_needs_bit17_swizzle(obj);
867
Eric Anholt40123c12009-03-09 13:42:30 -0700868 mutex_lock(&dev->struct_mutex);
869
Chris Wilson07f73f62009-09-14 16:50:30 +0100870 ret = i915_gem_object_get_pages_or_evict(obj);
871 if (ret)
Eric Anholt40123c12009-03-09 13:42:30 -0700872 goto fail_unlock;
873
874 ret = i915_gem_object_set_to_cpu_domain(obj, 1);
875 if (ret != 0)
876 goto fail_put_pages;
877
Daniel Vetter23010e42010-03-08 13:35:02 +0100878 obj_priv = to_intel_bo(obj);
Eric Anholt40123c12009-03-09 13:42:30 -0700879 offset = args->offset;
880 obj_priv->dirty = 1;
881
882 while (remain > 0) {
883 /* Operation in this page
884 *
885 * shmem_page_index = page number within shmem file
886 * shmem_page_offset = offset within page in shmem file
887 * data_page_index = page number in get_user_pages return
888 * data_page_offset = offset with data_page_index page.
889 * page_length = bytes to copy for this page
890 */
891 shmem_page_index = offset / PAGE_SIZE;
892 shmem_page_offset = offset & ~PAGE_MASK;
893 data_page_index = data_ptr / PAGE_SIZE - first_data_page;
894 data_page_offset = data_ptr & ~PAGE_MASK;
895
896 page_length = remain;
897 if ((shmem_page_offset + page_length) > PAGE_SIZE)
898 page_length = PAGE_SIZE - shmem_page_offset;
899 if ((data_page_offset + page_length) > PAGE_SIZE)
900 page_length = PAGE_SIZE - data_page_offset;
901
Eric Anholt280b7132009-03-12 16:56:27 -0700902 if (do_bit17_swizzling) {
903 ret = slow_shmem_bit17_copy(obj_priv->pages[shmem_page_index],
904 shmem_page_offset,
905 user_pages[data_page_index],
906 data_page_offset,
907 page_length,
908 0);
909 } else {
910 ret = slow_shmem_copy(obj_priv->pages[shmem_page_index],
911 shmem_page_offset,
912 user_pages[data_page_index],
913 data_page_offset,
914 page_length);
915 }
Eric Anholt40123c12009-03-09 13:42:30 -0700916 if (ret)
917 goto fail_put_pages;
918
919 remain -= page_length;
920 data_ptr += page_length;
921 offset += page_length;
922 }
923
924fail_put_pages:
925 i915_gem_object_put_pages(obj);
926fail_unlock:
927 mutex_unlock(&dev->struct_mutex);
928fail_put_user_pages:
929 for (i = 0; i < pinned_pages; i++)
930 page_cache_release(user_pages[i]);
Jesse Barnes8e7d2b22009-05-08 16:13:25 -0700931 drm_free_large(user_pages);
Eric Anholt40123c12009-03-09 13:42:30 -0700932
933 return ret;
Eric Anholt673a3942008-07-30 12:06:12 -0700934}
935
936/**
937 * Writes data to the object referenced by handle.
938 *
939 * On error, the contents of the buffer that were to be modified are undefined.
940 */
941int
942i915_gem_pwrite_ioctl(struct drm_device *dev, void *data,
943 struct drm_file *file_priv)
944{
945 struct drm_i915_gem_pwrite *args = data;
946 struct drm_gem_object *obj;
947 struct drm_i915_gem_object *obj_priv;
948 int ret = 0;
949
950 obj = drm_gem_object_lookup(dev, file_priv, args->handle);
951 if (obj == NULL)
952 return -EBADF;
Daniel Vetter23010e42010-03-08 13:35:02 +0100953 obj_priv = to_intel_bo(obj);
Eric Anholt673a3942008-07-30 12:06:12 -0700954
955 /* Bounds check destination.
956 *
957 * XXX: This could use review for overflow issues...
958 */
959 if (args->offset > obj->size || args->size > obj->size ||
960 args->offset + args->size > obj->size) {
Luca Barbieribc9025b2010-02-09 05:49:12 +0000961 drm_gem_object_unreference_unlocked(obj);
Eric Anholt673a3942008-07-30 12:06:12 -0700962 return -EINVAL;
963 }
964
965 /* We can only do the GTT pwrite on untiled buffers, as otherwise
966 * it would end up going through the fenced access, and we'll get
967 * different detiling behavior between reading and writing.
968 * pread/pwrite currently are reading and writing from the CPU
969 * perspective, requiring manual detiling by the client.
970 */
Dave Airlie71acb5e2008-12-30 20:31:46 +1000971 if (obj_priv->phys_obj)
972 ret = i915_gem_phys_pwrite(dev, obj, args, file_priv);
973 else if (obj_priv->tiling_mode == I915_TILING_NONE &&
Eric Anholt3de09aa2009-03-09 09:42:23 -0700974 dev->gtt_total != 0) {
975 ret = i915_gem_gtt_pwrite_fast(dev, obj, args, file_priv);
976 if (ret == -EFAULT) {
977 ret = i915_gem_gtt_pwrite_slow(dev, obj, args,
978 file_priv);
979 }
Eric Anholt280b7132009-03-12 16:56:27 -0700980 } else if (i915_gem_object_needs_bit17_swizzle(obj)) {
981 ret = i915_gem_shmem_pwrite_slow(dev, obj, args, file_priv);
Eric Anholt40123c12009-03-09 13:42:30 -0700982 } else {
983 ret = i915_gem_shmem_pwrite_fast(dev, obj, args, file_priv);
984 if (ret == -EFAULT) {
985 ret = i915_gem_shmem_pwrite_slow(dev, obj, args,
986 file_priv);
987 }
988 }
Eric Anholt673a3942008-07-30 12:06:12 -0700989
990#if WATCH_PWRITE
991 if (ret)
992 DRM_INFO("pwrite failed %d\n", ret);
993#endif
994
Luca Barbieribc9025b2010-02-09 05:49:12 +0000995 drm_gem_object_unreference_unlocked(obj);
Eric Anholt673a3942008-07-30 12:06:12 -0700996
997 return ret;
998}
999
1000/**
Eric Anholt2ef7eea2008-11-10 10:53:25 -08001001 * Called when user space prepares to use an object with the CPU, either
1002 * through the mmap ioctl's mapping or a GTT mapping.
Eric Anholt673a3942008-07-30 12:06:12 -07001003 */
1004int
1005i915_gem_set_domain_ioctl(struct drm_device *dev, void *data,
1006 struct drm_file *file_priv)
1007{
Eric Anholta09ba7f2009-08-29 12:49:51 -07001008 struct drm_i915_private *dev_priv = dev->dev_private;
Eric Anholt673a3942008-07-30 12:06:12 -07001009 struct drm_i915_gem_set_domain *args = data;
1010 struct drm_gem_object *obj;
Jesse Barnes652c3932009-08-17 13:31:43 -07001011 struct drm_i915_gem_object *obj_priv;
Eric Anholt2ef7eea2008-11-10 10:53:25 -08001012 uint32_t read_domains = args->read_domains;
1013 uint32_t write_domain = args->write_domain;
Eric Anholt673a3942008-07-30 12:06:12 -07001014 int ret;
1015
1016 if (!(dev->driver->driver_features & DRIVER_GEM))
1017 return -ENODEV;
1018
Eric Anholt2ef7eea2008-11-10 10:53:25 -08001019 /* Only handle setting domains to types used by the CPU. */
Chris Wilson21d509e2009-06-06 09:46:02 +01001020 if (write_domain & I915_GEM_GPU_DOMAINS)
Eric Anholt2ef7eea2008-11-10 10:53:25 -08001021 return -EINVAL;
1022
Chris Wilson21d509e2009-06-06 09:46:02 +01001023 if (read_domains & I915_GEM_GPU_DOMAINS)
Eric Anholt2ef7eea2008-11-10 10:53:25 -08001024 return -EINVAL;
1025
1026 /* Having something in the write domain implies it's in the read
1027 * domain, and only that read domain. Enforce that in the request.
1028 */
1029 if (write_domain != 0 && read_domains != write_domain)
1030 return -EINVAL;
1031
Eric Anholt673a3942008-07-30 12:06:12 -07001032 obj = drm_gem_object_lookup(dev, file_priv, args->handle);
1033 if (obj == NULL)
1034 return -EBADF;
Daniel Vetter23010e42010-03-08 13:35:02 +01001035 obj_priv = to_intel_bo(obj);
Eric Anholt673a3942008-07-30 12:06:12 -07001036
1037 mutex_lock(&dev->struct_mutex);
Jesse Barnes652c3932009-08-17 13:31:43 -07001038
1039 intel_mark_busy(dev, obj);
1040
Eric Anholt673a3942008-07-30 12:06:12 -07001041#if WATCH_BUF
Krzysztof Halasacfd43c02009-06-20 00:31:28 +02001042 DRM_INFO("set_domain_ioctl %p(%zd), %08x %08x\n",
Eric Anholt2ef7eea2008-11-10 10:53:25 -08001043 obj, obj->size, read_domains, write_domain);
Eric Anholt673a3942008-07-30 12:06:12 -07001044#endif
Eric Anholt2ef7eea2008-11-10 10:53:25 -08001045 if (read_domains & I915_GEM_DOMAIN_GTT) {
1046 ret = i915_gem_object_set_to_gtt_domain(obj, write_domain != 0);
Eric Anholt02354392008-11-26 13:58:13 -08001047
Eric Anholta09ba7f2009-08-29 12:49:51 -07001048 /* Update the LRU on the fence for the CPU access that's
1049 * about to occur.
1050 */
1051 if (obj_priv->fence_reg != I915_FENCE_REG_NONE) {
Daniel Vetter007cc8a2010-04-28 11:02:31 +02001052 struct drm_i915_fence_reg *reg =
1053 &dev_priv->fence_regs[obj_priv->fence_reg];
1054 list_move_tail(&reg->lru_list,
Eric Anholta09ba7f2009-08-29 12:49:51 -07001055 &dev_priv->mm.fence_list);
1056 }
1057
Eric Anholt02354392008-11-26 13:58:13 -08001058 /* Silently promote "you're not bound, there was nothing to do"
1059 * to success, since the client was just asking us to
1060 * make sure everything was done.
1061 */
1062 if (ret == -EINVAL)
1063 ret = 0;
Eric Anholt2ef7eea2008-11-10 10:53:25 -08001064 } else {
Eric Anholte47c68e2008-11-14 13:35:19 -08001065 ret = i915_gem_object_set_to_cpu_domain(obj, write_domain != 0);
Eric Anholt2ef7eea2008-11-10 10:53:25 -08001066 }
1067
Eric Anholt673a3942008-07-30 12:06:12 -07001068 drm_gem_object_unreference(obj);
1069 mutex_unlock(&dev->struct_mutex);
1070 return ret;
1071}
1072
1073/**
1074 * Called when user space has done writes to this buffer
1075 */
1076int
1077i915_gem_sw_finish_ioctl(struct drm_device *dev, void *data,
1078 struct drm_file *file_priv)
1079{
1080 struct drm_i915_gem_sw_finish *args = data;
1081 struct drm_gem_object *obj;
1082 struct drm_i915_gem_object *obj_priv;
1083 int ret = 0;
1084
1085 if (!(dev->driver->driver_features & DRIVER_GEM))
1086 return -ENODEV;
1087
1088 mutex_lock(&dev->struct_mutex);
1089 obj = drm_gem_object_lookup(dev, file_priv, args->handle);
1090 if (obj == NULL) {
1091 mutex_unlock(&dev->struct_mutex);
1092 return -EBADF;
1093 }
1094
1095#if WATCH_BUF
Krzysztof Halasacfd43c02009-06-20 00:31:28 +02001096 DRM_INFO("%s: sw_finish %d (%p %zd)\n",
Eric Anholt673a3942008-07-30 12:06:12 -07001097 __func__, args->handle, obj, obj->size);
1098#endif
Daniel Vetter23010e42010-03-08 13:35:02 +01001099 obj_priv = to_intel_bo(obj);
Eric Anholt673a3942008-07-30 12:06:12 -07001100
1101 /* Pinned buffers may be scanout, so flush the cache */
Eric Anholte47c68e2008-11-14 13:35:19 -08001102 if (obj_priv->pin_count)
1103 i915_gem_object_flush_cpu_write_domain(obj);
1104
Eric Anholt673a3942008-07-30 12:06:12 -07001105 drm_gem_object_unreference(obj);
1106 mutex_unlock(&dev->struct_mutex);
1107 return ret;
1108}
1109
1110/**
1111 * Maps the contents of an object, returning the address it is mapped
1112 * into.
1113 *
1114 * While the mapping holds a reference on the contents of the object, it doesn't
1115 * imply a ref on the object itself.
1116 */
1117int
1118i915_gem_mmap_ioctl(struct drm_device *dev, void *data,
1119 struct drm_file *file_priv)
1120{
1121 struct drm_i915_gem_mmap *args = data;
1122 struct drm_gem_object *obj;
1123 loff_t offset;
1124 unsigned long addr;
1125
1126 if (!(dev->driver->driver_features & DRIVER_GEM))
1127 return -ENODEV;
1128
1129 obj = drm_gem_object_lookup(dev, file_priv, args->handle);
1130 if (obj == NULL)
1131 return -EBADF;
1132
1133 offset = args->offset;
1134
1135 down_write(&current->mm->mmap_sem);
1136 addr = do_mmap(obj->filp, 0, args->size,
1137 PROT_READ | PROT_WRITE, MAP_SHARED,
1138 args->offset);
1139 up_write(&current->mm->mmap_sem);
Luca Barbieribc9025b2010-02-09 05:49:12 +00001140 drm_gem_object_unreference_unlocked(obj);
Eric Anholt673a3942008-07-30 12:06:12 -07001141 if (IS_ERR((void *)addr))
1142 return addr;
1143
1144 args->addr_ptr = (uint64_t) addr;
1145
1146 return 0;
1147}
1148
Jesse Barnesde151cf2008-11-12 10:03:55 -08001149/**
1150 * i915_gem_fault - fault a page into the GTT
1151 * vma: VMA in question
1152 * vmf: fault info
1153 *
1154 * The fault handler is set up by drm_gem_mmap() when a object is GTT mapped
1155 * from userspace. The fault handler takes care of binding the object to
1156 * the GTT (if needed), allocating and programming a fence register (again,
1157 * only if needed based on whether the old reg is still valid or the object
1158 * is tiled) and inserting a new PTE into the faulting process.
1159 *
1160 * Note that the faulting process may involve evicting existing objects
1161 * from the GTT and/or fence registers to make room. So performance may
1162 * suffer if the GTT working set is large or there are few fence registers
1163 * left.
1164 */
1165int i915_gem_fault(struct vm_area_struct *vma, struct vm_fault *vmf)
1166{
1167 struct drm_gem_object *obj = vma->vm_private_data;
1168 struct drm_device *dev = obj->dev;
1169 struct drm_i915_private *dev_priv = dev->dev_private;
Daniel Vetter23010e42010-03-08 13:35:02 +01001170 struct drm_i915_gem_object *obj_priv = to_intel_bo(obj);
Jesse Barnesde151cf2008-11-12 10:03:55 -08001171 pgoff_t page_offset;
1172 unsigned long pfn;
1173 int ret = 0;
Jesse Barnes0f973f22009-01-26 17:10:45 -08001174 bool write = !!(vmf->flags & FAULT_FLAG_WRITE);
Jesse Barnesde151cf2008-11-12 10:03:55 -08001175
1176 /* We don't use vmf->pgoff since that has the fake offset */
1177 page_offset = ((unsigned long)vmf->virtual_address - vma->vm_start) >>
1178 PAGE_SHIFT;
1179
1180 /* Now bind it into the GTT if needed */
1181 mutex_lock(&dev->struct_mutex);
1182 if (!obj_priv->gtt_space) {
Chris Wilsone67b8ce2009-09-14 16:50:26 +01001183 ret = i915_gem_object_bind_to_gtt(obj, 0);
Chris Wilsonc7150892009-09-23 00:43:56 +01001184 if (ret)
1185 goto unlock;
Kristian Høgsberg07f4f3e2009-05-27 14:37:28 -04001186
Jesse Barnes14b60392009-05-20 16:47:08 -04001187 list_add_tail(&obj_priv->list, &dev_priv->mm.inactive_list);
Jesse Barnesde151cf2008-11-12 10:03:55 -08001188
1189 ret = i915_gem_object_set_to_gtt_domain(obj, write);
Chris Wilsonc7150892009-09-23 00:43:56 +01001190 if (ret)
1191 goto unlock;
Jesse Barnesde151cf2008-11-12 10:03:55 -08001192 }
1193
1194 /* Need a new fence register? */
Eric Anholta09ba7f2009-08-29 12:49:51 -07001195 if (obj_priv->tiling_mode != I915_TILING_NONE) {
Chris Wilson8c4b8c32009-06-17 22:08:52 +01001196 ret = i915_gem_object_get_fence_reg(obj);
Chris Wilsonc7150892009-09-23 00:43:56 +01001197 if (ret)
1198 goto unlock;
Eric Anholtd9ddcb92009-01-27 10:33:49 -08001199 }
Jesse Barnesde151cf2008-11-12 10:03:55 -08001200
1201 pfn = ((dev->agp->base + obj_priv->gtt_offset) >> PAGE_SHIFT) +
1202 page_offset;
1203
1204 /* Finally, remap it using the new GTT offset */
1205 ret = vm_insert_pfn(vma, (unsigned long)vmf->virtual_address, pfn);
Chris Wilsonc7150892009-09-23 00:43:56 +01001206unlock:
Jesse Barnesde151cf2008-11-12 10:03:55 -08001207 mutex_unlock(&dev->struct_mutex);
1208
1209 switch (ret) {
Chris Wilsonc7150892009-09-23 00:43:56 +01001210 case 0:
1211 case -ERESTARTSYS:
1212 return VM_FAULT_NOPAGE;
Jesse Barnesde151cf2008-11-12 10:03:55 -08001213 case -ENOMEM:
1214 case -EAGAIN:
1215 return VM_FAULT_OOM;
Jesse Barnesde151cf2008-11-12 10:03:55 -08001216 default:
Chris Wilsonc7150892009-09-23 00:43:56 +01001217 return VM_FAULT_SIGBUS;
Jesse Barnesde151cf2008-11-12 10:03:55 -08001218 }
1219}
1220
1221/**
1222 * i915_gem_create_mmap_offset - create a fake mmap offset for an object
1223 * @obj: obj in question
1224 *
1225 * GEM memory mapping works by handing back to userspace a fake mmap offset
1226 * it can use in a subsequent mmap(2) call. The DRM core code then looks
1227 * up the object based on the offset and sets up the various memory mapping
1228 * structures.
1229 *
1230 * This routine allocates and attaches a fake offset for @obj.
1231 */
1232static int
1233i915_gem_create_mmap_offset(struct drm_gem_object *obj)
1234{
1235 struct drm_device *dev = obj->dev;
1236 struct drm_gem_mm *mm = dev->mm_private;
Daniel Vetter23010e42010-03-08 13:35:02 +01001237 struct drm_i915_gem_object *obj_priv = to_intel_bo(obj);
Jesse Barnesde151cf2008-11-12 10:03:55 -08001238 struct drm_map_list *list;
Benjamin Herrenschmidtf77d3902009-02-02 16:55:46 +11001239 struct drm_local_map *map;
Jesse Barnesde151cf2008-11-12 10:03:55 -08001240 int ret = 0;
1241
1242 /* Set the object up for mmap'ing */
1243 list = &obj->map_list;
Eric Anholt9a298b22009-03-24 12:23:04 -07001244 list->map = kzalloc(sizeof(struct drm_map_list), GFP_KERNEL);
Jesse Barnesde151cf2008-11-12 10:03:55 -08001245 if (!list->map)
1246 return -ENOMEM;
1247
1248 map = list->map;
1249 map->type = _DRM_GEM;
1250 map->size = obj->size;
1251 map->handle = obj;
1252
1253 /* Get a DRM GEM mmap offset allocated... */
1254 list->file_offset_node = drm_mm_search_free(&mm->offset_manager,
1255 obj->size / PAGE_SIZE, 0, 0);
1256 if (!list->file_offset_node) {
1257 DRM_ERROR("failed to allocate offset for bo %d\n", obj->name);
1258 ret = -ENOMEM;
1259 goto out_free_list;
1260 }
1261
1262 list->file_offset_node = drm_mm_get_block(list->file_offset_node,
1263 obj->size / PAGE_SIZE, 0);
1264 if (!list->file_offset_node) {
1265 ret = -ENOMEM;
1266 goto out_free_list;
1267 }
1268
1269 list->hash.key = list->file_offset_node->start;
1270 if (drm_ht_insert_item(&mm->offset_hash, &list->hash)) {
1271 DRM_ERROR("failed to add to map hash\n");
Chris Wilson5618ca62009-12-02 15:15:30 +00001272 ret = -ENOMEM;
Jesse Barnesde151cf2008-11-12 10:03:55 -08001273 goto out_free_mm;
1274 }
1275
1276 /* By now we should be all set, any drm_mmap request on the offset
1277 * below will get to our mmap & fault handler */
1278 obj_priv->mmap_offset = ((uint64_t) list->hash.key) << PAGE_SHIFT;
1279
1280 return 0;
1281
1282out_free_mm:
1283 drm_mm_put_block(list->file_offset_node);
1284out_free_list:
Eric Anholt9a298b22009-03-24 12:23:04 -07001285 kfree(list->map);
Jesse Barnesde151cf2008-11-12 10:03:55 -08001286
1287 return ret;
1288}
1289
Chris Wilson901782b2009-07-10 08:18:50 +01001290/**
1291 * i915_gem_release_mmap - remove physical page mappings
1292 * @obj: obj in question
1293 *
André Goddard Rosaaf901ca2009-11-14 13:09:05 -02001294 * Preserve the reservation of the mmapping with the DRM core code, but
Chris Wilson901782b2009-07-10 08:18:50 +01001295 * relinquish ownership of the pages back to the system.
1296 *
1297 * It is vital that we remove the page mapping if we have mapped a tiled
1298 * object through the GTT and then lose the fence register due to
1299 * resource pressure. Similarly if the object has been moved out of the
1300 * aperture, than pages mapped into userspace must be revoked. Removing the
1301 * mapping will then trigger a page fault on the next user access, allowing
1302 * fixup by i915_gem_fault().
1303 */
Eric Anholtd05ca302009-07-10 13:02:26 -07001304void
Chris Wilson901782b2009-07-10 08:18:50 +01001305i915_gem_release_mmap(struct drm_gem_object *obj)
1306{
1307 struct drm_device *dev = obj->dev;
Daniel Vetter23010e42010-03-08 13:35:02 +01001308 struct drm_i915_gem_object *obj_priv = to_intel_bo(obj);
Chris Wilson901782b2009-07-10 08:18:50 +01001309
1310 if (dev->dev_mapping)
1311 unmap_mapping_range(dev->dev_mapping,
1312 obj_priv->mmap_offset, obj->size, 1);
1313}
1314
Jesse Barnesab00b3e2009-02-11 14:01:46 -08001315static void
1316i915_gem_free_mmap_offset(struct drm_gem_object *obj)
1317{
1318 struct drm_device *dev = obj->dev;
Daniel Vetter23010e42010-03-08 13:35:02 +01001319 struct drm_i915_gem_object *obj_priv = to_intel_bo(obj);
Jesse Barnesab00b3e2009-02-11 14:01:46 -08001320 struct drm_gem_mm *mm = dev->mm_private;
1321 struct drm_map_list *list;
1322
1323 list = &obj->map_list;
1324 drm_ht_remove_item(&mm->offset_hash, &list->hash);
1325
1326 if (list->file_offset_node) {
1327 drm_mm_put_block(list->file_offset_node);
1328 list->file_offset_node = NULL;
1329 }
1330
1331 if (list->map) {
Eric Anholt9a298b22009-03-24 12:23:04 -07001332 kfree(list->map);
Jesse Barnesab00b3e2009-02-11 14:01:46 -08001333 list->map = NULL;
1334 }
1335
1336 obj_priv->mmap_offset = 0;
1337}
1338
Jesse Barnesde151cf2008-11-12 10:03:55 -08001339/**
1340 * i915_gem_get_gtt_alignment - return required GTT alignment for an object
1341 * @obj: object to check
1342 *
1343 * Return the required GTT alignment for an object, taking into account
1344 * potential fence register mapping if needed.
1345 */
1346static uint32_t
1347i915_gem_get_gtt_alignment(struct drm_gem_object *obj)
1348{
1349 struct drm_device *dev = obj->dev;
Daniel Vetter23010e42010-03-08 13:35:02 +01001350 struct drm_i915_gem_object *obj_priv = to_intel_bo(obj);
Jesse Barnesde151cf2008-11-12 10:03:55 -08001351 int start, i;
1352
1353 /*
1354 * Minimum alignment is 4k (GTT page size), but might be greater
1355 * if a fence register is needed for the object.
1356 */
1357 if (IS_I965G(dev) || obj_priv->tiling_mode == I915_TILING_NONE)
1358 return 4096;
1359
1360 /*
1361 * Previous chips need to be aligned to the size of the smallest
1362 * fence register that can contain the object.
1363 */
1364 if (IS_I9XX(dev))
1365 start = 1024*1024;
1366 else
1367 start = 512*1024;
1368
1369 for (i = start; i < obj->size; i <<= 1)
1370 ;
1371
1372 return i;
1373}
1374
1375/**
1376 * i915_gem_mmap_gtt_ioctl - prepare an object for GTT mmap'ing
1377 * @dev: DRM device
1378 * @data: GTT mapping ioctl data
1379 * @file_priv: GEM object info
1380 *
1381 * Simply returns the fake offset to userspace so it can mmap it.
1382 * The mmap call will end up in drm_gem_mmap(), which will set things
1383 * up so we can get faults in the handler above.
1384 *
1385 * The fault handler will take care of binding the object into the GTT
1386 * (since it may have been evicted to make room for something), allocating
1387 * a fence register, and mapping the appropriate aperture address into
1388 * userspace.
1389 */
1390int
1391i915_gem_mmap_gtt_ioctl(struct drm_device *dev, void *data,
1392 struct drm_file *file_priv)
1393{
1394 struct drm_i915_gem_mmap_gtt *args = data;
1395 struct drm_i915_private *dev_priv = dev->dev_private;
1396 struct drm_gem_object *obj;
1397 struct drm_i915_gem_object *obj_priv;
1398 int ret;
1399
1400 if (!(dev->driver->driver_features & DRIVER_GEM))
1401 return -ENODEV;
1402
1403 obj = drm_gem_object_lookup(dev, file_priv, args->handle);
1404 if (obj == NULL)
1405 return -EBADF;
1406
1407 mutex_lock(&dev->struct_mutex);
1408
Daniel Vetter23010e42010-03-08 13:35:02 +01001409 obj_priv = to_intel_bo(obj);
Jesse Barnesde151cf2008-11-12 10:03:55 -08001410
Chris Wilsonab182822009-09-22 18:46:17 +01001411 if (obj_priv->madv != I915_MADV_WILLNEED) {
1412 DRM_ERROR("Attempting to mmap a purgeable buffer\n");
1413 drm_gem_object_unreference(obj);
1414 mutex_unlock(&dev->struct_mutex);
1415 return -EINVAL;
1416 }
1417
1418
Jesse Barnesde151cf2008-11-12 10:03:55 -08001419 if (!obj_priv->mmap_offset) {
1420 ret = i915_gem_create_mmap_offset(obj);
Chris Wilson13af1062009-02-11 14:26:31 +00001421 if (ret) {
1422 drm_gem_object_unreference(obj);
1423 mutex_unlock(&dev->struct_mutex);
Jesse Barnesde151cf2008-11-12 10:03:55 -08001424 return ret;
Chris Wilson13af1062009-02-11 14:26:31 +00001425 }
Jesse Barnesde151cf2008-11-12 10:03:55 -08001426 }
1427
1428 args->offset = obj_priv->mmap_offset;
1429
Jesse Barnesde151cf2008-11-12 10:03:55 -08001430 /*
1431 * Pull it into the GTT so that we have a page list (makes the
1432 * initial fault faster and any subsequent flushing possible).
1433 */
1434 if (!obj_priv->agp_mem) {
Chris Wilsone67b8ce2009-09-14 16:50:26 +01001435 ret = i915_gem_object_bind_to_gtt(obj, 0);
Jesse Barnesde151cf2008-11-12 10:03:55 -08001436 if (ret) {
1437 drm_gem_object_unreference(obj);
1438 mutex_unlock(&dev->struct_mutex);
1439 return ret;
1440 }
Jesse Barnes14b60392009-05-20 16:47:08 -04001441 list_add_tail(&obj_priv->list, &dev_priv->mm.inactive_list);
Jesse Barnesde151cf2008-11-12 10:03:55 -08001442 }
1443
1444 drm_gem_object_unreference(obj);
1445 mutex_unlock(&dev->struct_mutex);
1446
1447 return 0;
1448}
1449
Ben Gamari6911a9b2009-04-02 11:24:54 -07001450void
Eric Anholt856fa192009-03-19 14:10:50 -07001451i915_gem_object_put_pages(struct drm_gem_object *obj)
Eric Anholt673a3942008-07-30 12:06:12 -07001452{
Daniel Vetter23010e42010-03-08 13:35:02 +01001453 struct drm_i915_gem_object *obj_priv = to_intel_bo(obj);
Eric Anholt673a3942008-07-30 12:06:12 -07001454 int page_count = obj->size / PAGE_SIZE;
1455 int i;
1456
Eric Anholt856fa192009-03-19 14:10:50 -07001457 BUG_ON(obj_priv->pages_refcount == 0);
Chris Wilsonbb6baf72009-09-22 14:24:13 +01001458 BUG_ON(obj_priv->madv == __I915_MADV_PURGED);
Eric Anholt856fa192009-03-19 14:10:50 -07001459
1460 if (--obj_priv->pages_refcount != 0)
Eric Anholt673a3942008-07-30 12:06:12 -07001461 return;
1462
Eric Anholt280b7132009-03-12 16:56:27 -07001463 if (obj_priv->tiling_mode != I915_TILING_NONE)
1464 i915_gem_object_save_bit_17_swizzle(obj);
1465
Chris Wilson3ef94da2009-09-14 16:50:29 +01001466 if (obj_priv->madv == I915_MADV_DONTNEED)
Chris Wilson13a05fd2009-09-20 23:03:19 +01001467 obj_priv->dirty = 0;
Chris Wilson3ef94da2009-09-14 16:50:29 +01001468
1469 for (i = 0; i < page_count; i++) {
Chris Wilson3ef94da2009-09-14 16:50:29 +01001470 if (obj_priv->dirty)
1471 set_page_dirty(obj_priv->pages[i]);
1472
1473 if (obj_priv->madv == I915_MADV_WILLNEED)
Eric Anholt856fa192009-03-19 14:10:50 -07001474 mark_page_accessed(obj_priv->pages[i]);
Chris Wilson3ef94da2009-09-14 16:50:29 +01001475
1476 page_cache_release(obj_priv->pages[i]);
1477 }
Eric Anholt673a3942008-07-30 12:06:12 -07001478 obj_priv->dirty = 0;
1479
Jesse Barnes8e7d2b22009-05-08 16:13:25 -07001480 drm_free_large(obj_priv->pages);
Eric Anholt856fa192009-03-19 14:10:50 -07001481 obj_priv->pages = NULL;
Eric Anholt673a3942008-07-30 12:06:12 -07001482}
1483
1484static void
Zou Nan hai852835f2010-05-21 09:08:56 +08001485i915_gem_object_move_to_active(struct drm_gem_object *obj, uint32_t seqno,
1486 struct intel_ring_buffer *ring)
Eric Anholt673a3942008-07-30 12:06:12 -07001487{
1488 struct drm_device *dev = obj->dev;
1489 drm_i915_private_t *dev_priv = dev->dev_private;
Daniel Vetter23010e42010-03-08 13:35:02 +01001490 struct drm_i915_gem_object *obj_priv = to_intel_bo(obj);
Zou Nan hai852835f2010-05-21 09:08:56 +08001491 BUG_ON(ring == NULL);
1492 obj_priv->ring = ring;
Eric Anholt673a3942008-07-30 12:06:12 -07001493
1494 /* Add a reference if we're newly entering the active list. */
1495 if (!obj_priv->active) {
1496 drm_gem_object_reference(obj);
1497 obj_priv->active = 1;
1498 }
1499 /* Move from whatever list we were on to the tail of execution. */
Carl Worth5e118f42009-03-20 11:54:25 -07001500 spin_lock(&dev_priv->mm.active_list_lock);
Zou Nan hai852835f2010-05-21 09:08:56 +08001501 list_move_tail(&obj_priv->list, &ring->active_list);
Carl Worth5e118f42009-03-20 11:54:25 -07001502 spin_unlock(&dev_priv->mm.active_list_lock);
Eric Anholtce44b0e2008-11-06 16:00:31 -08001503 obj_priv->last_rendering_seqno = seqno;
Eric Anholt673a3942008-07-30 12:06:12 -07001504}
1505
Eric Anholtce44b0e2008-11-06 16:00:31 -08001506static void
1507i915_gem_object_move_to_flushing(struct drm_gem_object *obj)
1508{
1509 struct drm_device *dev = obj->dev;
1510 drm_i915_private_t *dev_priv = dev->dev_private;
Daniel Vetter23010e42010-03-08 13:35:02 +01001511 struct drm_i915_gem_object *obj_priv = to_intel_bo(obj);
Eric Anholtce44b0e2008-11-06 16:00:31 -08001512
1513 BUG_ON(!obj_priv->active);
1514 list_move_tail(&obj_priv->list, &dev_priv->mm.flushing_list);
1515 obj_priv->last_rendering_seqno = 0;
1516}
Eric Anholt673a3942008-07-30 12:06:12 -07001517
Chris Wilson963b4832009-09-20 23:03:54 +01001518/* Immediately discard the backing storage */
1519static void
1520i915_gem_object_truncate(struct drm_gem_object *obj)
1521{
Daniel Vetter23010e42010-03-08 13:35:02 +01001522 struct drm_i915_gem_object *obj_priv = to_intel_bo(obj);
Chris Wilsonbb6baf72009-09-22 14:24:13 +01001523 struct inode *inode;
Chris Wilson963b4832009-09-20 23:03:54 +01001524
Chris Wilsonbb6baf72009-09-22 14:24:13 +01001525 inode = obj->filp->f_path.dentry->d_inode;
1526 if (inode->i_op->truncate)
1527 inode->i_op->truncate (inode);
1528
1529 obj_priv->madv = __I915_MADV_PURGED;
Chris Wilson963b4832009-09-20 23:03:54 +01001530}
1531
1532static inline int
1533i915_gem_object_is_purgeable(struct drm_i915_gem_object *obj_priv)
1534{
1535 return obj_priv->madv == I915_MADV_DONTNEED;
1536}
1537
Eric Anholt673a3942008-07-30 12:06:12 -07001538static void
1539i915_gem_object_move_to_inactive(struct drm_gem_object *obj)
1540{
1541 struct drm_device *dev = obj->dev;
1542 drm_i915_private_t *dev_priv = dev->dev_private;
Daniel Vetter23010e42010-03-08 13:35:02 +01001543 struct drm_i915_gem_object *obj_priv = to_intel_bo(obj);
Eric Anholt673a3942008-07-30 12:06:12 -07001544
1545 i915_verify_inactive(dev, __FILE__, __LINE__);
1546 if (obj_priv->pin_count != 0)
1547 list_del_init(&obj_priv->list);
1548 else
1549 list_move_tail(&obj_priv->list, &dev_priv->mm.inactive_list);
1550
Daniel Vetter99fcb762010-02-07 16:20:18 +01001551 BUG_ON(!list_empty(&obj_priv->gpu_write_list));
1552
Eric Anholtce44b0e2008-11-06 16:00:31 -08001553 obj_priv->last_rendering_seqno = 0;
Zou Nan hai852835f2010-05-21 09:08:56 +08001554 obj_priv->ring = NULL;
Eric Anholt673a3942008-07-30 12:06:12 -07001555 if (obj_priv->active) {
1556 obj_priv->active = 0;
1557 drm_gem_object_unreference(obj);
1558 }
1559 i915_verify_inactive(dev, __FILE__, __LINE__);
1560}
1561
Daniel Vetter63560392010-02-19 11:51:59 +01001562static void
1563i915_gem_process_flushing_list(struct drm_device *dev,
Zou Nan hai852835f2010-05-21 09:08:56 +08001564 uint32_t flush_domains, uint32_t seqno,
1565 struct intel_ring_buffer *ring)
Daniel Vetter63560392010-02-19 11:51:59 +01001566{
1567 drm_i915_private_t *dev_priv = dev->dev_private;
1568 struct drm_i915_gem_object *obj_priv, *next;
1569
1570 list_for_each_entry_safe(obj_priv, next,
1571 &dev_priv->mm.gpu_write_list,
1572 gpu_write_list) {
Daniel Vettera8089e82010-04-09 19:05:09 +00001573 struct drm_gem_object *obj = &obj_priv->base;
Daniel Vetter63560392010-02-19 11:51:59 +01001574
1575 if ((obj->write_domain & flush_domains) ==
Zou Nan hai852835f2010-05-21 09:08:56 +08001576 obj->write_domain &&
1577 obj_priv->ring->ring_flag == ring->ring_flag) {
Daniel Vetter63560392010-02-19 11:51:59 +01001578 uint32_t old_write_domain = obj->write_domain;
1579
1580 obj->write_domain = 0;
1581 list_del_init(&obj_priv->gpu_write_list);
Zou Nan hai852835f2010-05-21 09:08:56 +08001582 i915_gem_object_move_to_active(obj, seqno, ring);
Daniel Vetter63560392010-02-19 11:51:59 +01001583
1584 /* update the fence lru list */
Daniel Vetter007cc8a2010-04-28 11:02:31 +02001585 if (obj_priv->fence_reg != I915_FENCE_REG_NONE) {
1586 struct drm_i915_fence_reg *reg =
1587 &dev_priv->fence_regs[obj_priv->fence_reg];
1588 list_move_tail(&reg->lru_list,
Daniel Vetter63560392010-02-19 11:51:59 +01001589 &dev_priv->mm.fence_list);
Daniel Vetter007cc8a2010-04-28 11:02:31 +02001590 }
Daniel Vetter63560392010-02-19 11:51:59 +01001591
1592 trace_i915_gem_object_change_domain(obj,
1593 obj->read_domains,
1594 old_write_domain);
1595 }
1596 }
1597}
Zou Nan hai8187a2b2010-05-21 09:08:55 +08001598
Daniel Vetter5a5a0c62009-09-15 22:57:36 +02001599uint32_t
Eric Anholtb9624422009-06-03 07:27:35 +00001600i915_add_request(struct drm_device *dev, struct drm_file *file_priv,
Zou Nan hai852835f2010-05-21 09:08:56 +08001601 uint32_t flush_domains, struct intel_ring_buffer *ring)
Eric Anholt673a3942008-07-30 12:06:12 -07001602{
1603 drm_i915_private_t *dev_priv = dev->dev_private;
Eric Anholtb9624422009-06-03 07:27:35 +00001604 struct drm_i915_file_private *i915_file_priv = NULL;
Eric Anholt673a3942008-07-30 12:06:12 -07001605 struct drm_i915_gem_request *request;
1606 uint32_t seqno;
1607 int was_empty;
Eric Anholt673a3942008-07-30 12:06:12 -07001608
Eric Anholtb9624422009-06-03 07:27:35 +00001609 if (file_priv != NULL)
1610 i915_file_priv = file_priv->driver_priv;
1611
Eric Anholt9a298b22009-03-24 12:23:04 -07001612 request = kzalloc(sizeof(*request), GFP_KERNEL);
Eric Anholt673a3942008-07-30 12:06:12 -07001613 if (request == NULL)
1614 return 0;
1615
Zou Nan hai852835f2010-05-21 09:08:56 +08001616 seqno = ring->add_request(dev, ring, file_priv, flush_domains);
Eric Anholt673a3942008-07-30 12:06:12 -07001617
1618 request->seqno = seqno;
Zou Nan hai852835f2010-05-21 09:08:56 +08001619 request->ring = ring;
Eric Anholt673a3942008-07-30 12:06:12 -07001620 request->emitted_jiffies = jiffies;
Zou Nan hai852835f2010-05-21 09:08:56 +08001621 was_empty = list_empty(&ring->request_list);
1622 list_add_tail(&request->list, &ring->request_list);
1623
Eric Anholtb9624422009-06-03 07:27:35 +00001624 if (i915_file_priv) {
1625 list_add_tail(&request->client_list,
1626 &i915_file_priv->mm.request_list);
1627 } else {
1628 INIT_LIST_HEAD(&request->client_list);
1629 }
Eric Anholt673a3942008-07-30 12:06:12 -07001630
Eric Anholtce44b0e2008-11-06 16:00:31 -08001631 /* Associate any objects on the flushing list matching the write
1632 * domain we're flushing with our flush.
1633 */
Daniel Vetter63560392010-02-19 11:51:59 +01001634 if (flush_domains != 0)
Zou Nan hai852835f2010-05-21 09:08:56 +08001635 i915_gem_process_flushing_list(dev, flush_domains, seqno, ring);
Eric Anholtce44b0e2008-11-06 16:00:31 -08001636
Ben Gamarif65d9422009-09-14 17:48:44 -04001637 if (!dev_priv->mm.suspended) {
1638 mod_timer(&dev_priv->hangcheck_timer, jiffies + DRM_I915_HANGCHECK_PERIOD);
1639 if (was_empty)
1640 queue_delayed_work(dev_priv->wq, &dev_priv->mm.retire_work, HZ);
1641 }
Eric Anholt673a3942008-07-30 12:06:12 -07001642 return seqno;
1643}
1644
1645/**
1646 * Command execution barrier
1647 *
1648 * Ensures that all commands in the ring are finished
1649 * before signalling the CPU
1650 */
Eric Anholt3043c602008-10-02 12:24:47 -07001651static uint32_t
Zou Nan hai852835f2010-05-21 09:08:56 +08001652i915_retire_commands(struct drm_device *dev, struct intel_ring_buffer *ring)
Eric Anholt673a3942008-07-30 12:06:12 -07001653{
Eric Anholt673a3942008-07-30 12:06:12 -07001654 uint32_t flush_domains = 0;
Eric Anholt673a3942008-07-30 12:06:12 -07001655
1656 /* The sampler always gets flushed on i965 (sigh) */
1657 if (IS_I965G(dev))
1658 flush_domains |= I915_GEM_DOMAIN_SAMPLER;
Zou Nan hai852835f2010-05-21 09:08:56 +08001659
1660 ring->flush(dev, ring,
1661 I915_GEM_DOMAIN_COMMAND, flush_domains);
Eric Anholt673a3942008-07-30 12:06:12 -07001662 return flush_domains;
1663}
1664
1665/**
1666 * Moves buffers associated only with the given active seqno from the active
1667 * to inactive list, potentially freeing them.
1668 */
1669static void
1670i915_gem_retire_request(struct drm_device *dev,
1671 struct drm_i915_gem_request *request)
1672{
1673 drm_i915_private_t *dev_priv = dev->dev_private;
1674
Chris Wilson1c5d22f2009-08-25 11:15:50 +01001675 trace_i915_gem_request_retire(dev, request->seqno);
1676
Eric Anholt673a3942008-07-30 12:06:12 -07001677 /* Move any buffers on the active list that are no longer referenced
1678 * by the ringbuffer to the flushing/inactive lists as appropriate.
1679 */
Carl Worth5e118f42009-03-20 11:54:25 -07001680 spin_lock(&dev_priv->mm.active_list_lock);
Zou Nan hai852835f2010-05-21 09:08:56 +08001681 while (!list_empty(&request->ring->active_list)) {
Eric Anholt673a3942008-07-30 12:06:12 -07001682 struct drm_gem_object *obj;
1683 struct drm_i915_gem_object *obj_priv;
1684
Zou Nan hai852835f2010-05-21 09:08:56 +08001685 obj_priv = list_first_entry(&request->ring->active_list,
Eric Anholt673a3942008-07-30 12:06:12 -07001686 struct drm_i915_gem_object,
1687 list);
Daniel Vettera8089e82010-04-09 19:05:09 +00001688 obj = &obj_priv->base;
Eric Anholt673a3942008-07-30 12:06:12 -07001689
1690 /* If the seqno being retired doesn't match the oldest in the
1691 * list, then the oldest in the list must still be newer than
1692 * this seqno.
1693 */
1694 if (obj_priv->last_rendering_seqno != request->seqno)
Carl Worth5e118f42009-03-20 11:54:25 -07001695 goto out;
Jesse Barnesde151cf2008-11-12 10:03:55 -08001696
Eric Anholt673a3942008-07-30 12:06:12 -07001697#if WATCH_LRU
1698 DRM_INFO("%s: retire %d moves to inactive list %p\n",
1699 __func__, request->seqno, obj);
1700#endif
1701
Eric Anholtce44b0e2008-11-06 16:00:31 -08001702 if (obj->write_domain != 0)
1703 i915_gem_object_move_to_flushing(obj);
Shaohua Li68c84342009-04-08 10:58:23 +08001704 else {
1705 /* Take a reference on the object so it won't be
1706 * freed while the spinlock is held. The list
1707 * protection for this spinlock is safe when breaking
1708 * the lock like this since the next thing we do
1709 * is just get the head of the list again.
1710 */
1711 drm_gem_object_reference(obj);
Eric Anholt673a3942008-07-30 12:06:12 -07001712 i915_gem_object_move_to_inactive(obj);
Shaohua Li68c84342009-04-08 10:58:23 +08001713 spin_unlock(&dev_priv->mm.active_list_lock);
1714 drm_gem_object_unreference(obj);
1715 spin_lock(&dev_priv->mm.active_list_lock);
1716 }
Eric Anholt673a3942008-07-30 12:06:12 -07001717 }
Carl Worth5e118f42009-03-20 11:54:25 -07001718out:
1719 spin_unlock(&dev_priv->mm.active_list_lock);
Eric Anholt673a3942008-07-30 12:06:12 -07001720}
1721
1722/**
1723 * Returns true if seq1 is later than seq2.
1724 */
Ben Gamari22be1722009-09-14 17:48:43 -04001725bool
Eric Anholt673a3942008-07-30 12:06:12 -07001726i915_seqno_passed(uint32_t seq1, uint32_t seq2)
1727{
1728 return (int32_t)(seq1 - seq2) >= 0;
1729}
1730
1731uint32_t
Zou Nan hai852835f2010-05-21 09:08:56 +08001732i915_get_gem_seqno(struct drm_device *dev,
1733 struct intel_ring_buffer *ring)
Eric Anholt673a3942008-07-30 12:06:12 -07001734{
Zou Nan hai852835f2010-05-21 09:08:56 +08001735 return ring->get_gem_seqno(dev, ring);
Eric Anholt673a3942008-07-30 12:06:12 -07001736}
1737
1738/**
1739 * This function clears the request list as sequence numbers are passed.
1740 */
1741void
Zou Nan hai852835f2010-05-21 09:08:56 +08001742i915_gem_retire_requests(struct drm_device *dev,
1743 struct intel_ring_buffer *ring)
Eric Anholt673a3942008-07-30 12:06:12 -07001744{
1745 drm_i915_private_t *dev_priv = dev->dev_private;
1746 uint32_t seqno;
1747
Zou Nan hai8187a2b2010-05-21 09:08:55 +08001748 if (!ring->status_page.page_addr
Zou Nan hai852835f2010-05-21 09:08:56 +08001749 || list_empty(&ring->request_list))
Karsten Wiese6c0594a2009-02-23 15:07:57 +01001750 return;
1751
Zou Nan hai852835f2010-05-21 09:08:56 +08001752 seqno = i915_get_gem_seqno(dev, ring);
Eric Anholt673a3942008-07-30 12:06:12 -07001753
Zou Nan hai852835f2010-05-21 09:08:56 +08001754 while (!list_empty(&ring->request_list)) {
Eric Anholt673a3942008-07-30 12:06:12 -07001755 struct drm_i915_gem_request *request;
1756 uint32_t retiring_seqno;
1757
Zou Nan hai852835f2010-05-21 09:08:56 +08001758 request = list_first_entry(&ring->request_list,
Eric Anholt673a3942008-07-30 12:06:12 -07001759 struct drm_i915_gem_request,
1760 list);
1761 retiring_seqno = request->seqno;
1762
1763 if (i915_seqno_passed(seqno, retiring_seqno) ||
Ben Gamariba1234d2009-09-14 17:48:47 -04001764 atomic_read(&dev_priv->mm.wedged)) {
Eric Anholt673a3942008-07-30 12:06:12 -07001765 i915_gem_retire_request(dev, request);
1766
1767 list_del(&request->list);
Eric Anholtb9624422009-06-03 07:27:35 +00001768 list_del(&request->client_list);
Eric Anholt9a298b22009-03-24 12:23:04 -07001769 kfree(request);
Eric Anholt673a3942008-07-30 12:06:12 -07001770 } else
1771 break;
1772 }
Chris Wilson9d34e5d2009-09-24 05:26:06 +01001773
1774 if (unlikely (dev_priv->trace_irq_seqno &&
1775 i915_seqno_passed(dev_priv->trace_irq_seqno, seqno))) {
Zou Nan hai8187a2b2010-05-21 09:08:55 +08001776
1777 ring->user_irq_put(dev, ring);
Chris Wilson9d34e5d2009-09-24 05:26:06 +01001778 dev_priv->trace_irq_seqno = 0;
1779 }
Eric Anholt673a3942008-07-30 12:06:12 -07001780}
1781
1782void
1783i915_gem_retire_work_handler(struct work_struct *work)
1784{
1785 drm_i915_private_t *dev_priv;
1786 struct drm_device *dev;
1787
1788 dev_priv = container_of(work, drm_i915_private_t,
1789 mm.retire_work.work);
1790 dev = dev_priv->dev;
1791
1792 mutex_lock(&dev->struct_mutex);
Zou Nan hai852835f2010-05-21 09:08:56 +08001793 i915_gem_retire_requests(dev, &dev_priv->render_ring);
1794
Keith Packard6dbe2772008-10-14 21:41:13 -07001795 if (!dev_priv->mm.suspended &&
Zou Nan hai852835f2010-05-21 09:08:56 +08001796 (!list_empty(&dev_priv->render_ring.request_list)))
Eric Anholt9c9fe1f2009-08-03 16:09:16 -07001797 queue_delayed_work(dev_priv->wq, &dev_priv->mm.retire_work, HZ);
Eric Anholt673a3942008-07-30 12:06:12 -07001798 mutex_unlock(&dev->struct_mutex);
1799}
1800
Daniel Vetter5a5a0c62009-09-15 22:57:36 +02001801int
Zou Nan hai852835f2010-05-21 09:08:56 +08001802i915_do_wait_request(struct drm_device *dev, uint32_t seqno,
1803 int interruptible, struct intel_ring_buffer *ring)
Eric Anholt673a3942008-07-30 12:06:12 -07001804{
1805 drm_i915_private_t *dev_priv = dev->dev_private;
Jesse Barnes802c7eb2009-05-05 16:03:48 -07001806 u32 ier;
Eric Anholt673a3942008-07-30 12:06:12 -07001807 int ret = 0;
1808
1809 BUG_ON(seqno == 0);
1810
Ben Gamariba1234d2009-09-14 17:48:47 -04001811 if (atomic_read(&dev_priv->mm.wedged))
Ben Gamariffed1d02009-09-14 17:48:41 -04001812 return -EIO;
1813
Zou Nan hai852835f2010-05-21 09:08:56 +08001814 if (!i915_seqno_passed(ring->get_gem_seqno(dev, ring), seqno)) {
Eric Anholtbad720f2009-10-22 16:11:14 -07001815 if (HAS_PCH_SPLIT(dev))
Zhenyu Wang036a4a72009-06-08 14:40:19 +08001816 ier = I915_READ(DEIER) | I915_READ(GTIER);
1817 else
1818 ier = I915_READ(IER);
Jesse Barnes802c7eb2009-05-05 16:03:48 -07001819 if (!ier) {
1820 DRM_ERROR("something (likely vbetool) disabled "
1821 "interrupts, re-enabling\n");
1822 i915_driver_irq_preinstall(dev);
1823 i915_driver_irq_postinstall(dev);
1824 }
1825
Chris Wilson1c5d22f2009-08-25 11:15:50 +01001826 trace_i915_gem_request_wait_begin(dev, seqno);
1827
Zou Nan hai852835f2010-05-21 09:08:56 +08001828 ring->waiting_gem_seqno = seqno;
Zou Nan hai8187a2b2010-05-21 09:08:55 +08001829 ring->user_irq_get(dev, ring);
Daniel Vetter48764bf2009-09-15 22:57:32 +02001830 if (interruptible)
Zou Nan hai852835f2010-05-21 09:08:56 +08001831 ret = wait_event_interruptible(ring->irq_queue,
1832 i915_seqno_passed(
1833 ring->get_gem_seqno(dev, ring), seqno)
1834 || atomic_read(&dev_priv->mm.wedged));
Daniel Vetter48764bf2009-09-15 22:57:32 +02001835 else
Zou Nan hai852835f2010-05-21 09:08:56 +08001836 wait_event(ring->irq_queue,
1837 i915_seqno_passed(
1838 ring->get_gem_seqno(dev, ring), seqno)
1839 || atomic_read(&dev_priv->mm.wedged));
Daniel Vetter48764bf2009-09-15 22:57:32 +02001840
Zou Nan hai8187a2b2010-05-21 09:08:55 +08001841 ring->user_irq_put(dev, ring);
Zou Nan hai852835f2010-05-21 09:08:56 +08001842 ring->waiting_gem_seqno = 0;
Chris Wilson1c5d22f2009-08-25 11:15:50 +01001843
1844 trace_i915_gem_request_wait_end(dev, seqno);
Eric Anholt673a3942008-07-30 12:06:12 -07001845 }
Ben Gamariba1234d2009-09-14 17:48:47 -04001846 if (atomic_read(&dev_priv->mm.wedged))
Eric Anholt673a3942008-07-30 12:06:12 -07001847 ret = -EIO;
1848
1849 if (ret && ret != -ERESTARTSYS)
1850 DRM_ERROR("%s returns %d (awaiting %d at %d)\n",
Zou Nan hai852835f2010-05-21 09:08:56 +08001851 __func__, ret, seqno, ring->get_gem_seqno(dev, ring));
Eric Anholt673a3942008-07-30 12:06:12 -07001852
1853 /* Directly dispatch request retiring. While we have the work queue
1854 * to handle this, the waiter on a request often wants an associated
1855 * buffer to have made it to the inactive list, and we would need
1856 * a separate wait queue to handle that.
1857 */
1858 if (ret == 0)
Zou Nan hai852835f2010-05-21 09:08:56 +08001859 i915_gem_retire_requests(dev, ring);
Eric Anholt673a3942008-07-30 12:06:12 -07001860
1861 return ret;
1862}
1863
Daniel Vetter48764bf2009-09-15 22:57:32 +02001864/**
1865 * Waits for a sequence number to be signaled, and cleans up the
1866 * request and object lists appropriately for that event.
1867 */
1868static int
Zou Nan hai852835f2010-05-21 09:08:56 +08001869i915_wait_request(struct drm_device *dev, uint32_t seqno,
1870 struct intel_ring_buffer *ring)
Daniel Vetter48764bf2009-09-15 22:57:32 +02001871{
Zou Nan hai852835f2010-05-21 09:08:56 +08001872 return i915_do_wait_request(dev, seqno, 1, ring);
Daniel Vetter48764bf2009-09-15 22:57:32 +02001873}
1874
Zou Nan hai8187a2b2010-05-21 09:08:55 +08001875static void
1876i915_gem_flush(struct drm_device *dev,
1877 uint32_t invalidate_domains,
1878 uint32_t flush_domains)
1879{
1880 drm_i915_private_t *dev_priv = dev->dev_private;
1881 if (flush_domains & I915_GEM_DOMAIN_CPU)
1882 drm_agp_chipset_flush(dev);
1883 dev_priv->render_ring.flush(dev, &dev_priv->render_ring,
1884 invalidate_domains,
1885 flush_domains);
1886}
1887
Zou Nan hai852835f2010-05-21 09:08:56 +08001888static void
1889i915_gem_flush_ring(struct drm_device *dev,
1890 uint32_t invalidate_domains,
1891 uint32_t flush_domains,
1892 struct intel_ring_buffer *ring)
1893{
1894 if (flush_domains & I915_GEM_DOMAIN_CPU)
1895 drm_agp_chipset_flush(dev);
1896 ring->flush(dev, ring,
1897 invalidate_domains,
1898 flush_domains);
1899}
1900
Eric Anholt673a3942008-07-30 12:06:12 -07001901/**
1902 * Ensures that all rendering to the object has completed and the object is
1903 * safe to unbind from the GTT or access from the CPU.
1904 */
1905static int
1906i915_gem_object_wait_rendering(struct drm_gem_object *obj)
1907{
1908 struct drm_device *dev = obj->dev;
Daniel Vetter23010e42010-03-08 13:35:02 +01001909 struct drm_i915_gem_object *obj_priv = to_intel_bo(obj);
Eric Anholt673a3942008-07-30 12:06:12 -07001910 int ret;
1911
Eric Anholte47c68e2008-11-14 13:35:19 -08001912 /* This function only exists to support waiting for existing rendering,
1913 * not for emitting required flushes.
Eric Anholt673a3942008-07-30 12:06:12 -07001914 */
Eric Anholte47c68e2008-11-14 13:35:19 -08001915 BUG_ON((obj->write_domain & I915_GEM_GPU_DOMAINS) != 0);
Eric Anholt673a3942008-07-30 12:06:12 -07001916
1917 /* If there is rendering queued on the buffer being evicted, wait for
1918 * it.
1919 */
1920 if (obj_priv->active) {
1921#if WATCH_BUF
1922 DRM_INFO("%s: object %p wait for seqno %08x\n",
1923 __func__, obj, obj_priv->last_rendering_seqno);
1924#endif
Zou Nan hai852835f2010-05-21 09:08:56 +08001925 ret = i915_wait_request(dev,
1926 obj_priv->last_rendering_seqno, obj_priv->ring);
Eric Anholt673a3942008-07-30 12:06:12 -07001927 if (ret != 0)
1928 return ret;
1929 }
1930
1931 return 0;
1932}
1933
1934/**
1935 * Unbinds an object from the GTT aperture.
1936 */
Jesse Barnes0f973f22009-01-26 17:10:45 -08001937int
Eric Anholt673a3942008-07-30 12:06:12 -07001938i915_gem_object_unbind(struct drm_gem_object *obj)
1939{
1940 struct drm_device *dev = obj->dev;
Daniel Vetter4a87b8c2010-02-19 11:51:57 +01001941 drm_i915_private_t *dev_priv = dev->dev_private;
Daniel Vetter23010e42010-03-08 13:35:02 +01001942 struct drm_i915_gem_object *obj_priv = to_intel_bo(obj);
Eric Anholt673a3942008-07-30 12:06:12 -07001943 int ret = 0;
1944
1945#if WATCH_BUF
1946 DRM_INFO("%s:%d %p\n", __func__, __LINE__, obj);
1947 DRM_INFO("gtt_space %p\n", obj_priv->gtt_space);
1948#endif
1949 if (obj_priv->gtt_space == NULL)
1950 return 0;
1951
1952 if (obj_priv->pin_count != 0) {
1953 DRM_ERROR("Attempting to unbind pinned buffer\n");
1954 return -EINVAL;
1955 }
1956
Eric Anholt5323fd02009-09-09 11:50:45 -07001957 /* blow away mappings if mapped through GTT */
1958 i915_gem_release_mmap(obj);
1959
Eric Anholt673a3942008-07-30 12:06:12 -07001960 /* Move the object to the CPU domain to ensure that
1961 * any possible CPU writes while it's not in the GTT
1962 * are flushed when we go to remap it. This will
1963 * also ensure that all pending GPU writes are finished
1964 * before we unbind.
1965 */
Eric Anholte47c68e2008-11-14 13:35:19 -08001966 ret = i915_gem_object_set_to_cpu_domain(obj, 1);
Eric Anholt673a3942008-07-30 12:06:12 -07001967 if (ret) {
Eric Anholte47c68e2008-11-14 13:35:19 -08001968 if (ret != -ERESTARTSYS)
1969 DRM_ERROR("set_domain failed: %d\n", ret);
Eric Anholt673a3942008-07-30 12:06:12 -07001970 return ret;
1971 }
1972
Eric Anholt5323fd02009-09-09 11:50:45 -07001973 BUG_ON(obj_priv->active);
1974
Daniel Vetter96b47b62009-12-15 17:50:00 +01001975 /* release the fence reg _after_ flushing */
1976 if (obj_priv->fence_reg != I915_FENCE_REG_NONE)
1977 i915_gem_clear_fence_reg(obj);
1978
Eric Anholt673a3942008-07-30 12:06:12 -07001979 if (obj_priv->agp_mem != NULL) {
1980 drm_unbind_agp(obj_priv->agp_mem);
1981 drm_free_agp(obj_priv->agp_mem, obj->size / PAGE_SIZE);
1982 obj_priv->agp_mem = NULL;
1983 }
1984
Eric Anholt856fa192009-03-19 14:10:50 -07001985 i915_gem_object_put_pages(obj);
Chris Wilsona32808c2009-09-20 21:29:47 +01001986 BUG_ON(obj_priv->pages_refcount);
Eric Anholt673a3942008-07-30 12:06:12 -07001987
1988 if (obj_priv->gtt_space) {
1989 atomic_dec(&dev->gtt_count);
1990 atomic_sub(obj->size, &dev->gtt_memory);
1991
1992 drm_mm_put_block(obj_priv->gtt_space);
1993 obj_priv->gtt_space = NULL;
1994 }
1995
1996 /* Remove ourselves from the LRU list if present. */
Daniel Vetter4a87b8c2010-02-19 11:51:57 +01001997 spin_lock(&dev_priv->mm.active_list_lock);
Eric Anholt673a3942008-07-30 12:06:12 -07001998 if (!list_empty(&obj_priv->list))
1999 list_del_init(&obj_priv->list);
Daniel Vetter4a87b8c2010-02-19 11:51:57 +01002000 spin_unlock(&dev_priv->mm.active_list_lock);
Eric Anholt673a3942008-07-30 12:06:12 -07002001
Chris Wilson963b4832009-09-20 23:03:54 +01002002 if (i915_gem_object_is_purgeable(obj_priv))
2003 i915_gem_object_truncate(obj);
2004
Chris Wilson1c5d22f2009-08-25 11:15:50 +01002005 trace_i915_gem_object_unbind(obj);
2006
Eric Anholt673a3942008-07-30 12:06:12 -07002007 return 0;
2008}
2009
Chris Wilson07f73f62009-09-14 16:50:30 +01002010static struct drm_gem_object *
2011i915_gem_find_inactive_object(struct drm_device *dev, int min_size)
2012{
2013 drm_i915_private_t *dev_priv = dev->dev_private;
2014 struct drm_i915_gem_object *obj_priv;
2015 struct drm_gem_object *best = NULL;
2016 struct drm_gem_object *first = NULL;
2017
2018 /* Try to find the smallest clean object */
2019 list_for_each_entry(obj_priv, &dev_priv->mm.inactive_list, list) {
Daniel Vettera8089e82010-04-09 19:05:09 +00002020 struct drm_gem_object *obj = &obj_priv->base;
Chris Wilson07f73f62009-09-14 16:50:30 +01002021 if (obj->size >= min_size) {
Chris Wilson963b4832009-09-20 23:03:54 +01002022 if ((!obj_priv->dirty ||
2023 i915_gem_object_is_purgeable(obj_priv)) &&
Chris Wilson07f73f62009-09-14 16:50:30 +01002024 (!best || obj->size < best->size)) {
2025 best = obj;
2026 if (best->size == min_size)
2027 return best;
2028 }
2029 if (!first)
2030 first = obj;
2031 }
2032 }
2033
2034 return best ? best : first;
2035}
2036
Eric Anholt673a3942008-07-30 12:06:12 -07002037static int
Daniel Vetter4df2faf2010-02-19 11:52:00 +01002038i915_gpu_idle(struct drm_device *dev)
2039{
2040 drm_i915_private_t *dev_priv = dev->dev_private;
2041 bool lists_empty;
2042 uint32_t seqno;
Zou Nan hai852835f2010-05-21 09:08:56 +08002043 int ret;
Daniel Vetter4df2faf2010-02-19 11:52:00 +01002044
2045 spin_lock(&dev_priv->mm.active_list_lock);
2046 lists_empty = list_empty(&dev_priv->mm.flushing_list) &&
Zou Nan hai852835f2010-05-21 09:08:56 +08002047 list_empty(&dev_priv->render_ring.active_list);
Daniel Vetter4df2faf2010-02-19 11:52:00 +01002048 spin_unlock(&dev_priv->mm.active_list_lock);
2049
2050 if (lists_empty)
2051 return 0;
2052
2053 /* Flush everything onto the inactive list. */
2054 i915_gem_flush(dev, I915_GEM_GPU_DOMAINS, I915_GEM_GPU_DOMAINS);
Zou Nan hai852835f2010-05-21 09:08:56 +08002055 seqno = i915_add_request(dev, NULL, I915_GEM_GPU_DOMAINS,
2056 &dev_priv->render_ring);
Daniel Vetter4df2faf2010-02-19 11:52:00 +01002057 if (seqno == 0)
2058 return -ENOMEM;
Zou Nan hai852835f2010-05-21 09:08:56 +08002059 ret = i915_wait_request(dev, seqno, &dev_priv->render_ring);
Daniel Vetter4df2faf2010-02-19 11:52:00 +01002060
Zou Nan hai852835f2010-05-21 09:08:56 +08002061 return ret;
Daniel Vetter4df2faf2010-02-19 11:52:00 +01002062}
2063
2064static int
Chris Wilson07f73f62009-09-14 16:50:30 +01002065i915_gem_evict_everything(struct drm_device *dev)
2066{
2067 drm_i915_private_t *dev_priv = dev->dev_private;
Chris Wilson07f73f62009-09-14 16:50:30 +01002068 int ret;
2069 bool lists_empty;
2070
Chris Wilson07f73f62009-09-14 16:50:30 +01002071 spin_lock(&dev_priv->mm.active_list_lock);
2072 lists_empty = (list_empty(&dev_priv->mm.inactive_list) &&
2073 list_empty(&dev_priv->mm.flushing_list) &&
Zou Nan hai852835f2010-05-21 09:08:56 +08002074 list_empty(&dev_priv->render_ring.active_list));
Chris Wilson07f73f62009-09-14 16:50:30 +01002075 spin_unlock(&dev_priv->mm.active_list_lock);
2076
Chris Wilson97311292009-09-21 00:22:34 +01002077 if (lists_empty)
Chris Wilson07f73f62009-09-14 16:50:30 +01002078 return -ENOSPC;
Chris Wilson07f73f62009-09-14 16:50:30 +01002079
2080 /* Flush everything (on to the inactive lists) and evict */
Daniel Vetter4df2faf2010-02-19 11:52:00 +01002081 ret = i915_gpu_idle(dev);
Chris Wilson07f73f62009-09-14 16:50:30 +01002082 if (ret)
2083 return ret;
2084
Daniel Vetter99fcb762010-02-07 16:20:18 +01002085 BUG_ON(!list_empty(&dev_priv->mm.flushing_list));
2086
Chris Wilsonab5ee572009-09-20 19:25:47 +01002087 ret = i915_gem_evict_from_inactive_list(dev);
Chris Wilson07f73f62009-09-14 16:50:30 +01002088 if (ret)
2089 return ret;
2090
2091 spin_lock(&dev_priv->mm.active_list_lock);
2092 lists_empty = (list_empty(&dev_priv->mm.inactive_list) &&
2093 list_empty(&dev_priv->mm.flushing_list) &&
Zou Nan hai852835f2010-05-21 09:08:56 +08002094 list_empty(&dev_priv->render_ring.active_list));
Chris Wilson07f73f62009-09-14 16:50:30 +01002095 spin_unlock(&dev_priv->mm.active_list_lock);
2096 BUG_ON(!lists_empty);
2097
Eric Anholt673a3942008-07-30 12:06:12 -07002098 return 0;
2099}
2100
2101static int
Chris Wilson07f73f62009-09-14 16:50:30 +01002102i915_gem_evict_something(struct drm_device *dev, int min_size)
Eric Anholt673a3942008-07-30 12:06:12 -07002103{
2104 drm_i915_private_t *dev_priv = dev->dev_private;
2105 struct drm_gem_object *obj;
Chris Wilson07f73f62009-09-14 16:50:30 +01002106 int ret;
Eric Anholt673a3942008-07-30 12:06:12 -07002107
Zou Nan hai852835f2010-05-21 09:08:56 +08002108 struct intel_ring_buffer *render_ring = &dev_priv->render_ring;
Eric Anholt673a3942008-07-30 12:06:12 -07002109 for (;;) {
Zou Nan hai852835f2010-05-21 09:08:56 +08002110 i915_gem_retire_requests(dev, render_ring);
Chris Wilson07f73f62009-09-14 16:50:30 +01002111
Eric Anholt673a3942008-07-30 12:06:12 -07002112 /* If there's an inactive buffer available now, grab it
2113 * and be done.
2114 */
Chris Wilson07f73f62009-09-14 16:50:30 +01002115 obj = i915_gem_find_inactive_object(dev, min_size);
2116 if (obj) {
2117 struct drm_i915_gem_object *obj_priv;
2118
Eric Anholt673a3942008-07-30 12:06:12 -07002119#if WATCH_LRU
2120 DRM_INFO("%s: evicting %p\n", __func__, obj);
2121#endif
Daniel Vetter23010e42010-03-08 13:35:02 +01002122 obj_priv = to_intel_bo(obj);
Chris Wilson07f73f62009-09-14 16:50:30 +01002123 BUG_ON(obj_priv->pin_count != 0);
Eric Anholt673a3942008-07-30 12:06:12 -07002124 BUG_ON(obj_priv->active);
2125
2126 /* Wait on the rendering and unbind the buffer. */
Chris Wilson07f73f62009-09-14 16:50:30 +01002127 return i915_gem_object_unbind(obj);
Eric Anholt673a3942008-07-30 12:06:12 -07002128 }
2129
2130 /* If we didn't get anything, but the ring is still processing
Chris Wilson07f73f62009-09-14 16:50:30 +01002131 * things, wait for the next to finish and hopefully leave us
2132 * a buffer to evict.
Eric Anholt673a3942008-07-30 12:06:12 -07002133 */
Zou Nan hai852835f2010-05-21 09:08:56 +08002134 if (!list_empty(&render_ring->request_list)) {
Eric Anholt673a3942008-07-30 12:06:12 -07002135 struct drm_i915_gem_request *request;
2136
Zou Nan hai852835f2010-05-21 09:08:56 +08002137 request = list_first_entry(&render_ring->request_list,
Eric Anholt673a3942008-07-30 12:06:12 -07002138 struct drm_i915_gem_request,
2139 list);
2140
Zou Nan hai852835f2010-05-21 09:08:56 +08002141 ret = i915_wait_request(dev,
2142 request->seqno, request->ring);
Eric Anholt673a3942008-07-30 12:06:12 -07002143 if (ret)
Chris Wilson07f73f62009-09-14 16:50:30 +01002144 return ret;
Eric Anholt673a3942008-07-30 12:06:12 -07002145
Chris Wilson07f73f62009-09-14 16:50:30 +01002146 continue;
Eric Anholt673a3942008-07-30 12:06:12 -07002147 }
2148
2149 /* If we didn't have anything on the request list but there
2150 * are buffers awaiting a flush, emit one and try again.
2151 * When we wait on it, those buffers waiting for that flush
2152 * will get moved to inactive.
2153 */
2154 if (!list_empty(&dev_priv->mm.flushing_list)) {
Chris Wilson07f73f62009-09-14 16:50:30 +01002155 struct drm_i915_gem_object *obj_priv;
Eric Anholt673a3942008-07-30 12:06:12 -07002156
Chris Wilson9a1e2582009-09-20 20:16:50 +01002157 /* Find an object that we can immediately reuse */
2158 list_for_each_entry(obj_priv, &dev_priv->mm.flushing_list, list) {
Daniel Vettera8089e82010-04-09 19:05:09 +00002159 obj = &obj_priv->base;
Chris Wilson9a1e2582009-09-20 20:16:50 +01002160 if (obj->size >= min_size)
2161 break;
Eric Anholt673a3942008-07-30 12:06:12 -07002162
Chris Wilson9a1e2582009-09-20 20:16:50 +01002163 obj = NULL;
2164 }
Eric Anholt673a3942008-07-30 12:06:12 -07002165
Chris Wilson9a1e2582009-09-20 20:16:50 +01002166 if (obj != NULL) {
2167 uint32_t seqno;
Chris Wilson07f73f62009-09-14 16:50:30 +01002168
Zou Nan hai852835f2010-05-21 09:08:56 +08002169 i915_gem_flush_ring(dev,
Chris Wilson9a1e2582009-09-20 20:16:50 +01002170 obj->write_domain,
Zou Nan hai852835f2010-05-21 09:08:56 +08002171 obj->write_domain,
2172 obj_priv->ring);
2173 seqno = i915_add_request(dev, NULL,
2174 obj->write_domain,
2175 obj_priv->ring);
Chris Wilson9a1e2582009-09-20 20:16:50 +01002176 if (seqno == 0)
2177 return -ENOMEM;
Chris Wilson9a1e2582009-09-20 20:16:50 +01002178 continue;
2179 }
Eric Anholt673a3942008-07-30 12:06:12 -07002180 }
2181
Chris Wilson07f73f62009-09-14 16:50:30 +01002182 /* If we didn't do any of the above, there's no single buffer
2183 * large enough to swap out for the new one, so just evict
2184 * everything and start again. (This should be rare.)
Eric Anholt673a3942008-07-30 12:06:12 -07002185 */
Chris Wilson97311292009-09-21 00:22:34 +01002186 if (!list_empty (&dev_priv->mm.inactive_list))
Chris Wilsonab5ee572009-09-20 19:25:47 +01002187 return i915_gem_evict_from_inactive_list(dev);
Chris Wilson97311292009-09-21 00:22:34 +01002188 else
Chris Wilson07f73f62009-09-14 16:50:30 +01002189 return i915_gem_evict_everything(dev);
Eric Anholt673a3942008-07-30 12:06:12 -07002190 }
Keith Packardac94a962008-11-20 23:30:27 -08002191}
2192
Ben Gamari6911a9b2009-04-02 11:24:54 -07002193int
Chris Wilson4bdadb92010-01-27 13:36:32 +00002194i915_gem_object_get_pages(struct drm_gem_object *obj,
2195 gfp_t gfpmask)
Eric Anholt673a3942008-07-30 12:06:12 -07002196{
Daniel Vetter23010e42010-03-08 13:35:02 +01002197 struct drm_i915_gem_object *obj_priv = to_intel_bo(obj);
Eric Anholt673a3942008-07-30 12:06:12 -07002198 int page_count, i;
2199 struct address_space *mapping;
2200 struct inode *inode;
2201 struct page *page;
Eric Anholt673a3942008-07-30 12:06:12 -07002202
Eric Anholt856fa192009-03-19 14:10:50 -07002203 if (obj_priv->pages_refcount++ != 0)
Eric Anholt673a3942008-07-30 12:06:12 -07002204 return 0;
2205
2206 /* Get the list of pages out of our struct file. They'll be pinned
2207 * at this point until we release them.
2208 */
2209 page_count = obj->size / PAGE_SIZE;
Eric Anholt856fa192009-03-19 14:10:50 -07002210 BUG_ON(obj_priv->pages != NULL);
Jesse Barnes8e7d2b22009-05-08 16:13:25 -07002211 obj_priv->pages = drm_calloc_large(page_count, sizeof(struct page *));
Eric Anholt856fa192009-03-19 14:10:50 -07002212 if (obj_priv->pages == NULL) {
Eric Anholt856fa192009-03-19 14:10:50 -07002213 obj_priv->pages_refcount--;
Eric Anholt673a3942008-07-30 12:06:12 -07002214 return -ENOMEM;
2215 }
2216
2217 inode = obj->filp->f_path.dentry->d_inode;
2218 mapping = inode->i_mapping;
2219 for (i = 0; i < page_count; i++) {
Chris Wilson4bdadb92010-01-27 13:36:32 +00002220 page = read_cache_page_gfp(mapping, i,
2221 mapping_gfp_mask (mapping) |
2222 __GFP_COLD |
2223 gfpmask);
Chris Wilson1f2b1012010-03-12 19:52:55 +00002224 if (IS_ERR(page))
2225 goto err_pages;
2226
Eric Anholt856fa192009-03-19 14:10:50 -07002227 obj_priv->pages[i] = page;
Eric Anholt673a3942008-07-30 12:06:12 -07002228 }
Eric Anholt280b7132009-03-12 16:56:27 -07002229
2230 if (obj_priv->tiling_mode != I915_TILING_NONE)
2231 i915_gem_object_do_bit_17_swizzle(obj);
2232
Eric Anholt673a3942008-07-30 12:06:12 -07002233 return 0;
Chris Wilson1f2b1012010-03-12 19:52:55 +00002234
2235err_pages:
2236 while (i--)
2237 page_cache_release(obj_priv->pages[i]);
2238
2239 drm_free_large(obj_priv->pages);
2240 obj_priv->pages = NULL;
2241 obj_priv->pages_refcount--;
2242 return PTR_ERR(page);
Eric Anholt673a3942008-07-30 12:06:12 -07002243}
2244
Eric Anholt4e901fd2009-10-26 16:44:17 -07002245static void sandybridge_write_fence_reg(struct drm_i915_fence_reg *reg)
2246{
2247 struct drm_gem_object *obj = reg->obj;
2248 struct drm_device *dev = obj->dev;
2249 drm_i915_private_t *dev_priv = dev->dev_private;
Daniel Vetter23010e42010-03-08 13:35:02 +01002250 struct drm_i915_gem_object *obj_priv = to_intel_bo(obj);
Eric Anholt4e901fd2009-10-26 16:44:17 -07002251 int regnum = obj_priv->fence_reg;
2252 uint64_t val;
2253
2254 val = (uint64_t)((obj_priv->gtt_offset + obj->size - 4096) &
2255 0xfffff000) << 32;
2256 val |= obj_priv->gtt_offset & 0xfffff000;
2257 val |= (uint64_t)((obj_priv->stride / 128) - 1) <<
2258 SANDYBRIDGE_FENCE_PITCH_SHIFT;
2259
2260 if (obj_priv->tiling_mode == I915_TILING_Y)
2261 val |= 1 << I965_FENCE_TILING_Y_SHIFT;
2262 val |= I965_FENCE_REG_VALID;
2263
2264 I915_WRITE64(FENCE_REG_SANDYBRIDGE_0 + (regnum * 8), val);
2265}
2266
Jesse Barnesde151cf2008-11-12 10:03:55 -08002267static void i965_write_fence_reg(struct drm_i915_fence_reg *reg)
2268{
2269 struct drm_gem_object *obj = reg->obj;
2270 struct drm_device *dev = obj->dev;
2271 drm_i915_private_t *dev_priv = dev->dev_private;
Daniel Vetter23010e42010-03-08 13:35:02 +01002272 struct drm_i915_gem_object *obj_priv = to_intel_bo(obj);
Jesse Barnesde151cf2008-11-12 10:03:55 -08002273 int regnum = obj_priv->fence_reg;
2274 uint64_t val;
2275
2276 val = (uint64_t)((obj_priv->gtt_offset + obj->size - 4096) &
2277 0xfffff000) << 32;
2278 val |= obj_priv->gtt_offset & 0xfffff000;
2279 val |= ((obj_priv->stride / 128) - 1) << I965_FENCE_PITCH_SHIFT;
2280 if (obj_priv->tiling_mode == I915_TILING_Y)
2281 val |= 1 << I965_FENCE_TILING_Y_SHIFT;
2282 val |= I965_FENCE_REG_VALID;
2283
2284 I915_WRITE64(FENCE_REG_965_0 + (regnum * 8), val);
2285}
2286
2287static void i915_write_fence_reg(struct drm_i915_fence_reg *reg)
2288{
2289 struct drm_gem_object *obj = reg->obj;
2290 struct drm_device *dev = obj->dev;
2291 drm_i915_private_t *dev_priv = dev->dev_private;
Daniel Vetter23010e42010-03-08 13:35:02 +01002292 struct drm_i915_gem_object *obj_priv = to_intel_bo(obj);
Jesse Barnesde151cf2008-11-12 10:03:55 -08002293 int regnum = obj_priv->fence_reg;
Jesse Barnes0f973f22009-01-26 17:10:45 -08002294 int tile_width;
Eric Anholtdc529a42009-03-10 22:34:49 -07002295 uint32_t fence_reg, val;
Jesse Barnesde151cf2008-11-12 10:03:55 -08002296 uint32_t pitch_val;
2297
2298 if ((obj_priv->gtt_offset & ~I915_FENCE_START_MASK) ||
2299 (obj_priv->gtt_offset & (obj->size - 1))) {
Linus Torvaldsf06da262009-02-09 08:57:29 -08002300 WARN(1, "%s: object 0x%08x not 1M or size (0x%zx) aligned\n",
Jesse Barnes0f973f22009-01-26 17:10:45 -08002301 __func__, obj_priv->gtt_offset, obj->size);
Jesse Barnesde151cf2008-11-12 10:03:55 -08002302 return;
2303 }
2304
Jesse Barnes0f973f22009-01-26 17:10:45 -08002305 if (obj_priv->tiling_mode == I915_TILING_Y &&
2306 HAS_128_BYTE_Y_TILING(dev))
2307 tile_width = 128;
Jesse Barnesde151cf2008-11-12 10:03:55 -08002308 else
Jesse Barnes0f973f22009-01-26 17:10:45 -08002309 tile_width = 512;
2310
2311 /* Note: pitch better be a power of two tile widths */
2312 pitch_val = obj_priv->stride / tile_width;
2313 pitch_val = ffs(pitch_val) - 1;
Jesse Barnesde151cf2008-11-12 10:03:55 -08002314
Daniel Vetterc36a2a62010-04-17 15:12:03 +02002315 if (obj_priv->tiling_mode == I915_TILING_Y &&
2316 HAS_128_BYTE_Y_TILING(dev))
2317 WARN_ON(pitch_val > I830_FENCE_MAX_PITCH_VAL);
2318 else
2319 WARN_ON(pitch_val > I915_FENCE_MAX_PITCH_VAL);
2320
Jesse Barnesde151cf2008-11-12 10:03:55 -08002321 val = obj_priv->gtt_offset;
2322 if (obj_priv->tiling_mode == I915_TILING_Y)
2323 val |= 1 << I830_FENCE_TILING_Y_SHIFT;
2324 val |= I915_FENCE_SIZE_BITS(obj->size);
2325 val |= pitch_val << I830_FENCE_PITCH_SHIFT;
2326 val |= I830_FENCE_REG_VALID;
2327
Eric Anholtdc529a42009-03-10 22:34:49 -07002328 if (regnum < 8)
2329 fence_reg = FENCE_REG_830_0 + (regnum * 4);
2330 else
2331 fence_reg = FENCE_REG_945_8 + ((regnum - 8) * 4);
2332 I915_WRITE(fence_reg, val);
Jesse Barnesde151cf2008-11-12 10:03:55 -08002333}
2334
2335static void i830_write_fence_reg(struct drm_i915_fence_reg *reg)
2336{
2337 struct drm_gem_object *obj = reg->obj;
2338 struct drm_device *dev = obj->dev;
2339 drm_i915_private_t *dev_priv = dev->dev_private;
Daniel Vetter23010e42010-03-08 13:35:02 +01002340 struct drm_i915_gem_object *obj_priv = to_intel_bo(obj);
Jesse Barnesde151cf2008-11-12 10:03:55 -08002341 int regnum = obj_priv->fence_reg;
2342 uint32_t val;
2343 uint32_t pitch_val;
Daniel Vetter8d7773a2009-03-29 14:09:41 +02002344 uint32_t fence_size_bits;
Jesse Barnesde151cf2008-11-12 10:03:55 -08002345
Daniel Vetter8d7773a2009-03-29 14:09:41 +02002346 if ((obj_priv->gtt_offset & ~I830_FENCE_START_MASK) ||
Jesse Barnesde151cf2008-11-12 10:03:55 -08002347 (obj_priv->gtt_offset & (obj->size - 1))) {
Daniel Vetter8d7773a2009-03-29 14:09:41 +02002348 WARN(1, "%s: object 0x%08x not 512K or size aligned\n",
Jesse Barnes0f973f22009-01-26 17:10:45 -08002349 __func__, obj_priv->gtt_offset);
Jesse Barnesde151cf2008-11-12 10:03:55 -08002350 return;
2351 }
2352
Eric Anholte76a16d2009-05-26 17:44:56 -07002353 pitch_val = obj_priv->stride / 128;
2354 pitch_val = ffs(pitch_val) - 1;
2355 WARN_ON(pitch_val > I830_FENCE_MAX_PITCH_VAL);
2356
Jesse Barnesde151cf2008-11-12 10:03:55 -08002357 val = obj_priv->gtt_offset;
2358 if (obj_priv->tiling_mode == I915_TILING_Y)
2359 val |= 1 << I830_FENCE_TILING_Y_SHIFT;
Daniel Vetter8d7773a2009-03-29 14:09:41 +02002360 fence_size_bits = I830_FENCE_SIZE_BITS(obj->size);
2361 WARN_ON(fence_size_bits & ~0x00000f00);
2362 val |= fence_size_bits;
Jesse Barnesde151cf2008-11-12 10:03:55 -08002363 val |= pitch_val << I830_FENCE_PITCH_SHIFT;
2364 val |= I830_FENCE_REG_VALID;
2365
2366 I915_WRITE(FENCE_REG_830_0 + (regnum * 4), val);
Jesse Barnesde151cf2008-11-12 10:03:55 -08002367}
2368
Daniel Vetterae3db242010-02-19 11:51:58 +01002369static int i915_find_fence_reg(struct drm_device *dev)
2370{
2371 struct drm_i915_fence_reg *reg = NULL;
2372 struct drm_i915_gem_object *obj_priv = NULL;
2373 struct drm_i915_private *dev_priv = dev->dev_private;
2374 struct drm_gem_object *obj = NULL;
2375 int i, avail, ret;
2376
2377 /* First try to find a free reg */
2378 avail = 0;
2379 for (i = dev_priv->fence_reg_start; i < dev_priv->num_fence_regs; i++) {
2380 reg = &dev_priv->fence_regs[i];
2381 if (!reg->obj)
2382 return i;
2383
Daniel Vetter23010e42010-03-08 13:35:02 +01002384 obj_priv = to_intel_bo(reg->obj);
Daniel Vetterae3db242010-02-19 11:51:58 +01002385 if (!obj_priv->pin_count)
2386 avail++;
2387 }
2388
2389 if (avail == 0)
2390 return -ENOSPC;
2391
2392 /* None available, try to steal one or wait for a user to finish */
2393 i = I915_FENCE_REG_NONE;
Daniel Vetter007cc8a2010-04-28 11:02:31 +02002394 list_for_each_entry(reg, &dev_priv->mm.fence_list,
2395 lru_list) {
2396 obj = reg->obj;
2397 obj_priv = to_intel_bo(obj);
Daniel Vetterae3db242010-02-19 11:51:58 +01002398
2399 if (obj_priv->pin_count)
2400 continue;
2401
2402 /* found one! */
2403 i = obj_priv->fence_reg;
2404 break;
2405 }
2406
2407 BUG_ON(i == I915_FENCE_REG_NONE);
2408
2409 /* We only have a reference on obj from the active list. put_fence_reg
2410 * might drop that one, causing a use-after-free in it. So hold a
2411 * private reference to obj like the other callers of put_fence_reg
2412 * (set_tiling ioctl) do. */
2413 drm_gem_object_reference(obj);
2414 ret = i915_gem_object_put_fence_reg(obj);
2415 drm_gem_object_unreference(obj);
2416 if (ret != 0)
2417 return ret;
2418
2419 return i;
2420}
2421
Jesse Barnesde151cf2008-11-12 10:03:55 -08002422/**
2423 * i915_gem_object_get_fence_reg - set up a fence reg for an object
2424 * @obj: object to map through a fence reg
2425 *
2426 * When mapping objects through the GTT, userspace wants to be able to write
2427 * to them without having to worry about swizzling if the object is tiled.
2428 *
2429 * This function walks the fence regs looking for a free one for @obj,
2430 * stealing one if it can't find any.
2431 *
2432 * It then sets up the reg based on the object's properties: address, pitch
2433 * and tiling format.
2434 */
Chris Wilson8c4b8c32009-06-17 22:08:52 +01002435int
2436i915_gem_object_get_fence_reg(struct drm_gem_object *obj)
Jesse Barnesde151cf2008-11-12 10:03:55 -08002437{
2438 struct drm_device *dev = obj->dev;
Jesse Barnes79e53942008-11-07 14:24:08 -08002439 struct drm_i915_private *dev_priv = dev->dev_private;
Daniel Vetter23010e42010-03-08 13:35:02 +01002440 struct drm_i915_gem_object *obj_priv = to_intel_bo(obj);
Jesse Barnesde151cf2008-11-12 10:03:55 -08002441 struct drm_i915_fence_reg *reg = NULL;
Daniel Vetterae3db242010-02-19 11:51:58 +01002442 int ret;
Jesse Barnesde151cf2008-11-12 10:03:55 -08002443
Eric Anholta09ba7f2009-08-29 12:49:51 -07002444 /* Just update our place in the LRU if our fence is getting used. */
2445 if (obj_priv->fence_reg != I915_FENCE_REG_NONE) {
Daniel Vetter007cc8a2010-04-28 11:02:31 +02002446 reg = &dev_priv->fence_regs[obj_priv->fence_reg];
2447 list_move_tail(&reg->lru_list, &dev_priv->mm.fence_list);
Eric Anholta09ba7f2009-08-29 12:49:51 -07002448 return 0;
2449 }
2450
Jesse Barnesde151cf2008-11-12 10:03:55 -08002451 switch (obj_priv->tiling_mode) {
2452 case I915_TILING_NONE:
2453 WARN(1, "allocating a fence for non-tiled object?\n");
2454 break;
2455 case I915_TILING_X:
Jesse Barnes0f973f22009-01-26 17:10:45 -08002456 if (!obj_priv->stride)
2457 return -EINVAL;
2458 WARN((obj_priv->stride & (512 - 1)),
2459 "object 0x%08x is X tiled but has non-512B pitch\n",
2460 obj_priv->gtt_offset);
Jesse Barnesde151cf2008-11-12 10:03:55 -08002461 break;
2462 case I915_TILING_Y:
Jesse Barnes0f973f22009-01-26 17:10:45 -08002463 if (!obj_priv->stride)
2464 return -EINVAL;
2465 WARN((obj_priv->stride & (128 - 1)),
2466 "object 0x%08x is Y tiled but has non-128B pitch\n",
2467 obj_priv->gtt_offset);
Jesse Barnesde151cf2008-11-12 10:03:55 -08002468 break;
2469 }
2470
Daniel Vetterae3db242010-02-19 11:51:58 +01002471 ret = i915_find_fence_reg(dev);
2472 if (ret < 0)
2473 return ret;
Chris Wilsonfc7170b2009-02-11 14:26:46 +00002474
Daniel Vetterae3db242010-02-19 11:51:58 +01002475 obj_priv->fence_reg = ret;
2476 reg = &dev_priv->fence_regs[obj_priv->fence_reg];
Daniel Vetter007cc8a2010-04-28 11:02:31 +02002477 list_add_tail(&reg->lru_list, &dev_priv->mm.fence_list);
Eric Anholta09ba7f2009-08-29 12:49:51 -07002478
Jesse Barnesde151cf2008-11-12 10:03:55 -08002479 reg->obj = obj;
2480
Eric Anholt4e901fd2009-10-26 16:44:17 -07002481 if (IS_GEN6(dev))
2482 sandybridge_write_fence_reg(reg);
2483 else if (IS_I965G(dev))
Jesse Barnesde151cf2008-11-12 10:03:55 -08002484 i965_write_fence_reg(reg);
2485 else if (IS_I9XX(dev))
2486 i915_write_fence_reg(reg);
2487 else
2488 i830_write_fence_reg(reg);
Eric Anholtd9ddcb92009-01-27 10:33:49 -08002489
Daniel Vetterae3db242010-02-19 11:51:58 +01002490 trace_i915_gem_object_get_fence(obj, obj_priv->fence_reg,
2491 obj_priv->tiling_mode);
Chris Wilson1c5d22f2009-08-25 11:15:50 +01002492
Eric Anholtd9ddcb92009-01-27 10:33:49 -08002493 return 0;
Jesse Barnesde151cf2008-11-12 10:03:55 -08002494}
2495
2496/**
2497 * i915_gem_clear_fence_reg - clear out fence register info
2498 * @obj: object to clear
2499 *
2500 * Zeroes out the fence register itself and clears out the associated
2501 * data structures in dev_priv and obj_priv.
2502 */
2503static void
2504i915_gem_clear_fence_reg(struct drm_gem_object *obj)
2505{
2506 struct drm_device *dev = obj->dev;
Jesse Barnes79e53942008-11-07 14:24:08 -08002507 drm_i915_private_t *dev_priv = dev->dev_private;
Daniel Vetter23010e42010-03-08 13:35:02 +01002508 struct drm_i915_gem_object *obj_priv = to_intel_bo(obj);
Daniel Vetter007cc8a2010-04-28 11:02:31 +02002509 struct drm_i915_fence_reg *reg =
2510 &dev_priv->fence_regs[obj_priv->fence_reg];
Jesse Barnesde151cf2008-11-12 10:03:55 -08002511
Eric Anholt4e901fd2009-10-26 16:44:17 -07002512 if (IS_GEN6(dev)) {
2513 I915_WRITE64(FENCE_REG_SANDYBRIDGE_0 +
2514 (obj_priv->fence_reg * 8), 0);
2515 } else if (IS_I965G(dev)) {
Jesse Barnesde151cf2008-11-12 10:03:55 -08002516 I915_WRITE64(FENCE_REG_965_0 + (obj_priv->fence_reg * 8), 0);
Eric Anholt4e901fd2009-10-26 16:44:17 -07002517 } else {
Eric Anholtdc529a42009-03-10 22:34:49 -07002518 uint32_t fence_reg;
2519
2520 if (obj_priv->fence_reg < 8)
2521 fence_reg = FENCE_REG_830_0 + obj_priv->fence_reg * 4;
2522 else
2523 fence_reg = FENCE_REG_945_8 + (obj_priv->fence_reg -
2524 8) * 4;
2525
2526 I915_WRITE(fence_reg, 0);
2527 }
Jesse Barnesde151cf2008-11-12 10:03:55 -08002528
Daniel Vetter007cc8a2010-04-28 11:02:31 +02002529 reg->obj = NULL;
Jesse Barnesde151cf2008-11-12 10:03:55 -08002530 obj_priv->fence_reg = I915_FENCE_REG_NONE;
Daniel Vetter007cc8a2010-04-28 11:02:31 +02002531 list_del_init(&reg->lru_list);
Jesse Barnesde151cf2008-11-12 10:03:55 -08002532}
2533
Eric Anholt673a3942008-07-30 12:06:12 -07002534/**
Chris Wilson52dc7d32009-06-06 09:46:01 +01002535 * i915_gem_object_put_fence_reg - waits on outstanding fenced access
2536 * to the buffer to finish, and then resets the fence register.
2537 * @obj: tiled object holding a fence register.
2538 *
2539 * Zeroes out the fence register itself and clears out the associated
2540 * data structures in dev_priv and obj_priv.
2541 */
2542int
2543i915_gem_object_put_fence_reg(struct drm_gem_object *obj)
2544{
2545 struct drm_device *dev = obj->dev;
Daniel Vetter23010e42010-03-08 13:35:02 +01002546 struct drm_i915_gem_object *obj_priv = to_intel_bo(obj);
Chris Wilson52dc7d32009-06-06 09:46:01 +01002547
2548 if (obj_priv->fence_reg == I915_FENCE_REG_NONE)
2549 return 0;
2550
Daniel Vetter10ae9bd2010-02-01 13:59:17 +01002551 /* If we've changed tiling, GTT-mappings of the object
2552 * need to re-fault to ensure that the correct fence register
2553 * setup is in place.
2554 */
2555 i915_gem_release_mmap(obj);
2556
Chris Wilson52dc7d32009-06-06 09:46:01 +01002557 /* On the i915, GPU access to tiled buffers is via a fence,
2558 * therefore we must wait for any outstanding access to complete
2559 * before clearing the fence.
2560 */
2561 if (!IS_I965G(dev)) {
2562 int ret;
2563
2564 i915_gem_object_flush_gpu_write_domain(obj);
Chris Wilson52dc7d32009-06-06 09:46:01 +01002565 ret = i915_gem_object_wait_rendering(obj);
2566 if (ret != 0)
2567 return ret;
2568 }
2569
Daniel Vetter4a726612010-02-01 13:59:16 +01002570 i915_gem_object_flush_gtt_write_domain(obj);
Chris Wilson52dc7d32009-06-06 09:46:01 +01002571 i915_gem_clear_fence_reg (obj);
2572
2573 return 0;
2574}
2575
2576/**
Eric Anholt673a3942008-07-30 12:06:12 -07002577 * Finds free space in the GTT aperture and binds the object there.
2578 */
2579static int
2580i915_gem_object_bind_to_gtt(struct drm_gem_object *obj, unsigned alignment)
2581{
2582 struct drm_device *dev = obj->dev;
2583 drm_i915_private_t *dev_priv = dev->dev_private;
Daniel Vetter23010e42010-03-08 13:35:02 +01002584 struct drm_i915_gem_object *obj_priv = to_intel_bo(obj);
Eric Anholt673a3942008-07-30 12:06:12 -07002585 struct drm_mm_node *free_space;
Chris Wilson4bdadb92010-01-27 13:36:32 +00002586 gfp_t gfpmask = __GFP_NORETRY | __GFP_NOWARN;
Chris Wilson07f73f62009-09-14 16:50:30 +01002587 int ret;
Eric Anholt673a3942008-07-30 12:06:12 -07002588
Chris Wilsonbb6baf72009-09-22 14:24:13 +01002589 if (obj_priv->madv != I915_MADV_WILLNEED) {
Chris Wilson3ef94da2009-09-14 16:50:29 +01002590 DRM_ERROR("Attempting to bind a purgeable object\n");
2591 return -EINVAL;
2592 }
2593
Eric Anholt673a3942008-07-30 12:06:12 -07002594 if (alignment == 0)
Jesse Barnes0f973f22009-01-26 17:10:45 -08002595 alignment = i915_gem_get_gtt_alignment(obj);
Daniel Vetter8d7773a2009-03-29 14:09:41 +02002596 if (alignment & (i915_gem_get_gtt_alignment(obj) - 1)) {
Eric Anholt673a3942008-07-30 12:06:12 -07002597 DRM_ERROR("Invalid object alignment requested %u\n", alignment);
2598 return -EINVAL;
2599 }
2600
2601 search_free:
2602 free_space = drm_mm_search_free(&dev_priv->mm.gtt_space,
2603 obj->size, alignment, 0);
2604 if (free_space != NULL) {
2605 obj_priv->gtt_space = drm_mm_get_block(free_space, obj->size,
2606 alignment);
2607 if (obj_priv->gtt_space != NULL) {
2608 obj_priv->gtt_space->private = obj;
2609 obj_priv->gtt_offset = obj_priv->gtt_space->start;
2610 }
2611 }
2612 if (obj_priv->gtt_space == NULL) {
2613 /* If the gtt is empty and we're still having trouble
2614 * fitting our object in, we're out of memory.
2615 */
2616#if WATCH_LRU
2617 DRM_INFO("%s: GTT full, evicting something\n", __func__);
2618#endif
Chris Wilson07f73f62009-09-14 16:50:30 +01002619 ret = i915_gem_evict_something(dev, obj->size);
Chris Wilson97311292009-09-21 00:22:34 +01002620 if (ret)
Eric Anholt673a3942008-07-30 12:06:12 -07002621 return ret;
Chris Wilson97311292009-09-21 00:22:34 +01002622
Eric Anholt673a3942008-07-30 12:06:12 -07002623 goto search_free;
2624 }
2625
2626#if WATCH_BUF
Krzysztof Halasacfd43c02009-06-20 00:31:28 +02002627 DRM_INFO("Binding object of size %zd at 0x%08x\n",
Eric Anholt673a3942008-07-30 12:06:12 -07002628 obj->size, obj_priv->gtt_offset);
2629#endif
Chris Wilson4bdadb92010-01-27 13:36:32 +00002630 ret = i915_gem_object_get_pages(obj, gfpmask);
Eric Anholt673a3942008-07-30 12:06:12 -07002631 if (ret) {
2632 drm_mm_put_block(obj_priv->gtt_space);
2633 obj_priv->gtt_space = NULL;
Chris Wilson07f73f62009-09-14 16:50:30 +01002634
2635 if (ret == -ENOMEM) {
2636 /* first try to clear up some space from the GTT */
2637 ret = i915_gem_evict_something(dev, obj->size);
2638 if (ret) {
Chris Wilson07f73f62009-09-14 16:50:30 +01002639 /* now try to shrink everyone else */
Chris Wilson4bdadb92010-01-27 13:36:32 +00002640 if (gfpmask) {
2641 gfpmask = 0;
2642 goto search_free;
Chris Wilson07f73f62009-09-14 16:50:30 +01002643 }
2644
2645 return ret;
2646 }
2647
2648 goto search_free;
2649 }
2650
Eric Anholt673a3942008-07-30 12:06:12 -07002651 return ret;
2652 }
2653
Eric Anholt673a3942008-07-30 12:06:12 -07002654 /* Create an AGP memory structure pointing at our pages, and bind it
2655 * into the GTT.
2656 */
2657 obj_priv->agp_mem = drm_agp_bind_pages(dev,
Eric Anholt856fa192009-03-19 14:10:50 -07002658 obj_priv->pages,
Chris Wilson07f73f62009-09-14 16:50:30 +01002659 obj->size >> PAGE_SHIFT,
Keith Packardba1eb1d2008-10-14 19:55:10 -07002660 obj_priv->gtt_offset,
2661 obj_priv->agp_type);
Eric Anholt673a3942008-07-30 12:06:12 -07002662 if (obj_priv->agp_mem == NULL) {
Eric Anholt856fa192009-03-19 14:10:50 -07002663 i915_gem_object_put_pages(obj);
Eric Anholt673a3942008-07-30 12:06:12 -07002664 drm_mm_put_block(obj_priv->gtt_space);
2665 obj_priv->gtt_space = NULL;
Chris Wilson07f73f62009-09-14 16:50:30 +01002666
2667 ret = i915_gem_evict_something(dev, obj->size);
Chris Wilson97311292009-09-21 00:22:34 +01002668 if (ret)
Chris Wilson07f73f62009-09-14 16:50:30 +01002669 return ret;
Chris Wilson07f73f62009-09-14 16:50:30 +01002670
2671 goto search_free;
Eric Anholt673a3942008-07-30 12:06:12 -07002672 }
2673 atomic_inc(&dev->gtt_count);
2674 atomic_add(obj->size, &dev->gtt_memory);
2675
2676 /* Assert that the object is not currently in any GPU domain. As it
2677 * wasn't in the GTT, there shouldn't be any way it could have been in
2678 * a GPU cache
2679 */
Chris Wilson21d509e2009-06-06 09:46:02 +01002680 BUG_ON(obj->read_domains & I915_GEM_GPU_DOMAINS);
2681 BUG_ON(obj->write_domain & I915_GEM_GPU_DOMAINS);
Eric Anholt673a3942008-07-30 12:06:12 -07002682
Chris Wilson1c5d22f2009-08-25 11:15:50 +01002683 trace_i915_gem_object_bind(obj, obj_priv->gtt_offset);
2684
Eric Anholt673a3942008-07-30 12:06:12 -07002685 return 0;
2686}
2687
2688void
2689i915_gem_clflush_object(struct drm_gem_object *obj)
2690{
Daniel Vetter23010e42010-03-08 13:35:02 +01002691 struct drm_i915_gem_object *obj_priv = to_intel_bo(obj);
Eric Anholt673a3942008-07-30 12:06:12 -07002692
2693 /* If we don't have a page list set up, then we're not pinned
2694 * to GPU, and we can ignore the cache flush because it'll happen
2695 * again at bind time.
2696 */
Eric Anholt856fa192009-03-19 14:10:50 -07002697 if (obj_priv->pages == NULL)
Eric Anholt673a3942008-07-30 12:06:12 -07002698 return;
2699
Chris Wilson1c5d22f2009-08-25 11:15:50 +01002700 trace_i915_gem_object_clflush(obj);
Eric Anholtcfa16a02009-05-26 18:46:16 -07002701
Eric Anholt856fa192009-03-19 14:10:50 -07002702 drm_clflush_pages(obj_priv->pages, obj->size / PAGE_SIZE);
Eric Anholt673a3942008-07-30 12:06:12 -07002703}
2704
Eric Anholte47c68e2008-11-14 13:35:19 -08002705/** Flushes any GPU write domain for the object if it's dirty. */
2706static void
2707i915_gem_object_flush_gpu_write_domain(struct drm_gem_object *obj)
2708{
2709 struct drm_device *dev = obj->dev;
Chris Wilson1c5d22f2009-08-25 11:15:50 +01002710 uint32_t old_write_domain;
Zou Nan hai852835f2010-05-21 09:08:56 +08002711 struct drm_i915_gem_object *obj_priv = to_intel_bo(obj);
Eric Anholte47c68e2008-11-14 13:35:19 -08002712
2713 if ((obj->write_domain & I915_GEM_GPU_DOMAINS) == 0)
2714 return;
2715
2716 /* Queue the GPU write cache flushing we need. */
Chris Wilson1c5d22f2009-08-25 11:15:50 +01002717 old_write_domain = obj->write_domain;
Eric Anholte47c68e2008-11-14 13:35:19 -08002718 i915_gem_flush(dev, 0, obj->write_domain);
Zou Nan hai852835f2010-05-21 09:08:56 +08002719 (void) i915_add_request(dev, NULL, obj->write_domain, obj_priv->ring);
Daniel Vetter99fcb762010-02-07 16:20:18 +01002720 BUG_ON(obj->write_domain);
Chris Wilson1c5d22f2009-08-25 11:15:50 +01002721
2722 trace_i915_gem_object_change_domain(obj,
2723 obj->read_domains,
2724 old_write_domain);
Eric Anholte47c68e2008-11-14 13:35:19 -08002725}
2726
2727/** Flushes the GTT write domain for the object if it's dirty. */
2728static void
2729i915_gem_object_flush_gtt_write_domain(struct drm_gem_object *obj)
2730{
Chris Wilson1c5d22f2009-08-25 11:15:50 +01002731 uint32_t old_write_domain;
2732
Eric Anholte47c68e2008-11-14 13:35:19 -08002733 if (obj->write_domain != I915_GEM_DOMAIN_GTT)
2734 return;
2735
2736 /* No actual flushing is required for the GTT write domain. Writes
2737 * to it immediately go to main memory as far as we know, so there's
2738 * no chipset flush. It also doesn't land in render cache.
2739 */
Chris Wilson1c5d22f2009-08-25 11:15:50 +01002740 old_write_domain = obj->write_domain;
Eric Anholte47c68e2008-11-14 13:35:19 -08002741 obj->write_domain = 0;
Chris Wilson1c5d22f2009-08-25 11:15:50 +01002742
2743 trace_i915_gem_object_change_domain(obj,
2744 obj->read_domains,
2745 old_write_domain);
Eric Anholte47c68e2008-11-14 13:35:19 -08002746}
2747
2748/** Flushes the CPU write domain for the object if it's dirty. */
2749static void
2750i915_gem_object_flush_cpu_write_domain(struct drm_gem_object *obj)
2751{
2752 struct drm_device *dev = obj->dev;
Chris Wilson1c5d22f2009-08-25 11:15:50 +01002753 uint32_t old_write_domain;
Eric Anholte47c68e2008-11-14 13:35:19 -08002754
2755 if (obj->write_domain != I915_GEM_DOMAIN_CPU)
2756 return;
2757
2758 i915_gem_clflush_object(obj);
2759 drm_agp_chipset_flush(dev);
Chris Wilson1c5d22f2009-08-25 11:15:50 +01002760 old_write_domain = obj->write_domain;
Eric Anholte47c68e2008-11-14 13:35:19 -08002761 obj->write_domain = 0;
Chris Wilson1c5d22f2009-08-25 11:15:50 +01002762
2763 trace_i915_gem_object_change_domain(obj,
2764 obj->read_domains,
2765 old_write_domain);
Eric Anholte47c68e2008-11-14 13:35:19 -08002766}
2767
Kristian Høgsberg6b95a202009-11-18 11:25:18 -05002768void
2769i915_gem_object_flush_write_domain(struct drm_gem_object *obj)
2770{
2771 switch (obj->write_domain) {
2772 case I915_GEM_DOMAIN_GTT:
2773 i915_gem_object_flush_gtt_write_domain(obj);
2774 break;
2775 case I915_GEM_DOMAIN_CPU:
2776 i915_gem_object_flush_cpu_write_domain(obj);
2777 break;
2778 default:
2779 i915_gem_object_flush_gpu_write_domain(obj);
2780 break;
2781 }
2782}
2783
Eric Anholt2ef7eea2008-11-10 10:53:25 -08002784/**
2785 * Moves a single object to the GTT read, and possibly write domain.
2786 *
2787 * This function returns when the move is complete, including waiting on
2788 * flushes to occur.
2789 */
Jesse Barnes79e53942008-11-07 14:24:08 -08002790int
Eric Anholt2ef7eea2008-11-10 10:53:25 -08002791i915_gem_object_set_to_gtt_domain(struct drm_gem_object *obj, int write)
2792{
Daniel Vetter23010e42010-03-08 13:35:02 +01002793 struct drm_i915_gem_object *obj_priv = to_intel_bo(obj);
Chris Wilson1c5d22f2009-08-25 11:15:50 +01002794 uint32_t old_write_domain, old_read_domains;
Eric Anholte47c68e2008-11-14 13:35:19 -08002795 int ret;
Eric Anholt2ef7eea2008-11-10 10:53:25 -08002796
Eric Anholt02354392008-11-26 13:58:13 -08002797 /* Not valid to be called on unbound objects. */
2798 if (obj_priv->gtt_space == NULL)
2799 return -EINVAL;
2800
Eric Anholte47c68e2008-11-14 13:35:19 -08002801 i915_gem_object_flush_gpu_write_domain(obj);
Eric Anholt2ef7eea2008-11-10 10:53:25 -08002802 /* Wait on any GPU rendering and flushing to occur. */
Eric Anholte47c68e2008-11-14 13:35:19 -08002803 ret = i915_gem_object_wait_rendering(obj);
2804 if (ret != 0)
2805 return ret;
Eric Anholt2ef7eea2008-11-10 10:53:25 -08002806
Chris Wilson1c5d22f2009-08-25 11:15:50 +01002807 old_write_domain = obj->write_domain;
2808 old_read_domains = obj->read_domains;
2809
Eric Anholt2ef7eea2008-11-10 10:53:25 -08002810 /* If we're writing through the GTT domain, then CPU and GPU caches
2811 * will need to be invalidated at next use.
2812 */
2813 if (write)
Eric Anholte47c68e2008-11-14 13:35:19 -08002814 obj->read_domains &= I915_GEM_DOMAIN_GTT;
Eric Anholt2ef7eea2008-11-10 10:53:25 -08002815
Eric Anholte47c68e2008-11-14 13:35:19 -08002816 i915_gem_object_flush_cpu_write_domain(obj);
Eric Anholt2ef7eea2008-11-10 10:53:25 -08002817
2818 /* It should now be out of any other write domains, and we can update
2819 * the domain values for our changes.
2820 */
2821 BUG_ON((obj->write_domain & ~I915_GEM_DOMAIN_GTT) != 0);
2822 obj->read_domains |= I915_GEM_DOMAIN_GTT;
Eric Anholte47c68e2008-11-14 13:35:19 -08002823 if (write) {
Eric Anholt2ef7eea2008-11-10 10:53:25 -08002824 obj->write_domain = I915_GEM_DOMAIN_GTT;
Eric Anholte47c68e2008-11-14 13:35:19 -08002825 obj_priv->dirty = 1;
2826 }
2827
Chris Wilson1c5d22f2009-08-25 11:15:50 +01002828 trace_i915_gem_object_change_domain(obj,
2829 old_read_domains,
2830 old_write_domain);
2831
Eric Anholte47c68e2008-11-14 13:35:19 -08002832 return 0;
2833}
2834
Zhenyu Wangb9241ea2009-11-25 13:09:39 +08002835/*
2836 * Prepare buffer for display plane. Use uninterruptible for possible flush
2837 * wait, as in modesetting process we're not supposed to be interrupted.
2838 */
2839int
2840i915_gem_object_set_to_display_plane(struct drm_gem_object *obj)
2841{
2842 struct drm_device *dev = obj->dev;
Daniel Vetter23010e42010-03-08 13:35:02 +01002843 struct drm_i915_gem_object *obj_priv = to_intel_bo(obj);
Zhenyu Wangb9241ea2009-11-25 13:09:39 +08002844 uint32_t old_write_domain, old_read_domains;
2845 int ret;
2846
2847 /* Not valid to be called on unbound objects. */
2848 if (obj_priv->gtt_space == NULL)
2849 return -EINVAL;
2850
2851 i915_gem_object_flush_gpu_write_domain(obj);
2852
2853 /* Wait on any GPU rendering and flushing to occur. */
2854 if (obj_priv->active) {
2855#if WATCH_BUF
2856 DRM_INFO("%s: object %p wait for seqno %08x\n",
2857 __func__, obj, obj_priv->last_rendering_seqno);
2858#endif
Zou Nan hai852835f2010-05-21 09:08:56 +08002859 ret = i915_do_wait_request(dev,
2860 obj_priv->last_rendering_seqno,
2861 0,
2862 obj_priv->ring);
Zhenyu Wangb9241ea2009-11-25 13:09:39 +08002863 if (ret != 0)
2864 return ret;
2865 }
2866
2867 old_write_domain = obj->write_domain;
2868 old_read_domains = obj->read_domains;
2869
2870 obj->read_domains &= I915_GEM_DOMAIN_GTT;
2871
2872 i915_gem_object_flush_cpu_write_domain(obj);
2873
2874 /* It should now be out of any other write domains, and we can update
2875 * the domain values for our changes.
2876 */
2877 BUG_ON((obj->write_domain & ~I915_GEM_DOMAIN_GTT) != 0);
2878 obj->read_domains |= I915_GEM_DOMAIN_GTT;
2879 obj->write_domain = I915_GEM_DOMAIN_GTT;
2880 obj_priv->dirty = 1;
2881
2882 trace_i915_gem_object_change_domain(obj,
2883 old_read_domains,
2884 old_write_domain);
2885
2886 return 0;
2887}
2888
Eric Anholte47c68e2008-11-14 13:35:19 -08002889/**
2890 * Moves a single object to the CPU read, and possibly write domain.
2891 *
2892 * This function returns when the move is complete, including waiting on
2893 * flushes to occur.
2894 */
2895static int
2896i915_gem_object_set_to_cpu_domain(struct drm_gem_object *obj, int write)
2897{
Chris Wilson1c5d22f2009-08-25 11:15:50 +01002898 uint32_t old_write_domain, old_read_domains;
Eric Anholte47c68e2008-11-14 13:35:19 -08002899 int ret;
2900
2901 i915_gem_object_flush_gpu_write_domain(obj);
2902 /* Wait on any GPU rendering and flushing to occur. */
2903 ret = i915_gem_object_wait_rendering(obj);
2904 if (ret != 0)
2905 return ret;
2906
2907 i915_gem_object_flush_gtt_write_domain(obj);
2908
2909 /* If we have a partially-valid cache of the object in the CPU,
2910 * finish invalidating it and free the per-page flags.
2911 */
2912 i915_gem_object_set_to_full_cpu_read_domain(obj);
2913
Chris Wilson1c5d22f2009-08-25 11:15:50 +01002914 old_write_domain = obj->write_domain;
2915 old_read_domains = obj->read_domains;
2916
Eric Anholte47c68e2008-11-14 13:35:19 -08002917 /* Flush the CPU cache if it's still invalid. */
2918 if ((obj->read_domains & I915_GEM_DOMAIN_CPU) == 0) {
2919 i915_gem_clflush_object(obj);
Eric Anholte47c68e2008-11-14 13:35:19 -08002920
2921 obj->read_domains |= I915_GEM_DOMAIN_CPU;
2922 }
2923
2924 /* It should now be out of any other write domains, and we can update
2925 * the domain values for our changes.
2926 */
2927 BUG_ON((obj->write_domain & ~I915_GEM_DOMAIN_CPU) != 0);
2928
2929 /* If we're writing through the CPU, then the GPU read domains will
2930 * need to be invalidated at next use.
2931 */
2932 if (write) {
2933 obj->read_domains &= I915_GEM_DOMAIN_CPU;
2934 obj->write_domain = I915_GEM_DOMAIN_CPU;
2935 }
Eric Anholt2ef7eea2008-11-10 10:53:25 -08002936
Chris Wilson1c5d22f2009-08-25 11:15:50 +01002937 trace_i915_gem_object_change_domain(obj,
2938 old_read_domains,
2939 old_write_domain);
2940
Eric Anholt2ef7eea2008-11-10 10:53:25 -08002941 return 0;
2942}
2943
Eric Anholt673a3942008-07-30 12:06:12 -07002944/*
2945 * Set the next domain for the specified object. This
2946 * may not actually perform the necessary flushing/invaliding though,
2947 * as that may want to be batched with other set_domain operations
2948 *
2949 * This is (we hope) the only really tricky part of gem. The goal
2950 * is fairly simple -- track which caches hold bits of the object
2951 * and make sure they remain coherent. A few concrete examples may
2952 * help to explain how it works. For shorthand, we use the notation
2953 * (read_domains, write_domain), e.g. (CPU, CPU) to indicate the
2954 * a pair of read and write domain masks.
2955 *
2956 * Case 1: the batch buffer
2957 *
2958 * 1. Allocated
2959 * 2. Written by CPU
2960 * 3. Mapped to GTT
2961 * 4. Read by GPU
2962 * 5. Unmapped from GTT
2963 * 6. Freed
2964 *
2965 * Let's take these a step at a time
2966 *
2967 * 1. Allocated
2968 * Pages allocated from the kernel may still have
2969 * cache contents, so we set them to (CPU, CPU) always.
2970 * 2. Written by CPU (using pwrite)
2971 * The pwrite function calls set_domain (CPU, CPU) and
2972 * this function does nothing (as nothing changes)
2973 * 3. Mapped by GTT
2974 * This function asserts that the object is not
2975 * currently in any GPU-based read or write domains
2976 * 4. Read by GPU
2977 * i915_gem_execbuffer calls set_domain (COMMAND, 0).
2978 * As write_domain is zero, this function adds in the
2979 * current read domains (CPU+COMMAND, 0).
2980 * flush_domains is set to CPU.
2981 * invalidate_domains is set to COMMAND
2982 * clflush is run to get data out of the CPU caches
2983 * then i915_dev_set_domain calls i915_gem_flush to
2984 * emit an MI_FLUSH and drm_agp_chipset_flush
2985 * 5. Unmapped from GTT
2986 * i915_gem_object_unbind calls set_domain (CPU, CPU)
2987 * flush_domains and invalidate_domains end up both zero
2988 * so no flushing/invalidating happens
2989 * 6. Freed
2990 * yay, done
2991 *
2992 * Case 2: The shared render buffer
2993 *
2994 * 1. Allocated
2995 * 2. Mapped to GTT
2996 * 3. Read/written by GPU
2997 * 4. set_domain to (CPU,CPU)
2998 * 5. Read/written by CPU
2999 * 6. Read/written by GPU
3000 *
3001 * 1. Allocated
3002 * Same as last example, (CPU, CPU)
3003 * 2. Mapped to GTT
3004 * Nothing changes (assertions find that it is not in the GPU)
3005 * 3. Read/written by GPU
3006 * execbuffer calls set_domain (RENDER, RENDER)
3007 * flush_domains gets CPU
3008 * invalidate_domains gets GPU
3009 * clflush (obj)
3010 * MI_FLUSH and drm_agp_chipset_flush
3011 * 4. set_domain (CPU, CPU)
3012 * flush_domains gets GPU
3013 * invalidate_domains gets CPU
3014 * wait_rendering (obj) to make sure all drawing is complete.
3015 * This will include an MI_FLUSH to get the data from GPU
3016 * to memory
3017 * clflush (obj) to invalidate the CPU cache
3018 * Another MI_FLUSH in i915_gem_flush (eliminate this somehow?)
3019 * 5. Read/written by CPU
3020 * cache lines are loaded and dirtied
3021 * 6. Read written by GPU
3022 * Same as last GPU access
3023 *
3024 * Case 3: The constant buffer
3025 *
3026 * 1. Allocated
3027 * 2. Written by CPU
3028 * 3. Read by GPU
3029 * 4. Updated (written) by CPU again
3030 * 5. Read by GPU
3031 *
3032 * 1. Allocated
3033 * (CPU, CPU)
3034 * 2. Written by CPU
3035 * (CPU, CPU)
3036 * 3. Read by GPU
3037 * (CPU+RENDER, 0)
3038 * flush_domains = CPU
3039 * invalidate_domains = RENDER
3040 * clflush (obj)
3041 * MI_FLUSH
3042 * drm_agp_chipset_flush
3043 * 4. Updated (written) by CPU again
3044 * (CPU, CPU)
3045 * flush_domains = 0 (no previous write domain)
3046 * invalidate_domains = 0 (no new read domains)
3047 * 5. Read by GPU
3048 * (CPU+RENDER, 0)
3049 * flush_domains = CPU
3050 * invalidate_domains = RENDER
3051 * clflush (obj)
3052 * MI_FLUSH
3053 * drm_agp_chipset_flush
3054 */
Keith Packardc0d90822008-11-20 23:11:08 -08003055static void
Eric Anholt8b0e3782009-02-19 14:40:50 -08003056i915_gem_object_set_to_gpu_domain(struct drm_gem_object *obj)
Eric Anholt673a3942008-07-30 12:06:12 -07003057{
3058 struct drm_device *dev = obj->dev;
Daniel Vetter23010e42010-03-08 13:35:02 +01003059 struct drm_i915_gem_object *obj_priv = to_intel_bo(obj);
Eric Anholt673a3942008-07-30 12:06:12 -07003060 uint32_t invalidate_domains = 0;
3061 uint32_t flush_domains = 0;
Chris Wilson1c5d22f2009-08-25 11:15:50 +01003062 uint32_t old_read_domains;
Eric Anholte47c68e2008-11-14 13:35:19 -08003063
Eric Anholt8b0e3782009-02-19 14:40:50 -08003064 BUG_ON(obj->pending_read_domains & I915_GEM_DOMAIN_CPU);
3065 BUG_ON(obj->pending_write_domain == I915_GEM_DOMAIN_CPU);
Eric Anholt673a3942008-07-30 12:06:12 -07003066
Jesse Barnes652c3932009-08-17 13:31:43 -07003067 intel_mark_busy(dev, obj);
3068
Eric Anholt673a3942008-07-30 12:06:12 -07003069#if WATCH_BUF
3070 DRM_INFO("%s: object %p read %08x -> %08x write %08x -> %08x\n",
3071 __func__, obj,
Eric Anholt8b0e3782009-02-19 14:40:50 -08003072 obj->read_domains, obj->pending_read_domains,
3073 obj->write_domain, obj->pending_write_domain);
Eric Anholt673a3942008-07-30 12:06:12 -07003074#endif
3075 /*
3076 * If the object isn't moving to a new write domain,
3077 * let the object stay in multiple read domains
3078 */
Eric Anholt8b0e3782009-02-19 14:40:50 -08003079 if (obj->pending_write_domain == 0)
3080 obj->pending_read_domains |= obj->read_domains;
Eric Anholt673a3942008-07-30 12:06:12 -07003081 else
3082 obj_priv->dirty = 1;
3083
3084 /*
3085 * Flush the current write domain if
3086 * the new read domains don't match. Invalidate
3087 * any read domains which differ from the old
3088 * write domain
3089 */
Eric Anholt8b0e3782009-02-19 14:40:50 -08003090 if (obj->write_domain &&
3091 obj->write_domain != obj->pending_read_domains) {
Eric Anholt673a3942008-07-30 12:06:12 -07003092 flush_domains |= obj->write_domain;
Eric Anholt8b0e3782009-02-19 14:40:50 -08003093 invalidate_domains |=
3094 obj->pending_read_domains & ~obj->write_domain;
Eric Anholt673a3942008-07-30 12:06:12 -07003095 }
3096 /*
3097 * Invalidate any read caches which may have
3098 * stale data. That is, any new read domains.
3099 */
Eric Anholt8b0e3782009-02-19 14:40:50 -08003100 invalidate_domains |= obj->pending_read_domains & ~obj->read_domains;
Eric Anholt673a3942008-07-30 12:06:12 -07003101 if ((flush_domains | invalidate_domains) & I915_GEM_DOMAIN_CPU) {
3102#if WATCH_BUF
3103 DRM_INFO("%s: CPU domain flush %08x invalidate %08x\n",
3104 __func__, flush_domains, invalidate_domains);
3105#endif
Eric Anholt673a3942008-07-30 12:06:12 -07003106 i915_gem_clflush_object(obj);
3107 }
3108
Chris Wilson1c5d22f2009-08-25 11:15:50 +01003109 old_read_domains = obj->read_domains;
3110
Eric Anholtefbeed92009-02-19 14:54:51 -08003111 /* The actual obj->write_domain will be updated with
3112 * pending_write_domain after we emit the accumulated flush for all
3113 * of our domain changes in execbuffers (which clears objects'
3114 * write_domains). So if we have a current write domain that we
3115 * aren't changing, set pending_write_domain to that.
3116 */
3117 if (flush_domains == 0 && obj->pending_write_domain == 0)
3118 obj->pending_write_domain = obj->write_domain;
Eric Anholt8b0e3782009-02-19 14:40:50 -08003119 obj->read_domains = obj->pending_read_domains;
Eric Anholt673a3942008-07-30 12:06:12 -07003120
3121 dev->invalidate_domains |= invalidate_domains;
3122 dev->flush_domains |= flush_domains;
3123#if WATCH_BUF
3124 DRM_INFO("%s: read %08x write %08x invalidate %08x flush %08x\n",
3125 __func__,
3126 obj->read_domains, obj->write_domain,
3127 dev->invalidate_domains, dev->flush_domains);
3128#endif
Chris Wilson1c5d22f2009-08-25 11:15:50 +01003129
3130 trace_i915_gem_object_change_domain(obj,
3131 old_read_domains,
3132 obj->write_domain);
Eric Anholt673a3942008-07-30 12:06:12 -07003133}
3134
3135/**
Eric Anholte47c68e2008-11-14 13:35:19 -08003136 * Moves the object from a partially CPU read to a full one.
Eric Anholt673a3942008-07-30 12:06:12 -07003137 *
Eric Anholte47c68e2008-11-14 13:35:19 -08003138 * Note that this only resolves i915_gem_object_set_cpu_read_domain_range(),
3139 * and doesn't handle transitioning from !(read_domains & I915_GEM_DOMAIN_CPU).
3140 */
3141static void
3142i915_gem_object_set_to_full_cpu_read_domain(struct drm_gem_object *obj)
3143{
Daniel Vetter23010e42010-03-08 13:35:02 +01003144 struct drm_i915_gem_object *obj_priv = to_intel_bo(obj);
Eric Anholte47c68e2008-11-14 13:35:19 -08003145
3146 if (!obj_priv->page_cpu_valid)
3147 return;
3148
3149 /* If we're partially in the CPU read domain, finish moving it in.
3150 */
3151 if (obj->read_domains & I915_GEM_DOMAIN_CPU) {
3152 int i;
3153
3154 for (i = 0; i <= (obj->size - 1) / PAGE_SIZE; i++) {
3155 if (obj_priv->page_cpu_valid[i])
3156 continue;
Eric Anholt856fa192009-03-19 14:10:50 -07003157 drm_clflush_pages(obj_priv->pages + i, 1);
Eric Anholte47c68e2008-11-14 13:35:19 -08003158 }
Eric Anholte47c68e2008-11-14 13:35:19 -08003159 }
3160
3161 /* Free the page_cpu_valid mappings which are now stale, whether
3162 * or not we've got I915_GEM_DOMAIN_CPU.
3163 */
Eric Anholt9a298b22009-03-24 12:23:04 -07003164 kfree(obj_priv->page_cpu_valid);
Eric Anholte47c68e2008-11-14 13:35:19 -08003165 obj_priv->page_cpu_valid = NULL;
3166}
3167
3168/**
3169 * Set the CPU read domain on a range of the object.
3170 *
3171 * The object ends up with I915_GEM_DOMAIN_CPU in its read flags although it's
3172 * not entirely valid. The page_cpu_valid member of the object flags which
3173 * pages have been flushed, and will be respected by
3174 * i915_gem_object_set_to_cpu_domain() if it's called on to get a valid mapping
3175 * of the whole object.
3176 *
3177 * This function returns when the move is complete, including waiting on
3178 * flushes to occur.
Eric Anholt673a3942008-07-30 12:06:12 -07003179 */
3180static int
Eric Anholte47c68e2008-11-14 13:35:19 -08003181i915_gem_object_set_cpu_read_domain_range(struct drm_gem_object *obj,
3182 uint64_t offset, uint64_t size)
Eric Anholt673a3942008-07-30 12:06:12 -07003183{
Daniel Vetter23010e42010-03-08 13:35:02 +01003184 struct drm_i915_gem_object *obj_priv = to_intel_bo(obj);
Chris Wilson1c5d22f2009-08-25 11:15:50 +01003185 uint32_t old_read_domains;
Eric Anholte47c68e2008-11-14 13:35:19 -08003186 int i, ret;
Eric Anholt673a3942008-07-30 12:06:12 -07003187
Eric Anholte47c68e2008-11-14 13:35:19 -08003188 if (offset == 0 && size == obj->size)
3189 return i915_gem_object_set_to_cpu_domain(obj, 0);
3190
3191 i915_gem_object_flush_gpu_write_domain(obj);
3192 /* Wait on any GPU rendering and flushing to occur. */
3193 ret = i915_gem_object_wait_rendering(obj);
3194 if (ret != 0)
3195 return ret;
3196 i915_gem_object_flush_gtt_write_domain(obj);
3197
3198 /* If we're already fully in the CPU read domain, we're done. */
3199 if (obj_priv->page_cpu_valid == NULL &&
3200 (obj->read_domains & I915_GEM_DOMAIN_CPU) != 0)
Eric Anholt673a3942008-07-30 12:06:12 -07003201 return 0;
3202
Eric Anholte47c68e2008-11-14 13:35:19 -08003203 /* Otherwise, create/clear the per-page CPU read domain flag if we're
3204 * newly adding I915_GEM_DOMAIN_CPU
3205 */
Eric Anholt673a3942008-07-30 12:06:12 -07003206 if (obj_priv->page_cpu_valid == NULL) {
Eric Anholt9a298b22009-03-24 12:23:04 -07003207 obj_priv->page_cpu_valid = kzalloc(obj->size / PAGE_SIZE,
3208 GFP_KERNEL);
Eric Anholte47c68e2008-11-14 13:35:19 -08003209 if (obj_priv->page_cpu_valid == NULL)
3210 return -ENOMEM;
3211 } else if ((obj->read_domains & I915_GEM_DOMAIN_CPU) == 0)
3212 memset(obj_priv->page_cpu_valid, 0, obj->size / PAGE_SIZE);
Eric Anholt673a3942008-07-30 12:06:12 -07003213
3214 /* Flush the cache on any pages that are still invalid from the CPU's
3215 * perspective.
3216 */
Eric Anholte47c68e2008-11-14 13:35:19 -08003217 for (i = offset / PAGE_SIZE; i <= (offset + size - 1) / PAGE_SIZE;
3218 i++) {
Eric Anholt673a3942008-07-30 12:06:12 -07003219 if (obj_priv->page_cpu_valid[i])
3220 continue;
3221
Eric Anholt856fa192009-03-19 14:10:50 -07003222 drm_clflush_pages(obj_priv->pages + i, 1);
Eric Anholt673a3942008-07-30 12:06:12 -07003223
3224 obj_priv->page_cpu_valid[i] = 1;
3225 }
3226
Eric Anholte47c68e2008-11-14 13:35:19 -08003227 /* It should now be out of any other write domains, and we can update
3228 * the domain values for our changes.
3229 */
3230 BUG_ON((obj->write_domain & ~I915_GEM_DOMAIN_CPU) != 0);
3231
Chris Wilson1c5d22f2009-08-25 11:15:50 +01003232 old_read_domains = obj->read_domains;
Eric Anholte47c68e2008-11-14 13:35:19 -08003233 obj->read_domains |= I915_GEM_DOMAIN_CPU;
3234
Chris Wilson1c5d22f2009-08-25 11:15:50 +01003235 trace_i915_gem_object_change_domain(obj,
3236 old_read_domains,
3237 obj->write_domain);
3238
Eric Anholt673a3942008-07-30 12:06:12 -07003239 return 0;
3240}
3241
3242/**
Eric Anholt673a3942008-07-30 12:06:12 -07003243 * Pin an object to the GTT and evaluate the relocations landing in it.
3244 */
3245static int
3246i915_gem_object_pin_and_relocate(struct drm_gem_object *obj,
3247 struct drm_file *file_priv,
Jesse Barnes76446ca2009-12-17 22:05:42 -05003248 struct drm_i915_gem_exec_object2 *entry,
Eric Anholt40a5f0d2009-03-12 11:23:52 -07003249 struct drm_i915_gem_relocation_entry *relocs)
Eric Anholt673a3942008-07-30 12:06:12 -07003250{
3251 struct drm_device *dev = obj->dev;
Keith Packard0839ccb2008-10-30 19:38:48 -07003252 drm_i915_private_t *dev_priv = dev->dev_private;
Daniel Vetter23010e42010-03-08 13:35:02 +01003253 struct drm_i915_gem_object *obj_priv = to_intel_bo(obj);
Eric Anholt673a3942008-07-30 12:06:12 -07003254 int i, ret;
Keith Packard0839ccb2008-10-30 19:38:48 -07003255 void __iomem *reloc_page;
Jesse Barnes76446ca2009-12-17 22:05:42 -05003256 bool need_fence;
3257
3258 need_fence = entry->flags & EXEC_OBJECT_NEEDS_FENCE &&
3259 obj_priv->tiling_mode != I915_TILING_NONE;
3260
3261 /* Check fence reg constraints and rebind if necessary */
Owain Ainsworthf590d272010-02-18 15:33:00 +00003262 if (need_fence && !i915_gem_object_fence_offset_ok(obj,
3263 obj_priv->tiling_mode))
Jesse Barnes76446ca2009-12-17 22:05:42 -05003264 i915_gem_object_unbind(obj);
Eric Anholt673a3942008-07-30 12:06:12 -07003265
3266 /* Choose the GTT offset for our buffer and put it there. */
3267 ret = i915_gem_object_pin(obj, (uint32_t) entry->alignment);
3268 if (ret)
3269 return ret;
3270
Jesse Barnes76446ca2009-12-17 22:05:42 -05003271 /*
3272 * Pre-965 chips need a fence register set up in order to
3273 * properly handle blits to/from tiled surfaces.
3274 */
3275 if (need_fence) {
3276 ret = i915_gem_object_get_fence_reg(obj);
3277 if (ret != 0) {
3278 if (ret != -EBUSY && ret != -ERESTARTSYS)
3279 DRM_ERROR("Failure to install fence: %d\n",
3280 ret);
3281 i915_gem_object_unpin(obj);
3282 return ret;
3283 }
3284 }
3285
Eric Anholt673a3942008-07-30 12:06:12 -07003286 entry->offset = obj_priv->gtt_offset;
3287
Eric Anholt673a3942008-07-30 12:06:12 -07003288 /* Apply the relocations, using the GTT aperture to avoid cache
3289 * flushing requirements.
3290 */
3291 for (i = 0; i < entry->relocation_count; i++) {
Eric Anholt40a5f0d2009-03-12 11:23:52 -07003292 struct drm_i915_gem_relocation_entry *reloc= &relocs[i];
Eric Anholt673a3942008-07-30 12:06:12 -07003293 struct drm_gem_object *target_obj;
3294 struct drm_i915_gem_object *target_obj_priv;
Eric Anholt3043c602008-10-02 12:24:47 -07003295 uint32_t reloc_val, reloc_offset;
3296 uint32_t __iomem *reloc_entry;
Eric Anholt673a3942008-07-30 12:06:12 -07003297
Eric Anholt673a3942008-07-30 12:06:12 -07003298 target_obj = drm_gem_object_lookup(obj->dev, file_priv,
Eric Anholt40a5f0d2009-03-12 11:23:52 -07003299 reloc->target_handle);
Eric Anholt673a3942008-07-30 12:06:12 -07003300 if (target_obj == NULL) {
3301 i915_gem_object_unpin(obj);
3302 return -EBADF;
3303 }
Daniel Vetter23010e42010-03-08 13:35:02 +01003304 target_obj_priv = to_intel_bo(target_obj);
Eric Anholt673a3942008-07-30 12:06:12 -07003305
Chris Wilson8542a0b2009-09-09 21:15:15 +01003306#if WATCH_RELOC
3307 DRM_INFO("%s: obj %p offset %08x target %d "
3308 "read %08x write %08x gtt %08x "
3309 "presumed %08x delta %08x\n",
3310 __func__,
3311 obj,
3312 (int) reloc->offset,
3313 (int) reloc->target_handle,
3314 (int) reloc->read_domains,
3315 (int) reloc->write_domain,
3316 (int) target_obj_priv->gtt_offset,
3317 (int) reloc->presumed_offset,
3318 reloc->delta);
3319#endif
3320
Eric Anholt673a3942008-07-30 12:06:12 -07003321 /* The target buffer should have appeared before us in the
3322 * exec_object list, so it should have a GTT space bound by now.
3323 */
3324 if (target_obj_priv->gtt_space == NULL) {
3325 DRM_ERROR("No GTT space found for object %d\n",
Eric Anholt40a5f0d2009-03-12 11:23:52 -07003326 reloc->target_handle);
Eric Anholt673a3942008-07-30 12:06:12 -07003327 drm_gem_object_unreference(target_obj);
3328 i915_gem_object_unpin(obj);
3329 return -EINVAL;
3330 }
3331
Chris Wilson8542a0b2009-09-09 21:15:15 +01003332 /* Validate that the target is in a valid r/w GPU domain */
Daniel Vetter16edd552010-02-19 11:52:02 +01003333 if (reloc->write_domain & (reloc->write_domain - 1)) {
3334 DRM_ERROR("reloc with multiple write domains: "
3335 "obj %p target %d offset %d "
3336 "read %08x write %08x",
3337 obj, reloc->target_handle,
3338 (int) reloc->offset,
3339 reloc->read_domains,
3340 reloc->write_domain);
3341 return -EINVAL;
3342 }
Chris Wilson8542a0b2009-09-09 21:15:15 +01003343 if (reloc->write_domain & I915_GEM_DOMAIN_CPU ||
3344 reloc->read_domains & I915_GEM_DOMAIN_CPU) {
3345 DRM_ERROR("reloc with read/write CPU domains: "
3346 "obj %p target %d offset %d "
3347 "read %08x write %08x",
3348 obj, reloc->target_handle,
3349 (int) reloc->offset,
3350 reloc->read_domains,
3351 reloc->write_domain);
3352 drm_gem_object_unreference(target_obj);
3353 i915_gem_object_unpin(obj);
3354 return -EINVAL;
3355 }
3356 if (reloc->write_domain && target_obj->pending_write_domain &&
3357 reloc->write_domain != target_obj->pending_write_domain) {
3358 DRM_ERROR("Write domain conflict: "
3359 "obj %p target %d offset %d "
3360 "new %08x old %08x\n",
3361 obj, reloc->target_handle,
3362 (int) reloc->offset,
3363 reloc->write_domain,
3364 target_obj->pending_write_domain);
3365 drm_gem_object_unreference(target_obj);
3366 i915_gem_object_unpin(obj);
3367 return -EINVAL;
3368 }
3369
3370 target_obj->pending_read_domains |= reloc->read_domains;
3371 target_obj->pending_write_domain |= reloc->write_domain;
3372
3373 /* If the relocation already has the right value in it, no
3374 * more work needs to be done.
3375 */
3376 if (target_obj_priv->gtt_offset == reloc->presumed_offset) {
3377 drm_gem_object_unreference(target_obj);
3378 continue;
3379 }
3380
3381 /* Check that the relocation address is valid... */
Eric Anholt40a5f0d2009-03-12 11:23:52 -07003382 if (reloc->offset > obj->size - 4) {
Eric Anholt673a3942008-07-30 12:06:12 -07003383 DRM_ERROR("Relocation beyond object bounds: "
3384 "obj %p target %d offset %d size %d.\n",
Eric Anholt40a5f0d2009-03-12 11:23:52 -07003385 obj, reloc->target_handle,
3386 (int) reloc->offset, (int) obj->size);
Eric Anholt673a3942008-07-30 12:06:12 -07003387 drm_gem_object_unreference(target_obj);
3388 i915_gem_object_unpin(obj);
3389 return -EINVAL;
3390 }
Eric Anholt40a5f0d2009-03-12 11:23:52 -07003391 if (reloc->offset & 3) {
Eric Anholt673a3942008-07-30 12:06:12 -07003392 DRM_ERROR("Relocation not 4-byte aligned: "
3393 "obj %p target %d offset %d.\n",
Eric Anholt40a5f0d2009-03-12 11:23:52 -07003394 obj, reloc->target_handle,
3395 (int) reloc->offset);
Eric Anholt673a3942008-07-30 12:06:12 -07003396 drm_gem_object_unreference(target_obj);
3397 i915_gem_object_unpin(obj);
3398 return -EINVAL;
3399 }
3400
Chris Wilson8542a0b2009-09-09 21:15:15 +01003401 /* and points to somewhere within the target object. */
Chris Wilsoncd0b9fb2009-09-15 23:23:18 +01003402 if (reloc->delta >= target_obj->size) {
3403 DRM_ERROR("Relocation beyond target object bounds: "
3404 "obj %p target %d delta %d size %d.\n",
Eric Anholt40a5f0d2009-03-12 11:23:52 -07003405 obj, reloc->target_handle,
Chris Wilsoncd0b9fb2009-09-15 23:23:18 +01003406 (int) reloc->delta, (int) target_obj->size);
Chris Wilson491152b2009-02-11 14:26:32 +00003407 drm_gem_object_unreference(target_obj);
3408 i915_gem_object_unpin(obj);
Eric Anholte47c68e2008-11-14 13:35:19 -08003409 return -EINVAL;
3410 }
3411
Eric Anholt2ef7eea2008-11-10 10:53:25 -08003412 ret = i915_gem_object_set_to_gtt_domain(obj, 1);
3413 if (ret != 0) {
3414 drm_gem_object_unreference(target_obj);
3415 i915_gem_object_unpin(obj);
3416 return -EINVAL;
Eric Anholt673a3942008-07-30 12:06:12 -07003417 }
3418
3419 /* Map the page containing the relocation we're going to
3420 * perform.
3421 */
Eric Anholt40a5f0d2009-03-12 11:23:52 -07003422 reloc_offset = obj_priv->gtt_offset + reloc->offset;
Keith Packard0839ccb2008-10-30 19:38:48 -07003423 reloc_page = io_mapping_map_atomic_wc(dev_priv->mm.gtt_mapping,
3424 (reloc_offset &
3425 ~(PAGE_SIZE - 1)));
Eric Anholt3043c602008-10-02 12:24:47 -07003426 reloc_entry = (uint32_t __iomem *)(reloc_page +
Keith Packard0839ccb2008-10-30 19:38:48 -07003427 (reloc_offset & (PAGE_SIZE - 1)));
Eric Anholt40a5f0d2009-03-12 11:23:52 -07003428 reloc_val = target_obj_priv->gtt_offset + reloc->delta;
Eric Anholt673a3942008-07-30 12:06:12 -07003429
3430#if WATCH_BUF
3431 DRM_INFO("Applied relocation: %p@0x%08x %08x -> %08x\n",
Eric Anholt40a5f0d2009-03-12 11:23:52 -07003432 obj, (unsigned int) reloc->offset,
Eric Anholt673a3942008-07-30 12:06:12 -07003433 readl(reloc_entry), reloc_val);
3434#endif
3435 writel(reloc_val, reloc_entry);
Keith Packard0839ccb2008-10-30 19:38:48 -07003436 io_mapping_unmap_atomic(reloc_page);
Eric Anholt673a3942008-07-30 12:06:12 -07003437
Eric Anholt40a5f0d2009-03-12 11:23:52 -07003438 /* The updated presumed offset for this entry will be
3439 * copied back out to the user.
Eric Anholt673a3942008-07-30 12:06:12 -07003440 */
Eric Anholt40a5f0d2009-03-12 11:23:52 -07003441 reloc->presumed_offset = target_obj_priv->gtt_offset;
Eric Anholt673a3942008-07-30 12:06:12 -07003442
3443 drm_gem_object_unreference(target_obj);
3444 }
3445
Eric Anholt673a3942008-07-30 12:06:12 -07003446#if WATCH_BUF
3447 if (0)
3448 i915_gem_dump_object(obj, 128, __func__, ~0);
3449#endif
3450 return 0;
3451}
3452
Eric Anholt673a3942008-07-30 12:06:12 -07003453/* Throttle our rendering by waiting until the ring has completed our requests
3454 * emitted over 20 msec ago.
3455 *
Eric Anholtb9624422009-06-03 07:27:35 +00003456 * Note that if we were to use the current jiffies each time around the loop,
3457 * we wouldn't escape the function with any frames outstanding if the time to
3458 * render a frame was over 20ms.
3459 *
Eric Anholt673a3942008-07-30 12:06:12 -07003460 * This should get us reasonable parallelism between CPU and GPU but also
3461 * relatively low latency when blocking on a particular request to finish.
3462 */
3463static int
3464i915_gem_ring_throttle(struct drm_device *dev, struct drm_file *file_priv)
3465{
3466 struct drm_i915_file_private *i915_file_priv = file_priv->driver_priv;
3467 int ret = 0;
Eric Anholtb9624422009-06-03 07:27:35 +00003468 unsigned long recent_enough = jiffies - msecs_to_jiffies(20);
Eric Anholt673a3942008-07-30 12:06:12 -07003469
3470 mutex_lock(&dev->struct_mutex);
Eric Anholtb9624422009-06-03 07:27:35 +00003471 while (!list_empty(&i915_file_priv->mm.request_list)) {
3472 struct drm_i915_gem_request *request;
3473
3474 request = list_first_entry(&i915_file_priv->mm.request_list,
3475 struct drm_i915_gem_request,
3476 client_list);
3477
3478 if (time_after_eq(request->emitted_jiffies, recent_enough))
3479 break;
3480
Zou Nan hai852835f2010-05-21 09:08:56 +08003481 ret = i915_wait_request(dev, request->seqno, request->ring);
Eric Anholtb9624422009-06-03 07:27:35 +00003482 if (ret != 0)
3483 break;
3484 }
Eric Anholt673a3942008-07-30 12:06:12 -07003485 mutex_unlock(&dev->struct_mutex);
Eric Anholtb9624422009-06-03 07:27:35 +00003486
Eric Anholt673a3942008-07-30 12:06:12 -07003487 return ret;
3488}
3489
Eric Anholt40a5f0d2009-03-12 11:23:52 -07003490static int
Jesse Barnes76446ca2009-12-17 22:05:42 -05003491i915_gem_get_relocs_from_user(struct drm_i915_gem_exec_object2 *exec_list,
Eric Anholt40a5f0d2009-03-12 11:23:52 -07003492 uint32_t buffer_count,
3493 struct drm_i915_gem_relocation_entry **relocs)
3494{
3495 uint32_t reloc_count = 0, reloc_index = 0, i;
3496 int ret;
3497
3498 *relocs = NULL;
3499 for (i = 0; i < buffer_count; i++) {
3500 if (reloc_count + exec_list[i].relocation_count < reloc_count)
3501 return -EINVAL;
3502 reloc_count += exec_list[i].relocation_count;
3503 }
3504
Jesse Barnes8e7d2b22009-05-08 16:13:25 -07003505 *relocs = drm_calloc_large(reloc_count, sizeof(**relocs));
Jesse Barnes76446ca2009-12-17 22:05:42 -05003506 if (*relocs == NULL) {
3507 DRM_ERROR("failed to alloc relocs, count %d\n", reloc_count);
Eric Anholt40a5f0d2009-03-12 11:23:52 -07003508 return -ENOMEM;
Jesse Barnes76446ca2009-12-17 22:05:42 -05003509 }
Eric Anholt40a5f0d2009-03-12 11:23:52 -07003510
3511 for (i = 0; i < buffer_count; i++) {
3512 struct drm_i915_gem_relocation_entry __user *user_relocs;
3513
3514 user_relocs = (void __user *)(uintptr_t)exec_list[i].relocs_ptr;
3515
3516 ret = copy_from_user(&(*relocs)[reloc_index],
3517 user_relocs,
3518 exec_list[i].relocation_count *
3519 sizeof(**relocs));
3520 if (ret != 0) {
Jesse Barnes8e7d2b22009-05-08 16:13:25 -07003521 drm_free_large(*relocs);
Eric Anholt40a5f0d2009-03-12 11:23:52 -07003522 *relocs = NULL;
Florian Mickler2bc43b52009-04-06 22:55:41 +02003523 return -EFAULT;
Eric Anholt40a5f0d2009-03-12 11:23:52 -07003524 }
3525
3526 reloc_index += exec_list[i].relocation_count;
3527 }
3528
Florian Mickler2bc43b52009-04-06 22:55:41 +02003529 return 0;
Eric Anholt40a5f0d2009-03-12 11:23:52 -07003530}
3531
3532static int
Jesse Barnes76446ca2009-12-17 22:05:42 -05003533i915_gem_put_relocs_to_user(struct drm_i915_gem_exec_object2 *exec_list,
Eric Anholt40a5f0d2009-03-12 11:23:52 -07003534 uint32_t buffer_count,
3535 struct drm_i915_gem_relocation_entry *relocs)
3536{
3537 uint32_t reloc_count = 0, i;
Florian Mickler2bc43b52009-04-06 22:55:41 +02003538 int ret = 0;
Eric Anholt40a5f0d2009-03-12 11:23:52 -07003539
Chris Wilson93533c22010-01-31 10:40:48 +00003540 if (relocs == NULL)
3541 return 0;
3542
Eric Anholt40a5f0d2009-03-12 11:23:52 -07003543 for (i = 0; i < buffer_count; i++) {
3544 struct drm_i915_gem_relocation_entry __user *user_relocs;
Florian Mickler2bc43b52009-04-06 22:55:41 +02003545 int unwritten;
Eric Anholt40a5f0d2009-03-12 11:23:52 -07003546
3547 user_relocs = (void __user *)(uintptr_t)exec_list[i].relocs_ptr;
3548
Florian Mickler2bc43b52009-04-06 22:55:41 +02003549 unwritten = copy_to_user(user_relocs,
3550 &relocs[reloc_count],
3551 exec_list[i].relocation_count *
3552 sizeof(*relocs));
3553
3554 if (unwritten) {
3555 ret = -EFAULT;
3556 goto err;
Eric Anholt40a5f0d2009-03-12 11:23:52 -07003557 }
3558
3559 reloc_count += exec_list[i].relocation_count;
3560 }
3561
Florian Mickler2bc43b52009-04-06 22:55:41 +02003562err:
Jesse Barnes8e7d2b22009-05-08 16:13:25 -07003563 drm_free_large(relocs);
Eric Anholt40a5f0d2009-03-12 11:23:52 -07003564
3565 return ret;
3566}
3567
Chris Wilson83d60792009-06-06 09:45:57 +01003568static int
Jesse Barnes76446ca2009-12-17 22:05:42 -05003569i915_gem_check_execbuffer (struct drm_i915_gem_execbuffer2 *exec,
Chris Wilson83d60792009-06-06 09:45:57 +01003570 uint64_t exec_offset)
3571{
3572 uint32_t exec_start, exec_len;
3573
3574 exec_start = (uint32_t) exec_offset + exec->batch_start_offset;
3575 exec_len = (uint32_t) exec->batch_len;
3576
3577 if ((exec_start | exec_len) & 0x7)
3578 return -EINVAL;
3579
3580 if (!exec_start)
3581 return -EINVAL;
3582
3583 return 0;
3584}
3585
Kristian Høgsberg6b95a202009-11-18 11:25:18 -05003586static int
3587i915_gem_wait_for_pending_flip(struct drm_device *dev,
3588 struct drm_gem_object **object_list,
3589 int count)
3590{
3591 drm_i915_private_t *dev_priv = dev->dev_private;
3592 struct drm_i915_gem_object *obj_priv;
3593 DEFINE_WAIT(wait);
3594 int i, ret = 0;
3595
3596 for (;;) {
3597 prepare_to_wait(&dev_priv->pending_flip_queue,
3598 &wait, TASK_INTERRUPTIBLE);
3599 for (i = 0; i < count; i++) {
Daniel Vetter23010e42010-03-08 13:35:02 +01003600 obj_priv = to_intel_bo(object_list[i]);
Kristian Høgsberg6b95a202009-11-18 11:25:18 -05003601 if (atomic_read(&obj_priv->pending_flip) > 0)
3602 break;
3603 }
3604 if (i == count)
3605 break;
3606
3607 if (!signal_pending(current)) {
3608 mutex_unlock(&dev->struct_mutex);
3609 schedule();
3610 mutex_lock(&dev->struct_mutex);
3611 continue;
3612 }
3613 ret = -ERESTARTSYS;
3614 break;
3615 }
3616 finish_wait(&dev_priv->pending_flip_queue, &wait);
3617
3618 return ret;
3619}
3620
Eric Anholt673a3942008-07-30 12:06:12 -07003621int
Jesse Barnes76446ca2009-12-17 22:05:42 -05003622i915_gem_do_execbuffer(struct drm_device *dev, void *data,
3623 struct drm_file *file_priv,
3624 struct drm_i915_gem_execbuffer2 *args,
3625 struct drm_i915_gem_exec_object2 *exec_list)
Eric Anholt673a3942008-07-30 12:06:12 -07003626{
3627 drm_i915_private_t *dev_priv = dev->dev_private;
Eric Anholt673a3942008-07-30 12:06:12 -07003628 struct drm_gem_object **object_list = NULL;
3629 struct drm_gem_object *batch_obj;
Kristian Høgsbergb70d11d2009-03-03 14:45:57 -05003630 struct drm_i915_gem_object *obj_priv;
Eric Anholt201361a2009-03-11 12:30:04 -07003631 struct drm_clip_rect *cliprects = NULL;
Chris Wilson93533c22010-01-31 10:40:48 +00003632 struct drm_i915_gem_relocation_entry *relocs = NULL;
Jesse Barnes76446ca2009-12-17 22:05:42 -05003633 int ret = 0, ret2, i, pinned = 0;
Eric Anholt673a3942008-07-30 12:06:12 -07003634 uint64_t exec_offset;
Eric Anholt40a5f0d2009-03-12 11:23:52 -07003635 uint32_t seqno, flush_domains, reloc_index;
Kristian Høgsberg6b95a202009-11-18 11:25:18 -05003636 int pin_tries, flips;
Eric Anholt673a3942008-07-30 12:06:12 -07003637
Zou Nan hai852835f2010-05-21 09:08:56 +08003638 struct intel_ring_buffer *ring = NULL;
3639
Eric Anholt673a3942008-07-30 12:06:12 -07003640#if WATCH_EXEC
3641 DRM_INFO("buffers_ptr %d buffer_count %d len %08x\n",
3642 (int) args->buffers_ptr, args->buffer_count, args->batch_len);
3643#endif
3644
Eric Anholt4f481ed2008-09-10 14:22:49 -07003645 if (args->buffer_count < 1) {
3646 DRM_ERROR("execbuf with %d buffers\n", args->buffer_count);
3647 return -EINVAL;
3648 }
Eric Anholtc8e0f932009-11-22 03:49:37 +01003649 object_list = drm_malloc_ab(sizeof(*object_list), args->buffer_count);
Jesse Barnes76446ca2009-12-17 22:05:42 -05003650 if (object_list == NULL) {
3651 DRM_ERROR("Failed to allocate object list for %d buffers\n",
Eric Anholt673a3942008-07-30 12:06:12 -07003652 args->buffer_count);
3653 ret = -ENOMEM;
3654 goto pre_mutex_err;
3655 }
Eric Anholt673a3942008-07-30 12:06:12 -07003656
Eric Anholt201361a2009-03-11 12:30:04 -07003657 if (args->num_cliprects != 0) {
Eric Anholt9a298b22009-03-24 12:23:04 -07003658 cliprects = kcalloc(args->num_cliprects, sizeof(*cliprects),
3659 GFP_KERNEL);
Owain Ainswortha40e8d32010-02-09 14:25:55 +00003660 if (cliprects == NULL) {
3661 ret = -ENOMEM;
Eric Anholt201361a2009-03-11 12:30:04 -07003662 goto pre_mutex_err;
Owain Ainswortha40e8d32010-02-09 14:25:55 +00003663 }
Eric Anholt201361a2009-03-11 12:30:04 -07003664
3665 ret = copy_from_user(cliprects,
3666 (struct drm_clip_rect __user *)
3667 (uintptr_t) args->cliprects_ptr,
3668 sizeof(*cliprects) * args->num_cliprects);
3669 if (ret != 0) {
3670 DRM_ERROR("copy %d cliprects failed: %d\n",
3671 args->num_cliprects, ret);
3672 goto pre_mutex_err;
3673 }
3674 }
3675
Eric Anholt40a5f0d2009-03-12 11:23:52 -07003676 ret = i915_gem_get_relocs_from_user(exec_list, args->buffer_count,
3677 &relocs);
3678 if (ret != 0)
3679 goto pre_mutex_err;
3680
Eric Anholt673a3942008-07-30 12:06:12 -07003681 mutex_lock(&dev->struct_mutex);
3682
3683 i915_verify_inactive(dev, __FILE__, __LINE__);
3684
Ben Gamariba1234d2009-09-14 17:48:47 -04003685 if (atomic_read(&dev_priv->mm.wedged)) {
Eric Anholt673a3942008-07-30 12:06:12 -07003686 mutex_unlock(&dev->struct_mutex);
Chris Wilsona198bc82009-02-06 16:55:20 +00003687 ret = -EIO;
3688 goto pre_mutex_err;
Eric Anholt673a3942008-07-30 12:06:12 -07003689 }
3690
3691 if (dev_priv->mm.suspended) {
Eric Anholt673a3942008-07-30 12:06:12 -07003692 mutex_unlock(&dev->struct_mutex);
Chris Wilsona198bc82009-02-06 16:55:20 +00003693 ret = -EBUSY;
3694 goto pre_mutex_err;
Eric Anholt673a3942008-07-30 12:06:12 -07003695 }
3696
Zou Nan hai852835f2010-05-21 09:08:56 +08003697 ring = &dev_priv->render_ring;
3698
Keith Packardac94a962008-11-20 23:30:27 -08003699 /* Look up object handles */
Kristian Høgsberg6b95a202009-11-18 11:25:18 -05003700 flips = 0;
Eric Anholt673a3942008-07-30 12:06:12 -07003701 for (i = 0; i < args->buffer_count; i++) {
3702 object_list[i] = drm_gem_object_lookup(dev, file_priv,
3703 exec_list[i].handle);
3704 if (object_list[i] == NULL) {
3705 DRM_ERROR("Invalid object handle %d at index %d\n",
3706 exec_list[i].handle, i);
Chris Wilson0ce907f2010-01-23 20:26:35 +00003707 /* prevent error path from reading uninitialized data */
3708 args->buffer_count = i + 1;
Eric Anholt673a3942008-07-30 12:06:12 -07003709 ret = -EBADF;
3710 goto err;
3711 }
Kristian Høgsbergb70d11d2009-03-03 14:45:57 -05003712
Daniel Vetter23010e42010-03-08 13:35:02 +01003713 obj_priv = to_intel_bo(object_list[i]);
Kristian Høgsbergb70d11d2009-03-03 14:45:57 -05003714 if (obj_priv->in_execbuffer) {
3715 DRM_ERROR("Object %p appears more than once in object list\n",
3716 object_list[i]);
Chris Wilson0ce907f2010-01-23 20:26:35 +00003717 /* prevent error path from reading uninitialized data */
3718 args->buffer_count = i + 1;
Kristian Høgsbergb70d11d2009-03-03 14:45:57 -05003719 ret = -EBADF;
3720 goto err;
3721 }
3722 obj_priv->in_execbuffer = true;
Kristian Høgsberg6b95a202009-11-18 11:25:18 -05003723 flips += atomic_read(&obj_priv->pending_flip);
3724 }
3725
3726 if (flips > 0) {
3727 ret = i915_gem_wait_for_pending_flip(dev, object_list,
3728 args->buffer_count);
3729 if (ret)
3730 goto err;
Keith Packardac94a962008-11-20 23:30:27 -08003731 }
Eric Anholt673a3942008-07-30 12:06:12 -07003732
Keith Packardac94a962008-11-20 23:30:27 -08003733 /* Pin and relocate */
3734 for (pin_tries = 0; ; pin_tries++) {
3735 ret = 0;
Eric Anholt40a5f0d2009-03-12 11:23:52 -07003736 reloc_index = 0;
3737
Keith Packardac94a962008-11-20 23:30:27 -08003738 for (i = 0; i < args->buffer_count; i++) {
3739 object_list[i]->pending_read_domains = 0;
3740 object_list[i]->pending_write_domain = 0;
3741 ret = i915_gem_object_pin_and_relocate(object_list[i],
3742 file_priv,
Eric Anholt40a5f0d2009-03-12 11:23:52 -07003743 &exec_list[i],
3744 &relocs[reloc_index]);
Keith Packardac94a962008-11-20 23:30:27 -08003745 if (ret)
3746 break;
3747 pinned = i + 1;
Eric Anholt40a5f0d2009-03-12 11:23:52 -07003748 reloc_index += exec_list[i].relocation_count;
Keith Packardac94a962008-11-20 23:30:27 -08003749 }
3750 /* success */
3751 if (ret == 0)
3752 break;
3753
3754 /* error other than GTT full, or we've already tried again */
Chris Wilson2939e1f2009-06-06 09:46:03 +01003755 if (ret != -ENOSPC || pin_tries >= 1) {
Chris Wilson07f73f62009-09-14 16:50:30 +01003756 if (ret != -ERESTARTSYS) {
3757 unsigned long long total_size = 0;
3758 for (i = 0; i < args->buffer_count; i++)
3759 total_size += object_list[i]->size;
3760 DRM_ERROR("Failed to pin buffer %d of %d, total %llu bytes: %d\n",
3761 pinned+1, args->buffer_count,
3762 total_size, ret);
3763 DRM_ERROR("%d objects [%d pinned], "
3764 "%d object bytes [%d pinned], "
3765 "%d/%d gtt bytes\n",
3766 atomic_read(&dev->object_count),
3767 atomic_read(&dev->pin_count),
3768 atomic_read(&dev->object_memory),
3769 atomic_read(&dev->pin_memory),
3770 atomic_read(&dev->gtt_memory),
3771 dev->gtt_total);
3772 }
Eric Anholt673a3942008-07-30 12:06:12 -07003773 goto err;
3774 }
Keith Packardac94a962008-11-20 23:30:27 -08003775
3776 /* unpin all of our buffers */
3777 for (i = 0; i < pinned; i++)
3778 i915_gem_object_unpin(object_list[i]);
Eric Anholtb1177632008-12-10 10:09:41 -08003779 pinned = 0;
Keith Packardac94a962008-11-20 23:30:27 -08003780
3781 /* evict everyone we can from the aperture */
3782 ret = i915_gem_evict_everything(dev);
Chris Wilson07f73f62009-09-14 16:50:30 +01003783 if (ret && ret != -ENOSPC)
Keith Packardac94a962008-11-20 23:30:27 -08003784 goto err;
Eric Anholt673a3942008-07-30 12:06:12 -07003785 }
3786
3787 /* Set the pending read domains for the batch buffer to COMMAND */
3788 batch_obj = object_list[args->buffer_count-1];
Chris Wilson5f26a2c2009-06-06 09:45:58 +01003789 if (batch_obj->pending_write_domain) {
3790 DRM_ERROR("Attempting to use self-modifying batch buffer\n");
3791 ret = -EINVAL;
3792 goto err;
3793 }
3794 batch_obj->pending_read_domains |= I915_GEM_DOMAIN_COMMAND;
Eric Anholt673a3942008-07-30 12:06:12 -07003795
Chris Wilson83d60792009-06-06 09:45:57 +01003796 /* Sanity check the batch buffer, prior to moving objects */
3797 exec_offset = exec_list[args->buffer_count - 1].offset;
3798 ret = i915_gem_check_execbuffer (args, exec_offset);
3799 if (ret != 0) {
3800 DRM_ERROR("execbuf with invalid offset/length\n");
3801 goto err;
3802 }
3803
Eric Anholt673a3942008-07-30 12:06:12 -07003804 i915_verify_inactive(dev, __FILE__, __LINE__);
3805
Keith Packard646f0f62008-11-20 23:23:03 -08003806 /* Zero the global flush/invalidate flags. These
3807 * will be modified as new domains are computed
3808 * for each object
3809 */
3810 dev->invalidate_domains = 0;
3811 dev->flush_domains = 0;
3812
Eric Anholt673a3942008-07-30 12:06:12 -07003813 for (i = 0; i < args->buffer_count; i++) {
3814 struct drm_gem_object *obj = object_list[i];
Eric Anholt673a3942008-07-30 12:06:12 -07003815
Keith Packard646f0f62008-11-20 23:23:03 -08003816 /* Compute new gpu domains and update invalidate/flush */
Eric Anholt8b0e3782009-02-19 14:40:50 -08003817 i915_gem_object_set_to_gpu_domain(obj);
Eric Anholt673a3942008-07-30 12:06:12 -07003818 }
3819
3820 i915_verify_inactive(dev, __FILE__, __LINE__);
3821
Keith Packard646f0f62008-11-20 23:23:03 -08003822 if (dev->invalidate_domains | dev->flush_domains) {
3823#if WATCH_EXEC
3824 DRM_INFO("%s: invalidate_domains %08x flush_domains %08x\n",
3825 __func__,
3826 dev->invalidate_domains,
3827 dev->flush_domains);
3828#endif
3829 i915_gem_flush(dev,
3830 dev->invalidate_domains,
3831 dev->flush_domains);
Zou Nan hai852835f2010-05-21 09:08:56 +08003832 if (dev->flush_domains & I915_GEM_GPU_DOMAINS) {
Eric Anholtb9624422009-06-03 07:27:35 +00003833 (void)i915_add_request(dev, file_priv,
Zou Nan hai852835f2010-05-21 09:08:56 +08003834 dev->flush_domains,
3835 &dev_priv->render_ring);
3836
3837 }
Keith Packard646f0f62008-11-20 23:23:03 -08003838 }
Eric Anholt673a3942008-07-30 12:06:12 -07003839
Eric Anholtefbeed92009-02-19 14:54:51 -08003840 for (i = 0; i < args->buffer_count; i++) {
3841 struct drm_gem_object *obj = object_list[i];
Daniel Vetter23010e42010-03-08 13:35:02 +01003842 struct drm_i915_gem_object *obj_priv = to_intel_bo(obj);
Chris Wilson1c5d22f2009-08-25 11:15:50 +01003843 uint32_t old_write_domain = obj->write_domain;
Eric Anholtefbeed92009-02-19 14:54:51 -08003844
3845 obj->write_domain = obj->pending_write_domain;
Daniel Vetter99fcb762010-02-07 16:20:18 +01003846 if (obj->write_domain)
3847 list_move_tail(&obj_priv->gpu_write_list,
3848 &dev_priv->mm.gpu_write_list);
3849 else
3850 list_del_init(&obj_priv->gpu_write_list);
3851
Chris Wilson1c5d22f2009-08-25 11:15:50 +01003852 trace_i915_gem_object_change_domain(obj,
3853 obj->read_domains,
3854 old_write_domain);
Eric Anholtefbeed92009-02-19 14:54:51 -08003855 }
3856
Eric Anholt673a3942008-07-30 12:06:12 -07003857 i915_verify_inactive(dev, __FILE__, __LINE__);
3858
3859#if WATCH_COHERENCY
3860 for (i = 0; i < args->buffer_count; i++) {
3861 i915_gem_object_check_coherency(object_list[i],
3862 exec_list[i].handle);
3863 }
3864#endif
3865
Eric Anholt673a3942008-07-30 12:06:12 -07003866#if WATCH_EXEC
Ben Gamari6911a9b2009-04-02 11:24:54 -07003867 i915_gem_dump_object(batch_obj,
Eric Anholt673a3942008-07-30 12:06:12 -07003868 args->batch_len,
3869 __func__,
3870 ~0);
3871#endif
3872
Eric Anholt673a3942008-07-30 12:06:12 -07003873 /* Exec the batchbuffer */
Zou Nan hai852835f2010-05-21 09:08:56 +08003874 ret = ring->dispatch_gem_execbuffer(dev, ring, args,
3875 cliprects, exec_offset);
Eric Anholt673a3942008-07-30 12:06:12 -07003876 if (ret) {
3877 DRM_ERROR("dispatch failed %d\n", ret);
3878 goto err;
3879 }
3880
3881 /*
3882 * Ensure that the commands in the batch buffer are
3883 * finished before the interrupt fires
3884 */
Zou Nan hai852835f2010-05-21 09:08:56 +08003885 flush_domains = i915_retire_commands(dev, ring);
Eric Anholt673a3942008-07-30 12:06:12 -07003886
3887 i915_verify_inactive(dev, __FILE__, __LINE__);
3888
3889 /*
3890 * Get a seqno representing the execution of the current buffer,
3891 * which we can wait on. We would like to mitigate these interrupts,
3892 * likely by only creating seqnos occasionally (so that we have
3893 * *some* interrupts representing completion of buffers that we can
3894 * wait on when trying to clear up gtt space).
3895 */
Zou Nan hai852835f2010-05-21 09:08:56 +08003896 seqno = i915_add_request(dev, file_priv, flush_domains, ring);
Eric Anholt673a3942008-07-30 12:06:12 -07003897 BUG_ON(seqno == 0);
Eric Anholt673a3942008-07-30 12:06:12 -07003898 for (i = 0; i < args->buffer_count; i++) {
3899 struct drm_gem_object *obj = object_list[i];
Zou Nan hai852835f2010-05-21 09:08:56 +08003900 obj_priv = to_intel_bo(obj);
Eric Anholt673a3942008-07-30 12:06:12 -07003901
Zou Nan hai852835f2010-05-21 09:08:56 +08003902 i915_gem_object_move_to_active(obj, seqno, ring);
Eric Anholt673a3942008-07-30 12:06:12 -07003903#if WATCH_LRU
3904 DRM_INFO("%s: move to exec list %p\n", __func__, obj);
3905#endif
3906 }
3907#if WATCH_LRU
3908 i915_dump_lru(dev, __func__);
3909#endif
3910
3911 i915_verify_inactive(dev, __FILE__, __LINE__);
3912
Eric Anholt673a3942008-07-30 12:06:12 -07003913err:
Julia Lawallaad87df2008-12-21 16:28:47 +01003914 for (i = 0; i < pinned; i++)
3915 i915_gem_object_unpin(object_list[i]);
Eric Anholt673a3942008-07-30 12:06:12 -07003916
Kristian Høgsbergb70d11d2009-03-03 14:45:57 -05003917 for (i = 0; i < args->buffer_count; i++) {
3918 if (object_list[i]) {
Daniel Vetter23010e42010-03-08 13:35:02 +01003919 obj_priv = to_intel_bo(object_list[i]);
Kristian Høgsbergb70d11d2009-03-03 14:45:57 -05003920 obj_priv->in_execbuffer = false;
3921 }
Julia Lawallaad87df2008-12-21 16:28:47 +01003922 drm_gem_object_unreference(object_list[i]);
Kristian Høgsbergb70d11d2009-03-03 14:45:57 -05003923 }
Julia Lawallaad87df2008-12-21 16:28:47 +01003924
Eric Anholt673a3942008-07-30 12:06:12 -07003925 mutex_unlock(&dev->struct_mutex);
3926
Chris Wilson93533c22010-01-31 10:40:48 +00003927pre_mutex_err:
Eric Anholt40a5f0d2009-03-12 11:23:52 -07003928 /* Copy the updated relocations out regardless of current error
3929 * state. Failure to update the relocs would mean that the next
3930 * time userland calls execbuf, it would do so with presumed offset
3931 * state that didn't match the actual object state.
3932 */
3933 ret2 = i915_gem_put_relocs_to_user(exec_list, args->buffer_count,
3934 relocs);
3935 if (ret2 != 0) {
3936 DRM_ERROR("Failed to copy relocations back out: %d\n", ret2);
3937
3938 if (ret == 0)
3939 ret = ret2;
3940 }
3941
Jesse Barnes8e7d2b22009-05-08 16:13:25 -07003942 drm_free_large(object_list);
Eric Anholt9a298b22009-03-24 12:23:04 -07003943 kfree(cliprects);
Eric Anholt673a3942008-07-30 12:06:12 -07003944
3945 return ret;
3946}
3947
Jesse Barnes76446ca2009-12-17 22:05:42 -05003948/*
3949 * Legacy execbuffer just creates an exec2 list from the original exec object
3950 * list array and passes it to the real function.
3951 */
3952int
3953i915_gem_execbuffer(struct drm_device *dev, void *data,
3954 struct drm_file *file_priv)
3955{
3956 struct drm_i915_gem_execbuffer *args = data;
3957 struct drm_i915_gem_execbuffer2 exec2;
3958 struct drm_i915_gem_exec_object *exec_list = NULL;
3959 struct drm_i915_gem_exec_object2 *exec2_list = NULL;
3960 int ret, i;
3961
3962#if WATCH_EXEC
3963 DRM_INFO("buffers_ptr %d buffer_count %d len %08x\n",
3964 (int) args->buffers_ptr, args->buffer_count, args->batch_len);
3965#endif
3966
3967 if (args->buffer_count < 1) {
3968 DRM_ERROR("execbuf with %d buffers\n", args->buffer_count);
3969 return -EINVAL;
3970 }
3971
3972 /* Copy in the exec list from userland */
3973 exec_list = drm_malloc_ab(sizeof(*exec_list), args->buffer_count);
3974 exec2_list = drm_malloc_ab(sizeof(*exec2_list), args->buffer_count);
3975 if (exec_list == NULL || exec2_list == NULL) {
3976 DRM_ERROR("Failed to allocate exec list for %d buffers\n",
3977 args->buffer_count);
3978 drm_free_large(exec_list);
3979 drm_free_large(exec2_list);
3980 return -ENOMEM;
3981 }
3982 ret = copy_from_user(exec_list,
3983 (struct drm_i915_relocation_entry __user *)
3984 (uintptr_t) args->buffers_ptr,
3985 sizeof(*exec_list) * args->buffer_count);
3986 if (ret != 0) {
3987 DRM_ERROR("copy %d exec entries failed %d\n",
3988 args->buffer_count, ret);
3989 drm_free_large(exec_list);
3990 drm_free_large(exec2_list);
3991 return -EFAULT;
3992 }
3993
3994 for (i = 0; i < args->buffer_count; i++) {
3995 exec2_list[i].handle = exec_list[i].handle;
3996 exec2_list[i].relocation_count = exec_list[i].relocation_count;
3997 exec2_list[i].relocs_ptr = exec_list[i].relocs_ptr;
3998 exec2_list[i].alignment = exec_list[i].alignment;
3999 exec2_list[i].offset = exec_list[i].offset;
4000 if (!IS_I965G(dev))
4001 exec2_list[i].flags = EXEC_OBJECT_NEEDS_FENCE;
4002 else
4003 exec2_list[i].flags = 0;
4004 }
4005
4006 exec2.buffers_ptr = args->buffers_ptr;
4007 exec2.buffer_count = args->buffer_count;
4008 exec2.batch_start_offset = args->batch_start_offset;
4009 exec2.batch_len = args->batch_len;
4010 exec2.DR1 = args->DR1;
4011 exec2.DR4 = args->DR4;
4012 exec2.num_cliprects = args->num_cliprects;
4013 exec2.cliprects_ptr = args->cliprects_ptr;
Zou Nan hai852835f2010-05-21 09:08:56 +08004014 exec2.flags = I915_EXEC_RENDER;
Jesse Barnes76446ca2009-12-17 22:05:42 -05004015
4016 ret = i915_gem_do_execbuffer(dev, data, file_priv, &exec2, exec2_list);
4017 if (!ret) {
4018 /* Copy the new buffer offsets back to the user's exec list. */
4019 for (i = 0; i < args->buffer_count; i++)
4020 exec_list[i].offset = exec2_list[i].offset;
4021 /* ... and back out to userspace */
4022 ret = copy_to_user((struct drm_i915_relocation_entry __user *)
4023 (uintptr_t) args->buffers_ptr,
4024 exec_list,
4025 sizeof(*exec_list) * args->buffer_count);
4026 if (ret) {
4027 ret = -EFAULT;
4028 DRM_ERROR("failed to copy %d exec entries "
4029 "back to user (%d)\n",
4030 args->buffer_count, ret);
4031 }
Jesse Barnes76446ca2009-12-17 22:05:42 -05004032 }
4033
4034 drm_free_large(exec_list);
4035 drm_free_large(exec2_list);
4036 return ret;
4037}
4038
4039int
4040i915_gem_execbuffer2(struct drm_device *dev, void *data,
4041 struct drm_file *file_priv)
4042{
4043 struct drm_i915_gem_execbuffer2 *args = data;
4044 struct drm_i915_gem_exec_object2 *exec2_list = NULL;
4045 int ret;
4046
4047#if WATCH_EXEC
4048 DRM_INFO("buffers_ptr %d buffer_count %d len %08x\n",
4049 (int) args->buffers_ptr, args->buffer_count, args->batch_len);
4050#endif
4051
4052 if (args->buffer_count < 1) {
4053 DRM_ERROR("execbuf2 with %d buffers\n", args->buffer_count);
4054 return -EINVAL;
4055 }
4056
4057 exec2_list = drm_malloc_ab(sizeof(*exec2_list), args->buffer_count);
4058 if (exec2_list == NULL) {
4059 DRM_ERROR("Failed to allocate exec list for %d buffers\n",
4060 args->buffer_count);
4061 return -ENOMEM;
4062 }
4063 ret = copy_from_user(exec2_list,
4064 (struct drm_i915_relocation_entry __user *)
4065 (uintptr_t) args->buffers_ptr,
4066 sizeof(*exec2_list) * args->buffer_count);
4067 if (ret != 0) {
4068 DRM_ERROR("copy %d exec entries failed %d\n",
4069 args->buffer_count, ret);
4070 drm_free_large(exec2_list);
4071 return -EFAULT;
4072 }
4073
4074 ret = i915_gem_do_execbuffer(dev, data, file_priv, args, exec2_list);
4075 if (!ret) {
4076 /* Copy the new buffer offsets back to the user's exec list. */
4077 ret = copy_to_user((struct drm_i915_relocation_entry __user *)
4078 (uintptr_t) args->buffers_ptr,
4079 exec2_list,
4080 sizeof(*exec2_list) * args->buffer_count);
4081 if (ret) {
4082 ret = -EFAULT;
4083 DRM_ERROR("failed to copy %d exec entries "
4084 "back to user (%d)\n",
4085 args->buffer_count, ret);
4086 }
4087 }
4088
4089 drm_free_large(exec2_list);
4090 return ret;
4091}
4092
Eric Anholt673a3942008-07-30 12:06:12 -07004093int
4094i915_gem_object_pin(struct drm_gem_object *obj, uint32_t alignment)
4095{
4096 struct drm_device *dev = obj->dev;
Daniel Vetter23010e42010-03-08 13:35:02 +01004097 struct drm_i915_gem_object *obj_priv = to_intel_bo(obj);
Eric Anholt673a3942008-07-30 12:06:12 -07004098 int ret;
4099
4100 i915_verify_inactive(dev, __FILE__, __LINE__);
4101 if (obj_priv->gtt_space == NULL) {
4102 ret = i915_gem_object_bind_to_gtt(obj, alignment);
Chris Wilson97311292009-09-21 00:22:34 +01004103 if (ret)
Eric Anholt673a3942008-07-30 12:06:12 -07004104 return ret;
Chris Wilson22c344e2009-02-11 14:26:45 +00004105 }
Jesse Barnes76446ca2009-12-17 22:05:42 -05004106
Eric Anholt673a3942008-07-30 12:06:12 -07004107 obj_priv->pin_count++;
4108
4109 /* If the object is not active and not pending a flush,
4110 * remove it from the inactive list
4111 */
4112 if (obj_priv->pin_count == 1) {
4113 atomic_inc(&dev->pin_count);
4114 atomic_add(obj->size, &dev->pin_memory);
4115 if (!obj_priv->active &&
Chris Wilson21d509e2009-06-06 09:46:02 +01004116 (obj->write_domain & I915_GEM_GPU_DOMAINS) == 0 &&
Eric Anholt673a3942008-07-30 12:06:12 -07004117 !list_empty(&obj_priv->list))
4118 list_del_init(&obj_priv->list);
4119 }
4120 i915_verify_inactive(dev, __FILE__, __LINE__);
4121
4122 return 0;
4123}
4124
4125void
4126i915_gem_object_unpin(struct drm_gem_object *obj)
4127{
4128 struct drm_device *dev = obj->dev;
4129 drm_i915_private_t *dev_priv = dev->dev_private;
Daniel Vetter23010e42010-03-08 13:35:02 +01004130 struct drm_i915_gem_object *obj_priv = to_intel_bo(obj);
Eric Anholt673a3942008-07-30 12:06:12 -07004131
4132 i915_verify_inactive(dev, __FILE__, __LINE__);
4133 obj_priv->pin_count--;
4134 BUG_ON(obj_priv->pin_count < 0);
4135 BUG_ON(obj_priv->gtt_space == NULL);
4136
4137 /* If the object is no longer pinned, and is
4138 * neither active nor being flushed, then stick it on
4139 * the inactive list
4140 */
4141 if (obj_priv->pin_count == 0) {
4142 if (!obj_priv->active &&
Chris Wilson21d509e2009-06-06 09:46:02 +01004143 (obj->write_domain & I915_GEM_GPU_DOMAINS) == 0)
Eric Anholt673a3942008-07-30 12:06:12 -07004144 list_move_tail(&obj_priv->list,
4145 &dev_priv->mm.inactive_list);
4146 atomic_dec(&dev->pin_count);
4147 atomic_sub(obj->size, &dev->pin_memory);
4148 }
4149 i915_verify_inactive(dev, __FILE__, __LINE__);
4150}
4151
4152int
4153i915_gem_pin_ioctl(struct drm_device *dev, void *data,
4154 struct drm_file *file_priv)
4155{
4156 struct drm_i915_gem_pin *args = data;
4157 struct drm_gem_object *obj;
4158 struct drm_i915_gem_object *obj_priv;
4159 int ret;
4160
4161 mutex_lock(&dev->struct_mutex);
4162
4163 obj = drm_gem_object_lookup(dev, file_priv, args->handle);
4164 if (obj == NULL) {
4165 DRM_ERROR("Bad handle in i915_gem_pin_ioctl(): %d\n",
4166 args->handle);
4167 mutex_unlock(&dev->struct_mutex);
4168 return -EBADF;
4169 }
Daniel Vetter23010e42010-03-08 13:35:02 +01004170 obj_priv = to_intel_bo(obj);
Eric Anholt673a3942008-07-30 12:06:12 -07004171
Chris Wilsonbb6baf72009-09-22 14:24:13 +01004172 if (obj_priv->madv != I915_MADV_WILLNEED) {
4173 DRM_ERROR("Attempting to pin a purgeable buffer\n");
Chris Wilson3ef94da2009-09-14 16:50:29 +01004174 drm_gem_object_unreference(obj);
4175 mutex_unlock(&dev->struct_mutex);
4176 return -EINVAL;
4177 }
4178
Jesse Barnes79e53942008-11-07 14:24:08 -08004179 if (obj_priv->pin_filp != NULL && obj_priv->pin_filp != file_priv) {
4180 DRM_ERROR("Already pinned in i915_gem_pin_ioctl(): %d\n",
4181 args->handle);
Chris Wilson96dec612009-02-08 19:08:04 +00004182 drm_gem_object_unreference(obj);
Eric Anholt673a3942008-07-30 12:06:12 -07004183 mutex_unlock(&dev->struct_mutex);
Jesse Barnes79e53942008-11-07 14:24:08 -08004184 return -EINVAL;
4185 }
4186
4187 obj_priv->user_pin_count++;
4188 obj_priv->pin_filp = file_priv;
4189 if (obj_priv->user_pin_count == 1) {
4190 ret = i915_gem_object_pin(obj, args->alignment);
4191 if (ret != 0) {
4192 drm_gem_object_unreference(obj);
4193 mutex_unlock(&dev->struct_mutex);
4194 return ret;
4195 }
Eric Anholt673a3942008-07-30 12:06:12 -07004196 }
4197
4198 /* XXX - flush the CPU caches for pinned objects
4199 * as the X server doesn't manage domains yet
4200 */
Eric Anholte47c68e2008-11-14 13:35:19 -08004201 i915_gem_object_flush_cpu_write_domain(obj);
Eric Anholt673a3942008-07-30 12:06:12 -07004202 args->offset = obj_priv->gtt_offset;
4203 drm_gem_object_unreference(obj);
4204 mutex_unlock(&dev->struct_mutex);
4205
4206 return 0;
4207}
4208
4209int
4210i915_gem_unpin_ioctl(struct drm_device *dev, void *data,
4211 struct drm_file *file_priv)
4212{
4213 struct drm_i915_gem_pin *args = data;
4214 struct drm_gem_object *obj;
Jesse Barnes79e53942008-11-07 14:24:08 -08004215 struct drm_i915_gem_object *obj_priv;
Eric Anholt673a3942008-07-30 12:06:12 -07004216
4217 mutex_lock(&dev->struct_mutex);
4218
4219 obj = drm_gem_object_lookup(dev, file_priv, args->handle);
4220 if (obj == NULL) {
4221 DRM_ERROR("Bad handle in i915_gem_unpin_ioctl(): %d\n",
4222 args->handle);
4223 mutex_unlock(&dev->struct_mutex);
4224 return -EBADF;
4225 }
4226
Daniel Vetter23010e42010-03-08 13:35:02 +01004227 obj_priv = to_intel_bo(obj);
Jesse Barnes79e53942008-11-07 14:24:08 -08004228 if (obj_priv->pin_filp != file_priv) {
4229 DRM_ERROR("Not pinned by caller in i915_gem_pin_ioctl(): %d\n",
4230 args->handle);
4231 drm_gem_object_unreference(obj);
4232 mutex_unlock(&dev->struct_mutex);
4233 return -EINVAL;
4234 }
4235 obj_priv->user_pin_count--;
4236 if (obj_priv->user_pin_count == 0) {
4237 obj_priv->pin_filp = NULL;
4238 i915_gem_object_unpin(obj);
4239 }
Eric Anholt673a3942008-07-30 12:06:12 -07004240
4241 drm_gem_object_unreference(obj);
4242 mutex_unlock(&dev->struct_mutex);
4243 return 0;
4244}
4245
4246int
4247i915_gem_busy_ioctl(struct drm_device *dev, void *data,
4248 struct drm_file *file_priv)
4249{
4250 struct drm_i915_gem_busy *args = data;
4251 struct drm_gem_object *obj;
4252 struct drm_i915_gem_object *obj_priv;
Zou Nan hai852835f2010-05-21 09:08:56 +08004253 drm_i915_private_t *dev_priv = dev->dev_private;
Eric Anholt673a3942008-07-30 12:06:12 -07004254
Eric Anholt673a3942008-07-30 12:06:12 -07004255 obj = drm_gem_object_lookup(dev, file_priv, args->handle);
4256 if (obj == NULL) {
4257 DRM_ERROR("Bad handle in i915_gem_busy_ioctl(): %d\n",
4258 args->handle);
Eric Anholt673a3942008-07-30 12:06:12 -07004259 return -EBADF;
4260 }
4261
Chris Wilsonb1ce7862009-06-06 09:46:00 +01004262 mutex_lock(&dev->struct_mutex);
Eric Anholtf21289b2009-02-18 09:44:56 -08004263 /* Update the active list for the hardware's current position.
4264 * Otherwise this only updates on a delayed timer or when irqs are
4265 * actually unmasked, and our working set ends up being larger than
4266 * required.
4267 */
Zou Nan hai852835f2010-05-21 09:08:56 +08004268 i915_gem_retire_requests(dev, &dev_priv->render_ring);
Eric Anholtf21289b2009-02-18 09:44:56 -08004269
Daniel Vetter23010e42010-03-08 13:35:02 +01004270 obj_priv = to_intel_bo(obj);
Eric Anholtc4de0a52008-12-14 19:05:04 -08004271 /* Don't count being on the flushing list against the object being
4272 * done. Otherwise, a buffer left on the flushing list but not getting
4273 * flushed (because nobody's flushing that domain) won't ever return
4274 * unbusy and get reused by libdrm's bo cache. The other expected
4275 * consumer of this interface, OpenGL's occlusion queries, also specs
4276 * that the objects get unbusy "eventually" without any interference.
4277 */
4278 args->busy = obj_priv->active && obj_priv->last_rendering_seqno != 0;
Eric Anholt673a3942008-07-30 12:06:12 -07004279
4280 drm_gem_object_unreference(obj);
4281 mutex_unlock(&dev->struct_mutex);
4282 return 0;
4283}
4284
4285int
4286i915_gem_throttle_ioctl(struct drm_device *dev, void *data,
4287 struct drm_file *file_priv)
4288{
4289 return i915_gem_ring_throttle(dev, file_priv);
4290}
4291
Chris Wilson3ef94da2009-09-14 16:50:29 +01004292int
4293i915_gem_madvise_ioctl(struct drm_device *dev, void *data,
4294 struct drm_file *file_priv)
4295{
4296 struct drm_i915_gem_madvise *args = data;
4297 struct drm_gem_object *obj;
4298 struct drm_i915_gem_object *obj_priv;
4299
4300 switch (args->madv) {
4301 case I915_MADV_DONTNEED:
4302 case I915_MADV_WILLNEED:
4303 break;
4304 default:
4305 return -EINVAL;
4306 }
4307
4308 obj = drm_gem_object_lookup(dev, file_priv, args->handle);
4309 if (obj == NULL) {
4310 DRM_ERROR("Bad handle in i915_gem_madvise_ioctl(): %d\n",
4311 args->handle);
4312 return -EBADF;
4313 }
4314
4315 mutex_lock(&dev->struct_mutex);
Daniel Vetter23010e42010-03-08 13:35:02 +01004316 obj_priv = to_intel_bo(obj);
Chris Wilson3ef94da2009-09-14 16:50:29 +01004317
4318 if (obj_priv->pin_count) {
4319 drm_gem_object_unreference(obj);
4320 mutex_unlock(&dev->struct_mutex);
4321
4322 DRM_ERROR("Attempted i915_gem_madvise_ioctl() on a pinned object\n");
4323 return -EINVAL;
4324 }
4325
Chris Wilsonbb6baf72009-09-22 14:24:13 +01004326 if (obj_priv->madv != __I915_MADV_PURGED)
4327 obj_priv->madv = args->madv;
Chris Wilson3ef94da2009-09-14 16:50:29 +01004328
Chris Wilson2d7ef392009-09-20 23:13:10 +01004329 /* if the object is no longer bound, discard its backing storage */
4330 if (i915_gem_object_is_purgeable(obj_priv) &&
4331 obj_priv->gtt_space == NULL)
4332 i915_gem_object_truncate(obj);
4333
Chris Wilsonbb6baf72009-09-22 14:24:13 +01004334 args->retained = obj_priv->madv != __I915_MADV_PURGED;
4335
Chris Wilson3ef94da2009-09-14 16:50:29 +01004336 drm_gem_object_unreference(obj);
4337 mutex_unlock(&dev->struct_mutex);
4338
4339 return 0;
4340}
4341
Daniel Vetterac52bc52010-04-09 19:05:06 +00004342struct drm_gem_object * i915_gem_alloc_object(struct drm_device *dev,
4343 size_t size)
4344{
Daniel Vetterc397b902010-04-09 19:05:07 +00004345 struct drm_i915_gem_object *obj;
4346
4347 obj = kzalloc(sizeof(*obj), GFP_KERNEL);
4348 if (obj == NULL)
4349 return NULL;
4350
4351 if (drm_gem_object_init(dev, &obj->base, size) != 0) {
4352 kfree(obj);
4353 return NULL;
4354 }
4355
4356 obj->base.write_domain = I915_GEM_DOMAIN_CPU;
4357 obj->base.read_domains = I915_GEM_DOMAIN_CPU;
4358
4359 obj->agp_type = AGP_USER_MEMORY;
Daniel Vetter62b8b212010-04-09 19:05:08 +00004360 obj->base.driver_private = NULL;
Daniel Vetterc397b902010-04-09 19:05:07 +00004361 obj->fence_reg = I915_FENCE_REG_NONE;
4362 INIT_LIST_HEAD(&obj->list);
4363 INIT_LIST_HEAD(&obj->gpu_write_list);
Daniel Vetterc397b902010-04-09 19:05:07 +00004364 obj->madv = I915_MADV_WILLNEED;
4365
4366 trace_i915_gem_object_create(&obj->base);
4367
4368 return &obj->base;
Daniel Vetterac52bc52010-04-09 19:05:06 +00004369}
4370
Eric Anholt673a3942008-07-30 12:06:12 -07004371int i915_gem_init_object(struct drm_gem_object *obj)
4372{
Daniel Vetterc397b902010-04-09 19:05:07 +00004373 BUG();
Jesse Barnesde151cf2008-11-12 10:03:55 -08004374
Eric Anholt673a3942008-07-30 12:06:12 -07004375 return 0;
4376}
4377
4378void i915_gem_free_object(struct drm_gem_object *obj)
4379{
Jesse Barnesde151cf2008-11-12 10:03:55 -08004380 struct drm_device *dev = obj->dev;
Daniel Vetter23010e42010-03-08 13:35:02 +01004381 struct drm_i915_gem_object *obj_priv = to_intel_bo(obj);
Eric Anholt673a3942008-07-30 12:06:12 -07004382
Chris Wilson1c5d22f2009-08-25 11:15:50 +01004383 trace_i915_gem_object_destroy(obj);
4384
Eric Anholt673a3942008-07-30 12:06:12 -07004385 while (obj_priv->pin_count > 0)
4386 i915_gem_object_unpin(obj);
4387
Dave Airlie71acb5e2008-12-30 20:31:46 +10004388 if (obj_priv->phys_obj)
4389 i915_gem_detach_phys_object(dev, obj);
4390
Eric Anholt673a3942008-07-30 12:06:12 -07004391 i915_gem_object_unbind(obj);
4392
Chris Wilson7e616152009-09-10 08:53:04 +01004393 if (obj_priv->mmap_offset)
4394 i915_gem_free_mmap_offset(obj);
Jesse Barnesde151cf2008-11-12 10:03:55 -08004395
Daniel Vetterc397b902010-04-09 19:05:07 +00004396 drm_gem_object_release(obj);
4397
Eric Anholt9a298b22009-03-24 12:23:04 -07004398 kfree(obj_priv->page_cpu_valid);
Eric Anholt280b7132009-03-12 16:56:27 -07004399 kfree(obj_priv->bit_17);
Daniel Vetterc397b902010-04-09 19:05:07 +00004400 kfree(obj_priv);
Eric Anholt673a3942008-07-30 12:06:12 -07004401}
4402
Chris Wilsonab5ee572009-09-20 19:25:47 +01004403/** Unbinds all inactive objects. */
Eric Anholt673a3942008-07-30 12:06:12 -07004404static int
Chris Wilsonab5ee572009-09-20 19:25:47 +01004405i915_gem_evict_from_inactive_list(struct drm_device *dev)
Eric Anholt673a3942008-07-30 12:06:12 -07004406{
Chris Wilsonab5ee572009-09-20 19:25:47 +01004407 drm_i915_private_t *dev_priv = dev->dev_private;
Eric Anholt673a3942008-07-30 12:06:12 -07004408
Chris Wilsonab5ee572009-09-20 19:25:47 +01004409 while (!list_empty(&dev_priv->mm.inactive_list)) {
4410 struct drm_gem_object *obj;
4411 int ret;
Eric Anholt673a3942008-07-30 12:06:12 -07004412
Daniel Vettera8089e82010-04-09 19:05:09 +00004413 obj = &list_first_entry(&dev_priv->mm.inactive_list,
4414 struct drm_i915_gem_object,
4415 list)->base;
Eric Anholt673a3942008-07-30 12:06:12 -07004416
4417 ret = i915_gem_object_unbind(obj);
4418 if (ret != 0) {
Chris Wilsonab5ee572009-09-20 19:25:47 +01004419 DRM_ERROR("Error unbinding object: %d\n", ret);
Eric Anholt673a3942008-07-30 12:06:12 -07004420 return ret;
4421 }
4422 }
4423
Eric Anholt673a3942008-07-30 12:06:12 -07004424 return 0;
4425}
4426
Jesse Barnes5669fca2009-02-17 15:13:31 -08004427int
Eric Anholt673a3942008-07-30 12:06:12 -07004428i915_gem_idle(struct drm_device *dev)
4429{
4430 drm_i915_private_t *dev_priv = dev->dev_private;
Chris Wilson29105cc2010-01-07 10:39:13 +00004431 int ret;
Eric Anholt673a3942008-07-30 12:06:12 -07004432
Keith Packard6dbe2772008-10-14 21:41:13 -07004433 mutex_lock(&dev->struct_mutex);
4434
Zou Nan hai8187a2b2010-05-21 09:08:55 +08004435 if (dev_priv->mm.suspended ||
4436 dev_priv->render_ring.gem_object == NULL) {
Keith Packard6dbe2772008-10-14 21:41:13 -07004437 mutex_unlock(&dev->struct_mutex);
Eric Anholt673a3942008-07-30 12:06:12 -07004438 return 0;
Keith Packard6dbe2772008-10-14 21:41:13 -07004439 }
Eric Anholt673a3942008-07-30 12:06:12 -07004440
Chris Wilson29105cc2010-01-07 10:39:13 +00004441 ret = i915_gpu_idle(dev);
Keith Packard6dbe2772008-10-14 21:41:13 -07004442 if (ret) {
4443 mutex_unlock(&dev->struct_mutex);
Eric Anholt673a3942008-07-30 12:06:12 -07004444 return ret;
Keith Packard6dbe2772008-10-14 21:41:13 -07004445 }
Eric Anholt673a3942008-07-30 12:06:12 -07004446
Chris Wilson29105cc2010-01-07 10:39:13 +00004447 /* Under UMS, be paranoid and evict. */
4448 if (!drm_core_check_feature(dev, DRIVER_MODESET)) {
4449 ret = i915_gem_evict_from_inactive_list(dev);
4450 if (ret) {
4451 mutex_unlock(&dev->struct_mutex);
4452 return ret;
4453 }
4454 }
4455
4456 /* Hack! Don't let anybody do execbuf while we don't control the chip.
4457 * We need to replace this with a semaphore, or something.
4458 * And not confound mm.suspended!
4459 */
4460 dev_priv->mm.suspended = 1;
4461 del_timer(&dev_priv->hangcheck_timer);
4462
4463 i915_kernel_lost_context(dev);
Keith Packard6dbe2772008-10-14 21:41:13 -07004464 i915_gem_cleanup_ringbuffer(dev);
Chris Wilson29105cc2010-01-07 10:39:13 +00004465
Keith Packard6dbe2772008-10-14 21:41:13 -07004466 mutex_unlock(&dev->struct_mutex);
4467
Chris Wilson29105cc2010-01-07 10:39:13 +00004468 /* Cancel the retire work handler, which should be idle now. */
4469 cancel_delayed_work_sync(&dev_priv->mm.retire_work);
4470
Eric Anholt673a3942008-07-30 12:06:12 -07004471 return 0;
4472}
4473
Jesse Barnese552eb72010-04-21 11:39:23 -07004474/*
4475 * 965+ support PIPE_CONTROL commands, which provide finer grained control
4476 * over cache flushing.
4477 */
Zou Nan hai8187a2b2010-05-21 09:08:55 +08004478static int
Jesse Barnese552eb72010-04-21 11:39:23 -07004479i915_gem_init_pipe_control(struct drm_device *dev)
4480{
4481 drm_i915_private_t *dev_priv = dev->dev_private;
4482 struct drm_gem_object *obj;
4483 struct drm_i915_gem_object *obj_priv;
4484 int ret;
4485
Eric Anholt34dc4d42010-05-07 14:30:03 -07004486 obj = i915_gem_alloc_object(dev, 4096);
Jesse Barnese552eb72010-04-21 11:39:23 -07004487 if (obj == NULL) {
4488 DRM_ERROR("Failed to allocate seqno page\n");
4489 ret = -ENOMEM;
4490 goto err;
4491 }
4492 obj_priv = to_intel_bo(obj);
4493 obj_priv->agp_type = AGP_USER_CACHED_MEMORY;
4494
4495 ret = i915_gem_object_pin(obj, 4096);
4496 if (ret)
4497 goto err_unref;
4498
4499 dev_priv->seqno_gfx_addr = obj_priv->gtt_offset;
4500 dev_priv->seqno_page = kmap(obj_priv->pages[0]);
4501 if (dev_priv->seqno_page == NULL)
4502 goto err_unpin;
4503
4504 dev_priv->seqno_obj = obj;
4505 memset(dev_priv->seqno_page, 0, PAGE_SIZE);
4506
4507 return 0;
4508
4509err_unpin:
4510 i915_gem_object_unpin(obj);
4511err_unref:
4512 drm_gem_object_unreference(obj);
4513err:
4514 return ret;
4515}
4516
Zou Nan hai8187a2b2010-05-21 09:08:55 +08004517
4518static void
Jesse Barnese552eb72010-04-21 11:39:23 -07004519i915_gem_cleanup_pipe_control(struct drm_device *dev)
4520{
4521 drm_i915_private_t *dev_priv = dev->dev_private;
4522 struct drm_gem_object *obj;
4523 struct drm_i915_gem_object *obj_priv;
4524
4525 obj = dev_priv->seqno_obj;
4526 obj_priv = to_intel_bo(obj);
4527 kunmap(obj_priv->pages[0]);
4528 i915_gem_object_unpin(obj);
4529 drm_gem_object_unreference(obj);
4530 dev_priv->seqno_obj = NULL;
4531
4532 dev_priv->seqno_page = NULL;
Eric Anholt673a3942008-07-30 12:06:12 -07004533}
4534
Eric Anholt673a3942008-07-30 12:06:12 -07004535int
Zou Nan hai8187a2b2010-05-21 09:08:55 +08004536i915_gem_init_ringbuffer(struct drm_device *dev)
4537{
4538 drm_i915_private_t *dev_priv = dev->dev_private;
4539 int ret;
4540 dev_priv->render_ring = render_ring;
4541 if (!I915_NEED_GFX_HWS(dev)) {
4542 dev_priv->render_ring.status_page.page_addr
4543 = dev_priv->status_page_dmah->vaddr;
4544 memset(dev_priv->render_ring.status_page.page_addr,
4545 0, PAGE_SIZE);
4546 }
4547 if (HAS_PIPE_CONTROL(dev)) {
4548 ret = i915_gem_init_pipe_control(dev);
4549 if (ret)
4550 return ret;
4551 }
4552 ret = intel_init_ring_buffer(dev, &dev_priv->render_ring);
4553 return ret;
4554}
4555
4556void
4557i915_gem_cleanup_ringbuffer(struct drm_device *dev)
4558{
4559 drm_i915_private_t *dev_priv = dev->dev_private;
4560
4561 intel_cleanup_ring_buffer(dev, &dev_priv->render_ring);
4562 if (HAS_PIPE_CONTROL(dev))
4563 i915_gem_cleanup_pipe_control(dev);
4564}
4565
4566int
Eric Anholt673a3942008-07-30 12:06:12 -07004567i915_gem_entervt_ioctl(struct drm_device *dev, void *data,
4568 struct drm_file *file_priv)
4569{
4570 drm_i915_private_t *dev_priv = dev->dev_private;
4571 int ret;
4572
Jesse Barnes79e53942008-11-07 14:24:08 -08004573 if (drm_core_check_feature(dev, DRIVER_MODESET))
4574 return 0;
4575
Ben Gamariba1234d2009-09-14 17:48:47 -04004576 if (atomic_read(&dev_priv->mm.wedged)) {
Eric Anholt673a3942008-07-30 12:06:12 -07004577 DRM_ERROR("Reenabling wedged hardware, good luck\n");
Ben Gamariba1234d2009-09-14 17:48:47 -04004578 atomic_set(&dev_priv->mm.wedged, 0);
Eric Anholt673a3942008-07-30 12:06:12 -07004579 }
4580
Eric Anholt673a3942008-07-30 12:06:12 -07004581 mutex_lock(&dev->struct_mutex);
Eric Anholt9bb2d6f2008-12-23 18:42:32 -08004582 dev_priv->mm.suspended = 0;
4583
4584 ret = i915_gem_init_ringbuffer(dev);
Wu Fengguangd816f6a2009-04-18 10:43:32 +08004585 if (ret != 0) {
4586 mutex_unlock(&dev->struct_mutex);
Eric Anholt9bb2d6f2008-12-23 18:42:32 -08004587 return ret;
Wu Fengguangd816f6a2009-04-18 10:43:32 +08004588 }
Eric Anholt9bb2d6f2008-12-23 18:42:32 -08004589
Carl Worth5e118f42009-03-20 11:54:25 -07004590 spin_lock(&dev_priv->mm.active_list_lock);
Zou Nan hai852835f2010-05-21 09:08:56 +08004591 BUG_ON(!list_empty(&dev_priv->render_ring.active_list));
Carl Worth5e118f42009-03-20 11:54:25 -07004592 spin_unlock(&dev_priv->mm.active_list_lock);
4593
Eric Anholt673a3942008-07-30 12:06:12 -07004594 BUG_ON(!list_empty(&dev_priv->mm.flushing_list));
4595 BUG_ON(!list_empty(&dev_priv->mm.inactive_list));
Zou Nan hai852835f2010-05-21 09:08:56 +08004596 BUG_ON(!list_empty(&dev_priv->render_ring.request_list));
Eric Anholt673a3942008-07-30 12:06:12 -07004597 mutex_unlock(&dev->struct_mutex);
Kristian Høgsbergdbb19d32008-08-20 11:04:27 -04004598
4599 drm_irq_install(dev);
4600
Eric Anholt673a3942008-07-30 12:06:12 -07004601 return 0;
4602}
4603
4604int
4605i915_gem_leavevt_ioctl(struct drm_device *dev, void *data,
4606 struct drm_file *file_priv)
4607{
Jesse Barnes79e53942008-11-07 14:24:08 -08004608 if (drm_core_check_feature(dev, DRIVER_MODESET))
4609 return 0;
4610
Kristian Høgsbergdbb19d32008-08-20 11:04:27 -04004611 drm_irq_uninstall(dev);
Linus Torvaldse6890f62009-09-08 17:09:24 -07004612 return i915_gem_idle(dev);
Eric Anholt673a3942008-07-30 12:06:12 -07004613}
4614
4615void
4616i915_gem_lastclose(struct drm_device *dev)
4617{
4618 int ret;
Eric Anholt673a3942008-07-30 12:06:12 -07004619
Eric Anholte806b492009-01-22 09:56:58 -08004620 if (drm_core_check_feature(dev, DRIVER_MODESET))
4621 return;
4622
Keith Packard6dbe2772008-10-14 21:41:13 -07004623 ret = i915_gem_idle(dev);
4624 if (ret)
4625 DRM_ERROR("failed to idle hardware: %d\n", ret);
Eric Anholt673a3942008-07-30 12:06:12 -07004626}
4627
4628void
4629i915_gem_load(struct drm_device *dev)
4630{
Grégoire Henryb5aa8a02009-06-23 15:41:02 +02004631 int i;
Eric Anholt673a3942008-07-30 12:06:12 -07004632 drm_i915_private_t *dev_priv = dev->dev_private;
4633
Carl Worth5e118f42009-03-20 11:54:25 -07004634 spin_lock_init(&dev_priv->mm.active_list_lock);
Eric Anholt673a3942008-07-30 12:06:12 -07004635 INIT_LIST_HEAD(&dev_priv->mm.flushing_list);
Daniel Vetter99fcb762010-02-07 16:20:18 +01004636 INIT_LIST_HEAD(&dev_priv->mm.gpu_write_list);
Eric Anholt673a3942008-07-30 12:06:12 -07004637 INIT_LIST_HEAD(&dev_priv->mm.inactive_list);
Eric Anholta09ba7f2009-08-29 12:49:51 -07004638 INIT_LIST_HEAD(&dev_priv->mm.fence_list);
Zou Nan hai852835f2010-05-21 09:08:56 +08004639 INIT_LIST_HEAD(&dev_priv->render_ring.active_list);
4640 INIT_LIST_HEAD(&dev_priv->render_ring.request_list);
Daniel Vetter007cc8a2010-04-28 11:02:31 +02004641 for (i = 0; i < 16; i++)
4642 INIT_LIST_HEAD(&dev_priv->fence_regs[i].lru_list);
Eric Anholt673a3942008-07-30 12:06:12 -07004643 INIT_DELAYED_WORK(&dev_priv->mm.retire_work,
4644 i915_gem_retire_work_handler);
Chris Wilson31169712009-09-14 16:50:28 +01004645 spin_lock(&shrink_list_lock);
4646 list_add(&dev_priv->mm.shrink_list, &shrink_list);
4647 spin_unlock(&shrink_list_lock);
4648
Jesse Barnesde151cf2008-11-12 10:03:55 -08004649 /* Old X drivers will take 0-2 for front, back, depth buffers */
Eric Anholtb397c832010-01-26 09:43:10 -08004650 if (!drm_core_check_feature(dev, DRIVER_MODESET))
4651 dev_priv->fence_reg_start = 3;
Jesse Barnesde151cf2008-11-12 10:03:55 -08004652
Jesse Barnes0f973f22009-01-26 17:10:45 -08004653 if (IS_I965G(dev) || IS_I945G(dev) || IS_I945GM(dev) || IS_G33(dev))
Jesse Barnesde151cf2008-11-12 10:03:55 -08004654 dev_priv->num_fence_regs = 16;
4655 else
4656 dev_priv->num_fence_regs = 8;
4657
Grégoire Henryb5aa8a02009-06-23 15:41:02 +02004658 /* Initialize fence registers to zero */
4659 if (IS_I965G(dev)) {
4660 for (i = 0; i < 16; i++)
4661 I915_WRITE64(FENCE_REG_965_0 + (i * 8), 0);
4662 } else {
4663 for (i = 0; i < 8; i++)
4664 I915_WRITE(FENCE_REG_830_0 + (i * 4), 0);
4665 if (IS_I945G(dev) || IS_I945GM(dev) || IS_G33(dev))
4666 for (i = 0; i < 8; i++)
4667 I915_WRITE(FENCE_REG_945_8 + (i * 4), 0);
4668 }
Eric Anholt673a3942008-07-30 12:06:12 -07004669 i915_gem_detect_bit_6_swizzle(dev);
Kristian Høgsberg6b95a202009-11-18 11:25:18 -05004670 init_waitqueue_head(&dev_priv->pending_flip_queue);
Eric Anholt673a3942008-07-30 12:06:12 -07004671}
Dave Airlie71acb5e2008-12-30 20:31:46 +10004672
4673/*
4674 * Create a physically contiguous memory object for this object
4675 * e.g. for cursor + overlay regs
4676 */
4677int i915_gem_init_phys_object(struct drm_device *dev,
4678 int id, int size)
4679{
4680 drm_i915_private_t *dev_priv = dev->dev_private;
4681 struct drm_i915_gem_phys_object *phys_obj;
4682 int ret;
4683
4684 if (dev_priv->mm.phys_objs[id - 1] || !size)
4685 return 0;
4686
Eric Anholt9a298b22009-03-24 12:23:04 -07004687 phys_obj = kzalloc(sizeof(struct drm_i915_gem_phys_object), GFP_KERNEL);
Dave Airlie71acb5e2008-12-30 20:31:46 +10004688 if (!phys_obj)
4689 return -ENOMEM;
4690
4691 phys_obj->id = id;
4692
Zhenyu Wange6be8d92010-01-05 11:25:05 +08004693 phys_obj->handle = drm_pci_alloc(dev, size, 0);
Dave Airlie71acb5e2008-12-30 20:31:46 +10004694 if (!phys_obj->handle) {
4695 ret = -ENOMEM;
4696 goto kfree_obj;
4697 }
4698#ifdef CONFIG_X86
4699 set_memory_wc((unsigned long)phys_obj->handle->vaddr, phys_obj->handle->size / PAGE_SIZE);
4700#endif
4701
4702 dev_priv->mm.phys_objs[id - 1] = phys_obj;
4703
4704 return 0;
4705kfree_obj:
Eric Anholt9a298b22009-03-24 12:23:04 -07004706 kfree(phys_obj);
Dave Airlie71acb5e2008-12-30 20:31:46 +10004707 return ret;
4708}
4709
4710void i915_gem_free_phys_object(struct drm_device *dev, int id)
4711{
4712 drm_i915_private_t *dev_priv = dev->dev_private;
4713 struct drm_i915_gem_phys_object *phys_obj;
4714
4715 if (!dev_priv->mm.phys_objs[id - 1])
4716 return;
4717
4718 phys_obj = dev_priv->mm.phys_objs[id - 1];
4719 if (phys_obj->cur_obj) {
4720 i915_gem_detach_phys_object(dev, phys_obj->cur_obj);
4721 }
4722
4723#ifdef CONFIG_X86
4724 set_memory_wb((unsigned long)phys_obj->handle->vaddr, phys_obj->handle->size / PAGE_SIZE);
4725#endif
4726 drm_pci_free(dev, phys_obj->handle);
4727 kfree(phys_obj);
4728 dev_priv->mm.phys_objs[id - 1] = NULL;
4729}
4730
4731void i915_gem_free_all_phys_object(struct drm_device *dev)
4732{
4733 int i;
4734
Dave Airlie260883c2009-01-22 17:58:49 +10004735 for (i = I915_GEM_PHYS_CURSOR_0; i <= I915_MAX_PHYS_OBJECT; i++)
Dave Airlie71acb5e2008-12-30 20:31:46 +10004736 i915_gem_free_phys_object(dev, i);
4737}
4738
4739void i915_gem_detach_phys_object(struct drm_device *dev,
4740 struct drm_gem_object *obj)
4741{
4742 struct drm_i915_gem_object *obj_priv;
4743 int i;
4744 int ret;
4745 int page_count;
4746
Daniel Vetter23010e42010-03-08 13:35:02 +01004747 obj_priv = to_intel_bo(obj);
Dave Airlie71acb5e2008-12-30 20:31:46 +10004748 if (!obj_priv->phys_obj)
4749 return;
4750
Chris Wilson4bdadb92010-01-27 13:36:32 +00004751 ret = i915_gem_object_get_pages(obj, 0);
Dave Airlie71acb5e2008-12-30 20:31:46 +10004752 if (ret)
4753 goto out;
4754
4755 page_count = obj->size / PAGE_SIZE;
4756
4757 for (i = 0; i < page_count; i++) {
Eric Anholt856fa192009-03-19 14:10:50 -07004758 char *dst = kmap_atomic(obj_priv->pages[i], KM_USER0);
Dave Airlie71acb5e2008-12-30 20:31:46 +10004759 char *src = obj_priv->phys_obj->handle->vaddr + (i * PAGE_SIZE);
4760
4761 memcpy(dst, src, PAGE_SIZE);
4762 kunmap_atomic(dst, KM_USER0);
4763 }
Eric Anholt856fa192009-03-19 14:10:50 -07004764 drm_clflush_pages(obj_priv->pages, page_count);
Dave Airlie71acb5e2008-12-30 20:31:46 +10004765 drm_agp_chipset_flush(dev);
Chris Wilsond78b47b2009-06-17 21:52:49 +01004766
4767 i915_gem_object_put_pages(obj);
Dave Airlie71acb5e2008-12-30 20:31:46 +10004768out:
4769 obj_priv->phys_obj->cur_obj = NULL;
4770 obj_priv->phys_obj = NULL;
4771}
4772
4773int
4774i915_gem_attach_phys_object(struct drm_device *dev,
4775 struct drm_gem_object *obj, int id)
4776{
4777 drm_i915_private_t *dev_priv = dev->dev_private;
4778 struct drm_i915_gem_object *obj_priv;
4779 int ret = 0;
4780 int page_count;
4781 int i;
4782
4783 if (id > I915_MAX_PHYS_OBJECT)
4784 return -EINVAL;
4785
Daniel Vetter23010e42010-03-08 13:35:02 +01004786 obj_priv = to_intel_bo(obj);
Dave Airlie71acb5e2008-12-30 20:31:46 +10004787
4788 if (obj_priv->phys_obj) {
4789 if (obj_priv->phys_obj->id == id)
4790 return 0;
4791 i915_gem_detach_phys_object(dev, obj);
4792 }
4793
4794
4795 /* create a new object */
4796 if (!dev_priv->mm.phys_objs[id - 1]) {
4797 ret = i915_gem_init_phys_object(dev, id,
4798 obj->size);
4799 if (ret) {
Linus Torvaldsaeb565d2009-01-26 10:01:53 -08004800 DRM_ERROR("failed to init phys object %d size: %zu\n", id, obj->size);
Dave Airlie71acb5e2008-12-30 20:31:46 +10004801 goto out;
4802 }
4803 }
4804
4805 /* bind to the object */
4806 obj_priv->phys_obj = dev_priv->mm.phys_objs[id - 1];
4807 obj_priv->phys_obj->cur_obj = obj;
4808
Chris Wilson4bdadb92010-01-27 13:36:32 +00004809 ret = i915_gem_object_get_pages(obj, 0);
Dave Airlie71acb5e2008-12-30 20:31:46 +10004810 if (ret) {
4811 DRM_ERROR("failed to get page list\n");
4812 goto out;
4813 }
4814
4815 page_count = obj->size / PAGE_SIZE;
4816
4817 for (i = 0; i < page_count; i++) {
Eric Anholt856fa192009-03-19 14:10:50 -07004818 char *src = kmap_atomic(obj_priv->pages[i], KM_USER0);
Dave Airlie71acb5e2008-12-30 20:31:46 +10004819 char *dst = obj_priv->phys_obj->handle->vaddr + (i * PAGE_SIZE);
4820
4821 memcpy(dst, src, PAGE_SIZE);
4822 kunmap_atomic(src, KM_USER0);
4823 }
4824
Chris Wilsond78b47b2009-06-17 21:52:49 +01004825 i915_gem_object_put_pages(obj);
4826
Dave Airlie71acb5e2008-12-30 20:31:46 +10004827 return 0;
4828out:
4829 return ret;
4830}
4831
4832static int
4833i915_gem_phys_pwrite(struct drm_device *dev, struct drm_gem_object *obj,
4834 struct drm_i915_gem_pwrite *args,
4835 struct drm_file *file_priv)
4836{
Daniel Vetter23010e42010-03-08 13:35:02 +01004837 struct drm_i915_gem_object *obj_priv = to_intel_bo(obj);
Dave Airlie71acb5e2008-12-30 20:31:46 +10004838 void *obj_addr;
4839 int ret;
4840 char __user *user_data;
4841
4842 user_data = (char __user *) (uintptr_t) args->data_ptr;
4843 obj_addr = obj_priv->phys_obj->handle->vaddr + args->offset;
4844
Zhao Yakui44d98a62009-10-09 11:39:40 +08004845 DRM_DEBUG_DRIVER("obj_addr %p, %lld\n", obj_addr, args->size);
Dave Airlie71acb5e2008-12-30 20:31:46 +10004846 ret = copy_from_user(obj_addr, user_data, args->size);
4847 if (ret)
4848 return -EFAULT;
4849
4850 drm_agp_chipset_flush(dev);
4851 return 0;
4852}
Eric Anholtb9624422009-06-03 07:27:35 +00004853
4854void i915_gem_release(struct drm_device * dev, struct drm_file *file_priv)
4855{
4856 struct drm_i915_file_private *i915_file_priv = file_priv->driver_priv;
4857
4858 /* Clean up our request list when the client is going away, so that
4859 * later retire_requests won't dereference our soon-to-be-gone
4860 * file_priv.
4861 */
4862 mutex_lock(&dev->struct_mutex);
4863 while (!list_empty(&i915_file_priv->mm.request_list))
4864 list_del_init(i915_file_priv->mm.request_list.next);
4865 mutex_unlock(&dev->struct_mutex);
4866}
Chris Wilson31169712009-09-14 16:50:28 +01004867
Chris Wilson31169712009-09-14 16:50:28 +01004868static int
Chris Wilson1637ef42010-04-20 17:10:35 +01004869i915_gpu_is_active(struct drm_device *dev)
4870{
4871 drm_i915_private_t *dev_priv = dev->dev_private;
4872 int lists_empty;
4873
4874 spin_lock(&dev_priv->mm.active_list_lock);
4875 lists_empty = list_empty(&dev_priv->mm.flushing_list) &&
Zou Nan hai852835f2010-05-21 09:08:56 +08004876 list_empty(&dev_priv->render_ring.active_list);
Chris Wilson1637ef42010-04-20 17:10:35 +01004877 spin_unlock(&dev_priv->mm.active_list_lock);
4878
4879 return !lists_empty;
4880}
4881
4882static int
Chris Wilson31169712009-09-14 16:50:28 +01004883i915_gem_shrink(int nr_to_scan, gfp_t gfp_mask)
4884{
4885 drm_i915_private_t *dev_priv, *next_dev;
4886 struct drm_i915_gem_object *obj_priv, *next_obj;
4887 int cnt = 0;
4888 int would_deadlock = 1;
4889
4890 /* "fast-path" to count number of available objects */
4891 if (nr_to_scan == 0) {
4892 spin_lock(&shrink_list_lock);
4893 list_for_each_entry(dev_priv, &shrink_list, mm.shrink_list) {
4894 struct drm_device *dev = dev_priv->dev;
4895
4896 if (mutex_trylock(&dev->struct_mutex)) {
4897 list_for_each_entry(obj_priv,
4898 &dev_priv->mm.inactive_list,
4899 list)
4900 cnt++;
4901 mutex_unlock(&dev->struct_mutex);
4902 }
4903 }
4904 spin_unlock(&shrink_list_lock);
4905
4906 return (cnt / 100) * sysctl_vfs_cache_pressure;
4907 }
4908
4909 spin_lock(&shrink_list_lock);
4910
Chris Wilson1637ef42010-04-20 17:10:35 +01004911rescan:
Chris Wilson31169712009-09-14 16:50:28 +01004912 /* first scan for clean buffers */
4913 list_for_each_entry_safe(dev_priv, next_dev,
4914 &shrink_list, mm.shrink_list) {
4915 struct drm_device *dev = dev_priv->dev;
4916
4917 if (! mutex_trylock(&dev->struct_mutex))
4918 continue;
4919
4920 spin_unlock(&shrink_list_lock);
Zou Nan hai852835f2010-05-21 09:08:56 +08004921 i915_gem_retire_requests(dev, &dev_priv->render_ring);
Chris Wilson31169712009-09-14 16:50:28 +01004922
4923 list_for_each_entry_safe(obj_priv, next_obj,
4924 &dev_priv->mm.inactive_list,
4925 list) {
4926 if (i915_gem_object_is_purgeable(obj_priv)) {
Daniel Vettera8089e82010-04-09 19:05:09 +00004927 i915_gem_object_unbind(&obj_priv->base);
Chris Wilson31169712009-09-14 16:50:28 +01004928 if (--nr_to_scan <= 0)
4929 break;
4930 }
4931 }
4932
4933 spin_lock(&shrink_list_lock);
4934 mutex_unlock(&dev->struct_mutex);
4935
Chris Wilson963b4832009-09-20 23:03:54 +01004936 would_deadlock = 0;
4937
Chris Wilson31169712009-09-14 16:50:28 +01004938 if (nr_to_scan <= 0)
4939 break;
4940 }
4941
4942 /* second pass, evict/count anything still on the inactive list */
4943 list_for_each_entry_safe(dev_priv, next_dev,
4944 &shrink_list, mm.shrink_list) {
4945 struct drm_device *dev = dev_priv->dev;
4946
4947 if (! mutex_trylock(&dev->struct_mutex))
4948 continue;
4949
4950 spin_unlock(&shrink_list_lock);
4951
4952 list_for_each_entry_safe(obj_priv, next_obj,
4953 &dev_priv->mm.inactive_list,
4954 list) {
4955 if (nr_to_scan > 0) {
Daniel Vettera8089e82010-04-09 19:05:09 +00004956 i915_gem_object_unbind(&obj_priv->base);
Chris Wilson31169712009-09-14 16:50:28 +01004957 nr_to_scan--;
4958 } else
4959 cnt++;
4960 }
4961
4962 spin_lock(&shrink_list_lock);
4963 mutex_unlock(&dev->struct_mutex);
4964
4965 would_deadlock = 0;
4966 }
4967
Chris Wilson1637ef42010-04-20 17:10:35 +01004968 if (nr_to_scan) {
4969 int active = 0;
4970
4971 /*
4972 * We are desperate for pages, so as a last resort, wait
4973 * for the GPU to finish and discard whatever we can.
4974 * This has a dramatic impact to reduce the number of
4975 * OOM-killer events whilst running the GPU aggressively.
4976 */
4977 list_for_each_entry(dev_priv, &shrink_list, mm.shrink_list) {
4978 struct drm_device *dev = dev_priv->dev;
4979
4980 if (!mutex_trylock(&dev->struct_mutex))
4981 continue;
4982
4983 spin_unlock(&shrink_list_lock);
4984
4985 if (i915_gpu_is_active(dev)) {
4986 i915_gpu_idle(dev);
4987 active++;
4988 }
4989
4990 spin_lock(&shrink_list_lock);
4991 mutex_unlock(&dev->struct_mutex);
4992 }
4993
4994 if (active)
4995 goto rescan;
4996 }
4997
Chris Wilson31169712009-09-14 16:50:28 +01004998 spin_unlock(&shrink_list_lock);
4999
5000 if (would_deadlock)
5001 return -1;
5002 else if (cnt > 0)
5003 return (cnt / 100) * sysctl_vfs_cache_pressure;
5004 else
5005 return 0;
5006}
5007
5008static struct shrinker shrinker = {
5009 .shrink = i915_gem_shrink,
5010 .seeks = DEFAULT_SEEKS,
5011};
5012
5013__init void
5014i915_gem_shrinker_init(void)
5015{
5016 register_shrinker(&shrinker);
5017}
5018
5019__exit void
5020i915_gem_shrinker_exit(void)
5021{
5022 unregister_shrinker(&shrinker);
5023}