blob: d409b26607f320dd8a1efdb76105e7fc4a99803d [file] [log] [blame]
Ben Skeggs6ee73862009-12-11 19:24:15 +10001/*
2 * Copyright 2007 Dave Airlied
3 * All Rights Reserved.
4 *
5 * Permission is hereby granted, free of charge, to any person obtaining a
6 * copy of this software and associated documentation files (the "Software"),
7 * to deal in the Software without restriction, including without limitation
8 * the rights to use, copy, modify, merge, publish, distribute, sublicense,
9 * and/or sell copies of the Software, and to permit persons to whom the
10 * Software is furnished to do so, subject to the following conditions:
11 *
12 * The above copyright notice and this permission notice (including the next
13 * paragraph) shall be included in all copies or substantial portions of the
14 * Software.
15 *
16 * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
17 * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
18 * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL
19 * VA LINUX SYSTEMS AND/OR ITS SUPPLIERS BE LIABLE FOR ANY CLAIM, DAMAGES OR
20 * OTHER LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE,
21 * ARISING FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR
22 * OTHER DEALINGS IN THE SOFTWARE.
23 */
24/*
25 * Authors: Dave Airlied <airlied@linux.ie>
26 * Ben Skeggs <darktama@iinet.net.au>
27 * Jeremy Kolb <jkolb@brandeis.edu>
28 */
29
Ben Skeggsfdb751e2014-08-10 04:10:23 +100030#include <linux/dma-mapping.h>
Chris Metcalf3e2b7562013-02-01 13:44:33 -050031#include <linux/swiotlb.h>
Ben Skeggs6ee73862009-12-11 19:24:15 +100032
Ben Skeggsebb945a2012-07-20 08:17:34 +100033#include "nouveau_drm.h"
Ben Skeggs6ee73862009-12-11 19:24:15 +100034#include "nouveau_dma.h"
Ben Skeggsd375e7d52012-04-30 13:30:00 +100035#include "nouveau_fence.h"
Ben Skeggs6ee73862009-12-11 19:24:15 +100036
Ben Skeggsebb945a2012-07-20 08:17:34 +100037#include "nouveau_bo.h"
38#include "nouveau_ttm.h"
39#include "nouveau_gem.h"
Maarten Maathuisa5106042009-12-26 21:46:36 +010040
Ben Skeggsbc9e7b92012-07-19 17:54:21 +100041/*
42 * NV10-NV40 tiling helpers
43 */
44
45static void
Ben Skeggsebb945a2012-07-20 08:17:34 +100046nv10_bo_update_tile_region(struct drm_device *dev, struct nouveau_drm_tile *reg,
47 u32 addr, u32 size, u32 pitch, u32 flags)
Ben Skeggsbc9e7b92012-07-19 17:54:21 +100048{
Ben Skeggs77145f12012-07-31 16:16:21 +100049 struct nouveau_drm *drm = nouveau_drm(dev);
Ben Skeggsebb945a2012-07-20 08:17:34 +100050 int i = reg - drm->tile.reg;
Ben Skeggs967e7bd2014-08-10 04:10:22 +100051 struct nouveau_fb *pfb = nvkm_fb(&drm->device);
Ben Skeggsebb945a2012-07-20 08:17:34 +100052 struct nouveau_fb_tile *tile = &pfb->tile.region[i];
53 struct nouveau_engine *engine;
Ben Skeggsbc9e7b92012-07-19 17:54:21 +100054
Ben Skeggsebb945a2012-07-20 08:17:34 +100055 nouveau_fence_unref(&reg->fence);
Ben Skeggsbc9e7b92012-07-19 17:54:21 +100056
57 if (tile->pitch)
Ben Skeggsebb945a2012-07-20 08:17:34 +100058 pfb->tile.fini(pfb, i, tile);
Ben Skeggsbc9e7b92012-07-19 17:54:21 +100059
60 if (pitch)
Ben Skeggsebb945a2012-07-20 08:17:34 +100061 pfb->tile.init(pfb, i, addr, size, pitch, flags, tile);
Ben Skeggsbc9e7b92012-07-19 17:54:21 +100062
Ben Skeggsebb945a2012-07-20 08:17:34 +100063 pfb->tile.prog(pfb, i, tile);
Ben Skeggsbc9e7b92012-07-19 17:54:21 +100064
Ben Skeggsebb945a2012-07-20 08:17:34 +100065 if ((engine = nouveau_engine(pfb, NVDEV_ENGINE_GR)))
66 engine->tile_prog(engine, i);
67 if ((engine = nouveau_engine(pfb, NVDEV_ENGINE_MPEG)))
68 engine->tile_prog(engine, i);
Ben Skeggsbc9e7b92012-07-19 17:54:21 +100069}
70
Ben Skeggsebb945a2012-07-20 08:17:34 +100071static struct nouveau_drm_tile *
Ben Skeggsbc9e7b92012-07-19 17:54:21 +100072nv10_bo_get_tile_region(struct drm_device *dev, int i)
73{
Ben Skeggs77145f12012-07-31 16:16:21 +100074 struct nouveau_drm *drm = nouveau_drm(dev);
Ben Skeggsebb945a2012-07-20 08:17:34 +100075 struct nouveau_drm_tile *tile = &drm->tile.reg[i];
Ben Skeggsbc9e7b92012-07-19 17:54:21 +100076
Ben Skeggsebb945a2012-07-20 08:17:34 +100077 spin_lock(&drm->tile.lock);
Ben Skeggsbc9e7b92012-07-19 17:54:21 +100078
79 if (!tile->used &&
80 (!tile->fence || nouveau_fence_done(tile->fence)))
81 tile->used = true;
82 else
83 tile = NULL;
84
Ben Skeggsebb945a2012-07-20 08:17:34 +100085 spin_unlock(&drm->tile.lock);
Ben Skeggsbc9e7b92012-07-19 17:54:21 +100086 return tile;
87}
88
89static void
Ben Skeggsebb945a2012-07-20 08:17:34 +100090nv10_bo_put_tile_region(struct drm_device *dev, struct nouveau_drm_tile *tile,
Maarten Lankhorstf2c24b82014-04-02 17:14:48 +020091 struct fence *fence)
Ben Skeggsbc9e7b92012-07-19 17:54:21 +100092{
Ben Skeggs77145f12012-07-31 16:16:21 +100093 struct nouveau_drm *drm = nouveau_drm(dev);
Ben Skeggsbc9e7b92012-07-19 17:54:21 +100094
95 if (tile) {
Ben Skeggsebb945a2012-07-20 08:17:34 +100096 spin_lock(&drm->tile.lock);
Maarten Lankhorst809e9442014-04-09 16:19:30 +020097 tile->fence = (struct nouveau_fence *)fence_get(fence);
Ben Skeggsbc9e7b92012-07-19 17:54:21 +100098 tile->used = false;
Ben Skeggsebb945a2012-07-20 08:17:34 +100099 spin_unlock(&drm->tile.lock);
Ben Skeggsbc9e7b92012-07-19 17:54:21 +1000100 }
101}
102
Ben Skeggsebb945a2012-07-20 08:17:34 +1000103static struct nouveau_drm_tile *
104nv10_bo_set_tiling(struct drm_device *dev, u32 addr,
105 u32 size, u32 pitch, u32 flags)
Ben Skeggsbc9e7b92012-07-19 17:54:21 +1000106{
Ben Skeggs77145f12012-07-31 16:16:21 +1000107 struct nouveau_drm *drm = nouveau_drm(dev);
Ben Skeggs967e7bd2014-08-10 04:10:22 +1000108 struct nouveau_fb *pfb = nvkm_fb(&drm->device);
Ben Skeggsebb945a2012-07-20 08:17:34 +1000109 struct nouveau_drm_tile *tile, *found = NULL;
Ben Skeggsbc9e7b92012-07-19 17:54:21 +1000110 int i;
111
Ben Skeggsebb945a2012-07-20 08:17:34 +1000112 for (i = 0; i < pfb->tile.regions; i++) {
Ben Skeggsbc9e7b92012-07-19 17:54:21 +1000113 tile = nv10_bo_get_tile_region(dev, i);
114
115 if (pitch && !found) {
116 found = tile;
117 continue;
118
Ben Skeggsebb945a2012-07-20 08:17:34 +1000119 } else if (tile && pfb->tile.region[i].pitch) {
Ben Skeggsbc9e7b92012-07-19 17:54:21 +1000120 /* Kill an unused tile region. */
121 nv10_bo_update_tile_region(dev, tile, 0, 0, 0, 0);
122 }
123
124 nv10_bo_put_tile_region(dev, tile, NULL);
125 }
126
127 if (found)
128 nv10_bo_update_tile_region(dev, found, addr, size,
129 pitch, flags);
130 return found;
131}
132
Ben Skeggs6ee73862009-12-11 19:24:15 +1000133static void
134nouveau_bo_del_ttm(struct ttm_buffer_object *bo)
135{
Ben Skeggsebb945a2012-07-20 08:17:34 +1000136 struct nouveau_drm *drm = nouveau_bdev(bo->bdev);
137 struct drm_device *dev = drm->dev;
Ben Skeggs6ee73862009-12-11 19:24:15 +1000138 struct nouveau_bo *nvbo = nouveau_bo(bo);
139
David Herrmann55fb74a2013-10-02 10:15:17 +0200140 if (unlikely(nvbo->gem.filp))
Ben Skeggs6ee73862009-12-11 19:24:15 +1000141 DRM_ERROR("bo %p still attached to GEM object\n", bo);
Maarten Lankhorst4f385592013-07-07 10:37:35 +0200142 WARN_ON(nvbo->pin_refcnt > 0);
Ben Skeggsbc9e7b92012-07-19 17:54:21 +1000143 nv10_bo_put_tile_region(dev, nvbo->tile, NULL);
Ben Skeggs6ee73862009-12-11 19:24:15 +1000144 kfree(nvbo);
145}
146
Francisco Jereza0af9ad2009-12-11 16:51:09 +0100147static void
Ben Skeggsdb5c8e22011-02-10 13:41:01 +1000148nouveau_bo_fixup_align(struct nouveau_bo *nvbo, u32 flags,
Ben Skeggsf91bac52011-06-06 14:15:46 +1000149 int *align, int *size)
Francisco Jereza0af9ad2009-12-11 16:51:09 +0100150{
Ben Skeggsebb945a2012-07-20 08:17:34 +1000151 struct nouveau_drm *drm = nouveau_bdev(nvbo->bo.bdev);
Ben Skeggs967e7bd2014-08-10 04:10:22 +1000152 struct nvif_device *device = &drm->device;
Francisco Jereza0af9ad2009-12-11 16:51:09 +0100153
Ben Skeggs967e7bd2014-08-10 04:10:22 +1000154 if (device->info.family < NV_DEVICE_INFO_V0_TESLA) {
Ben Skeggsbfd83ac2010-11-12 15:12:51 +1000155 if (nvbo->tile_mode) {
Ben Skeggs967e7bd2014-08-10 04:10:22 +1000156 if (device->info.chipset >= 0x40) {
Francisco Jereza0af9ad2009-12-11 16:51:09 +0100157 *align = 65536;
Ben Skeggsbfd83ac2010-11-12 15:12:51 +1000158 *size = roundup(*size, 64 * nvbo->tile_mode);
Francisco Jereza0af9ad2009-12-11 16:51:09 +0100159
Ben Skeggs967e7bd2014-08-10 04:10:22 +1000160 } else if (device->info.chipset >= 0x30) {
Francisco Jereza0af9ad2009-12-11 16:51:09 +0100161 *align = 32768;
Ben Skeggsbfd83ac2010-11-12 15:12:51 +1000162 *size = roundup(*size, 64 * nvbo->tile_mode);
Francisco Jereza0af9ad2009-12-11 16:51:09 +0100163
Ben Skeggs967e7bd2014-08-10 04:10:22 +1000164 } else if (device->info.chipset >= 0x20) {
Francisco Jereza0af9ad2009-12-11 16:51:09 +0100165 *align = 16384;
Ben Skeggsbfd83ac2010-11-12 15:12:51 +1000166 *size = roundup(*size, 64 * nvbo->tile_mode);
Francisco Jereza0af9ad2009-12-11 16:51:09 +0100167
Ben Skeggs967e7bd2014-08-10 04:10:22 +1000168 } else if (device->info.chipset >= 0x10) {
Francisco Jereza0af9ad2009-12-11 16:51:09 +0100169 *align = 16384;
Ben Skeggsbfd83ac2010-11-12 15:12:51 +1000170 *size = roundup(*size, 32 * nvbo->tile_mode);
Francisco Jereza0af9ad2009-12-11 16:51:09 +0100171 }
172 }
Ben Skeggsbfd83ac2010-11-12 15:12:51 +1000173 } else {
Ben Skeggsf91bac52011-06-06 14:15:46 +1000174 *size = roundup(*size, (1 << nvbo->page_shift));
175 *align = max((1 << nvbo->page_shift), *align);
Francisco Jereza0af9ad2009-12-11 16:51:09 +0100176 }
177
Maarten Maathuis1c7059e2009-12-25 18:51:17 +0100178 *size = roundup(*size, PAGE_SIZE);
Francisco Jereza0af9ad2009-12-11 16:51:09 +0100179}
180
Ben Skeggs6ee73862009-12-11 19:24:15 +1000181int
Ben Skeggs7375c952011-06-07 14:21:29 +1000182nouveau_bo_new(struct drm_device *dev, int size, int align,
183 uint32_t flags, uint32_t tile_mode, uint32_t tile_flags,
Maarten Lankhorstbb6178b2014-01-09 11:03:15 +0100184 struct sg_table *sg, struct reservation_object *robj,
Ben Skeggs7375c952011-06-07 14:21:29 +1000185 struct nouveau_bo **pnvbo)
Ben Skeggs6ee73862009-12-11 19:24:15 +1000186{
Ben Skeggs77145f12012-07-31 16:16:21 +1000187 struct nouveau_drm *drm = nouveau_drm(dev);
Ben Skeggs6ee73862009-12-11 19:24:15 +1000188 struct nouveau_bo *nvbo;
Jerome Glisse57de4ba2011-11-11 15:42:57 -0500189 size_t acc_size;
Ben Skeggsf91bac52011-06-06 14:15:46 +1000190 int ret;
Dave Airlie22b33e82012-04-02 11:53:06 +0100191 int type = ttm_bo_type_device;
Maarten Lankhorst35095f72013-07-27 10:17:12 +0200192 int lpg_shift = 12;
193 int max_size;
194
Ben Skeggs3ee6f5b2014-08-10 04:10:20 +1000195 if (drm->client.vm)
196 lpg_shift = drm->client.vm->vmm->lpg_shift;
Maarten Lankhorst35095f72013-07-27 10:17:12 +0200197 max_size = INT_MAX & ~((1 << lpg_shift) - 1);
Maarten Lankhorst0108bc82013-07-07 10:40:19 +0200198
199 if (size <= 0 || size > max_size) {
Ben Skeggsfa2bade2014-08-10 04:10:22 +1000200 NV_WARN(drm, "skipped size %x\n", (u32)size);
Maarten Lankhorst0108bc82013-07-07 10:40:19 +0200201 return -EINVAL;
202 }
Dave Airlie22b33e82012-04-02 11:53:06 +0100203
204 if (sg)
205 type = ttm_bo_type_sg;
Ben Skeggs6ee73862009-12-11 19:24:15 +1000206
207 nvbo = kzalloc(sizeof(struct nouveau_bo), GFP_KERNEL);
208 if (!nvbo)
209 return -ENOMEM;
210 INIT_LIST_HEAD(&nvbo->head);
211 INIT_LIST_HEAD(&nvbo->entry);
Ben Skeggsfd2871a2011-06-06 14:07:04 +1000212 INIT_LIST_HEAD(&nvbo->vma_list);
Ben Skeggs6ee73862009-12-11 19:24:15 +1000213 nvbo->tile_mode = tile_mode;
214 nvbo->tile_flags = tile_flags;
Ben Skeggsebb945a2012-07-20 08:17:34 +1000215 nvbo->bo.bdev = &drm->ttm.bdev;
Ben Skeggs6ee73862009-12-11 19:24:15 +1000216
Alexandre Courbotc3a0c772014-10-27 18:49:17 +0900217 if (!nv_device_is_cpu_coherent(nvkm_device(&drm->device)))
218 nvbo->force_coherent = flags & TTM_PL_FLAG_UNCACHED;
219
Ben Skeggsf91bac52011-06-06 14:15:46 +1000220 nvbo->page_shift = 12;
Ben Skeggs3ee6f5b2014-08-10 04:10:20 +1000221 if (drm->client.vm) {
Ben Skeggsf91bac52011-06-06 14:15:46 +1000222 if (!(flags & TTM_PL_FLAG_TT) && size > 256 * 1024)
Ben Skeggs3ee6f5b2014-08-10 04:10:20 +1000223 nvbo->page_shift = drm->client.vm->vmm->lpg_shift;
Ben Skeggsf91bac52011-06-06 14:15:46 +1000224 }
225
226 nouveau_bo_fixup_align(nvbo, flags, &align, &size);
Ben Skeggsfd2871a2011-06-06 14:07:04 +1000227 nvbo->bo.mem.num_pages = size >> PAGE_SHIFT;
228 nouveau_bo_placement_set(nvbo, flags, 0);
Ben Skeggs6ee73862009-12-11 19:24:15 +1000229
Ben Skeggsebb945a2012-07-20 08:17:34 +1000230 acc_size = ttm_bo_dma_acc_size(&drm->ttm.bdev, size,
Jerome Glisse57de4ba2011-11-11 15:42:57 -0500231 sizeof(struct nouveau_bo));
232
Ben Skeggsebb945a2012-07-20 08:17:34 +1000233 ret = ttm_bo_init(&drm->ttm.bdev, &nvbo->bo, size,
Dave Airlie22b33e82012-04-02 11:53:06 +0100234 type, &nvbo->placement,
Marcin Slusarz0b91c4a2012-11-06 21:49:51 +0000235 align >> PAGE_SHIFT, false, NULL, acc_size, sg,
Maarten Lankhorstbb6178b2014-01-09 11:03:15 +0100236 robj, nouveau_bo_del_ttm);
Ben Skeggs6ee73862009-12-11 19:24:15 +1000237 if (ret) {
238 /* ttm will call nouveau_bo_del_ttm if it fails.. */
239 return ret;
240 }
241
Ben Skeggs6ee73862009-12-11 19:24:15 +1000242 *pnvbo = nvbo;
243 return 0;
244}
245
Francisco Jerez78ad0f72010-03-18 13:07:47 +0100246static void
Christian Königf1217ed2014-08-27 13:16:04 +0200247set_placement_list(struct ttm_place *pl, unsigned *n, uint32_t type, uint32_t flags)
Ben Skeggs6ee73862009-12-11 19:24:15 +1000248{
Francisco Jerez78ad0f72010-03-18 13:07:47 +0100249 *n = 0;
Ben Skeggs6ee73862009-12-11 19:24:15 +1000250
Francisco Jerez78ad0f72010-03-18 13:07:47 +0100251 if (type & TTM_PL_FLAG_VRAM)
Christian Königf1217ed2014-08-27 13:16:04 +0200252 pl[(*n)++].flags = TTM_PL_FLAG_VRAM | flags;
Francisco Jerez78ad0f72010-03-18 13:07:47 +0100253 if (type & TTM_PL_FLAG_TT)
Christian Königf1217ed2014-08-27 13:16:04 +0200254 pl[(*n)++].flags = TTM_PL_FLAG_TT | flags;
Francisco Jerez78ad0f72010-03-18 13:07:47 +0100255 if (type & TTM_PL_FLAG_SYSTEM)
Christian Königf1217ed2014-08-27 13:16:04 +0200256 pl[(*n)++].flags = TTM_PL_FLAG_SYSTEM | flags;
Francisco Jerez78ad0f72010-03-18 13:07:47 +0100257}
Ben Skeggs37cb3e082009-12-16 16:22:42 +1000258
Francisco Jerez699ddfd2010-10-10 06:07:32 +0200259static void
260set_placement_range(struct nouveau_bo *nvbo, uint32_t type)
261{
Ben Skeggsebb945a2012-07-20 08:17:34 +1000262 struct nouveau_drm *drm = nouveau_bdev(nvbo->bo.bdev);
Ben Skeggsf392ec42014-08-10 04:10:28 +1000263 u32 vram_pages = drm->device.info.ram_size >> PAGE_SHIFT;
Christian Königf1217ed2014-08-27 13:16:04 +0200264 unsigned i, fpfn, lpfn;
Francisco Jerez699ddfd2010-10-10 06:07:32 +0200265
Ben Skeggs967e7bd2014-08-10 04:10:22 +1000266 if (drm->device.info.family == NV_DEVICE_INFO_V0_CELSIUS &&
Francisco Jerez812f2192011-02-03 01:49:33 +0100267 nvbo->tile_mode && (type & TTM_PL_FLAG_VRAM) &&
Francisco Jerez4beb1162011-11-06 21:21:28 +0100268 nvbo->bo.mem.num_pages < vram_pages / 4) {
Francisco Jerez699ddfd2010-10-10 06:07:32 +0200269 /*
270 * Make sure that the color and depth buffers are handled
271 * by independent memory controller units. Up to a 9x
272 * speed up when alpha-blending and depth-test are enabled
273 * at the same time.
274 */
Francisco Jerez699ddfd2010-10-10 06:07:32 +0200275 if (nvbo->tile_flags & NOUVEAU_GEM_TILE_ZETA) {
Christian Königf1217ed2014-08-27 13:16:04 +0200276 fpfn = vram_pages / 2;
277 lpfn = ~0;
Francisco Jerez699ddfd2010-10-10 06:07:32 +0200278 } else {
Christian Königf1217ed2014-08-27 13:16:04 +0200279 fpfn = 0;
280 lpfn = vram_pages / 2;
281 }
282 for (i = 0; i < nvbo->placement.num_placement; ++i) {
283 nvbo->placements[i].fpfn = fpfn;
284 nvbo->placements[i].lpfn = lpfn;
285 }
286 for (i = 0; i < nvbo->placement.num_busy_placement; ++i) {
287 nvbo->busy_placements[i].fpfn = fpfn;
288 nvbo->busy_placements[i].lpfn = lpfn;
Francisco Jerez699ddfd2010-10-10 06:07:32 +0200289 }
290 }
291}
292
Francisco Jerez78ad0f72010-03-18 13:07:47 +0100293void
294nouveau_bo_placement_set(struct nouveau_bo *nvbo, uint32_t type, uint32_t busy)
295{
296 struct ttm_placement *pl = &nvbo->placement;
Alexandre Courbotc3a0c772014-10-27 18:49:17 +0900297 uint32_t flags = (nvbo->force_coherent ? TTM_PL_FLAG_UNCACHED :
298 TTM_PL_MASK_CACHING) |
299 (nvbo->pin_refcnt ? TTM_PL_FLAG_NO_EVICT : 0);
Francisco Jerez78ad0f72010-03-18 13:07:47 +0100300
301 pl->placement = nvbo->placements;
302 set_placement_list(nvbo->placements, &pl->num_placement,
303 type, flags);
304
305 pl->busy_placement = nvbo->busy_placements;
306 set_placement_list(nvbo->busy_placements, &pl->num_busy_placement,
307 type | busy, flags);
Francisco Jerez699ddfd2010-10-10 06:07:32 +0200308
309 set_placement_range(nvbo, type);
Ben Skeggs6ee73862009-12-11 19:24:15 +1000310}
311
312int
313nouveau_bo_pin(struct nouveau_bo *nvbo, uint32_t memtype)
314{
Ben Skeggsebb945a2012-07-20 08:17:34 +1000315 struct nouveau_drm *drm = nouveau_bdev(nvbo->bo.bdev);
Ben Skeggs6ee73862009-12-11 19:24:15 +1000316 struct ttm_buffer_object *bo = &nvbo->bo;
Francisco Jerez78ad0f72010-03-18 13:07:47 +0100317 int ret;
Ben Skeggs6ee73862009-12-11 19:24:15 +1000318
Thierry Redingee3939e2014-07-21 13:15:51 +0200319 ret = ttm_bo_reserve(bo, false, false, false, NULL);
Daniel Vetter0ae6d7b2012-12-11 21:52:30 +0100320 if (ret)
321 goto out;
322
Ben Skeggs6ee73862009-12-11 19:24:15 +1000323 if (nvbo->pin_refcnt && !(memtype & (1 << bo->mem.mem_type))) {
Ben Skeggsebb945a2012-07-20 08:17:34 +1000324 NV_ERROR(drm, "bo %p pinned elsewhere: 0x%08x vs 0x%08x\n", bo,
Ben Skeggs6ee73862009-12-11 19:24:15 +1000325 1 << bo->mem.mem_type, memtype);
Daniel Vetter0ae6d7b2012-12-11 21:52:30 +0100326 ret = -EINVAL;
327 goto out;
Ben Skeggs6ee73862009-12-11 19:24:15 +1000328 }
329
Alexandre Courbot5be5a152014-10-27 18:11:52 +0900330 if (nvbo->pin_refcnt)
331 goto ref_inc;
Ben Skeggs6ee73862009-12-11 19:24:15 +1000332
Francisco Jerez78ad0f72010-03-18 13:07:47 +0100333 nouveau_bo_placement_set(nvbo, memtype, 0);
Ben Skeggs6ee73862009-12-11 19:24:15 +1000334
Maarten Lankhorst97a875c2012-11-28 11:25:44 +0000335 ret = nouveau_bo_validate(nvbo, false, false);
Ben Skeggs6aac6ce2014-11-06 14:34:31 +1000336 if (ret)
337 goto out;
338
339 switch (bo->mem.mem_type) {
340 case TTM_PL_VRAM:
341 drm->gem.vram_available -= bo->mem.size;
342 break;
343 case TTM_PL_TT:
344 drm->gem.gart_available -= bo->mem.size;
345 break;
346 default:
347 break;
Ben Skeggs6ee73862009-12-11 19:24:15 +1000348 }
Alexandre Courbot5be5a152014-10-27 18:11:52 +0900349
350ref_inc:
351 nvbo->pin_refcnt++;
Ben Skeggs6ee73862009-12-11 19:24:15 +1000352out:
Daniel Vetter0ae6d7b2012-12-11 21:52:30 +0100353 ttm_bo_unreserve(bo);
Ben Skeggs6ee73862009-12-11 19:24:15 +1000354 return ret;
355}
356
357int
358nouveau_bo_unpin(struct nouveau_bo *nvbo)
359{
Ben Skeggsebb945a2012-07-20 08:17:34 +1000360 struct nouveau_drm *drm = nouveau_bdev(nvbo->bo.bdev);
Ben Skeggs6ee73862009-12-11 19:24:15 +1000361 struct ttm_buffer_object *bo = &nvbo->bo;
Maarten Lankhorst4f385592013-07-07 10:37:35 +0200362 int ret, ref;
Ben Skeggs6ee73862009-12-11 19:24:15 +1000363
Thierry Redingee3939e2014-07-21 13:15:51 +0200364 ret = ttm_bo_reserve(bo, false, false, false, NULL);
Ben Skeggs6ee73862009-12-11 19:24:15 +1000365 if (ret)
366 return ret;
367
Maarten Lankhorst4f385592013-07-07 10:37:35 +0200368 ref = --nvbo->pin_refcnt;
369 WARN_ON_ONCE(ref < 0);
370 if (ref)
Daniel Vetter0ae6d7b2012-12-11 21:52:30 +0100371 goto out;
372
Francisco Jerez78ad0f72010-03-18 13:07:47 +0100373 nouveau_bo_placement_set(nvbo, bo->mem.placement, 0);
Ben Skeggs6ee73862009-12-11 19:24:15 +1000374
Maarten Lankhorst97a875c2012-11-28 11:25:44 +0000375 ret = nouveau_bo_validate(nvbo, false, false);
Ben Skeggs6ee73862009-12-11 19:24:15 +1000376 if (ret == 0) {
377 switch (bo->mem.mem_type) {
378 case TTM_PL_VRAM:
Ben Skeggsebb945a2012-07-20 08:17:34 +1000379 drm->gem.vram_available += bo->mem.size;
Ben Skeggs6ee73862009-12-11 19:24:15 +1000380 break;
381 case TTM_PL_TT:
Ben Skeggsebb945a2012-07-20 08:17:34 +1000382 drm->gem.gart_available += bo->mem.size;
Ben Skeggs6ee73862009-12-11 19:24:15 +1000383 break;
384 default:
385 break;
386 }
387 }
388
Daniel Vetter0ae6d7b2012-12-11 21:52:30 +0100389out:
Ben Skeggs6ee73862009-12-11 19:24:15 +1000390 ttm_bo_unreserve(bo);
391 return ret;
392}
393
394int
395nouveau_bo_map(struct nouveau_bo *nvbo)
396{
397 int ret;
398
Thierry Redingee3939e2014-07-21 13:15:51 +0200399 ret = ttm_bo_reserve(&nvbo->bo, false, false, false, NULL);
Ben Skeggs6ee73862009-12-11 19:24:15 +1000400 if (ret)
401 return ret;
402
Alexandre Courbotc3a0c772014-10-27 18:49:17 +0900403 /*
404 * TTM buffers allocated using the DMA API already have a mapping, let's
405 * use it instead.
406 */
407 if (!nvbo->force_coherent)
408 ret = ttm_bo_kmap(&nvbo->bo, 0, nvbo->bo.mem.num_pages,
409 &nvbo->kmap);
410
Ben Skeggs6ee73862009-12-11 19:24:15 +1000411 ttm_bo_unreserve(&nvbo->bo);
412 return ret;
413}
414
415void
416nouveau_bo_unmap(struct nouveau_bo *nvbo)
417{
Alexandre Courbotc3a0c772014-10-27 18:49:17 +0900418 if (!nvbo)
419 return;
420
421 /*
422 * TTM buffers allocated using the DMA API already had a coherent
423 * mapping which we used, no need to unmap.
424 */
425 if (!nvbo->force_coherent)
Ben Skeggs9d59e8a2010-08-27 13:04:41 +1000426 ttm_bo_kunmap(&nvbo->kmap);
Ben Skeggs6ee73862009-12-11 19:24:15 +1000427}
428
Alexandre Courbotb22870b2014-10-27 18:49:19 +0900429void
430nouveau_bo_sync_for_device(struct nouveau_bo *nvbo)
431{
432 struct nouveau_drm *drm = nouveau_bdev(nvbo->bo.bdev);
433 struct nouveau_device *device = nvkm_device(&drm->device);
434 struct ttm_dma_tt *ttm_dma = (struct ttm_dma_tt *)nvbo->bo.ttm;
435 int i;
436
437 if (!ttm_dma)
438 return;
439
440 /* Don't waste time looping if the object is coherent */
441 if (nvbo->force_coherent)
442 return;
443
444 for (i = 0; i < ttm_dma->ttm.num_pages; i++)
445 dma_sync_single_for_device(nv_device_base(device),
446 ttm_dma->dma_address[i], PAGE_SIZE, DMA_TO_DEVICE);
447}
448
449void
450nouveau_bo_sync_for_cpu(struct nouveau_bo *nvbo)
451{
452 struct nouveau_drm *drm = nouveau_bdev(nvbo->bo.bdev);
453 struct nouveau_device *device = nvkm_device(&drm->device);
454 struct ttm_dma_tt *ttm_dma = (struct ttm_dma_tt *)nvbo->bo.ttm;
455 int i;
456
457 if (!ttm_dma)
458 return;
459
460 /* Don't waste time looping if the object is coherent */
461 if (nvbo->force_coherent)
462 return;
463
464 for (i = 0; i < ttm_dma->ttm.num_pages; i++)
465 dma_sync_single_for_cpu(nv_device_base(device),
466 ttm_dma->dma_address[i], PAGE_SIZE, DMA_FROM_DEVICE);
467}
468
Ben Skeggs7a45d762010-11-22 08:50:27 +1000469int
470nouveau_bo_validate(struct nouveau_bo *nvbo, bool interruptible,
Maarten Lankhorst97a875c2012-11-28 11:25:44 +0000471 bool no_wait_gpu)
Ben Skeggs7a45d762010-11-22 08:50:27 +1000472{
473 int ret;
474
Maarten Lankhorst97a875c2012-11-28 11:25:44 +0000475 ret = ttm_bo_validate(&nvbo->bo, &nvbo->placement,
476 interruptible, no_wait_gpu);
Ben Skeggs7a45d762010-11-22 08:50:27 +1000477 if (ret)
478 return ret;
479
Alexandre Courbotb22870b2014-10-27 18:49:19 +0900480 nouveau_bo_sync_for_device(nvbo);
481
Ben Skeggs7a45d762010-11-22 08:50:27 +1000482 return 0;
483}
484
Alexandre Courbotc3a0c772014-10-27 18:49:17 +0900485static inline void *
486_nouveau_bo_mem_index(struct nouveau_bo *nvbo, unsigned index, void *mem, u8 sz)
487{
488 struct ttm_dma_tt *dma_tt;
489 u8 *m = mem;
490
491 index *= sz;
492
493 if (m) {
494 /* kmap'd address, return the corresponding offset */
495 m += index;
496 } else {
497 /* DMA-API mapping, lookup the right address */
498 dma_tt = (struct ttm_dma_tt *)nvbo->bo.ttm;
499 m = dma_tt->cpu_address[index / PAGE_SIZE];
500 m += index % PAGE_SIZE;
501 }
502
503 return m;
504}
505#define nouveau_bo_mem_index(o, i, m) _nouveau_bo_mem_index(o, i, m, sizeof(*m))
506
Ben Skeggs6ee73862009-12-11 19:24:15 +1000507u16
508nouveau_bo_rd16(struct nouveau_bo *nvbo, unsigned index)
509{
510 bool is_iomem;
511 u16 *mem = ttm_kmap_obj_virtual(&nvbo->kmap, &is_iomem);
Alexandre Courbotc3a0c772014-10-27 18:49:17 +0900512
513 mem = nouveau_bo_mem_index(nvbo, index, mem);
514
Ben Skeggs6ee73862009-12-11 19:24:15 +1000515 if (is_iomem)
516 return ioread16_native((void __force __iomem *)mem);
517 else
518 return *mem;
519}
520
521void
522nouveau_bo_wr16(struct nouveau_bo *nvbo, unsigned index, u16 val)
523{
524 bool is_iomem;
525 u16 *mem = ttm_kmap_obj_virtual(&nvbo->kmap, &is_iomem);
Alexandre Courbotc3a0c772014-10-27 18:49:17 +0900526
527 mem = nouveau_bo_mem_index(nvbo, index, mem);
528
Ben Skeggs6ee73862009-12-11 19:24:15 +1000529 if (is_iomem)
530 iowrite16_native(val, (void __force __iomem *)mem);
531 else
532 *mem = val;
533}
534
535u32
536nouveau_bo_rd32(struct nouveau_bo *nvbo, unsigned index)
537{
538 bool is_iomem;
539 u32 *mem = ttm_kmap_obj_virtual(&nvbo->kmap, &is_iomem);
Alexandre Courbotc3a0c772014-10-27 18:49:17 +0900540
541 mem = nouveau_bo_mem_index(nvbo, index, mem);
542
Ben Skeggs6ee73862009-12-11 19:24:15 +1000543 if (is_iomem)
544 return ioread32_native((void __force __iomem *)mem);
545 else
546 return *mem;
547}
548
549void
550nouveau_bo_wr32(struct nouveau_bo *nvbo, unsigned index, u32 val)
551{
552 bool is_iomem;
553 u32 *mem = ttm_kmap_obj_virtual(&nvbo->kmap, &is_iomem);
Alexandre Courbotc3a0c772014-10-27 18:49:17 +0900554
555 mem = nouveau_bo_mem_index(nvbo, index, mem);
556
Ben Skeggs6ee73862009-12-11 19:24:15 +1000557 if (is_iomem)
558 iowrite32_native(val, (void __force __iomem *)mem);
559 else
560 *mem = val;
561}
562
Jerome Glisse649bf3c2011-11-01 20:46:13 -0400563static struct ttm_tt *
Ben Skeggsebb945a2012-07-20 08:17:34 +1000564nouveau_ttm_tt_create(struct ttm_bo_device *bdev, unsigned long size,
565 uint32_t page_flags, struct page *dummy_read)
Ben Skeggs6ee73862009-12-11 19:24:15 +1000566{
Max Filippovdf1b4b92012-10-14 01:58:26 +0400567#if __OS_HAS_AGP
Ben Skeggsebb945a2012-07-20 08:17:34 +1000568 struct nouveau_drm *drm = nouveau_bdev(bdev);
569 struct drm_device *dev = drm->dev;
Ben Skeggs6ee73862009-12-11 19:24:15 +1000570
Ben Skeggsebb945a2012-07-20 08:17:34 +1000571 if (drm->agp.stat == ENABLED) {
572 return ttm_agp_tt_create(bdev, dev->agp->bridge, size,
573 page_flags, dummy_read);
Ben Skeggs6ee73862009-12-11 19:24:15 +1000574 }
Max Filippovdf1b4b92012-10-14 01:58:26 +0400575#endif
Ben Skeggs6ee73862009-12-11 19:24:15 +1000576
Ben Skeggsebb945a2012-07-20 08:17:34 +1000577 return nouveau_sgdma_create_ttm(bdev, size, page_flags, dummy_read);
Ben Skeggs6ee73862009-12-11 19:24:15 +1000578}
579
580static int
581nouveau_bo_invalidate_caches(struct ttm_bo_device *bdev, uint32_t flags)
582{
583 /* We'll do this from user space. */
584 return 0;
585}
586
587static int
588nouveau_bo_init_mem_type(struct ttm_bo_device *bdev, uint32_t type,
589 struct ttm_mem_type_manager *man)
590{
Ben Skeggsebb945a2012-07-20 08:17:34 +1000591 struct nouveau_drm *drm = nouveau_bdev(bdev);
Ben Skeggs6ee73862009-12-11 19:24:15 +1000592
593 switch (type) {
594 case TTM_PL_SYSTEM:
595 man->flags = TTM_MEMTYPE_FLAG_MAPPABLE;
596 man->available_caching = TTM_PL_MASK_CACHING;
597 man->default_caching = TTM_PL_FLAG_CACHED;
598 break;
599 case TTM_PL_VRAM:
Alexandre Courbote2a4e782014-06-27 19:28:50 +0900600 man->flags = TTM_MEMTYPE_FLAG_FIXED |
601 TTM_MEMTYPE_FLAG_MAPPABLE;
602 man->available_caching = TTM_PL_FLAG_UNCACHED |
603 TTM_PL_FLAG_WC;
604 man->default_caching = TTM_PL_FLAG_WC;
605
Ben Skeggs967e7bd2014-08-10 04:10:22 +1000606 if (drm->device.info.family >= NV_DEVICE_INFO_V0_TESLA) {
Alexandre Courbote2a4e782014-06-27 19:28:50 +0900607 /* Some BARs do not support being ioremapped WC */
Ben Skeggs967e7bd2014-08-10 04:10:22 +1000608 if (nvkm_bar(&drm->device)->iomap_uncached) {
Alexandre Courbote2a4e782014-06-27 19:28:50 +0900609 man->available_caching = TTM_PL_FLAG_UNCACHED;
610 man->default_caching = TTM_PL_FLAG_UNCACHED;
611 }
612
Ben Skeggs573a2a32010-08-25 15:26:04 +1000613 man->func = &nouveau_vram_manager;
Ben Skeggsf869ef82010-11-15 11:53:16 +1000614 man->io_reserve_fastpath = false;
615 man->use_io_reserve_lru = true;
616 } else {
Ben Skeggs573a2a32010-08-25 15:26:04 +1000617 man->func = &ttm_bo_manager_func;
Ben Skeggsf869ef82010-11-15 11:53:16 +1000618 }
Ben Skeggs6ee73862009-12-11 19:24:15 +1000619 break;
620 case TTM_PL_TT:
Ben Skeggs967e7bd2014-08-10 04:10:22 +1000621 if (drm->device.info.family >= NV_DEVICE_INFO_V0_TESLA)
Ben Skeggs26c0c9e2011-02-10 12:59:51 +1000622 man->func = &nouveau_gart_manager;
623 else
Ben Skeggsebb945a2012-07-20 08:17:34 +1000624 if (drm->agp.stat != ENABLED)
Ben Skeggs3863c9b2012-07-14 19:09:17 +1000625 man->func = &nv04_gart_manager;
626 else
Ben Skeggs26c0c9e2011-02-10 12:59:51 +1000627 man->func = &ttm_bo_manager_func;
Ben Skeggsebb945a2012-07-20 08:17:34 +1000628
629 if (drm->agp.stat == ENABLED) {
Jerome Glissef32f02f2010-04-09 14:39:25 +0200630 man->flags = TTM_MEMTYPE_FLAG_MAPPABLE;
Francisco Jereza3d487e2010-11-20 22:11:22 +0100631 man->available_caching = TTM_PL_FLAG_UNCACHED |
632 TTM_PL_FLAG_WC;
633 man->default_caching = TTM_PL_FLAG_WC;
Ben Skeggsebb945a2012-07-20 08:17:34 +1000634 } else {
Ben Skeggs6ee73862009-12-11 19:24:15 +1000635 man->flags = TTM_MEMTYPE_FLAG_MAPPABLE |
636 TTM_MEMTYPE_FLAG_CMA;
637 man->available_caching = TTM_PL_MASK_CACHING;
638 man->default_caching = TTM_PL_FLAG_CACHED;
Ben Skeggs6ee73862009-12-11 19:24:15 +1000639 }
Ben Skeggsebb945a2012-07-20 08:17:34 +1000640
Ben Skeggs6ee73862009-12-11 19:24:15 +1000641 break;
642 default:
Ben Skeggs6ee73862009-12-11 19:24:15 +1000643 return -EINVAL;
644 }
645 return 0;
646}
647
648static void
649nouveau_bo_evict_flags(struct ttm_buffer_object *bo, struct ttm_placement *pl)
650{
651 struct nouveau_bo *nvbo = nouveau_bo(bo);
652
653 switch (bo->mem.mem_type) {
Francisco Jerez22fbd532009-12-11 18:40:17 +0100654 case TTM_PL_VRAM:
Francisco Jerez78ad0f72010-03-18 13:07:47 +0100655 nouveau_bo_placement_set(nvbo, TTM_PL_FLAG_TT,
656 TTM_PL_FLAG_SYSTEM);
Francisco Jerez22fbd532009-12-11 18:40:17 +0100657 break;
Ben Skeggs6ee73862009-12-11 19:24:15 +1000658 default:
Francisco Jerez78ad0f72010-03-18 13:07:47 +0100659 nouveau_bo_placement_set(nvbo, TTM_PL_FLAG_SYSTEM, 0);
Ben Skeggs6ee73862009-12-11 19:24:15 +1000660 break;
661 }
Francisco Jerez22fbd532009-12-11 18:40:17 +0100662
663 *pl = nvbo->placement;
Ben Skeggs6ee73862009-12-11 19:24:15 +1000664}
665
666
Ben Skeggs6ee73862009-12-11 19:24:15 +1000667static int
Ben Skeggs49981042012-08-06 19:38:25 +1000668nve0_bo_move_init(struct nouveau_channel *chan, u32 handle)
669{
670 int ret = RING_SPACE(chan, 2);
671 if (ret == 0) {
672 BEGIN_NVC0(chan, NvSubCopy, 0x0000, 1);
Ben Skeggs00fc6f62013-07-09 14:20:15 +1000673 OUT_RING (chan, handle & 0x0000ffff);
Ben Skeggs49981042012-08-06 19:38:25 +1000674 FIRE_RING (chan);
675 }
676 return ret;
677}
678
679static int
Ben Skeggsc6b7e892012-03-20 14:36:04 +1000680nve0_bo_move_copy(struct nouveau_channel *chan, struct ttm_buffer_object *bo,
681 struct ttm_mem_reg *old_mem, struct ttm_mem_reg *new_mem)
682{
683 struct nouveau_mem *node = old_mem->mm_node;
684 int ret = RING_SPACE(chan, 10);
685 if (ret == 0) {
Ben Skeggs6d597022012-04-01 21:09:13 +1000686 BEGIN_NVC0(chan, NvSubCopy, 0x0400, 8);
Ben Skeggsc6b7e892012-03-20 14:36:04 +1000687 OUT_RING (chan, upper_32_bits(node->vma[0].offset));
688 OUT_RING (chan, lower_32_bits(node->vma[0].offset));
689 OUT_RING (chan, upper_32_bits(node->vma[1].offset));
690 OUT_RING (chan, lower_32_bits(node->vma[1].offset));
691 OUT_RING (chan, PAGE_SIZE);
692 OUT_RING (chan, PAGE_SIZE);
693 OUT_RING (chan, PAGE_SIZE);
694 OUT_RING (chan, new_mem->num_pages);
Ben Skeggs6d597022012-04-01 21:09:13 +1000695 BEGIN_IMC0(chan, NvSubCopy, 0x0300, 0x0386);
Ben Skeggsc6b7e892012-03-20 14:36:04 +1000696 }
697 return ret;
698}
699
700static int
Ben Skeggsd1b167e2012-05-04 14:01:52 +1000701nvc0_bo_move_init(struct nouveau_channel *chan, u32 handle)
702{
703 int ret = RING_SPACE(chan, 2);
704 if (ret == 0) {
705 BEGIN_NVC0(chan, NvSubCopy, 0x0000, 1);
706 OUT_RING (chan, handle);
707 }
708 return ret;
709}
710
711static int
Ben Skeggs1a460982012-05-04 15:17:28 +1000712nvc0_bo_move_copy(struct nouveau_channel *chan, struct ttm_buffer_object *bo,
713 struct ttm_mem_reg *old_mem, struct ttm_mem_reg *new_mem)
714{
715 struct nouveau_mem *node = old_mem->mm_node;
716 u64 src_offset = node->vma[0].offset;
717 u64 dst_offset = node->vma[1].offset;
718 u32 page_count = new_mem->num_pages;
719 int ret;
720
721 page_count = new_mem->num_pages;
722 while (page_count) {
723 int line_count = (page_count > 8191) ? 8191 : page_count;
724
725 ret = RING_SPACE(chan, 11);
726 if (ret)
727 return ret;
728
729 BEGIN_NVC0(chan, NvSubCopy, 0x030c, 8);
730 OUT_RING (chan, upper_32_bits(src_offset));
731 OUT_RING (chan, lower_32_bits(src_offset));
732 OUT_RING (chan, upper_32_bits(dst_offset));
733 OUT_RING (chan, lower_32_bits(dst_offset));
734 OUT_RING (chan, PAGE_SIZE);
735 OUT_RING (chan, PAGE_SIZE);
736 OUT_RING (chan, PAGE_SIZE);
737 OUT_RING (chan, line_count);
738 BEGIN_NVC0(chan, NvSubCopy, 0x0300, 1);
739 OUT_RING (chan, 0x00000110);
740
741 page_count -= line_count;
742 src_offset += (PAGE_SIZE * line_count);
743 dst_offset += (PAGE_SIZE * line_count);
744 }
745
746 return 0;
747}
748
749static int
Ben Skeggs183720b2010-12-09 15:17:10 +1000750nvc0_bo_move_m2mf(struct nouveau_channel *chan, struct ttm_buffer_object *bo,
751 struct ttm_mem_reg *old_mem, struct ttm_mem_reg *new_mem)
752{
Ben Skeggsd2f966662011-06-06 20:54:42 +1000753 struct nouveau_mem *node = old_mem->mm_node;
754 u64 src_offset = node->vma[0].offset;
755 u64 dst_offset = node->vma[1].offset;
Ben Skeggs183720b2010-12-09 15:17:10 +1000756 u32 page_count = new_mem->num_pages;
757 int ret;
758
Ben Skeggs183720b2010-12-09 15:17:10 +1000759 page_count = new_mem->num_pages;
760 while (page_count) {
761 int line_count = (page_count > 2047) ? 2047 : page_count;
762
763 ret = RING_SPACE(chan, 12);
764 if (ret)
765 return ret;
766
Ben Skeggsd1b167e2012-05-04 14:01:52 +1000767 BEGIN_NVC0(chan, NvSubCopy, 0x0238, 2);
Ben Skeggs183720b2010-12-09 15:17:10 +1000768 OUT_RING (chan, upper_32_bits(dst_offset));
769 OUT_RING (chan, lower_32_bits(dst_offset));
Ben Skeggsd1b167e2012-05-04 14:01:52 +1000770 BEGIN_NVC0(chan, NvSubCopy, 0x030c, 6);
Ben Skeggs183720b2010-12-09 15:17:10 +1000771 OUT_RING (chan, upper_32_bits(src_offset));
772 OUT_RING (chan, lower_32_bits(src_offset));
773 OUT_RING (chan, PAGE_SIZE); /* src_pitch */
774 OUT_RING (chan, PAGE_SIZE); /* dst_pitch */
775 OUT_RING (chan, PAGE_SIZE); /* line_length */
776 OUT_RING (chan, line_count);
Ben Skeggsd1b167e2012-05-04 14:01:52 +1000777 BEGIN_NVC0(chan, NvSubCopy, 0x0300, 1);
Ben Skeggs183720b2010-12-09 15:17:10 +1000778 OUT_RING (chan, 0x00100110);
779
780 page_count -= line_count;
781 src_offset += (PAGE_SIZE * line_count);
782 dst_offset += (PAGE_SIZE * line_count);
783 }
784
785 return 0;
786}
787
788static int
Ben Skeggsfdf53242012-05-04 15:15:12 +1000789nva3_bo_move_copy(struct nouveau_channel *chan, struct ttm_buffer_object *bo,
790 struct ttm_mem_reg *old_mem, struct ttm_mem_reg *new_mem)
791{
792 struct nouveau_mem *node = old_mem->mm_node;
793 u64 src_offset = node->vma[0].offset;
794 u64 dst_offset = node->vma[1].offset;
795 u32 page_count = new_mem->num_pages;
796 int ret;
797
798 page_count = new_mem->num_pages;
799 while (page_count) {
800 int line_count = (page_count > 8191) ? 8191 : page_count;
801
802 ret = RING_SPACE(chan, 11);
803 if (ret)
804 return ret;
805
806 BEGIN_NV04(chan, NvSubCopy, 0x030c, 8);
807 OUT_RING (chan, upper_32_bits(src_offset));
808 OUT_RING (chan, lower_32_bits(src_offset));
809 OUT_RING (chan, upper_32_bits(dst_offset));
810 OUT_RING (chan, lower_32_bits(dst_offset));
811 OUT_RING (chan, PAGE_SIZE);
812 OUT_RING (chan, PAGE_SIZE);
813 OUT_RING (chan, PAGE_SIZE);
814 OUT_RING (chan, line_count);
815 BEGIN_NV04(chan, NvSubCopy, 0x0300, 1);
816 OUT_RING (chan, 0x00000110);
817
818 page_count -= line_count;
819 src_offset += (PAGE_SIZE * line_count);
820 dst_offset += (PAGE_SIZE * line_count);
821 }
822
823 return 0;
824}
825
826static int
Ben Skeggs5490e5d2012-05-04 14:34:16 +1000827nv98_bo_move_exec(struct nouveau_channel *chan, struct ttm_buffer_object *bo,
828 struct ttm_mem_reg *old_mem, struct ttm_mem_reg *new_mem)
829{
830 struct nouveau_mem *node = old_mem->mm_node;
831 int ret = RING_SPACE(chan, 7);
832 if (ret == 0) {
833 BEGIN_NV04(chan, NvSubCopy, 0x0320, 6);
834 OUT_RING (chan, upper_32_bits(node->vma[0].offset));
835 OUT_RING (chan, lower_32_bits(node->vma[0].offset));
836 OUT_RING (chan, upper_32_bits(node->vma[1].offset));
837 OUT_RING (chan, lower_32_bits(node->vma[1].offset));
838 OUT_RING (chan, 0x00000000 /* COPY */);
839 OUT_RING (chan, new_mem->num_pages << PAGE_SHIFT);
840 }
841 return ret;
842}
843
844static int
Ben Skeggs4c193d22012-05-04 14:21:15 +1000845nv84_bo_move_exec(struct nouveau_channel *chan, struct ttm_buffer_object *bo,
846 struct ttm_mem_reg *old_mem, struct ttm_mem_reg *new_mem)
847{
848 struct nouveau_mem *node = old_mem->mm_node;
849 int ret = RING_SPACE(chan, 7);
850 if (ret == 0) {
851 BEGIN_NV04(chan, NvSubCopy, 0x0304, 6);
852 OUT_RING (chan, new_mem->num_pages << PAGE_SHIFT);
853 OUT_RING (chan, upper_32_bits(node->vma[0].offset));
854 OUT_RING (chan, lower_32_bits(node->vma[0].offset));
855 OUT_RING (chan, upper_32_bits(node->vma[1].offset));
856 OUT_RING (chan, lower_32_bits(node->vma[1].offset));
857 OUT_RING (chan, 0x00000000 /* MODE_COPY, QUERY_NONE */);
858 }
859 return ret;
860}
861
862static int
Ben Skeggsd1b167e2012-05-04 14:01:52 +1000863nv50_bo_move_init(struct nouveau_channel *chan, u32 handle)
864{
Ben Skeggsebb945a2012-07-20 08:17:34 +1000865 int ret = RING_SPACE(chan, 6);
Ben Skeggsd1b167e2012-05-04 14:01:52 +1000866 if (ret == 0) {
Ben Skeggsebb945a2012-07-20 08:17:34 +1000867 BEGIN_NV04(chan, NvSubCopy, 0x0000, 1);
868 OUT_RING (chan, handle);
869 BEGIN_NV04(chan, NvSubCopy, 0x0180, 3);
Ben Skeggsf45f55c2014-08-10 04:10:23 +1000870 OUT_RING (chan, chan->drm->ntfy.handle);
871 OUT_RING (chan, chan->vram.handle);
872 OUT_RING (chan, chan->vram.handle);
Ben Skeggsd1b167e2012-05-04 14:01:52 +1000873 }
874
875 return ret;
876}
877
878static int
Ben Skeggsf1ab0cc2010-08-26 11:32:01 +1000879nv50_bo_move_m2mf(struct nouveau_channel *chan, struct ttm_buffer_object *bo,
880 struct ttm_mem_reg *old_mem, struct ttm_mem_reg *new_mem)
Ben Skeggs6ee73862009-12-11 19:24:15 +1000881{
Ben Skeggsd2f966662011-06-06 20:54:42 +1000882 struct nouveau_mem *node = old_mem->mm_node;
Ben Skeggsf1ab0cc2010-08-26 11:32:01 +1000883 u64 length = (new_mem->num_pages << PAGE_SHIFT);
Ben Skeggsd2f966662011-06-06 20:54:42 +1000884 u64 src_offset = node->vma[0].offset;
885 u64 dst_offset = node->vma[1].offset;
Maarten Lankhorstce8f7692013-11-12 13:34:08 +0100886 int src_tiled = !!node->memtype;
887 int dst_tiled = !!((struct nouveau_mem *)new_mem->mm_node)->memtype;
Ben Skeggs6ee73862009-12-11 19:24:15 +1000888 int ret;
889
Ben Skeggsf1ab0cc2010-08-26 11:32:01 +1000890 while (length) {
891 u32 amount, stride, height;
892
Maarten Lankhorstce8f7692013-11-12 13:34:08 +0100893 ret = RING_SPACE(chan, 18 + 6 * (src_tiled + dst_tiled));
894 if (ret)
895 return ret;
896
Ben Skeggs5220b3c2010-09-23 15:21:17 +1000897 amount = min(length, (u64)(4 * 1024 * 1024));
898 stride = 16 * 4;
Ben Skeggsf1ab0cc2010-08-26 11:32:01 +1000899 height = amount / stride;
900
Maarten Lankhorstce8f7692013-11-12 13:34:08 +0100901 if (src_tiled) {
Ben Skeggsd1b167e2012-05-04 14:01:52 +1000902 BEGIN_NV04(chan, NvSubCopy, 0x0200, 7);
Ben Skeggsf1ab0cc2010-08-26 11:32:01 +1000903 OUT_RING (chan, 0);
Ben Skeggs5220b3c2010-09-23 15:21:17 +1000904 OUT_RING (chan, 0);
Ben Skeggsf1ab0cc2010-08-26 11:32:01 +1000905 OUT_RING (chan, stride);
906 OUT_RING (chan, height);
907 OUT_RING (chan, 1);
908 OUT_RING (chan, 0);
909 OUT_RING (chan, 0);
910 } else {
Ben Skeggsd1b167e2012-05-04 14:01:52 +1000911 BEGIN_NV04(chan, NvSubCopy, 0x0200, 1);
Ben Skeggsf1ab0cc2010-08-26 11:32:01 +1000912 OUT_RING (chan, 1);
913 }
Maarten Lankhorstce8f7692013-11-12 13:34:08 +0100914 if (dst_tiled) {
Ben Skeggsd1b167e2012-05-04 14:01:52 +1000915 BEGIN_NV04(chan, NvSubCopy, 0x021c, 7);
Ben Skeggsf1ab0cc2010-08-26 11:32:01 +1000916 OUT_RING (chan, 0);
Ben Skeggs5220b3c2010-09-23 15:21:17 +1000917 OUT_RING (chan, 0);
Ben Skeggsf1ab0cc2010-08-26 11:32:01 +1000918 OUT_RING (chan, stride);
919 OUT_RING (chan, height);
920 OUT_RING (chan, 1);
921 OUT_RING (chan, 0);
922 OUT_RING (chan, 0);
923 } else {
Ben Skeggsd1b167e2012-05-04 14:01:52 +1000924 BEGIN_NV04(chan, NvSubCopy, 0x021c, 1);
Ben Skeggsf1ab0cc2010-08-26 11:32:01 +1000925 OUT_RING (chan, 1);
926 }
927
Ben Skeggsd1b167e2012-05-04 14:01:52 +1000928 BEGIN_NV04(chan, NvSubCopy, 0x0238, 2);
Ben Skeggsf1ab0cc2010-08-26 11:32:01 +1000929 OUT_RING (chan, upper_32_bits(src_offset));
930 OUT_RING (chan, upper_32_bits(dst_offset));
Ben Skeggsd1b167e2012-05-04 14:01:52 +1000931 BEGIN_NV04(chan, NvSubCopy, 0x030c, 8);
Ben Skeggsf1ab0cc2010-08-26 11:32:01 +1000932 OUT_RING (chan, lower_32_bits(src_offset));
933 OUT_RING (chan, lower_32_bits(dst_offset));
934 OUT_RING (chan, stride);
935 OUT_RING (chan, stride);
936 OUT_RING (chan, stride);
937 OUT_RING (chan, height);
938 OUT_RING (chan, 0x00000101);
939 OUT_RING (chan, 0x00000000);
Ben Skeggsd1b167e2012-05-04 14:01:52 +1000940 BEGIN_NV04(chan, NvSubCopy, NV_MEMORY_TO_MEMORY_FORMAT_NOP, 1);
Ben Skeggsf1ab0cc2010-08-26 11:32:01 +1000941 OUT_RING (chan, 0);
942
943 length -= amount;
944 src_offset += amount;
945 dst_offset += amount;
Ben Skeggs6ee73862009-12-11 19:24:15 +1000946 }
947
Ben Skeggsf1ab0cc2010-08-26 11:32:01 +1000948 return 0;
949}
950
Ben Skeggsd1b167e2012-05-04 14:01:52 +1000951static int
952nv04_bo_move_init(struct nouveau_channel *chan, u32 handle)
953{
Ben Skeggsebb945a2012-07-20 08:17:34 +1000954 int ret = RING_SPACE(chan, 4);
Ben Skeggsd1b167e2012-05-04 14:01:52 +1000955 if (ret == 0) {
Ben Skeggsebb945a2012-07-20 08:17:34 +1000956 BEGIN_NV04(chan, NvSubCopy, 0x0000, 1);
957 OUT_RING (chan, handle);
958 BEGIN_NV04(chan, NvSubCopy, 0x0180, 1);
Ben Skeggsf45f55c2014-08-10 04:10:23 +1000959 OUT_RING (chan, chan->drm->ntfy.handle);
Ben Skeggsd1b167e2012-05-04 14:01:52 +1000960 }
961
962 return ret;
963}
964
Ben Skeggsa6704782011-02-16 09:10:20 +1000965static inline uint32_t
966nouveau_bo_mem_ctxdma(struct ttm_buffer_object *bo,
967 struct nouveau_channel *chan, struct ttm_mem_reg *mem)
968{
969 if (mem->mem_type == TTM_PL_TT)
Ben Skeggsebb945a2012-07-20 08:17:34 +1000970 return NvDmaTT;
Ben Skeggsf45f55c2014-08-10 04:10:23 +1000971 return chan->vram.handle;
Ben Skeggsa6704782011-02-16 09:10:20 +1000972}
973
Ben Skeggsf1ab0cc2010-08-26 11:32:01 +1000974static int
975nv04_bo_move_m2mf(struct nouveau_channel *chan, struct ttm_buffer_object *bo,
976 struct ttm_mem_reg *old_mem, struct ttm_mem_reg *new_mem)
977{
Ben Skeggsd961db72010-08-05 10:48:18 +1000978 u32 src_offset = old_mem->start << PAGE_SHIFT;
979 u32 dst_offset = new_mem->start << PAGE_SHIFT;
Ben Skeggsf1ab0cc2010-08-26 11:32:01 +1000980 u32 page_count = new_mem->num_pages;
981 int ret;
982
983 ret = RING_SPACE(chan, 3);
984 if (ret)
985 return ret;
986
Ben Skeggsd1b167e2012-05-04 14:01:52 +1000987 BEGIN_NV04(chan, NvSubCopy, NV_MEMORY_TO_MEMORY_FORMAT_DMA_SOURCE, 2);
Ben Skeggsf1ab0cc2010-08-26 11:32:01 +1000988 OUT_RING (chan, nouveau_bo_mem_ctxdma(bo, chan, old_mem));
989 OUT_RING (chan, nouveau_bo_mem_ctxdma(bo, chan, new_mem));
990
Ben Skeggs6ee73862009-12-11 19:24:15 +1000991 page_count = new_mem->num_pages;
992 while (page_count) {
993 int line_count = (page_count > 2047) ? 2047 : page_count;
994
Ben Skeggs6ee73862009-12-11 19:24:15 +1000995 ret = RING_SPACE(chan, 11);
996 if (ret)
997 return ret;
Ben Skeggsf1ab0cc2010-08-26 11:32:01 +1000998
Ben Skeggsd1b167e2012-05-04 14:01:52 +1000999 BEGIN_NV04(chan, NvSubCopy,
Ben Skeggs6ee73862009-12-11 19:24:15 +10001000 NV_MEMORY_TO_MEMORY_FORMAT_OFFSET_IN, 8);
Ben Skeggsf1ab0cc2010-08-26 11:32:01 +10001001 OUT_RING (chan, src_offset);
1002 OUT_RING (chan, dst_offset);
1003 OUT_RING (chan, PAGE_SIZE); /* src_pitch */
1004 OUT_RING (chan, PAGE_SIZE); /* dst_pitch */
1005 OUT_RING (chan, PAGE_SIZE); /* line_length */
1006 OUT_RING (chan, line_count);
1007 OUT_RING (chan, 0x00000101);
1008 OUT_RING (chan, 0x00000000);
Ben Skeggsd1b167e2012-05-04 14:01:52 +10001009 BEGIN_NV04(chan, NvSubCopy, NV_MEMORY_TO_MEMORY_FORMAT_NOP, 1);
Ben Skeggsf1ab0cc2010-08-26 11:32:01 +10001010 OUT_RING (chan, 0);
Ben Skeggs6ee73862009-12-11 19:24:15 +10001011
1012 page_count -= line_count;
1013 src_offset += (PAGE_SIZE * line_count);
1014 dst_offset += (PAGE_SIZE * line_count);
1015 }
1016
Ben Skeggsf1ab0cc2010-08-26 11:32:01 +10001017 return 0;
1018}
1019
1020static int
Ben Skeggs3c57d852013-11-22 10:35:25 +10001021nouveau_bo_move_prep(struct nouveau_drm *drm, struct ttm_buffer_object *bo,
1022 struct ttm_mem_reg *mem)
Ben Skeggsd2f966662011-06-06 20:54:42 +10001023{
Ben Skeggs3c57d852013-11-22 10:35:25 +10001024 struct nouveau_mem *old_node = bo->mem.mm_node;
1025 struct nouveau_mem *new_node = mem->mm_node;
1026 u64 size = (u64)mem->num_pages << PAGE_SHIFT;
Ben Skeggsd2f966662011-06-06 20:54:42 +10001027 int ret;
1028
Ben Skeggs3ee6f5b2014-08-10 04:10:20 +10001029 ret = nouveau_vm_get(drm->client.vm, size, old_node->page_shift,
Ben Skeggs3c57d852013-11-22 10:35:25 +10001030 NV_MEM_ACCESS_RW, &old_node->vma[0]);
Ben Skeggsd2f966662011-06-06 20:54:42 +10001031 if (ret)
1032 return ret;
1033
Ben Skeggs3ee6f5b2014-08-10 04:10:20 +10001034 ret = nouveau_vm_get(drm->client.vm, size, new_node->page_shift,
Ben Skeggs3c57d852013-11-22 10:35:25 +10001035 NV_MEM_ACCESS_RW, &old_node->vma[1]);
1036 if (ret) {
1037 nouveau_vm_put(&old_node->vma[0]);
1038 return ret;
1039 }
1040
1041 nouveau_vm_map(&old_node->vma[0], old_node);
1042 nouveau_vm_map(&old_node->vma[1], new_node);
Ben Skeggsd2f966662011-06-06 20:54:42 +10001043 return 0;
1044}
1045
1046static int
Ben Skeggsf1ab0cc2010-08-26 11:32:01 +10001047nouveau_bo_move_m2mf(struct ttm_buffer_object *bo, int evict, bool intr,
Maarten Lankhorst97a875c2012-11-28 11:25:44 +00001048 bool no_wait_gpu, struct ttm_mem_reg *new_mem)
Ben Skeggsf1ab0cc2010-08-26 11:32:01 +10001049{
Ben Skeggsebb945a2012-07-20 08:17:34 +10001050 struct nouveau_drm *drm = nouveau_bdev(bo->bdev);
Dave Jones1934a2a2013-09-17 17:26:34 -04001051 struct nouveau_channel *chan = drm->ttm.chan;
Ben Skeggs0ad72862014-08-10 04:10:22 +10001052 struct nouveau_cli *cli = (void *)nvif_client(&chan->device->base);
Ben Skeggs35b81412013-11-22 10:39:57 +10001053 struct nouveau_fence *fence;
Ben Skeggsf1ab0cc2010-08-26 11:32:01 +10001054 int ret;
1055
Ben Skeggsd2f966662011-06-06 20:54:42 +10001056 /* create temporary vmas for the transfer and attach them to the
1057 * old nouveau_mem node, these will get cleaned up after ttm has
1058 * destroyed the ttm_mem_reg
Ben Skeggs3425df42011-02-10 11:22:12 +10001059 */
Ben Skeggs967e7bd2014-08-10 04:10:22 +10001060 if (drm->device.info.family >= NV_DEVICE_INFO_V0_TESLA) {
Ben Skeggs3c57d852013-11-22 10:35:25 +10001061 ret = nouveau_bo_move_prep(drm, bo, new_mem);
Ben Skeggsd2f966662011-06-06 20:54:42 +10001062 if (ret)
Ben Skeggs3c57d852013-11-22 10:35:25 +10001063 return ret;
Ben Skeggs3425df42011-02-10 11:22:12 +10001064 }
1065
Ben Skeggs0ad72862014-08-10 04:10:22 +10001066 mutex_lock_nested(&cli->mutex, SINGLE_DEPTH_NESTING);
Maarten Lankhorste3be4c22014-09-16 11:15:07 +02001067 ret = nouveau_fence_sync(nouveau_bo(bo), chan, true, intr);
Ben Skeggs6a6b73f2010-10-05 16:53:48 +10001068 if (ret == 0) {
Ben Skeggs35b81412013-11-22 10:39:57 +10001069 ret = drm->ttm.move(chan, bo, &bo->mem, new_mem);
1070 if (ret == 0) {
1071 ret = nouveau_fence_new(chan, false, &fence);
1072 if (ret == 0) {
Maarten Lankhorstf2c24b82014-04-02 17:14:48 +02001073 ret = ttm_bo_move_accel_cleanup(bo,
1074 &fence->base,
Ben Skeggs35b81412013-11-22 10:39:57 +10001075 evict,
1076 no_wait_gpu,
1077 new_mem);
1078 nouveau_fence_unref(&fence);
1079 }
1080 }
Ben Skeggs6a6b73f2010-10-05 16:53:48 +10001081 }
Ben Skeggs0ad72862014-08-10 04:10:22 +10001082 mutex_unlock(&cli->mutex);
Ben Skeggs6a6b73f2010-10-05 16:53:48 +10001083 return ret;
Ben Skeggs6ee73862009-12-11 19:24:15 +10001084}
1085
Ben Skeggsd1b167e2012-05-04 14:01:52 +10001086void
Ben Skeggs49981042012-08-06 19:38:25 +10001087nouveau_bo_move_init(struct nouveau_drm *drm)
Ben Skeggsd1b167e2012-05-04 14:01:52 +10001088{
Ben Skeggsd1b167e2012-05-04 14:01:52 +10001089 static const struct {
1090 const char *name;
Ben Skeggs1a460982012-05-04 15:17:28 +10001091 int engine;
Ben Skeggsd1b167e2012-05-04 14:01:52 +10001092 u32 oclass;
1093 int (*exec)(struct nouveau_channel *,
1094 struct ttm_buffer_object *,
1095 struct ttm_mem_reg *, struct ttm_mem_reg *);
1096 int (*init)(struct nouveau_channel *, u32 handle);
1097 } _methods[] = {
Ben Skeggs00fc6f62013-07-09 14:20:15 +10001098 { "COPY", 4, 0xa0b5, nve0_bo_move_copy, nve0_bo_move_init },
Ben Skeggs49981042012-08-06 19:38:25 +10001099 { "GRCE", 0, 0xa0b5, nve0_bo_move_copy, nvc0_bo_move_init },
Ben Skeggs1a460982012-05-04 15:17:28 +10001100 { "COPY1", 5, 0x90b8, nvc0_bo_move_copy, nvc0_bo_move_init },
1101 { "COPY0", 4, 0x90b5, nvc0_bo_move_copy, nvc0_bo_move_init },
1102 { "COPY", 0, 0x85b5, nva3_bo_move_copy, nv50_bo_move_init },
1103 { "CRYPT", 0, 0x74c1, nv84_bo_move_exec, nv50_bo_move_init },
1104 { "M2MF", 0, 0x9039, nvc0_bo_move_m2mf, nvc0_bo_move_init },
1105 { "M2MF", 0, 0x5039, nv50_bo_move_m2mf, nv50_bo_move_init },
1106 { "M2MF", 0, 0x0039, nv04_bo_move_m2mf, nv04_bo_move_init },
Ben Skeggs5490e5d2012-05-04 14:34:16 +10001107 {},
Ben Skeggs1a460982012-05-04 15:17:28 +10001108 { "CRYPT", 0, 0x88b4, nv98_bo_move_exec, nv50_bo_move_init },
Ben Skeggsd1b167e2012-05-04 14:01:52 +10001109 }, *mthd = _methods;
1110 const char *name = "CPU";
1111 int ret;
1112
1113 do {
Ben Skeggs49981042012-08-06 19:38:25 +10001114 struct nouveau_channel *chan;
Ben Skeggsebb945a2012-07-20 08:17:34 +10001115
Ben Skeggs00fc6f62013-07-09 14:20:15 +10001116 if (mthd->engine)
Ben Skeggs49981042012-08-06 19:38:25 +10001117 chan = drm->cechan;
1118 else
1119 chan = drm->channel;
1120 if (chan == NULL)
1121 continue;
1122
Ben Skeggs0ad72862014-08-10 04:10:22 +10001123 ret = nvif_object_init(chan->object, NULL,
1124 mthd->oclass | (mthd->engine << 16),
1125 mthd->oclass, NULL, 0,
1126 &drm->ttm.copy);
Ben Skeggsd1b167e2012-05-04 14:01:52 +10001127 if (ret == 0) {
Ben Skeggs0ad72862014-08-10 04:10:22 +10001128 ret = mthd->init(chan, drm->ttm.copy.handle);
Ben Skeggsebb945a2012-07-20 08:17:34 +10001129 if (ret) {
Ben Skeggs0ad72862014-08-10 04:10:22 +10001130 nvif_object_fini(&drm->ttm.copy);
Ben Skeggsebb945a2012-07-20 08:17:34 +10001131 continue;
Ben Skeggsd1b167e2012-05-04 14:01:52 +10001132 }
Ben Skeggsebb945a2012-07-20 08:17:34 +10001133
1134 drm->ttm.move = mthd->exec;
Ben Skeggs1bb3f6a2013-07-08 10:40:35 +10001135 drm->ttm.chan = chan;
Ben Skeggsebb945a2012-07-20 08:17:34 +10001136 name = mthd->name;
1137 break;
Ben Skeggsd1b167e2012-05-04 14:01:52 +10001138 }
1139 } while ((++mthd)->exec);
1140
Ben Skeggsebb945a2012-07-20 08:17:34 +10001141 NV_INFO(drm, "MM: using %s for buffer copies\n", name);
Ben Skeggsd1b167e2012-05-04 14:01:52 +10001142}
1143
Ben Skeggs6ee73862009-12-11 19:24:15 +10001144static int
1145nouveau_bo_move_flipd(struct ttm_buffer_object *bo, bool evict, bool intr,
Maarten Lankhorst97a875c2012-11-28 11:25:44 +00001146 bool no_wait_gpu, struct ttm_mem_reg *new_mem)
Ben Skeggs6ee73862009-12-11 19:24:15 +10001147{
Christian Königf1217ed2014-08-27 13:16:04 +02001148 struct ttm_place placement_memtype = {
1149 .fpfn = 0,
1150 .lpfn = 0,
1151 .flags = TTM_PL_FLAG_TT | TTM_PL_MASK_CACHING
1152 };
Ben Skeggs6ee73862009-12-11 19:24:15 +10001153 struct ttm_placement placement;
1154 struct ttm_mem_reg tmp_mem;
1155 int ret;
1156
Ben Skeggs6ee73862009-12-11 19:24:15 +10001157 placement.num_placement = placement.num_busy_placement = 1;
Francisco Jerez77e2b5e2009-12-16 19:05:00 +01001158 placement.placement = placement.busy_placement = &placement_memtype;
Ben Skeggs6ee73862009-12-11 19:24:15 +10001159
1160 tmp_mem = *new_mem;
1161 tmp_mem.mm_node = NULL;
Maarten Lankhorst97a875c2012-11-28 11:25:44 +00001162 ret = ttm_bo_mem_space(bo, &placement, &tmp_mem, intr, no_wait_gpu);
Ben Skeggs6ee73862009-12-11 19:24:15 +10001163 if (ret)
1164 return ret;
1165
1166 ret = ttm_tt_bind(bo->ttm, &tmp_mem);
1167 if (ret)
1168 goto out;
1169
Maarten Lankhorst97a875c2012-11-28 11:25:44 +00001170 ret = nouveau_bo_move_m2mf(bo, true, intr, no_wait_gpu, &tmp_mem);
Ben Skeggs6ee73862009-12-11 19:24:15 +10001171 if (ret)
1172 goto out;
1173
Maarten Lankhorst97a875c2012-11-28 11:25:44 +00001174 ret = ttm_bo_move_ttm(bo, true, no_wait_gpu, new_mem);
Ben Skeggs6ee73862009-12-11 19:24:15 +10001175out:
Ben Skeggs42311ff2010-08-04 12:07:08 +10001176 ttm_bo_mem_put(bo, &tmp_mem);
Ben Skeggs6ee73862009-12-11 19:24:15 +10001177 return ret;
1178}
1179
1180static int
1181nouveau_bo_move_flips(struct ttm_buffer_object *bo, bool evict, bool intr,
Maarten Lankhorst97a875c2012-11-28 11:25:44 +00001182 bool no_wait_gpu, struct ttm_mem_reg *new_mem)
Ben Skeggs6ee73862009-12-11 19:24:15 +10001183{
Christian Königf1217ed2014-08-27 13:16:04 +02001184 struct ttm_place placement_memtype = {
1185 .fpfn = 0,
1186 .lpfn = 0,
1187 .flags = TTM_PL_FLAG_TT | TTM_PL_MASK_CACHING
1188 };
Ben Skeggs6ee73862009-12-11 19:24:15 +10001189 struct ttm_placement placement;
1190 struct ttm_mem_reg tmp_mem;
1191 int ret;
1192
Ben Skeggs6ee73862009-12-11 19:24:15 +10001193 placement.num_placement = placement.num_busy_placement = 1;
Francisco Jerez77e2b5e2009-12-16 19:05:00 +01001194 placement.placement = placement.busy_placement = &placement_memtype;
Ben Skeggs6ee73862009-12-11 19:24:15 +10001195
1196 tmp_mem = *new_mem;
1197 tmp_mem.mm_node = NULL;
Maarten Lankhorst97a875c2012-11-28 11:25:44 +00001198 ret = ttm_bo_mem_space(bo, &placement, &tmp_mem, intr, no_wait_gpu);
Ben Skeggs6ee73862009-12-11 19:24:15 +10001199 if (ret)
1200 return ret;
1201
Maarten Lankhorst97a875c2012-11-28 11:25:44 +00001202 ret = ttm_bo_move_ttm(bo, true, no_wait_gpu, &tmp_mem);
Ben Skeggs6ee73862009-12-11 19:24:15 +10001203 if (ret)
1204 goto out;
1205
Maarten Lankhorst97a875c2012-11-28 11:25:44 +00001206 ret = nouveau_bo_move_m2mf(bo, true, intr, no_wait_gpu, new_mem);
Ben Skeggs6ee73862009-12-11 19:24:15 +10001207 if (ret)
1208 goto out;
1209
1210out:
Ben Skeggs42311ff2010-08-04 12:07:08 +10001211 ttm_bo_mem_put(bo, &tmp_mem);
Ben Skeggs6ee73862009-12-11 19:24:15 +10001212 return ret;
1213}
1214
Ben Skeggsa4154bb2011-02-10 10:35:16 +10001215static void
1216nouveau_bo_move_ntfy(struct ttm_buffer_object *bo, struct ttm_mem_reg *new_mem)
1217{
Ben Skeggsa4154bb2011-02-10 10:35:16 +10001218 struct nouveau_bo *nvbo = nouveau_bo(bo);
Ben Skeggsfd2871a2011-06-06 14:07:04 +10001219 struct nouveau_vma *vma;
Ben Skeggsa4154bb2011-02-10 10:35:16 +10001220
Ben Skeggs9f1feed2012-01-25 15:34:22 +10001221 /* ttm can now (stupidly) pass the driver bos it didn't create... */
1222 if (bo->destroy != nouveau_bo_del_ttm)
1223 return;
1224
Ben Skeggsfd2871a2011-06-06 14:07:04 +10001225 list_for_each_entry(vma, &nvbo->vma_list, head) {
Ben Skeggs2e2cfbe2013-11-15 11:56:49 +10001226 if (new_mem && new_mem->mem_type != TTM_PL_SYSTEM &&
1227 (new_mem->mem_type == TTM_PL_VRAM ||
1228 nvbo->page_shift != vma->vm->vmm->lpg_shift)) {
Ben Skeggsfd2871a2011-06-06 14:07:04 +10001229 nouveau_vm_map(vma, new_mem->mm_node);
Ben Skeggsfd2871a2011-06-06 14:07:04 +10001230 } else {
1231 nouveau_vm_unmap(vma);
1232 }
Ben Skeggsa4154bb2011-02-10 10:35:16 +10001233 }
1234}
1235
Ben Skeggs6ee73862009-12-11 19:24:15 +10001236static int
Francisco Jereza0af9ad2009-12-11 16:51:09 +01001237nouveau_bo_vm_bind(struct ttm_buffer_object *bo, struct ttm_mem_reg *new_mem,
Ben Skeggsebb945a2012-07-20 08:17:34 +10001238 struct nouveau_drm_tile **new_tile)
Ben Skeggs6ee73862009-12-11 19:24:15 +10001239{
Ben Skeggsebb945a2012-07-20 08:17:34 +10001240 struct nouveau_drm *drm = nouveau_bdev(bo->bdev);
1241 struct drm_device *dev = drm->dev;
Francisco Jereza0af9ad2009-12-11 16:51:09 +01001242 struct nouveau_bo *nvbo = nouveau_bo(bo);
Ben Skeggsa4154bb2011-02-10 10:35:16 +10001243 u64 offset = new_mem->start << PAGE_SHIFT;
Ben Skeggs6ee73862009-12-11 19:24:15 +10001244
Ben Skeggsa4154bb2011-02-10 10:35:16 +10001245 *new_tile = NULL;
1246 if (new_mem->mem_type != TTM_PL_VRAM)
Francisco Jereza0af9ad2009-12-11 16:51:09 +01001247 return 0;
Ben Skeggs6ee73862009-12-11 19:24:15 +10001248
Ben Skeggs967e7bd2014-08-10 04:10:22 +10001249 if (drm->device.info.family >= NV_DEVICE_INFO_V0_CELSIUS) {
Ben Skeggsbc9e7b92012-07-19 17:54:21 +10001250 *new_tile = nv10_bo_set_tiling(dev, offset, new_mem->size,
Francisco Jereza5cf68b2010-10-24 16:14:41 +02001251 nvbo->tile_mode,
1252 nvbo->tile_flags);
Ben Skeggs6ee73862009-12-11 19:24:15 +10001253 }
1254
Francisco Jereza0af9ad2009-12-11 16:51:09 +01001255 return 0;
1256}
Ben Skeggs6ee73862009-12-11 19:24:15 +10001257
Francisco Jereza0af9ad2009-12-11 16:51:09 +01001258static void
1259nouveau_bo_vm_cleanup(struct ttm_buffer_object *bo,
Ben Skeggsebb945a2012-07-20 08:17:34 +10001260 struct nouveau_drm_tile *new_tile,
1261 struct nouveau_drm_tile **old_tile)
Francisco Jereza0af9ad2009-12-11 16:51:09 +01001262{
Ben Skeggsebb945a2012-07-20 08:17:34 +10001263 struct nouveau_drm *drm = nouveau_bdev(bo->bdev);
1264 struct drm_device *dev = drm->dev;
Maarten Lankhorstf2c24b82014-04-02 17:14:48 +02001265 struct fence *fence = reservation_object_get_excl(bo->resv);
Francisco Jereza0af9ad2009-12-11 16:51:09 +01001266
Maarten Lankhorstf2c24b82014-04-02 17:14:48 +02001267 nv10_bo_put_tile_region(dev, *old_tile, fence);
Ben Skeggsa4154bb2011-02-10 10:35:16 +10001268 *old_tile = new_tile;
Francisco Jereza0af9ad2009-12-11 16:51:09 +01001269}
1270
1271static int
1272nouveau_bo_move(struct ttm_buffer_object *bo, bool evict, bool intr,
Maarten Lankhorst97a875c2012-11-28 11:25:44 +00001273 bool no_wait_gpu, struct ttm_mem_reg *new_mem)
Francisco Jereza0af9ad2009-12-11 16:51:09 +01001274{
Ben Skeggsebb945a2012-07-20 08:17:34 +10001275 struct nouveau_drm *drm = nouveau_bdev(bo->bdev);
Francisco Jereza0af9ad2009-12-11 16:51:09 +01001276 struct nouveau_bo *nvbo = nouveau_bo(bo);
1277 struct ttm_mem_reg *old_mem = &bo->mem;
Ben Skeggsebb945a2012-07-20 08:17:34 +10001278 struct nouveau_drm_tile *new_tile = NULL;
Francisco Jereza0af9ad2009-12-11 16:51:09 +01001279 int ret = 0;
1280
Alexandre Courbot5be5a152014-10-27 18:11:52 +09001281 if (nvbo->pin_refcnt)
1282 NV_WARN(drm, "Moving pinned object %p!\n", nvbo);
1283
Ben Skeggs967e7bd2014-08-10 04:10:22 +10001284 if (drm->device.info.family < NV_DEVICE_INFO_V0_TESLA) {
Ben Skeggsa4154bb2011-02-10 10:35:16 +10001285 ret = nouveau_bo_vm_bind(bo, new_mem, &new_tile);
1286 if (ret)
1287 return ret;
1288 }
Francisco Jereza0af9ad2009-12-11 16:51:09 +01001289
Francisco Jereza0af9ad2009-12-11 16:51:09 +01001290 /* Fake bo copy. */
Ben Skeggs6ee73862009-12-11 19:24:15 +10001291 if (old_mem->mem_type == TTM_PL_SYSTEM && !bo->ttm) {
1292 BUG_ON(bo->mem.mm_node != NULL);
1293 bo->mem = *new_mem;
1294 new_mem->mm_node = NULL;
Francisco Jereza0af9ad2009-12-11 16:51:09 +01001295 goto out;
Ben Skeggs6ee73862009-12-11 19:24:15 +10001296 }
1297
Ben Skeggscef9e992013-11-22 10:52:54 +10001298 /* Hardware assisted copy. */
1299 if (drm->ttm.move) {
1300 if (new_mem->mem_type == TTM_PL_SYSTEM)
1301 ret = nouveau_bo_move_flipd(bo, evict, intr,
1302 no_wait_gpu, new_mem);
1303 else if (old_mem->mem_type == TTM_PL_SYSTEM)
1304 ret = nouveau_bo_move_flips(bo, evict, intr,
1305 no_wait_gpu, new_mem);
1306 else
1307 ret = nouveau_bo_move_m2mf(bo, evict, intr,
1308 no_wait_gpu, new_mem);
1309 if (!ret)
1310 goto out;
Ben Skeggsb8a6a802010-08-27 11:55:43 +10001311 }
1312
Francisco Jereza0af9ad2009-12-11 16:51:09 +01001313 /* Fallback to software copy. */
Ben Skeggscef9e992013-11-22 10:52:54 +10001314 ret = ttm_bo_wait(bo, true, intr, no_wait_gpu);
Ben Skeggscef9e992013-11-22 10:52:54 +10001315 if (ret == 0)
1316 ret = ttm_bo_move_memcpy(bo, evict, no_wait_gpu, new_mem);
Francisco Jereza0af9ad2009-12-11 16:51:09 +01001317
1318out:
Ben Skeggs967e7bd2014-08-10 04:10:22 +10001319 if (drm->device.info.family < NV_DEVICE_INFO_V0_TESLA) {
Ben Skeggsa4154bb2011-02-10 10:35:16 +10001320 if (ret)
1321 nouveau_bo_vm_cleanup(bo, NULL, &new_tile);
1322 else
1323 nouveau_bo_vm_cleanup(bo, new_tile, &nvbo->tile);
1324 }
Francisco Jereza0af9ad2009-12-11 16:51:09 +01001325
1326 return ret;
Ben Skeggs6ee73862009-12-11 19:24:15 +10001327}
1328
1329static int
1330nouveau_bo_verify_access(struct ttm_buffer_object *bo, struct file *filp)
1331{
David Herrmannacb46522013-08-25 18:28:59 +02001332 struct nouveau_bo *nvbo = nouveau_bo(bo);
1333
David Herrmann55fb74a2013-10-02 10:15:17 +02001334 return drm_vma_node_verify_access(&nvbo->gem.vma_node, filp);
Ben Skeggs6ee73862009-12-11 19:24:15 +10001335}
1336
Jerome Glissef32f02f2010-04-09 14:39:25 +02001337static int
1338nouveau_ttm_io_mem_reserve(struct ttm_bo_device *bdev, struct ttm_mem_reg *mem)
1339{
1340 struct ttm_mem_type_manager *man = &bdev->man[mem->mem_type];
Ben Skeggsebb945a2012-07-20 08:17:34 +10001341 struct nouveau_drm *drm = nouveau_bdev(bdev);
Maarten Lankhorsta5540902013-11-12 13:34:09 +01001342 struct nouveau_mem *node = mem->mm_node;
Ben Skeggsf869ef82010-11-15 11:53:16 +10001343 int ret;
Jerome Glissef32f02f2010-04-09 14:39:25 +02001344
1345 mem->bus.addr = NULL;
1346 mem->bus.offset = 0;
1347 mem->bus.size = mem->num_pages << PAGE_SHIFT;
1348 mem->bus.base = 0;
1349 mem->bus.is_iomem = false;
1350 if (!(man->flags & TTM_MEMTYPE_FLAG_MAPPABLE))
1351 return -EINVAL;
1352 switch (mem->mem_type) {
1353 case TTM_PL_SYSTEM:
1354 /* System memory */
1355 return 0;
1356 case TTM_PL_TT:
1357#if __OS_HAS_AGP
Ben Skeggsebb945a2012-07-20 08:17:34 +10001358 if (drm->agp.stat == ENABLED) {
Ben Skeggsd961db72010-08-05 10:48:18 +10001359 mem->bus.offset = mem->start << PAGE_SHIFT;
Ben Skeggsebb945a2012-07-20 08:17:34 +10001360 mem->bus.base = drm->agp.base;
Ben Skeggs5c13cac2014-08-10 12:39:09 +10001361 mem->bus.is_iomem = !drm->dev->agp->cant_use_aperture;
Jerome Glissef32f02f2010-04-09 14:39:25 +02001362 }
1363#endif
Ben Skeggs967e7bd2014-08-10 04:10:22 +10001364 if (drm->device.info.family < NV_DEVICE_INFO_V0_TESLA || !node->memtype)
Maarten Lankhorsta5540902013-11-12 13:34:09 +01001365 /* untiled */
1366 break;
1367 /* fallthrough, tiled memory */
Jerome Glissef32f02f2010-04-09 14:39:25 +02001368 case TTM_PL_VRAM:
Ben Skeggs3863c9b2012-07-14 19:09:17 +10001369 mem->bus.offset = mem->start << PAGE_SHIFT;
Ben Skeggs967e7bd2014-08-10 04:10:22 +10001370 mem->bus.base = nv_device_resource_start(nvkm_device(&drm->device), 1);
Jerome Glissef32f02f2010-04-09 14:39:25 +02001371 mem->bus.is_iomem = true;
Ben Skeggs967e7bd2014-08-10 04:10:22 +10001372 if (drm->device.info.family >= NV_DEVICE_INFO_V0_TESLA) {
1373 struct nouveau_bar *bar = nvkm_bar(&drm->device);
Ben Skeggs3863c9b2012-07-14 19:09:17 +10001374
Ben Skeggsebb945a2012-07-20 08:17:34 +10001375 ret = bar->umap(bar, node, NV_MEM_ACCESS_RW,
Ben Skeggs3863c9b2012-07-14 19:09:17 +10001376 &node->bar_vma);
1377 if (ret)
1378 return ret;
1379
1380 mem->bus.offset = node->bar_vma.offset;
1381 }
Jerome Glissef32f02f2010-04-09 14:39:25 +02001382 break;
1383 default:
1384 return -EINVAL;
1385 }
1386 return 0;
1387}
1388
1389static void
1390nouveau_ttm_io_mem_free(struct ttm_bo_device *bdev, struct ttm_mem_reg *mem)
1391{
Ben Skeggsebb945a2012-07-20 08:17:34 +10001392 struct nouveau_drm *drm = nouveau_bdev(bdev);
Ben Skeggs967e7bd2014-08-10 04:10:22 +10001393 struct nouveau_bar *bar = nvkm_bar(&drm->device);
Ben Skeggsd5f42392011-02-10 12:22:52 +10001394 struct nouveau_mem *node = mem->mm_node;
Ben Skeggsf869ef82010-11-15 11:53:16 +10001395
Ben Skeggsd5f42392011-02-10 12:22:52 +10001396 if (!node->bar_vma.node)
Ben Skeggsf869ef82010-11-15 11:53:16 +10001397 return;
1398
Ben Skeggsebb945a2012-07-20 08:17:34 +10001399 bar->unmap(bar, &node->bar_vma);
Jerome Glissef32f02f2010-04-09 14:39:25 +02001400}
1401
1402static int
1403nouveau_ttm_fault_reserve_notify(struct ttm_buffer_object *bo)
1404{
Ben Skeggsebb945a2012-07-20 08:17:34 +10001405 struct nouveau_drm *drm = nouveau_bdev(bo->bdev);
Ben Skeggse1429b42010-09-10 11:12:25 +10001406 struct nouveau_bo *nvbo = nouveau_bo(bo);
Ben Skeggs967e7bd2014-08-10 04:10:22 +10001407 struct nvif_device *device = &drm->device;
1408 u32 mappable = nv_device_resource_len(nvkm_device(device), 1) >> PAGE_SHIFT;
Christian Königf1217ed2014-08-27 13:16:04 +02001409 int i, ret;
Ben Skeggse1429b42010-09-10 11:12:25 +10001410
1411 /* as long as the bo isn't in vram, and isn't tiled, we've got
1412 * nothing to do here.
1413 */
1414 if (bo->mem.mem_type != TTM_PL_VRAM) {
Ben Skeggs967e7bd2014-08-10 04:10:22 +10001415 if (drm->device.info.family < NV_DEVICE_INFO_V0_TESLA ||
Francisco Jerezf13b3262010-10-10 06:01:08 +02001416 !nouveau_bo_tile_layout(nvbo))
Ben Skeggse1429b42010-09-10 11:12:25 +10001417 return 0;
Maarten Lankhorsta5540902013-11-12 13:34:09 +01001418
1419 if (bo->mem.mem_type == TTM_PL_SYSTEM) {
1420 nouveau_bo_placement_set(nvbo, TTM_PL_TT, 0);
1421
1422 ret = nouveau_bo_validate(nvbo, false, false);
1423 if (ret)
1424 return ret;
1425 }
1426 return 0;
Ben Skeggse1429b42010-09-10 11:12:25 +10001427 }
1428
1429 /* make sure bo is in mappable vram */
Ben Skeggs967e7bd2014-08-10 04:10:22 +10001430 if (drm->device.info.family >= NV_DEVICE_INFO_V0_TESLA ||
Maarten Lankhorsta5540902013-11-12 13:34:09 +01001431 bo->mem.start + bo->mem.num_pages < mappable)
Ben Skeggse1429b42010-09-10 11:12:25 +10001432 return 0;
1433
Christian Königf1217ed2014-08-27 13:16:04 +02001434 for (i = 0; i < nvbo->placement.num_placement; ++i) {
1435 nvbo->placements[i].fpfn = 0;
1436 nvbo->placements[i].lpfn = mappable;
1437 }
Ben Skeggse1429b42010-09-10 11:12:25 +10001438
Christian Königf1217ed2014-08-27 13:16:04 +02001439 for (i = 0; i < nvbo->placement.num_busy_placement; ++i) {
1440 nvbo->busy_placements[i].fpfn = 0;
1441 nvbo->busy_placements[i].lpfn = mappable;
1442 }
1443
Dave Airliec2848152012-05-18 15:31:12 +01001444 nouveau_bo_placement_set(nvbo, TTM_PL_FLAG_VRAM, 0);
Maarten Lankhorst97a875c2012-11-28 11:25:44 +00001445 return nouveau_bo_validate(nvbo, false, false);
Jerome Glissef32f02f2010-04-09 14:39:25 +02001446}
1447
Konrad Rzeszutek Wilk3230cfc2011-10-17 17:14:26 -04001448static int
1449nouveau_ttm_tt_populate(struct ttm_tt *ttm)
1450{
Jerome Glisse8e7e7052011-11-09 17:15:26 -05001451 struct ttm_dma_tt *ttm_dma = (void *)ttm;
Ben Skeggsebb945a2012-07-20 08:17:34 +10001452 struct nouveau_drm *drm;
Alexandre Courbot420b9462014-02-17 15:17:26 +09001453 struct nouveau_device *device;
Konrad Rzeszutek Wilk3230cfc2011-10-17 17:14:26 -04001454 struct drm_device *dev;
Alexandre Courbotfd1496a2014-07-31 18:09:42 +09001455 struct device *pdev;
Konrad Rzeszutek Wilk3230cfc2011-10-17 17:14:26 -04001456 unsigned i;
1457 int r;
Dave Airlie22b33e82012-04-02 11:53:06 +01001458 bool slave = !!(ttm->page_flags & TTM_PAGE_FLAG_SG);
Konrad Rzeszutek Wilk3230cfc2011-10-17 17:14:26 -04001459
1460 if (ttm->state != tt_unpopulated)
1461 return 0;
1462
Dave Airlie22b33e82012-04-02 11:53:06 +01001463 if (slave && ttm->sg) {
1464 /* make userspace faulting work */
1465 drm_prime_sg_to_page_addr_arrays(ttm->sg, ttm->pages,
1466 ttm_dma->dma_address, ttm->num_pages);
1467 ttm->state = tt_unbound;
1468 return 0;
1469 }
1470
Ben Skeggsebb945a2012-07-20 08:17:34 +10001471 drm = nouveau_bdev(ttm->bdev);
Ben Skeggs967e7bd2014-08-10 04:10:22 +10001472 device = nvkm_device(&drm->device);
Ben Skeggsebb945a2012-07-20 08:17:34 +10001473 dev = drm->dev;
Alexandre Courbotfd1496a2014-07-31 18:09:42 +09001474 pdev = nv_device_base(device);
Konrad Rzeszutek Wilk3230cfc2011-10-17 17:14:26 -04001475
Alexandre Courbotc3a0c772014-10-27 18:49:17 +09001476 /*
1477 * Objects matching this condition have been marked as force_coherent,
1478 * so use the DMA API for them.
1479 */
1480 if (!nv_device_is_cpu_coherent(device) &&
1481 ttm->caching_state == tt_uncached)
1482 return ttm_dma_populate(ttm_dma, dev->dev);
1483
Jerome Glissedea7e0a2012-01-03 17:37:37 -05001484#if __OS_HAS_AGP
Ben Skeggsebb945a2012-07-20 08:17:34 +10001485 if (drm->agp.stat == ENABLED) {
Jerome Glissedea7e0a2012-01-03 17:37:37 -05001486 return ttm_agp_tt_populate(ttm);
1487 }
1488#endif
1489
Konrad Rzeszutek Wilk3230cfc2011-10-17 17:14:26 -04001490#ifdef CONFIG_SWIOTLB
1491 if (swiotlb_nr_tbl()) {
Jerome Glisse8e7e7052011-11-09 17:15:26 -05001492 return ttm_dma_populate((void *)ttm, dev->dev);
Konrad Rzeszutek Wilk3230cfc2011-10-17 17:14:26 -04001493 }
1494#endif
1495
1496 r = ttm_pool_populate(ttm);
1497 if (r) {
1498 return r;
1499 }
1500
1501 for (i = 0; i < ttm->num_pages; i++) {
Alexandre Courbotfd1496a2014-07-31 18:09:42 +09001502 dma_addr_t addr;
1503
1504 addr = dma_map_page(pdev, ttm->pages[i], 0, PAGE_SIZE,
1505 DMA_BIDIRECTIONAL);
1506
1507 if (dma_mapping_error(pdev, addr)) {
Konrad Rzeszutek Wilk3230cfc2011-10-17 17:14:26 -04001508 while (--i) {
Alexandre Courbotfd1496a2014-07-31 18:09:42 +09001509 dma_unmap_page(pdev, ttm_dma->dma_address[i],
1510 PAGE_SIZE, DMA_BIDIRECTIONAL);
Jerome Glisse8e7e7052011-11-09 17:15:26 -05001511 ttm_dma->dma_address[i] = 0;
Konrad Rzeszutek Wilk3230cfc2011-10-17 17:14:26 -04001512 }
1513 ttm_pool_unpopulate(ttm);
1514 return -EFAULT;
1515 }
Alexandre Courbotfd1496a2014-07-31 18:09:42 +09001516
1517 ttm_dma->dma_address[i] = addr;
Konrad Rzeszutek Wilk3230cfc2011-10-17 17:14:26 -04001518 }
1519 return 0;
1520}
1521
1522static void
1523nouveau_ttm_tt_unpopulate(struct ttm_tt *ttm)
1524{
Jerome Glisse8e7e7052011-11-09 17:15:26 -05001525 struct ttm_dma_tt *ttm_dma = (void *)ttm;
Ben Skeggsebb945a2012-07-20 08:17:34 +10001526 struct nouveau_drm *drm;
Alexandre Courbot420b9462014-02-17 15:17:26 +09001527 struct nouveau_device *device;
Konrad Rzeszutek Wilk3230cfc2011-10-17 17:14:26 -04001528 struct drm_device *dev;
Alexandre Courbotfd1496a2014-07-31 18:09:42 +09001529 struct device *pdev;
Konrad Rzeszutek Wilk3230cfc2011-10-17 17:14:26 -04001530 unsigned i;
Dave Airlie22b33e82012-04-02 11:53:06 +01001531 bool slave = !!(ttm->page_flags & TTM_PAGE_FLAG_SG);
1532
1533 if (slave)
1534 return;
Konrad Rzeszutek Wilk3230cfc2011-10-17 17:14:26 -04001535
Ben Skeggsebb945a2012-07-20 08:17:34 +10001536 drm = nouveau_bdev(ttm->bdev);
Ben Skeggs967e7bd2014-08-10 04:10:22 +10001537 device = nvkm_device(&drm->device);
Ben Skeggsebb945a2012-07-20 08:17:34 +10001538 dev = drm->dev;
Alexandre Courbotfd1496a2014-07-31 18:09:42 +09001539 pdev = nv_device_base(device);
Konrad Rzeszutek Wilk3230cfc2011-10-17 17:14:26 -04001540
Alexandre Courbotc3a0c772014-10-27 18:49:17 +09001541 /*
1542 * Objects matching this condition have been marked as force_coherent,
1543 * so use the DMA API for them.
1544 */
1545 if (!nv_device_is_cpu_coherent(device) &&
1546 ttm->caching_state == tt_uncached)
1547 ttm_dma_unpopulate(ttm_dma, dev->dev);
1548
Jerome Glissedea7e0a2012-01-03 17:37:37 -05001549#if __OS_HAS_AGP
Ben Skeggsebb945a2012-07-20 08:17:34 +10001550 if (drm->agp.stat == ENABLED) {
Jerome Glissedea7e0a2012-01-03 17:37:37 -05001551 ttm_agp_tt_unpopulate(ttm);
1552 return;
1553 }
1554#endif
1555
Konrad Rzeszutek Wilk3230cfc2011-10-17 17:14:26 -04001556#ifdef CONFIG_SWIOTLB
1557 if (swiotlb_nr_tbl()) {
Jerome Glisse8e7e7052011-11-09 17:15:26 -05001558 ttm_dma_unpopulate((void *)ttm, dev->dev);
Konrad Rzeszutek Wilk3230cfc2011-10-17 17:14:26 -04001559 return;
1560 }
1561#endif
1562
1563 for (i = 0; i < ttm->num_pages; i++) {
Jerome Glisse8e7e7052011-11-09 17:15:26 -05001564 if (ttm_dma->dma_address[i]) {
Alexandre Courbotfd1496a2014-07-31 18:09:42 +09001565 dma_unmap_page(pdev, ttm_dma->dma_address[i], PAGE_SIZE,
1566 DMA_BIDIRECTIONAL);
Konrad Rzeszutek Wilk3230cfc2011-10-17 17:14:26 -04001567 }
1568 }
1569
1570 ttm_pool_unpopulate(ttm);
1571}
1572
Maarten Lankhorstdd7cfd62014-01-21 13:07:31 +01001573void
Maarten Lankhorst809e9442014-04-09 16:19:30 +02001574nouveau_bo_fence(struct nouveau_bo *nvbo, struct nouveau_fence *fence, bool exclusive)
Maarten Lankhorstdd7cfd62014-01-21 13:07:31 +01001575{
Maarten Lankhorst29ba89b2014-01-09 11:03:11 +01001576 struct reservation_object *resv = nvbo->bo.resv;
Maarten Lankhorstdd7cfd62014-01-21 13:07:31 +01001577
Maarten Lankhorst809e9442014-04-09 16:19:30 +02001578 if (exclusive)
1579 reservation_object_add_excl_fence(resv, &fence->base);
1580 else if (fence)
1581 reservation_object_add_shared_fence(resv, &fence->base);
Maarten Lankhorstdd7cfd62014-01-21 13:07:31 +01001582}
1583
Ben Skeggs6ee73862009-12-11 19:24:15 +10001584struct ttm_bo_driver nouveau_bo_driver = {
Jerome Glisse649bf3c2011-11-01 20:46:13 -04001585 .ttm_tt_create = &nouveau_ttm_tt_create,
Konrad Rzeszutek Wilk3230cfc2011-10-17 17:14:26 -04001586 .ttm_tt_populate = &nouveau_ttm_tt_populate,
1587 .ttm_tt_unpopulate = &nouveau_ttm_tt_unpopulate,
Ben Skeggs6ee73862009-12-11 19:24:15 +10001588 .invalidate_caches = nouveau_bo_invalidate_caches,
1589 .init_mem_type = nouveau_bo_init_mem_type,
1590 .evict_flags = nouveau_bo_evict_flags,
Ben Skeggsa4154bb2011-02-10 10:35:16 +10001591 .move_notify = nouveau_bo_move_ntfy,
Ben Skeggs6ee73862009-12-11 19:24:15 +10001592 .move = nouveau_bo_move,
1593 .verify_access = nouveau_bo_verify_access,
Jerome Glissef32f02f2010-04-09 14:39:25 +02001594 .fault_reserve_notify = &nouveau_ttm_fault_reserve_notify,
1595 .io_mem_reserve = &nouveau_ttm_io_mem_reserve,
1596 .io_mem_free = &nouveau_ttm_io_mem_free,
Ben Skeggs6ee73862009-12-11 19:24:15 +10001597};
1598
Ben Skeggsfd2871a2011-06-06 14:07:04 +10001599struct nouveau_vma *
1600nouveau_bo_vma_find(struct nouveau_bo *nvbo, struct nouveau_vm *vm)
1601{
1602 struct nouveau_vma *vma;
1603 list_for_each_entry(vma, &nvbo->vma_list, head) {
1604 if (vma->vm == vm)
1605 return vma;
1606 }
1607
1608 return NULL;
1609}
1610
1611int
1612nouveau_bo_vma_add(struct nouveau_bo *nvbo, struct nouveau_vm *vm,
1613 struct nouveau_vma *vma)
1614{
1615 const u32 size = nvbo->bo.mem.num_pages << PAGE_SHIFT;
Ben Skeggsfd2871a2011-06-06 14:07:04 +10001616 int ret;
1617
1618 ret = nouveau_vm_get(vm, size, nvbo->page_shift,
1619 NV_MEM_ACCESS_RW, vma);
1620 if (ret)
1621 return ret;
1622
Ben Skeggs2e2cfbe2013-11-15 11:56:49 +10001623 if ( nvbo->bo.mem.mem_type != TTM_PL_SYSTEM &&
1624 (nvbo->bo.mem.mem_type == TTM_PL_VRAM ||
1625 nvbo->page_shift != vma->vm->vmm->lpg_shift))
Ben Skeggsfd2871a2011-06-06 14:07:04 +10001626 nouveau_vm_map(vma, nvbo->bo.mem.mm_node);
Ben Skeggsfd2871a2011-06-06 14:07:04 +10001627
1628 list_add_tail(&vma->head, &nvbo->vma_list);
Ben Skeggs2fd3db62011-06-07 15:25:12 +10001629 vma->refcount = 1;
Ben Skeggsfd2871a2011-06-06 14:07:04 +10001630 return 0;
1631}
1632
1633void
1634nouveau_bo_vma_del(struct nouveau_bo *nvbo, struct nouveau_vma *vma)
1635{
1636 if (vma->node) {
Ben Skeggsc4c70442013-05-07 09:48:30 +10001637 if (nvbo->bo.mem.mem_type != TTM_PL_SYSTEM)
Ben Skeggsfd2871a2011-06-06 14:07:04 +10001638 nouveau_vm_unmap(vma);
Ben Skeggsfd2871a2011-06-06 14:07:04 +10001639 nouveau_vm_put(vma);
1640 list_del(&vma->head);
1641 }
1642}