blob: 77326e344dadaf07720afb30c827d964454e7520 [file] [log] [blame]
Ben Skeggs6ee73862009-12-11 19:24:15 +10001/*
2 * Copyright 2007 Dave Airlied
3 * All Rights Reserved.
4 *
5 * Permission is hereby granted, free of charge, to any person obtaining a
6 * copy of this software and associated documentation files (the "Software"),
7 * to deal in the Software without restriction, including without limitation
8 * the rights to use, copy, modify, merge, publish, distribute, sublicense,
9 * and/or sell copies of the Software, and to permit persons to whom the
10 * Software is furnished to do so, subject to the following conditions:
11 *
12 * The above copyright notice and this permission notice (including the next
13 * paragraph) shall be included in all copies or substantial portions of the
14 * Software.
15 *
16 * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
17 * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
18 * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL
19 * VA LINUX SYSTEMS AND/OR ITS SUPPLIERS BE LIABLE FOR ANY CLAIM, DAMAGES OR
20 * OTHER LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE,
21 * ARISING FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR
22 * OTHER DEALINGS IN THE SOFTWARE.
23 */
24/*
25 * Authors: Dave Airlied <airlied@linux.ie>
26 * Ben Skeggs <darktama@iinet.net.au>
27 * Jeremy Kolb <jkolb@brandeis.edu>
28 */
29
Ben Skeggsfdb751e2014-08-10 04:10:23 +100030#include <linux/dma-mapping.h>
Chris Metcalf3e2b7562013-02-01 13:44:33 -050031#include <linux/swiotlb.h>
Ben Skeggs6ee73862009-12-11 19:24:15 +100032
Ben Skeggsebb945a2012-07-20 08:17:34 +100033#include "nouveau_drm.h"
Ben Skeggs6ee73862009-12-11 19:24:15 +100034#include "nouveau_dma.h"
Ben Skeggsd375e7d52012-04-30 13:30:00 +100035#include "nouveau_fence.h"
Ben Skeggs6ee73862009-12-11 19:24:15 +100036
Ben Skeggsebb945a2012-07-20 08:17:34 +100037#include "nouveau_bo.h"
38#include "nouveau_ttm.h"
39#include "nouveau_gem.h"
Maarten Maathuisa5106042009-12-26 21:46:36 +010040
Ben Skeggsbc9e7b92012-07-19 17:54:21 +100041/*
42 * NV10-NV40 tiling helpers
43 */
44
45static void
Ben Skeggsebb945a2012-07-20 08:17:34 +100046nv10_bo_update_tile_region(struct drm_device *dev, struct nouveau_drm_tile *reg,
47 u32 addr, u32 size, u32 pitch, u32 flags)
Ben Skeggsbc9e7b92012-07-19 17:54:21 +100048{
Ben Skeggs77145f12012-07-31 16:16:21 +100049 struct nouveau_drm *drm = nouveau_drm(dev);
Ben Skeggsebb945a2012-07-20 08:17:34 +100050 int i = reg - drm->tile.reg;
Ben Skeggsbe83cd42015-01-14 15:36:34 +100051 struct nvkm_fb *pfb = nvxx_fb(&drm->device);
52 struct nvkm_fb_tile *tile = &pfb->tile.region[i];
53 struct nvkm_engine *engine;
Ben Skeggsbc9e7b92012-07-19 17:54:21 +100054
Ben Skeggsebb945a2012-07-20 08:17:34 +100055 nouveau_fence_unref(&reg->fence);
Ben Skeggsbc9e7b92012-07-19 17:54:21 +100056
57 if (tile->pitch)
Ben Skeggsebb945a2012-07-20 08:17:34 +100058 pfb->tile.fini(pfb, i, tile);
Ben Skeggsbc9e7b92012-07-19 17:54:21 +100059
60 if (pitch)
Ben Skeggsebb945a2012-07-20 08:17:34 +100061 pfb->tile.init(pfb, i, addr, size, pitch, flags, tile);
Ben Skeggsbc9e7b92012-07-19 17:54:21 +100062
Ben Skeggsebb945a2012-07-20 08:17:34 +100063 pfb->tile.prog(pfb, i, tile);
Ben Skeggsbc9e7b92012-07-19 17:54:21 +100064
Ben Skeggsbe83cd42015-01-14 15:36:34 +100065 if ((engine = nvkm_engine(pfb, NVDEV_ENGINE_GR)))
Ben Skeggsebb945a2012-07-20 08:17:34 +100066 engine->tile_prog(engine, i);
Ben Skeggsbe83cd42015-01-14 15:36:34 +100067 if ((engine = nvkm_engine(pfb, NVDEV_ENGINE_MPEG)))
Ben Skeggsebb945a2012-07-20 08:17:34 +100068 engine->tile_prog(engine, i);
Ben Skeggsbc9e7b92012-07-19 17:54:21 +100069}
70
Ben Skeggsebb945a2012-07-20 08:17:34 +100071static struct nouveau_drm_tile *
Ben Skeggsbc9e7b92012-07-19 17:54:21 +100072nv10_bo_get_tile_region(struct drm_device *dev, int i)
73{
Ben Skeggs77145f12012-07-31 16:16:21 +100074 struct nouveau_drm *drm = nouveau_drm(dev);
Ben Skeggsebb945a2012-07-20 08:17:34 +100075 struct nouveau_drm_tile *tile = &drm->tile.reg[i];
Ben Skeggsbc9e7b92012-07-19 17:54:21 +100076
Ben Skeggsebb945a2012-07-20 08:17:34 +100077 spin_lock(&drm->tile.lock);
Ben Skeggsbc9e7b92012-07-19 17:54:21 +100078
79 if (!tile->used &&
80 (!tile->fence || nouveau_fence_done(tile->fence)))
81 tile->used = true;
82 else
83 tile = NULL;
84
Ben Skeggsebb945a2012-07-20 08:17:34 +100085 spin_unlock(&drm->tile.lock);
Ben Skeggsbc9e7b92012-07-19 17:54:21 +100086 return tile;
87}
88
89static void
Ben Skeggsebb945a2012-07-20 08:17:34 +100090nv10_bo_put_tile_region(struct drm_device *dev, struct nouveau_drm_tile *tile,
Maarten Lankhorstf2c24b82014-04-02 17:14:48 +020091 struct fence *fence)
Ben Skeggsbc9e7b92012-07-19 17:54:21 +100092{
Ben Skeggs77145f12012-07-31 16:16:21 +100093 struct nouveau_drm *drm = nouveau_drm(dev);
Ben Skeggsbc9e7b92012-07-19 17:54:21 +100094
95 if (tile) {
Ben Skeggsebb945a2012-07-20 08:17:34 +100096 spin_lock(&drm->tile.lock);
Maarten Lankhorst809e9442014-04-09 16:19:30 +020097 tile->fence = (struct nouveau_fence *)fence_get(fence);
Ben Skeggsbc9e7b92012-07-19 17:54:21 +100098 tile->used = false;
Ben Skeggsebb945a2012-07-20 08:17:34 +100099 spin_unlock(&drm->tile.lock);
Ben Skeggsbc9e7b92012-07-19 17:54:21 +1000100 }
101}
102
Ben Skeggsebb945a2012-07-20 08:17:34 +1000103static struct nouveau_drm_tile *
104nv10_bo_set_tiling(struct drm_device *dev, u32 addr,
105 u32 size, u32 pitch, u32 flags)
Ben Skeggsbc9e7b92012-07-19 17:54:21 +1000106{
Ben Skeggs77145f12012-07-31 16:16:21 +1000107 struct nouveau_drm *drm = nouveau_drm(dev);
Ben Skeggsbe83cd42015-01-14 15:36:34 +1000108 struct nvkm_fb *pfb = nvxx_fb(&drm->device);
Ben Skeggsebb945a2012-07-20 08:17:34 +1000109 struct nouveau_drm_tile *tile, *found = NULL;
Ben Skeggsbc9e7b92012-07-19 17:54:21 +1000110 int i;
111
Ben Skeggsebb945a2012-07-20 08:17:34 +1000112 for (i = 0; i < pfb->tile.regions; i++) {
Ben Skeggsbc9e7b92012-07-19 17:54:21 +1000113 tile = nv10_bo_get_tile_region(dev, i);
114
115 if (pitch && !found) {
116 found = tile;
117 continue;
118
Ben Skeggsebb945a2012-07-20 08:17:34 +1000119 } else if (tile && pfb->tile.region[i].pitch) {
Ben Skeggsbc9e7b92012-07-19 17:54:21 +1000120 /* Kill an unused tile region. */
121 nv10_bo_update_tile_region(dev, tile, 0, 0, 0, 0);
122 }
123
124 nv10_bo_put_tile_region(dev, tile, NULL);
125 }
126
127 if (found)
128 nv10_bo_update_tile_region(dev, found, addr, size,
129 pitch, flags);
130 return found;
131}
132
Ben Skeggs6ee73862009-12-11 19:24:15 +1000133static void
134nouveau_bo_del_ttm(struct ttm_buffer_object *bo)
135{
Ben Skeggsebb945a2012-07-20 08:17:34 +1000136 struct nouveau_drm *drm = nouveau_bdev(bo->bdev);
137 struct drm_device *dev = drm->dev;
Ben Skeggs6ee73862009-12-11 19:24:15 +1000138 struct nouveau_bo *nvbo = nouveau_bo(bo);
139
David Herrmann55fb74a2013-10-02 10:15:17 +0200140 if (unlikely(nvbo->gem.filp))
Ben Skeggs6ee73862009-12-11 19:24:15 +1000141 DRM_ERROR("bo %p still attached to GEM object\n", bo);
Maarten Lankhorst4f385592013-07-07 10:37:35 +0200142 WARN_ON(nvbo->pin_refcnt > 0);
Ben Skeggsbc9e7b92012-07-19 17:54:21 +1000143 nv10_bo_put_tile_region(dev, nvbo->tile, NULL);
Ben Skeggs6ee73862009-12-11 19:24:15 +1000144 kfree(nvbo);
145}
146
Francisco Jereza0af9ad2009-12-11 16:51:09 +0100147static void
Ben Skeggsdb5c8e22011-02-10 13:41:01 +1000148nouveau_bo_fixup_align(struct nouveau_bo *nvbo, u32 flags,
Ben Skeggsf91bac52011-06-06 14:15:46 +1000149 int *align, int *size)
Francisco Jereza0af9ad2009-12-11 16:51:09 +0100150{
Ben Skeggsebb945a2012-07-20 08:17:34 +1000151 struct nouveau_drm *drm = nouveau_bdev(nvbo->bo.bdev);
Ben Skeggs967e7bd2014-08-10 04:10:22 +1000152 struct nvif_device *device = &drm->device;
Francisco Jereza0af9ad2009-12-11 16:51:09 +0100153
Ben Skeggs967e7bd2014-08-10 04:10:22 +1000154 if (device->info.family < NV_DEVICE_INFO_V0_TESLA) {
Ben Skeggsbfd83ac2010-11-12 15:12:51 +1000155 if (nvbo->tile_mode) {
Ben Skeggs967e7bd2014-08-10 04:10:22 +1000156 if (device->info.chipset >= 0x40) {
Francisco Jereza0af9ad2009-12-11 16:51:09 +0100157 *align = 65536;
Ben Skeggsbfd83ac2010-11-12 15:12:51 +1000158 *size = roundup(*size, 64 * nvbo->tile_mode);
Francisco Jereza0af9ad2009-12-11 16:51:09 +0100159
Ben Skeggs967e7bd2014-08-10 04:10:22 +1000160 } else if (device->info.chipset >= 0x30) {
Francisco Jereza0af9ad2009-12-11 16:51:09 +0100161 *align = 32768;
Ben Skeggsbfd83ac2010-11-12 15:12:51 +1000162 *size = roundup(*size, 64 * nvbo->tile_mode);
Francisco Jereza0af9ad2009-12-11 16:51:09 +0100163
Ben Skeggs967e7bd2014-08-10 04:10:22 +1000164 } else if (device->info.chipset >= 0x20) {
Francisco Jereza0af9ad2009-12-11 16:51:09 +0100165 *align = 16384;
Ben Skeggsbfd83ac2010-11-12 15:12:51 +1000166 *size = roundup(*size, 64 * nvbo->tile_mode);
Francisco Jereza0af9ad2009-12-11 16:51:09 +0100167
Ben Skeggs967e7bd2014-08-10 04:10:22 +1000168 } else if (device->info.chipset >= 0x10) {
Francisco Jereza0af9ad2009-12-11 16:51:09 +0100169 *align = 16384;
Ben Skeggsbfd83ac2010-11-12 15:12:51 +1000170 *size = roundup(*size, 32 * nvbo->tile_mode);
Francisco Jereza0af9ad2009-12-11 16:51:09 +0100171 }
172 }
Ben Skeggsbfd83ac2010-11-12 15:12:51 +1000173 } else {
Ben Skeggsf91bac52011-06-06 14:15:46 +1000174 *size = roundup(*size, (1 << nvbo->page_shift));
175 *align = max((1 << nvbo->page_shift), *align);
Francisco Jereza0af9ad2009-12-11 16:51:09 +0100176 }
177
Maarten Maathuis1c7059e2009-12-25 18:51:17 +0100178 *size = roundup(*size, PAGE_SIZE);
Francisco Jereza0af9ad2009-12-11 16:51:09 +0100179}
180
Ben Skeggs6ee73862009-12-11 19:24:15 +1000181int
Ben Skeggs7375c952011-06-07 14:21:29 +1000182nouveau_bo_new(struct drm_device *dev, int size, int align,
183 uint32_t flags, uint32_t tile_mode, uint32_t tile_flags,
Maarten Lankhorstbb6178b2014-01-09 11:03:15 +0100184 struct sg_table *sg, struct reservation_object *robj,
Ben Skeggs7375c952011-06-07 14:21:29 +1000185 struct nouveau_bo **pnvbo)
Ben Skeggs6ee73862009-12-11 19:24:15 +1000186{
Ben Skeggs77145f12012-07-31 16:16:21 +1000187 struct nouveau_drm *drm = nouveau_drm(dev);
Ben Skeggs6ee73862009-12-11 19:24:15 +1000188 struct nouveau_bo *nvbo;
Jerome Glisse57de4ba2011-11-11 15:42:57 -0500189 size_t acc_size;
Ben Skeggsf91bac52011-06-06 14:15:46 +1000190 int ret;
Dave Airlie22b33e82012-04-02 11:53:06 +0100191 int type = ttm_bo_type_device;
Maarten Lankhorst35095f72013-07-27 10:17:12 +0200192 int lpg_shift = 12;
193 int max_size;
194
Ben Skeggs3ee6f5b2014-08-10 04:10:20 +1000195 if (drm->client.vm)
Ben Skeggs5ce3bf32015-01-14 09:57:36 +1000196 lpg_shift = drm->client.vm->mmu->lpg_shift;
Maarten Lankhorst35095f72013-07-27 10:17:12 +0200197 max_size = INT_MAX & ~((1 << lpg_shift) - 1);
Maarten Lankhorst0108bc82013-07-07 10:40:19 +0200198
199 if (size <= 0 || size > max_size) {
Ben Skeggsfa2bade2014-08-10 04:10:22 +1000200 NV_WARN(drm, "skipped size %x\n", (u32)size);
Maarten Lankhorst0108bc82013-07-07 10:40:19 +0200201 return -EINVAL;
202 }
Dave Airlie22b33e82012-04-02 11:53:06 +0100203
204 if (sg)
205 type = ttm_bo_type_sg;
Ben Skeggs6ee73862009-12-11 19:24:15 +1000206
207 nvbo = kzalloc(sizeof(struct nouveau_bo), GFP_KERNEL);
208 if (!nvbo)
209 return -ENOMEM;
210 INIT_LIST_HEAD(&nvbo->head);
211 INIT_LIST_HEAD(&nvbo->entry);
Ben Skeggsfd2871a2011-06-06 14:07:04 +1000212 INIT_LIST_HEAD(&nvbo->vma_list);
Ben Skeggs6ee73862009-12-11 19:24:15 +1000213 nvbo->tile_mode = tile_mode;
214 nvbo->tile_flags = tile_flags;
Ben Skeggsebb945a2012-07-20 08:17:34 +1000215 nvbo->bo.bdev = &drm->ttm.bdev;
Ben Skeggs6ee73862009-12-11 19:24:15 +1000216
Ben Skeggs989aa5b2015-01-12 12:33:37 +1000217 if (!nv_device_is_cpu_coherent(nvxx_device(&drm->device)))
Alexandre Courbotc3a0c772014-10-27 18:49:17 +0900218 nvbo->force_coherent = flags & TTM_PL_FLAG_UNCACHED;
219
Ben Skeggsf91bac52011-06-06 14:15:46 +1000220 nvbo->page_shift = 12;
Ben Skeggs3ee6f5b2014-08-10 04:10:20 +1000221 if (drm->client.vm) {
Ben Skeggsf91bac52011-06-06 14:15:46 +1000222 if (!(flags & TTM_PL_FLAG_TT) && size > 256 * 1024)
Ben Skeggs5ce3bf32015-01-14 09:57:36 +1000223 nvbo->page_shift = drm->client.vm->mmu->lpg_shift;
Ben Skeggsf91bac52011-06-06 14:15:46 +1000224 }
225
226 nouveau_bo_fixup_align(nvbo, flags, &align, &size);
Ben Skeggsfd2871a2011-06-06 14:07:04 +1000227 nvbo->bo.mem.num_pages = size >> PAGE_SHIFT;
228 nouveau_bo_placement_set(nvbo, flags, 0);
Ben Skeggs6ee73862009-12-11 19:24:15 +1000229
Ben Skeggsebb945a2012-07-20 08:17:34 +1000230 acc_size = ttm_bo_dma_acc_size(&drm->ttm.bdev, size,
Jerome Glisse57de4ba2011-11-11 15:42:57 -0500231 sizeof(struct nouveau_bo));
232
Ben Skeggsebb945a2012-07-20 08:17:34 +1000233 ret = ttm_bo_init(&drm->ttm.bdev, &nvbo->bo, size,
Dave Airlie22b33e82012-04-02 11:53:06 +0100234 type, &nvbo->placement,
Marcin Slusarz0b91c4a2012-11-06 21:49:51 +0000235 align >> PAGE_SHIFT, false, NULL, acc_size, sg,
Maarten Lankhorstbb6178b2014-01-09 11:03:15 +0100236 robj, nouveau_bo_del_ttm);
Ben Skeggs6ee73862009-12-11 19:24:15 +1000237 if (ret) {
238 /* ttm will call nouveau_bo_del_ttm if it fails.. */
239 return ret;
240 }
241
Ben Skeggs6ee73862009-12-11 19:24:15 +1000242 *pnvbo = nvbo;
243 return 0;
244}
245
Francisco Jerez78ad0f72010-03-18 13:07:47 +0100246static void
Christian Königf1217ed2014-08-27 13:16:04 +0200247set_placement_list(struct ttm_place *pl, unsigned *n, uint32_t type, uint32_t flags)
Ben Skeggs6ee73862009-12-11 19:24:15 +1000248{
Francisco Jerez78ad0f72010-03-18 13:07:47 +0100249 *n = 0;
Ben Skeggs6ee73862009-12-11 19:24:15 +1000250
Francisco Jerez78ad0f72010-03-18 13:07:47 +0100251 if (type & TTM_PL_FLAG_VRAM)
Christian Königf1217ed2014-08-27 13:16:04 +0200252 pl[(*n)++].flags = TTM_PL_FLAG_VRAM | flags;
Francisco Jerez78ad0f72010-03-18 13:07:47 +0100253 if (type & TTM_PL_FLAG_TT)
Christian Königf1217ed2014-08-27 13:16:04 +0200254 pl[(*n)++].flags = TTM_PL_FLAG_TT | flags;
Francisco Jerez78ad0f72010-03-18 13:07:47 +0100255 if (type & TTM_PL_FLAG_SYSTEM)
Christian Königf1217ed2014-08-27 13:16:04 +0200256 pl[(*n)++].flags = TTM_PL_FLAG_SYSTEM | flags;
Francisco Jerez78ad0f72010-03-18 13:07:47 +0100257}
Ben Skeggs37cb3e082009-12-16 16:22:42 +1000258
Francisco Jerez699ddfd2010-10-10 06:07:32 +0200259static void
260set_placement_range(struct nouveau_bo *nvbo, uint32_t type)
261{
Ben Skeggsebb945a2012-07-20 08:17:34 +1000262 struct nouveau_drm *drm = nouveau_bdev(nvbo->bo.bdev);
Ben Skeggsf392ec42014-08-10 04:10:28 +1000263 u32 vram_pages = drm->device.info.ram_size >> PAGE_SHIFT;
Christian Königf1217ed2014-08-27 13:16:04 +0200264 unsigned i, fpfn, lpfn;
Francisco Jerez699ddfd2010-10-10 06:07:32 +0200265
Ben Skeggs967e7bd2014-08-10 04:10:22 +1000266 if (drm->device.info.family == NV_DEVICE_INFO_V0_CELSIUS &&
Francisco Jerez812f2192011-02-03 01:49:33 +0100267 nvbo->tile_mode && (type & TTM_PL_FLAG_VRAM) &&
Francisco Jerez4beb1162011-11-06 21:21:28 +0100268 nvbo->bo.mem.num_pages < vram_pages / 4) {
Francisco Jerez699ddfd2010-10-10 06:07:32 +0200269 /*
270 * Make sure that the color and depth buffers are handled
271 * by independent memory controller units. Up to a 9x
272 * speed up when alpha-blending and depth-test are enabled
273 * at the same time.
274 */
Francisco Jerez699ddfd2010-10-10 06:07:32 +0200275 if (nvbo->tile_flags & NOUVEAU_GEM_TILE_ZETA) {
Christian Königf1217ed2014-08-27 13:16:04 +0200276 fpfn = vram_pages / 2;
277 lpfn = ~0;
Francisco Jerez699ddfd2010-10-10 06:07:32 +0200278 } else {
Christian Königf1217ed2014-08-27 13:16:04 +0200279 fpfn = 0;
280 lpfn = vram_pages / 2;
281 }
282 for (i = 0; i < nvbo->placement.num_placement; ++i) {
283 nvbo->placements[i].fpfn = fpfn;
284 nvbo->placements[i].lpfn = lpfn;
285 }
286 for (i = 0; i < nvbo->placement.num_busy_placement; ++i) {
287 nvbo->busy_placements[i].fpfn = fpfn;
288 nvbo->busy_placements[i].lpfn = lpfn;
Francisco Jerez699ddfd2010-10-10 06:07:32 +0200289 }
290 }
291}
292
Francisco Jerez78ad0f72010-03-18 13:07:47 +0100293void
294nouveau_bo_placement_set(struct nouveau_bo *nvbo, uint32_t type, uint32_t busy)
295{
296 struct ttm_placement *pl = &nvbo->placement;
Alexandre Courbotc3a0c772014-10-27 18:49:17 +0900297 uint32_t flags = (nvbo->force_coherent ? TTM_PL_FLAG_UNCACHED :
298 TTM_PL_MASK_CACHING) |
299 (nvbo->pin_refcnt ? TTM_PL_FLAG_NO_EVICT : 0);
Francisco Jerez78ad0f72010-03-18 13:07:47 +0100300
301 pl->placement = nvbo->placements;
302 set_placement_list(nvbo->placements, &pl->num_placement,
303 type, flags);
304
305 pl->busy_placement = nvbo->busy_placements;
306 set_placement_list(nvbo->busy_placements, &pl->num_busy_placement,
307 type | busy, flags);
Francisco Jerez699ddfd2010-10-10 06:07:32 +0200308
309 set_placement_range(nvbo, type);
Ben Skeggs6ee73862009-12-11 19:24:15 +1000310}
311
312int
Ben Skeggsad76b3f2014-11-10 11:24:27 +1000313nouveau_bo_pin(struct nouveau_bo *nvbo, uint32_t memtype, bool contig)
Ben Skeggs6ee73862009-12-11 19:24:15 +1000314{
Ben Skeggsebb945a2012-07-20 08:17:34 +1000315 struct nouveau_drm *drm = nouveau_bdev(nvbo->bo.bdev);
Ben Skeggs6ee73862009-12-11 19:24:15 +1000316 struct ttm_buffer_object *bo = &nvbo->bo;
Ben Skeggsad76b3f2014-11-10 11:24:27 +1000317 bool force = false, evict = false;
Francisco Jerez78ad0f72010-03-18 13:07:47 +0100318 int ret;
Ben Skeggs6ee73862009-12-11 19:24:15 +1000319
Thierry Redingee3939e2014-07-21 13:15:51 +0200320 ret = ttm_bo_reserve(bo, false, false, false, NULL);
Daniel Vetter0ae6d7b2012-12-11 21:52:30 +0100321 if (ret)
Ben Skeggs50ab2e52014-11-10 11:12:17 +1000322 return ret;
Daniel Vetter0ae6d7b2012-12-11 21:52:30 +0100323
Ben Skeggsad76b3f2014-11-10 11:24:27 +1000324 if (drm->device.info.family >= NV_DEVICE_INFO_V0_TESLA &&
325 memtype == TTM_PL_FLAG_VRAM && contig) {
326 if (nvbo->tile_flags & NOUVEAU_GEM_TILE_NONCONTIG) {
327 if (bo->mem.mem_type == TTM_PL_VRAM) {
Ben Skeggsbe83cd42015-01-14 15:36:34 +1000328 struct nvkm_mem *mem = bo->mem.mm_node;
Ben Skeggsad76b3f2014-11-10 11:24:27 +1000329 if (!list_is_singular(&mem->regions))
330 evict = true;
331 }
332 nvbo->tile_flags &= ~NOUVEAU_GEM_TILE_NONCONTIG;
333 force = true;
334 }
335 }
336
337 if (nvbo->pin_refcnt) {
338 if (!(memtype & (1 << bo->mem.mem_type)) || evict) {
339 NV_ERROR(drm, "bo %p pinned elsewhere: "
340 "0x%08x vs 0x%08x\n", bo,
341 1 << bo->mem.mem_type, memtype);
342 ret = -EBUSY;
343 }
344 nvbo->pin_refcnt++;
Daniel Vetter0ae6d7b2012-12-11 21:52:30 +0100345 goto out;
Ben Skeggs6ee73862009-12-11 19:24:15 +1000346 }
347
Ben Skeggsad76b3f2014-11-10 11:24:27 +1000348 if (evict) {
349 nouveau_bo_placement_set(nvbo, TTM_PL_FLAG_TT, 0);
350 ret = nouveau_bo_validate(nvbo, false, false);
351 if (ret)
352 goto out;
353 }
Ben Skeggs6ee73862009-12-11 19:24:15 +1000354
Ben Skeggsad76b3f2014-11-10 11:24:27 +1000355 nvbo->pin_refcnt++;
Francisco Jerez78ad0f72010-03-18 13:07:47 +0100356 nouveau_bo_placement_set(nvbo, memtype, 0);
Ben Skeggs6ee73862009-12-11 19:24:15 +1000357
Ben Skeggs50ab2e52014-11-10 11:12:17 +1000358 /* drop pin_refcnt temporarily, so we don't trip the assertion
359 * in nouveau_bo_move() that makes sure we're not trying to
360 * move a pinned buffer
361 */
362 nvbo->pin_refcnt--;
Maarten Lankhorst97a875c2012-11-28 11:25:44 +0000363 ret = nouveau_bo_validate(nvbo, false, false);
Ben Skeggs6aac6ce2014-11-06 14:34:31 +1000364 if (ret)
365 goto out;
Ben Skeggs50ab2e52014-11-10 11:12:17 +1000366 nvbo->pin_refcnt++;
Ben Skeggs6aac6ce2014-11-06 14:34:31 +1000367
368 switch (bo->mem.mem_type) {
369 case TTM_PL_VRAM:
370 drm->gem.vram_available -= bo->mem.size;
371 break;
372 case TTM_PL_TT:
373 drm->gem.gart_available -= bo->mem.size;
374 break;
375 default:
376 break;
Ben Skeggs6ee73862009-12-11 19:24:15 +1000377 }
Alexandre Courbot5be5a152014-10-27 18:11:52 +0900378
Ben Skeggs6ee73862009-12-11 19:24:15 +1000379out:
Ben Skeggsad76b3f2014-11-10 11:24:27 +1000380 if (force && ret)
381 nvbo->tile_flags |= NOUVEAU_GEM_TILE_NONCONTIG;
Daniel Vetter0ae6d7b2012-12-11 21:52:30 +0100382 ttm_bo_unreserve(bo);
Ben Skeggs6ee73862009-12-11 19:24:15 +1000383 return ret;
384}
385
386int
387nouveau_bo_unpin(struct nouveau_bo *nvbo)
388{
Ben Skeggsebb945a2012-07-20 08:17:34 +1000389 struct nouveau_drm *drm = nouveau_bdev(nvbo->bo.bdev);
Ben Skeggs6ee73862009-12-11 19:24:15 +1000390 struct ttm_buffer_object *bo = &nvbo->bo;
Maarten Lankhorst4f385592013-07-07 10:37:35 +0200391 int ret, ref;
Ben Skeggs6ee73862009-12-11 19:24:15 +1000392
Thierry Redingee3939e2014-07-21 13:15:51 +0200393 ret = ttm_bo_reserve(bo, false, false, false, NULL);
Ben Skeggs6ee73862009-12-11 19:24:15 +1000394 if (ret)
395 return ret;
396
Maarten Lankhorst4f385592013-07-07 10:37:35 +0200397 ref = --nvbo->pin_refcnt;
398 WARN_ON_ONCE(ref < 0);
399 if (ref)
Daniel Vetter0ae6d7b2012-12-11 21:52:30 +0100400 goto out;
401
Francisco Jerez78ad0f72010-03-18 13:07:47 +0100402 nouveau_bo_placement_set(nvbo, bo->mem.placement, 0);
Ben Skeggs6ee73862009-12-11 19:24:15 +1000403
Maarten Lankhorst97a875c2012-11-28 11:25:44 +0000404 ret = nouveau_bo_validate(nvbo, false, false);
Ben Skeggs6ee73862009-12-11 19:24:15 +1000405 if (ret == 0) {
406 switch (bo->mem.mem_type) {
407 case TTM_PL_VRAM:
Ben Skeggsebb945a2012-07-20 08:17:34 +1000408 drm->gem.vram_available += bo->mem.size;
Ben Skeggs6ee73862009-12-11 19:24:15 +1000409 break;
410 case TTM_PL_TT:
Ben Skeggsebb945a2012-07-20 08:17:34 +1000411 drm->gem.gart_available += bo->mem.size;
Ben Skeggs6ee73862009-12-11 19:24:15 +1000412 break;
413 default:
414 break;
415 }
416 }
417
Daniel Vetter0ae6d7b2012-12-11 21:52:30 +0100418out:
Ben Skeggs6ee73862009-12-11 19:24:15 +1000419 ttm_bo_unreserve(bo);
420 return ret;
421}
422
423int
424nouveau_bo_map(struct nouveau_bo *nvbo)
425{
426 int ret;
427
Thierry Redingee3939e2014-07-21 13:15:51 +0200428 ret = ttm_bo_reserve(&nvbo->bo, false, false, false, NULL);
Ben Skeggs6ee73862009-12-11 19:24:15 +1000429 if (ret)
430 return ret;
431
Alexandre Courbotc3a0c772014-10-27 18:49:17 +0900432 /*
433 * TTM buffers allocated using the DMA API already have a mapping, let's
434 * use it instead.
435 */
436 if (!nvbo->force_coherent)
437 ret = ttm_bo_kmap(&nvbo->bo, 0, nvbo->bo.mem.num_pages,
438 &nvbo->kmap);
439
Ben Skeggs6ee73862009-12-11 19:24:15 +1000440 ttm_bo_unreserve(&nvbo->bo);
441 return ret;
442}
443
444void
445nouveau_bo_unmap(struct nouveau_bo *nvbo)
446{
Alexandre Courbotc3a0c772014-10-27 18:49:17 +0900447 if (!nvbo)
448 return;
449
450 /*
451 * TTM buffers allocated using the DMA API already had a coherent
452 * mapping which we used, no need to unmap.
453 */
454 if (!nvbo->force_coherent)
Ben Skeggs9d59e8a2010-08-27 13:04:41 +1000455 ttm_bo_kunmap(&nvbo->kmap);
Ben Skeggs6ee73862009-12-11 19:24:15 +1000456}
457
Alexandre Courbotb22870b2014-10-27 18:49:19 +0900458void
459nouveau_bo_sync_for_device(struct nouveau_bo *nvbo)
460{
461 struct nouveau_drm *drm = nouveau_bdev(nvbo->bo.bdev);
Ben Skeggsbe83cd42015-01-14 15:36:34 +1000462 struct nvkm_device *device = nvxx_device(&drm->device);
Alexandre Courbotb22870b2014-10-27 18:49:19 +0900463 struct ttm_dma_tt *ttm_dma = (struct ttm_dma_tt *)nvbo->bo.ttm;
464 int i;
465
466 if (!ttm_dma)
467 return;
468
469 /* Don't waste time looping if the object is coherent */
470 if (nvbo->force_coherent)
471 return;
472
473 for (i = 0; i < ttm_dma->ttm.num_pages; i++)
474 dma_sync_single_for_device(nv_device_base(device),
475 ttm_dma->dma_address[i], PAGE_SIZE, DMA_TO_DEVICE);
476}
477
478void
479nouveau_bo_sync_for_cpu(struct nouveau_bo *nvbo)
480{
481 struct nouveau_drm *drm = nouveau_bdev(nvbo->bo.bdev);
Ben Skeggsbe83cd42015-01-14 15:36:34 +1000482 struct nvkm_device *device = nvxx_device(&drm->device);
Alexandre Courbotb22870b2014-10-27 18:49:19 +0900483 struct ttm_dma_tt *ttm_dma = (struct ttm_dma_tt *)nvbo->bo.ttm;
484 int i;
485
486 if (!ttm_dma)
487 return;
488
489 /* Don't waste time looping if the object is coherent */
490 if (nvbo->force_coherent)
491 return;
492
493 for (i = 0; i < ttm_dma->ttm.num_pages; i++)
494 dma_sync_single_for_cpu(nv_device_base(device),
495 ttm_dma->dma_address[i], PAGE_SIZE, DMA_FROM_DEVICE);
496}
497
Ben Skeggs7a45d762010-11-22 08:50:27 +1000498int
499nouveau_bo_validate(struct nouveau_bo *nvbo, bool interruptible,
Maarten Lankhorst97a875c2012-11-28 11:25:44 +0000500 bool no_wait_gpu)
Ben Skeggs7a45d762010-11-22 08:50:27 +1000501{
502 int ret;
503
Maarten Lankhorst97a875c2012-11-28 11:25:44 +0000504 ret = ttm_bo_validate(&nvbo->bo, &nvbo->placement,
505 interruptible, no_wait_gpu);
Ben Skeggs7a45d762010-11-22 08:50:27 +1000506 if (ret)
507 return ret;
508
Alexandre Courbotb22870b2014-10-27 18:49:19 +0900509 nouveau_bo_sync_for_device(nvbo);
510
Ben Skeggs7a45d762010-11-22 08:50:27 +1000511 return 0;
512}
513
Alexandre Courbotc3a0c772014-10-27 18:49:17 +0900514static inline void *
515_nouveau_bo_mem_index(struct nouveau_bo *nvbo, unsigned index, void *mem, u8 sz)
516{
517 struct ttm_dma_tt *dma_tt;
518 u8 *m = mem;
519
520 index *= sz;
521
522 if (m) {
523 /* kmap'd address, return the corresponding offset */
524 m += index;
525 } else {
526 /* DMA-API mapping, lookup the right address */
527 dma_tt = (struct ttm_dma_tt *)nvbo->bo.ttm;
528 m = dma_tt->cpu_address[index / PAGE_SIZE];
529 m += index % PAGE_SIZE;
530 }
531
532 return m;
533}
534#define nouveau_bo_mem_index(o, i, m) _nouveau_bo_mem_index(o, i, m, sizeof(*m))
535
Ben Skeggs6ee73862009-12-11 19:24:15 +1000536void
537nouveau_bo_wr16(struct nouveau_bo *nvbo, unsigned index, u16 val)
538{
539 bool is_iomem;
540 u16 *mem = ttm_kmap_obj_virtual(&nvbo->kmap, &is_iomem);
Alexandre Courbotc3a0c772014-10-27 18:49:17 +0900541
542 mem = nouveau_bo_mem_index(nvbo, index, mem);
543
Ben Skeggs6ee73862009-12-11 19:24:15 +1000544 if (is_iomem)
545 iowrite16_native(val, (void __force __iomem *)mem);
546 else
547 *mem = val;
548}
549
550u32
551nouveau_bo_rd32(struct nouveau_bo *nvbo, unsigned index)
552{
553 bool is_iomem;
554 u32 *mem = ttm_kmap_obj_virtual(&nvbo->kmap, &is_iomem);
Alexandre Courbotc3a0c772014-10-27 18:49:17 +0900555
556 mem = nouveau_bo_mem_index(nvbo, index, mem);
557
Ben Skeggs6ee73862009-12-11 19:24:15 +1000558 if (is_iomem)
559 return ioread32_native((void __force __iomem *)mem);
560 else
561 return *mem;
562}
563
564void
565nouveau_bo_wr32(struct nouveau_bo *nvbo, unsigned index, u32 val)
566{
567 bool is_iomem;
568 u32 *mem = ttm_kmap_obj_virtual(&nvbo->kmap, &is_iomem);
Alexandre Courbotc3a0c772014-10-27 18:49:17 +0900569
570 mem = nouveau_bo_mem_index(nvbo, index, mem);
571
Ben Skeggs6ee73862009-12-11 19:24:15 +1000572 if (is_iomem)
573 iowrite32_native(val, (void __force __iomem *)mem);
574 else
575 *mem = val;
576}
577
Jerome Glisse649bf3c2011-11-01 20:46:13 -0400578static struct ttm_tt *
Ben Skeggsebb945a2012-07-20 08:17:34 +1000579nouveau_ttm_tt_create(struct ttm_bo_device *bdev, unsigned long size,
580 uint32_t page_flags, struct page *dummy_read)
Ben Skeggs6ee73862009-12-11 19:24:15 +1000581{
Max Filippovdf1b4b92012-10-14 01:58:26 +0400582#if __OS_HAS_AGP
Ben Skeggsebb945a2012-07-20 08:17:34 +1000583 struct nouveau_drm *drm = nouveau_bdev(bdev);
584 struct drm_device *dev = drm->dev;
Ben Skeggs6ee73862009-12-11 19:24:15 +1000585
Ben Skeggsebb945a2012-07-20 08:17:34 +1000586 if (drm->agp.stat == ENABLED) {
587 return ttm_agp_tt_create(bdev, dev->agp->bridge, size,
588 page_flags, dummy_read);
Ben Skeggs6ee73862009-12-11 19:24:15 +1000589 }
Max Filippovdf1b4b92012-10-14 01:58:26 +0400590#endif
Ben Skeggs6ee73862009-12-11 19:24:15 +1000591
Ben Skeggsebb945a2012-07-20 08:17:34 +1000592 return nouveau_sgdma_create_ttm(bdev, size, page_flags, dummy_read);
Ben Skeggs6ee73862009-12-11 19:24:15 +1000593}
594
595static int
596nouveau_bo_invalidate_caches(struct ttm_bo_device *bdev, uint32_t flags)
597{
598 /* We'll do this from user space. */
599 return 0;
600}
601
602static int
603nouveau_bo_init_mem_type(struct ttm_bo_device *bdev, uint32_t type,
604 struct ttm_mem_type_manager *man)
605{
Ben Skeggsebb945a2012-07-20 08:17:34 +1000606 struct nouveau_drm *drm = nouveau_bdev(bdev);
Ben Skeggs6ee73862009-12-11 19:24:15 +1000607
608 switch (type) {
609 case TTM_PL_SYSTEM:
610 man->flags = TTM_MEMTYPE_FLAG_MAPPABLE;
611 man->available_caching = TTM_PL_MASK_CACHING;
612 man->default_caching = TTM_PL_FLAG_CACHED;
613 break;
614 case TTM_PL_VRAM:
Alexandre Courbote2a4e782014-06-27 19:28:50 +0900615 man->flags = TTM_MEMTYPE_FLAG_FIXED |
616 TTM_MEMTYPE_FLAG_MAPPABLE;
617 man->available_caching = TTM_PL_FLAG_UNCACHED |
618 TTM_PL_FLAG_WC;
619 man->default_caching = TTM_PL_FLAG_WC;
620
Ben Skeggs967e7bd2014-08-10 04:10:22 +1000621 if (drm->device.info.family >= NV_DEVICE_INFO_V0_TESLA) {
Alexandre Courbote2a4e782014-06-27 19:28:50 +0900622 /* Some BARs do not support being ioremapped WC */
Ben Skeggs989aa5b2015-01-12 12:33:37 +1000623 if (nvxx_bar(&drm->device)->iomap_uncached) {
Alexandre Courbote2a4e782014-06-27 19:28:50 +0900624 man->available_caching = TTM_PL_FLAG_UNCACHED;
625 man->default_caching = TTM_PL_FLAG_UNCACHED;
626 }
627
Ben Skeggs573a2a32010-08-25 15:26:04 +1000628 man->func = &nouveau_vram_manager;
Ben Skeggsf869ef82010-11-15 11:53:16 +1000629 man->io_reserve_fastpath = false;
630 man->use_io_reserve_lru = true;
631 } else {
Ben Skeggs573a2a32010-08-25 15:26:04 +1000632 man->func = &ttm_bo_manager_func;
Ben Skeggsf869ef82010-11-15 11:53:16 +1000633 }
Ben Skeggs6ee73862009-12-11 19:24:15 +1000634 break;
635 case TTM_PL_TT:
Ben Skeggs967e7bd2014-08-10 04:10:22 +1000636 if (drm->device.info.family >= NV_DEVICE_INFO_V0_TESLA)
Ben Skeggs26c0c9e2011-02-10 12:59:51 +1000637 man->func = &nouveau_gart_manager;
638 else
Ben Skeggsebb945a2012-07-20 08:17:34 +1000639 if (drm->agp.stat != ENABLED)
Ben Skeggs3863c9b2012-07-14 19:09:17 +1000640 man->func = &nv04_gart_manager;
641 else
Ben Skeggs26c0c9e2011-02-10 12:59:51 +1000642 man->func = &ttm_bo_manager_func;
Ben Skeggsebb945a2012-07-20 08:17:34 +1000643
644 if (drm->agp.stat == ENABLED) {
Jerome Glissef32f02f2010-04-09 14:39:25 +0200645 man->flags = TTM_MEMTYPE_FLAG_MAPPABLE;
Francisco Jereza3d487e2010-11-20 22:11:22 +0100646 man->available_caching = TTM_PL_FLAG_UNCACHED |
647 TTM_PL_FLAG_WC;
648 man->default_caching = TTM_PL_FLAG_WC;
Ben Skeggsebb945a2012-07-20 08:17:34 +1000649 } else {
Ben Skeggs6ee73862009-12-11 19:24:15 +1000650 man->flags = TTM_MEMTYPE_FLAG_MAPPABLE |
651 TTM_MEMTYPE_FLAG_CMA;
652 man->available_caching = TTM_PL_MASK_CACHING;
653 man->default_caching = TTM_PL_FLAG_CACHED;
Ben Skeggs6ee73862009-12-11 19:24:15 +1000654 }
Ben Skeggsebb945a2012-07-20 08:17:34 +1000655
Ben Skeggs6ee73862009-12-11 19:24:15 +1000656 break;
657 default:
Ben Skeggs6ee73862009-12-11 19:24:15 +1000658 return -EINVAL;
659 }
660 return 0;
661}
662
663static void
664nouveau_bo_evict_flags(struct ttm_buffer_object *bo, struct ttm_placement *pl)
665{
666 struct nouveau_bo *nvbo = nouveau_bo(bo);
667
668 switch (bo->mem.mem_type) {
Francisco Jerez22fbd532009-12-11 18:40:17 +0100669 case TTM_PL_VRAM:
Francisco Jerez78ad0f72010-03-18 13:07:47 +0100670 nouveau_bo_placement_set(nvbo, TTM_PL_FLAG_TT,
671 TTM_PL_FLAG_SYSTEM);
Francisco Jerez22fbd532009-12-11 18:40:17 +0100672 break;
Ben Skeggs6ee73862009-12-11 19:24:15 +1000673 default:
Francisco Jerez78ad0f72010-03-18 13:07:47 +0100674 nouveau_bo_placement_set(nvbo, TTM_PL_FLAG_SYSTEM, 0);
Ben Skeggs6ee73862009-12-11 19:24:15 +1000675 break;
676 }
Francisco Jerez22fbd532009-12-11 18:40:17 +0100677
678 *pl = nvbo->placement;
Ben Skeggs6ee73862009-12-11 19:24:15 +1000679}
680
681
Ben Skeggs6ee73862009-12-11 19:24:15 +1000682static int
Ben Skeggs49981042012-08-06 19:38:25 +1000683nve0_bo_move_init(struct nouveau_channel *chan, u32 handle)
684{
685 int ret = RING_SPACE(chan, 2);
686 if (ret == 0) {
687 BEGIN_NVC0(chan, NvSubCopy, 0x0000, 1);
Ben Skeggs00fc6f62013-07-09 14:20:15 +1000688 OUT_RING (chan, handle & 0x0000ffff);
Ben Skeggs49981042012-08-06 19:38:25 +1000689 FIRE_RING (chan);
690 }
691 return ret;
692}
693
694static int
Ben Skeggsc6b7e892012-03-20 14:36:04 +1000695nve0_bo_move_copy(struct nouveau_channel *chan, struct ttm_buffer_object *bo,
696 struct ttm_mem_reg *old_mem, struct ttm_mem_reg *new_mem)
697{
Ben Skeggsbe83cd42015-01-14 15:36:34 +1000698 struct nvkm_mem *node = old_mem->mm_node;
Ben Skeggsc6b7e892012-03-20 14:36:04 +1000699 int ret = RING_SPACE(chan, 10);
700 if (ret == 0) {
Ben Skeggs6d597022012-04-01 21:09:13 +1000701 BEGIN_NVC0(chan, NvSubCopy, 0x0400, 8);
Ben Skeggsc6b7e892012-03-20 14:36:04 +1000702 OUT_RING (chan, upper_32_bits(node->vma[0].offset));
703 OUT_RING (chan, lower_32_bits(node->vma[0].offset));
704 OUT_RING (chan, upper_32_bits(node->vma[1].offset));
705 OUT_RING (chan, lower_32_bits(node->vma[1].offset));
706 OUT_RING (chan, PAGE_SIZE);
707 OUT_RING (chan, PAGE_SIZE);
708 OUT_RING (chan, PAGE_SIZE);
709 OUT_RING (chan, new_mem->num_pages);
Ben Skeggs6d597022012-04-01 21:09:13 +1000710 BEGIN_IMC0(chan, NvSubCopy, 0x0300, 0x0386);
Ben Skeggsc6b7e892012-03-20 14:36:04 +1000711 }
712 return ret;
713}
714
715static int
Ben Skeggsd1b167e2012-05-04 14:01:52 +1000716nvc0_bo_move_init(struct nouveau_channel *chan, u32 handle)
717{
718 int ret = RING_SPACE(chan, 2);
719 if (ret == 0) {
720 BEGIN_NVC0(chan, NvSubCopy, 0x0000, 1);
721 OUT_RING (chan, handle);
722 }
723 return ret;
724}
725
726static int
Ben Skeggs1a460982012-05-04 15:17:28 +1000727nvc0_bo_move_copy(struct nouveau_channel *chan, struct ttm_buffer_object *bo,
728 struct ttm_mem_reg *old_mem, struct ttm_mem_reg *new_mem)
729{
Ben Skeggsbe83cd42015-01-14 15:36:34 +1000730 struct nvkm_mem *node = old_mem->mm_node;
Ben Skeggs1a460982012-05-04 15:17:28 +1000731 u64 src_offset = node->vma[0].offset;
732 u64 dst_offset = node->vma[1].offset;
733 u32 page_count = new_mem->num_pages;
734 int ret;
735
736 page_count = new_mem->num_pages;
737 while (page_count) {
738 int line_count = (page_count > 8191) ? 8191 : page_count;
739
740 ret = RING_SPACE(chan, 11);
741 if (ret)
742 return ret;
743
744 BEGIN_NVC0(chan, NvSubCopy, 0x030c, 8);
745 OUT_RING (chan, upper_32_bits(src_offset));
746 OUT_RING (chan, lower_32_bits(src_offset));
747 OUT_RING (chan, upper_32_bits(dst_offset));
748 OUT_RING (chan, lower_32_bits(dst_offset));
749 OUT_RING (chan, PAGE_SIZE);
750 OUT_RING (chan, PAGE_SIZE);
751 OUT_RING (chan, PAGE_SIZE);
752 OUT_RING (chan, line_count);
753 BEGIN_NVC0(chan, NvSubCopy, 0x0300, 1);
754 OUT_RING (chan, 0x00000110);
755
756 page_count -= line_count;
757 src_offset += (PAGE_SIZE * line_count);
758 dst_offset += (PAGE_SIZE * line_count);
759 }
760
761 return 0;
762}
763
764static int
Ben Skeggs183720b2010-12-09 15:17:10 +1000765nvc0_bo_move_m2mf(struct nouveau_channel *chan, struct ttm_buffer_object *bo,
766 struct ttm_mem_reg *old_mem, struct ttm_mem_reg *new_mem)
767{
Ben Skeggsbe83cd42015-01-14 15:36:34 +1000768 struct nvkm_mem *node = old_mem->mm_node;
Ben Skeggsd2f966662011-06-06 20:54:42 +1000769 u64 src_offset = node->vma[0].offset;
770 u64 dst_offset = node->vma[1].offset;
Ben Skeggs183720b2010-12-09 15:17:10 +1000771 u32 page_count = new_mem->num_pages;
772 int ret;
773
Ben Skeggs183720b2010-12-09 15:17:10 +1000774 page_count = new_mem->num_pages;
775 while (page_count) {
776 int line_count = (page_count > 2047) ? 2047 : page_count;
777
778 ret = RING_SPACE(chan, 12);
779 if (ret)
780 return ret;
781
Ben Skeggsd1b167e2012-05-04 14:01:52 +1000782 BEGIN_NVC0(chan, NvSubCopy, 0x0238, 2);
Ben Skeggs183720b2010-12-09 15:17:10 +1000783 OUT_RING (chan, upper_32_bits(dst_offset));
784 OUT_RING (chan, lower_32_bits(dst_offset));
Ben Skeggsd1b167e2012-05-04 14:01:52 +1000785 BEGIN_NVC0(chan, NvSubCopy, 0x030c, 6);
Ben Skeggs183720b2010-12-09 15:17:10 +1000786 OUT_RING (chan, upper_32_bits(src_offset));
787 OUT_RING (chan, lower_32_bits(src_offset));
788 OUT_RING (chan, PAGE_SIZE); /* src_pitch */
789 OUT_RING (chan, PAGE_SIZE); /* dst_pitch */
790 OUT_RING (chan, PAGE_SIZE); /* line_length */
791 OUT_RING (chan, line_count);
Ben Skeggsd1b167e2012-05-04 14:01:52 +1000792 BEGIN_NVC0(chan, NvSubCopy, 0x0300, 1);
Ben Skeggs183720b2010-12-09 15:17:10 +1000793 OUT_RING (chan, 0x00100110);
794
795 page_count -= line_count;
796 src_offset += (PAGE_SIZE * line_count);
797 dst_offset += (PAGE_SIZE * line_count);
798 }
799
800 return 0;
801}
802
803static int
Ben Skeggsfdf53242012-05-04 15:15:12 +1000804nva3_bo_move_copy(struct nouveau_channel *chan, struct ttm_buffer_object *bo,
805 struct ttm_mem_reg *old_mem, struct ttm_mem_reg *new_mem)
806{
Ben Skeggsbe83cd42015-01-14 15:36:34 +1000807 struct nvkm_mem *node = old_mem->mm_node;
Ben Skeggsfdf53242012-05-04 15:15:12 +1000808 u64 src_offset = node->vma[0].offset;
809 u64 dst_offset = node->vma[1].offset;
810 u32 page_count = new_mem->num_pages;
811 int ret;
812
813 page_count = new_mem->num_pages;
814 while (page_count) {
815 int line_count = (page_count > 8191) ? 8191 : page_count;
816
817 ret = RING_SPACE(chan, 11);
818 if (ret)
819 return ret;
820
821 BEGIN_NV04(chan, NvSubCopy, 0x030c, 8);
822 OUT_RING (chan, upper_32_bits(src_offset));
823 OUT_RING (chan, lower_32_bits(src_offset));
824 OUT_RING (chan, upper_32_bits(dst_offset));
825 OUT_RING (chan, lower_32_bits(dst_offset));
826 OUT_RING (chan, PAGE_SIZE);
827 OUT_RING (chan, PAGE_SIZE);
828 OUT_RING (chan, PAGE_SIZE);
829 OUT_RING (chan, line_count);
830 BEGIN_NV04(chan, NvSubCopy, 0x0300, 1);
831 OUT_RING (chan, 0x00000110);
832
833 page_count -= line_count;
834 src_offset += (PAGE_SIZE * line_count);
835 dst_offset += (PAGE_SIZE * line_count);
836 }
837
838 return 0;
839}
840
841static int
Ben Skeggs5490e5d2012-05-04 14:34:16 +1000842nv98_bo_move_exec(struct nouveau_channel *chan, struct ttm_buffer_object *bo,
843 struct ttm_mem_reg *old_mem, struct ttm_mem_reg *new_mem)
844{
Ben Skeggsbe83cd42015-01-14 15:36:34 +1000845 struct nvkm_mem *node = old_mem->mm_node;
Ben Skeggs5490e5d2012-05-04 14:34:16 +1000846 int ret = RING_SPACE(chan, 7);
847 if (ret == 0) {
848 BEGIN_NV04(chan, NvSubCopy, 0x0320, 6);
849 OUT_RING (chan, upper_32_bits(node->vma[0].offset));
850 OUT_RING (chan, lower_32_bits(node->vma[0].offset));
851 OUT_RING (chan, upper_32_bits(node->vma[1].offset));
852 OUT_RING (chan, lower_32_bits(node->vma[1].offset));
853 OUT_RING (chan, 0x00000000 /* COPY */);
854 OUT_RING (chan, new_mem->num_pages << PAGE_SHIFT);
855 }
856 return ret;
857}
858
859static int
Ben Skeggs4c193d22012-05-04 14:21:15 +1000860nv84_bo_move_exec(struct nouveau_channel *chan, struct ttm_buffer_object *bo,
861 struct ttm_mem_reg *old_mem, struct ttm_mem_reg *new_mem)
862{
Ben Skeggsbe83cd42015-01-14 15:36:34 +1000863 struct nvkm_mem *node = old_mem->mm_node;
Ben Skeggs4c193d22012-05-04 14:21:15 +1000864 int ret = RING_SPACE(chan, 7);
865 if (ret == 0) {
866 BEGIN_NV04(chan, NvSubCopy, 0x0304, 6);
867 OUT_RING (chan, new_mem->num_pages << PAGE_SHIFT);
868 OUT_RING (chan, upper_32_bits(node->vma[0].offset));
869 OUT_RING (chan, lower_32_bits(node->vma[0].offset));
870 OUT_RING (chan, upper_32_bits(node->vma[1].offset));
871 OUT_RING (chan, lower_32_bits(node->vma[1].offset));
872 OUT_RING (chan, 0x00000000 /* MODE_COPY, QUERY_NONE */);
873 }
874 return ret;
875}
876
877static int
Ben Skeggsd1b167e2012-05-04 14:01:52 +1000878nv50_bo_move_init(struct nouveau_channel *chan, u32 handle)
879{
Ben Skeggsebb945a2012-07-20 08:17:34 +1000880 int ret = RING_SPACE(chan, 6);
Ben Skeggsd1b167e2012-05-04 14:01:52 +1000881 if (ret == 0) {
Ben Skeggsebb945a2012-07-20 08:17:34 +1000882 BEGIN_NV04(chan, NvSubCopy, 0x0000, 1);
883 OUT_RING (chan, handle);
884 BEGIN_NV04(chan, NvSubCopy, 0x0180, 3);
Ben Skeggsf45f55c2014-08-10 04:10:23 +1000885 OUT_RING (chan, chan->drm->ntfy.handle);
886 OUT_RING (chan, chan->vram.handle);
887 OUT_RING (chan, chan->vram.handle);
Ben Skeggsd1b167e2012-05-04 14:01:52 +1000888 }
889
890 return ret;
891}
892
893static int
Ben Skeggsf1ab0cc2010-08-26 11:32:01 +1000894nv50_bo_move_m2mf(struct nouveau_channel *chan, struct ttm_buffer_object *bo,
895 struct ttm_mem_reg *old_mem, struct ttm_mem_reg *new_mem)
Ben Skeggs6ee73862009-12-11 19:24:15 +1000896{
Ben Skeggsbe83cd42015-01-14 15:36:34 +1000897 struct nvkm_mem *node = old_mem->mm_node;
Ben Skeggsf1ab0cc2010-08-26 11:32:01 +1000898 u64 length = (new_mem->num_pages << PAGE_SHIFT);
Ben Skeggsd2f966662011-06-06 20:54:42 +1000899 u64 src_offset = node->vma[0].offset;
900 u64 dst_offset = node->vma[1].offset;
Maarten Lankhorstce8f7692013-11-12 13:34:08 +0100901 int src_tiled = !!node->memtype;
Ben Skeggsbe83cd42015-01-14 15:36:34 +1000902 int dst_tiled = !!((struct nvkm_mem *)new_mem->mm_node)->memtype;
Ben Skeggs6ee73862009-12-11 19:24:15 +1000903 int ret;
904
Ben Skeggsf1ab0cc2010-08-26 11:32:01 +1000905 while (length) {
906 u32 amount, stride, height;
907
Maarten Lankhorstce8f7692013-11-12 13:34:08 +0100908 ret = RING_SPACE(chan, 18 + 6 * (src_tiled + dst_tiled));
909 if (ret)
910 return ret;
911
Ben Skeggs5220b3c2010-09-23 15:21:17 +1000912 amount = min(length, (u64)(4 * 1024 * 1024));
913 stride = 16 * 4;
Ben Skeggsf1ab0cc2010-08-26 11:32:01 +1000914 height = amount / stride;
915
Maarten Lankhorstce8f7692013-11-12 13:34:08 +0100916 if (src_tiled) {
Ben Skeggsd1b167e2012-05-04 14:01:52 +1000917 BEGIN_NV04(chan, NvSubCopy, 0x0200, 7);
Ben Skeggsf1ab0cc2010-08-26 11:32:01 +1000918 OUT_RING (chan, 0);
Ben Skeggs5220b3c2010-09-23 15:21:17 +1000919 OUT_RING (chan, 0);
Ben Skeggsf1ab0cc2010-08-26 11:32:01 +1000920 OUT_RING (chan, stride);
921 OUT_RING (chan, height);
922 OUT_RING (chan, 1);
923 OUT_RING (chan, 0);
924 OUT_RING (chan, 0);
925 } else {
Ben Skeggsd1b167e2012-05-04 14:01:52 +1000926 BEGIN_NV04(chan, NvSubCopy, 0x0200, 1);
Ben Skeggsf1ab0cc2010-08-26 11:32:01 +1000927 OUT_RING (chan, 1);
928 }
Maarten Lankhorstce8f7692013-11-12 13:34:08 +0100929 if (dst_tiled) {
Ben Skeggsd1b167e2012-05-04 14:01:52 +1000930 BEGIN_NV04(chan, NvSubCopy, 0x021c, 7);
Ben Skeggsf1ab0cc2010-08-26 11:32:01 +1000931 OUT_RING (chan, 0);
Ben Skeggs5220b3c2010-09-23 15:21:17 +1000932 OUT_RING (chan, 0);
Ben Skeggsf1ab0cc2010-08-26 11:32:01 +1000933 OUT_RING (chan, stride);
934 OUT_RING (chan, height);
935 OUT_RING (chan, 1);
936 OUT_RING (chan, 0);
937 OUT_RING (chan, 0);
938 } else {
Ben Skeggsd1b167e2012-05-04 14:01:52 +1000939 BEGIN_NV04(chan, NvSubCopy, 0x021c, 1);
Ben Skeggsf1ab0cc2010-08-26 11:32:01 +1000940 OUT_RING (chan, 1);
941 }
942
Ben Skeggsd1b167e2012-05-04 14:01:52 +1000943 BEGIN_NV04(chan, NvSubCopy, 0x0238, 2);
Ben Skeggsf1ab0cc2010-08-26 11:32:01 +1000944 OUT_RING (chan, upper_32_bits(src_offset));
945 OUT_RING (chan, upper_32_bits(dst_offset));
Ben Skeggsd1b167e2012-05-04 14:01:52 +1000946 BEGIN_NV04(chan, NvSubCopy, 0x030c, 8);
Ben Skeggsf1ab0cc2010-08-26 11:32:01 +1000947 OUT_RING (chan, lower_32_bits(src_offset));
948 OUT_RING (chan, lower_32_bits(dst_offset));
949 OUT_RING (chan, stride);
950 OUT_RING (chan, stride);
951 OUT_RING (chan, stride);
952 OUT_RING (chan, height);
953 OUT_RING (chan, 0x00000101);
954 OUT_RING (chan, 0x00000000);
Ben Skeggsd1b167e2012-05-04 14:01:52 +1000955 BEGIN_NV04(chan, NvSubCopy, NV_MEMORY_TO_MEMORY_FORMAT_NOP, 1);
Ben Skeggsf1ab0cc2010-08-26 11:32:01 +1000956 OUT_RING (chan, 0);
957
958 length -= amount;
959 src_offset += amount;
960 dst_offset += amount;
Ben Skeggs6ee73862009-12-11 19:24:15 +1000961 }
962
Ben Skeggsf1ab0cc2010-08-26 11:32:01 +1000963 return 0;
964}
965
Ben Skeggsd1b167e2012-05-04 14:01:52 +1000966static int
967nv04_bo_move_init(struct nouveau_channel *chan, u32 handle)
968{
Ben Skeggsebb945a2012-07-20 08:17:34 +1000969 int ret = RING_SPACE(chan, 4);
Ben Skeggsd1b167e2012-05-04 14:01:52 +1000970 if (ret == 0) {
Ben Skeggsebb945a2012-07-20 08:17:34 +1000971 BEGIN_NV04(chan, NvSubCopy, 0x0000, 1);
972 OUT_RING (chan, handle);
973 BEGIN_NV04(chan, NvSubCopy, 0x0180, 1);
Ben Skeggsf45f55c2014-08-10 04:10:23 +1000974 OUT_RING (chan, chan->drm->ntfy.handle);
Ben Skeggsd1b167e2012-05-04 14:01:52 +1000975 }
976
977 return ret;
978}
979
Ben Skeggsa6704782011-02-16 09:10:20 +1000980static inline uint32_t
981nouveau_bo_mem_ctxdma(struct ttm_buffer_object *bo,
982 struct nouveau_channel *chan, struct ttm_mem_reg *mem)
983{
984 if (mem->mem_type == TTM_PL_TT)
Ben Skeggsebb945a2012-07-20 08:17:34 +1000985 return NvDmaTT;
Ben Skeggsf45f55c2014-08-10 04:10:23 +1000986 return chan->vram.handle;
Ben Skeggsa6704782011-02-16 09:10:20 +1000987}
988
Ben Skeggsf1ab0cc2010-08-26 11:32:01 +1000989static int
990nv04_bo_move_m2mf(struct nouveau_channel *chan, struct ttm_buffer_object *bo,
991 struct ttm_mem_reg *old_mem, struct ttm_mem_reg *new_mem)
992{
Ben Skeggsd961db72010-08-05 10:48:18 +1000993 u32 src_offset = old_mem->start << PAGE_SHIFT;
994 u32 dst_offset = new_mem->start << PAGE_SHIFT;
Ben Skeggsf1ab0cc2010-08-26 11:32:01 +1000995 u32 page_count = new_mem->num_pages;
996 int ret;
997
998 ret = RING_SPACE(chan, 3);
999 if (ret)
1000 return ret;
1001
Ben Skeggsd1b167e2012-05-04 14:01:52 +10001002 BEGIN_NV04(chan, NvSubCopy, NV_MEMORY_TO_MEMORY_FORMAT_DMA_SOURCE, 2);
Ben Skeggsf1ab0cc2010-08-26 11:32:01 +10001003 OUT_RING (chan, nouveau_bo_mem_ctxdma(bo, chan, old_mem));
1004 OUT_RING (chan, nouveau_bo_mem_ctxdma(bo, chan, new_mem));
1005
Ben Skeggs6ee73862009-12-11 19:24:15 +10001006 page_count = new_mem->num_pages;
1007 while (page_count) {
1008 int line_count = (page_count > 2047) ? 2047 : page_count;
1009
Ben Skeggs6ee73862009-12-11 19:24:15 +10001010 ret = RING_SPACE(chan, 11);
1011 if (ret)
1012 return ret;
Ben Skeggsf1ab0cc2010-08-26 11:32:01 +10001013
Ben Skeggsd1b167e2012-05-04 14:01:52 +10001014 BEGIN_NV04(chan, NvSubCopy,
Ben Skeggs6ee73862009-12-11 19:24:15 +10001015 NV_MEMORY_TO_MEMORY_FORMAT_OFFSET_IN, 8);
Ben Skeggsf1ab0cc2010-08-26 11:32:01 +10001016 OUT_RING (chan, src_offset);
1017 OUT_RING (chan, dst_offset);
1018 OUT_RING (chan, PAGE_SIZE); /* src_pitch */
1019 OUT_RING (chan, PAGE_SIZE); /* dst_pitch */
1020 OUT_RING (chan, PAGE_SIZE); /* line_length */
1021 OUT_RING (chan, line_count);
1022 OUT_RING (chan, 0x00000101);
1023 OUT_RING (chan, 0x00000000);
Ben Skeggsd1b167e2012-05-04 14:01:52 +10001024 BEGIN_NV04(chan, NvSubCopy, NV_MEMORY_TO_MEMORY_FORMAT_NOP, 1);
Ben Skeggsf1ab0cc2010-08-26 11:32:01 +10001025 OUT_RING (chan, 0);
Ben Skeggs6ee73862009-12-11 19:24:15 +10001026
1027 page_count -= line_count;
1028 src_offset += (PAGE_SIZE * line_count);
1029 dst_offset += (PAGE_SIZE * line_count);
1030 }
1031
Ben Skeggsf1ab0cc2010-08-26 11:32:01 +10001032 return 0;
1033}
1034
1035static int
Ben Skeggs3c57d852013-11-22 10:35:25 +10001036nouveau_bo_move_prep(struct nouveau_drm *drm, struct ttm_buffer_object *bo,
1037 struct ttm_mem_reg *mem)
Ben Skeggsd2f966662011-06-06 20:54:42 +10001038{
Ben Skeggsbe83cd42015-01-14 15:36:34 +10001039 struct nvkm_mem *old_node = bo->mem.mm_node;
1040 struct nvkm_mem *new_node = mem->mm_node;
Ben Skeggs3c57d852013-11-22 10:35:25 +10001041 u64 size = (u64)mem->num_pages << PAGE_SHIFT;
Ben Skeggsd2f966662011-06-06 20:54:42 +10001042 int ret;
1043
Ben Skeggsbe83cd42015-01-14 15:36:34 +10001044 ret = nvkm_vm_get(drm->client.vm, size, old_node->page_shift,
1045 NV_MEM_ACCESS_RW, &old_node->vma[0]);
Ben Skeggsd2f966662011-06-06 20:54:42 +10001046 if (ret)
1047 return ret;
1048
Ben Skeggsbe83cd42015-01-14 15:36:34 +10001049 ret = nvkm_vm_get(drm->client.vm, size, new_node->page_shift,
1050 NV_MEM_ACCESS_RW, &old_node->vma[1]);
Ben Skeggs3c57d852013-11-22 10:35:25 +10001051 if (ret) {
Ben Skeggsbe83cd42015-01-14 15:36:34 +10001052 nvkm_vm_put(&old_node->vma[0]);
Ben Skeggs3c57d852013-11-22 10:35:25 +10001053 return ret;
1054 }
1055
Ben Skeggsbe83cd42015-01-14 15:36:34 +10001056 nvkm_vm_map(&old_node->vma[0], old_node);
1057 nvkm_vm_map(&old_node->vma[1], new_node);
Ben Skeggsd2f966662011-06-06 20:54:42 +10001058 return 0;
1059}
1060
1061static int
Ben Skeggsf1ab0cc2010-08-26 11:32:01 +10001062nouveau_bo_move_m2mf(struct ttm_buffer_object *bo, int evict, bool intr,
Maarten Lankhorst97a875c2012-11-28 11:25:44 +00001063 bool no_wait_gpu, struct ttm_mem_reg *new_mem)
Ben Skeggsf1ab0cc2010-08-26 11:32:01 +10001064{
Ben Skeggsebb945a2012-07-20 08:17:34 +10001065 struct nouveau_drm *drm = nouveau_bdev(bo->bdev);
Dave Jones1934a2a2013-09-17 17:26:34 -04001066 struct nouveau_channel *chan = drm->ttm.chan;
Ben Skeggs0ad72862014-08-10 04:10:22 +10001067 struct nouveau_cli *cli = (void *)nvif_client(&chan->device->base);
Ben Skeggs35b81412013-11-22 10:39:57 +10001068 struct nouveau_fence *fence;
Ben Skeggsf1ab0cc2010-08-26 11:32:01 +10001069 int ret;
1070
Ben Skeggsd2f966662011-06-06 20:54:42 +10001071 /* create temporary vmas for the transfer and attach them to the
Ben Skeggsbe83cd42015-01-14 15:36:34 +10001072 * old nvkm_mem node, these will get cleaned up after ttm has
Ben Skeggsd2f966662011-06-06 20:54:42 +10001073 * destroyed the ttm_mem_reg
Ben Skeggs3425df42011-02-10 11:22:12 +10001074 */
Ben Skeggs967e7bd2014-08-10 04:10:22 +10001075 if (drm->device.info.family >= NV_DEVICE_INFO_V0_TESLA) {
Ben Skeggs3c57d852013-11-22 10:35:25 +10001076 ret = nouveau_bo_move_prep(drm, bo, new_mem);
Ben Skeggsd2f966662011-06-06 20:54:42 +10001077 if (ret)
Ben Skeggs3c57d852013-11-22 10:35:25 +10001078 return ret;
Ben Skeggs3425df42011-02-10 11:22:12 +10001079 }
1080
Ben Skeggs0ad72862014-08-10 04:10:22 +10001081 mutex_lock_nested(&cli->mutex, SINGLE_DEPTH_NESTING);
Maarten Lankhorste3be4c22014-09-16 11:15:07 +02001082 ret = nouveau_fence_sync(nouveau_bo(bo), chan, true, intr);
Ben Skeggs6a6b73f2010-10-05 16:53:48 +10001083 if (ret == 0) {
Ben Skeggs35b81412013-11-22 10:39:57 +10001084 ret = drm->ttm.move(chan, bo, &bo->mem, new_mem);
1085 if (ret == 0) {
1086 ret = nouveau_fence_new(chan, false, &fence);
1087 if (ret == 0) {
Maarten Lankhorstf2c24b82014-04-02 17:14:48 +02001088 ret = ttm_bo_move_accel_cleanup(bo,
1089 &fence->base,
Ben Skeggs35b81412013-11-22 10:39:57 +10001090 evict,
1091 no_wait_gpu,
1092 new_mem);
1093 nouveau_fence_unref(&fence);
1094 }
1095 }
Ben Skeggs6a6b73f2010-10-05 16:53:48 +10001096 }
Ben Skeggs0ad72862014-08-10 04:10:22 +10001097 mutex_unlock(&cli->mutex);
Ben Skeggs6a6b73f2010-10-05 16:53:48 +10001098 return ret;
Ben Skeggs6ee73862009-12-11 19:24:15 +10001099}
1100
Ben Skeggsd1b167e2012-05-04 14:01:52 +10001101void
Ben Skeggs49981042012-08-06 19:38:25 +10001102nouveau_bo_move_init(struct nouveau_drm *drm)
Ben Skeggsd1b167e2012-05-04 14:01:52 +10001103{
Ben Skeggsd1b167e2012-05-04 14:01:52 +10001104 static const struct {
1105 const char *name;
Ben Skeggs1a460982012-05-04 15:17:28 +10001106 int engine;
Ben Skeggsd1b167e2012-05-04 14:01:52 +10001107 u32 oclass;
1108 int (*exec)(struct nouveau_channel *,
1109 struct ttm_buffer_object *,
1110 struct ttm_mem_reg *, struct ttm_mem_reg *);
1111 int (*init)(struct nouveau_channel *, u32 handle);
1112 } _methods[] = {
Ben Skeggs00fc6f62013-07-09 14:20:15 +10001113 { "COPY", 4, 0xa0b5, nve0_bo_move_copy, nve0_bo_move_init },
Ben Skeggs49981042012-08-06 19:38:25 +10001114 { "GRCE", 0, 0xa0b5, nve0_bo_move_copy, nvc0_bo_move_init },
Ben Skeggs1a460982012-05-04 15:17:28 +10001115 { "COPY1", 5, 0x90b8, nvc0_bo_move_copy, nvc0_bo_move_init },
1116 { "COPY0", 4, 0x90b5, nvc0_bo_move_copy, nvc0_bo_move_init },
1117 { "COPY", 0, 0x85b5, nva3_bo_move_copy, nv50_bo_move_init },
1118 { "CRYPT", 0, 0x74c1, nv84_bo_move_exec, nv50_bo_move_init },
1119 { "M2MF", 0, 0x9039, nvc0_bo_move_m2mf, nvc0_bo_move_init },
1120 { "M2MF", 0, 0x5039, nv50_bo_move_m2mf, nv50_bo_move_init },
1121 { "M2MF", 0, 0x0039, nv04_bo_move_m2mf, nv04_bo_move_init },
Ben Skeggs5490e5d2012-05-04 14:34:16 +10001122 {},
Ben Skeggs1a460982012-05-04 15:17:28 +10001123 { "CRYPT", 0, 0x88b4, nv98_bo_move_exec, nv50_bo_move_init },
Ben Skeggsd1b167e2012-05-04 14:01:52 +10001124 }, *mthd = _methods;
1125 const char *name = "CPU";
1126 int ret;
1127
1128 do {
Ben Skeggs49981042012-08-06 19:38:25 +10001129 struct nouveau_channel *chan;
Ben Skeggsebb945a2012-07-20 08:17:34 +10001130
Ben Skeggs00fc6f62013-07-09 14:20:15 +10001131 if (mthd->engine)
Ben Skeggs49981042012-08-06 19:38:25 +10001132 chan = drm->cechan;
1133 else
1134 chan = drm->channel;
1135 if (chan == NULL)
1136 continue;
1137
Ben Skeggs0ad72862014-08-10 04:10:22 +10001138 ret = nvif_object_init(chan->object, NULL,
1139 mthd->oclass | (mthd->engine << 16),
1140 mthd->oclass, NULL, 0,
1141 &drm->ttm.copy);
Ben Skeggsd1b167e2012-05-04 14:01:52 +10001142 if (ret == 0) {
Ben Skeggs0ad72862014-08-10 04:10:22 +10001143 ret = mthd->init(chan, drm->ttm.copy.handle);
Ben Skeggsebb945a2012-07-20 08:17:34 +10001144 if (ret) {
Ben Skeggs0ad72862014-08-10 04:10:22 +10001145 nvif_object_fini(&drm->ttm.copy);
Ben Skeggsebb945a2012-07-20 08:17:34 +10001146 continue;
Ben Skeggsd1b167e2012-05-04 14:01:52 +10001147 }
Ben Skeggsebb945a2012-07-20 08:17:34 +10001148
1149 drm->ttm.move = mthd->exec;
Ben Skeggs1bb3f6a2013-07-08 10:40:35 +10001150 drm->ttm.chan = chan;
Ben Skeggsebb945a2012-07-20 08:17:34 +10001151 name = mthd->name;
1152 break;
Ben Skeggsd1b167e2012-05-04 14:01:52 +10001153 }
1154 } while ((++mthd)->exec);
1155
Ben Skeggsebb945a2012-07-20 08:17:34 +10001156 NV_INFO(drm, "MM: using %s for buffer copies\n", name);
Ben Skeggsd1b167e2012-05-04 14:01:52 +10001157}
1158
Ben Skeggs6ee73862009-12-11 19:24:15 +10001159static int
1160nouveau_bo_move_flipd(struct ttm_buffer_object *bo, bool evict, bool intr,
Maarten Lankhorst97a875c2012-11-28 11:25:44 +00001161 bool no_wait_gpu, struct ttm_mem_reg *new_mem)
Ben Skeggs6ee73862009-12-11 19:24:15 +10001162{
Christian Königf1217ed2014-08-27 13:16:04 +02001163 struct ttm_place placement_memtype = {
1164 .fpfn = 0,
1165 .lpfn = 0,
1166 .flags = TTM_PL_FLAG_TT | TTM_PL_MASK_CACHING
1167 };
Ben Skeggs6ee73862009-12-11 19:24:15 +10001168 struct ttm_placement placement;
1169 struct ttm_mem_reg tmp_mem;
1170 int ret;
1171
Ben Skeggs6ee73862009-12-11 19:24:15 +10001172 placement.num_placement = placement.num_busy_placement = 1;
Francisco Jerez77e2b5e2009-12-16 19:05:00 +01001173 placement.placement = placement.busy_placement = &placement_memtype;
Ben Skeggs6ee73862009-12-11 19:24:15 +10001174
1175 tmp_mem = *new_mem;
1176 tmp_mem.mm_node = NULL;
Maarten Lankhorst97a875c2012-11-28 11:25:44 +00001177 ret = ttm_bo_mem_space(bo, &placement, &tmp_mem, intr, no_wait_gpu);
Ben Skeggs6ee73862009-12-11 19:24:15 +10001178 if (ret)
1179 return ret;
1180
1181 ret = ttm_tt_bind(bo->ttm, &tmp_mem);
1182 if (ret)
1183 goto out;
1184
Maarten Lankhorst97a875c2012-11-28 11:25:44 +00001185 ret = nouveau_bo_move_m2mf(bo, true, intr, no_wait_gpu, &tmp_mem);
Ben Skeggs6ee73862009-12-11 19:24:15 +10001186 if (ret)
1187 goto out;
1188
Maarten Lankhorst97a875c2012-11-28 11:25:44 +00001189 ret = ttm_bo_move_ttm(bo, true, no_wait_gpu, new_mem);
Ben Skeggs6ee73862009-12-11 19:24:15 +10001190out:
Ben Skeggs42311ff2010-08-04 12:07:08 +10001191 ttm_bo_mem_put(bo, &tmp_mem);
Ben Skeggs6ee73862009-12-11 19:24:15 +10001192 return ret;
1193}
1194
1195static int
1196nouveau_bo_move_flips(struct ttm_buffer_object *bo, bool evict, bool intr,
Maarten Lankhorst97a875c2012-11-28 11:25:44 +00001197 bool no_wait_gpu, struct ttm_mem_reg *new_mem)
Ben Skeggs6ee73862009-12-11 19:24:15 +10001198{
Christian Königf1217ed2014-08-27 13:16:04 +02001199 struct ttm_place placement_memtype = {
1200 .fpfn = 0,
1201 .lpfn = 0,
1202 .flags = TTM_PL_FLAG_TT | TTM_PL_MASK_CACHING
1203 };
Ben Skeggs6ee73862009-12-11 19:24:15 +10001204 struct ttm_placement placement;
1205 struct ttm_mem_reg tmp_mem;
1206 int ret;
1207
Ben Skeggs6ee73862009-12-11 19:24:15 +10001208 placement.num_placement = placement.num_busy_placement = 1;
Francisco Jerez77e2b5e2009-12-16 19:05:00 +01001209 placement.placement = placement.busy_placement = &placement_memtype;
Ben Skeggs6ee73862009-12-11 19:24:15 +10001210
1211 tmp_mem = *new_mem;
1212 tmp_mem.mm_node = NULL;
Maarten Lankhorst97a875c2012-11-28 11:25:44 +00001213 ret = ttm_bo_mem_space(bo, &placement, &tmp_mem, intr, no_wait_gpu);
Ben Skeggs6ee73862009-12-11 19:24:15 +10001214 if (ret)
1215 return ret;
1216
Maarten Lankhorst97a875c2012-11-28 11:25:44 +00001217 ret = ttm_bo_move_ttm(bo, true, no_wait_gpu, &tmp_mem);
Ben Skeggs6ee73862009-12-11 19:24:15 +10001218 if (ret)
1219 goto out;
1220
Maarten Lankhorst97a875c2012-11-28 11:25:44 +00001221 ret = nouveau_bo_move_m2mf(bo, true, intr, no_wait_gpu, new_mem);
Ben Skeggs6ee73862009-12-11 19:24:15 +10001222 if (ret)
1223 goto out;
1224
1225out:
Ben Skeggs42311ff2010-08-04 12:07:08 +10001226 ttm_bo_mem_put(bo, &tmp_mem);
Ben Skeggs6ee73862009-12-11 19:24:15 +10001227 return ret;
1228}
1229
Ben Skeggsa4154bb2011-02-10 10:35:16 +10001230static void
1231nouveau_bo_move_ntfy(struct ttm_buffer_object *bo, struct ttm_mem_reg *new_mem)
1232{
Ben Skeggsa4154bb2011-02-10 10:35:16 +10001233 struct nouveau_bo *nvbo = nouveau_bo(bo);
Ben Skeggsbe83cd42015-01-14 15:36:34 +10001234 struct nvkm_vma *vma;
Ben Skeggsa4154bb2011-02-10 10:35:16 +10001235
Ben Skeggs9f1feed2012-01-25 15:34:22 +10001236 /* ttm can now (stupidly) pass the driver bos it didn't create... */
1237 if (bo->destroy != nouveau_bo_del_ttm)
1238 return;
1239
Ben Skeggsfd2871a2011-06-06 14:07:04 +10001240 list_for_each_entry(vma, &nvbo->vma_list, head) {
Ben Skeggs2e2cfbe2013-11-15 11:56:49 +10001241 if (new_mem && new_mem->mem_type != TTM_PL_SYSTEM &&
1242 (new_mem->mem_type == TTM_PL_VRAM ||
Ben Skeggs5ce3bf32015-01-14 09:57:36 +10001243 nvbo->page_shift != vma->vm->mmu->lpg_shift)) {
Ben Skeggsbe83cd42015-01-14 15:36:34 +10001244 nvkm_vm_map(vma, new_mem->mm_node);
Ben Skeggsfd2871a2011-06-06 14:07:04 +10001245 } else {
Ben Skeggsbe83cd42015-01-14 15:36:34 +10001246 nvkm_vm_unmap(vma);
Ben Skeggsfd2871a2011-06-06 14:07:04 +10001247 }
Ben Skeggsa4154bb2011-02-10 10:35:16 +10001248 }
1249}
1250
Ben Skeggs6ee73862009-12-11 19:24:15 +10001251static int
Francisco Jereza0af9ad2009-12-11 16:51:09 +01001252nouveau_bo_vm_bind(struct ttm_buffer_object *bo, struct ttm_mem_reg *new_mem,
Ben Skeggsebb945a2012-07-20 08:17:34 +10001253 struct nouveau_drm_tile **new_tile)
Ben Skeggs6ee73862009-12-11 19:24:15 +10001254{
Ben Skeggsebb945a2012-07-20 08:17:34 +10001255 struct nouveau_drm *drm = nouveau_bdev(bo->bdev);
1256 struct drm_device *dev = drm->dev;
Francisco Jereza0af9ad2009-12-11 16:51:09 +01001257 struct nouveau_bo *nvbo = nouveau_bo(bo);
Ben Skeggsa4154bb2011-02-10 10:35:16 +10001258 u64 offset = new_mem->start << PAGE_SHIFT;
Ben Skeggs6ee73862009-12-11 19:24:15 +10001259
Ben Skeggsa4154bb2011-02-10 10:35:16 +10001260 *new_tile = NULL;
1261 if (new_mem->mem_type != TTM_PL_VRAM)
Francisco Jereza0af9ad2009-12-11 16:51:09 +01001262 return 0;
Ben Skeggs6ee73862009-12-11 19:24:15 +10001263
Ben Skeggs967e7bd2014-08-10 04:10:22 +10001264 if (drm->device.info.family >= NV_DEVICE_INFO_V0_CELSIUS) {
Ben Skeggsbc9e7b92012-07-19 17:54:21 +10001265 *new_tile = nv10_bo_set_tiling(dev, offset, new_mem->size,
Francisco Jereza5cf68b2010-10-24 16:14:41 +02001266 nvbo->tile_mode,
1267 nvbo->tile_flags);
Ben Skeggs6ee73862009-12-11 19:24:15 +10001268 }
1269
Francisco Jereza0af9ad2009-12-11 16:51:09 +01001270 return 0;
1271}
Ben Skeggs6ee73862009-12-11 19:24:15 +10001272
Francisco Jereza0af9ad2009-12-11 16:51:09 +01001273static void
1274nouveau_bo_vm_cleanup(struct ttm_buffer_object *bo,
Ben Skeggsebb945a2012-07-20 08:17:34 +10001275 struct nouveau_drm_tile *new_tile,
1276 struct nouveau_drm_tile **old_tile)
Francisco Jereza0af9ad2009-12-11 16:51:09 +01001277{
Ben Skeggsebb945a2012-07-20 08:17:34 +10001278 struct nouveau_drm *drm = nouveau_bdev(bo->bdev);
1279 struct drm_device *dev = drm->dev;
Maarten Lankhorstf2c24b82014-04-02 17:14:48 +02001280 struct fence *fence = reservation_object_get_excl(bo->resv);
Francisco Jereza0af9ad2009-12-11 16:51:09 +01001281
Maarten Lankhorstf2c24b82014-04-02 17:14:48 +02001282 nv10_bo_put_tile_region(dev, *old_tile, fence);
Ben Skeggsa4154bb2011-02-10 10:35:16 +10001283 *old_tile = new_tile;
Francisco Jereza0af9ad2009-12-11 16:51:09 +01001284}
1285
1286static int
1287nouveau_bo_move(struct ttm_buffer_object *bo, bool evict, bool intr,
Maarten Lankhorst97a875c2012-11-28 11:25:44 +00001288 bool no_wait_gpu, struct ttm_mem_reg *new_mem)
Francisco Jereza0af9ad2009-12-11 16:51:09 +01001289{
Ben Skeggsebb945a2012-07-20 08:17:34 +10001290 struct nouveau_drm *drm = nouveau_bdev(bo->bdev);
Francisco Jereza0af9ad2009-12-11 16:51:09 +01001291 struct nouveau_bo *nvbo = nouveau_bo(bo);
1292 struct ttm_mem_reg *old_mem = &bo->mem;
Ben Skeggsebb945a2012-07-20 08:17:34 +10001293 struct nouveau_drm_tile *new_tile = NULL;
Francisco Jereza0af9ad2009-12-11 16:51:09 +01001294 int ret = 0;
1295
Alexandre Courbot5be5a152014-10-27 18:11:52 +09001296 if (nvbo->pin_refcnt)
1297 NV_WARN(drm, "Moving pinned object %p!\n", nvbo);
1298
Ben Skeggs967e7bd2014-08-10 04:10:22 +10001299 if (drm->device.info.family < NV_DEVICE_INFO_V0_TESLA) {
Ben Skeggsa4154bb2011-02-10 10:35:16 +10001300 ret = nouveau_bo_vm_bind(bo, new_mem, &new_tile);
1301 if (ret)
1302 return ret;
1303 }
Francisco Jereza0af9ad2009-12-11 16:51:09 +01001304
Francisco Jereza0af9ad2009-12-11 16:51:09 +01001305 /* Fake bo copy. */
Ben Skeggs6ee73862009-12-11 19:24:15 +10001306 if (old_mem->mem_type == TTM_PL_SYSTEM && !bo->ttm) {
1307 BUG_ON(bo->mem.mm_node != NULL);
1308 bo->mem = *new_mem;
1309 new_mem->mm_node = NULL;
Francisco Jereza0af9ad2009-12-11 16:51:09 +01001310 goto out;
Ben Skeggs6ee73862009-12-11 19:24:15 +10001311 }
1312
Ben Skeggscef9e992013-11-22 10:52:54 +10001313 /* Hardware assisted copy. */
1314 if (drm->ttm.move) {
1315 if (new_mem->mem_type == TTM_PL_SYSTEM)
1316 ret = nouveau_bo_move_flipd(bo, evict, intr,
1317 no_wait_gpu, new_mem);
1318 else if (old_mem->mem_type == TTM_PL_SYSTEM)
1319 ret = nouveau_bo_move_flips(bo, evict, intr,
1320 no_wait_gpu, new_mem);
1321 else
1322 ret = nouveau_bo_move_m2mf(bo, evict, intr,
1323 no_wait_gpu, new_mem);
1324 if (!ret)
1325 goto out;
Ben Skeggsb8a6a802010-08-27 11:55:43 +10001326 }
1327
Francisco Jereza0af9ad2009-12-11 16:51:09 +01001328 /* Fallback to software copy. */
Ben Skeggscef9e992013-11-22 10:52:54 +10001329 ret = ttm_bo_wait(bo, true, intr, no_wait_gpu);
Ben Skeggscef9e992013-11-22 10:52:54 +10001330 if (ret == 0)
1331 ret = ttm_bo_move_memcpy(bo, evict, no_wait_gpu, new_mem);
Francisco Jereza0af9ad2009-12-11 16:51:09 +01001332
1333out:
Ben Skeggs967e7bd2014-08-10 04:10:22 +10001334 if (drm->device.info.family < NV_DEVICE_INFO_V0_TESLA) {
Ben Skeggsa4154bb2011-02-10 10:35:16 +10001335 if (ret)
1336 nouveau_bo_vm_cleanup(bo, NULL, &new_tile);
1337 else
1338 nouveau_bo_vm_cleanup(bo, new_tile, &nvbo->tile);
1339 }
Francisco Jereza0af9ad2009-12-11 16:51:09 +01001340
1341 return ret;
Ben Skeggs6ee73862009-12-11 19:24:15 +10001342}
1343
1344static int
1345nouveau_bo_verify_access(struct ttm_buffer_object *bo, struct file *filp)
1346{
David Herrmannacb46522013-08-25 18:28:59 +02001347 struct nouveau_bo *nvbo = nouveau_bo(bo);
1348
David Herrmann55fb74a2013-10-02 10:15:17 +02001349 return drm_vma_node_verify_access(&nvbo->gem.vma_node, filp);
Ben Skeggs6ee73862009-12-11 19:24:15 +10001350}
1351
Jerome Glissef32f02f2010-04-09 14:39:25 +02001352static int
1353nouveau_ttm_io_mem_reserve(struct ttm_bo_device *bdev, struct ttm_mem_reg *mem)
1354{
1355 struct ttm_mem_type_manager *man = &bdev->man[mem->mem_type];
Ben Skeggsebb945a2012-07-20 08:17:34 +10001356 struct nouveau_drm *drm = nouveau_bdev(bdev);
Ben Skeggsbe83cd42015-01-14 15:36:34 +10001357 struct nvkm_mem *node = mem->mm_node;
Ben Skeggsf869ef82010-11-15 11:53:16 +10001358 int ret;
Jerome Glissef32f02f2010-04-09 14:39:25 +02001359
1360 mem->bus.addr = NULL;
1361 mem->bus.offset = 0;
1362 mem->bus.size = mem->num_pages << PAGE_SHIFT;
1363 mem->bus.base = 0;
1364 mem->bus.is_iomem = false;
1365 if (!(man->flags & TTM_MEMTYPE_FLAG_MAPPABLE))
1366 return -EINVAL;
1367 switch (mem->mem_type) {
1368 case TTM_PL_SYSTEM:
1369 /* System memory */
1370 return 0;
1371 case TTM_PL_TT:
1372#if __OS_HAS_AGP
Ben Skeggsebb945a2012-07-20 08:17:34 +10001373 if (drm->agp.stat == ENABLED) {
Ben Skeggsd961db72010-08-05 10:48:18 +10001374 mem->bus.offset = mem->start << PAGE_SHIFT;
Ben Skeggsebb945a2012-07-20 08:17:34 +10001375 mem->bus.base = drm->agp.base;
Ben Skeggs5c13cac2014-08-10 12:39:09 +10001376 mem->bus.is_iomem = !drm->dev->agp->cant_use_aperture;
Jerome Glissef32f02f2010-04-09 14:39:25 +02001377 }
1378#endif
Ben Skeggs967e7bd2014-08-10 04:10:22 +10001379 if (drm->device.info.family < NV_DEVICE_INFO_V0_TESLA || !node->memtype)
Maarten Lankhorsta5540902013-11-12 13:34:09 +01001380 /* untiled */
1381 break;
1382 /* fallthrough, tiled memory */
Jerome Glissef32f02f2010-04-09 14:39:25 +02001383 case TTM_PL_VRAM:
Ben Skeggs3863c9b2012-07-14 19:09:17 +10001384 mem->bus.offset = mem->start << PAGE_SHIFT;
Ben Skeggs989aa5b2015-01-12 12:33:37 +10001385 mem->bus.base = nv_device_resource_start(nvxx_device(&drm->device), 1);
Jerome Glissef32f02f2010-04-09 14:39:25 +02001386 mem->bus.is_iomem = true;
Ben Skeggs967e7bd2014-08-10 04:10:22 +10001387 if (drm->device.info.family >= NV_DEVICE_INFO_V0_TESLA) {
Ben Skeggsbe83cd42015-01-14 15:36:34 +10001388 struct nvkm_bar *bar = nvxx_bar(&drm->device);
Ben Skeggs3863c9b2012-07-14 19:09:17 +10001389
Ben Skeggsebb945a2012-07-20 08:17:34 +10001390 ret = bar->umap(bar, node, NV_MEM_ACCESS_RW,
Ben Skeggs3863c9b2012-07-14 19:09:17 +10001391 &node->bar_vma);
1392 if (ret)
1393 return ret;
1394
1395 mem->bus.offset = node->bar_vma.offset;
1396 }
Jerome Glissef32f02f2010-04-09 14:39:25 +02001397 break;
1398 default:
1399 return -EINVAL;
1400 }
1401 return 0;
1402}
1403
1404static void
1405nouveau_ttm_io_mem_free(struct ttm_bo_device *bdev, struct ttm_mem_reg *mem)
1406{
Ben Skeggsebb945a2012-07-20 08:17:34 +10001407 struct nouveau_drm *drm = nouveau_bdev(bdev);
Ben Skeggsbe83cd42015-01-14 15:36:34 +10001408 struct nvkm_bar *bar = nvxx_bar(&drm->device);
1409 struct nvkm_mem *node = mem->mm_node;
Ben Skeggsf869ef82010-11-15 11:53:16 +10001410
Ben Skeggsd5f42392011-02-10 12:22:52 +10001411 if (!node->bar_vma.node)
Ben Skeggsf869ef82010-11-15 11:53:16 +10001412 return;
1413
Ben Skeggsebb945a2012-07-20 08:17:34 +10001414 bar->unmap(bar, &node->bar_vma);
Jerome Glissef32f02f2010-04-09 14:39:25 +02001415}
1416
1417static int
1418nouveau_ttm_fault_reserve_notify(struct ttm_buffer_object *bo)
1419{
Ben Skeggsebb945a2012-07-20 08:17:34 +10001420 struct nouveau_drm *drm = nouveau_bdev(bo->bdev);
Ben Skeggse1429b42010-09-10 11:12:25 +10001421 struct nouveau_bo *nvbo = nouveau_bo(bo);
Ben Skeggs967e7bd2014-08-10 04:10:22 +10001422 struct nvif_device *device = &drm->device;
Ben Skeggs989aa5b2015-01-12 12:33:37 +10001423 u32 mappable = nv_device_resource_len(nvxx_device(device), 1) >> PAGE_SHIFT;
Christian Königf1217ed2014-08-27 13:16:04 +02001424 int i, ret;
Ben Skeggse1429b42010-09-10 11:12:25 +10001425
1426 /* as long as the bo isn't in vram, and isn't tiled, we've got
1427 * nothing to do here.
1428 */
1429 if (bo->mem.mem_type != TTM_PL_VRAM) {
Ben Skeggs967e7bd2014-08-10 04:10:22 +10001430 if (drm->device.info.family < NV_DEVICE_INFO_V0_TESLA ||
Francisco Jerezf13b3262010-10-10 06:01:08 +02001431 !nouveau_bo_tile_layout(nvbo))
Ben Skeggse1429b42010-09-10 11:12:25 +10001432 return 0;
Maarten Lankhorsta5540902013-11-12 13:34:09 +01001433
1434 if (bo->mem.mem_type == TTM_PL_SYSTEM) {
1435 nouveau_bo_placement_set(nvbo, TTM_PL_TT, 0);
1436
1437 ret = nouveau_bo_validate(nvbo, false, false);
1438 if (ret)
1439 return ret;
1440 }
1441 return 0;
Ben Skeggse1429b42010-09-10 11:12:25 +10001442 }
1443
1444 /* make sure bo is in mappable vram */
Ben Skeggs967e7bd2014-08-10 04:10:22 +10001445 if (drm->device.info.family >= NV_DEVICE_INFO_V0_TESLA ||
Maarten Lankhorsta5540902013-11-12 13:34:09 +01001446 bo->mem.start + bo->mem.num_pages < mappable)
Ben Skeggse1429b42010-09-10 11:12:25 +10001447 return 0;
1448
Christian Königf1217ed2014-08-27 13:16:04 +02001449 for (i = 0; i < nvbo->placement.num_placement; ++i) {
1450 nvbo->placements[i].fpfn = 0;
1451 nvbo->placements[i].lpfn = mappable;
1452 }
Ben Skeggse1429b42010-09-10 11:12:25 +10001453
Christian Königf1217ed2014-08-27 13:16:04 +02001454 for (i = 0; i < nvbo->placement.num_busy_placement; ++i) {
1455 nvbo->busy_placements[i].fpfn = 0;
1456 nvbo->busy_placements[i].lpfn = mappable;
1457 }
1458
Dave Airliec2848152012-05-18 15:31:12 +01001459 nouveau_bo_placement_set(nvbo, TTM_PL_FLAG_VRAM, 0);
Maarten Lankhorst97a875c2012-11-28 11:25:44 +00001460 return nouveau_bo_validate(nvbo, false, false);
Jerome Glissef32f02f2010-04-09 14:39:25 +02001461}
1462
Konrad Rzeszutek Wilk3230cfc2011-10-17 17:14:26 -04001463static int
1464nouveau_ttm_tt_populate(struct ttm_tt *ttm)
1465{
Jerome Glisse8e7e7052011-11-09 17:15:26 -05001466 struct ttm_dma_tt *ttm_dma = (void *)ttm;
Ben Skeggsebb945a2012-07-20 08:17:34 +10001467 struct nouveau_drm *drm;
Ben Skeggsbe83cd42015-01-14 15:36:34 +10001468 struct nvkm_device *device;
Konrad Rzeszutek Wilk3230cfc2011-10-17 17:14:26 -04001469 struct drm_device *dev;
Alexandre Courbotfd1496a2014-07-31 18:09:42 +09001470 struct device *pdev;
Konrad Rzeszutek Wilk3230cfc2011-10-17 17:14:26 -04001471 unsigned i;
1472 int r;
Dave Airlie22b33e82012-04-02 11:53:06 +01001473 bool slave = !!(ttm->page_flags & TTM_PAGE_FLAG_SG);
Konrad Rzeszutek Wilk3230cfc2011-10-17 17:14:26 -04001474
1475 if (ttm->state != tt_unpopulated)
1476 return 0;
1477
Dave Airlie22b33e82012-04-02 11:53:06 +01001478 if (slave && ttm->sg) {
1479 /* make userspace faulting work */
1480 drm_prime_sg_to_page_addr_arrays(ttm->sg, ttm->pages,
1481 ttm_dma->dma_address, ttm->num_pages);
1482 ttm->state = tt_unbound;
1483 return 0;
1484 }
1485
Ben Skeggsebb945a2012-07-20 08:17:34 +10001486 drm = nouveau_bdev(ttm->bdev);
Ben Skeggs989aa5b2015-01-12 12:33:37 +10001487 device = nvxx_device(&drm->device);
Ben Skeggsebb945a2012-07-20 08:17:34 +10001488 dev = drm->dev;
Alexandre Courbotfd1496a2014-07-31 18:09:42 +09001489 pdev = nv_device_base(device);
Konrad Rzeszutek Wilk3230cfc2011-10-17 17:14:26 -04001490
Alexandre Courbotc3a0c772014-10-27 18:49:17 +09001491 /*
1492 * Objects matching this condition have been marked as force_coherent,
1493 * so use the DMA API for them.
1494 */
1495 if (!nv_device_is_cpu_coherent(device) &&
1496 ttm->caching_state == tt_uncached)
1497 return ttm_dma_populate(ttm_dma, dev->dev);
1498
Jerome Glissedea7e0a2012-01-03 17:37:37 -05001499#if __OS_HAS_AGP
Ben Skeggsebb945a2012-07-20 08:17:34 +10001500 if (drm->agp.stat == ENABLED) {
Jerome Glissedea7e0a2012-01-03 17:37:37 -05001501 return ttm_agp_tt_populate(ttm);
1502 }
1503#endif
1504
Konrad Rzeszutek Wilk3230cfc2011-10-17 17:14:26 -04001505#ifdef CONFIG_SWIOTLB
1506 if (swiotlb_nr_tbl()) {
Jerome Glisse8e7e7052011-11-09 17:15:26 -05001507 return ttm_dma_populate((void *)ttm, dev->dev);
Konrad Rzeszutek Wilk3230cfc2011-10-17 17:14:26 -04001508 }
1509#endif
1510
1511 r = ttm_pool_populate(ttm);
1512 if (r) {
1513 return r;
1514 }
1515
1516 for (i = 0; i < ttm->num_pages; i++) {
Alexandre Courbotfd1496a2014-07-31 18:09:42 +09001517 dma_addr_t addr;
1518
1519 addr = dma_map_page(pdev, ttm->pages[i], 0, PAGE_SIZE,
1520 DMA_BIDIRECTIONAL);
1521
1522 if (dma_mapping_error(pdev, addr)) {
Konrad Rzeszutek Wilk3230cfc2011-10-17 17:14:26 -04001523 while (--i) {
Alexandre Courbotfd1496a2014-07-31 18:09:42 +09001524 dma_unmap_page(pdev, ttm_dma->dma_address[i],
1525 PAGE_SIZE, DMA_BIDIRECTIONAL);
Jerome Glisse8e7e7052011-11-09 17:15:26 -05001526 ttm_dma->dma_address[i] = 0;
Konrad Rzeszutek Wilk3230cfc2011-10-17 17:14:26 -04001527 }
1528 ttm_pool_unpopulate(ttm);
1529 return -EFAULT;
1530 }
Alexandre Courbotfd1496a2014-07-31 18:09:42 +09001531
1532 ttm_dma->dma_address[i] = addr;
Konrad Rzeszutek Wilk3230cfc2011-10-17 17:14:26 -04001533 }
1534 return 0;
1535}
1536
1537static void
1538nouveau_ttm_tt_unpopulate(struct ttm_tt *ttm)
1539{
Jerome Glisse8e7e7052011-11-09 17:15:26 -05001540 struct ttm_dma_tt *ttm_dma = (void *)ttm;
Ben Skeggsebb945a2012-07-20 08:17:34 +10001541 struct nouveau_drm *drm;
Ben Skeggsbe83cd42015-01-14 15:36:34 +10001542 struct nvkm_device *device;
Konrad Rzeszutek Wilk3230cfc2011-10-17 17:14:26 -04001543 struct drm_device *dev;
Alexandre Courbotfd1496a2014-07-31 18:09:42 +09001544 struct device *pdev;
Konrad Rzeszutek Wilk3230cfc2011-10-17 17:14:26 -04001545 unsigned i;
Dave Airlie22b33e82012-04-02 11:53:06 +01001546 bool slave = !!(ttm->page_flags & TTM_PAGE_FLAG_SG);
1547
1548 if (slave)
1549 return;
Konrad Rzeszutek Wilk3230cfc2011-10-17 17:14:26 -04001550
Ben Skeggsebb945a2012-07-20 08:17:34 +10001551 drm = nouveau_bdev(ttm->bdev);
Ben Skeggs989aa5b2015-01-12 12:33:37 +10001552 device = nvxx_device(&drm->device);
Ben Skeggsebb945a2012-07-20 08:17:34 +10001553 dev = drm->dev;
Alexandre Courbotfd1496a2014-07-31 18:09:42 +09001554 pdev = nv_device_base(device);
Konrad Rzeszutek Wilk3230cfc2011-10-17 17:14:26 -04001555
Alexandre Courbotc3a0c772014-10-27 18:49:17 +09001556 /*
1557 * Objects matching this condition have been marked as force_coherent,
1558 * so use the DMA API for them.
1559 */
1560 if (!nv_device_is_cpu_coherent(device) &&
Alexandre Courbotdcccdc12014-12-11 03:09:10 +09001561 ttm->caching_state == tt_uncached) {
Alexandre Courbotc3a0c772014-10-27 18:49:17 +09001562 ttm_dma_unpopulate(ttm_dma, dev->dev);
Alexandre Courbotdcccdc12014-12-11 03:09:10 +09001563 return;
1564 }
Alexandre Courbotc3a0c772014-10-27 18:49:17 +09001565
Jerome Glissedea7e0a2012-01-03 17:37:37 -05001566#if __OS_HAS_AGP
Ben Skeggsebb945a2012-07-20 08:17:34 +10001567 if (drm->agp.stat == ENABLED) {
Jerome Glissedea7e0a2012-01-03 17:37:37 -05001568 ttm_agp_tt_unpopulate(ttm);
1569 return;
1570 }
1571#endif
1572
Konrad Rzeszutek Wilk3230cfc2011-10-17 17:14:26 -04001573#ifdef CONFIG_SWIOTLB
1574 if (swiotlb_nr_tbl()) {
Jerome Glisse8e7e7052011-11-09 17:15:26 -05001575 ttm_dma_unpopulate((void *)ttm, dev->dev);
Konrad Rzeszutek Wilk3230cfc2011-10-17 17:14:26 -04001576 return;
1577 }
1578#endif
1579
1580 for (i = 0; i < ttm->num_pages; i++) {
Jerome Glisse8e7e7052011-11-09 17:15:26 -05001581 if (ttm_dma->dma_address[i]) {
Alexandre Courbotfd1496a2014-07-31 18:09:42 +09001582 dma_unmap_page(pdev, ttm_dma->dma_address[i], PAGE_SIZE,
1583 DMA_BIDIRECTIONAL);
Konrad Rzeszutek Wilk3230cfc2011-10-17 17:14:26 -04001584 }
1585 }
1586
1587 ttm_pool_unpopulate(ttm);
1588}
1589
Maarten Lankhorstdd7cfd62014-01-21 13:07:31 +01001590void
Maarten Lankhorst809e9442014-04-09 16:19:30 +02001591nouveau_bo_fence(struct nouveau_bo *nvbo, struct nouveau_fence *fence, bool exclusive)
Maarten Lankhorstdd7cfd62014-01-21 13:07:31 +01001592{
Maarten Lankhorst29ba89b2014-01-09 11:03:11 +01001593 struct reservation_object *resv = nvbo->bo.resv;
Maarten Lankhorstdd7cfd62014-01-21 13:07:31 +01001594
Maarten Lankhorst809e9442014-04-09 16:19:30 +02001595 if (exclusive)
1596 reservation_object_add_excl_fence(resv, &fence->base);
1597 else if (fence)
1598 reservation_object_add_shared_fence(resv, &fence->base);
Maarten Lankhorstdd7cfd62014-01-21 13:07:31 +01001599}
1600
Ben Skeggs6ee73862009-12-11 19:24:15 +10001601struct ttm_bo_driver nouveau_bo_driver = {
Jerome Glisse649bf3c2011-11-01 20:46:13 -04001602 .ttm_tt_create = &nouveau_ttm_tt_create,
Konrad Rzeszutek Wilk3230cfc2011-10-17 17:14:26 -04001603 .ttm_tt_populate = &nouveau_ttm_tt_populate,
1604 .ttm_tt_unpopulate = &nouveau_ttm_tt_unpopulate,
Ben Skeggs6ee73862009-12-11 19:24:15 +10001605 .invalidate_caches = nouveau_bo_invalidate_caches,
1606 .init_mem_type = nouveau_bo_init_mem_type,
1607 .evict_flags = nouveau_bo_evict_flags,
Ben Skeggsa4154bb2011-02-10 10:35:16 +10001608 .move_notify = nouveau_bo_move_ntfy,
Ben Skeggs6ee73862009-12-11 19:24:15 +10001609 .move = nouveau_bo_move,
1610 .verify_access = nouveau_bo_verify_access,
Jerome Glissef32f02f2010-04-09 14:39:25 +02001611 .fault_reserve_notify = &nouveau_ttm_fault_reserve_notify,
1612 .io_mem_reserve = &nouveau_ttm_io_mem_reserve,
1613 .io_mem_free = &nouveau_ttm_io_mem_free,
Ben Skeggs6ee73862009-12-11 19:24:15 +10001614};
1615
Ben Skeggsbe83cd42015-01-14 15:36:34 +10001616struct nvkm_vma *
1617nouveau_bo_vma_find(struct nouveau_bo *nvbo, struct nvkm_vm *vm)
Ben Skeggsfd2871a2011-06-06 14:07:04 +10001618{
Ben Skeggsbe83cd42015-01-14 15:36:34 +10001619 struct nvkm_vma *vma;
Ben Skeggsfd2871a2011-06-06 14:07:04 +10001620 list_for_each_entry(vma, &nvbo->vma_list, head) {
1621 if (vma->vm == vm)
1622 return vma;
1623 }
1624
1625 return NULL;
1626}
1627
1628int
Ben Skeggsbe83cd42015-01-14 15:36:34 +10001629nouveau_bo_vma_add(struct nouveau_bo *nvbo, struct nvkm_vm *vm,
1630 struct nvkm_vma *vma)
Ben Skeggsfd2871a2011-06-06 14:07:04 +10001631{
1632 const u32 size = nvbo->bo.mem.num_pages << PAGE_SHIFT;
Ben Skeggsfd2871a2011-06-06 14:07:04 +10001633 int ret;
1634
Ben Skeggsbe83cd42015-01-14 15:36:34 +10001635 ret = nvkm_vm_get(vm, size, nvbo->page_shift,
Ben Skeggsfd2871a2011-06-06 14:07:04 +10001636 NV_MEM_ACCESS_RW, vma);
1637 if (ret)
1638 return ret;
1639
Ben Skeggs2e2cfbe2013-11-15 11:56:49 +10001640 if ( nvbo->bo.mem.mem_type != TTM_PL_SYSTEM &&
1641 (nvbo->bo.mem.mem_type == TTM_PL_VRAM ||
Ben Skeggs5ce3bf32015-01-14 09:57:36 +10001642 nvbo->page_shift != vma->vm->mmu->lpg_shift))
Ben Skeggsbe83cd42015-01-14 15:36:34 +10001643 nvkm_vm_map(vma, nvbo->bo.mem.mm_node);
Ben Skeggsfd2871a2011-06-06 14:07:04 +10001644
1645 list_add_tail(&vma->head, &nvbo->vma_list);
Ben Skeggs2fd3db62011-06-07 15:25:12 +10001646 vma->refcount = 1;
Ben Skeggsfd2871a2011-06-06 14:07:04 +10001647 return 0;
1648}
1649
1650void
Ben Skeggsbe83cd42015-01-14 15:36:34 +10001651nouveau_bo_vma_del(struct nouveau_bo *nvbo, struct nvkm_vma *vma)
Ben Skeggsfd2871a2011-06-06 14:07:04 +10001652{
1653 if (vma->node) {
Ben Skeggsc4c70442013-05-07 09:48:30 +10001654 if (nvbo->bo.mem.mem_type != TTM_PL_SYSTEM)
Ben Skeggsbe83cd42015-01-14 15:36:34 +10001655 nvkm_vm_unmap(vma);
1656 nvkm_vm_put(vma);
Ben Skeggsfd2871a2011-06-06 14:07:04 +10001657 list_del(&vma->head);
1658 }
1659}