blob: f2d4c90ea1d47b8bbac95431960a55390083706b [file] [log] [blame]
Zhi Wange4734052016-05-01 07:42:16 -04001/*
2 * Copyright(c) 2011-2016 Intel Corporation. All rights reserved.
3 *
4 * Permission is hereby granted, free of charge, to any person obtaining a
5 * copy of this software and associated documentation files (the "Software"),
6 * to deal in the Software without restriction, including without limitation
7 * the rights to use, copy, modify, merge, publish, distribute, sublicense,
8 * and/or sell copies of the Software, and to permit persons to whom the
9 * Software is furnished to do so, subject to the following conditions:
10 *
11 * The above copyright notice and this permission notice (including the next
12 * paragraph) shall be included in all copies or substantial portions of the
13 * Software.
14 *
15 * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
16 * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
17 * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL
18 * THE AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
19 * LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
20 * OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE
21 * SOFTWARE.
22 *
23 * Authors:
24 * Zhi Wang <zhi.a.wang@intel.com>
25 *
26 * Contributors:
27 * Ping Gao <ping.a.gao@intel.com>
28 * Tina Zhang <tina.zhang@intel.com>
29 * Chanbin Du <changbin.du@intel.com>
30 * Min He <min.he@intel.com>
31 * Bing Niu <bing.niu@intel.com>
32 * Zhenyu Wang <zhenyuw@linux.intel.com>
33 *
34 */
35
Zhi Wange4734052016-05-01 07:42:16 -040036#include <linux/kthread.h>
37
Zhenyu Wangfeddf6e2016-10-20 17:15:03 +080038#include "i915_drv.h"
39#include "gvt.h"
40
Zhi Wange4734052016-05-01 07:42:16 -040041#define RING_CTX_OFF(x) \
42 offsetof(struct execlist_ring_context, x)
43
Du, Changbin999ccb42016-10-20 14:08:47 +080044static void set_context_pdp_root_pointer(
45 struct execlist_ring_context *ring_context,
Zhi Wange4734052016-05-01 07:42:16 -040046 u32 pdp[8])
47{
48 struct execlist_mmio_pair *pdp_pair = &ring_context->pdp3_UDW;
49 int i;
50
51 for (i = 0; i < 8; i++)
52 pdp_pair[i].val = pdp[7 - i];
53}
54
55static int populate_shadow_context(struct intel_vgpu_workload *workload)
56{
57 struct intel_vgpu *vgpu = workload->vgpu;
58 struct intel_gvt *gvt = vgpu->gvt;
59 int ring_id = workload->ring_id;
Zhi Wang1406a142017-09-10 21:15:18 +080060 struct i915_gem_context *shadow_ctx = vgpu->submission.shadow_ctx;
Zhi Wange4734052016-05-01 07:42:16 -040061 struct drm_i915_gem_object *ctx_obj =
62 shadow_ctx->engine[ring_id].state->obj;
63 struct execlist_ring_context *shadow_ring_context;
64 struct page *page;
65 void *dst;
66 unsigned long context_gpa, context_page_num;
67 int i;
68
69 gvt_dbg_sched("ring id %d workload lrca %x", ring_id,
70 workload->ctx_desc.lrca);
71
Joonas Lahtinen63ffbcd2017-04-28 10:53:36 +030072 context_page_num = gvt->dev_priv->engine[ring_id]->context_size;
Zhi Wange4734052016-05-01 07:42:16 -040073
74 context_page_num = context_page_num >> PAGE_SHIFT;
75
76 if (IS_BROADWELL(gvt->dev_priv) && ring_id == RCS)
77 context_page_num = 19;
78
79 i = 2;
80
81 while (i < context_page_num) {
82 context_gpa = intel_vgpu_gma_to_gpa(vgpu->gtt.ggtt_mm,
83 (u32)((workload->ctx_desc.lrca + i) <<
84 GTT_PAGE_SHIFT));
85 if (context_gpa == INTEL_GVT_INVALID_ADDR) {
Tina Zhang695fbc02017-03-10 04:26:53 -050086 gvt_vgpu_err("Invalid guest context descriptor\n");
fred gao5c568832017-09-20 05:36:47 +080087 return -EFAULT;
Zhi Wange4734052016-05-01 07:42:16 -040088 }
89
Michel Thierry0b29c752017-09-13 09:56:00 +010090 page = i915_gem_object_get_page(ctx_obj, LRC_HEADER_PAGES + i);
Xiaoguang Chenc7549362016-11-03 18:38:30 +080091 dst = kmap(page);
Zhi Wange4734052016-05-01 07:42:16 -040092 intel_gvt_hypervisor_read_gpa(vgpu, context_gpa, dst,
93 GTT_PAGE_SIZE);
Xiaoguang Chenc7549362016-11-03 18:38:30 +080094 kunmap(page);
Zhi Wange4734052016-05-01 07:42:16 -040095 i++;
96 }
97
98 page = i915_gem_object_get_page(ctx_obj, LRC_STATE_PN);
Xiaoguang Chenc7549362016-11-03 18:38:30 +080099 shadow_ring_context = kmap(page);
Zhi Wange4734052016-05-01 07:42:16 -0400100
101#define COPY_REG(name) \
102 intel_gvt_hypervisor_read_gpa(vgpu, workload->ring_context_gpa \
103 + RING_CTX_OFF(name.val), &shadow_ring_context->name.val, 4)
104
105 COPY_REG(ctx_ctrl);
106 COPY_REG(ctx_timestamp);
107
108 if (ring_id == RCS) {
109 COPY_REG(bb_per_ctx_ptr);
110 COPY_REG(rcs_indirect_ctx);
111 COPY_REG(rcs_indirect_ctx_offset);
112 }
113#undef COPY_REG
114
115 set_context_pdp_root_pointer(shadow_ring_context,
116 workload->shadow_mm->shadow_page_table);
117
118 intel_gvt_hypervisor_read_gpa(vgpu,
119 workload->ring_context_gpa +
120 sizeof(*shadow_ring_context),
121 (void *)shadow_ring_context +
122 sizeof(*shadow_ring_context),
123 GTT_PAGE_SIZE - sizeof(*shadow_ring_context));
124
Xiaoguang Chenc7549362016-11-03 18:38:30 +0800125 kunmap(page);
Zhi Wange4734052016-05-01 07:42:16 -0400126 return 0;
127}
128
Changbin Dubc2d4b62017-03-22 12:35:31 +0800129static inline bool is_gvt_request(struct drm_i915_gem_request *req)
130{
131 return i915_gem_context_force_single_submission(req->ctx);
132}
133
Zhi Wange4734052016-05-01 07:42:16 -0400134static int shadow_context_status_change(struct notifier_block *nb,
135 unsigned long action, void *data)
136{
Changbin Du3fc03062017-03-13 10:47:11 +0800137 struct drm_i915_gem_request *req = (struct drm_i915_gem_request *)data;
138 struct intel_gvt *gvt = container_of(nb, struct intel_gvt,
139 shadow_ctx_notifier_block[req->engine->id]);
140 struct intel_gvt_workload_scheduler *scheduler = &gvt->scheduler;
Changbin Du0e86cc92017-05-04 10:52:38 +0800141 enum intel_engine_id ring_id = req->engine->id;
142 struct intel_vgpu_workload *workload;
Zhi Wange4734052016-05-01 07:42:16 -0400143
Changbin Du0e86cc92017-05-04 10:52:38 +0800144 if (!is_gvt_request(req)) {
145 spin_lock_bh(&scheduler->mmio_context_lock);
146 if (action == INTEL_CONTEXT_SCHEDULE_IN &&
147 scheduler->engine_owner[ring_id]) {
148 /* Switch ring from vGPU to host. */
149 intel_gvt_switch_mmio(scheduler->engine_owner[ring_id],
150 NULL, ring_id);
151 scheduler->engine_owner[ring_id] = NULL;
152 }
153 spin_unlock_bh(&scheduler->mmio_context_lock);
154
155 return NOTIFY_OK;
156 }
157
158 workload = scheduler->current_workload[ring_id];
159 if (unlikely(!workload))
Chuanxiao Dong9272f732017-02-17 19:29:52 +0800160 return NOTIFY_OK;
161
Zhi Wange4734052016-05-01 07:42:16 -0400162 switch (action) {
163 case INTEL_CONTEXT_SCHEDULE_IN:
Changbin Du0e86cc92017-05-04 10:52:38 +0800164 spin_lock_bh(&scheduler->mmio_context_lock);
165 if (workload->vgpu != scheduler->engine_owner[ring_id]) {
166 /* Switch ring from host to vGPU or vGPU to vGPU. */
167 intel_gvt_switch_mmio(scheduler->engine_owner[ring_id],
168 workload->vgpu, ring_id);
169 scheduler->engine_owner[ring_id] = workload->vgpu;
170 } else
171 gvt_dbg_sched("skip ring %d mmio switch for vgpu%d\n",
172 ring_id, workload->vgpu->id);
173 spin_unlock_bh(&scheduler->mmio_context_lock);
Zhi Wange4734052016-05-01 07:42:16 -0400174 atomic_set(&workload->shadow_ctx_active, 1);
175 break;
176 case INTEL_CONTEXT_SCHEDULE_OUT:
Chris Wilsond6c05112017-10-03 21:34:47 +0100177 case INTEL_CONTEXT_SCHEDULE_PREEMPTED:
Zhi Wange4734052016-05-01 07:42:16 -0400178 atomic_set(&workload->shadow_ctx_active, 0);
179 break;
180 default:
181 WARN_ON(1);
182 return NOTIFY_OK;
183 }
184 wake_up(&workload->shadow_ctx_status_wq);
185 return NOTIFY_OK;
186}
187
Kechen Lu9dfb8e52017-08-10 07:41:36 +0800188static void shadow_context_descriptor_update(struct i915_gem_context *ctx,
189 struct intel_engine_cs *engine)
190{
191 struct intel_context *ce = &ctx->engine[engine->id];
192 u64 desc = 0;
193
194 desc = ce->lrc_desc;
195
196 /* Update bits 0-11 of the context descriptor which includes flags
197 * like GEN8_CTX_* cached in desc_template
198 */
199 desc &= U64_MAX << 12;
200 desc |= ctx->desc_template & ((1ULL << 12) - 1);
201
202 ce->lrc_desc = desc;
203}
204
fred gao0a53bc02017-08-18 15:41:06 +0800205static int copy_workload_to_ring_buffer(struct intel_vgpu_workload *workload)
206{
207 struct intel_vgpu *vgpu = workload->vgpu;
208 void *shadow_ring_buffer_va;
209 u32 *cs;
210
211 /* allocate shadow ring buffer */
212 cs = intel_ring_begin(workload->req, workload->rb_len / sizeof(u32));
213 if (IS_ERR(cs)) {
214 gvt_vgpu_err("fail to alloc size =%ld shadow ring buffer\n",
215 workload->rb_len);
216 return PTR_ERR(cs);
217 }
218
219 shadow_ring_buffer_va = workload->shadow_ring_buffer_va;
220
221 /* get shadow ring buffer va */
222 workload->shadow_ring_buffer_va = cs;
223
224 memcpy(cs, shadow_ring_buffer_va,
225 workload->rb_len);
226
227 cs += workload->rb_len / sizeof(u32);
228 intel_ring_advance(workload->req, cs);
229
230 return 0;
231}
232
fred gaoa3cfdca2017-08-18 15:41:07 +0800233void release_shadow_wa_ctx(struct intel_shadow_wa_ctx *wa_ctx)
234{
235 if (!wa_ctx->indirect_ctx.obj)
236 return;
237
238 i915_gem_object_unpin_map(wa_ctx->indirect_ctx.obj);
239 i915_gem_object_put(wa_ctx->indirect_ctx.obj);
240}
241
Ping Gao89ea20b2017-06-29 12:22:42 +0800242/**
243 * intel_gvt_scan_and_shadow_workload - audit the workload by scanning and
244 * shadow it as well, include ringbuffer,wa_ctx and ctx.
245 * @workload: an abstract entity for each execlist submission.
246 *
247 * This function is called before the workload submitting to i915, to make
248 * sure the content of the workload is valid.
249 */
250int intel_gvt_scan_and_shadow_workload(struct intel_vgpu_workload *workload)
Zhi Wange4734052016-05-01 07:42:16 -0400251{
Zhi Wang1406a142017-09-10 21:15:18 +0800252 struct intel_vgpu *vgpu = workload->vgpu;
253 struct intel_vgpu_submission *s = &vgpu->submission;
254 struct i915_gem_context *shadow_ctx = s->shadow_ctx;
255 struct drm_i915_private *dev_priv = vgpu->gvt->dev_priv;
Zhi Wange4734052016-05-01 07:42:16 -0400256 int ring_id = workload->ring_id;
fred gao0a53bc02017-08-18 15:41:06 +0800257 struct intel_engine_cs *engine = dev_priv->engine[ring_id];
Chris Wilson0eb742d2016-10-20 17:29:36 +0800258 struct drm_i915_gem_request *rq;
fred gao0a53bc02017-08-18 15:41:06 +0800259 struct intel_ring *ring;
Zhi Wange4734052016-05-01 07:42:16 -0400260 int ret;
261
Ping Gao87e919d2017-07-04 14:53:03 +0800262 lockdep_assert_held(&dev_priv->drm.struct_mutex);
263
Ping Gaod0302e72017-06-29 12:22:43 +0800264 if (workload->shadowed)
265 return 0;
Zhi Wange4734052016-05-01 07:42:16 -0400266
Zhenyu Wang03806ed2017-02-13 17:07:19 +0800267 shadow_ctx->desc_template &= ~(0x3 << GEN8_CTX_ADDRESSING_MODE_SHIFT);
268 shadow_ctx->desc_template |= workload->ctx_desc.addressing_mode <<
Zhi Wange4734052016-05-01 07:42:16 -0400269 GEN8_CTX_ADDRESSING_MODE_SHIFT;
270
Zhi Wang1406a142017-09-10 21:15:18 +0800271 if (!test_and_set_bit(ring_id, s->shadow_ctx_desc_updated))
Kechen Lu9dfb8e52017-08-10 07:41:36 +0800272 shadow_context_descriptor_update(shadow_ctx,
273 dev_priv->engine[ring_id]);
Chuanxiao Dong3cd23b82017-03-16 09:47:58 +0800274
Ping Gao89ea20b2017-06-29 12:22:42 +0800275 ret = intel_gvt_scan_and_shadow_ringbuffer(workload);
Zhi Wangbe1da702016-05-03 18:26:57 -0400276 if (ret)
fred gaoa3cfdca2017-08-18 15:41:07 +0800277 goto err_scan;
Zhi Wangbe1da702016-05-03 18:26:57 -0400278
Tina Zhang17f1b1a2017-03-15 23:16:01 -0400279 if ((workload->ring_id == RCS) &&
280 (workload->wa_ctx.indirect_ctx.size != 0)) {
281 ret = intel_gvt_scan_and_shadow_wa_ctx(&workload->wa_ctx);
282 if (ret)
fred gaoa3cfdca2017-08-18 15:41:07 +0800283 goto err_scan;
Tina Zhang17f1b1a2017-03-15 23:16:01 -0400284 }
Zhi Wangbe1da702016-05-03 18:26:57 -0400285
Ping Gao89ea20b2017-06-29 12:22:42 +0800286 /* pin shadow context by gvt even the shadow context will be pinned
287 * when i915 alloc request. That is because gvt will update the guest
288 * context from shadow context when workload is completed, and at that
289 * moment, i915 may already unpined the shadow context to make the
290 * shadow_ctx pages invalid. So gvt need to pin itself. After update
291 * the guest context, gvt can unpin the shadow_ctx safely.
292 */
293 ring = engine->context_pin(engine, shadow_ctx);
294 if (IS_ERR(ring)) {
295 ret = PTR_ERR(ring);
296 gvt_vgpu_err("fail to pin shadow context\n");
fred gaoa3cfdca2017-08-18 15:41:07 +0800297 goto err_shadow;
Ping Gao89ea20b2017-06-29 12:22:42 +0800298 }
Zhi Wange4734052016-05-01 07:42:16 -0400299
fred gao0a53bc02017-08-18 15:41:06 +0800300 ret = populate_shadow_context(workload);
301 if (ret)
fred gaoa3cfdca2017-08-18 15:41:07 +0800302 goto err_unpin;
fred gao0a53bc02017-08-18 15:41:06 +0800303
304 rq = i915_gem_request_alloc(dev_priv->engine[ring_id], shadow_ctx);
305 if (IS_ERR(rq)) {
306 gvt_vgpu_err("fail to allocate gem request\n");
307 ret = PTR_ERR(rq);
fred gaoa3cfdca2017-08-18 15:41:07 +0800308 goto err_unpin;
fred gao0a53bc02017-08-18 15:41:06 +0800309 }
310
311 gvt_dbg_sched("ring id %d get i915 gem request %p\n", ring_id, rq);
312
313 workload->req = i915_gem_request_get(rq);
314 ret = copy_workload_to_ring_buffer(workload);
315 if (ret)
fred gaoa3cfdca2017-08-18 15:41:07 +0800316 goto err_unpin;
fred gao0a53bc02017-08-18 15:41:06 +0800317 workload->shadowed = true;
fred gaoa3cfdca2017-08-18 15:41:07 +0800318 return 0;
fred gao0a53bc02017-08-18 15:41:06 +0800319
fred gaoa3cfdca2017-08-18 15:41:07 +0800320err_unpin:
321 engine->context_unpin(engine, shadow_ctx);
322err_shadow:
323 release_shadow_wa_ctx(&workload->wa_ctx);
324err_scan:
fred gao0a53bc02017-08-18 15:41:06 +0800325 return ret;
326}
327
Zhi Wangf52c3802017-09-24 21:53:03 +0800328static void release_shadow_batch_buffer(struct intel_vgpu_workload *workload);
329
Zhi Wangd8235b52017-09-12 22:06:39 +0800330static int prepare_shadow_batch_buffer(struct intel_vgpu_workload *workload)
331{
332 struct intel_gvt *gvt = workload->vgpu->gvt;
333 const int gmadr_bytes = gvt->device_info.gmadr_bytes_in_cmd;
Zhi Wangf52c3802017-09-24 21:53:03 +0800334 struct intel_vgpu_shadow_bb *bb;
335 int ret;
Zhi Wangd8235b52017-09-12 22:06:39 +0800336
Zhi Wangf52c3802017-09-24 21:53:03 +0800337 list_for_each_entry(bb, &workload->shadow_bb, list) {
338 bb->vma = i915_gem_object_ggtt_pin(bb->obj, NULL, 0, 0, 0);
339 if (IS_ERR(bb->vma)) {
340 ret = PTR_ERR(bb->vma);
341 goto err;
342 }
Zhi Wangd8235b52017-09-12 22:06:39 +0800343
Zhi Wangf52c3802017-09-24 21:53:03 +0800344 /* relocate shadow batch buffer */
345 bb->bb_start_cmd_va[1] = i915_ggtt_offset(bb->vma);
Zhi Wangd8235b52017-09-12 22:06:39 +0800346 if (gmadr_bytes == 8)
Zhi Wangf52c3802017-09-24 21:53:03 +0800347 bb->bb_start_cmd_va[2] = 0;
348
349 /* No one is going to touch shadow bb from now on. */
350 if (bb->clflush & CLFLUSH_AFTER) {
351 drm_clflush_virt_range(bb->va, bb->obj->base.size);
352 bb->clflush &= ~CLFLUSH_AFTER;
353 }
354
355 ret = i915_gem_object_set_to_gtt_domain(bb->obj, false);
356 if (ret)
357 goto err;
358
359 i915_gem_obj_finish_shmem_access(bb->obj);
360 bb->accessing = false;
361
362 i915_vma_move_to_active(bb->vma, workload->req, 0);
Zhi Wangd8235b52017-09-12 22:06:39 +0800363 }
364 return 0;
Zhi Wangf52c3802017-09-24 21:53:03 +0800365err:
366 release_shadow_batch_buffer(workload);
367 return ret;
Zhi Wangd8235b52017-09-12 22:06:39 +0800368}
369
370static int update_wa_ctx_2_shadow_ctx(struct intel_shadow_wa_ctx *wa_ctx)
371{
372 struct intel_vgpu_workload *workload = container_of(wa_ctx,
373 struct intel_vgpu_workload,
374 wa_ctx);
375 int ring_id = workload->ring_id;
376 struct intel_vgpu_submission *s = &workload->vgpu->submission;
377 struct i915_gem_context *shadow_ctx = s->shadow_ctx;
378 struct drm_i915_gem_object *ctx_obj =
379 shadow_ctx->engine[ring_id].state->obj;
380 struct execlist_ring_context *shadow_ring_context;
381 struct page *page;
382
383 page = i915_gem_object_get_page(ctx_obj, LRC_STATE_PN);
384 shadow_ring_context = kmap_atomic(page);
385
386 shadow_ring_context->bb_per_ctx_ptr.val =
387 (shadow_ring_context->bb_per_ctx_ptr.val &
388 (~PER_CTX_ADDR_MASK)) | wa_ctx->per_ctx.shadow_gma;
389 shadow_ring_context->rcs_indirect_ctx.val =
390 (shadow_ring_context->rcs_indirect_ctx.val &
391 (~INDIRECT_CTX_ADDR_MASK)) | wa_ctx->indirect_ctx.shadow_gma;
392
393 kunmap_atomic(shadow_ring_context);
394 return 0;
395}
396
397static int prepare_shadow_wa_ctx(struct intel_shadow_wa_ctx *wa_ctx)
398{
399 struct i915_vma *vma;
400 unsigned char *per_ctx_va =
401 (unsigned char *)wa_ctx->indirect_ctx.shadow_va +
402 wa_ctx->indirect_ctx.size;
403
404 if (wa_ctx->indirect_ctx.size == 0)
405 return 0;
406
407 vma = i915_gem_object_ggtt_pin(wa_ctx->indirect_ctx.obj, NULL,
408 0, CACHELINE_BYTES, 0);
409 if (IS_ERR(vma))
410 return PTR_ERR(vma);
411
412 /* FIXME: we are not tracking our pinned VMA leaving it
413 * up to the core to fix up the stray pin_count upon
414 * free.
415 */
416
417 wa_ctx->indirect_ctx.shadow_gma = i915_ggtt_offset(vma);
418
419 wa_ctx->per_ctx.shadow_gma = *((unsigned int *)per_ctx_va + 1);
420 memset(per_ctx_va, 0, CACHELINE_BYTES);
421
422 update_wa_ctx_2_shadow_ctx(wa_ctx);
423 return 0;
424}
425
426static void release_shadow_batch_buffer(struct intel_vgpu_workload *workload)
427{
Zhi Wangf52c3802017-09-24 21:53:03 +0800428 struct intel_vgpu *vgpu = workload->vgpu;
429 struct drm_i915_private *dev_priv = vgpu->gvt->dev_priv;
430 struct intel_vgpu_shadow_bb *bb, *pos;
Zhi Wangd8235b52017-09-12 22:06:39 +0800431
Zhi Wangf52c3802017-09-24 21:53:03 +0800432 if (list_empty(&workload->shadow_bb))
433 return;
434
435 bb = list_first_entry(&workload->shadow_bb,
436 struct intel_vgpu_shadow_bb, list);
437
438 mutex_lock(&dev_priv->drm.struct_mutex);
439
440 list_for_each_entry_safe(bb, pos, &workload->shadow_bb, list) {
441 if (bb->obj) {
442 if (bb->accessing)
443 i915_gem_obj_finish_shmem_access(bb->obj);
444
445 if (bb->va && !IS_ERR(bb->va))
446 i915_gem_object_unpin_map(bb->obj);
447
448 if (bb->vma && !IS_ERR(bb->vma)) {
449 i915_vma_unpin(bb->vma);
450 i915_vma_close(bb->vma);
451 }
452 __i915_gem_object_release_unless_active(bb->obj);
Zhi Wangd8235b52017-09-12 22:06:39 +0800453 }
Zhi Wangf52c3802017-09-24 21:53:03 +0800454 list_del(&bb->list);
455 kfree(bb);
Zhi Wangd8235b52017-09-12 22:06:39 +0800456 }
Zhi Wangf52c3802017-09-24 21:53:03 +0800457
458 mutex_unlock(&dev_priv->drm.struct_mutex);
Zhi Wangd8235b52017-09-12 22:06:39 +0800459}
460
Zhi Wang497aa3f2017-09-12 21:51:10 +0800461static int prepare_workload(struct intel_vgpu_workload *workload)
462{
Zhi Wangd8235b52017-09-12 22:06:39 +0800463 struct intel_vgpu *vgpu = workload->vgpu;
Zhi Wang497aa3f2017-09-12 21:51:10 +0800464 int ret = 0;
465
Zhi Wangd8235b52017-09-12 22:06:39 +0800466 ret = intel_vgpu_pin_mm(workload->shadow_mm);
467 if (ret) {
468 gvt_vgpu_err("fail to vgpu pin mm\n");
469 return ret;
470 }
Zhi Wang497aa3f2017-09-12 21:51:10 +0800471
Zhi Wangd8235b52017-09-12 22:06:39 +0800472 ret = intel_vgpu_sync_oos_pages(workload->vgpu);
473 if (ret) {
474 gvt_vgpu_err("fail to vgpu sync oos pages\n");
475 goto err_unpin_mm;
476 }
477
478 ret = intel_vgpu_flush_post_shadow(workload->vgpu);
479 if (ret) {
480 gvt_vgpu_err("fail to flush post shadow\n");
481 goto err_unpin_mm;
482 }
483
484 ret = prepare_shadow_batch_buffer(workload);
485 if (ret) {
486 gvt_vgpu_err("fail to prepare_shadow_batch_buffer\n");
487 goto err_unpin_mm;
488 }
489
490 ret = prepare_shadow_wa_ctx(&workload->wa_ctx);
491 if (ret) {
492 gvt_vgpu_err("fail to prepare_shadow_wa_ctx\n");
493 goto err_shadow_batch;
494 }
495
496 if (workload->prepare) {
497 ret = workload->prepare(workload);
498 if (ret)
499 goto err_shadow_wa_ctx;
500 }
501
502 return 0;
503err_shadow_wa_ctx:
504 release_shadow_wa_ctx(&workload->wa_ctx);
505err_shadow_batch:
506 release_shadow_batch_buffer(workload);
507err_unpin_mm:
508 intel_vgpu_unpin_mm(workload->shadow_mm);
Zhi Wang497aa3f2017-09-12 21:51:10 +0800509 return ret;
510}
511
fred gao0a53bc02017-08-18 15:41:06 +0800512static int dispatch_workload(struct intel_vgpu_workload *workload)
513{
Zhi Wang1406a142017-09-10 21:15:18 +0800514 struct intel_vgpu *vgpu = workload->vgpu;
515 struct intel_vgpu_submission *s = &vgpu->submission;
516 struct i915_gem_context *shadow_ctx = s->shadow_ctx;
517 struct drm_i915_private *dev_priv = vgpu->gvt->dev_priv;
fred gao0a53bc02017-08-18 15:41:06 +0800518 int ring_id = workload->ring_id;
fred gao0a53bc02017-08-18 15:41:06 +0800519 struct intel_engine_cs *engine = dev_priv->engine[ring_id];
520 int ret = 0;
521
522 gvt_dbg_sched("ring id %d prepare to dispatch workload %p\n",
523 ring_id, workload);
524
525 mutex_lock(&dev_priv->drm.struct_mutex);
526
527 ret = intel_gvt_scan_and_shadow_workload(workload);
528 if (ret)
529 goto out;
530
Zhi Wang497aa3f2017-09-12 21:51:10 +0800531 ret = prepare_workload(workload);
532 if (ret) {
533 engine->context_unpin(engine, shadow_ctx);
534 goto out;
fred gao0a53bc02017-08-18 15:41:06 +0800535 }
536
Pei Zhang90d27a12016-11-14 18:02:57 +0800537out:
538 if (ret)
539 workload->status = ret;
Chris Wilson0eb742d2016-10-20 17:29:36 +0800540
Ping Gao89ea20b2017-06-29 12:22:42 +0800541 if (!IS_ERR_OR_NULL(workload->req)) {
542 gvt_dbg_sched("ring id %d submit workload to i915 %p\n",
543 ring_id, workload->req);
544 i915_add_request(workload->req);
545 workload->dispatched = true;
546 }
Chuanxiao Dong3cd23b82017-03-16 09:47:58 +0800547
Pei Zhang90d27a12016-11-14 18:02:57 +0800548 mutex_unlock(&dev_priv->drm.struct_mutex);
Zhi Wange4734052016-05-01 07:42:16 -0400549 return ret;
550}
551
552static struct intel_vgpu_workload *pick_next_workload(
553 struct intel_gvt *gvt, int ring_id)
554{
555 struct intel_gvt_workload_scheduler *scheduler = &gvt->scheduler;
556 struct intel_vgpu_workload *workload = NULL;
557
558 mutex_lock(&gvt->lock);
559
560 /*
561 * no current vgpu / will be scheduled out / no workload
562 * bail out
563 */
564 if (!scheduler->current_vgpu) {
565 gvt_dbg_sched("ring id %d stop - no current vgpu\n", ring_id);
566 goto out;
567 }
568
569 if (scheduler->need_reschedule) {
570 gvt_dbg_sched("ring id %d stop - will reschedule\n", ring_id);
571 goto out;
572 }
573
Zhenyu Wang954180a2017-04-12 14:22:50 +0800574 if (list_empty(workload_q_head(scheduler->current_vgpu, ring_id)))
Zhi Wange4734052016-05-01 07:42:16 -0400575 goto out;
Zhi Wange4734052016-05-01 07:42:16 -0400576
577 /*
578 * still have current workload, maybe the workload disptacher
579 * fail to submit it for some reason, resubmit it.
580 */
581 if (scheduler->current_workload[ring_id]) {
582 workload = scheduler->current_workload[ring_id];
583 gvt_dbg_sched("ring id %d still have current workload %p\n",
584 ring_id, workload);
585 goto out;
586 }
587
588 /*
589 * pick a workload as current workload
590 * once current workload is set, schedule policy routines
591 * will wait the current workload is finished when trying to
592 * schedule out a vgpu.
593 */
594 scheduler->current_workload[ring_id] = container_of(
595 workload_q_head(scheduler->current_vgpu, ring_id)->next,
596 struct intel_vgpu_workload, list);
597
598 workload = scheduler->current_workload[ring_id];
599
600 gvt_dbg_sched("ring id %d pick new workload %p\n", ring_id, workload);
601
Zhi Wang1406a142017-09-10 21:15:18 +0800602 atomic_inc(&workload->vgpu->submission.running_workload_num);
Zhi Wange4734052016-05-01 07:42:16 -0400603out:
604 mutex_unlock(&gvt->lock);
605 return workload;
606}
607
608static void update_guest_context(struct intel_vgpu_workload *workload)
609{
610 struct intel_vgpu *vgpu = workload->vgpu;
611 struct intel_gvt *gvt = vgpu->gvt;
Zhi Wang1406a142017-09-10 21:15:18 +0800612 struct intel_vgpu_submission *s = &vgpu->submission;
613 struct i915_gem_context *shadow_ctx = s->shadow_ctx;
Zhi Wange4734052016-05-01 07:42:16 -0400614 int ring_id = workload->ring_id;
Zhi Wange4734052016-05-01 07:42:16 -0400615 struct drm_i915_gem_object *ctx_obj =
616 shadow_ctx->engine[ring_id].state->obj;
617 struct execlist_ring_context *shadow_ring_context;
618 struct page *page;
619 void *src;
620 unsigned long context_gpa, context_page_num;
621 int i;
622
623 gvt_dbg_sched("ring id %d workload lrca %x\n", ring_id,
624 workload->ctx_desc.lrca);
625
Joonas Lahtinen63ffbcd2017-04-28 10:53:36 +0300626 context_page_num = gvt->dev_priv->engine[ring_id]->context_size;
Zhi Wange4734052016-05-01 07:42:16 -0400627
628 context_page_num = context_page_num >> PAGE_SHIFT;
629
630 if (IS_BROADWELL(gvt->dev_priv) && ring_id == RCS)
631 context_page_num = 19;
632
633 i = 2;
634
635 while (i < context_page_num) {
636 context_gpa = intel_vgpu_gma_to_gpa(vgpu->gtt.ggtt_mm,
637 (u32)((workload->ctx_desc.lrca + i) <<
638 GTT_PAGE_SHIFT));
639 if (context_gpa == INTEL_GVT_INVALID_ADDR) {
Tina Zhang695fbc02017-03-10 04:26:53 -0500640 gvt_vgpu_err("invalid guest context descriptor\n");
Zhi Wange4734052016-05-01 07:42:16 -0400641 return;
642 }
643
Michel Thierry0b29c752017-09-13 09:56:00 +0100644 page = i915_gem_object_get_page(ctx_obj, LRC_HEADER_PAGES + i);
Xiaoguang Chenc7549362016-11-03 18:38:30 +0800645 src = kmap(page);
Zhi Wange4734052016-05-01 07:42:16 -0400646 intel_gvt_hypervisor_write_gpa(vgpu, context_gpa, src,
647 GTT_PAGE_SIZE);
Xiaoguang Chenc7549362016-11-03 18:38:30 +0800648 kunmap(page);
Zhi Wange4734052016-05-01 07:42:16 -0400649 i++;
650 }
651
652 intel_gvt_hypervisor_write_gpa(vgpu, workload->ring_context_gpa +
653 RING_CTX_OFF(ring_header.val), &workload->rb_tail, 4);
654
655 page = i915_gem_object_get_page(ctx_obj, LRC_STATE_PN);
Xiaoguang Chenc7549362016-11-03 18:38:30 +0800656 shadow_ring_context = kmap(page);
Zhi Wange4734052016-05-01 07:42:16 -0400657
658#define COPY_REG(name) \
659 intel_gvt_hypervisor_write_gpa(vgpu, workload->ring_context_gpa + \
660 RING_CTX_OFF(name.val), &shadow_ring_context->name.val, 4)
661
662 COPY_REG(ctx_ctrl);
663 COPY_REG(ctx_timestamp);
664
665#undef COPY_REG
666
667 intel_gvt_hypervisor_write_gpa(vgpu,
668 workload->ring_context_gpa +
669 sizeof(*shadow_ring_context),
670 (void *)shadow_ring_context +
671 sizeof(*shadow_ring_context),
672 GTT_PAGE_SIZE - sizeof(*shadow_ring_context));
673
Xiaoguang Chenc7549362016-11-03 18:38:30 +0800674 kunmap(page);
Zhi Wange4734052016-05-01 07:42:16 -0400675}
676
Zhi Wange2c43c02017-09-13 01:58:35 +0800677static void clean_workloads(struct intel_vgpu *vgpu, unsigned long engine_mask)
678{
679 struct intel_vgpu_submission *s = &vgpu->submission;
680 struct drm_i915_private *dev_priv = vgpu->gvt->dev_priv;
681 struct intel_engine_cs *engine;
682 struct intel_vgpu_workload *pos, *n;
683 unsigned int tmp;
684
685 /* free the unsubmited workloads in the queues. */
686 for_each_engine_masked(engine, dev_priv, engine_mask, tmp) {
687 list_for_each_entry_safe(pos, n,
688 &s->workload_q_head[engine->id], list) {
689 list_del_init(&pos->list);
690 intel_vgpu_destroy_workload(pos);
691 }
692 clear_bit(engine->id, s->shadow_ctx_desc_updated);
693 }
694}
695
Zhi Wange4734052016-05-01 07:42:16 -0400696static void complete_current_workload(struct intel_gvt *gvt, int ring_id)
697{
698 struct intel_gvt_workload_scheduler *scheduler = &gvt->scheduler;
Zhi Wang1406a142017-09-10 21:15:18 +0800699 struct intel_vgpu_workload *workload =
700 scheduler->current_workload[ring_id];
701 struct intel_vgpu *vgpu = workload->vgpu;
702 struct intel_vgpu_submission *s = &vgpu->submission;
Zhi Wangbe1da702016-05-03 18:26:57 -0400703 int event;
Zhi Wange4734052016-05-01 07:42:16 -0400704
705 mutex_lock(&gvt->lock);
706
Chuanxiao Dong8f1117a2017-03-06 13:05:24 +0800707 /* For the workload w/ request, needs to wait for the context
708 * switch to make sure request is completed.
709 * For the workload w/o request, directly complete the workload.
710 */
711 if (workload->req) {
Chuanxiao Dong3cd23b82017-03-16 09:47:58 +0800712 struct drm_i915_private *dev_priv =
713 workload->vgpu->gvt->dev_priv;
714 struct intel_engine_cs *engine =
715 dev_priv->engine[workload->ring_id];
Zhi Wange4734052016-05-01 07:42:16 -0400716 wait_event(workload->shadow_ctx_status_wq,
717 !atomic_read(&workload->shadow_ctx_active));
718
Chuanxiao Dong0cf5ec42017-06-23 13:01:11 +0800719 /* If this request caused GPU hang, req->fence.error will
720 * be set to -EIO. Use -EIO to set workload status so
721 * that when this request caused GPU hang, didn't trigger
722 * context switch interrupt to guest.
723 */
724 if (likely(workload->status == -EINPROGRESS)) {
725 if (workload->req->fence.error == -EIO)
726 workload->status = -EIO;
727 else
728 workload->status = 0;
729 }
730
Chuanxiao Dong8f1117a2017-03-06 13:05:24 +0800731 i915_gem_request_put(fetch_and_zero(&workload->req));
Zhi Wangbe1da702016-05-03 18:26:57 -0400732
Chuanxiao Dong6184cc82017-08-01 17:47:25 +0800733 if (!workload->status && !(vgpu->resetting_eng &
734 ENGINE_MASK(ring_id))) {
Chuanxiao Dong8f1117a2017-03-06 13:05:24 +0800735 update_guest_context(workload);
736
737 for_each_set_bit(event, workload->pending_events,
738 INTEL_GVT_EVENT_MAX)
739 intel_vgpu_trigger_virtual_event(vgpu, event);
740 }
Chuanxiao Dong3cd23b82017-03-16 09:47:58 +0800741 mutex_lock(&dev_priv->drm.struct_mutex);
742 /* unpin shadow ctx as the shadow_ctx update is done */
Zhi Wang1406a142017-09-10 21:15:18 +0800743 engine->context_unpin(engine, s->shadow_ctx);
Chuanxiao Dong3cd23b82017-03-16 09:47:58 +0800744 mutex_unlock(&dev_priv->drm.struct_mutex);
Zhi Wange4734052016-05-01 07:42:16 -0400745 }
746
747 gvt_dbg_sched("ring id %d complete workload %p status %d\n",
748 ring_id, workload, workload->status);
749
750 scheduler->current_workload[ring_id] = NULL;
751
Zhi Wange4734052016-05-01 07:42:16 -0400752 list_del_init(&workload->list);
Zhi Wangd8235b52017-09-12 22:06:39 +0800753
754 if (!workload->status) {
755 release_shadow_batch_buffer(workload);
756 release_shadow_wa_ctx(&workload->wa_ctx);
757 }
758
Zhi Wange2c43c02017-09-13 01:58:35 +0800759 if (workload->status || (vgpu->resetting_eng & ENGINE_MASK(ring_id))) {
760 /* if workload->status is not successful means HW GPU
761 * has occurred GPU hang or something wrong with i915/GVT,
762 * and GVT won't inject context switch interrupt to guest.
763 * So this error is a vGPU hang actually to the guest.
764 * According to this we should emunlate a vGPU hang. If
765 * there are pending workloads which are already submitted
766 * from guest, we should clean them up like HW GPU does.
767 *
768 * if it is in middle of engine resetting, the pending
769 * workloads won't be submitted to HW GPU and will be
770 * cleaned up during the resetting process later, so doing
771 * the workload clean up here doesn't have any impact.
772 **/
773 clean_workloads(vgpu, ENGINE_MASK(ring_id));
774 }
775
Zhi Wange4734052016-05-01 07:42:16 -0400776 workload->complete(workload);
777
Zhi Wang1406a142017-09-10 21:15:18 +0800778 atomic_dec(&s->running_workload_num);
Zhi Wange4734052016-05-01 07:42:16 -0400779 wake_up(&scheduler->workload_complete_wq);
Ping Gaof100dae2017-05-24 09:14:11 +0800780
781 if (gvt->scheduler.need_reschedule)
782 intel_gvt_request_service(gvt, INTEL_GVT_REQUEST_EVENT_SCHED);
783
Zhi Wange4734052016-05-01 07:42:16 -0400784 mutex_unlock(&gvt->lock);
785}
786
787struct workload_thread_param {
788 struct intel_gvt *gvt;
789 int ring_id;
790};
791
792static int workload_thread(void *priv)
793{
794 struct workload_thread_param *p = (struct workload_thread_param *)priv;
795 struct intel_gvt *gvt = p->gvt;
796 int ring_id = p->ring_id;
797 struct intel_gvt_workload_scheduler *scheduler = &gvt->scheduler;
798 struct intel_vgpu_workload *workload = NULL;
Tina Zhang695fbc02017-03-10 04:26:53 -0500799 struct intel_vgpu *vgpu = NULL;
Zhi Wange4734052016-05-01 07:42:16 -0400800 int ret;
Xu Hane3476c02017-03-29 10:13:59 +0800801 bool need_force_wake = IS_SKYLAKE(gvt->dev_priv)
802 || IS_KABYLAKE(gvt->dev_priv);
Du, Changbine45d7b72016-10-27 11:10:31 +0800803 DEFINE_WAIT_FUNC(wait, woken_wake_function);
Zhi Wange4734052016-05-01 07:42:16 -0400804
805 kfree(p);
806
807 gvt_dbg_core("workload thread for ring %d started\n", ring_id);
808
809 while (!kthread_should_stop()) {
Du, Changbine45d7b72016-10-27 11:10:31 +0800810 add_wait_queue(&scheduler->waitq[ring_id], &wait);
811 do {
812 workload = pick_next_workload(gvt, ring_id);
813 if (workload)
814 break;
815 wait_woken(&wait, TASK_INTERRUPTIBLE,
816 MAX_SCHEDULE_TIMEOUT);
817 } while (!kthread_should_stop());
818 remove_wait_queue(&scheduler->waitq[ring_id], &wait);
Zhi Wange4734052016-05-01 07:42:16 -0400819
Du, Changbine45d7b72016-10-27 11:10:31 +0800820 if (!workload)
Zhi Wange4734052016-05-01 07:42:16 -0400821 break;
822
823 gvt_dbg_sched("ring id %d next workload %p vgpu %d\n",
824 workload->ring_id, workload,
825 workload->vgpu->id);
826
827 intel_runtime_pm_get(gvt->dev_priv);
828
Zhi Wange4734052016-05-01 07:42:16 -0400829 gvt_dbg_sched("ring id %d will dispatch workload %p\n",
830 workload->ring_id, workload);
831
832 if (need_force_wake)
833 intel_uncore_forcewake_get(gvt->dev_priv,
834 FORCEWAKE_ALL);
835
Pei Zhang90d27a12016-11-14 18:02:57 +0800836 mutex_lock(&gvt->lock);
Zhi Wange4734052016-05-01 07:42:16 -0400837 ret = dispatch_workload(workload);
Pei Zhang90d27a12016-11-14 18:02:57 +0800838 mutex_unlock(&gvt->lock);
Chris Wilson66bbc3b2016-10-19 11:11:44 +0100839
Zhi Wange4734052016-05-01 07:42:16 -0400840 if (ret) {
Tina Zhang695fbc02017-03-10 04:26:53 -0500841 vgpu = workload->vgpu;
842 gvt_vgpu_err("fail to dispatch workload, skip\n");
Zhi Wange4734052016-05-01 07:42:16 -0400843 goto complete;
844 }
845
846 gvt_dbg_sched("ring id %d wait workload %p\n",
847 workload->ring_id, workload);
Chris Wilson3dce2ac2017-03-08 22:08:08 +0000848 i915_wait_request(workload->req, 0, MAX_SCHEDULE_TIMEOUT);
Zhi Wange4734052016-05-01 07:42:16 -0400849
850complete:
Changbin Du3ce32742017-02-09 10:13:16 +0800851 gvt_dbg_sched("will complete workload %p, status: %d\n",
Zhi Wange4734052016-05-01 07:42:16 -0400852 workload, workload->status);
853
Changbin Du2e51ef32017-01-05 13:28:05 +0800854 complete_current_workload(gvt, ring_id);
855
Zhi Wange4734052016-05-01 07:42:16 -0400856 if (need_force_wake)
857 intel_uncore_forcewake_put(gvt->dev_priv,
858 FORCEWAKE_ALL);
859
Zhi Wange4734052016-05-01 07:42:16 -0400860 intel_runtime_pm_put(gvt->dev_priv);
Zhi Wang6d763032017-09-12 22:33:12 +0800861 if (ret && (vgpu_is_vm_unhealthy(ret)))
fred gaoe011c6c2017-09-19 15:11:28 +0800862 enter_failsafe_mode(vgpu, GVT_FAILSAFE_GUEST_ERR);
Zhi Wange4734052016-05-01 07:42:16 -0400863 }
864 return 0;
865}
866
867void intel_gvt_wait_vgpu_idle(struct intel_vgpu *vgpu)
868{
Zhi Wang1406a142017-09-10 21:15:18 +0800869 struct intel_vgpu_submission *s = &vgpu->submission;
Zhi Wange4734052016-05-01 07:42:16 -0400870 struct intel_gvt *gvt = vgpu->gvt;
871 struct intel_gvt_workload_scheduler *scheduler = &gvt->scheduler;
872
Zhi Wang1406a142017-09-10 21:15:18 +0800873 if (atomic_read(&s->running_workload_num)) {
Zhi Wange4734052016-05-01 07:42:16 -0400874 gvt_dbg_sched("wait vgpu idle\n");
875
876 wait_event(scheduler->workload_complete_wq,
Zhi Wang1406a142017-09-10 21:15:18 +0800877 !atomic_read(&s->running_workload_num));
Zhi Wange4734052016-05-01 07:42:16 -0400878 }
879}
880
881void intel_gvt_clean_workload_scheduler(struct intel_gvt *gvt)
882{
883 struct intel_gvt_workload_scheduler *scheduler = &gvt->scheduler;
Changbin Du3fc03062017-03-13 10:47:11 +0800884 struct intel_engine_cs *engine;
885 enum intel_engine_id i;
Zhi Wange4734052016-05-01 07:42:16 -0400886
887 gvt_dbg_core("clean workload scheduler\n");
888
Changbin Du3fc03062017-03-13 10:47:11 +0800889 for_each_engine(engine, gvt->dev_priv, i) {
890 atomic_notifier_chain_unregister(
891 &engine->context_status_notifier,
892 &gvt->shadow_ctx_notifier_block[i]);
893 kthread_stop(scheduler->thread[i]);
Zhi Wange4734052016-05-01 07:42:16 -0400894 }
895}
896
897int intel_gvt_init_workload_scheduler(struct intel_gvt *gvt)
898{
899 struct intel_gvt_workload_scheduler *scheduler = &gvt->scheduler;
900 struct workload_thread_param *param = NULL;
Changbin Du3fc03062017-03-13 10:47:11 +0800901 struct intel_engine_cs *engine;
902 enum intel_engine_id i;
Zhi Wange4734052016-05-01 07:42:16 -0400903 int ret;
Zhi Wange4734052016-05-01 07:42:16 -0400904
905 gvt_dbg_core("init workload scheduler\n");
906
907 init_waitqueue_head(&scheduler->workload_complete_wq);
908
Changbin Du3fc03062017-03-13 10:47:11 +0800909 for_each_engine(engine, gvt->dev_priv, i) {
Zhi Wange4734052016-05-01 07:42:16 -0400910 init_waitqueue_head(&scheduler->waitq[i]);
911
912 param = kzalloc(sizeof(*param), GFP_KERNEL);
913 if (!param) {
914 ret = -ENOMEM;
915 goto err;
916 }
917
918 param->gvt = gvt;
919 param->ring_id = i;
920
921 scheduler->thread[i] = kthread_run(workload_thread, param,
922 "gvt workload %d", i);
923 if (IS_ERR(scheduler->thread[i])) {
924 gvt_err("fail to create workload thread\n");
925 ret = PTR_ERR(scheduler->thread[i]);
926 goto err;
927 }
Changbin Du3fc03062017-03-13 10:47:11 +0800928
929 gvt->shadow_ctx_notifier_block[i].notifier_call =
930 shadow_context_status_change;
931 atomic_notifier_chain_register(&engine->context_status_notifier,
932 &gvt->shadow_ctx_notifier_block[i]);
Zhi Wange4734052016-05-01 07:42:16 -0400933 }
934 return 0;
935err:
936 intel_gvt_clean_workload_scheduler(gvt);
937 kfree(param);
938 param = NULL;
939 return ret;
940}
941
Zhi Wang874b6a92017-09-10 20:08:18 +0800942/**
943 * intel_vgpu_clean_submission - free submission-related resource for vGPU
944 * @vgpu: a vGPU
945 *
946 * This function is called when a vGPU is being destroyed.
947 *
948 */
949void intel_vgpu_clean_submission(struct intel_vgpu *vgpu)
Zhi Wange4734052016-05-01 07:42:16 -0400950{
Zhi Wang1406a142017-09-10 21:15:18 +0800951 struct intel_vgpu_submission *s = &vgpu->submission;
952
Zhi Wangad1d3632017-09-13 00:31:29 +0800953 intel_vgpu_select_submission_ops(vgpu, 0);
Zhi Wang1406a142017-09-10 21:15:18 +0800954 i915_gem_context_put(s->shadow_ctx);
955 kmem_cache_destroy(s->workloads);
Zhi Wange4734052016-05-01 07:42:16 -0400956}
957
Zhi Wang06bb3722017-09-13 01:41:35 +0800958
959/**
960 * intel_vgpu_reset_submission - reset submission-related resource for vGPU
961 * @vgpu: a vGPU
962 * @engine_mask: engines expected to be reset
963 *
964 * This function is called when a vGPU is being destroyed.
965 *
966 */
967void intel_vgpu_reset_submission(struct intel_vgpu *vgpu,
968 unsigned long engine_mask)
969{
970 struct intel_vgpu_submission *s = &vgpu->submission;
971
972 if (!s->active)
973 return;
974
Zhi Wange2c43c02017-09-13 01:58:35 +0800975 clean_workloads(vgpu, engine_mask);
Zhi Wang06bb3722017-09-13 01:41:35 +0800976 s->ops->reset(vgpu, engine_mask);
977}
978
Zhi Wang874b6a92017-09-10 20:08:18 +0800979/**
980 * intel_vgpu_setup_submission - setup submission-related resource for vGPU
981 * @vgpu: a vGPU
982 *
983 * This function is called when a vGPU is being created.
984 *
985 * Returns:
986 * Zero on success, negative error code if failed.
987 *
988 */
989int intel_vgpu_setup_submission(struct intel_vgpu *vgpu)
Zhi Wange4734052016-05-01 07:42:16 -0400990{
Zhi Wang1406a142017-09-10 21:15:18 +0800991 struct intel_vgpu_submission *s = &vgpu->submission;
Zhi Wang9a9829e2017-09-10 20:28:09 +0800992 enum intel_engine_id i;
993 struct intel_engine_cs *engine;
994 int ret;
Zhi Wange4734052016-05-01 07:42:16 -0400995
Zhi Wang1406a142017-09-10 21:15:18 +0800996 s->shadow_ctx = i915_gem_context_create_gvt(
Zhi Wange4734052016-05-01 07:42:16 -0400997 &vgpu->gvt->dev_priv->drm);
Zhi Wang1406a142017-09-10 21:15:18 +0800998 if (IS_ERR(s->shadow_ctx))
999 return PTR_ERR(s->shadow_ctx);
Zhi Wange4734052016-05-01 07:42:16 -04001000
Zhi Wang1406a142017-09-10 21:15:18 +08001001 bitmap_zero(s->shadow_ctx_desc_updated, I915_NUM_ENGINES);
Kechen Lu9dfb8e52017-08-10 07:41:36 +08001002
Zhi Wang1406a142017-09-10 21:15:18 +08001003 s->workloads = kmem_cache_create("gvt-g_vgpu_workload",
Zhi Wang9a9829e2017-09-10 20:28:09 +08001004 sizeof(struct intel_vgpu_workload), 0,
1005 SLAB_HWCACHE_ALIGN,
1006 NULL);
1007
Zhi Wang1406a142017-09-10 21:15:18 +08001008 if (!s->workloads) {
Zhi Wang9a9829e2017-09-10 20:28:09 +08001009 ret = -ENOMEM;
1010 goto out_shadow_ctx;
1011 }
1012
1013 for_each_engine(engine, vgpu->gvt->dev_priv, i)
Zhi Wang1406a142017-09-10 21:15:18 +08001014 INIT_LIST_HEAD(&s->workload_q_head[i]);
Zhi Wang9a9829e2017-09-10 20:28:09 +08001015
Zhi Wang1406a142017-09-10 21:15:18 +08001016 atomic_set(&s->running_workload_num, 0);
Zhi Wang91d5d852017-09-10 21:33:20 +08001017 bitmap_zero(s->tlb_handle_pending, I915_NUM_ENGINES);
Zhi Wang9a9829e2017-09-10 20:28:09 +08001018
Zhi Wange4734052016-05-01 07:42:16 -04001019 return 0;
Zhi Wang9a9829e2017-09-10 20:28:09 +08001020
1021out_shadow_ctx:
Zhi Wang1406a142017-09-10 21:15:18 +08001022 i915_gem_context_put(s->shadow_ctx);
Zhi Wang9a9829e2017-09-10 20:28:09 +08001023 return ret;
Zhi Wange4734052016-05-01 07:42:16 -04001024}
Zhi Wang21527a82017-09-12 21:42:09 +08001025
1026/**
Zhi Wangad1d3632017-09-13 00:31:29 +08001027 * intel_vgpu_select_submission_ops - select virtual submission interface
1028 * @vgpu: a vGPU
1029 * @interface: expected vGPU virtual submission interface
1030 *
1031 * This function is called when guest configures submission interface.
1032 *
1033 * Returns:
1034 * Zero on success, negative error code if failed.
1035 *
1036 */
1037int intel_vgpu_select_submission_ops(struct intel_vgpu *vgpu,
1038 unsigned int interface)
1039{
1040 struct intel_vgpu_submission *s = &vgpu->submission;
1041 const struct intel_vgpu_submission_ops *ops[] = {
1042 [INTEL_VGPU_EXECLIST_SUBMISSION] =
1043 &intel_vgpu_execlist_submission_ops,
1044 };
1045 int ret;
1046
1047 if (WARN_ON(interface >= ARRAY_SIZE(ops)))
1048 return -EINVAL;
1049
1050 if (s->active) {
1051 s->ops->clean(vgpu);
1052 s->active = false;
1053 gvt_dbg_core("vgpu%d: de-select ops [ %s ] \n",
1054 vgpu->id, s->ops->name);
1055 }
1056
1057 if (interface == 0) {
1058 s->ops = NULL;
1059 s->virtual_submission_interface = 0;
1060 gvt_dbg_core("vgpu%d: no submission ops\n", vgpu->id);
1061 return 0;
1062 }
1063
1064 ret = ops[interface]->init(vgpu);
1065 if (ret)
1066 return ret;
1067
1068 s->ops = ops[interface];
1069 s->virtual_submission_interface = interface;
1070 s->active = true;
1071
1072 gvt_dbg_core("vgpu%d: activate ops [ %s ]\n",
1073 vgpu->id, s->ops->name);
1074
1075 return 0;
1076}
1077
1078/**
Zhi Wang21527a82017-09-12 21:42:09 +08001079 * intel_vgpu_destroy_workload - destroy a vGPU workload
1080 * @vgpu: a vGPU
1081 *
1082 * This function is called when destroy a vGPU workload.
1083 *
1084 */
1085void intel_vgpu_destroy_workload(struct intel_vgpu_workload *workload)
1086{
1087 struct intel_vgpu_submission *s = &workload->vgpu->submission;
1088
1089 if (workload->shadow_mm)
1090 intel_gvt_mm_unreference(workload->shadow_mm);
1091
1092 kmem_cache_free(s->workloads, workload);
1093}
1094
Zhi Wang6d763032017-09-12 22:33:12 +08001095static struct intel_vgpu_workload *
1096alloc_workload(struct intel_vgpu *vgpu)
Zhi Wang21527a82017-09-12 21:42:09 +08001097{
1098 struct intel_vgpu_submission *s = &vgpu->submission;
1099 struct intel_vgpu_workload *workload;
1100
1101 workload = kmem_cache_zalloc(s->workloads, GFP_KERNEL);
1102 if (!workload)
1103 return ERR_PTR(-ENOMEM);
1104
1105 INIT_LIST_HEAD(&workload->list);
1106 INIT_LIST_HEAD(&workload->shadow_bb);
1107
1108 init_waitqueue_head(&workload->shadow_ctx_status_wq);
1109 atomic_set(&workload->shadow_ctx_active, 0);
1110
1111 workload->status = -EINPROGRESS;
1112 workload->shadowed = false;
1113 workload->vgpu = vgpu;
1114
1115 return workload;
1116}
Zhi Wang6d763032017-09-12 22:33:12 +08001117
1118#define RING_CTX_OFF(x) \
1119 offsetof(struct execlist_ring_context, x)
1120
1121static void read_guest_pdps(struct intel_vgpu *vgpu,
1122 u64 ring_context_gpa, u32 pdp[8])
1123{
1124 u64 gpa;
1125 int i;
1126
1127 gpa = ring_context_gpa + RING_CTX_OFF(pdp3_UDW.val);
1128
1129 for (i = 0; i < 8; i++)
1130 intel_gvt_hypervisor_read_gpa(vgpu,
1131 gpa + i * 8, &pdp[7 - i], 4);
1132}
1133
1134static int prepare_mm(struct intel_vgpu_workload *workload)
1135{
1136 struct execlist_ctx_descriptor_format *desc = &workload->ctx_desc;
1137 struct intel_vgpu_mm *mm;
1138 struct intel_vgpu *vgpu = workload->vgpu;
1139 int page_table_level;
1140 u32 pdp[8];
1141
1142 if (desc->addressing_mode == 1) { /* legacy 32-bit */
1143 page_table_level = 3;
1144 } else if (desc->addressing_mode == 3) { /* legacy 64 bit */
1145 page_table_level = 4;
1146 } else {
1147 gvt_vgpu_err("Advanced Context mode(SVM) is not supported!\n");
1148 return -EINVAL;
1149 }
1150
1151 read_guest_pdps(workload->vgpu, workload->ring_context_gpa, pdp);
1152
1153 mm = intel_vgpu_find_ppgtt_mm(workload->vgpu, page_table_level, pdp);
1154 if (mm) {
1155 intel_gvt_mm_reference(mm);
1156 } else {
1157
1158 mm = intel_vgpu_create_mm(workload->vgpu, INTEL_GVT_MM_PPGTT,
1159 pdp, page_table_level, 0);
1160 if (IS_ERR(mm)) {
1161 gvt_vgpu_err("fail to create mm object.\n");
1162 return PTR_ERR(mm);
1163 }
1164 }
1165 workload->shadow_mm = mm;
1166 return 0;
1167}
1168
1169#define same_context(a, b) (((a)->context_id == (b)->context_id) && \
1170 ((a)->lrca == (b)->lrca))
1171
1172#define get_last_workload(q) \
1173 (list_empty(q) ? NULL : container_of(q->prev, \
1174 struct intel_vgpu_workload, list))
1175/**
1176 * intel_vgpu_create_workload - create a vGPU workload
1177 * @vgpu: a vGPU
1178 * @desc: a guest context descriptor
1179 *
1180 * This function is called when creating a vGPU workload.
1181 *
1182 * Returns:
1183 * struct intel_vgpu_workload * on success, negative error code in
1184 * pointer if failed.
1185 *
1186 */
1187struct intel_vgpu_workload *
1188intel_vgpu_create_workload(struct intel_vgpu *vgpu, int ring_id,
1189 struct execlist_ctx_descriptor_format *desc)
1190{
1191 struct intel_vgpu_submission *s = &vgpu->submission;
1192 struct list_head *q = workload_q_head(vgpu, ring_id);
1193 struct intel_vgpu_workload *last_workload = get_last_workload(q);
1194 struct intel_vgpu_workload *workload = NULL;
1195 struct drm_i915_private *dev_priv = vgpu->gvt->dev_priv;
1196 u64 ring_context_gpa;
1197 u32 head, tail, start, ctl, ctx_ctl, per_ctx, indirect_ctx;
1198 int ret;
1199
1200 ring_context_gpa = intel_vgpu_gma_to_gpa(vgpu->gtt.ggtt_mm,
1201 (u32)((desc->lrca + 1) << GTT_PAGE_SHIFT));
1202 if (ring_context_gpa == INTEL_GVT_INVALID_ADDR) {
1203 gvt_vgpu_err("invalid guest context LRCA: %x\n", desc->lrca);
1204 return ERR_PTR(-EINVAL);
1205 }
1206
1207 intel_gvt_hypervisor_read_gpa(vgpu, ring_context_gpa +
1208 RING_CTX_OFF(ring_header.val), &head, 4);
1209
1210 intel_gvt_hypervisor_read_gpa(vgpu, ring_context_gpa +
1211 RING_CTX_OFF(ring_tail.val), &tail, 4);
1212
1213 head &= RB_HEAD_OFF_MASK;
1214 tail &= RB_TAIL_OFF_MASK;
1215
1216 if (last_workload && same_context(&last_workload->ctx_desc, desc)) {
1217 gvt_dbg_el("ring id %d cur workload == last\n", ring_id);
1218 gvt_dbg_el("ctx head %x real head %lx\n", head,
1219 last_workload->rb_tail);
1220 /*
1221 * cannot use guest context head pointer here,
1222 * as it might not be updated at this time
1223 */
1224 head = last_workload->rb_tail;
1225 }
1226
1227 gvt_dbg_el("ring id %d begin a new workload\n", ring_id);
1228
1229 /* record some ring buffer register values for scan and shadow */
1230 intel_gvt_hypervisor_read_gpa(vgpu, ring_context_gpa +
1231 RING_CTX_OFF(rb_start.val), &start, 4);
1232 intel_gvt_hypervisor_read_gpa(vgpu, ring_context_gpa +
1233 RING_CTX_OFF(rb_ctrl.val), &ctl, 4);
1234 intel_gvt_hypervisor_read_gpa(vgpu, ring_context_gpa +
1235 RING_CTX_OFF(ctx_ctrl.val), &ctx_ctl, 4);
1236
1237 workload = alloc_workload(vgpu);
1238 if (IS_ERR(workload))
1239 return workload;
1240
1241 workload->ring_id = ring_id;
1242 workload->ctx_desc = *desc;
1243 workload->ring_context_gpa = ring_context_gpa;
1244 workload->rb_head = head;
1245 workload->rb_tail = tail;
1246 workload->rb_start = start;
1247 workload->rb_ctl = ctl;
1248
1249 if (ring_id == RCS) {
1250 intel_gvt_hypervisor_read_gpa(vgpu, ring_context_gpa +
1251 RING_CTX_OFF(bb_per_ctx_ptr.val), &per_ctx, 4);
1252 intel_gvt_hypervisor_read_gpa(vgpu, ring_context_gpa +
1253 RING_CTX_OFF(rcs_indirect_ctx.val), &indirect_ctx, 4);
1254
1255 workload->wa_ctx.indirect_ctx.guest_gma =
1256 indirect_ctx & INDIRECT_CTX_ADDR_MASK;
1257 workload->wa_ctx.indirect_ctx.size =
1258 (indirect_ctx & INDIRECT_CTX_SIZE_MASK) *
1259 CACHELINE_BYTES;
1260 workload->wa_ctx.per_ctx.guest_gma =
1261 per_ctx & PER_CTX_ADDR_MASK;
1262 workload->wa_ctx.per_ctx.valid = per_ctx & 1;
1263 }
1264
1265 gvt_dbg_el("workload %p ring id %d head %x tail %x start %x ctl %x\n",
1266 workload, ring_id, head, tail, start, ctl);
1267
1268 ret = prepare_mm(workload);
1269 if (ret) {
1270 kmem_cache_free(s->workloads, workload);
1271 return ERR_PTR(ret);
1272 }
1273
1274 /* Only scan and shadow the first workload in the queue
1275 * as there is only one pre-allocated buf-obj for shadow.
1276 */
1277 if (list_empty(workload_q_head(vgpu, ring_id))) {
1278 intel_runtime_pm_get(dev_priv);
1279 mutex_lock(&dev_priv->drm.struct_mutex);
1280 ret = intel_gvt_scan_and_shadow_workload(workload);
1281 mutex_unlock(&dev_priv->drm.struct_mutex);
1282 intel_runtime_pm_put(dev_priv);
1283 }
1284
1285 if (ret && (vgpu_is_vm_unhealthy(ret))) {
1286 enter_failsafe_mode(vgpu, GVT_FAILSAFE_GUEST_ERR);
1287 intel_vgpu_destroy_workload(workload);
1288 return ERR_PTR(ret);
1289 }
1290
1291 return workload;
1292}