blob: 9100aebcb105b5fe4ef525d3f895f1c93412b0df [file] [log] [blame]
Zhi Wange4734052016-05-01 07:42:16 -04001/*
2 * Copyright(c) 2011-2016 Intel Corporation. All rights reserved.
3 *
4 * Permission is hereby granted, free of charge, to any person obtaining a
5 * copy of this software and associated documentation files (the "Software"),
6 * to deal in the Software without restriction, including without limitation
7 * the rights to use, copy, modify, merge, publish, distribute, sublicense,
8 * and/or sell copies of the Software, and to permit persons to whom the
9 * Software is furnished to do so, subject to the following conditions:
10 *
11 * The above copyright notice and this permission notice (including the next
12 * paragraph) shall be included in all copies or substantial portions of the
13 * Software.
14 *
15 * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
16 * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
17 * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL
18 * THE AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
19 * LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
20 * OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE
21 * SOFTWARE.
22 *
23 * Authors:
24 * Zhi Wang <zhi.a.wang@intel.com>
25 *
26 * Contributors:
27 * Ping Gao <ping.a.gao@intel.com>
28 * Tina Zhang <tina.zhang@intel.com>
29 * Chanbin Du <changbin.du@intel.com>
30 * Min He <min.he@intel.com>
31 * Bing Niu <bing.niu@intel.com>
32 * Zhenyu Wang <zhenyuw@linux.intel.com>
33 *
34 */
35
Zhi Wange4734052016-05-01 07:42:16 -040036#include <linux/kthread.h>
37
Zhenyu Wangfeddf6e2016-10-20 17:15:03 +080038#include "i915_drv.h"
39#include "gvt.h"
40
Zhi Wange4734052016-05-01 07:42:16 -040041#define RING_CTX_OFF(x) \
42 offsetof(struct execlist_ring_context, x)
43
Du, Changbin999ccb42016-10-20 14:08:47 +080044static void set_context_pdp_root_pointer(
45 struct execlist_ring_context *ring_context,
Zhi Wange4734052016-05-01 07:42:16 -040046 u32 pdp[8])
47{
48 struct execlist_mmio_pair *pdp_pair = &ring_context->pdp3_UDW;
49 int i;
50
51 for (i = 0; i < 8; i++)
52 pdp_pair[i].val = pdp[7 - i];
53}
54
55static int populate_shadow_context(struct intel_vgpu_workload *workload)
56{
57 struct intel_vgpu *vgpu = workload->vgpu;
58 struct intel_gvt *gvt = vgpu->gvt;
59 int ring_id = workload->ring_id;
Zhi Wang1406a142017-09-10 21:15:18 +080060 struct i915_gem_context *shadow_ctx = vgpu->submission.shadow_ctx;
Zhi Wange4734052016-05-01 07:42:16 -040061 struct drm_i915_gem_object *ctx_obj =
62 shadow_ctx->engine[ring_id].state->obj;
63 struct execlist_ring_context *shadow_ring_context;
64 struct page *page;
65 void *dst;
66 unsigned long context_gpa, context_page_num;
67 int i;
68
69 gvt_dbg_sched("ring id %d workload lrca %x", ring_id,
70 workload->ctx_desc.lrca);
71
Joonas Lahtinen63ffbcd2017-04-28 10:53:36 +030072 context_page_num = gvt->dev_priv->engine[ring_id]->context_size;
Zhi Wange4734052016-05-01 07:42:16 -040073
74 context_page_num = context_page_num >> PAGE_SHIFT;
75
76 if (IS_BROADWELL(gvt->dev_priv) && ring_id == RCS)
77 context_page_num = 19;
78
79 i = 2;
80
81 while (i < context_page_num) {
82 context_gpa = intel_vgpu_gma_to_gpa(vgpu->gtt.ggtt_mm,
83 (u32)((workload->ctx_desc.lrca + i) <<
Zhi Wang9556e112017-10-10 13:51:32 +080084 I915_GTT_PAGE_SHIFT));
Zhi Wange4734052016-05-01 07:42:16 -040085 if (context_gpa == INTEL_GVT_INVALID_ADDR) {
Tina Zhang695fbc02017-03-10 04:26:53 -050086 gvt_vgpu_err("Invalid guest context descriptor\n");
fred gao5c568832017-09-20 05:36:47 +080087 return -EFAULT;
Zhi Wange4734052016-05-01 07:42:16 -040088 }
89
Michel Thierry0b29c752017-09-13 09:56:00 +010090 page = i915_gem_object_get_page(ctx_obj, LRC_HEADER_PAGES + i);
Xiaoguang Chenc7549362016-11-03 18:38:30 +080091 dst = kmap(page);
Zhi Wange4734052016-05-01 07:42:16 -040092 intel_gvt_hypervisor_read_gpa(vgpu, context_gpa, dst,
Zhi Wang9556e112017-10-10 13:51:32 +080093 I915_GTT_PAGE_SIZE);
Xiaoguang Chenc7549362016-11-03 18:38:30 +080094 kunmap(page);
Zhi Wange4734052016-05-01 07:42:16 -040095 i++;
96 }
97
98 page = i915_gem_object_get_page(ctx_obj, LRC_STATE_PN);
Xiaoguang Chenc7549362016-11-03 18:38:30 +080099 shadow_ring_context = kmap(page);
Zhi Wange4734052016-05-01 07:42:16 -0400100
101#define COPY_REG(name) \
102 intel_gvt_hypervisor_read_gpa(vgpu, workload->ring_context_gpa \
103 + RING_CTX_OFF(name.val), &shadow_ring_context->name.val, 4)
104
105 COPY_REG(ctx_ctrl);
106 COPY_REG(ctx_timestamp);
107
108 if (ring_id == RCS) {
109 COPY_REG(bb_per_ctx_ptr);
110 COPY_REG(rcs_indirect_ctx);
111 COPY_REG(rcs_indirect_ctx_offset);
112 }
113#undef COPY_REG
114
115 set_context_pdp_root_pointer(shadow_ring_context,
116 workload->shadow_mm->shadow_page_table);
117
118 intel_gvt_hypervisor_read_gpa(vgpu,
119 workload->ring_context_gpa +
120 sizeof(*shadow_ring_context),
121 (void *)shadow_ring_context +
122 sizeof(*shadow_ring_context),
Zhi Wang9556e112017-10-10 13:51:32 +0800123 I915_GTT_PAGE_SIZE - sizeof(*shadow_ring_context));
Zhi Wange4734052016-05-01 07:42:16 -0400124
Xiaoguang Chenc7549362016-11-03 18:38:30 +0800125 kunmap(page);
Zhi Wange4734052016-05-01 07:42:16 -0400126 return 0;
127}
128
Changbin Dubc2d4b62017-03-22 12:35:31 +0800129static inline bool is_gvt_request(struct drm_i915_gem_request *req)
130{
131 return i915_gem_context_force_single_submission(req->ctx);
132}
133
Xiong Zhang295764c2017-11-07 05:23:02 +0800134static void save_ring_hw_state(struct intel_vgpu *vgpu, int ring_id)
135{
136 struct drm_i915_private *dev_priv = vgpu->gvt->dev_priv;
137 u32 ring_base = dev_priv->engine[ring_id]->mmio_base;
138 i915_reg_t reg;
139
140 reg = RING_INSTDONE(ring_base);
141 vgpu_vreg(vgpu, i915_mmio_reg_offset(reg)) = I915_READ_FW(reg);
142 reg = RING_ACTHD(ring_base);
143 vgpu_vreg(vgpu, i915_mmio_reg_offset(reg)) = I915_READ_FW(reg);
144 reg = RING_ACTHD_UDW(ring_base);
145 vgpu_vreg(vgpu, i915_mmio_reg_offset(reg)) = I915_READ_FW(reg);
146}
147
Zhi Wange4734052016-05-01 07:42:16 -0400148static int shadow_context_status_change(struct notifier_block *nb,
149 unsigned long action, void *data)
150{
Changbin Du3fc03062017-03-13 10:47:11 +0800151 struct drm_i915_gem_request *req = (struct drm_i915_gem_request *)data;
152 struct intel_gvt *gvt = container_of(nb, struct intel_gvt,
153 shadow_ctx_notifier_block[req->engine->id]);
154 struct intel_gvt_workload_scheduler *scheduler = &gvt->scheduler;
Changbin Du0e86cc92017-05-04 10:52:38 +0800155 enum intel_engine_id ring_id = req->engine->id;
156 struct intel_vgpu_workload *workload;
Zhi Wange4734052016-05-01 07:42:16 -0400157
Changbin Du0e86cc92017-05-04 10:52:38 +0800158 if (!is_gvt_request(req)) {
159 spin_lock_bh(&scheduler->mmio_context_lock);
160 if (action == INTEL_CONTEXT_SCHEDULE_IN &&
161 scheduler->engine_owner[ring_id]) {
162 /* Switch ring from vGPU to host. */
163 intel_gvt_switch_mmio(scheduler->engine_owner[ring_id],
164 NULL, ring_id);
165 scheduler->engine_owner[ring_id] = NULL;
166 }
167 spin_unlock_bh(&scheduler->mmio_context_lock);
168
169 return NOTIFY_OK;
170 }
171
172 workload = scheduler->current_workload[ring_id];
173 if (unlikely(!workload))
Chuanxiao Dong9272f732017-02-17 19:29:52 +0800174 return NOTIFY_OK;
175
Zhi Wange4734052016-05-01 07:42:16 -0400176 switch (action) {
177 case INTEL_CONTEXT_SCHEDULE_IN:
Changbin Du0e86cc92017-05-04 10:52:38 +0800178 spin_lock_bh(&scheduler->mmio_context_lock);
179 if (workload->vgpu != scheduler->engine_owner[ring_id]) {
180 /* Switch ring from host to vGPU or vGPU to vGPU. */
181 intel_gvt_switch_mmio(scheduler->engine_owner[ring_id],
182 workload->vgpu, ring_id);
183 scheduler->engine_owner[ring_id] = workload->vgpu;
184 } else
185 gvt_dbg_sched("skip ring %d mmio switch for vgpu%d\n",
186 ring_id, workload->vgpu->id);
187 spin_unlock_bh(&scheduler->mmio_context_lock);
Zhi Wange4734052016-05-01 07:42:16 -0400188 atomic_set(&workload->shadow_ctx_active, 1);
189 break;
190 case INTEL_CONTEXT_SCHEDULE_OUT:
Xiong Zhang295764c2017-11-07 05:23:02 +0800191 save_ring_hw_state(workload->vgpu, ring_id);
Zhi Wange4734052016-05-01 07:42:16 -0400192 atomic_set(&workload->shadow_ctx_active, 0);
193 break;
Zhenyu Wangda5f99e2017-12-01 14:59:53 +0800194 case INTEL_CONTEXT_SCHEDULE_PREEMPTED:
195 save_ring_hw_state(workload->vgpu, ring_id);
196 break;
Zhi Wange4734052016-05-01 07:42:16 -0400197 default:
198 WARN_ON(1);
199 return NOTIFY_OK;
200 }
201 wake_up(&workload->shadow_ctx_status_wq);
202 return NOTIFY_OK;
203}
204
Kechen Lu9dfb8e52017-08-10 07:41:36 +0800205static void shadow_context_descriptor_update(struct i915_gem_context *ctx,
206 struct intel_engine_cs *engine)
207{
208 struct intel_context *ce = &ctx->engine[engine->id];
209 u64 desc = 0;
210
211 desc = ce->lrc_desc;
212
213 /* Update bits 0-11 of the context descriptor which includes flags
214 * like GEN8_CTX_* cached in desc_template
215 */
216 desc &= U64_MAX << 12;
217 desc |= ctx->desc_template & ((1ULL << 12) - 1);
218
219 ce->lrc_desc = desc;
220}
221
fred gao0a53bc02017-08-18 15:41:06 +0800222static int copy_workload_to_ring_buffer(struct intel_vgpu_workload *workload)
223{
224 struct intel_vgpu *vgpu = workload->vgpu;
225 void *shadow_ring_buffer_va;
226 u32 *cs;
227
228 /* allocate shadow ring buffer */
229 cs = intel_ring_begin(workload->req, workload->rb_len / sizeof(u32));
230 if (IS_ERR(cs)) {
231 gvt_vgpu_err("fail to alloc size =%ld shadow ring buffer\n",
232 workload->rb_len);
233 return PTR_ERR(cs);
234 }
235
236 shadow_ring_buffer_va = workload->shadow_ring_buffer_va;
237
238 /* get shadow ring buffer va */
239 workload->shadow_ring_buffer_va = cs;
240
241 memcpy(cs, shadow_ring_buffer_va,
242 workload->rb_len);
243
244 cs += workload->rb_len / sizeof(u32);
245 intel_ring_advance(workload->req, cs);
246
247 return 0;
248}
249
Chris Wilson7b302552017-11-20 13:29:58 +0000250static void release_shadow_wa_ctx(struct intel_shadow_wa_ctx *wa_ctx)
fred gaoa3cfdca2017-08-18 15:41:07 +0800251{
252 if (!wa_ctx->indirect_ctx.obj)
253 return;
254
255 i915_gem_object_unpin_map(wa_ctx->indirect_ctx.obj);
256 i915_gem_object_put(wa_ctx->indirect_ctx.obj);
257}
258
Ping Gao89ea20b2017-06-29 12:22:42 +0800259/**
260 * intel_gvt_scan_and_shadow_workload - audit the workload by scanning and
261 * shadow it as well, include ringbuffer,wa_ctx and ctx.
262 * @workload: an abstract entity for each execlist submission.
263 *
264 * This function is called before the workload submitting to i915, to make
265 * sure the content of the workload is valid.
266 */
267int intel_gvt_scan_and_shadow_workload(struct intel_vgpu_workload *workload)
Zhi Wange4734052016-05-01 07:42:16 -0400268{
Zhi Wang1406a142017-09-10 21:15:18 +0800269 struct intel_vgpu *vgpu = workload->vgpu;
270 struct intel_vgpu_submission *s = &vgpu->submission;
271 struct i915_gem_context *shadow_ctx = s->shadow_ctx;
272 struct drm_i915_private *dev_priv = vgpu->gvt->dev_priv;
Zhi Wange4734052016-05-01 07:42:16 -0400273 int ring_id = workload->ring_id;
fred gao0a53bc02017-08-18 15:41:06 +0800274 struct intel_engine_cs *engine = dev_priv->engine[ring_id];
fred gao0a53bc02017-08-18 15:41:06 +0800275 struct intel_ring *ring;
Zhi Wange4734052016-05-01 07:42:16 -0400276 int ret;
277
Ping Gao87e919d2017-07-04 14:53:03 +0800278 lockdep_assert_held(&dev_priv->drm.struct_mutex);
279
Ping Gaod0302e72017-06-29 12:22:43 +0800280 if (workload->shadowed)
281 return 0;
Zhi Wange4734052016-05-01 07:42:16 -0400282
Zhenyu Wang03806ed2017-02-13 17:07:19 +0800283 shadow_ctx->desc_template &= ~(0x3 << GEN8_CTX_ADDRESSING_MODE_SHIFT);
284 shadow_ctx->desc_template |= workload->ctx_desc.addressing_mode <<
Zhi Wange4734052016-05-01 07:42:16 -0400285 GEN8_CTX_ADDRESSING_MODE_SHIFT;
286
Zhi Wang1406a142017-09-10 21:15:18 +0800287 if (!test_and_set_bit(ring_id, s->shadow_ctx_desc_updated))
Kechen Lu9dfb8e52017-08-10 07:41:36 +0800288 shadow_context_descriptor_update(shadow_ctx,
289 dev_priv->engine[ring_id]);
Chuanxiao Dong3cd23b82017-03-16 09:47:58 +0800290
Ping Gao89ea20b2017-06-29 12:22:42 +0800291 ret = intel_gvt_scan_and_shadow_ringbuffer(workload);
Zhi Wangbe1da702016-05-03 18:26:57 -0400292 if (ret)
fred gaoa3cfdca2017-08-18 15:41:07 +0800293 goto err_scan;
Zhi Wangbe1da702016-05-03 18:26:57 -0400294
Tina Zhang17f1b1a2017-03-15 23:16:01 -0400295 if ((workload->ring_id == RCS) &&
296 (workload->wa_ctx.indirect_ctx.size != 0)) {
297 ret = intel_gvt_scan_and_shadow_wa_ctx(&workload->wa_ctx);
298 if (ret)
fred gaoa3cfdca2017-08-18 15:41:07 +0800299 goto err_scan;
Tina Zhang17f1b1a2017-03-15 23:16:01 -0400300 }
Zhi Wangbe1da702016-05-03 18:26:57 -0400301
Ping Gao89ea20b2017-06-29 12:22:42 +0800302 /* pin shadow context by gvt even the shadow context will be pinned
303 * when i915 alloc request. That is because gvt will update the guest
304 * context from shadow context when workload is completed, and at that
305 * moment, i915 may already unpined the shadow context to make the
306 * shadow_ctx pages invalid. So gvt need to pin itself. After update
307 * the guest context, gvt can unpin the shadow_ctx safely.
308 */
309 ring = engine->context_pin(engine, shadow_ctx);
310 if (IS_ERR(ring)) {
311 ret = PTR_ERR(ring);
312 gvt_vgpu_err("fail to pin shadow context\n");
fred gaoa3cfdca2017-08-18 15:41:07 +0800313 goto err_shadow;
Ping Gao89ea20b2017-06-29 12:22:42 +0800314 }
Zhi Wange4734052016-05-01 07:42:16 -0400315
fred gao0a53bc02017-08-18 15:41:06 +0800316 ret = populate_shadow_context(workload);
317 if (ret)
fred gaoa3cfdca2017-08-18 15:41:07 +0800318 goto err_unpin;
fred gaof2880e02017-11-14 17:09:35 +0800319 workload->shadowed = true;
320 return 0;
321
322err_unpin:
323 engine->context_unpin(engine, shadow_ctx);
324err_shadow:
325 release_shadow_wa_ctx(&workload->wa_ctx);
326err_scan:
327 return ret;
328}
329
330static int intel_gvt_generate_request(struct intel_vgpu_workload *workload)
331{
332 int ring_id = workload->ring_id;
333 struct drm_i915_private *dev_priv = workload->vgpu->gvt->dev_priv;
334 struct intel_engine_cs *engine = dev_priv->engine[ring_id];
335 struct drm_i915_gem_request *rq;
336 struct intel_vgpu *vgpu = workload->vgpu;
337 struct intel_vgpu_submission *s = &vgpu->submission;
338 struct i915_gem_context *shadow_ctx = s->shadow_ctx;
339 int ret;
fred gao0a53bc02017-08-18 15:41:06 +0800340
341 rq = i915_gem_request_alloc(dev_priv->engine[ring_id], shadow_ctx);
342 if (IS_ERR(rq)) {
343 gvt_vgpu_err("fail to allocate gem request\n");
344 ret = PTR_ERR(rq);
fred gaoa3cfdca2017-08-18 15:41:07 +0800345 goto err_unpin;
fred gao0a53bc02017-08-18 15:41:06 +0800346 }
347
348 gvt_dbg_sched("ring id %d get i915 gem request %p\n", ring_id, rq);
349
350 workload->req = i915_gem_request_get(rq);
351 ret = copy_workload_to_ring_buffer(workload);
352 if (ret)
fred gaoa3cfdca2017-08-18 15:41:07 +0800353 goto err_unpin;
fred gaoa3cfdca2017-08-18 15:41:07 +0800354 return 0;
fred gao0a53bc02017-08-18 15:41:06 +0800355
fred gaoa3cfdca2017-08-18 15:41:07 +0800356err_unpin:
357 engine->context_unpin(engine, shadow_ctx);
fred gaoa3cfdca2017-08-18 15:41:07 +0800358 release_shadow_wa_ctx(&workload->wa_ctx);
fred gao0a53bc02017-08-18 15:41:06 +0800359 return ret;
360}
361
Zhi Wangf52c3802017-09-24 21:53:03 +0800362static void release_shadow_batch_buffer(struct intel_vgpu_workload *workload);
363
Zhi Wangd8235b52017-09-12 22:06:39 +0800364static int prepare_shadow_batch_buffer(struct intel_vgpu_workload *workload)
365{
366 struct intel_gvt *gvt = workload->vgpu->gvt;
367 const int gmadr_bytes = gvt->device_info.gmadr_bytes_in_cmd;
Zhi Wangf52c3802017-09-24 21:53:03 +0800368 struct intel_vgpu_shadow_bb *bb;
369 int ret;
Zhi Wangd8235b52017-09-12 22:06:39 +0800370
Zhi Wangf52c3802017-09-24 21:53:03 +0800371 list_for_each_entry(bb, &workload->shadow_bb, list) {
372 bb->vma = i915_gem_object_ggtt_pin(bb->obj, NULL, 0, 0, 0);
373 if (IS_ERR(bb->vma)) {
374 ret = PTR_ERR(bb->vma);
375 goto err;
376 }
Zhi Wangd8235b52017-09-12 22:06:39 +0800377
Zhi Wangf52c3802017-09-24 21:53:03 +0800378 /* relocate shadow batch buffer */
379 bb->bb_start_cmd_va[1] = i915_ggtt_offset(bb->vma);
Zhi Wangd8235b52017-09-12 22:06:39 +0800380 if (gmadr_bytes == 8)
Zhi Wangf52c3802017-09-24 21:53:03 +0800381 bb->bb_start_cmd_va[2] = 0;
382
383 /* No one is going to touch shadow bb from now on. */
384 if (bb->clflush & CLFLUSH_AFTER) {
385 drm_clflush_virt_range(bb->va, bb->obj->base.size);
386 bb->clflush &= ~CLFLUSH_AFTER;
387 }
388
389 ret = i915_gem_object_set_to_gtt_domain(bb->obj, false);
390 if (ret)
391 goto err;
392
393 i915_gem_obj_finish_shmem_access(bb->obj);
394 bb->accessing = false;
395
396 i915_vma_move_to_active(bb->vma, workload->req, 0);
Zhi Wangd8235b52017-09-12 22:06:39 +0800397 }
398 return 0;
Zhi Wangf52c3802017-09-24 21:53:03 +0800399err:
400 release_shadow_batch_buffer(workload);
401 return ret;
Zhi Wangd8235b52017-09-12 22:06:39 +0800402}
403
404static int update_wa_ctx_2_shadow_ctx(struct intel_shadow_wa_ctx *wa_ctx)
405{
406 struct intel_vgpu_workload *workload = container_of(wa_ctx,
407 struct intel_vgpu_workload,
408 wa_ctx);
409 int ring_id = workload->ring_id;
410 struct intel_vgpu_submission *s = &workload->vgpu->submission;
411 struct i915_gem_context *shadow_ctx = s->shadow_ctx;
412 struct drm_i915_gem_object *ctx_obj =
413 shadow_ctx->engine[ring_id].state->obj;
414 struct execlist_ring_context *shadow_ring_context;
415 struct page *page;
416
417 page = i915_gem_object_get_page(ctx_obj, LRC_STATE_PN);
418 shadow_ring_context = kmap_atomic(page);
419
420 shadow_ring_context->bb_per_ctx_ptr.val =
421 (shadow_ring_context->bb_per_ctx_ptr.val &
422 (~PER_CTX_ADDR_MASK)) | wa_ctx->per_ctx.shadow_gma;
423 shadow_ring_context->rcs_indirect_ctx.val =
424 (shadow_ring_context->rcs_indirect_ctx.val &
425 (~INDIRECT_CTX_ADDR_MASK)) | wa_ctx->indirect_ctx.shadow_gma;
426
427 kunmap_atomic(shadow_ring_context);
428 return 0;
429}
430
431static int prepare_shadow_wa_ctx(struct intel_shadow_wa_ctx *wa_ctx)
432{
433 struct i915_vma *vma;
434 unsigned char *per_ctx_va =
435 (unsigned char *)wa_ctx->indirect_ctx.shadow_va +
436 wa_ctx->indirect_ctx.size;
437
438 if (wa_ctx->indirect_ctx.size == 0)
439 return 0;
440
441 vma = i915_gem_object_ggtt_pin(wa_ctx->indirect_ctx.obj, NULL,
442 0, CACHELINE_BYTES, 0);
443 if (IS_ERR(vma))
444 return PTR_ERR(vma);
445
446 /* FIXME: we are not tracking our pinned VMA leaving it
447 * up to the core to fix up the stray pin_count upon
448 * free.
449 */
450
451 wa_ctx->indirect_ctx.shadow_gma = i915_ggtt_offset(vma);
452
453 wa_ctx->per_ctx.shadow_gma = *((unsigned int *)per_ctx_va + 1);
454 memset(per_ctx_va, 0, CACHELINE_BYTES);
455
456 update_wa_ctx_2_shadow_ctx(wa_ctx);
457 return 0;
458}
459
460static void release_shadow_batch_buffer(struct intel_vgpu_workload *workload)
461{
Zhi Wangf52c3802017-09-24 21:53:03 +0800462 struct intel_vgpu *vgpu = workload->vgpu;
463 struct drm_i915_private *dev_priv = vgpu->gvt->dev_priv;
464 struct intel_vgpu_shadow_bb *bb, *pos;
Zhi Wangd8235b52017-09-12 22:06:39 +0800465
Zhi Wangf52c3802017-09-24 21:53:03 +0800466 if (list_empty(&workload->shadow_bb))
467 return;
468
469 bb = list_first_entry(&workload->shadow_bb,
470 struct intel_vgpu_shadow_bb, list);
471
472 mutex_lock(&dev_priv->drm.struct_mutex);
473
474 list_for_each_entry_safe(bb, pos, &workload->shadow_bb, list) {
475 if (bb->obj) {
476 if (bb->accessing)
477 i915_gem_obj_finish_shmem_access(bb->obj);
478
479 if (bb->va && !IS_ERR(bb->va))
480 i915_gem_object_unpin_map(bb->obj);
481
482 if (bb->vma && !IS_ERR(bb->vma)) {
483 i915_vma_unpin(bb->vma);
484 i915_vma_close(bb->vma);
485 }
486 __i915_gem_object_release_unless_active(bb->obj);
Zhi Wangd8235b52017-09-12 22:06:39 +0800487 }
Zhi Wangf52c3802017-09-24 21:53:03 +0800488 list_del(&bb->list);
489 kfree(bb);
Zhi Wangd8235b52017-09-12 22:06:39 +0800490 }
Zhi Wangf52c3802017-09-24 21:53:03 +0800491
492 mutex_unlock(&dev_priv->drm.struct_mutex);
Zhi Wangd8235b52017-09-12 22:06:39 +0800493}
494
Zhi Wang497aa3f2017-09-12 21:51:10 +0800495static int prepare_workload(struct intel_vgpu_workload *workload)
496{
Zhi Wangd8235b52017-09-12 22:06:39 +0800497 struct intel_vgpu *vgpu = workload->vgpu;
Zhi Wang497aa3f2017-09-12 21:51:10 +0800498 int ret = 0;
499
Zhi Wangd8235b52017-09-12 22:06:39 +0800500 ret = intel_vgpu_pin_mm(workload->shadow_mm);
501 if (ret) {
502 gvt_vgpu_err("fail to vgpu pin mm\n");
503 return ret;
504 }
Zhi Wang497aa3f2017-09-12 21:51:10 +0800505
Zhi Wangd8235b52017-09-12 22:06:39 +0800506 ret = intel_vgpu_sync_oos_pages(workload->vgpu);
507 if (ret) {
508 gvt_vgpu_err("fail to vgpu sync oos pages\n");
509 goto err_unpin_mm;
510 }
511
512 ret = intel_vgpu_flush_post_shadow(workload->vgpu);
513 if (ret) {
514 gvt_vgpu_err("fail to flush post shadow\n");
515 goto err_unpin_mm;
516 }
517
fred gaof2880e02017-11-14 17:09:35 +0800518 ret = intel_gvt_generate_request(workload);
519 if (ret) {
520 gvt_vgpu_err("fail to generate request\n");
521 goto err_unpin_mm;
522 }
523
Zhi Wangd8235b52017-09-12 22:06:39 +0800524 ret = prepare_shadow_batch_buffer(workload);
525 if (ret) {
526 gvt_vgpu_err("fail to prepare_shadow_batch_buffer\n");
527 goto err_unpin_mm;
528 }
529
530 ret = prepare_shadow_wa_ctx(&workload->wa_ctx);
531 if (ret) {
532 gvt_vgpu_err("fail to prepare_shadow_wa_ctx\n");
533 goto err_shadow_batch;
534 }
535
536 if (workload->prepare) {
537 ret = workload->prepare(workload);
538 if (ret)
539 goto err_shadow_wa_ctx;
540 }
541
542 return 0;
543err_shadow_wa_ctx:
544 release_shadow_wa_ctx(&workload->wa_ctx);
545err_shadow_batch:
546 release_shadow_batch_buffer(workload);
547err_unpin_mm:
548 intel_vgpu_unpin_mm(workload->shadow_mm);
Zhi Wang497aa3f2017-09-12 21:51:10 +0800549 return ret;
550}
551
fred gao0a53bc02017-08-18 15:41:06 +0800552static int dispatch_workload(struct intel_vgpu_workload *workload)
553{
Zhi Wang1406a142017-09-10 21:15:18 +0800554 struct intel_vgpu *vgpu = workload->vgpu;
555 struct intel_vgpu_submission *s = &vgpu->submission;
556 struct i915_gem_context *shadow_ctx = s->shadow_ctx;
557 struct drm_i915_private *dev_priv = vgpu->gvt->dev_priv;
fred gao0a53bc02017-08-18 15:41:06 +0800558 int ring_id = workload->ring_id;
fred gao0a53bc02017-08-18 15:41:06 +0800559 struct intel_engine_cs *engine = dev_priv->engine[ring_id];
560 int ret = 0;
561
562 gvt_dbg_sched("ring id %d prepare to dispatch workload %p\n",
563 ring_id, workload);
564
565 mutex_lock(&dev_priv->drm.struct_mutex);
566
567 ret = intel_gvt_scan_and_shadow_workload(workload);
568 if (ret)
569 goto out;
570
Zhi Wang497aa3f2017-09-12 21:51:10 +0800571 ret = prepare_workload(workload);
572 if (ret) {
573 engine->context_unpin(engine, shadow_ctx);
574 goto out;
fred gao0a53bc02017-08-18 15:41:06 +0800575 }
576
Pei Zhang90d27a12016-11-14 18:02:57 +0800577out:
578 if (ret)
579 workload->status = ret;
Chris Wilson0eb742d2016-10-20 17:29:36 +0800580
Ping Gao89ea20b2017-06-29 12:22:42 +0800581 if (!IS_ERR_OR_NULL(workload->req)) {
582 gvt_dbg_sched("ring id %d submit workload to i915 %p\n",
583 ring_id, workload->req);
584 i915_add_request(workload->req);
585 workload->dispatched = true;
586 }
Chuanxiao Dong3cd23b82017-03-16 09:47:58 +0800587
Pei Zhang90d27a12016-11-14 18:02:57 +0800588 mutex_unlock(&dev_priv->drm.struct_mutex);
Zhi Wange4734052016-05-01 07:42:16 -0400589 return ret;
590}
591
592static struct intel_vgpu_workload *pick_next_workload(
593 struct intel_gvt *gvt, int ring_id)
594{
595 struct intel_gvt_workload_scheduler *scheduler = &gvt->scheduler;
596 struct intel_vgpu_workload *workload = NULL;
597
598 mutex_lock(&gvt->lock);
599
600 /*
601 * no current vgpu / will be scheduled out / no workload
602 * bail out
603 */
604 if (!scheduler->current_vgpu) {
605 gvt_dbg_sched("ring id %d stop - no current vgpu\n", ring_id);
606 goto out;
607 }
608
609 if (scheduler->need_reschedule) {
610 gvt_dbg_sched("ring id %d stop - will reschedule\n", ring_id);
611 goto out;
612 }
613
Zhenyu Wang954180a2017-04-12 14:22:50 +0800614 if (list_empty(workload_q_head(scheduler->current_vgpu, ring_id)))
Zhi Wange4734052016-05-01 07:42:16 -0400615 goto out;
Zhi Wange4734052016-05-01 07:42:16 -0400616
617 /*
618 * still have current workload, maybe the workload disptacher
619 * fail to submit it for some reason, resubmit it.
620 */
621 if (scheduler->current_workload[ring_id]) {
622 workload = scheduler->current_workload[ring_id];
623 gvt_dbg_sched("ring id %d still have current workload %p\n",
624 ring_id, workload);
625 goto out;
626 }
627
628 /*
629 * pick a workload as current workload
630 * once current workload is set, schedule policy routines
631 * will wait the current workload is finished when trying to
632 * schedule out a vgpu.
633 */
634 scheduler->current_workload[ring_id] = container_of(
635 workload_q_head(scheduler->current_vgpu, ring_id)->next,
636 struct intel_vgpu_workload, list);
637
638 workload = scheduler->current_workload[ring_id];
639
640 gvt_dbg_sched("ring id %d pick new workload %p\n", ring_id, workload);
641
Zhi Wang1406a142017-09-10 21:15:18 +0800642 atomic_inc(&workload->vgpu->submission.running_workload_num);
Zhi Wange4734052016-05-01 07:42:16 -0400643out:
644 mutex_unlock(&gvt->lock);
645 return workload;
646}
647
648static void update_guest_context(struct intel_vgpu_workload *workload)
649{
650 struct intel_vgpu *vgpu = workload->vgpu;
651 struct intel_gvt *gvt = vgpu->gvt;
Zhi Wang1406a142017-09-10 21:15:18 +0800652 struct intel_vgpu_submission *s = &vgpu->submission;
653 struct i915_gem_context *shadow_ctx = s->shadow_ctx;
Zhi Wange4734052016-05-01 07:42:16 -0400654 int ring_id = workload->ring_id;
Zhi Wange4734052016-05-01 07:42:16 -0400655 struct drm_i915_gem_object *ctx_obj =
656 shadow_ctx->engine[ring_id].state->obj;
657 struct execlist_ring_context *shadow_ring_context;
658 struct page *page;
659 void *src;
660 unsigned long context_gpa, context_page_num;
661 int i;
662
663 gvt_dbg_sched("ring id %d workload lrca %x\n", ring_id,
664 workload->ctx_desc.lrca);
665
Joonas Lahtinen63ffbcd2017-04-28 10:53:36 +0300666 context_page_num = gvt->dev_priv->engine[ring_id]->context_size;
Zhi Wange4734052016-05-01 07:42:16 -0400667
668 context_page_num = context_page_num >> PAGE_SHIFT;
669
670 if (IS_BROADWELL(gvt->dev_priv) && ring_id == RCS)
671 context_page_num = 19;
672
673 i = 2;
674
675 while (i < context_page_num) {
676 context_gpa = intel_vgpu_gma_to_gpa(vgpu->gtt.ggtt_mm,
677 (u32)((workload->ctx_desc.lrca + i) <<
Zhi Wang9556e112017-10-10 13:51:32 +0800678 I915_GTT_PAGE_SHIFT));
Zhi Wange4734052016-05-01 07:42:16 -0400679 if (context_gpa == INTEL_GVT_INVALID_ADDR) {
Tina Zhang695fbc02017-03-10 04:26:53 -0500680 gvt_vgpu_err("invalid guest context descriptor\n");
Zhi Wange4734052016-05-01 07:42:16 -0400681 return;
682 }
683
Michel Thierry0b29c752017-09-13 09:56:00 +0100684 page = i915_gem_object_get_page(ctx_obj, LRC_HEADER_PAGES + i);
Xiaoguang Chenc7549362016-11-03 18:38:30 +0800685 src = kmap(page);
Zhi Wange4734052016-05-01 07:42:16 -0400686 intel_gvt_hypervisor_write_gpa(vgpu, context_gpa, src,
Zhi Wang9556e112017-10-10 13:51:32 +0800687 I915_GTT_PAGE_SIZE);
Xiaoguang Chenc7549362016-11-03 18:38:30 +0800688 kunmap(page);
Zhi Wange4734052016-05-01 07:42:16 -0400689 i++;
690 }
691
692 intel_gvt_hypervisor_write_gpa(vgpu, workload->ring_context_gpa +
693 RING_CTX_OFF(ring_header.val), &workload->rb_tail, 4);
694
695 page = i915_gem_object_get_page(ctx_obj, LRC_STATE_PN);
Xiaoguang Chenc7549362016-11-03 18:38:30 +0800696 shadow_ring_context = kmap(page);
Zhi Wange4734052016-05-01 07:42:16 -0400697
698#define COPY_REG(name) \
699 intel_gvt_hypervisor_write_gpa(vgpu, workload->ring_context_gpa + \
700 RING_CTX_OFF(name.val), &shadow_ring_context->name.val, 4)
701
702 COPY_REG(ctx_ctrl);
703 COPY_REG(ctx_timestamp);
704
705#undef COPY_REG
706
707 intel_gvt_hypervisor_write_gpa(vgpu,
708 workload->ring_context_gpa +
709 sizeof(*shadow_ring_context),
710 (void *)shadow_ring_context +
711 sizeof(*shadow_ring_context),
Zhi Wang9556e112017-10-10 13:51:32 +0800712 I915_GTT_PAGE_SIZE - sizeof(*shadow_ring_context));
Zhi Wange4734052016-05-01 07:42:16 -0400713
Xiaoguang Chenc7549362016-11-03 18:38:30 +0800714 kunmap(page);
Zhi Wange4734052016-05-01 07:42:16 -0400715}
716
Zhi Wange2c43c02017-09-13 01:58:35 +0800717static void clean_workloads(struct intel_vgpu *vgpu, unsigned long engine_mask)
718{
719 struct intel_vgpu_submission *s = &vgpu->submission;
720 struct drm_i915_private *dev_priv = vgpu->gvt->dev_priv;
721 struct intel_engine_cs *engine;
722 struct intel_vgpu_workload *pos, *n;
723 unsigned int tmp;
724
725 /* free the unsubmited workloads in the queues. */
726 for_each_engine_masked(engine, dev_priv, engine_mask, tmp) {
727 list_for_each_entry_safe(pos, n,
728 &s->workload_q_head[engine->id], list) {
729 list_del_init(&pos->list);
730 intel_vgpu_destroy_workload(pos);
731 }
732 clear_bit(engine->id, s->shadow_ctx_desc_updated);
733 }
734}
735
Zhi Wange4734052016-05-01 07:42:16 -0400736static void complete_current_workload(struct intel_gvt *gvt, int ring_id)
737{
738 struct intel_gvt_workload_scheduler *scheduler = &gvt->scheduler;
Zhi Wang1406a142017-09-10 21:15:18 +0800739 struct intel_vgpu_workload *workload =
740 scheduler->current_workload[ring_id];
741 struct intel_vgpu *vgpu = workload->vgpu;
742 struct intel_vgpu_submission *s = &vgpu->submission;
Zhi Wangbe1da702016-05-03 18:26:57 -0400743 int event;
Zhi Wange4734052016-05-01 07:42:16 -0400744
745 mutex_lock(&gvt->lock);
746
Chuanxiao Dong8f1117a2017-03-06 13:05:24 +0800747 /* For the workload w/ request, needs to wait for the context
748 * switch to make sure request is completed.
749 * For the workload w/o request, directly complete the workload.
750 */
751 if (workload->req) {
Chuanxiao Dong3cd23b82017-03-16 09:47:58 +0800752 struct drm_i915_private *dev_priv =
753 workload->vgpu->gvt->dev_priv;
754 struct intel_engine_cs *engine =
755 dev_priv->engine[workload->ring_id];
Zhi Wange4734052016-05-01 07:42:16 -0400756 wait_event(workload->shadow_ctx_status_wq,
757 !atomic_read(&workload->shadow_ctx_active));
758
Chuanxiao Dong0cf5ec42017-06-23 13:01:11 +0800759 /* If this request caused GPU hang, req->fence.error will
760 * be set to -EIO. Use -EIO to set workload status so
761 * that when this request caused GPU hang, didn't trigger
762 * context switch interrupt to guest.
763 */
764 if (likely(workload->status == -EINPROGRESS)) {
765 if (workload->req->fence.error == -EIO)
766 workload->status = -EIO;
767 else
768 workload->status = 0;
769 }
770
Chuanxiao Dong8f1117a2017-03-06 13:05:24 +0800771 i915_gem_request_put(fetch_and_zero(&workload->req));
Zhi Wangbe1da702016-05-03 18:26:57 -0400772
Chuanxiao Dong6184cc82017-08-01 17:47:25 +0800773 if (!workload->status && !(vgpu->resetting_eng &
774 ENGINE_MASK(ring_id))) {
Chuanxiao Dong8f1117a2017-03-06 13:05:24 +0800775 update_guest_context(workload);
776
777 for_each_set_bit(event, workload->pending_events,
778 INTEL_GVT_EVENT_MAX)
779 intel_vgpu_trigger_virtual_event(vgpu, event);
780 }
Chuanxiao Dong3cd23b82017-03-16 09:47:58 +0800781 mutex_lock(&dev_priv->drm.struct_mutex);
782 /* unpin shadow ctx as the shadow_ctx update is done */
Zhi Wang1406a142017-09-10 21:15:18 +0800783 engine->context_unpin(engine, s->shadow_ctx);
Chuanxiao Dong3cd23b82017-03-16 09:47:58 +0800784 mutex_unlock(&dev_priv->drm.struct_mutex);
Zhi Wange4734052016-05-01 07:42:16 -0400785 }
786
787 gvt_dbg_sched("ring id %d complete workload %p status %d\n",
788 ring_id, workload, workload->status);
789
790 scheduler->current_workload[ring_id] = NULL;
791
Zhi Wange4734052016-05-01 07:42:16 -0400792 list_del_init(&workload->list);
Zhi Wangd8235b52017-09-12 22:06:39 +0800793
794 if (!workload->status) {
795 release_shadow_batch_buffer(workload);
796 release_shadow_wa_ctx(&workload->wa_ctx);
797 }
798
Zhi Wange2c43c02017-09-13 01:58:35 +0800799 if (workload->status || (vgpu->resetting_eng & ENGINE_MASK(ring_id))) {
800 /* if workload->status is not successful means HW GPU
801 * has occurred GPU hang or something wrong with i915/GVT,
802 * and GVT won't inject context switch interrupt to guest.
803 * So this error is a vGPU hang actually to the guest.
804 * According to this we should emunlate a vGPU hang. If
805 * there are pending workloads which are already submitted
806 * from guest, we should clean them up like HW GPU does.
807 *
808 * if it is in middle of engine resetting, the pending
809 * workloads won't be submitted to HW GPU and will be
810 * cleaned up during the resetting process later, so doing
811 * the workload clean up here doesn't have any impact.
812 **/
813 clean_workloads(vgpu, ENGINE_MASK(ring_id));
814 }
815
Zhi Wange4734052016-05-01 07:42:16 -0400816 workload->complete(workload);
817
Zhi Wang1406a142017-09-10 21:15:18 +0800818 atomic_dec(&s->running_workload_num);
Zhi Wange4734052016-05-01 07:42:16 -0400819 wake_up(&scheduler->workload_complete_wq);
Ping Gaof100dae2017-05-24 09:14:11 +0800820
821 if (gvt->scheduler.need_reschedule)
822 intel_gvt_request_service(gvt, INTEL_GVT_REQUEST_EVENT_SCHED);
823
Zhi Wange4734052016-05-01 07:42:16 -0400824 mutex_unlock(&gvt->lock);
825}
826
827struct workload_thread_param {
828 struct intel_gvt *gvt;
829 int ring_id;
830};
831
832static int workload_thread(void *priv)
833{
834 struct workload_thread_param *p = (struct workload_thread_param *)priv;
835 struct intel_gvt *gvt = p->gvt;
836 int ring_id = p->ring_id;
837 struct intel_gvt_workload_scheduler *scheduler = &gvt->scheduler;
838 struct intel_vgpu_workload *workload = NULL;
Tina Zhang695fbc02017-03-10 04:26:53 -0500839 struct intel_vgpu *vgpu = NULL;
Zhi Wange4734052016-05-01 07:42:16 -0400840 int ret;
Xu Hane3476c02017-03-29 10:13:59 +0800841 bool need_force_wake = IS_SKYLAKE(gvt->dev_priv)
842 || IS_KABYLAKE(gvt->dev_priv);
Du, Changbine45d7b72016-10-27 11:10:31 +0800843 DEFINE_WAIT_FUNC(wait, woken_wake_function);
Zhi Wange4734052016-05-01 07:42:16 -0400844
845 kfree(p);
846
847 gvt_dbg_core("workload thread for ring %d started\n", ring_id);
848
849 while (!kthread_should_stop()) {
Du, Changbine45d7b72016-10-27 11:10:31 +0800850 add_wait_queue(&scheduler->waitq[ring_id], &wait);
851 do {
852 workload = pick_next_workload(gvt, ring_id);
853 if (workload)
854 break;
855 wait_woken(&wait, TASK_INTERRUPTIBLE,
856 MAX_SCHEDULE_TIMEOUT);
857 } while (!kthread_should_stop());
858 remove_wait_queue(&scheduler->waitq[ring_id], &wait);
Zhi Wange4734052016-05-01 07:42:16 -0400859
Du, Changbine45d7b72016-10-27 11:10:31 +0800860 if (!workload)
Zhi Wange4734052016-05-01 07:42:16 -0400861 break;
862
863 gvt_dbg_sched("ring id %d next workload %p vgpu %d\n",
864 workload->ring_id, workload,
865 workload->vgpu->id);
866
867 intel_runtime_pm_get(gvt->dev_priv);
868
Zhi Wange4734052016-05-01 07:42:16 -0400869 gvt_dbg_sched("ring id %d will dispatch workload %p\n",
870 workload->ring_id, workload);
871
872 if (need_force_wake)
873 intel_uncore_forcewake_get(gvt->dev_priv,
874 FORCEWAKE_ALL);
875
Pei Zhang90d27a12016-11-14 18:02:57 +0800876 mutex_lock(&gvt->lock);
Zhi Wange4734052016-05-01 07:42:16 -0400877 ret = dispatch_workload(workload);
Pei Zhang90d27a12016-11-14 18:02:57 +0800878 mutex_unlock(&gvt->lock);
Chris Wilson66bbc3b2016-10-19 11:11:44 +0100879
Zhi Wange4734052016-05-01 07:42:16 -0400880 if (ret) {
Tina Zhang695fbc02017-03-10 04:26:53 -0500881 vgpu = workload->vgpu;
882 gvt_vgpu_err("fail to dispatch workload, skip\n");
Zhi Wange4734052016-05-01 07:42:16 -0400883 goto complete;
884 }
885
886 gvt_dbg_sched("ring id %d wait workload %p\n",
887 workload->ring_id, workload);
Chris Wilson3dce2ac2017-03-08 22:08:08 +0000888 i915_wait_request(workload->req, 0, MAX_SCHEDULE_TIMEOUT);
Zhi Wange4734052016-05-01 07:42:16 -0400889
890complete:
Changbin Du3ce32742017-02-09 10:13:16 +0800891 gvt_dbg_sched("will complete workload %p, status: %d\n",
Zhi Wange4734052016-05-01 07:42:16 -0400892 workload, workload->status);
893
Changbin Du2e51ef32017-01-05 13:28:05 +0800894 complete_current_workload(gvt, ring_id);
895
Zhi Wange4734052016-05-01 07:42:16 -0400896 if (need_force_wake)
897 intel_uncore_forcewake_put(gvt->dev_priv,
898 FORCEWAKE_ALL);
899
Zhi Wange4734052016-05-01 07:42:16 -0400900 intel_runtime_pm_put(gvt->dev_priv);
Zhi Wang6d763032017-09-12 22:33:12 +0800901 if (ret && (vgpu_is_vm_unhealthy(ret)))
fred gaoe011c6c2017-09-19 15:11:28 +0800902 enter_failsafe_mode(vgpu, GVT_FAILSAFE_GUEST_ERR);
Zhi Wange4734052016-05-01 07:42:16 -0400903 }
904 return 0;
905}
906
907void intel_gvt_wait_vgpu_idle(struct intel_vgpu *vgpu)
908{
Zhi Wang1406a142017-09-10 21:15:18 +0800909 struct intel_vgpu_submission *s = &vgpu->submission;
Zhi Wange4734052016-05-01 07:42:16 -0400910 struct intel_gvt *gvt = vgpu->gvt;
911 struct intel_gvt_workload_scheduler *scheduler = &gvt->scheduler;
912
Zhi Wang1406a142017-09-10 21:15:18 +0800913 if (atomic_read(&s->running_workload_num)) {
Zhi Wange4734052016-05-01 07:42:16 -0400914 gvt_dbg_sched("wait vgpu idle\n");
915
916 wait_event(scheduler->workload_complete_wq,
Zhi Wang1406a142017-09-10 21:15:18 +0800917 !atomic_read(&s->running_workload_num));
Zhi Wange4734052016-05-01 07:42:16 -0400918 }
919}
920
921void intel_gvt_clean_workload_scheduler(struct intel_gvt *gvt)
922{
923 struct intel_gvt_workload_scheduler *scheduler = &gvt->scheduler;
Changbin Du3fc03062017-03-13 10:47:11 +0800924 struct intel_engine_cs *engine;
925 enum intel_engine_id i;
Zhi Wange4734052016-05-01 07:42:16 -0400926
927 gvt_dbg_core("clean workload scheduler\n");
928
Changbin Du3fc03062017-03-13 10:47:11 +0800929 for_each_engine(engine, gvt->dev_priv, i) {
930 atomic_notifier_chain_unregister(
931 &engine->context_status_notifier,
932 &gvt->shadow_ctx_notifier_block[i]);
933 kthread_stop(scheduler->thread[i]);
Zhi Wange4734052016-05-01 07:42:16 -0400934 }
935}
936
937int intel_gvt_init_workload_scheduler(struct intel_gvt *gvt)
938{
939 struct intel_gvt_workload_scheduler *scheduler = &gvt->scheduler;
940 struct workload_thread_param *param = NULL;
Changbin Du3fc03062017-03-13 10:47:11 +0800941 struct intel_engine_cs *engine;
942 enum intel_engine_id i;
Zhi Wange4734052016-05-01 07:42:16 -0400943 int ret;
Zhi Wange4734052016-05-01 07:42:16 -0400944
945 gvt_dbg_core("init workload scheduler\n");
946
947 init_waitqueue_head(&scheduler->workload_complete_wq);
948
Changbin Du3fc03062017-03-13 10:47:11 +0800949 for_each_engine(engine, gvt->dev_priv, i) {
Zhi Wange4734052016-05-01 07:42:16 -0400950 init_waitqueue_head(&scheduler->waitq[i]);
951
952 param = kzalloc(sizeof(*param), GFP_KERNEL);
953 if (!param) {
954 ret = -ENOMEM;
955 goto err;
956 }
957
958 param->gvt = gvt;
959 param->ring_id = i;
960
961 scheduler->thread[i] = kthread_run(workload_thread, param,
962 "gvt workload %d", i);
963 if (IS_ERR(scheduler->thread[i])) {
964 gvt_err("fail to create workload thread\n");
965 ret = PTR_ERR(scheduler->thread[i]);
966 goto err;
967 }
Changbin Du3fc03062017-03-13 10:47:11 +0800968
969 gvt->shadow_ctx_notifier_block[i].notifier_call =
970 shadow_context_status_change;
971 atomic_notifier_chain_register(&engine->context_status_notifier,
972 &gvt->shadow_ctx_notifier_block[i]);
Zhi Wange4734052016-05-01 07:42:16 -0400973 }
974 return 0;
975err:
976 intel_gvt_clean_workload_scheduler(gvt);
977 kfree(param);
978 param = NULL;
979 return ret;
980}
981
Zhi Wang874b6a92017-09-10 20:08:18 +0800982/**
983 * intel_vgpu_clean_submission - free submission-related resource for vGPU
984 * @vgpu: a vGPU
985 *
986 * This function is called when a vGPU is being destroyed.
987 *
988 */
989void intel_vgpu_clean_submission(struct intel_vgpu *vgpu)
Zhi Wange4734052016-05-01 07:42:16 -0400990{
Zhi Wang1406a142017-09-10 21:15:18 +0800991 struct intel_vgpu_submission *s = &vgpu->submission;
992
Zhi Wangad1d3632017-09-13 00:31:29 +0800993 intel_vgpu_select_submission_ops(vgpu, 0);
Zhi Wang1406a142017-09-10 21:15:18 +0800994 i915_gem_context_put(s->shadow_ctx);
995 kmem_cache_destroy(s->workloads);
Zhi Wange4734052016-05-01 07:42:16 -0400996}
997
Zhi Wang06bb3722017-09-13 01:41:35 +0800998
999/**
1000 * intel_vgpu_reset_submission - reset submission-related resource for vGPU
1001 * @vgpu: a vGPU
1002 * @engine_mask: engines expected to be reset
1003 *
1004 * This function is called when a vGPU is being destroyed.
1005 *
1006 */
1007void intel_vgpu_reset_submission(struct intel_vgpu *vgpu,
1008 unsigned long engine_mask)
1009{
1010 struct intel_vgpu_submission *s = &vgpu->submission;
1011
1012 if (!s->active)
1013 return;
1014
Zhi Wange2c43c02017-09-13 01:58:35 +08001015 clean_workloads(vgpu, engine_mask);
Zhi Wang06bb3722017-09-13 01:41:35 +08001016 s->ops->reset(vgpu, engine_mask);
1017}
1018
Zhi Wang874b6a92017-09-10 20:08:18 +08001019/**
1020 * intel_vgpu_setup_submission - setup submission-related resource for vGPU
1021 * @vgpu: a vGPU
1022 *
1023 * This function is called when a vGPU is being created.
1024 *
1025 * Returns:
1026 * Zero on success, negative error code if failed.
1027 *
1028 */
1029int intel_vgpu_setup_submission(struct intel_vgpu *vgpu)
Zhi Wange4734052016-05-01 07:42:16 -04001030{
Zhi Wang1406a142017-09-10 21:15:18 +08001031 struct intel_vgpu_submission *s = &vgpu->submission;
Zhi Wang9a9829e2017-09-10 20:28:09 +08001032 enum intel_engine_id i;
1033 struct intel_engine_cs *engine;
1034 int ret;
Zhi Wange4734052016-05-01 07:42:16 -04001035
Zhi Wang1406a142017-09-10 21:15:18 +08001036 s->shadow_ctx = i915_gem_context_create_gvt(
Zhi Wange4734052016-05-01 07:42:16 -04001037 &vgpu->gvt->dev_priv->drm);
Zhi Wang1406a142017-09-10 21:15:18 +08001038 if (IS_ERR(s->shadow_ctx))
1039 return PTR_ERR(s->shadow_ctx);
Zhi Wange4734052016-05-01 07:42:16 -04001040
Zhi Wang1406a142017-09-10 21:15:18 +08001041 bitmap_zero(s->shadow_ctx_desc_updated, I915_NUM_ENGINES);
Kechen Lu9dfb8e52017-08-10 07:41:36 +08001042
Zhi Wang1406a142017-09-10 21:15:18 +08001043 s->workloads = kmem_cache_create("gvt-g_vgpu_workload",
Zhi Wang9a9829e2017-09-10 20:28:09 +08001044 sizeof(struct intel_vgpu_workload), 0,
1045 SLAB_HWCACHE_ALIGN,
1046 NULL);
1047
Zhi Wang1406a142017-09-10 21:15:18 +08001048 if (!s->workloads) {
Zhi Wang9a9829e2017-09-10 20:28:09 +08001049 ret = -ENOMEM;
1050 goto out_shadow_ctx;
1051 }
1052
1053 for_each_engine(engine, vgpu->gvt->dev_priv, i)
Zhi Wang1406a142017-09-10 21:15:18 +08001054 INIT_LIST_HEAD(&s->workload_q_head[i]);
Zhi Wang9a9829e2017-09-10 20:28:09 +08001055
Zhi Wang1406a142017-09-10 21:15:18 +08001056 atomic_set(&s->running_workload_num, 0);
Zhi Wang91d5d852017-09-10 21:33:20 +08001057 bitmap_zero(s->tlb_handle_pending, I915_NUM_ENGINES);
Zhi Wang9a9829e2017-09-10 20:28:09 +08001058
Zhi Wange4734052016-05-01 07:42:16 -04001059 return 0;
Zhi Wang9a9829e2017-09-10 20:28:09 +08001060
1061out_shadow_ctx:
Zhi Wang1406a142017-09-10 21:15:18 +08001062 i915_gem_context_put(s->shadow_ctx);
Zhi Wang9a9829e2017-09-10 20:28:09 +08001063 return ret;
Zhi Wange4734052016-05-01 07:42:16 -04001064}
Zhi Wang21527a82017-09-12 21:42:09 +08001065
1066/**
Zhi Wangad1d3632017-09-13 00:31:29 +08001067 * intel_vgpu_select_submission_ops - select virtual submission interface
1068 * @vgpu: a vGPU
1069 * @interface: expected vGPU virtual submission interface
1070 *
1071 * This function is called when guest configures submission interface.
1072 *
1073 * Returns:
1074 * Zero on success, negative error code if failed.
1075 *
1076 */
1077int intel_vgpu_select_submission_ops(struct intel_vgpu *vgpu,
1078 unsigned int interface)
1079{
1080 struct intel_vgpu_submission *s = &vgpu->submission;
1081 const struct intel_vgpu_submission_ops *ops[] = {
1082 [INTEL_VGPU_EXECLIST_SUBMISSION] =
1083 &intel_vgpu_execlist_submission_ops,
1084 };
1085 int ret;
1086
1087 if (WARN_ON(interface >= ARRAY_SIZE(ops)))
1088 return -EINVAL;
1089
1090 if (s->active) {
1091 s->ops->clean(vgpu);
1092 s->active = false;
1093 gvt_dbg_core("vgpu%d: de-select ops [ %s ] \n",
1094 vgpu->id, s->ops->name);
1095 }
1096
1097 if (interface == 0) {
1098 s->ops = NULL;
1099 s->virtual_submission_interface = 0;
1100 gvt_dbg_core("vgpu%d: no submission ops\n", vgpu->id);
1101 return 0;
1102 }
1103
1104 ret = ops[interface]->init(vgpu);
1105 if (ret)
1106 return ret;
1107
1108 s->ops = ops[interface];
1109 s->virtual_submission_interface = interface;
1110 s->active = true;
1111
1112 gvt_dbg_core("vgpu%d: activate ops [ %s ]\n",
1113 vgpu->id, s->ops->name);
1114
1115 return 0;
1116}
1117
1118/**
Zhi Wang21527a82017-09-12 21:42:09 +08001119 * intel_vgpu_destroy_workload - destroy a vGPU workload
1120 * @vgpu: a vGPU
1121 *
1122 * This function is called when destroy a vGPU workload.
1123 *
1124 */
1125void intel_vgpu_destroy_workload(struct intel_vgpu_workload *workload)
1126{
1127 struct intel_vgpu_submission *s = &workload->vgpu->submission;
1128
1129 if (workload->shadow_mm)
1130 intel_gvt_mm_unreference(workload->shadow_mm);
1131
1132 kmem_cache_free(s->workloads, workload);
1133}
1134
Zhi Wang6d763032017-09-12 22:33:12 +08001135static struct intel_vgpu_workload *
1136alloc_workload(struct intel_vgpu *vgpu)
Zhi Wang21527a82017-09-12 21:42:09 +08001137{
1138 struct intel_vgpu_submission *s = &vgpu->submission;
1139 struct intel_vgpu_workload *workload;
1140
1141 workload = kmem_cache_zalloc(s->workloads, GFP_KERNEL);
1142 if (!workload)
1143 return ERR_PTR(-ENOMEM);
1144
1145 INIT_LIST_HEAD(&workload->list);
1146 INIT_LIST_HEAD(&workload->shadow_bb);
1147
1148 init_waitqueue_head(&workload->shadow_ctx_status_wq);
1149 atomic_set(&workload->shadow_ctx_active, 0);
1150
1151 workload->status = -EINPROGRESS;
1152 workload->shadowed = false;
1153 workload->vgpu = vgpu;
1154
1155 return workload;
1156}
Zhi Wang6d763032017-09-12 22:33:12 +08001157
1158#define RING_CTX_OFF(x) \
1159 offsetof(struct execlist_ring_context, x)
1160
1161static void read_guest_pdps(struct intel_vgpu *vgpu,
1162 u64 ring_context_gpa, u32 pdp[8])
1163{
1164 u64 gpa;
1165 int i;
1166
1167 gpa = ring_context_gpa + RING_CTX_OFF(pdp3_UDW.val);
1168
1169 for (i = 0; i < 8; i++)
1170 intel_gvt_hypervisor_read_gpa(vgpu,
1171 gpa + i * 8, &pdp[7 - i], 4);
1172}
1173
1174static int prepare_mm(struct intel_vgpu_workload *workload)
1175{
1176 struct execlist_ctx_descriptor_format *desc = &workload->ctx_desc;
1177 struct intel_vgpu_mm *mm;
1178 struct intel_vgpu *vgpu = workload->vgpu;
1179 int page_table_level;
1180 u32 pdp[8];
1181
1182 if (desc->addressing_mode == 1) { /* legacy 32-bit */
1183 page_table_level = 3;
1184 } else if (desc->addressing_mode == 3) { /* legacy 64 bit */
1185 page_table_level = 4;
1186 } else {
1187 gvt_vgpu_err("Advanced Context mode(SVM) is not supported!\n");
1188 return -EINVAL;
1189 }
1190
1191 read_guest_pdps(workload->vgpu, workload->ring_context_gpa, pdp);
1192
1193 mm = intel_vgpu_find_ppgtt_mm(workload->vgpu, page_table_level, pdp);
1194 if (mm) {
1195 intel_gvt_mm_reference(mm);
1196 } else {
1197
1198 mm = intel_vgpu_create_mm(workload->vgpu, INTEL_GVT_MM_PPGTT,
1199 pdp, page_table_level, 0);
1200 if (IS_ERR(mm)) {
1201 gvt_vgpu_err("fail to create mm object.\n");
1202 return PTR_ERR(mm);
1203 }
1204 }
1205 workload->shadow_mm = mm;
1206 return 0;
1207}
1208
1209#define same_context(a, b) (((a)->context_id == (b)->context_id) && \
1210 ((a)->lrca == (b)->lrca))
1211
1212#define get_last_workload(q) \
1213 (list_empty(q) ? NULL : container_of(q->prev, \
1214 struct intel_vgpu_workload, list))
1215/**
1216 * intel_vgpu_create_workload - create a vGPU workload
1217 * @vgpu: a vGPU
1218 * @desc: a guest context descriptor
1219 *
1220 * This function is called when creating a vGPU workload.
1221 *
1222 * Returns:
1223 * struct intel_vgpu_workload * on success, negative error code in
1224 * pointer if failed.
1225 *
1226 */
1227struct intel_vgpu_workload *
1228intel_vgpu_create_workload(struct intel_vgpu *vgpu, int ring_id,
1229 struct execlist_ctx_descriptor_format *desc)
1230{
1231 struct intel_vgpu_submission *s = &vgpu->submission;
1232 struct list_head *q = workload_q_head(vgpu, ring_id);
1233 struct intel_vgpu_workload *last_workload = get_last_workload(q);
1234 struct intel_vgpu_workload *workload = NULL;
1235 struct drm_i915_private *dev_priv = vgpu->gvt->dev_priv;
1236 u64 ring_context_gpa;
1237 u32 head, tail, start, ctl, ctx_ctl, per_ctx, indirect_ctx;
1238 int ret;
1239
1240 ring_context_gpa = intel_vgpu_gma_to_gpa(vgpu->gtt.ggtt_mm,
Zhi Wang9556e112017-10-10 13:51:32 +08001241 (u32)((desc->lrca + 1) << I915_GTT_PAGE_SHIFT));
Zhi Wang6d763032017-09-12 22:33:12 +08001242 if (ring_context_gpa == INTEL_GVT_INVALID_ADDR) {
1243 gvt_vgpu_err("invalid guest context LRCA: %x\n", desc->lrca);
1244 return ERR_PTR(-EINVAL);
1245 }
1246
1247 intel_gvt_hypervisor_read_gpa(vgpu, ring_context_gpa +
1248 RING_CTX_OFF(ring_header.val), &head, 4);
1249
1250 intel_gvt_hypervisor_read_gpa(vgpu, ring_context_gpa +
1251 RING_CTX_OFF(ring_tail.val), &tail, 4);
1252
1253 head &= RB_HEAD_OFF_MASK;
1254 tail &= RB_TAIL_OFF_MASK;
1255
1256 if (last_workload && same_context(&last_workload->ctx_desc, desc)) {
1257 gvt_dbg_el("ring id %d cur workload == last\n", ring_id);
1258 gvt_dbg_el("ctx head %x real head %lx\n", head,
1259 last_workload->rb_tail);
1260 /*
1261 * cannot use guest context head pointer here,
1262 * as it might not be updated at this time
1263 */
1264 head = last_workload->rb_tail;
1265 }
1266
1267 gvt_dbg_el("ring id %d begin a new workload\n", ring_id);
1268
1269 /* record some ring buffer register values for scan and shadow */
1270 intel_gvt_hypervisor_read_gpa(vgpu, ring_context_gpa +
1271 RING_CTX_OFF(rb_start.val), &start, 4);
1272 intel_gvt_hypervisor_read_gpa(vgpu, ring_context_gpa +
1273 RING_CTX_OFF(rb_ctrl.val), &ctl, 4);
1274 intel_gvt_hypervisor_read_gpa(vgpu, ring_context_gpa +
1275 RING_CTX_OFF(ctx_ctrl.val), &ctx_ctl, 4);
1276
1277 workload = alloc_workload(vgpu);
1278 if (IS_ERR(workload))
1279 return workload;
1280
1281 workload->ring_id = ring_id;
1282 workload->ctx_desc = *desc;
1283 workload->ring_context_gpa = ring_context_gpa;
1284 workload->rb_head = head;
1285 workload->rb_tail = tail;
1286 workload->rb_start = start;
1287 workload->rb_ctl = ctl;
1288
1289 if (ring_id == RCS) {
1290 intel_gvt_hypervisor_read_gpa(vgpu, ring_context_gpa +
1291 RING_CTX_OFF(bb_per_ctx_ptr.val), &per_ctx, 4);
1292 intel_gvt_hypervisor_read_gpa(vgpu, ring_context_gpa +
1293 RING_CTX_OFF(rcs_indirect_ctx.val), &indirect_ctx, 4);
1294
1295 workload->wa_ctx.indirect_ctx.guest_gma =
1296 indirect_ctx & INDIRECT_CTX_ADDR_MASK;
1297 workload->wa_ctx.indirect_ctx.size =
1298 (indirect_ctx & INDIRECT_CTX_SIZE_MASK) *
1299 CACHELINE_BYTES;
1300 workload->wa_ctx.per_ctx.guest_gma =
1301 per_ctx & PER_CTX_ADDR_MASK;
1302 workload->wa_ctx.per_ctx.valid = per_ctx & 1;
1303 }
1304
1305 gvt_dbg_el("workload %p ring id %d head %x tail %x start %x ctl %x\n",
1306 workload, ring_id, head, tail, start, ctl);
1307
1308 ret = prepare_mm(workload);
1309 if (ret) {
1310 kmem_cache_free(s->workloads, workload);
1311 return ERR_PTR(ret);
1312 }
1313
1314 /* Only scan and shadow the first workload in the queue
1315 * as there is only one pre-allocated buf-obj for shadow.
1316 */
1317 if (list_empty(workload_q_head(vgpu, ring_id))) {
1318 intel_runtime_pm_get(dev_priv);
1319 mutex_lock(&dev_priv->drm.struct_mutex);
1320 ret = intel_gvt_scan_and_shadow_workload(workload);
1321 mutex_unlock(&dev_priv->drm.struct_mutex);
1322 intel_runtime_pm_put(dev_priv);
1323 }
1324
1325 if (ret && (vgpu_is_vm_unhealthy(ret))) {
1326 enter_failsafe_mode(vgpu, GVT_FAILSAFE_GUEST_ERR);
1327 intel_vgpu_destroy_workload(workload);
1328 return ERR_PTR(ret);
1329 }
1330
1331 return workload;
1332}
Changbin Du59a716c2017-11-29 15:40:06 +08001333
1334/**
1335 * intel_vgpu_queue_workload - Qeue a vGPU workload
1336 * @workload: the workload to queue in
1337 */
1338void intel_vgpu_queue_workload(struct intel_vgpu_workload *workload)
1339{
1340 list_add_tail(&workload->list,
1341 workload_q_head(workload->vgpu, workload->ring_id));
Changbin Duc1304562017-11-29 15:40:07 +08001342 intel_gvt_kick_schedule(workload->vgpu->gvt);
Changbin Du59a716c2017-11-29 15:40:06 +08001343 wake_up(&workload->vgpu->gvt->scheduler.waitq[workload->ring_id]);
1344}