blob: 1127bd77fc6e7d9897d73c3684b3052aab1db8d8 [file] [log] [blame]
Zhi Wange4734052016-05-01 07:42:16 -04001/*
2 * Copyright(c) 2011-2016 Intel Corporation. All rights reserved.
3 *
4 * Permission is hereby granted, free of charge, to any person obtaining a
5 * copy of this software and associated documentation files (the "Software"),
6 * to deal in the Software without restriction, including without limitation
7 * the rights to use, copy, modify, merge, publish, distribute, sublicense,
8 * and/or sell copies of the Software, and to permit persons to whom the
9 * Software is furnished to do so, subject to the following conditions:
10 *
11 * The above copyright notice and this permission notice (including the next
12 * paragraph) shall be included in all copies or substantial portions of the
13 * Software.
14 *
15 * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
16 * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
17 * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL
18 * THE AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
19 * LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
20 * OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE
21 * SOFTWARE.
22 *
23 * Authors:
24 * Zhi Wang <zhi.a.wang@intel.com>
25 *
26 * Contributors:
27 * Ping Gao <ping.a.gao@intel.com>
28 * Tina Zhang <tina.zhang@intel.com>
29 * Chanbin Du <changbin.du@intel.com>
30 * Min He <min.he@intel.com>
31 * Bing Niu <bing.niu@intel.com>
32 * Zhenyu Wang <zhenyuw@linux.intel.com>
33 *
34 */
35
Zhi Wange4734052016-05-01 07:42:16 -040036#include <linux/kthread.h>
37
Zhenyu Wangfeddf6e2016-10-20 17:15:03 +080038#include "i915_drv.h"
39#include "gvt.h"
40
Zhi Wange4734052016-05-01 07:42:16 -040041#define RING_CTX_OFF(x) \
42 offsetof(struct execlist_ring_context, x)
43
Du, Changbin999ccb42016-10-20 14:08:47 +080044static void set_context_pdp_root_pointer(
45 struct execlist_ring_context *ring_context,
Zhi Wange4734052016-05-01 07:42:16 -040046 u32 pdp[8])
47{
48 struct execlist_mmio_pair *pdp_pair = &ring_context->pdp3_UDW;
49 int i;
50
51 for (i = 0; i < 8; i++)
52 pdp_pair[i].val = pdp[7 - i];
53}
54
Zhi Wangb20c0d52018-02-07 18:12:15 +080055static void update_shadow_pdps(struct intel_vgpu_workload *workload)
56{
57 struct intel_vgpu *vgpu = workload->vgpu;
58 int ring_id = workload->ring_id;
59 struct i915_gem_context *shadow_ctx = vgpu->submission.shadow_ctx;
60 struct drm_i915_gem_object *ctx_obj =
61 shadow_ctx->engine[ring_id].state->obj;
62 struct execlist_ring_context *shadow_ring_context;
63 struct page *page;
64
65 if (WARN_ON(!workload->shadow_mm))
66 return;
67
68 if (WARN_ON(!atomic_read(&workload->shadow_mm->pincount)))
69 return;
70
71 page = i915_gem_object_get_page(ctx_obj, LRC_STATE_PN);
72 shadow_ring_context = kmap(page);
73 set_context_pdp_root_pointer(shadow_ring_context,
74 (void *)workload->shadow_mm->ppgtt_mm.shadow_pdps);
75 kunmap(page);
76}
77
Zhi Wange4734052016-05-01 07:42:16 -040078static int populate_shadow_context(struct intel_vgpu_workload *workload)
79{
80 struct intel_vgpu *vgpu = workload->vgpu;
81 struct intel_gvt *gvt = vgpu->gvt;
82 int ring_id = workload->ring_id;
Zhi Wang1406a142017-09-10 21:15:18 +080083 struct i915_gem_context *shadow_ctx = vgpu->submission.shadow_ctx;
Zhi Wange4734052016-05-01 07:42:16 -040084 struct drm_i915_gem_object *ctx_obj =
85 shadow_ctx->engine[ring_id].state->obj;
86 struct execlist_ring_context *shadow_ring_context;
87 struct page *page;
88 void *dst;
89 unsigned long context_gpa, context_page_num;
90 int i;
91
92 gvt_dbg_sched("ring id %d workload lrca %x", ring_id,
93 workload->ctx_desc.lrca);
94
Joonas Lahtinen63ffbcd2017-04-28 10:53:36 +030095 context_page_num = gvt->dev_priv->engine[ring_id]->context_size;
Zhi Wange4734052016-05-01 07:42:16 -040096
97 context_page_num = context_page_num >> PAGE_SHIFT;
98
99 if (IS_BROADWELL(gvt->dev_priv) && ring_id == RCS)
100 context_page_num = 19;
101
102 i = 2;
103
104 while (i < context_page_num) {
105 context_gpa = intel_vgpu_gma_to_gpa(vgpu->gtt.ggtt_mm,
106 (u32)((workload->ctx_desc.lrca + i) <<
Zhi Wang9556e112017-10-10 13:51:32 +0800107 I915_GTT_PAGE_SHIFT));
Zhi Wange4734052016-05-01 07:42:16 -0400108 if (context_gpa == INTEL_GVT_INVALID_ADDR) {
Tina Zhang695fbc02017-03-10 04:26:53 -0500109 gvt_vgpu_err("Invalid guest context descriptor\n");
fred gao5c568832017-09-20 05:36:47 +0800110 return -EFAULT;
Zhi Wange4734052016-05-01 07:42:16 -0400111 }
112
Michel Thierry0b29c752017-09-13 09:56:00 +0100113 page = i915_gem_object_get_page(ctx_obj, LRC_HEADER_PAGES + i);
Xiaoguang Chenc7549362016-11-03 18:38:30 +0800114 dst = kmap(page);
Zhi Wange4734052016-05-01 07:42:16 -0400115 intel_gvt_hypervisor_read_gpa(vgpu, context_gpa, dst,
Zhi Wang9556e112017-10-10 13:51:32 +0800116 I915_GTT_PAGE_SIZE);
Xiaoguang Chenc7549362016-11-03 18:38:30 +0800117 kunmap(page);
Zhi Wange4734052016-05-01 07:42:16 -0400118 i++;
119 }
120
121 page = i915_gem_object_get_page(ctx_obj, LRC_STATE_PN);
Xiaoguang Chenc7549362016-11-03 18:38:30 +0800122 shadow_ring_context = kmap(page);
Zhi Wange4734052016-05-01 07:42:16 -0400123
124#define COPY_REG(name) \
125 intel_gvt_hypervisor_read_gpa(vgpu, workload->ring_context_gpa \
126 + RING_CTX_OFF(name.val), &shadow_ring_context->name.val, 4)
127
128 COPY_REG(ctx_ctrl);
129 COPY_REG(ctx_timestamp);
130
131 if (ring_id == RCS) {
132 COPY_REG(bb_per_ctx_ptr);
133 COPY_REG(rcs_indirect_ctx);
134 COPY_REG(rcs_indirect_ctx_offset);
135 }
136#undef COPY_REG
137
Zhi Wange4734052016-05-01 07:42:16 -0400138 intel_gvt_hypervisor_read_gpa(vgpu,
139 workload->ring_context_gpa +
140 sizeof(*shadow_ring_context),
141 (void *)shadow_ring_context +
142 sizeof(*shadow_ring_context),
Zhi Wang9556e112017-10-10 13:51:32 +0800143 I915_GTT_PAGE_SIZE - sizeof(*shadow_ring_context));
Zhi Wange4734052016-05-01 07:42:16 -0400144
Xiaoguang Chenc7549362016-11-03 18:38:30 +0800145 kunmap(page);
Zhi Wange4734052016-05-01 07:42:16 -0400146 return 0;
147}
148
Chris Wilsone61e0f52018-02-21 09:56:36 +0000149static inline bool is_gvt_request(struct i915_request *req)
Changbin Dubc2d4b62017-03-22 12:35:31 +0800150{
151 return i915_gem_context_force_single_submission(req->ctx);
152}
153
Xiong Zhang295764c2017-11-07 05:23:02 +0800154static void save_ring_hw_state(struct intel_vgpu *vgpu, int ring_id)
155{
156 struct drm_i915_private *dev_priv = vgpu->gvt->dev_priv;
157 u32 ring_base = dev_priv->engine[ring_id]->mmio_base;
158 i915_reg_t reg;
159
160 reg = RING_INSTDONE(ring_base);
161 vgpu_vreg(vgpu, i915_mmio_reg_offset(reg)) = I915_READ_FW(reg);
162 reg = RING_ACTHD(ring_base);
163 vgpu_vreg(vgpu, i915_mmio_reg_offset(reg)) = I915_READ_FW(reg);
164 reg = RING_ACTHD_UDW(ring_base);
165 vgpu_vreg(vgpu, i915_mmio_reg_offset(reg)) = I915_READ_FW(reg);
166}
167
Zhi Wange4734052016-05-01 07:42:16 -0400168static int shadow_context_status_change(struct notifier_block *nb,
169 unsigned long action, void *data)
170{
Chris Wilsone61e0f52018-02-21 09:56:36 +0000171 struct i915_request *req = data;
Changbin Du3fc03062017-03-13 10:47:11 +0800172 struct intel_gvt *gvt = container_of(nb, struct intel_gvt,
173 shadow_ctx_notifier_block[req->engine->id]);
174 struct intel_gvt_workload_scheduler *scheduler = &gvt->scheduler;
Changbin Du0e86cc92017-05-04 10:52:38 +0800175 enum intel_engine_id ring_id = req->engine->id;
176 struct intel_vgpu_workload *workload;
Changbin Du679fd3e2017-11-13 14:58:31 +0800177 unsigned long flags;
Zhi Wange4734052016-05-01 07:42:16 -0400178
Changbin Du0e86cc92017-05-04 10:52:38 +0800179 if (!is_gvt_request(req)) {
Changbin Du679fd3e2017-11-13 14:58:31 +0800180 spin_lock_irqsave(&scheduler->mmio_context_lock, flags);
Changbin Du0e86cc92017-05-04 10:52:38 +0800181 if (action == INTEL_CONTEXT_SCHEDULE_IN &&
182 scheduler->engine_owner[ring_id]) {
183 /* Switch ring from vGPU to host. */
184 intel_gvt_switch_mmio(scheduler->engine_owner[ring_id],
185 NULL, ring_id);
186 scheduler->engine_owner[ring_id] = NULL;
187 }
Changbin Du679fd3e2017-11-13 14:58:31 +0800188 spin_unlock_irqrestore(&scheduler->mmio_context_lock, flags);
Changbin Du0e86cc92017-05-04 10:52:38 +0800189
190 return NOTIFY_OK;
191 }
192
193 workload = scheduler->current_workload[ring_id];
194 if (unlikely(!workload))
Chuanxiao Dong9272f732017-02-17 19:29:52 +0800195 return NOTIFY_OK;
196
Zhi Wange4734052016-05-01 07:42:16 -0400197 switch (action) {
198 case INTEL_CONTEXT_SCHEDULE_IN:
Changbin Du679fd3e2017-11-13 14:58:31 +0800199 spin_lock_irqsave(&scheduler->mmio_context_lock, flags);
Changbin Du0e86cc92017-05-04 10:52:38 +0800200 if (workload->vgpu != scheduler->engine_owner[ring_id]) {
201 /* Switch ring from host to vGPU or vGPU to vGPU. */
202 intel_gvt_switch_mmio(scheduler->engine_owner[ring_id],
203 workload->vgpu, ring_id);
204 scheduler->engine_owner[ring_id] = workload->vgpu;
205 } else
206 gvt_dbg_sched("skip ring %d mmio switch for vgpu%d\n",
207 ring_id, workload->vgpu->id);
Changbin Du679fd3e2017-11-13 14:58:31 +0800208 spin_unlock_irqrestore(&scheduler->mmio_context_lock, flags);
Zhi Wange4734052016-05-01 07:42:16 -0400209 atomic_set(&workload->shadow_ctx_active, 1);
210 break;
211 case INTEL_CONTEXT_SCHEDULE_OUT:
Xiong Zhang295764c2017-11-07 05:23:02 +0800212 save_ring_hw_state(workload->vgpu, ring_id);
Zhi Wange4734052016-05-01 07:42:16 -0400213 atomic_set(&workload->shadow_ctx_active, 0);
214 break;
Zhenyu Wangda5f99e2017-12-01 14:59:53 +0800215 case INTEL_CONTEXT_SCHEDULE_PREEMPTED:
216 save_ring_hw_state(workload->vgpu, ring_id);
217 break;
Zhi Wange4734052016-05-01 07:42:16 -0400218 default:
219 WARN_ON(1);
220 return NOTIFY_OK;
221 }
222 wake_up(&workload->shadow_ctx_status_wq);
223 return NOTIFY_OK;
224}
225
Kechen Lu9dfb8e52017-08-10 07:41:36 +0800226static void shadow_context_descriptor_update(struct i915_gem_context *ctx,
227 struct intel_engine_cs *engine)
228{
229 struct intel_context *ce = &ctx->engine[engine->id];
230 u64 desc = 0;
231
232 desc = ce->lrc_desc;
233
234 /* Update bits 0-11 of the context descriptor which includes flags
235 * like GEN8_CTX_* cached in desc_template
236 */
237 desc &= U64_MAX << 12;
238 desc |= ctx->desc_template & ((1ULL << 12) - 1);
239
240 ce->lrc_desc = desc;
241}
242
fred gao0a53bc02017-08-18 15:41:06 +0800243static int copy_workload_to_ring_buffer(struct intel_vgpu_workload *workload)
244{
245 struct intel_vgpu *vgpu = workload->vgpu;
246 void *shadow_ring_buffer_va;
247 u32 *cs;
Weinan Licd7e61b2018-02-23 14:46:45 +0800248 struct i915_request *req = workload->req;
249
250 if (IS_KABYLAKE(req->i915) &&
251 is_inhibit_context(req->ctx, req->engine->id))
252 intel_vgpu_restore_inhibit_context(vgpu, req);
fred gao0a53bc02017-08-18 15:41:06 +0800253
254 /* allocate shadow ring buffer */
255 cs = intel_ring_begin(workload->req, workload->rb_len / sizeof(u32));
256 if (IS_ERR(cs)) {
257 gvt_vgpu_err("fail to alloc size =%ld shadow ring buffer\n",
258 workload->rb_len);
259 return PTR_ERR(cs);
260 }
261
262 shadow_ring_buffer_va = workload->shadow_ring_buffer_va;
263
264 /* get shadow ring buffer va */
265 workload->shadow_ring_buffer_va = cs;
266
267 memcpy(cs, shadow_ring_buffer_va,
268 workload->rb_len);
269
270 cs += workload->rb_len / sizeof(u32);
271 intel_ring_advance(workload->req, cs);
272
273 return 0;
274}
275
Chris Wilson7b302552017-11-20 13:29:58 +0000276static void release_shadow_wa_ctx(struct intel_shadow_wa_ctx *wa_ctx)
fred gaoa3cfdca2017-08-18 15:41:07 +0800277{
278 if (!wa_ctx->indirect_ctx.obj)
279 return;
280
281 i915_gem_object_unpin_map(wa_ctx->indirect_ctx.obj);
282 i915_gem_object_put(wa_ctx->indirect_ctx.obj);
283}
284
Ping Gao89ea20b2017-06-29 12:22:42 +0800285/**
286 * intel_gvt_scan_and_shadow_workload - audit the workload by scanning and
287 * shadow it as well, include ringbuffer,wa_ctx and ctx.
288 * @workload: an abstract entity for each execlist submission.
289 *
290 * This function is called before the workload submitting to i915, to make
291 * sure the content of the workload is valid.
292 */
293int intel_gvt_scan_and_shadow_workload(struct intel_vgpu_workload *workload)
Zhi Wange4734052016-05-01 07:42:16 -0400294{
Zhi Wang1406a142017-09-10 21:15:18 +0800295 struct intel_vgpu *vgpu = workload->vgpu;
296 struct intel_vgpu_submission *s = &vgpu->submission;
297 struct i915_gem_context *shadow_ctx = s->shadow_ctx;
298 struct drm_i915_private *dev_priv = vgpu->gvt->dev_priv;
Zhi Wange4734052016-05-01 07:42:16 -0400299 int ring_id = workload->ring_id;
fred gao0a53bc02017-08-18 15:41:06 +0800300 struct intel_engine_cs *engine = dev_priv->engine[ring_id];
fred gao0a53bc02017-08-18 15:41:06 +0800301 struct intel_ring *ring;
Zhi Wange4734052016-05-01 07:42:16 -0400302 int ret;
303
Ping Gao87e919d2017-07-04 14:53:03 +0800304 lockdep_assert_held(&dev_priv->drm.struct_mutex);
305
Ping Gaod0302e72017-06-29 12:22:43 +0800306 if (workload->shadowed)
307 return 0;
Zhi Wange4734052016-05-01 07:42:16 -0400308
Zhenyu Wang03806ed2017-02-13 17:07:19 +0800309 shadow_ctx->desc_template &= ~(0x3 << GEN8_CTX_ADDRESSING_MODE_SHIFT);
310 shadow_ctx->desc_template |= workload->ctx_desc.addressing_mode <<
Zhi Wange4734052016-05-01 07:42:16 -0400311 GEN8_CTX_ADDRESSING_MODE_SHIFT;
312
Zhi Wang1406a142017-09-10 21:15:18 +0800313 if (!test_and_set_bit(ring_id, s->shadow_ctx_desc_updated))
Kechen Lu9dfb8e52017-08-10 07:41:36 +0800314 shadow_context_descriptor_update(shadow_ctx,
315 dev_priv->engine[ring_id]);
Chuanxiao Dong3cd23b82017-03-16 09:47:58 +0800316
Ping Gao89ea20b2017-06-29 12:22:42 +0800317 ret = intel_gvt_scan_and_shadow_ringbuffer(workload);
Zhi Wangbe1da702016-05-03 18:26:57 -0400318 if (ret)
fred gaoa3cfdca2017-08-18 15:41:07 +0800319 goto err_scan;
Zhi Wangbe1da702016-05-03 18:26:57 -0400320
Tina Zhang17f1b1a2017-03-15 23:16:01 -0400321 if ((workload->ring_id == RCS) &&
322 (workload->wa_ctx.indirect_ctx.size != 0)) {
323 ret = intel_gvt_scan_and_shadow_wa_ctx(&workload->wa_ctx);
324 if (ret)
fred gaoa3cfdca2017-08-18 15:41:07 +0800325 goto err_scan;
Tina Zhang17f1b1a2017-03-15 23:16:01 -0400326 }
Zhi Wangbe1da702016-05-03 18:26:57 -0400327
Ping Gao89ea20b2017-06-29 12:22:42 +0800328 /* pin shadow context by gvt even the shadow context will be pinned
329 * when i915 alloc request. That is because gvt will update the guest
330 * context from shadow context when workload is completed, and at that
331 * moment, i915 may already unpined the shadow context to make the
332 * shadow_ctx pages invalid. So gvt need to pin itself. After update
333 * the guest context, gvt can unpin the shadow_ctx safely.
334 */
335 ring = engine->context_pin(engine, shadow_ctx);
336 if (IS_ERR(ring)) {
337 ret = PTR_ERR(ring);
338 gvt_vgpu_err("fail to pin shadow context\n");
fred gaoa3cfdca2017-08-18 15:41:07 +0800339 goto err_shadow;
Ping Gao89ea20b2017-06-29 12:22:42 +0800340 }
Zhi Wange4734052016-05-01 07:42:16 -0400341
fred gao0a53bc02017-08-18 15:41:06 +0800342 ret = populate_shadow_context(workload);
343 if (ret)
fred gaoa3cfdca2017-08-18 15:41:07 +0800344 goto err_unpin;
fred gaof2880e02017-11-14 17:09:35 +0800345 workload->shadowed = true;
346 return 0;
347
348err_unpin:
349 engine->context_unpin(engine, shadow_ctx);
350err_shadow:
351 release_shadow_wa_ctx(&workload->wa_ctx);
352err_scan:
353 return ret;
354}
355
356static int intel_gvt_generate_request(struct intel_vgpu_workload *workload)
357{
358 int ring_id = workload->ring_id;
359 struct drm_i915_private *dev_priv = workload->vgpu->gvt->dev_priv;
360 struct intel_engine_cs *engine = dev_priv->engine[ring_id];
Chris Wilsone61e0f52018-02-21 09:56:36 +0000361 struct i915_request *rq;
fred gaof2880e02017-11-14 17:09:35 +0800362 struct intel_vgpu *vgpu = workload->vgpu;
363 struct intel_vgpu_submission *s = &vgpu->submission;
364 struct i915_gem_context *shadow_ctx = s->shadow_ctx;
365 int ret;
fred gao0a53bc02017-08-18 15:41:06 +0800366
Chris Wilsone61e0f52018-02-21 09:56:36 +0000367 rq = i915_request_alloc(dev_priv->engine[ring_id], shadow_ctx);
fred gao0a53bc02017-08-18 15:41:06 +0800368 if (IS_ERR(rq)) {
369 gvt_vgpu_err("fail to allocate gem request\n");
370 ret = PTR_ERR(rq);
fred gaoa3cfdca2017-08-18 15:41:07 +0800371 goto err_unpin;
fred gao0a53bc02017-08-18 15:41:06 +0800372 }
373
374 gvt_dbg_sched("ring id %d get i915 gem request %p\n", ring_id, rq);
375
Chris Wilsone61e0f52018-02-21 09:56:36 +0000376 workload->req = i915_request_get(rq);
fred gao0a53bc02017-08-18 15:41:06 +0800377 ret = copy_workload_to_ring_buffer(workload);
378 if (ret)
fred gaoa3cfdca2017-08-18 15:41:07 +0800379 goto err_unpin;
fred gaoa3cfdca2017-08-18 15:41:07 +0800380 return 0;
fred gao0a53bc02017-08-18 15:41:06 +0800381
fred gaoa3cfdca2017-08-18 15:41:07 +0800382err_unpin:
383 engine->context_unpin(engine, shadow_ctx);
fred gaoa3cfdca2017-08-18 15:41:07 +0800384 release_shadow_wa_ctx(&workload->wa_ctx);
fred gao0a53bc02017-08-18 15:41:06 +0800385 return ret;
386}
387
Zhi Wangf52c3802017-09-24 21:53:03 +0800388static void release_shadow_batch_buffer(struct intel_vgpu_workload *workload);
389
Zhi Wangd8235b52017-09-12 22:06:39 +0800390static int prepare_shadow_batch_buffer(struct intel_vgpu_workload *workload)
391{
392 struct intel_gvt *gvt = workload->vgpu->gvt;
393 const int gmadr_bytes = gvt->device_info.gmadr_bytes_in_cmd;
Zhi Wangf52c3802017-09-24 21:53:03 +0800394 struct intel_vgpu_shadow_bb *bb;
395 int ret;
Zhi Wangd8235b52017-09-12 22:06:39 +0800396
Zhi Wangf52c3802017-09-24 21:53:03 +0800397 list_for_each_entry(bb, &workload->shadow_bb, list) {
398 bb->vma = i915_gem_object_ggtt_pin(bb->obj, NULL, 0, 0, 0);
399 if (IS_ERR(bb->vma)) {
400 ret = PTR_ERR(bb->vma);
401 goto err;
402 }
Zhi Wangd8235b52017-09-12 22:06:39 +0800403
Zhi Wangf52c3802017-09-24 21:53:03 +0800404 /* relocate shadow batch buffer */
405 bb->bb_start_cmd_va[1] = i915_ggtt_offset(bb->vma);
Zhi Wangd8235b52017-09-12 22:06:39 +0800406 if (gmadr_bytes == 8)
Zhi Wangf52c3802017-09-24 21:53:03 +0800407 bb->bb_start_cmd_va[2] = 0;
408
409 /* No one is going to touch shadow bb from now on. */
410 if (bb->clflush & CLFLUSH_AFTER) {
411 drm_clflush_virt_range(bb->va, bb->obj->base.size);
412 bb->clflush &= ~CLFLUSH_AFTER;
413 }
414
415 ret = i915_gem_object_set_to_gtt_domain(bb->obj, false);
416 if (ret)
417 goto err;
418
419 i915_gem_obj_finish_shmem_access(bb->obj);
420 bb->accessing = false;
421
422 i915_vma_move_to_active(bb->vma, workload->req, 0);
Zhi Wangd8235b52017-09-12 22:06:39 +0800423 }
424 return 0;
Zhi Wangf52c3802017-09-24 21:53:03 +0800425err:
426 release_shadow_batch_buffer(workload);
427 return ret;
Zhi Wangd8235b52017-09-12 22:06:39 +0800428}
429
430static int update_wa_ctx_2_shadow_ctx(struct intel_shadow_wa_ctx *wa_ctx)
431{
432 struct intel_vgpu_workload *workload = container_of(wa_ctx,
433 struct intel_vgpu_workload,
434 wa_ctx);
435 int ring_id = workload->ring_id;
436 struct intel_vgpu_submission *s = &workload->vgpu->submission;
437 struct i915_gem_context *shadow_ctx = s->shadow_ctx;
438 struct drm_i915_gem_object *ctx_obj =
439 shadow_ctx->engine[ring_id].state->obj;
440 struct execlist_ring_context *shadow_ring_context;
441 struct page *page;
442
443 page = i915_gem_object_get_page(ctx_obj, LRC_STATE_PN);
444 shadow_ring_context = kmap_atomic(page);
445
446 shadow_ring_context->bb_per_ctx_ptr.val =
447 (shadow_ring_context->bb_per_ctx_ptr.val &
448 (~PER_CTX_ADDR_MASK)) | wa_ctx->per_ctx.shadow_gma;
449 shadow_ring_context->rcs_indirect_ctx.val =
450 (shadow_ring_context->rcs_indirect_ctx.val &
451 (~INDIRECT_CTX_ADDR_MASK)) | wa_ctx->indirect_ctx.shadow_gma;
452
453 kunmap_atomic(shadow_ring_context);
454 return 0;
455}
456
457static int prepare_shadow_wa_ctx(struct intel_shadow_wa_ctx *wa_ctx)
458{
459 struct i915_vma *vma;
460 unsigned char *per_ctx_va =
461 (unsigned char *)wa_ctx->indirect_ctx.shadow_va +
462 wa_ctx->indirect_ctx.size;
463
464 if (wa_ctx->indirect_ctx.size == 0)
465 return 0;
466
467 vma = i915_gem_object_ggtt_pin(wa_ctx->indirect_ctx.obj, NULL,
468 0, CACHELINE_BYTES, 0);
469 if (IS_ERR(vma))
470 return PTR_ERR(vma);
471
472 /* FIXME: we are not tracking our pinned VMA leaving it
473 * up to the core to fix up the stray pin_count upon
474 * free.
475 */
476
477 wa_ctx->indirect_ctx.shadow_gma = i915_ggtt_offset(vma);
478
479 wa_ctx->per_ctx.shadow_gma = *((unsigned int *)per_ctx_va + 1);
480 memset(per_ctx_va, 0, CACHELINE_BYTES);
481
482 update_wa_ctx_2_shadow_ctx(wa_ctx);
483 return 0;
484}
485
486static void release_shadow_batch_buffer(struct intel_vgpu_workload *workload)
487{
Zhi Wangf52c3802017-09-24 21:53:03 +0800488 struct intel_vgpu *vgpu = workload->vgpu;
489 struct drm_i915_private *dev_priv = vgpu->gvt->dev_priv;
490 struct intel_vgpu_shadow_bb *bb, *pos;
Zhi Wangd8235b52017-09-12 22:06:39 +0800491
Zhi Wangf52c3802017-09-24 21:53:03 +0800492 if (list_empty(&workload->shadow_bb))
493 return;
494
495 bb = list_first_entry(&workload->shadow_bb,
496 struct intel_vgpu_shadow_bb, list);
497
498 mutex_lock(&dev_priv->drm.struct_mutex);
499
500 list_for_each_entry_safe(bb, pos, &workload->shadow_bb, list) {
501 if (bb->obj) {
502 if (bb->accessing)
503 i915_gem_obj_finish_shmem_access(bb->obj);
504
505 if (bb->va && !IS_ERR(bb->va))
506 i915_gem_object_unpin_map(bb->obj);
507
508 if (bb->vma && !IS_ERR(bb->vma)) {
509 i915_vma_unpin(bb->vma);
510 i915_vma_close(bb->vma);
511 }
512 __i915_gem_object_release_unless_active(bb->obj);
Zhi Wangd8235b52017-09-12 22:06:39 +0800513 }
Zhi Wangf52c3802017-09-24 21:53:03 +0800514 list_del(&bb->list);
515 kfree(bb);
Zhi Wangd8235b52017-09-12 22:06:39 +0800516 }
Zhi Wangf52c3802017-09-24 21:53:03 +0800517
518 mutex_unlock(&dev_priv->drm.struct_mutex);
Zhi Wangd8235b52017-09-12 22:06:39 +0800519}
520
Zhi Wang497aa3f2017-09-12 21:51:10 +0800521static int prepare_workload(struct intel_vgpu_workload *workload)
522{
Zhi Wangd8235b52017-09-12 22:06:39 +0800523 struct intel_vgpu *vgpu = workload->vgpu;
Zhi Wang497aa3f2017-09-12 21:51:10 +0800524 int ret = 0;
525
Zhi Wangd8235b52017-09-12 22:06:39 +0800526 ret = intel_vgpu_pin_mm(workload->shadow_mm);
527 if (ret) {
528 gvt_vgpu_err("fail to vgpu pin mm\n");
529 return ret;
530 }
Zhi Wang497aa3f2017-09-12 21:51:10 +0800531
Zhi Wangb20c0d52018-02-07 18:12:15 +0800532 update_shadow_pdps(workload);
533
Zhi Wangd8235b52017-09-12 22:06:39 +0800534 ret = intel_vgpu_sync_oos_pages(workload->vgpu);
535 if (ret) {
536 gvt_vgpu_err("fail to vgpu sync oos pages\n");
537 goto err_unpin_mm;
538 }
539
540 ret = intel_vgpu_flush_post_shadow(workload->vgpu);
541 if (ret) {
542 gvt_vgpu_err("fail to flush post shadow\n");
543 goto err_unpin_mm;
544 }
545
fred gaof2880e02017-11-14 17:09:35 +0800546 ret = intel_gvt_generate_request(workload);
547 if (ret) {
548 gvt_vgpu_err("fail to generate request\n");
549 goto err_unpin_mm;
550 }
551
Zhi Wangd8235b52017-09-12 22:06:39 +0800552 ret = prepare_shadow_batch_buffer(workload);
553 if (ret) {
554 gvt_vgpu_err("fail to prepare_shadow_batch_buffer\n");
555 goto err_unpin_mm;
556 }
557
558 ret = prepare_shadow_wa_ctx(&workload->wa_ctx);
559 if (ret) {
560 gvt_vgpu_err("fail to prepare_shadow_wa_ctx\n");
561 goto err_shadow_batch;
562 }
563
564 if (workload->prepare) {
565 ret = workload->prepare(workload);
566 if (ret)
567 goto err_shadow_wa_ctx;
568 }
569
570 return 0;
571err_shadow_wa_ctx:
572 release_shadow_wa_ctx(&workload->wa_ctx);
573err_shadow_batch:
574 release_shadow_batch_buffer(workload);
575err_unpin_mm:
576 intel_vgpu_unpin_mm(workload->shadow_mm);
Zhi Wang497aa3f2017-09-12 21:51:10 +0800577 return ret;
578}
579
fred gao0a53bc02017-08-18 15:41:06 +0800580static int dispatch_workload(struct intel_vgpu_workload *workload)
581{
Zhi Wang1406a142017-09-10 21:15:18 +0800582 struct intel_vgpu *vgpu = workload->vgpu;
583 struct intel_vgpu_submission *s = &vgpu->submission;
584 struct i915_gem_context *shadow_ctx = s->shadow_ctx;
585 struct drm_i915_private *dev_priv = vgpu->gvt->dev_priv;
fred gao0a53bc02017-08-18 15:41:06 +0800586 int ring_id = workload->ring_id;
fred gao0a53bc02017-08-18 15:41:06 +0800587 struct intel_engine_cs *engine = dev_priv->engine[ring_id];
588 int ret = 0;
589
590 gvt_dbg_sched("ring id %d prepare to dispatch workload %p\n",
591 ring_id, workload);
592
593 mutex_lock(&dev_priv->drm.struct_mutex);
594
595 ret = intel_gvt_scan_and_shadow_workload(workload);
596 if (ret)
597 goto out;
598
Zhi Wang497aa3f2017-09-12 21:51:10 +0800599 ret = prepare_workload(workload);
600 if (ret) {
601 engine->context_unpin(engine, shadow_ctx);
602 goto out;
fred gao0a53bc02017-08-18 15:41:06 +0800603 }
604
Pei Zhang90d27a12016-11-14 18:02:57 +0800605out:
606 if (ret)
607 workload->status = ret;
Chris Wilson0eb742d2016-10-20 17:29:36 +0800608
Ping Gao89ea20b2017-06-29 12:22:42 +0800609 if (!IS_ERR_OR_NULL(workload->req)) {
610 gvt_dbg_sched("ring id %d submit workload to i915 %p\n",
611 ring_id, workload->req);
Chris Wilsone61e0f52018-02-21 09:56:36 +0000612 i915_request_add(workload->req);
Ping Gao89ea20b2017-06-29 12:22:42 +0800613 workload->dispatched = true;
614 }
Chuanxiao Dong3cd23b82017-03-16 09:47:58 +0800615
Pei Zhang90d27a12016-11-14 18:02:57 +0800616 mutex_unlock(&dev_priv->drm.struct_mutex);
Zhi Wange4734052016-05-01 07:42:16 -0400617 return ret;
618}
619
620static struct intel_vgpu_workload *pick_next_workload(
621 struct intel_gvt *gvt, int ring_id)
622{
623 struct intel_gvt_workload_scheduler *scheduler = &gvt->scheduler;
624 struct intel_vgpu_workload *workload = NULL;
625
626 mutex_lock(&gvt->lock);
627
628 /*
629 * no current vgpu / will be scheduled out / no workload
630 * bail out
631 */
632 if (!scheduler->current_vgpu) {
633 gvt_dbg_sched("ring id %d stop - no current vgpu\n", ring_id);
634 goto out;
635 }
636
637 if (scheduler->need_reschedule) {
638 gvt_dbg_sched("ring id %d stop - will reschedule\n", ring_id);
639 goto out;
640 }
641
Zhenyu Wang954180a2017-04-12 14:22:50 +0800642 if (list_empty(workload_q_head(scheduler->current_vgpu, ring_id)))
Zhi Wange4734052016-05-01 07:42:16 -0400643 goto out;
Zhi Wange4734052016-05-01 07:42:16 -0400644
645 /*
646 * still have current workload, maybe the workload disptacher
647 * fail to submit it for some reason, resubmit it.
648 */
649 if (scheduler->current_workload[ring_id]) {
650 workload = scheduler->current_workload[ring_id];
651 gvt_dbg_sched("ring id %d still have current workload %p\n",
652 ring_id, workload);
653 goto out;
654 }
655
656 /*
657 * pick a workload as current workload
658 * once current workload is set, schedule policy routines
659 * will wait the current workload is finished when trying to
660 * schedule out a vgpu.
661 */
662 scheduler->current_workload[ring_id] = container_of(
663 workload_q_head(scheduler->current_vgpu, ring_id)->next,
664 struct intel_vgpu_workload, list);
665
666 workload = scheduler->current_workload[ring_id];
667
668 gvt_dbg_sched("ring id %d pick new workload %p\n", ring_id, workload);
669
Zhi Wang1406a142017-09-10 21:15:18 +0800670 atomic_inc(&workload->vgpu->submission.running_workload_num);
Zhi Wange4734052016-05-01 07:42:16 -0400671out:
672 mutex_unlock(&gvt->lock);
673 return workload;
674}
675
676static void update_guest_context(struct intel_vgpu_workload *workload)
677{
678 struct intel_vgpu *vgpu = workload->vgpu;
679 struct intel_gvt *gvt = vgpu->gvt;
Zhi Wang1406a142017-09-10 21:15:18 +0800680 struct intel_vgpu_submission *s = &vgpu->submission;
681 struct i915_gem_context *shadow_ctx = s->shadow_ctx;
Zhi Wange4734052016-05-01 07:42:16 -0400682 int ring_id = workload->ring_id;
Zhi Wange4734052016-05-01 07:42:16 -0400683 struct drm_i915_gem_object *ctx_obj =
684 shadow_ctx->engine[ring_id].state->obj;
685 struct execlist_ring_context *shadow_ring_context;
686 struct page *page;
687 void *src;
688 unsigned long context_gpa, context_page_num;
689 int i;
690
691 gvt_dbg_sched("ring id %d workload lrca %x\n", ring_id,
692 workload->ctx_desc.lrca);
693
Joonas Lahtinen63ffbcd2017-04-28 10:53:36 +0300694 context_page_num = gvt->dev_priv->engine[ring_id]->context_size;
Zhi Wange4734052016-05-01 07:42:16 -0400695
696 context_page_num = context_page_num >> PAGE_SHIFT;
697
698 if (IS_BROADWELL(gvt->dev_priv) && ring_id == RCS)
699 context_page_num = 19;
700
701 i = 2;
702
703 while (i < context_page_num) {
704 context_gpa = intel_vgpu_gma_to_gpa(vgpu->gtt.ggtt_mm,
705 (u32)((workload->ctx_desc.lrca + i) <<
Zhi Wang9556e112017-10-10 13:51:32 +0800706 I915_GTT_PAGE_SHIFT));
Zhi Wange4734052016-05-01 07:42:16 -0400707 if (context_gpa == INTEL_GVT_INVALID_ADDR) {
Tina Zhang695fbc02017-03-10 04:26:53 -0500708 gvt_vgpu_err("invalid guest context descriptor\n");
Zhi Wange4734052016-05-01 07:42:16 -0400709 return;
710 }
711
Michel Thierry0b29c752017-09-13 09:56:00 +0100712 page = i915_gem_object_get_page(ctx_obj, LRC_HEADER_PAGES + i);
Xiaoguang Chenc7549362016-11-03 18:38:30 +0800713 src = kmap(page);
Zhi Wange4734052016-05-01 07:42:16 -0400714 intel_gvt_hypervisor_write_gpa(vgpu, context_gpa, src,
Zhi Wang9556e112017-10-10 13:51:32 +0800715 I915_GTT_PAGE_SIZE);
Xiaoguang Chenc7549362016-11-03 18:38:30 +0800716 kunmap(page);
Zhi Wange4734052016-05-01 07:42:16 -0400717 i++;
718 }
719
720 intel_gvt_hypervisor_write_gpa(vgpu, workload->ring_context_gpa +
721 RING_CTX_OFF(ring_header.val), &workload->rb_tail, 4);
722
723 page = i915_gem_object_get_page(ctx_obj, LRC_STATE_PN);
Xiaoguang Chenc7549362016-11-03 18:38:30 +0800724 shadow_ring_context = kmap(page);
Zhi Wange4734052016-05-01 07:42:16 -0400725
726#define COPY_REG(name) \
727 intel_gvt_hypervisor_write_gpa(vgpu, workload->ring_context_gpa + \
728 RING_CTX_OFF(name.val), &shadow_ring_context->name.val, 4)
729
730 COPY_REG(ctx_ctrl);
731 COPY_REG(ctx_timestamp);
732
733#undef COPY_REG
734
735 intel_gvt_hypervisor_write_gpa(vgpu,
736 workload->ring_context_gpa +
737 sizeof(*shadow_ring_context),
738 (void *)shadow_ring_context +
739 sizeof(*shadow_ring_context),
Zhi Wang9556e112017-10-10 13:51:32 +0800740 I915_GTT_PAGE_SIZE - sizeof(*shadow_ring_context));
Zhi Wange4734052016-05-01 07:42:16 -0400741
Xiaoguang Chenc7549362016-11-03 18:38:30 +0800742 kunmap(page);
Zhi Wange4734052016-05-01 07:42:16 -0400743}
744
Zhi Wange2c43c02017-09-13 01:58:35 +0800745static void clean_workloads(struct intel_vgpu *vgpu, unsigned long engine_mask)
746{
747 struct intel_vgpu_submission *s = &vgpu->submission;
748 struct drm_i915_private *dev_priv = vgpu->gvt->dev_priv;
749 struct intel_engine_cs *engine;
750 struct intel_vgpu_workload *pos, *n;
751 unsigned int tmp;
752
753 /* free the unsubmited workloads in the queues. */
754 for_each_engine_masked(engine, dev_priv, engine_mask, tmp) {
755 list_for_each_entry_safe(pos, n,
756 &s->workload_q_head[engine->id], list) {
757 list_del_init(&pos->list);
758 intel_vgpu_destroy_workload(pos);
759 }
760 clear_bit(engine->id, s->shadow_ctx_desc_updated);
761 }
762}
763
Zhi Wange4734052016-05-01 07:42:16 -0400764static void complete_current_workload(struct intel_gvt *gvt, int ring_id)
765{
766 struct intel_gvt_workload_scheduler *scheduler = &gvt->scheduler;
Zhi Wang1406a142017-09-10 21:15:18 +0800767 struct intel_vgpu_workload *workload =
768 scheduler->current_workload[ring_id];
769 struct intel_vgpu *vgpu = workload->vgpu;
770 struct intel_vgpu_submission *s = &vgpu->submission;
Zhi Wangbe1da702016-05-03 18:26:57 -0400771 int event;
Zhi Wange4734052016-05-01 07:42:16 -0400772
773 mutex_lock(&gvt->lock);
774
Chuanxiao Dong8f1117a2017-03-06 13:05:24 +0800775 /* For the workload w/ request, needs to wait for the context
776 * switch to make sure request is completed.
777 * For the workload w/o request, directly complete the workload.
778 */
779 if (workload->req) {
Chuanxiao Dong3cd23b82017-03-16 09:47:58 +0800780 struct drm_i915_private *dev_priv =
781 workload->vgpu->gvt->dev_priv;
782 struct intel_engine_cs *engine =
783 dev_priv->engine[workload->ring_id];
Zhi Wange4734052016-05-01 07:42:16 -0400784 wait_event(workload->shadow_ctx_status_wq,
785 !atomic_read(&workload->shadow_ctx_active));
786
Chuanxiao Dong0cf5ec42017-06-23 13:01:11 +0800787 /* If this request caused GPU hang, req->fence.error will
788 * be set to -EIO. Use -EIO to set workload status so
789 * that when this request caused GPU hang, didn't trigger
790 * context switch interrupt to guest.
791 */
792 if (likely(workload->status == -EINPROGRESS)) {
793 if (workload->req->fence.error == -EIO)
794 workload->status = -EIO;
795 else
796 workload->status = 0;
797 }
798
Chris Wilsone61e0f52018-02-21 09:56:36 +0000799 i915_request_put(fetch_and_zero(&workload->req));
Zhi Wangbe1da702016-05-03 18:26:57 -0400800
Chuanxiao Dong6184cc82017-08-01 17:47:25 +0800801 if (!workload->status && !(vgpu->resetting_eng &
802 ENGINE_MASK(ring_id))) {
Chuanxiao Dong8f1117a2017-03-06 13:05:24 +0800803 update_guest_context(workload);
804
805 for_each_set_bit(event, workload->pending_events,
806 INTEL_GVT_EVENT_MAX)
807 intel_vgpu_trigger_virtual_event(vgpu, event);
808 }
Chuanxiao Dong3cd23b82017-03-16 09:47:58 +0800809 mutex_lock(&dev_priv->drm.struct_mutex);
810 /* unpin shadow ctx as the shadow_ctx update is done */
Zhi Wang1406a142017-09-10 21:15:18 +0800811 engine->context_unpin(engine, s->shadow_ctx);
Chuanxiao Dong3cd23b82017-03-16 09:47:58 +0800812 mutex_unlock(&dev_priv->drm.struct_mutex);
Zhi Wange4734052016-05-01 07:42:16 -0400813 }
814
815 gvt_dbg_sched("ring id %d complete workload %p status %d\n",
816 ring_id, workload, workload->status);
817
818 scheduler->current_workload[ring_id] = NULL;
819
Zhi Wange4734052016-05-01 07:42:16 -0400820 list_del_init(&workload->list);
Zhi Wangd8235b52017-09-12 22:06:39 +0800821
822 if (!workload->status) {
823 release_shadow_batch_buffer(workload);
824 release_shadow_wa_ctx(&workload->wa_ctx);
825 }
826
Zhi Wange2c43c02017-09-13 01:58:35 +0800827 if (workload->status || (vgpu->resetting_eng & ENGINE_MASK(ring_id))) {
828 /* if workload->status is not successful means HW GPU
829 * has occurred GPU hang or something wrong with i915/GVT,
830 * and GVT won't inject context switch interrupt to guest.
831 * So this error is a vGPU hang actually to the guest.
832 * According to this we should emunlate a vGPU hang. If
833 * there are pending workloads which are already submitted
834 * from guest, we should clean them up like HW GPU does.
835 *
836 * if it is in middle of engine resetting, the pending
837 * workloads won't be submitted to HW GPU and will be
838 * cleaned up during the resetting process later, so doing
839 * the workload clean up here doesn't have any impact.
840 **/
841 clean_workloads(vgpu, ENGINE_MASK(ring_id));
842 }
843
Zhi Wange4734052016-05-01 07:42:16 -0400844 workload->complete(workload);
845
Zhi Wang1406a142017-09-10 21:15:18 +0800846 atomic_dec(&s->running_workload_num);
Zhi Wange4734052016-05-01 07:42:16 -0400847 wake_up(&scheduler->workload_complete_wq);
Ping Gaof100dae2017-05-24 09:14:11 +0800848
849 if (gvt->scheduler.need_reschedule)
850 intel_gvt_request_service(gvt, INTEL_GVT_REQUEST_EVENT_SCHED);
851
Zhi Wange4734052016-05-01 07:42:16 -0400852 mutex_unlock(&gvt->lock);
853}
854
855struct workload_thread_param {
856 struct intel_gvt *gvt;
857 int ring_id;
858};
859
860static int workload_thread(void *priv)
861{
862 struct workload_thread_param *p = (struct workload_thread_param *)priv;
863 struct intel_gvt *gvt = p->gvt;
864 int ring_id = p->ring_id;
865 struct intel_gvt_workload_scheduler *scheduler = &gvt->scheduler;
866 struct intel_vgpu_workload *workload = NULL;
Tina Zhang695fbc02017-03-10 04:26:53 -0500867 struct intel_vgpu *vgpu = NULL;
Zhi Wange4734052016-05-01 07:42:16 -0400868 int ret;
Xu Hane3476c02017-03-29 10:13:59 +0800869 bool need_force_wake = IS_SKYLAKE(gvt->dev_priv)
870 || IS_KABYLAKE(gvt->dev_priv);
Du, Changbine45d7b72016-10-27 11:10:31 +0800871 DEFINE_WAIT_FUNC(wait, woken_wake_function);
Zhi Wange4734052016-05-01 07:42:16 -0400872
873 kfree(p);
874
875 gvt_dbg_core("workload thread for ring %d started\n", ring_id);
876
877 while (!kthread_should_stop()) {
Du, Changbine45d7b72016-10-27 11:10:31 +0800878 add_wait_queue(&scheduler->waitq[ring_id], &wait);
879 do {
880 workload = pick_next_workload(gvt, ring_id);
881 if (workload)
882 break;
883 wait_woken(&wait, TASK_INTERRUPTIBLE,
884 MAX_SCHEDULE_TIMEOUT);
885 } while (!kthread_should_stop());
886 remove_wait_queue(&scheduler->waitq[ring_id], &wait);
Zhi Wange4734052016-05-01 07:42:16 -0400887
Du, Changbine45d7b72016-10-27 11:10:31 +0800888 if (!workload)
Zhi Wange4734052016-05-01 07:42:16 -0400889 break;
890
891 gvt_dbg_sched("ring id %d next workload %p vgpu %d\n",
892 workload->ring_id, workload,
893 workload->vgpu->id);
894
895 intel_runtime_pm_get(gvt->dev_priv);
896
Zhi Wange4734052016-05-01 07:42:16 -0400897 gvt_dbg_sched("ring id %d will dispatch workload %p\n",
898 workload->ring_id, workload);
899
900 if (need_force_wake)
901 intel_uncore_forcewake_get(gvt->dev_priv,
902 FORCEWAKE_ALL);
903
Pei Zhang90d27a12016-11-14 18:02:57 +0800904 mutex_lock(&gvt->lock);
Zhi Wange4734052016-05-01 07:42:16 -0400905 ret = dispatch_workload(workload);
Pei Zhang90d27a12016-11-14 18:02:57 +0800906 mutex_unlock(&gvt->lock);
Chris Wilson66bbc3b2016-10-19 11:11:44 +0100907
Zhi Wange4734052016-05-01 07:42:16 -0400908 if (ret) {
Tina Zhang695fbc02017-03-10 04:26:53 -0500909 vgpu = workload->vgpu;
910 gvt_vgpu_err("fail to dispatch workload, skip\n");
Zhi Wange4734052016-05-01 07:42:16 -0400911 goto complete;
912 }
913
914 gvt_dbg_sched("ring id %d wait workload %p\n",
915 workload->ring_id, workload);
Chris Wilsone61e0f52018-02-21 09:56:36 +0000916 i915_request_wait(workload->req, 0, MAX_SCHEDULE_TIMEOUT);
Zhi Wange4734052016-05-01 07:42:16 -0400917
918complete:
Changbin Du3ce32742017-02-09 10:13:16 +0800919 gvt_dbg_sched("will complete workload %p, status: %d\n",
Zhi Wange4734052016-05-01 07:42:16 -0400920 workload, workload->status);
921
Changbin Du2e51ef32017-01-05 13:28:05 +0800922 complete_current_workload(gvt, ring_id);
923
Zhi Wange4734052016-05-01 07:42:16 -0400924 if (need_force_wake)
925 intel_uncore_forcewake_put(gvt->dev_priv,
926 FORCEWAKE_ALL);
927
Zhi Wange4734052016-05-01 07:42:16 -0400928 intel_runtime_pm_put(gvt->dev_priv);
Zhi Wang6d763032017-09-12 22:33:12 +0800929 if (ret && (vgpu_is_vm_unhealthy(ret)))
fred gaoe011c6c2017-09-19 15:11:28 +0800930 enter_failsafe_mode(vgpu, GVT_FAILSAFE_GUEST_ERR);
Zhi Wange4734052016-05-01 07:42:16 -0400931 }
932 return 0;
933}
934
935void intel_gvt_wait_vgpu_idle(struct intel_vgpu *vgpu)
936{
Zhi Wang1406a142017-09-10 21:15:18 +0800937 struct intel_vgpu_submission *s = &vgpu->submission;
Zhi Wange4734052016-05-01 07:42:16 -0400938 struct intel_gvt *gvt = vgpu->gvt;
939 struct intel_gvt_workload_scheduler *scheduler = &gvt->scheduler;
940
Zhi Wang1406a142017-09-10 21:15:18 +0800941 if (atomic_read(&s->running_workload_num)) {
Zhi Wange4734052016-05-01 07:42:16 -0400942 gvt_dbg_sched("wait vgpu idle\n");
943
944 wait_event(scheduler->workload_complete_wq,
Zhi Wang1406a142017-09-10 21:15:18 +0800945 !atomic_read(&s->running_workload_num));
Zhi Wange4734052016-05-01 07:42:16 -0400946 }
947}
948
949void intel_gvt_clean_workload_scheduler(struct intel_gvt *gvt)
950{
951 struct intel_gvt_workload_scheduler *scheduler = &gvt->scheduler;
Changbin Du3fc03062017-03-13 10:47:11 +0800952 struct intel_engine_cs *engine;
953 enum intel_engine_id i;
Zhi Wange4734052016-05-01 07:42:16 -0400954
955 gvt_dbg_core("clean workload scheduler\n");
956
Changbin Du3fc03062017-03-13 10:47:11 +0800957 for_each_engine(engine, gvt->dev_priv, i) {
958 atomic_notifier_chain_unregister(
959 &engine->context_status_notifier,
960 &gvt->shadow_ctx_notifier_block[i]);
961 kthread_stop(scheduler->thread[i]);
Zhi Wange4734052016-05-01 07:42:16 -0400962 }
963}
964
965int intel_gvt_init_workload_scheduler(struct intel_gvt *gvt)
966{
967 struct intel_gvt_workload_scheduler *scheduler = &gvt->scheduler;
968 struct workload_thread_param *param = NULL;
Changbin Du3fc03062017-03-13 10:47:11 +0800969 struct intel_engine_cs *engine;
970 enum intel_engine_id i;
Zhi Wange4734052016-05-01 07:42:16 -0400971 int ret;
Zhi Wange4734052016-05-01 07:42:16 -0400972
973 gvt_dbg_core("init workload scheduler\n");
974
975 init_waitqueue_head(&scheduler->workload_complete_wq);
976
Changbin Du3fc03062017-03-13 10:47:11 +0800977 for_each_engine(engine, gvt->dev_priv, i) {
Zhi Wange4734052016-05-01 07:42:16 -0400978 init_waitqueue_head(&scheduler->waitq[i]);
979
980 param = kzalloc(sizeof(*param), GFP_KERNEL);
981 if (!param) {
982 ret = -ENOMEM;
983 goto err;
984 }
985
986 param->gvt = gvt;
987 param->ring_id = i;
988
989 scheduler->thread[i] = kthread_run(workload_thread, param,
990 "gvt workload %d", i);
991 if (IS_ERR(scheduler->thread[i])) {
992 gvt_err("fail to create workload thread\n");
993 ret = PTR_ERR(scheduler->thread[i]);
994 goto err;
995 }
Changbin Du3fc03062017-03-13 10:47:11 +0800996
997 gvt->shadow_ctx_notifier_block[i].notifier_call =
998 shadow_context_status_change;
999 atomic_notifier_chain_register(&engine->context_status_notifier,
1000 &gvt->shadow_ctx_notifier_block[i]);
Zhi Wange4734052016-05-01 07:42:16 -04001001 }
1002 return 0;
1003err:
1004 intel_gvt_clean_workload_scheduler(gvt);
1005 kfree(param);
1006 param = NULL;
1007 return ret;
1008}
1009
Zhi Wang874b6a92017-09-10 20:08:18 +08001010/**
1011 * intel_vgpu_clean_submission - free submission-related resource for vGPU
1012 * @vgpu: a vGPU
1013 *
1014 * This function is called when a vGPU is being destroyed.
1015 *
1016 */
1017void intel_vgpu_clean_submission(struct intel_vgpu *vgpu)
Zhi Wange4734052016-05-01 07:42:16 -04001018{
Zhi Wang1406a142017-09-10 21:15:18 +08001019 struct intel_vgpu_submission *s = &vgpu->submission;
1020
Weinan Li7569a062018-01-26 15:09:07 +08001021 intel_vgpu_select_submission_ops(vgpu, ALL_ENGINES, 0);
Zhi Wang1406a142017-09-10 21:15:18 +08001022 i915_gem_context_put(s->shadow_ctx);
1023 kmem_cache_destroy(s->workloads);
Zhi Wange4734052016-05-01 07:42:16 -04001024}
1025
Zhi Wang06bb3722017-09-13 01:41:35 +08001026
1027/**
1028 * intel_vgpu_reset_submission - reset submission-related resource for vGPU
1029 * @vgpu: a vGPU
1030 * @engine_mask: engines expected to be reset
1031 *
1032 * This function is called when a vGPU is being destroyed.
1033 *
1034 */
1035void intel_vgpu_reset_submission(struct intel_vgpu *vgpu,
1036 unsigned long engine_mask)
1037{
1038 struct intel_vgpu_submission *s = &vgpu->submission;
1039
1040 if (!s->active)
1041 return;
1042
Zhi Wange2c43c02017-09-13 01:58:35 +08001043 clean_workloads(vgpu, engine_mask);
Zhi Wang06bb3722017-09-13 01:41:35 +08001044 s->ops->reset(vgpu, engine_mask);
1045}
1046
Zhi Wang874b6a92017-09-10 20:08:18 +08001047/**
1048 * intel_vgpu_setup_submission - setup submission-related resource for vGPU
1049 * @vgpu: a vGPU
1050 *
1051 * This function is called when a vGPU is being created.
1052 *
1053 * Returns:
1054 * Zero on success, negative error code if failed.
1055 *
1056 */
1057int intel_vgpu_setup_submission(struct intel_vgpu *vgpu)
Zhi Wange4734052016-05-01 07:42:16 -04001058{
Zhi Wang1406a142017-09-10 21:15:18 +08001059 struct intel_vgpu_submission *s = &vgpu->submission;
Zhi Wang9a9829e2017-09-10 20:28:09 +08001060 enum intel_engine_id i;
1061 struct intel_engine_cs *engine;
1062 int ret;
Zhi Wange4734052016-05-01 07:42:16 -04001063
Zhi Wang1406a142017-09-10 21:15:18 +08001064 s->shadow_ctx = i915_gem_context_create_gvt(
Zhi Wange4734052016-05-01 07:42:16 -04001065 &vgpu->gvt->dev_priv->drm);
Zhi Wang1406a142017-09-10 21:15:18 +08001066 if (IS_ERR(s->shadow_ctx))
1067 return PTR_ERR(s->shadow_ctx);
Zhi Wange4734052016-05-01 07:42:16 -04001068
Zhenyu Wang16036602017-12-04 10:42:58 +08001069 if (HAS_LOGICAL_RING_PREEMPTION(vgpu->gvt->dev_priv))
1070 s->shadow_ctx->priority = INT_MAX;
1071
Zhi Wang1406a142017-09-10 21:15:18 +08001072 bitmap_zero(s->shadow_ctx_desc_updated, I915_NUM_ENGINES);
Kechen Lu9dfb8e52017-08-10 07:41:36 +08001073
Zhi Wang1406a142017-09-10 21:15:18 +08001074 s->workloads = kmem_cache_create("gvt-g_vgpu_workload",
Zhi Wang9a9829e2017-09-10 20:28:09 +08001075 sizeof(struct intel_vgpu_workload), 0,
1076 SLAB_HWCACHE_ALIGN,
1077 NULL);
1078
Zhi Wang1406a142017-09-10 21:15:18 +08001079 if (!s->workloads) {
Zhi Wang9a9829e2017-09-10 20:28:09 +08001080 ret = -ENOMEM;
1081 goto out_shadow_ctx;
1082 }
1083
1084 for_each_engine(engine, vgpu->gvt->dev_priv, i)
Zhi Wang1406a142017-09-10 21:15:18 +08001085 INIT_LIST_HEAD(&s->workload_q_head[i]);
Zhi Wang9a9829e2017-09-10 20:28:09 +08001086
Zhi Wang1406a142017-09-10 21:15:18 +08001087 atomic_set(&s->running_workload_num, 0);
Zhi Wang91d5d852017-09-10 21:33:20 +08001088 bitmap_zero(s->tlb_handle_pending, I915_NUM_ENGINES);
Zhi Wang9a9829e2017-09-10 20:28:09 +08001089
Zhi Wange4734052016-05-01 07:42:16 -04001090 return 0;
Zhi Wang9a9829e2017-09-10 20:28:09 +08001091
1092out_shadow_ctx:
Zhi Wang1406a142017-09-10 21:15:18 +08001093 i915_gem_context_put(s->shadow_ctx);
Zhi Wang9a9829e2017-09-10 20:28:09 +08001094 return ret;
Zhi Wange4734052016-05-01 07:42:16 -04001095}
Zhi Wang21527a82017-09-12 21:42:09 +08001096
1097/**
Zhi Wangad1d3632017-09-13 00:31:29 +08001098 * intel_vgpu_select_submission_ops - select virtual submission interface
1099 * @vgpu: a vGPU
1100 * @interface: expected vGPU virtual submission interface
1101 *
1102 * This function is called when guest configures submission interface.
1103 *
1104 * Returns:
1105 * Zero on success, negative error code if failed.
1106 *
1107 */
1108int intel_vgpu_select_submission_ops(struct intel_vgpu *vgpu,
Weinan Li7569a062018-01-26 15:09:07 +08001109 unsigned long engine_mask,
Zhi Wangad1d3632017-09-13 00:31:29 +08001110 unsigned int interface)
1111{
1112 struct intel_vgpu_submission *s = &vgpu->submission;
1113 const struct intel_vgpu_submission_ops *ops[] = {
1114 [INTEL_VGPU_EXECLIST_SUBMISSION] =
1115 &intel_vgpu_execlist_submission_ops,
1116 };
1117 int ret;
1118
1119 if (WARN_ON(interface >= ARRAY_SIZE(ops)))
1120 return -EINVAL;
1121
Weinan Li9212b132018-01-26 15:09:08 +08001122 if (WARN_ON(interface == 0 && engine_mask != ALL_ENGINES))
1123 return -EINVAL;
1124
1125 if (s->active)
Weinan Li7569a062018-01-26 15:09:07 +08001126 s->ops->clean(vgpu, engine_mask);
Zhi Wangad1d3632017-09-13 00:31:29 +08001127
1128 if (interface == 0) {
1129 s->ops = NULL;
1130 s->virtual_submission_interface = 0;
Weinan Li9212b132018-01-26 15:09:08 +08001131 s->active = false;
1132 gvt_dbg_core("vgpu%d: remove submission ops\n", vgpu->id);
Zhi Wangad1d3632017-09-13 00:31:29 +08001133 return 0;
1134 }
1135
Weinan Li7569a062018-01-26 15:09:07 +08001136 ret = ops[interface]->init(vgpu, engine_mask);
Zhi Wangad1d3632017-09-13 00:31:29 +08001137 if (ret)
1138 return ret;
1139
1140 s->ops = ops[interface];
1141 s->virtual_submission_interface = interface;
1142 s->active = true;
1143
1144 gvt_dbg_core("vgpu%d: activate ops [ %s ]\n",
1145 vgpu->id, s->ops->name);
1146
1147 return 0;
1148}
1149
1150/**
Zhi Wang21527a82017-09-12 21:42:09 +08001151 * intel_vgpu_destroy_workload - destroy a vGPU workload
1152 * @vgpu: a vGPU
1153 *
1154 * This function is called when destroy a vGPU workload.
1155 *
1156 */
1157void intel_vgpu_destroy_workload(struct intel_vgpu_workload *workload)
1158{
1159 struct intel_vgpu_submission *s = &workload->vgpu->submission;
1160
1161 if (workload->shadow_mm)
Changbin Du1bc25852018-01-30 19:19:41 +08001162 intel_vgpu_mm_put(workload->shadow_mm);
Zhi Wang21527a82017-09-12 21:42:09 +08001163
1164 kmem_cache_free(s->workloads, workload);
1165}
1166
Zhi Wang6d763032017-09-12 22:33:12 +08001167static struct intel_vgpu_workload *
1168alloc_workload(struct intel_vgpu *vgpu)
Zhi Wang21527a82017-09-12 21:42:09 +08001169{
1170 struct intel_vgpu_submission *s = &vgpu->submission;
1171 struct intel_vgpu_workload *workload;
1172
1173 workload = kmem_cache_zalloc(s->workloads, GFP_KERNEL);
1174 if (!workload)
1175 return ERR_PTR(-ENOMEM);
1176
1177 INIT_LIST_HEAD(&workload->list);
1178 INIT_LIST_HEAD(&workload->shadow_bb);
1179
1180 init_waitqueue_head(&workload->shadow_ctx_status_wq);
1181 atomic_set(&workload->shadow_ctx_active, 0);
1182
1183 workload->status = -EINPROGRESS;
1184 workload->shadowed = false;
1185 workload->vgpu = vgpu;
1186
1187 return workload;
1188}
Zhi Wang6d763032017-09-12 22:33:12 +08001189
1190#define RING_CTX_OFF(x) \
1191 offsetof(struct execlist_ring_context, x)
1192
1193static void read_guest_pdps(struct intel_vgpu *vgpu,
1194 u64 ring_context_gpa, u32 pdp[8])
1195{
1196 u64 gpa;
1197 int i;
1198
1199 gpa = ring_context_gpa + RING_CTX_OFF(pdp3_UDW.val);
1200
1201 for (i = 0; i < 8; i++)
1202 intel_gvt_hypervisor_read_gpa(vgpu,
1203 gpa + i * 8, &pdp[7 - i], 4);
1204}
1205
1206static int prepare_mm(struct intel_vgpu_workload *workload)
1207{
1208 struct execlist_ctx_descriptor_format *desc = &workload->ctx_desc;
1209 struct intel_vgpu_mm *mm;
1210 struct intel_vgpu *vgpu = workload->vgpu;
Changbin Duede9d0c2018-01-30 19:19:40 +08001211 intel_gvt_gtt_type_t root_entry_type;
1212 u64 pdps[GVT_RING_CTX_NR_PDPS];
Zhi Wang6d763032017-09-12 22:33:12 +08001213
Changbin Duede9d0c2018-01-30 19:19:40 +08001214 switch (desc->addressing_mode) {
1215 case 1: /* legacy 32-bit */
1216 root_entry_type = GTT_TYPE_PPGTT_ROOT_L3_ENTRY;
1217 break;
1218 case 3: /* legacy 64-bit */
1219 root_entry_type = GTT_TYPE_PPGTT_ROOT_L4_ENTRY;
1220 break;
1221 default:
Zhi Wang6d763032017-09-12 22:33:12 +08001222 gvt_vgpu_err("Advanced Context mode(SVM) is not supported!\n");
1223 return -EINVAL;
1224 }
1225
Changbin Duede9d0c2018-01-30 19:19:40 +08001226 read_guest_pdps(workload->vgpu, workload->ring_context_gpa, (void *)pdps);
Zhi Wang6d763032017-09-12 22:33:12 +08001227
Changbin Due6e9c462018-01-30 19:19:46 +08001228 mm = intel_vgpu_get_ppgtt_mm(workload->vgpu, root_entry_type, pdps);
1229 if (IS_ERR(mm))
1230 return PTR_ERR(mm);
Zhi Wang6d763032017-09-12 22:33:12 +08001231
Zhi Wang6d763032017-09-12 22:33:12 +08001232 workload->shadow_mm = mm;
1233 return 0;
1234}
1235
1236#define same_context(a, b) (((a)->context_id == (b)->context_id) && \
1237 ((a)->lrca == (b)->lrca))
1238
1239#define get_last_workload(q) \
1240 (list_empty(q) ? NULL : container_of(q->prev, \
1241 struct intel_vgpu_workload, list))
1242/**
1243 * intel_vgpu_create_workload - create a vGPU workload
1244 * @vgpu: a vGPU
1245 * @desc: a guest context descriptor
1246 *
1247 * This function is called when creating a vGPU workload.
1248 *
1249 * Returns:
1250 * struct intel_vgpu_workload * on success, negative error code in
1251 * pointer if failed.
1252 *
1253 */
1254struct intel_vgpu_workload *
1255intel_vgpu_create_workload(struct intel_vgpu *vgpu, int ring_id,
1256 struct execlist_ctx_descriptor_format *desc)
1257{
1258 struct intel_vgpu_submission *s = &vgpu->submission;
1259 struct list_head *q = workload_q_head(vgpu, ring_id);
1260 struct intel_vgpu_workload *last_workload = get_last_workload(q);
1261 struct intel_vgpu_workload *workload = NULL;
1262 struct drm_i915_private *dev_priv = vgpu->gvt->dev_priv;
1263 u64 ring_context_gpa;
1264 u32 head, tail, start, ctl, ctx_ctl, per_ctx, indirect_ctx;
1265 int ret;
1266
1267 ring_context_gpa = intel_vgpu_gma_to_gpa(vgpu->gtt.ggtt_mm,
Zhi Wang9556e112017-10-10 13:51:32 +08001268 (u32)((desc->lrca + 1) << I915_GTT_PAGE_SHIFT));
Zhi Wang6d763032017-09-12 22:33:12 +08001269 if (ring_context_gpa == INTEL_GVT_INVALID_ADDR) {
1270 gvt_vgpu_err("invalid guest context LRCA: %x\n", desc->lrca);
1271 return ERR_PTR(-EINVAL);
1272 }
1273
1274 intel_gvt_hypervisor_read_gpa(vgpu, ring_context_gpa +
1275 RING_CTX_OFF(ring_header.val), &head, 4);
1276
1277 intel_gvt_hypervisor_read_gpa(vgpu, ring_context_gpa +
1278 RING_CTX_OFF(ring_tail.val), &tail, 4);
1279
1280 head &= RB_HEAD_OFF_MASK;
1281 tail &= RB_TAIL_OFF_MASK;
1282
1283 if (last_workload && same_context(&last_workload->ctx_desc, desc)) {
1284 gvt_dbg_el("ring id %d cur workload == last\n", ring_id);
1285 gvt_dbg_el("ctx head %x real head %lx\n", head,
1286 last_workload->rb_tail);
1287 /*
1288 * cannot use guest context head pointer here,
1289 * as it might not be updated at this time
1290 */
1291 head = last_workload->rb_tail;
1292 }
1293
1294 gvt_dbg_el("ring id %d begin a new workload\n", ring_id);
1295
1296 /* record some ring buffer register values for scan and shadow */
1297 intel_gvt_hypervisor_read_gpa(vgpu, ring_context_gpa +
1298 RING_CTX_OFF(rb_start.val), &start, 4);
1299 intel_gvt_hypervisor_read_gpa(vgpu, ring_context_gpa +
1300 RING_CTX_OFF(rb_ctrl.val), &ctl, 4);
1301 intel_gvt_hypervisor_read_gpa(vgpu, ring_context_gpa +
1302 RING_CTX_OFF(ctx_ctrl.val), &ctx_ctl, 4);
1303
1304 workload = alloc_workload(vgpu);
1305 if (IS_ERR(workload))
1306 return workload;
1307
1308 workload->ring_id = ring_id;
1309 workload->ctx_desc = *desc;
1310 workload->ring_context_gpa = ring_context_gpa;
1311 workload->rb_head = head;
1312 workload->rb_tail = tail;
1313 workload->rb_start = start;
1314 workload->rb_ctl = ctl;
1315
1316 if (ring_id == RCS) {
1317 intel_gvt_hypervisor_read_gpa(vgpu, ring_context_gpa +
1318 RING_CTX_OFF(bb_per_ctx_ptr.val), &per_ctx, 4);
1319 intel_gvt_hypervisor_read_gpa(vgpu, ring_context_gpa +
1320 RING_CTX_OFF(rcs_indirect_ctx.val), &indirect_ctx, 4);
1321
1322 workload->wa_ctx.indirect_ctx.guest_gma =
1323 indirect_ctx & INDIRECT_CTX_ADDR_MASK;
1324 workload->wa_ctx.indirect_ctx.size =
1325 (indirect_ctx & INDIRECT_CTX_SIZE_MASK) *
1326 CACHELINE_BYTES;
1327 workload->wa_ctx.per_ctx.guest_gma =
1328 per_ctx & PER_CTX_ADDR_MASK;
1329 workload->wa_ctx.per_ctx.valid = per_ctx & 1;
1330 }
1331
1332 gvt_dbg_el("workload %p ring id %d head %x tail %x start %x ctl %x\n",
1333 workload, ring_id, head, tail, start, ctl);
1334
1335 ret = prepare_mm(workload);
1336 if (ret) {
1337 kmem_cache_free(s->workloads, workload);
1338 return ERR_PTR(ret);
1339 }
1340
1341 /* Only scan and shadow the first workload in the queue
1342 * as there is only one pre-allocated buf-obj for shadow.
1343 */
1344 if (list_empty(workload_q_head(vgpu, ring_id))) {
1345 intel_runtime_pm_get(dev_priv);
1346 mutex_lock(&dev_priv->drm.struct_mutex);
1347 ret = intel_gvt_scan_and_shadow_workload(workload);
1348 mutex_unlock(&dev_priv->drm.struct_mutex);
1349 intel_runtime_pm_put(dev_priv);
1350 }
1351
1352 if (ret && (vgpu_is_vm_unhealthy(ret))) {
1353 enter_failsafe_mode(vgpu, GVT_FAILSAFE_GUEST_ERR);
1354 intel_vgpu_destroy_workload(workload);
1355 return ERR_PTR(ret);
1356 }
1357
1358 return workload;
1359}
Changbin Du59a716c2017-11-29 15:40:06 +08001360
1361/**
1362 * intel_vgpu_queue_workload - Qeue a vGPU workload
1363 * @workload: the workload to queue in
1364 */
1365void intel_vgpu_queue_workload(struct intel_vgpu_workload *workload)
1366{
1367 list_add_tail(&workload->list,
1368 workload_q_head(workload->vgpu, workload->ring_id));
Changbin Duc1304562017-11-29 15:40:07 +08001369 intel_gvt_kick_schedule(workload->vgpu->gvt);
Changbin Du59a716c2017-11-29 15:40:06 +08001370 wake_up(&workload->vgpu->gvt->scheduler.waitq[workload->ring_id]);
1371}