Blame - drivers/gpu/drm/i915/gvt/scheduler.c - kernel/msm-5.4

blob: f2d4c90ea1d47b8bbac95431960a55390083706b [file] [log] [blame]

Zhi Wang	e473405	2016-05-01 07:42:16 -0400	[diff] [blame]	1	/*
				2	* Copyright(c) 2011-2016 Intel Corporation. All rights reserved.
				3	*
				4	* Permission is hereby granted, free of charge, to any person obtaining a
				5	* copy of this software and associated documentation files (the "Software"),
				6	* to deal in the Software without restriction, including without limitation
				7	* the rights to use, copy, modify, merge, publish, distribute, sublicense,
				8	* and/or sell copies of the Software, and to permit persons to whom the
				9	* Software is furnished to do so, subject to the following conditions:
				10	*
				11	* The above copyright notice and this permission notice (including the next
				12	* paragraph) shall be included in all copies or substantial portions of the
				13	* Software.
				14	*
				15	* THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
				16	* IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
				17	* FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL
				18	* THE AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
				19	* LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
				20	* OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE
				21	* SOFTWARE.
				22	*
				23	* Authors:
				24	* Zhi Wang <zhi.a.wang@intel.com>
				25	*
				26	* Contributors:
				27	* Ping Gao <ping.a.gao@intel.com>
				28	* Tina Zhang <tina.zhang@intel.com>
				29	* Chanbin Du <changbin.du@intel.com>
				30	* Min He <min.he@intel.com>
				31	* Bing Niu <bing.niu@intel.com>
				32	* Zhenyu Wang <zhenyuw@linux.intel.com>
				33	*
				34	*/
				35
Zhi Wang	e473405	2016-05-01 07:42:16 -0400	[diff] [blame]	36	#include <linux/kthread.h>
				37
Zhenyu Wang	feddf6e	2016-10-20 17:15:03 +0800	[diff] [blame]	38	#include "i915_drv.h"
				39	#include "gvt.h"
				40
Zhi Wang	e473405	2016-05-01 07:42:16 -0400	[diff] [blame]	41	#define RING_CTX_OFF(x) \
				42	offsetof(struct execlist_ring_context, x)
				43
Du, Changbin	999ccb4	2016-10-20 14:08:47 +0800	[diff] [blame]	44	static void set_context_pdp_root_pointer(
				45	struct execlist_ring_context *ring_context,
Zhi Wang	e473405	2016-05-01 07:42:16 -0400	[diff] [blame]	46	u32 pdp[8])
				47	{
				48	struct execlist_mmio_pair *pdp_pair = &ring_context->pdp3_UDW;
				49	int i;
				50
				51	for (i = 0; i < 8; i++)
				52	pdp_pair[i].val = pdp[7 - i];
				53	}
				54
				55	static int populate_shadow_context(struct intel_vgpu_workload *workload)
				56	{
				57	struct intel_vgpu *vgpu = workload->vgpu;
				58	struct intel_gvt *gvt = vgpu->gvt;
				59	int ring_id = workload->ring_id;
Zhi Wang	1406a14	2017-09-10 21:15:18 +0800	[diff] [blame]	60	struct i915_gem_context *shadow_ctx = vgpu->submission.shadow_ctx;
Zhi Wang	e473405	2016-05-01 07:42:16 -0400	[diff] [blame]	61	struct drm_i915_gem_object *ctx_obj =
				62	shadow_ctx->engine[ring_id].state->obj;
				63	struct execlist_ring_context *shadow_ring_context;
				64	struct page *page;
				65	void *dst;
				66	unsigned long context_gpa, context_page_num;
				67	int i;
				68
				69	gvt_dbg_sched("ring id %d workload lrca %x", ring_id,
				70	workload->ctx_desc.lrca);
				71
Joonas Lahtinen	63ffbcd	2017-04-28 10:53:36 +0300	[diff] [blame]	72	context_page_num = gvt->dev_priv->engine[ring_id]->context_size;
Zhi Wang	e473405	2016-05-01 07:42:16 -0400	[diff] [blame]	73
				74	context_page_num = context_page_num >> PAGE_SHIFT;
				75
				76	if (IS_BROADWELL(gvt->dev_priv) && ring_id == RCS)
				77	context_page_num = 19;
				78
				79	i = 2;
				80
				81	while (i < context_page_num) {
				82	context_gpa = intel_vgpu_gma_to_gpa(vgpu->gtt.ggtt_mm,
				83	(u32)((workload->ctx_desc.lrca + i) <<
				84	GTT_PAGE_SHIFT));
				85	if (context_gpa == INTEL_GVT_INVALID_ADDR) {
Tina Zhang	695fbc0	2017-03-10 04:26:53 -0500	[diff] [blame]	86	gvt_vgpu_err("Invalid guest context descriptor\n");
fred gao	5c56883	2017-09-20 05:36:47 +0800	[diff] [blame]	87	return -EFAULT;
Zhi Wang	e473405	2016-05-01 07:42:16 -0400	[diff] [blame]	88	}
				89
Michel Thierry	0b29c75	2017-09-13 09:56:00 +0100	[diff] [blame]	90	page = i915_gem_object_get_page(ctx_obj, LRC_HEADER_PAGES + i);
Xiaoguang Chen	c754936	2016-11-03 18:38:30 +0800	[diff] [blame]	91	dst = kmap(page);
Zhi Wang	e473405	2016-05-01 07:42:16 -0400	[diff] [blame]	92	intel_gvt_hypervisor_read_gpa(vgpu, context_gpa, dst,
				93	GTT_PAGE_SIZE);
Xiaoguang Chen	c754936	2016-11-03 18:38:30 +0800	[diff] [blame]	94	kunmap(page);
Zhi Wang	e473405	2016-05-01 07:42:16 -0400	[diff] [blame]	95	i++;
				96	}
				97
				98	page = i915_gem_object_get_page(ctx_obj, LRC_STATE_PN);
Xiaoguang Chen	c754936	2016-11-03 18:38:30 +0800	[diff] [blame]	99	shadow_ring_context = kmap(page);
Zhi Wang	e473405	2016-05-01 07:42:16 -0400	[diff] [blame]	100
				101	#define COPY_REG(name) \
				102	intel_gvt_hypervisor_read_gpa(vgpu, workload->ring_context_gpa \
				103	+ RING_CTX_OFF(name.val), &shadow_ring_context->name.val, 4)
				104
				105	COPY_REG(ctx_ctrl);
				106	COPY_REG(ctx_timestamp);
				107
				108	if (ring_id == RCS) {
				109	COPY_REG(bb_per_ctx_ptr);
				110	COPY_REG(rcs_indirect_ctx);
				111	COPY_REG(rcs_indirect_ctx_offset);
				112	}
				113	#undef COPY_REG
				114
				115	set_context_pdp_root_pointer(shadow_ring_context,
				116	workload->shadow_mm->shadow_page_table);
				117
				118	intel_gvt_hypervisor_read_gpa(vgpu,
				119	workload->ring_context_gpa +
				120	sizeof(*shadow_ring_context),
				121	(void *)shadow_ring_context +
				122	sizeof(*shadow_ring_context),
				123	GTT_PAGE_SIZE - sizeof(*shadow_ring_context));
				124
Xiaoguang Chen	c754936	2016-11-03 18:38:30 +0800	[diff] [blame]	125	kunmap(page);
Zhi Wang	e473405	2016-05-01 07:42:16 -0400	[diff] [blame]	126	return 0;
				127	}
				128
Changbin Du	bc2d4b6	2017-03-22 12:35:31 +0800	[diff] [blame]	129	static inline bool is_gvt_request(struct drm_i915_gem_request *req)
				130	{
				131	return i915_gem_context_force_single_submission(req->ctx);
				132	}
				133
Zhi Wang	e473405	2016-05-01 07:42:16 -0400	[diff] [blame]	134	static int shadow_context_status_change(struct notifier_block *nb,
				135	unsigned long action, void *data)
				136	{
Changbin Du	3fc0306	2017-03-13 10:47:11 +0800	[diff] [blame]	137	struct drm_i915_gem_request req = (struct drm_i915_gem_request )data;
				138	struct intel_gvt *gvt = container_of(nb, struct intel_gvt,
				139	shadow_ctx_notifier_block[req->engine->id]);
				140	struct intel_gvt_workload_scheduler *scheduler = &gvt->scheduler;
Changbin Du	0e86cc9	2017-05-04 10:52:38 +0800	[diff] [blame]	141	enum intel_engine_id ring_id = req->engine->id;
				142	struct intel_vgpu_workload *workload;
Zhi Wang	e473405	2016-05-01 07:42:16 -0400	[diff] [blame]	143
Changbin Du	0e86cc9	2017-05-04 10:52:38 +0800	[diff] [blame]	144	if (!is_gvt_request(req)) {
				145	spin_lock_bh(&scheduler->mmio_context_lock);
				146	if (action == INTEL_CONTEXT_SCHEDULE_IN &&
				147	scheduler->engine_owner[ring_id]) {
				148	/* Switch ring from vGPU to host. */
				149	intel_gvt_switch_mmio(scheduler->engine_owner[ring_id],
				150	NULL, ring_id);
				151	scheduler->engine_owner[ring_id] = NULL;
				152	}
				153	spin_unlock_bh(&scheduler->mmio_context_lock);
				154
				155	return NOTIFY_OK;
				156	}
				157
				158	workload = scheduler->current_workload[ring_id];
				159	if (unlikely(!workload))
Chuanxiao Dong	9272f73	2017-02-17 19:29:52 +0800	[diff] [blame]	160	return NOTIFY_OK;
				161
Zhi Wang	e473405	2016-05-01 07:42:16 -0400	[diff] [blame]	162	switch (action) {
				163	case INTEL_CONTEXT_SCHEDULE_IN:
Changbin Du	0e86cc9	2017-05-04 10:52:38 +0800	[diff] [blame]	164	spin_lock_bh(&scheduler->mmio_context_lock);
				165	if (workload->vgpu != scheduler->engine_owner[ring_id]) {
				166	/* Switch ring from host to vGPU or vGPU to vGPU. */
				167	intel_gvt_switch_mmio(scheduler->engine_owner[ring_id],
				168	workload->vgpu, ring_id);
				169	scheduler->engine_owner[ring_id] = workload->vgpu;
				170	} else
				171	gvt_dbg_sched("skip ring %d mmio switch for vgpu%d\n",
				172	ring_id, workload->vgpu->id);
				173	spin_unlock_bh(&scheduler->mmio_context_lock);
Zhi Wang	e473405	2016-05-01 07:42:16 -0400	[diff] [blame]	174	atomic_set(&workload->shadow_ctx_active, 1);
				175	break;
				176	case INTEL_CONTEXT_SCHEDULE_OUT:
Chris Wilson	d6c0511	2017-10-03 21:34:47 +0100	[diff] [blame]	177	case INTEL_CONTEXT_SCHEDULE_PREEMPTED:
Zhi Wang	e473405	2016-05-01 07:42:16 -0400	[diff] [blame]	178	atomic_set(&workload->shadow_ctx_active, 0);
				179	break;
				180	default:
				181	WARN_ON(1);
				182	return NOTIFY_OK;
				183	}
				184	wake_up(&workload->shadow_ctx_status_wq);
				185	return NOTIFY_OK;
				186	}
				187
Kechen Lu	9dfb8e5	2017-08-10 07:41:36 +0800	[diff] [blame]	188	static void shadow_context_descriptor_update(struct i915_gem_context *ctx,
				189	struct intel_engine_cs *engine)
				190	{
				191	struct intel_context *ce = &ctx->engine[engine->id];
				192	u64 desc = 0;
				193
				194	desc = ce->lrc_desc;
				195
				196	/* Update bits 0-11 of the context descriptor which includes flags
				197	* like GEN8_CTX_* cached in desc_template
				198	*/
				199	desc &= U64_MAX << 12;
				200	desc \|= ctx->desc_template & ((1ULL << 12) - 1);
				201
				202	ce->lrc_desc = desc;
				203	}
				204
fred gao	0a53bc0	2017-08-18 15:41:06 +0800	[diff] [blame]	205	static int copy_workload_to_ring_buffer(struct intel_vgpu_workload *workload)
				206	{
				207	struct intel_vgpu *vgpu = workload->vgpu;
				208	void *shadow_ring_buffer_va;
				209	u32 *cs;
				210
				211	/* allocate shadow ring buffer */
				212	cs = intel_ring_begin(workload->req, workload->rb_len / sizeof(u32));
				213	if (IS_ERR(cs)) {
				214	gvt_vgpu_err("fail to alloc size =%ld shadow ring buffer\n",
				215	workload->rb_len);
				216	return PTR_ERR(cs);
				217	}
				218
				219	shadow_ring_buffer_va = workload->shadow_ring_buffer_va;
				220
				221	/* get shadow ring buffer va */
				222	workload->shadow_ring_buffer_va = cs;
				223
				224	memcpy(cs, shadow_ring_buffer_va,
				225	workload->rb_len);
				226
				227	cs += workload->rb_len / sizeof(u32);
				228	intel_ring_advance(workload->req, cs);
				229
				230	return 0;
				231	}
				232
fred gao	a3cfdca	2017-08-18 15:41:07 +0800	[diff] [blame]	233	void release_shadow_wa_ctx(struct intel_shadow_wa_ctx *wa_ctx)
				234	{
				235	if (!wa_ctx->indirect_ctx.obj)
				236	return;
				237
				238	i915_gem_object_unpin_map(wa_ctx->indirect_ctx.obj);
				239	i915_gem_object_put(wa_ctx->indirect_ctx.obj);
				240	}
				241
Ping Gao	89ea20b	2017-06-29 12:22:42 +0800	[diff] [blame]	242	/**
				243	* intel_gvt_scan_and_shadow_workload - audit the workload by scanning and
				244	* shadow it as well, include ringbuffer,wa_ctx and ctx.
				245	* @workload: an abstract entity for each execlist submission.
				246	*
				247	* This function is called before the workload submitting to i915, to make
				248	* sure the content of the workload is valid.
				249	*/
				250	int intel_gvt_scan_and_shadow_workload(struct intel_vgpu_workload *workload)
Zhi Wang	e473405	2016-05-01 07:42:16 -0400	[diff] [blame]	251	{
Zhi Wang	1406a14	2017-09-10 21:15:18 +0800	[diff] [blame]	252	struct intel_vgpu *vgpu = workload->vgpu;
				253	struct intel_vgpu_submission *s = &vgpu->submission;
				254	struct i915_gem_context *shadow_ctx = s->shadow_ctx;
				255	struct drm_i915_private *dev_priv = vgpu->gvt->dev_priv;
Zhi Wang	e473405	2016-05-01 07:42:16 -0400	[diff] [blame]	256	int ring_id = workload->ring_id;
fred gao	0a53bc0	2017-08-18 15:41:06 +0800	[diff] [blame]	257	struct intel_engine_cs *engine = dev_priv->engine[ring_id];
Chris Wilson	0eb742d	2016-10-20 17:29:36 +0800	[diff] [blame]	258	struct drm_i915_gem_request *rq;
fred gao	0a53bc0	2017-08-18 15:41:06 +0800	[diff] [blame]	259	struct intel_ring *ring;
Zhi Wang	e473405	2016-05-01 07:42:16 -0400	[diff] [blame]	260	int ret;
				261
Ping Gao	87e919d	2017-07-04 14:53:03 +0800	[diff] [blame]	262	lockdep_assert_held(&dev_priv->drm.struct_mutex);
				263
Ping Gao	d0302e7	2017-06-29 12:22:43 +0800	[diff] [blame]	264	if (workload->shadowed)
				265	return 0;
Zhi Wang	e473405	2016-05-01 07:42:16 -0400	[diff] [blame]	266
Zhenyu Wang	03806ed	2017-02-13 17:07:19 +0800	[diff] [blame]	267	shadow_ctx->desc_template &= ~(0x3 << GEN8_CTX_ADDRESSING_MODE_SHIFT);
				268	shadow_ctx->desc_template \|= workload->ctx_desc.addressing_mode <<
Zhi Wang	e473405	2016-05-01 07:42:16 -0400	[diff] [blame]	269	GEN8_CTX_ADDRESSING_MODE_SHIFT;
				270
Zhi Wang	1406a14	2017-09-10 21:15:18 +0800	[diff] [blame]	271	if (!test_and_set_bit(ring_id, s->shadow_ctx_desc_updated))
Kechen Lu	9dfb8e5	2017-08-10 07:41:36 +0800	[diff] [blame]	272	shadow_context_descriptor_update(shadow_ctx,
				273	dev_priv->engine[ring_id]);
Chuanxiao Dong	3cd23b8	2017-03-16 09:47:58 +0800	[diff] [blame]	274
Ping Gao	89ea20b	2017-06-29 12:22:42 +0800	[diff] [blame]	275	ret = intel_gvt_scan_and_shadow_ringbuffer(workload);
Zhi Wang	be1da70	2016-05-03 18:26:57 -0400	[diff] [blame]	276	if (ret)
fred gao	a3cfdca	2017-08-18 15:41:07 +0800	[diff] [blame]	277	goto err_scan;
Zhi Wang	be1da70	2016-05-03 18:26:57 -0400	[diff] [blame]	278
Tina Zhang	17f1b1a	2017-03-15 23:16:01 -0400	[diff] [blame]	279	if ((workload->ring_id == RCS) &&
				280	(workload->wa_ctx.indirect_ctx.size != 0)) {
				281	ret = intel_gvt_scan_and_shadow_wa_ctx(&workload->wa_ctx);
				282	if (ret)
fred gao	a3cfdca	2017-08-18 15:41:07 +0800	[diff] [blame]	283	goto err_scan;
Tina Zhang	17f1b1a	2017-03-15 23:16:01 -0400	[diff] [blame]	284	}
Zhi Wang	be1da70	2016-05-03 18:26:57 -0400	[diff] [blame]	285
Ping Gao	89ea20b	2017-06-29 12:22:42 +0800	[diff] [blame]	286	/* pin shadow context by gvt even the shadow context will be pinned
				287	* when i915 alloc request. That is because gvt will update the guest
				288	* context from shadow context when workload is completed, and at that
				289	* moment, i915 may already unpined the shadow context to make the
				290	* shadow_ctx pages invalid. So gvt need to pin itself. After update
				291	* the guest context, gvt can unpin the shadow_ctx safely.
				292	*/
				293	ring = engine->context_pin(engine, shadow_ctx);
				294	if (IS_ERR(ring)) {
				295	ret = PTR_ERR(ring);
				296	gvt_vgpu_err("fail to pin shadow context\n");
fred gao	a3cfdca	2017-08-18 15:41:07 +0800	[diff] [blame]	297	goto err_shadow;
Ping Gao	89ea20b	2017-06-29 12:22:42 +0800	[diff] [blame]	298	}
Zhi Wang	e473405	2016-05-01 07:42:16 -0400	[diff] [blame]	299
fred gao	0a53bc0	2017-08-18 15:41:06 +0800	[diff] [blame]	300	ret = populate_shadow_context(workload);
				301	if (ret)
fred gao	a3cfdca	2017-08-18 15:41:07 +0800	[diff] [blame]	302	goto err_unpin;
fred gao	0a53bc0	2017-08-18 15:41:06 +0800	[diff] [blame]	303
				304	rq = i915_gem_request_alloc(dev_priv->engine[ring_id], shadow_ctx);
				305	if (IS_ERR(rq)) {
				306	gvt_vgpu_err("fail to allocate gem request\n");
				307	ret = PTR_ERR(rq);
fred gao	a3cfdca	2017-08-18 15:41:07 +0800	[diff] [blame]	308	goto err_unpin;
fred gao	0a53bc0	2017-08-18 15:41:06 +0800	[diff] [blame]	309	}
				310
				311	gvt_dbg_sched("ring id %d get i915 gem request %p\n", ring_id, rq);
				312
				313	workload->req = i915_gem_request_get(rq);
				314	ret = copy_workload_to_ring_buffer(workload);
				315	if (ret)
fred gao	a3cfdca	2017-08-18 15:41:07 +0800	[diff] [blame]	316	goto err_unpin;
fred gao	0a53bc0	2017-08-18 15:41:06 +0800	[diff] [blame]	317	workload->shadowed = true;
fred gao	a3cfdca	2017-08-18 15:41:07 +0800	[diff] [blame]	318	return 0;
fred gao	0a53bc0	2017-08-18 15:41:06 +0800	[diff] [blame]	319
fred gao	a3cfdca	2017-08-18 15:41:07 +0800	[diff] [blame]	320	err_unpin:
				321	engine->context_unpin(engine, shadow_ctx);
				322	err_shadow:
				323	release_shadow_wa_ctx(&workload->wa_ctx);
				324	err_scan:
fred gao	0a53bc0	2017-08-18 15:41:06 +0800	[diff] [blame]	325	return ret;
				326	}
				327
Zhi Wang	f52c380	2017-09-24 21:53:03 +0800	[diff] [blame^]	328	static void release_shadow_batch_buffer(struct intel_vgpu_workload *workload);
				329
Zhi Wang	d8235b5	2017-09-12 22:06:39 +0800	[diff] [blame]	330	static int prepare_shadow_batch_buffer(struct intel_vgpu_workload *workload)
				331	{
				332	struct intel_gvt *gvt = workload->vgpu->gvt;
				333	const int gmadr_bytes = gvt->device_info.gmadr_bytes_in_cmd;
Zhi Wang	f52c380	2017-09-24 21:53:03 +0800	[diff] [blame^]	334	struct intel_vgpu_shadow_bb *bb;
				335	int ret;
Zhi Wang	d8235b5	2017-09-12 22:06:39 +0800	[diff] [blame]	336
Zhi Wang	f52c380	2017-09-24 21:53:03 +0800	[diff] [blame^]	337	list_for_each_entry(bb, &workload->shadow_bb, list) {
				338	bb->vma = i915_gem_object_ggtt_pin(bb->obj, NULL, 0, 0, 0);
				339	if (IS_ERR(bb->vma)) {
				340	ret = PTR_ERR(bb->vma);
				341	goto err;
				342	}
Zhi Wang	d8235b5	2017-09-12 22:06:39 +0800	[diff] [blame]	343
Zhi Wang	f52c380	2017-09-24 21:53:03 +0800	[diff] [blame^]	344	/* relocate shadow batch buffer */
				345	bb->bb_start_cmd_va[1] = i915_ggtt_offset(bb->vma);
Zhi Wang	d8235b5	2017-09-12 22:06:39 +0800	[diff] [blame]	346	if (gmadr_bytes == 8)
Zhi Wang	f52c380	2017-09-24 21:53:03 +0800	[diff] [blame^]	347	bb->bb_start_cmd_va[2] = 0;
				348
				349	/* No one is going to touch shadow bb from now on. */
				350	if (bb->clflush & CLFLUSH_AFTER) {
				351	drm_clflush_virt_range(bb->va, bb->obj->base.size);
				352	bb->clflush &= ~CLFLUSH_AFTER;
				353	}
				354
				355	ret = i915_gem_object_set_to_gtt_domain(bb->obj, false);
				356	if (ret)
				357	goto err;
				358
				359	i915_gem_obj_finish_shmem_access(bb->obj);
				360	bb->accessing = false;
				361
				362	i915_vma_move_to_active(bb->vma, workload->req, 0);
Zhi Wang	d8235b5	2017-09-12 22:06:39 +0800	[diff] [blame]	363	}
				364	return 0;
Zhi Wang	f52c380	2017-09-24 21:53:03 +0800	[diff] [blame^]	365	err:
				366	release_shadow_batch_buffer(workload);
				367	return ret;
Zhi Wang	d8235b5	2017-09-12 22:06:39 +0800	[diff] [blame]	368	}
				369
				370	static int update_wa_ctx_2_shadow_ctx(struct intel_shadow_wa_ctx *wa_ctx)
				371	{
				372	struct intel_vgpu_workload *workload = container_of(wa_ctx,
				373	struct intel_vgpu_workload,
				374	wa_ctx);
				375	int ring_id = workload->ring_id;
				376	struct intel_vgpu_submission *s = &workload->vgpu->submission;
				377	struct i915_gem_context *shadow_ctx = s->shadow_ctx;
				378	struct drm_i915_gem_object *ctx_obj =
				379	shadow_ctx->engine[ring_id].state->obj;
				380	struct execlist_ring_context *shadow_ring_context;
				381	struct page *page;
				382
				383	page = i915_gem_object_get_page(ctx_obj, LRC_STATE_PN);
				384	shadow_ring_context = kmap_atomic(page);
				385
				386	shadow_ring_context->bb_per_ctx_ptr.val =
				387	(shadow_ring_context->bb_per_ctx_ptr.val &
				388	(~PER_CTX_ADDR_MASK)) \| wa_ctx->per_ctx.shadow_gma;
				389	shadow_ring_context->rcs_indirect_ctx.val =
				390	(shadow_ring_context->rcs_indirect_ctx.val &
				391	(~INDIRECT_CTX_ADDR_MASK)) \| wa_ctx->indirect_ctx.shadow_gma;
				392
				393	kunmap_atomic(shadow_ring_context);
				394	return 0;
				395	}
				396
				397	static int prepare_shadow_wa_ctx(struct intel_shadow_wa_ctx *wa_ctx)
				398	{
				399	struct i915_vma *vma;
				400	unsigned char *per_ctx_va =
				401	(unsigned char *)wa_ctx->indirect_ctx.shadow_va +
				402	wa_ctx->indirect_ctx.size;
				403
				404	if (wa_ctx->indirect_ctx.size == 0)
				405	return 0;
				406
				407	vma = i915_gem_object_ggtt_pin(wa_ctx->indirect_ctx.obj, NULL,
				408	0, CACHELINE_BYTES, 0);
				409	if (IS_ERR(vma))
				410	return PTR_ERR(vma);
				411
				412	/* FIXME: we are not tracking our pinned VMA leaving it
				413	* up to the core to fix up the stray pin_count upon
				414	* free.
				415	*/
				416
				417	wa_ctx->indirect_ctx.shadow_gma = i915_ggtt_offset(vma);
				418
				419	wa_ctx->per_ctx.shadow_gma = ((unsigned int )per_ctx_va + 1);
				420	memset(per_ctx_va, 0, CACHELINE_BYTES);
				421
				422	update_wa_ctx_2_shadow_ctx(wa_ctx);
				423	return 0;
				424	}
				425
				426	static void release_shadow_batch_buffer(struct intel_vgpu_workload *workload)
				427	{
Zhi Wang	f52c380	2017-09-24 21:53:03 +0800	[diff] [blame^]	428	struct intel_vgpu *vgpu = workload->vgpu;
				429	struct drm_i915_private *dev_priv = vgpu->gvt->dev_priv;
				430	struct intel_vgpu_shadow_bb bb, pos;
Zhi Wang	d8235b5	2017-09-12 22:06:39 +0800	[diff] [blame]	431
Zhi Wang	f52c380	2017-09-24 21:53:03 +0800	[diff] [blame^]	432	if (list_empty(&workload->shadow_bb))
				433	return;
				434
				435	bb = list_first_entry(&workload->shadow_bb,
				436	struct intel_vgpu_shadow_bb, list);
				437
				438	mutex_lock(&dev_priv->drm.struct_mutex);
				439
				440	list_for_each_entry_safe(bb, pos, &workload->shadow_bb, list) {
				441	if (bb->obj) {
				442	if (bb->accessing)
				443	i915_gem_obj_finish_shmem_access(bb->obj);
				444
				445	if (bb->va && !IS_ERR(bb->va))
				446	i915_gem_object_unpin_map(bb->obj);
				447
				448	if (bb->vma && !IS_ERR(bb->vma)) {
				449	i915_vma_unpin(bb->vma);
				450	i915_vma_close(bb->vma);
				451	}
				452	__i915_gem_object_release_unless_active(bb->obj);
Zhi Wang	d8235b5	2017-09-12 22:06:39 +0800	[diff] [blame]	453	}
Zhi Wang	f52c380	2017-09-24 21:53:03 +0800	[diff] [blame^]	454	list_del(&bb->list);
				455	kfree(bb);
Zhi Wang	d8235b5	2017-09-12 22:06:39 +0800	[diff] [blame]	456	}
Zhi Wang	f52c380	2017-09-24 21:53:03 +0800	[diff] [blame^]	457
				458	mutex_unlock(&dev_priv->drm.struct_mutex);
Zhi Wang	d8235b5	2017-09-12 22:06:39 +0800	[diff] [blame]	459	}
				460
Zhi Wang	497aa3f	2017-09-12 21:51:10 +0800	[diff] [blame]	461	static int prepare_workload(struct intel_vgpu_workload *workload)
				462	{
Zhi Wang	d8235b5	2017-09-12 22:06:39 +0800	[diff] [blame]	463	struct intel_vgpu *vgpu = workload->vgpu;
Zhi Wang	497aa3f	2017-09-12 21:51:10 +0800	[diff] [blame]	464	int ret = 0;
				465
Zhi Wang	d8235b5	2017-09-12 22:06:39 +0800	[diff] [blame]	466	ret = intel_vgpu_pin_mm(workload->shadow_mm);
				467	if (ret) {
				468	gvt_vgpu_err("fail to vgpu pin mm\n");
				469	return ret;
				470	}
Zhi Wang	497aa3f	2017-09-12 21:51:10 +0800	[diff] [blame]	471
Zhi Wang	d8235b5	2017-09-12 22:06:39 +0800	[diff] [blame]	472	ret = intel_vgpu_sync_oos_pages(workload->vgpu);
				473	if (ret) {
				474	gvt_vgpu_err("fail to vgpu sync oos pages\n");
				475	goto err_unpin_mm;
				476	}
				477
				478	ret = intel_vgpu_flush_post_shadow(workload->vgpu);
				479	if (ret) {
				480	gvt_vgpu_err("fail to flush post shadow\n");
				481	goto err_unpin_mm;
				482	}
				483
				484	ret = prepare_shadow_batch_buffer(workload);
				485	if (ret) {
				486	gvt_vgpu_err("fail to prepare_shadow_batch_buffer\n");
				487	goto err_unpin_mm;
				488	}
				489
				490	ret = prepare_shadow_wa_ctx(&workload->wa_ctx);
				491	if (ret) {
				492	gvt_vgpu_err("fail to prepare_shadow_wa_ctx\n");
				493	goto err_shadow_batch;
				494	}
				495
				496	if (workload->prepare) {
				497	ret = workload->prepare(workload);
				498	if (ret)
				499	goto err_shadow_wa_ctx;
				500	}
				501
				502	return 0;
				503	err_shadow_wa_ctx:
				504	release_shadow_wa_ctx(&workload->wa_ctx);
				505	err_shadow_batch:
				506	release_shadow_batch_buffer(workload);
				507	err_unpin_mm:
				508	intel_vgpu_unpin_mm(workload->shadow_mm);
Zhi Wang	497aa3f	2017-09-12 21:51:10 +0800	[diff] [blame]	509	return ret;
				510	}
				511
fred gao	0a53bc0	2017-08-18 15:41:06 +0800	[diff] [blame]	512	static int dispatch_workload(struct intel_vgpu_workload *workload)
				513	{
Zhi Wang	1406a14	2017-09-10 21:15:18 +0800	[diff] [blame]	514	struct intel_vgpu *vgpu = workload->vgpu;
				515	struct intel_vgpu_submission *s = &vgpu->submission;
				516	struct i915_gem_context *shadow_ctx = s->shadow_ctx;
				517	struct drm_i915_private *dev_priv = vgpu->gvt->dev_priv;
fred gao	0a53bc0	2017-08-18 15:41:06 +0800	[diff] [blame]	518	int ring_id = workload->ring_id;
fred gao	0a53bc0	2017-08-18 15:41:06 +0800	[diff] [blame]	519	struct intel_engine_cs *engine = dev_priv->engine[ring_id];
				520	int ret = 0;
				521
				522	gvt_dbg_sched("ring id %d prepare to dispatch workload %p\n",
				523	ring_id, workload);
				524
				525	mutex_lock(&dev_priv->drm.struct_mutex);
				526
				527	ret = intel_gvt_scan_and_shadow_workload(workload);
				528	if (ret)
				529	goto out;
				530
Zhi Wang	497aa3f	2017-09-12 21:51:10 +0800	[diff] [blame]	531	ret = prepare_workload(workload);
				532	if (ret) {
				533	engine->context_unpin(engine, shadow_ctx);
				534	goto out;
fred gao	0a53bc0	2017-08-18 15:41:06 +0800	[diff] [blame]	535	}
				536
Pei Zhang	90d27a1	2016-11-14 18:02:57 +0800	[diff] [blame]	537	out:
				538	if (ret)
				539	workload->status = ret;
Chris Wilson	0eb742d	2016-10-20 17:29:36 +0800	[diff] [blame]	540
Ping Gao	89ea20b	2017-06-29 12:22:42 +0800	[diff] [blame]	541	if (!IS_ERR_OR_NULL(workload->req)) {
				542	gvt_dbg_sched("ring id %d submit workload to i915 %p\n",
				543	ring_id, workload->req);
				544	i915_add_request(workload->req);
				545	workload->dispatched = true;
				546	}
Chuanxiao Dong	3cd23b8	2017-03-16 09:47:58 +0800	[diff] [blame]	547
Pei Zhang	90d27a1	2016-11-14 18:02:57 +0800	[diff] [blame]	548	mutex_unlock(&dev_priv->drm.struct_mutex);
Zhi Wang	e473405	2016-05-01 07:42:16 -0400	[diff] [blame]	549	return ret;
				550	}
				551
				552	static struct intel_vgpu_workload *pick_next_workload(
				553	struct intel_gvt *gvt, int ring_id)
				554	{
				555	struct intel_gvt_workload_scheduler *scheduler = &gvt->scheduler;
				556	struct intel_vgpu_workload *workload = NULL;
				557
				558	mutex_lock(&gvt->lock);
				559
				560	/*
				561	* no current vgpu / will be scheduled out / no workload
				562	* bail out
				563	*/
				564	if (!scheduler->current_vgpu) {
				565	gvt_dbg_sched("ring id %d stop - no current vgpu\n", ring_id);
				566	goto out;
				567	}
				568
				569	if (scheduler->need_reschedule) {
				570	gvt_dbg_sched("ring id %d stop - will reschedule\n", ring_id);
				571	goto out;
				572	}
				573
Zhenyu Wang	954180a	2017-04-12 14:22:50 +0800	[diff] [blame]	574	if (list_empty(workload_q_head(scheduler->current_vgpu, ring_id)))
Zhi Wang	e473405	2016-05-01 07:42:16 -0400	[diff] [blame]	575	goto out;
Zhi Wang	e473405	2016-05-01 07:42:16 -0400	[diff] [blame]	576
				577	/*
				578	* still have current workload, maybe the workload disptacher
				579	* fail to submit it for some reason, resubmit it.
				580	*/
				581	if (scheduler->current_workload[ring_id]) {
				582	workload = scheduler->current_workload[ring_id];
				583	gvt_dbg_sched("ring id %d still have current workload %p\n",
				584	ring_id, workload);
				585	goto out;
				586	}
				587
				588	/*
				589	* pick a workload as current workload
				590	* once current workload is set, schedule policy routines
				591	* will wait the current workload is finished when trying to
				592	* schedule out a vgpu.
				593	*/
				594	scheduler->current_workload[ring_id] = container_of(
				595	workload_q_head(scheduler->current_vgpu, ring_id)->next,
				596	struct intel_vgpu_workload, list);
				597
				598	workload = scheduler->current_workload[ring_id];
				599
				600	gvt_dbg_sched("ring id %d pick new workload %p\n", ring_id, workload);
				601
Zhi Wang	1406a14	2017-09-10 21:15:18 +0800	[diff] [blame]	602	atomic_inc(&workload->vgpu->submission.running_workload_num);
Zhi Wang	e473405	2016-05-01 07:42:16 -0400	[diff] [blame]	603	out:
				604	mutex_unlock(&gvt->lock);
				605	return workload;
				606	}
				607
				608	static void update_guest_context(struct intel_vgpu_workload *workload)
				609	{
				610	struct intel_vgpu *vgpu = workload->vgpu;
				611	struct intel_gvt *gvt = vgpu->gvt;
Zhi Wang	1406a14	2017-09-10 21:15:18 +0800	[diff] [blame]	612	struct intel_vgpu_submission *s = &vgpu->submission;
				613	struct i915_gem_context *shadow_ctx = s->shadow_ctx;
Zhi Wang	e473405	2016-05-01 07:42:16 -0400	[diff] [blame]	614	int ring_id = workload->ring_id;
Zhi Wang	e473405	2016-05-01 07:42:16 -0400	[diff] [blame]	615	struct drm_i915_gem_object *ctx_obj =
				616	shadow_ctx->engine[ring_id].state->obj;
				617	struct execlist_ring_context *shadow_ring_context;
				618	struct page *page;
				619	void *src;
				620	unsigned long context_gpa, context_page_num;
				621	int i;
				622
				623	gvt_dbg_sched("ring id %d workload lrca %x\n", ring_id,
				624	workload->ctx_desc.lrca);
				625
Joonas Lahtinen	63ffbcd	2017-04-28 10:53:36 +0300	[diff] [blame]	626	context_page_num = gvt->dev_priv->engine[ring_id]->context_size;
Zhi Wang	e473405	2016-05-01 07:42:16 -0400	[diff] [blame]	627
				628	context_page_num = context_page_num >> PAGE_SHIFT;
				629
				630	if (IS_BROADWELL(gvt->dev_priv) && ring_id == RCS)
				631	context_page_num = 19;
				632
				633	i = 2;
				634
				635	while (i < context_page_num) {
				636	context_gpa = intel_vgpu_gma_to_gpa(vgpu->gtt.ggtt_mm,
				637	(u32)((workload->ctx_desc.lrca + i) <<
				638	GTT_PAGE_SHIFT));
				639	if (context_gpa == INTEL_GVT_INVALID_ADDR) {
Tina Zhang	695fbc0	2017-03-10 04:26:53 -0500	[diff] [blame]	640	gvt_vgpu_err("invalid guest context descriptor\n");
Zhi Wang	e473405	2016-05-01 07:42:16 -0400	[diff] [blame]	641	return;
				642	}
				643
Michel Thierry	0b29c75	2017-09-13 09:56:00 +0100	[diff] [blame]	644	page = i915_gem_object_get_page(ctx_obj, LRC_HEADER_PAGES + i);
Xiaoguang Chen	c754936	2016-11-03 18:38:30 +0800	[diff] [blame]	645	src = kmap(page);
Zhi Wang	e473405	2016-05-01 07:42:16 -0400	[diff] [blame]	646	intel_gvt_hypervisor_write_gpa(vgpu, context_gpa, src,
				647	GTT_PAGE_SIZE);
Xiaoguang Chen	c754936	2016-11-03 18:38:30 +0800	[diff] [blame]	648	kunmap(page);
Zhi Wang	e473405	2016-05-01 07:42:16 -0400	[diff] [blame]	649	i++;
				650	}
				651
				652	intel_gvt_hypervisor_write_gpa(vgpu, workload->ring_context_gpa +
				653	RING_CTX_OFF(ring_header.val), &workload->rb_tail, 4);
				654
				655	page = i915_gem_object_get_page(ctx_obj, LRC_STATE_PN);
Xiaoguang Chen	c754936	2016-11-03 18:38:30 +0800	[diff] [blame]	656	shadow_ring_context = kmap(page);
Zhi Wang	e473405	2016-05-01 07:42:16 -0400	[diff] [blame]	657
				658	#define COPY_REG(name) \
				659	intel_gvt_hypervisor_write_gpa(vgpu, workload->ring_context_gpa + \
				660	RING_CTX_OFF(name.val), &shadow_ring_context->name.val, 4)
				661
				662	COPY_REG(ctx_ctrl);
				663	COPY_REG(ctx_timestamp);
				664
				665	#undef COPY_REG
				666
				667	intel_gvt_hypervisor_write_gpa(vgpu,
				668	workload->ring_context_gpa +
				669	sizeof(*shadow_ring_context),
				670	(void *)shadow_ring_context +
				671	sizeof(*shadow_ring_context),
				672	GTT_PAGE_SIZE - sizeof(*shadow_ring_context));
				673
Xiaoguang Chen	c754936	2016-11-03 18:38:30 +0800	[diff] [blame]	674	kunmap(page);
Zhi Wang	e473405	2016-05-01 07:42:16 -0400	[diff] [blame]	675	}
				676
Zhi Wang	e2c43c0	2017-09-13 01:58:35 +0800	[diff] [blame]	677	static void clean_workloads(struct intel_vgpu *vgpu, unsigned long engine_mask)
				678	{
				679	struct intel_vgpu_submission *s = &vgpu->submission;
				680	struct drm_i915_private *dev_priv = vgpu->gvt->dev_priv;
				681	struct intel_engine_cs *engine;
				682	struct intel_vgpu_workload pos, n;
				683	unsigned int tmp;
				684
				685	/* free the unsubmited workloads in the queues. */
				686	for_each_engine_masked(engine, dev_priv, engine_mask, tmp) {
				687	list_for_each_entry_safe(pos, n,
				688	&s->workload_q_head[engine->id], list) {
				689	list_del_init(&pos->list);
				690	intel_vgpu_destroy_workload(pos);
				691	}
				692	clear_bit(engine->id, s->shadow_ctx_desc_updated);
				693	}
				694	}
				695
Zhi Wang	e473405	2016-05-01 07:42:16 -0400	[diff] [blame]	696	static void complete_current_workload(struct intel_gvt *gvt, int ring_id)
				697	{
				698	struct intel_gvt_workload_scheduler *scheduler = &gvt->scheduler;
Zhi Wang	1406a14	2017-09-10 21:15:18 +0800	[diff] [blame]	699	struct intel_vgpu_workload *workload =
				700	scheduler->current_workload[ring_id];
				701	struct intel_vgpu *vgpu = workload->vgpu;
				702	struct intel_vgpu_submission *s = &vgpu->submission;
Zhi Wang	be1da70	2016-05-03 18:26:57 -0400	[diff] [blame]	703	int event;
Zhi Wang	e473405	2016-05-01 07:42:16 -0400	[diff] [blame]	704
				705	mutex_lock(&gvt->lock);
				706
Chuanxiao Dong	8f1117a	2017-03-06 13:05:24 +0800	[diff] [blame]	707	/* For the workload w/ request, needs to wait for the context
				708	* switch to make sure request is completed.
				709	* For the workload w/o request, directly complete the workload.
				710	*/
				711	if (workload->req) {
Chuanxiao Dong	3cd23b8	2017-03-16 09:47:58 +0800	[diff] [blame]	712	struct drm_i915_private *dev_priv =
				713	workload->vgpu->gvt->dev_priv;
				714	struct intel_engine_cs *engine =
				715	dev_priv->engine[workload->ring_id];
Zhi Wang	e473405	2016-05-01 07:42:16 -0400	[diff] [blame]	716	wait_event(workload->shadow_ctx_status_wq,
				717	!atomic_read(&workload->shadow_ctx_active));
				718
Chuanxiao Dong	0cf5ec4	2017-06-23 13:01:11 +0800	[diff] [blame]	719	/* If this request caused GPU hang, req->fence.error will
				720	* be set to -EIO. Use -EIO to set workload status so
				721	* that when this request caused GPU hang, didn't trigger
				722	* context switch interrupt to guest.
				723	*/
				724	if (likely(workload->status == -EINPROGRESS)) {
				725	if (workload->req->fence.error == -EIO)
				726	workload->status = -EIO;
				727	else
				728	workload->status = 0;
				729	}
				730
Chuanxiao Dong	8f1117a	2017-03-06 13:05:24 +0800	[diff] [blame]	731	i915_gem_request_put(fetch_and_zero(&workload->req));
Zhi Wang	be1da70	2016-05-03 18:26:57 -0400	[diff] [blame]	732
Chuanxiao Dong	6184cc8	2017-08-01 17:47:25 +0800	[diff] [blame]	733	if (!workload->status && !(vgpu->resetting_eng &
				734	ENGINE_MASK(ring_id))) {
Chuanxiao Dong	8f1117a	2017-03-06 13:05:24 +0800	[diff] [blame]	735	update_guest_context(workload);
				736
				737	for_each_set_bit(event, workload->pending_events,
				738	INTEL_GVT_EVENT_MAX)
				739	intel_vgpu_trigger_virtual_event(vgpu, event);
				740	}
Chuanxiao Dong	3cd23b8	2017-03-16 09:47:58 +0800	[diff] [blame]	741	mutex_lock(&dev_priv->drm.struct_mutex);
				742	/* unpin shadow ctx as the shadow_ctx update is done */
Zhi Wang	1406a14	2017-09-10 21:15:18 +0800	[diff] [blame]	743	engine->context_unpin(engine, s->shadow_ctx);
Chuanxiao Dong	3cd23b8	2017-03-16 09:47:58 +0800	[diff] [blame]	744	mutex_unlock(&dev_priv->drm.struct_mutex);
Zhi Wang	e473405	2016-05-01 07:42:16 -0400	[diff] [blame]	745	}
				746
				747	gvt_dbg_sched("ring id %d complete workload %p status %d\n",
				748	ring_id, workload, workload->status);
				749
				750	scheduler->current_workload[ring_id] = NULL;
				751
Zhi Wang	e473405	2016-05-01 07:42:16 -0400	[diff] [blame]	752	list_del_init(&workload->list);
Zhi Wang	d8235b5	2017-09-12 22:06:39 +0800	[diff] [blame]	753
				754	if (!workload->status) {
				755	release_shadow_batch_buffer(workload);
				756	release_shadow_wa_ctx(&workload->wa_ctx);
				757	}
				758
Zhi Wang	e2c43c0	2017-09-13 01:58:35 +0800	[diff] [blame]	759	if (workload->status \|\| (vgpu->resetting_eng & ENGINE_MASK(ring_id))) {
				760	/* if workload->status is not successful means HW GPU
				761	* has occurred GPU hang or something wrong with i915/GVT,
				762	* and GVT won't inject context switch interrupt to guest.
				763	* So this error is a vGPU hang actually to the guest.
				764	* According to this we should emunlate a vGPU hang. If
				765	* there are pending workloads which are already submitted
				766	* from guest, we should clean them up like HW GPU does.
				767	*
				768	* if it is in middle of engine resetting, the pending
				769	* workloads won't be submitted to HW GPU and will be
				770	* cleaned up during the resetting process later, so doing
				771	* the workload clean up here doesn't have any impact.
				772	**/
				773	clean_workloads(vgpu, ENGINE_MASK(ring_id));
				774	}
				775
Zhi Wang	e473405	2016-05-01 07:42:16 -0400	[diff] [blame]	776	workload->complete(workload);
				777
Zhi Wang	1406a14	2017-09-10 21:15:18 +0800	[diff] [blame]	778	atomic_dec(&s->running_workload_num);
Zhi Wang	e473405	2016-05-01 07:42:16 -0400	[diff] [blame]	779	wake_up(&scheduler->workload_complete_wq);
Ping Gao	f100dae	2017-05-24 09:14:11 +0800	[diff] [blame]	780
				781	if (gvt->scheduler.need_reschedule)
				782	intel_gvt_request_service(gvt, INTEL_GVT_REQUEST_EVENT_SCHED);
				783
Zhi Wang	e473405	2016-05-01 07:42:16 -0400	[diff] [blame]	784	mutex_unlock(&gvt->lock);
				785	}
				786
				787	struct workload_thread_param {
				788	struct intel_gvt *gvt;
				789	int ring_id;
				790	};
				791
				792	static int workload_thread(void *priv)
				793	{
				794	struct workload_thread_param p = (struct workload_thread_param )priv;
				795	struct intel_gvt *gvt = p->gvt;
				796	int ring_id = p->ring_id;
				797	struct intel_gvt_workload_scheduler *scheduler = &gvt->scheduler;
				798	struct intel_vgpu_workload *workload = NULL;
Tina Zhang	695fbc0	2017-03-10 04:26:53 -0500	[diff] [blame]	799	struct intel_vgpu *vgpu = NULL;
Zhi Wang	e473405	2016-05-01 07:42:16 -0400	[diff] [blame]	800	int ret;
Xu Han	e3476c0	2017-03-29 10:13:59 +0800	[diff] [blame]	801	bool need_force_wake = IS_SKYLAKE(gvt->dev_priv)
				802	\|\| IS_KABYLAKE(gvt->dev_priv);
Du, Changbin	e45d7b7	2016-10-27 11:10:31 +0800	[diff] [blame]	803	DEFINE_WAIT_FUNC(wait, woken_wake_function);
Zhi Wang	e473405	2016-05-01 07:42:16 -0400	[diff] [blame]	804
				805	kfree(p);
				806
				807	gvt_dbg_core("workload thread for ring %d started\n", ring_id);
				808
				809	while (!kthread_should_stop()) {
Du, Changbin	e45d7b7	2016-10-27 11:10:31 +0800	[diff] [blame]	810	add_wait_queue(&scheduler->waitq[ring_id], &wait);
				811	do {
				812	workload = pick_next_workload(gvt, ring_id);
				813	if (workload)
				814	break;
				815	wait_woken(&wait, TASK_INTERRUPTIBLE,
				816	MAX_SCHEDULE_TIMEOUT);
				817	} while (!kthread_should_stop());
				818	remove_wait_queue(&scheduler->waitq[ring_id], &wait);
Zhi Wang	e473405	2016-05-01 07:42:16 -0400	[diff] [blame]	819
Du, Changbin	e45d7b7	2016-10-27 11:10:31 +0800	[diff] [blame]	820	if (!workload)
Zhi Wang	e473405	2016-05-01 07:42:16 -0400	[diff] [blame]	821	break;
				822
				823	gvt_dbg_sched("ring id %d next workload %p vgpu %d\n",
				824	workload->ring_id, workload,
				825	workload->vgpu->id);
				826
				827	intel_runtime_pm_get(gvt->dev_priv);
				828
Zhi Wang	e473405	2016-05-01 07:42:16 -0400	[diff] [blame]	829	gvt_dbg_sched("ring id %d will dispatch workload %p\n",
				830	workload->ring_id, workload);
				831
				832	if (need_force_wake)
				833	intel_uncore_forcewake_get(gvt->dev_priv,
				834	FORCEWAKE_ALL);
				835
Pei Zhang	90d27a1	2016-11-14 18:02:57 +0800	[diff] [blame]	836	mutex_lock(&gvt->lock);
Zhi Wang	e473405	2016-05-01 07:42:16 -0400	[diff] [blame]	837	ret = dispatch_workload(workload);
Pei Zhang	90d27a1	2016-11-14 18:02:57 +0800	[diff] [blame]	838	mutex_unlock(&gvt->lock);
Chris Wilson	66bbc3b	2016-10-19 11:11:44 +0100	[diff] [blame]	839
Zhi Wang	e473405	2016-05-01 07:42:16 -0400	[diff] [blame]	840	if (ret) {
Tina Zhang	695fbc0	2017-03-10 04:26:53 -0500	[diff] [blame]	841	vgpu = workload->vgpu;
				842	gvt_vgpu_err("fail to dispatch workload, skip\n");
Zhi Wang	e473405	2016-05-01 07:42:16 -0400	[diff] [blame]	843	goto complete;
				844	}
				845
				846	gvt_dbg_sched("ring id %d wait workload %p\n",
				847	workload->ring_id, workload);
Chris Wilson	3dce2ac	2017-03-08 22:08:08 +0000	[diff] [blame]	848	i915_wait_request(workload->req, 0, MAX_SCHEDULE_TIMEOUT);
Zhi Wang	e473405	2016-05-01 07:42:16 -0400	[diff] [blame]	849
				850	complete:
Changbin Du	3ce3274	2017-02-09 10:13:16 +0800	[diff] [blame]	851	gvt_dbg_sched("will complete workload %p, status: %d\n",
Zhi Wang	e473405	2016-05-01 07:42:16 -0400	[diff] [blame]	852	workload, workload->status);
				853
Changbin Du	2e51ef3	2017-01-05 13:28:05 +0800	[diff] [blame]	854	complete_current_workload(gvt, ring_id);
				855
Zhi Wang	e473405	2016-05-01 07:42:16 -0400	[diff] [blame]	856	if (need_force_wake)
				857	intel_uncore_forcewake_put(gvt->dev_priv,
				858	FORCEWAKE_ALL);
				859
Zhi Wang	e473405	2016-05-01 07:42:16 -0400	[diff] [blame]	860	intel_runtime_pm_put(gvt->dev_priv);
Zhi Wang	6d76303	2017-09-12 22:33:12 +0800	[diff] [blame]	861	if (ret && (vgpu_is_vm_unhealthy(ret)))
fred gao	e011c6c	2017-09-19 15:11:28 +0800	[diff] [blame]	862	enter_failsafe_mode(vgpu, GVT_FAILSAFE_GUEST_ERR);
Zhi Wang	e473405	2016-05-01 07:42:16 -0400	[diff] [blame]	863	}
				864	return 0;
				865	}
				866
				867	void intel_gvt_wait_vgpu_idle(struct intel_vgpu *vgpu)
				868	{
Zhi Wang	1406a14	2017-09-10 21:15:18 +0800	[diff] [blame]	869	struct intel_vgpu_submission *s = &vgpu->submission;
Zhi Wang	e473405	2016-05-01 07:42:16 -0400	[diff] [blame]	870	struct intel_gvt *gvt = vgpu->gvt;
				871	struct intel_gvt_workload_scheduler *scheduler = &gvt->scheduler;
				872
Zhi Wang	1406a14	2017-09-10 21:15:18 +0800	[diff] [blame]	873	if (atomic_read(&s->running_workload_num)) {
Zhi Wang	e473405	2016-05-01 07:42:16 -0400	[diff] [blame]	874	gvt_dbg_sched("wait vgpu idle\n");
				875
				876	wait_event(scheduler->workload_complete_wq,
Zhi Wang	1406a14	2017-09-10 21:15:18 +0800	[diff] [blame]	877	!atomic_read(&s->running_workload_num));
Zhi Wang	e473405	2016-05-01 07:42:16 -0400	[diff] [blame]	878	}
				879	}
				880
				881	void intel_gvt_clean_workload_scheduler(struct intel_gvt *gvt)
				882	{
				883	struct intel_gvt_workload_scheduler *scheduler = &gvt->scheduler;
Changbin Du	3fc0306	2017-03-13 10:47:11 +0800	[diff] [blame]	884	struct intel_engine_cs *engine;
				885	enum intel_engine_id i;
Zhi Wang	e473405	2016-05-01 07:42:16 -0400	[diff] [blame]	886
				887	gvt_dbg_core("clean workload scheduler\n");
				888
Changbin Du	3fc0306	2017-03-13 10:47:11 +0800	[diff] [blame]	889	for_each_engine(engine, gvt->dev_priv, i) {
				890	atomic_notifier_chain_unregister(
				891	&engine->context_status_notifier,
				892	&gvt->shadow_ctx_notifier_block[i]);
				893	kthread_stop(scheduler->thread[i]);
Zhi Wang	e473405	2016-05-01 07:42:16 -0400	[diff] [blame]	894	}
				895	}
				896
				897	int intel_gvt_init_workload_scheduler(struct intel_gvt *gvt)
				898	{
				899	struct intel_gvt_workload_scheduler *scheduler = &gvt->scheduler;
				900	struct workload_thread_param *param = NULL;
Changbin Du	3fc0306	2017-03-13 10:47:11 +0800	[diff] [blame]	901	struct intel_engine_cs *engine;
				902	enum intel_engine_id i;
Zhi Wang	e473405	2016-05-01 07:42:16 -0400	[diff] [blame]	903	int ret;
Zhi Wang	e473405	2016-05-01 07:42:16 -0400	[diff] [blame]	904
				905	gvt_dbg_core("init workload scheduler\n");
				906
				907	init_waitqueue_head(&scheduler->workload_complete_wq);
				908
Changbin Du	3fc0306	2017-03-13 10:47:11 +0800	[diff] [blame]	909	for_each_engine(engine, gvt->dev_priv, i) {
Zhi Wang	e473405	2016-05-01 07:42:16 -0400	[diff] [blame]	910	init_waitqueue_head(&scheduler->waitq[i]);
				911
				912	param = kzalloc(sizeof(*param), GFP_KERNEL);
				913	if (!param) {
				914	ret = -ENOMEM;
				915	goto err;
				916	}
				917
				918	param->gvt = gvt;
				919	param->ring_id = i;
				920
				921	scheduler->thread[i] = kthread_run(workload_thread, param,
				922	"gvt workload %d", i);
				923	if (IS_ERR(scheduler->thread[i])) {
				924	gvt_err("fail to create workload thread\n");
				925	ret = PTR_ERR(scheduler->thread[i]);
				926	goto err;
				927	}
Changbin Du	3fc0306	2017-03-13 10:47:11 +0800	[diff] [blame]	928
				929	gvt->shadow_ctx_notifier_block[i].notifier_call =
				930	shadow_context_status_change;
				931	atomic_notifier_chain_register(&engine->context_status_notifier,
				932	&gvt->shadow_ctx_notifier_block[i]);
Zhi Wang	e473405	2016-05-01 07:42:16 -0400	[diff] [blame]	933	}
				934	return 0;
				935	err:
				936	intel_gvt_clean_workload_scheduler(gvt);
				937	kfree(param);
				938	param = NULL;
				939	return ret;
				940	}
				941
Zhi Wang	874b6a9	2017-09-10 20:08:18 +0800	[diff] [blame]	942	/**
				943	* intel_vgpu_clean_submission - free submission-related resource for vGPU
				944	* @vgpu: a vGPU
				945	*
				946	* This function is called when a vGPU is being destroyed.
				947	*
				948	*/
				949	void intel_vgpu_clean_submission(struct intel_vgpu *vgpu)
Zhi Wang	e473405	2016-05-01 07:42:16 -0400	[diff] [blame]	950	{
Zhi Wang	1406a14	2017-09-10 21:15:18 +0800	[diff] [blame]	951	struct intel_vgpu_submission *s = &vgpu->submission;
				952
Zhi Wang	ad1d363	2017-09-13 00:31:29 +0800	[diff] [blame]	953	intel_vgpu_select_submission_ops(vgpu, 0);
Zhi Wang	1406a14	2017-09-10 21:15:18 +0800	[diff] [blame]	954	i915_gem_context_put(s->shadow_ctx);
				955	kmem_cache_destroy(s->workloads);
Zhi Wang	e473405	2016-05-01 07:42:16 -0400	[diff] [blame]	956	}
				957
Zhi Wang	06bb372	2017-09-13 01:41:35 +0800	[diff] [blame]	958
				959	/**
				960	* intel_vgpu_reset_submission - reset submission-related resource for vGPU
				961	* @vgpu: a vGPU
				962	* @engine_mask: engines expected to be reset
				963	*
				964	* This function is called when a vGPU is being destroyed.
				965	*
				966	*/
				967	void intel_vgpu_reset_submission(struct intel_vgpu *vgpu,
				968	unsigned long engine_mask)
				969	{
				970	struct intel_vgpu_submission *s = &vgpu->submission;
				971
				972	if (!s->active)
				973	return;
				974
Zhi Wang	e2c43c0	2017-09-13 01:58:35 +0800	[diff] [blame]	975	clean_workloads(vgpu, engine_mask);
Zhi Wang	06bb372	2017-09-13 01:41:35 +0800	[diff] [blame]	976	s->ops->reset(vgpu, engine_mask);
				977	}
				978
Zhi Wang	874b6a9	2017-09-10 20:08:18 +0800	[diff] [blame]	979	/**
				980	* intel_vgpu_setup_submission - setup submission-related resource for vGPU
				981	* @vgpu: a vGPU
				982	*
				983	* This function is called when a vGPU is being created.
				984	*
				985	* Returns:
				986	* Zero on success, negative error code if failed.
				987	*
				988	*/
				989	int intel_vgpu_setup_submission(struct intel_vgpu *vgpu)
Zhi Wang	e473405	2016-05-01 07:42:16 -0400	[diff] [blame]	990	{
Zhi Wang	1406a14	2017-09-10 21:15:18 +0800	[diff] [blame]	991	struct intel_vgpu_submission *s = &vgpu->submission;
Zhi Wang	9a9829e	2017-09-10 20:28:09 +0800	[diff] [blame]	992	enum intel_engine_id i;
				993	struct intel_engine_cs *engine;
				994	int ret;
Zhi Wang	e473405	2016-05-01 07:42:16 -0400	[diff] [blame]	995
Zhi Wang	1406a14	2017-09-10 21:15:18 +0800	[diff] [blame]	996	s->shadow_ctx = i915_gem_context_create_gvt(
Zhi Wang	e473405	2016-05-01 07:42:16 -0400	[diff] [blame]	997	&vgpu->gvt->dev_priv->drm);
Zhi Wang	1406a14	2017-09-10 21:15:18 +0800	[diff] [blame]	998	if (IS_ERR(s->shadow_ctx))
				999	return PTR_ERR(s->shadow_ctx);
Zhi Wang	e473405	2016-05-01 07:42:16 -0400	[diff] [blame]	1000
Zhi Wang	1406a14	2017-09-10 21:15:18 +0800	[diff] [blame]	1001	bitmap_zero(s->shadow_ctx_desc_updated, I915_NUM_ENGINES);
Kechen Lu	9dfb8e5	2017-08-10 07:41:36 +0800	[diff] [blame]	1002
Zhi Wang	1406a14	2017-09-10 21:15:18 +0800	[diff] [blame]	1003	s->workloads = kmem_cache_create("gvt-g_vgpu_workload",
Zhi Wang	9a9829e	2017-09-10 20:28:09 +0800	[diff] [blame]	1004	sizeof(struct intel_vgpu_workload), 0,
				1005	SLAB_HWCACHE_ALIGN,
				1006	NULL);
				1007
Zhi Wang	1406a14	2017-09-10 21:15:18 +0800	[diff] [blame]	1008	if (!s->workloads) {
Zhi Wang	9a9829e	2017-09-10 20:28:09 +0800	[diff] [blame]	1009	ret = -ENOMEM;
				1010	goto out_shadow_ctx;
				1011	}
				1012
				1013	for_each_engine(engine, vgpu->gvt->dev_priv, i)
Zhi Wang	1406a14	2017-09-10 21:15:18 +0800	[diff] [blame]	1014	INIT_LIST_HEAD(&s->workload_q_head[i]);
Zhi Wang	9a9829e	2017-09-10 20:28:09 +0800	[diff] [blame]	1015
Zhi Wang	1406a14	2017-09-10 21:15:18 +0800	[diff] [blame]	1016	atomic_set(&s->running_workload_num, 0);
Zhi Wang	91d5d85	2017-09-10 21:33:20 +0800	[diff] [blame]	1017	bitmap_zero(s->tlb_handle_pending, I915_NUM_ENGINES);
Zhi Wang	9a9829e	2017-09-10 20:28:09 +0800	[diff] [blame]	1018
Zhi Wang	e473405	2016-05-01 07:42:16 -0400	[diff] [blame]	1019	return 0;
Zhi Wang	9a9829e	2017-09-10 20:28:09 +0800	[diff] [blame]	1020
				1021	out_shadow_ctx:
Zhi Wang	1406a14	2017-09-10 21:15:18 +0800	[diff] [blame]	1022	i915_gem_context_put(s->shadow_ctx);
Zhi Wang	9a9829e	2017-09-10 20:28:09 +0800	[diff] [blame]	1023	return ret;
Zhi Wang	e473405	2016-05-01 07:42:16 -0400	[diff] [blame]	1024	}
Zhi Wang	21527a8	2017-09-12 21:42:09 +0800	[diff] [blame]	1025
				1026	/**
Zhi Wang	ad1d363	2017-09-13 00:31:29 +0800	[diff] [blame]	1027	* intel_vgpu_select_submission_ops - select virtual submission interface
				1028	* @vgpu: a vGPU
				1029	* @interface: expected vGPU virtual submission interface
				1030	*
				1031	* This function is called when guest configures submission interface.
				1032	*
				1033	* Returns:
				1034	* Zero on success, negative error code if failed.
				1035	*
				1036	*/
				1037	int intel_vgpu_select_submission_ops(struct intel_vgpu *vgpu,
				1038	unsigned int interface)
				1039	{
				1040	struct intel_vgpu_submission *s = &vgpu->submission;
				1041	const struct intel_vgpu_submission_ops *ops[] = {
				1042	[INTEL_VGPU_EXECLIST_SUBMISSION] =
				1043	&intel_vgpu_execlist_submission_ops,
				1044	};
				1045	int ret;
				1046
				1047	if (WARN_ON(interface >= ARRAY_SIZE(ops)))
				1048	return -EINVAL;
				1049
				1050	if (s->active) {
				1051	s->ops->clean(vgpu);
				1052	s->active = false;
				1053	gvt_dbg_core("vgpu%d: de-select ops [ %s ] \n",
				1054	vgpu->id, s->ops->name);
				1055	}
				1056
				1057	if (interface == 0) {
				1058	s->ops = NULL;
				1059	s->virtual_submission_interface = 0;
				1060	gvt_dbg_core("vgpu%d: no submission ops\n", vgpu->id);
				1061	return 0;
				1062	}
				1063
				1064	ret = ops[interface]->init(vgpu);
				1065	if (ret)
				1066	return ret;
				1067
				1068	s->ops = ops[interface];
				1069	s->virtual_submission_interface = interface;
				1070	s->active = true;
				1071
				1072	gvt_dbg_core("vgpu%d: activate ops [ %s ]\n",
				1073	vgpu->id, s->ops->name);
				1074
				1075	return 0;
				1076	}
				1077
				1078	/**
Zhi Wang	21527a8	2017-09-12 21:42:09 +0800	[diff] [blame]	1079	* intel_vgpu_destroy_workload - destroy a vGPU workload
				1080	* @vgpu: a vGPU
				1081	*
				1082	* This function is called when destroy a vGPU workload.
				1083	*
				1084	*/
				1085	void intel_vgpu_destroy_workload(struct intel_vgpu_workload *workload)
				1086	{
				1087	struct intel_vgpu_submission *s = &workload->vgpu->submission;
				1088
				1089	if (workload->shadow_mm)
				1090	intel_gvt_mm_unreference(workload->shadow_mm);
				1091
				1092	kmem_cache_free(s->workloads, workload);
				1093	}
				1094
Zhi Wang	6d76303	2017-09-12 22:33:12 +0800	[diff] [blame]	1095	static struct intel_vgpu_workload *
				1096	alloc_workload(struct intel_vgpu *vgpu)
Zhi Wang	21527a8	2017-09-12 21:42:09 +0800	[diff] [blame]	1097	{
				1098	struct intel_vgpu_submission *s = &vgpu->submission;
				1099	struct intel_vgpu_workload *workload;
				1100
				1101	workload = kmem_cache_zalloc(s->workloads, GFP_KERNEL);
				1102	if (!workload)
				1103	return ERR_PTR(-ENOMEM);
				1104
				1105	INIT_LIST_HEAD(&workload->list);
				1106	INIT_LIST_HEAD(&workload->shadow_bb);
				1107
				1108	init_waitqueue_head(&workload->shadow_ctx_status_wq);
				1109	atomic_set(&workload->shadow_ctx_active, 0);
				1110
				1111	workload->status = -EINPROGRESS;
				1112	workload->shadowed = false;
				1113	workload->vgpu = vgpu;
				1114
				1115	return workload;
				1116	}
Zhi Wang	6d76303	2017-09-12 22:33:12 +0800	[diff] [blame]	1117
				1118	#define RING_CTX_OFF(x) \
				1119	offsetof(struct execlist_ring_context, x)
				1120
				1121	static void read_guest_pdps(struct intel_vgpu *vgpu,
				1122	u64 ring_context_gpa, u32 pdp[8])
				1123	{
				1124	u64 gpa;
				1125	int i;
				1126
				1127	gpa = ring_context_gpa + RING_CTX_OFF(pdp3_UDW.val);
				1128
				1129	for (i = 0; i < 8; i++)
				1130	intel_gvt_hypervisor_read_gpa(vgpu,
				1131	gpa + i * 8, &pdp[7 - i], 4);
				1132	}
				1133
				1134	static int prepare_mm(struct intel_vgpu_workload *workload)
				1135	{
				1136	struct execlist_ctx_descriptor_format *desc = &workload->ctx_desc;
				1137	struct intel_vgpu_mm *mm;
				1138	struct intel_vgpu *vgpu = workload->vgpu;
				1139	int page_table_level;
				1140	u32 pdp[8];
				1141
				1142	if (desc->addressing_mode == 1) { /* legacy 32-bit */
				1143	page_table_level = 3;
				1144	} else if (desc->addressing_mode == 3) { /* legacy 64 bit */
				1145	page_table_level = 4;
				1146	} else {
				1147	gvt_vgpu_err("Advanced Context mode(SVM) is not supported!\n");
				1148	return -EINVAL;
				1149	}
				1150
				1151	read_guest_pdps(workload->vgpu, workload->ring_context_gpa, pdp);
				1152
				1153	mm = intel_vgpu_find_ppgtt_mm(workload->vgpu, page_table_level, pdp);
				1154	if (mm) {
				1155	intel_gvt_mm_reference(mm);
				1156	} else {
				1157
				1158	mm = intel_vgpu_create_mm(workload->vgpu, INTEL_GVT_MM_PPGTT,
				1159	pdp, page_table_level, 0);
				1160	if (IS_ERR(mm)) {
				1161	gvt_vgpu_err("fail to create mm object.\n");
				1162	return PTR_ERR(mm);
				1163	}
				1164	}
				1165	workload->shadow_mm = mm;
				1166	return 0;
				1167	}
				1168
				1169	#define same_context(a, b) (((a)->context_id == (b)->context_id) && \
				1170	((a)->lrca == (b)->lrca))
				1171
				1172	#define get_last_workload(q) \
				1173	(list_empty(q) ? NULL : container_of(q->prev, \
				1174	struct intel_vgpu_workload, list))
				1175	/**
				1176	* intel_vgpu_create_workload - create a vGPU workload
				1177	* @vgpu: a vGPU
				1178	* @desc: a guest context descriptor
				1179	*
				1180	* This function is called when creating a vGPU workload.
				1181	*
				1182	* Returns:
				1183	* struct intel_vgpu_workload * on success, negative error code in
				1184	* pointer if failed.
				1185	*
				1186	*/
				1187	struct intel_vgpu_workload *
				1188	intel_vgpu_create_workload(struct intel_vgpu *vgpu, int ring_id,
				1189	struct execlist_ctx_descriptor_format *desc)
				1190	{
				1191	struct intel_vgpu_submission *s = &vgpu->submission;
				1192	struct list_head *q = workload_q_head(vgpu, ring_id);
				1193	struct intel_vgpu_workload *last_workload = get_last_workload(q);
				1194	struct intel_vgpu_workload *workload = NULL;
				1195	struct drm_i915_private *dev_priv = vgpu->gvt->dev_priv;
				1196	u64 ring_context_gpa;
				1197	u32 head, tail, start, ctl, ctx_ctl, per_ctx, indirect_ctx;
				1198	int ret;
				1199
				1200	ring_context_gpa = intel_vgpu_gma_to_gpa(vgpu->gtt.ggtt_mm,
				1201	(u32)((desc->lrca + 1) << GTT_PAGE_SHIFT));
				1202	if (ring_context_gpa == INTEL_GVT_INVALID_ADDR) {
				1203	gvt_vgpu_err("invalid guest context LRCA: %x\n", desc->lrca);
				1204	return ERR_PTR(-EINVAL);
				1205	}
				1206
				1207	intel_gvt_hypervisor_read_gpa(vgpu, ring_context_gpa +
				1208	RING_CTX_OFF(ring_header.val), &head, 4);
				1209
				1210	intel_gvt_hypervisor_read_gpa(vgpu, ring_context_gpa +
				1211	RING_CTX_OFF(ring_tail.val), &tail, 4);
				1212
				1213	head &= RB_HEAD_OFF_MASK;
				1214	tail &= RB_TAIL_OFF_MASK;
				1215
				1216	if (last_workload && same_context(&last_workload->ctx_desc, desc)) {
				1217	gvt_dbg_el("ring id %d cur workload == last\n", ring_id);
				1218	gvt_dbg_el("ctx head %x real head %lx\n", head,
				1219	last_workload->rb_tail);
				1220	/*
				1221	* cannot use guest context head pointer here,
				1222	* as it might not be updated at this time
				1223	*/
				1224	head = last_workload->rb_tail;
				1225	}
				1226
				1227	gvt_dbg_el("ring id %d begin a new workload\n", ring_id);
				1228
				1229	/* record some ring buffer register values for scan and shadow */
				1230	intel_gvt_hypervisor_read_gpa(vgpu, ring_context_gpa +
				1231	RING_CTX_OFF(rb_start.val), &start, 4);
				1232	intel_gvt_hypervisor_read_gpa(vgpu, ring_context_gpa +
				1233	RING_CTX_OFF(rb_ctrl.val), &ctl, 4);
				1234	intel_gvt_hypervisor_read_gpa(vgpu, ring_context_gpa +
				1235	RING_CTX_OFF(ctx_ctrl.val), &ctx_ctl, 4);
				1236
				1237	workload = alloc_workload(vgpu);
				1238	if (IS_ERR(workload))
				1239	return workload;
				1240
				1241	workload->ring_id = ring_id;
				1242	workload->ctx_desc = *desc;
				1243	workload->ring_context_gpa = ring_context_gpa;
				1244	workload->rb_head = head;
				1245	workload->rb_tail = tail;
				1246	workload->rb_start = start;
				1247	workload->rb_ctl = ctl;
				1248
				1249	if (ring_id == RCS) {
				1250	intel_gvt_hypervisor_read_gpa(vgpu, ring_context_gpa +
				1251	RING_CTX_OFF(bb_per_ctx_ptr.val), &per_ctx, 4);
				1252	intel_gvt_hypervisor_read_gpa(vgpu, ring_context_gpa +
				1253	RING_CTX_OFF(rcs_indirect_ctx.val), &indirect_ctx, 4);
				1254
				1255	workload->wa_ctx.indirect_ctx.guest_gma =
				1256	indirect_ctx & INDIRECT_CTX_ADDR_MASK;
				1257	workload->wa_ctx.indirect_ctx.size =
				1258	(indirect_ctx & INDIRECT_CTX_SIZE_MASK) *
				1259	CACHELINE_BYTES;
				1260	workload->wa_ctx.per_ctx.guest_gma =
				1261	per_ctx & PER_CTX_ADDR_MASK;
				1262	workload->wa_ctx.per_ctx.valid = per_ctx & 1;
				1263	}
				1264
				1265	gvt_dbg_el("workload %p ring id %d head %x tail %x start %x ctl %x\n",
				1266	workload, ring_id, head, tail, start, ctl);
				1267
				1268	ret = prepare_mm(workload);
				1269	if (ret) {
				1270	kmem_cache_free(s->workloads, workload);
				1271	return ERR_PTR(ret);
				1272	}
				1273
				1274	/* Only scan and shadow the first workload in the queue
				1275	* as there is only one pre-allocated buf-obj for shadow.
				1276	*/
				1277	if (list_empty(workload_q_head(vgpu, ring_id))) {
				1278	intel_runtime_pm_get(dev_priv);
				1279	mutex_lock(&dev_priv->drm.struct_mutex);
				1280	ret = intel_gvt_scan_and_shadow_workload(workload);
				1281	mutex_unlock(&dev_priv->drm.struct_mutex);
				1282	intel_runtime_pm_put(dev_priv);
				1283	}
				1284
				1285	if (ret && (vgpu_is_vm_unhealthy(ret))) {
				1286	enter_failsafe_mode(vgpu, GVT_FAILSAFE_GUEST_ERR);
				1287	intel_vgpu_destroy_workload(workload);
				1288	return ERR_PTR(ret);
				1289	}
				1290
				1291	return workload;
				1292	}