Blame - drivers/gpu/drm/i915/gvt/scheduler.c - kernel/msm-5.4

blob: 1127bd77fc6e7d9897d73c3684b3052aab1db8d8 [file] [log] [blame]

Zhi Wang	e473405	2016-05-01 07:42:16 -0400	[diff] [blame]	1	/*
				2	* Copyright(c) 2011-2016 Intel Corporation. All rights reserved.
				3	*
				4	* Permission is hereby granted, free of charge, to any person obtaining a
				5	* copy of this software and associated documentation files (the "Software"),
				6	* to deal in the Software without restriction, including without limitation
				7	* the rights to use, copy, modify, merge, publish, distribute, sublicense,
				8	* and/or sell copies of the Software, and to permit persons to whom the
				9	* Software is furnished to do so, subject to the following conditions:
				10	*
				11	* The above copyright notice and this permission notice (including the next
				12	* paragraph) shall be included in all copies or substantial portions of the
				13	* Software.
				14	*
				15	* THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
				16	* IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
				17	* FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL
				18	* THE AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
				19	* LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
				20	* OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE
				21	* SOFTWARE.
				22	*
				23	* Authors:
				24	* Zhi Wang <zhi.a.wang@intel.com>
				25	*
				26	* Contributors:
				27	* Ping Gao <ping.a.gao@intel.com>
				28	* Tina Zhang <tina.zhang@intel.com>
				29	* Chanbin Du <changbin.du@intel.com>
				30	* Min He <min.he@intel.com>
				31	* Bing Niu <bing.niu@intel.com>
				32	* Zhenyu Wang <zhenyuw@linux.intel.com>
				33	*
				34	*/
				35
Zhi Wang	e473405	2016-05-01 07:42:16 -0400	[diff] [blame]	36	#include <linux/kthread.h>
				37
Zhenyu Wang	feddf6e	2016-10-20 17:15:03 +0800	[diff] [blame]	38	#include "i915_drv.h"
				39	#include "gvt.h"
				40
Zhi Wang	e473405	2016-05-01 07:42:16 -0400	[diff] [blame]	41	#define RING_CTX_OFF(x) \
				42	offsetof(struct execlist_ring_context, x)
				43
Du, Changbin	999ccb4	2016-10-20 14:08:47 +0800	[diff] [blame]	44	static void set_context_pdp_root_pointer(
				45	struct execlist_ring_context *ring_context,
Zhi Wang	e473405	2016-05-01 07:42:16 -0400	[diff] [blame]	46	u32 pdp[8])
				47	{
				48	struct execlist_mmio_pair *pdp_pair = &ring_context->pdp3_UDW;
				49	int i;
				50
				51	for (i = 0; i < 8; i++)
				52	pdp_pair[i].val = pdp[7 - i];
				53	}
				54
Zhi Wang	b20c0d5	2018-02-07 18:12:15 +0800	[diff] [blame^]	55	static void update_shadow_pdps(struct intel_vgpu_workload *workload)
				56	{
				57	struct intel_vgpu *vgpu = workload->vgpu;
				58	int ring_id = workload->ring_id;
				59	struct i915_gem_context *shadow_ctx = vgpu->submission.shadow_ctx;
				60	struct drm_i915_gem_object *ctx_obj =
				61	shadow_ctx->engine[ring_id].state->obj;
				62	struct execlist_ring_context *shadow_ring_context;
				63	struct page *page;
				64
				65	if (WARN_ON(!workload->shadow_mm))
				66	return;
				67
				68	if (WARN_ON(!atomic_read(&workload->shadow_mm->pincount)))
				69	return;
				70
				71	page = i915_gem_object_get_page(ctx_obj, LRC_STATE_PN);
				72	shadow_ring_context = kmap(page);
				73	set_context_pdp_root_pointer(shadow_ring_context,
				74	(void *)workload->shadow_mm->ppgtt_mm.shadow_pdps);
				75	kunmap(page);
				76	}
				77
Zhi Wang	e473405	2016-05-01 07:42:16 -0400	[diff] [blame]	78	static int populate_shadow_context(struct intel_vgpu_workload *workload)
				79	{
				80	struct intel_vgpu *vgpu = workload->vgpu;
				81	struct intel_gvt *gvt = vgpu->gvt;
				82	int ring_id = workload->ring_id;
Zhi Wang	1406a14	2017-09-10 21:15:18 +0800	[diff] [blame]	83	struct i915_gem_context *shadow_ctx = vgpu->submission.shadow_ctx;
Zhi Wang	e473405	2016-05-01 07:42:16 -0400	[diff] [blame]	84	struct drm_i915_gem_object *ctx_obj =
				85	shadow_ctx->engine[ring_id].state->obj;
				86	struct execlist_ring_context *shadow_ring_context;
				87	struct page *page;
				88	void *dst;
				89	unsigned long context_gpa, context_page_num;
				90	int i;
				91
				92	gvt_dbg_sched("ring id %d workload lrca %x", ring_id,
				93	workload->ctx_desc.lrca);
				94
Joonas Lahtinen	63ffbcd	2017-04-28 10:53:36 +0300	[diff] [blame]	95	context_page_num = gvt->dev_priv->engine[ring_id]->context_size;
Zhi Wang	e473405	2016-05-01 07:42:16 -0400	[diff] [blame]	96
				97	context_page_num = context_page_num >> PAGE_SHIFT;
				98
				99	if (IS_BROADWELL(gvt->dev_priv) && ring_id == RCS)
				100	context_page_num = 19;
				101
				102	i = 2;
				103
				104	while (i < context_page_num) {
				105	context_gpa = intel_vgpu_gma_to_gpa(vgpu->gtt.ggtt_mm,
				106	(u32)((workload->ctx_desc.lrca + i) <<
Zhi Wang	9556e11	2017-10-10 13:51:32 +0800	[diff] [blame]	107	I915_GTT_PAGE_SHIFT));
Zhi Wang	e473405	2016-05-01 07:42:16 -0400	[diff] [blame]	108	if (context_gpa == INTEL_GVT_INVALID_ADDR) {
Tina Zhang	695fbc0	2017-03-10 04:26:53 -0500	[diff] [blame]	109	gvt_vgpu_err("Invalid guest context descriptor\n");
fred gao	5c56883	2017-09-20 05:36:47 +0800	[diff] [blame]	110	return -EFAULT;
Zhi Wang	e473405	2016-05-01 07:42:16 -0400	[diff] [blame]	111	}
				112
Michel Thierry	0b29c75	2017-09-13 09:56:00 +0100	[diff] [blame]	113	page = i915_gem_object_get_page(ctx_obj, LRC_HEADER_PAGES + i);
Xiaoguang Chen	c754936	2016-11-03 18:38:30 +0800	[diff] [blame]	114	dst = kmap(page);
Zhi Wang	e473405	2016-05-01 07:42:16 -0400	[diff] [blame]	115	intel_gvt_hypervisor_read_gpa(vgpu, context_gpa, dst,
Zhi Wang	9556e11	2017-10-10 13:51:32 +0800	[diff] [blame]	116	I915_GTT_PAGE_SIZE);
Xiaoguang Chen	c754936	2016-11-03 18:38:30 +0800	[diff] [blame]	117	kunmap(page);
Zhi Wang	e473405	2016-05-01 07:42:16 -0400	[diff] [blame]	118	i++;
				119	}
				120
				121	page = i915_gem_object_get_page(ctx_obj, LRC_STATE_PN);
Xiaoguang Chen	c754936	2016-11-03 18:38:30 +0800	[diff] [blame]	122	shadow_ring_context = kmap(page);
Zhi Wang	e473405	2016-05-01 07:42:16 -0400	[diff] [blame]	123
				124	#define COPY_REG(name) \
				125	intel_gvt_hypervisor_read_gpa(vgpu, workload->ring_context_gpa \
				126	+ RING_CTX_OFF(name.val), &shadow_ring_context->name.val, 4)
				127
				128	COPY_REG(ctx_ctrl);
				129	COPY_REG(ctx_timestamp);
				130
				131	if (ring_id == RCS) {
				132	COPY_REG(bb_per_ctx_ptr);
				133	COPY_REG(rcs_indirect_ctx);
				134	COPY_REG(rcs_indirect_ctx_offset);
				135	}
				136	#undef COPY_REG
				137
Zhi Wang	e473405	2016-05-01 07:42:16 -0400	[diff] [blame]	138	intel_gvt_hypervisor_read_gpa(vgpu,
				139	workload->ring_context_gpa +
				140	sizeof(*shadow_ring_context),
				141	(void *)shadow_ring_context +
				142	sizeof(*shadow_ring_context),
Zhi Wang	9556e11	2017-10-10 13:51:32 +0800	[diff] [blame]	143	I915_GTT_PAGE_SIZE - sizeof(*shadow_ring_context));
Zhi Wang	e473405	2016-05-01 07:42:16 -0400	[diff] [blame]	144
Xiaoguang Chen	c754936	2016-11-03 18:38:30 +0800	[diff] [blame]	145	kunmap(page);
Zhi Wang	e473405	2016-05-01 07:42:16 -0400	[diff] [blame]	146	return 0;
				147	}
				148
Chris Wilson	e61e0f5	2018-02-21 09:56:36 +0000	[diff] [blame]	149	static inline bool is_gvt_request(struct i915_request *req)
Changbin Du	bc2d4b6	2017-03-22 12:35:31 +0800	[diff] [blame]	150	{
				151	return i915_gem_context_force_single_submission(req->ctx);
				152	}
				153
Xiong Zhang	295764c	2017-11-07 05:23:02 +0800	[diff] [blame]	154	static void save_ring_hw_state(struct intel_vgpu *vgpu, int ring_id)
				155	{
				156	struct drm_i915_private *dev_priv = vgpu->gvt->dev_priv;
				157	u32 ring_base = dev_priv->engine[ring_id]->mmio_base;
				158	i915_reg_t reg;
				159
				160	reg = RING_INSTDONE(ring_base);
				161	vgpu_vreg(vgpu, i915_mmio_reg_offset(reg)) = I915_READ_FW(reg);
				162	reg = RING_ACTHD(ring_base);
				163	vgpu_vreg(vgpu, i915_mmio_reg_offset(reg)) = I915_READ_FW(reg);
				164	reg = RING_ACTHD_UDW(ring_base);
				165	vgpu_vreg(vgpu, i915_mmio_reg_offset(reg)) = I915_READ_FW(reg);
				166	}
				167
Zhi Wang	e473405	2016-05-01 07:42:16 -0400	[diff] [blame]	168	static int shadow_context_status_change(struct notifier_block *nb,
				169	unsigned long action, void *data)
				170	{
Chris Wilson	e61e0f5	2018-02-21 09:56:36 +0000	[diff] [blame]	171	struct i915_request *req = data;
Changbin Du	3fc0306	2017-03-13 10:47:11 +0800	[diff] [blame]	172	struct intel_gvt *gvt = container_of(nb, struct intel_gvt,
				173	shadow_ctx_notifier_block[req->engine->id]);
				174	struct intel_gvt_workload_scheduler *scheduler = &gvt->scheduler;
Changbin Du	0e86cc9	2017-05-04 10:52:38 +0800	[diff] [blame]	175	enum intel_engine_id ring_id = req->engine->id;
				176	struct intel_vgpu_workload *workload;
Changbin Du	679fd3e	2017-11-13 14:58:31 +0800	[diff] [blame]	177	unsigned long flags;
Zhi Wang	e473405	2016-05-01 07:42:16 -0400	[diff] [blame]	178
Changbin Du	0e86cc9	2017-05-04 10:52:38 +0800	[diff] [blame]	179	if (!is_gvt_request(req)) {
Changbin Du	679fd3e	2017-11-13 14:58:31 +0800	[diff] [blame]	180	spin_lock_irqsave(&scheduler->mmio_context_lock, flags);
Changbin Du	0e86cc9	2017-05-04 10:52:38 +0800	[diff] [blame]	181	if (action == INTEL_CONTEXT_SCHEDULE_IN &&
				182	scheduler->engine_owner[ring_id]) {
				183	/* Switch ring from vGPU to host. */
				184	intel_gvt_switch_mmio(scheduler->engine_owner[ring_id],
				185	NULL, ring_id);
				186	scheduler->engine_owner[ring_id] = NULL;
				187	}
Changbin Du	679fd3e	2017-11-13 14:58:31 +0800	[diff] [blame]	188	spin_unlock_irqrestore(&scheduler->mmio_context_lock, flags);
Changbin Du	0e86cc9	2017-05-04 10:52:38 +0800	[diff] [blame]	189
				190	return NOTIFY_OK;
				191	}
				192
				193	workload = scheduler->current_workload[ring_id];
				194	if (unlikely(!workload))
Chuanxiao Dong	9272f73	2017-02-17 19:29:52 +0800	[diff] [blame]	195	return NOTIFY_OK;
				196
Zhi Wang	e473405	2016-05-01 07:42:16 -0400	[diff] [blame]	197	switch (action) {
				198	case INTEL_CONTEXT_SCHEDULE_IN:
Changbin Du	679fd3e	2017-11-13 14:58:31 +0800	[diff] [blame]	199	spin_lock_irqsave(&scheduler->mmio_context_lock, flags);
Changbin Du	0e86cc9	2017-05-04 10:52:38 +0800	[diff] [blame]	200	if (workload->vgpu != scheduler->engine_owner[ring_id]) {
				201	/* Switch ring from host to vGPU or vGPU to vGPU. */
				202	intel_gvt_switch_mmio(scheduler->engine_owner[ring_id],
				203	workload->vgpu, ring_id);
				204	scheduler->engine_owner[ring_id] = workload->vgpu;
				205	} else
				206	gvt_dbg_sched("skip ring %d mmio switch for vgpu%d\n",
				207	ring_id, workload->vgpu->id);
Changbin Du	679fd3e	2017-11-13 14:58:31 +0800	[diff] [blame]	208	spin_unlock_irqrestore(&scheduler->mmio_context_lock, flags);
Zhi Wang	e473405	2016-05-01 07:42:16 -0400	[diff] [blame]	209	atomic_set(&workload->shadow_ctx_active, 1);
				210	break;
				211	case INTEL_CONTEXT_SCHEDULE_OUT:
Xiong Zhang	295764c	2017-11-07 05:23:02 +0800	[diff] [blame]	212	save_ring_hw_state(workload->vgpu, ring_id);
Zhi Wang	e473405	2016-05-01 07:42:16 -0400	[diff] [blame]	213	atomic_set(&workload->shadow_ctx_active, 0);
				214	break;
Zhenyu Wang	da5f99e	2017-12-01 14:59:53 +0800	[diff] [blame]	215	case INTEL_CONTEXT_SCHEDULE_PREEMPTED:
				216	save_ring_hw_state(workload->vgpu, ring_id);
				217	break;
Zhi Wang	e473405	2016-05-01 07:42:16 -0400	[diff] [blame]	218	default:
				219	WARN_ON(1);
				220	return NOTIFY_OK;
				221	}
				222	wake_up(&workload->shadow_ctx_status_wq);
				223	return NOTIFY_OK;
				224	}
				225
Kechen Lu	9dfb8e5	2017-08-10 07:41:36 +0800	[diff] [blame]	226	static void shadow_context_descriptor_update(struct i915_gem_context *ctx,
				227	struct intel_engine_cs *engine)
				228	{
				229	struct intel_context *ce = &ctx->engine[engine->id];
				230	u64 desc = 0;
				231
				232	desc = ce->lrc_desc;
				233
				234	/* Update bits 0-11 of the context descriptor which includes flags
				235	* like GEN8_CTX_* cached in desc_template
				236	*/
				237	desc &= U64_MAX << 12;
				238	desc \|= ctx->desc_template & ((1ULL << 12) - 1);
				239
				240	ce->lrc_desc = desc;
				241	}
				242
fred gao	0a53bc0	2017-08-18 15:41:06 +0800	[diff] [blame]	243	static int copy_workload_to_ring_buffer(struct intel_vgpu_workload *workload)
				244	{
				245	struct intel_vgpu *vgpu = workload->vgpu;
				246	void *shadow_ring_buffer_va;
				247	u32 *cs;
Weinan Li	cd7e61b	2018-02-23 14:46:45 +0800	[diff] [blame]	248	struct i915_request *req = workload->req;
				249
				250	if (IS_KABYLAKE(req->i915) &&
				251	is_inhibit_context(req->ctx, req->engine->id))
				252	intel_vgpu_restore_inhibit_context(vgpu, req);
fred gao	0a53bc0	2017-08-18 15:41:06 +0800	[diff] [blame]	253
				254	/* allocate shadow ring buffer */
				255	cs = intel_ring_begin(workload->req, workload->rb_len / sizeof(u32));
				256	if (IS_ERR(cs)) {
				257	gvt_vgpu_err("fail to alloc size =%ld shadow ring buffer\n",
				258	workload->rb_len);
				259	return PTR_ERR(cs);
				260	}
				261
				262	shadow_ring_buffer_va = workload->shadow_ring_buffer_va;
				263
				264	/* get shadow ring buffer va */
				265	workload->shadow_ring_buffer_va = cs;
				266
				267	memcpy(cs, shadow_ring_buffer_va,
				268	workload->rb_len);
				269
				270	cs += workload->rb_len / sizeof(u32);
				271	intel_ring_advance(workload->req, cs);
				272
				273	return 0;
				274	}
				275
Chris Wilson	7b30255	2017-11-20 13:29:58 +0000	[diff] [blame]	276	static void release_shadow_wa_ctx(struct intel_shadow_wa_ctx *wa_ctx)
fred gao	a3cfdca	2017-08-18 15:41:07 +0800	[diff] [blame]	277	{
				278	if (!wa_ctx->indirect_ctx.obj)
				279	return;
				280
				281	i915_gem_object_unpin_map(wa_ctx->indirect_ctx.obj);
				282	i915_gem_object_put(wa_ctx->indirect_ctx.obj);
				283	}
				284
Ping Gao	89ea20b	2017-06-29 12:22:42 +0800	[diff] [blame]	285	/**
				286	* intel_gvt_scan_and_shadow_workload - audit the workload by scanning and
				287	* shadow it as well, include ringbuffer,wa_ctx and ctx.
				288	* @workload: an abstract entity for each execlist submission.
				289	*
				290	* This function is called before the workload submitting to i915, to make
				291	* sure the content of the workload is valid.
				292	*/
				293	int intel_gvt_scan_and_shadow_workload(struct intel_vgpu_workload *workload)
Zhi Wang	e473405	2016-05-01 07:42:16 -0400	[diff] [blame]	294	{
Zhi Wang	1406a14	2017-09-10 21:15:18 +0800	[diff] [blame]	295	struct intel_vgpu *vgpu = workload->vgpu;
				296	struct intel_vgpu_submission *s = &vgpu->submission;
				297	struct i915_gem_context *shadow_ctx = s->shadow_ctx;
				298	struct drm_i915_private *dev_priv = vgpu->gvt->dev_priv;
Zhi Wang	e473405	2016-05-01 07:42:16 -0400	[diff] [blame]	299	int ring_id = workload->ring_id;
fred gao	0a53bc0	2017-08-18 15:41:06 +0800	[diff] [blame]	300	struct intel_engine_cs *engine = dev_priv->engine[ring_id];
fred gao	0a53bc0	2017-08-18 15:41:06 +0800	[diff] [blame]	301	struct intel_ring *ring;
Zhi Wang	e473405	2016-05-01 07:42:16 -0400	[diff] [blame]	302	int ret;
				303
Ping Gao	87e919d	2017-07-04 14:53:03 +0800	[diff] [blame]	304	lockdep_assert_held(&dev_priv->drm.struct_mutex);
				305
Ping Gao	d0302e7	2017-06-29 12:22:43 +0800	[diff] [blame]	306	if (workload->shadowed)
				307	return 0;
Zhi Wang	e473405	2016-05-01 07:42:16 -0400	[diff] [blame]	308
Zhenyu Wang	03806ed	2017-02-13 17:07:19 +0800	[diff] [blame]	309	shadow_ctx->desc_template &= ~(0x3 << GEN8_CTX_ADDRESSING_MODE_SHIFT);
				310	shadow_ctx->desc_template \|= workload->ctx_desc.addressing_mode <<
Zhi Wang	e473405	2016-05-01 07:42:16 -0400	[diff] [blame]	311	GEN8_CTX_ADDRESSING_MODE_SHIFT;
				312
Zhi Wang	1406a14	2017-09-10 21:15:18 +0800	[diff] [blame]	313	if (!test_and_set_bit(ring_id, s->shadow_ctx_desc_updated))
Kechen Lu	9dfb8e5	2017-08-10 07:41:36 +0800	[diff] [blame]	314	shadow_context_descriptor_update(shadow_ctx,
				315	dev_priv->engine[ring_id]);
Chuanxiao Dong	3cd23b8	2017-03-16 09:47:58 +0800	[diff] [blame]	316
Ping Gao	89ea20b	2017-06-29 12:22:42 +0800	[diff] [blame]	317	ret = intel_gvt_scan_and_shadow_ringbuffer(workload);
Zhi Wang	be1da70	2016-05-03 18:26:57 -0400	[diff] [blame]	318	if (ret)
fred gao	a3cfdca	2017-08-18 15:41:07 +0800	[diff] [blame]	319	goto err_scan;
Zhi Wang	be1da70	2016-05-03 18:26:57 -0400	[diff] [blame]	320
Tina Zhang	17f1b1a	2017-03-15 23:16:01 -0400	[diff] [blame]	321	if ((workload->ring_id == RCS) &&
				322	(workload->wa_ctx.indirect_ctx.size != 0)) {
				323	ret = intel_gvt_scan_and_shadow_wa_ctx(&workload->wa_ctx);
				324	if (ret)
fred gao	a3cfdca	2017-08-18 15:41:07 +0800	[diff] [blame]	325	goto err_scan;
Tina Zhang	17f1b1a	2017-03-15 23:16:01 -0400	[diff] [blame]	326	}
Zhi Wang	be1da70	2016-05-03 18:26:57 -0400	[diff] [blame]	327
Ping Gao	89ea20b	2017-06-29 12:22:42 +0800	[diff] [blame]	328	/* pin shadow context by gvt even the shadow context will be pinned
				329	* when i915 alloc request. That is because gvt will update the guest
				330	* context from shadow context when workload is completed, and at that
				331	* moment, i915 may already unpined the shadow context to make the
				332	* shadow_ctx pages invalid. So gvt need to pin itself. After update
				333	* the guest context, gvt can unpin the shadow_ctx safely.
				334	*/
				335	ring = engine->context_pin(engine, shadow_ctx);
				336	if (IS_ERR(ring)) {
				337	ret = PTR_ERR(ring);
				338	gvt_vgpu_err("fail to pin shadow context\n");
fred gao	a3cfdca	2017-08-18 15:41:07 +0800	[diff] [blame]	339	goto err_shadow;
Ping Gao	89ea20b	2017-06-29 12:22:42 +0800	[diff] [blame]	340	}
Zhi Wang	e473405	2016-05-01 07:42:16 -0400	[diff] [blame]	341
fred gao	0a53bc0	2017-08-18 15:41:06 +0800	[diff] [blame]	342	ret = populate_shadow_context(workload);
				343	if (ret)
fred gao	a3cfdca	2017-08-18 15:41:07 +0800	[diff] [blame]	344	goto err_unpin;
fred gao	f2880e0	2017-11-14 17:09:35 +0800	[diff] [blame]	345	workload->shadowed = true;
				346	return 0;
				347
				348	err_unpin:
				349	engine->context_unpin(engine, shadow_ctx);
				350	err_shadow:
				351	release_shadow_wa_ctx(&workload->wa_ctx);
				352	err_scan:
				353	return ret;
				354	}
				355
				356	static int intel_gvt_generate_request(struct intel_vgpu_workload *workload)
				357	{
				358	int ring_id = workload->ring_id;
				359	struct drm_i915_private *dev_priv = workload->vgpu->gvt->dev_priv;
				360	struct intel_engine_cs *engine = dev_priv->engine[ring_id];
Chris Wilson	e61e0f5	2018-02-21 09:56:36 +0000	[diff] [blame]	361	struct i915_request *rq;
fred gao	f2880e0	2017-11-14 17:09:35 +0800	[diff] [blame]	362	struct intel_vgpu *vgpu = workload->vgpu;
				363	struct intel_vgpu_submission *s = &vgpu->submission;
				364	struct i915_gem_context *shadow_ctx = s->shadow_ctx;
				365	int ret;
fred gao	0a53bc0	2017-08-18 15:41:06 +0800	[diff] [blame]	366
Chris Wilson	e61e0f5	2018-02-21 09:56:36 +0000	[diff] [blame]	367	rq = i915_request_alloc(dev_priv->engine[ring_id], shadow_ctx);
fred gao	0a53bc0	2017-08-18 15:41:06 +0800	[diff] [blame]	368	if (IS_ERR(rq)) {
				369	gvt_vgpu_err("fail to allocate gem request\n");
				370	ret = PTR_ERR(rq);
fred gao	a3cfdca	2017-08-18 15:41:07 +0800	[diff] [blame]	371	goto err_unpin;
fred gao	0a53bc0	2017-08-18 15:41:06 +0800	[diff] [blame]	372	}
				373
				374	gvt_dbg_sched("ring id %d get i915 gem request %p\n", ring_id, rq);
				375
Chris Wilson	e61e0f5	2018-02-21 09:56:36 +0000	[diff] [blame]	376	workload->req = i915_request_get(rq);
fred gao	0a53bc0	2017-08-18 15:41:06 +0800	[diff] [blame]	377	ret = copy_workload_to_ring_buffer(workload);
				378	if (ret)
fred gao	a3cfdca	2017-08-18 15:41:07 +0800	[diff] [blame]	379	goto err_unpin;
fred gao	a3cfdca	2017-08-18 15:41:07 +0800	[diff] [blame]	380	return 0;
fred gao	0a53bc0	2017-08-18 15:41:06 +0800	[diff] [blame]	381
fred gao	a3cfdca	2017-08-18 15:41:07 +0800	[diff] [blame]	382	err_unpin:
				383	engine->context_unpin(engine, shadow_ctx);
fred gao	a3cfdca	2017-08-18 15:41:07 +0800	[diff] [blame]	384	release_shadow_wa_ctx(&workload->wa_ctx);
fred gao	0a53bc0	2017-08-18 15:41:06 +0800	[diff] [blame]	385	return ret;
				386	}
				387
Zhi Wang	f52c380	2017-09-24 21:53:03 +0800	[diff] [blame]	388	static void release_shadow_batch_buffer(struct intel_vgpu_workload *workload);
				389
Zhi Wang	d8235b5	2017-09-12 22:06:39 +0800	[diff] [blame]	390	static int prepare_shadow_batch_buffer(struct intel_vgpu_workload *workload)
				391	{
				392	struct intel_gvt *gvt = workload->vgpu->gvt;
				393	const int gmadr_bytes = gvt->device_info.gmadr_bytes_in_cmd;
Zhi Wang	f52c380	2017-09-24 21:53:03 +0800	[diff] [blame]	394	struct intel_vgpu_shadow_bb *bb;
				395	int ret;
Zhi Wang	d8235b5	2017-09-12 22:06:39 +0800	[diff] [blame]	396
Zhi Wang	f52c380	2017-09-24 21:53:03 +0800	[diff] [blame]	397	list_for_each_entry(bb, &workload->shadow_bb, list) {
				398	bb->vma = i915_gem_object_ggtt_pin(bb->obj, NULL, 0, 0, 0);
				399	if (IS_ERR(bb->vma)) {
				400	ret = PTR_ERR(bb->vma);
				401	goto err;
				402	}
Zhi Wang	d8235b5	2017-09-12 22:06:39 +0800	[diff] [blame]	403
Zhi Wang	f52c380	2017-09-24 21:53:03 +0800	[diff] [blame]	404	/* relocate shadow batch buffer */
				405	bb->bb_start_cmd_va[1] = i915_ggtt_offset(bb->vma);
Zhi Wang	d8235b5	2017-09-12 22:06:39 +0800	[diff] [blame]	406	if (gmadr_bytes == 8)
Zhi Wang	f52c380	2017-09-24 21:53:03 +0800	[diff] [blame]	407	bb->bb_start_cmd_va[2] = 0;
				408
				409	/* No one is going to touch shadow bb from now on. */
				410	if (bb->clflush & CLFLUSH_AFTER) {
				411	drm_clflush_virt_range(bb->va, bb->obj->base.size);
				412	bb->clflush &= ~CLFLUSH_AFTER;
				413	}
				414
				415	ret = i915_gem_object_set_to_gtt_domain(bb->obj, false);
				416	if (ret)
				417	goto err;
				418
				419	i915_gem_obj_finish_shmem_access(bb->obj);
				420	bb->accessing = false;
				421
				422	i915_vma_move_to_active(bb->vma, workload->req, 0);
Zhi Wang	d8235b5	2017-09-12 22:06:39 +0800	[diff] [blame]	423	}
				424	return 0;
Zhi Wang	f52c380	2017-09-24 21:53:03 +0800	[diff] [blame]	425	err:
				426	release_shadow_batch_buffer(workload);
				427	return ret;
Zhi Wang	d8235b5	2017-09-12 22:06:39 +0800	[diff] [blame]	428	}
				429
				430	static int update_wa_ctx_2_shadow_ctx(struct intel_shadow_wa_ctx *wa_ctx)
				431	{
				432	struct intel_vgpu_workload *workload = container_of(wa_ctx,
				433	struct intel_vgpu_workload,
				434	wa_ctx);
				435	int ring_id = workload->ring_id;
				436	struct intel_vgpu_submission *s = &workload->vgpu->submission;
				437	struct i915_gem_context *shadow_ctx = s->shadow_ctx;
				438	struct drm_i915_gem_object *ctx_obj =
				439	shadow_ctx->engine[ring_id].state->obj;
				440	struct execlist_ring_context *shadow_ring_context;
				441	struct page *page;
				442
				443	page = i915_gem_object_get_page(ctx_obj, LRC_STATE_PN);
				444	shadow_ring_context = kmap_atomic(page);
				445
				446	shadow_ring_context->bb_per_ctx_ptr.val =
				447	(shadow_ring_context->bb_per_ctx_ptr.val &
				448	(~PER_CTX_ADDR_MASK)) \| wa_ctx->per_ctx.shadow_gma;
				449	shadow_ring_context->rcs_indirect_ctx.val =
				450	(shadow_ring_context->rcs_indirect_ctx.val &
				451	(~INDIRECT_CTX_ADDR_MASK)) \| wa_ctx->indirect_ctx.shadow_gma;
				452
				453	kunmap_atomic(shadow_ring_context);
				454	return 0;
				455	}
				456
				457	static int prepare_shadow_wa_ctx(struct intel_shadow_wa_ctx *wa_ctx)
				458	{
				459	struct i915_vma *vma;
				460	unsigned char *per_ctx_va =
				461	(unsigned char *)wa_ctx->indirect_ctx.shadow_va +
				462	wa_ctx->indirect_ctx.size;
				463
				464	if (wa_ctx->indirect_ctx.size == 0)
				465	return 0;
				466
				467	vma = i915_gem_object_ggtt_pin(wa_ctx->indirect_ctx.obj, NULL,
				468	0, CACHELINE_BYTES, 0);
				469	if (IS_ERR(vma))
				470	return PTR_ERR(vma);
				471
				472	/* FIXME: we are not tracking our pinned VMA leaving it
				473	* up to the core to fix up the stray pin_count upon
				474	* free.
				475	*/
				476
				477	wa_ctx->indirect_ctx.shadow_gma = i915_ggtt_offset(vma);
				478
				479	wa_ctx->per_ctx.shadow_gma = ((unsigned int )per_ctx_va + 1);
				480	memset(per_ctx_va, 0, CACHELINE_BYTES);
				481
				482	update_wa_ctx_2_shadow_ctx(wa_ctx);
				483	return 0;
				484	}
				485
				486	static void release_shadow_batch_buffer(struct intel_vgpu_workload *workload)
				487	{
Zhi Wang	f52c380	2017-09-24 21:53:03 +0800	[diff] [blame]	488	struct intel_vgpu *vgpu = workload->vgpu;
				489	struct drm_i915_private *dev_priv = vgpu->gvt->dev_priv;
				490	struct intel_vgpu_shadow_bb bb, pos;
Zhi Wang	d8235b5	2017-09-12 22:06:39 +0800	[diff] [blame]	491
Zhi Wang	f52c380	2017-09-24 21:53:03 +0800	[diff] [blame]	492	if (list_empty(&workload->shadow_bb))
				493	return;
				494
				495	bb = list_first_entry(&workload->shadow_bb,
				496	struct intel_vgpu_shadow_bb, list);
				497
				498	mutex_lock(&dev_priv->drm.struct_mutex);
				499
				500	list_for_each_entry_safe(bb, pos, &workload->shadow_bb, list) {
				501	if (bb->obj) {
				502	if (bb->accessing)
				503	i915_gem_obj_finish_shmem_access(bb->obj);
				504
				505	if (bb->va && !IS_ERR(bb->va))
				506	i915_gem_object_unpin_map(bb->obj);
				507
				508	if (bb->vma && !IS_ERR(bb->vma)) {
				509	i915_vma_unpin(bb->vma);
				510	i915_vma_close(bb->vma);
				511	}
				512	__i915_gem_object_release_unless_active(bb->obj);
Zhi Wang	d8235b5	2017-09-12 22:06:39 +0800	[diff] [blame]	513	}
Zhi Wang	f52c380	2017-09-24 21:53:03 +0800	[diff] [blame]	514	list_del(&bb->list);
				515	kfree(bb);
Zhi Wang	d8235b5	2017-09-12 22:06:39 +0800	[diff] [blame]	516	}
Zhi Wang	f52c380	2017-09-24 21:53:03 +0800	[diff] [blame]	517
				518	mutex_unlock(&dev_priv->drm.struct_mutex);
Zhi Wang	d8235b5	2017-09-12 22:06:39 +0800	[diff] [blame]	519	}
				520
Zhi Wang	497aa3f	2017-09-12 21:51:10 +0800	[diff] [blame]	521	static int prepare_workload(struct intel_vgpu_workload *workload)
				522	{
Zhi Wang	d8235b5	2017-09-12 22:06:39 +0800	[diff] [blame]	523	struct intel_vgpu *vgpu = workload->vgpu;
Zhi Wang	497aa3f	2017-09-12 21:51:10 +0800	[diff] [blame]	524	int ret = 0;
				525
Zhi Wang	d8235b5	2017-09-12 22:06:39 +0800	[diff] [blame]	526	ret = intel_vgpu_pin_mm(workload->shadow_mm);
				527	if (ret) {
				528	gvt_vgpu_err("fail to vgpu pin mm\n");
				529	return ret;
				530	}
Zhi Wang	497aa3f	2017-09-12 21:51:10 +0800	[diff] [blame]	531
Zhi Wang	b20c0d5	2018-02-07 18:12:15 +0800	[diff] [blame^]	532	update_shadow_pdps(workload);
				533
Zhi Wang	d8235b5	2017-09-12 22:06:39 +0800	[diff] [blame]	534	ret = intel_vgpu_sync_oos_pages(workload->vgpu);
				535	if (ret) {
				536	gvt_vgpu_err("fail to vgpu sync oos pages\n");
				537	goto err_unpin_mm;
				538	}
				539
				540	ret = intel_vgpu_flush_post_shadow(workload->vgpu);
				541	if (ret) {
				542	gvt_vgpu_err("fail to flush post shadow\n");
				543	goto err_unpin_mm;
				544	}
				545
fred gao	f2880e0	2017-11-14 17:09:35 +0800	[diff] [blame]	546	ret = intel_gvt_generate_request(workload);
				547	if (ret) {
				548	gvt_vgpu_err("fail to generate request\n");
				549	goto err_unpin_mm;
				550	}
				551
Zhi Wang	d8235b5	2017-09-12 22:06:39 +0800	[diff] [blame]	552	ret = prepare_shadow_batch_buffer(workload);
				553	if (ret) {
				554	gvt_vgpu_err("fail to prepare_shadow_batch_buffer\n");
				555	goto err_unpin_mm;
				556	}
				557
				558	ret = prepare_shadow_wa_ctx(&workload->wa_ctx);
				559	if (ret) {
				560	gvt_vgpu_err("fail to prepare_shadow_wa_ctx\n");
				561	goto err_shadow_batch;
				562	}
				563
				564	if (workload->prepare) {
				565	ret = workload->prepare(workload);
				566	if (ret)
				567	goto err_shadow_wa_ctx;
				568	}
				569
				570	return 0;
				571	err_shadow_wa_ctx:
				572	release_shadow_wa_ctx(&workload->wa_ctx);
				573	err_shadow_batch:
				574	release_shadow_batch_buffer(workload);
				575	err_unpin_mm:
				576	intel_vgpu_unpin_mm(workload->shadow_mm);
Zhi Wang	497aa3f	2017-09-12 21:51:10 +0800	[diff] [blame]	577	return ret;
				578	}
				579
fred gao	0a53bc0	2017-08-18 15:41:06 +0800	[diff] [blame]	580	static int dispatch_workload(struct intel_vgpu_workload *workload)
				581	{
Zhi Wang	1406a14	2017-09-10 21:15:18 +0800	[diff] [blame]	582	struct intel_vgpu *vgpu = workload->vgpu;
				583	struct intel_vgpu_submission *s = &vgpu->submission;
				584	struct i915_gem_context *shadow_ctx = s->shadow_ctx;
				585	struct drm_i915_private *dev_priv = vgpu->gvt->dev_priv;
fred gao	0a53bc0	2017-08-18 15:41:06 +0800	[diff] [blame]	586	int ring_id = workload->ring_id;
fred gao	0a53bc0	2017-08-18 15:41:06 +0800	[diff] [blame]	587	struct intel_engine_cs *engine = dev_priv->engine[ring_id];
				588	int ret = 0;
				589
				590	gvt_dbg_sched("ring id %d prepare to dispatch workload %p\n",
				591	ring_id, workload);
				592
				593	mutex_lock(&dev_priv->drm.struct_mutex);
				594
				595	ret = intel_gvt_scan_and_shadow_workload(workload);
				596	if (ret)
				597	goto out;
				598
Zhi Wang	497aa3f	2017-09-12 21:51:10 +0800	[diff] [blame]	599	ret = prepare_workload(workload);
				600	if (ret) {
				601	engine->context_unpin(engine, shadow_ctx);
				602	goto out;
fred gao	0a53bc0	2017-08-18 15:41:06 +0800	[diff] [blame]	603	}
				604
Pei Zhang	90d27a1	2016-11-14 18:02:57 +0800	[diff] [blame]	605	out:
				606	if (ret)
				607	workload->status = ret;
Chris Wilson	0eb742d	2016-10-20 17:29:36 +0800	[diff] [blame]	608
Ping Gao	89ea20b	2017-06-29 12:22:42 +0800	[diff] [blame]	609	if (!IS_ERR_OR_NULL(workload->req)) {
				610	gvt_dbg_sched("ring id %d submit workload to i915 %p\n",
				611	ring_id, workload->req);
Chris Wilson	e61e0f5	2018-02-21 09:56:36 +0000	[diff] [blame]	612	i915_request_add(workload->req);
Ping Gao	89ea20b	2017-06-29 12:22:42 +0800	[diff] [blame]	613	workload->dispatched = true;
				614	}
Chuanxiao Dong	3cd23b8	2017-03-16 09:47:58 +0800	[diff] [blame]	615
Pei Zhang	90d27a1	2016-11-14 18:02:57 +0800	[diff] [blame]	616	mutex_unlock(&dev_priv->drm.struct_mutex);
Zhi Wang	e473405	2016-05-01 07:42:16 -0400	[diff] [blame]	617	return ret;
				618	}
				619
				620	static struct intel_vgpu_workload *pick_next_workload(
				621	struct intel_gvt *gvt, int ring_id)
				622	{
				623	struct intel_gvt_workload_scheduler *scheduler = &gvt->scheduler;
				624	struct intel_vgpu_workload *workload = NULL;
				625
				626	mutex_lock(&gvt->lock);
				627
				628	/*
				629	* no current vgpu / will be scheduled out / no workload
				630	* bail out
				631	*/
				632	if (!scheduler->current_vgpu) {
				633	gvt_dbg_sched("ring id %d stop - no current vgpu\n", ring_id);
				634	goto out;
				635	}
				636
				637	if (scheduler->need_reschedule) {
				638	gvt_dbg_sched("ring id %d stop - will reschedule\n", ring_id);
				639	goto out;
				640	}
				641
Zhenyu Wang	954180a	2017-04-12 14:22:50 +0800	[diff] [blame]	642	if (list_empty(workload_q_head(scheduler->current_vgpu, ring_id)))
Zhi Wang	e473405	2016-05-01 07:42:16 -0400	[diff] [blame]	643	goto out;
Zhi Wang	e473405	2016-05-01 07:42:16 -0400	[diff] [blame]	644
				645	/*
				646	* still have current workload, maybe the workload disptacher
				647	* fail to submit it for some reason, resubmit it.
				648	*/
				649	if (scheduler->current_workload[ring_id]) {
				650	workload = scheduler->current_workload[ring_id];
				651	gvt_dbg_sched("ring id %d still have current workload %p\n",
				652	ring_id, workload);
				653	goto out;
				654	}
				655
				656	/*
				657	* pick a workload as current workload
				658	* once current workload is set, schedule policy routines
				659	* will wait the current workload is finished when trying to
				660	* schedule out a vgpu.
				661	*/
				662	scheduler->current_workload[ring_id] = container_of(
				663	workload_q_head(scheduler->current_vgpu, ring_id)->next,
				664	struct intel_vgpu_workload, list);
				665
				666	workload = scheduler->current_workload[ring_id];
				667
				668	gvt_dbg_sched("ring id %d pick new workload %p\n", ring_id, workload);
				669
Zhi Wang	1406a14	2017-09-10 21:15:18 +0800	[diff] [blame]	670	atomic_inc(&workload->vgpu->submission.running_workload_num);
Zhi Wang	e473405	2016-05-01 07:42:16 -0400	[diff] [blame]	671	out:
				672	mutex_unlock(&gvt->lock);
				673	return workload;
				674	}
				675
				676	static void update_guest_context(struct intel_vgpu_workload *workload)
				677	{
				678	struct intel_vgpu *vgpu = workload->vgpu;
				679	struct intel_gvt *gvt = vgpu->gvt;
Zhi Wang	1406a14	2017-09-10 21:15:18 +0800	[diff] [blame]	680	struct intel_vgpu_submission *s = &vgpu->submission;
				681	struct i915_gem_context *shadow_ctx = s->shadow_ctx;
Zhi Wang	e473405	2016-05-01 07:42:16 -0400	[diff] [blame]	682	int ring_id = workload->ring_id;
Zhi Wang	e473405	2016-05-01 07:42:16 -0400	[diff] [blame]	683	struct drm_i915_gem_object *ctx_obj =
				684	shadow_ctx->engine[ring_id].state->obj;
				685	struct execlist_ring_context *shadow_ring_context;
				686	struct page *page;
				687	void *src;
				688	unsigned long context_gpa, context_page_num;
				689	int i;
				690
				691	gvt_dbg_sched("ring id %d workload lrca %x\n", ring_id,
				692	workload->ctx_desc.lrca);
				693
Joonas Lahtinen	63ffbcd	2017-04-28 10:53:36 +0300	[diff] [blame]	694	context_page_num = gvt->dev_priv->engine[ring_id]->context_size;
Zhi Wang	e473405	2016-05-01 07:42:16 -0400	[diff] [blame]	695
				696	context_page_num = context_page_num >> PAGE_SHIFT;
				697
				698	if (IS_BROADWELL(gvt->dev_priv) && ring_id == RCS)
				699	context_page_num = 19;
				700
				701	i = 2;
				702
				703	while (i < context_page_num) {
				704	context_gpa = intel_vgpu_gma_to_gpa(vgpu->gtt.ggtt_mm,
				705	(u32)((workload->ctx_desc.lrca + i) <<
Zhi Wang	9556e11	2017-10-10 13:51:32 +0800	[diff] [blame]	706	I915_GTT_PAGE_SHIFT));
Zhi Wang	e473405	2016-05-01 07:42:16 -0400	[diff] [blame]	707	if (context_gpa == INTEL_GVT_INVALID_ADDR) {
Tina Zhang	695fbc0	2017-03-10 04:26:53 -0500	[diff] [blame]	708	gvt_vgpu_err("invalid guest context descriptor\n");
Zhi Wang	e473405	2016-05-01 07:42:16 -0400	[diff] [blame]	709	return;
				710	}
				711
Michel Thierry	0b29c75	2017-09-13 09:56:00 +0100	[diff] [blame]	712	page = i915_gem_object_get_page(ctx_obj, LRC_HEADER_PAGES + i);
Xiaoguang Chen	c754936	2016-11-03 18:38:30 +0800	[diff] [blame]	713	src = kmap(page);
Zhi Wang	e473405	2016-05-01 07:42:16 -0400	[diff] [blame]	714	intel_gvt_hypervisor_write_gpa(vgpu, context_gpa, src,
Zhi Wang	9556e11	2017-10-10 13:51:32 +0800	[diff] [blame]	715	I915_GTT_PAGE_SIZE);
Xiaoguang Chen	c754936	2016-11-03 18:38:30 +0800	[diff] [blame]	716	kunmap(page);
Zhi Wang	e473405	2016-05-01 07:42:16 -0400	[diff] [blame]	717	i++;
				718	}
				719
				720	intel_gvt_hypervisor_write_gpa(vgpu, workload->ring_context_gpa +
				721	RING_CTX_OFF(ring_header.val), &workload->rb_tail, 4);
				722
				723	page = i915_gem_object_get_page(ctx_obj, LRC_STATE_PN);
Xiaoguang Chen	c754936	2016-11-03 18:38:30 +0800	[diff] [blame]	724	shadow_ring_context = kmap(page);
Zhi Wang	e473405	2016-05-01 07:42:16 -0400	[diff] [blame]	725
				726	#define COPY_REG(name) \
				727	intel_gvt_hypervisor_write_gpa(vgpu, workload->ring_context_gpa + \
				728	RING_CTX_OFF(name.val), &shadow_ring_context->name.val, 4)
				729
				730	COPY_REG(ctx_ctrl);
				731	COPY_REG(ctx_timestamp);
				732
				733	#undef COPY_REG
				734
				735	intel_gvt_hypervisor_write_gpa(vgpu,
				736	workload->ring_context_gpa +
				737	sizeof(*shadow_ring_context),
				738	(void *)shadow_ring_context +
				739	sizeof(*shadow_ring_context),
Zhi Wang	9556e11	2017-10-10 13:51:32 +0800	[diff] [blame]	740	I915_GTT_PAGE_SIZE - sizeof(*shadow_ring_context));
Zhi Wang	e473405	2016-05-01 07:42:16 -0400	[diff] [blame]	741
Xiaoguang Chen	c754936	2016-11-03 18:38:30 +0800	[diff] [blame]	742	kunmap(page);
Zhi Wang	e473405	2016-05-01 07:42:16 -0400	[diff] [blame]	743	}
				744
Zhi Wang	e2c43c0	2017-09-13 01:58:35 +0800	[diff] [blame]	745	static void clean_workloads(struct intel_vgpu *vgpu, unsigned long engine_mask)
				746	{
				747	struct intel_vgpu_submission *s = &vgpu->submission;
				748	struct drm_i915_private *dev_priv = vgpu->gvt->dev_priv;
				749	struct intel_engine_cs *engine;
				750	struct intel_vgpu_workload pos, n;
				751	unsigned int tmp;
				752
				753	/* free the unsubmited workloads in the queues. */
				754	for_each_engine_masked(engine, dev_priv, engine_mask, tmp) {
				755	list_for_each_entry_safe(pos, n,
				756	&s->workload_q_head[engine->id], list) {
				757	list_del_init(&pos->list);
				758	intel_vgpu_destroy_workload(pos);
				759	}
				760	clear_bit(engine->id, s->shadow_ctx_desc_updated);
				761	}
				762	}
				763
Zhi Wang	e473405	2016-05-01 07:42:16 -0400	[diff] [blame]	764	static void complete_current_workload(struct intel_gvt *gvt, int ring_id)
				765	{
				766	struct intel_gvt_workload_scheduler *scheduler = &gvt->scheduler;
Zhi Wang	1406a14	2017-09-10 21:15:18 +0800	[diff] [blame]	767	struct intel_vgpu_workload *workload =
				768	scheduler->current_workload[ring_id];
				769	struct intel_vgpu *vgpu = workload->vgpu;
				770	struct intel_vgpu_submission *s = &vgpu->submission;
Zhi Wang	be1da70	2016-05-03 18:26:57 -0400	[diff] [blame]	771	int event;
Zhi Wang	e473405	2016-05-01 07:42:16 -0400	[diff] [blame]	772
				773	mutex_lock(&gvt->lock);
				774
Chuanxiao Dong	8f1117a	2017-03-06 13:05:24 +0800	[diff] [blame]	775	/* For the workload w/ request, needs to wait for the context
				776	* switch to make sure request is completed.
				777	* For the workload w/o request, directly complete the workload.
				778	*/
				779	if (workload->req) {
Chuanxiao Dong	3cd23b8	2017-03-16 09:47:58 +0800	[diff] [blame]	780	struct drm_i915_private *dev_priv =
				781	workload->vgpu->gvt->dev_priv;
				782	struct intel_engine_cs *engine =
				783	dev_priv->engine[workload->ring_id];
Zhi Wang	e473405	2016-05-01 07:42:16 -0400	[diff] [blame]	784	wait_event(workload->shadow_ctx_status_wq,
				785	!atomic_read(&workload->shadow_ctx_active));
				786
Chuanxiao Dong	0cf5ec4	2017-06-23 13:01:11 +0800	[diff] [blame]	787	/* If this request caused GPU hang, req->fence.error will
				788	* be set to -EIO. Use -EIO to set workload status so
				789	* that when this request caused GPU hang, didn't trigger
				790	* context switch interrupt to guest.
				791	*/
				792	if (likely(workload->status == -EINPROGRESS)) {
				793	if (workload->req->fence.error == -EIO)
				794	workload->status = -EIO;
				795	else
				796	workload->status = 0;
				797	}
				798
Chris Wilson	e61e0f5	2018-02-21 09:56:36 +0000	[diff] [blame]	799	i915_request_put(fetch_and_zero(&workload->req));
Zhi Wang	be1da70	2016-05-03 18:26:57 -0400	[diff] [blame]	800
Chuanxiao Dong	6184cc8	2017-08-01 17:47:25 +0800	[diff] [blame]	801	if (!workload->status && !(vgpu->resetting_eng &
				802	ENGINE_MASK(ring_id))) {
Chuanxiao Dong	8f1117a	2017-03-06 13:05:24 +0800	[diff] [blame]	803	update_guest_context(workload);
				804
				805	for_each_set_bit(event, workload->pending_events,
				806	INTEL_GVT_EVENT_MAX)
				807	intel_vgpu_trigger_virtual_event(vgpu, event);
				808	}
Chuanxiao Dong	3cd23b8	2017-03-16 09:47:58 +0800	[diff] [blame]	809	mutex_lock(&dev_priv->drm.struct_mutex);
				810	/* unpin shadow ctx as the shadow_ctx update is done */
Zhi Wang	1406a14	2017-09-10 21:15:18 +0800	[diff] [blame]	811	engine->context_unpin(engine, s->shadow_ctx);
Chuanxiao Dong	3cd23b8	2017-03-16 09:47:58 +0800	[diff] [blame]	812	mutex_unlock(&dev_priv->drm.struct_mutex);
Zhi Wang	e473405	2016-05-01 07:42:16 -0400	[diff] [blame]	813	}
				814
				815	gvt_dbg_sched("ring id %d complete workload %p status %d\n",
				816	ring_id, workload, workload->status);
				817
				818	scheduler->current_workload[ring_id] = NULL;
				819
Zhi Wang	e473405	2016-05-01 07:42:16 -0400	[diff] [blame]	820	list_del_init(&workload->list);
Zhi Wang	d8235b5	2017-09-12 22:06:39 +0800	[diff] [blame]	821
				822	if (!workload->status) {
				823	release_shadow_batch_buffer(workload);
				824	release_shadow_wa_ctx(&workload->wa_ctx);
				825	}
				826
Zhi Wang	e2c43c0	2017-09-13 01:58:35 +0800	[diff] [blame]	827	if (workload->status \|\| (vgpu->resetting_eng & ENGINE_MASK(ring_id))) {
				828	/* if workload->status is not successful means HW GPU
				829	* has occurred GPU hang or something wrong with i915/GVT,
				830	* and GVT won't inject context switch interrupt to guest.
				831	* So this error is a vGPU hang actually to the guest.
				832	* According to this we should emunlate a vGPU hang. If
				833	* there are pending workloads which are already submitted
				834	* from guest, we should clean them up like HW GPU does.
				835	*
				836	* if it is in middle of engine resetting, the pending
				837	* workloads won't be submitted to HW GPU and will be
				838	* cleaned up during the resetting process later, so doing
				839	* the workload clean up here doesn't have any impact.
				840	**/
				841	clean_workloads(vgpu, ENGINE_MASK(ring_id));
				842	}
				843
Zhi Wang	e473405	2016-05-01 07:42:16 -0400	[diff] [blame]	844	workload->complete(workload);
				845
Zhi Wang	1406a14	2017-09-10 21:15:18 +0800	[diff] [blame]	846	atomic_dec(&s->running_workload_num);
Zhi Wang	e473405	2016-05-01 07:42:16 -0400	[diff] [blame]	847	wake_up(&scheduler->workload_complete_wq);
Ping Gao	f100dae	2017-05-24 09:14:11 +0800	[diff] [blame]	848
				849	if (gvt->scheduler.need_reschedule)
				850	intel_gvt_request_service(gvt, INTEL_GVT_REQUEST_EVENT_SCHED);
				851
Zhi Wang	e473405	2016-05-01 07:42:16 -0400	[diff] [blame]	852	mutex_unlock(&gvt->lock);
				853	}
				854
				855	struct workload_thread_param {
				856	struct intel_gvt *gvt;
				857	int ring_id;
				858	};
				859
				860	static int workload_thread(void *priv)
				861	{
				862	struct workload_thread_param p = (struct workload_thread_param )priv;
				863	struct intel_gvt *gvt = p->gvt;
				864	int ring_id = p->ring_id;
				865	struct intel_gvt_workload_scheduler *scheduler = &gvt->scheduler;
				866	struct intel_vgpu_workload *workload = NULL;
Tina Zhang	695fbc0	2017-03-10 04:26:53 -0500	[diff] [blame]	867	struct intel_vgpu *vgpu = NULL;
Zhi Wang	e473405	2016-05-01 07:42:16 -0400	[diff] [blame]	868	int ret;
Xu Han	e3476c0	2017-03-29 10:13:59 +0800	[diff] [blame]	869	bool need_force_wake = IS_SKYLAKE(gvt->dev_priv)
				870	\|\| IS_KABYLAKE(gvt->dev_priv);
Du, Changbin	e45d7b7	2016-10-27 11:10:31 +0800	[diff] [blame]	871	DEFINE_WAIT_FUNC(wait, woken_wake_function);
Zhi Wang	e473405	2016-05-01 07:42:16 -0400	[diff] [blame]	872
				873	kfree(p);
				874
				875	gvt_dbg_core("workload thread for ring %d started\n", ring_id);
				876
				877	while (!kthread_should_stop()) {
Du, Changbin	e45d7b7	2016-10-27 11:10:31 +0800	[diff] [blame]	878	add_wait_queue(&scheduler->waitq[ring_id], &wait);
				879	do {
				880	workload = pick_next_workload(gvt, ring_id);
				881	if (workload)
				882	break;
				883	wait_woken(&wait, TASK_INTERRUPTIBLE,
				884	MAX_SCHEDULE_TIMEOUT);
				885	} while (!kthread_should_stop());
				886	remove_wait_queue(&scheduler->waitq[ring_id], &wait);
Zhi Wang	e473405	2016-05-01 07:42:16 -0400	[diff] [blame]	887
Du, Changbin	e45d7b7	2016-10-27 11:10:31 +0800	[diff] [blame]	888	if (!workload)
Zhi Wang	e473405	2016-05-01 07:42:16 -0400	[diff] [blame]	889	break;
				890
				891	gvt_dbg_sched("ring id %d next workload %p vgpu %d\n",
				892	workload->ring_id, workload,
				893	workload->vgpu->id);
				894
				895	intel_runtime_pm_get(gvt->dev_priv);
				896
Zhi Wang	e473405	2016-05-01 07:42:16 -0400	[diff] [blame]	897	gvt_dbg_sched("ring id %d will dispatch workload %p\n",
				898	workload->ring_id, workload);
				899
				900	if (need_force_wake)
				901	intel_uncore_forcewake_get(gvt->dev_priv,
				902	FORCEWAKE_ALL);
				903
Pei Zhang	90d27a1	2016-11-14 18:02:57 +0800	[diff] [blame]	904	mutex_lock(&gvt->lock);
Zhi Wang	e473405	2016-05-01 07:42:16 -0400	[diff] [blame]	905	ret = dispatch_workload(workload);
Pei Zhang	90d27a1	2016-11-14 18:02:57 +0800	[diff] [blame]	906	mutex_unlock(&gvt->lock);
Chris Wilson	66bbc3b	2016-10-19 11:11:44 +0100	[diff] [blame]	907
Zhi Wang	e473405	2016-05-01 07:42:16 -0400	[diff] [blame]	908	if (ret) {
Tina Zhang	695fbc0	2017-03-10 04:26:53 -0500	[diff] [blame]	909	vgpu = workload->vgpu;
				910	gvt_vgpu_err("fail to dispatch workload, skip\n");
Zhi Wang	e473405	2016-05-01 07:42:16 -0400	[diff] [blame]	911	goto complete;
				912	}
				913
				914	gvt_dbg_sched("ring id %d wait workload %p\n",
				915	workload->ring_id, workload);
Chris Wilson	e61e0f5	2018-02-21 09:56:36 +0000	[diff] [blame]	916	i915_request_wait(workload->req, 0, MAX_SCHEDULE_TIMEOUT);
Zhi Wang	e473405	2016-05-01 07:42:16 -0400	[diff] [blame]	917
				918	complete:
Changbin Du	3ce3274	2017-02-09 10:13:16 +0800	[diff] [blame]	919	gvt_dbg_sched("will complete workload %p, status: %d\n",
Zhi Wang	e473405	2016-05-01 07:42:16 -0400	[diff] [blame]	920	workload, workload->status);
				921
Changbin Du	2e51ef3	2017-01-05 13:28:05 +0800	[diff] [blame]	922	complete_current_workload(gvt, ring_id);
				923
Zhi Wang	e473405	2016-05-01 07:42:16 -0400	[diff] [blame]	924	if (need_force_wake)
				925	intel_uncore_forcewake_put(gvt->dev_priv,
				926	FORCEWAKE_ALL);
				927
Zhi Wang	e473405	2016-05-01 07:42:16 -0400	[diff] [blame]	928	intel_runtime_pm_put(gvt->dev_priv);
Zhi Wang	6d76303	2017-09-12 22:33:12 +0800	[diff] [blame]	929	if (ret && (vgpu_is_vm_unhealthy(ret)))
fred gao	e011c6c	2017-09-19 15:11:28 +0800	[diff] [blame]	930	enter_failsafe_mode(vgpu, GVT_FAILSAFE_GUEST_ERR);
Zhi Wang	e473405	2016-05-01 07:42:16 -0400	[diff] [blame]	931	}
				932	return 0;
				933	}
				934
				935	void intel_gvt_wait_vgpu_idle(struct intel_vgpu *vgpu)
				936	{
Zhi Wang	1406a14	2017-09-10 21:15:18 +0800	[diff] [blame]	937	struct intel_vgpu_submission *s = &vgpu->submission;
Zhi Wang	e473405	2016-05-01 07:42:16 -0400	[diff] [blame]	938	struct intel_gvt *gvt = vgpu->gvt;
				939	struct intel_gvt_workload_scheduler *scheduler = &gvt->scheduler;
				940
Zhi Wang	1406a14	2017-09-10 21:15:18 +0800	[diff] [blame]	941	if (atomic_read(&s->running_workload_num)) {
Zhi Wang	e473405	2016-05-01 07:42:16 -0400	[diff] [blame]	942	gvt_dbg_sched("wait vgpu idle\n");
				943
				944	wait_event(scheduler->workload_complete_wq,
Zhi Wang	1406a14	2017-09-10 21:15:18 +0800	[diff] [blame]	945	!atomic_read(&s->running_workload_num));
Zhi Wang	e473405	2016-05-01 07:42:16 -0400	[diff] [blame]	946	}
				947	}
				948
				949	void intel_gvt_clean_workload_scheduler(struct intel_gvt *gvt)
				950	{
				951	struct intel_gvt_workload_scheduler *scheduler = &gvt->scheduler;
Changbin Du	3fc0306	2017-03-13 10:47:11 +0800	[diff] [blame]	952	struct intel_engine_cs *engine;
				953	enum intel_engine_id i;
Zhi Wang	e473405	2016-05-01 07:42:16 -0400	[diff] [blame]	954
				955	gvt_dbg_core("clean workload scheduler\n");
				956
Changbin Du	3fc0306	2017-03-13 10:47:11 +0800	[diff] [blame]	957	for_each_engine(engine, gvt->dev_priv, i) {
				958	atomic_notifier_chain_unregister(
				959	&engine->context_status_notifier,
				960	&gvt->shadow_ctx_notifier_block[i]);
				961	kthread_stop(scheduler->thread[i]);
Zhi Wang	e473405	2016-05-01 07:42:16 -0400	[diff] [blame]	962	}
				963	}
				964
				965	int intel_gvt_init_workload_scheduler(struct intel_gvt *gvt)
				966	{
				967	struct intel_gvt_workload_scheduler *scheduler = &gvt->scheduler;
				968	struct workload_thread_param *param = NULL;
Changbin Du	3fc0306	2017-03-13 10:47:11 +0800	[diff] [blame]	969	struct intel_engine_cs *engine;
				970	enum intel_engine_id i;
Zhi Wang	e473405	2016-05-01 07:42:16 -0400	[diff] [blame]	971	int ret;
Zhi Wang	e473405	2016-05-01 07:42:16 -0400	[diff] [blame]	972
				973	gvt_dbg_core("init workload scheduler\n");
				974
				975	init_waitqueue_head(&scheduler->workload_complete_wq);
				976
Changbin Du	3fc0306	2017-03-13 10:47:11 +0800	[diff] [blame]	977	for_each_engine(engine, gvt->dev_priv, i) {
Zhi Wang	e473405	2016-05-01 07:42:16 -0400	[diff] [blame]	978	init_waitqueue_head(&scheduler->waitq[i]);
				979
				980	param = kzalloc(sizeof(*param), GFP_KERNEL);
				981	if (!param) {
				982	ret = -ENOMEM;
				983	goto err;
				984	}
				985
				986	param->gvt = gvt;
				987	param->ring_id = i;
				988
				989	scheduler->thread[i] = kthread_run(workload_thread, param,
				990	"gvt workload %d", i);
				991	if (IS_ERR(scheduler->thread[i])) {
				992	gvt_err("fail to create workload thread\n");
				993	ret = PTR_ERR(scheduler->thread[i]);
				994	goto err;
				995	}
Changbin Du	3fc0306	2017-03-13 10:47:11 +0800	[diff] [blame]	996
				997	gvt->shadow_ctx_notifier_block[i].notifier_call =
				998	shadow_context_status_change;
				999	atomic_notifier_chain_register(&engine->context_status_notifier,
				1000	&gvt->shadow_ctx_notifier_block[i]);
Zhi Wang	e473405	2016-05-01 07:42:16 -0400	[diff] [blame]	1001	}
				1002	return 0;
				1003	err:
				1004	intel_gvt_clean_workload_scheduler(gvt);
				1005	kfree(param);
				1006	param = NULL;
				1007	return ret;
				1008	}
				1009
Zhi Wang	874b6a9	2017-09-10 20:08:18 +0800	[diff] [blame]	1010	/**
				1011	* intel_vgpu_clean_submission - free submission-related resource for vGPU
				1012	* @vgpu: a vGPU
				1013	*
				1014	* This function is called when a vGPU is being destroyed.
				1015	*
				1016	*/
				1017	void intel_vgpu_clean_submission(struct intel_vgpu *vgpu)
Zhi Wang	e473405	2016-05-01 07:42:16 -0400	[diff] [blame]	1018	{
Zhi Wang	1406a14	2017-09-10 21:15:18 +0800	[diff] [blame]	1019	struct intel_vgpu_submission *s = &vgpu->submission;
				1020
Weinan Li	7569a06	2018-01-26 15:09:07 +0800	[diff] [blame]	1021	intel_vgpu_select_submission_ops(vgpu, ALL_ENGINES, 0);
Zhi Wang	1406a14	2017-09-10 21:15:18 +0800	[diff] [blame]	1022	i915_gem_context_put(s->shadow_ctx);
				1023	kmem_cache_destroy(s->workloads);
Zhi Wang	e473405	2016-05-01 07:42:16 -0400	[diff] [blame]	1024	}
				1025
Zhi Wang	06bb372	2017-09-13 01:41:35 +0800	[diff] [blame]	1026
				1027	/**
				1028	* intel_vgpu_reset_submission - reset submission-related resource for vGPU
				1029	* @vgpu: a vGPU
				1030	* @engine_mask: engines expected to be reset
				1031	*
				1032	* This function is called when a vGPU is being destroyed.
				1033	*
				1034	*/
				1035	void intel_vgpu_reset_submission(struct intel_vgpu *vgpu,
				1036	unsigned long engine_mask)
				1037	{
				1038	struct intel_vgpu_submission *s = &vgpu->submission;
				1039
				1040	if (!s->active)
				1041	return;
				1042
Zhi Wang	e2c43c0	2017-09-13 01:58:35 +0800	[diff] [blame]	1043	clean_workloads(vgpu, engine_mask);
Zhi Wang	06bb372	2017-09-13 01:41:35 +0800	[diff] [blame]	1044	s->ops->reset(vgpu, engine_mask);
				1045	}
				1046
Zhi Wang	874b6a9	2017-09-10 20:08:18 +0800	[diff] [blame]	1047	/**
				1048	* intel_vgpu_setup_submission - setup submission-related resource for vGPU
				1049	* @vgpu: a vGPU
				1050	*
				1051	* This function is called when a vGPU is being created.
				1052	*
				1053	* Returns:
				1054	* Zero on success, negative error code if failed.
				1055	*
				1056	*/
				1057	int intel_vgpu_setup_submission(struct intel_vgpu *vgpu)
Zhi Wang	e473405	2016-05-01 07:42:16 -0400	[diff] [blame]	1058	{
Zhi Wang	1406a14	2017-09-10 21:15:18 +0800	[diff] [blame]	1059	struct intel_vgpu_submission *s = &vgpu->submission;
Zhi Wang	9a9829e	2017-09-10 20:28:09 +0800	[diff] [blame]	1060	enum intel_engine_id i;
				1061	struct intel_engine_cs *engine;
				1062	int ret;
Zhi Wang	e473405	2016-05-01 07:42:16 -0400	[diff] [blame]	1063
Zhi Wang	1406a14	2017-09-10 21:15:18 +0800	[diff] [blame]	1064	s->shadow_ctx = i915_gem_context_create_gvt(
Zhi Wang	e473405	2016-05-01 07:42:16 -0400	[diff] [blame]	1065	&vgpu->gvt->dev_priv->drm);
Zhi Wang	1406a14	2017-09-10 21:15:18 +0800	[diff] [blame]	1066	if (IS_ERR(s->shadow_ctx))
				1067	return PTR_ERR(s->shadow_ctx);
Zhi Wang	e473405	2016-05-01 07:42:16 -0400	[diff] [blame]	1068
Zhenyu Wang	1603660	2017-12-04 10:42:58 +0800	[diff] [blame]	1069	if (HAS_LOGICAL_RING_PREEMPTION(vgpu->gvt->dev_priv))
				1070	s->shadow_ctx->priority = INT_MAX;
				1071
Zhi Wang	1406a14	2017-09-10 21:15:18 +0800	[diff] [blame]	1072	bitmap_zero(s->shadow_ctx_desc_updated, I915_NUM_ENGINES);
Kechen Lu	9dfb8e5	2017-08-10 07:41:36 +0800	[diff] [blame]	1073
Zhi Wang	1406a14	2017-09-10 21:15:18 +0800	[diff] [blame]	1074	s->workloads = kmem_cache_create("gvt-g_vgpu_workload",
Zhi Wang	9a9829e	2017-09-10 20:28:09 +0800	[diff] [blame]	1075	sizeof(struct intel_vgpu_workload), 0,
				1076	SLAB_HWCACHE_ALIGN,
				1077	NULL);
				1078
Zhi Wang	1406a14	2017-09-10 21:15:18 +0800	[diff] [blame]	1079	if (!s->workloads) {
Zhi Wang	9a9829e	2017-09-10 20:28:09 +0800	[diff] [blame]	1080	ret = -ENOMEM;
				1081	goto out_shadow_ctx;
				1082	}
				1083
				1084	for_each_engine(engine, vgpu->gvt->dev_priv, i)
Zhi Wang	1406a14	2017-09-10 21:15:18 +0800	[diff] [blame]	1085	INIT_LIST_HEAD(&s->workload_q_head[i]);
Zhi Wang	9a9829e	2017-09-10 20:28:09 +0800	[diff] [blame]	1086
Zhi Wang	1406a14	2017-09-10 21:15:18 +0800	[diff] [blame]	1087	atomic_set(&s->running_workload_num, 0);
Zhi Wang	91d5d85	2017-09-10 21:33:20 +0800	[diff] [blame]	1088	bitmap_zero(s->tlb_handle_pending, I915_NUM_ENGINES);
Zhi Wang	9a9829e	2017-09-10 20:28:09 +0800	[diff] [blame]	1089
Zhi Wang	e473405	2016-05-01 07:42:16 -0400	[diff] [blame]	1090	return 0;
Zhi Wang	9a9829e	2017-09-10 20:28:09 +0800	[diff] [blame]	1091
				1092	out_shadow_ctx:
Zhi Wang	1406a14	2017-09-10 21:15:18 +0800	[diff] [blame]	1093	i915_gem_context_put(s->shadow_ctx);
Zhi Wang	9a9829e	2017-09-10 20:28:09 +0800	[diff] [blame]	1094	return ret;
Zhi Wang	e473405	2016-05-01 07:42:16 -0400	[diff] [blame]	1095	}
Zhi Wang	21527a8	2017-09-12 21:42:09 +0800	[diff] [blame]	1096
				1097	/**
Zhi Wang	ad1d363	2017-09-13 00:31:29 +0800	[diff] [blame]	1098	* intel_vgpu_select_submission_ops - select virtual submission interface
				1099	* @vgpu: a vGPU
				1100	* @interface: expected vGPU virtual submission interface
				1101	*
				1102	* This function is called when guest configures submission interface.
				1103	*
				1104	* Returns:
				1105	* Zero on success, negative error code if failed.
				1106	*
				1107	*/
				1108	int intel_vgpu_select_submission_ops(struct intel_vgpu *vgpu,
Weinan Li	7569a06	2018-01-26 15:09:07 +0800	[diff] [blame]	1109	unsigned long engine_mask,
Zhi Wang	ad1d363	2017-09-13 00:31:29 +0800	[diff] [blame]	1110	unsigned int interface)
				1111	{
				1112	struct intel_vgpu_submission *s = &vgpu->submission;
				1113	const struct intel_vgpu_submission_ops *ops[] = {
				1114	[INTEL_VGPU_EXECLIST_SUBMISSION] =
				1115	&intel_vgpu_execlist_submission_ops,
				1116	};
				1117	int ret;
				1118
				1119	if (WARN_ON(interface >= ARRAY_SIZE(ops)))
				1120	return -EINVAL;
				1121
Weinan Li	9212b13	2018-01-26 15:09:08 +0800	[diff] [blame]	1122	if (WARN_ON(interface == 0 && engine_mask != ALL_ENGINES))
				1123	return -EINVAL;
				1124
				1125	if (s->active)
Weinan Li	7569a06	2018-01-26 15:09:07 +0800	[diff] [blame]	1126	s->ops->clean(vgpu, engine_mask);
Zhi Wang	ad1d363	2017-09-13 00:31:29 +0800	[diff] [blame]	1127
				1128	if (interface == 0) {
				1129	s->ops = NULL;
				1130	s->virtual_submission_interface = 0;
Weinan Li	9212b13	2018-01-26 15:09:08 +0800	[diff] [blame]	1131	s->active = false;
				1132	gvt_dbg_core("vgpu%d: remove submission ops\n", vgpu->id);
Zhi Wang	ad1d363	2017-09-13 00:31:29 +0800	[diff] [blame]	1133	return 0;
				1134	}
				1135
Weinan Li	7569a06	2018-01-26 15:09:07 +0800	[diff] [blame]	1136	ret = ops[interface]->init(vgpu, engine_mask);
Zhi Wang	ad1d363	2017-09-13 00:31:29 +0800	[diff] [blame]	1137	if (ret)
				1138	return ret;
				1139
				1140	s->ops = ops[interface];
				1141	s->virtual_submission_interface = interface;
				1142	s->active = true;
				1143
				1144	gvt_dbg_core("vgpu%d: activate ops [ %s ]\n",
				1145	vgpu->id, s->ops->name);
				1146
				1147	return 0;
				1148	}
				1149
				1150	/**
Zhi Wang	21527a8	2017-09-12 21:42:09 +0800	[diff] [blame]	1151	* intel_vgpu_destroy_workload - destroy a vGPU workload
				1152	* @vgpu: a vGPU
				1153	*
				1154	* This function is called when destroy a vGPU workload.
				1155	*
				1156	*/
				1157	void intel_vgpu_destroy_workload(struct intel_vgpu_workload *workload)
				1158	{
				1159	struct intel_vgpu_submission *s = &workload->vgpu->submission;
				1160
				1161	if (workload->shadow_mm)
Changbin Du	1bc2585	2018-01-30 19:19:41 +0800	[diff] [blame]	1162	intel_vgpu_mm_put(workload->shadow_mm);
Zhi Wang	21527a8	2017-09-12 21:42:09 +0800	[diff] [blame]	1163
				1164	kmem_cache_free(s->workloads, workload);
				1165	}
				1166
Zhi Wang	6d76303	2017-09-12 22:33:12 +0800	[diff] [blame]	1167	static struct intel_vgpu_workload *
				1168	alloc_workload(struct intel_vgpu *vgpu)
Zhi Wang	21527a8	2017-09-12 21:42:09 +0800	[diff] [blame]	1169	{
				1170	struct intel_vgpu_submission *s = &vgpu->submission;
				1171	struct intel_vgpu_workload *workload;
				1172
				1173	workload = kmem_cache_zalloc(s->workloads, GFP_KERNEL);
				1174	if (!workload)
				1175	return ERR_PTR(-ENOMEM);
				1176
				1177	INIT_LIST_HEAD(&workload->list);
				1178	INIT_LIST_HEAD(&workload->shadow_bb);
				1179
				1180	init_waitqueue_head(&workload->shadow_ctx_status_wq);
				1181	atomic_set(&workload->shadow_ctx_active, 0);
				1182
				1183	workload->status = -EINPROGRESS;
				1184	workload->shadowed = false;
				1185	workload->vgpu = vgpu;
				1186
				1187	return workload;
				1188	}
Zhi Wang	6d76303	2017-09-12 22:33:12 +0800	[diff] [blame]	1189
				1190	#define RING_CTX_OFF(x) \
				1191	offsetof(struct execlist_ring_context, x)
				1192
				1193	static void read_guest_pdps(struct intel_vgpu *vgpu,
				1194	u64 ring_context_gpa, u32 pdp[8])
				1195	{
				1196	u64 gpa;
				1197	int i;
				1198
				1199	gpa = ring_context_gpa + RING_CTX_OFF(pdp3_UDW.val);
				1200
				1201	for (i = 0; i < 8; i++)
				1202	intel_gvt_hypervisor_read_gpa(vgpu,
				1203	gpa + i * 8, &pdp[7 - i], 4);
				1204	}
				1205
				1206	static int prepare_mm(struct intel_vgpu_workload *workload)
				1207	{
				1208	struct execlist_ctx_descriptor_format *desc = &workload->ctx_desc;
				1209	struct intel_vgpu_mm *mm;
				1210	struct intel_vgpu *vgpu = workload->vgpu;
Changbin Du	ede9d0c	2018-01-30 19:19:40 +0800	[diff] [blame]	1211	intel_gvt_gtt_type_t root_entry_type;
				1212	u64 pdps[GVT_RING_CTX_NR_PDPS];
Zhi Wang	6d76303	2017-09-12 22:33:12 +0800	[diff] [blame]	1213
Changbin Du	ede9d0c	2018-01-30 19:19:40 +0800	[diff] [blame]	1214	switch (desc->addressing_mode) {
				1215	case 1: /* legacy 32-bit */
				1216	root_entry_type = GTT_TYPE_PPGTT_ROOT_L3_ENTRY;
				1217	break;
				1218	case 3: /* legacy 64-bit */
				1219	root_entry_type = GTT_TYPE_PPGTT_ROOT_L4_ENTRY;
				1220	break;
				1221	default:
Zhi Wang	6d76303	2017-09-12 22:33:12 +0800	[diff] [blame]	1222	gvt_vgpu_err("Advanced Context mode(SVM) is not supported!\n");
				1223	return -EINVAL;
				1224	}
				1225
Changbin Du	ede9d0c	2018-01-30 19:19:40 +0800	[diff] [blame]	1226	read_guest_pdps(workload->vgpu, workload->ring_context_gpa, (void *)pdps);
Zhi Wang	6d76303	2017-09-12 22:33:12 +0800	[diff] [blame]	1227
Changbin Du	e6e9c46	2018-01-30 19:19:46 +0800	[diff] [blame]	1228	mm = intel_vgpu_get_ppgtt_mm(workload->vgpu, root_entry_type, pdps);
				1229	if (IS_ERR(mm))
				1230	return PTR_ERR(mm);
Zhi Wang	6d76303	2017-09-12 22:33:12 +0800	[diff] [blame]	1231
Zhi Wang	6d76303	2017-09-12 22:33:12 +0800	[diff] [blame]	1232	workload->shadow_mm = mm;
				1233	return 0;
				1234	}
				1235
				1236	#define same_context(a, b) (((a)->context_id == (b)->context_id) && \
				1237	((a)->lrca == (b)->lrca))
				1238
				1239	#define get_last_workload(q) \
				1240	(list_empty(q) ? NULL : container_of(q->prev, \
				1241	struct intel_vgpu_workload, list))
				1242	/**
				1243	* intel_vgpu_create_workload - create a vGPU workload
				1244	* @vgpu: a vGPU
				1245	* @desc: a guest context descriptor
				1246	*
				1247	* This function is called when creating a vGPU workload.
				1248	*
				1249	* Returns:
				1250	* struct intel_vgpu_workload * on success, negative error code in
				1251	* pointer if failed.
				1252	*
				1253	*/
				1254	struct intel_vgpu_workload *
				1255	intel_vgpu_create_workload(struct intel_vgpu *vgpu, int ring_id,
				1256	struct execlist_ctx_descriptor_format *desc)
				1257	{
				1258	struct intel_vgpu_submission *s = &vgpu->submission;
				1259	struct list_head *q = workload_q_head(vgpu, ring_id);
				1260	struct intel_vgpu_workload *last_workload = get_last_workload(q);
				1261	struct intel_vgpu_workload *workload = NULL;
				1262	struct drm_i915_private *dev_priv = vgpu->gvt->dev_priv;
				1263	u64 ring_context_gpa;
				1264	u32 head, tail, start, ctl, ctx_ctl, per_ctx, indirect_ctx;
				1265	int ret;
				1266
				1267	ring_context_gpa = intel_vgpu_gma_to_gpa(vgpu->gtt.ggtt_mm,
Zhi Wang	9556e11	2017-10-10 13:51:32 +0800	[diff] [blame]	1268	(u32)((desc->lrca + 1) << I915_GTT_PAGE_SHIFT));
Zhi Wang	6d76303	2017-09-12 22:33:12 +0800	[diff] [blame]	1269	if (ring_context_gpa == INTEL_GVT_INVALID_ADDR) {
				1270	gvt_vgpu_err("invalid guest context LRCA: %x\n", desc->lrca);
				1271	return ERR_PTR(-EINVAL);
				1272	}
				1273
				1274	intel_gvt_hypervisor_read_gpa(vgpu, ring_context_gpa +
				1275	RING_CTX_OFF(ring_header.val), &head, 4);
				1276
				1277	intel_gvt_hypervisor_read_gpa(vgpu, ring_context_gpa +
				1278	RING_CTX_OFF(ring_tail.val), &tail, 4);
				1279
				1280	head &= RB_HEAD_OFF_MASK;
				1281	tail &= RB_TAIL_OFF_MASK;
				1282
				1283	if (last_workload && same_context(&last_workload->ctx_desc, desc)) {
				1284	gvt_dbg_el("ring id %d cur workload == last\n", ring_id);
				1285	gvt_dbg_el("ctx head %x real head %lx\n", head,
				1286	last_workload->rb_tail);
				1287	/*
				1288	* cannot use guest context head pointer here,
				1289	* as it might not be updated at this time
				1290	*/
				1291	head = last_workload->rb_tail;
				1292	}
				1293
				1294	gvt_dbg_el("ring id %d begin a new workload\n", ring_id);
				1295
				1296	/* record some ring buffer register values for scan and shadow */
				1297	intel_gvt_hypervisor_read_gpa(vgpu, ring_context_gpa +
				1298	RING_CTX_OFF(rb_start.val), &start, 4);
				1299	intel_gvt_hypervisor_read_gpa(vgpu, ring_context_gpa +
				1300	RING_CTX_OFF(rb_ctrl.val), &ctl, 4);
				1301	intel_gvt_hypervisor_read_gpa(vgpu, ring_context_gpa +
				1302	RING_CTX_OFF(ctx_ctrl.val), &ctx_ctl, 4);
				1303
				1304	workload = alloc_workload(vgpu);
				1305	if (IS_ERR(workload))
				1306	return workload;
				1307
				1308	workload->ring_id = ring_id;
				1309	workload->ctx_desc = *desc;
				1310	workload->ring_context_gpa = ring_context_gpa;
				1311	workload->rb_head = head;
				1312	workload->rb_tail = tail;
				1313	workload->rb_start = start;
				1314	workload->rb_ctl = ctl;
				1315
				1316	if (ring_id == RCS) {
				1317	intel_gvt_hypervisor_read_gpa(vgpu, ring_context_gpa +
				1318	RING_CTX_OFF(bb_per_ctx_ptr.val), &per_ctx, 4);
				1319	intel_gvt_hypervisor_read_gpa(vgpu, ring_context_gpa +
				1320	RING_CTX_OFF(rcs_indirect_ctx.val), &indirect_ctx, 4);
				1321
				1322	workload->wa_ctx.indirect_ctx.guest_gma =
				1323	indirect_ctx & INDIRECT_CTX_ADDR_MASK;
				1324	workload->wa_ctx.indirect_ctx.size =
				1325	(indirect_ctx & INDIRECT_CTX_SIZE_MASK) *
				1326	CACHELINE_BYTES;
				1327	workload->wa_ctx.per_ctx.guest_gma =
				1328	per_ctx & PER_CTX_ADDR_MASK;
				1329	workload->wa_ctx.per_ctx.valid = per_ctx & 1;
				1330	}
				1331
				1332	gvt_dbg_el("workload %p ring id %d head %x tail %x start %x ctl %x\n",
				1333	workload, ring_id, head, tail, start, ctl);
				1334
				1335	ret = prepare_mm(workload);
				1336	if (ret) {
				1337	kmem_cache_free(s->workloads, workload);
				1338	return ERR_PTR(ret);
				1339	}
				1340
				1341	/* Only scan and shadow the first workload in the queue
				1342	* as there is only one pre-allocated buf-obj for shadow.
				1343	*/
				1344	if (list_empty(workload_q_head(vgpu, ring_id))) {
				1345	intel_runtime_pm_get(dev_priv);
				1346	mutex_lock(&dev_priv->drm.struct_mutex);
				1347	ret = intel_gvt_scan_and_shadow_workload(workload);
				1348	mutex_unlock(&dev_priv->drm.struct_mutex);
				1349	intel_runtime_pm_put(dev_priv);
				1350	}
				1351
				1352	if (ret && (vgpu_is_vm_unhealthy(ret))) {
				1353	enter_failsafe_mode(vgpu, GVT_FAILSAFE_GUEST_ERR);
				1354	intel_vgpu_destroy_workload(workload);
				1355	return ERR_PTR(ret);
				1356	}
				1357
				1358	return workload;
				1359	}
Changbin Du	59a716c	2017-11-29 15:40:06 +0800	[diff] [blame]	1360
				1361	/**
				1362	* intel_vgpu_queue_workload - Qeue a vGPU workload
				1363	* @workload: the workload to queue in
				1364	*/
				1365	void intel_vgpu_queue_workload(struct intel_vgpu_workload *workload)
				1366	{
				1367	list_add_tail(&workload->list,
				1368	workload_q_head(workload->vgpu, workload->ring_id));
Changbin Du	c130456	2017-11-29 15:40:07 +0800	[diff] [blame]	1369	intel_gvt_kick_schedule(workload->vgpu->gvt);
Changbin Du	59a716c	2017-11-29 15:40:06 +0800	[diff] [blame]	1370	wake_up(&workload->vgpu->gvt->scheduler.waitq[workload->ring_id]);
				1371	}