Blame - drivers/gpu/drm/i915/i915_gem.c - kernel/msm-5.4

blob: c3d6507063299a114b126d50075280f101fc2334 [file] [log] [blame]

Eric Anholt	673a394	2008-07-30 12:06:12 -0700	[diff] [blame]	1	/*
Daniel Vetter	be6a037	2015-03-18 10:46:04 +0100	[diff] [blame]	2	* Copyright © 2008-2015 Intel Corporation
Eric Anholt	673a394	2008-07-30 12:06:12 -0700	[diff] [blame]	3	*
				4	* Permission is hereby granted, free of charge, to any person obtaining a
				5	* copy of this software and associated documentation files (the "Software"),
				6	* to deal in the Software without restriction, including without limitation
				7	* the rights to use, copy, modify, merge, publish, distribute, sublicense,
				8	* and/or sell copies of the Software, and to permit persons to whom the
				9	* Software is furnished to do so, subject to the following conditions:
				10	*
				11	* The above copyright notice and this permission notice (including the next
				12	* paragraph) shall be included in all copies or substantial portions of the
				13	* Software.
				14	*
				15	* THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
				16	* IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
				17	* FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL
				18	* THE AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
				19	* LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING
				20	* FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS
				21	* IN THE SOFTWARE.
				22	*
				23	* Authors:
				24	* Eric Anholt <eric@anholt.net>
				25	*
				26	*/
				27
David Howells	760285e	2012-10-02 18:01:07 +0100	[diff] [blame]	28	#include <drm/drmP.h>
David Herrmann	0de2397	2013-07-24 21:07:52 +0200	[diff] [blame]	29	#include <drm/drm_vma_manager.h>
David Howells	760285e	2012-10-02 18:01:07 +0100	[diff] [blame]	30	#include <drm/i915_drm.h>
Eric Anholt	673a394	2008-07-30 12:06:12 -0700	[diff] [blame]	31	#include "i915_drv.h"
Chris Wilson	57822dc	2017-02-22 11:40:48 +0000	[diff] [blame]	32	#include "i915_gem_clflush.h"
Yu Zhang	eb82289	2015-02-10 19:05:49 +0800	[diff] [blame]	33	#include "i915_vgpu.h"
Chris Wilson	1c5d22f	2009-08-25 11:15:50 +0100	[diff] [blame]	34	#include "i915_trace.h"
Jesse Barnes	652c393	2009-08-17 13:31:43 -0700	[diff] [blame]	35	#include "intel_drv.h"
Chris Wilson	5d723d7	2016-08-04 16:32:35 +0100	[diff] [blame]	36	#include "intel_frontbuffer.h"
Peter Antoine	0ccdacf	2016-04-13 15:03:25 +0100	[diff] [blame]	37	#include "intel_mocs.h"
Matthew Auld	465c403	2017-10-06 23:18:14 +0100	[diff] [blame]	38	#include "i915_gemfs.h"
Chris Wilson	6b5e90f	2016-11-14 20:41:05 +0000	[diff] [blame]	39	#include <linux/dma-fence-array.h>
Chris Wilson	fe3288b	2017-02-12 17:20:01 +0000	[diff] [blame]	40	#include <linux/kthread.h>
Chris Wilson	c13d87e	2016-07-20 09:21:15 +0100	[diff] [blame]	41	#include <linux/reservation.h>
Hugh Dickins	5949eac	2011-06-27 16:18:18 -0700	[diff] [blame]	42	#include <linux/shmem_fs.h>
Tejun Heo	5a0e3ad	2010-03-24 17:04:11 +0900	[diff] [blame]	43	#include <linux/slab.h>
Chris Wilson	20e4933	2016-11-22 14:41:21 +0000	[diff] [blame]	44	#include <linux/stop_machine.h>
Eric Anholt	673a394	2008-07-30 12:06:12 -0700	[diff] [blame]	45	#include <linux/swap.h>
Jesse Barnes	79e5394	2008-11-07 14:24:08 -0800	[diff] [blame]	46	#include <linux/pci.h>
Daniel Vetter	1286ff7	2012-05-10 15:25:09 +0200	[diff] [blame]	47	#include <linux/dma-buf.h>
Eric Anholt	673a394	2008-07-30 12:06:12 -0700	[diff] [blame]	48
Chris Wilson	fbbd37b	2016-10-28 13:58:42 +0100	[diff] [blame]	49	static void i915_gem_flush_free_objects(struct drm_i915_private *i915);
Chris Wilson	6105080	2012-04-17 15:31:31 +0100	[diff] [blame]	50
Chris Wilson	2c22569	2013-08-09 12:26:45 +0100	[diff] [blame]	51	static bool cpu_write_needs_clflush(struct drm_i915_gem_object *obj)
				52	{
Chris Wilson	e27ab73	2017-06-15 13:38:49 +0100	[diff] [blame]	53	if (obj->cache_dirty)
Ankitprasad Sharma	b50a537	2016-06-10 14:23:03 +0530	[diff] [blame]	54	return false;
				55
Chris Wilson	b8f55be	2017-08-11 12:11:16 +0100	[diff] [blame]	56	if (!(obj->cache_coherent & I915_BO_CACHE_COHERENT_FOR_WRITE))
Chris Wilson	2c22569	2013-08-09 12:26:45 +0100	[diff] [blame]	57	return true;
				58
Chris Wilson	bd3d225	2017-10-13 21:26:14 +0100	[diff] [blame]	59	return obj->pin_global; /* currently in use by HW, keep flushed */
Chris Wilson	2c22569	2013-08-09 12:26:45 +0100	[diff] [blame]	60	}
				61
Ankitprasad Sharma	4f1959e	2016-06-10 14:23:01 +0530	[diff] [blame]	62	static int
Chris Wilson	bb6dc8d	2016-10-28 13:58:39 +0100	[diff] [blame]	63	insert_mappable_node(struct i915_ggtt *ggtt,
Ankitprasad Sharma	4f1959e	2016-06-10 14:23:01 +0530	[diff] [blame]	64	struct drm_mm_node *node, u32 size)
				65	{
				66	memset(node, 0, sizeof(*node));
Chris Wilson	4e64e55	2017-02-02 21:04:38 +0000	[diff] [blame]	67	return drm_mm_insert_node_in_range(&ggtt->base.mm, node,
				68	size, 0, I915_COLOR_UNEVICTABLE,
				69	0, ggtt->mappable_end,
				70	DRM_MM_INSERT_LOW);
Ankitprasad Sharma	4f1959e	2016-06-10 14:23:01 +0530	[diff] [blame]	71	}
				72
				73	static void
				74	remove_mappable_node(struct drm_mm_node *node)
				75	{
				76	drm_mm_remove_node(node);
				77	}
				78
Chris Wilson	73aa808	2010-09-30 11:46:12 +0100	[diff] [blame]	79	/* some bookkeeping */
				80	static void i915_gem_info_add_obj(struct drm_i915_private *dev_priv,
Chris Wilson	3ef7f22	2016-10-18 13:02:48 +0100	[diff] [blame]	81	u64 size)
Chris Wilson	73aa808	2010-09-30 11:46:12 +0100	[diff] [blame]	82	{
Daniel Vetter	c20e835	2013-07-24 22:40:23 +0200	[diff] [blame]	83	spin_lock(&dev_priv->mm.object_stat_lock);
Chris Wilson	73aa808	2010-09-30 11:46:12 +0100	[diff] [blame]	84	dev_priv->mm.object_count++;
				85	dev_priv->mm.object_memory += size;
Daniel Vetter	c20e835	2013-07-24 22:40:23 +0200	[diff] [blame]	86	spin_unlock(&dev_priv->mm.object_stat_lock);
Chris Wilson	73aa808	2010-09-30 11:46:12 +0100	[diff] [blame]	87	}
				88
				89	static void i915_gem_info_remove_obj(struct drm_i915_private *dev_priv,
Chris Wilson	3ef7f22	2016-10-18 13:02:48 +0100	[diff] [blame]	90	u64 size)
Chris Wilson	73aa808	2010-09-30 11:46:12 +0100	[diff] [blame]	91	{
Daniel Vetter	c20e835	2013-07-24 22:40:23 +0200	[diff] [blame]	92	spin_lock(&dev_priv->mm.object_stat_lock);
Chris Wilson	73aa808	2010-09-30 11:46:12 +0100	[diff] [blame]	93	dev_priv->mm.object_count--;
				94	dev_priv->mm.object_memory -= size;
Daniel Vetter	c20e835	2013-07-24 22:40:23 +0200	[diff] [blame]	95	spin_unlock(&dev_priv->mm.object_stat_lock);
Chris Wilson	73aa808	2010-09-30 11:46:12 +0100	[diff] [blame]	96	}
				97
Chris Wilson	21dd373	2011-01-26 15:55:56 +0000	[diff] [blame]	98	static int
Daniel Vetter	33196de	2012-11-14 17:14:05 +0100	[diff] [blame]	99	i915_gem_wait_for_error(struct i915_gpu_error *error)
Chris Wilson	30dbf0c	2010-09-25 10:19:17 +0100	[diff] [blame]	100	{
Chris Wilson	30dbf0c	2010-09-25 10:19:17 +0100	[diff] [blame]	101	int ret;
				102
Chris Wilson	4c7d62c	2016-10-28 13:58:32 +0100	[diff] [blame]	103	might_sleep();
				104
Daniel Vetter	0a6759c	2012-07-04 22:18:41 +0200	[diff] [blame]	105	/*
				106	* Only wait 10 seconds for the gpu reset to complete to avoid hanging
				107	* userspace. If it takes that long something really bad is going on and
				108	* we should simply try to bail out and fail as gracefully as possible.
				109	*/
Daniel Vetter	1f83fee	2012-11-15 17:17:22 +0100	[diff] [blame]	110	ret = wait_event_interruptible_timeout(error->reset_queue,
Chris Wilson	8c185ec	2017-03-16 17:13:02 +0000	[diff] [blame]	111	!i915_reset_backoff(error),
Chris Wilson	b52992c	2016-10-28 13:58:24 +0100	[diff] [blame]	112	I915_RESET_TIMEOUT);
Daniel Vetter	0a6759c	2012-07-04 22:18:41 +0200	[diff] [blame]	113	if (ret == 0) {
				114	DRM_ERROR("Timed out waiting for the gpu reset to complete\n");
				115	return -EIO;
				116	} else if (ret < 0) {
Chris Wilson	30dbf0c	2010-09-25 10:19:17 +0100	[diff] [blame]	117	return ret;
Chris Wilson	d98c52c	2016-04-13 17:35:05 +0100	[diff] [blame]	118	} else {
				119	return 0;
Daniel Vetter	0a6759c	2012-07-04 22:18:41 +0200	[diff] [blame]	120	}
Chris Wilson	30dbf0c	2010-09-25 10:19:17 +0100	[diff] [blame]	121	}
				122
Chris Wilson	54cf91d	2010-11-25 18:00:26 +0000	[diff] [blame]	123	int i915_mutex_lock_interruptible(struct drm_device *dev)
Chris Wilson	76c1dec	2010-09-25 11:22:51 +0100	[diff] [blame]	124	{
Chris Wilson	fac5e23	2016-07-04 11:34:36 +0100	[diff] [blame]	125	struct drm_i915_private *dev_priv = to_i915(dev);
Chris Wilson	76c1dec	2010-09-25 11:22:51 +0100	[diff] [blame]	126	int ret;
				127
Daniel Vetter	33196de	2012-11-14 17:14:05 +0100	[diff] [blame]	128	ret = i915_gem_wait_for_error(&dev_priv->gpu_error);
Chris Wilson	76c1dec	2010-09-25 11:22:51 +0100	[diff] [blame]	129	if (ret)
				130	return ret;
				131
				132	ret = mutex_lock_interruptible(&dev->struct_mutex);
				133	if (ret)
				134	return ret;
				135
Chris Wilson	76c1dec	2010-09-25 11:22:51 +0100	[diff] [blame]	136	return 0;
				137	}
Chris Wilson	30dbf0c	2010-09-25 10:19:17 +0100	[diff] [blame]	138
Eric Anholt	673a394	2008-07-30 12:06:12 -0700	[diff] [blame]	139	int
Eric Anholt	5a125c3	2008-10-22 21:40:13 -0700	[diff] [blame]	140	i915_gem_get_aperture_ioctl(struct drm_device dev, void data,
Chris Wilson	05394f3	2010-11-08 19:18:58 +0000	[diff] [blame]	141	struct drm_file *file)
Eric Anholt	5a125c3	2008-10-22 21:40:13 -0700	[diff] [blame]	142	{
Joonas Lahtinen	72e96d6	2016-03-30 16:57:10 +0300	[diff] [blame]	143	struct drm_i915_private *dev_priv = to_i915(dev);
Joonas Lahtinen	62106b4	2016-03-18 10:42:57 +0200	[diff] [blame]	144	struct i915_ggtt *ggtt = &dev_priv->ggtt;
Joonas Lahtinen	72e96d6	2016-03-30 16:57:10 +0300	[diff] [blame]	145	struct drm_i915_gem_get_aperture *args = data;
Tvrtko Ursulin	ca1543b	2015-07-01 11:51:10 +0100	[diff] [blame]	146	struct i915_vma *vma;
Weinan Li	ff8f797	2017-05-31 10:35:52 +0800	[diff] [blame]	147	u64 pinned;
Eric Anholt	5a125c3	2008-10-22 21:40:13 -0700	[diff] [blame]	148
Weinan Li	ff8f797	2017-05-31 10:35:52 +0800	[diff] [blame]	149	pinned = ggtt->base.reserved;
Chris Wilson	73aa808	2010-09-30 11:46:12 +0100	[diff] [blame]	150	mutex_lock(&dev->struct_mutex);
Chris Wilson	1c7f4bc	2016-02-26 11:03:19 +0000	[diff] [blame]	151	list_for_each_entry(vma, &ggtt->base.active_list, vm_link)
Chris Wilson	20dfbde	2016-08-04 16:32:30 +0100	[diff] [blame]	152	if (i915_vma_is_pinned(vma))
Tvrtko Ursulin	ca1543b	2015-07-01 11:51:10 +0100	[diff] [blame]	153	pinned += vma->node.size;
Chris Wilson	1c7f4bc	2016-02-26 11:03:19 +0000	[diff] [blame]	154	list_for_each_entry(vma, &ggtt->base.inactive_list, vm_link)
Chris Wilson	20dfbde	2016-08-04 16:32:30 +0100	[diff] [blame]	155	if (i915_vma_is_pinned(vma))
Tvrtko Ursulin	ca1543b	2015-07-01 11:51:10 +0100	[diff] [blame]	156	pinned += vma->node.size;
Chris Wilson	73aa808	2010-09-30 11:46:12 +0100	[diff] [blame]	157	mutex_unlock(&dev->struct_mutex);
Eric Anholt	5a125c3	2008-10-22 21:40:13 -0700	[diff] [blame]	158
Joonas Lahtinen	72e96d6	2016-03-30 16:57:10 +0300	[diff] [blame]	159	args->aper_size = ggtt->base.total;
Akshay Joshi	0206e35	2011-08-16 15:34:10 -0400	[diff] [blame]	160	args->aper_available_size = args->aper_size - pinned;
Chris Wilson	6299f99	2010-11-24 12:23:44 +0000	[diff] [blame]	161
Eric Anholt	5a125c3	2008-10-22 21:40:13 -0700	[diff] [blame]	162	return 0;
				163	}
				164
Matthew Auld	b91b09e	2017-10-06 23:18:17 +0100	[diff] [blame]	165	static int i915_gem_object_get_pages_phys(struct drm_i915_gem_object *obj)
Chris Wilson	0073115	2014-05-21 12:42:56 +0100	[diff] [blame]	166	{
Al Viro	93c76a3	2015-12-04 23:45:44 -0500	[diff] [blame]	167	struct address_space *mapping = obj->base.filp->f_mapping;
Chris Wilson	dbb4351	2016-12-07 13:34:11 +0000	[diff] [blame]	168	drm_dma_handle_t *phys;
Chris Wilson	6a2c423	2014-11-04 04:51:40 -0800	[diff] [blame]	169	struct sg_table *st;
				170	struct scatterlist *sg;
Chris Wilson	dbb4351	2016-12-07 13:34:11 +0000	[diff] [blame]	171	char *vaddr;
Chris Wilson	6a2c423	2014-11-04 04:51:40 -0800	[diff] [blame]	172	int i;
Matthew Auld	b91b09e	2017-10-06 23:18:17 +0100	[diff] [blame]	173	int err;
Chris Wilson	0073115	2014-05-21 12:42:56 +0100	[diff] [blame]	174
Chris Wilson	6a2c423	2014-11-04 04:51:40 -0800	[diff] [blame]	175	if (WARN_ON(i915_gem_object_needs_bit17_swizzle(obj)))
Matthew Auld	b91b09e	2017-10-06 23:18:17 +0100	[diff] [blame]	176	return -EINVAL;
Chris Wilson	0073115	2014-05-21 12:42:56 +0100	[diff] [blame]	177
Chris Wilson	dbb4351	2016-12-07 13:34:11 +0000	[diff] [blame]	178	/* Always aligning to the object size, allows a single allocation
				179	* to handle all possible callers, and given typical object sizes,
				180	* the alignment of the buddy allocation will naturally match.
				181	*/
				182	phys = drm_pci_alloc(obj->base.dev,
Ville Syrjälä	750fae2	2017-09-07 17:32:03 +0300	[diff] [blame]	183	roundup_pow_of_two(obj->base.size),
Chris Wilson	dbb4351	2016-12-07 13:34:11 +0000	[diff] [blame]	184	roundup_pow_of_two(obj->base.size));
				185	if (!phys)
Matthew Auld	b91b09e	2017-10-06 23:18:17 +0100	[diff] [blame]	186	return -ENOMEM;
Chris Wilson	dbb4351	2016-12-07 13:34:11 +0000	[diff] [blame]	187
				188	vaddr = phys->vaddr;
Chris Wilson	6a2c423	2014-11-04 04:51:40 -0800	[diff] [blame]	189	for (i = 0; i < obj->base.size / PAGE_SIZE; i++) {
				190	struct page *page;
				191	char *src;
				192
				193	page = shmem_read_mapping_page(mapping, i);
Chris Wilson	dbb4351	2016-12-07 13:34:11 +0000	[diff] [blame]	194	if (IS_ERR(page)) {
Matthew Auld	b91b09e	2017-10-06 23:18:17 +0100	[diff] [blame]	195	err = PTR_ERR(page);
Chris Wilson	dbb4351	2016-12-07 13:34:11 +0000	[diff] [blame]	196	goto err_phys;
				197	}
Chris Wilson	6a2c423	2014-11-04 04:51:40 -0800	[diff] [blame]	198
				199	src = kmap_atomic(page);
				200	memcpy(vaddr, src, PAGE_SIZE);
				201	drm_clflush_virt_range(vaddr, PAGE_SIZE);
				202	kunmap_atomic(src);
				203
Kirill A. Shutemov	09cbfea	2016-04-01 15:29:47 +0300	[diff] [blame]	204	put_page(page);
Chris Wilson	6a2c423	2014-11-04 04:51:40 -0800	[diff] [blame]	205	vaddr += PAGE_SIZE;
				206	}
				207
Chris Wilson	c033666	2016-05-06 15:40:21 +0100	[diff] [blame]	208	i915_gem_chipset_flush(to_i915(obj->base.dev));
Chris Wilson	6a2c423	2014-11-04 04:51:40 -0800	[diff] [blame]	209
				210	st = kmalloc(sizeof(*st), GFP_KERNEL);
Chris Wilson	dbb4351	2016-12-07 13:34:11 +0000	[diff] [blame]	211	if (!st) {
Matthew Auld	b91b09e	2017-10-06 23:18:17 +0100	[diff] [blame]	212	err = -ENOMEM;
Chris Wilson	dbb4351	2016-12-07 13:34:11 +0000	[diff] [blame]	213	goto err_phys;
				214	}
Chris Wilson	6a2c423	2014-11-04 04:51:40 -0800	[diff] [blame]	215
				216	if (sg_alloc_table(st, 1, GFP_KERNEL)) {
				217	kfree(st);
Matthew Auld	b91b09e	2017-10-06 23:18:17 +0100	[diff] [blame]	218	err = -ENOMEM;
Chris Wilson	dbb4351	2016-12-07 13:34:11 +0000	[diff] [blame]	219	goto err_phys;
Chris Wilson	6a2c423	2014-11-04 04:51:40 -0800	[diff] [blame]	220	}
				221
				222	sg = st->sgl;
				223	sg->offset = 0;
				224	sg->length = obj->base.size;
				225
Chris Wilson	dbb4351	2016-12-07 13:34:11 +0000	[diff] [blame]	226	sg_dma_address(sg) = phys->busaddr;
Chris Wilson	6a2c423	2014-11-04 04:51:40 -0800	[diff] [blame]	227	sg_dma_len(sg) = obj->base.size;
				228
Chris Wilson	dbb4351	2016-12-07 13:34:11 +0000	[diff] [blame]	229	obj->phys_handle = phys;
Matthew Auld	b91b09e	2017-10-06 23:18:17 +0100	[diff] [blame]	230
Matthew Auld	a5c08166	2017-10-06 23:18:18 +0100	[diff] [blame]	231	__i915_gem_object_set_pages(obj, st, sg->length);
Matthew Auld	b91b09e	2017-10-06 23:18:17 +0100	[diff] [blame]	232
				233	return 0;
Chris Wilson	dbb4351	2016-12-07 13:34:11 +0000	[diff] [blame]	234
				235	err_phys:
				236	drm_pci_free(obj->base.dev, phys);
Matthew Auld	b91b09e	2017-10-06 23:18:17 +0100	[diff] [blame]	237
				238	return err;
Chris Wilson	6a2c423	2014-11-04 04:51:40 -0800	[diff] [blame]	239	}
				240
Chris Wilson	e27ab73	2017-06-15 13:38:49 +0100	[diff] [blame]	241	static void __start_cpu_write(struct drm_i915_gem_object *obj)
				242	{
Christian König	c0a51fd	2018-02-16 13:43:38 +0100	[diff] [blame]	243	obj->read_domains = I915_GEM_DOMAIN_CPU;
				244	obj->write_domain = I915_GEM_DOMAIN_CPU;
Chris Wilson	e27ab73	2017-06-15 13:38:49 +0100	[diff] [blame]	245	if (cpu_write_needs_clflush(obj))
				246	obj->cache_dirty = true;
				247	}
				248
Chris Wilson	6a2c423	2014-11-04 04:51:40 -0800	[diff] [blame]	249	static void
Chris Wilson	2b3c831	2016-11-11 14:58:09 +0000	[diff] [blame]	250	__i915_gem_object_release_shmem(struct drm_i915_gem_object *obj,
Chris Wilson	e5facdf	2016-12-23 14:57:57 +0000	[diff] [blame]	251	struct sg_table *pages,
				252	bool needs_clflush)
Chris Wilson	6a2c423	2014-11-04 04:51:40 -0800	[diff] [blame]	253	{
Chris Wilson	a4f5ea6	2016-10-28 13:58:35 +0100	[diff] [blame]	254	GEM_BUG_ON(obj->mm.madv == __I915_MADV_PURGED);
Chris Wilson	6a2c423	2014-11-04 04:51:40 -0800	[diff] [blame]	255
Chris Wilson	a4f5ea6	2016-10-28 13:58:35 +0100	[diff] [blame]	256	if (obj->mm.madv == I915_MADV_DONTNEED)
				257	obj->mm.dirty = false;
Chris Wilson	6a2c423	2014-11-04 04:51:40 -0800	[diff] [blame]	258
Chris Wilson	e5facdf	2016-12-23 14:57:57 +0000	[diff] [blame]	259	if (needs_clflush &&
Christian König	c0a51fd	2018-02-16 13:43:38 +0100	[diff] [blame]	260	(obj->read_domains & I915_GEM_DOMAIN_CPU) == 0 &&
Chris Wilson	b8f55be	2017-08-11 12:11:16 +0100	[diff] [blame]	261	!(obj->cache_coherent & I915_BO_CACHE_COHERENT_FOR_READ))
Chris Wilson	2b3c831	2016-11-11 14:58:09 +0000	[diff] [blame]	262	drm_clflush_sg(pages);
Chris Wilson	03ac84f	2016-10-28 13:58:36 +0100	[diff] [blame]	263
Chris Wilson	e27ab73	2017-06-15 13:38:49 +0100	[diff] [blame]	264	__start_cpu_write(obj);
Chris Wilson	03ac84f	2016-10-28 13:58:36 +0100	[diff] [blame]	265	}
				266
				267	static void
				268	i915_gem_object_put_pages_phys(struct drm_i915_gem_object *obj,
				269	struct sg_table *pages)
				270	{
Chris Wilson	e5facdf	2016-12-23 14:57:57 +0000	[diff] [blame]	271	__i915_gem_object_release_shmem(obj, pages, false);
Chris Wilson	03ac84f	2016-10-28 13:58:36 +0100	[diff] [blame]	272
Chris Wilson	a4f5ea6	2016-10-28 13:58:35 +0100	[diff] [blame]	273	if (obj->mm.dirty) {
Al Viro	93c76a3	2015-12-04 23:45:44 -0500	[diff] [blame]	274	struct address_space *mapping = obj->base.filp->f_mapping;
Chris Wilson	6a2c423	2014-11-04 04:51:40 -0800	[diff] [blame]	275	char *vaddr = obj->phys_handle->vaddr;
Chris Wilson	0073115	2014-05-21 12:42:56 +0100	[diff] [blame]	276	int i;
				277
				278	for (i = 0; i < obj->base.size / PAGE_SIZE; i++) {
Chris Wilson	6a2c423	2014-11-04 04:51:40 -0800	[diff] [blame]	279	struct page *page;
				280	char *dst;
Chris Wilson	0073115	2014-05-21 12:42:56 +0100	[diff] [blame]	281
Chris Wilson	6a2c423	2014-11-04 04:51:40 -0800	[diff] [blame]	282	page = shmem_read_mapping_page(mapping, i);
				283	if (IS_ERR(page))
				284	continue;
				285
				286	dst = kmap_atomic(page);
				287	drm_clflush_virt_range(vaddr, PAGE_SIZE);
				288	memcpy(dst, vaddr, PAGE_SIZE);
				289	kunmap_atomic(dst);
				290
				291	set_page_dirty(page);
Chris Wilson	a4f5ea6	2016-10-28 13:58:35 +0100	[diff] [blame]	292	if (obj->mm.madv == I915_MADV_WILLNEED)
Chris Wilson	0073115	2014-05-21 12:42:56 +0100	[diff] [blame]	293	mark_page_accessed(page);
Kirill A. Shutemov	09cbfea	2016-04-01 15:29:47 +0300	[diff] [blame]	294	put_page(page);
Chris Wilson	0073115	2014-05-21 12:42:56 +0100	[diff] [blame]	295	vaddr += PAGE_SIZE;
				296	}
Chris Wilson	a4f5ea6	2016-10-28 13:58:35 +0100	[diff] [blame]	297	obj->mm.dirty = false;
Chris Wilson	0073115	2014-05-21 12:42:56 +0100	[diff] [blame]	298	}
				299
Chris Wilson	03ac84f	2016-10-28 13:58:36 +0100	[diff] [blame]	300	sg_free_table(pages);
				301	kfree(pages);
Chris Wilson	dbb4351	2016-12-07 13:34:11 +0000	[diff] [blame]	302
				303	drm_pci_free(obj->base.dev, obj->phys_handle);
Chris Wilson	6a2c423	2014-11-04 04:51:40 -0800	[diff] [blame]	304	}
				305
				306	static void
				307	i915_gem_object_release_phys(struct drm_i915_gem_object *obj)
				308	{
Chris Wilson	a4f5ea6	2016-10-28 13:58:35 +0100	[diff] [blame]	309	i915_gem_object_unpin_pages(obj);
Chris Wilson	6a2c423	2014-11-04 04:51:40 -0800	[diff] [blame]	310	}
				311
				312	static const struct drm_i915_gem_object_ops i915_gem_phys_ops = {
				313	.get_pages = i915_gem_object_get_pages_phys,
				314	.put_pages = i915_gem_object_put_pages_phys,
				315	.release = i915_gem_object_release_phys,
				316	};
				317
Chris Wilson	581ab1f	2017-02-15 16:39:00 +0000	[diff] [blame]	318	static const struct drm_i915_gem_object_ops i915_gem_object_ops;
				319
Chris Wilson	35a9611	2016-08-14 18:44:40 +0100	[diff] [blame]	320	int i915_gem_object_unbind(struct drm_i915_gem_object *obj)
Chris Wilson	aa653a6	2016-08-04 07:52:27 +0100	[diff] [blame]	321	{
				322	struct i915_vma *vma;
				323	LIST_HEAD(still_in_list);
Chris Wilson	02bef8f	2016-08-14 18:44:41 +0100	[diff] [blame]	324	int ret;
Chris Wilson	aa653a6	2016-08-04 07:52:27 +0100	[diff] [blame]	325
Chris Wilson	02bef8f	2016-08-14 18:44:41 +0100	[diff] [blame]	326	lockdep_assert_held(&obj->base.dev->struct_mutex);
				327
				328	/* Closed vma are removed from the obj->vma_list - but they may
				329	* still have an active binding on the object. To remove those we
				330	* must wait for all rendering to complete to the object (as unbinding
				331	* must anyway), and retire the requests.
Chris Wilson	aa653a6	2016-08-04 07:52:27 +0100	[diff] [blame]	332	*/
Chris Wilson	5888fc9	2017-12-04 13:25:13 +0000	[diff] [blame]	333	ret = i915_gem_object_set_to_cpu_domain(obj, false);
Chris Wilson	02bef8f	2016-08-14 18:44:41 +0100	[diff] [blame]	334	if (ret)
				335	return ret;
				336
Chris Wilson	aa653a6	2016-08-04 07:52:27 +0100	[diff] [blame]	337	while ((vma = list_first_entry_or_null(&obj->vma_list,
				338	struct i915_vma,
				339	obj_link))) {
				340	list_move_tail(&vma->obj_link, &still_in_list);
				341	ret = i915_vma_unbind(vma);
				342	if (ret)
				343	break;
				344	}
				345	list_splice(&still_in_list, &obj->vma_list);
				346
				347	return ret;
				348	}
				349
Chris Wilson	e95433c	2016-10-28 13:58:27 +0100	[diff] [blame]	350	static long
				351	i915_gem_object_wait_fence(struct dma_fence *fence,
				352	unsigned int flags,
				353	long timeout,
Sagar Arun Kamble	562d9ba	2017-10-10 22:30:06 +0100	[diff] [blame]	354	struct intel_rps_client *rps_client)
Chris Wilson	e95433c	2016-10-28 13:58:27 +0100	[diff] [blame]	355	{
Chris Wilson	e61e0f5	2018-02-21 09:56:36 +0000	[diff] [blame]	356	struct i915_request *rq;
Chris Wilson	e95433c	2016-10-28 13:58:27 +0100	[diff] [blame]	357
				358	BUILD_BUG_ON(I915_WAIT_INTERRUPTIBLE != 0x1);
				359
				360	if (test_bit(DMA_FENCE_FLAG_SIGNALED_BIT, &fence->flags))
				361	return timeout;
				362
				363	if (!dma_fence_is_i915(fence))
				364	return dma_fence_wait_timeout(fence,
				365	flags & I915_WAIT_INTERRUPTIBLE,
				366	timeout);
				367
				368	rq = to_request(fence);
Chris Wilson	e61e0f5	2018-02-21 09:56:36 +0000	[diff] [blame]	369	if (i915_request_completed(rq))
Chris Wilson	e95433c	2016-10-28 13:58:27 +0100	[diff] [blame]	370	goto out;
				371
Chris Wilson	e9af4ea	2018-01-18 13:16:09 +0000	[diff] [blame]	372	/*
				373	* This client is about to stall waiting for the GPU. In many cases
Chris Wilson	e95433c	2016-10-28 13:58:27 +0100	[diff] [blame]	374	* this is undesirable and limits the throughput of the system, as
				375	* many clients cannot continue processing user input/output whilst
				376	* blocked. RPS autotuning may take tens of milliseconds to respond
				377	* to the GPU load and thus incurs additional latency for the client.
				378	* We can circumvent that by promoting the GPU frequency to maximum
				379	* before we wait. This makes the GPU throttle up much more quickly
				380	* (good for benchmarks and user experience, e.g. window animations),
				381	* but at a cost of spending more power processing the workload
				382	* (bad for battery). Not all clients even want their results
				383	* immediately and for them we should just let the GPU select its own
				384	* frequency to maximise efficiency. To prevent a single client from
				385	* forcing the clocks too high for the whole system, we only allow
				386	* each client to waitboost once in a busy period.
				387	*/
Chris Wilson	e61e0f5	2018-02-21 09:56:36 +0000	[diff] [blame]	388	if (rps_client && !i915_request_started(rq)) {
Chris Wilson	e95433c	2016-10-28 13:58:27 +0100	[diff] [blame]	389	if (INTEL_GEN(rq->i915) >= 6)
Sagar Arun Kamble	562d9ba	2017-10-10 22:30:06 +0100	[diff] [blame]	390	gen6_rps_boost(rq, rps_client);
Chris Wilson	e95433c	2016-10-28 13:58:27 +0100	[diff] [blame]	391	}
				392
Chris Wilson	e61e0f5	2018-02-21 09:56:36 +0000	[diff] [blame]	393	timeout = i915_request_wait(rq, flags, timeout);
Chris Wilson	e95433c	2016-10-28 13:58:27 +0100	[diff] [blame]	394
				395	out:
Chris Wilson	e61e0f5	2018-02-21 09:56:36 +0000	[diff] [blame]	396	if (flags & I915_WAIT_LOCKED && i915_request_completed(rq))
				397	i915_request_retire_upto(rq);
Chris Wilson	e95433c	2016-10-28 13:58:27 +0100	[diff] [blame]	398
Chris Wilson	e95433c	2016-10-28 13:58:27 +0100	[diff] [blame]	399	return timeout;
				400	}
				401
				402	static long
				403	i915_gem_object_wait_reservation(struct reservation_object *resv,
				404	unsigned int flags,
				405	long timeout,
Sagar Arun Kamble	562d9ba	2017-10-10 22:30:06 +0100	[diff] [blame]	406	struct intel_rps_client *rps_client)
Chris Wilson	e95433c	2016-10-28 13:58:27 +0100	[diff] [blame]	407	{
Chris Wilson	e54ca97	2017-02-17 15:13:04 +0000	[diff] [blame]	408	unsigned int seq = __read_seqcount_begin(&resv->seq);
Chris Wilson	e95433c	2016-10-28 13:58:27 +0100	[diff] [blame]	409	struct dma_fence *excl;
Chris Wilson	e54ca97	2017-02-17 15:13:04 +0000	[diff] [blame]	410	bool prune_fences = false;
Chris Wilson	e95433c	2016-10-28 13:58:27 +0100	[diff] [blame]	411
				412	if (flags & I915_WAIT_ALL) {
				413	struct dma_fence **shared;
				414	unsigned int count, i;
				415	int ret;
				416
				417	ret = reservation_object_get_fences_rcu(resv,
				418	&excl, &count, &shared);
				419	if (ret)
				420	return ret;
				421
				422	for (i = 0; i < count; i++) {
				423	timeout = i915_gem_object_wait_fence(shared[i],
				424	flags, timeout,
Sagar Arun Kamble	562d9ba	2017-10-10 22:30:06 +0100	[diff] [blame]	425	rps_client);
Chris Wilson	d892e93	2017-02-12 21:53:43 +0000	[diff] [blame]	426	if (timeout < 0)
Chris Wilson	e95433c	2016-10-28 13:58:27 +0100	[diff] [blame]	427	break;
				428
				429	dma_fence_put(shared[i]);
				430	}
				431
				432	for (; i < count; i++)
				433	dma_fence_put(shared[i]);
				434	kfree(shared);
Chris Wilson	e54ca97	2017-02-17 15:13:04 +0000	[diff] [blame]	435
Chris Wilson	fa73055	2018-03-07 17:13:03 +0000	[diff] [blame]	436	/*
				437	* If both shared fences and an exclusive fence exist,
				438	* then by construction the shared fences must be later
				439	* than the exclusive fence. If we successfully wait for
				440	* all the shared fences, we know that the exclusive fence
				441	* must all be signaled. If all the shared fences are
				442	* signaled, we can prune the array and recover the
				443	* floating references on the fences/requests.
				444	*/
Chris Wilson	e54ca97	2017-02-17 15:13:04 +0000	[diff] [blame]	445	prune_fences = count && timeout >= 0;
Chris Wilson	e95433c	2016-10-28 13:58:27 +0100	[diff] [blame]	446	} else {
				447	excl = reservation_object_get_excl_rcu(resv);
				448	}
				449
Chris Wilson	fa73055	2018-03-07 17:13:03 +0000	[diff] [blame]	450	if (excl && timeout >= 0)
Sagar Arun Kamble	562d9ba	2017-10-10 22:30:06 +0100	[diff] [blame]	451	timeout = i915_gem_object_wait_fence(excl, flags, timeout,
				452	rps_client);
Chris Wilson	e95433c	2016-10-28 13:58:27 +0100	[diff] [blame]	453
				454	dma_fence_put(excl);
				455
Chris Wilson	fa73055	2018-03-07 17:13:03 +0000	[diff] [blame]	456	/*
				457	* Opportunistically prune the fences iff we know they have all been
Chris Wilson	03d1cac	2017-03-08 13:26:28 +0000	[diff] [blame]	458	* signaled and that the reservation object has not been changed (i.e.
				459	* no new fences have been added).
				460	*/
Chris Wilson	e54ca97	2017-02-17 15:13:04 +0000	[diff] [blame]	461	if (prune_fences && !__read_seqcount_retry(&resv->seq, seq)) {
Chris Wilson	03d1cac	2017-03-08 13:26:28 +0000	[diff] [blame]	462	if (reservation_object_trylock(resv)) {
				463	if (!__read_seqcount_retry(&resv->seq, seq))
				464	reservation_object_add_excl_fence(resv, NULL);
				465	reservation_object_unlock(resv);
				466	}
Chris Wilson	e54ca97	2017-02-17 15:13:04 +0000	[diff] [blame]	467	}
				468
Chris Wilson	e95433c	2016-10-28 13:58:27 +0100	[diff] [blame]	469	return timeout;
				470	}
				471
Chris Wilson	6b5e90f	2016-11-14 20:41:05 +0000	[diff] [blame]	472	static void __fence_set_priority(struct dma_fence *fence, int prio)
				473	{
Chris Wilson	e61e0f5	2018-02-21 09:56:36 +0000	[diff] [blame]	474	struct i915_request *rq;
Chris Wilson	6b5e90f	2016-11-14 20:41:05 +0000	[diff] [blame]	475	struct intel_engine_cs *engine;
				476
Chris Wilson	c218ee0	2018-01-06 10:56:18 +0000	[diff] [blame]	477	if (dma_fence_is_signaled(fence) \|\| !dma_fence_is_i915(fence))
Chris Wilson	6b5e90f	2016-11-14 20:41:05 +0000	[diff] [blame]	478	return;
				479
				480	rq = to_request(fence);
				481	engine = rq->engine;
				482	if (!engine->schedule)
				483	return;
				484
				485	engine->schedule(rq, prio);
				486	}
				487
				488	static void fence_set_priority(struct dma_fence *fence, int prio)
				489	{
				490	/* Recurse once into a fence-array */
				491	if (dma_fence_is_array(fence)) {
				492	struct dma_fence_array *array = to_dma_fence_array(fence);
				493	int i;
				494
				495	for (i = 0; i < array->num_fences; i++)
				496	__fence_set_priority(array->fences[i], prio);
				497	} else {
				498	__fence_set_priority(fence, prio);
				499	}
				500	}
				501
				502	int
				503	i915_gem_object_wait_priority(struct drm_i915_gem_object *obj,
				504	unsigned int flags,
				505	int prio)
				506	{
				507	struct dma_fence *excl;
				508
				509	if (flags & I915_WAIT_ALL) {
				510	struct dma_fence **shared;
				511	unsigned int count, i;
				512	int ret;
				513
				514	ret = reservation_object_get_fences_rcu(obj->resv,
				515	&excl, &count, &shared);
				516	if (ret)
				517	return ret;
				518
				519	for (i = 0; i < count; i++) {
				520	fence_set_priority(shared[i], prio);
				521	dma_fence_put(shared[i]);
				522	}
				523
				524	kfree(shared);
				525	} else {
				526	excl = reservation_object_get_excl_rcu(obj->resv);
				527	}
				528
				529	if (excl) {
				530	fence_set_priority(excl, prio);
				531	dma_fence_put(excl);
				532	}
				533	return 0;
				534	}
				535
Chris Wilson	00e60f2	2016-08-04 16:32:40 +0100	[diff] [blame]	536	/**
Chris Wilson	e95433c	2016-10-28 13:58:27 +0100	[diff] [blame]	537	* Waits for rendering to the object to be completed
Chris Wilson	00e60f2	2016-08-04 16:32:40 +0100	[diff] [blame]	538	* @obj: i915 gem object
Chris Wilson	e95433c	2016-10-28 13:58:27 +0100	[diff] [blame]	539	* @flags: how to wait (under a lock, for all rendering or just for writes etc)
				540	* @timeout: how long to wait
Chris Wilson	a0a8b1c	2017-11-09 14:06:44 +0000	[diff] [blame]	541	* @rps_client: client (user process) to charge for any waitboosting
Chris Wilson	00e60f2	2016-08-04 16:32:40 +0100	[diff] [blame]	542	*/
				543	int
Chris Wilson	e95433c	2016-10-28 13:58:27 +0100	[diff] [blame]	544	i915_gem_object_wait(struct drm_i915_gem_object *obj,
				545	unsigned int flags,
				546	long timeout,
Sagar Arun Kamble	562d9ba	2017-10-10 22:30:06 +0100	[diff] [blame]	547	struct intel_rps_client *rps_client)
Chris Wilson	00e60f2	2016-08-04 16:32:40 +0100	[diff] [blame]	548	{
Chris Wilson	e95433c	2016-10-28 13:58:27 +0100	[diff] [blame]	549	might_sleep();
				550	#if IS_ENABLED(CONFIG_LOCKDEP)
				551	GEM_BUG_ON(debug_locks &&
				552	!!lockdep_is_held(&obj->base.dev->struct_mutex) !=
				553	!!(flags & I915_WAIT_LOCKED));
				554	#endif
				555	GEM_BUG_ON(timeout < 0);
Chris Wilson	00e60f2	2016-08-04 16:32:40 +0100	[diff] [blame]	556
Chris Wilson	d07f0e5	2016-10-28 13:58:44 +0100	[diff] [blame]	557	timeout = i915_gem_object_wait_reservation(obj->resv,
				558	flags, timeout,
Sagar Arun Kamble	562d9ba	2017-10-10 22:30:06 +0100	[diff] [blame]	559	rps_client);
Chris Wilson	e95433c	2016-10-28 13:58:27 +0100	[diff] [blame]	560	return timeout < 0 ? timeout : 0;
Chris Wilson	00e60f2	2016-08-04 16:32:40 +0100	[diff] [blame]	561	}
				562
				563	static struct intel_rps_client to_rps_client(struct drm_file file)
				564	{
				565	struct drm_i915_file_private *fpriv = file->driver_priv;
				566
Sagar Arun Kamble	562d9ba	2017-10-10 22:30:06 +0100	[diff] [blame]	567	return &fpriv->rps_client;
Chris Wilson	00e60f2	2016-08-04 16:32:40 +0100	[diff] [blame]	568	}
				569
Chris Wilson	0073115	2014-05-21 12:42:56 +0100	[diff] [blame]	570	static int
				571	i915_gem_phys_pwrite(struct drm_i915_gem_object *obj,
				572	struct drm_i915_gem_pwrite *args,
Chris Wilson	03ac84f	2016-10-28 13:58:36 +0100	[diff] [blame]	573	struct drm_file *file)
Chris Wilson	0073115	2014-05-21 12:42:56 +0100	[diff] [blame]	574	{
Chris Wilson	0073115	2014-05-21 12:42:56 +0100	[diff] [blame]	575	void *vaddr = obj->phys_handle->vaddr + args->offset;
Gustavo Padovan	3ed605b	2016-04-26 12:32:27 -0300	[diff] [blame]	576	char __user *user_data = u64_to_user_ptr(args->data_ptr);
Chris Wilson	6a2c423	2014-11-04 04:51:40 -0800	[diff] [blame]	577
				578	/* We manually control the domain here and pretend that it
				579	* remains coherent i.e. in the GTT domain, like shmem_pwrite.
				580	*/
Rodrigo Vivi	77a0d1c	2015-06-18 11:43:24 -0700	[diff] [blame]	581	intel_fb_obj_invalidate(obj, ORIGIN_CPU);
Chris Wilson	10466d2	2017-01-06 15:22:38 +0000	[diff] [blame]	582	if (copy_from_user(vaddr, user_data, args->size))
				583	return -EFAULT;
Chris Wilson	0073115	2014-05-21 12:42:56 +0100	[diff] [blame]	584
Chris Wilson	6a2c423	2014-11-04 04:51:40 -0800	[diff] [blame]	585	drm_clflush_virt_range(vaddr, args->size);
Chris Wilson	10466d2	2017-01-06 15:22:38 +0000	[diff] [blame]	586	i915_gem_chipset_flush(to_i915(obj->base.dev));
Paulo Zanoni	063e4e6	2015-02-13 17:23:45 -0200	[diff] [blame]	587
Chris Wilson	d59b21e	2017-02-22 11:40:49 +0000	[diff] [blame]	588	intel_fb_obj_flush(obj, ORIGIN_CPU);
Chris Wilson	10466d2	2017-01-06 15:22:38 +0000	[diff] [blame]	589	return 0;
Chris Wilson	0073115	2014-05-21 12:42:56 +0100	[diff] [blame]	590	}
				591
Tvrtko Ursulin	187685c	2016-12-01 14:16:36 +0000	[diff] [blame]	592	void i915_gem_object_alloc(struct drm_i915_private dev_priv)
Chris Wilson	42dcedd	2012-11-15 11:32:30 +0000	[diff] [blame]	593	{
Chris Wilson	efab6d8	2015-04-07 16:20:57 +0100	[diff] [blame]	594	return kmem_cache_zalloc(dev_priv->objects, GFP_KERNEL);
Chris Wilson	42dcedd	2012-11-15 11:32:30 +0000	[diff] [blame]	595	}
				596
				597	void i915_gem_object_free(struct drm_i915_gem_object *obj)
				598	{
Chris Wilson	fac5e23	2016-07-04 11:34:36 +0100	[diff] [blame]	599	struct drm_i915_private *dev_priv = to_i915(obj->base.dev);
Chris Wilson	efab6d8	2015-04-07 16:20:57 +0100	[diff] [blame]	600	kmem_cache_free(dev_priv->objects, obj);
Chris Wilson	42dcedd	2012-11-15 11:32:30 +0000	[diff] [blame]	601	}
				602
Dave Airlie	ff72145b	2011-02-07 12:16:14 +1000	[diff] [blame]	603	static int
				604	i915_gem_create(struct drm_file *file,
Tvrtko Ursulin	12d79d7	2016-12-01 14:16:37 +0000	[diff] [blame]	605	struct drm_i915_private *dev_priv,
Dave Airlie	ff72145b	2011-02-07 12:16:14 +1000	[diff] [blame]	606	uint64_t size,
				607	uint32_t *handle_p)
Eric Anholt	673a394	2008-07-30 12:06:12 -0700	[diff] [blame]	608	{
Chris Wilson	05394f3	2010-11-08 19:18:58 +0000	[diff] [blame]	609	struct drm_i915_gem_object *obj;
Pekka Paalanen	a1a2d1d	2009-08-23 12:40:55 +0300	[diff] [blame]	610	int ret;
				611	u32 handle;
Eric Anholt	673a394	2008-07-30 12:06:12 -0700	[diff] [blame]	612
Dave Airlie	ff72145b	2011-02-07 12:16:14 +1000	[diff] [blame]	613	size = roundup(size, PAGE_SIZE);
Chris Wilson	8ffc024	2011-09-14 14:14:28 +0200	[diff] [blame]	614	if (size == 0)
				615	return -EINVAL;
Eric Anholt	673a394	2008-07-30 12:06:12 -0700	[diff] [blame]	616
				617	/* Allocate the new object */
Tvrtko Ursulin	12d79d7	2016-12-01 14:16:37 +0000	[diff] [blame]	618	obj = i915_gem_object_create(dev_priv, size);
Chris Wilson	fe3db79	2016-04-25 13:32:13 +0100	[diff] [blame]	619	if (IS_ERR(obj))
				620	return PTR_ERR(obj);
Eric Anholt	673a394	2008-07-30 12:06:12 -0700	[diff] [blame]	621
Chris Wilson	05394f3	2010-11-08 19:18:58 +0000	[diff] [blame]	622	ret = drm_gem_handle_create(file, &obj->base, &handle);
Chris Wilson	202f2fe	2010-10-14 13:20:40 +0100	[diff] [blame]	623	/* drop reference from allocate - handle holds it now */
Chris Wilson	f0cd518	2016-10-28 13:58:43 +0100	[diff] [blame]	624	i915_gem_object_put(obj);
Daniel Vetter	d861e33	2013-07-24 23:25:03 +0200	[diff] [blame]	625	if (ret)
				626	return ret;
Chris Wilson	202f2fe	2010-10-14 13:20:40 +0100	[diff] [blame]	627
Dave Airlie	ff72145b	2011-02-07 12:16:14 +1000	[diff] [blame]	628	*handle_p = handle;
Eric Anholt	673a394	2008-07-30 12:06:12 -0700	[diff] [blame]	629	return 0;
				630	}
				631
Dave Airlie	ff72145b	2011-02-07 12:16:14 +1000	[diff] [blame]	632	int
				633	i915_gem_dumb_create(struct drm_file *file,
				634	struct drm_device *dev,
				635	struct drm_mode_create_dumb *args)
				636	{
				637	/* have to work out size/pitch and return them */
Paulo Zanoni	de45eaf	2013-10-18 18:48:24 -0300	[diff] [blame]	638	args->pitch = ALIGN(args->width * DIV_ROUND_UP(args->bpp, 8), 64);
Dave Airlie	ff72145b	2011-02-07 12:16:14 +1000	[diff] [blame]	639	args->size = args->pitch * args->height;
Tvrtko Ursulin	12d79d7	2016-12-01 14:16:37 +0000	[diff] [blame]	640	return i915_gem_create(file, to_i915(dev),
Dave Airlie	da6b51d	2014-12-24 13:11:17 +1000	[diff] [blame]	641	args->size, &args->handle);
Dave Airlie	ff72145b	2011-02-07 12:16:14 +1000	[diff] [blame]	642	}
				643
Chris Wilson	e27ab73	2017-06-15 13:38:49 +0100	[diff] [blame]	644	static bool gpu_write_needs_clflush(struct drm_i915_gem_object *obj)
				645	{
				646	return !(obj->cache_level == I915_CACHE_NONE \|\|
				647	obj->cache_level == I915_CACHE_WT);
				648	}
				649
Dave Airlie	ff72145b	2011-02-07 12:16:14 +1000	[diff] [blame]	650	/**
				651	* Creates a new mm object and returns a handle to it.
Tvrtko Ursulin	14bb2c1	2016-06-03 14:02:17 +0100	[diff] [blame]	652	* @dev: drm device pointer
				653	* @data: ioctl data blob
				654	* @file: drm file pointer
Dave Airlie	ff72145b	2011-02-07 12:16:14 +1000	[diff] [blame]	655	*/
				656	int
				657	i915_gem_create_ioctl(struct drm_device dev, void data,
				658	struct drm_file *file)
				659	{
Tvrtko Ursulin	12d79d7	2016-12-01 14:16:37 +0000	[diff] [blame]	660	struct drm_i915_private *dev_priv = to_i915(dev);
Dave Airlie	ff72145b	2011-02-07 12:16:14 +1000	[diff] [blame]	661	struct drm_i915_gem_create *args = data;
Daniel Vetter	63ed2cb	2012-04-23 16:50:50 +0200	[diff] [blame]	662
Tvrtko Ursulin	12d79d7	2016-12-01 14:16:37 +0000	[diff] [blame]	663	i915_gem_flush_free_objects(dev_priv);
Chris Wilson	fbbd37b	2016-10-28 13:58:42 +0100	[diff] [blame]	664
Tvrtko Ursulin	12d79d7	2016-12-01 14:16:37 +0000	[diff] [blame]	665	return i915_gem_create(file, dev_priv,
Dave Airlie	da6b51d	2014-12-24 13:11:17 +1000	[diff] [blame]	666	args->size, &args->handle);
Dave Airlie	ff72145b	2011-02-07 12:16:14 +1000	[diff] [blame]	667	}
				668
Chris Wilson	ef74921	2017-04-12 12:01:10 +0100	[diff] [blame]	669	static inline enum fb_op_origin
				670	fb_write_origin(struct drm_i915_gem_object *obj, unsigned int domain)
				671	{
				672	return (domain == I915_GEM_DOMAIN_GTT ?
				673	obj->frontbuffer_ggtt_origin : ORIGIN_CPU);
				674	}
				675
Chris Wilson	7125397	2017-12-06 12:49:14 +0000	[diff] [blame]	676	void i915_gem_flush_ggtt_writes(struct drm_i915_private *dev_priv)
Chris Wilson	ef74921	2017-04-12 12:01:10 +0100	[diff] [blame]	677	{
Chris Wilson	7125397	2017-12-06 12:49:14 +0000	[diff] [blame]	678	/*
				679	* No actual flushing is required for the GTT write domain for reads
				680	* from the GTT domain. Writes to it "immediately" go to main memory
				681	* as far as we know, so there's no chipset flush. It also doesn't
				682	* land in the GPU render cache.
Chris Wilson	ef74921	2017-04-12 12:01:10 +0100	[diff] [blame]	683	*
				684	* However, we do have to enforce the order so that all writes through
				685	* the GTT land before any writes to the device, such as updates to
				686	* the GATT itself.
				687	*
				688	* We also have to wait a bit for the writes to land from the GTT.
				689	* An uncached read (i.e. mmio) seems to be ideal for the round-trip
				690	* timing. This issue has only been observed when switching quickly
				691	* between GTT writes and CPU reads from inside the kernel on recent hw,
				692	* and it appears to only affect discrete GTT blocks (i.e. on LLC
Chris Wilson	7125397	2017-12-06 12:49:14 +0000	[diff] [blame]	693	* system agents we cannot reproduce this behaviour, until Cannonlake
				694	* that was!).
Chris Wilson	ef74921	2017-04-12 12:01:10 +0100	[diff] [blame]	695	*/
Chris Wilson	7125397	2017-12-06 12:49:14 +0000	[diff] [blame]	696
Chris Wilson	ef74921	2017-04-12 12:01:10 +0100	[diff] [blame]	697	wmb();
				698
Chris Wilson	7125397	2017-12-06 12:49:14 +0000	[diff] [blame]	699	intel_runtime_pm_get(dev_priv);
				700	spin_lock_irq(&dev_priv->uncore.lock);
				701
				702	POSTING_READ_FW(RING_HEAD(RENDER_RING_BASE));
				703
				704	spin_unlock_irq(&dev_priv->uncore.lock);
				705	intel_runtime_pm_put(dev_priv);
				706	}
				707
				708	static void
				709	flush_write_domain(struct drm_i915_gem_object *obj, unsigned int flush_domains)
				710	{
				711	struct drm_i915_private *dev_priv = to_i915(obj->base.dev);
				712	struct i915_vma *vma;
				713
Christian König	c0a51fd	2018-02-16 13:43:38 +0100	[diff] [blame]	714	if (!(obj->write_domain & flush_domains))
Chris Wilson	7125397	2017-12-06 12:49:14 +0000	[diff] [blame]	715	return;
				716
Christian König	c0a51fd	2018-02-16 13:43:38 +0100	[diff] [blame]	717	switch (obj->write_domain) {
Chris Wilson	ef74921	2017-04-12 12:01:10 +0100	[diff] [blame]	718	case I915_GEM_DOMAIN_GTT:
Chris Wilson	7125397	2017-12-06 12:49:14 +0000	[diff] [blame]	719	i915_gem_flush_ggtt_writes(dev_priv);
Chris Wilson	ef74921	2017-04-12 12:01:10 +0100	[diff] [blame]	720
				721	intel_fb_obj_flush(obj,
				722	fb_write_origin(obj, I915_GEM_DOMAIN_GTT));
Chris Wilson	7125397	2017-12-06 12:49:14 +0000	[diff] [blame]	723
Chris Wilson	e2189dd	2017-12-07 21:14:07 +0000	[diff] [blame]	724	for_each_ggtt_vma(vma, obj) {
Chris Wilson	7125397	2017-12-06 12:49:14 +0000	[diff] [blame]	725	if (vma->iomap)
				726	continue;
				727
				728	i915_vma_unset_ggtt_write(vma);
				729	}
Chris Wilson	ef74921	2017-04-12 12:01:10 +0100	[diff] [blame]	730	break;
				731
				732	case I915_GEM_DOMAIN_CPU:
				733	i915_gem_clflush_object(obj, I915_CLFLUSH_SYNC);
				734	break;
Chris Wilson	e27ab73	2017-06-15 13:38:49 +0100	[diff] [blame]	735
				736	case I915_GEM_DOMAIN_RENDER:
				737	if (gpu_write_needs_clflush(obj))
				738	obj->cache_dirty = true;
				739	break;
Chris Wilson	ef74921	2017-04-12 12:01:10 +0100	[diff] [blame]	740	}
				741
Christian König	c0a51fd	2018-02-16 13:43:38 +0100	[diff] [blame]	742	obj->write_domain = 0;
Chris Wilson	ef74921	2017-04-12 12:01:10 +0100	[diff] [blame]	743	}
				744
Daniel Vetter	8c59967	2011-12-14 13:57:31 +0100	[diff] [blame]	745	static inline int
Daniel Vetter	8461d22	2011-12-14 13:57:32 +0100	[diff] [blame]	746	__copy_to_user_swizzled(char __user *cpu_vaddr,
				747	const char *gpu_vaddr, int gpu_offset,
				748	int length)
				749	{
				750	int ret, cpu_offset = 0;
				751
				752	while (length > 0) {
				753	int cacheline_end = ALIGN(gpu_offset + 1, 64);
				754	int this_length = min(cacheline_end - gpu_offset, length);
				755	int swizzled_gpu_offset = gpu_offset ^ 64;
				756
				757	ret = __copy_to_user(cpu_vaddr + cpu_offset,
				758	gpu_vaddr + swizzled_gpu_offset,
				759	this_length);
				760	if (ret)
				761	return ret + length;
				762
				763	cpu_offset += this_length;
				764	gpu_offset += this_length;
				765	length -= this_length;
				766	}
				767
				768	return 0;
				769	}
				770
				771	static inline int
Ben Widawsky	4f0c7cf	2012-04-16 14:07:47 -0700	[diff] [blame]	772	__copy_from_user_swizzled(char *gpu_vaddr, int gpu_offset,
				773	const char __user *cpu_vaddr,
Daniel Vetter	8c59967	2011-12-14 13:57:31 +0100	[diff] [blame]	774	int length)
				775	{
				776	int ret, cpu_offset = 0;
				777
				778	while (length > 0) {
				779	int cacheline_end = ALIGN(gpu_offset + 1, 64);
				780	int this_length = min(cacheline_end - gpu_offset, length);
				781	int swizzled_gpu_offset = gpu_offset ^ 64;
				782
				783	ret = __copy_from_user(gpu_vaddr + swizzled_gpu_offset,
				784	cpu_vaddr + cpu_offset,
				785	this_length);
				786	if (ret)
				787	return ret + length;
				788
				789	cpu_offset += this_length;
				790	gpu_offset += this_length;
				791	length -= this_length;
				792	}
				793
				794	return 0;
				795	}
				796
Brad Volkin	4c914c0	2014-02-18 10:15:45 -0800	[diff] [blame]	797	/*
				798	* Pins the specified object's pages and synchronizes the object with
				799	* GPU accesses. Sets needs_clflush to non-zero if the caller should
				800	* flush the object from the CPU cache.
				801	*/
				802	int i915_gem_obj_prepare_shmem_read(struct drm_i915_gem_object *obj,
Chris Wilson	43394c7	2016-08-18 17:16:47 +0100	[diff] [blame]	803	unsigned int *needs_clflush)
Brad Volkin	4c914c0	2014-02-18 10:15:45 -0800	[diff] [blame]	804	{
				805	int ret;
				806
Chris Wilson	e95433c	2016-10-28 13:58:27 +0100	[diff] [blame]	807	lockdep_assert_held(&obj->base.dev->struct_mutex);
Brad Volkin	4c914c0	2014-02-18 10:15:45 -0800	[diff] [blame]	808
Chris Wilson	e95433c	2016-10-28 13:58:27 +0100	[diff] [blame]	809	*needs_clflush = 0;
Chris Wilson	43394c7	2016-08-18 17:16:47 +0100	[diff] [blame]	810	if (!i915_gem_object_has_struct_page(obj))
				811	return -ENODEV;
Brad Volkin	4c914c0	2014-02-18 10:15:45 -0800	[diff] [blame]	812
Chris Wilson	e95433c	2016-10-28 13:58:27 +0100	[diff] [blame]	813	ret = i915_gem_object_wait(obj,
				814	I915_WAIT_INTERRUPTIBLE \|
				815	I915_WAIT_LOCKED,
				816	MAX_SCHEDULE_TIMEOUT,
				817	NULL);
Chris Wilson	c13d87e	2016-07-20 09:21:15 +0100	[diff] [blame]	818	if (ret)
				819	return ret;
				820
Chris Wilson	a4f5ea6	2016-10-28 13:58:35 +0100	[diff] [blame]	821	ret = i915_gem_object_pin_pages(obj);
Chris Wilson	9764951	2016-08-18 17:16:50 +0100	[diff] [blame]	822	if (ret)
				823	return ret;
				824
Chris Wilson	b8f55be	2017-08-11 12:11:16 +0100	[diff] [blame]	825	if (obj->cache_coherent & I915_BO_CACHE_COHERENT_FOR_READ \|\|
				826	!static_cpu_has(X86_FEATURE_CLFLUSH)) {
Chris Wilson	7f5f95d	2017-03-10 00:09:42 +0000	[diff] [blame]	827	ret = i915_gem_object_set_to_cpu_domain(obj, false);
				828	if (ret)
				829	goto err_unpin;
				830	else
				831	goto out;
				832	}
				833
Chris Wilson	ef74921	2017-04-12 12:01:10 +0100	[diff] [blame]	834	flush_write_domain(obj, ~I915_GEM_DOMAIN_CPU);
Chris Wilson	a314d5c	2016-08-18 17:16:48 +0100	[diff] [blame]	835
Chris Wilson	43394c7	2016-08-18 17:16:47 +0100	[diff] [blame]	836	/* If we're not in the cpu read domain, set ourself into the gtt
				837	* read domain and manually flush cachelines (if required). This
				838	* optimizes for the case when the gpu will dirty the data
				839	* anyway again before the next pread happens.
				840	*/
Chris Wilson	e27ab73	2017-06-15 13:38:49 +0100	[diff] [blame]	841	if (!obj->cache_dirty &&
Christian König	c0a51fd	2018-02-16 13:43:38 +0100	[diff] [blame]	842	!(obj->read_domains & I915_GEM_DOMAIN_CPU))
Chris Wilson	7f5f95d	2017-03-10 00:09:42 +0000	[diff] [blame]	843	*needs_clflush = CLFLUSH_BEFORE;
Brad Volkin	4c914c0	2014-02-18 10:15:45 -0800	[diff] [blame]	844
Chris Wilson	7f5f95d	2017-03-10 00:09:42 +0000	[diff] [blame]	845	out:
Chris Wilson	9764951	2016-08-18 17:16:50 +0100	[diff] [blame]	846	/* return with the pages pinned */
Chris Wilson	43394c7	2016-08-18 17:16:47 +0100	[diff] [blame]	847	return 0;
Chris Wilson	9764951	2016-08-18 17:16:50 +0100	[diff] [blame]	848
				849	err_unpin:
				850	i915_gem_object_unpin_pages(obj);
				851	return ret;
Chris Wilson	43394c7	2016-08-18 17:16:47 +0100	[diff] [blame]	852	}
				853
				854	int i915_gem_obj_prepare_shmem_write(struct drm_i915_gem_object *obj,
				855	unsigned int *needs_clflush)
				856	{
				857	int ret;
				858
Chris Wilson	e95433c	2016-10-28 13:58:27 +0100	[diff] [blame]	859	lockdep_assert_held(&obj->base.dev->struct_mutex);
				860
Chris Wilson	43394c7	2016-08-18 17:16:47 +0100	[diff] [blame]	861	*needs_clflush = 0;
				862	if (!i915_gem_object_has_struct_page(obj))
				863	return -ENODEV;
				864
Chris Wilson	e95433c	2016-10-28 13:58:27 +0100	[diff] [blame]	865	ret = i915_gem_object_wait(obj,
				866	I915_WAIT_INTERRUPTIBLE \|
				867	I915_WAIT_LOCKED \|
				868	I915_WAIT_ALL,
				869	MAX_SCHEDULE_TIMEOUT,
				870	NULL);
Chris Wilson	43394c7	2016-08-18 17:16:47 +0100	[diff] [blame]	871	if (ret)
				872	return ret;
				873
Chris Wilson	a4f5ea6	2016-10-28 13:58:35 +0100	[diff] [blame]	874	ret = i915_gem_object_pin_pages(obj);
Chris Wilson	9764951	2016-08-18 17:16:50 +0100	[diff] [blame]	875	if (ret)
				876	return ret;
				877
Chris Wilson	b8f55be	2017-08-11 12:11:16 +0100	[diff] [blame]	878	if (obj->cache_coherent & I915_BO_CACHE_COHERENT_FOR_WRITE \|\|
				879	!static_cpu_has(X86_FEATURE_CLFLUSH)) {
Chris Wilson	7f5f95d	2017-03-10 00:09:42 +0000	[diff] [blame]	880	ret = i915_gem_object_set_to_cpu_domain(obj, true);
				881	if (ret)
				882	goto err_unpin;
				883	else
				884	goto out;
				885	}
				886
Chris Wilson	ef74921	2017-04-12 12:01:10 +0100	[diff] [blame]	887	flush_write_domain(obj, ~I915_GEM_DOMAIN_CPU);
Chris Wilson	a314d5c	2016-08-18 17:16:48 +0100	[diff] [blame]	888
Chris Wilson	43394c7	2016-08-18 17:16:47 +0100	[diff] [blame]	889	/* If we're not in the cpu write domain, set ourself into the
				890	* gtt write domain and manually flush cachelines (as required).
				891	* This optimizes for the case when the gpu will use the data
				892	* right away and we therefore have to clflush anyway.
				893	*/
Chris Wilson	e27ab73	2017-06-15 13:38:49 +0100	[diff] [blame]	894	if (!obj->cache_dirty) {
Chris Wilson	7f5f95d	2017-03-10 00:09:42 +0000	[diff] [blame]	895	*needs_clflush \|= CLFLUSH_AFTER;
Chris Wilson	43394c7	2016-08-18 17:16:47 +0100	[diff] [blame]	896
Chris Wilson	e27ab73	2017-06-15 13:38:49 +0100	[diff] [blame]	897	/*
				898	* Same trick applies to invalidate partially written
				899	* cachelines read before writing.
				900	*/
Christian König	c0a51fd	2018-02-16 13:43:38 +0100	[diff] [blame]	901	if (!(obj->read_domains & I915_GEM_DOMAIN_CPU))
Chris Wilson	e27ab73	2017-06-15 13:38:49 +0100	[diff] [blame]	902	*needs_clflush \|= CLFLUSH_BEFORE;
				903	}
Chris Wilson	43394c7	2016-08-18 17:16:47 +0100	[diff] [blame]	904
Chris Wilson	7f5f95d	2017-03-10 00:09:42 +0000	[diff] [blame]	905	out:
Chris Wilson	43394c7	2016-08-18 17:16:47 +0100	[diff] [blame]	906	intel_fb_obj_invalidate(obj, ORIGIN_CPU);
Chris Wilson	a4f5ea6	2016-10-28 13:58:35 +0100	[diff] [blame]	907	obj->mm.dirty = true;
Chris Wilson	9764951	2016-08-18 17:16:50 +0100	[diff] [blame]	908	/* return with the pages pinned */
Chris Wilson	43394c7	2016-08-18 17:16:47 +0100	[diff] [blame]	909	return 0;
Chris Wilson	9764951	2016-08-18 17:16:50 +0100	[diff] [blame]	910
				911	err_unpin:
				912	i915_gem_object_unpin_pages(obj);
				913	return ret;
Brad Volkin	4c914c0	2014-02-18 10:15:45 -0800	[diff] [blame]	914	}
				915
Daniel Vetter	23c18c7	2012-03-25 19:47:42 +0200	[diff] [blame]	916	static void
				917	shmem_clflush_swizzled_range(char *addr, unsigned long length,
				918	bool swizzled)
				919	{
Daniel Vetter	e7e58eb	2012-03-25 19:47:43 +0200	[diff] [blame]	920	if (unlikely(swizzled)) {
Daniel Vetter	23c18c7	2012-03-25 19:47:42 +0200	[diff] [blame]	921	unsigned long start = (unsigned long) addr;
				922	unsigned long end = (unsigned long) addr + length;
				923
				924	/* For swizzling simply ensure that we always flush both
				925	* channels. Lame, but simple and it works. Swizzled
				926	* pwrite/pread is far from a hotpath - current userspace
				927	* doesn't use it at all. */
				928	start = round_down(start, 128);
				929	end = round_up(end, 128);
				930
				931	drm_clflush_virt_range((void *)start, end - start);
				932	} else {
				933	drm_clflush_virt_range(addr, length);
				934	}
				935
				936	}
				937
Daniel Vetter	d174bd6	2012-03-25 19:47:40 +0200	[diff] [blame]	938	/* Only difference to the fast-path function is that this can handle bit17
				939	* and uses non-atomic copy and kmap functions. */
				940	static int
Chris Wilson	bb6dc8d	2016-10-28 13:58:39 +0100	[diff] [blame]	941	shmem_pread_slow(struct page *page, int offset, int length,
Daniel Vetter	d174bd6	2012-03-25 19:47:40 +0200	[diff] [blame]	942	char __user *user_data,
				943	bool page_do_bit17_swizzling, bool needs_clflush)
				944	{
				945	char *vaddr;
				946	int ret;
				947
				948	vaddr = kmap(page);
				949	if (needs_clflush)
Chris Wilson	bb6dc8d	2016-10-28 13:58:39 +0100	[diff] [blame]	950	shmem_clflush_swizzled_range(vaddr + offset, length,
Daniel Vetter	23c18c7	2012-03-25 19:47:42 +0200	[diff] [blame]	951	page_do_bit17_swizzling);
Daniel Vetter	d174bd6	2012-03-25 19:47:40 +0200	[diff] [blame]	952
				953	if (page_do_bit17_swizzling)
Chris Wilson	bb6dc8d	2016-10-28 13:58:39 +0100	[diff] [blame]	954	ret = __copy_to_user_swizzled(user_data, vaddr, offset, length);
Daniel Vetter	d174bd6	2012-03-25 19:47:40 +0200	[diff] [blame]	955	else
Chris Wilson	bb6dc8d	2016-10-28 13:58:39 +0100	[diff] [blame]	956	ret = __copy_to_user(user_data, vaddr + offset, length);
Daniel Vetter	d174bd6	2012-03-25 19:47:40 +0200	[diff] [blame]	957	kunmap(page);
				958
Chris Wilson	f60d7f0	2012-09-04 21:02:56 +0100	[diff] [blame]	959	return ret ? - EFAULT : 0;
Daniel Vetter	d174bd6	2012-03-25 19:47:40 +0200	[diff] [blame]	960	}
				961
Chris Wilson	bb6dc8d	2016-10-28 13:58:39 +0100	[diff] [blame]	962	static int
				963	shmem_pread(struct page page, int offset, int length, char __user user_data,
				964	bool page_do_bit17_swizzling, bool needs_clflush)
Ankitprasad Sharma	b50a537	2016-06-10 14:23:03 +0530	[diff] [blame]	965	{
Chris Wilson	bb6dc8d	2016-10-28 13:58:39 +0100	[diff] [blame]	966	int ret;
				967
				968	ret = -ENODEV;
				969	if (!page_do_bit17_swizzling) {
				970	char *vaddr = kmap_atomic(page);
				971
				972	if (needs_clflush)
				973	drm_clflush_virt_range(vaddr + offset, length);
				974	ret = __copy_to_user_inatomic(user_data, vaddr + offset, length);
				975	kunmap_atomic(vaddr);
				976	}
				977	if (ret == 0)
				978	return 0;
				979
				980	return shmem_pread_slow(page, offset, length, user_data,
				981	page_do_bit17_swizzling, needs_clflush);
				982	}
				983
				984	static int
				985	i915_gem_shmem_pread(struct drm_i915_gem_object *obj,
				986	struct drm_i915_gem_pread *args)
				987	{
				988	char __user *user_data;
				989	u64 remain;
				990	unsigned int obj_do_bit17_swizzling;
				991	unsigned int needs_clflush;
				992	unsigned int idx, offset;
				993	int ret;
				994
				995	obj_do_bit17_swizzling = 0;
				996	if (i915_gem_object_needs_bit17_swizzle(obj))
				997	obj_do_bit17_swizzling = BIT(17);
				998
				999	ret = mutex_lock_interruptible(&obj->base.dev->struct_mutex);
				1000	if (ret)
				1001	return ret;
				1002
				1003	ret = i915_gem_obj_prepare_shmem_read(obj, &needs_clflush);
				1004	mutex_unlock(&obj->base.dev->struct_mutex);
				1005	if (ret)
				1006	return ret;
				1007
				1008	remain = args->size;
				1009	user_data = u64_to_user_ptr(args->data_ptr);
				1010	offset = offset_in_page(args->offset);
				1011	for (idx = args->offset >> PAGE_SHIFT; remain; idx++) {
				1012	struct page *page = i915_gem_object_get_page(obj, idx);
				1013	int length;
				1014
				1015	length = remain;
				1016	if (offset + length > PAGE_SIZE)
				1017	length = PAGE_SIZE - offset;
				1018
				1019	ret = shmem_pread(page, offset, length, user_data,
				1020	page_to_phys(page) & obj_do_bit17_swizzling,
				1021	needs_clflush);
				1022	if (ret)
				1023	break;
				1024
				1025	remain -= length;
				1026	user_data += length;
				1027	offset = 0;
				1028	}
				1029
				1030	i915_gem_obj_finish_shmem_access(obj);
				1031	return ret;
				1032	}
				1033
				1034	static inline bool
				1035	gtt_user_read(struct io_mapping *mapping,
				1036	loff_t base, int offset,
				1037	char __user *user_data, int length)
				1038	{
Ville Syrjälä	afe722b	2017-09-01 20:12:52 +0300	[diff] [blame]	1039	void __iomem *vaddr;
Chris Wilson	bb6dc8d	2016-10-28 13:58:39 +0100	[diff] [blame]	1040	unsigned long unwritten;
Ankitprasad Sharma	b50a537	2016-06-10 14:23:03 +0530	[diff] [blame]	1041
Ankitprasad Sharma	b50a537	2016-06-10 14:23:03 +0530	[diff] [blame]	1042	/* We can use the cpu mem copy function because this is X86. */
Ville Syrjälä	afe722b	2017-09-01 20:12:52 +0300	[diff] [blame]	1043	vaddr = io_mapping_map_atomic_wc(mapping, base);
				1044	unwritten = __copy_to_user_inatomic(user_data,
				1045	(void __force *)vaddr + offset,
				1046	length);
Chris Wilson	bb6dc8d	2016-10-28 13:58:39 +0100	[diff] [blame]	1047	io_mapping_unmap_atomic(vaddr);
				1048	if (unwritten) {
Ville Syrjälä	afe722b	2017-09-01 20:12:52 +0300	[diff] [blame]	1049	vaddr = io_mapping_map_wc(mapping, base, PAGE_SIZE);
				1050	unwritten = copy_to_user(user_data,
				1051	(void __force *)vaddr + offset,
				1052	length);
Chris Wilson	bb6dc8d	2016-10-28 13:58:39 +0100	[diff] [blame]	1053	io_mapping_unmap(vaddr);
				1054	}
Ankitprasad Sharma	b50a537	2016-06-10 14:23:03 +0530	[diff] [blame]	1055	return unwritten;
				1056	}
				1057
				1058	static int
Chris Wilson	bb6dc8d	2016-10-28 13:58:39 +0100	[diff] [blame]	1059	i915_gem_gtt_pread(struct drm_i915_gem_object *obj,
				1060	const struct drm_i915_gem_pread *args)
Ankitprasad Sharma	b50a537	2016-06-10 14:23:03 +0530	[diff] [blame]	1061	{
Chris Wilson	bb6dc8d	2016-10-28 13:58:39 +0100	[diff] [blame]	1062	struct drm_i915_private *i915 = to_i915(obj->base.dev);
				1063	struct i915_ggtt *ggtt = &i915->ggtt;
Ankitprasad Sharma	b50a537	2016-06-10 14:23:03 +0530	[diff] [blame]	1064	struct drm_mm_node node;
Chris Wilson	bb6dc8d	2016-10-28 13:58:39 +0100	[diff] [blame]	1065	struct i915_vma *vma;
				1066	void __user *user_data;
				1067	u64 remain, offset;
Ankitprasad Sharma	b50a537	2016-06-10 14:23:03 +0530	[diff] [blame]	1068	int ret;
				1069
Chris Wilson	bb6dc8d	2016-10-28 13:58:39 +0100	[diff] [blame]	1070	ret = mutex_lock_interruptible(&i915->drm.struct_mutex);
				1071	if (ret)
				1072	return ret;
				1073
				1074	intel_runtime_pm_get(i915);
				1075	vma = i915_gem_object_ggtt_pin(obj, NULL, 0, 0,
Chris Wilson	a3259ca	2017-10-09 09:44:00 +0100	[diff] [blame]	1076	PIN_MAPPABLE \|
				1077	PIN_NONFAULT \|
				1078	PIN_NONBLOCK);
Chris Wilson	1803458	2016-08-18 17:16:45 +0100	[diff] [blame]	1079	if (!IS_ERR(vma)) {
				1080	node.start = i915_ggtt_offset(vma);
				1081	node.allocated = false;
Chris Wilson	49ef529	2016-08-18 17:17:00 +0100	[diff] [blame]	1082	ret = i915_vma_put_fence(vma);
Chris Wilson	1803458	2016-08-18 17:16:45 +0100	[diff] [blame]	1083	if (ret) {
				1084	i915_vma_unpin(vma);
				1085	vma = ERR_PTR(ret);
				1086	}
				1087	}
Chris Wilson	058d88c	2016-08-15 10:49:06 +0100	[diff] [blame]	1088	if (IS_ERR(vma)) {
Chris Wilson	bb6dc8d	2016-10-28 13:58:39 +0100	[diff] [blame]	1089	ret = insert_mappable_node(ggtt, &node, PAGE_SIZE);
Ankitprasad Sharma	b50a537	2016-06-10 14:23:03 +0530	[diff] [blame]	1090	if (ret)
Chris Wilson	bb6dc8d	2016-10-28 13:58:39 +0100	[diff] [blame]	1091	goto out_unlock;
				1092	GEM_BUG_ON(!node.allocated);
Ankitprasad Sharma	b50a537	2016-06-10 14:23:03 +0530	[diff] [blame]	1093	}
				1094
				1095	ret = i915_gem_object_set_to_gtt_domain(obj, false);
				1096	if (ret)
				1097	goto out_unpin;
				1098
Chris Wilson	bb6dc8d	2016-10-28 13:58:39 +0100	[diff] [blame]	1099	mutex_unlock(&i915->drm.struct_mutex);
Ankitprasad Sharma	b50a537	2016-06-10 14:23:03 +0530	[diff] [blame]	1100
Chris Wilson	bb6dc8d	2016-10-28 13:58:39 +0100	[diff] [blame]	1101	user_data = u64_to_user_ptr(args->data_ptr);
				1102	remain = args->size;
				1103	offset = args->offset;
Ankitprasad Sharma	b50a537	2016-06-10 14:23:03 +0530	[diff] [blame]	1104
				1105	while (remain > 0) {
				1106	/* Operation in this page
				1107	*
				1108	* page_base = page offset within aperture
				1109	* page_offset = offset within page
				1110	* page_length = bytes to copy for this page
				1111	*/
				1112	u32 page_base = node.start;
				1113	unsigned page_offset = offset_in_page(offset);
				1114	unsigned page_length = PAGE_SIZE - page_offset;
				1115	page_length = remain < page_length ? remain : page_length;
				1116	if (node.allocated) {
				1117	wmb();
				1118	ggtt->base.insert_page(&ggtt->base,
				1119	i915_gem_object_get_dma_address(obj, offset >> PAGE_SHIFT),
Chris Wilson	bb6dc8d	2016-10-28 13:58:39 +0100	[diff] [blame]	1120	node.start, I915_CACHE_NONE, 0);
Ankitprasad Sharma	b50a537	2016-06-10 14:23:03 +0530	[diff] [blame]	1121	wmb();
				1122	} else {
				1123	page_base += offset & PAGE_MASK;
				1124	}
Chris Wilson	bb6dc8d	2016-10-28 13:58:39 +0100	[diff] [blame]	1125
Matthew Auld	73ebd50	2017-12-11 15:18:20 +0000	[diff] [blame]	1126	if (gtt_user_read(&ggtt->iomap, page_base, page_offset,
Chris Wilson	bb6dc8d	2016-10-28 13:58:39 +0100	[diff] [blame]	1127	user_data, page_length)) {
Ankitprasad Sharma	b50a537	2016-06-10 14:23:03 +0530	[diff] [blame]	1128	ret = -EFAULT;
				1129	break;
				1130	}
				1131
				1132	remain -= page_length;
				1133	user_data += page_length;
				1134	offset += page_length;
				1135	}
				1136
Chris Wilson	bb6dc8d	2016-10-28 13:58:39 +0100	[diff] [blame]	1137	mutex_lock(&i915->drm.struct_mutex);
Ankitprasad Sharma	b50a537	2016-06-10 14:23:03 +0530	[diff] [blame]	1138	out_unpin:
				1139	if (node.allocated) {
				1140	wmb();
				1141	ggtt->base.clear_range(&ggtt->base,
Michał Winiarski	4fb84d9	2016-10-13 14:02:40 +0200	[diff] [blame]	1142	node.start, node.size);
Ankitprasad Sharma	b50a537	2016-06-10 14:23:03 +0530	[diff] [blame]	1143	remove_mappable_node(&node);
				1144	} else {
Chris Wilson	058d88c	2016-08-15 10:49:06 +0100	[diff] [blame]	1145	i915_vma_unpin(vma);
Ankitprasad Sharma	b50a537	2016-06-10 14:23:03 +0530	[diff] [blame]	1146	}
Chris Wilson	bb6dc8d	2016-10-28 13:58:39 +0100	[diff] [blame]	1147	out_unlock:
				1148	intel_runtime_pm_put(i915);
				1149	mutex_unlock(&i915->drm.struct_mutex);
Chris Wilson	f60d7f0	2012-09-04 21:02:56 +0100	[diff] [blame]	1150
Eric Anholt	eb01459	2009-03-10 11:44:52 -0700	[diff] [blame]	1151	return ret;
				1152	}
				1153
Eric Anholt	673a394	2008-07-30 12:06:12 -0700	[diff] [blame]	1154	/**
				1155	* Reads data from the object referenced by handle.
Tvrtko Ursulin	14bb2c1	2016-06-03 14:02:17 +0100	[diff] [blame]	1156	* @dev: drm device pointer
				1157	* @data: ioctl data blob
				1158	* @file: drm file pointer
Eric Anholt	673a394	2008-07-30 12:06:12 -0700	[diff] [blame]	1159	*
				1160	* On error, the contents of *data are undefined.
				1161	*/
				1162	int
				1163	i915_gem_pread_ioctl(struct drm_device dev, void data,
Chris Wilson	05394f3	2010-11-08 19:18:58 +0000	[diff] [blame]	1164	struct drm_file *file)
Eric Anholt	673a394	2008-07-30 12:06:12 -0700	[diff] [blame]	1165	{
				1166	struct drm_i915_gem_pread *args = data;
Chris Wilson	05394f3	2010-11-08 19:18:58 +0000	[diff] [blame]	1167	struct drm_i915_gem_object *obj;
Chris Wilson	bb6dc8d	2016-10-28 13:58:39 +0100	[diff] [blame]	1168	int ret;
Eric Anholt	673a394	2008-07-30 12:06:12 -0700	[diff] [blame]	1169
Chris Wilson	51311d0	2010-11-17 09:10:42 +0000	[diff] [blame]	1170	if (args->size == 0)
				1171	return 0;
				1172
				1173	if (!access_ok(VERIFY_WRITE,
Gustavo Padovan	3ed605b	2016-04-26 12:32:27 -0300	[diff] [blame]	1174	u64_to_user_ptr(args->data_ptr),
Chris Wilson	51311d0	2010-11-17 09:10:42 +0000	[diff] [blame]	1175	args->size))
				1176	return -EFAULT;
				1177
Chris Wilson	03ac064	2016-07-20 13:31:51 +0100	[diff] [blame]	1178	obj = i915_gem_object_lookup(file, args->handle);
Chris Wilson	258a5ed	2016-08-05 10:14:16 +0100	[diff] [blame]	1179	if (!obj)
				1180	return -ENOENT;
Eric Anholt	673a394	2008-07-30 12:06:12 -0700	[diff] [blame]	1181
Chris Wilson	7dcd249	2010-09-26 20:21:44 +0100	[diff] [blame]	1182	/* Bounds check source. */
Matthew Auld	966d5bf	2016-12-13 20:32:22 +0000	[diff] [blame]	1183	if (range_overflows_t(u64, args->offset, args->size, obj->base.size)) {
Chris Wilson	ce9d419	2010-09-26 20:50:05 +0100	[diff] [blame]	1184	ret = -EINVAL;
Chris Wilson	bb6dc8d	2016-10-28 13:58:39 +0100	[diff] [blame]	1185	goto out;
Chris Wilson	ce9d419	2010-09-26 20:50:05 +0100	[diff] [blame]	1186	}
				1187
Chris Wilson	db53a30	2011-02-03 11:57:46 +0000	[diff] [blame]	1188	trace_i915_gem_object_pread(obj, args->offset, args->size);
				1189
Chris Wilson	e95433c	2016-10-28 13:58:27 +0100	[diff] [blame]	1190	ret = i915_gem_object_wait(obj,
				1191	I915_WAIT_INTERRUPTIBLE,
				1192	MAX_SCHEDULE_TIMEOUT,
				1193	to_rps_client(file));
Chris Wilson	258a5ed	2016-08-05 10:14:16 +0100	[diff] [blame]	1194	if (ret)
Chris Wilson	bb6dc8d	2016-10-28 13:58:39 +0100	[diff] [blame]	1195	goto out;
Chris Wilson	258a5ed	2016-08-05 10:14:16 +0100	[diff] [blame]	1196
Chris Wilson	bb6dc8d	2016-10-28 13:58:39 +0100	[diff] [blame]	1197	ret = i915_gem_object_pin_pages(obj);
Chris Wilson	258a5ed	2016-08-05 10:14:16 +0100	[diff] [blame]	1198	if (ret)
Chris Wilson	bb6dc8d	2016-10-28 13:58:39 +0100	[diff] [blame]	1199	goto out;
Chris Wilson	258a5ed	2016-08-05 10:14:16 +0100	[diff] [blame]	1200
Chris Wilson	bb6dc8d	2016-10-28 13:58:39 +0100	[diff] [blame]	1201	ret = i915_gem_shmem_pread(obj, args);
Chris Wilson	9c870d0	2016-10-24 13:42:15 +0100	[diff] [blame]	1202	if (ret == -EFAULT \|\| ret == -ENODEV)
Chris Wilson	bb6dc8d	2016-10-28 13:58:39 +0100	[diff] [blame]	1203	ret = i915_gem_gtt_pread(obj, args);
Ankitprasad Sharma	b50a537	2016-06-10 14:23:03 +0530	[diff] [blame]	1204
Chris Wilson	bb6dc8d	2016-10-28 13:58:39 +0100	[diff] [blame]	1205	i915_gem_object_unpin_pages(obj);
				1206	out:
Chris Wilson	f0cd518	2016-10-28 13:58:43 +0100	[diff] [blame]	1207	i915_gem_object_put(obj);
Eric Anholt	eb01459	2009-03-10 11:44:52 -0700	[diff] [blame]	1208	return ret;
Eric Anholt	673a394	2008-07-30 12:06:12 -0700	[diff] [blame]	1209	}
				1210
Keith Packard	0839ccb	2008-10-30 19:38:48 -0700	[diff] [blame]	1211	/* This is the fast write path which cannot handle
				1212	* page faults in the source data
Linus Torvalds	9b7530cc	2008-10-20 14:16:43 -0700	[diff] [blame]	1213	*/
Linus Torvalds	9b7530cc	2008-10-20 14:16:43 -0700	[diff] [blame]	1214
Chris Wilson	fe11562	2016-10-28 13:58:40 +0100	[diff] [blame]	1215	static inline bool
				1216	ggtt_write(struct io_mapping *mapping,
				1217	loff_t base, int offset,
				1218	char __user *user_data, int length)
Keith Packard	0839ccb	2008-10-30 19:38:48 -0700	[diff] [blame]	1219	{
Ville Syrjälä	afe722b	2017-09-01 20:12:52 +0300	[diff] [blame]	1220	void __iomem *vaddr;
Keith Packard	0839ccb	2008-10-30 19:38:48 -0700	[diff] [blame]	1221	unsigned long unwritten;
				1222
Ben Widawsky	4f0c7cf	2012-04-16 14:07:47 -0700	[diff] [blame]	1223	/* We can use the cpu mem copy function because this is X86. */
Ville Syrjälä	afe722b	2017-09-01 20:12:52 +0300	[diff] [blame]	1224	vaddr = io_mapping_map_atomic_wc(mapping, base);
				1225	unwritten = __copy_from_user_inatomic_nocache((void __force *)vaddr + offset,
Keith Packard	0839ccb	2008-10-30 19:38:48 -0700	[diff] [blame]	1226	user_data, length);
Chris Wilson	fe11562	2016-10-28 13:58:40 +0100	[diff] [blame]	1227	io_mapping_unmap_atomic(vaddr);
				1228	if (unwritten) {
Ville Syrjälä	afe722b	2017-09-01 20:12:52 +0300	[diff] [blame]	1229	vaddr = io_mapping_map_wc(mapping, base, PAGE_SIZE);
				1230	unwritten = copy_from_user((void __force *)vaddr + offset,
				1231	user_data, length);
Chris Wilson	fe11562	2016-10-28 13:58:40 +0100	[diff] [blame]	1232	io_mapping_unmap(vaddr);
				1233	}
Keith Packard	0839ccb	2008-10-30 19:38:48 -0700	[diff] [blame]	1234
Chris Wilson	bb6dc8d	2016-10-28 13:58:39 +0100	[diff] [blame]	1235	return unwritten;
				1236	}
				1237
Eric Anholt	3de09aa	2009-03-09 09:42:23 -0700	[diff] [blame]	1238	/**
				1239	* This is the fast pwrite path, where we copy the data directly from the
				1240	* user into the GTT, uncached.
Chris Wilson	fe11562	2016-10-28 13:58:40 +0100	[diff] [blame]	1241	* @obj: i915 GEM object
Tvrtko Ursulin	14bb2c1	2016-06-03 14:02:17 +0100	[diff] [blame]	1242	* @args: pwrite arguments structure
Eric Anholt	3de09aa	2009-03-09 09:42:23 -0700	[diff] [blame]	1243	*/
Eric Anholt	673a394	2008-07-30 12:06:12 -0700	[diff] [blame]	1244	static int
Chris Wilson	fe11562	2016-10-28 13:58:40 +0100	[diff] [blame]	1245	i915_gem_gtt_pwrite_fast(struct drm_i915_gem_object *obj,
				1246	const struct drm_i915_gem_pwrite *args)
Eric Anholt	673a394	2008-07-30 12:06:12 -0700	[diff] [blame]	1247	{
Chris Wilson	fe11562	2016-10-28 13:58:40 +0100	[diff] [blame]	1248	struct drm_i915_private *i915 = to_i915(obj->base.dev);
Ankitprasad Sharma	4f1959e	2016-06-10 14:23:01 +0530	[diff] [blame]	1249	struct i915_ggtt *ggtt = &i915->ggtt;
				1250	struct drm_mm_node node;
Chris Wilson	fe11562	2016-10-28 13:58:40 +0100	[diff] [blame]	1251	struct i915_vma *vma;
				1252	u64 remain, offset;
				1253	void __user *user_data;
Ankitprasad Sharma	4f1959e	2016-06-10 14:23:01 +0530	[diff] [blame]	1254	int ret;
Ankitprasad Sharma	b50a537	2016-06-10 14:23:03 +0530	[diff] [blame]	1255
Chris Wilson	fe11562	2016-10-28 13:58:40 +0100	[diff] [blame]	1256	ret = mutex_lock_interruptible(&i915->drm.struct_mutex);
				1257	if (ret)
				1258	return ret;
Daniel Vetter	935aaa6	2012-03-25 19:47:35 +0200	[diff] [blame]	1259
Chris Wilson	8bd8181	2017-10-19 07:37:33 +0100	[diff] [blame]	1260	if (i915_gem_object_has_struct_page(obj)) {
				1261	/*
				1262	* Avoid waking the device up if we can fallback, as
				1263	* waking/resuming is very slow (worst-case 10-100 ms
				1264	* depending on PCI sleeps and our own resume time).
				1265	* This easily dwarfs any performance advantage from
				1266	* using the cache bypass of indirect GGTT access.
				1267	*/
				1268	if (!intel_runtime_pm_get_if_in_use(i915)) {
				1269	ret = -EFAULT;
				1270	goto out_unlock;
				1271	}
				1272	} else {
				1273	/* No backing pages, no fallback, we must force GGTT access */
				1274	intel_runtime_pm_get(i915);
				1275	}
				1276
Chris Wilson	058d88c	2016-08-15 10:49:06 +0100	[diff] [blame]	1277	vma = i915_gem_object_ggtt_pin(obj, NULL, 0, 0,
Chris Wilson	a3259ca	2017-10-09 09:44:00 +0100	[diff] [blame]	1278	PIN_MAPPABLE \|
				1279	PIN_NONFAULT \|
				1280	PIN_NONBLOCK);
Chris Wilson	1803458	2016-08-18 17:16:45 +0100	[diff] [blame]	1281	if (!IS_ERR(vma)) {
				1282	node.start = i915_ggtt_offset(vma);
				1283	node.allocated = false;
Chris Wilson	49ef529	2016-08-18 17:17:00 +0100	[diff] [blame]	1284	ret = i915_vma_put_fence(vma);
Chris Wilson	1803458	2016-08-18 17:16:45 +0100	[diff] [blame]	1285	if (ret) {
				1286	i915_vma_unpin(vma);
				1287	vma = ERR_PTR(ret);
				1288	}
				1289	}
Chris Wilson	058d88c	2016-08-15 10:49:06 +0100	[diff] [blame]	1290	if (IS_ERR(vma)) {
Chris Wilson	bb6dc8d	2016-10-28 13:58:39 +0100	[diff] [blame]	1291	ret = insert_mappable_node(ggtt, &node, PAGE_SIZE);
Ankitprasad Sharma	4f1959e	2016-06-10 14:23:01 +0530	[diff] [blame]	1292	if (ret)
Chris Wilson	8bd8181	2017-10-19 07:37:33 +0100	[diff] [blame]	1293	goto out_rpm;
Chris Wilson	fe11562	2016-10-28 13:58:40 +0100	[diff] [blame]	1294	GEM_BUG_ON(!node.allocated);
Ankitprasad Sharma	4f1959e	2016-06-10 14:23:01 +0530	[diff] [blame]	1295	}
Daniel Vetter	935aaa6	2012-03-25 19:47:35 +0200	[diff] [blame]	1296
				1297	ret = i915_gem_object_set_to_gtt_domain(obj, true);
				1298	if (ret)
				1299	goto out_unpin;
				1300
Chris Wilson	fe11562	2016-10-28 13:58:40 +0100	[diff] [blame]	1301	mutex_unlock(&i915->drm.struct_mutex);
				1302
Chris Wilson	b19482d	2016-08-18 17:16:43 +0100	[diff] [blame]	1303	intel_fb_obj_invalidate(obj, ORIGIN_CPU);
Paulo Zanoni	063e4e6	2015-02-13 17:23:45 -0200	[diff] [blame]	1304
Ankitprasad Sharma	4f1959e	2016-06-10 14:23:01 +0530	[diff] [blame]	1305	user_data = u64_to_user_ptr(args->data_ptr);
				1306	offset = args->offset;
				1307	remain = args->size;
				1308	while (remain) {
Eric Anholt	673a394	2008-07-30 12:06:12 -0700	[diff] [blame]	1309	/* Operation in this page
				1310	*
Keith Packard	0839ccb	2008-10-30 19:38:48 -0700	[diff] [blame]	1311	* page_base = page offset within aperture
				1312	* page_offset = offset within page
				1313	* page_length = bytes to copy for this page
Eric Anholt	673a394	2008-07-30 12:06:12 -0700	[diff] [blame]	1314	*/
Ankitprasad Sharma	4f1959e	2016-06-10 14:23:01 +0530	[diff] [blame]	1315	u32 page_base = node.start;
Chris Wilson	bb6dc8d	2016-10-28 13:58:39 +0100	[diff] [blame]	1316	unsigned int page_offset = offset_in_page(offset);
				1317	unsigned int page_length = PAGE_SIZE - page_offset;
Ankitprasad Sharma	4f1959e	2016-06-10 14:23:01 +0530	[diff] [blame]	1318	page_length = remain < page_length ? remain : page_length;
				1319	if (node.allocated) {
				1320	wmb(); /* flush the write before we modify the GGTT */
				1321	ggtt->base.insert_page(&ggtt->base,
				1322	i915_gem_object_get_dma_address(obj, offset >> PAGE_SHIFT),
				1323	node.start, I915_CACHE_NONE, 0);
				1324	wmb(); /* flush modifications to the GGTT (insert_page) */
				1325	} else {
				1326	page_base += offset & PAGE_MASK;
				1327	}
Keith Packard	0839ccb	2008-10-30 19:38:48 -0700	[diff] [blame]	1328	/* If we get a fault while copying data, then (presumably) our
Eric Anholt	3de09aa	2009-03-09 09:42:23 -0700	[diff] [blame]	1329	* source page isn't available. Return the error and we'll
				1330	* retry in the slow path.
Ankitprasad Sharma	b50a537	2016-06-10 14:23:03 +0530	[diff] [blame]	1331	* If the object is non-shmem backed, we retry again with the
				1332	* path that handles page fault.
Keith Packard	0839ccb	2008-10-30 19:38:48 -0700	[diff] [blame]	1333	*/
Matthew Auld	73ebd50	2017-12-11 15:18:20 +0000	[diff] [blame]	1334	if (ggtt_write(&ggtt->iomap, page_base, page_offset,
Chris Wilson	fe11562	2016-10-28 13:58:40 +0100	[diff] [blame]	1335	user_data, page_length)) {
				1336	ret = -EFAULT;
				1337	break;
Daniel Vetter	935aaa6	2012-03-25 19:47:35 +0200	[diff] [blame]	1338	}
Eric Anholt	673a394	2008-07-30 12:06:12 -0700	[diff] [blame]	1339
Keith Packard	0839ccb	2008-10-30 19:38:48 -0700	[diff] [blame]	1340	remain -= page_length;
				1341	user_data += page_length;
				1342	offset += page_length;
Eric Anholt	673a394	2008-07-30 12:06:12 -0700	[diff] [blame]	1343	}
Chris Wilson	d59b21e	2017-02-22 11:40:49 +0000	[diff] [blame]	1344	intel_fb_obj_flush(obj, ORIGIN_CPU);
Chris Wilson	fe11562	2016-10-28 13:58:40 +0100	[diff] [blame]	1345
				1346	mutex_lock(&i915->drm.struct_mutex);
Daniel Vetter	935aaa6	2012-03-25 19:47:35 +0200	[diff] [blame]	1347	out_unpin:
Ankitprasad Sharma	4f1959e	2016-06-10 14:23:01 +0530	[diff] [blame]	1348	if (node.allocated) {
				1349	wmb();
				1350	ggtt->base.clear_range(&ggtt->base,
Michał Winiarski	4fb84d9	2016-10-13 14:02:40 +0200	[diff] [blame]	1351	node.start, node.size);
Ankitprasad Sharma	4f1959e	2016-06-10 14:23:01 +0530	[diff] [blame]	1352	remove_mappable_node(&node);
				1353	} else {
Chris Wilson	058d88c	2016-08-15 10:49:06 +0100	[diff] [blame]	1354	i915_vma_unpin(vma);
Ankitprasad Sharma	4f1959e	2016-06-10 14:23:01 +0530	[diff] [blame]	1355	}
Chris Wilson	8bd8181	2017-10-19 07:37:33 +0100	[diff] [blame]	1356	out_rpm:
Chris Wilson	9c870d0	2016-10-24 13:42:15 +0100	[diff] [blame]	1357	intel_runtime_pm_put(i915);
Chris Wilson	8bd8181	2017-10-19 07:37:33 +0100	[diff] [blame]	1358	out_unlock:
Chris Wilson	fe11562	2016-10-28 13:58:40 +0100	[diff] [blame]	1359	mutex_unlock(&i915->drm.struct_mutex);
Eric Anholt	3de09aa	2009-03-09 09:42:23 -0700	[diff] [blame]	1360	return ret;
Eric Anholt	673a394	2008-07-30 12:06:12 -0700	[diff] [blame]	1361	}
				1362
Eric Anholt	673a394	2008-07-30 12:06:12 -0700	[diff] [blame]	1363	static int
Chris Wilson	fe11562	2016-10-28 13:58:40 +0100	[diff] [blame]	1364	shmem_pwrite_slow(struct page *page, int offset, int length,
Daniel Vetter	d174bd6	2012-03-25 19:47:40 +0200	[diff] [blame]	1365	char __user *user_data,
				1366	bool page_do_bit17_swizzling,
				1367	bool needs_clflush_before,
				1368	bool needs_clflush_after)
Eric Anholt	673a394	2008-07-30 12:06:12 -0700	[diff] [blame]	1369	{
Daniel Vetter	d174bd6	2012-03-25 19:47:40 +0200	[diff] [blame]	1370	char *vaddr;
				1371	int ret;
Eric Anholt	40123c1	2009-03-09 13:42:30 -0700	[diff] [blame]	1372
Daniel Vetter	d174bd6	2012-03-25 19:47:40 +0200	[diff] [blame]	1373	vaddr = kmap(page);
Daniel Vetter	e7e58eb	2012-03-25 19:47:43 +0200	[diff] [blame]	1374	if (unlikely(needs_clflush_before \|\| page_do_bit17_swizzling))
Chris Wilson	fe11562	2016-10-28 13:58:40 +0100	[diff] [blame]	1375	shmem_clflush_swizzled_range(vaddr + offset, length,
Daniel Vetter	23c18c7	2012-03-25 19:47:42 +0200	[diff] [blame]	1376	page_do_bit17_swizzling);
Daniel Vetter	d174bd6	2012-03-25 19:47:40 +0200	[diff] [blame]	1377	if (page_do_bit17_swizzling)
Chris Wilson	fe11562	2016-10-28 13:58:40 +0100	[diff] [blame]	1378	ret = __copy_from_user_swizzled(vaddr, offset, user_data,
				1379	length);
Daniel Vetter	d174bd6	2012-03-25 19:47:40 +0200	[diff] [blame]	1380	else
Chris Wilson	fe11562	2016-10-28 13:58:40 +0100	[diff] [blame]	1381	ret = __copy_from_user(vaddr + offset, user_data, length);
Daniel Vetter	d174bd6	2012-03-25 19:47:40 +0200	[diff] [blame]	1382	if (needs_clflush_after)
Chris Wilson	fe11562	2016-10-28 13:58:40 +0100	[diff] [blame]	1383	shmem_clflush_swizzled_range(vaddr + offset, length,
Daniel Vetter	23c18c7	2012-03-25 19:47:42 +0200	[diff] [blame]	1384	page_do_bit17_swizzling);
Daniel Vetter	d174bd6	2012-03-25 19:47:40 +0200	[diff] [blame]	1385	kunmap(page);
Chris Wilson	e5281cc	2010-10-28 13:45:36 +0100	[diff] [blame]	1386
Chris Wilson	755d221	2012-09-04 21:02:55 +0100	[diff] [blame]	1387	return ret ? -EFAULT : 0;
Eric Anholt	40123c1	2009-03-09 13:42:30 -0700	[diff] [blame]	1388	}
				1389
Chris Wilson	fe11562	2016-10-28 13:58:40 +0100	[diff] [blame]	1390	/* Per-page copy function for the shmem pwrite fastpath.
				1391	* Flushes invalid cachelines before writing to the target if
				1392	* needs_clflush_before is set and flushes out any written cachelines after
				1393	* writing if needs_clflush is set.
				1394	*/
Eric Anholt	40123c1	2009-03-09 13:42:30 -0700	[diff] [blame]	1395	static int
Chris Wilson	fe11562	2016-10-28 13:58:40 +0100	[diff] [blame]	1396	shmem_pwrite(struct page page, int offset, int len, char __user user_data,
				1397	bool page_do_bit17_swizzling,
				1398	bool needs_clflush_before,
				1399	bool needs_clflush_after)
Eric Anholt	40123c1	2009-03-09 13:42:30 -0700	[diff] [blame]	1400	{
Chris Wilson	fe11562	2016-10-28 13:58:40 +0100	[diff] [blame]	1401	int ret;
Eric Anholt	40123c1	2009-03-09 13:42:30 -0700	[diff] [blame]	1402
Chris Wilson	fe11562	2016-10-28 13:58:40 +0100	[diff] [blame]	1403	ret = -ENODEV;
				1404	if (!page_do_bit17_swizzling) {
				1405	char *vaddr = kmap_atomic(page);
				1406
				1407	if (needs_clflush_before)
				1408	drm_clflush_virt_range(vaddr + offset, len);
				1409	ret = __copy_from_user_inatomic(vaddr + offset, user_data, len);
				1410	if (needs_clflush_after)
				1411	drm_clflush_virt_range(vaddr + offset, len);
				1412
				1413	kunmap_atomic(vaddr);
				1414	}
				1415	if (ret == 0)
				1416	return ret;
				1417
				1418	return shmem_pwrite_slow(page, offset, len, user_data,
				1419	page_do_bit17_swizzling,
				1420	needs_clflush_before,
				1421	needs_clflush_after);
				1422	}
				1423
				1424	static int
				1425	i915_gem_shmem_pwrite(struct drm_i915_gem_object *obj,
				1426	const struct drm_i915_gem_pwrite *args)
				1427	{
				1428	struct drm_i915_private *i915 = to_i915(obj->base.dev);
				1429	void __user *user_data;
				1430	u64 remain;
				1431	unsigned int obj_do_bit17_swizzling;
				1432	unsigned int partial_cacheline_write;
				1433	unsigned int needs_clflush;
				1434	unsigned int offset, idx;
				1435	int ret;
				1436
				1437	ret = mutex_lock_interruptible(&i915->drm.struct_mutex);
Chris Wilson	43394c7	2016-08-18 17:16:47 +0100	[diff] [blame]	1438	if (ret)
				1439	return ret;
Eric Anholt	40123c1	2009-03-09 13:42:30 -0700	[diff] [blame]	1440
Chris Wilson	fe11562	2016-10-28 13:58:40 +0100	[diff] [blame]	1441	ret = i915_gem_obj_prepare_shmem_write(obj, &needs_clflush);
				1442	mutex_unlock(&i915->drm.struct_mutex);
				1443	if (ret)
				1444	return ret;
				1445
				1446	obj_do_bit17_swizzling = 0;
				1447	if (i915_gem_object_needs_bit17_swizzle(obj))
				1448	obj_do_bit17_swizzling = BIT(17);
				1449
				1450	/* If we don't overwrite a cacheline completely we need to be
				1451	* careful to have up-to-date data by first clflushing. Don't
				1452	* overcomplicate things and flush the entire patch.
				1453	*/
				1454	partial_cacheline_write = 0;
				1455	if (needs_clflush & CLFLUSH_BEFORE)
				1456	partial_cacheline_write = boot_cpu_data.x86_clflush_size - 1;
				1457
Chris Wilson	43394c7	2016-08-18 17:16:47 +0100	[diff] [blame]	1458	user_data = u64_to_user_ptr(args->data_ptr);
Chris Wilson	43394c7	2016-08-18 17:16:47 +0100	[diff] [blame]	1459	remain = args->size;
Chris Wilson	fe11562	2016-10-28 13:58:40 +0100	[diff] [blame]	1460	offset = offset_in_page(args->offset);
				1461	for (idx = args->offset >> PAGE_SHIFT; remain; idx++) {
				1462	struct page *page = i915_gem_object_get_page(obj, idx);
				1463	int length;
Eric Anholt	40123c1	2009-03-09 13:42:30 -0700	[diff] [blame]	1464
Chris Wilson	fe11562	2016-10-28 13:58:40 +0100	[diff] [blame]	1465	length = remain;
				1466	if (offset + length > PAGE_SIZE)
				1467	length = PAGE_SIZE - offset;
Chris Wilson	e5281cc	2010-10-28 13:45:36 +0100	[diff] [blame]	1468
Chris Wilson	fe11562	2016-10-28 13:58:40 +0100	[diff] [blame]	1469	ret = shmem_pwrite(page, offset, length, user_data,
				1470	page_to_phys(page) & obj_do_bit17_swizzling,
				1471	(offset \| length) & partial_cacheline_write,
				1472	needs_clflush & CLFLUSH_AFTER);
				1473	if (ret)
Chris Wilson	9da3da6	2012-06-01 15:20:22 +0100	[diff] [blame]	1474	break;
				1475
Chris Wilson	fe11562	2016-10-28 13:58:40 +0100	[diff] [blame]	1476	remain -= length;
				1477	user_data += length;
				1478	offset = 0;
Eric Anholt	40123c1	2009-03-09 13:42:30 -0700	[diff] [blame]	1479	}
				1480
Chris Wilson	d59b21e	2017-02-22 11:40:49 +0000	[diff] [blame]	1481	intel_fb_obj_flush(obj, ORIGIN_CPU);
Chris Wilson	fe11562	2016-10-28 13:58:40 +0100	[diff] [blame]	1482	i915_gem_obj_finish_shmem_access(obj);
Eric Anholt	40123c1	2009-03-09 13:42:30 -0700	[diff] [blame]	1483	return ret;
Eric Anholt	673a394	2008-07-30 12:06:12 -0700	[diff] [blame]	1484	}
				1485
				1486	/**
				1487	* Writes data to the object referenced by handle.
Tvrtko Ursulin	14bb2c1	2016-06-03 14:02:17 +0100	[diff] [blame]	1488	* @dev: drm device
				1489	* @data: ioctl data blob
				1490	* @file: drm file
Eric Anholt	673a394	2008-07-30 12:06:12 -0700	[diff] [blame]	1491	*
				1492	* On error, the contents of the buffer that were to be modified are undefined.
				1493	*/
				1494	int
				1495	i915_gem_pwrite_ioctl(struct drm_device dev, void data,
Chris Wilson	fbd5a26	2010-10-14 15:03:58 +0100	[diff] [blame]	1496	struct drm_file *file)
Eric Anholt	673a394	2008-07-30 12:06:12 -0700	[diff] [blame]	1497	{
				1498	struct drm_i915_gem_pwrite *args = data;
Chris Wilson	05394f3	2010-11-08 19:18:58 +0000	[diff] [blame]	1499	struct drm_i915_gem_object *obj;
Chris Wilson	51311d0	2010-11-17 09:10:42 +0000	[diff] [blame]	1500	int ret;
				1501
				1502	if (args->size == 0)
				1503	return 0;
				1504
				1505	if (!access_ok(VERIFY_READ,
Gustavo Padovan	3ed605b	2016-04-26 12:32:27 -0300	[diff] [blame]	1506	u64_to_user_ptr(args->data_ptr),
Chris Wilson	51311d0	2010-11-17 09:10:42 +0000	[diff] [blame]	1507	args->size))
				1508	return -EFAULT;
				1509
Chris Wilson	03ac064	2016-07-20 13:31:51 +0100	[diff] [blame]	1510	obj = i915_gem_object_lookup(file, args->handle);
Chris Wilson	258a5ed	2016-08-05 10:14:16 +0100	[diff] [blame]	1511	if (!obj)
				1512	return -ENOENT;
Eric Anholt	673a394	2008-07-30 12:06:12 -0700	[diff] [blame]	1513
Chris Wilson	7dcd249	2010-09-26 20:21:44 +0100	[diff] [blame]	1514	/* Bounds check destination. */
Matthew Auld	966d5bf	2016-12-13 20:32:22 +0000	[diff] [blame]	1515	if (range_overflows_t(u64, args->offset, args->size, obj->base.size)) {
Chris Wilson	ce9d419	2010-09-26 20:50:05 +0100	[diff] [blame]	1516	ret = -EINVAL;
Chris Wilson	258a5ed	2016-08-05 10:14:16 +0100	[diff] [blame]	1517	goto err;
Chris Wilson	ce9d419	2010-09-26 20:50:05 +0100	[diff] [blame]	1518	}
				1519
Chris Wilson	db53a30	2011-02-03 11:57:46 +0000	[diff] [blame]	1520	trace_i915_gem_object_pwrite(obj, args->offset, args->size);
				1521
Chris Wilson	7c55e2c	2017-03-07 12:03:38 +0000	[diff] [blame]	1522	ret = -ENODEV;
				1523	if (obj->ops->pwrite)
				1524	ret = obj->ops->pwrite(obj, args);
				1525	if (ret != -ENODEV)
				1526	goto err;
				1527
Chris Wilson	e95433c	2016-10-28 13:58:27 +0100	[diff] [blame]	1528	ret = i915_gem_object_wait(obj,
				1529	I915_WAIT_INTERRUPTIBLE \|
				1530	I915_WAIT_ALL,
				1531	MAX_SCHEDULE_TIMEOUT,
				1532	to_rps_client(file));
Chris Wilson	258a5ed	2016-08-05 10:14:16 +0100	[diff] [blame]	1533	if (ret)
				1534	goto err;
				1535
Chris Wilson	fe11562	2016-10-28 13:58:40 +0100	[diff] [blame]	1536	ret = i915_gem_object_pin_pages(obj);
Chris Wilson	258a5ed	2016-08-05 10:14:16 +0100	[diff] [blame]	1537	if (ret)
Chris Wilson	fe11562	2016-10-28 13:58:40 +0100	[diff] [blame]	1538	goto err;
Chris Wilson	258a5ed	2016-08-05 10:14:16 +0100	[diff] [blame]	1539
Daniel Vetter	935aaa6	2012-03-25 19:47:35 +0200	[diff] [blame]	1540	ret = -EFAULT;
Eric Anholt	673a394	2008-07-30 12:06:12 -0700	[diff] [blame]	1541	/* We can only do the GTT pwrite on untiled buffers, as otherwise
				1542	* it would end up going through the fenced access, and we'll get
				1543	* different detiling behavior between reading and writing.
				1544	* pread/pwrite currently are reading and writing from the CPU
				1545	* perspective, requiring manual detiling by the client.
				1546	*/
Chris Wilson	6eae005	2016-06-20 15:05:52 +0100	[diff] [blame]	1547	if (!i915_gem_object_has_struct_page(obj) \|\|
Chris Wilson	9c870d0	2016-10-24 13:42:15 +0100	[diff] [blame]	1548	cpu_write_needs_clflush(obj))
Daniel Vetter	935aaa6	2012-03-25 19:47:35 +0200	[diff] [blame]	1549	/* Note that the gtt paths might fail with non-page-backed user
				1550	* pointers (e.g. gtt mappings when moving data between
Chris Wilson	9c870d0	2016-10-24 13:42:15 +0100	[diff] [blame]	1551	* textures). Fallback to the shmem path in that case.
				1552	*/
Chris Wilson	fe11562	2016-10-28 13:58:40 +0100	[diff] [blame]	1553	ret = i915_gem_gtt_pwrite_fast(obj, args);
Eric Anholt	673a394	2008-07-30 12:06:12 -0700	[diff] [blame]	1554
Chris Wilson	d1054ee	2016-07-16 18:42:36 +0100	[diff] [blame]	1555	if (ret == -EFAULT \|\| ret == -ENOSPC) {
Chris Wilson	6a2c423	2014-11-04 04:51:40 -0800	[diff] [blame]	1556	if (obj->phys_handle)
				1557	ret = i915_gem_phys_pwrite(obj, args, file);
Ankitprasad Sharma	b50a537	2016-06-10 14:23:03 +0530	[diff] [blame]	1558	else
Chris Wilson	fe11562	2016-10-28 13:58:40 +0100	[diff] [blame]	1559	ret = i915_gem_shmem_pwrite(obj, args);
Chris Wilson	6a2c423	2014-11-04 04:51:40 -0800	[diff] [blame]	1560	}
Daniel Vetter	5c0480f	2011-12-14 13:57:30 +0100	[diff] [blame]	1561
Chris Wilson	fe11562	2016-10-28 13:58:40 +0100	[diff] [blame]	1562	i915_gem_object_unpin_pages(obj);
Chris Wilson	258a5ed	2016-08-05 10:14:16 +0100	[diff] [blame]	1563	err:
Chris Wilson	f0cd518	2016-10-28 13:58:43 +0100	[diff] [blame]	1564	i915_gem_object_put(obj);
Chris Wilson	258a5ed	2016-08-05 10:14:16 +0100	[diff] [blame]	1565	return ret;
Eric Anholt	673a394	2008-07-30 12:06:12 -0700	[diff] [blame]	1566	}
				1567
Chris Wilson	40e62d5	2016-10-28 13:58:41 +0100	[diff] [blame]	1568	static void i915_gem_object_bump_inactive_ggtt(struct drm_i915_gem_object *obj)
				1569	{
				1570	struct drm_i915_private *i915;
				1571	struct list_head *list;
				1572	struct i915_vma *vma;
				1573
Chris Wilson	f212381	2017-10-16 12:40:37 +0100	[diff] [blame]	1574	GEM_BUG_ON(!i915_gem_object_has_pinned_pages(obj));
				1575
Chris Wilson	e2189dd	2017-12-07 21:14:07 +0000	[diff] [blame]	1576	for_each_ggtt_vma(vma, obj) {
Chris Wilson	40e62d5	2016-10-28 13:58:41 +0100	[diff] [blame]	1577	if (i915_vma_is_active(vma))
				1578	continue;
				1579
				1580	if (!drm_mm_node_allocated(&vma->node))
				1581	continue;
				1582
				1583	list_move_tail(&vma->vm_link, &vma->vm->inactive_list);
				1584	}
				1585
				1586	i915 = to_i915(obj->base.dev);
Chris Wilson	f212381	2017-10-16 12:40:37 +0100	[diff] [blame]	1587	spin_lock(&i915->mm.obj_lock);
Chris Wilson	40e62d5	2016-10-28 13:58:41 +0100	[diff] [blame]	1588	list = obj->bind_count ? &i915->mm.bound_list : &i915->mm.unbound_list;
Chris Wilson	f212381	2017-10-16 12:40:37 +0100	[diff] [blame]	1589	list_move_tail(&obj->mm.link, list);
				1590	spin_unlock(&i915->mm.obj_lock);
Chris Wilson	40e62d5	2016-10-28 13:58:41 +0100	[diff] [blame]	1591	}
				1592
Eric Anholt	673a394	2008-07-30 12:06:12 -0700	[diff] [blame]	1593	/**
Eric Anholt	2ef7eea	2008-11-10 10:53:25 -0800	[diff] [blame]	1594	* Called when user space prepares to use an object with the CPU, either
				1595	* through the mmap ioctl's mapping or a GTT mapping.
Tvrtko Ursulin	14bb2c1	2016-06-03 14:02:17 +0100	[diff] [blame]	1596	* @dev: drm device
				1597	* @data: ioctl data blob
				1598	* @file: drm file
Eric Anholt	673a394	2008-07-30 12:06:12 -0700	[diff] [blame]	1599	*/
				1600	int
				1601	i915_gem_set_domain_ioctl(struct drm_device dev, void data,
Chris Wilson	05394f3	2010-11-08 19:18:58 +0000	[diff] [blame]	1602	struct drm_file *file)
Eric Anholt	673a394	2008-07-30 12:06:12 -0700	[diff] [blame]	1603	{
				1604	struct drm_i915_gem_set_domain *args = data;
Chris Wilson	05394f3	2010-11-08 19:18:58 +0000	[diff] [blame]	1605	struct drm_i915_gem_object *obj;
Eric Anholt	2ef7eea	2008-11-10 10:53:25 -0800	[diff] [blame]	1606	uint32_t read_domains = args->read_domains;
				1607	uint32_t write_domain = args->write_domain;
Chris Wilson	40e62d5	2016-10-28 13:58:41 +0100	[diff] [blame]	1608	int err;
Eric Anholt	673a394	2008-07-30 12:06:12 -0700	[diff] [blame]	1609
Eric Anholt	2ef7eea	2008-11-10 10:53:25 -0800	[diff] [blame]	1610	/* Only handle setting domains to types used by the CPU. */
Chris Wilson	b8f9096	2016-08-05 10:14:07 +0100	[diff] [blame]	1611	if ((write_domain \| read_domains) & I915_GEM_GPU_DOMAINS)
Eric Anholt	2ef7eea	2008-11-10 10:53:25 -0800	[diff] [blame]	1612	return -EINVAL;
				1613
				1614	/* Having something in the write domain implies it's in the read
				1615	* domain, and only that read domain. Enforce that in the request.
				1616	*/
				1617	if (write_domain != 0 && read_domains != write_domain)
				1618	return -EINVAL;
				1619
Chris Wilson	03ac064	2016-07-20 13:31:51 +0100	[diff] [blame]	1620	obj = i915_gem_object_lookup(file, args->handle);
Chris Wilson	b8f9096	2016-08-05 10:14:07 +0100	[diff] [blame]	1621	if (!obj)
				1622	return -ENOENT;
Jesse Barnes	652c393	2009-08-17 13:31:43 -0700	[diff] [blame]	1623
Chris Wilson	3236f57	2012-08-24 09:35:09 +0100	[diff] [blame]	1624	/* Try to flush the object off the GPU without holding the lock.
				1625	* We will repeat the flush holding the lock in the normal manner
				1626	* to catch cases where we are gazumped.
				1627	*/
Chris Wilson	40e62d5	2016-10-28 13:58:41 +0100	[diff] [blame]	1628	err = i915_gem_object_wait(obj,
Chris Wilson	e95433c	2016-10-28 13:58:27 +0100	[diff] [blame]	1629	I915_WAIT_INTERRUPTIBLE \|
				1630	(write_domain ? I915_WAIT_ALL : 0),
				1631	MAX_SCHEDULE_TIMEOUT,
				1632	to_rps_client(file));
Chris Wilson	40e62d5	2016-10-28 13:58:41 +0100	[diff] [blame]	1633	if (err)
Chris Wilson	f0cd518	2016-10-28 13:58:43 +0100	[diff] [blame]	1634	goto out;
Chris Wilson	b8f9096	2016-08-05 10:14:07 +0100	[diff] [blame]	1635
Tina Zhang	a03f395	2017-11-14 10:25:13 +0000	[diff] [blame]	1636	/*
				1637	* Proxy objects do not control access to the backing storage, ergo
				1638	* they cannot be used as a means to manipulate the cache domain
				1639	* tracking for that backing storage. The proxy object is always
				1640	* considered to be outside of any cache domain.
				1641	*/
				1642	if (i915_gem_object_is_proxy(obj)) {
				1643	err = -ENXIO;
				1644	goto out;
				1645	}
				1646
				1647	/*
				1648	* Flush and acquire obj->pages so that we are coherent through
Chris Wilson	40e62d5	2016-10-28 13:58:41 +0100	[diff] [blame]	1649	* direct access in memory with previous cached writes through
				1650	* shmemfs and that our cache domain tracking remains valid.
				1651	* For example, if the obj->filp was moved to swap without us
				1652	* being notified and releasing the pages, we would mistakenly
				1653	* continue to assume that the obj remained out of the CPU cached
				1654	* domain.
				1655	*/
				1656	err = i915_gem_object_pin_pages(obj);
				1657	if (err)
Chris Wilson	f0cd518	2016-10-28 13:58:43 +0100	[diff] [blame]	1658	goto out;
Chris Wilson	40e62d5	2016-10-28 13:58:41 +0100	[diff] [blame]	1659
				1660	err = i915_mutex_lock_interruptible(dev);
				1661	if (err)
Chris Wilson	f0cd518	2016-10-28 13:58:43 +0100	[diff] [blame]	1662	goto out_unpin;
Chris Wilson	3236f57	2012-08-24 09:35:09 +0100	[diff] [blame]	1663
Chris Wilson	e22d8e3	2017-04-12 12:01:11 +0100	[diff] [blame]	1664	if (read_domains & I915_GEM_DOMAIN_WC)
				1665	err = i915_gem_object_set_to_wc_domain(obj, write_domain);
				1666	else if (read_domains & I915_GEM_DOMAIN_GTT)
				1667	err = i915_gem_object_set_to_gtt_domain(obj, write_domain);
Chris Wilson	43566de	2015-01-02 16:29:29 +0530	[diff] [blame]	1668	else
Chris Wilson	e22d8e3	2017-04-12 12:01:11 +0100	[diff] [blame]	1669	err = i915_gem_object_set_to_cpu_domain(obj, write_domain);
Chris Wilson	40e62d5	2016-10-28 13:58:41 +0100	[diff] [blame]	1670
				1671	/* And bump the LRU for this access */
				1672	i915_gem_object_bump_inactive_ggtt(obj);
				1673
				1674	mutex_unlock(&dev->struct_mutex);
Eric Anholt	2ef7eea	2008-11-10 10:53:25 -0800	[diff] [blame]	1675
Daniel Vetter	031b698	2015-06-26 19:35:16 +0200	[diff] [blame]	1676	if (write_domain != 0)
Chris Wilson	ef74921	2017-04-12 12:01:10 +0100	[diff] [blame]	1677	intel_fb_obj_invalidate(obj,
				1678	fb_write_origin(obj, write_domain));
Daniel Vetter	031b698	2015-06-26 19:35:16 +0200	[diff] [blame]	1679
Chris Wilson	f0cd518	2016-10-28 13:58:43 +0100	[diff] [blame]	1680	out_unpin:
Chris Wilson	40e62d5	2016-10-28 13:58:41 +0100	[diff] [blame]	1681	i915_gem_object_unpin_pages(obj);
Chris Wilson	f0cd518	2016-10-28 13:58:43 +0100	[diff] [blame]	1682	out:
				1683	i915_gem_object_put(obj);
Chris Wilson	40e62d5	2016-10-28 13:58:41 +0100	[diff] [blame]	1684	return err;
Eric Anholt	673a394	2008-07-30 12:06:12 -0700	[diff] [blame]	1685	}
				1686
				1687	/**
				1688	* Called when user space has done writes to this buffer
Tvrtko Ursulin	14bb2c1	2016-06-03 14:02:17 +0100	[diff] [blame]	1689	* @dev: drm device
				1690	* @data: ioctl data blob
				1691	* @file: drm file
Eric Anholt	673a394	2008-07-30 12:06:12 -0700	[diff] [blame]	1692	*/
				1693	int
				1694	i915_gem_sw_finish_ioctl(struct drm_device dev, void data,
Chris Wilson	05394f3	2010-11-08 19:18:58 +0000	[diff] [blame]	1695	struct drm_file *file)
Eric Anholt	673a394	2008-07-30 12:06:12 -0700	[diff] [blame]	1696	{
				1697	struct drm_i915_gem_sw_finish *args = data;
Chris Wilson	05394f3	2010-11-08 19:18:58 +0000	[diff] [blame]	1698	struct drm_i915_gem_object *obj;
Chris Wilson	1d7cfea	2010-10-17 09:45:41 +0100	[diff] [blame]	1699
Chris Wilson	03ac064	2016-07-20 13:31:51 +0100	[diff] [blame]	1700	obj = i915_gem_object_lookup(file, args->handle);
Chris Wilson	c21724c	2016-08-05 10:14:19 +0100	[diff] [blame]	1701	if (!obj)
				1702	return -ENOENT;
Eric Anholt	673a394	2008-07-30 12:06:12 -0700	[diff] [blame]	1703
Tina Zhang	a03f395	2017-11-14 10:25:13 +0000	[diff] [blame]	1704	/*
				1705	* Proxy objects are barred from CPU access, so there is no
				1706	* need to ban sw_finish as it is a nop.
				1707	*/
				1708
Eric Anholt	673a394	2008-07-30 12:06:12 -0700	[diff] [blame]	1709	/* Pinned buffers may be scanout, so flush the cache */
Chris Wilson	5a97bcc	2017-02-22 11:40:46 +0000	[diff] [blame]	1710	i915_gem_object_flush_if_display(obj);
Chris Wilson	f0cd518	2016-10-28 13:58:43 +0100	[diff] [blame]	1711	i915_gem_object_put(obj);
Chris Wilson	5a97bcc	2017-02-22 11:40:46 +0000	[diff] [blame]	1712
				1713	return 0;
Eric Anholt	673a394	2008-07-30 12:06:12 -0700	[diff] [blame]	1714	}
				1715
				1716	/**
Tvrtko Ursulin	14bb2c1	2016-06-03 14:02:17 +0100	[diff] [blame]	1717	* i915_gem_mmap_ioctl - Maps the contents of an object, returning the address
				1718	* it is mapped to.
				1719	* @dev: drm device
				1720	* @data: ioctl data blob
				1721	* @file: drm file
Eric Anholt	673a394	2008-07-30 12:06:12 -0700	[diff] [blame]	1722	*
				1723	* While the mapping holds a reference on the contents of the object, it doesn't
				1724	* imply a ref on the object itself.
Daniel Vetter	3436738	2014-10-16 12:28:18 +0200	[diff] [blame]	1725	*
				1726	* IMPORTANT:
				1727	*
				1728	* DRM driver writers who look a this function as an example for how to do GEM
				1729	* mmap support, please don't implement mmap support like here. The modern way
				1730	* to implement DRM mmap support is with an mmap offset ioctl (like
				1731	* i915_gem_mmap_gtt) and then using the mmap syscall on the DRM fd directly.
				1732	* That way debug tooling like valgrind will understand what's going on, hiding
				1733	* the mmap call in a driver private ioctl will break that. The i915 driver only
				1734	* does cpu mmaps this way because we didn't know better.
Eric Anholt	673a394	2008-07-30 12:06:12 -0700	[diff] [blame]	1735	*/
				1736	int
				1737	i915_gem_mmap_ioctl(struct drm_device dev, void data,
Chris Wilson	05394f3	2010-11-08 19:18:58 +0000	[diff] [blame]	1738	struct drm_file *file)
Eric Anholt	673a394	2008-07-30 12:06:12 -0700	[diff] [blame]	1739	{
				1740	struct drm_i915_gem_mmap *args = data;
Chris Wilson	03ac064	2016-07-20 13:31:51 +0100	[diff] [blame]	1741	struct drm_i915_gem_object *obj;
Eric Anholt	673a394	2008-07-30 12:06:12 -0700	[diff] [blame]	1742	unsigned long addr;
				1743
Akash Goel	1816f92	2015-01-02 16:29:30 +0530	[diff] [blame]	1744	if (args->flags & ~(I915_MMAP_WC))
				1745	return -EINVAL;
				1746
Borislav Petkov	568a58e	2016-03-29 17:42:01 +0200	[diff] [blame]	1747	if (args->flags & I915_MMAP_WC && !boot_cpu_has(X86_FEATURE_PAT))
Akash Goel	1816f92	2015-01-02 16:29:30 +0530	[diff] [blame]	1748	return -ENODEV;
				1749
Chris Wilson	03ac064	2016-07-20 13:31:51 +0100	[diff] [blame]	1750	obj = i915_gem_object_lookup(file, args->handle);
				1751	if (!obj)
Chris Wilson	bf79cb9	2010-08-04 14:19:46 +0100	[diff] [blame]	1752	return -ENOENT;
Eric Anholt	673a394	2008-07-30 12:06:12 -0700	[diff] [blame]	1753
Daniel Vetter	1286ff7	2012-05-10 15:25:09 +0200	[diff] [blame]	1754	/* prime objects have no backing filp to GEM mmap
				1755	* pages from.
				1756	*/
Chris Wilson	03ac064	2016-07-20 13:31:51 +0100	[diff] [blame]	1757	if (!obj->base.filp) {
Chris Wilson	f0cd518	2016-10-28 13:58:43 +0100	[diff] [blame]	1758	i915_gem_object_put(obj);
Tina Zhang	274b246	2017-11-14 10:25:12 +0000	[diff] [blame]	1759	return -ENXIO;
Daniel Vetter	1286ff7	2012-05-10 15:25:09 +0200	[diff] [blame]	1760	}
				1761
Chris Wilson	03ac064	2016-07-20 13:31:51 +0100	[diff] [blame]	1762	addr = vm_mmap(obj->base.filp, 0, args->size,
Eric Anholt	673a394	2008-07-30 12:06:12 -0700	[diff] [blame]	1763	PROT_READ \| PROT_WRITE, MAP_SHARED,
				1764	args->offset);
Akash Goel	1816f92	2015-01-02 16:29:30 +0530	[diff] [blame]	1765	if (args->flags & I915_MMAP_WC) {
				1766	struct mm_struct *mm = current->mm;
				1767	struct vm_area_struct *vma;
				1768
Michal Hocko	80a89a5	2016-05-23 16:26:11 -0700	[diff] [blame]	1769	if (down_write_killable(&mm->mmap_sem)) {
Chris Wilson	f0cd518	2016-10-28 13:58:43 +0100	[diff] [blame]	1770	i915_gem_object_put(obj);
Michal Hocko	80a89a5	2016-05-23 16:26:11 -0700	[diff] [blame]	1771	return -EINTR;
				1772	}
Akash Goel	1816f92	2015-01-02 16:29:30 +0530	[diff] [blame]	1773	vma = find_vma(mm, addr);
				1774	if (vma)
				1775	vma->vm_page_prot =
				1776	pgprot_writecombine(vm_get_page_prot(vma->vm_flags));
				1777	else
				1778	addr = -ENOMEM;
				1779	up_write(&mm->mmap_sem);
Chris Wilson	aeecc96	2016-06-17 14:46:39 -0300	[diff] [blame]	1780
				1781	/* This may race, but that's ok, it only gets set */
Chris Wilson	5034924	2016-08-18 17:17:04 +0100	[diff] [blame]	1782	WRITE_ONCE(obj->frontbuffer_ggtt_origin, ORIGIN_CPU);
Akash Goel	1816f92	2015-01-02 16:29:30 +0530	[diff] [blame]	1783	}
Chris Wilson	f0cd518	2016-10-28 13:58:43 +0100	[diff] [blame]	1784	i915_gem_object_put(obj);
Eric Anholt	673a394	2008-07-30 12:06:12 -0700	[diff] [blame]	1785	if (IS_ERR((void *)addr))
				1786	return addr;
				1787
				1788	args->addr_ptr = (uint64_t) addr;
				1789
				1790	return 0;
				1791	}
				1792
Chris Wilson	03af84f	2016-08-18 17:17:01 +0100	[diff] [blame]	1793	static unsigned int tile_row_pages(struct drm_i915_gem_object *obj)
				1794	{
Chris Wilson	6649a0b	2017-01-09 16:16:08 +0000	[diff] [blame]	1795	return i915_gem_object_get_tile_row_size(obj) >> PAGE_SHIFT;
Chris Wilson	03af84f	2016-08-18 17:17:01 +0100	[diff] [blame]	1796	}
				1797
Jesse Barnes	de151cf	2008-11-12 10:03:55 -0800	[diff] [blame]	1798	/**
Chris Wilson	4cc6907	2016-08-25 19:05:19 +0100	[diff] [blame]	1799	* i915_gem_mmap_gtt_version - report the current feature set for GTT mmaps
				1800	*
				1801	* A history of the GTT mmap interface:
				1802	*
				1803	* 0 - Everything had to fit into the GTT. Both parties of a memcpy had to
				1804	* aligned and suitable for fencing, and still fit into the available
				1805	* mappable space left by the pinned display objects. A classic problem
				1806	* we called the page-fault-of-doom where we would ping-pong between
				1807	* two objects that could not fit inside the GTT and so the memcpy
				1808	* would page one object in at the expense of the other between every
				1809	* single byte.
				1810	*
				1811	* 1 - Objects can be any size, and have any compatible fencing (X Y, or none
				1812	* as set via i915_gem_set_tiling() [DRM_I915_GEM_SET_TILING]). If the
				1813	* object is too large for the available space (or simply too large
				1814	* for the mappable aperture!), a view is created instead and faulted
				1815	* into userspace. (This view is aligned and sized appropriately for
				1816	* fenced access.)
				1817	*
Chris Wilson	e22d8e3	2017-04-12 12:01:11 +0100	[diff] [blame]	1818	* 2 - Recognise WC as a separate cache domain so that we can flush the
				1819	* delayed writes via GTT before performing direct access via WC.
				1820	*
Chris Wilson	4cc6907	2016-08-25 19:05:19 +0100	[diff] [blame]	1821	* Restrictions:
				1822	*
				1823	* * snoopable objects cannot be accessed via the GTT. It can cause machine
				1824	* hangs on some architectures, corruption on others. An attempt to service
				1825	* a GTT page fault from a snoopable object will generate a SIGBUS.
				1826	*
				1827	* * the object must be able to fit into RAM (physical memory, though no
				1828	* limited to the mappable aperture).
				1829	*
				1830	*
				1831	* Caveats:
				1832	*
				1833	* * a new GTT page fault will synchronize rendering from the GPU and flush
				1834	* all data to system memory. Subsequent access will not be synchronized.
				1835	*
				1836	* * all mappings are revoked on runtime device suspend.
				1837	*
				1838	* * there are only 8, 16 or 32 fence registers to share between all users
				1839	* (older machines require fence register for display and blitter access
				1840	* as well). Contention of the fence registers will cause the previous users
				1841	* to be unmapped and any new access will generate new page faults.
				1842	*
				1843	* * running out of memory while servicing a fault may generate a SIGBUS,
				1844	* rather than the expected SIGSEGV.
				1845	*/
				1846	int i915_gem_mmap_gtt_version(void)
				1847	{
Chris Wilson	e22d8e3	2017-04-12 12:01:11 +0100	[diff] [blame]	1848	return 2;
Chris Wilson	4cc6907	2016-08-25 19:05:19 +0100	[diff] [blame]	1849	}
				1850
Chris Wilson	2d4281b	2017-01-10 09:56:32 +0000	[diff] [blame]	1851	static inline struct i915_ggtt_view
				1852	compute_partial_view(struct drm_i915_gem_object *obj,
Chris Wilson	2d4281b	2017-01-10 09:56:32 +0000	[diff] [blame]	1853	pgoff_t page_offset,
				1854	unsigned int chunk)
				1855	{
				1856	struct i915_ggtt_view view;
				1857
				1858	if (i915_gem_object_is_tiled(obj))
				1859	chunk = roundup(chunk, tile_row_pages(obj));
				1860
Chris Wilson	2d4281b	2017-01-10 09:56:32 +0000	[diff] [blame]	1861	view.type = I915_GGTT_VIEW_PARTIAL;
Chris Wilson	8bab1193	2017-01-14 00:28:25 +0000	[diff] [blame]	1862	view.partial.offset = rounddown(page_offset, chunk);
				1863	view.partial.size =
Chris Wilson	2d4281b	2017-01-10 09:56:32 +0000	[diff] [blame]	1864	min_t(unsigned int, chunk,
Chris Wilson	8bab1193	2017-01-14 00:28:25 +0000	[diff] [blame]	1865	(obj->base.size >> PAGE_SHIFT) - view.partial.offset);
Chris Wilson	2d4281b	2017-01-10 09:56:32 +0000	[diff] [blame]	1866
				1867	/* If the partial covers the entire object, just create a normal VMA. */
				1868	if (chunk >= obj->base.size >> PAGE_SHIFT)
				1869	view.type = I915_GGTT_VIEW_NORMAL;
				1870
				1871	return view;
				1872	}
				1873
Chris Wilson	4cc6907	2016-08-25 19:05:19 +0100	[diff] [blame]	1874	/**
Jesse Barnes	de151cf	2008-11-12 10:03:55 -0800	[diff] [blame]	1875	* i915_gem_fault - fault a page into the GTT
Geliang Tang	d9072a3	2015-09-15 05:58:44 -0700	[diff] [blame]	1876	* @vmf: fault info
Jesse Barnes	de151cf	2008-11-12 10:03:55 -0800	[diff] [blame]	1877	*
				1878	* The fault handler is set up by drm_gem_mmap() when a object is GTT mapped
				1879	* from userspace. The fault handler takes care of binding the object to
				1880	* the GTT (if needed), allocating and programming a fence register (again,
				1881	* only if needed based on whether the old reg is still valid or the object
				1882	* is tiled) and inserting a new PTE into the faulting process.
				1883	*
				1884	* Note that the faulting process may involve evicting existing objects
				1885	* from the GTT and/or fence registers to make room. So performance may
				1886	* suffer if the GTT working set is large or there are few fence registers
				1887	* left.
Chris Wilson	4cc6907	2016-08-25 19:05:19 +0100	[diff] [blame]	1888	*
				1889	* The current feature set supported by i915_gem_fault() and thus GTT mmaps
				1890	* is exposed via I915_PARAM_MMAP_GTT_VERSION (see i915_gem_mmap_gtt_version).
Jesse Barnes	de151cf	2008-11-12 10:03:55 -0800	[diff] [blame]	1891	*/
Dave Jiang	11bac80	2017-02-24 14:56:41 -0800	[diff] [blame]	1892	int i915_gem_fault(struct vm_fault *vmf)
Jesse Barnes	de151cf	2008-11-12 10:03:55 -0800	[diff] [blame]	1893	{
Chris Wilson	03af84f	2016-08-18 17:17:01 +0100	[diff] [blame]	1894	#define MIN_CHUNK_PAGES ((1 << 20) >> PAGE_SHIFT) /* 1 MiB */
Dave Jiang	11bac80	2017-02-24 14:56:41 -0800	[diff] [blame]	1895	struct vm_area_struct *area = vmf->vma;
Chris Wilson	058d88c	2016-08-15 10:49:06 +0100	[diff] [blame]	1896	struct drm_i915_gem_object *obj = to_intel_bo(area->vm_private_data);
Chris Wilson	05394f3	2010-11-08 19:18:58 +0000	[diff] [blame]	1897	struct drm_device *dev = obj->base.dev;
Joonas Lahtinen	72e96d6	2016-03-30 16:57:10 +0300	[diff] [blame]	1898	struct drm_i915_private *dev_priv = to_i915(dev);
				1899	struct i915_ggtt *ggtt = &dev_priv->ggtt;
Chris Wilson	b8f9096	2016-08-05 10:14:07 +0100	[diff] [blame]	1900	bool write = !!(vmf->flags & FAULT_FLAG_WRITE);
Chris Wilson	058d88c	2016-08-15 10:49:06 +0100	[diff] [blame]	1901	struct i915_vma *vma;
Jesse Barnes	de151cf	2008-11-12 10:03:55 -0800	[diff] [blame]	1902	pgoff_t page_offset;
Chris Wilson	8211887	2016-08-18 17:17:05 +0100	[diff] [blame]	1903	unsigned int flags;
Chris Wilson	b8f9096	2016-08-05 10:14:07 +0100	[diff] [blame]	1904	int ret;
Paulo Zanoni	f65c916	2013-11-27 18:20:34 -0200	[diff] [blame]	1905
Jesse Barnes	de151cf	2008-11-12 10:03:55 -0800	[diff] [blame]	1906	/* We don't use vmf->pgoff since that has the fake offset */
Jan Kara	1a29d85	2016-12-14 15:07:01 -0800	[diff] [blame]	1907	page_offset = (vmf->address - area->vm_start) >> PAGE_SHIFT;
Jesse Barnes	de151cf	2008-11-12 10:03:55 -0800	[diff] [blame]	1908
Chris Wilson	db53a30	2011-02-03 11:57:46 +0000	[diff] [blame]	1909	trace_i915_gem_object_fault(obj, page_offset, true, write);
				1910
Chris Wilson	6e4930f	2014-02-07 18:37:06 -0200	[diff] [blame]	1911	/* Try to flush the object off the GPU first without holding the lock.
Chris Wilson	b8f9096	2016-08-05 10:14:07 +0100	[diff] [blame]	1912	* Upon acquiring the lock, we will perform our sanity checks and then
Chris Wilson	6e4930f	2014-02-07 18:37:06 -0200	[diff] [blame]	1913	* repeat the flush holding the lock in the normal manner to catch cases
				1914	* where we are gazumped.
				1915	*/
Chris Wilson	e95433c	2016-10-28 13:58:27 +0100	[diff] [blame]	1916	ret = i915_gem_object_wait(obj,
				1917	I915_WAIT_INTERRUPTIBLE,
				1918	MAX_SCHEDULE_TIMEOUT,
				1919	NULL);
Chris Wilson	6e4930f	2014-02-07 18:37:06 -0200	[diff] [blame]	1920	if (ret)
Chris Wilson	b8f9096	2016-08-05 10:14:07 +0100	[diff] [blame]	1921	goto err;
				1922
Chris Wilson	40e62d5	2016-10-28 13:58:41 +0100	[diff] [blame]	1923	ret = i915_gem_object_pin_pages(obj);
				1924	if (ret)
				1925	goto err;
				1926
Chris Wilson	b8f9096	2016-08-05 10:14:07 +0100	[diff] [blame]	1927	intel_runtime_pm_get(dev_priv);
				1928
				1929	ret = i915_mutex_lock_interruptible(dev);
				1930	if (ret)
				1931	goto err_rpm;
Chris Wilson	6e4930f	2014-02-07 18:37:06 -0200	[diff] [blame]	1932
Chris Wilson	eb119bd	2012-12-16 12:43:36 +0000	[diff] [blame]	1933	/* Access to snoopable pages through the GTT is incoherent. */
Tvrtko Ursulin	0031fb9	2016-11-04 14:42:44 +0000	[diff] [blame]	1934	if (obj->cache_level != I915_CACHE_NONE && !HAS_LLC(dev_priv)) {
Chris Wilson	ddeff6e	2014-05-28 16:16:41 +0100	[diff] [blame]	1935	ret = -EFAULT;
Chris Wilson	b8f9096	2016-08-05 10:14:07 +0100	[diff] [blame]	1936	goto err_unlock;
Chris Wilson	eb119bd	2012-12-16 12:43:36 +0000	[diff] [blame]	1937	}
				1938
Chris Wilson	8211887	2016-08-18 17:17:05 +0100	[diff] [blame]	1939	/* If the object is smaller than a couple of partial vma, it is
				1940	* not worth only creating a single partial vma - we may as well
				1941	* clear enough space for the full object.
				1942	*/
				1943	flags = PIN_MAPPABLE;
				1944	if (obj->base.size > 2 * MIN_CHUNK_PAGES << PAGE_SHIFT)
				1945	flags \|= PIN_NONBLOCK \| PIN_NONFAULT;
				1946
Chris Wilson	a61007a	2016-08-18 17:17:02 +0100	[diff] [blame]	1947	/* Now pin it into the GTT as needed */
Chris Wilson	8211887	2016-08-18 17:17:05 +0100	[diff] [blame]	1948	vma = i915_gem_object_ggtt_pin(obj, NULL, 0, 0, flags);
Chris Wilson	a61007a	2016-08-18 17:17:02 +0100	[diff] [blame]	1949	if (IS_ERR(vma)) {
Chris Wilson	a61007a	2016-08-18 17:17:02 +0100	[diff] [blame]	1950	/* Use a partial view if it is bigger than available space */
Chris Wilson	2d4281b	2017-01-10 09:56:32 +0000	[diff] [blame]	1951	struct i915_ggtt_view view =
Chris Wilson	8201c1f	2017-01-10 09:56:33 +0000	[diff] [blame]	1952	compute_partial_view(obj, page_offset, MIN_CHUNK_PAGES);
Chris Wilson	aa136d9	2016-08-18 17:17:03 +0100	[diff] [blame]	1953
Chris Wilson	5034924	2016-08-18 17:17:04 +0100	[diff] [blame]	1954	/* Userspace is now writing through an untracked VMA, abandon
				1955	* all hope that the hardware is able to track future writes.
				1956	*/
				1957	obj->frontbuffer_ggtt_origin = ORIGIN_CPU;
				1958
Chris Wilson	a61007a	2016-08-18 17:17:02 +0100	[diff] [blame]	1959	vma = i915_gem_object_ggtt_pin(obj, &view, 0, 0, PIN_MAPPABLE);
				1960	}
Chris Wilson	058d88c	2016-08-15 10:49:06 +0100	[diff] [blame]	1961	if (IS_ERR(vma)) {
				1962	ret = PTR_ERR(vma);
Chris Wilson	b8f9096	2016-08-05 10:14:07 +0100	[diff] [blame]	1963	goto err_unlock;
Chris Wilson	058d88c	2016-08-15 10:49:06 +0100	[diff] [blame]	1964	}
Jesse Barnes	de151cf	2008-11-12 10:03:55 -0800	[diff] [blame]	1965
Chris Wilson	c983930	2012-11-20 10:45:17 +0000	[diff] [blame]	1966	ret = i915_gem_object_set_to_gtt_domain(obj, write);
				1967	if (ret)
Chris Wilson	b8f9096	2016-08-05 10:14:07 +0100	[diff] [blame]	1968	goto err_unpin;
Chris Wilson	c983930	2012-11-20 10:45:17 +0000	[diff] [blame]	1969
Chris Wilson	3bd4073	2017-10-09 09:43:56 +0100	[diff] [blame]	1970	ret = i915_vma_pin_fence(vma);
Chris Wilson	c983930	2012-11-20 10:45:17 +0000	[diff] [blame]	1971	if (ret)
Chris Wilson	b8f9096	2016-08-05 10:14:07 +0100	[diff] [blame]	1972	goto err_unpin;
Chris Wilson	7d1c480	2010-08-07 21:45:03 +0100	[diff] [blame]	1973
Chris Wilson	b90b91d	2014-06-10 12:14:40 +0100	[diff] [blame]	1974	/* Finally, remap it using the new GTT offset */
Chris Wilson	c58305a	2016-08-19 16:54:28 +0100	[diff] [blame]	1975	ret = remap_io_mapping(area,
Chris Wilson	8bab1193	2017-01-14 00:28:25 +0000	[diff] [blame]	1976	area->vm_start + (vma->ggtt_view.partial.offset << PAGE_SHIFT),
Matthew Auld	73ebd50	2017-12-11 15:18:20 +0000	[diff] [blame]	1977	(ggtt->gmadr.start + vma->node.start) >> PAGE_SHIFT,
Chris Wilson	c58305a	2016-08-19 16:54:28 +0100	[diff] [blame]	1978	min_t(u64, vma->size, area->vm_end - area->vm_start),
Matthew Auld	73ebd50	2017-12-11 15:18:20 +0000	[diff] [blame]	1979	&ggtt->iomap);
Chris Wilson	a65adaf	2017-10-09 09:43:57 +0100	[diff] [blame]	1980	if (ret)
				1981	goto err_fence;
Chris Wilson	a61007a	2016-08-18 17:17:02 +0100	[diff] [blame]	1982
Chris Wilson	a65adaf	2017-10-09 09:43:57 +0100	[diff] [blame]	1983	/* Mark as being mmapped into userspace for later revocation */
				1984	assert_rpm_wakelock_held(dev_priv);
				1985	if (!i915_vma_set_userfault(vma) && !obj->userfault_count++)
				1986	list_add(&obj->userfault_link, &dev_priv->mm.userfault_list);
				1987	GEM_BUG_ON(!obj->userfault_count);
				1988
Chris Wilson	7125397	2017-12-06 12:49:14 +0000	[diff] [blame]	1989	i915_vma_set_ggtt_write(vma);
				1990
Chris Wilson	a65adaf	2017-10-09 09:43:57 +0100	[diff] [blame]	1991	err_fence:
Chris Wilson	3bd4073	2017-10-09 09:43:56 +0100	[diff] [blame]	1992	i915_vma_unpin_fence(vma);
Chris Wilson	b8f9096	2016-08-05 10:14:07 +0100	[diff] [blame]	1993	err_unpin:
Chris Wilson	058d88c	2016-08-15 10:49:06 +0100	[diff] [blame]	1994	__i915_vma_unpin(vma);
Chris Wilson	b8f9096	2016-08-05 10:14:07 +0100	[diff] [blame]	1995	err_unlock:
Jesse Barnes	de151cf	2008-11-12 10:03:55 -0800	[diff] [blame]	1996	mutex_unlock(&dev->struct_mutex);
Chris Wilson	b8f9096	2016-08-05 10:14:07 +0100	[diff] [blame]	1997	err_rpm:
				1998	intel_runtime_pm_put(dev_priv);
Chris Wilson	40e62d5	2016-10-28 13:58:41 +0100	[diff] [blame]	1999	i915_gem_object_unpin_pages(obj);
Chris Wilson	b8f9096	2016-08-05 10:14:07 +0100	[diff] [blame]	2000	err:
Jesse Barnes	de151cf	2008-11-12 10:03:55 -0800	[diff] [blame]	2001	switch (ret) {
Chris Wilson	d9bc7e9	2011-02-07 13:09:31 +0000	[diff] [blame]	2002	case -EIO:
Daniel Vetter	2232f03	2014-09-04 09:36:18 +0200	[diff] [blame]	2003	/*
				2004	* We eat errors when the gpu is terminally wedged to avoid
				2005	* userspace unduly crashing (gl has no provisions for mmaps to
				2006	* fail). But any other -EIO isn't ours (e.g. swap in failure)
				2007	* and so needs to be reported.
				2008	*/
				2009	if (!i915_terminally_wedged(&dev_priv->gpu_error)) {
Paulo Zanoni	f65c916	2013-11-27 18:20:34 -0200	[diff] [blame]	2010	ret = VM_FAULT_SIGBUS;
				2011	break;
				2012	}
Chris Wilson	045e769	2010-11-07 09:18:22 +0000	[diff] [blame]	2013	case -EAGAIN:
Daniel Vetter	571c608	2013-09-12 17:57:28 +0200	[diff] [blame]	2014	/*
				2015	* EAGAIN means the gpu is hung and we'll wait for the error
				2016	* handler to reset everything when re-faulting in
				2017	* i915_mutex_lock_interruptible.
Chris Wilson	d9bc7e9	2011-02-07 13:09:31 +0000	[diff] [blame]	2018	*/
Chris Wilson	c715089	2009-09-23 00:43:56 +0100	[diff] [blame]	2019	case 0:
				2020	case -ERESTARTSYS:
Chris Wilson	bed636a	2011-02-11 20:31:19 +0000	[diff] [blame]	2021	case -EINTR:
Dmitry Rogozhkin	e79e0fe	2012-10-03 17:15:26 +0300	[diff] [blame]	2022	case -EBUSY:
				2023	/*
				2024	* EBUSY is ok: this just means that another thread
				2025	* already did the job.
				2026	*/
Paulo Zanoni	f65c916	2013-11-27 18:20:34 -0200	[diff] [blame]	2027	ret = VM_FAULT_NOPAGE;
				2028	break;
Jesse Barnes	de151cf	2008-11-12 10:03:55 -0800	[diff] [blame]	2029	case -ENOMEM:
Paulo Zanoni	f65c916	2013-11-27 18:20:34 -0200	[diff] [blame]	2030	ret = VM_FAULT_OOM;
				2031	break;
Daniel Vetter	a7c2e1a	2012-10-17 11:17:16 +0200	[diff] [blame]	2032	case -ENOSPC:
Chris Wilson	45d6781	2014-01-31 11:34:57 +0000	[diff] [blame]	2033	case -EFAULT:
Paulo Zanoni	f65c916	2013-11-27 18:20:34 -0200	[diff] [blame]	2034	ret = VM_FAULT_SIGBUS;
				2035	break;
Jesse Barnes	de151cf	2008-11-12 10:03:55 -0800	[diff] [blame]	2036	default:
Daniel Vetter	a7c2e1a	2012-10-17 11:17:16 +0200	[diff] [blame]	2037	WARN_ONCE(ret, "unhandled error in i915_gem_fault: %i\n", ret);
Paulo Zanoni	f65c916	2013-11-27 18:20:34 -0200	[diff] [blame]	2038	ret = VM_FAULT_SIGBUS;
				2039	break;
Jesse Barnes	de151cf	2008-11-12 10:03:55 -0800	[diff] [blame]	2040	}
Paulo Zanoni	f65c916	2013-11-27 18:20:34 -0200	[diff] [blame]	2041	return ret;
Jesse Barnes	de151cf	2008-11-12 10:03:55 -0800	[diff] [blame]	2042	}
				2043
Chris Wilson	a65adaf	2017-10-09 09:43:57 +0100	[diff] [blame]	2044	static void __i915_gem_object_release_mmap(struct drm_i915_gem_object *obj)
				2045	{
				2046	struct i915_vma *vma;
				2047
				2048	GEM_BUG_ON(!obj->userfault_count);
				2049
				2050	obj->userfault_count = 0;
				2051	list_del(&obj->userfault_link);
				2052	drm_vma_node_unmap(&obj->base.vma_node,
				2053	obj->base.dev->anon_inode->i_mapping);
				2054
Chris Wilson	e2189dd	2017-12-07 21:14:07 +0000	[diff] [blame]	2055	for_each_ggtt_vma(vma, obj)
Chris Wilson	a65adaf	2017-10-09 09:43:57 +0100	[diff] [blame]	2056	i915_vma_unset_userfault(vma);
Chris Wilson	a65adaf	2017-10-09 09:43:57 +0100	[diff] [blame]	2057	}
				2058
Jesse Barnes	de151cf	2008-11-12 10:03:55 -0800	[diff] [blame]	2059	/**
Chris Wilson	901782b	2009-07-10 08:18:50 +0100	[diff] [blame]	2060	* i915_gem_release_mmap - remove physical page mappings
				2061	* @obj: obj in question
				2062	*
André Goddard Rosa	af901ca	2009-11-14 13:09:05 -0200	[diff] [blame]	2063	* Preserve the reservation of the mmapping with the DRM core code, but
Chris Wilson	901782b	2009-07-10 08:18:50 +0100	[diff] [blame]	2064	* relinquish ownership of the pages back to the system.
				2065	*
				2066	* It is vital that we remove the page mapping if we have mapped a tiled
				2067	* object through the GTT and then lose the fence register due to
				2068	* resource pressure. Similarly if the object has been moved out of the
				2069	* aperture, than pages mapped into userspace must be revoked. Removing the
				2070	* mapping will then trigger a page fault on the next user access, allowing
				2071	* fixup by i915_gem_fault().
				2072	*/
Eric Anholt	d05ca30	2009-07-10 13:02:26 -0700	[diff] [blame]	2073	void
Chris Wilson	05394f3	2010-11-08 19:18:58 +0000	[diff] [blame]	2074	i915_gem_release_mmap(struct drm_i915_gem_object *obj)
Chris Wilson	901782b	2009-07-10 08:18:50 +0100	[diff] [blame]	2075	{
Chris Wilson	275f039	2016-10-24 13:42:14 +0100	[diff] [blame]	2076	struct drm_i915_private *i915 = to_i915(obj->base.dev);
Chris Wilson	275f039	2016-10-24 13:42:14 +0100	[diff] [blame]	2077
Chris Wilson	349f2cc	2016-04-13 17:35:12 +0100	[diff] [blame]	2078	/* Serialisation between user GTT access and our code depends upon
				2079	* revoking the CPU's PTE whilst the mutex is held. The next user
				2080	* pagefault then has to wait until we release the mutex.
Chris Wilson	9c870d0	2016-10-24 13:42:15 +0100	[diff] [blame]	2081	*
				2082	* Note that RPM complicates somewhat by adding an additional
				2083	* requirement that operations to the GGTT be made holding the RPM
				2084	* wakeref.
Chris Wilson	349f2cc	2016-04-13 17:35:12 +0100	[diff] [blame]	2085	*/
Chris Wilson	275f039	2016-10-24 13:42:14 +0100	[diff] [blame]	2086	lockdep_assert_held(&i915->drm.struct_mutex);
Chris Wilson	9c870d0	2016-10-24 13:42:15 +0100	[diff] [blame]	2087	intel_runtime_pm_get(i915);
Chris Wilson	349f2cc	2016-04-13 17:35:12 +0100	[diff] [blame]	2088
Chris Wilson	a65adaf	2017-10-09 09:43:57 +0100	[diff] [blame]	2089	if (!obj->userfault_count)
Chris Wilson	9c870d0	2016-10-24 13:42:15 +0100	[diff] [blame]	2090	goto out;
Chris Wilson	901782b	2009-07-10 08:18:50 +0100	[diff] [blame]	2091
Chris Wilson	a65adaf	2017-10-09 09:43:57 +0100	[diff] [blame]	2092	__i915_gem_object_release_mmap(obj);
Chris Wilson	349f2cc	2016-04-13 17:35:12 +0100	[diff] [blame]	2093
				2094	/* Ensure that the CPU's PTE are revoked and there are not outstanding
				2095	* memory transactions from userspace before we return. The TLB
				2096	* flushing implied above by changing the PTE above should be
				2097	* sufficient, an extra barrier here just provides us with a bit
				2098	* of paranoid documentation about our requirement to serialise
				2099	* memory writes before touching registers / GSM.
				2100	*/
				2101	wmb();
Chris Wilson	9c870d0	2016-10-24 13:42:15 +0100	[diff] [blame]	2102
				2103	out:
				2104	intel_runtime_pm_put(i915);
Chris Wilson	901782b	2009-07-10 08:18:50 +0100	[diff] [blame]	2105	}
				2106
Chris Wilson	7c108fd	2016-10-24 13:42:18 +0100	[diff] [blame]	2107	void i915_gem_runtime_suspend(struct drm_i915_private *dev_priv)
Chris Wilson	eedd10f	2014-06-16 08:57:44 +0100	[diff] [blame]	2108	{
Chris Wilson	3594a3e	2016-10-24 13:42:16 +0100	[diff] [blame]	2109	struct drm_i915_gem_object obj, on;
Chris Wilson	7c108fd	2016-10-24 13:42:18 +0100	[diff] [blame]	2110	int i;
Chris Wilson	eedd10f	2014-06-16 08:57:44 +0100	[diff] [blame]	2111
Chris Wilson	3594a3e	2016-10-24 13:42:16 +0100	[diff] [blame]	2112	/*
				2113	* Only called during RPM suspend. All users of the userfault_list
				2114	* must be holding an RPM wakeref to ensure that this can not
				2115	* run concurrently with themselves (and use the struct_mutex for
				2116	* protection between themselves).
				2117	*/
				2118
				2119	list_for_each_entry_safe(obj, on,
Chris Wilson	a65adaf	2017-10-09 09:43:57 +0100	[diff] [blame]	2120	&dev_priv->mm.userfault_list, userfault_link)
				2121	__i915_gem_object_release_mmap(obj);
Chris Wilson	7c108fd	2016-10-24 13:42:18 +0100	[diff] [blame]	2122
				2123	/* The fence will be lost when the device powers down. If any were
				2124	* in use by hardware (i.e. they are pinned), we should not be powering
				2125	* down! All other fences will be reacquired by the user upon waking.
				2126	*/
				2127	for (i = 0; i < dev_priv->num_fence_regs; i++) {
				2128	struct drm_i915_fence_reg *reg = &dev_priv->fence_regs[i];
				2129
Chris Wilson	e0ec3ec	2017-02-03 12:57:17 +0000	[diff] [blame]	2130	/* Ideally we want to assert that the fence register is not
				2131	* live at this point (i.e. that no piece of code will be
				2132	* trying to write through fence + GTT, as that both violates
				2133	* our tracking of activity and associated locking/barriers,
				2134	* but also is illegal given that the hw is powered down).
				2135	*
				2136	* Previously we used reg->pin_count as a "liveness" indicator.
				2137	* That is not sufficient, and we need a more fine-grained
				2138	* tool if we want to have a sanity check here.
				2139	*/
Chris Wilson	7c108fd	2016-10-24 13:42:18 +0100	[diff] [blame]	2140
				2141	if (!reg->vma)
				2142	continue;
				2143
Chris Wilson	a65adaf	2017-10-09 09:43:57 +0100	[diff] [blame]	2144	GEM_BUG_ON(i915_vma_has_userfault(reg->vma));
Chris Wilson	7c108fd	2016-10-24 13:42:18 +0100	[diff] [blame]	2145	reg->dirty = true;
				2146	}
Chris Wilson	eedd10f	2014-06-16 08:57:44 +0100	[diff] [blame]	2147	}
				2148
Chris Wilson	d8cb508	2012-08-11 15:41:03 +0100	[diff] [blame]	2149	static int i915_gem_object_create_mmap_offset(struct drm_i915_gem_object *obj)
				2150	{
Chris Wilson	fac5e23	2016-07-04 11:34:36 +0100	[diff] [blame]	2151	struct drm_i915_private *dev_priv = to_i915(obj->base.dev);
Chris Wilson	f3f6184	2016-08-05 10:14:14 +0100	[diff] [blame]	2152	int err;
Chris Wilson	d8cb508	2012-08-11 15:41:03 +0100	[diff] [blame]	2153
Chris Wilson	f3f6184	2016-08-05 10:14:14 +0100	[diff] [blame]	2154	err = drm_gem_create_mmap_offset(&obj->base);
Chris Wilson	b42a13d	2017-01-06 15:22:40 +0000	[diff] [blame]	2155	if (likely(!err))
Chris Wilson	f3f6184	2016-08-05 10:14:14 +0100	[diff] [blame]	2156	return 0;
Daniel Vetter	da494d7	2012-12-20 15:11:16 +0100	[diff] [blame]	2157
Chris Wilson	b42a13d	2017-01-06 15:22:40 +0000	[diff] [blame]	2158	/* Attempt to reap some mmap space from dead objects */
				2159	do {
				2160	err = i915_gem_wait_for_idle(dev_priv, I915_WAIT_INTERRUPTIBLE);
				2161	if (err)
				2162	break;
Chris Wilson	d8cb508	2012-08-11 15:41:03 +0100	[diff] [blame]	2163
Chris Wilson	b42a13d	2017-01-06 15:22:40 +0000	[diff] [blame]	2164	i915_gem_drain_freed_objects(dev_priv);
Chris Wilson	f3f6184	2016-08-05 10:14:14 +0100	[diff] [blame]	2165	err = drm_gem_create_mmap_offset(&obj->base);
Chris Wilson	b42a13d	2017-01-06 15:22:40 +0000	[diff] [blame]	2166	if (!err)
				2167	break;
				2168
				2169	} while (flush_delayed_work(&dev_priv->gt.retire_work));
Daniel Vetter	da494d7	2012-12-20 15:11:16 +0100	[diff] [blame]	2170
Chris Wilson	f3f6184	2016-08-05 10:14:14 +0100	[diff] [blame]	2171	return err;
Chris Wilson	d8cb508	2012-08-11 15:41:03 +0100	[diff] [blame]	2172	}
				2173
				2174	static void i915_gem_object_free_mmap_offset(struct drm_i915_gem_object *obj)
				2175	{
Chris Wilson	d8cb508	2012-08-11 15:41:03 +0100	[diff] [blame]	2176	drm_gem_free_mmap_offset(&obj->base);
				2177	}
				2178
Dave Airlie	da6b51d	2014-12-24 13:11:17 +1000	[diff] [blame]	2179	int
Dave Airlie	ff72145b	2011-02-07 12:16:14 +1000	[diff] [blame]	2180	i915_gem_mmap_gtt(struct drm_file *file,
				2181	struct drm_device *dev,
Dave Airlie	da6b51d	2014-12-24 13:11:17 +1000	[diff] [blame]	2182	uint32_t handle,
Dave Airlie	ff72145b	2011-02-07 12:16:14 +1000	[diff] [blame]	2183	uint64_t *offset)
Jesse Barnes	de151cf	2008-11-12 10:03:55 -0800	[diff] [blame]	2184	{
Chris Wilson	05394f3	2010-11-08 19:18:58 +0000	[diff] [blame]	2185	struct drm_i915_gem_object *obj;
Jesse Barnes	de151cf	2008-11-12 10:03:55 -0800	[diff] [blame]	2186	int ret;
				2187
Chris Wilson	03ac064	2016-07-20 13:31:51 +0100	[diff] [blame]	2188	obj = i915_gem_object_lookup(file, handle);
Chris Wilson	f3f6184	2016-08-05 10:14:14 +0100	[diff] [blame]	2189	if (!obj)
				2190	return -ENOENT;
Chris Wilson	ab18282	2009-09-22 18:46:17 +0100	[diff] [blame]	2191
Chris Wilson	d8cb508	2012-08-11 15:41:03 +0100	[diff] [blame]	2192	ret = i915_gem_object_create_mmap_offset(obj);
Chris Wilson	f3f6184	2016-08-05 10:14:14 +0100	[diff] [blame]	2193	if (ret == 0)
				2194	*offset = drm_vma_node_offset_addr(&obj->base.vma_node);
Jesse Barnes	de151cf	2008-11-12 10:03:55 -0800	[diff] [blame]	2195
Chris Wilson	f0cd518	2016-10-28 13:58:43 +0100	[diff] [blame]	2196	i915_gem_object_put(obj);
Chris Wilson	1d7cfea	2010-10-17 09:45:41 +0100	[diff] [blame]	2197	return ret;
Jesse Barnes	de151cf	2008-11-12 10:03:55 -0800	[diff] [blame]	2198	}
				2199
Dave Airlie	ff72145b	2011-02-07 12:16:14 +1000	[diff] [blame]	2200	/**
				2201	* i915_gem_mmap_gtt_ioctl - prepare an object for GTT mmap'ing
				2202	* @dev: DRM device
				2203	* @data: GTT mapping ioctl data
				2204	* @file: GEM object info
				2205	*
				2206	* Simply returns the fake offset to userspace so it can mmap it.
				2207	* The mmap call will end up in drm_gem_mmap(), which will set things
				2208	* up so we can get faults in the handler above.
				2209	*
				2210	* The fault handler will take care of binding the object into the GTT
				2211	* (since it may have been evicted to make room for something), allocating
				2212	* a fence register, and mapping the appropriate aperture address into
				2213	* userspace.
				2214	*/
				2215	int
				2216	i915_gem_mmap_gtt_ioctl(struct drm_device dev, void data,
				2217	struct drm_file *file)
				2218	{
				2219	struct drm_i915_gem_mmap_gtt *args = data;
				2220
Dave Airlie	da6b51d	2014-12-24 13:11:17 +1000	[diff] [blame]	2221	return i915_gem_mmap_gtt(file, dev, args->handle, &args->offset);
Dave Airlie	ff72145b	2011-02-07 12:16:14 +1000	[diff] [blame]	2222	}
				2223
Daniel Vetter	225067e	2012-08-20 10:23:20 +0200	[diff] [blame]	2224	/* Immediately discard the backing storage */
				2225	static void
				2226	i915_gem_object_truncate(struct drm_i915_gem_object *obj)
Chris Wilson	e5281cc	2010-10-28 13:45:36 +0100	[diff] [blame]	2227	{
Chris Wilson	4d6294bf	2012-08-11 15:41:05 +0100	[diff] [blame]	2228	i915_gem_object_free_mmap_offset(obj);
Daniel Vetter	1286ff7	2012-05-10 15:25:09 +0200	[diff] [blame]	2229
Chris Wilson	4d6294bf	2012-08-11 15:41:05 +0100	[diff] [blame]	2230	if (obj->base.filp == NULL)
				2231	return;
				2232
Daniel Vetter	225067e	2012-08-20 10:23:20 +0200	[diff] [blame]	2233	/* Our goal here is to return as much of the memory as
				2234	* is possible back to the system as we are called from OOM.
				2235	* To do this we must instruct the shmfs to drop all of its
				2236	* backing pages, now.
Chris Wilson	e5281cc	2010-10-28 13:45:36 +0100	[diff] [blame]	2237	*/
Chris Wilson	5537252	2014-03-25 13:23:06 +0000	[diff] [blame]	2238	shmem_truncate_range(file_inode(obj->base.filp), 0, (loff_t)-1);
Chris Wilson	a4f5ea6	2016-10-28 13:58:35 +0100	[diff] [blame]	2239	obj->mm.madv = __I915_MADV_PURGED;
Chris Wilson	4e5462e	2017-03-07 13:20:31 +0000	[diff] [blame]	2240	obj->mm.pages = ERR_PTR(-EFAULT);
Chris Wilson	e5281cc	2010-10-28 13:45:36 +0100	[diff] [blame]	2241	}
Chris Wilson	e5281cc	2010-10-28 13:45:36 +0100	[diff] [blame]	2242
Chris Wilson	5537252	2014-03-25 13:23:06 +0000	[diff] [blame]	2243	/* Try to discard unwanted pages */
Chris Wilson	03ac84f	2016-10-28 13:58:36 +0100	[diff] [blame]	2244	void __i915_gem_object_invalidate(struct drm_i915_gem_object *obj)
Daniel Vetter	225067e	2012-08-20 10:23:20 +0200	[diff] [blame]	2245	{
Chris Wilson	5537252	2014-03-25 13:23:06 +0000	[diff] [blame]	2246	struct address_space *mapping;
				2247
Chris Wilson	1233e2d	2016-10-28 13:58:37 +0100	[diff] [blame]	2248	lockdep_assert_held(&obj->mm.lock);
Chris Wilson	f1fa4f4	2017-10-13 21:26:13 +0100	[diff] [blame]	2249	GEM_BUG_ON(i915_gem_object_has_pages(obj));
Chris Wilson	1233e2d	2016-10-28 13:58:37 +0100	[diff] [blame]	2250
Chris Wilson	a4f5ea6	2016-10-28 13:58:35 +0100	[diff] [blame]	2251	switch (obj->mm.madv) {
Chris Wilson	5537252	2014-03-25 13:23:06 +0000	[diff] [blame]	2252	case I915_MADV_DONTNEED:
				2253	i915_gem_object_truncate(obj);
				2254	case __I915_MADV_PURGED:
				2255	return;
				2256	}
				2257
				2258	if (obj->base.filp == NULL)
				2259	return;
				2260
Al Viro	93c76a3	2015-12-04 23:45:44 -0500	[diff] [blame]	2261	mapping = obj->base.filp->f_mapping,
Chris Wilson	5537252	2014-03-25 13:23:06 +0000	[diff] [blame]	2262	invalidate_mapping_pages(mapping, 0, (loff_t)-1);
Chris Wilson	e5281cc	2010-10-28 13:45:36 +0100	[diff] [blame]	2263	}
				2264
Chris Wilson	5cdf588	2010-09-27 15:51:07 +0100	[diff] [blame]	2265	static void
Chris Wilson	03ac84f	2016-10-28 13:58:36 +0100	[diff] [blame]	2266	i915_gem_object_put_pages_gtt(struct drm_i915_gem_object *obj,
				2267	struct sg_table *pages)
Eric Anholt	673a394	2008-07-30 12:06:12 -0700	[diff] [blame]	2268	{
Dave Gordon	85d1225	2016-05-20 11:54:06 +0100	[diff] [blame]	2269	struct sgt_iter sgt_iter;
				2270	struct page *page;
Daniel Vetter	1286ff7	2012-05-10 15:25:09 +0200	[diff] [blame]	2271
Chris Wilson	e5facdf	2016-12-23 14:57:57 +0000	[diff] [blame]	2272	__i915_gem_object_release_shmem(obj, pages, true);
Eric Anholt	856fa19	2009-03-19 14:10:50 -0700	[diff] [blame]	2273
Chris Wilson	03ac84f	2016-10-28 13:58:36 +0100	[diff] [blame]	2274	i915_gem_gtt_finish_pages(obj, pages);
Imre Deak	e227330	2015-07-09 12:59:05 +0300	[diff] [blame]	2275
Daniel Vetter	6dacfd2	2011-09-12 21:30:02 +0200	[diff] [blame]	2276	if (i915_gem_object_needs_bit17_swizzle(obj))
Chris Wilson	03ac84f	2016-10-28 13:58:36 +0100	[diff] [blame]	2277	i915_gem_object_save_bit_17_swizzle(obj, pages);
Eric Anholt	280b713	2009-03-12 16:56:27 -0700	[diff] [blame]	2278
Chris Wilson	03ac84f	2016-10-28 13:58:36 +0100	[diff] [blame]	2279	for_each_sgt_page(page, sgt_iter, pages) {
Chris Wilson	a4f5ea6	2016-10-28 13:58:35 +0100	[diff] [blame]	2280	if (obj->mm.dirty)
Chris Wilson	9da3da6	2012-06-01 15:20:22 +0100	[diff] [blame]	2281	set_page_dirty(page);
Chris Wilson	3ef94da	2009-09-14 16:50:29 +0100	[diff] [blame]	2282
Chris Wilson	a4f5ea6	2016-10-28 13:58:35 +0100	[diff] [blame]	2283	if (obj->mm.madv == I915_MADV_WILLNEED)
Chris Wilson	9da3da6	2012-06-01 15:20:22 +0100	[diff] [blame]	2284	mark_page_accessed(page);
Chris Wilson	3ef94da	2009-09-14 16:50:29 +0100	[diff] [blame]	2285
Kirill A. Shutemov	09cbfea	2016-04-01 15:29:47 +0300	[diff] [blame]	2286	put_page(page);
Chris Wilson	3ef94da	2009-09-14 16:50:29 +0100	[diff] [blame]	2287	}
Chris Wilson	a4f5ea6	2016-10-28 13:58:35 +0100	[diff] [blame]	2288	obj->mm.dirty = false;
Eric Anholt	673a394	2008-07-30 12:06:12 -0700	[diff] [blame]	2289
Chris Wilson	03ac84f	2016-10-28 13:58:36 +0100	[diff] [blame]	2290	sg_free_table(pages);
				2291	kfree(pages);
Chris Wilson	37e680a	2012-06-07 15:38:42 +0100	[diff] [blame]	2292	}
				2293
Chris Wilson	96d7763	2016-10-28 13:58:33 +0100	[diff] [blame]	2294	static void __i915_gem_object_reset_page_iter(struct drm_i915_gem_object *obj)
				2295	{
				2296	struct radix_tree_iter iter;
Ville Syrjälä	c23aa71	2017-09-01 20:12:51 +0300	[diff] [blame]	2297	void __rcu **slot;
Chris Wilson	96d7763	2016-10-28 13:58:33 +0100	[diff] [blame]	2298
Chris Wilson	bea6e98	2017-10-26 14:00:31 +0100	[diff] [blame]	2299	rcu_read_lock();
Chris Wilson	a4f5ea6	2016-10-28 13:58:35 +0100	[diff] [blame]	2300	radix_tree_for_each_slot(slot, &obj->mm.get_page.radix, &iter, 0)
				2301	radix_tree_delete(&obj->mm.get_page.radix, iter.index);
Chris Wilson	bea6e98	2017-10-26 14:00:31 +0100	[diff] [blame]	2302	rcu_read_unlock();
Chris Wilson	96d7763	2016-10-28 13:58:33 +0100	[diff] [blame]	2303	}
				2304
Chris Wilson	548625e	2016-11-01 12:11:34 +0000	[diff] [blame]	2305	void __i915_gem_object_put_pages(struct drm_i915_gem_object *obj,
				2306	enum i915_mm_subclass subclass)
Chris Wilson	37e680a	2012-06-07 15:38:42 +0100	[diff] [blame]	2307	{
Chris Wilson	f212381	2017-10-16 12:40:37 +0100	[diff] [blame]	2308	struct drm_i915_private *i915 = to_i915(obj->base.dev);
Chris Wilson	03ac84f	2016-10-28 13:58:36 +0100	[diff] [blame]	2309	struct sg_table *pages;
Chris Wilson	37e680a	2012-06-07 15:38:42 +0100	[diff] [blame]	2310
Chris Wilson	a4f5ea6	2016-10-28 13:58:35 +0100	[diff] [blame]	2311	if (i915_gem_object_has_pinned_pages(obj))
Chris Wilson	03ac84f	2016-10-28 13:58:36 +0100	[diff] [blame]	2312	return;
Chris Wilson	a557017	2012-09-04 21:02:54 +0100	[diff] [blame]	2313
Chris Wilson	15717de	2016-08-04 07:52:26 +0100	[diff] [blame]	2314	GEM_BUG_ON(obj->bind_count);
Chris Wilson	f1fa4f4	2017-10-13 21:26:13 +0100	[diff] [blame]	2315	if (!i915_gem_object_has_pages(obj))
Chris Wilson	1233e2d	2016-10-28 13:58:37 +0100	[diff] [blame]	2316	return;
				2317
				2318	/* May be called by shrinker from within get_pages() (on another bo) */
Chris Wilson	548625e	2016-11-01 12:11:34 +0000	[diff] [blame]	2319	mutex_lock_nested(&obj->mm.lock, subclass);
Chris Wilson	1233e2d	2016-10-28 13:58:37 +0100	[diff] [blame]	2320	if (unlikely(atomic_read(&obj->mm.pages_pin_count)))
				2321	goto unlock;
Ben Widawsky	3e12302	2013-07-31 17:00:04 -0700	[diff] [blame]	2322
Chris Wilson	a2165e3	2012-12-03 11:49:00 +0000	[diff] [blame]	2323	/* ->put_pages might need to allocate memory for the bit17 swizzle
				2324	* array, hence protect them from being reaped by removing them from gtt
				2325	* lists early. */
Chris Wilson	03ac84f	2016-10-28 13:58:36 +0100	[diff] [blame]	2326	pages = fetch_and_zero(&obj->mm.pages);
				2327	GEM_BUG_ON(!pages);
Chris Wilson	a2165e3	2012-12-03 11:49:00 +0000	[diff] [blame]	2328
Chris Wilson	f212381	2017-10-16 12:40:37 +0100	[diff] [blame]	2329	spin_lock(&i915->mm.obj_lock);
				2330	list_del(&obj->mm.link);
				2331	spin_unlock(&i915->mm.obj_lock);
				2332
Chris Wilson	a4f5ea6	2016-10-28 13:58:35 +0100	[diff] [blame]	2333	if (obj->mm.mapping) {
Chris Wilson	4b30cb2	2016-08-18 17:16:42 +0100	[diff] [blame]	2334	void *ptr;
				2335
Chris Wilson	0ce8178	2017-05-17 13:09:59 +0100	[diff] [blame]	2336	ptr = page_mask_bits(obj->mm.mapping);
Chris Wilson	4b30cb2	2016-08-18 17:16:42 +0100	[diff] [blame]	2337	if (is_vmalloc_addr(ptr))
				2338	vunmap(ptr);
Chris Wilson	fb8621d	2016-04-08 12:11:14 +0100	[diff] [blame]	2339	else
Chris Wilson	4b30cb2	2016-08-18 17:16:42 +0100	[diff] [blame]	2340	kunmap(kmap_to_page(ptr));
				2341
Chris Wilson	a4f5ea6	2016-10-28 13:58:35 +0100	[diff] [blame]	2342	obj->mm.mapping = NULL;
Chris Wilson	0a798eb	2016-04-08 12:11:11 +0100	[diff] [blame]	2343	}
				2344
Chris Wilson	96d7763	2016-10-28 13:58:33 +0100	[diff] [blame]	2345	__i915_gem_object_reset_page_iter(obj);
				2346
Chris Wilson	4e5462e	2017-03-07 13:20:31 +0000	[diff] [blame]	2347	if (!IS_ERR(pages))
				2348	obj->ops->put_pages(obj, pages);
				2349
Matthew Auld	a5c08166	2017-10-06 23:18:18 +0100	[diff] [blame]	2350	obj->mm.page_sizes.phys = obj->mm.page_sizes.sg = 0;
				2351
Chris Wilson	1233e2d	2016-10-28 13:58:37 +0100	[diff] [blame]	2352	unlock:
				2353	mutex_unlock(&obj->mm.lock);
Chris Wilson	6c085a7	2012-08-20 11:40:46 +0200	[diff] [blame]	2354	}
				2355
Chris Wilson	935a2f7	2017-02-13 17:15:13 +0000	[diff] [blame]	2356	static bool i915_sg_trim(struct sg_table *orig_st)
Tvrtko Ursulin	0c40ce1	2016-11-09 15:13:43 +0000	[diff] [blame]	2357	{
				2358	struct sg_table new_st;
				2359	struct scatterlist sg, new_sg;
				2360	unsigned int i;
				2361
				2362	if (orig_st->nents == orig_st->orig_nents)
Chris Wilson	935a2f7	2017-02-13 17:15:13 +0000	[diff] [blame]	2363	return false;
Tvrtko Ursulin	0c40ce1	2016-11-09 15:13:43 +0000	[diff] [blame]	2364
Chris Wilson	8bfc478f	2016-12-23 14:57:58 +0000	[diff] [blame]	2365	if (sg_alloc_table(&new_st, orig_st->nents, GFP_KERNEL \| __GFP_NOWARN))
Chris Wilson	935a2f7	2017-02-13 17:15:13 +0000	[diff] [blame]	2366	return false;
Tvrtko Ursulin	0c40ce1	2016-11-09 15:13:43 +0000	[diff] [blame]	2367
				2368	new_sg = new_st.sgl;
				2369	for_each_sg(orig_st->sgl, sg, orig_st->nents, i) {
				2370	sg_set_page(new_sg, sg_page(sg), sg->length, 0);
				2371	/* called before being DMA mapped, no need to copy sg->dma_* */
				2372	new_sg = sg_next(new_sg);
				2373	}
Chris Wilson	c2dc6cc	2016-12-19 12:43:46 +0000	[diff] [blame]	2374	GEM_BUG_ON(new_sg); /* Should walk exactly nents and hit the end */
Tvrtko Ursulin	0c40ce1	2016-11-09 15:13:43 +0000	[diff] [blame]	2375
				2376	sg_free_table(orig_st);
				2377
				2378	*orig_st = new_st;
Chris Wilson	935a2f7	2017-02-13 17:15:13 +0000	[diff] [blame]	2379	return true;
Tvrtko Ursulin	0c40ce1	2016-11-09 15:13:43 +0000	[diff] [blame]	2380	}
				2381
Matthew Auld	b91b09e	2017-10-06 23:18:17 +0100	[diff] [blame]	2382	static int i915_gem_object_get_pages_gtt(struct drm_i915_gem_object *obj)
Eric Anholt	673a394	2008-07-30 12:06:12 -0700	[diff] [blame]	2383	{
Chris Wilson	fac5e23	2016-07-04 11:34:36 +0100	[diff] [blame]	2384	struct drm_i915_private *dev_priv = to_i915(obj->base.dev);
Chris Wilson	d766ef5	2016-12-19 12:43:45 +0000	[diff] [blame]	2385	const unsigned long page_count = obj->base.size / PAGE_SIZE;
				2386	unsigned long i;
Eric Anholt	673a394	2008-07-30 12:06:12 -0700	[diff] [blame]	2387	struct address_space *mapping;
Chris Wilson	9da3da6	2012-06-01 15:20:22 +0100	[diff] [blame]	2388	struct sg_table *st;
				2389	struct scatterlist *sg;
Dave Gordon	85d1225	2016-05-20 11:54:06 +0100	[diff] [blame]	2390	struct sgt_iter sgt_iter;
Eric Anholt	673a394	2008-07-30 12:06:12 -0700	[diff] [blame]	2391	struct page *page;
Imre Deak	90797e6	2013-02-18 19:28:03 +0200	[diff] [blame]	2392	unsigned long last_pfn = 0; /* suppress gcc warning */
Tvrtko Ursulin	5602452	2017-08-03 10:14:17 +0100	[diff] [blame]	2393	unsigned int max_segment = i915_sg_segment_size();
Matthew Auld	84e8978	2017-10-09 12:00:24 +0100	[diff] [blame]	2394	unsigned int sg_page_sizes;
Chris Wilson	4846bf0	2017-06-09 12:03:46 +0100	[diff] [blame]	2395	gfp_t noreclaim;
Imre Deak	e227330	2015-07-09 12:59:05 +0300	[diff] [blame]	2396	int ret;
Eric Anholt	673a394	2008-07-30 12:06:12 -0700	[diff] [blame]	2397
Chris Wilson	6c085a7	2012-08-20 11:40:46 +0200	[diff] [blame]	2398	/* Assert that the object is not currently in any GPU domain. As it
				2399	* wasn't in the GTT, there shouldn't be any way it could have been in
				2400	* a GPU cache
				2401	*/
Christian König	c0a51fd	2018-02-16 13:43:38 +0100	[diff] [blame]	2402	GEM_BUG_ON(obj->read_domains & I915_GEM_GPU_DOMAINS);
				2403	GEM_BUG_ON(obj->write_domain & I915_GEM_GPU_DOMAINS);
Chris Wilson	6c085a7	2012-08-20 11:40:46 +0200	[diff] [blame]	2404
Chris Wilson	9da3da6	2012-06-01 15:20:22 +0100	[diff] [blame]	2405	st = kmalloc(sizeof(*st), GFP_KERNEL);
				2406	if (st == NULL)
Matthew Auld	b91b09e	2017-10-06 23:18:17 +0100	[diff] [blame]	2407	return -ENOMEM;
Eric Anholt	673a394	2008-07-30 12:06:12 -0700	[diff] [blame]	2408
Chris Wilson	d766ef5	2016-12-19 12:43:45 +0000	[diff] [blame]	2409	rebuild_st:
Chris Wilson	9da3da6	2012-06-01 15:20:22 +0100	[diff] [blame]	2410	if (sg_alloc_table(st, page_count, GFP_KERNEL)) {
Chris Wilson	9da3da6	2012-06-01 15:20:22 +0100	[diff] [blame]	2411	kfree(st);
Matthew Auld	b91b09e	2017-10-06 23:18:17 +0100	[diff] [blame]	2412	return -ENOMEM;
Chris Wilson	9da3da6	2012-06-01 15:20:22 +0100	[diff] [blame]	2413	}
				2414
				2415	/* Get the list of pages out of our struct file. They'll be pinned
				2416	* at this point until we release them.
				2417	*
				2418	* Fail silently without starting the shrinker
				2419	*/
Al Viro	93c76a3	2015-12-04 23:45:44 -0500	[diff] [blame]	2420	mapping = obj->base.filp->f_mapping;
Chris Wilson	0f6ab55	2017-06-09 12:03:48 +0100	[diff] [blame]	2421	noreclaim = mapping_gfp_constraint(mapping, ~__GFP_RECLAIM);
Chris Wilson	4846bf0	2017-06-09 12:03:46 +0100	[diff] [blame]	2422	noreclaim \|= __GFP_NORETRY \| __GFP_NOWARN;
				2423
Imre Deak	90797e6	2013-02-18 19:28:03 +0200	[diff] [blame]	2424	sg = st->sgl;
				2425	st->nents = 0;
Matthew Auld	84e8978	2017-10-09 12:00:24 +0100	[diff] [blame]	2426	sg_page_sizes = 0;
Imre Deak	90797e6	2013-02-18 19:28:03 +0200	[diff] [blame]	2427	for (i = 0; i < page_count; i++) {
Chris Wilson	4846bf0	2017-06-09 12:03:46 +0100	[diff] [blame]	2428	const unsigned int shrink[] = {
				2429	I915_SHRINK_BOUND \| I915_SHRINK_UNBOUND \| I915_SHRINK_PURGEABLE,
				2430	0,
				2431	}, *s = shrink;
				2432	gfp_t gfp = noreclaim;
				2433
				2434	do {
Chris Wilson	6c085a7	2012-08-20 11:40:46 +0200	[diff] [blame]	2435	page = shmem_read_mapping_page_gfp(mapping, i, gfp);
Chris Wilson	4846bf0	2017-06-09 12:03:46 +0100	[diff] [blame]	2436	if (likely(!IS_ERR(page)))
				2437	break;
				2438
				2439	if (!*s) {
				2440	ret = PTR_ERR(page);
				2441	goto err_sg;
				2442	}
				2443
Chris Wilson	912d572	2017-09-06 16:19:30 -0700	[diff] [blame]	2444	i915_gem_shrink(dev_priv, 2 * page_count, NULL, *s++);
Chris Wilson	4846bf0	2017-06-09 12:03:46 +0100	[diff] [blame]	2445	cond_resched();
Chris Wilson	24f8e00	2017-03-22 11:05:21 +0000	[diff] [blame]	2446
Chris Wilson	6c085a7	2012-08-20 11:40:46 +0200	[diff] [blame]	2447	/* We've tried hard to allocate the memory by reaping
				2448	* our own buffer, now let the real VM do its job and
				2449	* go down in flames if truly OOM.
Chris Wilson	24f8e00	2017-03-22 11:05:21 +0000	[diff] [blame]	2450	*
				2451	* However, since graphics tend to be disposable,
				2452	* defer the oom here by reporting the ENOMEM back
				2453	* to userspace.
Chris Wilson	6c085a7	2012-08-20 11:40:46 +0200	[diff] [blame]	2454	*/
Chris Wilson	4846bf0	2017-06-09 12:03:46 +0100	[diff] [blame]	2455	if (!*s) {
				2456	/* reclaim and warn, but no oom */
				2457	gfp = mapping_gfp_mask(mapping);
Chris Wilson	eaf4180	2017-06-09 12:03:47 +0100	[diff] [blame]	2458
				2459	/* Our bo are always dirty and so we require
				2460	* kswapd to reclaim our pages (direct reclaim
				2461	* does not effectively begin pageout of our
				2462	* buffers on its own). However, direct reclaim
				2463	* only waits for kswapd when under allocation
				2464	* congestion. So as a result __GFP_RECLAIM is
				2465	* unreliable and fails to actually reclaim our
				2466	* dirty pages -- unless you try over and over
				2467	* again with !__GFP_NORETRY. However, we still
				2468	* want to fail this allocation rather than
				2469	* trigger the out-of-memory killer and for
Michal Hocko	dbb3295	2017-07-12 14:36:55 -0700	[diff] [blame]	2470	* this we want __GFP_RETRY_MAYFAIL.
Chris Wilson	eaf4180	2017-06-09 12:03:47 +0100	[diff] [blame]	2471	*/
Michal Hocko	dbb3295	2017-07-12 14:36:55 -0700	[diff] [blame]	2472	gfp \|= __GFP_RETRY_MAYFAIL;
Imre Deak	e227330	2015-07-09 12:59:05 +0300	[diff] [blame]	2473	}
Chris Wilson	4846bf0	2017-06-09 12:03:46 +0100	[diff] [blame]	2474	} while (1);
				2475
Chris Wilson	871dfbd	2016-10-11 09:20:21 +0100	[diff] [blame]	2476	if (!i \|\|
				2477	sg->length >= max_segment \|\|
				2478	page_to_pfn(page) != last_pfn + 1) {
Matthew Auld	a5c08166	2017-10-06 23:18:18 +0100	[diff] [blame]	2479	if (i) {
Matthew Auld	84e8978	2017-10-09 12:00:24 +0100	[diff] [blame]	2480	sg_page_sizes \|= sg->length;
Imre Deak	90797e6	2013-02-18 19:28:03 +0200	[diff] [blame]	2481	sg = sg_next(sg);
Matthew Auld	a5c08166	2017-10-06 23:18:18 +0100	[diff] [blame]	2482	}
Imre Deak	90797e6	2013-02-18 19:28:03 +0200	[diff] [blame]	2483	st->nents++;
				2484	sg_set_page(sg, page, PAGE_SIZE, 0);
				2485	} else {
				2486	sg->length += PAGE_SIZE;
				2487	}
				2488	last_pfn = page_to_pfn(page);
Daniel Vetter	3bbbe70	2013-10-07 17:15:45 -0300	[diff] [blame]	2489
				2490	/* Check that the i965g/gm workaround works. */
				2491	WARN_ON((gfp & __GFP_DMA32) && (last_pfn >= 0x00100000UL));
Eric Anholt	673a394	2008-07-30 12:06:12 -0700	[diff] [blame]	2492	}
Matthew Auld	a5c08166	2017-10-06 23:18:18 +0100	[diff] [blame]	2493	if (sg) { /* loop terminated early; short sg table */
Matthew Auld	84e8978	2017-10-09 12:00:24 +0100	[diff] [blame]	2494	sg_page_sizes \|= sg->length;
Konrad Rzeszutek Wilk	426729d	2013-06-24 11:47:48 -0400	[diff] [blame]	2495	sg_mark_end(sg);
Matthew Auld	a5c08166	2017-10-06 23:18:18 +0100	[diff] [blame]	2496	}
Chris Wilson	74ce6b6	2012-10-19 15:51:06 +0100	[diff] [blame]	2497
Tvrtko Ursulin	0c40ce1	2016-11-09 15:13:43 +0000	[diff] [blame]	2498	/* Trim unused sg entries to avoid wasting memory. */
				2499	i915_sg_trim(st);
				2500
Chris Wilson	03ac84f	2016-10-28 13:58:36 +0100	[diff] [blame]	2501	ret = i915_gem_gtt_prepare_pages(obj, st);
Chris Wilson	d766ef5	2016-12-19 12:43:45 +0000	[diff] [blame]	2502	if (ret) {
				2503	/* DMA remapping failed? One possible cause is that
				2504	* it could not reserve enough large entries, asking
				2505	* for PAGE_SIZE chunks instead may be helpful.
				2506	*/
				2507	if (max_segment > PAGE_SIZE) {
				2508	for_each_sgt_page(page, sgt_iter, st)
				2509	put_page(page);
				2510	sg_free_table(st);
				2511
				2512	max_segment = PAGE_SIZE;
				2513	goto rebuild_st;
				2514	} else {
				2515	dev_warn(&dev_priv->drm.pdev->dev,
				2516	"Failed to DMA remap %lu pages\n",
				2517	page_count);
				2518	goto err_pages;
				2519	}
				2520	}
Imre Deak	e227330	2015-07-09 12:59:05 +0300	[diff] [blame]	2521
Eric Anholt	673a394	2008-07-30 12:06:12 -0700	[diff] [blame]	2522	if (i915_gem_object_needs_bit17_swizzle(obj))
Chris Wilson	03ac84f	2016-10-28 13:58:36 +0100	[diff] [blame]	2523	i915_gem_object_do_bit_17_swizzle(obj, st);
Eric Anholt	673a394	2008-07-30 12:06:12 -0700	[diff] [blame]	2524
Matthew Auld	84e8978	2017-10-09 12:00:24 +0100	[diff] [blame]	2525	__i915_gem_object_set_pages(obj, st, sg_page_sizes);
Matthew Auld	b91b09e	2017-10-06 23:18:17 +0100	[diff] [blame]	2526
				2527	return 0;
Eric Anholt	673a394	2008-07-30 12:06:12 -0700	[diff] [blame]	2528
Chris Wilson	b17993b	2016-11-14 11:29:30 +0000	[diff] [blame]	2529	err_sg:
Imre Deak	90797e6	2013-02-18 19:28:03 +0200	[diff] [blame]	2530	sg_mark_end(sg);
Chris Wilson	b17993b	2016-11-14 11:29:30 +0000	[diff] [blame]	2531	err_pages:
Dave Gordon	85d1225	2016-05-20 11:54:06 +0100	[diff] [blame]	2532	for_each_sgt_page(page, sgt_iter, st)
				2533	put_page(page);
Chris Wilson	9da3da6	2012-06-01 15:20:22 +0100	[diff] [blame]	2534	sg_free_table(st);
				2535	kfree(st);
Chris Wilson	0820baf	2014-03-25 13:23:03 +0000	[diff] [blame]	2536
				2537	/* shmemfs first checks if there is enough memory to allocate the page
				2538	* and reports ENOSPC should there be insufficient, along with the usual
				2539	* ENOMEM for a genuine allocation failure.
				2540	*
				2541	* We use ENOSPC in our driver to mean that we have run out of aperture
				2542	* space and so want to translate the error from shmemfs back to our
				2543	* usual understanding of ENOMEM.
				2544	*/
Imre Deak	e227330	2015-07-09 12:59:05 +0300	[diff] [blame]	2545	if (ret == -ENOSPC)
				2546	ret = -ENOMEM;
				2547
Matthew Auld	b91b09e	2017-10-06 23:18:17 +0100	[diff] [blame]	2548	return ret;
Chris Wilson	03ac84f	2016-10-28 13:58:36 +0100	[diff] [blame]	2549	}
				2550
				2551	void __i915_gem_object_set_pages(struct drm_i915_gem_object *obj,
Matthew Auld	a5c08166	2017-10-06 23:18:18 +0100	[diff] [blame]	2552	struct sg_table *pages,
Matthew Auld	84e8978	2017-10-09 12:00:24 +0100	[diff] [blame]	2553	unsigned int sg_page_sizes)
Chris Wilson	03ac84f	2016-10-28 13:58:36 +0100	[diff] [blame]	2554	{
Matthew Auld	a5c08166	2017-10-06 23:18:18 +0100	[diff] [blame]	2555	struct drm_i915_private *i915 = to_i915(obj->base.dev);
				2556	unsigned long supported = INTEL_INFO(i915)->page_sizes;
				2557	int i;
				2558
Chris Wilson	1233e2d	2016-10-28 13:58:37 +0100	[diff] [blame]	2559	lockdep_assert_held(&obj->mm.lock);
Chris Wilson	03ac84f	2016-10-28 13:58:36 +0100	[diff] [blame]	2560
				2561	obj->mm.get_page.sg_pos = pages->sgl;
				2562	obj->mm.get_page.sg_idx = 0;
				2563
				2564	obj->mm.pages = pages;
Chris Wilson	2c3a3f4	2016-11-04 10:30:01 +0000	[diff] [blame]	2565
				2566	if (i915_gem_object_is_tiled(obj) &&
Chris Wilson	f212381	2017-10-16 12:40:37 +0100	[diff] [blame]	2567	i915->quirks & QUIRK_PIN_SWIZZLED_PAGES) {
Chris Wilson	2c3a3f4	2016-11-04 10:30:01 +0000	[diff] [blame]	2568	GEM_BUG_ON(obj->mm.quirked);
				2569	__i915_gem_object_pin_pages(obj);
				2570	obj->mm.quirked = true;
				2571	}
Matthew Auld	a5c08166	2017-10-06 23:18:18 +0100	[diff] [blame]	2572
Matthew Auld	84e8978	2017-10-09 12:00:24 +0100	[diff] [blame]	2573	GEM_BUG_ON(!sg_page_sizes);
				2574	obj->mm.page_sizes.phys = sg_page_sizes;
Matthew Auld	a5c08166	2017-10-06 23:18:18 +0100	[diff] [blame]	2575
				2576	/*
Matthew Auld	84e8978	2017-10-09 12:00:24 +0100	[diff] [blame]	2577	* Calculate the supported page-sizes which fit into the given
				2578	* sg_page_sizes. This will give us the page-sizes which we may be able
				2579	* to use opportunistically when later inserting into the GTT. For
				2580	* example if phys=2G, then in theory we should be able to use 1G, 2M,
				2581	* 64K or 4K pages, although in practice this will depend on a number of
				2582	* other factors.
Matthew Auld	a5c08166	2017-10-06 23:18:18 +0100	[diff] [blame]	2583	*/
				2584	obj->mm.page_sizes.sg = 0;
				2585	for_each_set_bit(i, &supported, ilog2(I915_GTT_MAX_PAGE_SIZE) + 1) {
				2586	if (obj->mm.page_sizes.phys & ~0u << i)
				2587	obj->mm.page_sizes.sg \|= BIT(i);
				2588	}
Matthew Auld	a5c08166	2017-10-06 23:18:18 +0100	[diff] [blame]	2589	GEM_BUG_ON(!HAS_PAGE_SIZES(i915, obj->mm.page_sizes.sg));
Chris Wilson	f212381	2017-10-16 12:40:37 +0100	[diff] [blame]	2590
				2591	spin_lock(&i915->mm.obj_lock);
				2592	list_add(&obj->mm.link, &i915->mm.unbound_list);
				2593	spin_unlock(&i915->mm.obj_lock);
Chris Wilson	03ac84f	2016-10-28 13:58:36 +0100	[diff] [blame]	2594	}
				2595
				2596	static int ____i915_gem_object_get_pages(struct drm_i915_gem_object *obj)
				2597	{
Matthew Auld	b91b09e	2017-10-06 23:18:17 +0100	[diff] [blame]	2598	int err;
Chris Wilson	03ac84f	2016-10-28 13:58:36 +0100	[diff] [blame]	2599
				2600	if (unlikely(obj->mm.madv != I915_MADV_WILLNEED)) {
				2601	DRM_DEBUG("Attempting to obtain a purgeable object\n");
				2602	return -EFAULT;
				2603	}
				2604
Matthew Auld	b91b09e	2017-10-06 23:18:17 +0100	[diff] [blame]	2605	err = obj->ops->get_pages(obj);
Matthew Auld	b65a9b9	2017-12-18 10:38:55 +0000	[diff] [blame]	2606	GEM_BUG_ON(!err && !i915_gem_object_has_pages(obj));
Chris Wilson	03ac84f	2016-10-28 13:58:36 +0100	[diff] [blame]	2607
Matthew Auld	b91b09e	2017-10-06 23:18:17 +0100	[diff] [blame]	2608	return err;
Eric Anholt	673a394	2008-07-30 12:06:12 -0700	[diff] [blame]	2609	}
				2610
Chris Wilson	37e680a	2012-06-07 15:38:42 +0100	[diff] [blame]	2611	/* Ensure that the associated pages are gathered from the backing storage
Chris Wilson	1233e2d	2016-10-28 13:58:37 +0100	[diff] [blame]	2612	* and pinned into our object. i915_gem_object_pin_pages() may be called
Chris Wilson	37e680a	2012-06-07 15:38:42 +0100	[diff] [blame]	2613	* multiple times before they are released by a single call to
Chris Wilson	1233e2d	2016-10-28 13:58:37 +0100	[diff] [blame]	2614	* i915_gem_object_unpin_pages() - once the pages are no longer referenced
Chris Wilson	37e680a	2012-06-07 15:38:42 +0100	[diff] [blame]	2615	* either as a result of memory pressure (reaping pages under the shrinker)
				2616	* or as the object is itself released.
				2617	*/
Chris Wilson	a4f5ea6	2016-10-28 13:58:35 +0100	[diff] [blame]	2618	int __i915_gem_object_get_pages(struct drm_i915_gem_object *obj)
Chris Wilson	37e680a	2012-06-07 15:38:42 +0100	[diff] [blame]	2619	{
Chris Wilson	03ac84f	2016-10-28 13:58:36 +0100	[diff] [blame]	2620	int err;
Chris Wilson	37e680a	2012-06-07 15:38:42 +0100	[diff] [blame]	2621
Chris Wilson	1233e2d	2016-10-28 13:58:37 +0100	[diff] [blame]	2622	err = mutex_lock_interruptible(&obj->mm.lock);
				2623	if (err)
				2624	return err;
Chris Wilson	4c7d62c	2016-10-28 13:58:32 +0100	[diff] [blame]	2625
Chris Wilson	f1fa4f4	2017-10-13 21:26:13 +0100	[diff] [blame]	2626	if (unlikely(!i915_gem_object_has_pages(obj))) {
Chris Wilson	88c880b	2017-09-06 14:52:20 +0100	[diff] [blame]	2627	GEM_BUG_ON(i915_gem_object_has_pinned_pages(obj));
				2628
Chris Wilson	2c3a3f4	2016-11-04 10:30:01 +0000	[diff] [blame]	2629	err = ____i915_gem_object_get_pages(obj);
				2630	if (err)
				2631	goto unlock;
				2632
				2633	smp_mb__before_atomic();
Chris Wilson	1233e2d	2016-10-28 13:58:37 +0100	[diff] [blame]	2634	}
Chris Wilson	2c3a3f4	2016-11-04 10:30:01 +0000	[diff] [blame]	2635	atomic_inc(&obj->mm.pages_pin_count);
Chris Wilson	43e28f0	2013-01-08 10:53:09 +0000	[diff] [blame]	2636
Chris Wilson	1233e2d	2016-10-28 13:58:37 +0100	[diff] [blame]	2637	unlock:
				2638	mutex_unlock(&obj->mm.lock);
Chris Wilson	03ac84f	2016-10-28 13:58:36 +0100	[diff] [blame]	2639	return err;
Eric Anholt	673a394	2008-07-30 12:06:12 -0700	[diff] [blame]	2640	}
				2641
Dave Gordon	dd6034c	2016-05-20 11:54:04 +0100	[diff] [blame]	2642	/* The 'mapping' part of i915_gem_object_pin_map() below */
Chris Wilson	d31d7cb	2016-08-12 12:39:58 +0100	[diff] [blame]	2643	static void i915_gem_object_map(const struct drm_i915_gem_object obj,
				2644	enum i915_map_type type)
Dave Gordon	dd6034c	2016-05-20 11:54:04 +0100	[diff] [blame]	2645	{
				2646	unsigned long n_pages = obj->base.size >> PAGE_SHIFT;
Chris Wilson	a4f5ea6	2016-10-28 13:58:35 +0100	[diff] [blame]	2647	struct sg_table *sgt = obj->mm.pages;
Dave Gordon	85d1225	2016-05-20 11:54:06 +0100	[diff] [blame]	2648	struct sgt_iter sgt_iter;
				2649	struct page *page;
Dave Gordon	b338fa4	2016-05-20 11:54:05 +0100	[diff] [blame]	2650	struct page *stack_pages[32];
				2651	struct page **pages = stack_pages;
Dave Gordon	dd6034c	2016-05-20 11:54:04 +0100	[diff] [blame]	2652	unsigned long i = 0;
Chris Wilson	d31d7cb	2016-08-12 12:39:58 +0100	[diff] [blame]	2653	pgprot_t pgprot;
Dave Gordon	dd6034c	2016-05-20 11:54:04 +0100	[diff] [blame]	2654	void *addr;
				2655
				2656	/* A single page can always be kmapped */
Chris Wilson	d31d7cb	2016-08-12 12:39:58 +0100	[diff] [blame]	2657	if (n_pages == 1 && type == I915_MAP_WB)
Dave Gordon	dd6034c	2016-05-20 11:54:04 +0100	[diff] [blame]	2658	return kmap(sg_page(sgt->sgl));
				2659
Dave Gordon	b338fa4	2016-05-20 11:54:05 +0100	[diff] [blame]	2660	if (n_pages > ARRAY_SIZE(stack_pages)) {
				2661	/* Too big for stack -- allocate temporary array instead */
Michal Hocko	0ee931c	2017-09-13 16:28:29 -0700	[diff] [blame]	2662	pages = kvmalloc_array(n_pages, sizeof(*pages), GFP_KERNEL);
Dave Gordon	b338fa4	2016-05-20 11:54:05 +0100	[diff] [blame]	2663	if (!pages)
				2664	return NULL;
				2665	}
Dave Gordon	dd6034c	2016-05-20 11:54:04 +0100	[diff] [blame]	2666
Dave Gordon	85d1225	2016-05-20 11:54:06 +0100	[diff] [blame]	2667	for_each_sgt_page(page, sgt_iter, sgt)
				2668	pages[i++] = page;
Dave Gordon	dd6034c	2016-05-20 11:54:04 +0100	[diff] [blame]	2669
				2670	/* Check that we have the expected number of pages */
				2671	GEM_BUG_ON(i != n_pages);
				2672
Chris Wilson	d31d7cb	2016-08-12 12:39:58 +0100	[diff] [blame]	2673	switch (type) {
Chris Wilson	a575c67	2017-08-28 11:46:31 +0100	[diff] [blame]	2674	default:
				2675	MISSING_CASE(type);
				2676	/* fallthrough to use PAGE_KERNEL anyway */
Chris Wilson	d31d7cb	2016-08-12 12:39:58 +0100	[diff] [blame]	2677	case I915_MAP_WB:
				2678	pgprot = PAGE_KERNEL;
				2679	break;
				2680	case I915_MAP_WC:
				2681	pgprot = pgprot_writecombine(PAGE_KERNEL_IO);
				2682	break;
				2683	}
				2684	addr = vmap(pages, n_pages, 0, pgprot);
Dave Gordon	dd6034c	2016-05-20 11:54:04 +0100	[diff] [blame]	2685
Dave Gordon	b338fa4	2016-05-20 11:54:05 +0100	[diff] [blame]	2686	if (pages != stack_pages)
Michal Hocko	2098105	2017-05-17 14:23:12 +0200	[diff] [blame]	2687	kvfree(pages);
Dave Gordon	dd6034c	2016-05-20 11:54:04 +0100	[diff] [blame]	2688
				2689	return addr;
				2690	}
				2691
				2692	/* get, pin, and map the pages of the object into kernel space */
Chris Wilson	d31d7cb	2016-08-12 12:39:58 +0100	[diff] [blame]	2693	void i915_gem_object_pin_map(struct drm_i915_gem_object obj,
				2694	enum i915_map_type type)
Chris Wilson	0a798eb	2016-04-08 12:11:11 +0100	[diff] [blame]	2695	{
Chris Wilson	d31d7cb	2016-08-12 12:39:58 +0100	[diff] [blame]	2696	enum i915_map_type has_type;
				2697	bool pinned;
				2698	void *ptr;
Chris Wilson	0a798eb	2016-04-08 12:11:11 +0100	[diff] [blame]	2699	int ret;
				2700
Tina Zhang	a03f395	2017-11-14 10:25:13 +0000	[diff] [blame]	2701	if (unlikely(!i915_gem_object_has_struct_page(obj)))
				2702	return ERR_PTR(-ENXIO);
Chris Wilson	0a798eb	2016-04-08 12:11:11 +0100	[diff] [blame]	2703
Chris Wilson	1233e2d	2016-10-28 13:58:37 +0100	[diff] [blame]	2704	ret = mutex_lock_interruptible(&obj->mm.lock);
Chris Wilson	0a798eb	2016-04-08 12:11:11 +0100	[diff] [blame]	2705	if (ret)
				2706	return ERR_PTR(ret);
				2707
Chris Wilson	a575c67	2017-08-28 11:46:31 +0100	[diff] [blame]	2708	pinned = !(type & I915_MAP_OVERRIDE);
				2709	type &= ~I915_MAP_OVERRIDE;
				2710
Chris Wilson	1233e2d	2016-10-28 13:58:37 +0100	[diff] [blame]	2711	if (!atomic_inc_not_zero(&obj->mm.pages_pin_count)) {
Chris Wilson	f1fa4f4	2017-10-13 21:26:13 +0100	[diff] [blame]	2712	if (unlikely(!i915_gem_object_has_pages(obj))) {
Chris Wilson	88c880b	2017-09-06 14:52:20 +0100	[diff] [blame]	2713	GEM_BUG_ON(i915_gem_object_has_pinned_pages(obj));
				2714
Chris Wilson	2c3a3f4	2016-11-04 10:30:01 +0000	[diff] [blame]	2715	ret = ____i915_gem_object_get_pages(obj);
				2716	if (ret)
				2717	goto err_unlock;
Chris Wilson	1233e2d	2016-10-28 13:58:37 +0100	[diff] [blame]	2718
Chris Wilson	2c3a3f4	2016-11-04 10:30:01 +0000	[diff] [blame]	2719	smp_mb__before_atomic();
				2720	}
				2721	atomic_inc(&obj->mm.pages_pin_count);
Chris Wilson	1233e2d	2016-10-28 13:58:37 +0100	[diff] [blame]	2722	pinned = false;
				2723	}
Chris Wilson	f1fa4f4	2017-10-13 21:26:13 +0100	[diff] [blame]	2724	GEM_BUG_ON(!i915_gem_object_has_pages(obj));
Chris Wilson	0a798eb	2016-04-08 12:11:11 +0100	[diff] [blame]	2725
Chris Wilson	0ce8178	2017-05-17 13:09:59 +0100	[diff] [blame]	2726	ptr = page_unpack_bits(obj->mm.mapping, &has_type);
Chris Wilson	d31d7cb	2016-08-12 12:39:58 +0100	[diff] [blame]	2727	if (ptr && has_type != type) {
				2728	if (pinned) {
				2729	ret = -EBUSY;
Chris Wilson	1233e2d	2016-10-28 13:58:37 +0100	[diff] [blame]	2730	goto err_unpin;
Chris Wilson	0a798eb	2016-04-08 12:11:11 +0100	[diff] [blame]	2731	}
Chris Wilson	d31d7cb	2016-08-12 12:39:58 +0100	[diff] [blame]	2732
				2733	if (is_vmalloc_addr(ptr))
				2734	vunmap(ptr);
				2735	else
				2736	kunmap(kmap_to_page(ptr));
				2737
Chris Wilson	a4f5ea6	2016-10-28 13:58:35 +0100	[diff] [blame]	2738	ptr = obj->mm.mapping = NULL;
Chris Wilson	0a798eb	2016-04-08 12:11:11 +0100	[diff] [blame]	2739	}
				2740
Chris Wilson	d31d7cb	2016-08-12 12:39:58 +0100	[diff] [blame]	2741	if (!ptr) {
				2742	ptr = i915_gem_object_map(obj, type);
				2743	if (!ptr) {
				2744	ret = -ENOMEM;
Chris Wilson	1233e2d	2016-10-28 13:58:37 +0100	[diff] [blame]	2745	goto err_unpin;
Chris Wilson	d31d7cb	2016-08-12 12:39:58 +0100	[diff] [blame]	2746	}
				2747
Chris Wilson	0ce8178	2017-05-17 13:09:59 +0100	[diff] [blame]	2748	obj->mm.mapping = page_pack_bits(ptr, type);
Chris Wilson	d31d7cb	2016-08-12 12:39:58 +0100	[diff] [blame]	2749	}
				2750
Chris Wilson	1233e2d	2016-10-28 13:58:37 +0100	[diff] [blame]	2751	out_unlock:
				2752	mutex_unlock(&obj->mm.lock);
Chris Wilson	d31d7cb	2016-08-12 12:39:58 +0100	[diff] [blame]	2753	return ptr;
				2754
Chris Wilson	1233e2d	2016-10-28 13:58:37 +0100	[diff] [blame]	2755	err_unpin:
				2756	atomic_dec(&obj->mm.pages_pin_count);
				2757	err_unlock:
				2758	ptr = ERR_PTR(ret);
				2759	goto out_unlock;
Chris Wilson	0a798eb	2016-04-08 12:11:11 +0100	[diff] [blame]	2760	}
				2761
Chris Wilson	7c55e2c	2017-03-07 12:03:38 +0000	[diff] [blame]	2762	static int
				2763	i915_gem_object_pwrite_gtt(struct drm_i915_gem_object *obj,
				2764	const struct drm_i915_gem_pwrite *arg)
				2765	{
				2766	struct address_space *mapping = obj->base.filp->f_mapping;
				2767	char __user *user_data = u64_to_user_ptr(arg->data_ptr);
				2768	u64 remain, offset;
				2769	unsigned int pg;
				2770
				2771	/* Before we instantiate/pin the backing store for our use, we
				2772	* can prepopulate the shmemfs filp efficiently using a write into
				2773	* the pagecache. We avoid the penalty of instantiating all the
				2774	* pages, important if the user is just writing to a few and never
				2775	* uses the object on the GPU, and using a direct write into shmemfs
				2776	* allows it to avoid the cost of retrieving a page (either swapin
				2777	* or clearing-before-use) before it is overwritten.
				2778	*/
Chris Wilson	f1fa4f4	2017-10-13 21:26:13 +0100	[diff] [blame]	2779	if (i915_gem_object_has_pages(obj))
Chris Wilson	7c55e2c	2017-03-07 12:03:38 +0000	[diff] [blame]	2780	return -ENODEV;
				2781
Chris Wilson	a6d65e4	2017-10-16 21:27:32 +0100	[diff] [blame]	2782	if (obj->mm.madv != I915_MADV_WILLNEED)
				2783	return -EFAULT;
				2784
Chris Wilson	7c55e2c	2017-03-07 12:03:38 +0000	[diff] [blame]	2785	/* Before the pages are instantiated the object is treated as being
				2786	* in the CPU domain. The pages will be clflushed as required before
				2787	* use, and we can freely write into the pages directly. If userspace
				2788	* races pwrite with any other operation; corruption will ensue -
				2789	* that is userspace's prerogative!
				2790	*/
				2791
				2792	remain = arg->size;
				2793	offset = arg->offset;
				2794	pg = offset_in_page(offset);
				2795
				2796	do {
				2797	unsigned int len, unwritten;
				2798	struct page *page;
				2799	void data, vaddr;
				2800	int err;
				2801
				2802	len = PAGE_SIZE - pg;
				2803	if (len > remain)
				2804	len = remain;
				2805
				2806	err = pagecache_write_begin(obj->base.filp, mapping,
				2807	offset, len, 0,
				2808	&page, &data);
				2809	if (err < 0)
				2810	return err;
				2811
				2812	vaddr = kmap(page);
				2813	unwritten = copy_from_user(vaddr + pg, user_data, len);
				2814	kunmap(page);
				2815
				2816	err = pagecache_write_end(obj->base.filp, mapping,
				2817	offset, len, len - unwritten,
				2818	page, data);
				2819	if (err < 0)
				2820	return err;
				2821
				2822	if (unwritten)
				2823	return -EFAULT;
				2824
				2825	remain -= len;
				2826	user_data += len;
				2827	offset += len;
				2828	pg = 0;
				2829	} while (remain);
				2830
				2831	return 0;
				2832	}
				2833
Mika Kuoppala	e5e1fc4	2016-11-16 17:20:31 +0200	[diff] [blame]	2834	static void i915_gem_context_mark_guilty(struct i915_gem_context *ctx)
Mika Kuoppala	aa60c66	2013-06-12 15:13:20 +0300	[diff] [blame]	2835	{
Chris Wilson	77b25a9	2017-07-21 13:32:30 +0100	[diff] [blame]	2836	bool banned;
Mika Kuoppala	b083a08	2016-11-18 15:10:47 +0200	[diff] [blame]	2837
Chris Wilson	77b25a9	2017-07-21 13:32:30 +0100	[diff] [blame]	2838	atomic_inc(&ctx->guilty_count);
				2839
Chris Wilson	24eae08	2018-02-05 09:22:01 +0000	[diff] [blame]	2840	banned = false;
				2841	if (i915_gem_context_is_bannable(ctx)) {
				2842	unsigned int score;
				2843
				2844	score = atomic_add_return(CONTEXT_SCORE_GUILTY,
				2845	&ctx->ban_score);
				2846	banned = score >= CONTEXT_SCORE_BAN_THRESHOLD;
				2847
				2848	DRM_DEBUG_DRIVER("context %s marked guilty (score %d) banned? %s\n",
				2849	ctx->name, score, yesno(banned));
				2850	}
Chris Wilson	77b25a9	2017-07-21 13:32:30 +0100	[diff] [blame]	2851	if (!banned)
Mika Kuoppala	b083a08	2016-11-18 15:10:47 +0200	[diff] [blame]	2852	return;
				2853
Chris Wilson	77b25a9	2017-07-21 13:32:30 +0100	[diff] [blame]	2854	i915_gem_context_set_banned(ctx);
				2855	if (!IS_ERR_OR_NULL(ctx->file_priv)) {
				2856	atomic_inc(&ctx->file_priv->context_bans);
				2857	DRM_DEBUG_DRIVER("client %s has had %d context banned\n",
				2858	ctx->name, atomic_read(&ctx->file_priv->context_bans));
				2859	}
Mika Kuoppala	e5e1fc4	2016-11-16 17:20:31 +0200	[diff] [blame]	2860	}
				2861
				2862	static void i915_gem_context_mark_innocent(struct i915_gem_context *ctx)
				2863	{
Chris Wilson	77b25a9	2017-07-21 13:32:30 +0100	[diff] [blame]	2864	atomic_inc(&ctx->active_count);
Mika Kuoppala	aa60c66	2013-06-12 15:13:20 +0300	[diff] [blame]	2865	}
				2866
Chris Wilson	e61e0f5	2018-02-21 09:56:36 +0000	[diff] [blame]	2867	struct i915_request *
Tvrtko Ursulin	0bc40be	2016-03-16 11:00:37 +0000	[diff] [blame]	2868	i915_gem_find_active_request(struct intel_engine_cs *engine)
Chris Wilson	9375e44	2010-09-19 12:21:28 +0100	[diff] [blame]	2869	{
Chris Wilson	e61e0f5	2018-02-21 09:56:36 +0000	[diff] [blame]	2870	struct i915_request request, active = NULL;
Chris Wilson	754c9fd	2017-02-23 07:44:14 +0000	[diff] [blame]	2871	unsigned long flags;
Mika Kuoppala	aa60c66	2013-06-12 15:13:20 +0300	[diff] [blame]	2872
Chris Wilson	f69a02c	2016-07-01 17:23:16 +0100	[diff] [blame]	2873	/* We are called by the error capture and reset at a random
				2874	* point in time. In particular, note that neither is crucially
				2875	* ordered with an interrupt. After a hang, the GPU is dead and we
				2876	* assume that no more writes can happen (we waited long enough for
				2877	* all writes that were in transaction to be flushed) - adding an
				2878	* extra delay for a recent interrupt is pointless. Hence, we do
				2879	* not need an engine->irq_seqno_barrier() before the seqno reads.
				2880	*/
Chris Wilson	754c9fd	2017-02-23 07:44:14 +0000	[diff] [blame]	2881	spin_lock_irqsave(&engine->timeline->lock, flags);
Chris Wilson	73cb970	2016-10-28 13:58:46 +0100	[diff] [blame]	2882	list_for_each_entry(request, &engine->timeline->requests, link) {
Chris Wilson	e61e0f5	2018-02-21 09:56:36 +0000	[diff] [blame]	2883	if (__i915_request_completed(request, request->global_seqno))
Chris Wilson	4db080f	2013-12-04 11:37:09 +0000	[diff] [blame]	2884	continue;
Mika Kuoppala	aa60c66	2013-06-12 15:13:20 +0300	[diff] [blame]	2885
Mika Kuoppala	36193ac	2017-01-17 17:59:02 +0200	[diff] [blame]	2886	GEM_BUG_ON(request->engine != engine);
Chris Wilson	c00122f3	2017-02-12 17:19:58 +0000	[diff] [blame]	2887	GEM_BUG_ON(test_bit(DMA_FENCE_FLAG_SIGNALED_BIT,
				2888	&request->fence.flags));
Mika Kuoppala	b6b0fac	2014-01-30 19:04:43 +0200	[diff] [blame]	2889
Chris Wilson	754c9fd	2017-02-23 07:44:14 +0000	[diff] [blame]	2890	active = request;
				2891	break;
				2892	}
				2893	spin_unlock_irqrestore(&engine->timeline->lock, flags);
				2894
				2895	return active;
Mika Kuoppala	b6b0fac	2014-01-30 19:04:43 +0200	[diff] [blame]	2896	}
				2897
Mika Kuoppala	bf2f043	2017-01-17 17:59:04 +0200	[diff] [blame]	2898	static bool engine_stalled(struct intel_engine_cs *engine)
				2899	{
				2900	if (!engine->hangcheck.stalled)
				2901	return false;
				2902
				2903	/* Check for possible seqno movement after hang declaration */
				2904	if (engine->hangcheck.seqno != intel_engine_get_seqno(engine)) {
				2905	DRM_DEBUG_DRIVER("%s pardoned\n", engine->name);
				2906	return false;
				2907	}
				2908
				2909	return true;
				2910	}
				2911
Michel Thierry	a1ef70e	2017-06-20 10:57:47 +0100	[diff] [blame]	2912	/*
				2913	* Ensure irq handler finishes, and not run again.
				2914	* Also return the active request so that we only search for it once.
				2915	*/
Chris Wilson	e61e0f5	2018-02-21 09:56:36 +0000	[diff] [blame]	2916	struct i915_request *
Michel Thierry	a1ef70e	2017-06-20 10:57:47 +0100	[diff] [blame]	2917	i915_gem_reset_prepare_engine(struct intel_engine_cs *engine)
				2918	{
Chris Wilson	e61e0f5	2018-02-21 09:56:36 +0000	[diff] [blame]	2919	struct i915_request *request = NULL;
Michel Thierry	a1ef70e	2017-06-20 10:57:47 +0100	[diff] [blame]	2920
Chris Wilson	1749d90	2017-10-09 12:02:59 +0100	[diff] [blame]	2921	/*
				2922	* During the reset sequence, we must prevent the engine from
				2923	* entering RC6. As the context state is undefined until we restart
				2924	* the engine, if it does enter RC6 during the reset, the state
				2925	* written to the powercontext is undefined and so we may lose
				2926	* GPU state upon resume, i.e. fail to restart after a reset.
				2927	*/
				2928	intel_uncore_forcewake_get(engine->i915, FORCEWAKE_ALL);
				2929
				2930	/*
				2931	* Prevent the signaler thread from updating the request
Michel Thierry	a1ef70e	2017-06-20 10:57:47 +0100	[diff] [blame]	2932	* state (by calling dma_fence_signal) as we are processing
				2933	* the reset. The write from the GPU of the seqno is
				2934	* asynchronous and the signaler thread may see a different
				2935	* value to us and declare the request complete, even though
				2936	* the reset routine have picked that request as the active
				2937	* (incomplete) request. This conflict is not handled
				2938	* gracefully!
				2939	*/
				2940	kthread_park(engine->breadcrumbs.signaler);
				2941
Chris Wilson	1749d90	2017-10-09 12:02:59 +0100	[diff] [blame]	2942	/*
				2943	* Prevent request submission to the hardware until we have
Michel Thierry	a1ef70e	2017-06-20 10:57:47 +0100	[diff] [blame]	2944	* completed the reset in i915_gem_reset_finish(). If a request
				2945	* is completed by one engine, it may then queue a request
Sagar Arun Kamble	c6dce8f	2017-11-16 19:02:37 +0530	[diff] [blame]	2946	* to a second via its execlists->tasklet just as we are
Michel Thierry	a1ef70e	2017-06-20 10:57:47 +0100	[diff] [blame]	2947	* calling engine->init_hw() and also writing the ELSP.
Sagar Arun Kamble	c6dce8f	2017-11-16 19:02:37 +0530	[diff] [blame]	2948	* Turning off the execlists->tasklet until the reset is over
Michel Thierry	a1ef70e	2017-06-20 10:57:47 +0100	[diff] [blame]	2949	* prevents the race.
				2950	*/
Sagar Arun Kamble	c6dce8f	2017-11-16 19:02:37 +0530	[diff] [blame]	2951	tasklet_kill(&engine->execlists.tasklet);
				2952	tasklet_disable(&engine->execlists.tasklet);
Michel Thierry	a1ef70e	2017-06-20 10:57:47 +0100	[diff] [blame]	2953
Michał Winiarski	c41937f	2017-10-26 15:35:58 +0200	[diff] [blame]	2954	/*
				2955	* We're using worker to queue preemption requests from the tasklet in
				2956	* GuC submission mode.
				2957	* Even though tasklet was disabled, we may still have a worker queued.
				2958	* Let's make sure that all workers scheduled before disabling the
				2959	* tasklet are completed before continuing with the reset.
				2960	*/
				2961	if (engine->i915->guc.preempt_wq)
				2962	flush_workqueue(engine->i915->guc.preempt_wq);
				2963
Michel Thierry	a1ef70e	2017-06-20 10:57:47 +0100	[diff] [blame]	2964	if (engine->irq_seqno_barrier)
				2965	engine->irq_seqno_barrier(engine);
				2966
Chris Wilson	d1d1ebf4	2017-07-21 13:32:33 +0100	[diff] [blame]	2967	request = i915_gem_find_active_request(engine);
				2968	if (request && request->fence.error == -EIO)
				2969	request = ERR_PTR(-EIO); /* Previous reset failed! */
Michel Thierry	a1ef70e	2017-06-20 10:57:47 +0100	[diff] [blame]	2970
				2971	return request;
				2972	}
				2973
Chris Wilson	0e178ae	2017-01-17 17:59:06 +0200	[diff] [blame]	2974	int i915_gem_reset_prepare(struct drm_i915_private *dev_priv)
Chris Wilson	4c96554	2017-01-17 17:59:01 +0200	[diff] [blame]	2975	{
				2976	struct intel_engine_cs *engine;
Chris Wilson	e61e0f5	2018-02-21 09:56:36 +0000	[diff] [blame]	2977	struct i915_request *request;
Chris Wilson	4c96554	2017-01-17 17:59:01 +0200	[diff] [blame]	2978	enum intel_engine_id id;
Chris Wilson	0e178ae	2017-01-17 17:59:06 +0200	[diff] [blame]	2979	int err = 0;
Chris Wilson	4c96554	2017-01-17 17:59:01 +0200	[diff] [blame]	2980
Chris Wilson	0e178ae	2017-01-17 17:59:06 +0200	[diff] [blame]	2981	for_each_engine(engine, dev_priv, id) {
Michel Thierry	a1ef70e	2017-06-20 10:57:47 +0100	[diff] [blame]	2982	request = i915_gem_reset_prepare_engine(engine);
				2983	if (IS_ERR(request)) {
				2984	err = PTR_ERR(request);
				2985	continue;
Chris Wilson	0e178ae	2017-01-17 17:59:06 +0200	[diff] [blame]	2986	}
Michel Thierry	c64992e	2017-06-20 10:57:44 +0100	[diff] [blame]	2987
				2988	engine->hangcheck.active_request = request;
Chris Wilson	0e178ae	2017-01-17 17:59:06 +0200	[diff] [blame]	2989	}
				2990
Chris Wilson	4c96554	2017-01-17 17:59:01 +0200	[diff] [blame]	2991	i915_gem_revoke_fences(dev_priv);
Chris Wilson	0e178ae	2017-01-17 17:59:06 +0200	[diff] [blame]	2992
				2993	return err;
Chris Wilson	4c96554	2017-01-17 17:59:01 +0200	[diff] [blame]	2994	}
				2995
Chris Wilson	e61e0f5	2018-02-21 09:56:36 +0000	[diff] [blame]	2996	static void skip_request(struct i915_request *request)
Mika Kuoppala	b6b0fac	2014-01-30 19:04:43 +0200	[diff] [blame]	2997	{
Chris Wilson	821ed7d	2016-09-09 14:11:53 +0100	[diff] [blame]	2998	void *vaddr = request->ring->vaddr;
				2999	u32 head;
Mika Kuoppala	b6b0fac	2014-01-30 19:04:43 +0200	[diff] [blame]	3000
Chris Wilson	821ed7d	2016-09-09 14:11:53 +0100	[diff] [blame]	3001	/* As this request likely depends on state from the lost
				3002	* context, clear out all the user operations leaving the
				3003	* breadcrumb at the end (so we get the fence notifications).
				3004	*/
				3005	head = request->head;
				3006	if (request->postfix < head) {
				3007	memset(vaddr + head, 0, request->ring->size - head);
				3008	head = 0;
				3009	}
				3010	memset(vaddr + head, 0, request->postfix - head);
Chris Wilson	c0d5f32	2017-01-10 17:22:43 +0000	[diff] [blame]	3011
				3012	dma_fence_set_error(&request->fence, -EIO);
Chris Wilson	4db080f	2013-12-04 11:37:09 +0000	[diff] [blame]	3013	}
				3014
Chris Wilson	e61e0f5	2018-02-21 09:56:36 +0000	[diff] [blame]	3015	static void engine_skip_context(struct i915_request *request)
Mika Kuoppala	36193ac	2017-01-17 17:59:02 +0200	[diff] [blame]	3016	{
				3017	struct intel_engine_cs *engine = request->engine;
				3018	struct i915_gem_context *hung_ctx = request->ctx;
				3019	struct intel_timeline *timeline;
				3020	unsigned long flags;
				3021
				3022	timeline = i915_gem_context_lookup_timeline(hung_ctx, engine);
				3023
				3024	spin_lock_irqsave(&engine->timeline->lock, flags);
				3025	spin_lock(&timeline->lock);
				3026
				3027	list_for_each_entry_continue(request, &engine->timeline->requests, link)
				3028	if (request->ctx == hung_ctx)
				3029	skip_request(request);
				3030
				3031	list_for_each_entry(request, &timeline->requests, link)
				3032	skip_request(request);
				3033
				3034	spin_unlock(&timeline->lock);
				3035	spin_unlock_irqrestore(&engine->timeline->lock, flags);
				3036	}
				3037
Chris Wilson	d1d1ebf4	2017-07-21 13:32:33 +0100	[diff] [blame]	3038	/* Returns the request if it was guilty of the hang */
Chris Wilson	e61e0f5	2018-02-21 09:56:36 +0000	[diff] [blame]	3039	static struct i915_request *
Chris Wilson	d1d1ebf4	2017-07-21 13:32:33 +0100	[diff] [blame]	3040	i915_gem_reset_request(struct intel_engine_cs *engine,
Chris Wilson	e61e0f5	2018-02-21 09:56:36 +0000	[diff] [blame]	3041	struct i915_request *request)
Mika Kuoppala	61da536	2017-01-17 17:59:05 +0200	[diff] [blame]	3042	{
Mika Kuoppala	71895a0	2017-01-17 17:59:07 +0200	[diff] [blame]	3043	/* The guilty request will get skipped on a hung engine.
				3044	*
				3045	* Users of client default contexts do not rely on logical
				3046	* state preserved between batches so it is safe to execute
				3047	* queued requests following the hang. Non default contexts
				3048	* rely on preserved state, so skipping a batch loses the
				3049	* evolution of the state and it needs to be considered corrupted.
				3050	* Executing more queued batches on top of corrupted state is
				3051	* risky. But we take the risk by trying to advance through
				3052	* the queued requests in order to make the client behaviour
				3053	* more predictable around resets, by not throwing away random
				3054	* amount of batches it has prepared for execution. Sophisticated
				3055	* clients can use gem_reset_stats_ioctl and dma fence status
				3056	* (exported via sync_file info ioctl on explicit fences) to observe
				3057	* when it loses the context state and should rebuild accordingly.
				3058	*
				3059	* The context ban, and ultimately the client ban, mechanism are safety
				3060	* valves if client submission ends up resulting in nothing more than
				3061	* subsequent hangs.
				3062	*/
				3063
Chris Wilson	d1d1ebf4	2017-07-21 13:32:33 +0100	[diff] [blame]	3064	if (engine_stalled(engine)) {
Mika Kuoppala	61da536	2017-01-17 17:59:05 +0200	[diff] [blame]	3065	i915_gem_context_mark_guilty(request->ctx);
				3066	skip_request(request);
Chris Wilson	d1d1ebf4	2017-07-21 13:32:33 +0100	[diff] [blame]	3067
				3068	/* If this context is now banned, skip all pending requests. */
				3069	if (i915_gem_context_is_banned(request->ctx))
				3070	engine_skip_context(request);
Mika Kuoppala	61da536	2017-01-17 17:59:05 +0200	[diff] [blame]	3071	} else {
Chris Wilson	d1d1ebf4	2017-07-21 13:32:33 +0100	[diff] [blame]	3072	/*
				3073	* Since this is not the hung engine, it may have advanced
				3074	* since the hang declaration. Double check by refinding
				3075	* the active request at the time of the reset.
				3076	*/
				3077	request = i915_gem_find_active_request(engine);
				3078	if (request) {
				3079	i915_gem_context_mark_innocent(request->ctx);
				3080	dma_fence_set_error(&request->fence, -EAGAIN);
				3081
				3082	/* Rewind the engine to replay the incomplete rq */
				3083	spin_lock_irq(&engine->timeline->lock);
				3084	request = list_prev_entry(request, link);
				3085	if (&request->link == &engine->timeline->requests)
				3086	request = NULL;
				3087	spin_unlock_irq(&engine->timeline->lock);
				3088	}
Mika Kuoppala	61da536	2017-01-17 17:59:05 +0200	[diff] [blame]	3089	}
				3090
Chris Wilson	d1d1ebf4	2017-07-21 13:32:33 +0100	[diff] [blame]	3091	return request;
Mika Kuoppala	61da536	2017-01-17 17:59:05 +0200	[diff] [blame]	3092	}
				3093
Michel Thierry	a1ef70e	2017-06-20 10:57:47 +0100	[diff] [blame]	3094	void i915_gem_reset_engine(struct intel_engine_cs *engine,
Chris Wilson	e61e0f5	2018-02-21 09:56:36 +0000	[diff] [blame]	3095	struct i915_request *request)
Chris Wilson	4db080f	2013-12-04 11:37:09 +0000	[diff] [blame]	3096	{
Chris Wilson	fcb1de5	2017-12-19 09:01:10 +0000	[diff] [blame]	3097	/*
				3098	* Make sure this write is visible before we re-enable the interrupt
				3099	* handlers on another CPU, as tasklet_enable() resolves to just
				3100	* a compiler barrier which is insufficient for our purpose here.
				3101	*/
				3102	smp_store_mb(engine->irq_posted, 0);
Chris Wilson	ed454f2	2017-07-21 13:32:29 +0100	[diff] [blame]	3103
Chris Wilson	d1d1ebf4	2017-07-21 13:32:33 +0100	[diff] [blame]	3104	if (request)
				3105	request = i915_gem_reset_request(engine, request);
				3106
				3107	if (request) {
Chris Wilson	c0dcb20	2017-02-07 15:24:37 +0000	[diff] [blame]	3108	DRM_DEBUG_DRIVER("resetting %s to restart from tail of request 0x%x\n",
				3109	engine->name, request->global_seqno);
Chris Wilson	c0dcb20	2017-02-07 15:24:37 +0000	[diff] [blame]	3110	}
Chris Wilson	821ed7d	2016-09-09 14:11:53 +0100	[diff] [blame]	3111
				3112	/* Setup the CS to resume from the breadcrumb of the hung request */
				3113	engine->reset_hw(engine, request);
Chris Wilson	821ed7d	2016-09-09 14:11:53 +0100	[diff] [blame]	3114	}
				3115
Chris Wilson	d802709	2017-02-08 14:30:32 +0000	[diff] [blame]	3116	void i915_gem_reset(struct drm_i915_private *dev_priv)
Chris Wilson	821ed7d	2016-09-09 14:11:53 +0100	[diff] [blame]	3117	{
				3118	struct intel_engine_cs *engine;
Akash Goel	3b3f165	2016-10-13 22:44:48 +0530	[diff] [blame]	3119	enum intel_engine_id id;
Chris Wilson	821ed7d	2016-09-09 14:11:53 +0100	[diff] [blame]	3120
Chris Wilson	4c7d62c	2016-10-28 13:58:32 +0100	[diff] [blame]	3121	lockdep_assert_held(&dev_priv->drm.struct_mutex);
				3122
Chris Wilson	e61e0f5	2018-02-21 09:56:36 +0000	[diff] [blame]	3123	i915_retire_requests(dev_priv);
Chris Wilson	821ed7d	2016-09-09 14:11:53 +0100	[diff] [blame]	3124
Chris Wilson	2ae5573	2017-02-12 17:20:02 +0000	[diff] [blame]	3125	for_each_engine(engine, dev_priv, id) {
				3126	struct i915_gem_context *ctx;
				3127
Michel Thierry	c64992e	2017-06-20 10:57:44 +0100	[diff] [blame]	3128	i915_gem_reset_engine(engine, engine->hangcheck.active_request);
Chris Wilson	2ae5573	2017-02-12 17:20:02 +0000	[diff] [blame]	3129	ctx = fetch_and_zero(&engine->last_retired_context);
				3130	if (ctx)
				3131	engine->context_unpin(engine, ctx);
Chris Wilson	7b6da81	2017-12-16 00:03:34 +0000	[diff] [blame]	3132
				3133	/*
				3134	* Ostensibily, we always want a context loaded for powersaving,
				3135	* so if the engine is idle after the reset, send a request
				3136	* to load our scratch kernel_context.
				3137	*
				3138	* More mysteriously, if we leave the engine idle after a reset,
				3139	* the next userspace batch may hang, with what appears to be
				3140	* an incoherent read by the CS (presumably stale TLB). An
				3141	* empty request appears sufficient to paper over the glitch.
				3142	*/
Chris Wilson	01b8fdc	2018-02-05 15:24:31 +0000	[diff] [blame]	3143	if (intel_engine_is_idle(engine)) {
Chris Wilson	e61e0f5	2018-02-21 09:56:36 +0000	[diff] [blame]	3144	struct i915_request *rq;
Chris Wilson	7b6da81	2017-12-16 00:03:34 +0000	[diff] [blame]	3145
Chris Wilson	e61e0f5	2018-02-21 09:56:36 +0000	[diff] [blame]	3146	rq = i915_request_alloc(engine,
				3147	dev_priv->kernel_context);
Chris Wilson	7b6da81	2017-12-16 00:03:34 +0000	[diff] [blame]	3148	if (!IS_ERR(rq))
Chris Wilson	e61e0f5	2018-02-21 09:56:36 +0000	[diff] [blame]	3149	__i915_request_add(rq, false);
Chris Wilson	7b6da81	2017-12-16 00:03:34 +0000	[diff] [blame]	3150	}
Chris Wilson	2ae5573	2017-02-12 17:20:02 +0000	[diff] [blame]	3151	}
Chris Wilson	821ed7d	2016-09-09 14:11:53 +0100	[diff] [blame]	3152
Tvrtko Ursulin	4362f4f	2016-11-16 08:55:33 +0000	[diff] [blame]	3153	i915_gem_restore_fences(dev_priv);
Chris Wilson	f2a91d1	2016-09-21 14:51:06 +0100	[diff] [blame]	3154
				3155	if (dev_priv->gt.awake) {
				3156	intel_sanitize_gt_powersave(dev_priv);
				3157	intel_enable_gt_powersave(dev_priv);
				3158	if (INTEL_GEN(dev_priv) >= 6)
				3159	gen6_rps_busy(dev_priv);
				3160	}
Chris Wilson	821ed7d	2016-09-09 14:11:53 +0100	[diff] [blame]	3161	}
				3162
Michel Thierry	a1ef70e	2017-06-20 10:57:47 +0100	[diff] [blame]	3163	void i915_gem_reset_finish_engine(struct intel_engine_cs *engine)
				3164	{
Sagar Arun Kamble	c6dce8f	2017-11-16 19:02:37 +0530	[diff] [blame]	3165	tasklet_enable(&engine->execlists.tasklet);
Michel Thierry	a1ef70e	2017-06-20 10:57:47 +0100	[diff] [blame]	3166	kthread_unpark(engine->breadcrumbs.signaler);
Chris Wilson	1749d90	2017-10-09 12:02:59 +0100	[diff] [blame]	3167
				3168	intel_uncore_forcewake_put(engine->i915, FORCEWAKE_ALL);
Michel Thierry	a1ef70e	2017-06-20 10:57:47 +0100	[diff] [blame]	3169	}
				3170
Chris Wilson	d802709	2017-02-08 14:30:32 +0000	[diff] [blame]	3171	void i915_gem_reset_finish(struct drm_i915_private *dev_priv)
				3172	{
Chris Wilson	1f7b847	2017-02-08 14:30:33 +0000	[diff] [blame]	3173	struct intel_engine_cs *engine;
				3174	enum intel_engine_id id;
				3175
Chris Wilson	d802709	2017-02-08 14:30:32 +0000	[diff] [blame]	3176	lockdep_assert_held(&dev_priv->drm.struct_mutex);
Chris Wilson	1f7b847	2017-02-08 14:30:33 +0000	[diff] [blame]	3177
Chris Wilson	fe3288b	2017-02-12 17:20:01 +0000	[diff] [blame]	3178	for_each_engine(engine, dev_priv, id) {
Michel Thierry	c64992e	2017-06-20 10:57:44 +0100	[diff] [blame]	3179	engine->hangcheck.active_request = NULL;
Michel Thierry	a1ef70e	2017-06-20 10:57:47 +0100	[diff] [blame]	3180	i915_gem_reset_finish_engine(engine);
Chris Wilson	fe3288b	2017-02-12 17:20:01 +0000	[diff] [blame]	3181	}
Chris Wilson	d802709	2017-02-08 14:30:32 +0000	[diff] [blame]	3182	}
				3183
Chris Wilson	e61e0f5	2018-02-21 09:56:36 +0000	[diff] [blame]	3184	static void nop_submit_request(struct i915_request *request)
Chris Wilson	821ed7d	2016-09-09 14:11:53 +0100	[diff] [blame]	3185	{
Daniel Vetter	af7a8ff	2017-10-11 11:10:19 +0200	[diff] [blame]	3186	dma_fence_set_error(&request->fence, -EIO);
				3187
Chris Wilson	e61e0f5	2018-02-21 09:56:36 +0000	[diff] [blame]	3188	i915_request_submit(request);
Daniel Vetter	af7a8ff	2017-10-11 11:10:19 +0200	[diff] [blame]	3189	}
				3190
Chris Wilson	e61e0f5	2018-02-21 09:56:36 +0000	[diff] [blame]	3191	static void nop_complete_submit_request(struct i915_request *request)
Daniel Vetter	af7a8ff	2017-10-11 11:10:19 +0200	[diff] [blame]	3192	{
Chris Wilson	8d55082	2017-10-06 12:56:17 +0100	[diff] [blame]	3193	unsigned long flags;
				3194
Chris Wilson	3cd9442	2017-01-10 17:22:45 +0000	[diff] [blame]	3195	dma_fence_set_error(&request->fence, -EIO);
Chris Wilson	8d55082	2017-10-06 12:56:17 +0100	[diff] [blame]	3196
				3197	spin_lock_irqsave(&request->engine->timeline->lock, flags);
Chris Wilson	e61e0f5	2018-02-21 09:56:36 +0000	[diff] [blame]	3198	__i915_request_submit(request);
Chris Wilson	3dcf93f	2016-11-22 14:41:20 +0000	[diff] [blame]	3199	intel_engine_init_global_seqno(request->engine, request->global_seqno);
Chris Wilson	8d55082	2017-10-06 12:56:17 +0100	[diff] [blame]	3200	spin_unlock_irqrestore(&request->engine->timeline->lock, flags);
Chris Wilson	821ed7d	2016-09-09 14:11:53 +0100	[diff] [blame]	3201	}
				3202
Daniel Vetter	af7a8ff	2017-10-11 11:10:19 +0200	[diff] [blame]	3203	void i915_gem_set_wedged(struct drm_i915_private *i915)
Chris Wilson	821ed7d	2016-09-09 14:11:53 +0100	[diff] [blame]	3204	{
Tvrtko Ursulin	e2f8039	2016-03-16 11:00:36 +0000	[diff] [blame]	3205	struct intel_engine_cs *engine;
Akash Goel	3b3f165	2016-10-13 22:44:48 +0530	[diff] [blame]	3206	enum intel_engine_id id;
Eric Anholt	673a394	2008-07-30 12:06:12 -0700	[diff] [blame]	3207
Chris Wilson	559e040	2018-02-05 09:21:59 +0000	[diff] [blame]	3208	if (drm_debug & DRM_UT_DRIVER) {
				3209	struct drm_printer p = drm_debug_printer(__func__);
				3210
				3211	for_each_engine(engine, i915, id)
				3212	intel_engine_dump(engine, &p, "%s\n", engine->name);
				3213	}
				3214
Chris Wilson	0d73e7a	2018-02-07 15:13:50 +0000	[diff] [blame]	3215	set_bit(I915_WEDGED, &i915->gpu_error.flags);
				3216	smp_mb__after_atomic();
				3217
Daniel Vetter	af7a8ff	2017-10-11 11:10:19 +0200	[diff] [blame]	3218	/*
				3219	* First, stop submission to hw, but do not yet complete requests by
				3220	* rolling the global seqno forward (since this would complete requests
				3221	* for which we haven't set the fence error to EIO yet).
				3222	*/
Chris Wilson	963ddd6	2018-03-02 11:33:24 +0000	[diff] [blame]	3223	for_each_engine(engine, i915, id) {
				3224	i915_gem_reset_prepare_engine(engine);
Daniel Vetter	af7a8ff	2017-10-11 11:10:19 +0200	[diff] [blame]	3225	engine->submit_request = nop_submit_request;
Chris Wilson	963ddd6	2018-03-02 11:33:24 +0000	[diff] [blame]	3226	}
Daniel Vetter	af7a8ff	2017-10-11 11:10:19 +0200	[diff] [blame]	3227
				3228	/*
				3229	* Make sure no one is running the old callback before we proceed with
				3230	* cancelling requests and resetting the completion tracking. Otherwise
				3231	* we might submit a request to the hardware which never completes.
				3232	*/
				3233	synchronize_rcu();
				3234
				3235	for_each_engine(engine, i915, id) {
				3236	/* Mark all executing requests as skipped */
				3237	engine->cancel_requests(engine);
				3238
				3239	/*
				3240	* Only once we've force-cancelled all in-flight requests can we
				3241	* start to complete all requests.
				3242	*/
				3243	engine->submit_request = nop_complete_submit_request;
Chris Wilson	3fed180	2018-02-07 21:05:43 +0000	[diff] [blame]	3244	engine->schedule = NULL;
Daniel Vetter	af7a8ff	2017-10-11 11:10:19 +0200	[diff] [blame]	3245	}
				3246
Chris Wilson	3fed180	2018-02-07 21:05:43 +0000	[diff] [blame]	3247	i915->caps.scheduler = 0;
				3248
Daniel Vetter	af7a8ff	2017-10-11 11:10:19 +0200	[diff] [blame]	3249	/*
				3250	* Make sure no request can slip through without getting completed by
				3251	* either this call here to intel_engine_init_global_seqno, or the one
				3252	* in nop_complete_submit_request.
				3253	*/
				3254	synchronize_rcu();
				3255
				3256	for_each_engine(engine, i915, id) {
				3257	unsigned long flags;
				3258
Chris Wilson	0d73e7a	2018-02-07 15:13:50 +0000	[diff] [blame]	3259	/*
				3260	* Mark all pending requests as complete so that any concurrent
Daniel Vetter	af7a8ff	2017-10-11 11:10:19 +0200	[diff] [blame]	3261	* (lockless) lookup doesn't try and wait upon the request as we
				3262	* reset it.
				3263	*/
				3264	spin_lock_irqsave(&engine->timeline->lock, flags);
				3265	intel_engine_init_global_seqno(engine,
				3266	intel_engine_last_submit(engine));
				3267	spin_unlock_irqrestore(&engine->timeline->lock, flags);
Chris Wilson	963ddd6	2018-03-02 11:33:24 +0000	[diff] [blame]	3268
				3269	i915_gem_reset_finish_engine(engine);
Daniel Vetter	af7a8ff	2017-10-11 11:10:19 +0200	[diff] [blame]	3270	}
Chris Wilson	20e4933	2016-11-22 14:41:21 +0000	[diff] [blame]	3271
Chris Wilson	3d7adbb	2017-07-21 13:32:27 +0100	[diff] [blame]	3272	wake_up_all(&i915->gpu_error.reset_queue);
Eric Anholt	673a394	2008-07-30 12:06:12 -0700	[diff] [blame]	3273	}
				3274
Chris Wilson	2e8f9d3	2017-03-16 17:13:04 +0000	[diff] [blame]	3275	bool i915_gem_unset_wedged(struct drm_i915_private *i915)
				3276	{
				3277	struct i915_gem_timeline *tl;
				3278	int i;
				3279
				3280	lockdep_assert_held(&i915->drm.struct_mutex);
				3281	if (!test_bit(I915_WEDGED, &i915->gpu_error.flags))
				3282	return true;
				3283
Chris Wilson	2d4ecac	2018-03-07 13:42:21 +0000	[diff] [blame^]	3284	/*
				3285	* Before unwedging, make sure that all pending operations
Chris Wilson	2e8f9d3	2017-03-16 17:13:04 +0000	[diff] [blame]	3286	* are flushed and errored out - we may have requests waiting upon
				3287	* third party fences. We marked all inflight requests as EIO, and
				3288	* every execbuf since returned EIO, for consistency we want all
				3289	* the currently pending requests to also be marked as EIO, which
				3290	* is done inside our nop_submit_request - and so we must wait.
				3291	*
				3292	* No more can be submitted until we reset the wedged bit.
				3293	*/
				3294	list_for_each_entry(tl, &i915->gt.timelines, link) {
				3295	for (i = 0; i < ARRAY_SIZE(tl->engine); i++) {
Chris Wilson	e61e0f5	2018-02-21 09:56:36 +0000	[diff] [blame]	3296	struct i915_request *rq;
Chris Wilson	2e8f9d3	2017-03-16 17:13:04 +0000	[diff] [blame]	3297
				3298	rq = i915_gem_active_peek(&tl->engine[i].last_request,
				3299	&i915->drm.struct_mutex);
				3300	if (!rq)
				3301	continue;
				3302
Chris Wilson	2d4ecac	2018-03-07 13:42:21 +0000	[diff] [blame^]	3303	/*
				3304	* We can't use our normal waiter as we want to
Chris Wilson	2e8f9d3	2017-03-16 17:13:04 +0000	[diff] [blame]	3305	* avoid recursively trying to handle the current
				3306	* reset. The basic dma_fence_default_wait() installs
				3307	* a callback for dma_fence_signal(), which is
				3308	* triggered by our nop handler (indirectly, the
				3309	* callback enables the signaler thread which is
				3310	* woken by the nop_submit_request() advancing the seqno
				3311	* and when the seqno passes the fence, the signaler
				3312	* then signals the fence waking us up).
				3313	*/
				3314	if (dma_fence_default_wait(&rq->fence, true,
				3315	MAX_SCHEDULE_TIMEOUT) < 0)
				3316	return false;
				3317	}
				3318	}
Chris Wilson	2d4ecac	2018-03-07 13:42:21 +0000	[diff] [blame^]	3319	i915_retire_requests(i915);
				3320	GEM_BUG_ON(i915->gt.active_requests);
Chris Wilson	2e8f9d3	2017-03-16 17:13:04 +0000	[diff] [blame]	3321
Chris Wilson	2d4ecac	2018-03-07 13:42:21 +0000	[diff] [blame^]	3322	/*
				3323	* Undo nop_submit_request. We prevent all new i915 requests from
Chris Wilson	2e8f9d3	2017-03-16 17:13:04 +0000	[diff] [blame]	3324	* being queued (by disallowing execbuf whilst wedged) so having
				3325	* waited for all active requests above, we know the system is idle
				3326	* and do not have to worry about a thread being inside
				3327	* engine->submit_request() as we swap over. So unlike installing
				3328	* the nop_submit_request on reset, we can do this from normal
				3329	* context and do not require stop_machine().
				3330	*/
				3331	intel_engines_reset_default_submission(i915);
Chris Wilson	36703e7	2017-06-22 11:56:25 +0100	[diff] [blame]	3332	i915_gem_contexts_lost(i915);
Chris Wilson	2e8f9d3	2017-03-16 17:13:04 +0000	[diff] [blame]	3333
				3334	smp_mb__before_atomic(); /* complete takeover before enabling execbuf */
				3335	clear_bit(I915_WEDGED, &i915->gpu_error.flags);
				3336
				3337	return true;
				3338	}
				3339
Daniel Vetter	75ef9da	2010-08-21 00:25:16 +0200	[diff] [blame]	3340	static void
Eric Anholt	673a394	2008-07-30 12:06:12 -0700	[diff] [blame]	3341	i915_gem_retire_work_handler(struct work_struct *work)
				3342	{
Chris Wilson	b29c19b	2013-09-25 17:34:56 +0100	[diff] [blame]	3343	struct drm_i915_private *dev_priv =
Chris Wilson	67d97da	2016-07-04 08:08:31 +0100	[diff] [blame]	3344	container_of(work, typeof(*dev_priv), gt.retire_work.work);
Chris Wilson	91c8a32	2016-07-05 10:40:23 +0100	[diff] [blame]	3345	struct drm_device *dev = &dev_priv->drm;
Eric Anholt	673a394	2008-07-30 12:06:12 -0700	[diff] [blame]	3346
Chris Wilson	891b48c	2010-09-29 12:26:37 +0100	[diff] [blame]	3347	/* Come back later if the device is busy... */
Chris Wilson	b29c19b	2013-09-25 17:34:56 +0100	[diff] [blame]	3348	if (mutex_trylock(&dev->struct_mutex)) {
Chris Wilson	e61e0f5	2018-02-21 09:56:36 +0000	[diff] [blame]	3349	i915_retire_requests(dev_priv);
Chris Wilson	b29c19b	2013-09-25 17:34:56 +0100	[diff] [blame]	3350	mutex_unlock(&dev->struct_mutex);
				3351	}
Chris Wilson	67d97da	2016-07-04 08:08:31 +0100	[diff] [blame]	3352
Chris Wilson	8892304	2018-01-29 14:41:04 +0000	[diff] [blame]	3353	/*
				3354	* Keep the retire handler running until we are finally idle.
Chris Wilson	67d97da	2016-07-04 08:08:31 +0100	[diff] [blame]	3355	* We do not need to do this test under locking as in the worst-case
				3356	* we queue the retire worker once too often.
				3357	*/
Chris Wilson	8892304	2018-01-29 14:41:04 +0000	[diff] [blame]	3358	if (READ_ONCE(dev_priv->gt.awake))
Chris Wilson	67d97da	2016-07-04 08:08:31 +0100	[diff] [blame]	3359	queue_delayed_work(dev_priv->wq,
				3360	&dev_priv->gt.retire_work,
Chris Wilson	bcb4508	2012-10-05 17:02:57 +0100	[diff] [blame]	3361	round_jiffies_up_relative(HZ));
Chris Wilson	b29c19b	2013-09-25 17:34:56 +0100	[diff] [blame]	3362	}
Chris Wilson	891b48c	2010-09-29 12:26:37 +0100	[diff] [blame]	3363
Chris Wilson	84a1074	2018-01-24 11:36:08 +0000	[diff] [blame]	3364	static void shrink_caches(struct drm_i915_private *i915)
				3365	{
				3366	/*
				3367	* kmem_cache_shrink() discards empty slabs and reorders partially
				3368	* filled slabs to prioritise allocating from the mostly full slabs,
				3369	* with the aim of reducing fragmentation.
				3370	*/
				3371	kmem_cache_shrink(i915->priorities);
				3372	kmem_cache_shrink(i915->dependencies);
				3373	kmem_cache_shrink(i915->requests);
				3374	kmem_cache_shrink(i915->luts);
				3375	kmem_cache_shrink(i915->vmas);
				3376	kmem_cache_shrink(i915->objects);
				3377	}
				3378
				3379	struct sleep_rcu_work {
				3380	union {
				3381	struct rcu_head rcu;
				3382	struct work_struct work;
				3383	};
				3384	struct drm_i915_private *i915;
				3385	unsigned int epoch;
				3386	};
				3387
				3388	static inline bool
				3389	same_epoch(struct drm_i915_private *i915, unsigned int epoch)
				3390	{
				3391	/*
				3392	* There is a small chance that the epoch wrapped since we started
				3393	* sleeping. If we assume that epoch is at least a u32, then it will
				3394	* take at least 2^32 * 100ms for it to wrap, or about 326 years.
				3395	*/
				3396	return epoch == READ_ONCE(i915->gt.epoch);
				3397	}
				3398
				3399	static void __sleep_work(struct work_struct *work)
				3400	{
				3401	struct sleep_rcu_work s = container_of(work, typeof(s), work);
				3402	struct drm_i915_private *i915 = s->i915;
				3403	unsigned int epoch = s->epoch;
				3404
				3405	kfree(s);
				3406	if (same_epoch(i915, epoch))
				3407	shrink_caches(i915);
				3408	}
				3409
				3410	static void __sleep_rcu(struct rcu_head *rcu)
				3411	{
				3412	struct sleep_rcu_work s = container_of(rcu, typeof(s), rcu);
				3413	struct drm_i915_private *i915 = s->i915;
				3414
				3415	if (same_epoch(i915, s->epoch)) {
				3416	INIT_WORK(&s->work, __sleep_work);
				3417	queue_work(i915->wq, &s->work);
				3418	} else {
				3419	kfree(s);
				3420	}
				3421	}
				3422
Chris Wilson	5427f20	2017-10-23 22:32:34 +0100	[diff] [blame]	3423	static inline bool
				3424	new_requests_since_last_retire(const struct drm_i915_private *i915)
				3425	{
				3426	return (READ_ONCE(i915->gt.active_requests) \|\|
				3427	work_pending(&i915->gt.idle_work.work));
				3428	}
				3429
Chris Wilson	b29c19b	2013-09-25 17:34:56 +0100	[diff] [blame]	3430	static void
				3431	i915_gem_idle_work_handler(struct work_struct *work)
				3432	{
				3433	struct drm_i915_private *dev_priv =
Chris Wilson	67d97da	2016-07-04 08:08:31 +0100	[diff] [blame]	3434	container_of(work, typeof(*dev_priv), gt.idle_work.work);
Chris Wilson	84a1074	2018-01-24 11:36:08 +0000	[diff] [blame]	3435	unsigned int epoch = I915_EPOCH_INVALID;
Chris Wilson	67d97da	2016-07-04 08:08:31 +0100	[diff] [blame]	3436	bool rearm_hangcheck;
				3437
				3438	if (!READ_ONCE(dev_priv->gt.awake))
				3439	return;
				3440
Imre Deak	0cb5670	2016-11-07 11:20:04 +0200	[diff] [blame]	3441	/*
				3442	* Wait for last execlists context complete, but bail out in case a
Chris Wilson	ffed7bd	2018-03-01 10:33:38 +0000	[diff] [blame]	3443	* new request is submitted. As we don't trust the hardware, we
				3444	* continue on if the wait times out. This is necessary to allow
				3445	* the machine to suspend even if the hardware dies, and we will
				3446	* try to recover in resume (after depriving the hardware of power,
				3447	* it may be in a better mmod).
Imre Deak	0cb5670	2016-11-07 11:20:04 +0200	[diff] [blame]	3448	*/
Chris Wilson	ffed7bd	2018-03-01 10:33:38 +0000	[diff] [blame]	3449	__wait_for(if (new_requests_since_last_retire(dev_priv)) return,
				3450	intel_engines_are_idle(dev_priv),
				3451	I915_IDLE_ENGINES_TIMEOUT * 1000,
				3452	10, 500);
Chris Wilson	67d97da	2016-07-04 08:08:31 +0100	[diff] [blame]	3453
				3454	rearm_hangcheck =
				3455	cancel_delayed_work_sync(&dev_priv->gpu_error.hangcheck_work);
				3456
Chris Wilson	5427f20	2017-10-23 22:32:34 +0100	[diff] [blame]	3457	if (!mutex_trylock(&dev_priv->drm.struct_mutex)) {
Chris Wilson	67d97da	2016-07-04 08:08:31 +0100	[diff] [blame]	3458	/* Currently busy, come back later */
				3459	mod_delayed_work(dev_priv->wq,
				3460	&dev_priv->gt.idle_work,
				3461	msecs_to_jiffies(50));
				3462	goto out_rearm;
				3463	}
				3464
Imre Deak	93c97dc	2016-11-07 11:20:03 +0200	[diff] [blame]	3465	/*
				3466	* New request retired after this work handler started, extend active
				3467	* period until next instance of the work.
				3468	*/
Chris Wilson	5427f20	2017-10-23 22:32:34 +0100	[diff] [blame]	3469	if (new_requests_since_last_retire(dev_priv))
Imre Deak	93c97dc	2016-11-07 11:20:03 +0200	[diff] [blame]	3470	goto out_unlock;
				3471
Chris Wilson	5427f20	2017-10-23 22:32:34 +0100	[diff] [blame]	3472	/*
Chris Wilson	ff320d6	2017-10-23 22:32:35 +0100	[diff] [blame]	3473	* Be paranoid and flush a concurrent interrupt to make sure
				3474	* we don't reactivate any irq tasklets after parking.
				3475	*
				3476	* FIXME: Note that even though we have waited for execlists to be idle,
				3477	* there may still be an in-flight interrupt even though the CSB
				3478	* is now empty. synchronize_irq() makes sure that a residual interrupt
				3479	* is completed before we continue, but it doesn't prevent the HW from
				3480	* raising a spurious interrupt later. To complete the shield we should
				3481	* coordinate disabling the CS irq with flushing the interrupts.
				3482	*/
				3483	synchronize_irq(dev_priv->drm.irq);
				3484
Chris Wilson	aba5e27	2017-10-25 15:39:41 +0100	[diff] [blame]	3485	intel_engines_park(dev_priv);
Chris Wilson	d02a1d8	2017-11-27 12:30:54 +0000	[diff] [blame]	3486	i915_gem_timelines_park(dev_priv);
				3487
Tvrtko Ursulin	feff0dc	2017-11-21 18:18:46 +0000	[diff] [blame]	3488	i915_pmu_gt_parked(dev_priv);
Zou Nan hai	d1b851f	2010-05-21 09:08:57 +0800	[diff] [blame]	3489
Chris Wilson	67d97da	2016-07-04 08:08:31 +0100	[diff] [blame]	3490	GEM_BUG_ON(!dev_priv->gt.awake);
				3491	dev_priv->gt.awake = false;
Chris Wilson	84a1074	2018-01-24 11:36:08 +0000	[diff] [blame]	3492	epoch = dev_priv->gt.epoch;
				3493	GEM_BUG_ON(epoch == I915_EPOCH_INVALID);
Chris Wilson	67d97da	2016-07-04 08:08:31 +0100	[diff] [blame]	3494	rearm_hangcheck = false;
Daniel Vetter	30ecad7	2015-12-09 09:29:36 +0100	[diff] [blame]	3495
Chris Wilson	67d97da	2016-07-04 08:08:31 +0100	[diff] [blame]	3496	if (INTEL_GEN(dev_priv) >= 6)
				3497	gen6_rps_idle(dev_priv);
Tvrtko Ursulin	b687637	2017-12-05 13:28:54 +0000	[diff] [blame]	3498
				3499	intel_display_power_put(dev_priv, POWER_DOMAIN_GT_IRQ);
				3500
Chris Wilson	67d97da	2016-07-04 08:08:31 +0100	[diff] [blame]	3501	intel_runtime_pm_put(dev_priv);
				3502	out_unlock:
Chris Wilson	5427f20	2017-10-23 22:32:34 +0100	[diff] [blame]	3503	mutex_unlock(&dev_priv->drm.struct_mutex);
Chris Wilson	35c9418	2015-04-07 16:20:37 +0100	[diff] [blame]	3504
Chris Wilson	67d97da	2016-07-04 08:08:31 +0100	[diff] [blame]	3505	out_rearm:
				3506	if (rearm_hangcheck) {
				3507	GEM_BUG_ON(!dev_priv->gt.awake);
				3508	i915_queue_hangcheck(dev_priv);
Chris Wilson	35c9418	2015-04-07 16:20:37 +0100	[diff] [blame]	3509	}
Chris Wilson	84a1074	2018-01-24 11:36:08 +0000	[diff] [blame]	3510
				3511	/*
				3512	* When we are idle, it is an opportune time to reap our caches.
				3513	* However, we have many objects that utilise RCU and the ordered
				3514	* i915->wq that this work is executing on. To try and flush any
				3515	* pending frees now we are idle, we first wait for an RCU grace
				3516	* period, and then queue a task (that will run last on the wq) to
				3517	* shrink and re-optimize the caches.
				3518	*/
				3519	if (same_epoch(dev_priv, epoch)) {
				3520	struct sleep_rcu_work s = kmalloc(sizeof(s), GFP_KERNEL);
				3521	if (s) {
				3522	s->i915 = dev_priv;
				3523	s->epoch = epoch;
				3524	call_rcu(&s->rcu, __sleep_rcu);
				3525	}
				3526	}
Eric Anholt	673a394	2008-07-30 12:06:12 -0700	[diff] [blame]	3527	}
				3528
Chris Wilson	b1f788c	2016-08-04 07:52:45 +0100	[diff] [blame]	3529	void i915_gem_close_object(struct drm_gem_object gem, struct drm_file file)
				3530	{
Chris Wilson	d1b48c1	2017-08-16 09:52:08 +0100	[diff] [blame]	3531	struct drm_i915_private *i915 = to_i915(gem->dev);
Chris Wilson	b1f788c	2016-08-04 07:52:45 +0100	[diff] [blame]	3532	struct drm_i915_gem_object *obj = to_intel_bo(gem);
				3533	struct drm_i915_file_private *fpriv = file->driver_priv;
Chris Wilson	d1b48c1	2017-08-16 09:52:08 +0100	[diff] [blame]	3534	struct i915_lut_handle lut, ln;
Chris Wilson	b1f788c	2016-08-04 07:52:45 +0100	[diff] [blame]	3535
Chris Wilson	d1b48c1	2017-08-16 09:52:08 +0100	[diff] [blame]	3536	mutex_lock(&i915->drm.struct_mutex);
				3537
				3538	list_for_each_entry_safe(lut, ln, &obj->lut_list, obj_link) {
				3539	struct i915_gem_context *ctx = lut->ctx;
				3540	struct i915_vma *vma;
				3541
Chris Wilson	432295d	2017-08-22 12:05:15 +0100	[diff] [blame]	3542	GEM_BUG_ON(ctx->file_priv == ERR_PTR(-EBADF));
Chris Wilson	d1b48c1	2017-08-16 09:52:08 +0100	[diff] [blame]	3543	if (ctx->file_priv != fpriv)
				3544	continue;
				3545
				3546	vma = radix_tree_delete(&ctx->handles_vma, lut->handle);
Chris Wilson	3ffff01	2017-08-22 12:05:17 +0100	[diff] [blame]	3547	GEM_BUG_ON(vma->obj != obj);
				3548
				3549	/* We allow the process to have multiple handles to the same
				3550	* vma, in the same fd namespace, by virtue of flink/open.
				3551	*/
				3552	GEM_BUG_ON(!vma->open_count);
				3553	if (!--vma->open_count && !i915_vma_is_ggtt(vma))
Chris Wilson	b1f788c	2016-08-04 07:52:45 +0100	[diff] [blame]	3554	i915_vma_close(vma);
Chris Wilson	f8a7fde	2016-10-28 13:58:29 +0100	[diff] [blame]	3555
Chris Wilson	d1b48c1	2017-08-16 09:52:08 +0100	[diff] [blame]	3556	list_del(&lut->obj_link);
				3557	list_del(&lut->ctx_link);
Chris Wilson	4ff4b44	2017-06-16 15:05:16 +0100	[diff] [blame]	3558
Chris Wilson	d1b48c1	2017-08-16 09:52:08 +0100	[diff] [blame]	3559	kmem_cache_free(i915->luts, lut);
				3560	__i915_gem_object_release_unless_active(obj);
Chris Wilson	f8a7fde	2016-10-28 13:58:29 +0100	[diff] [blame]	3561	}
Chris Wilson	d1b48c1	2017-08-16 09:52:08 +0100	[diff] [blame]	3562
				3563	mutex_unlock(&i915->drm.struct_mutex);
Chris Wilson	b1f788c	2016-08-04 07:52:45 +0100	[diff] [blame]	3564	}
				3565
Chris Wilson	e95433c	2016-10-28 13:58:27 +0100	[diff] [blame]	3566	static unsigned long to_wait_timeout(s64 timeout_ns)
				3567	{
				3568	if (timeout_ns < 0)
				3569	return MAX_SCHEDULE_TIMEOUT;
				3570
				3571	if (timeout_ns == 0)
				3572	return 0;
				3573
				3574	return nsecs_to_jiffies_timeout(timeout_ns);
				3575	}
				3576
Ben Widawsky	5816d64	2012-04-11 11:18:19 -0700	[diff] [blame]	3577	/**
Ben Widawsky	23ba4fd	2012-05-24 15:03:10 -0700	[diff] [blame]	3578	* i915_gem_wait_ioctl - implements DRM_IOCTL_I915_GEM_WAIT
Tvrtko Ursulin	14bb2c1	2016-06-03 14:02:17 +0100	[diff] [blame]	3579	* @dev: drm device pointer
				3580	* @data: ioctl data blob
				3581	* @file: drm file pointer
Ben Widawsky	23ba4fd	2012-05-24 15:03:10 -0700	[diff] [blame]	3582	*
				3583	* Returns 0 if successful, else an error is returned with the remaining time in
				3584	* the timeout parameter.
				3585	* -ETIME: object is still busy after timeout
				3586	* -ERESTARTSYS: signal interrupted the wait
				3587	* -ENONENT: object doesn't exist
				3588	* Also possible, but rare:
Chris Wilson	b805014	2017-08-11 11:57:31 +0100	[diff] [blame]	3589	* -EAGAIN: incomplete, restart syscall
Ben Widawsky	23ba4fd	2012-05-24 15:03:10 -0700	[diff] [blame]	3590	* -ENOMEM: damn
				3591	* -ENODEV: Internal IRQ fail
				3592	* -E?: The add request failed
				3593	*
				3594	* The wait ioctl with a timeout of 0 reimplements the busy ioctl. With any
				3595	* non-zero timeout parameter the wait ioctl will wait for the given number of
				3596	* nanoseconds on an object becoming unbusy. Since the wait itself does so
				3597	* without holding struct_mutex the object may become re-busied before this
				3598	* function completes. A similar but shorter * race condition exists in the busy
				3599	* ioctl
				3600	*/
				3601	int
				3602	i915_gem_wait_ioctl(struct drm_device dev, void data, struct drm_file *file)
				3603	{
				3604	struct drm_i915_gem_wait *args = data;
				3605	struct drm_i915_gem_object *obj;
Chris Wilson	e95433c	2016-10-28 13:58:27 +0100	[diff] [blame]	3606	ktime_t start;
				3607	long ret;
Ben Widawsky	23ba4fd	2012-05-24 15:03:10 -0700	[diff] [blame]	3608
Daniel Vetter	11b5d51	2014-09-29 15:31:26 +0200	[diff] [blame]	3609	if (args->flags != 0)
				3610	return -EINVAL;
				3611
Chris Wilson	03ac064	2016-07-20 13:31:51 +0100	[diff] [blame]	3612	obj = i915_gem_object_lookup(file, args->bo_handle);
Chris Wilson	033d549	2016-08-05 10:14:17 +0100	[diff] [blame]	3613	if (!obj)
Ben Widawsky	23ba4fd	2012-05-24 15:03:10 -0700	[diff] [blame]	3614	return -ENOENT;
Chris Wilson	033d549	2016-08-05 10:14:17 +0100	[diff] [blame]	3615
Chris Wilson	e95433c	2016-10-28 13:58:27 +0100	[diff] [blame]	3616	start = ktime_get();
				3617
				3618	ret = i915_gem_object_wait(obj,
				3619	I915_WAIT_INTERRUPTIBLE \| I915_WAIT_ALL,
				3620	to_wait_timeout(args->timeout_ns),
				3621	to_rps_client(file));
				3622
				3623	if (args->timeout_ns > 0) {
				3624	args->timeout_ns -= ktime_to_ns(ktime_sub(ktime_get(), start));
				3625	if (args->timeout_ns < 0)
				3626	args->timeout_ns = 0;
Chris Wilson	c1d2061	2017-02-16 12:54:41 +0000	[diff] [blame]	3627
				3628	/*
				3629	* Apparently ktime isn't accurate enough and occasionally has a
				3630	* bit of mismatch in the jiffies<->nsecs<->ktime loop. So patch
				3631	* things up to make the test happy. We allow up to 1 jiffy.
				3632	*
				3633	* This is a regression from the timespec->ktime conversion.
				3634	*/
				3635	if (ret == -ETIME && !nsecs_to_jiffies(args->timeout_ns))
				3636	args->timeout_ns = 0;
Chris Wilson	b805014	2017-08-11 11:57:31 +0100	[diff] [blame]	3637
				3638	/* Asked to wait beyond the jiffie/scheduler precision? */
				3639	if (ret == -ETIME && args->timeout_ns)
				3640	ret = -EAGAIN;
Ben Widawsky	23ba4fd	2012-05-24 15:03:10 -0700	[diff] [blame]	3641	}
				3642
Chris Wilson	f0cd518	2016-10-28 13:58:43 +0100	[diff] [blame]	3643	i915_gem_object_put(obj);
John Harrison	ff86588	2014-11-24 18:49:28 +0000	[diff] [blame]	3644	return ret;
Ben Widawsky	23ba4fd	2012-05-24 15:03:10 -0700	[diff] [blame]	3645	}
				3646
Chris Wilson	73cb970	2016-10-28 13:58:46 +0100	[diff] [blame]	3647	static int wait_for_timeline(struct i915_gem_timeline *tl, unsigned int flags)
Daniel Vetter	4df2faf	2010-02-19 11:52:00 +0100	[diff] [blame]	3648	{
Chris Wilson	73cb970	2016-10-28 13:58:46 +0100	[diff] [blame]	3649	int ret, i;
				3650
				3651	for (i = 0; i < ARRAY_SIZE(tl->engine); i++) {
				3652	ret = i915_gem_active_wait(&tl->engine[i].last_request, flags);
				3653	if (ret)
				3654	return ret;
				3655	}
				3656
				3657	return 0;
				3658	}
				3659
Chris Wilson	25112b6	2017-03-30 15:50:39 +0100	[diff] [blame]	3660	static int wait_for_engines(struct drm_i915_private *i915)
				3661	{
Chris Wilson	ee42c00	2017-12-11 19:41:34 +0000	[diff] [blame]	3662	if (wait_for(intel_engines_are_idle(i915), I915_IDLE_ENGINES_TIMEOUT)) {
Chris Wilson	59e4b19	2017-12-11 19:41:35 +0000	[diff] [blame]	3663	dev_err(i915->drm.dev,
				3664	"Failed to idle engines, declaring wedged!\n");
				3665	if (drm_debug & DRM_UT_DRIVER) {
				3666	struct drm_printer p = drm_debug_printer(__func__);
				3667	struct intel_engine_cs *engine;
				3668	enum intel_engine_id id;
				3669
				3670	for_each_engine(engine, i915, id)
				3671	intel_engine_dump(engine, &p,
Chris Wilson	9e519bc	2018-02-05 10:06:18 +0000	[diff] [blame]	3672	"%s\n", engine->name);
Chris Wilson	59e4b19	2017-12-11 19:41:35 +0000	[diff] [blame]	3673	}
				3674
Chris Wilson	cad9946	2017-08-26 12:09:33 +0100	[diff] [blame]	3675	i915_gem_set_wedged(i915);
				3676	return -EIO;
Chris Wilson	25112b6	2017-03-30 15:50:39 +0100	[diff] [blame]	3677	}
				3678
				3679	return 0;
				3680	}
				3681
Chris Wilson	73cb970	2016-10-28 13:58:46 +0100	[diff] [blame]	3682	int i915_gem_wait_for_idle(struct drm_i915_private *i915, unsigned int flags)
				3683	{
Dave Gordon	b4ac5af	2016-03-24 11:20:38 +0000	[diff] [blame]	3684	int ret;
Daniel Vetter	4df2faf	2010-02-19 11:52:00 +0100	[diff] [blame]	3685
Chris Wilson	863e9fd	2017-05-30 13:13:32 +0100	[diff] [blame]	3686	/* If the device is asleep, we have no requests outstanding */
				3687	if (!READ_ONCE(i915->gt.awake))
				3688	return 0;
				3689
Chris Wilson	9caa34a	2016-11-11 14:58:08 +0000	[diff] [blame]	3690	if (flags & I915_WAIT_LOCKED) {
				3691	struct i915_gem_timeline *tl;
				3692
				3693	lockdep_assert_held(&i915->drm.struct_mutex);
				3694
				3695	list_for_each_entry(tl, &i915->gt.timelines, link) {
				3696	ret = wait_for_timeline(tl, flags);
				3697	if (ret)
				3698	return ret;
				3699	}
Chris Wilson	e61e0f5	2018-02-21 09:56:36 +0000	[diff] [blame]	3700	i915_retire_requests(i915);
Chris Wilson	25112b6	2017-03-30 15:50:39 +0100	[diff] [blame]	3701
				3702	ret = wait_for_engines(i915);
Chris Wilson	9caa34a	2016-11-11 14:58:08 +0000	[diff] [blame]	3703	} else {
				3704	ret = wait_for_timeline(&i915->gt.global_timeline, flags);
Chris Wilson	1ec14ad	2010-12-04 11:30:53 +0000	[diff] [blame]	3705	}
Zou Nan hai	d1b851f	2010-05-21 09:08:57 +0800	[diff] [blame]	3706
Chris Wilson	25112b6	2017-03-30 15:50:39 +0100	[diff] [blame]	3707	return ret;
Daniel Vetter	4df2faf	2010-02-19 11:52:00 +0100	[diff] [blame]	3708	}
				3709
Chris Wilson	5a97bcc	2017-02-22 11:40:46 +0000	[diff] [blame]	3710	static void __i915_gem_object_flush_for_display(struct drm_i915_gem_object *obj)
				3711	{
Chris Wilson	e27ab73	2017-06-15 13:38:49 +0100	[diff] [blame]	3712	/*
				3713	* We manually flush the CPU domain so that we can override and
				3714	* force the flush for the display, and perform it asyncrhonously.
				3715	*/
				3716	flush_write_domain(obj, ~I915_GEM_DOMAIN_CPU);
				3717	if (obj->cache_dirty)
				3718	i915_gem_clflush_object(obj, I915_CLFLUSH_FORCE);
Christian König	c0a51fd	2018-02-16 13:43:38 +0100	[diff] [blame]	3719	obj->write_domain = 0;
Chris Wilson	5a97bcc	2017-02-22 11:40:46 +0000	[diff] [blame]	3720	}
				3721
				3722	void i915_gem_object_flush_if_display(struct drm_i915_gem_object *obj)
				3723	{
Chris Wilson	bd3d225	2017-10-13 21:26:14 +0100	[diff] [blame]	3724	if (!READ_ONCE(obj->pin_global))
Chris Wilson	5a97bcc	2017-02-22 11:40:46 +0000	[diff] [blame]	3725	return;
				3726
				3727	mutex_lock(&obj->base.dev->struct_mutex);
				3728	__i915_gem_object_flush_for_display(obj);
				3729	mutex_unlock(&obj->base.dev->struct_mutex);
				3730	}
				3731
Eric Anholt	2ef7eea	2008-11-10 10:53:25 -0800	[diff] [blame]	3732	/**
Chris Wilson	e22d8e3	2017-04-12 12:01:11 +0100	[diff] [blame]	3733	* Moves a single object to the WC read, and possibly write domain.
				3734	* @obj: object to act on
				3735	* @write: ask for write access or read only
				3736	*
				3737	* This function returns when the move is complete, including waiting on
				3738	* flushes to occur.
				3739	*/
				3740	int
				3741	i915_gem_object_set_to_wc_domain(struct drm_i915_gem_object *obj, bool write)
				3742	{
				3743	int ret;
				3744
				3745	lockdep_assert_held(&obj->base.dev->struct_mutex);
				3746
				3747	ret = i915_gem_object_wait(obj,
				3748	I915_WAIT_INTERRUPTIBLE \|
				3749	I915_WAIT_LOCKED \|
				3750	(write ? I915_WAIT_ALL : 0),
				3751	MAX_SCHEDULE_TIMEOUT,
				3752	NULL);
				3753	if (ret)
				3754	return ret;
				3755
Christian König	c0a51fd	2018-02-16 13:43:38 +0100	[diff] [blame]	3756	if (obj->write_domain == I915_GEM_DOMAIN_WC)
Chris Wilson	e22d8e3	2017-04-12 12:01:11 +0100	[diff] [blame]	3757	return 0;
				3758
				3759	/* Flush and acquire obj->pages so that we are coherent through
				3760	* direct access in memory with previous cached writes through
				3761	* shmemfs and that our cache domain tracking remains valid.
				3762	* For example, if the obj->filp was moved to swap without us
				3763	* being notified and releasing the pages, we would mistakenly
				3764	* continue to assume that the obj remained out of the CPU cached
				3765	* domain.
				3766	*/
				3767	ret = i915_gem_object_pin_pages(obj);
				3768	if (ret)
				3769	return ret;
				3770
				3771	flush_write_domain(obj, ~I915_GEM_DOMAIN_WC);
				3772
				3773	/* Serialise direct access to this object with the barriers for
				3774	* coherent writes from the GPU, by effectively invalidating the
				3775	* WC domain upon first access.
				3776	*/
Christian König	c0a51fd	2018-02-16 13:43:38 +0100	[diff] [blame]	3777	if ((obj->read_domains & I915_GEM_DOMAIN_WC) == 0)
Chris Wilson	e22d8e3	2017-04-12 12:01:11 +0100	[diff] [blame]	3778	mb();
				3779
				3780	/* It should now be out of any other write domains, and we can update
				3781	* the domain values for our changes.
				3782	*/
Christian König	c0a51fd	2018-02-16 13:43:38 +0100	[diff] [blame]	3783	GEM_BUG_ON((obj->write_domain & ~I915_GEM_DOMAIN_WC) != 0);
				3784	obj->read_domains \|= I915_GEM_DOMAIN_WC;
Chris Wilson	e22d8e3	2017-04-12 12:01:11 +0100	[diff] [blame]	3785	if (write) {
Christian König	c0a51fd	2018-02-16 13:43:38 +0100	[diff] [blame]	3786	obj->read_domains = I915_GEM_DOMAIN_WC;
				3787	obj->write_domain = I915_GEM_DOMAIN_WC;
Chris Wilson	e22d8e3	2017-04-12 12:01:11 +0100	[diff] [blame]	3788	obj->mm.dirty = true;
				3789	}
				3790
				3791	i915_gem_object_unpin_pages(obj);
				3792	return 0;
				3793	}
				3794
				3795	/**
Eric Anholt	2ef7eea	2008-11-10 10:53:25 -0800	[diff] [blame]	3796	* Moves a single object to the GTT read, and possibly write domain.
Tvrtko Ursulin	14bb2c1	2016-06-03 14:02:17 +0100	[diff] [blame]	3797	* @obj: object to act on
				3798	* @write: ask for write access or read only
Eric Anholt	2ef7eea	2008-11-10 10:53:25 -0800	[diff] [blame]	3799	*
				3800	* This function returns when the move is complete, including waiting on
				3801	* flushes to occur.
				3802	*/
Jesse Barnes	79e5394	2008-11-07 14:24:08 -0800	[diff] [blame]	3803	int
Chris Wilson	2021746	2010-11-23 15:26:33 +0000	[diff] [blame]	3804	i915_gem_object_set_to_gtt_domain(struct drm_i915_gem_object *obj, bool write)
Eric Anholt	2ef7eea	2008-11-10 10:53:25 -0800	[diff] [blame]	3805	{
Eric Anholt	e47c68e	2008-11-14 13:35:19 -0800	[diff] [blame]	3806	int ret;
Eric Anholt	2ef7eea	2008-11-10 10:53:25 -0800	[diff] [blame]	3807
Chris Wilson	e95433c	2016-10-28 13:58:27 +0100	[diff] [blame]	3808	lockdep_assert_held(&obj->base.dev->struct_mutex);
Chris Wilson	4c7d62c	2016-10-28 13:58:32 +0100	[diff] [blame]	3809
Chris Wilson	e95433c	2016-10-28 13:58:27 +0100	[diff] [blame]	3810	ret = i915_gem_object_wait(obj,
				3811	I915_WAIT_INTERRUPTIBLE \|
				3812	I915_WAIT_LOCKED \|
				3813	(write ? I915_WAIT_ALL : 0),
				3814	MAX_SCHEDULE_TIMEOUT,
				3815	NULL);
Chris Wilson	8824178	2011-01-07 17:09:48 +0000	[diff] [blame]	3816	if (ret)
				3817	return ret;
				3818
Christian König	c0a51fd	2018-02-16 13:43:38 +0100	[diff] [blame]	3819	if (obj->write_domain == I915_GEM_DOMAIN_GTT)
Chris Wilson	c13d87e	2016-07-20 09:21:15 +0100	[diff] [blame]	3820	return 0;
				3821
Chris Wilson	43566de	2015-01-02 16:29:29 +0530	[diff] [blame]	3822	/* Flush and acquire obj->pages so that we are coherent through
				3823	* direct access in memory with previous cached writes through
				3824	* shmemfs and that our cache domain tracking remains valid.
				3825	* For example, if the obj->filp was moved to swap without us
				3826	* being notified and releasing the pages, we would mistakenly
				3827	* continue to assume that the obj remained out of the CPU cached
				3828	* domain.
				3829	*/
Chris Wilson	a4f5ea6	2016-10-28 13:58:35 +0100	[diff] [blame]	3830	ret = i915_gem_object_pin_pages(obj);
Chris Wilson	43566de	2015-01-02 16:29:29 +0530	[diff] [blame]	3831	if (ret)
				3832	return ret;
				3833
Chris Wilson	ef74921	2017-04-12 12:01:10 +0100	[diff] [blame]	3834	flush_write_domain(obj, ~I915_GEM_DOMAIN_GTT);
Chris Wilson	1c5d22f	2009-08-25 11:15:50 +0100	[diff] [blame]	3835
Chris Wilson	d0a5778	2012-10-09 19:24:37 +0100	[diff] [blame]	3836	/* Serialise direct access to this object with the barriers for
				3837	* coherent writes from the GPU, by effectively invalidating the
				3838	* GTT domain upon first access.
				3839	*/
Christian König	c0a51fd	2018-02-16 13:43:38 +0100	[diff] [blame]	3840	if ((obj->read_domains & I915_GEM_DOMAIN_GTT) == 0)
Chris Wilson	d0a5778	2012-10-09 19:24:37 +0100	[diff] [blame]	3841	mb();
				3842
Eric Anholt	2ef7eea	2008-11-10 10:53:25 -0800	[diff] [blame]	3843	/* It should now be out of any other write domains, and we can update
				3844	* the domain values for our changes.
				3845	*/
Christian König	c0a51fd	2018-02-16 13:43:38 +0100	[diff] [blame]	3846	GEM_BUG_ON((obj->write_domain & ~I915_GEM_DOMAIN_GTT) != 0);
				3847	obj->read_domains \|= I915_GEM_DOMAIN_GTT;
Eric Anholt	e47c68e	2008-11-14 13:35:19 -0800	[diff] [blame]	3848	if (write) {
Christian König	c0a51fd	2018-02-16 13:43:38 +0100	[diff] [blame]	3849	obj->read_domains = I915_GEM_DOMAIN_GTT;
				3850	obj->write_domain = I915_GEM_DOMAIN_GTT;
Chris Wilson	a4f5ea6	2016-10-28 13:58:35 +0100	[diff] [blame]	3851	obj->mm.dirty = true;
Eric Anholt	e47c68e	2008-11-14 13:35:19 -0800	[diff] [blame]	3852	}
				3853
Chris Wilson	a4f5ea6	2016-10-28 13:58:35 +0100	[diff] [blame]	3854	i915_gem_object_unpin_pages(obj);
Eric Anholt	e47c68e	2008-11-14 13:35:19 -0800	[diff] [blame]	3855	return 0;
				3856	}
				3857
Chris Wilson	ef55f92	2015-10-09 14:11:27 +0100	[diff] [blame]	3858	/**
				3859	* Changes the cache-level of an object across all VMA.
Tvrtko Ursulin	14bb2c1	2016-06-03 14:02:17 +0100	[diff] [blame]	3860	* @obj: object to act on
				3861	* @cache_level: new cache level to set for the object
Chris Wilson	ef55f92	2015-10-09 14:11:27 +0100	[diff] [blame]	3862	*
				3863	* After this function returns, the object will be in the new cache-level
				3864	* across all GTT and the contents of the backing storage will be coherent,
				3865	* with respect to the new cache-level. In order to keep the backing storage
				3866	* coherent for all users, we only allow a single cache level to be set
				3867	* globally on the object and prevent it from being changed whilst the
				3868	* hardware is reading from the object. That is if the object is currently
				3869	* on the scanout it will be set to uncached (or equivalent display
				3870	* cache coherency) and all non-MOCS GPU access will also be uncached so
				3871	* that all direct access to the scanout remains coherent.
				3872	*/
Chris Wilson	e4ffd17	2011-04-04 09:44:39 +0100	[diff] [blame]	3873	int i915_gem_object_set_cache_level(struct drm_i915_gem_object *obj,
				3874	enum i915_cache_level cache_level)
				3875	{
Chris Wilson	aa653a6	2016-08-04 07:52:27 +0100	[diff] [blame]	3876	struct i915_vma *vma;
Chris Wilson	a6a7cc4	2016-11-18 21:17:46 +0000	[diff] [blame]	3877	int ret;
Chris Wilson	e4ffd17	2011-04-04 09:44:39 +0100	[diff] [blame]	3878
Chris Wilson	4c7d62c	2016-10-28 13:58:32 +0100	[diff] [blame]	3879	lockdep_assert_held(&obj->base.dev->struct_mutex);
				3880
Chris Wilson	e4ffd17	2011-04-04 09:44:39 +0100	[diff] [blame]	3881	if (obj->cache_level == cache_level)
Chris Wilson	a6a7cc4	2016-11-18 21:17:46 +0000	[diff] [blame]	3882	return 0;
Chris Wilson	e4ffd17	2011-04-04 09:44:39 +0100	[diff] [blame]	3883
Chris Wilson	ef55f92	2015-10-09 14:11:27 +0100	[diff] [blame]	3884	/* Inspect the list of currently bound VMA and unbind any that would
				3885	* be invalid given the new cache-level. This is principally to
				3886	* catch the issue of the CS prefetch crossing page boundaries and
				3887	* reading an invalid PTE on older architectures.
				3888	*/
Chris Wilson	aa653a6	2016-08-04 07:52:27 +0100	[diff] [blame]	3889	restart:
				3890	list_for_each_entry(vma, &obj->vma_list, obj_link) {
Chris Wilson	ef55f92	2015-10-09 14:11:27 +0100	[diff] [blame]	3891	if (!drm_mm_node_allocated(&vma->node))
				3892	continue;
				3893
Chris Wilson	20dfbde	2016-08-04 16:32:30 +0100	[diff] [blame]	3894	if (i915_vma_is_pinned(vma)) {
Chris Wilson	ef55f92	2015-10-09 14:11:27 +0100	[diff] [blame]	3895	DRM_DEBUG("can not change the cache level of pinned objects\n");
				3896	return -EBUSY;
				3897	}
				3898
Chris Wilson	010e3e6	2017-12-06 12:49:13 +0000	[diff] [blame]	3899	if (!i915_vma_is_closed(vma) &&
				3900	i915_gem_valid_gtt_space(vma, cache_level))
Chris Wilson	aa653a6	2016-08-04 07:52:27 +0100	[diff] [blame]	3901	continue;
				3902
				3903	ret = i915_vma_unbind(vma);
				3904	if (ret)
				3905	return ret;
				3906
				3907	/* As unbinding may affect other elements in the
				3908	* obj->vma_list (due to side-effects from retiring
				3909	* an active vma), play safe and restart the iterator.
				3910	*/
				3911	goto restart;
Chris Wilson	42d6ab4	2012-07-26 11:49:32 +0100	[diff] [blame]	3912	}
				3913
Chris Wilson	ef55f92	2015-10-09 14:11:27 +0100	[diff] [blame]	3914	/* We can reuse the existing drm_mm nodes but need to change the
				3915	* cache-level on the PTE. We could simply unbind them all and
				3916	* rebind with the correct cache-level on next use. However since
				3917	* we already have a valid slot, dma mapping, pages etc, we may as
				3918	* rewrite the PTE in the belief that doing so tramples upon less
				3919	* state and so involves less work.
				3920	*/
Chris Wilson	15717de	2016-08-04 07:52:26 +0100	[diff] [blame]	3921	if (obj->bind_count) {
Chris Wilson	ef55f92	2015-10-09 14:11:27 +0100	[diff] [blame]	3922	/* Before we change the PTE, the GPU must not be accessing it.
				3923	* If we wait upon the object, we know that all the bound
				3924	* VMA are no longer active.
				3925	*/
Chris Wilson	e95433c	2016-10-28 13:58:27 +0100	[diff] [blame]	3926	ret = i915_gem_object_wait(obj,
				3927	I915_WAIT_INTERRUPTIBLE \|
				3928	I915_WAIT_LOCKED \|
				3929	I915_WAIT_ALL,
				3930	MAX_SCHEDULE_TIMEOUT,
				3931	NULL);
Chris Wilson	e4ffd17	2011-04-04 09:44:39 +0100	[diff] [blame]	3932	if (ret)
				3933	return ret;
				3934
Tvrtko Ursulin	0031fb9	2016-11-04 14:42:44 +0000	[diff] [blame]	3935	if (!HAS_LLC(to_i915(obj->base.dev)) &&
				3936	cache_level != I915_CACHE_NONE) {
Chris Wilson	ef55f92	2015-10-09 14:11:27 +0100	[diff] [blame]	3937	/* Access to snoopable pages through the GTT is
				3938	* incoherent and on some machines causes a hard
				3939	* lockup. Relinquish the CPU mmaping to force
				3940	* userspace to refault in the pages and we can
				3941	* then double check if the GTT mapping is still
				3942	* valid for that pointer access.
				3943	*/
				3944	i915_gem_release_mmap(obj);
Chris Wilson	e4ffd17	2011-04-04 09:44:39 +0100	[diff] [blame]	3945
Chris Wilson	ef55f92	2015-10-09 14:11:27 +0100	[diff] [blame]	3946	/* As we no longer need a fence for GTT access,
				3947	* we can relinquish it now (and so prevent having
				3948	* to steal a fence from someone else on the next
				3949	* fence request). Note GPU activity would have
				3950	* dropped the fence as all snoopable access is
				3951	* supposed to be linear.
				3952	*/
Chris Wilson	e2189dd	2017-12-07 21:14:07 +0000	[diff] [blame]	3953	for_each_ggtt_vma(vma, obj) {
Chris Wilson	49ef529	2016-08-18 17:17:00 +0100	[diff] [blame]	3954	ret = i915_vma_put_fence(vma);
				3955	if (ret)
				3956	return ret;
				3957	}
Chris Wilson	ef55f92	2015-10-09 14:11:27 +0100	[diff] [blame]	3958	} else {
				3959	/* We either have incoherent backing store and
				3960	* so no GTT access or the architecture is fully
				3961	* coherent. In such cases, existing GTT mmaps
				3962	* ignore the cache bit in the PTE and we can
				3963	* rewrite it without confusing the GPU or having
				3964	* to force userspace to fault back in its mmaps.
				3965	*/
Chris Wilson	e4ffd17	2011-04-04 09:44:39 +0100	[diff] [blame]	3966	}
				3967
Chris Wilson	1c7f4bc	2016-02-26 11:03:19 +0000	[diff] [blame]	3968	list_for_each_entry(vma, &obj->vma_list, obj_link) {
Chris Wilson	ef55f92	2015-10-09 14:11:27 +0100	[diff] [blame]	3969	if (!drm_mm_node_allocated(&vma->node))
				3970	continue;
				3971
				3972	ret = i915_vma_bind(vma, cache_level, PIN_UPDATE);
				3973	if (ret)
				3974	return ret;
				3975	}
Chris Wilson	e4ffd17	2011-04-04 09:44:39 +0100	[diff] [blame]	3976	}
				3977
Chris Wilson	1c7f4bc	2016-02-26 11:03:19 +0000	[diff] [blame]	3978	list_for_each_entry(vma, &obj->vma_list, obj_link)
Chris Wilson	2c22569	2013-08-09 12:26:45 +0100	[diff] [blame]	3979	vma->node.color = cache_level;
Chris Wilson	b8f55be	2017-08-11 12:11:16 +0100	[diff] [blame]	3980	i915_gem_object_set_cache_coherency(obj, cache_level);
Chris Wilson	e27ab73	2017-06-15 13:38:49 +0100	[diff] [blame]	3981	obj->cache_dirty = true; /* Always invalidate stale cachelines */
Chris Wilson	2c22569	2013-08-09 12:26:45 +0100	[diff] [blame]	3982
Chris Wilson	e4ffd17	2011-04-04 09:44:39 +0100	[diff] [blame]	3983	return 0;
				3984	}
				3985
Ben Widawsky	199adf4	2012-09-21 17:01:20 -0700	[diff] [blame]	3986	int i915_gem_get_caching_ioctl(struct drm_device dev, void data,
				3987	struct drm_file *file)
Chris Wilson	e6994ae	2012-07-10 10:27:08 +0100	[diff] [blame]	3988	{
Ben Widawsky	199adf4	2012-09-21 17:01:20 -0700	[diff] [blame]	3989	struct drm_i915_gem_caching *args = data;
Chris Wilson	e6994ae	2012-07-10 10:27:08 +0100	[diff] [blame]	3990	struct drm_i915_gem_object *obj;
Chris Wilson	fbbd37b	2016-10-28 13:58:42 +0100	[diff] [blame]	3991	int err = 0;
Chris Wilson	e6994ae	2012-07-10 10:27:08 +0100	[diff] [blame]	3992
Chris Wilson	fbbd37b	2016-10-28 13:58:42 +0100	[diff] [blame]	3993	rcu_read_lock();
				3994	obj = i915_gem_object_lookup_rcu(file, args->handle);
				3995	if (!obj) {
				3996	err = -ENOENT;
				3997	goto out;
				3998	}
Chris Wilson	e6994ae	2012-07-10 10:27:08 +0100	[diff] [blame]	3999
Chris Wilson	651d794	2013-08-08 14:41:10 +0100	[diff] [blame]	4000	switch (obj->cache_level) {
				4001	case I915_CACHE_LLC:
				4002	case I915_CACHE_L3_LLC:
				4003	args->caching = I915_CACHING_CACHED;
				4004	break;
				4005
Chris Wilson	4257d3b	2013-08-08 14:41:11 +0100	[diff] [blame]	4006	case I915_CACHE_WT:
				4007	args->caching = I915_CACHING_DISPLAY;
				4008	break;
				4009
Chris Wilson	651d794	2013-08-08 14:41:10 +0100	[diff] [blame]	4010	default:
				4011	args->caching = I915_CACHING_NONE;
				4012	break;
				4013	}
Chris Wilson	fbbd37b	2016-10-28 13:58:42 +0100	[diff] [blame]	4014	out:
				4015	rcu_read_unlock();
				4016	return err;
Chris Wilson	e6994ae	2012-07-10 10:27:08 +0100	[diff] [blame]	4017	}
				4018
Ben Widawsky	199adf4	2012-09-21 17:01:20 -0700	[diff] [blame]	4019	int i915_gem_set_caching_ioctl(struct drm_device dev, void data,
				4020	struct drm_file *file)
Chris Wilson	e6994ae	2012-07-10 10:27:08 +0100	[diff] [blame]	4021	{
Chris Wilson	9c870d0	2016-10-24 13:42:15 +0100	[diff] [blame]	4022	struct drm_i915_private *i915 = to_i915(dev);
Ben Widawsky	199adf4	2012-09-21 17:01:20 -0700	[diff] [blame]	4023	struct drm_i915_gem_caching *args = data;
Chris Wilson	e6994ae	2012-07-10 10:27:08 +0100	[diff] [blame]	4024	struct drm_i915_gem_object *obj;
				4025	enum i915_cache_level level;
Chris Wilson	d65415d	2017-01-19 08:22:10 +0000	[diff] [blame]	4026	int ret = 0;
Chris Wilson	e6994ae	2012-07-10 10:27:08 +0100	[diff] [blame]	4027
Ben Widawsky	199adf4	2012-09-21 17:01:20 -0700	[diff] [blame]	4028	switch (args->caching) {
				4029	case I915_CACHING_NONE:
Chris Wilson	e6994ae	2012-07-10 10:27:08 +0100	[diff] [blame]	4030	level = I915_CACHE_NONE;
				4031	break;
Ben Widawsky	199adf4	2012-09-21 17:01:20 -0700	[diff] [blame]	4032	case I915_CACHING_CACHED:
Imre Deak	e5756c1	2015-08-14 18:43:30 +0300	[diff] [blame]	4033	/*
				4034	* Due to a HW issue on BXT A stepping, GPU stores via a
				4035	* snooped mapping may leave stale data in a corresponding CPU
				4036	* cacheline, whereas normally such cachelines would get
				4037	* invalidated.
				4038	*/
Chris Wilson	9c870d0	2016-10-24 13:42:15 +0100	[diff] [blame]	4039	if (!HAS_LLC(i915) && !HAS_SNOOP(i915))
Imre Deak	e5756c1	2015-08-14 18:43:30 +0300	[diff] [blame]	4040	return -ENODEV;
				4041
Chris Wilson	e6994ae	2012-07-10 10:27:08 +0100	[diff] [blame]	4042	level = I915_CACHE_LLC;
				4043	break;
Chris Wilson	4257d3b	2013-08-08 14:41:11 +0100	[diff] [blame]	4044	case I915_CACHING_DISPLAY:
Chris Wilson	9c870d0	2016-10-24 13:42:15 +0100	[diff] [blame]	4045	level = HAS_WT(i915) ? I915_CACHE_WT : I915_CACHE_NONE;
Chris Wilson	4257d3b	2013-08-08 14:41:11 +0100	[diff] [blame]	4046	break;
Chris Wilson	e6994ae	2012-07-10 10:27:08 +0100	[diff] [blame]	4047	default:
				4048	return -EINVAL;
				4049	}
				4050
Chris Wilson	d65415d	2017-01-19 08:22:10 +0000	[diff] [blame]	4051	obj = i915_gem_object_lookup(file, args->handle);
				4052	if (!obj)
				4053	return -ENOENT;
				4054
Tina Zhang	a03f395	2017-11-14 10:25:13 +0000	[diff] [blame]	4055	/*
				4056	* The caching mode of proxy object is handled by its generator, and
				4057	* not allowed to be changed by userspace.
				4058	*/
				4059	if (i915_gem_object_is_proxy(obj)) {
				4060	ret = -ENXIO;
				4061	goto out;
				4062	}
				4063
Chris Wilson	d65415d	2017-01-19 08:22:10 +0000	[diff] [blame]	4064	if (obj->cache_level == level)
				4065	goto out;
				4066
				4067	ret = i915_gem_object_wait(obj,
				4068	I915_WAIT_INTERRUPTIBLE,
				4069	MAX_SCHEDULE_TIMEOUT,
				4070	to_rps_client(file));
				4071	if (ret)
				4072	goto out;
				4073
Ben Widawsky	3bc2913	2012-09-26 16:15:20 -0700	[diff] [blame]	4074	ret = i915_mutex_lock_interruptible(dev);
				4075	if (ret)
Chris Wilson	d65415d	2017-01-19 08:22:10 +0000	[diff] [blame]	4076	goto out;
Chris Wilson	e6994ae	2012-07-10 10:27:08 +0100	[diff] [blame]	4077
				4078	ret = i915_gem_object_set_cache_level(obj, level);
Chris Wilson	e6994ae	2012-07-10 10:27:08 +0100	[diff] [blame]	4079	mutex_unlock(&dev->struct_mutex);
Chris Wilson	d65415d	2017-01-19 08:22:10 +0000	[diff] [blame]	4080
				4081	out:
				4082	i915_gem_object_put(obj);
Chris Wilson	e6994ae	2012-07-10 10:27:08 +0100	[diff] [blame]	4083	return ret;
				4084	}
				4085
Zhenyu Wang	b9241ea	2009-11-25 13:09:39 +0800	[diff] [blame]	4086	/*
Chris Wilson	2da3b9b	2011-04-14 09:41:17 +0100	[diff] [blame]	4087	* Prepare buffer for display plane (scanout, cursors, etc).
				4088	* Can be called from an uninterruptible phase (modesetting) and allows
				4089	* any flushes to be pipelined (for pageflips).
Zhenyu Wang	b9241ea	2009-11-25 13:09:39 +0800	[diff] [blame]	4090	*/
Chris Wilson	058d88c	2016-08-15 10:49:06 +0100	[diff] [blame]	4091	struct i915_vma *
Chris Wilson	2da3b9b	2011-04-14 09:41:17 +0100	[diff] [blame]	4092	i915_gem_object_pin_to_display_plane(struct drm_i915_gem_object *obj,
				4093	u32 alignment,
Chris Wilson	5935485	2018-02-20 13:42:06 +0000	[diff] [blame]	4094	const struct i915_ggtt_view *view,
				4095	unsigned int flags)
Zhenyu Wang	b9241ea	2009-11-25 13:09:39 +0800	[diff] [blame]	4096	{
Chris Wilson	058d88c	2016-08-15 10:49:06 +0100	[diff] [blame]	4097	struct i915_vma *vma;
Zhenyu Wang	b9241ea	2009-11-25 13:09:39 +0800	[diff] [blame]	4098	int ret;
				4099
Chris Wilson	4c7d62c	2016-10-28 13:58:32 +0100	[diff] [blame]	4100	lockdep_assert_held(&obj->base.dev->struct_mutex);
				4101
Chris Wilson	bd3d225	2017-10-13 21:26:14 +0100	[diff] [blame]	4102	/* Mark the global pin early so that we account for the
Chris Wilson	cc98b41	2013-08-09 12:25:09 +0100	[diff] [blame]	4103	* display coherency whilst setting up the cache domains.
				4104	*/
Chris Wilson	bd3d225	2017-10-13 21:26:14 +0100	[diff] [blame]	4105	obj->pin_global++;
Chris Wilson	cc98b41	2013-08-09 12:25:09 +0100	[diff] [blame]	4106
Eric Anholt	a7ef064	2011-03-29 16:59:54 -0700	[diff] [blame]	4107	/* The display engine is not coherent with the LLC cache on gen6. As
				4108	* a result, we make sure that the pinning that is about to occur is
				4109	* done with uncached PTEs. This is lowest common denominator for all
				4110	* chipsets.
				4111	*
				4112	* However for gen6+, we could do better by using the GFDT bit instead
				4113	* of uncaching, which would allow us to flush all the LLC-cached data
				4114	* with that bit in the PTE to main memory with just one PIPE_CONTROL.
				4115	*/
Chris Wilson	651d794	2013-08-08 14:41:10 +0100	[diff] [blame]	4116	ret = i915_gem_object_set_cache_level(obj,
Tvrtko Ursulin	8652744	2016-10-13 11:03:00 +0100	[diff] [blame]	4117	HAS_WT(to_i915(obj->base.dev)) ?
				4118	I915_CACHE_WT : I915_CACHE_NONE);
Chris Wilson	058d88c	2016-08-15 10:49:06 +0100	[diff] [blame]	4119	if (ret) {
				4120	vma = ERR_PTR(ret);
Chris Wilson	bd3d225	2017-10-13 21:26:14 +0100	[diff] [blame]	4121	goto err_unpin_global;
Chris Wilson	058d88c	2016-08-15 10:49:06 +0100	[diff] [blame]	4122	}
Eric Anholt	a7ef064	2011-03-29 16:59:54 -0700	[diff] [blame]	4123
Chris Wilson	2da3b9b	2011-04-14 09:41:17 +0100	[diff] [blame]	4124	/* As the user may map the buffer once pinned in the display plane
				4125	* (e.g. libkms for the bootup splash), we have to ensure that we
Chris Wilson	2efb813	2016-08-18 17:17:06 +0100	[diff] [blame]	4126	* always use map_and_fenceable for all scanout buffers. However,
				4127	* it may simply be too big to fit into mappable, in which case
				4128	* put it anyway and hope that userspace can cope (but always first
				4129	* try to preserve the existing ABI).
Chris Wilson	2da3b9b	2011-04-14 09:41:17 +0100	[diff] [blame]	4130	*/
Chris Wilson	2efb813	2016-08-18 17:17:06 +0100	[diff] [blame]	4131	vma = ERR_PTR(-ENOSPC);
Chris Wilson	5935485	2018-02-20 13:42:06 +0000	[diff] [blame]	4132	if ((flags & PIN_MAPPABLE) == 0 &&
				4133	(!view \|\| view->type == I915_GGTT_VIEW_NORMAL))
Chris Wilson	2efb813	2016-08-18 17:17:06 +0100	[diff] [blame]	4134	vma = i915_gem_object_ggtt_pin(obj, view, 0, alignment,
Chris Wilson	5935485	2018-02-20 13:42:06 +0000	[diff] [blame]	4135	flags \|
				4136	PIN_MAPPABLE \|
				4137	PIN_NONBLOCK);
				4138	if (IS_ERR(vma))
Chris Wilson	767a222	2016-11-07 11:01:28 +0000	[diff] [blame]	4139	vma = i915_gem_object_ggtt_pin(obj, view, 0, alignment, flags);
Chris Wilson	058d88c	2016-08-15 10:49:06 +0100	[diff] [blame]	4140	if (IS_ERR(vma))
Chris Wilson	bd3d225	2017-10-13 21:26:14 +0100	[diff] [blame]	4141	goto err_unpin_global;
Chris Wilson	2da3b9b	2011-04-14 09:41:17 +0100	[diff] [blame]	4142
Chris Wilson	d8923dc	2016-08-18 17:17:07 +0100	[diff] [blame]	4143	vma->display_alignment = max_t(u64, vma->display_alignment, alignment);
				4144
Chris Wilson	a6a7cc4	2016-11-18 21:17:46 +0000	[diff] [blame]	4145	/* Treat this as an end-of-frame, like intel_user_framebuffer_dirty() */
Chris Wilson	5a97bcc	2017-02-22 11:40:46 +0000	[diff] [blame]	4146	__i915_gem_object_flush_for_display(obj);
Chris Wilson	d59b21e	2017-02-22 11:40:49 +0000	[diff] [blame]	4147	intel_fb_obj_flush(obj, ORIGIN_DIRTYFB);
Chris Wilson	b118c1e	2010-05-27 13:18:14 +0100	[diff] [blame]	4148
Chris Wilson	2da3b9b	2011-04-14 09:41:17 +0100	[diff] [blame]	4149	/* It should now be out of any other write domains, and we can update
				4150	* the domain values for our changes.
				4151	*/
Christian König	c0a51fd	2018-02-16 13:43:38 +0100	[diff] [blame]	4152	obj->read_domains \|= I915_GEM_DOMAIN_GTT;
Zhenyu Wang	b9241ea	2009-11-25 13:09:39 +0800	[diff] [blame]	4153
Chris Wilson	058d88c	2016-08-15 10:49:06 +0100	[diff] [blame]	4154	return vma;
Chris Wilson	cc98b41	2013-08-09 12:25:09 +0100	[diff] [blame]	4155
Chris Wilson	bd3d225	2017-10-13 21:26:14 +0100	[diff] [blame]	4156	err_unpin_global:
				4157	obj->pin_global--;
Chris Wilson	058d88c	2016-08-15 10:49:06 +0100	[diff] [blame]	4158	return vma;
Chris Wilson	cc98b41	2013-08-09 12:25:09 +0100	[diff] [blame]	4159	}
				4160
				4161	void
Chris Wilson	058d88c	2016-08-15 10:49:06 +0100	[diff] [blame]	4162	i915_gem_object_unpin_from_display_plane(struct i915_vma *vma)
Chris Wilson	cc98b41	2013-08-09 12:25:09 +0100	[diff] [blame]	4163	{
Chris Wilson	49d7391	2016-11-29 09:50:08 +0000	[diff] [blame]	4164	lockdep_assert_held(&vma->vm->i915->drm.struct_mutex);
Chris Wilson	4c7d62c	2016-10-28 13:58:32 +0100	[diff] [blame]	4165
Chris Wilson	bd3d225	2017-10-13 21:26:14 +0100	[diff] [blame]	4166	if (WARN_ON(vma->obj->pin_global == 0))
Tvrtko Ursulin	8a0c39b	2015-04-13 11:50:09 +0100	[diff] [blame]	4167	return;
				4168
Chris Wilson	bd3d225	2017-10-13 21:26:14 +0100	[diff] [blame]	4169	if (--vma->obj->pin_global == 0)
Chris Wilson	f51455d	2017-01-10 14:47:34 +0000	[diff] [blame]	4170	vma->display_alignment = I915_GTT_MIN_ALIGNMENT;
Tvrtko Ursulin	e661733	2015-03-23 11:10:33 +0000	[diff] [blame]	4171
Chris Wilson	383d582	2016-08-18 17:17:08 +0100	[diff] [blame]	4172	/* Bump the LRU to try and avoid premature eviction whilst flipping */
Chris Wilson	befedbb	2017-01-19 19:26:55 +0000	[diff] [blame]	4173	i915_gem_object_bump_inactive_ggtt(vma->obj);
Chris Wilson	383d582	2016-08-18 17:17:08 +0100	[diff] [blame]	4174
Chris Wilson	058d88c	2016-08-15 10:49:06 +0100	[diff] [blame]	4175	i915_vma_unpin(vma);
Zhenyu Wang	b9241ea	2009-11-25 13:09:39 +0800	[diff] [blame]	4176	}
				4177
Eric Anholt	e47c68e	2008-11-14 13:35:19 -0800	[diff] [blame]	4178	/**
				4179	* Moves a single object to the CPU read, and possibly write domain.
Tvrtko Ursulin	14bb2c1	2016-06-03 14:02:17 +0100	[diff] [blame]	4180	* @obj: object to act on
				4181	* @write: requesting write or read-only access
Eric Anholt	e47c68e	2008-11-14 13:35:19 -0800	[diff] [blame]	4182	*
				4183	* This function returns when the move is complete, including waiting on
				4184	* flushes to occur.
				4185	*/
Chris Wilson	dabdfe0	2012-03-26 10:10:27 +0200	[diff] [blame]	4186	int
Chris Wilson	919926a	2010-11-12 13:42:53 +0000	[diff] [blame]	4187	i915_gem_object_set_to_cpu_domain(struct drm_i915_gem_object *obj, bool write)
Eric Anholt	e47c68e	2008-11-14 13:35:19 -0800	[diff] [blame]	4188	{
Eric Anholt	e47c68e	2008-11-14 13:35:19 -0800	[diff] [blame]	4189	int ret;
				4190
Chris Wilson	e95433c	2016-10-28 13:58:27 +0100	[diff] [blame]	4191	lockdep_assert_held(&obj->base.dev->struct_mutex);
Chris Wilson	4c7d62c	2016-10-28 13:58:32 +0100	[diff] [blame]	4192
Chris Wilson	e95433c	2016-10-28 13:58:27 +0100	[diff] [blame]	4193	ret = i915_gem_object_wait(obj,
				4194	I915_WAIT_INTERRUPTIBLE \|
				4195	I915_WAIT_LOCKED \|
				4196	(write ? I915_WAIT_ALL : 0),
				4197	MAX_SCHEDULE_TIMEOUT,
				4198	NULL);
Chris Wilson	8824178	2011-01-07 17:09:48 +0000	[diff] [blame]	4199	if (ret)
				4200	return ret;
				4201
Chris Wilson	ef74921	2017-04-12 12:01:10 +0100	[diff] [blame]	4202	flush_write_domain(obj, ~I915_GEM_DOMAIN_CPU);
Eric Anholt	e47c68e	2008-11-14 13:35:19 -0800	[diff] [blame]	4203
Eric Anholt	e47c68e	2008-11-14 13:35:19 -0800	[diff] [blame]	4204	/* Flush the CPU cache if it's still invalid. */
Christian König	c0a51fd	2018-02-16 13:43:38 +0100	[diff] [blame]	4205	if ((obj->read_domains & I915_GEM_DOMAIN_CPU) == 0) {
Chris Wilson	57822dc	2017-02-22 11:40:48 +0000	[diff] [blame]	4206	i915_gem_clflush_object(obj, I915_CLFLUSH_SYNC);
Christian König	c0a51fd	2018-02-16 13:43:38 +0100	[diff] [blame]	4207	obj->read_domains \|= I915_GEM_DOMAIN_CPU;
Eric Anholt	e47c68e	2008-11-14 13:35:19 -0800	[diff] [blame]	4208	}
				4209
				4210	/* It should now be out of any other write domains, and we can update
				4211	* the domain values for our changes.
				4212	*/
Christian König	c0a51fd	2018-02-16 13:43:38 +0100	[diff] [blame]	4213	GEM_BUG_ON(obj->write_domain & ~I915_GEM_DOMAIN_CPU);
Eric Anholt	e47c68e	2008-11-14 13:35:19 -0800	[diff] [blame]	4214
				4215	/* If we're writing through the CPU, then the GPU read domains will
				4216	* need to be invalidated at next use.
				4217	*/
Chris Wilson	e27ab73	2017-06-15 13:38:49 +0100	[diff] [blame]	4218	if (write)
				4219	__start_cpu_write(obj);
Eric Anholt	2ef7eea	2008-11-10 10:53:25 -0800	[diff] [blame]	4220
				4221	return 0;
				4222	}
				4223
Eric Anholt	673a394	2008-07-30 12:06:12 -0700	[diff] [blame]	4224	/* Throttle our rendering by waiting until the ring has completed our requests
				4225	* emitted over 20 msec ago.
				4226	*
Eric Anholt	b962442	2009-06-03 07:27:35 +0000	[diff] [blame]	4227	* Note that if we were to use the current jiffies each time around the loop,
				4228	* we wouldn't escape the function with any frames outstanding if the time to
				4229	* render a frame was over 20ms.
				4230	*
Eric Anholt	673a394	2008-07-30 12:06:12 -0700	[diff] [blame]	4231	* This should get us reasonable parallelism between CPU and GPU but also
				4232	* relatively low latency when blocking on a particular request to finish.
				4233	*/
				4234	static int
Chris Wilson	f787a5f	2010-09-24 16:02:42 +0100	[diff] [blame]	4235	i915_gem_ring_throttle(struct drm_device dev, struct drm_file file)
Eric Anholt	673a394	2008-07-30 12:06:12 -0700	[diff] [blame]	4236	{
Chris Wilson	fac5e23	2016-07-04 11:34:36 +0100	[diff] [blame]	4237	struct drm_i915_private *dev_priv = to_i915(dev);
Chris Wilson	f787a5f	2010-09-24 16:02:42 +0100	[diff] [blame]	4238	struct drm_i915_file_private *file_priv = file->driver_priv;
Chris Wilson	d0bc54f	2015-05-21 21:01:48 +0100	[diff] [blame]	4239	unsigned long recent_enough = jiffies - DRM_I915_THROTTLE_JIFFIES;
Chris Wilson	e61e0f5	2018-02-21 09:56:36 +0000	[diff] [blame]	4240	struct i915_request request, target = NULL;
Chris Wilson	e95433c	2016-10-28 13:58:27 +0100	[diff] [blame]	4241	long ret;
Eric Anholt	673a394	2008-07-30 12:06:12 -0700	[diff] [blame]	4242
Chris Wilson	f4457ae	2016-04-13 17:35:08 +0100	[diff] [blame]	4243	/* ABI: return -EIO if already wedged */
				4244	if (i915_terminally_wedged(&dev_priv->gpu_error))
				4245	return -EIO;
Chris Wilson	e110e8d	2011-01-26 15:39:14 +0000	[diff] [blame]	4246
Chris Wilson	1c25595	2010-09-26 11:03:27 +0100	[diff] [blame]	4247	spin_lock(&file_priv->mm.lock);
Chris Wilson	c8659ef	2017-03-02 12:25:25 +0000	[diff] [blame]	4248	list_for_each_entry(request, &file_priv->mm.request_list, client_link) {
Eric Anholt	b962442	2009-06-03 07:27:35 +0000	[diff] [blame]	4249	if (time_after_eq(request->emitted_jiffies, recent_enough))
				4250	break;
				4251
Chris Wilson	c8659ef	2017-03-02 12:25:25 +0000	[diff] [blame]	4252	if (target) {
				4253	list_del(&target->client_link);
				4254	target->file_priv = NULL;
				4255	}
John Harrison	fcfa423c	2015-05-29 17:44:12 +0100	[diff] [blame]	4256
John Harrison	54fb241	2014-11-24 18:49:27 +0000	[diff] [blame]	4257	target = request;
Eric Anholt	b962442	2009-06-03 07:27:35 +0000	[diff] [blame]	4258	}
John Harrison	ff86588	2014-11-24 18:49:28 +0000	[diff] [blame]	4259	if (target)
Chris Wilson	e61e0f5	2018-02-21 09:56:36 +0000	[diff] [blame]	4260	i915_request_get(target);
Chris Wilson	1c25595	2010-09-26 11:03:27 +0100	[diff] [blame]	4261	spin_unlock(&file_priv->mm.lock);
Chris Wilson	f787a5f	2010-09-24 16:02:42 +0100	[diff] [blame]	4262
John Harrison	54fb241	2014-11-24 18:49:27 +0000	[diff] [blame]	4263	if (target == NULL)
Chris Wilson	f787a5f	2010-09-24 16:02:42 +0100	[diff] [blame]	4264	return 0;
				4265
Chris Wilson	e61e0f5	2018-02-21 09:56:36 +0000	[diff] [blame]	4266	ret = i915_request_wait(target,
Chris Wilson	e95433c	2016-10-28 13:58:27 +0100	[diff] [blame]	4267	I915_WAIT_INTERRUPTIBLE,
				4268	MAX_SCHEDULE_TIMEOUT);
Chris Wilson	e61e0f5	2018-02-21 09:56:36 +0000	[diff] [blame]	4269	i915_request_put(target);
John Harrison	ff86588	2014-11-24 18:49:28 +0000	[diff] [blame]	4270
Chris Wilson	e95433c	2016-10-28 13:58:27 +0100	[diff] [blame]	4271	return ret < 0 ? ret : 0;
Eric Anholt	673a394	2008-07-30 12:06:12 -0700	[diff] [blame]	4272	}
				4273
Chris Wilson	058d88c	2016-08-15 10:49:06 +0100	[diff] [blame]	4274	struct i915_vma *
Joonas Lahtinen	ec7adb6	2015-03-16 14:11:13 +0200	[diff] [blame]	4275	i915_gem_object_ggtt_pin(struct drm_i915_gem_object *obj,
				4276	const struct i915_ggtt_view *view,
Chris Wilson	91b2db6	2016-08-04 16:32:23 +0100	[diff] [blame]	4277	u64 size,
Chris Wilson	2ffffd0	2016-08-04 16:32:22 +0100	[diff] [blame]	4278	u64 alignment,
				4279	u64 flags)
Joonas Lahtinen	ec7adb6	2015-03-16 14:11:13 +0200	[diff] [blame]	4280	{
Chris Wilson	ad16d2e	2016-10-13 09:55:04 +0100	[diff] [blame]	4281	struct drm_i915_private *dev_priv = to_i915(obj->base.dev);
				4282	struct i915_address_space *vm = &dev_priv->ggtt.base;
Chris Wilson	59bfa12	2016-08-04 16:32:31 +0100	[diff] [blame]	4283	struct i915_vma *vma;
				4284	int ret;
Joonas Lahtinen	72e96d6	2016-03-30 16:57:10 +0300	[diff] [blame]	4285
Chris Wilson	4c7d62c	2016-10-28 13:58:32 +0100	[diff] [blame]	4286	lockdep_assert_held(&obj->base.dev->struct_mutex);
				4287
Chris Wilson	ac87a6fd	2018-02-20 13:42:05 +0000	[diff] [blame]	4288	if (flags & PIN_MAPPABLE &&
				4289	(!view \|\| view->type == I915_GGTT_VIEW_NORMAL)) {
Chris Wilson	43ae70d	2017-10-09 09:44:01 +0100	[diff] [blame]	4290	/* If the required space is larger than the available
				4291	* aperture, we will not able to find a slot for the
				4292	* object and unbinding the object now will be in
				4293	* vain. Worse, doing so may cause us to ping-pong
				4294	* the object in and out of the Global GTT and
				4295	* waste a lot of cycles under the mutex.
				4296	*/
				4297	if (obj->base.size > dev_priv->ggtt.mappable_end)
				4298	return ERR_PTR(-E2BIG);
				4299
				4300	/* If NONBLOCK is set the caller is optimistically
				4301	* trying to cache the full object within the mappable
				4302	* aperture, and must have a fallback in place for
				4303	* situations where we cannot bind the object. We
				4304	* can be a little more lax here and use the fallback
				4305	* more often to avoid costly migrations of ourselves
				4306	* and other objects within the aperture.
				4307	*
				4308	* Half-the-aperture is used as a simple heuristic.
				4309	* More interesting would to do search for a free
				4310	* block prior to making the commitment to unbind.
				4311	* That caters for the self-harm case, and with a
				4312	* little more heuristics (e.g. NOFAULT, NOEVICT)
				4313	* we could try to minimise harm to others.
				4314	*/
				4315	if (flags & PIN_NONBLOCK &&
				4316	obj->base.size > dev_priv->ggtt.mappable_end / 2)
				4317	return ERR_PTR(-ENOSPC);
				4318	}
				4319
Chris Wilson	718659a	2017-01-16 15:21:28 +0000	[diff] [blame]	4320	vma = i915_vma_instance(obj, vm, view);
Chris Wilson	e0216b7	2017-01-19 19:26:57 +0000	[diff] [blame]	4321	if (unlikely(IS_ERR(vma)))
Chris Wilson	058d88c	2016-08-15 10:49:06 +0100	[diff] [blame]	4322	return vma;
Chris Wilson	59bfa12	2016-08-04 16:32:31 +0100	[diff] [blame]	4323
				4324	if (i915_vma_misplaced(vma, size, alignment, flags)) {
Chris Wilson	43ae70d	2017-10-09 09:44:01 +0100	[diff] [blame]	4325	if (flags & PIN_NONBLOCK) {
				4326	if (i915_vma_is_pinned(vma) \|\| i915_vma_is_active(vma))
				4327	return ERR_PTR(-ENOSPC);
Chris Wilson	59bfa12	2016-08-04 16:32:31 +0100	[diff] [blame]	4328
Chris Wilson	43ae70d	2017-10-09 09:44:01 +0100	[diff] [blame]	4329	if (flags & PIN_MAPPABLE &&
Chris Wilson	944397f	2017-01-09 16:16:11 +0000	[diff] [blame]	4330	vma->fence_size > dev_priv->ggtt.mappable_end / 2)
Chris Wilson	ad16d2e	2016-10-13 09:55:04 +0100	[diff] [blame]	4331	return ERR_PTR(-ENOSPC);
				4332	}
				4333
Chris Wilson	59bfa12	2016-08-04 16:32:31 +0100	[diff] [blame]	4334	WARN(i915_vma_is_pinned(vma),
				4335	"bo is already pinned in ggtt with incorrect alignment:"
Chris Wilson	05a20d0	2016-08-18 17:16:55 +0100	[diff] [blame]	4336	" offset=%08x, req.alignment=%llx,"
				4337	" req.map_and_fenceable=%d, vma->map_and_fenceable=%d\n",
				4338	i915_ggtt_offset(vma), alignment,
Chris Wilson	59bfa12	2016-08-04 16:32:31 +0100	[diff] [blame]	4339	!!(flags & PIN_MAPPABLE),
Chris Wilson	05a20d0	2016-08-18 17:16:55 +0100	[diff] [blame]	4340	i915_vma_is_map_and_fenceable(vma));
Chris Wilson	59bfa12	2016-08-04 16:32:31 +0100	[diff] [blame]	4341	ret = i915_vma_unbind(vma);
				4342	if (ret)
Chris Wilson	058d88c	2016-08-15 10:49:06 +0100	[diff] [blame]	4343	return ERR_PTR(ret);
Chris Wilson	59bfa12	2016-08-04 16:32:31 +0100	[diff] [blame]	4344	}
				4345
Chris Wilson	058d88c	2016-08-15 10:49:06 +0100	[diff] [blame]	4346	ret = i915_vma_pin(vma, size, alignment, flags \| PIN_GLOBAL);
				4347	if (ret)
				4348	return ERR_PTR(ret);
Joonas Lahtinen	ec7adb6	2015-03-16 14:11:13 +0200	[diff] [blame]	4349
Chris Wilson	058d88c	2016-08-15 10:49:06 +0100	[diff] [blame]	4350	return vma;
Eric Anholt	673a394	2008-07-30 12:06:12 -0700	[diff] [blame]	4351	}
				4352
Chris Wilson	edf6b76	2016-08-09 09:23:33 +0100	[diff] [blame]	4353	static __always_inline unsigned int __busy_read_flag(unsigned int id)
Chris Wilson	3fdc13c	2016-08-05 10:14:18 +0100	[diff] [blame]	4354	{
				4355	/* Note that we could alias engines in the execbuf API, but
				4356	* that would be very unwise as it prevents userspace from
				4357	* fine control over engine selection. Ahem.
				4358	*
				4359	* This should be something like EXEC_MAX_ENGINE instead of
				4360	* I915_NUM_ENGINES.
				4361	*/
				4362	BUILD_BUG_ON(I915_NUM_ENGINES > 16);
				4363	return 0x10000 << id;
				4364	}
				4365
				4366	static __always_inline unsigned int __busy_write_id(unsigned int id)
				4367	{
Chris Wilson	70cb472	2016-08-09 18:08:25 +0100	[diff] [blame]	4368	/* The uABI guarantees an active writer is also amongst the read
				4369	* engines. This would be true if we accessed the activity tracking
				4370	* under the lock, but as we perform the lookup of the object and
				4371	* its activity locklessly we can not guarantee that the last_write
				4372	* being active implies that we have set the same engine flag from
				4373	* last_read - hence we always set both read and write busy for
				4374	* last_write.
				4375	*/
				4376	return id \| __busy_read_flag(id);
Chris Wilson	3fdc13c	2016-08-05 10:14:18 +0100	[diff] [blame]	4377	}
				4378
Chris Wilson	edf6b76	2016-08-09 09:23:33 +0100	[diff] [blame]	4379	static __always_inline unsigned int
Chris Wilson	d07f0e5	2016-10-28 13:58:44 +0100	[diff] [blame]	4380	__busy_set_if_active(const struct dma_fence *fence,
Chris Wilson	3fdc13c	2016-08-05 10:14:18 +0100	[diff] [blame]	4381	unsigned int (*flag)(unsigned int id))
				4382	{
Chris Wilson	e61e0f5	2018-02-21 09:56:36 +0000	[diff] [blame]	4383	struct i915_request *rq;
Chris Wilson	1255501	2016-08-16 09:50:40 +0100	[diff] [blame]	4384
Chris Wilson	d07f0e5	2016-10-28 13:58:44 +0100	[diff] [blame]	4385	/* We have to check the current hw status of the fence as the uABI
				4386	* guarantees forward progress. We could rely on the idle worker
				4387	* to eventually flush us, but to minimise latency just ask the
				4388	* hardware.
				4389	*
				4390	* Note we only report on the status of native fences.
				4391	*/
				4392	if (!dma_fence_is_i915(fence))
Chris Wilson	1255501	2016-08-16 09:50:40 +0100	[diff] [blame]	4393	return 0;
				4394
Chris Wilson	d07f0e5	2016-10-28 13:58:44 +0100	[diff] [blame]	4395	/* opencode to_request() in order to avoid const warnings */
Chris Wilson	e61e0f5	2018-02-21 09:56:36 +0000	[diff] [blame]	4396	rq = container_of(fence, struct i915_request, fence);
				4397	if (i915_request_completed(rq))
Chris Wilson	d07f0e5	2016-10-28 13:58:44 +0100	[diff] [blame]	4398	return 0;
				4399
Chris Wilson	1d39f28	2017-04-11 13:43:06 +0100	[diff] [blame]	4400	return flag(rq->engine->uabi_id);
Chris Wilson	3fdc13c	2016-08-05 10:14:18 +0100	[diff] [blame]	4401	}
				4402
Chris Wilson	edf6b76	2016-08-09 09:23:33 +0100	[diff] [blame]	4403	static __always_inline unsigned int
Chris Wilson	d07f0e5	2016-10-28 13:58:44 +0100	[diff] [blame]	4404	busy_check_reader(const struct dma_fence *fence)
Chris Wilson	3fdc13c	2016-08-05 10:14:18 +0100	[diff] [blame]	4405	{
Chris Wilson	d07f0e5	2016-10-28 13:58:44 +0100	[diff] [blame]	4406	return __busy_set_if_active(fence, __busy_read_flag);
Chris Wilson	3fdc13c	2016-08-05 10:14:18 +0100	[diff] [blame]	4407	}
				4408
Chris Wilson	edf6b76	2016-08-09 09:23:33 +0100	[diff] [blame]	4409	static __always_inline unsigned int
Chris Wilson	d07f0e5	2016-10-28 13:58:44 +0100	[diff] [blame]	4410	busy_check_writer(const struct dma_fence *fence)
Chris Wilson	3fdc13c	2016-08-05 10:14:18 +0100	[diff] [blame]	4411	{
Chris Wilson	d07f0e5	2016-10-28 13:58:44 +0100	[diff] [blame]	4412	if (!fence)
				4413	return 0;
				4414
				4415	return __busy_set_if_active(fence, __busy_write_id);
Chris Wilson	3fdc13c	2016-08-05 10:14:18 +0100	[diff] [blame]	4416	}
				4417
Eric Anholt	673a394	2008-07-30 12:06:12 -0700	[diff] [blame]	4418	int
Eric Anholt	673a394	2008-07-30 12:06:12 -0700	[diff] [blame]	4419	i915_gem_busy_ioctl(struct drm_device dev, void data,
Chris Wilson	05394f3	2010-11-08 19:18:58 +0000	[diff] [blame]	4420	struct drm_file *file)
Eric Anholt	673a394	2008-07-30 12:06:12 -0700	[diff] [blame]	4421	{
				4422	struct drm_i915_gem_busy *args = data;
Chris Wilson	05394f3	2010-11-08 19:18:58 +0000	[diff] [blame]	4423	struct drm_i915_gem_object *obj;
Chris Wilson	d07f0e5	2016-10-28 13:58:44 +0100	[diff] [blame]	4424	struct reservation_object_list *list;
				4425	unsigned int seq;
Chris Wilson	fbbd37b	2016-10-28 13:58:42 +0100	[diff] [blame]	4426	int err;
Eric Anholt	673a394	2008-07-30 12:06:12 -0700	[diff] [blame]	4427
Chris Wilson	d07f0e5	2016-10-28 13:58:44 +0100	[diff] [blame]	4428	err = -ENOENT;
Chris Wilson	fbbd37b	2016-10-28 13:58:42 +0100	[diff] [blame]	4429	rcu_read_lock();
				4430	obj = i915_gem_object_lookup_rcu(file, args->handle);
Chris Wilson	d07f0e5	2016-10-28 13:58:44 +0100	[diff] [blame]	4431	if (!obj)
Chris Wilson	fbbd37b	2016-10-28 13:58:42 +0100	[diff] [blame]	4432	goto out;
Chris Wilson	d07f0e5	2016-10-28 13:58:44 +0100	[diff] [blame]	4433
				4434	/* A discrepancy here is that we do not report the status of
				4435	* non-i915 fences, i.e. even though we may report the object as idle,
				4436	* a call to set-domain may still stall waiting for foreign rendering.
				4437	* This also means that wait-ioctl may report an object as busy,
				4438	* where busy-ioctl considers it idle.
				4439	*
				4440	* We trade the ability to warn of foreign fences to report on which
				4441	* i915 engines are active for the object.
				4442	*
				4443	* Alternatively, we can trade that extra information on read/write
				4444	* activity with
				4445	* args->busy =
				4446	* !reservation_object_test_signaled_rcu(obj->resv, true);
				4447	* to report the overall busyness. This is what the wait-ioctl does.
				4448	*
				4449	*/
				4450	retry:
				4451	seq = raw_read_seqcount(&obj->resv->seq);
				4452
				4453	/* Translate the exclusive fence to the READ and WRITE engine */
				4454	args->busy = busy_check_writer(rcu_dereference(obj->resv->fence_excl));
				4455
				4456	/* Translate shared fences to READ set of engines */
				4457	list = rcu_dereference(obj->resv->fence);
				4458	if (list) {
				4459	unsigned int shared_count = list->shared_count, i;
				4460
				4461	for (i = 0; i < shared_count; ++i) {
				4462	struct dma_fence *fence =
				4463	rcu_dereference(list->shared[i]);
				4464
				4465	args->busy \|= busy_check_reader(fence);
				4466	}
Chris Wilson	fbbd37b	2016-10-28 13:58:42 +0100	[diff] [blame]	4467	}
Zou Nan hai	d1b851f	2010-05-21 09:08:57 +0800	[diff] [blame]	4468
Chris Wilson	d07f0e5	2016-10-28 13:58:44 +0100	[diff] [blame]	4469	if (args->busy && read_seqcount_retry(&obj->resv->seq, seq))
				4470	goto retry;
Chris Wilson	426960b	2016-01-15 16:51:46 +0000	[diff] [blame]	4471
Chris Wilson	d07f0e5	2016-10-28 13:58:44 +0100	[diff] [blame]	4472	err = 0;
Chris Wilson	fbbd37b	2016-10-28 13:58:42 +0100	[diff] [blame]	4473	out:
				4474	rcu_read_unlock();
				4475	return err;
Eric Anholt	673a394	2008-07-30 12:06:12 -0700	[diff] [blame]	4476	}
				4477
				4478	int
				4479	i915_gem_throttle_ioctl(struct drm_device dev, void data,
				4480	struct drm_file *file_priv)
				4481	{
Akshay Joshi	0206e35	2011-08-16 15:34:10 -0400	[diff] [blame]	4482	return i915_gem_ring_throttle(dev, file_priv);
Eric Anholt	673a394	2008-07-30 12:06:12 -0700	[diff] [blame]	4483	}
				4484
Chris Wilson	3ef94da	2009-09-14 16:50:29 +0100	[diff] [blame]	4485	int
				4486	i915_gem_madvise_ioctl(struct drm_device dev, void data,
				4487	struct drm_file *file_priv)
				4488	{
Chris Wilson	fac5e23	2016-07-04 11:34:36 +0100	[diff] [blame]	4489	struct drm_i915_private *dev_priv = to_i915(dev);
Chris Wilson	3ef94da	2009-09-14 16:50:29 +0100	[diff] [blame]	4490	struct drm_i915_gem_madvise *args = data;
Chris Wilson	05394f3	2010-11-08 19:18:58 +0000	[diff] [blame]	4491	struct drm_i915_gem_object *obj;
Chris Wilson	1233e2d	2016-10-28 13:58:37 +0100	[diff] [blame]	4492	int err;
Chris Wilson	3ef94da	2009-09-14 16:50:29 +0100	[diff] [blame]	4493
				4494	switch (args->madv) {
				4495	case I915_MADV_DONTNEED:
				4496	case I915_MADV_WILLNEED:
				4497	break;
				4498	default:
				4499	return -EINVAL;
				4500	}
				4501
Chris Wilson	03ac064	2016-07-20 13:31:51 +0100	[diff] [blame]	4502	obj = i915_gem_object_lookup(file_priv, args->handle);
Chris Wilson	1233e2d	2016-10-28 13:58:37 +0100	[diff] [blame]	4503	if (!obj)
				4504	return -ENOENT;
				4505
				4506	err = mutex_lock_interruptible(&obj->mm.lock);
				4507	if (err)
				4508	goto out;
Chris Wilson	3ef94da	2009-09-14 16:50:29 +0100	[diff] [blame]	4509
Chris Wilson	f1fa4f4	2017-10-13 21:26:13 +0100	[diff] [blame]	4510	if (i915_gem_object_has_pages(obj) &&
Chris Wilson	3e510a8	2016-08-05 10:14:23 +0100	[diff] [blame]	4511	i915_gem_object_is_tiled(obj) &&
Daniel Vetter	656bfa3	2014-11-20 09:26:30 +0100	[diff] [blame]	4512	dev_priv->quirks & QUIRK_PIN_SWIZZLED_PAGES) {
Chris Wilson	bc0629a	2016-11-01 10:03:17 +0000	[diff] [blame]	4513	if (obj->mm.madv == I915_MADV_WILLNEED) {
				4514	GEM_BUG_ON(!obj->mm.quirked);
Chris Wilson	a4f5ea6	2016-10-28 13:58:35 +0100	[diff] [blame]	4515	__i915_gem_object_unpin_pages(obj);
Chris Wilson	bc0629a	2016-11-01 10:03:17 +0000	[diff] [blame]	4516	obj->mm.quirked = false;
				4517	}
				4518	if (args->madv == I915_MADV_WILLNEED) {
Chris Wilson	2c3a3f4	2016-11-04 10:30:01 +0000	[diff] [blame]	4519	GEM_BUG_ON(obj->mm.quirked);
Chris Wilson	a4f5ea6	2016-10-28 13:58:35 +0100	[diff] [blame]	4520	__i915_gem_object_pin_pages(obj);
Chris Wilson	bc0629a	2016-11-01 10:03:17 +0000	[diff] [blame]	4521	obj->mm.quirked = true;
				4522	}
Daniel Vetter	656bfa3	2014-11-20 09:26:30 +0100	[diff] [blame]	4523	}
				4524
Chris Wilson	a4f5ea6	2016-10-28 13:58:35 +0100	[diff] [blame]	4525	if (obj->mm.madv != __I915_MADV_PURGED)
				4526	obj->mm.madv = args->madv;
Chris Wilson	3ef94da	2009-09-14 16:50:29 +0100	[diff] [blame]	4527
Chris Wilson	6c085a7	2012-08-20 11:40:46 +0200	[diff] [blame]	4528	/* if the object is no longer attached, discard its backing storage */
Chris Wilson	f1fa4f4	2017-10-13 21:26:13 +0100	[diff] [blame]	4529	if (obj->mm.madv == I915_MADV_DONTNEED &&
				4530	!i915_gem_object_has_pages(obj))
Chris Wilson	2d7ef39	2009-09-20 23:13:10 +0100	[diff] [blame]	4531	i915_gem_object_truncate(obj);
				4532
Chris Wilson	a4f5ea6	2016-10-28 13:58:35 +0100	[diff] [blame]	4533	args->retained = obj->mm.madv != __I915_MADV_PURGED;
Chris Wilson	1233e2d	2016-10-28 13:58:37 +0100	[diff] [blame]	4534	mutex_unlock(&obj->mm.lock);
Chris Wilson	bb6baf7	2009-09-22 14:24:13 +0100	[diff] [blame]	4535
Chris Wilson	1233e2d	2016-10-28 13:58:37 +0100	[diff] [blame]	4536	out:
Chris Wilson	f8c417c	2016-07-20 13:31:53 +0100	[diff] [blame]	4537	i915_gem_object_put(obj);
Chris Wilson	1233e2d	2016-10-28 13:58:37 +0100	[diff] [blame]	4538	return err;
Chris Wilson	3ef94da	2009-09-14 16:50:29 +0100	[diff] [blame]	4539	}
				4540
Chris Wilson	5b8c8ae	2016-11-16 19:07:04 +0000	[diff] [blame]	4541	static void
Chris Wilson	e61e0f5	2018-02-21 09:56:36 +0000	[diff] [blame]	4542	frontbuffer_retire(struct i915_gem_active active, struct i915_request request)
Chris Wilson	5b8c8ae	2016-11-16 19:07:04 +0000	[diff] [blame]	4543	{
				4544	struct drm_i915_gem_object *obj =
				4545	container_of(active, typeof(*obj), frontbuffer_write);
				4546
Chris Wilson	d59b21e	2017-02-22 11:40:49 +0000	[diff] [blame]	4547	intel_fb_obj_flush(obj, ORIGIN_CS);
Chris Wilson	5b8c8ae	2016-11-16 19:07:04 +0000	[diff] [blame]	4548	}
				4549
Chris Wilson	37e680a	2012-06-07 15:38:42 +0100	[diff] [blame]	4550	void i915_gem_object_init(struct drm_i915_gem_object *obj,
				4551	const struct drm_i915_gem_object_ops *ops)
Chris Wilson	0327d6b	2012-08-11 15:41:06 +0100	[diff] [blame]	4552	{
Chris Wilson	1233e2d	2016-10-28 13:58:37 +0100	[diff] [blame]	4553	mutex_init(&obj->mm.lock);
				4554
Ben Widawsky	2f63315	2013-07-17 12:19:03 -0700	[diff] [blame]	4555	INIT_LIST_HEAD(&obj->vma_list);
Chris Wilson	d1b48c1	2017-08-16 09:52:08 +0100	[diff] [blame]	4556	INIT_LIST_HEAD(&obj->lut_list);
Chris Wilson	8d9d574	2015-04-07 16:20:38 +0100	[diff] [blame]	4557	INIT_LIST_HEAD(&obj->batch_pool_link);
Chris Wilson	0327d6b	2012-08-11 15:41:06 +0100	[diff] [blame]	4558
Chris Wilson	37e680a	2012-06-07 15:38:42 +0100	[diff] [blame]	4559	obj->ops = ops;
				4560
Chris Wilson	d07f0e5	2016-10-28 13:58:44 +0100	[diff] [blame]	4561	reservation_object_init(&obj->__builtin_resv);
				4562	obj->resv = &obj->__builtin_resv;
				4563
Chris Wilson	5034924	2016-08-18 17:17:04 +0100	[diff] [blame]	4564	obj->frontbuffer_ggtt_origin = ORIGIN_GTT;
Chris Wilson	5b8c8ae	2016-11-16 19:07:04 +0000	[diff] [blame]	4565	init_request_active(&obj->frontbuffer_write, frontbuffer_retire);
Chris Wilson	a4f5ea6	2016-10-28 13:58:35 +0100	[diff] [blame]	4566
				4567	obj->mm.madv = I915_MADV_WILLNEED;
				4568	INIT_RADIX_TREE(&obj->mm.get_page.radix, GFP_KERNEL \| __GFP_NOWARN);
				4569	mutex_init(&obj->mm.get_page.lock);
Chris Wilson	0327d6b	2012-08-11 15:41:06 +0100	[diff] [blame]	4570
Dave Gordon	f19ec8c	2016-07-04 11:34:37 +0100	[diff] [blame]	4571	i915_gem_info_add_obj(to_i915(obj->base.dev), obj->base.size);
Chris Wilson	0327d6b	2012-08-11 15:41:06 +0100	[diff] [blame]	4572	}
				4573
Chris Wilson	37e680a	2012-06-07 15:38:42 +0100	[diff] [blame]	4574	static const struct drm_i915_gem_object_ops i915_gem_object_ops = {
Tvrtko Ursulin	3599a91	2016-11-01 14:44:10 +0000	[diff] [blame]	4575	.flags = I915_GEM_OBJECT_HAS_STRUCT_PAGE \|
				4576	I915_GEM_OBJECT_IS_SHRINKABLE,
Chris Wilson	7c55e2c	2017-03-07 12:03:38 +0000	[diff] [blame]	4577
Chris Wilson	37e680a	2012-06-07 15:38:42 +0100	[diff] [blame]	4578	.get_pages = i915_gem_object_get_pages_gtt,
				4579	.put_pages = i915_gem_object_put_pages_gtt,
Chris Wilson	7c55e2c	2017-03-07 12:03:38 +0000	[diff] [blame]	4580
				4581	.pwrite = i915_gem_object_pwrite_gtt,
Chris Wilson	37e680a	2012-06-07 15:38:42 +0100	[diff] [blame]	4582	};
				4583
Matthew Auld	465c403	2017-10-06 23:18:14 +0100	[diff] [blame]	4584	static int i915_gem_object_create_shmem(struct drm_device *dev,
				4585	struct drm_gem_object *obj,
				4586	size_t size)
				4587	{
				4588	struct drm_i915_private *i915 = to_i915(dev);
				4589	unsigned long flags = VM_NORESERVE;
				4590	struct file *filp;
				4591
				4592	drm_gem_private_object_init(dev, obj, size);
				4593
				4594	if (i915->mm.gemfs)
				4595	filp = shmem_file_setup_with_mnt(i915->mm.gemfs, "i915", size,
				4596	flags);
				4597	else
				4598	filp = shmem_file_setup("i915", size, flags);
				4599
				4600	if (IS_ERR(filp))
				4601	return PTR_ERR(filp);
				4602
				4603	obj->filp = filp;
				4604
				4605	return 0;
				4606	}
				4607
Chris Wilson	b4bcbe2	2016-10-18 13:02:49 +0100	[diff] [blame]	4608	struct drm_i915_gem_object *
Tvrtko Ursulin	12d79d7	2016-12-01 14:16:37 +0000	[diff] [blame]	4609	i915_gem_object_create(struct drm_i915_private *dev_priv, u64 size)
Daniel Vetter	ac52bc5	2010-04-09 19:05:06 +0000	[diff] [blame]	4610	{
Daniel Vetter	c397b90	2010-04-09 19:05:07 +0000	[diff] [blame]	4611	struct drm_i915_gem_object *obj;
Hugh Dickins	5949eac	2011-06-27 16:18:18 -0700	[diff] [blame]	4612	struct address_space *mapping;
Chris Wilson	b8f55be	2017-08-11 12:11:16 +0100	[diff] [blame]	4613	unsigned int cache_level;
Daniel Vetter	1a240d4	2012-11-29 22:18:51 +0100	[diff] [blame]	4614	gfp_t mask;
Chris Wilson	fe3db79	2016-04-25 13:32:13 +0100	[diff] [blame]	4615	int ret;
Daniel Vetter	c397b90	2010-04-09 19:05:07 +0000	[diff] [blame]	4616
Chris Wilson	b4bcbe2	2016-10-18 13:02:49 +0100	[diff] [blame]	4617	/* There is a prevalence of the assumption that we fit the object's
				4618	* page count inside a 32bit _signed_ variable. Let's document this and
				4619	* catch if we ever need to fix it. In the meantime, if you do spot
				4620	* such a local variable, please consider fixing!
				4621	*/
Tvrtko Ursulin	7a3ee5d	2017-03-30 17:31:30 +0100	[diff] [blame]	4622	if (size >> PAGE_SHIFT > INT_MAX)
Chris Wilson	b4bcbe2	2016-10-18 13:02:49 +0100	[diff] [blame]	4623	return ERR_PTR(-E2BIG);
				4624
				4625	if (overflows_type(size, obj->base.size))
				4626	return ERR_PTR(-E2BIG);
				4627
Tvrtko Ursulin	187685c	2016-12-01 14:16:36 +0000	[diff] [blame]	4628	obj = i915_gem_object_alloc(dev_priv);
Daniel Vetter	c397b90	2010-04-09 19:05:07 +0000	[diff] [blame]	4629	if (obj == NULL)
Chris Wilson	fe3db79	2016-04-25 13:32:13 +0100	[diff] [blame]	4630	return ERR_PTR(-ENOMEM);
Daniel Vetter	c397b90	2010-04-09 19:05:07 +0000	[diff] [blame]	4631
Matthew Auld	465c403	2017-10-06 23:18:14 +0100	[diff] [blame]	4632	ret = i915_gem_object_create_shmem(&dev_priv->drm, &obj->base, size);
Chris Wilson	fe3db79	2016-04-25 13:32:13 +0100	[diff] [blame]	4633	if (ret)
				4634	goto fail;
Daniel Vetter	c397b90	2010-04-09 19:05:07 +0000	[diff] [blame]	4635
Chris Wilson	bed1ea9	2012-05-24 20:48:12 +0100	[diff] [blame]	4636	mask = GFP_HIGHUSER \| __GFP_RECLAIMABLE;
Jani Nikula	c0f8683	2016-12-07 12:13:04 +0200	[diff] [blame]	4637	if (IS_I965GM(dev_priv) \|\| IS_I965G(dev_priv)) {
Chris Wilson	bed1ea9	2012-05-24 20:48:12 +0100	[diff] [blame]	4638	/* 965gm cannot relocate objects above 4GiB. */
				4639	mask &= ~__GFP_HIGHMEM;
				4640	mask \|= __GFP_DMA32;
				4641	}
				4642
Al Viro	93c76a3	2015-12-04 23:45:44 -0500	[diff] [blame]	4643	mapping = obj->base.filp->f_mapping;
Chris Wilson	bed1ea9	2012-05-24 20:48:12 +0100	[diff] [blame]	4644	mapping_set_gfp_mask(mapping, mask);
Chris Wilson	4846bf0	2017-06-09 12:03:46 +0100	[diff] [blame]	4645	GEM_BUG_ON(!(mapping_gfp_mask(mapping) & __GFP_RECLAIM));
Hugh Dickins	5949eac	2011-06-27 16:18:18 -0700	[diff] [blame]	4646
Chris Wilson	37e680a	2012-06-07 15:38:42 +0100	[diff] [blame]	4647	i915_gem_object_init(obj, &i915_gem_object_ops);
Chris Wilson	73aa808	2010-09-30 11:46:12 +0100	[diff] [blame]	4648
Christian König	c0a51fd	2018-02-16 13:43:38 +0100	[diff] [blame]	4649	obj->write_domain = I915_GEM_DOMAIN_CPU;
				4650	obj->read_domains = I915_GEM_DOMAIN_CPU;
Daniel Vetter	c397b90	2010-04-09 19:05:07 +0000	[diff] [blame]	4651
Chris Wilson	b8f55be	2017-08-11 12:11:16 +0100	[diff] [blame]	4652	if (HAS_LLC(dev_priv))
Eugeni Dodonov	3d29b84	2012-01-17 14:43:53 -0200	[diff] [blame]	4653	/* On some devices, we can have the GPU use the LLC (the CPU
Eric Anholt	a187111	2011-03-29 16:59:55 -0700	[diff] [blame]	4654	* cache) for about a 10% performance improvement
				4655	* compared to uncached. Graphics requests other than
				4656	* display scanout are coherent with the CPU in
				4657	* accessing this cache. This means in this mode we
				4658	* don't need to clflush on the CPU side, and on the
				4659	* GPU side we only need to flush internal caches to
				4660	* get data visible to the CPU.
				4661	*
				4662	* However, we maintain the display planes as UC, and so
				4663	* need to rebind when first used as such.
				4664	*/
Chris Wilson	b8f55be	2017-08-11 12:11:16 +0100	[diff] [blame]	4665	cache_level = I915_CACHE_LLC;
				4666	else
				4667	cache_level = I915_CACHE_NONE;
Eric Anholt	a187111	2011-03-29 16:59:55 -0700	[diff] [blame]	4668
Chris Wilson	b8f55be	2017-08-11 12:11:16 +0100	[diff] [blame]	4669	i915_gem_object_set_cache_coherency(obj, cache_level);
Chris Wilson	e27ab73	2017-06-15 13:38:49 +0100	[diff] [blame]	4670
Daniel Vetter	d861e33	2013-07-24 23:25:03 +0200	[diff] [blame]	4671	trace_i915_gem_object_create(obj);
				4672
Chris Wilson	05394f3	2010-11-08 19:18:58 +0000	[diff] [blame]	4673	return obj;
Chris Wilson	fe3db79	2016-04-25 13:32:13 +0100	[diff] [blame]	4674
				4675	fail:
				4676	i915_gem_object_free(obj);
Chris Wilson	fe3db79	2016-04-25 13:32:13 +0100	[diff] [blame]	4677	return ERR_PTR(ret);
Daniel Vetter	ac52bc5	2010-04-09 19:05:06 +0000	[diff] [blame]	4678	}
				4679
Chris Wilson	340fbd8	2014-05-22 09:16:52 +0100	[diff] [blame]	4680	static bool discard_backing_storage(struct drm_i915_gem_object *obj)
				4681	{
				4682	/* If we are the last user of the backing storage (be it shmemfs
				4683	* pages or stolen etc), we know that the pages are going to be
				4684	* immediately released. In this case, we can then skip copying
				4685	* back the contents from the GPU.
				4686	*/
				4687
Chris Wilson	a4f5ea6	2016-10-28 13:58:35 +0100	[diff] [blame]	4688	if (obj->mm.madv != I915_MADV_WILLNEED)
Chris Wilson	340fbd8	2014-05-22 09:16:52 +0100	[diff] [blame]	4689	return false;
				4690
				4691	if (obj->base.filp == NULL)
				4692	return true;
				4693
				4694	/* At first glance, this looks racy, but then again so would be
				4695	* userspace racing mmap against close. However, the first external
				4696	* reference to the filp can only be obtained through the
				4697	* i915_gem_mmap_ioctl() which safeguards us against the user
				4698	* acquiring such a reference whilst we are in the middle of
				4699	* freeing the object.
				4700	*/
				4701	return atomic_long_read(&obj->base.filp->f_count) == 1;
				4702	}
				4703
Chris Wilson	fbbd37b	2016-10-28 13:58:42 +0100	[diff] [blame]	4704	static void __i915_gem_free_objects(struct drm_i915_private *i915,
				4705	struct llist_node *freed)
Chris Wilson	be72615	2010-07-23 23:18:50 +0100	[diff] [blame]	4706	{
Chris Wilson	fbbd37b	2016-10-28 13:58:42 +0100	[diff] [blame]	4707	struct drm_i915_gem_object obj, on;
Chris Wilson	be72615	2010-07-23 23:18:50 +0100	[diff] [blame]	4708
Chris Wilson	fbbd37b	2016-10-28 13:58:42 +0100	[diff] [blame]	4709	intel_runtime_pm_get(i915);
Chris Wilson	cc731f5	2017-10-13 21:26:21 +0100	[diff] [blame]	4710	llist_for_each_entry_safe(obj, on, freed, freed) {
Chris Wilson	fbbd37b	2016-10-28 13:58:42 +0100	[diff] [blame]	4711	struct i915_vma vma, vn;
Paulo Zanoni	f65c916	2013-11-27 18:20:34 -0200	[diff] [blame]	4712
Chris Wilson	fbbd37b	2016-10-28 13:58:42 +0100	[diff] [blame]	4713	trace_i915_gem_object_destroy(obj);
				4714
Chris Wilson	cc731f5	2017-10-13 21:26:21 +0100	[diff] [blame]	4715	mutex_lock(&i915->drm.struct_mutex);
				4716
Chris Wilson	fbbd37b	2016-10-28 13:58:42 +0100	[diff] [blame]	4717	GEM_BUG_ON(i915_gem_object_is_active(obj));
				4718	list_for_each_entry_safe(vma, vn,
				4719	&obj->vma_list, obj_link) {
Chris Wilson	fbbd37b	2016-10-28 13:58:42 +0100	[diff] [blame]	4720	GEM_BUG_ON(i915_vma_is_active(vma));
				4721	vma->flags &= ~I915_VMA_PIN_MASK;
				4722	i915_vma_close(vma);
				4723	}
Chris Wilson	db6c2b4	2016-11-01 11:54:00 +0000	[diff] [blame]	4724	GEM_BUG_ON(!list_empty(&obj->vma_list));
				4725	GEM_BUG_ON(!RB_EMPTY_ROOT(&obj->vma_tree));
Chris Wilson	fbbd37b	2016-10-28 13:58:42 +0100	[diff] [blame]	4726
Chris Wilson	f212381	2017-10-16 12:40:37 +0100	[diff] [blame]	4727	/* This serializes freeing with the shrinker. Since the free
				4728	* is delayed, first by RCU then by the workqueue, we want the
				4729	* shrinker to be able to free pages of unreferenced objects,
				4730	* or else we may oom whilst there are plenty of deferred
				4731	* freed objects.
				4732	*/
				4733	if (i915_gem_object_has_pages(obj)) {
				4734	spin_lock(&i915->mm.obj_lock);
				4735	list_del_init(&obj->mm.link);
				4736	spin_unlock(&i915->mm.obj_lock);
				4737	}
				4738
Chris Wilson	cc731f5	2017-10-13 21:26:21 +0100	[diff] [blame]	4739	mutex_unlock(&i915->drm.struct_mutex);
Chris Wilson	fbbd37b	2016-10-28 13:58:42 +0100	[diff] [blame]	4740
Chris Wilson	fbbd37b	2016-10-28 13:58:42 +0100	[diff] [blame]	4741	GEM_BUG_ON(obj->bind_count);
Chris Wilson	a65adaf	2017-10-09 09:43:57 +0100	[diff] [blame]	4742	GEM_BUG_ON(obj->userfault_count);
Chris Wilson	fbbd37b	2016-10-28 13:58:42 +0100	[diff] [blame]	4743	GEM_BUG_ON(atomic_read(&obj->frontbuffer_bits));
Chris Wilson	67b4804	2017-08-22 12:05:16 +0100	[diff] [blame]	4744	GEM_BUG_ON(!list_empty(&obj->lut_list));
Chris Wilson	fbbd37b	2016-10-28 13:58:42 +0100	[diff] [blame]	4745
				4746	if (obj->ops->release)
				4747	obj->ops->release(obj);
				4748
				4749	if (WARN_ON(i915_gem_object_has_pinned_pages(obj)))
				4750	atomic_set(&obj->mm.pages_pin_count, 0);
Chris Wilson	548625e	2016-11-01 12:11:34 +0000	[diff] [blame]	4751	__i915_gem_object_put_pages(obj, I915_MM_NORMAL);
Chris Wilson	f1fa4f4	2017-10-13 21:26:13 +0100	[diff] [blame]	4752	GEM_BUG_ON(i915_gem_object_has_pages(obj));
Chris Wilson	fbbd37b	2016-10-28 13:58:42 +0100	[diff] [blame]	4753
				4754	if (obj->base.import_attach)
				4755	drm_prime_gem_destroy(&obj->base, NULL);
				4756
Chris Wilson	d07f0e5	2016-10-28 13:58:44 +0100	[diff] [blame]	4757	reservation_object_fini(&obj->__builtin_resv);
Chris Wilson	fbbd37b	2016-10-28 13:58:42 +0100	[diff] [blame]	4758	drm_gem_object_release(&obj->base);
				4759	i915_gem_info_remove_obj(i915, obj->base.size);
				4760
				4761	kfree(obj->bit_17);
				4762	i915_gem_object_free(obj);
Chris Wilson	cc731f5	2017-10-13 21:26:21 +0100	[diff] [blame]	4763
Chris Wilson	c9c7047	2018-02-19 22:06:31 +0000	[diff] [blame]	4764	GEM_BUG_ON(!atomic_read(&i915->mm.free_count));
				4765	atomic_dec(&i915->mm.free_count);
				4766
Chris Wilson	cc731f5	2017-10-13 21:26:21 +0100	[diff] [blame]	4767	if (on)
				4768	cond_resched();
Chris Wilson	fbbd37b	2016-10-28 13:58:42 +0100	[diff] [blame]	4769	}
Chris Wilson	cc731f5	2017-10-13 21:26:21 +0100	[diff] [blame]	4770	intel_runtime_pm_put(i915);
Chris Wilson	fbbd37b	2016-10-28 13:58:42 +0100	[diff] [blame]	4771	}
				4772
				4773	static void i915_gem_flush_free_objects(struct drm_i915_private *i915)
				4774	{
				4775	struct llist_node *freed;
				4776
Chris Wilson	87701b4	2017-10-13 21:26:20 +0100	[diff] [blame]	4777	/* Free the oldest, most stale object to keep the free_list short */
				4778	freed = NULL;
				4779	if (!llist_empty(&i915->mm.free_list)) { /* quick test for hotpath */
				4780	/* Only one consumer of llist_del_first() allowed */
				4781	spin_lock(&i915->mm.free_lock);
				4782	freed = llist_del_first(&i915->mm.free_list);
				4783	spin_unlock(&i915->mm.free_lock);
				4784	}
				4785	if (unlikely(freed)) {
				4786	freed->next = NULL;
Chris Wilson	fbbd37b	2016-10-28 13:58:42 +0100	[diff] [blame]	4787	__i915_gem_free_objects(i915, freed);
Chris Wilson	87701b4	2017-10-13 21:26:20 +0100	[diff] [blame]	4788	}
Chris Wilson	fbbd37b	2016-10-28 13:58:42 +0100	[diff] [blame]	4789	}
				4790
				4791	static void __i915_gem_free_work(struct work_struct *work)
				4792	{
				4793	struct drm_i915_private *i915 =
				4794	container_of(work, struct drm_i915_private, mm.free_work);
				4795	struct llist_node *freed;
Chris Wilson	26e12f8	2011-03-20 11:20:19 +0000	[diff] [blame]	4796
Chris Wilson	2ef1e72	2018-01-15 20:57:59 +0000	[diff] [blame]	4797	/*
				4798	* All file-owned VMA should have been released by this point through
Chris Wilson	b1f788c	2016-08-04 07:52:45 +0100	[diff] [blame]	4799	* i915_gem_close_object(), or earlier by i915_gem_context_close().
				4800	* However, the object may also be bound into the global GTT (e.g.
				4801	* older GPUs without per-process support, or for direct access through
				4802	* the GTT either for the user or for scanout). Those VMA still need to
				4803	* unbound now.
				4804	*/
Chris Wilson	1488fc0	2012-04-24 15:47:31 +0100	[diff] [blame]	4805
Chris Wilson	f991c49	2017-11-06 11:15:08 +0000	[diff] [blame]	4806	spin_lock(&i915->mm.free_lock);
Chris Wilson	5ad08be	2017-04-07 11:25:51 +0100	[diff] [blame]	4807	while ((freed = llist_del_all(&i915->mm.free_list))) {
Chris Wilson	f991c49	2017-11-06 11:15:08 +0000	[diff] [blame]	4808	spin_unlock(&i915->mm.free_lock);
				4809
Chris Wilson	fbbd37b	2016-10-28 13:58:42 +0100	[diff] [blame]	4810	__i915_gem_free_objects(i915, freed);
Chris Wilson	5ad08be	2017-04-07 11:25:51 +0100	[diff] [blame]	4811	if (need_resched())
Chris Wilson	f991c49	2017-11-06 11:15:08 +0000	[diff] [blame]	4812	return;
				4813
				4814	spin_lock(&i915->mm.free_lock);
Chris Wilson	5ad08be	2017-04-07 11:25:51 +0100	[diff] [blame]	4815	}
Chris Wilson	f991c49	2017-11-06 11:15:08 +0000	[diff] [blame]	4816	spin_unlock(&i915->mm.free_lock);
Chris Wilson	fbbd37b	2016-10-28 13:58:42 +0100	[diff] [blame]	4817	}
				4818
				4819	static void __i915_gem_free_object_rcu(struct rcu_head *head)
				4820	{
				4821	struct drm_i915_gem_object *obj =
				4822	container_of(head, typeof(*obj), rcu);
				4823	struct drm_i915_private *i915 = to_i915(obj->base.dev);
				4824
Chris Wilson	2ef1e72	2018-01-15 20:57:59 +0000	[diff] [blame]	4825	/*
				4826	* Since we require blocking on struct_mutex to unbind the freed
				4827	* object from the GPU before releasing resources back to the
				4828	* system, we can not do that directly from the RCU callback (which may
				4829	* be a softirq context), but must instead then defer that work onto a
				4830	* kthread. We use the RCU callback rather than move the freed object
				4831	* directly onto the work queue so that we can mix between using the
				4832	* worker and performing frees directly from subsequent allocations for
				4833	* crude but effective memory throttling.
Chris Wilson	fbbd37b	2016-10-28 13:58:42 +0100	[diff] [blame]	4834	*/
				4835	if (llist_add(&obj->freed, &i915->mm.free_list))
Chris Wilson	beacbd1	2018-01-15 12:28:45 +0000	[diff] [blame]	4836	queue_work(i915->wq, &i915->mm.free_work);
Chris Wilson	fbbd37b	2016-10-28 13:58:42 +0100	[diff] [blame]	4837	}
				4838
				4839	void i915_gem_free_object(struct drm_gem_object *gem_obj)
				4840	{
				4841	struct drm_i915_gem_object *obj = to_intel_bo(gem_obj);
				4842
Chris Wilson	bc0629a	2016-11-01 10:03:17 +0000	[diff] [blame]	4843	if (obj->mm.quirked)
				4844	__i915_gem_object_unpin_pages(obj);
				4845
Chris Wilson	fbbd37b	2016-10-28 13:58:42 +0100	[diff] [blame]	4846	if (discard_backing_storage(obj))
				4847	obj->mm.madv = I915_MADV_DONTNEED;
Daniel Vetter	a071fa0	2014-06-18 23:28:09 +0200	[diff] [blame]	4848
Chris Wilson	2ef1e72	2018-01-15 20:57:59 +0000	[diff] [blame]	4849	/*
				4850	* Before we free the object, make sure any pure RCU-only
Chris Wilson	fbbd37b	2016-10-28 13:58:42 +0100	[diff] [blame]	4851	* read-side critical sections are complete, e.g.
				4852	* i915_gem_busy_ioctl(). For the corresponding synchronized
				4853	* lookup see i915_gem_object_lookup_rcu().
				4854	*/
Chris Wilson	c9c7047	2018-02-19 22:06:31 +0000	[diff] [blame]	4855	atomic_inc(&to_i915(obj->base.dev)->mm.free_count);
Chris Wilson	fbbd37b	2016-10-28 13:58:42 +0100	[diff] [blame]	4856	call_rcu(&obj->rcu, __i915_gem_free_object_rcu);
Chris Wilson	be72615	2010-07-23 23:18:50 +0100	[diff] [blame]	4857	}
				4858
Chris Wilson	f8a7fde	2016-10-28 13:58:29 +0100	[diff] [blame]	4859	void __i915_gem_object_release_unless_active(struct drm_i915_gem_object *obj)
				4860	{
				4861	lockdep_assert_held(&obj->base.dev->struct_mutex);
				4862
Chris Wilson	d1b48c1	2017-08-16 09:52:08 +0100	[diff] [blame]	4863	if (!i915_gem_object_has_active_reference(obj) &&
				4864	i915_gem_object_is_active(obj))
Chris Wilson	f8a7fde	2016-10-28 13:58:29 +0100	[diff] [blame]	4865	i915_gem_object_set_active_reference(obj);
				4866	else
				4867	i915_gem_object_put(obj);
				4868	}
				4869
Chris Wilson	ae6c457	2017-11-10 14:26:28 +0000	[diff] [blame]	4870	static void assert_kernel_context_is_current(struct drm_i915_private *i915)
Chris Wilson	3033aca	2016-10-28 13:58:47 +0100	[diff] [blame]	4871	{
Chris Wilson	ae6c457	2017-11-10 14:26:28 +0000	[diff] [blame]	4872	struct i915_gem_context *kernel_context = i915->kernel_context;
Chris Wilson	3033aca	2016-10-28 13:58:47 +0100	[diff] [blame]	4873	struct intel_engine_cs *engine;
				4874	enum intel_engine_id id;
				4875
Chris Wilson	ae6c457	2017-11-10 14:26:28 +0000	[diff] [blame]	4876	for_each_engine(engine, i915, id) {
				4877	GEM_BUG_ON(__i915_gem_active_peek(&engine->timeline->last_request));
				4878	GEM_BUG_ON(engine->last_retired_context != kernel_context);
				4879	}
Chris Wilson	3033aca	2016-10-28 13:58:47 +0100	[diff] [blame]	4880	}
				4881
Chris Wilson	2414551	2017-01-24 11:01:35 +0000	[diff] [blame]	4882	void i915_gem_sanitize(struct drm_i915_private *i915)
				4883	{
Chris Wilson	f36325f	2017-08-26 12:09:34 +0100	[diff] [blame]	4884	if (i915_terminally_wedged(&i915->gpu_error)) {
				4885	mutex_lock(&i915->drm.struct_mutex);
				4886	i915_gem_unset_wedged(i915);
				4887	mutex_unlock(&i915->drm.struct_mutex);
				4888	}
				4889
Chris Wilson	2414551	2017-01-24 11:01:35 +0000	[diff] [blame]	4890	/*
				4891	* If we inherit context state from the BIOS or earlier occupants
				4892	* of the GPU, the GPU may be in an inconsistent state when we
				4893	* try to take over. The only way to remove the earlier state
				4894	* is by resetting. However, resetting on earlier gen is tricky as
				4895	* it may impact the display and we are uncertain about the stability
Joonas Lahtinen	ea117b8	2017-04-28 10:53:38 +0300	[diff] [blame]	4896	* of the reset, so this could be applied to even earlier gen.
Chris Wilson	2414551	2017-01-24 11:01:35 +0000	[diff] [blame]	4897	*/
Daniele Ceraolo Spurio	ce1599a	2018-02-07 13:24:40 -0800	[diff] [blame]	4898	if (INTEL_GEN(i915) >= 5 && intel_has_gpu_reset(i915))
				4899	WARN_ON(intel_gpu_reset(i915, ALL_ENGINES));
Chris Wilson	2414551	2017-01-24 11:01:35 +0000	[diff] [blame]	4900	}
				4901
Tvrtko Ursulin	bf9e842	2016-12-01 14:16:38 +0000	[diff] [blame]	4902	int i915_gem_suspend(struct drm_i915_private *dev_priv)
Eric Anholt	673a394	2008-07-30 12:06:12 -0700	[diff] [blame]	4903	{
Tvrtko Ursulin	bf9e842	2016-12-01 14:16:38 +0000	[diff] [blame]	4904	struct drm_device *dev = &dev_priv->drm;
Chris Wilson	dcff85c	2016-08-05 10:14:11 +0100	[diff] [blame]	4905	int ret;
Eric Anholt	673a394	2008-07-30 12:06:12 -0700	[diff] [blame]	4906
Chris Wilson	c998e8a	2017-03-02 08:30:29 +0000	[diff] [blame]	4907	intel_runtime_pm_get(dev_priv);
Chris Wilson	54b4f68	2016-07-21 21:16:19 +0100	[diff] [blame]	4908	intel_suspend_gt_powersave(dev_priv);
				4909
Chris Wilson	45c5f20	2013-10-16 11:50:01 +0100	[diff] [blame]	4910	mutex_lock(&dev->struct_mutex);
Chris Wilson	5ab57c7	2016-07-15 14:56:20 +0100	[diff] [blame]	4911
				4912	/* We have to flush all the executing contexts to main memory so
				4913	* that they can saved in the hibernation image. To ensure the last
				4914	* context image is coherent, we have to switch away from it. That
				4915	* leaves the dev_priv->kernel_context still active when
				4916	* we actually suspend, and its image in memory may not match the GPU
				4917	* state. Fortunately, the kernel_context is disposable and we do
				4918	* not rely on its state.
				4919	*/
Chris Wilson	ecf73eb	2017-11-30 10:29:51 +0000	[diff] [blame]	4920	if (!i915_terminally_wedged(&dev_priv->gpu_error)) {
				4921	ret = i915_gem_switch_to_kernel_context(dev_priv);
				4922	if (ret)
				4923	goto err_unlock;
Chris Wilson	5ab57c7	2016-07-15 14:56:20 +0100	[diff] [blame]	4924
Chris Wilson	ecf73eb	2017-11-30 10:29:51 +0000	[diff] [blame]	4925	ret = i915_gem_wait_for_idle(dev_priv,
				4926	I915_WAIT_INTERRUPTIBLE \|
				4927	I915_WAIT_LOCKED);
				4928	if (ret && ret != -EIO)
				4929	goto err_unlock;
Chris Wilson	f740334	2013-09-13 23:57:04 +0100	[diff] [blame]	4930
Chris Wilson	ecf73eb	2017-11-30 10:29:51 +0000	[diff] [blame]	4931	assert_kernel_context_is_current(dev_priv);
				4932	}
Chris Wilson	829a0af	2017-06-20 12:05:45 +0100	[diff] [blame]	4933	i915_gem_contexts_lost(dev_priv);
Chris Wilson	45c5f20	2013-10-16 11:50:01 +0100	[diff] [blame]	4934	mutex_unlock(&dev->struct_mutex);
				4935
Michal Wajdeczko	7cfca4a	2018-03-02 11:15:49 +0000	[diff] [blame]	4936	intel_uc_suspend(dev_priv);
Sagar Arun Kamble	63987bf	2017-04-05 15:51:50 +0530	[diff] [blame]	4937
Chris Wilson	737b150	2015-01-26 18:03:03 +0200	[diff] [blame]	4938	cancel_delayed_work_sync(&dev_priv->gpu_error.hangcheck_work);
Chris Wilson	67d97da	2016-07-04 08:08:31 +0100	[diff] [blame]	4939	cancel_delayed_work_sync(&dev_priv->gt.retire_work);
Chris Wilson	bdeb978	2016-12-23 14:57:56 +0000	[diff] [blame]	4940
				4941	/* As the idle_work is rearming if it detects a race, play safe and
				4942	* repeat the flush until it is definitely idle.
				4943	*/
Chris Wilson	7c26240	2017-10-06 11:40:38 +0100	[diff] [blame]	4944	drain_delayed_work(&dev_priv->gt.idle_work);
Chris Wilson	bdeb978	2016-12-23 14:57:56 +0000	[diff] [blame]	4945
Chris Wilson	bdcf120	2014-11-25 11:56:33 +0000	[diff] [blame]	4946	/* Assert that we sucessfully flushed all the work and
				4947	* reset the GPU back to its idle, low power state.
				4948	*/
Chris Wilson	67d97da	2016-07-04 08:08:31 +0100	[diff] [blame]	4949	WARN_ON(dev_priv->gt.awake);
Chris Wilson	fc692bd	2017-08-26 12:09:35 +0100	[diff] [blame]	4950	if (WARN_ON(!intel_engines_are_idle(dev_priv)))
				4951	i915_gem_set_wedged(dev_priv); /* no hope, discard everything */
Chris Wilson	bdcf120	2014-11-25 11:56:33 +0000	[diff] [blame]	4952
Imre Deak	1c777c5	2016-10-12 17:46:37 +0300	[diff] [blame]	4953	/*
				4954	* Neither the BIOS, ourselves or any other kernel
				4955	* expects the system to be in execlists mode on startup,
				4956	* so we need to reset the GPU back to legacy mode. And the only
				4957	* known way to disable logical contexts is through a GPU reset.
				4958	*
				4959	* So in order to leave the system in a known default configuration,
				4960	* always reset the GPU upon unload and suspend. Afterwards we then
				4961	* clean up the GEM state tracking, flushing off the requests and
				4962	* leaving the system in a known idle state.
				4963	*
				4964	* Note that is of the upmost importance that the GPU is idle and
				4965	* all stray writes are flushed before we dismantle the backing
				4966	* storage for the pinned objects.
				4967	*
				4968	* However, since we are uncertain that resetting the GPU on older
				4969	* machines is a good idea, we don't - just in case it leaves the
				4970	* machine in an unusable condition.
				4971	*/
Chris Wilson	2414551	2017-01-24 11:01:35 +0000	[diff] [blame]	4972	i915_gem_sanitize(dev_priv);
Chris Wilson	cad9946	2017-08-26 12:09:33 +0100	[diff] [blame]	4973
				4974	intel_runtime_pm_put(dev_priv);
				4975	return 0;
Imre Deak	1c777c5	2016-10-12 17:46:37 +0300	[diff] [blame]	4976
Chris Wilson	c998e8a	2017-03-02 08:30:29 +0000	[diff] [blame]	4977	err_unlock:
Chris Wilson	45c5f20	2013-10-16 11:50:01 +0100	[diff] [blame]	4978	mutex_unlock(&dev->struct_mutex);
Chris Wilson	c998e8a	2017-03-02 08:30:29 +0000	[diff] [blame]	4979	intel_runtime_pm_put(dev_priv);
Chris Wilson	45c5f20	2013-10-16 11:50:01 +0100	[diff] [blame]	4980	return ret;
Eric Anholt	673a394	2008-07-30 12:06:12 -0700	[diff] [blame]	4981	}
				4982
Chris Wilson	37cd330	2017-11-12 11:27:38 +0000	[diff] [blame]	4983	void i915_gem_resume(struct drm_i915_private *i915)
Chris Wilson	5ab57c7	2016-07-15 14:56:20 +0100	[diff] [blame]	4984	{
Chris Wilson	37cd330	2017-11-12 11:27:38 +0000	[diff] [blame]	4985	WARN_ON(i915->gt.awake);
Chris Wilson	5ab57c7	2016-07-15 14:56:20 +0100	[diff] [blame]	4986
Chris Wilson	37cd330	2017-11-12 11:27:38 +0000	[diff] [blame]	4987	mutex_lock(&i915->drm.struct_mutex);
				4988	intel_uncore_forcewake_get(i915, FORCEWAKE_ALL);
Imre Deak	31ab49a	2016-11-07 11:20:05 +0200	[diff] [blame]	4989
Chris Wilson	37cd330	2017-11-12 11:27:38 +0000	[diff] [blame]	4990	i915_gem_restore_gtt_mappings(i915);
				4991	i915_gem_restore_fences(i915);
Chris Wilson	5ab57c7	2016-07-15 14:56:20 +0100	[diff] [blame]	4992
Chris Wilson	6ca9a2b	2017-12-13 13:43:47 +0000	[diff] [blame]	4993	/*
				4994	* As we didn't flush the kernel context before suspend, we cannot
Chris Wilson	5ab57c7	2016-07-15 14:56:20 +0100	[diff] [blame]	4995	* guarantee that the context image is complete. So let's just reset
				4996	* it and start again.
				4997	*/
Chris Wilson	37cd330	2017-11-12 11:27:38 +0000	[diff] [blame]	4998	i915->gt.resume(i915);
Chris Wilson	5ab57c7	2016-07-15 14:56:20 +0100	[diff] [blame]	4999
Chris Wilson	37cd330	2017-11-12 11:27:38 +0000	[diff] [blame]	5000	if (i915_gem_init_hw(i915))
				5001	goto err_wedged;
				5002
Michal Wajdeczko	7cfca4a	2018-03-02 11:15:49 +0000	[diff] [blame]	5003	intel_uc_resume(i915);
Chris Wilson	7469c62	2017-11-14 13:03:00 +0000	[diff] [blame]	5004
Chris Wilson	37cd330	2017-11-12 11:27:38 +0000	[diff] [blame]	5005	/* Always reload a context for powersaving. */
				5006	if (i915_gem_switch_to_kernel_context(i915))
				5007	goto err_wedged;
				5008
				5009	out_unlock:
				5010	intel_uncore_forcewake_put(i915, FORCEWAKE_ALL);
				5011	mutex_unlock(&i915->drm.struct_mutex);
				5012	return;
				5013
				5014	err_wedged:
Chris Wilson	6ca9a2b	2017-12-13 13:43:47 +0000	[diff] [blame]	5015	if (!i915_terminally_wedged(&i915->gpu_error)) {
				5016	DRM_ERROR("failed to re-initialize GPU, declaring wedged!\n");
				5017	i915_gem_set_wedged(i915);
				5018	}
Chris Wilson	37cd330	2017-11-12 11:27:38 +0000	[diff] [blame]	5019	goto out_unlock;
Chris Wilson	5ab57c7	2016-07-15 14:56:20 +0100	[diff] [blame]	5020	}
				5021
Tvrtko Ursulin	c6be607	2016-11-16 08:55:31 +0000	[diff] [blame]	5022	void i915_gem_init_swizzling(struct drm_i915_private *dev_priv)
Daniel Vetter	f691e2f	2012-02-02 09:58:12 +0100	[diff] [blame]	5023	{
Tvrtko Ursulin	c6be607	2016-11-16 08:55:31 +0000	[diff] [blame]	5024	if (INTEL_GEN(dev_priv) < 5 \|\|
Daniel Vetter	f691e2f	2012-02-02 09:58:12 +0100	[diff] [blame]	5025	dev_priv->mm.bit_6_swizzle_x == I915_BIT_6_SWIZZLE_NONE)
				5026	return;
				5027
				5028	I915_WRITE(DISP_ARB_CTL, I915_READ(DISP_ARB_CTL) \|
				5029	DISP_TILE_SURFACE_SWIZZLING);
				5030
Tvrtko Ursulin	5db9401	2016-10-13 11:03:10 +0100	[diff] [blame]	5031	if (IS_GEN5(dev_priv))
Daniel Vetter	11782b0	2012-01-31 16:47:55 +0100	[diff] [blame]	5032	return;
				5033
Daniel Vetter	f691e2f	2012-02-02 09:58:12 +0100	[diff] [blame]	5034	I915_WRITE(TILECTL, I915_READ(TILECTL) \| TILECTL_SWZCTL);
Tvrtko Ursulin	5db9401	2016-10-13 11:03:10 +0100	[diff] [blame]	5035	if (IS_GEN6(dev_priv))
Daniel Vetter	6b26c86	2012-04-24 14:04:12 +0200	[diff] [blame]	5036	I915_WRITE(ARB_MODE, _MASKED_BIT_ENABLE(ARB_MODE_SWIZZLE_SNB));
Tvrtko Ursulin	5db9401	2016-10-13 11:03:10 +0100	[diff] [blame]	5037	else if (IS_GEN7(dev_priv))
Daniel Vetter	6b26c86	2012-04-24 14:04:12 +0200	[diff] [blame]	5038	I915_WRITE(ARB_MODE, _MASKED_BIT_ENABLE(ARB_MODE_SWIZZLE_IVB));
Tvrtko Ursulin	5db9401	2016-10-13 11:03:10 +0100	[diff] [blame]	5039	else if (IS_GEN8(dev_priv))
Ben Widawsky	31a5336	2013-11-02 21:07:04 -0700	[diff] [blame]	5040	I915_WRITE(GAMTARBMODE, _MASKED_BIT_ENABLE(ARB_MODE_SWIZZLE_BDW));
Ben Widawsky	8782e26	2012-12-18 10:31:23 -0800	[diff] [blame]	5041	else
				5042	BUG();
Daniel Vetter	f691e2f	2012-02-02 09:58:12 +0100	[diff] [blame]	5043	}
Daniel Vetter	e21af88	2012-02-09 20:53:27 +0100	[diff] [blame]	5044
Tvrtko Ursulin	50a0bc9	2016-10-13 11:02:58 +0100	[diff] [blame]	5045	static void init_unused_ring(struct drm_i915_private *dev_priv, u32 base)
Ville Syrjälä	81e7f20	2014-08-15 01:21:55 +0300	[diff] [blame]	5046	{
Ville Syrjälä	81e7f20	2014-08-15 01:21:55 +0300	[diff] [blame]	5047	I915_WRITE(RING_CTL(base), 0);
				5048	I915_WRITE(RING_HEAD(base), 0);
				5049	I915_WRITE(RING_TAIL(base), 0);
				5050	I915_WRITE(RING_START(base), 0);
				5051	}
				5052
Tvrtko Ursulin	50a0bc9	2016-10-13 11:02:58 +0100	[diff] [blame]	5053	static void init_unused_rings(struct drm_i915_private *dev_priv)
Ville Syrjälä	81e7f20	2014-08-15 01:21:55 +0300	[diff] [blame]	5054	{
Tvrtko Ursulin	50a0bc9	2016-10-13 11:02:58 +0100	[diff] [blame]	5055	if (IS_I830(dev_priv)) {
				5056	init_unused_ring(dev_priv, PRB1_BASE);
				5057	init_unused_ring(dev_priv, SRB0_BASE);
				5058	init_unused_ring(dev_priv, SRB1_BASE);
				5059	init_unused_ring(dev_priv, SRB2_BASE);
				5060	init_unused_ring(dev_priv, SRB3_BASE);
				5061	} else if (IS_GEN2(dev_priv)) {
				5062	init_unused_ring(dev_priv, SRB0_BASE);
				5063	init_unused_ring(dev_priv, SRB1_BASE);
				5064	} else if (IS_GEN3(dev_priv)) {
				5065	init_unused_ring(dev_priv, PRB1_BASE);
				5066	init_unused_ring(dev_priv, PRB2_BASE);
Ville Syrjälä	81e7f20	2014-08-15 01:21:55 +0300	[diff] [blame]	5067	}
				5068	}
				5069
Chris Wilson	20a8a74	2017-02-08 14:30:31 +0000	[diff] [blame]	5070	static int __i915_gem_restart_engines(void *data)
Ben Widawsky	4fc7c97	2013-02-08 11:49:24 -0800	[diff] [blame]	5071	{
Chris Wilson	20a8a74	2017-02-08 14:30:31 +0000	[diff] [blame]	5072	struct drm_i915_private *i915 = data;
Tvrtko Ursulin	e2f8039	2016-03-16 11:00:36 +0000	[diff] [blame]	5073	struct intel_engine_cs *engine;
Akash Goel	3b3f165	2016-10-13 22:44:48 +0530	[diff] [blame]	5074	enum intel_engine_id id;
Chris Wilson	20a8a74	2017-02-08 14:30:31 +0000	[diff] [blame]	5075	int err;
				5076
				5077	for_each_engine(engine, i915, id) {
				5078	err = engine->init_hw(engine);
Chris Wilson	8177e11	2018-02-07 11:15:45 +0000	[diff] [blame]	5079	if (err) {
				5080	DRM_ERROR("Failed to restart %s (%d)\n",
				5081	engine->name, err);
Chris Wilson	20a8a74	2017-02-08 14:30:31 +0000	[diff] [blame]	5082	return err;
Chris Wilson	8177e11	2018-02-07 11:15:45 +0000	[diff] [blame]	5083	}
Chris Wilson	20a8a74	2017-02-08 14:30:31 +0000	[diff] [blame]	5084	}
				5085
				5086	return 0;
				5087	}
				5088
				5089	int i915_gem_init_hw(struct drm_i915_private *dev_priv)
				5090	{
Chris Wilson	d200cda	2016-04-28 09:56:44 +0100	[diff] [blame]	5091	int ret;
Ben Widawsky	4fc7c97	2013-02-08 11:49:24 -0800	[diff] [blame]	5092
Chris Wilson	de867c2	2016-10-25 13:16:02 +0100	[diff] [blame]	5093	dev_priv->gt.last_init_time = ktime_get();
				5094
Chris Wilson	5e4f518	2015-02-13 14:35:59 +0000	[diff] [blame]	5095	/* Double layer security blanket, see i915_gem_init() */
				5096	intel_uncore_forcewake_get(dev_priv, FORCEWAKE_ALL);
				5097
Tvrtko Ursulin	0031fb9	2016-11-04 14:42:44 +0000	[diff] [blame]	5098	if (HAS_EDRAM(dev_priv) && INTEL_GEN(dev_priv) < 9)
Ben Widawsky	05e21cc	2013-07-04 11:02:04 -0700	[diff] [blame]	5099	I915_WRITE(HSW_IDICR, I915_READ(HSW_IDICR) \| IDIHASHMSK(0xf));
Ben Widawsky	4fc7c97	2013-02-08 11:49:24 -0800	[diff] [blame]	5100
Tvrtko Ursulin	772c2a5	2016-10-13 11:03:01 +0100	[diff] [blame]	5101	if (IS_HASWELL(dev_priv))
Tvrtko Ursulin	50a0bc9	2016-10-13 11:02:58 +0100	[diff] [blame]	5102	I915_WRITE(MI_PREDICATE_RESULT_2, IS_HSW_GT3(dev_priv) ?
Ville Syrjälä	0bf2134	2013-11-29 14:56:12 +0200	[diff] [blame]	5103	LOWER_SLICE_ENABLED : LOWER_SLICE_DISABLED);
Rodrigo Vivi	9435373	2013-08-28 16:45:46 -0300	[diff] [blame]	5104
Tvrtko Ursulin	6e26695	2016-10-13 11:02:53 +0100	[diff] [blame]	5105	if (HAS_PCH_NOP(dev_priv)) {
Tvrtko Ursulin	fd6b8f4	2016-10-14 10:13:06 +0100	[diff] [blame]	5106	if (IS_IVYBRIDGE(dev_priv)) {
Daniel Vetter	6ba844b	2014-01-22 23:39:30 +0100	[diff] [blame]	5107	u32 temp = I915_READ(GEN7_MSG_CTL);
				5108	temp &= ~(WAIT_FOR_PCH_FLR_ACK \| WAIT_FOR_PCH_RESET_ACK);
				5109	I915_WRITE(GEN7_MSG_CTL, temp);
Tvrtko Ursulin	c6be607	2016-11-16 08:55:31 +0000	[diff] [blame]	5110	} else if (INTEL_GEN(dev_priv) >= 7) {
Daniel Vetter	6ba844b	2014-01-22 23:39:30 +0100	[diff] [blame]	5111	u32 temp = I915_READ(HSW_NDE_RSTWRN_OPT);
				5112	temp &= ~RESET_PCH_HANDSHAKE_ENABLE;
				5113	I915_WRITE(HSW_NDE_RSTWRN_OPT, temp);
				5114	}
Ben Widawsky	88a2b2a	2013-04-05 13:12:43 -0700	[diff] [blame]	5115	}
				5116
Tvrtko Ursulin	c6be607	2016-11-16 08:55:31 +0000	[diff] [blame]	5117	i915_gem_init_swizzling(dev_priv);
Ben Widawsky	4fc7c97	2013-02-08 11:49:24 -0800	[diff] [blame]	5118
Daniel Vetter	d5abdfd	2014-11-20 09:45:19 +0100	[diff] [blame]	5119	/*
				5120	* At least 830 can leave some of the unused rings
				5121	* "active" (ie. head != tail) after resume which
				5122	* will prevent c3 entry. Makes sure all unused rings
				5123	* are totally idle.
				5124	*/
Tvrtko Ursulin	50a0bc9	2016-10-13 11:02:58 +0100	[diff] [blame]	5125	init_unused_rings(dev_priv);
Daniel Vetter	d5abdfd	2014-11-20 09:45:19 +0100	[diff] [blame]	5126
Dave Gordon	ed54c1a	2016-01-19 19:02:54 +0000	[diff] [blame]	5127	BUG_ON(!dev_priv->kernel_context);
Chris Wilson	6f74b36	2017-10-15 15:37:25 +0100	[diff] [blame]	5128	if (i915_terminally_wedged(&dev_priv->gpu_error)) {
				5129	ret = -EIO;
				5130	goto out;
				5131	}
John Harrison	90638cc	2015-05-29 17:43:37 +0100	[diff] [blame]	5132
Tvrtko Ursulin	c6be607	2016-11-16 08:55:31 +0000	[diff] [blame]	5133	ret = i915_ppgtt_init_hw(dev_priv);
John Harrison	4ad2fd8	2015-06-18 13:11:20 +0100	[diff] [blame]	5134	if (ret) {
Chris Wilson	8177e11	2018-02-07 11:15:45 +0000	[diff] [blame]	5135	DRM_ERROR("Enabling PPGTT failed (%d)\n", ret);
John Harrison	4ad2fd8	2015-06-18 13:11:20 +0100	[diff] [blame]	5136	goto out;
				5137	}
				5138
Michał Winiarski	9bdc357	2017-10-25 18:25:19 +0100	[diff] [blame]	5139	/* We can't enable contexts until all firmware is loaded */
				5140	ret = intel_uc_init_hw(dev_priv);
Chris Wilson	8177e11	2018-02-07 11:15:45 +0000	[diff] [blame]	5141	if (ret) {
				5142	DRM_ERROR("Enabling uc failed (%d)\n", ret);
Michał Winiarski	9bdc357	2017-10-25 18:25:19 +0100	[diff] [blame]	5143	goto out;
Chris Wilson	8177e11	2018-02-07 11:15:45 +0000	[diff] [blame]	5144	}
Michał Winiarski	9bdc357	2017-10-25 18:25:19 +0100	[diff] [blame]	5145
Tvrtko Ursulin	bf9e842	2016-12-01 14:16:38 +0000	[diff] [blame]	5146	intel_mocs_init_l3cc_table(dev_priv);
Peter Antoine	0ccdacf	2016-04-13 15:03:25 +0100	[diff] [blame]	5147
Chris Wilson	136109c	2017-11-02 13:14:30 +0000	[diff] [blame]	5148	/* Only when the HW is re-initialised, can we replay the requests */
				5149	ret = __i915_gem_restart_engines(dev_priv);
Chris Wilson	5e4f518	2015-02-13 14:35:59 +0000	[diff] [blame]	5150	out:
				5151	intel_uncore_forcewake_put(dev_priv, FORCEWAKE_ALL);
Ben Widawsky	2fa48d8	2013-12-06 14:11:04 -0800	[diff] [blame]	5152	return ret;
Zou Nan hai	8187a2b	2010-05-21 09:08:55 +0800	[diff] [blame]	5153	}
				5154
Chris Wilson	d2b4b97	2017-11-10 14:26:33 +0000	[diff] [blame]	5155	static int __intel_engines_record_defaults(struct drm_i915_private *i915)
				5156	{
				5157	struct i915_gem_context *ctx;
				5158	struct intel_engine_cs *engine;
				5159	enum intel_engine_id id;
				5160	int err;
				5161
				5162	/*
				5163	* As we reset the gpu during very early sanitisation, the current
				5164	* register state on the GPU should reflect its defaults values.
				5165	* We load a context onto the hw (with restore-inhibit), then switch
				5166	* over to a second context to save that default register state. We
				5167	* can then prime every new context with that state so they all start
				5168	* from the same default HW values.
				5169	*/
				5170
				5171	ctx = i915_gem_context_create_kernel(i915, 0);
				5172	if (IS_ERR(ctx))
				5173	return PTR_ERR(ctx);
				5174
				5175	for_each_engine(engine, i915, id) {
Chris Wilson	e61e0f5	2018-02-21 09:56:36 +0000	[diff] [blame]	5176	struct i915_request *rq;
Chris Wilson	d2b4b97	2017-11-10 14:26:33 +0000	[diff] [blame]	5177
Chris Wilson	e61e0f5	2018-02-21 09:56:36 +0000	[diff] [blame]	5178	rq = i915_request_alloc(engine, ctx);
Chris Wilson	d2b4b97	2017-11-10 14:26:33 +0000	[diff] [blame]	5179	if (IS_ERR(rq)) {
				5180	err = PTR_ERR(rq);
				5181	goto out_ctx;
				5182	}
				5183
Chris Wilson	3fef5cd	2017-11-20 10:20:02 +0000	[diff] [blame]	5184	err = 0;
Chris Wilson	d2b4b97	2017-11-10 14:26:33 +0000	[diff] [blame]	5185	if (engine->init_context)
				5186	err = engine->init_context(rq);
				5187
Chris Wilson	e61e0f5	2018-02-21 09:56:36 +0000	[diff] [blame]	5188	__i915_request_add(rq, true);
Chris Wilson	d2b4b97	2017-11-10 14:26:33 +0000	[diff] [blame]	5189	if (err)
				5190	goto err_active;
				5191	}
				5192
				5193	err = i915_gem_switch_to_kernel_context(i915);
				5194	if (err)
				5195	goto err_active;
				5196
				5197	err = i915_gem_wait_for_idle(i915, I915_WAIT_LOCKED);
				5198	if (err)
				5199	goto err_active;
				5200
				5201	assert_kernel_context_is_current(i915);
				5202
				5203	for_each_engine(engine, i915, id) {
				5204	struct i915_vma *state;
				5205
				5206	state = ctx->engine[id].state;
				5207	if (!state)
				5208	continue;
				5209
				5210	/*
				5211	* As we will hold a reference to the logical state, it will
				5212	* not be torn down with the context, and importantly the
				5213	* object will hold onto its vma (making it possible for a
				5214	* stray GTT write to corrupt our defaults). Unmap the vma
				5215	* from the GTT to prevent such accidents and reclaim the
				5216	* space.
				5217	*/
				5218	err = i915_vma_unbind(state);
				5219	if (err)
				5220	goto err_active;
				5221
				5222	err = i915_gem_object_set_to_cpu_domain(state->obj, false);
				5223	if (err)
				5224	goto err_active;
				5225
				5226	engine->default_state = i915_gem_object_get(state->obj);
				5227	}
				5228
				5229	if (IS_ENABLED(CONFIG_DRM_I915_DEBUG_GEM)) {
				5230	unsigned int found = intel_engines_has_context_isolation(i915);
				5231
				5232	/*
				5233	* Make sure that classes with multiple engine instances all
				5234	* share the same basic configuration.
				5235	*/
				5236	for_each_engine(engine, i915, id) {
				5237	unsigned int bit = BIT(engine->uabi_class);
				5238	unsigned int expected = engine->default_state ? bit : 0;
				5239
				5240	if ((found & bit) != expected) {
				5241	DRM_ERROR("mismatching default context state for class %d on engine %s\n",
				5242	engine->uabi_class, engine->name);
				5243	}
				5244	}
				5245	}
				5246
				5247	out_ctx:
				5248	i915_gem_context_set_closed(ctx);
				5249	i915_gem_context_put(ctx);
				5250	return err;
				5251
				5252	err_active:
				5253	/*
				5254	* If we have to abandon now, we expect the engines to be idle
				5255	* and ready to be torn-down. First try to flush any remaining
				5256	* request, ensure we are pointing at the kernel context and
				5257	* then remove it.
				5258	*/
				5259	if (WARN_ON(i915_gem_switch_to_kernel_context(i915)))
				5260	goto out_ctx;
				5261
				5262	if (WARN_ON(i915_gem_wait_for_idle(i915, I915_WAIT_LOCKED)))
				5263	goto out_ctx;
				5264
				5265	i915_gem_contexts_lost(i915);
				5266	goto out_ctx;
				5267	}
				5268
Tvrtko Ursulin	bf9e842	2016-12-01 14:16:38 +0000	[diff] [blame]	5269	int i915_gem_init(struct drm_i915_private *dev_priv)
Chris Wilson	1070a42	2012-04-24 15:47:41 +0100	[diff] [blame]	5270	{
Chris Wilson	1070a42	2012-04-24 15:47:41 +0100	[diff] [blame]	5271	int ret;
				5272
Matthew Auld	da9fe3f3	2017-10-06 23:18:31 +0100	[diff] [blame]	5273	/*
				5274	* We need to fallback to 4K pages since gvt gtt handling doesn't
				5275	* support huge page entries - we will need to check either hypervisor
				5276	* mm can support huge guest page or just do emulation in gvt.
				5277	*/
				5278	if (intel_vgpu_active(dev_priv))
				5279	mkwrite_device_info(dev_priv)->page_sizes =
				5280	I915_GTT_PAGE_SIZE_4K;
				5281
Chris Wilson	9431282	2017-05-03 10:39:18 +0100	[diff] [blame]	5282	dev_priv->mm.unordered_timeline = dma_fence_context_alloc(1);
Chris Wilson	57822dc	2017-02-22 11:40:48 +0000	[diff] [blame]	5283
Chris Wilson	fb5c551	2017-11-20 20:55:00 +0000	[diff] [blame]	5284	if (HAS_LOGICAL_RING_CONTEXTS(dev_priv)) {
Chris Wilson	821ed7d	2016-09-09 14:11:53 +0100	[diff] [blame]	5285	dev_priv->gt.resume = intel_lr_context_resume;
Tvrtko Ursulin	117897f	2016-03-16 11:00:40 +0000	[diff] [blame]	5286	dev_priv->gt.cleanup_engine = intel_logical_ring_cleanup;
Chris Wilson	fb5c551	2017-11-20 20:55:00 +0000	[diff] [blame]	5287	} else {
				5288	dev_priv->gt.resume = intel_legacy_submission_resume;
				5289	dev_priv->gt.cleanup_engine = intel_engine_cleanup;
Oscar Mateo	a83014d	2014-07-24 17:04:21 +0100	[diff] [blame]	5290	}
				5291
Chris Wilson	ee48700	2017-11-22 17:26:21 +0000	[diff] [blame]	5292	ret = i915_gem_init_userptr(dev_priv);
				5293	if (ret)
				5294	return ret;
				5295
Sagar Arun Kamble	70deead	2018-01-24 21:16:58 +0530	[diff] [blame]	5296	ret = intel_uc_init_misc(dev_priv);
Michał Winiarski	3176ff4	2017-12-13 23:13:47 +0100	[diff] [blame]	5297	if (ret)
				5298	return ret;
				5299
Chris Wilson	5e4f518	2015-02-13 14:35:59 +0000	[diff] [blame]	5300	/* This is just a security blanket to placate dragons.
				5301	* On some systems, we very sporadically observe that the first TLBs
				5302	* used by the CS may be stale, despite us poking the TLB reset. If
				5303	* we hold the forcewake during initialisation these problems
				5304	* just magically go away.
				5305	*/
Chris Wilson	ee48700	2017-11-22 17:26:21 +0000	[diff] [blame]	5306	mutex_lock(&dev_priv->drm.struct_mutex);
Chris Wilson	5e4f518	2015-02-13 14:35:59 +0000	[diff] [blame]	5307	intel_uncore_forcewake_get(dev_priv, FORCEWAKE_ALL);
				5308
Chris Wilson	f6b9d5c	2016-08-04 07:52:23 +0100	[diff] [blame]	5309	ret = i915_gem_init_ggtt(dev_priv);
Chris Wilson	6ca9a2b	2017-12-13 13:43:47 +0000	[diff] [blame]	5310	if (ret) {
				5311	GEM_BUG_ON(ret == -EIO);
				5312	goto err_unlock;
				5313	}
Jesse Barnes	d62b489	2013-03-08 10:45:53 -0800	[diff] [blame]	5314
Chris Wilson	829a0af	2017-06-20 12:05:45 +0100	[diff] [blame]	5315	ret = i915_gem_contexts_init(dev_priv);
Chris Wilson	6ca9a2b	2017-12-13 13:43:47 +0000	[diff] [blame]	5316	if (ret) {
				5317	GEM_BUG_ON(ret == -EIO);
				5318	goto err_ggtt;
				5319	}
Ben Widawsky	2fa48d8	2013-12-06 14:11:04 -0800	[diff] [blame]	5320
Tvrtko Ursulin	bf9e842	2016-12-01 14:16:38 +0000	[diff] [blame]	5321	ret = intel_engines_init(dev_priv);
Chris Wilson	6ca9a2b	2017-12-13 13:43:47 +0000	[diff] [blame]	5322	if (ret) {
				5323	GEM_BUG_ON(ret == -EIO);
				5324	goto err_context;
				5325	}
Daniel Vetter	53ca26c	2012-04-26 23:28:03 +0200	[diff] [blame]	5326
Chris Wilson	f58d13d	2017-11-10 14:26:29 +0000	[diff] [blame]	5327	intel_init_gt_powersave(dev_priv);
				5328
Michał Winiarski	61b5c15	2017-12-13 23:13:48 +0100	[diff] [blame]	5329	ret = intel_uc_init(dev_priv);
Chris Wilson	cc6a818	2017-11-10 14:26:30 +0000	[diff] [blame]	5330	if (ret)
Chris Wilson	6ca9a2b	2017-12-13 13:43:47 +0000	[diff] [blame]	5331	goto err_pm;
Chris Wilson	cc6a818	2017-11-10 14:26:30 +0000	[diff] [blame]	5332
Michał Winiarski	61b5c15	2017-12-13 23:13:48 +0100	[diff] [blame]	5333	ret = i915_gem_init_hw(dev_priv);
				5334	if (ret)
				5335	goto err_uc_init;
				5336
Chris Wilson	cc6a818	2017-11-10 14:26:30 +0000	[diff] [blame]	5337	/*
				5338	* Despite its name intel_init_clock_gating applies both display
				5339	* clock gating workarounds; GT mmio workarounds and the occasional
				5340	* GT power context workaround. Worse, sometimes it includes a context
				5341	* register workaround which we need to apply before we record the
				5342	* default HW state for all contexts.
				5343	*
				5344	* FIXME: break up the workarounds and apply them at the right time!
				5345	*/
				5346	intel_init_clock_gating(dev_priv);
				5347
Chris Wilson	d2b4b97	2017-11-10 14:26:33 +0000	[diff] [blame]	5348	ret = __intel_engines_record_defaults(dev_priv);
Chris Wilson	6ca9a2b	2017-12-13 13:43:47 +0000	[diff] [blame]	5349	if (ret)
				5350	goto err_init_hw;
				5351
				5352	if (i915_inject_load_failure()) {
				5353	ret = -ENODEV;
				5354	goto err_init_hw;
				5355	}
				5356
				5357	if (i915_inject_load_failure()) {
				5358	ret = -EIO;
				5359	goto err_init_hw;
				5360	}
				5361
				5362	intel_uncore_forcewake_put(dev_priv, FORCEWAKE_ALL);
				5363	mutex_unlock(&dev_priv->drm.struct_mutex);
				5364
				5365	return 0;
				5366
				5367	/*
				5368	* Unwinding is complicated by that we want to handle -EIO to mean
				5369	* disable GPU submission but keep KMS alive. We want to mark the
				5370	* HW as irrevisibly wedged, but keep enough state around that the
				5371	* driver doesn't explode during runtime.
				5372	*/
				5373	err_init_hw:
				5374	i915_gem_wait_for_idle(dev_priv, I915_WAIT_LOCKED);
				5375	i915_gem_contexts_lost(dev_priv);
				5376	intel_uc_fini_hw(dev_priv);
Michał Winiarski	61b5c15	2017-12-13 23:13:48 +0100	[diff] [blame]	5377	err_uc_init:
				5378	intel_uc_fini(dev_priv);
Chris Wilson	6ca9a2b	2017-12-13 13:43:47 +0000	[diff] [blame]	5379	err_pm:
				5380	if (ret != -EIO) {
				5381	intel_cleanup_gt_powersave(dev_priv);
				5382	i915_gem_cleanup_engines(dev_priv);
				5383	}
				5384	err_context:
				5385	if (ret != -EIO)
				5386	i915_gem_contexts_fini(dev_priv);
				5387	err_ggtt:
				5388	err_unlock:
				5389	intel_uncore_forcewake_put(dev_priv, FORCEWAKE_ALL);
				5390	mutex_unlock(&dev_priv->drm.struct_mutex);
				5391
Sagar Arun Kamble	70deead	2018-01-24 21:16:58 +0530	[diff] [blame]	5392	intel_uc_fini_misc(dev_priv);
Sagar Arun Kamble	da943b5	2018-01-10 18:24:16 +0530	[diff] [blame]	5393
Chris Wilson	6ca9a2b	2017-12-13 13:43:47 +0000	[diff] [blame]	5394	if (ret != -EIO)
				5395	i915_gem_cleanup_userptr(dev_priv);
				5396
Chris Wilson	6099032	2014-04-09 09:19:42 +0100	[diff] [blame]	5397	if (ret == -EIO) {
Chris Wilson	6ca9a2b	2017-12-13 13:43:47 +0000	[diff] [blame]	5398	/*
				5399	* Allow engine initialisation to fail by marking the GPU as
Chris Wilson	6099032	2014-04-09 09:19:42 +0100	[diff] [blame]	5400	* wedged. But we only want to do this where the GPU is angry,
				5401	* for all other failure, such as an allocation failure, bail.
				5402	*/
Chris Wilson	6f74b36	2017-10-15 15:37:25 +0100	[diff] [blame]	5403	if (!i915_terminally_wedged(&dev_priv->gpu_error)) {
				5404	DRM_ERROR("Failed to initialize GPU, declaring it wedged\n");
				5405	i915_gem_set_wedged(dev_priv);
				5406	}
Chris Wilson	6099032	2014-04-09 09:19:42 +0100	[diff] [blame]	5407	ret = 0;
Chris Wilson	1070a42	2012-04-24 15:47:41 +0100	[diff] [blame]	5408	}
				5409
Chris Wilson	6ca9a2b	2017-12-13 13:43:47 +0000	[diff] [blame]	5410	i915_gem_drain_freed_objects(dev_priv);
Chris Wilson	6099032	2014-04-09 09:19:42 +0100	[diff] [blame]	5411	return ret;
Chris Wilson	1070a42	2012-04-24 15:47:41 +0100	[diff] [blame]	5412	}
				5413
Chris Wilson	2414551	2017-01-24 11:01:35 +0000	[diff] [blame]	5414	void i915_gem_init_mmio(struct drm_i915_private *i915)
				5415	{
				5416	i915_gem_sanitize(i915);
				5417	}
				5418
Zou Nan hai	8187a2b	2010-05-21 09:08:55 +0800	[diff] [blame]	5419	void
Tvrtko Ursulin	cb15d9f	2016-12-01 14:16:39 +0000	[diff] [blame]	5420	i915_gem_cleanup_engines(struct drm_i915_private *dev_priv)
Zou Nan hai	8187a2b	2010-05-21 09:08:55 +0800	[diff] [blame]	5421	{
Tvrtko Ursulin	e2f8039	2016-03-16 11:00:36 +0000	[diff] [blame]	5422	struct intel_engine_cs *engine;
Akash Goel	3b3f165	2016-10-13 22:44:48 +0530	[diff] [blame]	5423	enum intel_engine_id id;
Zou Nan hai	8187a2b	2010-05-21 09:08:55 +0800	[diff] [blame]	5424
Akash Goel	3b3f165	2016-10-13 22:44:48 +0530	[diff] [blame]	5425	for_each_engine(engine, dev_priv, id)
Tvrtko Ursulin	117897f	2016-03-16 11:00:40 +0000	[diff] [blame]	5426	dev_priv->gt.cleanup_engine(engine);
Zou Nan hai	8187a2b	2010-05-21 09:08:55 +0800	[diff] [blame]	5427	}
				5428
Eric Anholt	673a394	2008-07-30 12:06:12 -0700	[diff] [blame]	5429	void
Imre Deak	40ae4e1	2016-03-16 14:54:03 +0200	[diff] [blame]	5430	i915_gem_load_init_fences(struct drm_i915_private *dev_priv)
				5431	{
Chris Wilson	49ef529	2016-08-18 17:17:00 +0100	[diff] [blame]	5432	int i;
Imre Deak	40ae4e1	2016-03-16 14:54:03 +0200	[diff] [blame]	5433
Tvrtko Ursulin	c56b89f	2018-02-09 21:58:46 +0000	[diff] [blame]	5434	if (INTEL_GEN(dev_priv) >= 7 && !IS_VALLEYVIEW(dev_priv) &&
Imre Deak	40ae4e1	2016-03-16 14:54:03 +0200	[diff] [blame]	5435	!IS_CHERRYVIEW(dev_priv))
				5436	dev_priv->num_fence_regs = 32;
Tvrtko Ursulin	c56b89f	2018-02-09 21:58:46 +0000	[diff] [blame]	5437	else if (INTEL_GEN(dev_priv) >= 4 \|\|
Jani Nikula	73f67aa	2016-12-07 22:48:09 +0200	[diff] [blame]	5438	IS_I945G(dev_priv) \|\| IS_I945GM(dev_priv) \|\|
				5439	IS_G33(dev_priv) \|\| IS_PINEVIEW(dev_priv))
Imre Deak	40ae4e1	2016-03-16 14:54:03 +0200	[diff] [blame]	5440	dev_priv->num_fence_regs = 16;
				5441	else
				5442	dev_priv->num_fence_regs = 8;
				5443
Chris Wilson	c033666	2016-05-06 15:40:21 +0100	[diff] [blame]	5444	if (intel_vgpu_active(dev_priv))
Imre Deak	40ae4e1	2016-03-16 14:54:03 +0200	[diff] [blame]	5445	dev_priv->num_fence_regs =
				5446	I915_READ(vgtif_reg(avail_rs.fence_num));
				5447
				5448	/* Initialize fence registers to zero */
Chris Wilson	49ef529	2016-08-18 17:17:00 +0100	[diff] [blame]	5449	for (i = 0; i < dev_priv->num_fence_regs; i++) {
				5450	struct drm_i915_fence_reg *fence = &dev_priv->fence_regs[i];
				5451
				5452	fence->i915 = dev_priv;
				5453	fence->id = i;
				5454	list_add_tail(&fence->link, &dev_priv->mm.fence_list);
				5455	}
Tvrtko Ursulin	4362f4f	2016-11-16 08:55:33 +0000	[diff] [blame]	5456	i915_gem_restore_fences(dev_priv);
Imre Deak	40ae4e1	2016-03-16 14:54:03 +0200	[diff] [blame]	5457
Tvrtko Ursulin	4362f4f	2016-11-16 08:55:33 +0000	[diff] [blame]	5458	i915_gem_detect_bit_6_swizzle(dev_priv);
Imre Deak	40ae4e1	2016-03-16 14:54:03 +0200	[diff] [blame]	5459	}
				5460
Chris Wilson	9c52d1c	2017-11-10 23:24:47 +0000	[diff] [blame]	5461	static void i915_gem_init__mm(struct drm_i915_private *i915)
				5462	{
				5463	spin_lock_init(&i915->mm.object_stat_lock);
				5464	spin_lock_init(&i915->mm.obj_lock);
				5465	spin_lock_init(&i915->mm.free_lock);
				5466
				5467	init_llist_head(&i915->mm.free_list);
				5468
				5469	INIT_LIST_HEAD(&i915->mm.unbound_list);
				5470	INIT_LIST_HEAD(&i915->mm.bound_list);
				5471	INIT_LIST_HEAD(&i915->mm.fence_list);
				5472	INIT_LIST_HEAD(&i915->mm.userfault_list);
				5473
				5474	INIT_WORK(&i915->mm.free_work, __i915_gem_free_work);
				5475	}
				5476
Chris Wilson	73cb970	2016-10-28 13:58:46 +0100	[diff] [blame]	5477	int
Tvrtko Ursulin	cb15d9f	2016-12-01 14:16:39 +0000	[diff] [blame]	5478	i915_gem_load_init(struct drm_i915_private *dev_priv)
Eric Anholt	673a394	2008-07-30 12:06:12 -0700	[diff] [blame]	5479	{
Tvrtko Ursulin	a933568	2016-11-02 15:14:59 +0000	[diff] [blame]	5480	int err = -ENOMEM;
Chris Wilson	42dcedd	2012-11-15 11:32:30 +0000	[diff] [blame]	5481
Tvrtko Ursulin	a933568	2016-11-02 15:14:59 +0000	[diff] [blame]	5482	dev_priv->objects = KMEM_CACHE(drm_i915_gem_object, SLAB_HWCACHE_ALIGN);
				5483	if (!dev_priv->objects)
Chris Wilson	73cb970	2016-10-28 13:58:46 +0100	[diff] [blame]	5484	goto err_out;
Chris Wilson	73cb970	2016-10-28 13:58:46 +0100	[diff] [blame]	5485
Tvrtko Ursulin	a933568	2016-11-02 15:14:59 +0000	[diff] [blame]	5486	dev_priv->vmas = KMEM_CACHE(i915_vma, SLAB_HWCACHE_ALIGN);
				5487	if (!dev_priv->vmas)
Chris Wilson	73cb970	2016-10-28 13:58:46 +0100	[diff] [blame]	5488	goto err_objects;
Chris Wilson	73cb970	2016-10-28 13:58:46 +0100	[diff] [blame]	5489
Chris Wilson	d1b48c1	2017-08-16 09:52:08 +0100	[diff] [blame]	5490	dev_priv->luts = KMEM_CACHE(i915_lut_handle, 0);
				5491	if (!dev_priv->luts)
				5492	goto err_vmas;
				5493
Chris Wilson	e61e0f5	2018-02-21 09:56:36 +0000	[diff] [blame]	5494	dev_priv->requests = KMEM_CACHE(i915_request,
Tvrtko Ursulin	a933568	2016-11-02 15:14:59 +0000	[diff] [blame]	5495	SLAB_HWCACHE_ALIGN \|
				5496	SLAB_RECLAIM_ACCOUNT \|
Paul E. McKenney	5f0d5a3	2017-01-18 02:53:44 -0800	[diff] [blame]	5497	SLAB_TYPESAFE_BY_RCU);
Tvrtko Ursulin	a933568	2016-11-02 15:14:59 +0000	[diff] [blame]	5498	if (!dev_priv->requests)
Chris Wilson	d1b48c1	2017-08-16 09:52:08 +0100	[diff] [blame]	5499	goto err_luts;
Chris Wilson	73cb970	2016-10-28 13:58:46 +0100	[diff] [blame]	5500
Chris Wilson	52e5420	2016-11-14 20:41:02 +0000	[diff] [blame]	5501	dev_priv->dependencies = KMEM_CACHE(i915_dependency,
				5502	SLAB_HWCACHE_ALIGN \|
				5503	SLAB_RECLAIM_ACCOUNT);
				5504	if (!dev_priv->dependencies)
				5505	goto err_requests;
				5506
Chris Wilson	c5cf9a9	2017-05-17 13:10:04 +0100	[diff] [blame]	5507	dev_priv->priorities = KMEM_CACHE(i915_priolist, SLAB_HWCACHE_ALIGN);
				5508	if (!dev_priv->priorities)
				5509	goto err_dependencies;
				5510
Chris Wilson	73cb970	2016-10-28 13:58:46 +0100	[diff] [blame]	5511	mutex_lock(&dev_priv->drm.struct_mutex);
				5512	INIT_LIST_HEAD(&dev_priv->gt.timelines);
Chris Wilson	bb89485	2016-11-14 20:40:57 +0000	[diff] [blame]	5513	err = i915_gem_timeline_init__global(dev_priv);
Chris Wilson	73cb970	2016-10-28 13:58:46 +0100	[diff] [blame]	5514	mutex_unlock(&dev_priv->drm.struct_mutex);
				5515	if (err)
Chris Wilson	c5cf9a9	2017-05-17 13:10:04 +0100	[diff] [blame]	5516	goto err_priorities;
Eric Anholt	673a394	2008-07-30 12:06:12 -0700	[diff] [blame]	5517
Chris Wilson	9c52d1c	2017-11-10 23:24:47 +0000	[diff] [blame]	5518	i915_gem_init__mm(dev_priv);
Chris Wilson	f212381	2017-10-16 12:40:37 +0100	[diff] [blame]	5519
Chris Wilson	67d97da	2016-07-04 08:08:31 +0100	[diff] [blame]	5520	INIT_DELAYED_WORK(&dev_priv->gt.retire_work,
Eric Anholt	673a394	2008-07-30 12:06:12 -0700	[diff] [blame]	5521	i915_gem_retire_work_handler);
Chris Wilson	67d97da	2016-07-04 08:08:31 +0100	[diff] [blame]	5522	INIT_DELAYED_WORK(&dev_priv->gt.idle_work,
Chris Wilson	b29c19b	2013-09-25 17:34:56 +0100	[diff] [blame]	5523	i915_gem_idle_work_handler);
Chris Wilson	1f15b76	2016-07-01 17:23:14 +0100	[diff] [blame]	5524	init_waitqueue_head(&dev_priv->gpu_error.wait_queue);
Daniel Vetter	1f83fee	2012-11-15 17:17:22 +0100	[diff] [blame]	5525	init_waitqueue_head(&dev_priv->gpu_error.reset_queue);
Chris Wilson	3116971	2009-09-14 16:50:28 +0100	[diff] [blame]	5526
Joonas Lahtinen	6f63340	2016-09-01 14:58:21 +0300	[diff] [blame]	5527	atomic_set(&dev_priv->mm.bsd_engine_dispatch_index, 0);
				5528
Chris Wilson	b5add95	2016-08-04 16:32:36 +0100	[diff] [blame]	5529	spin_lock_init(&dev_priv->fb_tracking.lock);
Chris Wilson	73cb970	2016-10-28 13:58:46 +0100	[diff] [blame]	5530
Matthew Auld	465c403	2017-10-06 23:18:14 +0100	[diff] [blame]	5531	err = i915_gemfs_init(dev_priv);
				5532	if (err)
				5533	DRM_NOTE("Unable to create a private tmpfs mount, hugepage support will be disabled(%d).\n", err);
				5534
Chris Wilson	73cb970	2016-10-28 13:58:46 +0100	[diff] [blame]	5535	return 0;
				5536
Chris Wilson	c5cf9a9	2017-05-17 13:10:04 +0100	[diff] [blame]	5537	err_priorities:
				5538	kmem_cache_destroy(dev_priv->priorities);
Chris Wilson	52e5420	2016-11-14 20:41:02 +0000	[diff] [blame]	5539	err_dependencies:
				5540	kmem_cache_destroy(dev_priv->dependencies);
Chris Wilson	73cb970	2016-10-28 13:58:46 +0100	[diff] [blame]	5541	err_requests:
				5542	kmem_cache_destroy(dev_priv->requests);
Chris Wilson	d1b48c1	2017-08-16 09:52:08 +0100	[diff] [blame]	5543	err_luts:
				5544	kmem_cache_destroy(dev_priv->luts);
Chris Wilson	73cb970	2016-10-28 13:58:46 +0100	[diff] [blame]	5545	err_vmas:
				5546	kmem_cache_destroy(dev_priv->vmas);
				5547	err_objects:
				5548	kmem_cache_destroy(dev_priv->objects);
				5549	err_out:
				5550	return err;
Eric Anholt	673a394	2008-07-30 12:06:12 -0700	[diff] [blame]	5551	}
Dave Airlie	71acb5e	2008-12-30 20:31:46 +1000	[diff] [blame]	5552
Tvrtko Ursulin	cb15d9f	2016-12-01 14:16:39 +0000	[diff] [blame]	5553	void i915_gem_load_cleanup(struct drm_i915_private *dev_priv)
Imre Deak	d64aa09	2016-01-19 15:26:29 +0200	[diff] [blame]	5554	{
Chris Wilson	c4d4c1c	2017-02-10 16:35:23 +0000	[diff] [blame]	5555	i915_gem_drain_freed_objects(dev_priv);
Chris Wilson	c9c7047	2018-02-19 22:06:31 +0000	[diff] [blame]	5556	GEM_BUG_ON(!llist_empty(&dev_priv->mm.free_list));
				5557	GEM_BUG_ON(atomic_read(&dev_priv->mm.free_count));
Chris Wilson	c4d4c1c	2017-02-10 16:35:23 +0000	[diff] [blame]	5558	WARN_ON(dev_priv->mm.object_count);
Chris Wilson	7d5d59e	2016-11-01 08:48:41 +0000	[diff] [blame]	5559
Matthew Auld	ea84aa7	2016-11-17 21:04:11 +0000	[diff] [blame]	5560	mutex_lock(&dev_priv->drm.struct_mutex);
				5561	i915_gem_timeline_fini(&dev_priv->gt.global_timeline);
				5562	WARN_ON(!list_empty(&dev_priv->gt.timelines));
				5563	mutex_unlock(&dev_priv->drm.struct_mutex);
				5564
Chris Wilson	c5cf9a9	2017-05-17 13:10:04 +0100	[diff] [blame]	5565	kmem_cache_destroy(dev_priv->priorities);
Chris Wilson	52e5420	2016-11-14 20:41:02 +0000	[diff] [blame]	5566	kmem_cache_destroy(dev_priv->dependencies);
Imre Deak	d64aa09	2016-01-19 15:26:29 +0200	[diff] [blame]	5567	kmem_cache_destroy(dev_priv->requests);
Chris Wilson	d1b48c1	2017-08-16 09:52:08 +0100	[diff] [blame]	5568	kmem_cache_destroy(dev_priv->luts);
Imre Deak	d64aa09	2016-01-19 15:26:29 +0200	[diff] [blame]	5569	kmem_cache_destroy(dev_priv->vmas);
				5570	kmem_cache_destroy(dev_priv->objects);
Chris Wilson	0eafec6	2016-08-04 16:32:41 +0100	[diff] [blame]	5571
				5572	/* And ensure that our DESTROY_BY_RCU slabs are truly destroyed */
				5573	rcu_barrier();
Matthew Auld	465c403	2017-10-06 23:18:14 +0100	[diff] [blame]	5574
				5575	i915_gemfs_fini(dev_priv);
Imre Deak	d64aa09	2016-01-19 15:26:29 +0200	[diff] [blame]	5576	}
				5577
Chris Wilson	6a800ea	2016-09-21 14:51:07 +0100	[diff] [blame]	5578	int i915_gem_freeze(struct drm_i915_private *dev_priv)
				5579	{
Chris Wilson	d0aa301	2017-04-07 11:25:49 +0100	[diff] [blame]	5580	/* Discard all purgeable objects, let userspace recover those as
				5581	* required after resuming.
				5582	*/
Chris Wilson	6a800ea	2016-09-21 14:51:07 +0100	[diff] [blame]	5583	i915_gem_shrink_all(dev_priv);
Chris Wilson	6a800ea	2016-09-21 14:51:07 +0100	[diff] [blame]	5584
Chris Wilson	6a800ea	2016-09-21 14:51:07 +0100	[diff] [blame]	5585	return 0;
				5586	}
				5587
Chris Wilson	461fb99	2016-05-14 07:26:33 +0100	[diff] [blame]	5588	int i915_gem_freeze_late(struct drm_i915_private *dev_priv)
				5589	{
				5590	struct drm_i915_gem_object *obj;
Chris Wilson	7aab2d5	2016-09-09 20:02:18 +0100	[diff] [blame]	5591	struct list_head *phases[] = {
				5592	&dev_priv->mm.unbound_list,
				5593	&dev_priv->mm.bound_list,
				5594	NULL
				5595	}, **p;
Chris Wilson	461fb99	2016-05-14 07:26:33 +0100	[diff] [blame]	5596
				5597	/* Called just before we write the hibernation image.
				5598	*
				5599	* We need to update the domain tracking to reflect that the CPU
				5600	* will be accessing all the pages to create and restore from the
				5601	* hibernation, and so upon restoration those pages will be in the
				5602	* CPU domain.
				5603	*
				5604	* To make sure the hibernation image contains the latest state,
				5605	* we update that state just before writing out the image.
Chris Wilson	7aab2d5	2016-09-09 20:02:18 +0100	[diff] [blame]	5606	*
				5607	* To try and reduce the hibernation image, we manually shrink
Chris Wilson	d0aa301	2017-04-07 11:25:49 +0100	[diff] [blame]	5608	* the objects as well, see i915_gem_freeze()
Chris Wilson	461fb99	2016-05-14 07:26:33 +0100	[diff] [blame]	5609	*/
				5610
Chris Wilson	912d572	2017-09-06 16:19:30 -0700	[diff] [blame]	5611	i915_gem_shrink(dev_priv, -1UL, NULL, I915_SHRINK_UNBOUND);
Chris Wilson	17b93c4	2017-04-07 11:25:50 +0100	[diff] [blame]	5612	i915_gem_drain_freed_objects(dev_priv);
Chris Wilson	461fb99	2016-05-14 07:26:33 +0100	[diff] [blame]	5613
Chris Wilson	f212381	2017-10-16 12:40:37 +0100	[diff] [blame]	5614	spin_lock(&dev_priv->mm.obj_lock);
Chris Wilson	7aab2d5	2016-09-09 20:02:18 +0100	[diff] [blame]	5615	for (p = phases; *p; p++) {
Chris Wilson	f212381	2017-10-16 12:40:37 +0100	[diff] [blame]	5616	list_for_each_entry(obj, *p, mm.link)
Chris Wilson	e27ab73	2017-06-15 13:38:49 +0100	[diff] [blame]	5617	__start_cpu_write(obj);
Chris Wilson	461fb99	2016-05-14 07:26:33 +0100	[diff] [blame]	5618	}
Chris Wilson	f212381	2017-10-16 12:40:37 +0100	[diff] [blame]	5619	spin_unlock(&dev_priv->mm.obj_lock);
Chris Wilson	461fb99	2016-05-14 07:26:33 +0100	[diff] [blame]	5620
				5621	return 0;
				5622	}
				5623
Chris Wilson	f787a5f	2010-09-24 16:02:42 +0100	[diff] [blame]	5624	void i915_gem_release(struct drm_device dev, struct drm_file file)
Eric Anholt	b962442	2009-06-03 07:27:35 +0000	[diff] [blame]	5625	{
Chris Wilson	f787a5f	2010-09-24 16:02:42 +0100	[diff] [blame]	5626	struct drm_i915_file_private *file_priv = file->driver_priv;
Chris Wilson	e61e0f5	2018-02-21 09:56:36 +0000	[diff] [blame]	5627	struct i915_request *request;
Eric Anholt	b962442	2009-06-03 07:27:35 +0000	[diff] [blame]	5628
				5629	/* Clean up our request list when the client is going away, so that
				5630	* later retire_requests won't dereference our soon-to-be-gone
				5631	* file_priv.
				5632	*/
Chris Wilson	1c25595	2010-09-26 11:03:27 +0100	[diff] [blame]	5633	spin_lock(&file_priv->mm.lock);
Chris Wilson	c8659ef	2017-03-02 12:25:25 +0000	[diff] [blame]	5634	list_for_each_entry(request, &file_priv->mm.request_list, client_link)
Chris Wilson	f787a5f	2010-09-24 16:02:42 +0100	[diff] [blame]	5635	request->file_priv = NULL;
Chris Wilson	1c25595	2010-09-26 11:03:27 +0100	[diff] [blame]	5636	spin_unlock(&file_priv->mm.lock);
Chris Wilson	b29c19b	2013-09-25 17:34:56 +0100	[diff] [blame]	5637	}
				5638
Chris Wilson	829a0af	2017-06-20 12:05:45 +0100	[diff] [blame]	5639	int i915_gem_open(struct drm_i915_private i915, struct drm_file file)
Chris Wilson	b29c19b	2013-09-25 17:34:56 +0100	[diff] [blame]	5640	{
				5641	struct drm_i915_file_private *file_priv;
Ben Widawsky	e422b88	2013-12-06 14:10:58 -0800	[diff] [blame]	5642	int ret;
Chris Wilson	b29c19b	2013-09-25 17:34:56 +0100	[diff] [blame]	5643
Chris Wilson	c4c29d7	2016-11-09 10:45:07 +0000	[diff] [blame]	5644	DRM_DEBUG("\n");
Chris Wilson	b29c19b	2013-09-25 17:34:56 +0100	[diff] [blame]	5645
				5646	file_priv = kzalloc(sizeof(*file_priv), GFP_KERNEL);
				5647	if (!file_priv)
				5648	return -ENOMEM;
				5649
				5650	file->driver_priv = file_priv;
Chris Wilson	829a0af	2017-06-20 12:05:45 +0100	[diff] [blame]	5651	file_priv->dev_priv = i915;
Chris Wilson	ab0e7ff	2014-02-25 17:11:24 +0200	[diff] [blame]	5652	file_priv->file = file;
Chris Wilson	b29c19b	2013-09-25 17:34:56 +0100	[diff] [blame]	5653
				5654	spin_lock_init(&file_priv->mm.lock);
				5655	INIT_LIST_HEAD(&file_priv->mm.request_list);
Chris Wilson	b29c19b	2013-09-25 17:34:56 +0100	[diff] [blame]	5656
Chris Wilson	c80ff16	2016-07-27 09:07:27 +0100	[diff] [blame]	5657	file_priv->bsd_engine = -1;
Tvrtko Ursulin	de1add3	2016-01-15 15:12:50 +0000	[diff] [blame]	5658
Chris Wilson	829a0af	2017-06-20 12:05:45 +0100	[diff] [blame]	5659	ret = i915_gem_context_open(i915, file);
Ben Widawsky	e422b88	2013-12-06 14:10:58 -0800	[diff] [blame]	5660	if (ret)
				5661	kfree(file_priv);
Chris Wilson	b29c19b	2013-09-25 17:34:56 +0100	[diff] [blame]	5662
Ben Widawsky	e422b88	2013-12-06 14:10:58 -0800	[diff] [blame]	5663	return ret;
Chris Wilson	b29c19b	2013-09-25 17:34:56 +0100	[diff] [blame]	5664	}
				5665
Daniel Vetter	b680c37	2014-09-19 18:27:27 +0200	[diff] [blame]	5666	/**
				5667	* i915_gem_track_fb - update frontbuffer tracking
Geliang Tang	d9072a3	2015-09-15 05:58:44 -0700	[diff] [blame]	5668	* @old: current GEM buffer for the frontbuffer slots
				5669	* @new: new GEM buffer for the frontbuffer slots
				5670	* @frontbuffer_bits: bitmask of frontbuffer slots
Daniel Vetter	b680c37	2014-09-19 18:27:27 +0200	[diff] [blame]	5671	*
				5672	* This updates the frontbuffer tracking bits @frontbuffer_bits by clearing them
				5673	* from @old and setting them in @new. Both @old and @new can be NULL.
				5674	*/
Daniel Vetter	a071fa0	2014-06-18 23:28:09 +0200	[diff] [blame]	5675	void i915_gem_track_fb(struct drm_i915_gem_object *old,
				5676	struct drm_i915_gem_object *new,
				5677	unsigned frontbuffer_bits)
				5678	{
Chris Wilson	faf5bf0	2016-08-04 16:32:37 +0100	[diff] [blame]	5679	/* Control of individual bits within the mask are guarded by
				5680	* the owning plane->mutex, i.e. we can never see concurrent
				5681	* manipulation of individual bits. But since the bitfield as a whole
				5682	* is updated using RMW, we need to use atomics in order to update
				5683	* the bits.
				5684	*/
				5685	BUILD_BUG_ON(INTEL_FRONTBUFFER_BITS_PER_PIPE * I915_MAX_PIPES >
				5686	sizeof(atomic_t) * BITS_PER_BYTE);
				5687
Daniel Vetter	a071fa0	2014-06-18 23:28:09 +0200	[diff] [blame]	5688	if (old) {
Chris Wilson	faf5bf0	2016-08-04 16:32:37 +0100	[diff] [blame]	5689	WARN_ON(!(atomic_read(&old->frontbuffer_bits) & frontbuffer_bits));
				5690	atomic_andnot(frontbuffer_bits, &old->frontbuffer_bits);
Daniel Vetter	a071fa0	2014-06-18 23:28:09 +0200	[diff] [blame]	5691	}
				5692
				5693	if (new) {
Chris Wilson	faf5bf0	2016-08-04 16:32:37 +0100	[diff] [blame]	5694	WARN_ON(atomic_read(&new->frontbuffer_bits) & frontbuffer_bits);
				5695	atomic_or(frontbuffer_bits, &new->frontbuffer_bits);
Daniel Vetter	a071fa0	2014-06-18 23:28:09 +0200	[diff] [blame]	5696	}
				5697	}
				5698
Dave Gordon	ea70299	2015-07-09 19:29:02 +0100	[diff] [blame]	5699	/* Allocate a new GEM object and fill it with the supplied data */
				5700	struct drm_i915_gem_object *
Tvrtko Ursulin	12d79d7	2016-12-01 14:16:37 +0000	[diff] [blame]	5701	i915_gem_object_create_from_data(struct drm_i915_private *dev_priv,
Dave Gordon	ea70299	2015-07-09 19:29:02 +0100	[diff] [blame]	5702	const void *data, size_t size)
				5703	{
				5704	struct drm_i915_gem_object *obj;
Chris Wilson	be062fa	2017-03-17 19:46:48 +0000	[diff] [blame]	5705	struct file *file;
				5706	size_t offset;
				5707	int err;
Dave Gordon	ea70299	2015-07-09 19:29:02 +0100	[diff] [blame]	5708
Tvrtko Ursulin	12d79d7	2016-12-01 14:16:37 +0000	[diff] [blame]	5709	obj = i915_gem_object_create(dev_priv, round_up(size, PAGE_SIZE));
Chris Wilson	fe3db79	2016-04-25 13:32:13 +0100	[diff] [blame]	5710	if (IS_ERR(obj))
Dave Gordon	ea70299	2015-07-09 19:29:02 +0100	[diff] [blame]	5711	return obj;
				5712
Christian König	c0a51fd	2018-02-16 13:43:38 +0100	[diff] [blame]	5713	GEM_BUG_ON(obj->write_domain != I915_GEM_DOMAIN_CPU);
Dave Gordon	ea70299	2015-07-09 19:29:02 +0100	[diff] [blame]	5714
Chris Wilson	be062fa	2017-03-17 19:46:48 +0000	[diff] [blame]	5715	file = obj->base.filp;
				5716	offset = 0;
				5717	do {
				5718	unsigned int len = min_t(typeof(size), size, PAGE_SIZE);
				5719	struct page *page;
				5720	void pgdata, vaddr;
Dave Gordon	ea70299	2015-07-09 19:29:02 +0100	[diff] [blame]	5721
Chris Wilson	be062fa	2017-03-17 19:46:48 +0000	[diff] [blame]	5722	err = pagecache_write_begin(file, file->f_mapping,
				5723	offset, len, 0,
				5724	&page, &pgdata);
				5725	if (err < 0)
				5726	goto fail;
Dave Gordon	ea70299	2015-07-09 19:29:02 +0100	[diff] [blame]	5727
Chris Wilson	be062fa	2017-03-17 19:46:48 +0000	[diff] [blame]	5728	vaddr = kmap(page);
				5729	memcpy(vaddr, data, len);
				5730	kunmap(page);
				5731
				5732	err = pagecache_write_end(file, file->f_mapping,
				5733	offset, len, len,
				5734	page, pgdata);
				5735	if (err < 0)
				5736	goto fail;
				5737
				5738	size -= len;
				5739	data += len;
				5740	offset += len;
				5741	} while (size);
Dave Gordon	ea70299	2015-07-09 19:29:02 +0100	[diff] [blame]	5742
				5743	return obj;
				5744
				5745	fail:
Chris Wilson	f8c417c	2016-07-20 13:31:53 +0100	[diff] [blame]	5746	i915_gem_object_put(obj);
Chris Wilson	be062fa	2017-03-17 19:46:48 +0000	[diff] [blame]	5747	return ERR_PTR(err);
Dave Gordon	ea70299	2015-07-09 19:29:02 +0100	[diff] [blame]	5748	}
Chris Wilson	96d7763	2016-10-28 13:58:33 +0100	[diff] [blame]	5749
				5750	struct scatterlist *
				5751	i915_gem_object_get_sg(struct drm_i915_gem_object *obj,
				5752	unsigned int n,
				5753	unsigned int *offset)
				5754	{
Chris Wilson	a4f5ea6	2016-10-28 13:58:35 +0100	[diff] [blame]	5755	struct i915_gem_object_page_iter *iter = &obj->mm.get_page;
Chris Wilson	96d7763	2016-10-28 13:58:33 +0100	[diff] [blame]	5756	struct scatterlist *sg;
				5757	unsigned int idx, count;
				5758
				5759	might_sleep();
				5760	GEM_BUG_ON(n >= obj->base.size >> PAGE_SHIFT);
Chris Wilson	a4f5ea6	2016-10-28 13:58:35 +0100	[diff] [blame]	5761	GEM_BUG_ON(!i915_gem_object_has_pinned_pages(obj));
Chris Wilson	96d7763	2016-10-28 13:58:33 +0100	[diff] [blame]	5762
				5763	/* As we iterate forward through the sg, we record each entry in a
				5764	* radixtree for quick repeated (backwards) lookups. If we have seen
				5765	* this index previously, we will have an entry for it.
				5766	*
				5767	* Initial lookup is O(N), but this is amortized to O(1) for
				5768	* sequential page access (where each new request is consecutive
				5769	* to the previous one). Repeated lookups are O(lg(obj->base.size)),
				5770	* i.e. O(1) with a large constant!
				5771	*/
				5772	if (n < READ_ONCE(iter->sg_idx))
				5773	goto lookup;
				5774
				5775	mutex_lock(&iter->lock);
				5776
				5777	/* We prefer to reuse the last sg so that repeated lookup of this
				5778	* (or the subsequent) sg are fast - comparing against the last
				5779	* sg is faster than going through the radixtree.
				5780	*/
				5781
				5782	sg = iter->sg_pos;
				5783	idx = iter->sg_idx;
				5784	count = __sg_page_count(sg);
				5785
				5786	while (idx + count <= n) {
				5787	unsigned long exception, i;
				5788	int ret;
				5789
				5790	/* If we cannot allocate and insert this entry, or the
				5791	* individual pages from this range, cancel updating the
				5792	* sg_idx so that on this lookup we are forced to linearly
				5793	* scan onwards, but on future lookups we will try the
				5794	* insertion again (in which case we need to be careful of
				5795	* the error return reporting that we have already inserted
				5796	* this index).
				5797	*/
				5798	ret = radix_tree_insert(&iter->radix, idx, sg);
				5799	if (ret && ret != -EEXIST)
				5800	goto scan;
				5801
				5802	exception =
				5803	RADIX_TREE_EXCEPTIONAL_ENTRY \|
				5804	idx << RADIX_TREE_EXCEPTIONAL_SHIFT;
				5805	for (i = 1; i < count; i++) {
				5806	ret = radix_tree_insert(&iter->radix, idx + i,
				5807	(void *)exception);
				5808	if (ret && ret != -EEXIST)
				5809	goto scan;
				5810	}
				5811
				5812	idx += count;
				5813	sg = ____sg_next(sg);
				5814	count = __sg_page_count(sg);
				5815	}
				5816
				5817	scan:
				5818	iter->sg_pos = sg;
				5819	iter->sg_idx = idx;
				5820
				5821	mutex_unlock(&iter->lock);
				5822
				5823	if (unlikely(n < idx)) /* insertion completed by another thread */
				5824	goto lookup;
				5825
				5826	/* In case we failed to insert the entry into the radixtree, we need
				5827	* to look beyond the current sg.
				5828	*/
				5829	while (idx + count <= n) {
				5830	idx += count;
				5831	sg = ____sg_next(sg);
				5832	count = __sg_page_count(sg);
				5833	}
				5834
				5835	*offset = n - idx;
				5836	return sg;
				5837
				5838	lookup:
				5839	rcu_read_lock();
				5840
				5841	sg = radix_tree_lookup(&iter->radix, n);
				5842	GEM_BUG_ON(!sg);
				5843
				5844	/* If this index is in the middle of multi-page sg entry,
				5845	* the radixtree will contain an exceptional entry that points
				5846	* to the start of that range. We will return the pointer to
				5847	* the base page and the offset of this page within the
				5848	* sg entry's range.
				5849	*/
				5850	*offset = 0;
				5851	if (unlikely(radix_tree_exception(sg))) {
				5852	unsigned long base =
				5853	(unsigned long)sg >> RADIX_TREE_EXCEPTIONAL_SHIFT;
				5854
				5855	sg = radix_tree_lookup(&iter->radix, base);
				5856	GEM_BUG_ON(!sg);
				5857
				5858	*offset = n - base;
				5859	}
				5860
				5861	rcu_read_unlock();
				5862
				5863	return sg;
				5864	}
				5865
				5866	struct page *
				5867	i915_gem_object_get_page(struct drm_i915_gem_object *obj, unsigned int n)
				5868	{
				5869	struct scatterlist *sg;
				5870	unsigned int offset;
				5871
				5872	GEM_BUG_ON(!i915_gem_object_has_struct_page(obj));
				5873
				5874	sg = i915_gem_object_get_sg(obj, n, &offset);
				5875	return nth_page(sg_page(sg), offset);
				5876	}
				5877
				5878	/* Like i915_gem_object_get_page(), but mark the returned page dirty */
				5879	struct page *
				5880	i915_gem_object_get_dirty_page(struct drm_i915_gem_object *obj,
				5881	unsigned int n)
				5882	{
				5883	struct page *page;
				5884
				5885	page = i915_gem_object_get_page(obj, n);
Chris Wilson	a4f5ea6	2016-10-28 13:58:35 +0100	[diff] [blame]	5886	if (!obj->mm.dirty)
Chris Wilson	96d7763	2016-10-28 13:58:33 +0100	[diff] [blame]	5887	set_page_dirty(page);
				5888
				5889	return page;
				5890	}
				5891
				5892	dma_addr_t
				5893	i915_gem_object_get_dma_address(struct drm_i915_gem_object *obj,
				5894	unsigned long n)
				5895	{
				5896	struct scatterlist *sg;
				5897	unsigned int offset;
				5898
				5899	sg = i915_gem_object_get_sg(obj, n, &offset);
				5900	return sg_dma_address(sg) + (offset << PAGE_SHIFT);
				5901	}
Chris Wilson	935a2f7	2017-02-13 17:15:13 +0000	[diff] [blame]	5902
Chris Wilson	8eeb790	2017-07-26 19:16:01 +0100	[diff] [blame]	5903	int i915_gem_object_attach_phys(struct drm_i915_gem_object *obj, int align)
				5904	{
				5905	struct sg_table *pages;
				5906	int err;
				5907
				5908	if (align > obj->base.size)
				5909	return -EINVAL;
				5910
				5911	if (obj->ops == &i915_gem_phys_ops)
				5912	return 0;
				5913
				5914	if (obj->ops != &i915_gem_object_ops)
				5915	return -EINVAL;
				5916
				5917	err = i915_gem_object_unbind(obj);
				5918	if (err)
				5919	return err;
				5920
				5921	mutex_lock(&obj->mm.lock);
				5922
				5923	if (obj->mm.madv != I915_MADV_WILLNEED) {
				5924	err = -EFAULT;
				5925	goto err_unlock;
				5926	}
				5927
				5928	if (obj->mm.quirked) {
				5929	err = -EFAULT;
				5930	goto err_unlock;
				5931	}
				5932
				5933	if (obj->mm.mapping) {
				5934	err = -EBUSY;
				5935	goto err_unlock;
				5936	}
				5937
Chris Wilson	f212381	2017-10-16 12:40:37 +0100	[diff] [blame]	5938	pages = fetch_and_zero(&obj->mm.pages);
				5939	if (pages) {
				5940	struct drm_i915_private *i915 = to_i915(obj->base.dev);
				5941
				5942	__i915_gem_object_reset_page_iter(obj);
				5943
				5944	spin_lock(&i915->mm.obj_lock);
				5945	list_del(&obj->mm.link);
				5946	spin_unlock(&i915->mm.obj_lock);
				5947	}
				5948
Chris Wilson	8eeb790	2017-07-26 19:16:01 +0100	[diff] [blame]	5949	obj->ops = &i915_gem_phys_ops;
				5950
Chris Wilson	8fb6a5d	2017-07-26 19:16:02 +0100	[diff] [blame]	5951	err = ____i915_gem_object_get_pages(obj);
Chris Wilson	8eeb790	2017-07-26 19:16:01 +0100	[diff] [blame]	5952	if (err)
				5953	goto err_xfer;
				5954
				5955	/* Perma-pin (until release) the physical set of pages */
				5956	__i915_gem_object_pin_pages(obj);
				5957
				5958	if (!IS_ERR_OR_NULL(pages))
				5959	i915_gem_object_ops.put_pages(obj, pages);
				5960	mutex_unlock(&obj->mm.lock);
				5961	return 0;
				5962
				5963	err_xfer:
				5964	obj->ops = &i915_gem_object_ops;
				5965	obj->mm.pages = pages;
				5966	err_unlock:
				5967	mutex_unlock(&obj->mm.lock);
				5968	return err;
				5969	}
				5970
Chris Wilson	935a2f7	2017-02-13 17:15:13 +0000	[diff] [blame]	5971	#if IS_ENABLED(CONFIG_DRM_I915_SELFTEST)
				5972	#include "selftests/scatterlist.c"
Chris Wilson	66d9cb5	2017-02-13 17:15:17 +0000	[diff] [blame]	5973	#include "selftests/mock_gem_device.c"
Chris Wilson	4465398	2017-02-13 17:15:20 +0000	[diff] [blame]	5974	#include "selftests/huge_gem_object.c"
Matthew Auld	4049866	2017-10-06 23:18:29 +0100	[diff] [blame]	5975	#include "selftests/huge_pages.c"
Chris Wilson	8335fd6	2017-02-13 17:15:28 +0000	[diff] [blame]	5976	#include "selftests/i915_gem_object.c"
Chris Wilson	1705945	2017-02-13 17:15:32 +0000	[diff] [blame]	5977	#include "selftests/i915_gem_coherency.c"
Chris Wilson	935a2f7	2017-02-13 17:15:13 +0000	[diff] [blame]	5978	#endif