Blame - drivers/gpu/drm/i915/i915_gem.c - SHIFTPHONES/kernel/common

blob: 7d45e71100bce7d3cba037dff76d08276da2ee68 [file] [log] [blame]

Eric Anholt	673a394	2008-07-30 12:06:12 -0700	[diff] [blame]	1	/*
Daniel Vetter	be6a037	2015-03-18 10:46:04 +0100	[diff] [blame]	2	* Copyright © 2008-2015 Intel Corporation
Eric Anholt	673a394	2008-07-30 12:06:12 -0700	[diff] [blame]	3	*
				4	* Permission is hereby granted, free of charge, to any person obtaining a
				5	* copy of this software and associated documentation files (the "Software"),
				6	* to deal in the Software without restriction, including without limitation
				7	* the rights to use, copy, modify, merge, publish, distribute, sublicense,
				8	* and/or sell copies of the Software, and to permit persons to whom the
				9	* Software is furnished to do so, subject to the following conditions:
				10	*
				11	* The above copyright notice and this permission notice (including the next
				12	* paragraph) shall be included in all copies or substantial portions of the
				13	* Software.
				14	*
				15	* THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
				16	* IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
				17	* FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL
				18	* THE AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
				19	* LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING
				20	* FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS
				21	* IN THE SOFTWARE.
				22	*
				23	* Authors:
				24	* Eric Anholt <eric@anholt.net>
				25	*
				26	*/
				27
David Howells	760285e	2012-10-02 18:01:07 +0100	[diff] [blame]	28	#include <drm/drmP.h>
David Herrmann	0de2397	2013-07-24 21:07:52 +0200	[diff] [blame]	29	#include <drm/drm_vma_manager.h>
David Howells	760285e	2012-10-02 18:01:07 +0100	[diff] [blame]	30	#include <drm/i915_drm.h>
Eric Anholt	673a394	2008-07-30 12:06:12 -0700	[diff] [blame]	31	#include "i915_drv.h"
Chris Wilson	57822dc	2017-02-22 11:40:48 +0000	[diff] [blame]	32	#include "i915_gem_clflush.h"
Yu Zhang	eb82289	2015-02-10 19:05:49 +0800	[diff] [blame]	33	#include "i915_vgpu.h"
Chris Wilson	1c5d22f	2009-08-25 11:15:50 +0100	[diff] [blame]	34	#include "i915_trace.h"
Jesse Barnes	652c393	2009-08-17 13:31:43 -0700	[diff] [blame]	35	#include "intel_drv.h"
Chris Wilson	5d723d7	2016-08-04 16:32:35 +0100	[diff] [blame]	36	#include "intel_frontbuffer.h"
Peter Antoine	0ccdacf	2016-04-13 15:03:25 +0100	[diff] [blame]	37	#include "intel_mocs.h"
Oscar Mateo	59b449d	2018-04-10 09:12:47 -0700	[diff] [blame]	38	#include "intel_workarounds.h"
Matthew Auld	465c403	2017-10-06 23:18:14 +0100	[diff] [blame]	39	#include "i915_gemfs.h"
Chris Wilson	6b5e90f	2016-11-14 20:41:05 +0000	[diff] [blame]	40	#include <linux/dma-fence-array.h>
Chris Wilson	fe3288b	2017-02-12 17:20:01 +0000	[diff] [blame]	41	#include <linux/kthread.h>
Chris Wilson	c13d87e	2016-07-20 09:21:15 +0100	[diff] [blame]	42	#include <linux/reservation.h>
Hugh Dickins	5949eac	2011-06-27 16:18:18 -0700	[diff] [blame]	43	#include <linux/shmem_fs.h>
Tejun Heo	5a0e3ad	2010-03-24 17:04:11 +0900	[diff] [blame]	44	#include <linux/slab.h>
Chris Wilson	20e4933	2016-11-22 14:41:21 +0000	[diff] [blame]	45	#include <linux/stop_machine.h>
Eric Anholt	673a394	2008-07-30 12:06:12 -0700	[diff] [blame]	46	#include <linux/swap.h>
Jesse Barnes	79e5394	2008-11-07 14:24:08 -0800	[diff] [blame]	47	#include <linux/pci.h>
Daniel Vetter	1286ff7	2012-05-10 15:25:09 +0200	[diff] [blame]	48	#include <linux/dma-buf.h>
Eric Anholt	673a394	2008-07-30 12:06:12 -0700	[diff] [blame]	49
Chris Wilson	fbbd37b	2016-10-28 13:58:42 +0100	[diff] [blame]	50	static void i915_gem_flush_free_objects(struct drm_i915_private *i915);
Chris Wilson	6105080	2012-04-17 15:31:31 +0100	[diff] [blame]	51
Chris Wilson	2c22569	2013-08-09 12:26:45 +0100	[diff] [blame]	52	static bool cpu_write_needs_clflush(struct drm_i915_gem_object *obj)
				53	{
Chris Wilson	e27ab73	2017-06-15 13:38:49 +0100	[diff] [blame]	54	if (obj->cache_dirty)
Ankitprasad Sharma	b50a537	2016-06-10 14:23:03 +0530	[diff] [blame]	55	return false;
				56
Chris Wilson	b8f55be	2017-08-11 12:11:16 +0100	[diff] [blame]	57	if (!(obj->cache_coherent & I915_BO_CACHE_COHERENT_FOR_WRITE))
Chris Wilson	2c22569	2013-08-09 12:26:45 +0100	[diff] [blame]	58	return true;
				59
Chris Wilson	bd3d225	2017-10-13 21:26:14 +0100	[diff] [blame]	60	return obj->pin_global; /* currently in use by HW, keep flushed */
Chris Wilson	2c22569	2013-08-09 12:26:45 +0100	[diff] [blame]	61	}
				62
Ankitprasad Sharma	4f1959e	2016-06-10 14:23:01 +0530	[diff] [blame]	63	static int
Chris Wilson	bb6dc8d	2016-10-28 13:58:39 +0100	[diff] [blame]	64	insert_mappable_node(struct i915_ggtt *ggtt,
Ankitprasad Sharma	4f1959e	2016-06-10 14:23:01 +0530	[diff] [blame]	65	struct drm_mm_node *node, u32 size)
				66	{
				67	memset(node, 0, sizeof(*node));
Chris Wilson	82ad644	2018-06-05 16:37:58 +0100	[diff] [blame]	68	return drm_mm_insert_node_in_range(&ggtt->vm.mm, node,
Chris Wilson	4e64e55	2017-02-02 21:04:38 +0000	[diff] [blame]	69	size, 0, I915_COLOR_UNEVICTABLE,
				70	0, ggtt->mappable_end,
				71	DRM_MM_INSERT_LOW);
Ankitprasad Sharma	4f1959e	2016-06-10 14:23:01 +0530	[diff] [blame]	72	}
				73
				74	static void
				75	remove_mappable_node(struct drm_mm_node *node)
				76	{
				77	drm_mm_remove_node(node);
				78	}
				79
Chris Wilson	73aa808	2010-09-30 11:46:12 +0100	[diff] [blame]	80	/* some bookkeeping */
				81	static void i915_gem_info_add_obj(struct drm_i915_private *dev_priv,
Chris Wilson	3ef7f22	2016-10-18 13:02:48 +0100	[diff] [blame]	82	u64 size)
Chris Wilson	73aa808	2010-09-30 11:46:12 +0100	[diff] [blame]	83	{
Daniel Vetter	c20e835	2013-07-24 22:40:23 +0200	[diff] [blame]	84	spin_lock(&dev_priv->mm.object_stat_lock);
Chris Wilson	73aa808	2010-09-30 11:46:12 +0100	[diff] [blame]	85	dev_priv->mm.object_count++;
				86	dev_priv->mm.object_memory += size;
Daniel Vetter	c20e835	2013-07-24 22:40:23 +0200	[diff] [blame]	87	spin_unlock(&dev_priv->mm.object_stat_lock);
Chris Wilson	73aa808	2010-09-30 11:46:12 +0100	[diff] [blame]	88	}
				89
				90	static void i915_gem_info_remove_obj(struct drm_i915_private *dev_priv,
Chris Wilson	3ef7f22	2016-10-18 13:02:48 +0100	[diff] [blame]	91	u64 size)
Chris Wilson	73aa808	2010-09-30 11:46:12 +0100	[diff] [blame]	92	{
Daniel Vetter	c20e835	2013-07-24 22:40:23 +0200	[diff] [blame]	93	spin_lock(&dev_priv->mm.object_stat_lock);
Chris Wilson	73aa808	2010-09-30 11:46:12 +0100	[diff] [blame]	94	dev_priv->mm.object_count--;
				95	dev_priv->mm.object_memory -= size;
Daniel Vetter	c20e835	2013-07-24 22:40:23 +0200	[diff] [blame]	96	spin_unlock(&dev_priv->mm.object_stat_lock);
Chris Wilson	73aa808	2010-09-30 11:46:12 +0100	[diff] [blame]	97	}
				98
Chris Wilson	21dd373	2011-01-26 15:55:56 +0000	[diff] [blame]	99	static int
Daniel Vetter	33196de	2012-11-14 17:14:05 +0100	[diff] [blame]	100	i915_gem_wait_for_error(struct i915_gpu_error *error)
Chris Wilson	30dbf0c	2010-09-25 10:19:17 +0100	[diff] [blame]	101	{
Chris Wilson	30dbf0c	2010-09-25 10:19:17 +0100	[diff] [blame]	102	int ret;
				103
Chris Wilson	4c7d62c	2016-10-28 13:58:32 +0100	[diff] [blame]	104	might_sleep();
				105
Daniel Vetter	0a6759c	2012-07-04 22:18:41 +0200	[diff] [blame]	106	/*
				107	* Only wait 10 seconds for the gpu reset to complete to avoid hanging
				108	* userspace. If it takes that long something really bad is going on and
				109	* we should simply try to bail out and fail as gracefully as possible.
				110	*/
Daniel Vetter	1f83fee	2012-11-15 17:17:22 +0100	[diff] [blame]	111	ret = wait_event_interruptible_timeout(error->reset_queue,
Chris Wilson	8c185ec	2017-03-16 17:13:02 +0000	[diff] [blame]	112	!i915_reset_backoff(error),
Chris Wilson	b52992c	2016-10-28 13:58:24 +0100	[diff] [blame]	113	I915_RESET_TIMEOUT);
Daniel Vetter	0a6759c	2012-07-04 22:18:41 +0200	[diff] [blame]	114	if (ret == 0) {
				115	DRM_ERROR("Timed out waiting for the gpu reset to complete\n");
				116	return -EIO;
				117	} else if (ret < 0) {
Chris Wilson	30dbf0c	2010-09-25 10:19:17 +0100	[diff] [blame]	118	return ret;
Chris Wilson	d98c52c	2016-04-13 17:35:05 +0100	[diff] [blame]	119	} else {
				120	return 0;
Daniel Vetter	0a6759c	2012-07-04 22:18:41 +0200	[diff] [blame]	121	}
Chris Wilson	30dbf0c	2010-09-25 10:19:17 +0100	[diff] [blame]	122	}
				123
Chris Wilson	54cf91d	2010-11-25 18:00:26 +0000	[diff] [blame]	124	int i915_mutex_lock_interruptible(struct drm_device *dev)
Chris Wilson	76c1dec	2010-09-25 11:22:51 +0100	[diff] [blame]	125	{
Chris Wilson	fac5e23	2016-07-04 11:34:36 +0100	[diff] [blame]	126	struct drm_i915_private *dev_priv = to_i915(dev);
Chris Wilson	76c1dec	2010-09-25 11:22:51 +0100	[diff] [blame]	127	int ret;
				128
Daniel Vetter	33196de	2012-11-14 17:14:05 +0100	[diff] [blame]	129	ret = i915_gem_wait_for_error(&dev_priv->gpu_error);
Chris Wilson	76c1dec	2010-09-25 11:22:51 +0100	[diff] [blame]	130	if (ret)
				131	return ret;
				132
				133	ret = mutex_lock_interruptible(&dev->struct_mutex);
				134	if (ret)
				135	return ret;
				136
Chris Wilson	76c1dec	2010-09-25 11:22:51 +0100	[diff] [blame]	137	return 0;
				138	}
Chris Wilson	30dbf0c	2010-09-25 10:19:17 +0100	[diff] [blame]	139
Chris Wilson	e4d2006	2018-04-06 16:51:44 +0100	[diff] [blame]	140	static u32 __i915_gem_park(struct drm_i915_private *i915)
				141	{
Chris Wilson	4dfacb0	2018-05-31 09:22:43 +0100	[diff] [blame]	142	GEM_TRACE("\n");
				143
Chris Wilson	e4d2006	2018-04-06 16:51:44 +0100	[diff] [blame]	144	lockdep_assert_held(&i915->drm.struct_mutex);
				145	GEM_BUG_ON(i915->gt.active_requests);
Chris Wilson	643b450	2018-04-30 14:15:03 +0100	[diff] [blame]	146	GEM_BUG_ON(!list_empty(&i915->gt.active_rings));
Chris Wilson	e4d2006	2018-04-06 16:51:44 +0100	[diff] [blame]	147
				148	if (!i915->gt.awake)
				149	return I915_EPOCH_INVALID;
				150
				151	GEM_BUG_ON(i915->gt.epoch == I915_EPOCH_INVALID);
				152
				153	/*
				154	* Be paranoid and flush a concurrent interrupt to make sure
				155	* we don't reactivate any irq tasklets after parking.
				156	*
				157	* FIXME: Note that even though we have waited for execlists to be idle,
				158	* there may still be an in-flight interrupt even though the CSB
				159	* is now empty. synchronize_irq() makes sure that a residual interrupt
				160	* is completed before we continue, but it doesn't prevent the HW from
				161	* raising a spurious interrupt later. To complete the shield we should
				162	* coordinate disabling the CS irq with flushing the interrupts.
				163	*/
				164	synchronize_irq(i915->drm.irq);
				165
				166	intel_engines_park(i915);
Chris Wilson	a89d1f9	2018-05-02 17:38:39 +0100	[diff] [blame]	167	i915_timelines_park(i915);
Chris Wilson	e4d2006	2018-04-06 16:51:44 +0100	[diff] [blame]	168
				169	i915_pmu_gt_parked(i915);
Chris Wilson	3365e22	2018-05-03 20:51:14 +0100	[diff] [blame]	170	i915_vma_parked(i915);
Chris Wilson	e4d2006	2018-04-06 16:51:44 +0100	[diff] [blame]	171
				172	i915->gt.awake = false;
				173
				174	if (INTEL_GEN(i915) >= 6)
				175	gen6_rps_idle(i915);
				176
				177	intel_display_power_put(i915, POWER_DOMAIN_GT_IRQ);
				178
				179	intel_runtime_pm_put(i915);
				180
				181	return i915->gt.epoch;
				182	}
				183
				184	void i915_gem_park(struct drm_i915_private *i915)
				185	{
Chris Wilson	4dfacb0	2018-05-31 09:22:43 +0100	[diff] [blame]	186	GEM_TRACE("\n");
				187
Chris Wilson	e4d2006	2018-04-06 16:51:44 +0100	[diff] [blame]	188	lockdep_assert_held(&i915->drm.struct_mutex);
				189	GEM_BUG_ON(i915->gt.active_requests);
				190
				191	if (!i915->gt.awake)
				192	return;
				193
				194	/* Defer the actual call to __i915_gem_park() to prevent ping-pongs */
				195	mod_delayed_work(i915->wq, &i915->gt.idle_work, msecs_to_jiffies(100));
				196	}
				197
				198	void i915_gem_unpark(struct drm_i915_private *i915)
				199	{
Chris Wilson	4dfacb0	2018-05-31 09:22:43 +0100	[diff] [blame]	200	GEM_TRACE("\n");
				201
Chris Wilson	e4d2006	2018-04-06 16:51:44 +0100	[diff] [blame]	202	lockdep_assert_held(&i915->drm.struct_mutex);
				203	GEM_BUG_ON(!i915->gt.active_requests);
				204
				205	if (i915->gt.awake)
				206	return;
				207
				208	intel_runtime_pm_get_noresume(i915);
				209
				210	/*
				211	* It seems that the DMC likes to transition between the DC states a lot
				212	* when there are no connected displays (no active power domains) during
				213	* command submission.
				214	*
				215	* This activity has negative impact on the performance of the chip with
				216	* huge latencies observed in the interrupt handler and elsewhere.
				217	*
				218	* Work around it by grabbing a GT IRQ power domain whilst there is any
				219	* GT activity, preventing any DC state transitions.
				220	*/
				221	intel_display_power_get(i915, POWER_DOMAIN_GT_IRQ);
				222
				223	i915->gt.awake = true;
				224	if (unlikely(++i915->gt.epoch == 0)) /* keep 0 as invalid */
				225	i915->gt.epoch = 1;
				226
				227	intel_enable_gt_powersave(i915);
				228	i915_update_gfx_val(i915);
				229	if (INTEL_GEN(i915) >= 6)
				230	gen6_rps_busy(i915);
				231	i915_pmu_gt_unparked(i915);
				232
				233	intel_engines_unpark(i915);
				234
				235	i915_queue_hangcheck(i915);
				236
				237	queue_delayed_work(i915->wq,
				238	&i915->gt.retire_work,
				239	round_jiffies_up_relative(HZ));
				240	}
				241
Eric Anholt	673a394	2008-07-30 12:06:12 -0700	[diff] [blame]	242	int
Eric Anholt	5a125c3	2008-10-22 21:40:13 -0700	[diff] [blame]	243	i915_gem_get_aperture_ioctl(struct drm_device dev, void data,
Chris Wilson	05394f3	2010-11-08 19:18:58 +0000	[diff] [blame]	244	struct drm_file *file)
Eric Anholt	5a125c3	2008-10-22 21:40:13 -0700	[diff] [blame]	245	{
Joonas Lahtinen	72e96d6	2016-03-30 16:57:10 +0300	[diff] [blame]	246	struct drm_i915_private *dev_priv = to_i915(dev);
Joonas Lahtinen	62106b4	2016-03-18 10:42:57 +0200	[diff] [blame]	247	struct i915_ggtt *ggtt = &dev_priv->ggtt;
Joonas Lahtinen	72e96d6	2016-03-30 16:57:10 +0300	[diff] [blame]	248	struct drm_i915_gem_get_aperture *args = data;
Tvrtko Ursulin	ca1543b	2015-07-01 11:51:10 +0100	[diff] [blame]	249	struct i915_vma *vma;
Weinan Li	ff8f797	2017-05-31 10:35:52 +0800	[diff] [blame]	250	u64 pinned;
Eric Anholt	5a125c3	2008-10-22 21:40:13 -0700	[diff] [blame]	251
Chris Wilson	82ad644	2018-06-05 16:37:58 +0100	[diff] [blame]	252	pinned = ggtt->vm.reserved;
Chris Wilson	73aa808	2010-09-30 11:46:12 +0100	[diff] [blame]	253	mutex_lock(&dev->struct_mutex);
Chris Wilson	82ad644	2018-06-05 16:37:58 +0100	[diff] [blame]	254	list_for_each_entry(vma, &ggtt->vm.active_list, vm_link)
Chris Wilson	20dfbde	2016-08-04 16:32:30 +0100	[diff] [blame]	255	if (i915_vma_is_pinned(vma))
Tvrtko Ursulin	ca1543b	2015-07-01 11:51:10 +0100	[diff] [blame]	256	pinned += vma->node.size;
Chris Wilson	82ad644	2018-06-05 16:37:58 +0100	[diff] [blame]	257	list_for_each_entry(vma, &ggtt->vm.inactive_list, vm_link)
Chris Wilson	20dfbde	2016-08-04 16:32:30 +0100	[diff] [blame]	258	if (i915_vma_is_pinned(vma))
Tvrtko Ursulin	ca1543b	2015-07-01 11:51:10 +0100	[diff] [blame]	259	pinned += vma->node.size;
Chris Wilson	73aa808	2010-09-30 11:46:12 +0100	[diff] [blame]	260	mutex_unlock(&dev->struct_mutex);
Eric Anholt	5a125c3	2008-10-22 21:40:13 -0700	[diff] [blame]	261
Chris Wilson	82ad644	2018-06-05 16:37:58 +0100	[diff] [blame]	262	args->aper_size = ggtt->vm.total;
Akshay Joshi	0206e35	2011-08-16 15:34:10 -0400	[diff] [blame]	263	args->aper_available_size = args->aper_size - pinned;
Chris Wilson	6299f99	2010-11-24 12:23:44 +0000	[diff] [blame]	264
Eric Anholt	5a125c3	2008-10-22 21:40:13 -0700	[diff] [blame]	265	return 0;
				266	}
				267
Matthew Auld	b91b09e	2017-10-06 23:18:17 +0100	[diff] [blame]	268	static int i915_gem_object_get_pages_phys(struct drm_i915_gem_object *obj)
Chris Wilson	0073115	2014-05-21 12:42:56 +0100	[diff] [blame]	269	{
Al Viro	93c76a3	2015-12-04 23:45:44 -0500	[diff] [blame]	270	struct address_space *mapping = obj->base.filp->f_mapping;
Chris Wilson	dbb4351	2016-12-07 13:34:11 +0000	[diff] [blame]	271	drm_dma_handle_t *phys;
Chris Wilson	6a2c423	2014-11-04 04:51:40 -0800	[diff] [blame]	272	struct sg_table *st;
				273	struct scatterlist *sg;
Chris Wilson	dbb4351	2016-12-07 13:34:11 +0000	[diff] [blame]	274	char *vaddr;
Chris Wilson	6a2c423	2014-11-04 04:51:40 -0800	[diff] [blame]	275	int i;
Matthew Auld	b91b09e	2017-10-06 23:18:17 +0100	[diff] [blame]	276	int err;
Chris Wilson	0073115	2014-05-21 12:42:56 +0100	[diff] [blame]	277
Chris Wilson	6a2c423	2014-11-04 04:51:40 -0800	[diff] [blame]	278	if (WARN_ON(i915_gem_object_needs_bit17_swizzle(obj)))
Matthew Auld	b91b09e	2017-10-06 23:18:17 +0100	[diff] [blame]	279	return -EINVAL;
Chris Wilson	0073115	2014-05-21 12:42:56 +0100	[diff] [blame]	280
Chris Wilson	dbb4351	2016-12-07 13:34:11 +0000	[diff] [blame]	281	/* Always aligning to the object size, allows a single allocation
				282	* to handle all possible callers, and given typical object sizes,
				283	* the alignment of the buddy allocation will naturally match.
				284	*/
				285	phys = drm_pci_alloc(obj->base.dev,
Ville Syrjälä	750fae2	2017-09-07 17:32:03 +0300	[diff] [blame]	286	roundup_pow_of_two(obj->base.size),
Chris Wilson	dbb4351	2016-12-07 13:34:11 +0000	[diff] [blame]	287	roundup_pow_of_two(obj->base.size));
				288	if (!phys)
Matthew Auld	b91b09e	2017-10-06 23:18:17 +0100	[diff] [blame]	289	return -ENOMEM;
Chris Wilson	dbb4351	2016-12-07 13:34:11 +0000	[diff] [blame]	290
				291	vaddr = phys->vaddr;
Chris Wilson	6a2c423	2014-11-04 04:51:40 -0800	[diff] [blame]	292	for (i = 0; i < obj->base.size / PAGE_SIZE; i++) {
				293	struct page *page;
				294	char *src;
				295
				296	page = shmem_read_mapping_page(mapping, i);
Chris Wilson	dbb4351	2016-12-07 13:34:11 +0000	[diff] [blame]	297	if (IS_ERR(page)) {
Matthew Auld	b91b09e	2017-10-06 23:18:17 +0100	[diff] [blame]	298	err = PTR_ERR(page);
Chris Wilson	dbb4351	2016-12-07 13:34:11 +0000	[diff] [blame]	299	goto err_phys;
				300	}
Chris Wilson	6a2c423	2014-11-04 04:51:40 -0800	[diff] [blame]	301
				302	src = kmap_atomic(page);
				303	memcpy(vaddr, src, PAGE_SIZE);
				304	drm_clflush_virt_range(vaddr, PAGE_SIZE);
				305	kunmap_atomic(src);
				306
Kirill A. Shutemov	09cbfea	2016-04-01 15:29:47 +0300	[diff] [blame]	307	put_page(page);
Chris Wilson	6a2c423	2014-11-04 04:51:40 -0800	[diff] [blame]	308	vaddr += PAGE_SIZE;
				309	}
				310
Chris Wilson	c033666	2016-05-06 15:40:21 +0100	[diff] [blame]	311	i915_gem_chipset_flush(to_i915(obj->base.dev));
Chris Wilson	6a2c423	2014-11-04 04:51:40 -0800	[diff] [blame]	312
				313	st = kmalloc(sizeof(*st), GFP_KERNEL);
Chris Wilson	dbb4351	2016-12-07 13:34:11 +0000	[diff] [blame]	314	if (!st) {
Matthew Auld	b91b09e	2017-10-06 23:18:17 +0100	[diff] [blame]	315	err = -ENOMEM;
Chris Wilson	dbb4351	2016-12-07 13:34:11 +0000	[diff] [blame]	316	goto err_phys;
				317	}
Chris Wilson	6a2c423	2014-11-04 04:51:40 -0800	[diff] [blame]	318
				319	if (sg_alloc_table(st, 1, GFP_KERNEL)) {
				320	kfree(st);
Matthew Auld	b91b09e	2017-10-06 23:18:17 +0100	[diff] [blame]	321	err = -ENOMEM;
Chris Wilson	dbb4351	2016-12-07 13:34:11 +0000	[diff] [blame]	322	goto err_phys;
Chris Wilson	6a2c423	2014-11-04 04:51:40 -0800	[diff] [blame]	323	}
				324
				325	sg = st->sgl;
				326	sg->offset = 0;
				327	sg->length = obj->base.size;
				328
Chris Wilson	dbb4351	2016-12-07 13:34:11 +0000	[diff] [blame]	329	sg_dma_address(sg) = phys->busaddr;
Chris Wilson	6a2c423	2014-11-04 04:51:40 -0800	[diff] [blame]	330	sg_dma_len(sg) = obj->base.size;
				331
Chris Wilson	dbb4351	2016-12-07 13:34:11 +0000	[diff] [blame]	332	obj->phys_handle = phys;
Matthew Auld	b91b09e	2017-10-06 23:18:17 +0100	[diff] [blame]	333
Matthew Auld	a5c08166	2017-10-06 23:18:18 +0100	[diff] [blame]	334	__i915_gem_object_set_pages(obj, st, sg->length);
Matthew Auld	b91b09e	2017-10-06 23:18:17 +0100	[diff] [blame]	335
				336	return 0;
Chris Wilson	dbb4351	2016-12-07 13:34:11 +0000	[diff] [blame]	337
				338	err_phys:
				339	drm_pci_free(obj->base.dev, phys);
Matthew Auld	b91b09e	2017-10-06 23:18:17 +0100	[diff] [blame]	340
				341	return err;
Chris Wilson	6a2c423	2014-11-04 04:51:40 -0800	[diff] [blame]	342	}
				343
Chris Wilson	e27ab73	2017-06-15 13:38:49 +0100	[diff] [blame]	344	static void __start_cpu_write(struct drm_i915_gem_object *obj)
				345	{
Christian König	c0a51fd	2018-02-16 13:43:38 +0100	[diff] [blame]	346	obj->read_domains = I915_GEM_DOMAIN_CPU;
				347	obj->write_domain = I915_GEM_DOMAIN_CPU;
Chris Wilson	e27ab73	2017-06-15 13:38:49 +0100	[diff] [blame]	348	if (cpu_write_needs_clflush(obj))
				349	obj->cache_dirty = true;
				350	}
				351
Chris Wilson	6a2c423	2014-11-04 04:51:40 -0800	[diff] [blame]	352	static void
Chris Wilson	2b3c831	2016-11-11 14:58:09 +0000	[diff] [blame]	353	__i915_gem_object_release_shmem(struct drm_i915_gem_object *obj,
Chris Wilson	e5facdf	2016-12-23 14:57:57 +0000	[diff] [blame]	354	struct sg_table *pages,
				355	bool needs_clflush)
Chris Wilson	6a2c423	2014-11-04 04:51:40 -0800	[diff] [blame]	356	{
Chris Wilson	a4f5ea6	2016-10-28 13:58:35 +0100	[diff] [blame]	357	GEM_BUG_ON(obj->mm.madv == __I915_MADV_PURGED);
Chris Wilson	6a2c423	2014-11-04 04:51:40 -0800	[diff] [blame]	358
Chris Wilson	a4f5ea6	2016-10-28 13:58:35 +0100	[diff] [blame]	359	if (obj->mm.madv == I915_MADV_DONTNEED)
				360	obj->mm.dirty = false;
Chris Wilson	6a2c423	2014-11-04 04:51:40 -0800	[diff] [blame]	361
Chris Wilson	e5facdf	2016-12-23 14:57:57 +0000	[diff] [blame]	362	if (needs_clflush &&
Christian König	c0a51fd	2018-02-16 13:43:38 +0100	[diff] [blame]	363	(obj->read_domains & I915_GEM_DOMAIN_CPU) == 0 &&
Chris Wilson	b8f55be	2017-08-11 12:11:16 +0100	[diff] [blame]	364	!(obj->cache_coherent & I915_BO_CACHE_COHERENT_FOR_READ))
Chris Wilson	2b3c831	2016-11-11 14:58:09 +0000	[diff] [blame]	365	drm_clflush_sg(pages);
Chris Wilson	03ac84f	2016-10-28 13:58:36 +0100	[diff] [blame]	366
Chris Wilson	e27ab73	2017-06-15 13:38:49 +0100	[diff] [blame]	367	__start_cpu_write(obj);
Chris Wilson	03ac84f	2016-10-28 13:58:36 +0100	[diff] [blame]	368	}
				369
				370	static void
				371	i915_gem_object_put_pages_phys(struct drm_i915_gem_object *obj,
				372	struct sg_table *pages)
				373	{
Chris Wilson	e5facdf	2016-12-23 14:57:57 +0000	[diff] [blame]	374	__i915_gem_object_release_shmem(obj, pages, false);
Chris Wilson	03ac84f	2016-10-28 13:58:36 +0100	[diff] [blame]	375
Chris Wilson	a4f5ea6	2016-10-28 13:58:35 +0100	[diff] [blame]	376	if (obj->mm.dirty) {
Al Viro	93c76a3	2015-12-04 23:45:44 -0500	[diff] [blame]	377	struct address_space *mapping = obj->base.filp->f_mapping;
Chris Wilson	6a2c423	2014-11-04 04:51:40 -0800	[diff] [blame]	378	char *vaddr = obj->phys_handle->vaddr;
Chris Wilson	0073115	2014-05-21 12:42:56 +0100	[diff] [blame]	379	int i;
				380
				381	for (i = 0; i < obj->base.size / PAGE_SIZE; i++) {
Chris Wilson	6a2c423	2014-11-04 04:51:40 -0800	[diff] [blame]	382	struct page *page;
				383	char *dst;
Chris Wilson	0073115	2014-05-21 12:42:56 +0100	[diff] [blame]	384
Chris Wilson	6a2c423	2014-11-04 04:51:40 -0800	[diff] [blame]	385	page = shmem_read_mapping_page(mapping, i);
				386	if (IS_ERR(page))
				387	continue;
				388
				389	dst = kmap_atomic(page);
				390	drm_clflush_virt_range(vaddr, PAGE_SIZE);
				391	memcpy(dst, vaddr, PAGE_SIZE);
				392	kunmap_atomic(dst);
				393
				394	set_page_dirty(page);
Chris Wilson	a4f5ea6	2016-10-28 13:58:35 +0100	[diff] [blame]	395	if (obj->mm.madv == I915_MADV_WILLNEED)
Chris Wilson	0073115	2014-05-21 12:42:56 +0100	[diff] [blame]	396	mark_page_accessed(page);
Kirill A. Shutemov	09cbfea	2016-04-01 15:29:47 +0300	[diff] [blame]	397	put_page(page);
Chris Wilson	0073115	2014-05-21 12:42:56 +0100	[diff] [blame]	398	vaddr += PAGE_SIZE;
				399	}
Chris Wilson	a4f5ea6	2016-10-28 13:58:35 +0100	[diff] [blame]	400	obj->mm.dirty = false;
Chris Wilson	0073115	2014-05-21 12:42:56 +0100	[diff] [blame]	401	}
				402
Chris Wilson	03ac84f	2016-10-28 13:58:36 +0100	[diff] [blame]	403	sg_free_table(pages);
				404	kfree(pages);
Chris Wilson	dbb4351	2016-12-07 13:34:11 +0000	[diff] [blame]	405
				406	drm_pci_free(obj->base.dev, obj->phys_handle);
Chris Wilson	6a2c423	2014-11-04 04:51:40 -0800	[diff] [blame]	407	}
				408
				409	static void
				410	i915_gem_object_release_phys(struct drm_i915_gem_object *obj)
				411	{
Chris Wilson	a4f5ea6	2016-10-28 13:58:35 +0100	[diff] [blame]	412	i915_gem_object_unpin_pages(obj);
Chris Wilson	6a2c423	2014-11-04 04:51:40 -0800	[diff] [blame]	413	}
				414
				415	static const struct drm_i915_gem_object_ops i915_gem_phys_ops = {
				416	.get_pages = i915_gem_object_get_pages_phys,
				417	.put_pages = i915_gem_object_put_pages_phys,
				418	.release = i915_gem_object_release_phys,
				419	};
				420
Chris Wilson	581ab1f	2017-02-15 16:39:00 +0000	[diff] [blame]	421	static const struct drm_i915_gem_object_ops i915_gem_object_ops;
				422
Chris Wilson	35a9611	2016-08-14 18:44:40 +0100	[diff] [blame]	423	int i915_gem_object_unbind(struct drm_i915_gem_object *obj)
Chris Wilson	aa653a6	2016-08-04 07:52:27 +0100	[diff] [blame]	424	{
				425	struct i915_vma *vma;
				426	LIST_HEAD(still_in_list);
Chris Wilson	02bef8f	2016-08-14 18:44:41 +0100	[diff] [blame]	427	int ret;
Chris Wilson	aa653a6	2016-08-04 07:52:27 +0100	[diff] [blame]	428
Chris Wilson	02bef8f	2016-08-14 18:44:41 +0100	[diff] [blame]	429	lockdep_assert_held(&obj->base.dev->struct_mutex);
				430
				431	/* Closed vma are removed from the obj->vma_list - but they may
				432	* still have an active binding on the object. To remove those we
				433	* must wait for all rendering to complete to the object (as unbinding
				434	* must anyway), and retire the requests.
Chris Wilson	aa653a6	2016-08-04 07:52:27 +0100	[diff] [blame]	435	*/
Chris Wilson	5888fc9	2017-12-04 13:25:13 +0000	[diff] [blame]	436	ret = i915_gem_object_set_to_cpu_domain(obj, false);
Chris Wilson	02bef8f	2016-08-14 18:44:41 +0100	[diff] [blame]	437	if (ret)
				438	return ret;
				439
Chris Wilson	aa653a6	2016-08-04 07:52:27 +0100	[diff] [blame]	440	while ((vma = list_first_entry_or_null(&obj->vma_list,
				441	struct i915_vma,
				442	obj_link))) {
				443	list_move_tail(&vma->obj_link, &still_in_list);
				444	ret = i915_vma_unbind(vma);
				445	if (ret)
				446	break;
				447	}
				448	list_splice(&still_in_list, &obj->vma_list);
				449
				450	return ret;
				451	}
				452
Chris Wilson	e95433c	2016-10-28 13:58:27 +0100	[diff] [blame]	453	static long
				454	i915_gem_object_wait_fence(struct dma_fence *fence,
				455	unsigned int flags,
				456	long timeout,
Sagar Arun Kamble	562d9ba	2017-10-10 22:30:06 +0100	[diff] [blame]	457	struct intel_rps_client *rps_client)
Chris Wilson	e95433c	2016-10-28 13:58:27 +0100	[diff] [blame]	458	{
Chris Wilson	e61e0f5	2018-02-21 09:56:36 +0000	[diff] [blame]	459	struct i915_request *rq;
Chris Wilson	e95433c	2016-10-28 13:58:27 +0100	[diff] [blame]	460
				461	BUILD_BUG_ON(I915_WAIT_INTERRUPTIBLE != 0x1);
				462
				463	if (test_bit(DMA_FENCE_FLAG_SIGNALED_BIT, &fence->flags))
				464	return timeout;
				465
				466	if (!dma_fence_is_i915(fence))
				467	return dma_fence_wait_timeout(fence,
				468	flags & I915_WAIT_INTERRUPTIBLE,
				469	timeout);
				470
				471	rq = to_request(fence);
Chris Wilson	e61e0f5	2018-02-21 09:56:36 +0000	[diff] [blame]	472	if (i915_request_completed(rq))
Chris Wilson	e95433c	2016-10-28 13:58:27 +0100	[diff] [blame]	473	goto out;
				474
Chris Wilson	e9af4ea	2018-01-18 13:16:09 +0000	[diff] [blame]	475	/*
				476	* This client is about to stall waiting for the GPU. In many cases
Chris Wilson	e95433c	2016-10-28 13:58:27 +0100	[diff] [blame]	477	* this is undesirable and limits the throughput of the system, as
				478	* many clients cannot continue processing user input/output whilst
				479	* blocked. RPS autotuning may take tens of milliseconds to respond
				480	* to the GPU load and thus incurs additional latency for the client.
				481	* We can circumvent that by promoting the GPU frequency to maximum
				482	* before we wait. This makes the GPU throttle up much more quickly
				483	* (good for benchmarks and user experience, e.g. window animations),
				484	* but at a cost of spending more power processing the workload
				485	* (bad for battery). Not all clients even want their results
				486	* immediately and for them we should just let the GPU select its own
				487	* frequency to maximise efficiency. To prevent a single client from
				488	* forcing the clocks too high for the whole system, we only allow
				489	* each client to waitboost once in a busy period.
				490	*/
Chris Wilson	e61e0f5	2018-02-21 09:56:36 +0000	[diff] [blame]	491	if (rps_client && !i915_request_started(rq)) {
Chris Wilson	e95433c	2016-10-28 13:58:27 +0100	[diff] [blame]	492	if (INTEL_GEN(rq->i915) >= 6)
Sagar Arun Kamble	562d9ba	2017-10-10 22:30:06 +0100	[diff] [blame]	493	gen6_rps_boost(rq, rps_client);
Chris Wilson	e95433c	2016-10-28 13:58:27 +0100	[diff] [blame]	494	}
				495
Chris Wilson	e61e0f5	2018-02-21 09:56:36 +0000	[diff] [blame]	496	timeout = i915_request_wait(rq, flags, timeout);
Chris Wilson	e95433c	2016-10-28 13:58:27 +0100	[diff] [blame]	497
				498	out:
Chris Wilson	e61e0f5	2018-02-21 09:56:36 +0000	[diff] [blame]	499	if (flags & I915_WAIT_LOCKED && i915_request_completed(rq))
				500	i915_request_retire_upto(rq);
Chris Wilson	e95433c	2016-10-28 13:58:27 +0100	[diff] [blame]	501
Chris Wilson	e95433c	2016-10-28 13:58:27 +0100	[diff] [blame]	502	return timeout;
				503	}
				504
				505	static long
				506	i915_gem_object_wait_reservation(struct reservation_object *resv,
				507	unsigned int flags,
				508	long timeout,
Sagar Arun Kamble	562d9ba	2017-10-10 22:30:06 +0100	[diff] [blame]	509	struct intel_rps_client *rps_client)
Chris Wilson	e95433c	2016-10-28 13:58:27 +0100	[diff] [blame]	510	{
Chris Wilson	e54ca97	2017-02-17 15:13:04 +0000	[diff] [blame]	511	unsigned int seq = __read_seqcount_begin(&resv->seq);
Chris Wilson	e95433c	2016-10-28 13:58:27 +0100	[diff] [blame]	512	struct dma_fence *excl;
Chris Wilson	e54ca97	2017-02-17 15:13:04 +0000	[diff] [blame]	513	bool prune_fences = false;
Chris Wilson	e95433c	2016-10-28 13:58:27 +0100	[diff] [blame]	514
				515	if (flags & I915_WAIT_ALL) {
				516	struct dma_fence **shared;
				517	unsigned int count, i;
				518	int ret;
				519
				520	ret = reservation_object_get_fences_rcu(resv,
				521	&excl, &count, &shared);
				522	if (ret)
				523	return ret;
				524
				525	for (i = 0; i < count; i++) {
				526	timeout = i915_gem_object_wait_fence(shared[i],
				527	flags, timeout,
Sagar Arun Kamble	562d9ba	2017-10-10 22:30:06 +0100	[diff] [blame]	528	rps_client);
Chris Wilson	d892e93	2017-02-12 21:53:43 +0000	[diff] [blame]	529	if (timeout < 0)
Chris Wilson	e95433c	2016-10-28 13:58:27 +0100	[diff] [blame]	530	break;
				531
				532	dma_fence_put(shared[i]);
				533	}
				534
				535	for (; i < count; i++)
				536	dma_fence_put(shared[i]);
				537	kfree(shared);
Chris Wilson	e54ca97	2017-02-17 15:13:04 +0000	[diff] [blame]	538
Chris Wilson	fa73055	2018-03-07 17:13:03 +0000	[diff] [blame]	539	/*
				540	* If both shared fences and an exclusive fence exist,
				541	* then by construction the shared fences must be later
				542	* than the exclusive fence. If we successfully wait for
				543	* all the shared fences, we know that the exclusive fence
				544	* must all be signaled. If all the shared fences are
				545	* signaled, we can prune the array and recover the
				546	* floating references on the fences/requests.
				547	*/
Chris Wilson	e54ca97	2017-02-17 15:13:04 +0000	[diff] [blame]	548	prune_fences = count && timeout >= 0;
Chris Wilson	e95433c	2016-10-28 13:58:27 +0100	[diff] [blame]	549	} else {
				550	excl = reservation_object_get_excl_rcu(resv);
				551	}
				552
Chris Wilson	fa73055	2018-03-07 17:13:03 +0000	[diff] [blame]	553	if (excl && timeout >= 0)
Sagar Arun Kamble	562d9ba	2017-10-10 22:30:06 +0100	[diff] [blame]	554	timeout = i915_gem_object_wait_fence(excl, flags, timeout,
				555	rps_client);
Chris Wilson	e95433c	2016-10-28 13:58:27 +0100	[diff] [blame]	556
				557	dma_fence_put(excl);
				558
Chris Wilson	fa73055	2018-03-07 17:13:03 +0000	[diff] [blame]	559	/*
				560	* Opportunistically prune the fences iff we know they have all been
Chris Wilson	03d1cac	2017-03-08 13:26:28 +0000	[diff] [blame]	561	* signaled and that the reservation object has not been changed (i.e.
				562	* no new fences have been added).
				563	*/
Chris Wilson	e54ca97	2017-02-17 15:13:04 +0000	[diff] [blame]	564	if (prune_fences && !__read_seqcount_retry(&resv->seq, seq)) {
Chris Wilson	03d1cac	2017-03-08 13:26:28 +0000	[diff] [blame]	565	if (reservation_object_trylock(resv)) {
				566	if (!__read_seqcount_retry(&resv->seq, seq))
				567	reservation_object_add_excl_fence(resv, NULL);
				568	reservation_object_unlock(resv);
				569	}
Chris Wilson	e54ca97	2017-02-17 15:13:04 +0000	[diff] [blame]	570	}
				571
Chris Wilson	e95433c	2016-10-28 13:58:27 +0100	[diff] [blame]	572	return timeout;
				573	}
				574
Chris Wilson	b7268c5	2018-04-18 19:40:52 +0100	[diff] [blame]	575	static void __fence_set_priority(struct dma_fence *fence,
				576	const struct i915_sched_attr *attr)
Chris Wilson	6b5e90f	2016-11-14 20:41:05 +0000	[diff] [blame]	577	{
Chris Wilson	e61e0f5	2018-02-21 09:56:36 +0000	[diff] [blame]	578	struct i915_request *rq;
Chris Wilson	6b5e90f	2016-11-14 20:41:05 +0000	[diff] [blame]	579	struct intel_engine_cs *engine;
				580
Chris Wilson	c218ee0	2018-01-06 10:56:18 +0000	[diff] [blame]	581	if (dma_fence_is_signaled(fence) \|\| !dma_fence_is_i915(fence))
Chris Wilson	6b5e90f	2016-11-14 20:41:05 +0000	[diff] [blame]	582	return;
				583
				584	rq = to_request(fence);
				585	engine = rq->engine;
Chris Wilson	6b5e90f	2016-11-14 20:41:05 +0000	[diff] [blame]	586
Chris Wilson	4f6d8fc	2018-05-07 14:57:25 +0100	[diff] [blame]	587	local_bh_disable();
				588	rcu_read_lock(); /* RCU serialisation for set-wedged protection */
Chris Wilson	47650db	2018-03-07 13:42:25 +0000	[diff] [blame]	589	if (engine->schedule)
Chris Wilson	b7268c5	2018-04-18 19:40:52 +0100	[diff] [blame]	590	engine->schedule(rq, attr);
Chris Wilson	47650db	2018-03-07 13:42:25 +0000	[diff] [blame]	591	rcu_read_unlock();
Chris Wilson	4f6d8fc	2018-05-07 14:57:25 +0100	[diff] [blame]	592	local_bh_enable(); /* kick the tasklets if queues were reprioritised */
Chris Wilson	6b5e90f	2016-11-14 20:41:05 +0000	[diff] [blame]	593	}
				594
Chris Wilson	b7268c5	2018-04-18 19:40:52 +0100	[diff] [blame]	595	static void fence_set_priority(struct dma_fence *fence,
				596	const struct i915_sched_attr *attr)
Chris Wilson	6b5e90f	2016-11-14 20:41:05 +0000	[diff] [blame]	597	{
				598	/* Recurse once into a fence-array */
				599	if (dma_fence_is_array(fence)) {
				600	struct dma_fence_array *array = to_dma_fence_array(fence);
				601	int i;
				602
				603	for (i = 0; i < array->num_fences; i++)
Chris Wilson	b7268c5	2018-04-18 19:40:52 +0100	[diff] [blame]	604	__fence_set_priority(array->fences[i], attr);
Chris Wilson	6b5e90f	2016-11-14 20:41:05 +0000	[diff] [blame]	605	} else {
Chris Wilson	b7268c5	2018-04-18 19:40:52 +0100	[diff] [blame]	606	__fence_set_priority(fence, attr);
Chris Wilson	6b5e90f	2016-11-14 20:41:05 +0000	[diff] [blame]	607	}
				608	}
				609
				610	int
				611	i915_gem_object_wait_priority(struct drm_i915_gem_object *obj,
				612	unsigned int flags,
Chris Wilson	b7268c5	2018-04-18 19:40:52 +0100	[diff] [blame]	613	const struct i915_sched_attr *attr)
Chris Wilson	6b5e90f	2016-11-14 20:41:05 +0000	[diff] [blame]	614	{
				615	struct dma_fence *excl;
				616
				617	if (flags & I915_WAIT_ALL) {
				618	struct dma_fence **shared;
				619	unsigned int count, i;
				620	int ret;
				621
				622	ret = reservation_object_get_fences_rcu(obj->resv,
				623	&excl, &count, &shared);
				624	if (ret)
				625	return ret;
				626
				627	for (i = 0; i < count; i++) {
Chris Wilson	b7268c5	2018-04-18 19:40:52 +0100	[diff] [blame]	628	fence_set_priority(shared[i], attr);
Chris Wilson	6b5e90f	2016-11-14 20:41:05 +0000	[diff] [blame]	629	dma_fence_put(shared[i]);
				630	}
				631
				632	kfree(shared);
				633	} else {
				634	excl = reservation_object_get_excl_rcu(obj->resv);
				635	}
				636
				637	if (excl) {
Chris Wilson	b7268c5	2018-04-18 19:40:52 +0100	[diff] [blame]	638	fence_set_priority(excl, attr);
Chris Wilson	6b5e90f	2016-11-14 20:41:05 +0000	[diff] [blame]	639	dma_fence_put(excl);
				640	}
				641	return 0;
				642	}
				643
Chris Wilson	00e60f2	2016-08-04 16:32:40 +0100	[diff] [blame]	644	/**
Chris Wilson	e95433c	2016-10-28 13:58:27 +0100	[diff] [blame]	645	* Waits for rendering to the object to be completed
Chris Wilson	00e60f2	2016-08-04 16:32:40 +0100	[diff] [blame]	646	* @obj: i915 gem object
Chris Wilson	e95433c	2016-10-28 13:58:27 +0100	[diff] [blame]	647	* @flags: how to wait (under a lock, for all rendering or just for writes etc)
				648	* @timeout: how long to wait
Chris Wilson	a0a8b1c	2017-11-09 14:06:44 +0000	[diff] [blame]	649	* @rps_client: client (user process) to charge for any waitboosting
Chris Wilson	00e60f2	2016-08-04 16:32:40 +0100	[diff] [blame]	650	*/
				651	int
Chris Wilson	e95433c	2016-10-28 13:58:27 +0100	[diff] [blame]	652	i915_gem_object_wait(struct drm_i915_gem_object *obj,
				653	unsigned int flags,
				654	long timeout,
Sagar Arun Kamble	562d9ba	2017-10-10 22:30:06 +0100	[diff] [blame]	655	struct intel_rps_client *rps_client)
Chris Wilson	00e60f2	2016-08-04 16:32:40 +0100	[diff] [blame]	656	{
Chris Wilson	e95433c	2016-10-28 13:58:27 +0100	[diff] [blame]	657	might_sleep();
				658	#if IS_ENABLED(CONFIG_LOCKDEP)
				659	GEM_BUG_ON(debug_locks &&
				660	!!lockdep_is_held(&obj->base.dev->struct_mutex) !=
				661	!!(flags & I915_WAIT_LOCKED));
				662	#endif
				663	GEM_BUG_ON(timeout < 0);
Chris Wilson	00e60f2	2016-08-04 16:32:40 +0100	[diff] [blame]	664
Chris Wilson	d07f0e5	2016-10-28 13:58:44 +0100	[diff] [blame]	665	timeout = i915_gem_object_wait_reservation(obj->resv,
				666	flags, timeout,
Sagar Arun Kamble	562d9ba	2017-10-10 22:30:06 +0100	[diff] [blame]	667	rps_client);
Chris Wilson	e95433c	2016-10-28 13:58:27 +0100	[diff] [blame]	668	return timeout < 0 ? timeout : 0;
Chris Wilson	00e60f2	2016-08-04 16:32:40 +0100	[diff] [blame]	669	}
				670
				671	static struct intel_rps_client to_rps_client(struct drm_file file)
				672	{
				673	struct drm_i915_file_private *fpriv = file->driver_priv;
				674
Sagar Arun Kamble	562d9ba	2017-10-10 22:30:06 +0100	[diff] [blame]	675	return &fpriv->rps_client;
Chris Wilson	00e60f2	2016-08-04 16:32:40 +0100	[diff] [blame]	676	}
				677
Chris Wilson	0073115	2014-05-21 12:42:56 +0100	[diff] [blame]	678	static int
				679	i915_gem_phys_pwrite(struct drm_i915_gem_object *obj,
				680	struct drm_i915_gem_pwrite *args,
Chris Wilson	03ac84f	2016-10-28 13:58:36 +0100	[diff] [blame]	681	struct drm_file *file)
Chris Wilson	0073115	2014-05-21 12:42:56 +0100	[diff] [blame]	682	{
Chris Wilson	0073115	2014-05-21 12:42:56 +0100	[diff] [blame]	683	void *vaddr = obj->phys_handle->vaddr + args->offset;
Gustavo Padovan	3ed605b	2016-04-26 12:32:27 -0300	[diff] [blame]	684	char __user *user_data = u64_to_user_ptr(args->data_ptr);
Chris Wilson	6a2c423	2014-11-04 04:51:40 -0800	[diff] [blame]	685
				686	/* We manually control the domain here and pretend that it
				687	* remains coherent i.e. in the GTT domain, like shmem_pwrite.
				688	*/
Rodrigo Vivi	77a0d1c	2015-06-18 11:43:24 -0700	[diff] [blame]	689	intel_fb_obj_invalidate(obj, ORIGIN_CPU);
Chris Wilson	10466d2	2017-01-06 15:22:38 +0000	[diff] [blame]	690	if (copy_from_user(vaddr, user_data, args->size))
				691	return -EFAULT;
Chris Wilson	0073115	2014-05-21 12:42:56 +0100	[diff] [blame]	692
Chris Wilson	6a2c423	2014-11-04 04:51:40 -0800	[diff] [blame]	693	drm_clflush_virt_range(vaddr, args->size);
Chris Wilson	10466d2	2017-01-06 15:22:38 +0000	[diff] [blame]	694	i915_gem_chipset_flush(to_i915(obj->base.dev));
Paulo Zanoni	063e4e6	2015-02-13 17:23:45 -0200	[diff] [blame]	695
Chris Wilson	d59b21e	2017-02-22 11:40:49 +0000	[diff] [blame]	696	intel_fb_obj_flush(obj, ORIGIN_CPU);
Chris Wilson	10466d2	2017-01-06 15:22:38 +0000	[diff] [blame]	697	return 0;
Chris Wilson	0073115	2014-05-21 12:42:56 +0100	[diff] [blame]	698	}
				699
Tvrtko Ursulin	187685c	2016-12-01 14:16:36 +0000	[diff] [blame]	700	void i915_gem_object_alloc(struct drm_i915_private dev_priv)
Chris Wilson	42dcedd	2012-11-15 11:32:30 +0000	[diff] [blame]	701	{
Chris Wilson	efab6d8	2015-04-07 16:20:57 +0100	[diff] [blame]	702	return kmem_cache_zalloc(dev_priv->objects, GFP_KERNEL);
Chris Wilson	42dcedd	2012-11-15 11:32:30 +0000	[diff] [blame]	703	}
				704
				705	void i915_gem_object_free(struct drm_i915_gem_object *obj)
				706	{
Chris Wilson	fac5e23	2016-07-04 11:34:36 +0100	[diff] [blame]	707	struct drm_i915_private *dev_priv = to_i915(obj->base.dev);
Chris Wilson	efab6d8	2015-04-07 16:20:57 +0100	[diff] [blame]	708	kmem_cache_free(dev_priv->objects, obj);
Chris Wilson	42dcedd	2012-11-15 11:32:30 +0000	[diff] [blame]	709	}
				710
Dave Airlie	ff72145b	2011-02-07 12:16:14 +1000	[diff] [blame]	711	static int
				712	i915_gem_create(struct drm_file *file,
Tvrtko Ursulin	12d79d7	2016-12-01 14:16:37 +0000	[diff] [blame]	713	struct drm_i915_private *dev_priv,
Dave Airlie	ff72145b	2011-02-07 12:16:14 +1000	[diff] [blame]	714	uint64_t size,
				715	uint32_t *handle_p)
Eric Anholt	673a394	2008-07-30 12:06:12 -0700	[diff] [blame]	716	{
Chris Wilson	05394f3	2010-11-08 19:18:58 +0000	[diff] [blame]	717	struct drm_i915_gem_object *obj;
Pekka Paalanen	a1a2d1d	2009-08-23 12:40:55 +0300	[diff] [blame]	718	int ret;
				719	u32 handle;
Eric Anholt	673a394	2008-07-30 12:06:12 -0700	[diff] [blame]	720
Dave Airlie	ff72145b	2011-02-07 12:16:14 +1000	[diff] [blame]	721	size = roundup(size, PAGE_SIZE);
Chris Wilson	8ffc024	2011-09-14 14:14:28 +0200	[diff] [blame]	722	if (size == 0)
				723	return -EINVAL;
Eric Anholt	673a394	2008-07-30 12:06:12 -0700	[diff] [blame]	724
				725	/* Allocate the new object */
Tvrtko Ursulin	12d79d7	2016-12-01 14:16:37 +0000	[diff] [blame]	726	obj = i915_gem_object_create(dev_priv, size);
Chris Wilson	fe3db79	2016-04-25 13:32:13 +0100	[diff] [blame]	727	if (IS_ERR(obj))
				728	return PTR_ERR(obj);
Eric Anholt	673a394	2008-07-30 12:06:12 -0700	[diff] [blame]	729
Chris Wilson	05394f3	2010-11-08 19:18:58 +0000	[diff] [blame]	730	ret = drm_gem_handle_create(file, &obj->base, &handle);
Chris Wilson	202f2fe	2010-10-14 13:20:40 +0100	[diff] [blame]	731	/* drop reference from allocate - handle holds it now */
Chris Wilson	f0cd518	2016-10-28 13:58:43 +0100	[diff] [blame]	732	i915_gem_object_put(obj);
Daniel Vetter	d861e33	2013-07-24 23:25:03 +0200	[diff] [blame]	733	if (ret)
				734	return ret;
Chris Wilson	202f2fe	2010-10-14 13:20:40 +0100	[diff] [blame]	735
Dave Airlie	ff72145b	2011-02-07 12:16:14 +1000	[diff] [blame]	736	*handle_p = handle;
Eric Anholt	673a394	2008-07-30 12:06:12 -0700	[diff] [blame]	737	return 0;
				738	}
				739
Dave Airlie	ff72145b	2011-02-07 12:16:14 +1000	[diff] [blame]	740	int
				741	i915_gem_dumb_create(struct drm_file *file,
				742	struct drm_device *dev,
				743	struct drm_mode_create_dumb *args)
				744	{
				745	/* have to work out size/pitch and return them */
Paulo Zanoni	de45eaf	2013-10-18 18:48:24 -0300	[diff] [blame]	746	args->pitch = ALIGN(args->width * DIV_ROUND_UP(args->bpp, 8), 64);
Dave Airlie	ff72145b	2011-02-07 12:16:14 +1000	[diff] [blame]	747	args->size = args->pitch * args->height;
Tvrtko Ursulin	12d79d7	2016-12-01 14:16:37 +0000	[diff] [blame]	748	return i915_gem_create(file, to_i915(dev),
Dave Airlie	da6b51d	2014-12-24 13:11:17 +1000	[diff] [blame]	749	args->size, &args->handle);
Dave Airlie	ff72145b	2011-02-07 12:16:14 +1000	[diff] [blame]	750	}
				751
Chris Wilson	e27ab73	2017-06-15 13:38:49 +0100	[diff] [blame]	752	static bool gpu_write_needs_clflush(struct drm_i915_gem_object *obj)
				753	{
				754	return !(obj->cache_level == I915_CACHE_NONE \|\|
				755	obj->cache_level == I915_CACHE_WT);
				756	}
				757
Dave Airlie	ff72145b	2011-02-07 12:16:14 +1000	[diff] [blame]	758	/**
				759	* Creates a new mm object and returns a handle to it.
Tvrtko Ursulin	14bb2c1	2016-06-03 14:02:17 +0100	[diff] [blame]	760	* @dev: drm device pointer
				761	* @data: ioctl data blob
				762	* @file: drm file pointer
Dave Airlie	ff72145b	2011-02-07 12:16:14 +1000	[diff] [blame]	763	*/
				764	int
				765	i915_gem_create_ioctl(struct drm_device dev, void data,
				766	struct drm_file *file)
				767	{
Tvrtko Ursulin	12d79d7	2016-12-01 14:16:37 +0000	[diff] [blame]	768	struct drm_i915_private *dev_priv = to_i915(dev);
Dave Airlie	ff72145b	2011-02-07 12:16:14 +1000	[diff] [blame]	769	struct drm_i915_gem_create *args = data;
Daniel Vetter	63ed2cb	2012-04-23 16:50:50 +0200	[diff] [blame]	770
Tvrtko Ursulin	12d79d7	2016-12-01 14:16:37 +0000	[diff] [blame]	771	i915_gem_flush_free_objects(dev_priv);
Chris Wilson	fbbd37b	2016-10-28 13:58:42 +0100	[diff] [blame]	772
Tvrtko Ursulin	12d79d7	2016-12-01 14:16:37 +0000	[diff] [blame]	773	return i915_gem_create(file, dev_priv,
Dave Airlie	da6b51d	2014-12-24 13:11:17 +1000	[diff] [blame]	774	args->size, &args->handle);
Dave Airlie	ff72145b	2011-02-07 12:16:14 +1000	[diff] [blame]	775	}
				776
Chris Wilson	ef74921	2017-04-12 12:01:10 +0100	[diff] [blame]	777	static inline enum fb_op_origin
				778	fb_write_origin(struct drm_i915_gem_object *obj, unsigned int domain)
				779	{
				780	return (domain == I915_GEM_DOMAIN_GTT ?
				781	obj->frontbuffer_ggtt_origin : ORIGIN_CPU);
				782	}
				783
Chris Wilson	7125397b	2017-12-06 12:49:14 +0000	[diff] [blame]	784	void i915_gem_flush_ggtt_writes(struct drm_i915_private *dev_priv)
Chris Wilson	ef74921	2017-04-12 12:01:10 +0100	[diff] [blame]	785	{
Chris Wilson	7125397b	2017-12-06 12:49:14 +0000	[diff] [blame]	786	/*
				787	* No actual flushing is required for the GTT write domain for reads
				788	* from the GTT domain. Writes to it "immediately" go to main memory
				789	* as far as we know, so there's no chipset flush. It also doesn't
				790	* land in the GPU render cache.
Chris Wilson	ef74921	2017-04-12 12:01:10 +0100	[diff] [blame]	791	*
				792	* However, we do have to enforce the order so that all writes through
				793	* the GTT land before any writes to the device, such as updates to
				794	* the GATT itself.
				795	*
				796	* We also have to wait a bit for the writes to land from the GTT.
				797	* An uncached read (i.e. mmio) seems to be ideal for the round-trip
				798	* timing. This issue has only been observed when switching quickly
				799	* between GTT writes and CPU reads from inside the kernel on recent hw,
				800	* and it appears to only affect discrete GTT blocks (i.e. on LLC
Chris Wilson	7125397b	2017-12-06 12:49:14 +0000	[diff] [blame]	801	* system agents we cannot reproduce this behaviour, until Cannonlake
				802	* that was!).
Chris Wilson	ef74921	2017-04-12 12:01:10 +0100	[diff] [blame]	803	*/
Chris Wilson	7125397b	2017-12-06 12:49:14 +0000	[diff] [blame]	804
Chris Wilson	900ccf3	2018-07-20 11:19:10 +0100	[diff] [blame]	805	wmb();
				806
				807	if (INTEL_INFO(dev_priv)->has_coherent_ggtt)
				808	return;
				809
Chris Wilson	a8bd3b8	2018-07-17 10:26:55 +0100	[diff] [blame]	810	i915_gem_chipset_flush(dev_priv);
Chris Wilson	ef74921	2017-04-12 12:01:10 +0100	[diff] [blame]	811
Chris Wilson	7125397b	2017-12-06 12:49:14 +0000	[diff] [blame]	812	intel_runtime_pm_get(dev_priv);
				813	spin_lock_irq(&dev_priv->uncore.lock);
				814
				815	POSTING_READ_FW(RING_HEAD(RENDER_RING_BASE));
				816
				817	spin_unlock_irq(&dev_priv->uncore.lock);
				818	intel_runtime_pm_put(dev_priv);
				819	}
				820
				821	static void
				822	flush_write_domain(struct drm_i915_gem_object *obj, unsigned int flush_domains)
				823	{
				824	struct drm_i915_private *dev_priv = to_i915(obj->base.dev);
				825	struct i915_vma *vma;
				826
Christian König	c0a51fd	2018-02-16 13:43:38 +0100	[diff] [blame]	827	if (!(obj->write_domain & flush_domains))
Chris Wilson	7125397b	2017-12-06 12:49:14 +0000	[diff] [blame]	828	return;
				829
Christian König	c0a51fd	2018-02-16 13:43:38 +0100	[diff] [blame]	830	switch (obj->write_domain) {
Chris Wilson	ef74921	2017-04-12 12:01:10 +0100	[diff] [blame]	831	case I915_GEM_DOMAIN_GTT:
Chris Wilson	7125397b	2017-12-06 12:49:14 +0000	[diff] [blame]	832	i915_gem_flush_ggtt_writes(dev_priv);
Chris Wilson	ef74921	2017-04-12 12:01:10 +0100	[diff] [blame]	833
				834	intel_fb_obj_flush(obj,
				835	fb_write_origin(obj, I915_GEM_DOMAIN_GTT));
Chris Wilson	7125397b	2017-12-06 12:49:14 +0000	[diff] [blame]	836
Chris Wilson	e2189dd	2017-12-07 21:14:07 +0000	[diff] [blame]	837	for_each_ggtt_vma(vma, obj) {
Chris Wilson	7125397b	2017-12-06 12:49:14 +0000	[diff] [blame]	838	if (vma->iomap)
				839	continue;
				840
				841	i915_vma_unset_ggtt_write(vma);
				842	}
Chris Wilson	ef74921	2017-04-12 12:01:10 +0100	[diff] [blame]	843	break;
				844
Chris Wilson	add00e6	2018-07-06 12:54:02 +0100	[diff] [blame]	845	case I915_GEM_DOMAIN_WC:
				846	wmb();
				847	break;
				848
Chris Wilson	ef74921	2017-04-12 12:01:10 +0100	[diff] [blame]	849	case I915_GEM_DOMAIN_CPU:
				850	i915_gem_clflush_object(obj, I915_CLFLUSH_SYNC);
				851	break;
Chris Wilson	e27ab73	2017-06-15 13:38:49 +0100	[diff] [blame]	852
				853	case I915_GEM_DOMAIN_RENDER:
				854	if (gpu_write_needs_clflush(obj))
				855	obj->cache_dirty = true;
				856	break;
Chris Wilson	ef74921	2017-04-12 12:01:10 +0100	[diff] [blame]	857	}
				858
Christian König	c0a51fd	2018-02-16 13:43:38 +0100	[diff] [blame]	859	obj->write_domain = 0;
Chris Wilson	ef74921	2017-04-12 12:01:10 +0100	[diff] [blame]	860	}
				861
Daniel Vetter	8c59967	2011-12-14 13:57:31 +0100	[diff] [blame]	862	static inline int
Daniel Vetter	8461d22	2011-12-14 13:57:32 +0100	[diff] [blame]	863	__copy_to_user_swizzled(char __user *cpu_vaddr,
				864	const char *gpu_vaddr, int gpu_offset,
				865	int length)
				866	{
				867	int ret, cpu_offset = 0;
				868
				869	while (length > 0) {
				870	int cacheline_end = ALIGN(gpu_offset + 1, 64);
				871	int this_length = min(cacheline_end - gpu_offset, length);
				872	int swizzled_gpu_offset = gpu_offset ^ 64;
				873
				874	ret = __copy_to_user(cpu_vaddr + cpu_offset,
				875	gpu_vaddr + swizzled_gpu_offset,
				876	this_length);
				877	if (ret)
				878	return ret + length;
				879
				880	cpu_offset += this_length;
				881	gpu_offset += this_length;
				882	length -= this_length;
				883	}
				884
				885	return 0;
				886	}
				887
				888	static inline int
Ben Widawsky	4f0c7cf	2012-04-16 14:07:47 -0700	[diff] [blame]	889	__copy_from_user_swizzled(char *gpu_vaddr, int gpu_offset,
				890	const char __user *cpu_vaddr,
Daniel Vetter	8c59967	2011-12-14 13:57:31 +0100	[diff] [blame]	891	int length)
				892	{
				893	int ret, cpu_offset = 0;
				894
				895	while (length > 0) {
				896	int cacheline_end = ALIGN(gpu_offset + 1, 64);
				897	int this_length = min(cacheline_end - gpu_offset, length);
				898	int swizzled_gpu_offset = gpu_offset ^ 64;
				899
				900	ret = __copy_from_user(gpu_vaddr + swizzled_gpu_offset,
				901	cpu_vaddr + cpu_offset,
				902	this_length);
				903	if (ret)
				904	return ret + length;
				905
				906	cpu_offset += this_length;
				907	gpu_offset += this_length;
				908	length -= this_length;
				909	}
				910
				911	return 0;
				912	}
				913
Brad Volkin	4c914c0	2014-02-18 10:15:45 -0800	[diff] [blame]	914	/*
				915	* Pins the specified object's pages and synchronizes the object with
				916	* GPU accesses. Sets needs_clflush to non-zero if the caller should
				917	* flush the object from the CPU cache.
				918	*/
				919	int i915_gem_obj_prepare_shmem_read(struct drm_i915_gem_object *obj,
Chris Wilson	43394c7	2016-08-18 17:16:47 +0100	[diff] [blame]	920	unsigned int *needs_clflush)
Brad Volkin	4c914c0	2014-02-18 10:15:45 -0800	[diff] [blame]	921	{
				922	int ret;
				923
Chris Wilson	e95433c	2016-10-28 13:58:27 +0100	[diff] [blame]	924	lockdep_assert_held(&obj->base.dev->struct_mutex);
Brad Volkin	4c914c0	2014-02-18 10:15:45 -0800	[diff] [blame]	925
Chris Wilson	e95433c	2016-10-28 13:58:27 +0100	[diff] [blame]	926	*needs_clflush = 0;
Chris Wilson	43394c7	2016-08-18 17:16:47 +0100	[diff] [blame]	927	if (!i915_gem_object_has_struct_page(obj))
				928	return -ENODEV;
Brad Volkin	4c914c0	2014-02-18 10:15:45 -0800	[diff] [blame]	929
Chris Wilson	e95433c	2016-10-28 13:58:27 +0100	[diff] [blame]	930	ret = i915_gem_object_wait(obj,
				931	I915_WAIT_INTERRUPTIBLE \|
				932	I915_WAIT_LOCKED,
				933	MAX_SCHEDULE_TIMEOUT,
				934	NULL);
Chris Wilson	c13d87e	2016-07-20 09:21:15 +0100	[diff] [blame]	935	if (ret)
				936	return ret;
				937
Chris Wilson	a4f5ea6	2016-10-28 13:58:35 +0100	[diff] [blame]	938	ret = i915_gem_object_pin_pages(obj);
Chris Wilson	9764951	2016-08-18 17:16:50 +0100	[diff] [blame]	939	if (ret)
				940	return ret;
				941
Chris Wilson	b8f55be	2017-08-11 12:11:16 +0100	[diff] [blame]	942	if (obj->cache_coherent & I915_BO_CACHE_COHERENT_FOR_READ \|\|
				943	!static_cpu_has(X86_FEATURE_CLFLUSH)) {
Chris Wilson	7f5f95d	2017-03-10 00:09:42 +0000	[diff] [blame]	944	ret = i915_gem_object_set_to_cpu_domain(obj, false);
				945	if (ret)
				946	goto err_unpin;
				947	else
				948	goto out;
				949	}
				950
Chris Wilson	ef74921	2017-04-12 12:01:10 +0100	[diff] [blame]	951	flush_write_domain(obj, ~I915_GEM_DOMAIN_CPU);
Chris Wilson	a314d5c	2016-08-18 17:16:48 +0100	[diff] [blame]	952
Chris Wilson	43394c7	2016-08-18 17:16:47 +0100	[diff] [blame]	953	/* If we're not in the cpu read domain, set ourself into the gtt
				954	* read domain and manually flush cachelines (if required). This
				955	* optimizes for the case when the gpu will dirty the data
				956	* anyway again before the next pread happens.
				957	*/
Chris Wilson	e27ab73	2017-06-15 13:38:49 +0100	[diff] [blame]	958	if (!obj->cache_dirty &&
Christian König	c0a51fd	2018-02-16 13:43:38 +0100	[diff] [blame]	959	!(obj->read_domains & I915_GEM_DOMAIN_CPU))
Chris Wilson	7f5f95d	2017-03-10 00:09:42 +0000	[diff] [blame]	960	*needs_clflush = CLFLUSH_BEFORE;
Brad Volkin	4c914c0	2014-02-18 10:15:45 -0800	[diff] [blame]	961
Chris Wilson	7f5f95d	2017-03-10 00:09:42 +0000	[diff] [blame]	962	out:
Chris Wilson	9764951	2016-08-18 17:16:50 +0100	[diff] [blame]	963	/* return with the pages pinned */
Chris Wilson	43394c7	2016-08-18 17:16:47 +0100	[diff] [blame]	964	return 0;
Chris Wilson	9764951	2016-08-18 17:16:50 +0100	[diff] [blame]	965
				966	err_unpin:
				967	i915_gem_object_unpin_pages(obj);
				968	return ret;
Chris Wilson	43394c7	2016-08-18 17:16:47 +0100	[diff] [blame]	969	}
				970
				971	int i915_gem_obj_prepare_shmem_write(struct drm_i915_gem_object *obj,
				972	unsigned int *needs_clflush)
				973	{
				974	int ret;
				975
Chris Wilson	e95433c	2016-10-28 13:58:27 +0100	[diff] [blame]	976	lockdep_assert_held(&obj->base.dev->struct_mutex);
				977
Chris Wilson	43394c7	2016-08-18 17:16:47 +0100	[diff] [blame]	978	*needs_clflush = 0;
				979	if (!i915_gem_object_has_struct_page(obj))
				980	return -ENODEV;
				981
Chris Wilson	e95433c	2016-10-28 13:58:27 +0100	[diff] [blame]	982	ret = i915_gem_object_wait(obj,
				983	I915_WAIT_INTERRUPTIBLE \|
				984	I915_WAIT_LOCKED \|
				985	I915_WAIT_ALL,
				986	MAX_SCHEDULE_TIMEOUT,
				987	NULL);
Chris Wilson	43394c7	2016-08-18 17:16:47 +0100	[diff] [blame]	988	if (ret)
				989	return ret;
				990
Chris Wilson	a4f5ea6	2016-10-28 13:58:35 +0100	[diff] [blame]	991	ret = i915_gem_object_pin_pages(obj);
Chris Wilson	9764951	2016-08-18 17:16:50 +0100	[diff] [blame]	992	if (ret)
				993	return ret;
				994
Chris Wilson	b8f55be	2017-08-11 12:11:16 +0100	[diff] [blame]	995	if (obj->cache_coherent & I915_BO_CACHE_COHERENT_FOR_WRITE \|\|
				996	!static_cpu_has(X86_FEATURE_CLFLUSH)) {
Chris Wilson	7f5f95d	2017-03-10 00:09:42 +0000	[diff] [blame]	997	ret = i915_gem_object_set_to_cpu_domain(obj, true);
				998	if (ret)
				999	goto err_unpin;
				1000	else
				1001	goto out;
				1002	}
				1003
Chris Wilson	ef74921	2017-04-12 12:01:10 +0100	[diff] [blame]	1004	flush_write_domain(obj, ~I915_GEM_DOMAIN_CPU);
Chris Wilson	a314d5c	2016-08-18 17:16:48 +0100	[diff] [blame]	1005
Chris Wilson	43394c7	2016-08-18 17:16:47 +0100	[diff] [blame]	1006	/* If we're not in the cpu write domain, set ourself into the
				1007	* gtt write domain and manually flush cachelines (as required).
				1008	* This optimizes for the case when the gpu will use the data
				1009	* right away and we therefore have to clflush anyway.
				1010	*/
Chris Wilson	e27ab73	2017-06-15 13:38:49 +0100	[diff] [blame]	1011	if (!obj->cache_dirty) {
Chris Wilson	7f5f95d	2017-03-10 00:09:42 +0000	[diff] [blame]	1012	*needs_clflush \|= CLFLUSH_AFTER;
Chris Wilson	43394c7	2016-08-18 17:16:47 +0100	[diff] [blame]	1013
Chris Wilson	e27ab73	2017-06-15 13:38:49 +0100	[diff] [blame]	1014	/*
				1015	* Same trick applies to invalidate partially written
				1016	* cachelines read before writing.
				1017	*/
Christian König	c0a51fd	2018-02-16 13:43:38 +0100	[diff] [blame]	1018	if (!(obj->read_domains & I915_GEM_DOMAIN_CPU))
Chris Wilson	e27ab73	2017-06-15 13:38:49 +0100	[diff] [blame]	1019	*needs_clflush \|= CLFLUSH_BEFORE;
				1020	}
Chris Wilson	43394c7	2016-08-18 17:16:47 +0100	[diff] [blame]	1021
Chris Wilson	7f5f95d	2017-03-10 00:09:42 +0000	[diff] [blame]	1022	out:
Chris Wilson	43394c7	2016-08-18 17:16:47 +0100	[diff] [blame]	1023	intel_fb_obj_invalidate(obj, ORIGIN_CPU);
Chris Wilson	a4f5ea6	2016-10-28 13:58:35 +0100	[diff] [blame]	1024	obj->mm.dirty = true;
Chris Wilson	9764951	2016-08-18 17:16:50 +0100	[diff] [blame]	1025	/* return with the pages pinned */
Chris Wilson	43394c7	2016-08-18 17:16:47 +0100	[diff] [blame]	1026	return 0;
Chris Wilson	9764951	2016-08-18 17:16:50 +0100	[diff] [blame]	1027
				1028	err_unpin:
				1029	i915_gem_object_unpin_pages(obj);
				1030	return ret;
Brad Volkin	4c914c0	2014-02-18 10:15:45 -0800	[diff] [blame]	1031	}
				1032
Daniel Vetter	23c18c7	2012-03-25 19:47:42 +0200	[diff] [blame]	1033	static void
				1034	shmem_clflush_swizzled_range(char *addr, unsigned long length,
				1035	bool swizzled)
				1036	{
Daniel Vetter	e7e58eb	2012-03-25 19:47:43 +0200	[diff] [blame]	1037	if (unlikely(swizzled)) {
Daniel Vetter	23c18c7	2012-03-25 19:47:42 +0200	[diff] [blame]	1038	unsigned long start = (unsigned long) addr;
				1039	unsigned long end = (unsigned long) addr + length;
				1040
				1041	/* For swizzling simply ensure that we always flush both
				1042	* channels. Lame, but simple and it works. Swizzled
				1043	* pwrite/pread is far from a hotpath - current userspace
				1044	* doesn't use it at all. */
				1045	start = round_down(start, 128);
				1046	end = round_up(end, 128);
				1047
				1048	drm_clflush_virt_range((void *)start, end - start);
				1049	} else {
				1050	drm_clflush_virt_range(addr, length);
				1051	}
				1052
				1053	}
				1054
Daniel Vetter	d174bd6	2012-03-25 19:47:40 +0200	[diff] [blame]	1055	/* Only difference to the fast-path function is that this can handle bit17
				1056	* and uses non-atomic copy and kmap functions. */
				1057	static int
Chris Wilson	bb6dc8d	2016-10-28 13:58:39 +0100	[diff] [blame]	1058	shmem_pread_slow(struct page *page, int offset, int length,
Daniel Vetter	d174bd6	2012-03-25 19:47:40 +0200	[diff] [blame]	1059	char __user *user_data,
				1060	bool page_do_bit17_swizzling, bool needs_clflush)
				1061	{
				1062	char *vaddr;
				1063	int ret;
				1064
				1065	vaddr = kmap(page);
				1066	if (needs_clflush)
Chris Wilson	bb6dc8d	2016-10-28 13:58:39 +0100	[diff] [blame]	1067	shmem_clflush_swizzled_range(vaddr + offset, length,
Daniel Vetter	23c18c7	2012-03-25 19:47:42 +0200	[diff] [blame]	1068	page_do_bit17_swizzling);
Daniel Vetter	d174bd6	2012-03-25 19:47:40 +0200	[diff] [blame]	1069
				1070	if (page_do_bit17_swizzling)
Chris Wilson	bb6dc8d	2016-10-28 13:58:39 +0100	[diff] [blame]	1071	ret = __copy_to_user_swizzled(user_data, vaddr, offset, length);
Daniel Vetter	d174bd6	2012-03-25 19:47:40 +0200	[diff] [blame]	1072	else
Chris Wilson	bb6dc8d	2016-10-28 13:58:39 +0100	[diff] [blame]	1073	ret = __copy_to_user(user_data, vaddr + offset, length);
Daniel Vetter	d174bd6	2012-03-25 19:47:40 +0200	[diff] [blame]	1074	kunmap(page);
				1075
Chris Wilson	f60d7f0	2012-09-04 21:02:56 +0100	[diff] [blame]	1076	return ret ? - EFAULT : 0;
Daniel Vetter	d174bd6	2012-03-25 19:47:40 +0200	[diff] [blame]	1077	}
				1078
Chris Wilson	bb6dc8d	2016-10-28 13:58:39 +0100	[diff] [blame]	1079	static int
				1080	shmem_pread(struct page page, int offset, int length, char __user user_data,
				1081	bool page_do_bit17_swizzling, bool needs_clflush)
Ankitprasad Sharma	b50a537	2016-06-10 14:23:03 +0530	[diff] [blame]	1082	{
Chris Wilson	bb6dc8d	2016-10-28 13:58:39 +0100	[diff] [blame]	1083	int ret;
				1084
				1085	ret = -ENODEV;
				1086	if (!page_do_bit17_swizzling) {
				1087	char *vaddr = kmap_atomic(page);
				1088
				1089	if (needs_clflush)
				1090	drm_clflush_virt_range(vaddr + offset, length);
				1091	ret = __copy_to_user_inatomic(user_data, vaddr + offset, length);
				1092	kunmap_atomic(vaddr);
				1093	}
				1094	if (ret == 0)
				1095	return 0;
				1096
				1097	return shmem_pread_slow(page, offset, length, user_data,
				1098	page_do_bit17_swizzling, needs_clflush);
				1099	}
				1100
				1101	static int
				1102	i915_gem_shmem_pread(struct drm_i915_gem_object *obj,
				1103	struct drm_i915_gem_pread *args)
				1104	{
				1105	char __user *user_data;
				1106	u64 remain;
				1107	unsigned int obj_do_bit17_swizzling;
				1108	unsigned int needs_clflush;
				1109	unsigned int idx, offset;
				1110	int ret;
				1111
				1112	obj_do_bit17_swizzling = 0;
				1113	if (i915_gem_object_needs_bit17_swizzle(obj))
				1114	obj_do_bit17_swizzling = BIT(17);
				1115
				1116	ret = mutex_lock_interruptible(&obj->base.dev->struct_mutex);
				1117	if (ret)
				1118	return ret;
				1119
				1120	ret = i915_gem_obj_prepare_shmem_read(obj, &needs_clflush);
				1121	mutex_unlock(&obj->base.dev->struct_mutex);
				1122	if (ret)
				1123	return ret;
				1124
				1125	remain = args->size;
				1126	user_data = u64_to_user_ptr(args->data_ptr);
				1127	offset = offset_in_page(args->offset);
				1128	for (idx = args->offset >> PAGE_SHIFT; remain; idx++) {
				1129	struct page *page = i915_gem_object_get_page(obj, idx);
				1130	int length;
				1131
				1132	length = remain;
				1133	if (offset + length > PAGE_SIZE)
				1134	length = PAGE_SIZE - offset;
				1135
				1136	ret = shmem_pread(page, offset, length, user_data,
				1137	page_to_phys(page) & obj_do_bit17_swizzling,
				1138	needs_clflush);
				1139	if (ret)
				1140	break;
				1141
				1142	remain -= length;
				1143	user_data += length;
				1144	offset = 0;
				1145	}
				1146
				1147	i915_gem_obj_finish_shmem_access(obj);
				1148	return ret;
				1149	}
				1150
				1151	static inline bool
				1152	gtt_user_read(struct io_mapping *mapping,
				1153	loff_t base, int offset,
				1154	char __user *user_data, int length)
				1155	{
Ville Syrjälä	afe722b	2017-09-01 20:12:52 +0300	[diff] [blame]	1156	void __iomem *vaddr;
Chris Wilson	bb6dc8d	2016-10-28 13:58:39 +0100	[diff] [blame]	1157	unsigned long unwritten;
Ankitprasad Sharma	b50a537	2016-06-10 14:23:03 +0530	[diff] [blame]	1158
Ankitprasad Sharma	b50a537	2016-06-10 14:23:03 +0530	[diff] [blame]	1159	/* We can use the cpu mem copy function because this is X86. */
Ville Syrjälä	afe722b	2017-09-01 20:12:52 +0300	[diff] [blame]	1160	vaddr = io_mapping_map_atomic_wc(mapping, base);
				1161	unwritten = __copy_to_user_inatomic(user_data,
				1162	(void __force *)vaddr + offset,
				1163	length);
Chris Wilson	bb6dc8d	2016-10-28 13:58:39 +0100	[diff] [blame]	1164	io_mapping_unmap_atomic(vaddr);
				1165	if (unwritten) {
Ville Syrjälä	afe722b	2017-09-01 20:12:52 +0300	[diff] [blame]	1166	vaddr = io_mapping_map_wc(mapping, base, PAGE_SIZE);
				1167	unwritten = copy_to_user(user_data,
				1168	(void __force *)vaddr + offset,
				1169	length);
Chris Wilson	bb6dc8d	2016-10-28 13:58:39 +0100	[diff] [blame]	1170	io_mapping_unmap(vaddr);
				1171	}
Ankitprasad Sharma	b50a537	2016-06-10 14:23:03 +0530	[diff] [blame]	1172	return unwritten;
				1173	}
				1174
				1175	static int
Chris Wilson	bb6dc8d	2016-10-28 13:58:39 +0100	[diff] [blame]	1176	i915_gem_gtt_pread(struct drm_i915_gem_object *obj,
				1177	const struct drm_i915_gem_pread *args)
Ankitprasad Sharma	b50a537	2016-06-10 14:23:03 +0530	[diff] [blame]	1178	{
Chris Wilson	bb6dc8d	2016-10-28 13:58:39 +0100	[diff] [blame]	1179	struct drm_i915_private *i915 = to_i915(obj->base.dev);
				1180	struct i915_ggtt *ggtt = &i915->ggtt;
Ankitprasad Sharma	b50a537	2016-06-10 14:23:03 +0530	[diff] [blame]	1181	struct drm_mm_node node;
Chris Wilson	bb6dc8d	2016-10-28 13:58:39 +0100	[diff] [blame]	1182	struct i915_vma *vma;
				1183	void __user *user_data;
				1184	u64 remain, offset;
Ankitprasad Sharma	b50a537	2016-06-10 14:23:03 +0530	[diff] [blame]	1185	int ret;
				1186
Chris Wilson	bb6dc8d	2016-10-28 13:58:39 +0100	[diff] [blame]	1187	ret = mutex_lock_interruptible(&i915->drm.struct_mutex);
				1188	if (ret)
				1189	return ret;
				1190
				1191	intel_runtime_pm_get(i915);
				1192	vma = i915_gem_object_ggtt_pin(obj, NULL, 0, 0,
Chris Wilson	a3259ca	2017-10-09 09:44:00 +0100	[diff] [blame]	1193	PIN_MAPPABLE \|
				1194	PIN_NONFAULT \|
				1195	PIN_NONBLOCK);
Chris Wilson	1803458	2016-08-18 17:16:45 +0100	[diff] [blame]	1196	if (!IS_ERR(vma)) {
				1197	node.start = i915_ggtt_offset(vma);
				1198	node.allocated = false;
Chris Wilson	49ef529	2016-08-18 17:17:00 +0100	[diff] [blame]	1199	ret = i915_vma_put_fence(vma);
Chris Wilson	1803458	2016-08-18 17:16:45 +0100	[diff] [blame]	1200	if (ret) {
				1201	i915_vma_unpin(vma);
				1202	vma = ERR_PTR(ret);
				1203	}
				1204	}
Chris Wilson	058d88c	2016-08-15 10:49:06 +0100	[diff] [blame]	1205	if (IS_ERR(vma)) {
Chris Wilson	bb6dc8d	2016-10-28 13:58:39 +0100	[diff] [blame]	1206	ret = insert_mappable_node(ggtt, &node, PAGE_SIZE);
Ankitprasad Sharma	b50a537	2016-06-10 14:23:03 +0530	[diff] [blame]	1207	if (ret)
Chris Wilson	bb6dc8d	2016-10-28 13:58:39 +0100	[diff] [blame]	1208	goto out_unlock;
				1209	GEM_BUG_ON(!node.allocated);
Ankitprasad Sharma	b50a537	2016-06-10 14:23:03 +0530	[diff] [blame]	1210	}
				1211
				1212	ret = i915_gem_object_set_to_gtt_domain(obj, false);
				1213	if (ret)
				1214	goto out_unpin;
				1215
Chris Wilson	bb6dc8d	2016-10-28 13:58:39 +0100	[diff] [blame]	1216	mutex_unlock(&i915->drm.struct_mutex);
Ankitprasad Sharma	b50a537	2016-06-10 14:23:03 +0530	[diff] [blame]	1217
Chris Wilson	bb6dc8d	2016-10-28 13:58:39 +0100	[diff] [blame]	1218	user_data = u64_to_user_ptr(args->data_ptr);
				1219	remain = args->size;
				1220	offset = args->offset;
Ankitprasad Sharma	b50a537	2016-06-10 14:23:03 +0530	[diff] [blame]	1221
				1222	while (remain > 0) {
				1223	/* Operation in this page
				1224	*
				1225	* page_base = page offset within aperture
				1226	* page_offset = offset within page
				1227	* page_length = bytes to copy for this page
				1228	*/
				1229	u32 page_base = node.start;
				1230	unsigned page_offset = offset_in_page(offset);
				1231	unsigned page_length = PAGE_SIZE - page_offset;
				1232	page_length = remain < page_length ? remain : page_length;
				1233	if (node.allocated) {
				1234	wmb();
Chris Wilson	82ad644	2018-06-05 16:37:58 +0100	[diff] [blame]	1235	ggtt->vm.insert_page(&ggtt->vm,
				1236	i915_gem_object_get_dma_address(obj, offset >> PAGE_SHIFT),
				1237	node.start, I915_CACHE_NONE, 0);
Ankitprasad Sharma	b50a537	2016-06-10 14:23:03 +0530	[diff] [blame]	1238	wmb();
				1239	} else {
				1240	page_base += offset & PAGE_MASK;
				1241	}
Chris Wilson	bb6dc8d	2016-10-28 13:58:39 +0100	[diff] [blame]	1242
Matthew Auld	73ebd50	2017-12-11 15:18:20 +0000	[diff] [blame]	1243	if (gtt_user_read(&ggtt->iomap, page_base, page_offset,
Chris Wilson	bb6dc8d	2016-10-28 13:58:39 +0100	[diff] [blame]	1244	user_data, page_length)) {
Ankitprasad Sharma	b50a537	2016-06-10 14:23:03 +0530	[diff] [blame]	1245	ret = -EFAULT;
				1246	break;
				1247	}
				1248
				1249	remain -= page_length;
				1250	user_data += page_length;
				1251	offset += page_length;
				1252	}
				1253
Chris Wilson	bb6dc8d	2016-10-28 13:58:39 +0100	[diff] [blame]	1254	mutex_lock(&i915->drm.struct_mutex);
Ankitprasad Sharma	b50a537	2016-06-10 14:23:03 +0530	[diff] [blame]	1255	out_unpin:
				1256	if (node.allocated) {
				1257	wmb();
Chris Wilson	82ad644	2018-06-05 16:37:58 +0100	[diff] [blame]	1258	ggtt->vm.clear_range(&ggtt->vm, node.start, node.size);
Ankitprasad Sharma	b50a537	2016-06-10 14:23:03 +0530	[diff] [blame]	1259	remove_mappable_node(&node);
				1260	} else {
Chris Wilson	058d88c	2016-08-15 10:49:06 +0100	[diff] [blame]	1261	i915_vma_unpin(vma);
Ankitprasad Sharma	b50a537	2016-06-10 14:23:03 +0530	[diff] [blame]	1262	}
Chris Wilson	bb6dc8d	2016-10-28 13:58:39 +0100	[diff] [blame]	1263	out_unlock:
				1264	intel_runtime_pm_put(i915);
				1265	mutex_unlock(&i915->drm.struct_mutex);
Chris Wilson	f60d7f0	2012-09-04 21:02:56 +0100	[diff] [blame]	1266
Eric Anholt	eb01459	2009-03-10 11:44:52 -0700	[diff] [blame]	1267	return ret;
				1268	}
				1269
Eric Anholt	673a394	2008-07-30 12:06:12 -0700	[diff] [blame]	1270	/**
				1271	* Reads data from the object referenced by handle.
Tvrtko Ursulin	14bb2c1	2016-06-03 14:02:17 +0100	[diff] [blame]	1272	* @dev: drm device pointer
				1273	* @data: ioctl data blob
				1274	* @file: drm file pointer
Eric Anholt	673a394	2008-07-30 12:06:12 -0700	[diff] [blame]	1275	*
				1276	* On error, the contents of *data are undefined.
				1277	*/
				1278	int
				1279	i915_gem_pread_ioctl(struct drm_device dev, void data,
Chris Wilson	05394f3	2010-11-08 19:18:58 +0000	[diff] [blame]	1280	struct drm_file *file)
Eric Anholt	673a394	2008-07-30 12:06:12 -0700	[diff] [blame]	1281	{
				1282	struct drm_i915_gem_pread *args = data;
Chris Wilson	05394f3	2010-11-08 19:18:58 +0000	[diff] [blame]	1283	struct drm_i915_gem_object *obj;
Chris Wilson	bb6dc8d	2016-10-28 13:58:39 +0100	[diff] [blame]	1284	int ret;
Eric Anholt	673a394	2008-07-30 12:06:12 -0700	[diff] [blame]	1285
Chris Wilson	51311d0	2010-11-17 09:10:42 +0000	[diff] [blame]	1286	if (args->size == 0)
				1287	return 0;
				1288
				1289	if (!access_ok(VERIFY_WRITE,
Gustavo Padovan	3ed605b	2016-04-26 12:32:27 -0300	[diff] [blame]	1290	u64_to_user_ptr(args->data_ptr),
Chris Wilson	51311d0	2010-11-17 09:10:42 +0000	[diff] [blame]	1291	args->size))
				1292	return -EFAULT;
				1293
Chris Wilson	03ac064	2016-07-20 13:31:51 +0100	[diff] [blame]	1294	obj = i915_gem_object_lookup(file, args->handle);
Chris Wilson	258a5ed	2016-08-05 10:14:16 +0100	[diff] [blame]	1295	if (!obj)
				1296	return -ENOENT;
Eric Anholt	673a394	2008-07-30 12:06:12 -0700	[diff] [blame]	1297
Chris Wilson	7dcd249	2010-09-26 20:21:44 +0100	[diff] [blame]	1298	/* Bounds check source. */
Matthew Auld	966d5bf	2016-12-13 20:32:22 +0000	[diff] [blame]	1299	if (range_overflows_t(u64, args->offset, args->size, obj->base.size)) {
Chris Wilson	ce9d419	2010-09-26 20:50:05 +0100	[diff] [blame]	1300	ret = -EINVAL;
Chris Wilson	bb6dc8d	2016-10-28 13:58:39 +0100	[diff] [blame]	1301	goto out;
Chris Wilson	ce9d419	2010-09-26 20:50:05 +0100	[diff] [blame]	1302	}
				1303
Chris Wilson	db53a30	2011-02-03 11:57:46 +0000	[diff] [blame]	1304	trace_i915_gem_object_pread(obj, args->offset, args->size);
				1305
Chris Wilson	e95433c	2016-10-28 13:58:27 +0100	[diff] [blame]	1306	ret = i915_gem_object_wait(obj,
				1307	I915_WAIT_INTERRUPTIBLE,
				1308	MAX_SCHEDULE_TIMEOUT,
				1309	to_rps_client(file));
Chris Wilson	258a5ed	2016-08-05 10:14:16 +0100	[diff] [blame]	1310	if (ret)
Chris Wilson	bb6dc8d	2016-10-28 13:58:39 +0100	[diff] [blame]	1311	goto out;
Chris Wilson	258a5ed	2016-08-05 10:14:16 +0100	[diff] [blame]	1312
Chris Wilson	bb6dc8d	2016-10-28 13:58:39 +0100	[diff] [blame]	1313	ret = i915_gem_object_pin_pages(obj);
Chris Wilson	258a5ed	2016-08-05 10:14:16 +0100	[diff] [blame]	1314	if (ret)
Chris Wilson	bb6dc8d	2016-10-28 13:58:39 +0100	[diff] [blame]	1315	goto out;
Chris Wilson	258a5ed	2016-08-05 10:14:16 +0100	[diff] [blame]	1316
Chris Wilson	bb6dc8d	2016-10-28 13:58:39 +0100	[diff] [blame]	1317	ret = i915_gem_shmem_pread(obj, args);
Chris Wilson	9c870d0	2016-10-24 13:42:15 +0100	[diff] [blame]	1318	if (ret == -EFAULT \|\| ret == -ENODEV)
Chris Wilson	bb6dc8d	2016-10-28 13:58:39 +0100	[diff] [blame]	1319	ret = i915_gem_gtt_pread(obj, args);
Ankitprasad Sharma	b50a537	2016-06-10 14:23:03 +0530	[diff] [blame]	1320
Chris Wilson	bb6dc8d	2016-10-28 13:58:39 +0100	[diff] [blame]	1321	i915_gem_object_unpin_pages(obj);
				1322	out:
Chris Wilson	f0cd518	2016-10-28 13:58:43 +0100	[diff] [blame]	1323	i915_gem_object_put(obj);
Eric Anholt	eb01459	2009-03-10 11:44:52 -0700	[diff] [blame]	1324	return ret;
Eric Anholt	673a394	2008-07-30 12:06:12 -0700	[diff] [blame]	1325	}
				1326
Keith Packard	0839ccb	2008-10-30 19:38:48 -0700	[diff] [blame]	1327	/* This is the fast write path which cannot handle
				1328	* page faults in the source data
Linus Torvalds	9b7530cc	2008-10-20 14:16:43 -0700	[diff] [blame]	1329	*/
Linus Torvalds	9b7530cc	2008-10-20 14:16:43 -0700	[diff] [blame]	1330
Chris Wilson	fe11562	2016-10-28 13:58:40 +0100	[diff] [blame]	1331	static inline bool
				1332	ggtt_write(struct io_mapping *mapping,
				1333	loff_t base, int offset,
				1334	char __user *user_data, int length)
Keith Packard	0839ccb	2008-10-30 19:38:48 -0700	[diff] [blame]	1335	{
Ville Syrjälä	afe722b	2017-09-01 20:12:52 +0300	[diff] [blame]	1336	void __iomem *vaddr;
Keith Packard	0839ccb	2008-10-30 19:38:48 -0700	[diff] [blame]	1337	unsigned long unwritten;
				1338
Ben Widawsky	4f0c7cf	2012-04-16 14:07:47 -0700	[diff] [blame]	1339	/* We can use the cpu mem copy function because this is X86. */
Ville Syrjälä	afe722b	2017-09-01 20:12:52 +0300	[diff] [blame]	1340	vaddr = io_mapping_map_atomic_wc(mapping, base);
				1341	unwritten = __copy_from_user_inatomic_nocache((void __force *)vaddr + offset,
Keith Packard	0839ccb	2008-10-30 19:38:48 -0700	[diff] [blame]	1342	user_data, length);
Chris Wilson	fe11562	2016-10-28 13:58:40 +0100	[diff] [blame]	1343	io_mapping_unmap_atomic(vaddr);
				1344	if (unwritten) {
Ville Syrjälä	afe722b	2017-09-01 20:12:52 +0300	[diff] [blame]	1345	vaddr = io_mapping_map_wc(mapping, base, PAGE_SIZE);
				1346	unwritten = copy_from_user((void __force *)vaddr + offset,
				1347	user_data, length);
Chris Wilson	fe11562	2016-10-28 13:58:40 +0100	[diff] [blame]	1348	io_mapping_unmap(vaddr);
				1349	}
Keith Packard	0839ccb	2008-10-30 19:38:48 -0700	[diff] [blame]	1350
Chris Wilson	bb6dc8d	2016-10-28 13:58:39 +0100	[diff] [blame]	1351	return unwritten;
				1352	}
				1353
Eric Anholt	3de09aa	2009-03-09 09:42:23 -0700	[diff] [blame]	1354	/**
				1355	* This is the fast pwrite path, where we copy the data directly from the
				1356	* user into the GTT, uncached.
Chris Wilson	fe11562	2016-10-28 13:58:40 +0100	[diff] [blame]	1357	* @obj: i915 GEM object
Tvrtko Ursulin	14bb2c1	2016-06-03 14:02:17 +0100	[diff] [blame]	1358	* @args: pwrite arguments structure
Eric Anholt	3de09aa	2009-03-09 09:42:23 -0700	[diff] [blame]	1359	*/
Eric Anholt	673a394	2008-07-30 12:06:12 -0700	[diff] [blame]	1360	static int
Chris Wilson	fe11562	2016-10-28 13:58:40 +0100	[diff] [blame]	1361	i915_gem_gtt_pwrite_fast(struct drm_i915_gem_object *obj,
				1362	const struct drm_i915_gem_pwrite *args)
Eric Anholt	673a394	2008-07-30 12:06:12 -0700	[diff] [blame]	1363	{
Chris Wilson	fe11562	2016-10-28 13:58:40 +0100	[diff] [blame]	1364	struct drm_i915_private *i915 = to_i915(obj->base.dev);
Ankitprasad Sharma	4f1959e	2016-06-10 14:23:01 +0530	[diff] [blame]	1365	struct i915_ggtt *ggtt = &i915->ggtt;
				1366	struct drm_mm_node node;
Chris Wilson	fe11562	2016-10-28 13:58:40 +0100	[diff] [blame]	1367	struct i915_vma *vma;
				1368	u64 remain, offset;
				1369	void __user *user_data;
Ankitprasad Sharma	4f1959e	2016-06-10 14:23:01 +0530	[diff] [blame]	1370	int ret;
Ankitprasad Sharma	b50a537	2016-06-10 14:23:03 +0530	[diff] [blame]	1371
Chris Wilson	fe11562	2016-10-28 13:58:40 +0100	[diff] [blame]	1372	ret = mutex_lock_interruptible(&i915->drm.struct_mutex);
				1373	if (ret)
				1374	return ret;
Daniel Vetter	935aaa6	2012-03-25 19:47:35 +0200	[diff] [blame]	1375
Chris Wilson	8bd81815	2017-10-19 07:37:33 +0100	[diff] [blame]	1376	if (i915_gem_object_has_struct_page(obj)) {
				1377	/*
				1378	* Avoid waking the device up if we can fallback, as
				1379	* waking/resuming is very slow (worst-case 10-100 ms
				1380	* depending on PCI sleeps and our own resume time).
				1381	* This easily dwarfs any performance advantage from
				1382	* using the cache bypass of indirect GGTT access.
				1383	*/
				1384	if (!intel_runtime_pm_get_if_in_use(i915)) {
				1385	ret = -EFAULT;
				1386	goto out_unlock;
				1387	}
				1388	} else {
				1389	/* No backing pages, no fallback, we must force GGTT access */
				1390	intel_runtime_pm_get(i915);
				1391	}
				1392
Chris Wilson	058d88c	2016-08-15 10:49:06 +0100	[diff] [blame]	1393	vma = i915_gem_object_ggtt_pin(obj, NULL, 0, 0,
Chris Wilson	a3259ca	2017-10-09 09:44:00 +0100	[diff] [blame]	1394	PIN_MAPPABLE \|
				1395	PIN_NONFAULT \|
				1396	PIN_NONBLOCK);
Chris Wilson	1803458	2016-08-18 17:16:45 +0100	[diff] [blame]	1397	if (!IS_ERR(vma)) {
				1398	node.start = i915_ggtt_offset(vma);
				1399	node.allocated = false;
Chris Wilson	49ef529	2016-08-18 17:17:00 +0100	[diff] [blame]	1400	ret = i915_vma_put_fence(vma);
Chris Wilson	1803458	2016-08-18 17:16:45 +0100	[diff] [blame]	1401	if (ret) {
				1402	i915_vma_unpin(vma);
				1403	vma = ERR_PTR(ret);
				1404	}
				1405	}
Chris Wilson	058d88c	2016-08-15 10:49:06 +0100	[diff] [blame]	1406	if (IS_ERR(vma)) {
Chris Wilson	bb6dc8d	2016-10-28 13:58:39 +0100	[diff] [blame]	1407	ret = insert_mappable_node(ggtt, &node, PAGE_SIZE);
Ankitprasad Sharma	4f1959e	2016-06-10 14:23:01 +0530	[diff] [blame]	1408	if (ret)
Chris Wilson	8bd81815	2017-10-19 07:37:33 +0100	[diff] [blame]	1409	goto out_rpm;
Chris Wilson	fe11562	2016-10-28 13:58:40 +0100	[diff] [blame]	1410	GEM_BUG_ON(!node.allocated);
Ankitprasad Sharma	4f1959e	2016-06-10 14:23:01 +0530	[diff] [blame]	1411	}
Daniel Vetter	935aaa6	2012-03-25 19:47:35 +0200	[diff] [blame]	1412
				1413	ret = i915_gem_object_set_to_gtt_domain(obj, true);
				1414	if (ret)
				1415	goto out_unpin;
				1416
Chris Wilson	fe11562	2016-10-28 13:58:40 +0100	[diff] [blame]	1417	mutex_unlock(&i915->drm.struct_mutex);
				1418
Chris Wilson	b19482d	2016-08-18 17:16:43 +0100	[diff] [blame]	1419	intel_fb_obj_invalidate(obj, ORIGIN_CPU);
Paulo Zanoni	063e4e6	2015-02-13 17:23:45 -0200	[diff] [blame]	1420
Ankitprasad Sharma	4f1959e	2016-06-10 14:23:01 +0530	[diff] [blame]	1421	user_data = u64_to_user_ptr(args->data_ptr);
				1422	offset = args->offset;
				1423	remain = args->size;
				1424	while (remain) {
Eric Anholt	673a394	2008-07-30 12:06:12 -0700	[diff] [blame]	1425	/* Operation in this page
				1426	*
Keith Packard	0839ccb	2008-10-30 19:38:48 -0700	[diff] [blame]	1427	* page_base = page offset within aperture
				1428	* page_offset = offset within page
				1429	* page_length = bytes to copy for this page
Eric Anholt	673a394	2008-07-30 12:06:12 -0700	[diff] [blame]	1430	*/
Ankitprasad Sharma	4f1959e	2016-06-10 14:23:01 +0530	[diff] [blame]	1431	u32 page_base = node.start;
Chris Wilson	bb6dc8d	2016-10-28 13:58:39 +0100	[diff] [blame]	1432	unsigned int page_offset = offset_in_page(offset);
				1433	unsigned int page_length = PAGE_SIZE - page_offset;
Ankitprasad Sharma	4f1959e	2016-06-10 14:23:01 +0530	[diff] [blame]	1434	page_length = remain < page_length ? remain : page_length;
				1435	if (node.allocated) {
				1436	wmb(); /* flush the write before we modify the GGTT */
Chris Wilson	82ad644	2018-06-05 16:37:58 +0100	[diff] [blame]	1437	ggtt->vm.insert_page(&ggtt->vm,
				1438	i915_gem_object_get_dma_address(obj, offset >> PAGE_SHIFT),
				1439	node.start, I915_CACHE_NONE, 0);
Ankitprasad Sharma	4f1959e	2016-06-10 14:23:01 +0530	[diff] [blame]	1440	wmb(); /* flush modifications to the GGTT (insert_page) */
				1441	} else {
				1442	page_base += offset & PAGE_MASK;
				1443	}
Keith Packard	0839ccb	2008-10-30 19:38:48 -0700	[diff] [blame]	1444	/* If we get a fault while copying data, then (presumably) our
Eric Anholt	3de09aa	2009-03-09 09:42:23 -0700	[diff] [blame]	1445	* source page isn't available. Return the error and we'll
				1446	* retry in the slow path.
Ankitprasad Sharma	b50a537	2016-06-10 14:23:03 +0530	[diff] [blame]	1447	* If the object is non-shmem backed, we retry again with the
				1448	* path that handles page fault.
Keith Packard	0839ccb	2008-10-30 19:38:48 -0700	[diff] [blame]	1449	*/
Matthew Auld	73ebd50	2017-12-11 15:18:20 +0000	[diff] [blame]	1450	if (ggtt_write(&ggtt->iomap, page_base, page_offset,
Chris Wilson	fe11562	2016-10-28 13:58:40 +0100	[diff] [blame]	1451	user_data, page_length)) {
				1452	ret = -EFAULT;
				1453	break;
Daniel Vetter	935aaa6	2012-03-25 19:47:35 +0200	[diff] [blame]	1454	}
Eric Anholt	673a394	2008-07-30 12:06:12 -0700	[diff] [blame]	1455
Keith Packard	0839ccb	2008-10-30 19:38:48 -0700	[diff] [blame]	1456	remain -= page_length;
				1457	user_data += page_length;
				1458	offset += page_length;
Eric Anholt	673a394	2008-07-30 12:06:12 -0700	[diff] [blame]	1459	}
Chris Wilson	d59b21e	2017-02-22 11:40:49 +0000	[diff] [blame]	1460	intel_fb_obj_flush(obj, ORIGIN_CPU);
Chris Wilson	fe11562	2016-10-28 13:58:40 +0100	[diff] [blame]	1461
				1462	mutex_lock(&i915->drm.struct_mutex);
Daniel Vetter	935aaa6	2012-03-25 19:47:35 +0200	[diff] [blame]	1463	out_unpin:
Ankitprasad Sharma	4f1959e	2016-06-10 14:23:01 +0530	[diff] [blame]	1464	if (node.allocated) {
				1465	wmb();
Chris Wilson	82ad644	2018-06-05 16:37:58 +0100	[diff] [blame]	1466	ggtt->vm.clear_range(&ggtt->vm, node.start, node.size);
Ankitprasad Sharma	4f1959e	2016-06-10 14:23:01 +0530	[diff] [blame]	1467	remove_mappable_node(&node);
				1468	} else {
Chris Wilson	058d88c	2016-08-15 10:49:06 +0100	[diff] [blame]	1469	i915_vma_unpin(vma);
Ankitprasad Sharma	4f1959e	2016-06-10 14:23:01 +0530	[diff] [blame]	1470	}
Chris Wilson	8bd81815	2017-10-19 07:37:33 +0100	[diff] [blame]	1471	out_rpm:
Chris Wilson	9c870d0	2016-10-24 13:42:15 +0100	[diff] [blame]	1472	intel_runtime_pm_put(i915);
Chris Wilson	8bd81815	2017-10-19 07:37:33 +0100	[diff] [blame]	1473	out_unlock:
Chris Wilson	fe11562	2016-10-28 13:58:40 +0100	[diff] [blame]	1474	mutex_unlock(&i915->drm.struct_mutex);
Eric Anholt	3de09aa	2009-03-09 09:42:23 -0700	[diff] [blame]	1475	return ret;
Eric Anholt	673a394	2008-07-30 12:06:12 -0700	[diff] [blame]	1476	}
				1477
Eric Anholt	673a394	2008-07-30 12:06:12 -0700	[diff] [blame]	1478	static int
Chris Wilson	fe11562	2016-10-28 13:58:40 +0100	[diff] [blame]	1479	shmem_pwrite_slow(struct page *page, int offset, int length,
Daniel Vetter	d174bd6	2012-03-25 19:47:40 +0200	[diff] [blame]	1480	char __user *user_data,
				1481	bool page_do_bit17_swizzling,
				1482	bool needs_clflush_before,
				1483	bool needs_clflush_after)
Eric Anholt	673a394	2008-07-30 12:06:12 -0700	[diff] [blame]	1484	{
Daniel Vetter	d174bd6	2012-03-25 19:47:40 +0200	[diff] [blame]	1485	char *vaddr;
				1486	int ret;
Eric Anholt	40123c1	2009-03-09 13:42:30 -0700	[diff] [blame]	1487
Daniel Vetter	d174bd6	2012-03-25 19:47:40 +0200	[diff] [blame]	1488	vaddr = kmap(page);
Daniel Vetter	e7e58eb	2012-03-25 19:47:43 +0200	[diff] [blame]	1489	if (unlikely(needs_clflush_before \|\| page_do_bit17_swizzling))
Chris Wilson	fe11562	2016-10-28 13:58:40 +0100	[diff] [blame]	1490	shmem_clflush_swizzled_range(vaddr + offset, length,
Daniel Vetter	23c18c7	2012-03-25 19:47:42 +0200	[diff] [blame]	1491	page_do_bit17_swizzling);
Daniel Vetter	d174bd6	2012-03-25 19:47:40 +0200	[diff] [blame]	1492	if (page_do_bit17_swizzling)
Chris Wilson	fe11562	2016-10-28 13:58:40 +0100	[diff] [blame]	1493	ret = __copy_from_user_swizzled(vaddr, offset, user_data,
				1494	length);
Daniel Vetter	d174bd6	2012-03-25 19:47:40 +0200	[diff] [blame]	1495	else
Chris Wilson	fe11562	2016-10-28 13:58:40 +0100	[diff] [blame]	1496	ret = __copy_from_user(vaddr + offset, user_data, length);
Daniel Vetter	d174bd6	2012-03-25 19:47:40 +0200	[diff] [blame]	1497	if (needs_clflush_after)
Chris Wilson	fe11562	2016-10-28 13:58:40 +0100	[diff] [blame]	1498	shmem_clflush_swizzled_range(vaddr + offset, length,
Daniel Vetter	23c18c7	2012-03-25 19:47:42 +0200	[diff] [blame]	1499	page_do_bit17_swizzling);
Daniel Vetter	d174bd6	2012-03-25 19:47:40 +0200	[diff] [blame]	1500	kunmap(page);
Chris Wilson	e5281cc	2010-10-28 13:45:36 +0100	[diff] [blame]	1501
Chris Wilson	755d221	2012-09-04 21:02:55 +0100	[diff] [blame]	1502	return ret ? -EFAULT : 0;
Eric Anholt	40123c1	2009-03-09 13:42:30 -0700	[diff] [blame]	1503	}
				1504
Chris Wilson	fe11562	2016-10-28 13:58:40 +0100	[diff] [blame]	1505	/* Per-page copy function for the shmem pwrite fastpath.
				1506	* Flushes invalid cachelines before writing to the target if
				1507	* needs_clflush_before is set and flushes out any written cachelines after
				1508	* writing if needs_clflush is set.
				1509	*/
Eric Anholt	40123c1	2009-03-09 13:42:30 -0700	[diff] [blame]	1510	static int
Chris Wilson	fe11562	2016-10-28 13:58:40 +0100	[diff] [blame]	1511	shmem_pwrite(struct page page, int offset, int len, char __user user_data,
				1512	bool page_do_bit17_swizzling,
				1513	bool needs_clflush_before,
				1514	bool needs_clflush_after)
Eric Anholt	40123c1	2009-03-09 13:42:30 -0700	[diff] [blame]	1515	{
Chris Wilson	fe11562	2016-10-28 13:58:40 +0100	[diff] [blame]	1516	int ret;
Eric Anholt	40123c1	2009-03-09 13:42:30 -0700	[diff] [blame]	1517
Chris Wilson	fe11562	2016-10-28 13:58:40 +0100	[diff] [blame]	1518	ret = -ENODEV;
				1519	if (!page_do_bit17_swizzling) {
				1520	char *vaddr = kmap_atomic(page);
				1521
				1522	if (needs_clflush_before)
				1523	drm_clflush_virt_range(vaddr + offset, len);
				1524	ret = __copy_from_user_inatomic(vaddr + offset, user_data, len);
				1525	if (needs_clflush_after)
				1526	drm_clflush_virt_range(vaddr + offset, len);
				1527
				1528	kunmap_atomic(vaddr);
				1529	}
				1530	if (ret == 0)
				1531	return ret;
				1532
				1533	return shmem_pwrite_slow(page, offset, len, user_data,
				1534	page_do_bit17_swizzling,
				1535	needs_clflush_before,
				1536	needs_clflush_after);
				1537	}
				1538
				1539	static int
				1540	i915_gem_shmem_pwrite(struct drm_i915_gem_object *obj,
				1541	const struct drm_i915_gem_pwrite *args)
				1542	{
				1543	struct drm_i915_private *i915 = to_i915(obj->base.dev);
				1544	void __user *user_data;
				1545	u64 remain;
				1546	unsigned int obj_do_bit17_swizzling;
				1547	unsigned int partial_cacheline_write;
				1548	unsigned int needs_clflush;
				1549	unsigned int offset, idx;
				1550	int ret;
				1551
				1552	ret = mutex_lock_interruptible(&i915->drm.struct_mutex);
Chris Wilson	43394c7	2016-08-18 17:16:47 +0100	[diff] [blame]	1553	if (ret)
				1554	return ret;
Eric Anholt	40123c1	2009-03-09 13:42:30 -0700	[diff] [blame]	1555
Chris Wilson	fe11562	2016-10-28 13:58:40 +0100	[diff] [blame]	1556	ret = i915_gem_obj_prepare_shmem_write(obj, &needs_clflush);
				1557	mutex_unlock(&i915->drm.struct_mutex);
				1558	if (ret)
				1559	return ret;
				1560
				1561	obj_do_bit17_swizzling = 0;
				1562	if (i915_gem_object_needs_bit17_swizzle(obj))
				1563	obj_do_bit17_swizzling = BIT(17);
				1564
				1565	/* If we don't overwrite a cacheline completely we need to be
				1566	* careful to have up-to-date data by first clflushing. Don't
				1567	* overcomplicate things and flush the entire patch.
				1568	*/
				1569	partial_cacheline_write = 0;
				1570	if (needs_clflush & CLFLUSH_BEFORE)
				1571	partial_cacheline_write = boot_cpu_data.x86_clflush_size - 1;
				1572
Chris Wilson	43394c7	2016-08-18 17:16:47 +0100	[diff] [blame]	1573	user_data = u64_to_user_ptr(args->data_ptr);
Chris Wilson	43394c7	2016-08-18 17:16:47 +0100	[diff] [blame]	1574	remain = args->size;
Chris Wilson	fe11562	2016-10-28 13:58:40 +0100	[diff] [blame]	1575	offset = offset_in_page(args->offset);
				1576	for (idx = args->offset >> PAGE_SHIFT; remain; idx++) {
				1577	struct page *page = i915_gem_object_get_page(obj, idx);
				1578	int length;
Eric Anholt	40123c1	2009-03-09 13:42:30 -0700	[diff] [blame]	1579
Chris Wilson	fe11562	2016-10-28 13:58:40 +0100	[diff] [blame]	1580	length = remain;
				1581	if (offset + length > PAGE_SIZE)
				1582	length = PAGE_SIZE - offset;
Chris Wilson	e5281cc	2010-10-28 13:45:36 +0100	[diff] [blame]	1583
Chris Wilson	fe11562	2016-10-28 13:58:40 +0100	[diff] [blame]	1584	ret = shmem_pwrite(page, offset, length, user_data,
				1585	page_to_phys(page) & obj_do_bit17_swizzling,
				1586	(offset \| length) & partial_cacheline_write,
				1587	needs_clflush & CLFLUSH_AFTER);
				1588	if (ret)
Chris Wilson	9da3da6	2012-06-01 15:20:22 +0100	[diff] [blame]	1589	break;
				1590
Chris Wilson	fe11562	2016-10-28 13:58:40 +0100	[diff] [blame]	1591	remain -= length;
				1592	user_data += length;
				1593	offset = 0;
Eric Anholt	40123c1	2009-03-09 13:42:30 -0700	[diff] [blame]	1594	}
				1595
Chris Wilson	d59b21e	2017-02-22 11:40:49 +0000	[diff] [blame]	1596	intel_fb_obj_flush(obj, ORIGIN_CPU);
Chris Wilson	fe11562	2016-10-28 13:58:40 +0100	[diff] [blame]	1597	i915_gem_obj_finish_shmem_access(obj);
Eric Anholt	40123c1	2009-03-09 13:42:30 -0700	[diff] [blame]	1598	return ret;
Eric Anholt	673a394	2008-07-30 12:06:12 -0700	[diff] [blame]	1599	}
				1600
				1601	/**
				1602	* Writes data to the object referenced by handle.
Tvrtko Ursulin	14bb2c1	2016-06-03 14:02:17 +0100	[diff] [blame]	1603	* @dev: drm device
				1604	* @data: ioctl data blob
				1605	* @file: drm file
Eric Anholt	673a394	2008-07-30 12:06:12 -0700	[diff] [blame]	1606	*
				1607	* On error, the contents of the buffer that were to be modified are undefined.
				1608	*/
				1609	int
				1610	i915_gem_pwrite_ioctl(struct drm_device dev, void data,
Chris Wilson	fbd5a26	2010-10-14 15:03:58 +0100	[diff] [blame]	1611	struct drm_file *file)
Eric Anholt	673a394	2008-07-30 12:06:12 -0700	[diff] [blame]	1612	{
				1613	struct drm_i915_gem_pwrite *args = data;
Chris Wilson	05394f3	2010-11-08 19:18:58 +0000	[diff] [blame]	1614	struct drm_i915_gem_object *obj;
Chris Wilson	51311d0	2010-11-17 09:10:42 +0000	[diff] [blame]	1615	int ret;
				1616
				1617	if (args->size == 0)
				1618	return 0;
				1619
				1620	if (!access_ok(VERIFY_READ,
Gustavo Padovan	3ed605b	2016-04-26 12:32:27 -0300	[diff] [blame]	1621	u64_to_user_ptr(args->data_ptr),
Chris Wilson	51311d0	2010-11-17 09:10:42 +0000	[diff] [blame]	1622	args->size))
				1623	return -EFAULT;
				1624
Chris Wilson	03ac064	2016-07-20 13:31:51 +0100	[diff] [blame]	1625	obj = i915_gem_object_lookup(file, args->handle);
Chris Wilson	258a5ed	2016-08-05 10:14:16 +0100	[diff] [blame]	1626	if (!obj)
				1627	return -ENOENT;
Eric Anholt	673a394	2008-07-30 12:06:12 -0700	[diff] [blame]	1628
Chris Wilson	7dcd249	2010-09-26 20:21:44 +0100	[diff] [blame]	1629	/* Bounds check destination. */
Matthew Auld	966d5bf	2016-12-13 20:32:22 +0000	[diff] [blame]	1630	if (range_overflows_t(u64, args->offset, args->size, obj->base.size)) {
Chris Wilson	ce9d419	2010-09-26 20:50:05 +0100	[diff] [blame]	1631	ret = -EINVAL;
Chris Wilson	258a5ed	2016-08-05 10:14:16 +0100	[diff] [blame]	1632	goto err;
Chris Wilson	ce9d419	2010-09-26 20:50:05 +0100	[diff] [blame]	1633	}
				1634
Chris Wilson	f8c1cce	2018-07-12 19:53:14 +0100	[diff] [blame]	1635	/* Writes not allowed into this read-only object */
				1636	if (i915_gem_object_is_readonly(obj)) {
				1637	ret = -EINVAL;
				1638	goto err;
				1639	}
				1640
Chris Wilson	db53a30	2011-02-03 11:57:46 +0000	[diff] [blame]	1641	trace_i915_gem_object_pwrite(obj, args->offset, args->size);
				1642
Chris Wilson	7c55e2c	2017-03-07 12:03:38 +0000	[diff] [blame]	1643	ret = -ENODEV;
				1644	if (obj->ops->pwrite)
				1645	ret = obj->ops->pwrite(obj, args);
				1646	if (ret != -ENODEV)
				1647	goto err;
				1648
Chris Wilson	e95433c	2016-10-28 13:58:27 +0100	[diff] [blame]	1649	ret = i915_gem_object_wait(obj,
				1650	I915_WAIT_INTERRUPTIBLE \|
				1651	I915_WAIT_ALL,
				1652	MAX_SCHEDULE_TIMEOUT,
				1653	to_rps_client(file));
Chris Wilson	258a5ed	2016-08-05 10:14:16 +0100	[diff] [blame]	1654	if (ret)
				1655	goto err;
				1656
Chris Wilson	fe11562	2016-10-28 13:58:40 +0100	[diff] [blame]	1657	ret = i915_gem_object_pin_pages(obj);
Chris Wilson	258a5ed	2016-08-05 10:14:16 +0100	[diff] [blame]	1658	if (ret)
Chris Wilson	fe11562	2016-10-28 13:58:40 +0100	[diff] [blame]	1659	goto err;
Chris Wilson	258a5ed	2016-08-05 10:14:16 +0100	[diff] [blame]	1660
Daniel Vetter	935aaa6	2012-03-25 19:47:35 +0200	[diff] [blame]	1661	ret = -EFAULT;
Eric Anholt	673a394	2008-07-30 12:06:12 -0700	[diff] [blame]	1662	/* We can only do the GTT pwrite on untiled buffers, as otherwise
				1663	* it would end up going through the fenced access, and we'll get
				1664	* different detiling behavior between reading and writing.
				1665	* pread/pwrite currently are reading and writing from the CPU
				1666	* perspective, requiring manual detiling by the client.
				1667	*/
Chris Wilson	6eae005	2016-06-20 15:05:52 +0100	[diff] [blame]	1668	if (!i915_gem_object_has_struct_page(obj) \|\|
Chris Wilson	9c870d0	2016-10-24 13:42:15 +0100	[diff] [blame]	1669	cpu_write_needs_clflush(obj))
Daniel Vetter	935aaa6	2012-03-25 19:47:35 +0200	[diff] [blame]	1670	/* Note that the gtt paths might fail with non-page-backed user
				1671	* pointers (e.g. gtt mappings when moving data between
Chris Wilson	9c870d0	2016-10-24 13:42:15 +0100	[diff] [blame]	1672	* textures). Fallback to the shmem path in that case.
				1673	*/
Chris Wilson	fe11562	2016-10-28 13:58:40 +0100	[diff] [blame]	1674	ret = i915_gem_gtt_pwrite_fast(obj, args);
Eric Anholt	673a394	2008-07-30 12:06:12 -0700	[diff] [blame]	1675
Chris Wilson	d1054ee	2016-07-16 18:42:36 +0100	[diff] [blame]	1676	if (ret == -EFAULT \|\| ret == -ENOSPC) {
Chris Wilson	6a2c423	2014-11-04 04:51:40 -0800	[diff] [blame]	1677	if (obj->phys_handle)
				1678	ret = i915_gem_phys_pwrite(obj, args, file);
Ankitprasad Sharma	b50a537	2016-06-10 14:23:03 +0530	[diff] [blame]	1679	else
Chris Wilson	fe11562	2016-10-28 13:58:40 +0100	[diff] [blame]	1680	ret = i915_gem_shmem_pwrite(obj, args);
Chris Wilson	6a2c423	2014-11-04 04:51:40 -0800	[diff] [blame]	1681	}
Daniel Vetter	5c0480f	2011-12-14 13:57:30 +0100	[diff] [blame]	1682
Chris Wilson	fe11562	2016-10-28 13:58:40 +0100	[diff] [blame]	1683	i915_gem_object_unpin_pages(obj);
Chris Wilson	258a5ed	2016-08-05 10:14:16 +0100	[diff] [blame]	1684	err:
Chris Wilson	f0cd518	2016-10-28 13:58:43 +0100	[diff] [blame]	1685	i915_gem_object_put(obj);
Chris Wilson	258a5ed	2016-08-05 10:14:16 +0100	[diff] [blame]	1686	return ret;
Eric Anholt	673a394	2008-07-30 12:06:12 -0700	[diff] [blame]	1687	}
				1688
Chris Wilson	40e62d5	2016-10-28 13:58:41 +0100	[diff] [blame]	1689	static void i915_gem_object_bump_inactive_ggtt(struct drm_i915_gem_object *obj)
				1690	{
				1691	struct drm_i915_private *i915;
				1692	struct list_head *list;
				1693	struct i915_vma *vma;
				1694
Chris Wilson	f212381	2017-10-16 12:40:37 +0100	[diff] [blame]	1695	GEM_BUG_ON(!i915_gem_object_has_pinned_pages(obj));
				1696
Chris Wilson	e2189dd	2017-12-07 21:14:07 +0000	[diff] [blame]	1697	for_each_ggtt_vma(vma, obj) {
Chris Wilson	40e62d5	2016-10-28 13:58:41 +0100	[diff] [blame]	1698	if (i915_vma_is_active(vma))
				1699	continue;
				1700
				1701	if (!drm_mm_node_allocated(&vma->node))
				1702	continue;
				1703
				1704	list_move_tail(&vma->vm_link, &vma->vm->inactive_list);
				1705	}
				1706
				1707	i915 = to_i915(obj->base.dev);
Chris Wilson	f212381	2017-10-16 12:40:37 +0100	[diff] [blame]	1708	spin_lock(&i915->mm.obj_lock);
Chris Wilson	40e62d5	2016-10-28 13:58:41 +0100	[diff] [blame]	1709	list = obj->bind_count ? &i915->mm.bound_list : &i915->mm.unbound_list;
Chris Wilson	f212381	2017-10-16 12:40:37 +0100	[diff] [blame]	1710	list_move_tail(&obj->mm.link, list);
				1711	spin_unlock(&i915->mm.obj_lock);
Chris Wilson	40e62d5	2016-10-28 13:58:41 +0100	[diff] [blame]	1712	}
				1713
Eric Anholt	673a394	2008-07-30 12:06:12 -0700	[diff] [blame]	1714	/**
Eric Anholt	2ef7eea	2008-11-10 10:53:25 -0800	[diff] [blame]	1715	* Called when user space prepares to use an object with the CPU, either
				1716	* through the mmap ioctl's mapping or a GTT mapping.
Tvrtko Ursulin	14bb2c1	2016-06-03 14:02:17 +0100	[diff] [blame]	1717	* @dev: drm device
				1718	* @data: ioctl data blob
				1719	* @file: drm file
Eric Anholt	673a394	2008-07-30 12:06:12 -0700	[diff] [blame]	1720	*/
				1721	int
				1722	i915_gem_set_domain_ioctl(struct drm_device dev, void data,
Chris Wilson	05394f3	2010-11-08 19:18:58 +0000	[diff] [blame]	1723	struct drm_file *file)
Eric Anholt	673a394	2008-07-30 12:06:12 -0700	[diff] [blame]	1724	{
				1725	struct drm_i915_gem_set_domain *args = data;
Chris Wilson	05394f3	2010-11-08 19:18:58 +0000	[diff] [blame]	1726	struct drm_i915_gem_object *obj;
Eric Anholt	2ef7eea	2008-11-10 10:53:25 -0800	[diff] [blame]	1727	uint32_t read_domains = args->read_domains;
				1728	uint32_t write_domain = args->write_domain;
Chris Wilson	40e62d5	2016-10-28 13:58:41 +0100	[diff] [blame]	1729	int err;
Eric Anholt	673a394	2008-07-30 12:06:12 -0700	[diff] [blame]	1730
Eric Anholt	2ef7eea	2008-11-10 10:53:25 -0800	[diff] [blame]	1731	/* Only handle setting domains to types used by the CPU. */
Chris Wilson	b8f9096	2016-08-05 10:14:07 +0100	[diff] [blame]	1732	if ((write_domain \| read_domains) & I915_GEM_GPU_DOMAINS)
Eric Anholt	2ef7eea	2008-11-10 10:53:25 -0800	[diff] [blame]	1733	return -EINVAL;
				1734
				1735	/* Having something in the write domain implies it's in the read
				1736	* domain, and only that read domain. Enforce that in the request.
				1737	*/
				1738	if (write_domain != 0 && read_domains != write_domain)
				1739	return -EINVAL;
				1740
Chris Wilson	03ac064	2016-07-20 13:31:51 +0100	[diff] [blame]	1741	obj = i915_gem_object_lookup(file, args->handle);
Chris Wilson	b8f9096	2016-08-05 10:14:07 +0100	[diff] [blame]	1742	if (!obj)
				1743	return -ENOENT;
Jesse Barnes	652c393	2009-08-17 13:31:43 -0700	[diff] [blame]	1744
Chris Wilson	3236f57	2012-08-24 09:35:09 +0100	[diff] [blame]	1745	/* Try to flush the object off the GPU without holding the lock.
				1746	* We will repeat the flush holding the lock in the normal manner
				1747	* to catch cases where we are gazumped.
				1748	*/
Chris Wilson	40e62d5	2016-10-28 13:58:41 +0100	[diff] [blame]	1749	err = i915_gem_object_wait(obj,
Chris Wilson	e95433c	2016-10-28 13:58:27 +0100	[diff] [blame]	1750	I915_WAIT_INTERRUPTIBLE \|
Chris Wilson	e9eaf82	2018-10-01 15:47:55 +0100	[diff] [blame^]	1751	I915_WAIT_PRIORITY \|
Chris Wilson	e95433c	2016-10-28 13:58:27 +0100	[diff] [blame]	1752	(write_domain ? I915_WAIT_ALL : 0),
				1753	MAX_SCHEDULE_TIMEOUT,
				1754	to_rps_client(file));
Chris Wilson	40e62d5	2016-10-28 13:58:41 +0100	[diff] [blame]	1755	if (err)
Chris Wilson	f0cd518	2016-10-28 13:58:43 +0100	[diff] [blame]	1756	goto out;
Chris Wilson	b8f9096	2016-08-05 10:14:07 +0100	[diff] [blame]	1757
Tina Zhang	a03f395	2017-11-14 10:25:13 +0000	[diff] [blame]	1758	/*
				1759	* Proxy objects do not control access to the backing storage, ergo
				1760	* they cannot be used as a means to manipulate the cache domain
				1761	* tracking for that backing storage. The proxy object is always
				1762	* considered to be outside of any cache domain.
				1763	*/
				1764	if (i915_gem_object_is_proxy(obj)) {
				1765	err = -ENXIO;
				1766	goto out;
				1767	}
				1768
				1769	/*
				1770	* Flush and acquire obj->pages so that we are coherent through
Chris Wilson	40e62d5	2016-10-28 13:58:41 +0100	[diff] [blame]	1771	* direct access in memory with previous cached writes through
				1772	* shmemfs and that our cache domain tracking remains valid.
				1773	* For example, if the obj->filp was moved to swap without us
				1774	* being notified and releasing the pages, we would mistakenly
				1775	* continue to assume that the obj remained out of the CPU cached
				1776	* domain.
				1777	*/
				1778	err = i915_gem_object_pin_pages(obj);
				1779	if (err)
Chris Wilson	f0cd518	2016-10-28 13:58:43 +0100	[diff] [blame]	1780	goto out;
Chris Wilson	40e62d5	2016-10-28 13:58:41 +0100	[diff] [blame]	1781
				1782	err = i915_mutex_lock_interruptible(dev);
				1783	if (err)
Chris Wilson	f0cd518	2016-10-28 13:58:43 +0100	[diff] [blame]	1784	goto out_unpin;
Chris Wilson	3236f57	2012-08-24 09:35:09 +0100	[diff] [blame]	1785
Chris Wilson	e22d8e3	2017-04-12 12:01:11 +0100	[diff] [blame]	1786	if (read_domains & I915_GEM_DOMAIN_WC)
				1787	err = i915_gem_object_set_to_wc_domain(obj, write_domain);
				1788	else if (read_domains & I915_GEM_DOMAIN_GTT)
				1789	err = i915_gem_object_set_to_gtt_domain(obj, write_domain);
Chris Wilson	43566de	2015-01-02 16:29:29 +0530	[diff] [blame]	1790	else
Chris Wilson	e22d8e3	2017-04-12 12:01:11 +0100	[diff] [blame]	1791	err = i915_gem_object_set_to_cpu_domain(obj, write_domain);
Chris Wilson	40e62d5	2016-10-28 13:58:41 +0100	[diff] [blame]	1792
				1793	/* And bump the LRU for this access */
				1794	i915_gem_object_bump_inactive_ggtt(obj);
				1795
				1796	mutex_unlock(&dev->struct_mutex);
Eric Anholt	2ef7eea	2008-11-10 10:53:25 -0800	[diff] [blame]	1797
Daniel Vetter	031b698	2015-06-26 19:35:16 +0200	[diff] [blame]	1798	if (write_domain != 0)
Chris Wilson	ef74921	2017-04-12 12:01:10 +0100	[diff] [blame]	1799	intel_fb_obj_invalidate(obj,
				1800	fb_write_origin(obj, write_domain));
Daniel Vetter	031b698	2015-06-26 19:35:16 +0200	[diff] [blame]	1801
Chris Wilson	f0cd518	2016-10-28 13:58:43 +0100	[diff] [blame]	1802	out_unpin:
Chris Wilson	40e62d5	2016-10-28 13:58:41 +0100	[diff] [blame]	1803	i915_gem_object_unpin_pages(obj);
Chris Wilson	f0cd518	2016-10-28 13:58:43 +0100	[diff] [blame]	1804	out:
				1805	i915_gem_object_put(obj);
Chris Wilson	40e62d5	2016-10-28 13:58:41 +0100	[diff] [blame]	1806	return err;
Eric Anholt	673a394	2008-07-30 12:06:12 -0700	[diff] [blame]	1807	}
				1808
				1809	/**
				1810	* Called when user space has done writes to this buffer
Tvrtko Ursulin	14bb2c1	2016-06-03 14:02:17 +0100	[diff] [blame]	1811	* @dev: drm device
				1812	* @data: ioctl data blob
				1813	* @file: drm file
Eric Anholt	673a394	2008-07-30 12:06:12 -0700	[diff] [blame]	1814	*/
				1815	int
				1816	i915_gem_sw_finish_ioctl(struct drm_device dev, void data,
Chris Wilson	05394f3	2010-11-08 19:18:58 +0000	[diff] [blame]	1817	struct drm_file *file)
Eric Anholt	673a394	2008-07-30 12:06:12 -0700	[diff] [blame]	1818	{
				1819	struct drm_i915_gem_sw_finish *args = data;
Chris Wilson	05394f3	2010-11-08 19:18:58 +0000	[diff] [blame]	1820	struct drm_i915_gem_object *obj;
Chris Wilson	1d7cfea	2010-10-17 09:45:41 +0100	[diff] [blame]	1821
Chris Wilson	03ac064	2016-07-20 13:31:51 +0100	[diff] [blame]	1822	obj = i915_gem_object_lookup(file, args->handle);
Chris Wilson	c21724c	2016-08-05 10:14:19 +0100	[diff] [blame]	1823	if (!obj)
				1824	return -ENOENT;
Eric Anholt	673a394	2008-07-30 12:06:12 -0700	[diff] [blame]	1825
Tina Zhang	a03f395	2017-11-14 10:25:13 +0000	[diff] [blame]	1826	/*
				1827	* Proxy objects are barred from CPU access, so there is no
				1828	* need to ban sw_finish as it is a nop.
				1829	*/
				1830
Eric Anholt	673a394	2008-07-30 12:06:12 -0700	[diff] [blame]	1831	/* Pinned buffers may be scanout, so flush the cache */
Chris Wilson	5a97bcc	2017-02-22 11:40:46 +0000	[diff] [blame]	1832	i915_gem_object_flush_if_display(obj);
Chris Wilson	f0cd518	2016-10-28 13:58:43 +0100	[diff] [blame]	1833	i915_gem_object_put(obj);
Chris Wilson	5a97bcc	2017-02-22 11:40:46 +0000	[diff] [blame]	1834
				1835	return 0;
Eric Anholt	673a394	2008-07-30 12:06:12 -0700	[diff] [blame]	1836	}
				1837
				1838	/**
Tvrtko Ursulin	14bb2c1	2016-06-03 14:02:17 +0100	[diff] [blame]	1839	* i915_gem_mmap_ioctl - Maps the contents of an object, returning the address
				1840	* it is mapped to.
				1841	* @dev: drm device
				1842	* @data: ioctl data blob
				1843	* @file: drm file
Eric Anholt	673a394	2008-07-30 12:06:12 -0700	[diff] [blame]	1844	*
				1845	* While the mapping holds a reference on the contents of the object, it doesn't
				1846	* imply a ref on the object itself.
Daniel Vetter	3436738	2014-10-16 12:28:18 +0200	[diff] [blame]	1847	*
				1848	* IMPORTANT:
				1849	*
				1850	* DRM driver writers who look a this function as an example for how to do GEM
				1851	* mmap support, please don't implement mmap support like here. The modern way
				1852	* to implement DRM mmap support is with an mmap offset ioctl (like
				1853	* i915_gem_mmap_gtt) and then using the mmap syscall on the DRM fd directly.
				1854	* That way debug tooling like valgrind will understand what's going on, hiding
				1855	* the mmap call in a driver private ioctl will break that. The i915 driver only
				1856	* does cpu mmaps this way because we didn't know better.
Eric Anholt	673a394	2008-07-30 12:06:12 -0700	[diff] [blame]	1857	*/
				1858	int
				1859	i915_gem_mmap_ioctl(struct drm_device dev, void data,
Chris Wilson	05394f3	2010-11-08 19:18:58 +0000	[diff] [blame]	1860	struct drm_file *file)
Eric Anholt	673a394	2008-07-30 12:06:12 -0700	[diff] [blame]	1861	{
				1862	struct drm_i915_gem_mmap *args = data;
Chris Wilson	03ac064	2016-07-20 13:31:51 +0100	[diff] [blame]	1863	struct drm_i915_gem_object *obj;
Eric Anholt	673a394	2008-07-30 12:06:12 -0700	[diff] [blame]	1864	unsigned long addr;
				1865
Akash Goel	1816f92	2015-01-02 16:29:30 +0530	[diff] [blame]	1866	if (args->flags & ~(I915_MMAP_WC))
				1867	return -EINVAL;
				1868
Borislav Petkov	568a58e	2016-03-29 17:42:01 +0200	[diff] [blame]	1869	if (args->flags & I915_MMAP_WC && !boot_cpu_has(X86_FEATURE_PAT))
Akash Goel	1816f92	2015-01-02 16:29:30 +0530	[diff] [blame]	1870	return -ENODEV;
				1871
Chris Wilson	03ac064	2016-07-20 13:31:51 +0100	[diff] [blame]	1872	obj = i915_gem_object_lookup(file, args->handle);
				1873	if (!obj)
Chris Wilson	bf79cb9	2010-08-04 14:19:46 +0100	[diff] [blame]	1874	return -ENOENT;
Eric Anholt	673a394	2008-07-30 12:06:12 -0700	[diff] [blame]	1875
Daniel Vetter	1286ff7	2012-05-10 15:25:09 +0200	[diff] [blame]	1876	/* prime objects have no backing filp to GEM mmap
				1877	* pages from.
				1878	*/
Chris Wilson	03ac064	2016-07-20 13:31:51 +0100	[diff] [blame]	1879	if (!obj->base.filp) {
Chris Wilson	f0cd518	2016-10-28 13:58:43 +0100	[diff] [blame]	1880	i915_gem_object_put(obj);
Tina Zhang	274b246	2017-11-14 10:25:12 +0000	[diff] [blame]	1881	return -ENXIO;
Daniel Vetter	1286ff7	2012-05-10 15:25:09 +0200	[diff] [blame]	1882	}
				1883
Chris Wilson	03ac064	2016-07-20 13:31:51 +0100	[diff] [blame]	1884	addr = vm_mmap(obj->base.filp, 0, args->size,
Eric Anholt	673a394	2008-07-30 12:06:12 -0700	[diff] [blame]	1885	PROT_READ \| PROT_WRITE, MAP_SHARED,
				1886	args->offset);
Akash Goel	1816f92	2015-01-02 16:29:30 +0530	[diff] [blame]	1887	if (args->flags & I915_MMAP_WC) {
				1888	struct mm_struct *mm = current->mm;
				1889	struct vm_area_struct *vma;
				1890
Michal Hocko	80a89a5	2016-05-23 16:26:11 -0700	[diff] [blame]	1891	if (down_write_killable(&mm->mmap_sem)) {
Chris Wilson	f0cd518	2016-10-28 13:58:43 +0100	[diff] [blame]	1892	i915_gem_object_put(obj);
Michal Hocko	80a89a5	2016-05-23 16:26:11 -0700	[diff] [blame]	1893	return -EINTR;
				1894	}
Akash Goel	1816f92	2015-01-02 16:29:30 +0530	[diff] [blame]	1895	vma = find_vma(mm, addr);
				1896	if (vma)
				1897	vma->vm_page_prot =
				1898	pgprot_writecombine(vm_get_page_prot(vma->vm_flags));
				1899	else
				1900	addr = -ENOMEM;
				1901	up_write(&mm->mmap_sem);
Chris Wilson	aeecc96	2016-06-17 14:46:39 -0300	[diff] [blame]	1902
				1903	/* This may race, but that's ok, it only gets set */
Chris Wilson	5034924	2016-08-18 17:17:04 +0100	[diff] [blame]	1904	WRITE_ONCE(obj->frontbuffer_ggtt_origin, ORIGIN_CPU);
Akash Goel	1816f92	2015-01-02 16:29:30 +0530	[diff] [blame]	1905	}
Chris Wilson	f0cd518	2016-10-28 13:58:43 +0100	[diff] [blame]	1906	i915_gem_object_put(obj);
Eric Anholt	673a394	2008-07-30 12:06:12 -0700	[diff] [blame]	1907	if (IS_ERR((void *)addr))
				1908	return addr;
				1909
				1910	args->addr_ptr = (uint64_t) addr;
				1911
				1912	return 0;
				1913	}
				1914
Chris Wilson	d899ace	2018-07-25 16:54:47 +0100	[diff] [blame]	1915	static unsigned int tile_row_pages(const struct drm_i915_gem_object *obj)
Chris Wilson	03af84f	2016-08-18 17:17:01 +0100	[diff] [blame]	1916	{
Chris Wilson	6649a0b	2017-01-09 16:16:08 +0000	[diff] [blame]	1917	return i915_gem_object_get_tile_row_size(obj) >> PAGE_SHIFT;
Chris Wilson	03af84f	2016-08-18 17:17:01 +0100	[diff] [blame]	1918	}
				1919
Jesse Barnes	de151cf	2008-11-12 10:03:55 -0800	[diff] [blame]	1920	/**
Chris Wilson	4cc6907	2016-08-25 19:05:19 +0100	[diff] [blame]	1921	* i915_gem_mmap_gtt_version - report the current feature set for GTT mmaps
				1922	*
				1923	* A history of the GTT mmap interface:
				1924	*
				1925	* 0 - Everything had to fit into the GTT. Both parties of a memcpy had to
				1926	* aligned and suitable for fencing, and still fit into the available
				1927	* mappable space left by the pinned display objects. A classic problem
				1928	* we called the page-fault-of-doom where we would ping-pong between
				1929	* two objects that could not fit inside the GTT and so the memcpy
				1930	* would page one object in at the expense of the other between every
				1931	* single byte.
				1932	*
				1933	* 1 - Objects can be any size, and have any compatible fencing (X Y, or none
				1934	* as set via i915_gem_set_tiling() [DRM_I915_GEM_SET_TILING]). If the
				1935	* object is too large for the available space (or simply too large
				1936	* for the mappable aperture!), a view is created instead and faulted
				1937	* into userspace. (This view is aligned and sized appropriately for
				1938	* fenced access.)
				1939	*
Chris Wilson	e22d8e3	2017-04-12 12:01:11 +0100	[diff] [blame]	1940	* 2 - Recognise WC as a separate cache domain so that we can flush the
				1941	* delayed writes via GTT before performing direct access via WC.
				1942	*
Chris Wilson	4cc6907	2016-08-25 19:05:19 +0100	[diff] [blame]	1943	* Restrictions:
				1944	*
				1945	* * snoopable objects cannot be accessed via the GTT. It can cause machine
				1946	* hangs on some architectures, corruption on others. An attempt to service
				1947	* a GTT page fault from a snoopable object will generate a SIGBUS.
				1948	*
				1949	* * the object must be able to fit into RAM (physical memory, though no
				1950	* limited to the mappable aperture).
				1951	*
				1952	*
				1953	* Caveats:
				1954	*
				1955	* * a new GTT page fault will synchronize rendering from the GPU and flush
				1956	* all data to system memory. Subsequent access will not be synchronized.
				1957	*
				1958	* * all mappings are revoked on runtime device suspend.
				1959	*
				1960	* * there are only 8, 16 or 32 fence registers to share between all users
				1961	* (older machines require fence register for display and blitter access
				1962	* as well). Contention of the fence registers will cause the previous users
				1963	* to be unmapped and any new access will generate new page faults.
				1964	*
				1965	* * running out of memory while servicing a fault may generate a SIGBUS,
				1966	* rather than the expected SIGSEGV.
				1967	*/
				1968	int i915_gem_mmap_gtt_version(void)
				1969	{
Chris Wilson	e22d8e3	2017-04-12 12:01:11 +0100	[diff] [blame]	1970	return 2;
Chris Wilson	4cc6907	2016-08-25 19:05:19 +0100	[diff] [blame]	1971	}
				1972
Chris Wilson	2d4281b	2017-01-10 09:56:32 +0000	[diff] [blame]	1973	static inline struct i915_ggtt_view
Chris Wilson	d899ace	2018-07-25 16:54:47 +0100	[diff] [blame]	1974	compute_partial_view(const struct drm_i915_gem_object *obj,
Chris Wilson	2d4281b	2017-01-10 09:56:32 +0000	[diff] [blame]	1975	pgoff_t page_offset,
				1976	unsigned int chunk)
				1977	{
				1978	struct i915_ggtt_view view;
				1979
				1980	if (i915_gem_object_is_tiled(obj))
				1981	chunk = roundup(chunk, tile_row_pages(obj));
				1982
Chris Wilson	2d4281b	2017-01-10 09:56:32 +0000	[diff] [blame]	1983	view.type = I915_GGTT_VIEW_PARTIAL;
Chris Wilson	8bab1193	2017-01-14 00:28:25 +0000	[diff] [blame]	1984	view.partial.offset = rounddown(page_offset, chunk);
				1985	view.partial.size =
Chris Wilson	2d4281b	2017-01-10 09:56:32 +0000	[diff] [blame]	1986	min_t(unsigned int, chunk,
Chris Wilson	8bab1193	2017-01-14 00:28:25 +0000	[diff] [blame]	1987	(obj->base.size >> PAGE_SHIFT) - view.partial.offset);
Chris Wilson	2d4281b	2017-01-10 09:56:32 +0000	[diff] [blame]	1988
				1989	/* If the partial covers the entire object, just create a normal VMA. */
				1990	if (chunk >= obj->base.size >> PAGE_SHIFT)
				1991	view.type = I915_GGTT_VIEW_NORMAL;
				1992
				1993	return view;
				1994	}
				1995
Chris Wilson	4cc6907	2016-08-25 19:05:19 +0100	[diff] [blame]	1996	/**
Jesse Barnes	de151cf	2008-11-12 10:03:55 -0800	[diff] [blame]	1997	* i915_gem_fault - fault a page into the GTT
Geliang Tang	d9072a3	2015-09-15 05:58:44 -0700	[diff] [blame]	1998	* @vmf: fault info
Jesse Barnes	de151cf	2008-11-12 10:03:55 -0800	[diff] [blame]	1999	*
				2000	* The fault handler is set up by drm_gem_mmap() when a object is GTT mapped
				2001	* from userspace. The fault handler takes care of binding the object to
				2002	* the GTT (if needed), allocating and programming a fence register (again,
				2003	* only if needed based on whether the old reg is still valid or the object
				2004	* is tiled) and inserting a new PTE into the faulting process.
				2005	*
				2006	* Note that the faulting process may involve evicting existing objects
				2007	* from the GTT and/or fence registers to make room. So performance may
				2008	* suffer if the GTT working set is large or there are few fence registers
				2009	* left.
Chris Wilson	4cc6907	2016-08-25 19:05:19 +0100	[diff] [blame]	2010	*
				2011	* The current feature set supported by i915_gem_fault() and thus GTT mmaps
				2012	* is exposed via I915_PARAM_MMAP_GTT_VERSION (see i915_gem_mmap_gtt_version).
Jesse Barnes	de151cf	2008-11-12 10:03:55 -0800	[diff] [blame]	2013	*/
Chris Wilson	5213701	2018-06-06 22:45:20 +0100	[diff] [blame]	2014	vm_fault_t i915_gem_fault(struct vm_fault *vmf)
Jesse Barnes	de151cf	2008-11-12 10:03:55 -0800	[diff] [blame]	2015	{
Chris Wilson	420980c	2018-06-05 14:57:46 +0100	[diff] [blame]	2016	#define MIN_CHUNK_PAGES (SZ_1M >> PAGE_SHIFT)
Dave Jiang	11bac80	2017-02-24 14:56:41 -0800	[diff] [blame]	2017	struct vm_area_struct *area = vmf->vma;
Chris Wilson	058d88c	2016-08-15 10:49:06 +0100	[diff] [blame]	2018	struct drm_i915_gem_object *obj = to_intel_bo(area->vm_private_data);
Chris Wilson	05394f3	2010-11-08 19:18:58 +0000	[diff] [blame]	2019	struct drm_device *dev = obj->base.dev;
Joonas Lahtinen	72e96d6	2016-03-30 16:57:10 +0300	[diff] [blame]	2020	struct drm_i915_private *dev_priv = to_i915(dev);
				2021	struct i915_ggtt *ggtt = &dev_priv->ggtt;
Chris Wilson	aae7c06	2018-09-03 09:33:34 +0100	[diff] [blame]	2022	bool write = area->vm_flags & VM_WRITE;
Chris Wilson	058d88c	2016-08-15 10:49:06 +0100	[diff] [blame]	2023	struct i915_vma *vma;
Jesse Barnes	de151cf	2008-11-12 10:03:55 -0800	[diff] [blame]	2024	pgoff_t page_offset;
Chris Wilson	b8f9096	2016-08-05 10:14:07 +0100	[diff] [blame]	2025	int ret;
Paulo Zanoni	f65c916	2013-11-27 18:20:34 -0200	[diff] [blame]	2026
Chris Wilson	3e977ac	2018-07-12 19:53:13 +0100	[diff] [blame]	2027	/* Sanity check that we allow writing into this object */
				2028	if (i915_gem_object_is_readonly(obj) && write)
				2029	return VM_FAULT_SIGBUS;
				2030
Jesse Barnes	de151cf	2008-11-12 10:03:55 -0800	[diff] [blame]	2031	/* We don't use vmf->pgoff since that has the fake offset */
Jan Kara	1a29d85	2016-12-14 15:07:01 -0800	[diff] [blame]	2032	page_offset = (vmf->address - area->vm_start) >> PAGE_SHIFT;
Jesse Barnes	de151cf	2008-11-12 10:03:55 -0800	[diff] [blame]	2033
Chris Wilson	db53a30	2011-02-03 11:57:46 +0000	[diff] [blame]	2034	trace_i915_gem_object_fault(obj, page_offset, true, write);
				2035
Chris Wilson	6e4930f	2014-02-07 18:37:06 -0200	[diff] [blame]	2036	/* Try to flush the object off the GPU first without holding the lock.
Chris Wilson	b8f9096	2016-08-05 10:14:07 +0100	[diff] [blame]	2037	* Upon acquiring the lock, we will perform our sanity checks and then
Chris Wilson	6e4930f	2014-02-07 18:37:06 -0200	[diff] [blame]	2038	* repeat the flush holding the lock in the normal manner to catch cases
				2039	* where we are gazumped.
				2040	*/
Chris Wilson	e95433c	2016-10-28 13:58:27 +0100	[diff] [blame]	2041	ret = i915_gem_object_wait(obj,
				2042	I915_WAIT_INTERRUPTIBLE,
				2043	MAX_SCHEDULE_TIMEOUT,
				2044	NULL);
Chris Wilson	6e4930f	2014-02-07 18:37:06 -0200	[diff] [blame]	2045	if (ret)
Chris Wilson	b8f9096	2016-08-05 10:14:07 +0100	[diff] [blame]	2046	goto err;
				2047
Chris Wilson	40e62d5	2016-10-28 13:58:41 +0100	[diff] [blame]	2048	ret = i915_gem_object_pin_pages(obj);
				2049	if (ret)
				2050	goto err;
				2051
Chris Wilson	b8f9096	2016-08-05 10:14:07 +0100	[diff] [blame]	2052	intel_runtime_pm_get(dev_priv);
				2053
				2054	ret = i915_mutex_lock_interruptible(dev);
				2055	if (ret)
				2056	goto err_rpm;
Chris Wilson	6e4930f	2014-02-07 18:37:06 -0200	[diff] [blame]	2057
Chris Wilson	eb119bd	2012-12-16 12:43:36 +0000	[diff] [blame]	2058	/* Access to snoopable pages through the GTT is incoherent. */
Tvrtko Ursulin	0031fb9	2016-11-04 14:42:44 +0000	[diff] [blame]	2059	if (obj->cache_level != I915_CACHE_NONE && !HAS_LLC(dev_priv)) {
Chris Wilson	ddeff6e	2014-05-28 16:16:41 +0100	[diff] [blame]	2060	ret = -EFAULT;
Chris Wilson	b8f9096	2016-08-05 10:14:07 +0100	[diff] [blame]	2061	goto err_unlock;
Chris Wilson	eb119bd	2012-12-16 12:43:36 +0000	[diff] [blame]	2062	}
				2063
Chris Wilson	8211887	2016-08-18 17:17:05 +0100	[diff] [blame]	2064
Chris Wilson	a61007a	2016-08-18 17:17:02 +0100	[diff] [blame]	2065	/* Now pin it into the GTT as needed */
Chris Wilson	7e7367d	2018-06-30 10:05:09 +0100	[diff] [blame]	2066	vma = i915_gem_object_ggtt_pin(obj, NULL, 0, 0,
				2067	PIN_MAPPABLE \|
				2068	PIN_NONBLOCK \|
				2069	PIN_NONFAULT);
Chris Wilson	a61007a	2016-08-18 17:17:02 +0100	[diff] [blame]	2070	if (IS_ERR(vma)) {
Chris Wilson	a61007a	2016-08-18 17:17:02 +0100	[diff] [blame]	2071	/* Use a partial view if it is bigger than available space */
Chris Wilson	2d4281b	2017-01-10 09:56:32 +0000	[diff] [blame]	2072	struct i915_ggtt_view view =
Chris Wilson	8201c1f	2017-01-10 09:56:33 +0000	[diff] [blame]	2073	compute_partial_view(obj, page_offset, MIN_CHUNK_PAGES);
Chris Wilson	7e7367d	2018-06-30 10:05:09 +0100	[diff] [blame]	2074	unsigned int flags;
Chris Wilson	aa136d9	2016-08-18 17:17:03 +0100	[diff] [blame]	2075
Chris Wilson	7e7367d	2018-06-30 10:05:09 +0100	[diff] [blame]	2076	flags = PIN_MAPPABLE;
				2077	if (view.type == I915_GGTT_VIEW_NORMAL)
				2078	flags \|= PIN_NONBLOCK; /* avoid warnings for pinned */
				2079
				2080	/*
				2081	* Userspace is now writing through an untracked VMA, abandon
Chris Wilson	5034924	2016-08-18 17:17:04 +0100	[diff] [blame]	2082	* all hope that the hardware is able to track future writes.
				2083	*/
				2084	obj->frontbuffer_ggtt_origin = ORIGIN_CPU;
				2085
Chris Wilson	7e7367d	2018-06-30 10:05:09 +0100	[diff] [blame]	2086	vma = i915_gem_object_ggtt_pin(obj, &view, 0, 0, flags);
				2087	if (IS_ERR(vma) && !view.type) {
				2088	flags = PIN_MAPPABLE;
				2089	view.type = I915_GGTT_VIEW_PARTIAL;
				2090	vma = i915_gem_object_ggtt_pin(obj, &view, 0, 0, flags);
				2091	}
Chris Wilson	a61007a	2016-08-18 17:17:02 +0100	[diff] [blame]	2092	}
Chris Wilson	058d88c	2016-08-15 10:49:06 +0100	[diff] [blame]	2093	if (IS_ERR(vma)) {
				2094	ret = PTR_ERR(vma);
Chris Wilson	b8f9096	2016-08-05 10:14:07 +0100	[diff] [blame]	2095	goto err_unlock;
Chris Wilson	058d88c	2016-08-15 10:49:06 +0100	[diff] [blame]	2096	}
Jesse Barnes	de151cf	2008-11-12 10:03:55 -0800	[diff] [blame]	2097
Chris Wilson	c983930	2012-11-20 10:45:17 +0000	[diff] [blame]	2098	ret = i915_gem_object_set_to_gtt_domain(obj, write);
				2099	if (ret)
Chris Wilson	b8f9096	2016-08-05 10:14:07 +0100	[diff] [blame]	2100	goto err_unpin;
Chris Wilson	c983930	2012-11-20 10:45:17 +0000	[diff] [blame]	2101
Chris Wilson	3bd4073	2017-10-09 09:43:56 +0100	[diff] [blame]	2102	ret = i915_vma_pin_fence(vma);
Chris Wilson	c983930	2012-11-20 10:45:17 +0000	[diff] [blame]	2103	if (ret)
Chris Wilson	b8f9096	2016-08-05 10:14:07 +0100	[diff] [blame]	2104	goto err_unpin;
Chris Wilson	7d1c480	2010-08-07 21:45:03 +0100	[diff] [blame]	2105
Chris Wilson	b90b91d	2014-06-10 12:14:40 +0100	[diff] [blame]	2106	/* Finally, remap it using the new GTT offset */
Chris Wilson	c58305a	2016-08-19 16:54:28 +0100	[diff] [blame]	2107	ret = remap_io_mapping(area,
Chris Wilson	8bab1193	2017-01-14 00:28:25 +0000	[diff] [blame]	2108	area->vm_start + (vma->ggtt_view.partial.offset << PAGE_SHIFT),
Matthew Auld	73ebd50	2017-12-11 15:18:20 +0000	[diff] [blame]	2109	(ggtt->gmadr.start + vma->node.start) >> PAGE_SHIFT,
Chris Wilson	c58305a	2016-08-19 16:54:28 +0100	[diff] [blame]	2110	min_t(u64, vma->size, area->vm_end - area->vm_start),
Matthew Auld	73ebd50	2017-12-11 15:18:20 +0000	[diff] [blame]	2111	&ggtt->iomap);
Chris Wilson	a65adaf	2017-10-09 09:43:57 +0100	[diff] [blame]	2112	if (ret)
				2113	goto err_fence;
Chris Wilson	a61007a	2016-08-18 17:17:02 +0100	[diff] [blame]	2114
Chris Wilson	a65adaf	2017-10-09 09:43:57 +0100	[diff] [blame]	2115	/* Mark as being mmapped into userspace for later revocation */
				2116	assert_rpm_wakelock_held(dev_priv);
				2117	if (!i915_vma_set_userfault(vma) && !obj->userfault_count++)
				2118	list_add(&obj->userfault_link, &dev_priv->mm.userfault_list);
				2119	GEM_BUG_ON(!obj->userfault_count);
				2120
Chris Wilson	7125397b	2017-12-06 12:49:14 +0000	[diff] [blame]	2121	i915_vma_set_ggtt_write(vma);
				2122
Chris Wilson	a65adaf	2017-10-09 09:43:57 +0100	[diff] [blame]	2123	err_fence:
Chris Wilson	3bd4073	2017-10-09 09:43:56 +0100	[diff] [blame]	2124	i915_vma_unpin_fence(vma);
Chris Wilson	b8f9096	2016-08-05 10:14:07 +0100	[diff] [blame]	2125	err_unpin:
Chris Wilson	058d88c	2016-08-15 10:49:06 +0100	[diff] [blame]	2126	__i915_vma_unpin(vma);
Chris Wilson	b8f9096	2016-08-05 10:14:07 +0100	[diff] [blame]	2127	err_unlock:
Jesse Barnes	de151cf	2008-11-12 10:03:55 -0800	[diff] [blame]	2128	mutex_unlock(&dev->struct_mutex);
Chris Wilson	b8f9096	2016-08-05 10:14:07 +0100	[diff] [blame]	2129	err_rpm:
				2130	intel_runtime_pm_put(dev_priv);
Chris Wilson	40e62d5	2016-10-28 13:58:41 +0100	[diff] [blame]	2131	i915_gem_object_unpin_pages(obj);
Chris Wilson	b8f9096	2016-08-05 10:14:07 +0100	[diff] [blame]	2132	err:
Jesse Barnes	de151cf	2008-11-12 10:03:55 -0800	[diff] [blame]	2133	switch (ret) {
Chris Wilson	d9bc7e9	2011-02-07 13:09:31 +0000	[diff] [blame]	2134	case -EIO:
Daniel Vetter	2232f03	2014-09-04 09:36:18 +0200	[diff] [blame]	2135	/*
				2136	* We eat errors when the gpu is terminally wedged to avoid
				2137	* userspace unduly crashing (gl has no provisions for mmaps to
				2138	* fail). But any other -EIO isn't ours (e.g. swap in failure)
				2139	* and so needs to be reported.
				2140	*/
Chris Wilson	5213701	2018-06-06 22:45:20 +0100	[diff] [blame]	2141	if (!i915_terminally_wedged(&dev_priv->gpu_error))
				2142	return VM_FAULT_SIGBUS;
Gustavo A. R. Silva	f0d759f	2018-06-28 17:35:41 -0500	[diff] [blame]	2143	/* else: fall through */
Chris Wilson	045e769	2010-11-07 09:18:22 +0000	[diff] [blame]	2144	case -EAGAIN:
Daniel Vetter	571c608	2013-09-12 17:57:28 +0200	[diff] [blame]	2145	/*
				2146	* EAGAIN means the gpu is hung and we'll wait for the error
				2147	* handler to reset everything when re-faulting in
				2148	* i915_mutex_lock_interruptible.
Chris Wilson	d9bc7e9	2011-02-07 13:09:31 +0000	[diff] [blame]	2149	*/
Chris Wilson	c715089	2009-09-23 00:43:56 +0100	[diff] [blame]	2150	case 0:
				2151	case -ERESTARTSYS:
Chris Wilson	bed636a	2011-02-11 20:31:19 +0000	[diff] [blame]	2152	case -EINTR:
Dmitry Rogozhkin	e79e0fe	2012-10-03 17:15:26 +0300	[diff] [blame]	2153	case -EBUSY:
				2154	/*
				2155	* EBUSY is ok: this just means that another thread
				2156	* already did the job.
				2157	*/
Chris Wilson	5213701	2018-06-06 22:45:20 +0100	[diff] [blame]	2158	return VM_FAULT_NOPAGE;
Jesse Barnes	de151cf	2008-11-12 10:03:55 -0800	[diff] [blame]	2159	case -ENOMEM:
Chris Wilson	5213701	2018-06-06 22:45:20 +0100	[diff] [blame]	2160	return VM_FAULT_OOM;
Daniel Vetter	a7c2e1a	2012-10-17 11:17:16 +0200	[diff] [blame]	2161	case -ENOSPC:
Chris Wilson	45d6781	2014-01-31 11:34:57 +0000	[diff] [blame]	2162	case -EFAULT:
Chris Wilson	5213701	2018-06-06 22:45:20 +0100	[diff] [blame]	2163	return VM_FAULT_SIGBUS;
Jesse Barnes	de151cf	2008-11-12 10:03:55 -0800	[diff] [blame]	2164	default:
Daniel Vetter	a7c2e1a	2012-10-17 11:17:16 +0200	[diff] [blame]	2165	WARN_ONCE(ret, "unhandled error in i915_gem_fault: %i\n", ret);
Chris Wilson	5213701	2018-06-06 22:45:20 +0100	[diff] [blame]	2166	return VM_FAULT_SIGBUS;
Jesse Barnes	de151cf	2008-11-12 10:03:55 -0800	[diff] [blame]	2167	}
				2168	}
				2169
Chris Wilson	a65adaf	2017-10-09 09:43:57 +0100	[diff] [blame]	2170	static void __i915_gem_object_release_mmap(struct drm_i915_gem_object *obj)
				2171	{
				2172	struct i915_vma *vma;
				2173
				2174	GEM_BUG_ON(!obj->userfault_count);
				2175
				2176	obj->userfault_count = 0;
				2177	list_del(&obj->userfault_link);
				2178	drm_vma_node_unmap(&obj->base.vma_node,
				2179	obj->base.dev->anon_inode->i_mapping);
				2180
Chris Wilson	e2189dd	2017-12-07 21:14:07 +0000	[diff] [blame]	2181	for_each_ggtt_vma(vma, obj)
Chris Wilson	a65adaf	2017-10-09 09:43:57 +0100	[diff] [blame]	2182	i915_vma_unset_userfault(vma);
Chris Wilson	a65adaf	2017-10-09 09:43:57 +0100	[diff] [blame]	2183	}
				2184
Jesse Barnes	de151cf	2008-11-12 10:03:55 -0800	[diff] [blame]	2185	/**
Chris Wilson	901782b	2009-07-10 08:18:50 +0100	[diff] [blame]	2186	* i915_gem_release_mmap - remove physical page mappings
				2187	* @obj: obj in question
				2188	*
André Goddard Rosa	af901ca	2009-11-14 13:09:05 -0200	[diff] [blame]	2189	* Preserve the reservation of the mmapping with the DRM core code, but
Chris Wilson	901782b	2009-07-10 08:18:50 +0100	[diff] [blame]	2190	* relinquish ownership of the pages back to the system.
				2191	*
				2192	* It is vital that we remove the page mapping if we have mapped a tiled
				2193	* object through the GTT and then lose the fence register due to
				2194	* resource pressure. Similarly if the object has been moved out of the
				2195	* aperture, than pages mapped into userspace must be revoked. Removing the
				2196	* mapping will then trigger a page fault on the next user access, allowing
				2197	* fixup by i915_gem_fault().
				2198	*/
Eric Anholt	d05ca30	2009-07-10 13:02:26 -0700	[diff] [blame]	2199	void
Chris Wilson	05394f3	2010-11-08 19:18:58 +0000	[diff] [blame]	2200	i915_gem_release_mmap(struct drm_i915_gem_object *obj)
Chris Wilson	901782b	2009-07-10 08:18:50 +0100	[diff] [blame]	2201	{
Chris Wilson	275f039	2016-10-24 13:42:14 +0100	[diff] [blame]	2202	struct drm_i915_private *i915 = to_i915(obj->base.dev);
Chris Wilson	275f039	2016-10-24 13:42:14 +0100	[diff] [blame]	2203
Chris Wilson	349f2cc	2016-04-13 17:35:12 +0100	[diff] [blame]	2204	/* Serialisation between user GTT access and our code depends upon
				2205	* revoking the CPU's PTE whilst the mutex is held. The next user
				2206	* pagefault then has to wait until we release the mutex.
Chris Wilson	9c870d0	2016-10-24 13:42:15 +0100	[diff] [blame]	2207	*
				2208	* Note that RPM complicates somewhat by adding an additional
				2209	* requirement that operations to the GGTT be made holding the RPM
				2210	* wakeref.
Chris Wilson	349f2cc	2016-04-13 17:35:12 +0100	[diff] [blame]	2211	*/
Chris Wilson	275f039	2016-10-24 13:42:14 +0100	[diff] [blame]	2212	lockdep_assert_held(&i915->drm.struct_mutex);
Chris Wilson	9c870d0	2016-10-24 13:42:15 +0100	[diff] [blame]	2213	intel_runtime_pm_get(i915);
Chris Wilson	349f2cc	2016-04-13 17:35:12 +0100	[diff] [blame]	2214
Chris Wilson	a65adaf	2017-10-09 09:43:57 +0100	[diff] [blame]	2215	if (!obj->userfault_count)
Chris Wilson	9c870d0	2016-10-24 13:42:15 +0100	[diff] [blame]	2216	goto out;
Chris Wilson	901782b	2009-07-10 08:18:50 +0100	[diff] [blame]	2217
Chris Wilson	a65adaf	2017-10-09 09:43:57 +0100	[diff] [blame]	2218	__i915_gem_object_release_mmap(obj);
Chris Wilson	349f2cc	2016-04-13 17:35:12 +0100	[diff] [blame]	2219
				2220	/* Ensure that the CPU's PTE are revoked and there are not outstanding
				2221	* memory transactions from userspace before we return. The TLB
				2222	* flushing implied above by changing the PTE above should be
				2223	* sufficient, an extra barrier here just provides us with a bit
				2224	* of paranoid documentation about our requirement to serialise
				2225	* memory writes before touching registers / GSM.
				2226	*/
				2227	wmb();
Chris Wilson	9c870d0	2016-10-24 13:42:15 +0100	[diff] [blame]	2228
				2229	out:
				2230	intel_runtime_pm_put(i915);
Chris Wilson	901782b	2009-07-10 08:18:50 +0100	[diff] [blame]	2231	}
				2232
Chris Wilson	7c108fd	2016-10-24 13:42:18 +0100	[diff] [blame]	2233	void i915_gem_runtime_suspend(struct drm_i915_private *dev_priv)
Chris Wilson	eedd10f	2014-06-16 08:57:44 +0100	[diff] [blame]	2234	{
Chris Wilson	3594a3e	2016-10-24 13:42:16 +0100	[diff] [blame]	2235	struct drm_i915_gem_object obj, on;
Chris Wilson	7c108fd	2016-10-24 13:42:18 +0100	[diff] [blame]	2236	int i;
Chris Wilson	eedd10f	2014-06-16 08:57:44 +0100	[diff] [blame]	2237
Chris Wilson	3594a3e	2016-10-24 13:42:16 +0100	[diff] [blame]	2238	/*
				2239	* Only called during RPM suspend. All users of the userfault_list
				2240	* must be holding an RPM wakeref to ensure that this can not
				2241	* run concurrently with themselves (and use the struct_mutex for
				2242	* protection between themselves).
				2243	*/
				2244
				2245	list_for_each_entry_safe(obj, on,
Chris Wilson	a65adaf	2017-10-09 09:43:57 +0100	[diff] [blame]	2246	&dev_priv->mm.userfault_list, userfault_link)
				2247	__i915_gem_object_release_mmap(obj);
Chris Wilson	7c108fd	2016-10-24 13:42:18 +0100	[diff] [blame]	2248
				2249	/* The fence will be lost when the device powers down. If any were
				2250	* in use by hardware (i.e. they are pinned), we should not be powering
				2251	* down! All other fences will be reacquired by the user upon waking.
				2252	*/
				2253	for (i = 0; i < dev_priv->num_fence_regs; i++) {
				2254	struct drm_i915_fence_reg *reg = &dev_priv->fence_regs[i];
				2255
Chris Wilson	e0ec3ec	2017-02-03 12:57:17 +0000	[diff] [blame]	2256	/* Ideally we want to assert that the fence register is not
				2257	* live at this point (i.e. that no piece of code will be
				2258	* trying to write through fence + GTT, as that both violates
				2259	* our tracking of activity and associated locking/barriers,
				2260	* but also is illegal given that the hw is powered down).
				2261	*
				2262	* Previously we used reg->pin_count as a "liveness" indicator.
				2263	* That is not sufficient, and we need a more fine-grained
				2264	* tool if we want to have a sanity check here.
				2265	*/
Chris Wilson	7c108fd	2016-10-24 13:42:18 +0100	[diff] [blame]	2266
				2267	if (!reg->vma)
				2268	continue;
				2269
Chris Wilson	a65adaf	2017-10-09 09:43:57 +0100	[diff] [blame]	2270	GEM_BUG_ON(i915_vma_has_userfault(reg->vma));
Chris Wilson	7c108fd	2016-10-24 13:42:18 +0100	[diff] [blame]	2271	reg->dirty = true;
				2272	}
Chris Wilson	eedd10f	2014-06-16 08:57:44 +0100	[diff] [blame]	2273	}
				2274
Chris Wilson	d8cb508	2012-08-11 15:41:03 +0100	[diff] [blame]	2275	static int i915_gem_object_create_mmap_offset(struct drm_i915_gem_object *obj)
				2276	{
Chris Wilson	fac5e23	2016-07-04 11:34:36 +0100	[diff] [blame]	2277	struct drm_i915_private *dev_priv = to_i915(obj->base.dev);
Chris Wilson	f3f6184	2016-08-05 10:14:14 +0100	[diff] [blame]	2278	int err;
Chris Wilson	d8cb508	2012-08-11 15:41:03 +0100	[diff] [blame]	2279
Chris Wilson	f3f6184	2016-08-05 10:14:14 +0100	[diff] [blame]	2280	err = drm_gem_create_mmap_offset(&obj->base);
Chris Wilson	b42a13d	2017-01-06 15:22:40 +0000	[diff] [blame]	2281	if (likely(!err))
Chris Wilson	f3f6184	2016-08-05 10:14:14 +0100	[diff] [blame]	2282	return 0;
Daniel Vetter	da494d7	2012-12-20 15:11:16 +0100	[diff] [blame]	2283
Chris Wilson	b42a13d	2017-01-06 15:22:40 +0000	[diff] [blame]	2284	/* Attempt to reap some mmap space from dead objects */
				2285	do {
Chris Wilson	ec625fb	2018-07-09 13:20:42 +0100	[diff] [blame]	2286	err = i915_gem_wait_for_idle(dev_priv,
				2287	I915_WAIT_INTERRUPTIBLE,
				2288	MAX_SCHEDULE_TIMEOUT);
Chris Wilson	b42a13d	2017-01-06 15:22:40 +0000	[diff] [blame]	2289	if (err)
				2290	break;
Chris Wilson	d8cb508	2012-08-11 15:41:03 +0100	[diff] [blame]	2291
Chris Wilson	b42a13d	2017-01-06 15:22:40 +0000	[diff] [blame]	2292	i915_gem_drain_freed_objects(dev_priv);
Chris Wilson	f3f6184	2016-08-05 10:14:14 +0100	[diff] [blame]	2293	err = drm_gem_create_mmap_offset(&obj->base);
Chris Wilson	b42a13d	2017-01-06 15:22:40 +0000	[diff] [blame]	2294	if (!err)
				2295	break;
				2296
				2297	} while (flush_delayed_work(&dev_priv->gt.retire_work));
Daniel Vetter	da494d7	2012-12-20 15:11:16 +0100	[diff] [blame]	2298
Chris Wilson	f3f6184	2016-08-05 10:14:14 +0100	[diff] [blame]	2299	return err;
Chris Wilson	d8cb508	2012-08-11 15:41:03 +0100	[diff] [blame]	2300	}
				2301
				2302	static void i915_gem_object_free_mmap_offset(struct drm_i915_gem_object *obj)
				2303	{
Chris Wilson	d8cb508	2012-08-11 15:41:03 +0100	[diff] [blame]	2304	drm_gem_free_mmap_offset(&obj->base);
				2305	}
				2306
Dave Airlie	da6b51d	2014-12-24 13:11:17 +1000	[diff] [blame]	2307	int
Dave Airlie	ff72145b	2011-02-07 12:16:14 +1000	[diff] [blame]	2308	i915_gem_mmap_gtt(struct drm_file *file,
				2309	struct drm_device *dev,
Dave Airlie	da6b51d	2014-12-24 13:11:17 +1000	[diff] [blame]	2310	uint32_t handle,
Dave Airlie	ff72145b	2011-02-07 12:16:14 +1000	[diff] [blame]	2311	uint64_t *offset)
Jesse Barnes	de151cf	2008-11-12 10:03:55 -0800	[diff] [blame]	2312	{
Chris Wilson	05394f3	2010-11-08 19:18:58 +0000	[diff] [blame]	2313	struct drm_i915_gem_object *obj;
Jesse Barnes	de151cf	2008-11-12 10:03:55 -0800	[diff] [blame]	2314	int ret;
				2315
Chris Wilson	03ac064	2016-07-20 13:31:51 +0100	[diff] [blame]	2316	obj = i915_gem_object_lookup(file, handle);
Chris Wilson	f3f6184	2016-08-05 10:14:14 +0100	[diff] [blame]	2317	if (!obj)
				2318	return -ENOENT;
Chris Wilson	ab18282	2009-09-22 18:46:17 +0100	[diff] [blame]	2319
Chris Wilson	d8cb508	2012-08-11 15:41:03 +0100	[diff] [blame]	2320	ret = i915_gem_object_create_mmap_offset(obj);
Chris Wilson	f3f6184	2016-08-05 10:14:14 +0100	[diff] [blame]	2321	if (ret == 0)
				2322	*offset = drm_vma_node_offset_addr(&obj->base.vma_node);
Jesse Barnes	de151cf	2008-11-12 10:03:55 -0800	[diff] [blame]	2323
Chris Wilson	f0cd518	2016-10-28 13:58:43 +0100	[diff] [blame]	2324	i915_gem_object_put(obj);
Chris Wilson	1d7cfea	2010-10-17 09:45:41 +0100	[diff] [blame]	2325	return ret;
Jesse Barnes	de151cf	2008-11-12 10:03:55 -0800	[diff] [blame]	2326	}
				2327
Dave Airlie	ff72145b	2011-02-07 12:16:14 +1000	[diff] [blame]	2328	/**
				2329	* i915_gem_mmap_gtt_ioctl - prepare an object for GTT mmap'ing
				2330	* @dev: DRM device
				2331	* @data: GTT mapping ioctl data
				2332	* @file: GEM object info
				2333	*
				2334	* Simply returns the fake offset to userspace so it can mmap it.
				2335	* The mmap call will end up in drm_gem_mmap(), which will set things
				2336	* up so we can get faults in the handler above.
				2337	*
				2338	* The fault handler will take care of binding the object into the GTT
				2339	* (since it may have been evicted to make room for something), allocating
				2340	* a fence register, and mapping the appropriate aperture address into
				2341	* userspace.
				2342	*/
				2343	int
				2344	i915_gem_mmap_gtt_ioctl(struct drm_device dev, void data,
				2345	struct drm_file *file)
				2346	{
				2347	struct drm_i915_gem_mmap_gtt *args = data;
				2348
Dave Airlie	da6b51d	2014-12-24 13:11:17 +1000	[diff] [blame]	2349	return i915_gem_mmap_gtt(file, dev, args->handle, &args->offset);
Dave Airlie	ff72145b	2011-02-07 12:16:14 +1000	[diff] [blame]	2350	}
				2351
Daniel Vetter	225067e	2012-08-20 10:23:20 +0200	[diff] [blame]	2352	/* Immediately discard the backing storage */
				2353	static void
				2354	i915_gem_object_truncate(struct drm_i915_gem_object *obj)
Chris Wilson	e5281cc	2010-10-28 13:45:36 +0100	[diff] [blame]	2355	{
Chris Wilson	4d6294bf	2012-08-11 15:41:05 +0100	[diff] [blame]	2356	i915_gem_object_free_mmap_offset(obj);
Daniel Vetter	1286ff7	2012-05-10 15:25:09 +0200	[diff] [blame]	2357
Chris Wilson	4d6294bf	2012-08-11 15:41:05 +0100	[diff] [blame]	2358	if (obj->base.filp == NULL)
				2359	return;
				2360
Daniel Vetter	225067e	2012-08-20 10:23:20 +0200	[diff] [blame]	2361	/* Our goal here is to return as much of the memory as
				2362	* is possible back to the system as we are called from OOM.
				2363	* To do this we must instruct the shmfs to drop all of its
				2364	* backing pages, now.
Chris Wilson	e5281cc	2010-10-28 13:45:36 +0100	[diff] [blame]	2365	*/
Chris Wilson	5537252	2014-03-25 13:23:06 +0000	[diff] [blame]	2366	shmem_truncate_range(file_inode(obj->base.filp), 0, (loff_t)-1);
Chris Wilson	a4f5ea6	2016-10-28 13:58:35 +0100	[diff] [blame]	2367	obj->mm.madv = __I915_MADV_PURGED;
Chris Wilson	4e5462e	2017-03-07 13:20:31 +0000	[diff] [blame]	2368	obj->mm.pages = ERR_PTR(-EFAULT);
Chris Wilson	e5281cc	2010-10-28 13:45:36 +0100	[diff] [blame]	2369	}
Chris Wilson	e5281cc	2010-10-28 13:45:36 +0100	[diff] [blame]	2370
Chris Wilson	5537252	2014-03-25 13:23:06 +0000	[diff] [blame]	2371	/* Try to discard unwanted pages */
Chris Wilson	03ac84f	2016-10-28 13:58:36 +0100	[diff] [blame]	2372	void __i915_gem_object_invalidate(struct drm_i915_gem_object *obj)
Daniel Vetter	225067e	2012-08-20 10:23:20 +0200	[diff] [blame]	2373	{
Chris Wilson	5537252	2014-03-25 13:23:06 +0000	[diff] [blame]	2374	struct address_space *mapping;
				2375
Chris Wilson	1233e2d	2016-10-28 13:58:37 +0100	[diff] [blame]	2376	lockdep_assert_held(&obj->mm.lock);
Chris Wilson	f1fa4f4	2017-10-13 21:26:13 +0100	[diff] [blame]	2377	GEM_BUG_ON(i915_gem_object_has_pages(obj));
Chris Wilson	1233e2d	2016-10-28 13:58:37 +0100	[diff] [blame]	2378
Chris Wilson	a4f5ea6	2016-10-28 13:58:35 +0100	[diff] [blame]	2379	switch (obj->mm.madv) {
Chris Wilson	5537252	2014-03-25 13:23:06 +0000	[diff] [blame]	2380	case I915_MADV_DONTNEED:
				2381	i915_gem_object_truncate(obj);
				2382	case __I915_MADV_PURGED:
				2383	return;
				2384	}
				2385
				2386	if (obj->base.filp == NULL)
				2387	return;
				2388
Al Viro	93c76a3	2015-12-04 23:45:44 -0500	[diff] [blame]	2389	mapping = obj->base.filp->f_mapping,
Chris Wilson	5537252	2014-03-25 13:23:06 +0000	[diff] [blame]	2390	invalidate_mapping_pages(mapping, 0, (loff_t)-1);
Chris Wilson	e5281cc	2010-10-28 13:45:36 +0100	[diff] [blame]	2391	}
				2392
Chris Wilson	5cdf588	2010-09-27 15:51:07 +0100	[diff] [blame]	2393	static void
Chris Wilson	03ac84f	2016-10-28 13:58:36 +0100	[diff] [blame]	2394	i915_gem_object_put_pages_gtt(struct drm_i915_gem_object *obj,
				2395	struct sg_table *pages)
Eric Anholt	673a394	2008-07-30 12:06:12 -0700	[diff] [blame]	2396	{
Dave Gordon	85d1225	2016-05-20 11:54:06 +0100	[diff] [blame]	2397	struct sgt_iter sgt_iter;
				2398	struct page *page;
Daniel Vetter	1286ff7	2012-05-10 15:25:09 +0200	[diff] [blame]	2399
Chris Wilson	e5facdf	2016-12-23 14:57:57 +0000	[diff] [blame]	2400	__i915_gem_object_release_shmem(obj, pages, true);
Eric Anholt	856fa19	2009-03-19 14:10:50 -0700	[diff] [blame]	2401
Chris Wilson	03ac84f	2016-10-28 13:58:36 +0100	[diff] [blame]	2402	i915_gem_gtt_finish_pages(obj, pages);
Imre Deak	e227330	2015-07-09 12:59:05 +0300	[diff] [blame]	2403
Daniel Vetter	6dacfd2	2011-09-12 21:30:02 +0200	[diff] [blame]	2404	if (i915_gem_object_needs_bit17_swizzle(obj))
Chris Wilson	03ac84f	2016-10-28 13:58:36 +0100	[diff] [blame]	2405	i915_gem_object_save_bit_17_swizzle(obj, pages);
Eric Anholt	280b713	2009-03-12 16:56:27 -0700	[diff] [blame]	2406
Chris Wilson	03ac84f	2016-10-28 13:58:36 +0100	[diff] [blame]	2407	for_each_sgt_page(page, sgt_iter, pages) {
Chris Wilson	a4f5ea6	2016-10-28 13:58:35 +0100	[diff] [blame]	2408	if (obj->mm.dirty)
Chris Wilson	9da3da6	2012-06-01 15:20:22 +0100	[diff] [blame]	2409	set_page_dirty(page);
Chris Wilson	3ef94da	2009-09-14 16:50:29 +0100	[diff] [blame]	2410
Chris Wilson	a4f5ea6	2016-10-28 13:58:35 +0100	[diff] [blame]	2411	if (obj->mm.madv == I915_MADV_WILLNEED)
Chris Wilson	9da3da6	2012-06-01 15:20:22 +0100	[diff] [blame]	2412	mark_page_accessed(page);
Chris Wilson	3ef94da	2009-09-14 16:50:29 +0100	[diff] [blame]	2413
Kirill A. Shutemov	09cbfea	2016-04-01 15:29:47 +0300	[diff] [blame]	2414	put_page(page);
Chris Wilson	3ef94da	2009-09-14 16:50:29 +0100	[diff] [blame]	2415	}
Chris Wilson	a4f5ea6	2016-10-28 13:58:35 +0100	[diff] [blame]	2416	obj->mm.dirty = false;
Eric Anholt	673a394	2008-07-30 12:06:12 -0700	[diff] [blame]	2417
Chris Wilson	03ac84f	2016-10-28 13:58:36 +0100	[diff] [blame]	2418	sg_free_table(pages);
				2419	kfree(pages);
Chris Wilson	37e680a	2012-06-07 15:38:42 +0100	[diff] [blame]	2420	}
				2421
Chris Wilson	96d7763	2016-10-28 13:58:33 +0100	[diff] [blame]	2422	static void __i915_gem_object_reset_page_iter(struct drm_i915_gem_object *obj)
				2423	{
				2424	struct radix_tree_iter iter;
Ville Syrjälä	c23aa71	2017-09-01 20:12:51 +0300	[diff] [blame]	2425	void __rcu **slot;
Chris Wilson	96d7763	2016-10-28 13:58:33 +0100	[diff] [blame]	2426
Chris Wilson	bea6e98	2017-10-26 14:00:31 +0100	[diff] [blame]	2427	rcu_read_lock();
Chris Wilson	a4f5ea6	2016-10-28 13:58:35 +0100	[diff] [blame]	2428	radix_tree_for_each_slot(slot, &obj->mm.get_page.radix, &iter, 0)
				2429	radix_tree_delete(&obj->mm.get_page.radix, iter.index);
Chris Wilson	bea6e98	2017-10-26 14:00:31 +0100	[diff] [blame]	2430	rcu_read_unlock();
Chris Wilson	96d7763	2016-10-28 13:58:33 +0100	[diff] [blame]	2431	}
				2432
Chris Wilson	acd1c1e	2018-06-11 08:55:32 +0100	[diff] [blame]	2433	static struct sg_table *
				2434	__i915_gem_object_unset_pages(struct drm_i915_gem_object *obj)
Chris Wilson	37e680a	2012-06-07 15:38:42 +0100	[diff] [blame]	2435	{
Chris Wilson	f212381	2017-10-16 12:40:37 +0100	[diff] [blame]	2436	struct drm_i915_private *i915 = to_i915(obj->base.dev);
Chris Wilson	03ac84f	2016-10-28 13:58:36 +0100	[diff] [blame]	2437	struct sg_table *pages;
Chris Wilson	37e680a	2012-06-07 15:38:42 +0100	[diff] [blame]	2438
Chris Wilson	03ac84f	2016-10-28 13:58:36 +0100	[diff] [blame]	2439	pages = fetch_and_zero(&obj->mm.pages);
Chris Wilson	acd1c1e	2018-06-11 08:55:32 +0100	[diff] [blame]	2440	if (!pages)
				2441	return NULL;
Chris Wilson	a2165e3	2012-12-03 11:49:00 +0000	[diff] [blame]	2442
Chris Wilson	f212381	2017-10-16 12:40:37 +0100	[diff] [blame]	2443	spin_lock(&i915->mm.obj_lock);
				2444	list_del(&obj->mm.link);
				2445	spin_unlock(&i915->mm.obj_lock);
				2446
Chris Wilson	a4f5ea6	2016-10-28 13:58:35 +0100	[diff] [blame]	2447	if (obj->mm.mapping) {
Chris Wilson	4b30cb2	2016-08-18 17:16:42 +0100	[diff] [blame]	2448	void *ptr;
				2449
Chris Wilson	0ce8178	2017-05-17 13:09:59 +0100	[diff] [blame]	2450	ptr = page_mask_bits(obj->mm.mapping);
Chris Wilson	4b30cb2	2016-08-18 17:16:42 +0100	[diff] [blame]	2451	if (is_vmalloc_addr(ptr))
				2452	vunmap(ptr);
Chris Wilson	fb8621d	2016-04-08 12:11:14 +0100	[diff] [blame]	2453	else
Chris Wilson	4b30cb2	2016-08-18 17:16:42 +0100	[diff] [blame]	2454	kunmap(kmap_to_page(ptr));
				2455
Chris Wilson	a4f5ea6	2016-10-28 13:58:35 +0100	[diff] [blame]	2456	obj->mm.mapping = NULL;
Chris Wilson	0a798eb	2016-04-08 12:11:11 +0100	[diff] [blame]	2457	}
				2458
Chris Wilson	96d7763	2016-10-28 13:58:33 +0100	[diff] [blame]	2459	__i915_gem_object_reset_page_iter(obj);
Chris Wilson	acd1c1e	2018-06-11 08:55:32 +0100	[diff] [blame]	2460	obj->mm.page_sizes.phys = obj->mm.page_sizes.sg = 0;
Chris Wilson	96d7763	2016-10-28 13:58:33 +0100	[diff] [blame]	2461
Chris Wilson	acd1c1e	2018-06-11 08:55:32 +0100	[diff] [blame]	2462	return pages;
				2463	}
				2464
				2465	void __i915_gem_object_put_pages(struct drm_i915_gem_object *obj,
				2466	enum i915_mm_subclass subclass)
				2467	{
				2468	struct sg_table *pages;
				2469
				2470	if (i915_gem_object_has_pinned_pages(obj))
				2471	return;
				2472
				2473	GEM_BUG_ON(obj->bind_count);
				2474	if (!i915_gem_object_has_pages(obj))
				2475	return;
				2476
				2477	/* May be called by shrinker from within get_pages() (on another bo) */
				2478	mutex_lock_nested(&obj->mm.lock, subclass);
				2479	if (unlikely(atomic_read(&obj->mm.pages_pin_count)))
				2480	goto unlock;
				2481
				2482	/*
				2483	* ->put_pages might need to allocate memory for the bit17 swizzle
				2484	* array, hence protect them from being reaped by removing them from gtt
				2485	* lists early.
				2486	*/
				2487	pages = __i915_gem_object_unset_pages(obj);
Chris Wilson	4e5462e	2017-03-07 13:20:31 +0000	[diff] [blame]	2488	if (!IS_ERR(pages))
				2489	obj->ops->put_pages(obj, pages);
				2490
Chris Wilson	1233e2d	2016-10-28 13:58:37 +0100	[diff] [blame]	2491	unlock:
				2492	mutex_unlock(&obj->mm.lock);
Chris Wilson	6c085a7	2012-08-20 11:40:46 +0200	[diff] [blame]	2493	}
				2494
Tvrtko Ursulin	f8e5786	2018-09-26 09:03:53 +0100	[diff] [blame]	2495	bool i915_sg_trim(struct sg_table *orig_st)
Tvrtko Ursulin	0c40ce1	2016-11-09 15:13:43 +0000	[diff] [blame]	2496	{
				2497	struct sg_table new_st;
				2498	struct scatterlist sg, new_sg;
				2499	unsigned int i;
				2500
				2501	if (orig_st->nents == orig_st->orig_nents)
Chris Wilson	935a2f7	2017-02-13 17:15:13 +0000	[diff] [blame]	2502	return false;
Tvrtko Ursulin	0c40ce1	2016-11-09 15:13:43 +0000	[diff] [blame]	2503
Chris Wilson	8bfc478f	2016-12-23 14:57:58 +0000	[diff] [blame]	2504	if (sg_alloc_table(&new_st, orig_st->nents, GFP_KERNEL \| __GFP_NOWARN))
Chris Wilson	935a2f7	2017-02-13 17:15:13 +0000	[diff] [blame]	2505	return false;
Tvrtko Ursulin	0c40ce1	2016-11-09 15:13:43 +0000	[diff] [blame]	2506
				2507	new_sg = new_st.sgl;
				2508	for_each_sg(orig_st->sgl, sg, orig_st->nents, i) {
				2509	sg_set_page(new_sg, sg_page(sg), sg->length, 0);
Matthew Auld	c6d22ab	2018-09-20 15:27:06 +0100	[diff] [blame]	2510	sg_dma_address(new_sg) = sg_dma_address(sg);
				2511	sg_dma_len(new_sg) = sg_dma_len(sg);
				2512
Tvrtko Ursulin	0c40ce1	2016-11-09 15:13:43 +0000	[diff] [blame]	2513	new_sg = sg_next(new_sg);
				2514	}
Chris Wilson	c2dc6cc	2016-12-19 12:43:46 +0000	[diff] [blame]	2515	GEM_BUG_ON(new_sg); /* Should walk exactly nents and hit the end */
Tvrtko Ursulin	0c40ce1	2016-11-09 15:13:43 +0000	[diff] [blame]	2516
				2517	sg_free_table(orig_st);
				2518
				2519	*orig_st = new_st;
Chris Wilson	935a2f7	2017-02-13 17:15:13 +0000	[diff] [blame]	2520	return true;
Tvrtko Ursulin	0c40ce1	2016-11-09 15:13:43 +0000	[diff] [blame]	2521	}
				2522
Matthew Auld	b91b09e	2017-10-06 23:18:17 +0100	[diff] [blame]	2523	static int i915_gem_object_get_pages_gtt(struct drm_i915_gem_object *obj)
Eric Anholt	673a394	2008-07-30 12:06:12 -0700	[diff] [blame]	2524	{
Chris Wilson	fac5e23	2016-07-04 11:34:36 +0100	[diff] [blame]	2525	struct drm_i915_private *dev_priv = to_i915(obj->base.dev);
Chris Wilson	d766ef5	2016-12-19 12:43:45 +0000	[diff] [blame]	2526	const unsigned long page_count = obj->base.size / PAGE_SIZE;
				2527	unsigned long i;
Eric Anholt	673a394	2008-07-30 12:06:12 -0700	[diff] [blame]	2528	struct address_space *mapping;
Chris Wilson	9da3da6	2012-06-01 15:20:22 +0100	[diff] [blame]	2529	struct sg_table *st;
				2530	struct scatterlist *sg;
Dave Gordon	85d1225	2016-05-20 11:54:06 +0100	[diff] [blame]	2531	struct sgt_iter sgt_iter;
Eric Anholt	673a394	2008-07-30 12:06:12 -0700	[diff] [blame]	2532	struct page *page;
Imre Deak	90797e6	2013-02-18 19:28:03 +0200	[diff] [blame]	2533	unsigned long last_pfn = 0; /* suppress gcc warning */
Tvrtko Ursulin	5602452	2017-08-03 10:14:17 +0100	[diff] [blame]	2534	unsigned int max_segment = i915_sg_segment_size();
Matthew Auld	84e8978	2017-10-09 12:00:24 +0100	[diff] [blame]	2535	unsigned int sg_page_sizes;
Chris Wilson	4846bf0	2017-06-09 12:03:46 +0100	[diff] [blame]	2536	gfp_t noreclaim;
Imre Deak	e227330	2015-07-09 12:59:05 +0300	[diff] [blame]	2537	int ret;
Eric Anholt	673a394	2008-07-30 12:06:12 -0700	[diff] [blame]	2538
Chris Wilson	e0ff7a7	2018-09-03 09:33:36 +0100	[diff] [blame]	2539	/*
				2540	* Assert that the object is not currently in any GPU domain. As it
Chris Wilson	6c085a7	2012-08-20 11:40:46 +0200	[diff] [blame]	2541	* wasn't in the GTT, there shouldn't be any way it could have been in
				2542	* a GPU cache
				2543	*/
Christian König	c0a51fd	2018-02-16 13:43:38 +0100	[diff] [blame]	2544	GEM_BUG_ON(obj->read_domains & I915_GEM_GPU_DOMAINS);
				2545	GEM_BUG_ON(obj->write_domain & I915_GEM_GPU_DOMAINS);
Chris Wilson	6c085a7	2012-08-20 11:40:46 +0200	[diff] [blame]	2546
Chris Wilson	e0ff7a7	2018-09-03 09:33:36 +0100	[diff] [blame]	2547	/*
				2548	* If there's no chance of allocating enough pages for the whole
				2549	* object, bail early.
				2550	*/
				2551	if (page_count > totalram_pages)
				2552	return -ENOMEM;
				2553
Chris Wilson	9da3da6	2012-06-01 15:20:22 +0100	[diff] [blame]	2554	st = kmalloc(sizeof(*st), GFP_KERNEL);
				2555	if (st == NULL)
Matthew Auld	b91b09e	2017-10-06 23:18:17 +0100	[diff] [blame]	2556	return -ENOMEM;
Eric Anholt	673a394	2008-07-30 12:06:12 -0700	[diff] [blame]	2557
Chris Wilson	d766ef5	2016-12-19 12:43:45 +0000	[diff] [blame]	2558	rebuild_st:
Chris Wilson	9da3da6	2012-06-01 15:20:22 +0100	[diff] [blame]	2559	if (sg_alloc_table(st, page_count, GFP_KERNEL)) {
Chris Wilson	9da3da6	2012-06-01 15:20:22 +0100	[diff] [blame]	2560	kfree(st);
Matthew Auld	b91b09e	2017-10-06 23:18:17 +0100	[diff] [blame]	2561	return -ENOMEM;
Chris Wilson	9da3da6	2012-06-01 15:20:22 +0100	[diff] [blame]	2562	}
				2563
Chris Wilson	e0ff7a7	2018-09-03 09:33:36 +0100	[diff] [blame]	2564	/*
				2565	* Get the list of pages out of our struct file. They'll be pinned
Chris Wilson	9da3da6	2012-06-01 15:20:22 +0100	[diff] [blame]	2566	* at this point until we release them.
				2567	*
				2568	* Fail silently without starting the shrinker
				2569	*/
Al Viro	93c76a3	2015-12-04 23:45:44 -0500	[diff] [blame]	2570	mapping = obj->base.filp->f_mapping;
Chris Wilson	0f6ab55	2017-06-09 12:03:48 +0100	[diff] [blame]	2571	noreclaim = mapping_gfp_constraint(mapping, ~__GFP_RECLAIM);
Chris Wilson	4846bf0	2017-06-09 12:03:46 +0100	[diff] [blame]	2572	noreclaim \|= __GFP_NORETRY \| __GFP_NOWARN;
				2573
Imre Deak	90797e6	2013-02-18 19:28:03 +0200	[diff] [blame]	2574	sg = st->sgl;
				2575	st->nents = 0;
Matthew Auld	84e8978	2017-10-09 12:00:24 +0100	[diff] [blame]	2576	sg_page_sizes = 0;
Imre Deak	90797e6	2013-02-18 19:28:03 +0200	[diff] [blame]	2577	for (i = 0; i < page_count; i++) {
Chris Wilson	4846bf0	2017-06-09 12:03:46 +0100	[diff] [blame]	2578	const unsigned int shrink[] = {
				2579	I915_SHRINK_BOUND \| I915_SHRINK_UNBOUND \| I915_SHRINK_PURGEABLE,
				2580	0,
				2581	}, *s = shrink;
				2582	gfp_t gfp = noreclaim;
				2583
				2584	do {
Chris Wilson	6c085a7	2012-08-20 11:40:46 +0200	[diff] [blame]	2585	page = shmem_read_mapping_page_gfp(mapping, i, gfp);
Chris Wilson	4846bf0	2017-06-09 12:03:46 +0100	[diff] [blame]	2586	if (likely(!IS_ERR(page)))
				2587	break;
				2588
				2589	if (!*s) {
				2590	ret = PTR_ERR(page);
				2591	goto err_sg;
				2592	}
				2593
Chris Wilson	912d572	2017-09-06 16:19:30 -0700	[diff] [blame]	2594	i915_gem_shrink(dev_priv, 2 * page_count, NULL, *s++);
Chris Wilson	4846bf0	2017-06-09 12:03:46 +0100	[diff] [blame]	2595	cond_resched();
Chris Wilson	24f8e00	2017-03-22 11:05:21 +0000	[diff] [blame]	2596
Chris Wilson	e0ff7a7	2018-09-03 09:33:36 +0100	[diff] [blame]	2597	/*
				2598	* We've tried hard to allocate the memory by reaping
Chris Wilson	6c085a7	2012-08-20 11:40:46 +0200	[diff] [blame]	2599	* our own buffer, now let the real VM do its job and
				2600	* go down in flames if truly OOM.
Chris Wilson	24f8e00	2017-03-22 11:05:21 +0000	[diff] [blame]	2601	*
				2602	* However, since graphics tend to be disposable,
				2603	* defer the oom here by reporting the ENOMEM back
				2604	* to userspace.
Chris Wilson	6c085a7	2012-08-20 11:40:46 +0200	[diff] [blame]	2605	*/
Chris Wilson	4846bf0	2017-06-09 12:03:46 +0100	[diff] [blame]	2606	if (!*s) {
				2607	/* reclaim and warn, but no oom */
				2608	gfp = mapping_gfp_mask(mapping);
Chris Wilson	eaf4180	2017-06-09 12:03:47 +0100	[diff] [blame]	2609
Chris Wilson	e0ff7a7	2018-09-03 09:33:36 +0100	[diff] [blame]	2610	/*
				2611	* Our bo are always dirty and so we require
Chris Wilson	eaf4180	2017-06-09 12:03:47 +0100	[diff] [blame]	2612	* kswapd to reclaim our pages (direct reclaim
				2613	* does not effectively begin pageout of our
				2614	* buffers on its own). However, direct reclaim
				2615	* only waits for kswapd when under allocation
				2616	* congestion. So as a result __GFP_RECLAIM is
				2617	* unreliable and fails to actually reclaim our
				2618	* dirty pages -- unless you try over and over
				2619	* again with !__GFP_NORETRY. However, we still
				2620	* want to fail this allocation rather than
				2621	* trigger the out-of-memory killer and for
Michal Hocko	dbb3295	2017-07-12 14:36:55 -0700	[diff] [blame]	2622	* this we want __GFP_RETRY_MAYFAIL.
Chris Wilson	eaf4180	2017-06-09 12:03:47 +0100	[diff] [blame]	2623	*/
Michal Hocko	dbb3295	2017-07-12 14:36:55 -0700	[diff] [blame]	2624	gfp \|= __GFP_RETRY_MAYFAIL;
Imre Deak	e227330	2015-07-09 12:59:05 +0300	[diff] [blame]	2625	}
Chris Wilson	4846bf0	2017-06-09 12:03:46 +0100	[diff] [blame]	2626	} while (1);
				2627
Chris Wilson	871dfbd	2016-10-11 09:20:21 +0100	[diff] [blame]	2628	if (!i \|\|
				2629	sg->length >= max_segment \|\|
				2630	page_to_pfn(page) != last_pfn + 1) {
Matthew Auld	a5c08166	2017-10-06 23:18:18 +0100	[diff] [blame]	2631	if (i) {
Matthew Auld	84e8978	2017-10-09 12:00:24 +0100	[diff] [blame]	2632	sg_page_sizes \|= sg->length;
Imre Deak	90797e6	2013-02-18 19:28:03 +0200	[diff] [blame]	2633	sg = sg_next(sg);
Matthew Auld	a5c08166	2017-10-06 23:18:18 +0100	[diff] [blame]	2634	}
Imre Deak	90797e6	2013-02-18 19:28:03 +0200	[diff] [blame]	2635	st->nents++;
				2636	sg_set_page(sg, page, PAGE_SIZE, 0);
				2637	} else {
				2638	sg->length += PAGE_SIZE;
				2639	}
				2640	last_pfn = page_to_pfn(page);
Daniel Vetter	3bbbe70	2013-10-07 17:15:45 -0300	[diff] [blame]	2641
				2642	/* Check that the i965g/gm workaround works. */
				2643	WARN_ON((gfp & __GFP_DMA32) && (last_pfn >= 0x00100000UL));
Eric Anholt	673a394	2008-07-30 12:06:12 -0700	[diff] [blame]	2644	}
Matthew Auld	a5c08166	2017-10-06 23:18:18 +0100	[diff] [blame]	2645	if (sg) { /* loop terminated early; short sg table */
Matthew Auld	84e8978	2017-10-09 12:00:24 +0100	[diff] [blame]	2646	sg_page_sizes \|= sg->length;
Konrad Rzeszutek Wilk	426729d	2013-06-24 11:47:48 -0400	[diff] [blame]	2647	sg_mark_end(sg);
Matthew Auld	a5c08166	2017-10-06 23:18:18 +0100	[diff] [blame]	2648	}
Chris Wilson	74ce6b6	2012-10-19 15:51:06 +0100	[diff] [blame]	2649
Tvrtko Ursulin	0c40ce1	2016-11-09 15:13:43 +0000	[diff] [blame]	2650	/* Trim unused sg entries to avoid wasting memory. */
				2651	i915_sg_trim(st);
				2652
Chris Wilson	03ac84f	2016-10-28 13:58:36 +0100	[diff] [blame]	2653	ret = i915_gem_gtt_prepare_pages(obj, st);
Chris Wilson	d766ef5	2016-12-19 12:43:45 +0000	[diff] [blame]	2654	if (ret) {
Chris Wilson	e0ff7a7	2018-09-03 09:33:36 +0100	[diff] [blame]	2655	/*
				2656	* DMA remapping failed? One possible cause is that
Chris Wilson	d766ef5	2016-12-19 12:43:45 +0000	[diff] [blame]	2657	* it could not reserve enough large entries, asking
				2658	* for PAGE_SIZE chunks instead may be helpful.
				2659	*/
				2660	if (max_segment > PAGE_SIZE) {
				2661	for_each_sgt_page(page, sgt_iter, st)
				2662	put_page(page);
				2663	sg_free_table(st);
				2664
				2665	max_segment = PAGE_SIZE;
				2666	goto rebuild_st;
				2667	} else {
				2668	dev_warn(&dev_priv->drm.pdev->dev,
				2669	"Failed to DMA remap %lu pages\n",
				2670	page_count);
				2671	goto err_pages;
				2672	}
				2673	}
Imre Deak	e227330	2015-07-09 12:59:05 +0300	[diff] [blame]	2674
Eric Anholt	673a394	2008-07-30 12:06:12 -0700	[diff] [blame]	2675	if (i915_gem_object_needs_bit17_swizzle(obj))
Chris Wilson	03ac84f	2016-10-28 13:58:36 +0100	[diff] [blame]	2676	i915_gem_object_do_bit_17_swizzle(obj, st);
Eric Anholt	673a394	2008-07-30 12:06:12 -0700	[diff] [blame]	2677
Matthew Auld	84e8978	2017-10-09 12:00:24 +0100	[diff] [blame]	2678	__i915_gem_object_set_pages(obj, st, sg_page_sizes);
Matthew Auld	b91b09e	2017-10-06 23:18:17 +0100	[diff] [blame]	2679
				2680	return 0;
Eric Anholt	673a394	2008-07-30 12:06:12 -0700	[diff] [blame]	2681
Chris Wilson	b17993b	2016-11-14 11:29:30 +0000	[diff] [blame]	2682	err_sg:
Imre Deak	90797e6	2013-02-18 19:28:03 +0200	[diff] [blame]	2683	sg_mark_end(sg);
Chris Wilson	b17993b	2016-11-14 11:29:30 +0000	[diff] [blame]	2684	err_pages:
Dave Gordon	85d1225	2016-05-20 11:54:06 +0100	[diff] [blame]	2685	for_each_sgt_page(page, sgt_iter, st)
				2686	put_page(page);
Chris Wilson	9da3da6	2012-06-01 15:20:22 +0100	[diff] [blame]	2687	sg_free_table(st);
				2688	kfree(st);
Chris Wilson	0820baf	2014-03-25 13:23:03 +0000	[diff] [blame]	2689
Chris Wilson	e0ff7a7	2018-09-03 09:33:36 +0100	[diff] [blame]	2690	/*
				2691	* shmemfs first checks if there is enough memory to allocate the page
Chris Wilson	0820baf	2014-03-25 13:23:03 +0000	[diff] [blame]	2692	* and reports ENOSPC should there be insufficient, along with the usual
				2693	* ENOMEM for a genuine allocation failure.
				2694	*
				2695	* We use ENOSPC in our driver to mean that we have run out of aperture
				2696	* space and so want to translate the error from shmemfs back to our
				2697	* usual understanding of ENOMEM.
				2698	*/
Imre Deak	e227330	2015-07-09 12:59:05 +0300	[diff] [blame]	2699	if (ret == -ENOSPC)
				2700	ret = -ENOMEM;
				2701
Matthew Auld	b91b09e	2017-10-06 23:18:17 +0100	[diff] [blame]	2702	return ret;
Chris Wilson	03ac84f	2016-10-28 13:58:36 +0100	[diff] [blame]	2703	}
				2704
				2705	void __i915_gem_object_set_pages(struct drm_i915_gem_object *obj,
Matthew Auld	a5c08166	2017-10-06 23:18:18 +0100	[diff] [blame]	2706	struct sg_table *pages,
Matthew Auld	84e8978	2017-10-09 12:00:24 +0100	[diff] [blame]	2707	unsigned int sg_page_sizes)
Chris Wilson	03ac84f	2016-10-28 13:58:36 +0100	[diff] [blame]	2708	{
Matthew Auld	a5c08166	2017-10-06 23:18:18 +0100	[diff] [blame]	2709	struct drm_i915_private *i915 = to_i915(obj->base.dev);
				2710	unsigned long supported = INTEL_INFO(i915)->page_sizes;
				2711	int i;
				2712
Chris Wilson	1233e2d	2016-10-28 13:58:37 +0100	[diff] [blame]	2713	lockdep_assert_held(&obj->mm.lock);
Chris Wilson	03ac84f	2016-10-28 13:58:36 +0100	[diff] [blame]	2714
				2715	obj->mm.get_page.sg_pos = pages->sgl;
				2716	obj->mm.get_page.sg_idx = 0;
				2717
				2718	obj->mm.pages = pages;
Chris Wilson	2c3a3f4	2016-11-04 10:30:01 +0000	[diff] [blame]	2719
				2720	if (i915_gem_object_is_tiled(obj) &&
Chris Wilson	f212381	2017-10-16 12:40:37 +0100	[diff] [blame]	2721	i915->quirks & QUIRK_PIN_SWIZZLED_PAGES) {
Chris Wilson	2c3a3f4	2016-11-04 10:30:01 +0000	[diff] [blame]	2722	GEM_BUG_ON(obj->mm.quirked);
				2723	__i915_gem_object_pin_pages(obj);
				2724	obj->mm.quirked = true;
				2725	}
Matthew Auld	a5c08166	2017-10-06 23:18:18 +0100	[diff] [blame]	2726
Matthew Auld	84e8978	2017-10-09 12:00:24 +0100	[diff] [blame]	2727	GEM_BUG_ON(!sg_page_sizes);
				2728	obj->mm.page_sizes.phys = sg_page_sizes;
Matthew Auld	a5c08166	2017-10-06 23:18:18 +0100	[diff] [blame]	2729
				2730	/*
Matthew Auld	84e8978	2017-10-09 12:00:24 +0100	[diff] [blame]	2731	* Calculate the supported page-sizes which fit into the given
				2732	* sg_page_sizes. This will give us the page-sizes which we may be able
				2733	* to use opportunistically when later inserting into the GTT. For
				2734	* example if phys=2G, then in theory we should be able to use 1G, 2M,
				2735	* 64K or 4K pages, although in practice this will depend on a number of
				2736	* other factors.
Matthew Auld	a5c08166	2017-10-06 23:18:18 +0100	[diff] [blame]	2737	*/
				2738	obj->mm.page_sizes.sg = 0;
				2739	for_each_set_bit(i, &supported, ilog2(I915_GTT_MAX_PAGE_SIZE) + 1) {
				2740	if (obj->mm.page_sizes.phys & ~0u << i)
				2741	obj->mm.page_sizes.sg \|= BIT(i);
				2742	}
Matthew Auld	a5c08166	2017-10-06 23:18:18 +0100	[diff] [blame]	2743	GEM_BUG_ON(!HAS_PAGE_SIZES(i915, obj->mm.page_sizes.sg));
Chris Wilson	f212381	2017-10-16 12:40:37 +0100	[diff] [blame]	2744
				2745	spin_lock(&i915->mm.obj_lock);
				2746	list_add(&obj->mm.link, &i915->mm.unbound_list);
				2747	spin_unlock(&i915->mm.obj_lock);
Chris Wilson	03ac84f	2016-10-28 13:58:36 +0100	[diff] [blame]	2748	}
				2749
				2750	static int ____i915_gem_object_get_pages(struct drm_i915_gem_object *obj)
				2751	{
Matthew Auld	b91b09e	2017-10-06 23:18:17 +0100	[diff] [blame]	2752	int err;
Chris Wilson	03ac84f	2016-10-28 13:58:36 +0100	[diff] [blame]	2753
				2754	if (unlikely(obj->mm.madv != I915_MADV_WILLNEED)) {
				2755	DRM_DEBUG("Attempting to obtain a purgeable object\n");
				2756	return -EFAULT;
				2757	}
				2758
Matthew Auld	b91b09e	2017-10-06 23:18:17 +0100	[diff] [blame]	2759	err = obj->ops->get_pages(obj);
Matthew Auld	b65a9b9	2017-12-18 10:38:55 +0000	[diff] [blame]	2760	GEM_BUG_ON(!err && !i915_gem_object_has_pages(obj));
Chris Wilson	03ac84f	2016-10-28 13:58:36 +0100	[diff] [blame]	2761
Matthew Auld	b91b09e	2017-10-06 23:18:17 +0100	[diff] [blame]	2762	return err;
Eric Anholt	673a394	2008-07-30 12:06:12 -0700	[diff] [blame]	2763	}
				2764
Chris Wilson	37e680a	2012-06-07 15:38:42 +0100	[diff] [blame]	2765	/* Ensure that the associated pages are gathered from the backing storage
Chris Wilson	1233e2d	2016-10-28 13:58:37 +0100	[diff] [blame]	2766	* and pinned into our object. i915_gem_object_pin_pages() may be called
Chris Wilson	37e680a	2012-06-07 15:38:42 +0100	[diff] [blame]	2767	* multiple times before they are released by a single call to
Chris Wilson	1233e2d	2016-10-28 13:58:37 +0100	[diff] [blame]	2768	* i915_gem_object_unpin_pages() - once the pages are no longer referenced
Chris Wilson	37e680a	2012-06-07 15:38:42 +0100	[diff] [blame]	2769	* either as a result of memory pressure (reaping pages under the shrinker)
				2770	* or as the object is itself released.
				2771	*/
Chris Wilson	a4f5ea6	2016-10-28 13:58:35 +0100	[diff] [blame]	2772	int __i915_gem_object_get_pages(struct drm_i915_gem_object *obj)
Chris Wilson	37e680a	2012-06-07 15:38:42 +0100	[diff] [blame]	2773	{
Chris Wilson	03ac84f	2016-10-28 13:58:36 +0100	[diff] [blame]	2774	int err;
Chris Wilson	37e680a	2012-06-07 15:38:42 +0100	[diff] [blame]	2775
Chris Wilson	1233e2d	2016-10-28 13:58:37 +0100	[diff] [blame]	2776	err = mutex_lock_interruptible(&obj->mm.lock);
				2777	if (err)
				2778	return err;
Chris Wilson	4c7d62c	2016-10-28 13:58:32 +0100	[diff] [blame]	2779
Chris Wilson	f1fa4f4	2017-10-13 21:26:13 +0100	[diff] [blame]	2780	if (unlikely(!i915_gem_object_has_pages(obj))) {
Chris Wilson	88c880b	2017-09-06 14:52:20 +0100	[diff] [blame]	2781	GEM_BUG_ON(i915_gem_object_has_pinned_pages(obj));
				2782
Chris Wilson	2c3a3f4	2016-11-04 10:30:01 +0000	[diff] [blame]	2783	err = ____i915_gem_object_get_pages(obj);
				2784	if (err)
				2785	goto unlock;
				2786
				2787	smp_mb__before_atomic();
Chris Wilson	1233e2d	2016-10-28 13:58:37 +0100	[diff] [blame]	2788	}
Chris Wilson	2c3a3f4	2016-11-04 10:30:01 +0000	[diff] [blame]	2789	atomic_inc(&obj->mm.pages_pin_count);
Chris Wilson	43e28f0	2013-01-08 10:53:09 +0000	[diff] [blame]	2790
Chris Wilson	1233e2d	2016-10-28 13:58:37 +0100	[diff] [blame]	2791	unlock:
				2792	mutex_unlock(&obj->mm.lock);
Chris Wilson	03ac84f	2016-10-28 13:58:36 +0100	[diff] [blame]	2793	return err;
Eric Anholt	673a394	2008-07-30 12:06:12 -0700	[diff] [blame]	2794	}
				2795
Dave Gordon	dd6034c	2016-05-20 11:54:04 +0100	[diff] [blame]	2796	/* The 'mapping' part of i915_gem_object_pin_map() below */
Chris Wilson	d31d7cb	2016-08-12 12:39:58 +0100	[diff] [blame]	2797	static void i915_gem_object_map(const struct drm_i915_gem_object obj,
				2798	enum i915_map_type type)
Dave Gordon	dd6034c	2016-05-20 11:54:04 +0100	[diff] [blame]	2799	{
				2800	unsigned long n_pages = obj->base.size >> PAGE_SHIFT;
Chris Wilson	a4f5ea6	2016-10-28 13:58:35 +0100	[diff] [blame]	2801	struct sg_table *sgt = obj->mm.pages;
Dave Gordon	85d1225	2016-05-20 11:54:06 +0100	[diff] [blame]	2802	struct sgt_iter sgt_iter;
				2803	struct page *page;
Dave Gordon	b338fa4	2016-05-20 11:54:05 +0100	[diff] [blame]	2804	struct page *stack_pages[32];
				2805	struct page **pages = stack_pages;
Dave Gordon	dd6034c	2016-05-20 11:54:04 +0100	[diff] [blame]	2806	unsigned long i = 0;
Chris Wilson	d31d7cb	2016-08-12 12:39:58 +0100	[diff] [blame]	2807	pgprot_t pgprot;
Dave Gordon	dd6034c	2016-05-20 11:54:04 +0100	[diff] [blame]	2808	void *addr;
				2809
				2810	/* A single page can always be kmapped */
Chris Wilson	d31d7cb	2016-08-12 12:39:58 +0100	[diff] [blame]	2811	if (n_pages == 1 && type == I915_MAP_WB)
Dave Gordon	dd6034c	2016-05-20 11:54:04 +0100	[diff] [blame]	2812	return kmap(sg_page(sgt->sgl));
				2813
Dave Gordon	b338fa4	2016-05-20 11:54:05 +0100	[diff] [blame]	2814	if (n_pages > ARRAY_SIZE(stack_pages)) {
				2815	/* Too big for stack -- allocate temporary array instead */
Michal Hocko	0ee931c	2017-09-13 16:28:29 -0700	[diff] [blame]	2816	pages = kvmalloc_array(n_pages, sizeof(*pages), GFP_KERNEL);
Dave Gordon	b338fa4	2016-05-20 11:54:05 +0100	[diff] [blame]	2817	if (!pages)
				2818	return NULL;
				2819	}
Dave Gordon	dd6034c	2016-05-20 11:54:04 +0100	[diff] [blame]	2820
Dave Gordon	85d1225	2016-05-20 11:54:06 +0100	[diff] [blame]	2821	for_each_sgt_page(page, sgt_iter, sgt)
				2822	pages[i++] = page;
Dave Gordon	dd6034c	2016-05-20 11:54:04 +0100	[diff] [blame]	2823
				2824	/* Check that we have the expected number of pages */
				2825	GEM_BUG_ON(i != n_pages);
				2826
Chris Wilson	d31d7cb	2016-08-12 12:39:58 +0100	[diff] [blame]	2827	switch (type) {
Chris Wilson	a575c67	2017-08-28 11:46:31 +0100	[diff] [blame]	2828	default:
				2829	MISSING_CASE(type);
				2830	/* fallthrough to use PAGE_KERNEL anyway */
Chris Wilson	d31d7cb	2016-08-12 12:39:58 +0100	[diff] [blame]	2831	case I915_MAP_WB:
				2832	pgprot = PAGE_KERNEL;
				2833	break;
				2834	case I915_MAP_WC:
				2835	pgprot = pgprot_writecombine(PAGE_KERNEL_IO);
				2836	break;
				2837	}
				2838	addr = vmap(pages, n_pages, 0, pgprot);
Dave Gordon	dd6034c	2016-05-20 11:54:04 +0100	[diff] [blame]	2839
Dave Gordon	b338fa4	2016-05-20 11:54:05 +0100	[diff] [blame]	2840	if (pages != stack_pages)
Michal Hocko	2098105	2017-05-17 14:23:12 +0200	[diff] [blame]	2841	kvfree(pages);
Dave Gordon	dd6034c	2016-05-20 11:54:04 +0100	[diff] [blame]	2842
				2843	return addr;
				2844	}
				2845
				2846	/* get, pin, and map the pages of the object into kernel space */
Chris Wilson	d31d7cb	2016-08-12 12:39:58 +0100	[diff] [blame]	2847	void i915_gem_object_pin_map(struct drm_i915_gem_object obj,
				2848	enum i915_map_type type)
Chris Wilson	0a798eb	2016-04-08 12:11:11 +0100	[diff] [blame]	2849	{
Chris Wilson	d31d7cb	2016-08-12 12:39:58 +0100	[diff] [blame]	2850	enum i915_map_type has_type;
				2851	bool pinned;
				2852	void *ptr;
Chris Wilson	0a798eb	2016-04-08 12:11:11 +0100	[diff] [blame]	2853	int ret;
				2854
Tina Zhang	a03f395	2017-11-14 10:25:13 +0000	[diff] [blame]	2855	if (unlikely(!i915_gem_object_has_struct_page(obj)))
				2856	return ERR_PTR(-ENXIO);
Chris Wilson	0a798eb	2016-04-08 12:11:11 +0100	[diff] [blame]	2857
Chris Wilson	1233e2d	2016-10-28 13:58:37 +0100	[diff] [blame]	2858	ret = mutex_lock_interruptible(&obj->mm.lock);
Chris Wilson	0a798eb	2016-04-08 12:11:11 +0100	[diff] [blame]	2859	if (ret)
				2860	return ERR_PTR(ret);
				2861
Chris Wilson	a575c67	2017-08-28 11:46:31 +0100	[diff] [blame]	2862	pinned = !(type & I915_MAP_OVERRIDE);
				2863	type &= ~I915_MAP_OVERRIDE;
				2864
Chris Wilson	1233e2d	2016-10-28 13:58:37 +0100	[diff] [blame]	2865	if (!atomic_inc_not_zero(&obj->mm.pages_pin_count)) {
Chris Wilson	f1fa4f4	2017-10-13 21:26:13 +0100	[diff] [blame]	2866	if (unlikely(!i915_gem_object_has_pages(obj))) {
Chris Wilson	88c880b	2017-09-06 14:52:20 +0100	[diff] [blame]	2867	GEM_BUG_ON(i915_gem_object_has_pinned_pages(obj));
				2868
Chris Wilson	2c3a3f4	2016-11-04 10:30:01 +0000	[diff] [blame]	2869	ret = ____i915_gem_object_get_pages(obj);
				2870	if (ret)
				2871	goto err_unlock;
Chris Wilson	1233e2d	2016-10-28 13:58:37 +0100	[diff] [blame]	2872
Chris Wilson	2c3a3f4	2016-11-04 10:30:01 +0000	[diff] [blame]	2873	smp_mb__before_atomic();
				2874	}
				2875	atomic_inc(&obj->mm.pages_pin_count);
Chris Wilson	1233e2d	2016-10-28 13:58:37 +0100	[diff] [blame]	2876	pinned = false;
				2877	}
Chris Wilson	f1fa4f4	2017-10-13 21:26:13 +0100	[diff] [blame]	2878	GEM_BUG_ON(!i915_gem_object_has_pages(obj));
Chris Wilson	0a798eb	2016-04-08 12:11:11 +0100	[diff] [blame]	2879
Chris Wilson	0ce8178	2017-05-17 13:09:59 +0100	[diff] [blame]	2880	ptr = page_unpack_bits(obj->mm.mapping, &has_type);
Chris Wilson	d31d7cb	2016-08-12 12:39:58 +0100	[diff] [blame]	2881	if (ptr && has_type != type) {
				2882	if (pinned) {
				2883	ret = -EBUSY;
Chris Wilson	1233e2d	2016-10-28 13:58:37 +0100	[diff] [blame]	2884	goto err_unpin;
Chris Wilson	0a798eb	2016-04-08 12:11:11 +0100	[diff] [blame]	2885	}
Chris Wilson	d31d7cb	2016-08-12 12:39:58 +0100	[diff] [blame]	2886
				2887	if (is_vmalloc_addr(ptr))
				2888	vunmap(ptr);
				2889	else
				2890	kunmap(kmap_to_page(ptr));
				2891
Chris Wilson	a4f5ea6	2016-10-28 13:58:35 +0100	[diff] [blame]	2892	ptr = obj->mm.mapping = NULL;
Chris Wilson	0a798eb	2016-04-08 12:11:11 +0100	[diff] [blame]	2893	}
				2894
Chris Wilson	d31d7cb	2016-08-12 12:39:58 +0100	[diff] [blame]	2895	if (!ptr) {
				2896	ptr = i915_gem_object_map(obj, type);
				2897	if (!ptr) {
				2898	ret = -ENOMEM;
Chris Wilson	1233e2d	2016-10-28 13:58:37 +0100	[diff] [blame]	2899	goto err_unpin;
Chris Wilson	d31d7cb	2016-08-12 12:39:58 +0100	[diff] [blame]	2900	}
				2901
Chris Wilson	0ce8178	2017-05-17 13:09:59 +0100	[diff] [blame]	2902	obj->mm.mapping = page_pack_bits(ptr, type);
Chris Wilson	d31d7cb	2016-08-12 12:39:58 +0100	[diff] [blame]	2903	}
				2904
Chris Wilson	1233e2d	2016-10-28 13:58:37 +0100	[diff] [blame]	2905	out_unlock:
				2906	mutex_unlock(&obj->mm.lock);
Chris Wilson	d31d7cb	2016-08-12 12:39:58 +0100	[diff] [blame]	2907	return ptr;
				2908
Chris Wilson	1233e2d	2016-10-28 13:58:37 +0100	[diff] [blame]	2909	err_unpin:
				2910	atomic_dec(&obj->mm.pages_pin_count);
				2911	err_unlock:
				2912	ptr = ERR_PTR(ret);
				2913	goto out_unlock;
Chris Wilson	0a798eb	2016-04-08 12:11:11 +0100	[diff] [blame]	2914	}
				2915
Chris Wilson	7c55e2c	2017-03-07 12:03:38 +0000	[diff] [blame]	2916	static int
				2917	i915_gem_object_pwrite_gtt(struct drm_i915_gem_object *obj,
				2918	const struct drm_i915_gem_pwrite *arg)
				2919	{
				2920	struct address_space *mapping = obj->base.filp->f_mapping;
				2921	char __user *user_data = u64_to_user_ptr(arg->data_ptr);
				2922	u64 remain, offset;
				2923	unsigned int pg;
				2924
				2925	/* Before we instantiate/pin the backing store for our use, we
				2926	* can prepopulate the shmemfs filp efficiently using a write into
				2927	* the pagecache. We avoid the penalty of instantiating all the
				2928	* pages, important if the user is just writing to a few and never
				2929	* uses the object on the GPU, and using a direct write into shmemfs
				2930	* allows it to avoid the cost of retrieving a page (either swapin
				2931	* or clearing-before-use) before it is overwritten.
				2932	*/
Chris Wilson	f1fa4f4	2017-10-13 21:26:13 +0100	[diff] [blame]	2933	if (i915_gem_object_has_pages(obj))
Chris Wilson	7c55e2c	2017-03-07 12:03:38 +0000	[diff] [blame]	2934	return -ENODEV;
				2935
Chris Wilson	a6d65e4	2017-10-16 21:27:32 +0100	[diff] [blame]	2936	if (obj->mm.madv != I915_MADV_WILLNEED)
				2937	return -EFAULT;
				2938
Chris Wilson	7c55e2c	2017-03-07 12:03:38 +0000	[diff] [blame]	2939	/* Before the pages are instantiated the object is treated as being
				2940	* in the CPU domain. The pages will be clflushed as required before
				2941	* use, and we can freely write into the pages directly. If userspace
				2942	* races pwrite with any other operation; corruption will ensue -
				2943	* that is userspace's prerogative!
				2944	*/
				2945
				2946	remain = arg->size;
				2947	offset = arg->offset;
				2948	pg = offset_in_page(offset);
				2949
				2950	do {
				2951	unsigned int len, unwritten;
				2952	struct page *page;
				2953	void data, vaddr;
				2954	int err;
				2955
				2956	len = PAGE_SIZE - pg;
				2957	if (len > remain)
				2958	len = remain;
				2959
				2960	err = pagecache_write_begin(obj->base.filp, mapping,
				2961	offset, len, 0,
				2962	&page, &data);
				2963	if (err < 0)
				2964	return err;
				2965
				2966	vaddr = kmap(page);
				2967	unwritten = copy_from_user(vaddr + pg, user_data, len);
				2968	kunmap(page);
				2969
				2970	err = pagecache_write_end(obj->base.filp, mapping,
				2971	offset, len, len - unwritten,
				2972	page, data);
				2973	if (err < 0)
				2974	return err;
				2975
				2976	if (unwritten)
				2977	return -EFAULT;
				2978
				2979	remain -= len;
				2980	user_data += len;
				2981	offset += len;
				2982	pg = 0;
				2983	} while (remain);
				2984
				2985	return 0;
				2986	}
				2987
Mika Kuoppala	14921f3	2018-06-15 13:44:29 +0300	[diff] [blame]	2988	static void i915_gem_client_mark_guilty(struct drm_i915_file_private *file_priv,
				2989	const struct i915_gem_context *ctx)
				2990	{
				2991	unsigned int score;
				2992	unsigned long prev_hang;
				2993
				2994	if (i915_gem_context_is_banned(ctx))
				2995	score = I915_CLIENT_SCORE_CONTEXT_BAN;
				2996	else
				2997	score = 0;
				2998
				2999	prev_hang = xchg(&file_priv->hang_timestamp, jiffies);
				3000	if (time_before(jiffies, prev_hang + I915_CLIENT_FAST_HANG_JIFFIES))
				3001	score += I915_CLIENT_SCORE_HANG_FAST;
				3002
				3003	if (score) {
				3004	atomic_add(score, &file_priv->ban_score);
				3005
				3006	DRM_DEBUG_DRIVER("client %s: gained %u ban score, now %u\n",
				3007	ctx->name, score,
				3008	atomic_read(&file_priv->ban_score));
				3009	}
				3010	}
				3011
Mika Kuoppala	e5e1fc4	2016-11-16 17:20:31 +0200	[diff] [blame]	3012	static void i915_gem_context_mark_guilty(struct i915_gem_context *ctx)
Mika Kuoppala	aa60c66	2013-06-12 15:13:20 +0300	[diff] [blame]	3013	{
Mika Kuoppala	14921f3	2018-06-15 13:44:29 +0300	[diff] [blame]	3014	unsigned int score;
				3015	bool banned, bannable;
Mika Kuoppala	b083a08	2016-11-18 15:10:47 +0200	[diff] [blame]	3016
Chris Wilson	77b25a9	2017-07-21 13:32:30 +0100	[diff] [blame]	3017	atomic_inc(&ctx->guilty_count);
				3018
Mika Kuoppala	14921f3	2018-06-15 13:44:29 +0300	[diff] [blame]	3019	bannable = i915_gem_context_is_bannable(ctx);
				3020	score = atomic_add_return(CONTEXT_SCORE_GUILTY, &ctx->ban_score);
				3021	banned = score >= CONTEXT_SCORE_BAN_THRESHOLD;
Chris Wilson	24eae08	2018-02-05 09:22:01 +0000	[diff] [blame]	3022
Mika Kuoppala	14921f3	2018-06-15 13:44:29 +0300	[diff] [blame]	3023	/* Cool contexts don't accumulate client ban score */
				3024	if (!bannable)
Mika Kuoppala	b083a08	2016-11-18 15:10:47 +0200	[diff] [blame]	3025	return;
				3026
Chris Wilson	bcc2661	2018-06-18 08:31:35 +0100	[diff] [blame]	3027	if (banned) {
				3028	DRM_DEBUG_DRIVER("context %s: guilty %d, score %u, banned\n",
				3029	ctx->name, atomic_read(&ctx->guilty_count),
				3030	score);
Mika Kuoppala	14921f3	2018-06-15 13:44:29 +0300	[diff] [blame]	3031	i915_gem_context_set_banned(ctx);
Chris Wilson	bcc2661	2018-06-18 08:31:35 +0100	[diff] [blame]	3032	}
Mika Kuoppala	14921f3	2018-06-15 13:44:29 +0300	[diff] [blame]	3033
				3034	if (!IS_ERR_OR_NULL(ctx->file_priv))
				3035	i915_gem_client_mark_guilty(ctx->file_priv, ctx);
Mika Kuoppala	e5e1fc4	2016-11-16 17:20:31 +0200	[diff] [blame]	3036	}
				3037
				3038	static void i915_gem_context_mark_innocent(struct i915_gem_context *ctx)
				3039	{
Chris Wilson	77b25a9	2017-07-21 13:32:30 +0100	[diff] [blame]	3040	atomic_inc(&ctx->active_count);
Mika Kuoppala	aa60c66	2013-06-12 15:13:20 +0300	[diff] [blame]	3041	}
				3042
Chris Wilson	e61e0f5	2018-02-21 09:56:36 +0000	[diff] [blame]	3043	struct i915_request *
Tvrtko Ursulin	0bc40be	2016-03-16 11:00:37 +0000	[diff] [blame]	3044	i915_gem_find_active_request(struct intel_engine_cs *engine)
Chris Wilson	9375e44	2010-09-19 12:21:28 +0100	[diff] [blame]	3045	{
Chris Wilson	e61e0f5	2018-02-21 09:56:36 +0000	[diff] [blame]	3046	struct i915_request request, active = NULL;
Chris Wilson	754c9fd	2017-02-23 07:44:14 +0000	[diff] [blame]	3047	unsigned long flags;
Mika Kuoppala	aa60c66	2013-06-12 15:13:20 +0300	[diff] [blame]	3048
Chris Wilson	cc7cc53	2018-05-29 14:29:18 +0100	[diff] [blame]	3049	/*
				3050	* We are called by the error capture, reset and to dump engine
				3051	* state at random points in time. In particular, note that neither is
				3052	* crucially ordered with an interrupt. After a hang, the GPU is dead
				3053	* and we assume that no more writes can happen (we waited long enough
				3054	* for all writes that were in transaction to be flushed) - adding an
Chris Wilson	f69a02c	2016-07-01 17:23:16 +0100	[diff] [blame]	3055	* extra delay for a recent interrupt is pointless. Hence, we do
				3056	* not need an engine->irq_seqno_barrier() before the seqno reads.
Chris Wilson	cc7cc53	2018-05-29 14:29:18 +0100	[diff] [blame]	3057	* At all other times, we must assume the GPU is still running, but
				3058	* we only care about the snapshot of this moment.
Chris Wilson	f69a02c	2016-07-01 17:23:16 +0100	[diff] [blame]	3059	*/
Chris Wilson	a89d1f9	2018-05-02 17:38:39 +0100	[diff] [blame]	3060	spin_lock_irqsave(&engine->timeline.lock, flags);
				3061	list_for_each_entry(request, &engine->timeline.requests, link) {
Chris Wilson	e61e0f5	2018-02-21 09:56:36 +0000	[diff] [blame]	3062	if (__i915_request_completed(request, request->global_seqno))
Chris Wilson	4db080f	2013-12-04 11:37:09 +0000	[diff] [blame]	3063	continue;
Mika Kuoppala	aa60c66	2013-06-12 15:13:20 +0300	[diff] [blame]	3064
Chris Wilson	754c9fd	2017-02-23 07:44:14 +0000	[diff] [blame]	3065	active = request;
				3066	break;
				3067	}
Chris Wilson	a89d1f9	2018-05-02 17:38:39 +0100	[diff] [blame]	3068	spin_unlock_irqrestore(&engine->timeline.lock, flags);
Chris Wilson	754c9fd	2017-02-23 07:44:14 +0000	[diff] [blame]	3069
				3070	return active;
Mika Kuoppala	b6b0fac	2014-01-30 19:04:43 +0200	[diff] [blame]	3071	}
				3072
Michel Thierry	a1ef70e	2017-06-20 10:57:47 +0100	[diff] [blame]	3073	/*
				3074	* Ensure irq handler finishes, and not run again.
				3075	* Also return the active request so that we only search for it once.
				3076	*/
Chris Wilson	e61e0f5	2018-02-21 09:56:36 +0000	[diff] [blame]	3077	struct i915_request *
Michel Thierry	a1ef70e	2017-06-20 10:57:47 +0100	[diff] [blame]	3078	i915_gem_reset_prepare_engine(struct intel_engine_cs *engine)
				3079	{
Chris Wilson	5adfb77	2018-05-16 19:33:51 +0100	[diff] [blame]	3080	struct i915_request *request;
Michel Thierry	a1ef70e	2017-06-20 10:57:47 +0100	[diff] [blame]	3081
Chris Wilson	1749d90	2017-10-09 12:02:59 +0100	[diff] [blame]	3082	/*
				3083	* During the reset sequence, we must prevent the engine from
				3084	* entering RC6. As the context state is undefined until we restart
				3085	* the engine, if it does enter RC6 during the reset, the state
				3086	* written to the powercontext is undefined and so we may lose
				3087	* GPU state upon resume, i.e. fail to restart after a reset.
				3088	*/
				3089	intel_uncore_forcewake_get(engine->i915, FORCEWAKE_ALL);
				3090
Chris Wilson	5adfb77	2018-05-16 19:33:51 +0100	[diff] [blame]	3091	request = engine->reset.prepare(engine);
Chris Wilson	d1d1ebf4	2017-07-21 13:32:33 +0100	[diff] [blame]	3092	if (request && request->fence.error == -EIO)
				3093	request = ERR_PTR(-EIO); /* Previous reset failed! */
Michel Thierry	a1ef70e	2017-06-20 10:57:47 +0100	[diff] [blame]	3094
				3095	return request;
				3096	}
				3097
Chris Wilson	0e178ae	2017-01-17 17:59:06 +0200	[diff] [blame]	3098	int i915_gem_reset_prepare(struct drm_i915_private *dev_priv)
Chris Wilson	4c96554	2017-01-17 17:59:01 +0200	[diff] [blame]	3099	{
				3100	struct intel_engine_cs *engine;
Chris Wilson	e61e0f5	2018-02-21 09:56:36 +0000	[diff] [blame]	3101	struct i915_request *request;
Chris Wilson	4c96554	2017-01-17 17:59:01 +0200	[diff] [blame]	3102	enum intel_engine_id id;
Chris Wilson	0e178ae	2017-01-17 17:59:06 +0200	[diff] [blame]	3103	int err = 0;
Chris Wilson	4c96554	2017-01-17 17:59:01 +0200	[diff] [blame]	3104
Chris Wilson	0e178ae	2017-01-17 17:59:06 +0200	[diff] [blame]	3105	for_each_engine(engine, dev_priv, id) {
Michel Thierry	a1ef70e	2017-06-20 10:57:47 +0100	[diff] [blame]	3106	request = i915_gem_reset_prepare_engine(engine);
				3107	if (IS_ERR(request)) {
				3108	err = PTR_ERR(request);
				3109	continue;
Chris Wilson	0e178ae	2017-01-17 17:59:06 +0200	[diff] [blame]	3110	}
Michel Thierry	c64992e	2017-06-20 10:57:44 +0100	[diff] [blame]	3111
				3112	engine->hangcheck.active_request = request;
Chris Wilson	0e178ae	2017-01-17 17:59:06 +0200	[diff] [blame]	3113	}
				3114
Chris Wilson	4c96554	2017-01-17 17:59:01 +0200	[diff] [blame]	3115	i915_gem_revoke_fences(dev_priv);
Michal Wajdeczko	c37d572	2018-03-12 13:03:07 +0000	[diff] [blame]	3116	intel_uc_sanitize(dev_priv);
Chris Wilson	0e178ae	2017-01-17 17:59:06 +0200	[diff] [blame]	3117
				3118	return err;
Chris Wilson	4c96554	2017-01-17 17:59:01 +0200	[diff] [blame]	3119	}
				3120
Chris Wilson	e61e0f5	2018-02-21 09:56:36 +0000	[diff] [blame]	3121	static void engine_skip_context(struct i915_request *request)
Mika Kuoppala	36193ac	2017-01-17 17:59:02 +0200	[diff] [blame]	3122	{
				3123	struct intel_engine_cs *engine = request->engine;
Chris Wilson	4e0d64d	2018-05-17 22:26:30 +0100	[diff] [blame]	3124	struct i915_gem_context *hung_ctx = request->gem_context;
Chris Wilson	a89d1f9	2018-05-02 17:38:39 +0100	[diff] [blame]	3125	struct i915_timeline *timeline = request->timeline;
Mika Kuoppala	36193ac	2017-01-17 17:59:02 +0200	[diff] [blame]	3126	unsigned long flags;
				3127
Chris Wilson	a89d1f9	2018-05-02 17:38:39 +0100	[diff] [blame]	3128	GEM_BUG_ON(timeline == &engine->timeline);
Mika Kuoppala	36193ac	2017-01-17 17:59:02 +0200	[diff] [blame]	3129
Chris Wilson	a89d1f9	2018-05-02 17:38:39 +0100	[diff] [blame]	3130	spin_lock_irqsave(&engine->timeline.lock, flags);
Chris Wilson	890fd18	2018-07-06 22:07:10 +0100	[diff] [blame]	3131	spin_lock(&timeline->lock);
Mika Kuoppala	36193ac	2017-01-17 17:59:02 +0200	[diff] [blame]	3132
Chris Wilson	a89d1f9	2018-05-02 17:38:39 +0100	[diff] [blame]	3133	list_for_each_entry_continue(request, &engine->timeline.requests, link)
Chris Wilson	4e0d64d	2018-05-17 22:26:30 +0100	[diff] [blame]	3134	if (request->gem_context == hung_ctx)
Chris Wilson	6dd7526	2018-07-06 11:39:43 +0100	[diff] [blame]	3135	i915_request_skip(request, -EIO);
Mika Kuoppala	36193ac	2017-01-17 17:59:02 +0200	[diff] [blame]	3136
				3137	list_for_each_entry(request, &timeline->requests, link)
Chris Wilson	6dd7526	2018-07-06 11:39:43 +0100	[diff] [blame]	3138	i915_request_skip(request, -EIO);
Mika Kuoppala	36193ac	2017-01-17 17:59:02 +0200	[diff] [blame]	3139
				3140	spin_unlock(&timeline->lock);
Chris Wilson	a89d1f9	2018-05-02 17:38:39 +0100	[diff] [blame]	3141	spin_unlock_irqrestore(&engine->timeline.lock, flags);
Mika Kuoppala	36193ac	2017-01-17 17:59:02 +0200	[diff] [blame]	3142	}
				3143
Chris Wilson	d1d1ebf4	2017-07-21 13:32:33 +0100	[diff] [blame]	3144	/* Returns the request if it was guilty of the hang */
Chris Wilson	e61e0f5	2018-02-21 09:56:36 +0000	[diff] [blame]	3145	static struct i915_request *
Chris Wilson	d1d1ebf4	2017-07-21 13:32:33 +0100	[diff] [blame]	3146	i915_gem_reset_request(struct intel_engine_cs *engine,
Chris Wilson	bba0869	2018-04-06 23:03:53 +0100	[diff] [blame]	3147	struct i915_request *request,
				3148	bool stalled)
Mika Kuoppala	61da536	2017-01-17 17:59:05 +0200	[diff] [blame]	3149	{
Mika Kuoppala	71895a0	2017-01-17 17:59:07 +0200	[diff] [blame]	3150	/* The guilty request will get skipped on a hung engine.
				3151	*
				3152	* Users of client default contexts do not rely on logical
				3153	* state preserved between batches so it is safe to execute
				3154	* queued requests following the hang. Non default contexts
				3155	* rely on preserved state, so skipping a batch loses the
				3156	* evolution of the state and it needs to be considered corrupted.
				3157	* Executing more queued batches on top of corrupted state is
				3158	* risky. But we take the risk by trying to advance through
				3159	* the queued requests in order to make the client behaviour
				3160	* more predictable around resets, by not throwing away random
				3161	* amount of batches it has prepared for execution. Sophisticated
				3162	* clients can use gem_reset_stats_ioctl and dma fence status
				3163	* (exported via sync_file info ioctl on explicit fences) to observe
				3164	* when it loses the context state and should rebuild accordingly.
				3165	*
				3166	* The context ban, and ultimately the client ban, mechanism are safety
				3167	* valves if client submission ends up resulting in nothing more than
				3168	* subsequent hangs.
				3169	*/
				3170
Chris Wilson	bba0869	2018-04-06 23:03:53 +0100	[diff] [blame]	3171	if (i915_request_completed(request)) {
				3172	GEM_TRACE("%s pardoned global=%d (fence %llx:%d), current %d\n",
				3173	engine->name, request->global_seqno,
				3174	request->fence.context, request->fence.seqno,
				3175	intel_engine_get_seqno(engine));
				3176	stalled = false;
				3177	}
				3178
				3179	if (stalled) {
Chris Wilson	4e0d64d	2018-05-17 22:26:30 +0100	[diff] [blame]	3180	i915_gem_context_mark_guilty(request->gem_context);
Chris Wilson	6dd7526	2018-07-06 11:39:43 +0100	[diff] [blame]	3181	i915_request_skip(request, -EIO);
Chris Wilson	d1d1ebf4	2017-07-21 13:32:33 +0100	[diff] [blame]	3182
				3183	/* If this context is now banned, skip all pending requests. */
Chris Wilson	4e0d64d	2018-05-17 22:26:30 +0100	[diff] [blame]	3184	if (i915_gem_context_is_banned(request->gem_context))
Chris Wilson	d1d1ebf4	2017-07-21 13:32:33 +0100	[diff] [blame]	3185	engine_skip_context(request);
Mika Kuoppala	61da536	2017-01-17 17:59:05 +0200	[diff] [blame]	3186	} else {
Chris Wilson	d1d1ebf4	2017-07-21 13:32:33 +0100	[diff] [blame]	3187	/*
				3188	* Since this is not the hung engine, it may have advanced
				3189	* since the hang declaration. Double check by refinding
				3190	* the active request at the time of the reset.
				3191	*/
				3192	request = i915_gem_find_active_request(engine);
				3193	if (request) {
Chris Wilson	042ed2d	2018-06-15 10:31:36 +0100	[diff] [blame]	3194	unsigned long flags;
				3195
Chris Wilson	4e0d64d	2018-05-17 22:26:30 +0100	[diff] [blame]	3196	i915_gem_context_mark_innocent(request->gem_context);
Chris Wilson	d1d1ebf4	2017-07-21 13:32:33 +0100	[diff] [blame]	3197	dma_fence_set_error(&request->fence, -EAGAIN);
				3198
				3199	/* Rewind the engine to replay the incomplete rq */
Chris Wilson	042ed2d	2018-06-15 10:31:36 +0100	[diff] [blame]	3200	spin_lock_irqsave(&engine->timeline.lock, flags);
Chris Wilson	d1d1ebf4	2017-07-21 13:32:33 +0100	[diff] [blame]	3201	request = list_prev_entry(request, link);
Chris Wilson	a89d1f9	2018-05-02 17:38:39 +0100	[diff] [blame]	3202	if (&request->link == &engine->timeline.requests)
Chris Wilson	d1d1ebf4	2017-07-21 13:32:33 +0100	[diff] [blame]	3203	request = NULL;
Chris Wilson	042ed2d	2018-06-15 10:31:36 +0100	[diff] [blame]	3204	spin_unlock_irqrestore(&engine->timeline.lock, flags);
Chris Wilson	d1d1ebf4	2017-07-21 13:32:33 +0100	[diff] [blame]	3205	}
Mika Kuoppala	61da536	2017-01-17 17:59:05 +0200	[diff] [blame]	3206	}
				3207
Chris Wilson	d1d1ebf4	2017-07-21 13:32:33 +0100	[diff] [blame]	3208	return request;
Mika Kuoppala	61da536	2017-01-17 17:59:05 +0200	[diff] [blame]	3209	}
				3210
Michel Thierry	a1ef70e	2017-06-20 10:57:47 +0100	[diff] [blame]	3211	void i915_gem_reset_engine(struct intel_engine_cs *engine,
Chris Wilson	bba0869	2018-04-06 23:03:53 +0100	[diff] [blame]	3212	struct i915_request *request,
				3213	bool stalled)
Chris Wilson	4db080f	2013-12-04 11:37:09 +0000	[diff] [blame]	3214	{
Chris Wilson	fcb1de5	2017-12-19 09:01:10 +0000	[diff] [blame]	3215	/*
				3216	* Make sure this write is visible before we re-enable the interrupt
				3217	* handlers on another CPU, as tasklet_enable() resolves to just
				3218	* a compiler barrier which is insufficient for our purpose here.
				3219	*/
				3220	smp_store_mb(engine->irq_posted, 0);
Chris Wilson	ed454f2	2017-07-21 13:32:29 +0100	[diff] [blame]	3221
Chris Wilson	d1d1ebf4	2017-07-21 13:32:33 +0100	[diff] [blame]	3222	if (request)
Chris Wilson	bba0869	2018-04-06 23:03:53 +0100	[diff] [blame]	3223	request = i915_gem_reset_request(engine, request, stalled);
Chris Wilson	d1d1ebf4	2017-07-21 13:32:33 +0100	[diff] [blame]	3224
Chris Wilson	821ed7d	2016-09-09 14:11:53 +0100	[diff] [blame]	3225	/* Setup the CS to resume from the breadcrumb of the hung request */
Chris Wilson	5adfb77	2018-05-16 19:33:51 +0100	[diff] [blame]	3226	engine->reset.reset(engine, request);
Chris Wilson	821ed7d	2016-09-09 14:11:53 +0100	[diff] [blame]	3227	}
				3228
Chris Wilson	d0667e9	2018-04-06 23:03:54 +0100	[diff] [blame]	3229	void i915_gem_reset(struct drm_i915_private *dev_priv,
				3230	unsigned int stalled_mask)
Chris Wilson	821ed7d	2016-09-09 14:11:53 +0100	[diff] [blame]	3231	{
				3232	struct intel_engine_cs *engine;
Akash Goel	3b3f165	2016-10-13 22:44:48 +0530	[diff] [blame]	3233	enum intel_engine_id id;
Chris Wilson	821ed7d	2016-09-09 14:11:53 +0100	[diff] [blame]	3234
Chris Wilson	4c7d62c	2016-10-28 13:58:32 +0100	[diff] [blame]	3235	lockdep_assert_held(&dev_priv->drm.struct_mutex);
				3236
Chris Wilson	e61e0f5	2018-02-21 09:56:36 +0000	[diff] [blame]	3237	i915_retire_requests(dev_priv);
Chris Wilson	821ed7d	2016-09-09 14:11:53 +0100	[diff] [blame]	3238
Chris Wilson	2ae5573	2017-02-12 17:20:02 +0000	[diff] [blame]	3239	for_each_engine(engine, dev_priv, id) {
Chris Wilson	1fc44d9	2018-05-17 22:26:32 +0100	[diff] [blame]	3240	struct intel_context *ce;
Chris Wilson	2ae5573	2017-02-12 17:20:02 +0000	[diff] [blame]	3241
Chris Wilson	bba0869	2018-04-06 23:03:53 +0100	[diff] [blame]	3242	i915_gem_reset_engine(engine,
				3243	engine->hangcheck.active_request,
Chris Wilson	d0667e9	2018-04-06 23:03:54 +0100	[diff] [blame]	3244	stalled_mask & ENGINE_MASK(id));
Chris Wilson	1fc44d9	2018-05-17 22:26:32 +0100	[diff] [blame]	3245	ce = fetch_and_zero(&engine->last_retired_context);
				3246	if (ce)
				3247	intel_context_unpin(ce);
Chris Wilson	7b6da81	2017-12-16 00:03:34 +0000	[diff] [blame]	3248
				3249	/*
				3250	* Ostensibily, we always want a context loaded for powersaving,
				3251	* so if the engine is idle after the reset, send a request
				3252	* to load our scratch kernel_context.
				3253	*
				3254	* More mysteriously, if we leave the engine idle after a reset,
				3255	* the next userspace batch may hang, with what appears to be
				3256	* an incoherent read by the CS (presumably stale TLB). An
				3257	* empty request appears sufficient to paper over the glitch.
				3258	*/
Chris Wilson	01b8fdc	2018-02-05 15:24:31 +0000	[diff] [blame]	3259	if (intel_engine_is_idle(engine)) {
Chris Wilson	e61e0f5	2018-02-21 09:56:36 +0000	[diff] [blame]	3260	struct i915_request *rq;
Chris Wilson	7b6da81	2017-12-16 00:03:34 +0000	[diff] [blame]	3261
Chris Wilson	e61e0f5	2018-02-21 09:56:36 +0000	[diff] [blame]	3262	rq = i915_request_alloc(engine,
				3263	dev_priv->kernel_context);
Chris Wilson	7b6da81	2017-12-16 00:03:34 +0000	[diff] [blame]	3264	if (!IS_ERR(rq))
Chris Wilson	697b9a8	2018-06-12 11:51:35 +0100	[diff] [blame]	3265	i915_request_add(rq);
Chris Wilson	7b6da81	2017-12-16 00:03:34 +0000	[diff] [blame]	3266	}
Chris Wilson	2ae5573	2017-02-12 17:20:02 +0000	[diff] [blame]	3267	}
Chris Wilson	821ed7d	2016-09-09 14:11:53 +0100	[diff] [blame]	3268
Tvrtko Ursulin	4362f4f	2016-11-16 08:55:33 +0000	[diff] [blame]	3269	i915_gem_restore_fences(dev_priv);
Chris Wilson	821ed7d	2016-09-09 14:11:53 +0100	[diff] [blame]	3270	}
				3271
Michel Thierry	a1ef70e	2017-06-20 10:57:47 +0100	[diff] [blame]	3272	void i915_gem_reset_finish_engine(struct intel_engine_cs *engine)
				3273	{
Chris Wilson	5adfb77	2018-05-16 19:33:51 +0100	[diff] [blame]	3274	engine->reset.finish(engine);
				3275
Chris Wilson	1749d90	2017-10-09 12:02:59 +0100	[diff] [blame]	3276	intel_uncore_forcewake_put(engine->i915, FORCEWAKE_ALL);
Michel Thierry	a1ef70e	2017-06-20 10:57:47 +0100	[diff] [blame]	3277	}
				3278
Chris Wilson	d802709	2017-02-08 14:30:32 +0000	[diff] [blame]	3279	void i915_gem_reset_finish(struct drm_i915_private *dev_priv)
				3280	{
Chris Wilson	1f7b847	2017-02-08 14:30:33 +0000	[diff] [blame]	3281	struct intel_engine_cs *engine;
				3282	enum intel_engine_id id;
				3283
Chris Wilson	d802709	2017-02-08 14:30:32 +0000	[diff] [blame]	3284	lockdep_assert_held(&dev_priv->drm.struct_mutex);
Chris Wilson	1f7b847	2017-02-08 14:30:33 +0000	[diff] [blame]	3285
Chris Wilson	fe3288b	2017-02-12 17:20:01 +0000	[diff] [blame]	3286	for_each_engine(engine, dev_priv, id) {
Michel Thierry	c64992e	2017-06-20 10:57:44 +0100	[diff] [blame]	3287	engine->hangcheck.active_request = NULL;
Michel Thierry	a1ef70e	2017-06-20 10:57:47 +0100	[diff] [blame]	3288	i915_gem_reset_finish_engine(engine);
Chris Wilson	fe3288b	2017-02-12 17:20:01 +0000	[diff] [blame]	3289	}
Chris Wilson	d802709	2017-02-08 14:30:32 +0000	[diff] [blame]	3290	}
				3291
Chris Wilson	e61e0f5	2018-02-21 09:56:36 +0000	[diff] [blame]	3292	static void nop_submit_request(struct i915_request *request)
Chris Wilson	821ed7d	2016-09-09 14:11:53 +0100	[diff] [blame]	3293	{
Chris Wilson	d9b13c4	2018-03-15 13:14:50 +0000	[diff] [blame]	3294	GEM_TRACE("%s fence %llx:%d -> -EIO\n",
				3295	request->engine->name,
				3296	request->fence.context, request->fence.seqno);
Daniel Vetter	af7a8ff	2017-10-11 11:10:19 +0200	[diff] [blame]	3297	dma_fence_set_error(&request->fence, -EIO);
				3298
Chris Wilson	e61e0f5	2018-02-21 09:56:36 +0000	[diff] [blame]	3299	i915_request_submit(request);
Daniel Vetter	af7a8ff	2017-10-11 11:10:19 +0200	[diff] [blame]	3300	}
				3301
Chris Wilson	e61e0f5	2018-02-21 09:56:36 +0000	[diff] [blame]	3302	static void nop_complete_submit_request(struct i915_request *request)
Daniel Vetter	af7a8ff	2017-10-11 11:10:19 +0200	[diff] [blame]	3303	{
Chris Wilson	8d55082	2017-10-06 12:56:17 +0100	[diff] [blame]	3304	unsigned long flags;
				3305
Chris Wilson	d9b13c4	2018-03-15 13:14:50 +0000	[diff] [blame]	3306	GEM_TRACE("%s fence %llx:%d -> -EIO\n",
				3307	request->engine->name,
				3308	request->fence.context, request->fence.seqno);
Chris Wilson	3cd9442	2017-01-10 17:22:45 +0000	[diff] [blame]	3309	dma_fence_set_error(&request->fence, -EIO);
Chris Wilson	8d55082	2017-10-06 12:56:17 +0100	[diff] [blame]	3310
Chris Wilson	a89d1f9	2018-05-02 17:38:39 +0100	[diff] [blame]	3311	spin_lock_irqsave(&request->engine->timeline.lock, flags);
Chris Wilson	e61e0f5	2018-02-21 09:56:36 +0000	[diff] [blame]	3312	__i915_request_submit(request);
Chris Wilson	3dcf93f7	2016-11-22 14:41:20 +0000	[diff] [blame]	3313	intel_engine_init_global_seqno(request->engine, request->global_seqno);
Chris Wilson	a89d1f9	2018-05-02 17:38:39 +0100	[diff] [blame]	3314	spin_unlock_irqrestore(&request->engine->timeline.lock, flags);
Chris Wilson	821ed7d	2016-09-09 14:11:53 +0100	[diff] [blame]	3315	}
				3316
Daniel Vetter	af7a8ff	2017-10-11 11:10:19 +0200	[diff] [blame]	3317	void i915_gem_set_wedged(struct drm_i915_private *i915)
Chris Wilson	821ed7d	2016-09-09 14:11:53 +0100	[diff] [blame]	3318	{
Tvrtko Ursulin	e2f8039	2016-03-16 11:00:36 +0000	[diff] [blame]	3319	struct intel_engine_cs *engine;
Akash Goel	3b3f165	2016-10-13 22:44:48 +0530	[diff] [blame]	3320	enum intel_engine_id id;
Eric Anholt	673a394	2008-07-30 12:06:12 -0700	[diff] [blame]	3321
Chris Wilson	d9b13c4	2018-03-15 13:14:50 +0000	[diff] [blame]	3322	GEM_TRACE("start\n");
				3323
Chris Wilson	7f961d7	2018-04-26 11:32:19 +0100	[diff] [blame]	3324	if (GEM_SHOW_DEBUG()) {
Chris Wilson	559e040	2018-02-05 09:21:59 +0000	[diff] [blame]	3325	struct drm_printer p = drm_debug_printer(__func__);
				3326
				3327	for_each_engine(engine, i915, id)
				3328	intel_engine_dump(engine, &p, "%s\n", engine->name);
				3329	}
				3330
Chris Wilson	3970c65	2018-07-23 15:53:35 +0100	[diff] [blame]	3331	if (test_and_set_bit(I915_WEDGED, &i915->gpu_error.flags))
				3332	goto out;
Chris Wilson	0d73e7a	2018-02-07 15:13:50 +0000	[diff] [blame]	3333
Daniel Vetter	af7a8ff	2017-10-11 11:10:19 +0200	[diff] [blame]	3334	/*
				3335	* First, stop submission to hw, but do not yet complete requests by
				3336	* rolling the global seqno forward (since this would complete requests
				3337	* for which we haven't set the fence error to EIO yet).
				3338	*/
Chris Wilson	963ddd6	2018-03-02 11:33:24 +0000	[diff] [blame]	3339	for_each_engine(engine, i915, id) {
				3340	i915_gem_reset_prepare_engine(engine);
Chris Wilson	47650db	2018-03-07 13:42:25 +0000	[diff] [blame]	3341
Daniel Vetter	af7a8ff	2017-10-11 11:10:19 +0200	[diff] [blame]	3342	engine->submit_request = nop_submit_request;
Chris Wilson	47650db	2018-03-07 13:42:25 +0000	[diff] [blame]	3343	engine->schedule = NULL;
Chris Wilson	963ddd6	2018-03-02 11:33:24 +0000	[diff] [blame]	3344	}
Chris Wilson	47650db	2018-03-07 13:42:25 +0000	[diff] [blame]	3345	i915->caps.scheduler = 0;
Daniel Vetter	af7a8ff	2017-10-11 11:10:19 +0200	[diff] [blame]	3346
Chris Wilson	ac697ae	2018-03-15 15:10:15 +0000	[diff] [blame]	3347	/* Even if the GPU reset fails, it should still stop the engines */
Chris Wilson	ec5b65a	2018-07-26 09:50:33 +0100	[diff] [blame]	3348	if (INTEL_GEN(i915) >= 5)
				3349	intel_gpu_reset(i915, ALL_ENGINES);
Chris Wilson	ac697ae	2018-03-15 15:10:15 +0000	[diff] [blame]	3350
Daniel Vetter	af7a8ff	2017-10-11 11:10:19 +0200	[diff] [blame]	3351	/*
				3352	* Make sure no one is running the old callback before we proceed with
				3353	* cancelling requests and resetting the completion tracking. Otherwise
				3354	* we might submit a request to the hardware which never completes.
				3355	*/
				3356	synchronize_rcu();
				3357
				3358	for_each_engine(engine, i915, id) {
				3359	/* Mark all executing requests as skipped */
				3360	engine->cancel_requests(engine);
				3361
				3362	/*
				3363	* Only once we've force-cancelled all in-flight requests can we
				3364	* start to complete all requests.
				3365	*/
				3366	engine->submit_request = nop_complete_submit_request;
				3367	}
				3368
				3369	/*
				3370	* Make sure no request can slip through without getting completed by
				3371	* either this call here to intel_engine_init_global_seqno, or the one
				3372	* in nop_complete_submit_request.
				3373	*/
				3374	synchronize_rcu();
				3375
				3376	for_each_engine(engine, i915, id) {
				3377	unsigned long flags;
				3378
Chris Wilson	0d73e7a	2018-02-07 15:13:50 +0000	[diff] [blame]	3379	/*
				3380	* Mark all pending requests as complete so that any concurrent
Daniel Vetter	af7a8ff	2017-10-11 11:10:19 +0200	[diff] [blame]	3381	* (lockless) lookup doesn't try and wait upon the request as we
				3382	* reset it.
				3383	*/
Chris Wilson	a89d1f9	2018-05-02 17:38:39 +0100	[diff] [blame]	3384	spin_lock_irqsave(&engine->timeline.lock, flags);
Daniel Vetter	af7a8ff	2017-10-11 11:10:19 +0200	[diff] [blame]	3385	intel_engine_init_global_seqno(engine,
				3386	intel_engine_last_submit(engine));
Chris Wilson	a89d1f9	2018-05-02 17:38:39 +0100	[diff] [blame]	3387	spin_unlock_irqrestore(&engine->timeline.lock, flags);
Chris Wilson	963ddd6	2018-03-02 11:33:24 +0000	[diff] [blame]	3388
				3389	i915_gem_reset_finish_engine(engine);
Daniel Vetter	af7a8ff	2017-10-11 11:10:19 +0200	[diff] [blame]	3390	}
Chris Wilson	20e4933	2016-11-22 14:41:21 +0000	[diff] [blame]	3391
Chris Wilson	3970c65	2018-07-23 15:53:35 +0100	[diff] [blame]	3392	out:
Chris Wilson	d9b13c4	2018-03-15 13:14:50 +0000	[diff] [blame]	3393	GEM_TRACE("end\n");
				3394
Chris Wilson	3d7adbb	2017-07-21 13:32:27 +0100	[diff] [blame]	3395	wake_up_all(&i915->gpu_error.reset_queue);
Eric Anholt	673a394	2008-07-30 12:06:12 -0700	[diff] [blame]	3396	}
				3397
Chris Wilson	2e8f9d3	2017-03-16 17:13:04 +0000	[diff] [blame]	3398	bool i915_gem_unset_wedged(struct drm_i915_private *i915)
				3399	{
Chris Wilson	a89d1f9	2018-05-02 17:38:39 +0100	[diff] [blame]	3400	struct i915_timeline *tl;
Chris Wilson	2e8f9d3	2017-03-16 17:13:04 +0000	[diff] [blame]	3401
				3402	lockdep_assert_held(&i915->drm.struct_mutex);
				3403	if (!test_bit(I915_WEDGED, &i915->gpu_error.flags))
				3404	return true;
				3405
Chris Wilson	d9b13c4	2018-03-15 13:14:50 +0000	[diff] [blame]	3406	GEM_TRACE("start\n");
				3407
Chris Wilson	2d4ecac	2018-03-07 13:42:21 +0000	[diff] [blame]	3408	/*
				3409	* Before unwedging, make sure that all pending operations
Chris Wilson	2e8f9d3	2017-03-16 17:13:04 +0000	[diff] [blame]	3410	* are flushed and errored out - we may have requests waiting upon
				3411	* third party fences. We marked all inflight requests as EIO, and
				3412	* every execbuf since returned EIO, for consistency we want all
				3413	* the currently pending requests to also be marked as EIO, which
				3414	* is done inside our nop_submit_request - and so we must wait.
				3415	*
				3416	* No more can be submitted until we reset the wedged bit.
				3417	*/
				3418	list_for_each_entry(tl, &i915->gt.timelines, link) {
Chris Wilson	a89d1f9	2018-05-02 17:38:39 +0100	[diff] [blame]	3419	struct i915_request *rq;
Chris Wilson	2e8f9d3	2017-03-16 17:13:04 +0000	[diff] [blame]	3420
Chris Wilson	a89d1f9	2018-05-02 17:38:39 +0100	[diff] [blame]	3421	rq = i915_gem_active_peek(&tl->last_request,
				3422	&i915->drm.struct_mutex);
				3423	if (!rq)
				3424	continue;
Chris Wilson	2e8f9d3	2017-03-16 17:13:04 +0000	[diff] [blame]	3425
Chris Wilson	a89d1f9	2018-05-02 17:38:39 +0100	[diff] [blame]	3426	/*
				3427	* We can't use our normal waiter as we want to
				3428	* avoid recursively trying to handle the current
				3429	* reset. The basic dma_fence_default_wait() installs
				3430	* a callback for dma_fence_signal(), which is
				3431	* triggered by our nop handler (indirectly, the
				3432	* callback enables the signaler thread which is
				3433	* woken by the nop_submit_request() advancing the seqno
				3434	* and when the seqno passes the fence, the signaler
				3435	* then signals the fence waking us up).
				3436	*/
				3437	if (dma_fence_default_wait(&rq->fence, true,
				3438	MAX_SCHEDULE_TIMEOUT) < 0)
				3439	return false;
Chris Wilson	2e8f9d3	2017-03-16 17:13:04 +0000	[diff] [blame]	3440	}
Chris Wilson	2d4ecac	2018-03-07 13:42:21 +0000	[diff] [blame]	3441	i915_retire_requests(i915);
				3442	GEM_BUG_ON(i915->gt.active_requests);
Chris Wilson	2e8f9d3	2017-03-16 17:13:04 +0000	[diff] [blame]	3443
Chris Wilson	8db601f	2018-09-14 09:00:17 +0100	[diff] [blame]	3444	if (!intel_gpu_reset(i915, ALL_ENGINES))
				3445	intel_engines_sanitize(i915);
				3446
Chris Wilson	2d4ecac	2018-03-07 13:42:21 +0000	[diff] [blame]	3447	/*
				3448	* Undo nop_submit_request. We prevent all new i915 requests from
Chris Wilson	2e8f9d3	2017-03-16 17:13:04 +0000	[diff] [blame]	3449	* being queued (by disallowing execbuf whilst wedged) so having
				3450	* waited for all active requests above, we know the system is idle
				3451	* and do not have to worry about a thread being inside
				3452	* engine->submit_request() as we swap over. So unlike installing
				3453	* the nop_submit_request on reset, we can do this from normal
				3454	* context and do not require stop_machine().
				3455	*/
				3456	intel_engines_reset_default_submission(i915);
Chris Wilson	36703e7	2017-06-22 11:56:25 +0100	[diff] [blame]	3457	i915_gem_contexts_lost(i915);
Chris Wilson	2e8f9d3	2017-03-16 17:13:04 +0000	[diff] [blame]	3458
Chris Wilson	d9b13c4	2018-03-15 13:14:50 +0000	[diff] [blame]	3459	GEM_TRACE("end\n");
				3460
Chris Wilson	2e8f9d3	2017-03-16 17:13:04 +0000	[diff] [blame]	3461	smp_mb__before_atomic(); /* complete takeover before enabling execbuf */
				3462	clear_bit(I915_WEDGED, &i915->gpu_error.flags);
				3463
				3464	return true;
				3465	}
				3466
Daniel Vetter	75ef9da	2010-08-21 00:25:16 +0200	[diff] [blame]	3467	static void
Eric Anholt	673a394	2008-07-30 12:06:12 -0700	[diff] [blame]	3468	i915_gem_retire_work_handler(struct work_struct *work)
				3469	{
Chris Wilson	b29c19b	2013-09-25 17:34:56 +0100	[diff] [blame]	3470	struct drm_i915_private *dev_priv =
Chris Wilson	67d97da	2016-07-04 08:08:31 +0100	[diff] [blame]	3471	container_of(work, typeof(*dev_priv), gt.retire_work.work);
Chris Wilson	91c8a32	2016-07-05 10:40:23 +0100	[diff] [blame]	3472	struct drm_device *dev = &dev_priv->drm;
Eric Anholt	673a394	2008-07-30 12:06:12 -0700	[diff] [blame]	3473
Chris Wilson	891b48c	2010-09-29 12:26:37 +0100	[diff] [blame]	3474	/* Come back later if the device is busy... */
Chris Wilson	b29c19b	2013-09-25 17:34:56 +0100	[diff] [blame]	3475	if (mutex_trylock(&dev->struct_mutex)) {
Chris Wilson	e61e0f5	2018-02-21 09:56:36 +0000	[diff] [blame]	3476	i915_retire_requests(dev_priv);
Chris Wilson	b29c19b	2013-09-25 17:34:56 +0100	[diff] [blame]	3477	mutex_unlock(&dev->struct_mutex);
				3478	}
Chris Wilson	67d97da	2016-07-04 08:08:31 +0100	[diff] [blame]	3479
Chris Wilson	8892304	2018-01-29 14:41:04 +0000	[diff] [blame]	3480	/*
				3481	* Keep the retire handler running until we are finally idle.
Chris Wilson	67d97da	2016-07-04 08:08:31 +0100	[diff] [blame]	3482	* We do not need to do this test under locking as in the worst-case
				3483	* we queue the retire worker once too often.
				3484	*/
Chris Wilson	8892304	2018-01-29 14:41:04 +0000	[diff] [blame]	3485	if (READ_ONCE(dev_priv->gt.awake))
Chris Wilson	67d97da	2016-07-04 08:08:31 +0100	[diff] [blame]	3486	queue_delayed_work(dev_priv->wq,
				3487	&dev_priv->gt.retire_work,
Chris Wilson	bcb4508	2012-10-05 17:02:57 +0100	[diff] [blame]	3488	round_jiffies_up_relative(HZ));
Chris Wilson	b29c19b	2013-09-25 17:34:56 +0100	[diff] [blame]	3489	}
Chris Wilson	891b48c	2010-09-29 12:26:37 +0100	[diff] [blame]	3490
Chris Wilson	84a1074	2018-01-24 11:36:08 +0000	[diff] [blame]	3491	static void shrink_caches(struct drm_i915_private *i915)
				3492	{
				3493	/*
				3494	* kmem_cache_shrink() discards empty slabs and reorders partially
				3495	* filled slabs to prioritise allocating from the mostly full slabs,
				3496	* with the aim of reducing fragmentation.
				3497	*/
				3498	kmem_cache_shrink(i915->priorities);
				3499	kmem_cache_shrink(i915->dependencies);
				3500	kmem_cache_shrink(i915->requests);
				3501	kmem_cache_shrink(i915->luts);
				3502	kmem_cache_shrink(i915->vmas);
				3503	kmem_cache_shrink(i915->objects);
				3504	}
				3505
				3506	struct sleep_rcu_work {
				3507	union {
				3508	struct rcu_head rcu;
				3509	struct work_struct work;
				3510	};
				3511	struct drm_i915_private *i915;
				3512	unsigned int epoch;
				3513	};
				3514
				3515	static inline bool
				3516	same_epoch(struct drm_i915_private *i915, unsigned int epoch)
				3517	{
				3518	/*
				3519	* There is a small chance that the epoch wrapped since we started
				3520	* sleeping. If we assume that epoch is at least a u32, then it will
				3521	* take at least 2^32 * 100ms for it to wrap, or about 326 years.
				3522	*/
				3523	return epoch == READ_ONCE(i915->gt.epoch);
				3524	}
				3525
				3526	static void __sleep_work(struct work_struct *work)
				3527	{
				3528	struct sleep_rcu_work s = container_of(work, typeof(s), work);
				3529	struct drm_i915_private *i915 = s->i915;
				3530	unsigned int epoch = s->epoch;
				3531
				3532	kfree(s);
				3533	if (same_epoch(i915, epoch))
				3534	shrink_caches(i915);
				3535	}
				3536
				3537	static void __sleep_rcu(struct rcu_head *rcu)
				3538	{
				3539	struct sleep_rcu_work s = container_of(rcu, typeof(s), rcu);
				3540	struct drm_i915_private *i915 = s->i915;
				3541
				3542	if (same_epoch(i915, s->epoch)) {
				3543	INIT_WORK(&s->work, __sleep_work);
				3544	queue_work(i915->wq, &s->work);
				3545	} else {
				3546	kfree(s);
				3547	}
				3548	}
				3549
Chris Wilson	5427f20	2017-10-23 22:32:34 +0100	[diff] [blame]	3550	static inline bool
				3551	new_requests_since_last_retire(const struct drm_i915_private *i915)
				3552	{
				3553	return (READ_ONCE(i915->gt.active_requests) \|\|
				3554	work_pending(&i915->gt.idle_work.work));
				3555	}
				3556
Chris Wilson	1934f5de	2018-05-31 23:40:57 +0100	[diff] [blame]	3557	static void assert_kernel_context_is_current(struct drm_i915_private *i915)
				3558	{
				3559	struct intel_engine_cs *engine;
				3560	enum intel_engine_id id;
				3561
				3562	if (i915_terminally_wedged(&i915->gpu_error))
				3563	return;
				3564
				3565	GEM_BUG_ON(i915->gt.active_requests);
				3566	for_each_engine(engine, i915, id) {
				3567	GEM_BUG_ON(__i915_gem_active_peek(&engine->timeline.last_request));
				3568	GEM_BUG_ON(engine->last_retired_context !=
				3569	to_intel_context(i915->kernel_context, engine));
				3570	}
				3571	}
				3572
Chris Wilson	b29c19b	2013-09-25 17:34:56 +0100	[diff] [blame]	3573	static void
				3574	i915_gem_idle_work_handler(struct work_struct *work)
				3575	{
				3576	struct drm_i915_private *dev_priv =
Chris Wilson	67d97da	2016-07-04 08:08:31 +0100	[diff] [blame]	3577	container_of(work, typeof(*dev_priv), gt.idle_work.work);
Chris Wilson	84a1074	2018-01-24 11:36:08 +0000	[diff] [blame]	3578	unsigned int epoch = I915_EPOCH_INVALID;
Chris Wilson	67d97da	2016-07-04 08:08:31 +0100	[diff] [blame]	3579	bool rearm_hangcheck;
				3580
				3581	if (!READ_ONCE(dev_priv->gt.awake))
				3582	return;
				3583
Chris Wilson	4dfacb0	2018-05-31 09:22:43 +0100	[diff] [blame]	3584	if (READ_ONCE(dev_priv->gt.active_requests))
				3585	return;
				3586
				3587	/*
				3588	* Flush out the last user context, leaving only the pinned
				3589	* kernel context resident. When we are idling on the kernel_context,
				3590	* no more new requests (with a context switch) are emitted and we
				3591	* can finally rest. A consequence is that the idle work handler is
				3592	* always called at least twice before idling (and if the system is
				3593	* idle that implies a round trip through the retire worker).
				3594	*/
				3595	mutex_lock(&dev_priv->drm.struct_mutex);
				3596	i915_gem_switch_to_kernel_context(dev_priv);
				3597	mutex_unlock(&dev_priv->drm.struct_mutex);
				3598
				3599	GEM_TRACE("active_requests=%d (after switch-to-kernel-context)\n",
				3600	READ_ONCE(dev_priv->gt.active_requests));
				3601
Imre Deak	0cb5670	2016-11-07 11:20:04 +0200	[diff] [blame]	3602	/*
				3603	* Wait for last execlists context complete, but bail out in case a
Chris Wilson	ffed7bd	2018-03-01 10:33:38 +0000	[diff] [blame]	3604	* new request is submitted. As we don't trust the hardware, we
				3605	* continue on if the wait times out. This is necessary to allow
				3606	* the machine to suspend even if the hardware dies, and we will
				3607	* try to recover in resume (after depriving the hardware of power,
				3608	* it may be in a better mmod).
Imre Deak	0cb5670	2016-11-07 11:20:04 +0200	[diff] [blame]	3609	*/
Chris Wilson	ffed7bd	2018-03-01 10:33:38 +0000	[diff] [blame]	3610	__wait_for(if (new_requests_since_last_retire(dev_priv)) return,
				3611	intel_engines_are_idle(dev_priv),
				3612	I915_IDLE_ENGINES_TIMEOUT * 1000,
				3613	10, 500);
Chris Wilson	67d97da	2016-07-04 08:08:31 +0100	[diff] [blame]	3614
				3615	rearm_hangcheck =
				3616	cancel_delayed_work_sync(&dev_priv->gpu_error.hangcheck_work);
				3617
Chris Wilson	5427f20	2017-10-23 22:32:34 +0100	[diff] [blame]	3618	if (!mutex_trylock(&dev_priv->drm.struct_mutex)) {
Chris Wilson	67d97da	2016-07-04 08:08:31 +0100	[diff] [blame]	3619	/* Currently busy, come back later */
				3620	mod_delayed_work(dev_priv->wq,
				3621	&dev_priv->gt.idle_work,
				3622	msecs_to_jiffies(50));
				3623	goto out_rearm;
				3624	}
				3625
Imre Deak	93c97dc	2016-11-07 11:20:03 +0200	[diff] [blame]	3626	/*
				3627	* New request retired after this work handler started, extend active
				3628	* period until next instance of the work.
				3629	*/
Chris Wilson	5427f20	2017-10-23 22:32:34 +0100	[diff] [blame]	3630	if (new_requests_since_last_retire(dev_priv))
Imre Deak	93c97dc	2016-11-07 11:20:03 +0200	[diff] [blame]	3631	goto out_unlock;
				3632
Chris Wilson	e4d2006	2018-04-06 16:51:44 +0100	[diff] [blame]	3633	epoch = __i915_gem_park(dev_priv);
Chris Wilson	ff320d6	2017-10-23 22:32:35 +0100	[diff] [blame]	3634
Chris Wilson	1934f5de	2018-05-31 23:40:57 +0100	[diff] [blame]	3635	assert_kernel_context_is_current(dev_priv);
				3636
Chris Wilson	67d97da	2016-07-04 08:08:31 +0100	[diff] [blame]	3637	rearm_hangcheck = false;
Chris Wilson	67d97da	2016-07-04 08:08:31 +0100	[diff] [blame]	3638	out_unlock:
Chris Wilson	5427f20	2017-10-23 22:32:34 +0100	[diff] [blame]	3639	mutex_unlock(&dev_priv->drm.struct_mutex);
Chris Wilson	35c9418	2015-04-07 16:20:37 +0100	[diff] [blame]	3640
Chris Wilson	67d97da	2016-07-04 08:08:31 +0100	[diff] [blame]	3641	out_rearm:
				3642	if (rearm_hangcheck) {
				3643	GEM_BUG_ON(!dev_priv->gt.awake);
				3644	i915_queue_hangcheck(dev_priv);
Chris Wilson	35c9418	2015-04-07 16:20:37 +0100	[diff] [blame]	3645	}
Chris Wilson	84a1074	2018-01-24 11:36:08 +0000	[diff] [blame]	3646
				3647	/*
				3648	* When we are idle, it is an opportune time to reap our caches.
				3649	* However, we have many objects that utilise RCU and the ordered
				3650	* i915->wq that this work is executing on. To try and flush any
				3651	* pending frees now we are idle, we first wait for an RCU grace
				3652	* period, and then queue a task (that will run last on the wq) to
				3653	* shrink and re-optimize the caches.
				3654	*/
				3655	if (same_epoch(dev_priv, epoch)) {
				3656	struct sleep_rcu_work s = kmalloc(sizeof(s), GFP_KERNEL);
				3657	if (s) {
				3658	s->i915 = dev_priv;
				3659	s->epoch = epoch;
				3660	call_rcu(&s->rcu, __sleep_rcu);
				3661	}
				3662	}
Eric Anholt	673a394	2008-07-30 12:06:12 -0700	[diff] [blame]	3663	}
				3664
Chris Wilson	b1f788c	2016-08-04 07:52:45 +0100	[diff] [blame]	3665	void i915_gem_close_object(struct drm_gem_object gem, struct drm_file file)
				3666	{
Chris Wilson	d1b48c1	2017-08-16 09:52:08 +0100	[diff] [blame]	3667	struct drm_i915_private *i915 = to_i915(gem->dev);
Chris Wilson	b1f788c	2016-08-04 07:52:45 +0100	[diff] [blame]	3668	struct drm_i915_gem_object *obj = to_intel_bo(gem);
				3669	struct drm_i915_file_private *fpriv = file->driver_priv;
Chris Wilson	d1b48c1	2017-08-16 09:52:08 +0100	[diff] [blame]	3670	struct i915_lut_handle lut, ln;
Chris Wilson	b1f788c	2016-08-04 07:52:45 +0100	[diff] [blame]	3671
Chris Wilson	d1b48c1	2017-08-16 09:52:08 +0100	[diff] [blame]	3672	mutex_lock(&i915->drm.struct_mutex);
				3673
				3674	list_for_each_entry_safe(lut, ln, &obj->lut_list, obj_link) {
				3675	struct i915_gem_context *ctx = lut->ctx;
				3676	struct i915_vma *vma;
				3677
Chris Wilson	432295d	2017-08-22 12:05:15 +0100	[diff] [blame]	3678	GEM_BUG_ON(ctx->file_priv == ERR_PTR(-EBADF));
Chris Wilson	d1b48c1	2017-08-16 09:52:08 +0100	[diff] [blame]	3679	if (ctx->file_priv != fpriv)
				3680	continue;
				3681
				3682	vma = radix_tree_delete(&ctx->handles_vma, lut->handle);
Chris Wilson	3ffff01	2017-08-22 12:05:17 +0100	[diff] [blame]	3683	GEM_BUG_ON(vma->obj != obj);
				3684
				3685	/* We allow the process to have multiple handles to the same
				3686	* vma, in the same fd namespace, by virtue of flink/open.
				3687	*/
				3688	GEM_BUG_ON(!vma->open_count);
				3689	if (!--vma->open_count && !i915_vma_is_ggtt(vma))
Chris Wilson	b1f788c	2016-08-04 07:52:45 +0100	[diff] [blame]	3690	i915_vma_close(vma);
Chris Wilson	f8a7fde	2016-10-28 13:58:29 +0100	[diff] [blame]	3691
Chris Wilson	d1b48c1	2017-08-16 09:52:08 +0100	[diff] [blame]	3692	list_del(&lut->obj_link);
				3693	list_del(&lut->ctx_link);
Chris Wilson	4ff4b44	2017-06-16 15:05:16 +0100	[diff] [blame]	3694
Chris Wilson	d1b48c1	2017-08-16 09:52:08 +0100	[diff] [blame]	3695	kmem_cache_free(i915->luts, lut);
				3696	__i915_gem_object_release_unless_active(obj);
Chris Wilson	f8a7fde	2016-10-28 13:58:29 +0100	[diff] [blame]	3697	}
Chris Wilson	d1b48c1	2017-08-16 09:52:08 +0100	[diff] [blame]	3698
				3699	mutex_unlock(&i915->drm.struct_mutex);
Chris Wilson	b1f788c	2016-08-04 07:52:45 +0100	[diff] [blame]	3700	}
				3701
Chris Wilson	e95433c	2016-10-28 13:58:27 +0100	[diff] [blame]	3702	static unsigned long to_wait_timeout(s64 timeout_ns)
				3703	{
				3704	if (timeout_ns < 0)
				3705	return MAX_SCHEDULE_TIMEOUT;
				3706
				3707	if (timeout_ns == 0)
				3708	return 0;
				3709
				3710	return nsecs_to_jiffies_timeout(timeout_ns);
				3711	}
				3712
Ben Widawsky	5816d64	2012-04-11 11:18:19 -0700	[diff] [blame]	3713	/**
Ben Widawsky	23ba4fd	2012-05-24 15:03:10 -0700	[diff] [blame]	3714	* i915_gem_wait_ioctl - implements DRM_IOCTL_I915_GEM_WAIT
Tvrtko Ursulin	14bb2c1	2016-06-03 14:02:17 +0100	[diff] [blame]	3715	* @dev: drm device pointer
				3716	* @data: ioctl data blob
				3717	* @file: drm file pointer
Ben Widawsky	23ba4fd	2012-05-24 15:03:10 -0700	[diff] [blame]	3718	*
				3719	* Returns 0 if successful, else an error is returned with the remaining time in
				3720	* the timeout parameter.
				3721	* -ETIME: object is still busy after timeout
				3722	* -ERESTARTSYS: signal interrupted the wait
				3723	* -ENONENT: object doesn't exist
				3724	* Also possible, but rare:
Chris Wilson	b805014	2017-08-11 11:57:31 +0100	[diff] [blame]	3725	* -EAGAIN: incomplete, restart syscall
Ben Widawsky	23ba4fd	2012-05-24 15:03:10 -0700	[diff] [blame]	3726	* -ENOMEM: damn
				3727	* -ENODEV: Internal IRQ fail
				3728	* -E?: The add request failed
				3729	*
				3730	* The wait ioctl with a timeout of 0 reimplements the busy ioctl. With any
				3731	* non-zero timeout parameter the wait ioctl will wait for the given number of
				3732	* nanoseconds on an object becoming unbusy. Since the wait itself does so
				3733	* without holding struct_mutex the object may become re-busied before this
				3734	* function completes. A similar but shorter * race condition exists in the busy
				3735	* ioctl
				3736	*/
				3737	int
				3738	i915_gem_wait_ioctl(struct drm_device dev, void data, struct drm_file *file)
				3739	{
				3740	struct drm_i915_gem_wait *args = data;
				3741	struct drm_i915_gem_object *obj;
Chris Wilson	e95433c	2016-10-28 13:58:27 +0100	[diff] [blame]	3742	ktime_t start;
				3743	long ret;
Ben Widawsky	23ba4fd	2012-05-24 15:03:10 -0700	[diff] [blame]	3744
Daniel Vetter	11b5d51	2014-09-29 15:31:26 +0200	[diff] [blame]	3745	if (args->flags != 0)
				3746	return -EINVAL;
				3747
Chris Wilson	03ac064	2016-07-20 13:31:51 +0100	[diff] [blame]	3748	obj = i915_gem_object_lookup(file, args->bo_handle);
Chris Wilson	033d549	2016-08-05 10:14:17 +0100	[diff] [blame]	3749	if (!obj)
Ben Widawsky	23ba4fd	2012-05-24 15:03:10 -0700	[diff] [blame]	3750	return -ENOENT;
Chris Wilson	033d549	2016-08-05 10:14:17 +0100	[diff] [blame]	3751
Chris Wilson	e95433c	2016-10-28 13:58:27 +0100	[diff] [blame]	3752	start = ktime_get();
				3753
				3754	ret = i915_gem_object_wait(obj,
Chris Wilson	e9eaf82	2018-10-01 15:47:55 +0100	[diff] [blame^]	3755	I915_WAIT_INTERRUPTIBLE \|
				3756	I915_WAIT_PRIORITY \|
				3757	I915_WAIT_ALL,
Chris Wilson	e95433c	2016-10-28 13:58:27 +0100	[diff] [blame]	3758	to_wait_timeout(args->timeout_ns),
				3759	to_rps_client(file));
				3760
				3761	if (args->timeout_ns > 0) {
				3762	args->timeout_ns -= ktime_to_ns(ktime_sub(ktime_get(), start));
				3763	if (args->timeout_ns < 0)
				3764	args->timeout_ns = 0;
Chris Wilson	c1d2061	2017-02-16 12:54:41 +0000	[diff] [blame]	3765
				3766	/*
				3767	* Apparently ktime isn't accurate enough and occasionally has a
				3768	* bit of mismatch in the jiffies<->nsecs<->ktime loop. So patch
				3769	* things up to make the test happy. We allow up to 1 jiffy.
				3770	*
				3771	* This is a regression from the timespec->ktime conversion.
				3772	*/
				3773	if (ret == -ETIME && !nsecs_to_jiffies(args->timeout_ns))
				3774	args->timeout_ns = 0;
Chris Wilson	b805014	2017-08-11 11:57:31 +0100	[diff] [blame]	3775
				3776	/* Asked to wait beyond the jiffie/scheduler precision? */
				3777	if (ret == -ETIME && args->timeout_ns)
				3778	ret = -EAGAIN;
Ben Widawsky	23ba4fd	2012-05-24 15:03:10 -0700	[diff] [blame]	3779	}
				3780
Chris Wilson	f0cd518	2016-10-28 13:58:43 +0100	[diff] [blame]	3781	i915_gem_object_put(obj);
John Harrison	ff86588	2014-11-24 18:49:28 +0000	[diff] [blame]	3782	return ret;
Ben Widawsky	23ba4fd	2012-05-24 15:03:10 -0700	[diff] [blame]	3783	}
				3784
Chris Wilson	ec625fb	2018-07-09 13:20:42 +0100	[diff] [blame]	3785	static long wait_for_timeline(struct i915_timeline *tl,
				3786	unsigned int flags, long timeout)
Daniel Vetter	4df2faf	2010-02-19 11:52:00 +0100	[diff] [blame]	3787	{
Chris Wilson	0606035	2018-05-31 09:22:44 +0100	[diff] [blame]	3788	struct i915_request *rq;
Chris Wilson	0606035	2018-05-31 09:22:44 +0100	[diff] [blame]	3789
				3790	rq = i915_gem_active_get_unlocked(&tl->last_request);
				3791	if (!rq)
Chris Wilson	ec625fb	2018-07-09 13:20:42 +0100	[diff] [blame]	3792	return timeout;
Chris Wilson	0606035	2018-05-31 09:22:44 +0100	[diff] [blame]	3793
				3794	/*
				3795	* "Race-to-idle".
				3796	*
				3797	* Switching to the kernel context is often used a synchronous
				3798	* step prior to idling, e.g. in suspend for flushing all
				3799	* current operations to memory before sleeping. These we
				3800	* want to complete as quickly as possible to avoid prolonged
				3801	* stalls, so allow the gpu to boost to maximum clocks.
				3802	*/
				3803	if (flags & I915_WAIT_FOR_IDLE_BOOST)
				3804	gen6_rps_boost(rq, NULL);
				3805
Chris Wilson	ec625fb	2018-07-09 13:20:42 +0100	[diff] [blame]	3806	timeout = i915_request_wait(rq, flags, timeout);
Chris Wilson	0606035	2018-05-31 09:22:44 +0100	[diff] [blame]	3807	i915_request_put(rq);
				3808
Chris Wilson	ec625fb	2018-07-09 13:20:42 +0100	[diff] [blame]	3809	return timeout;
Chris Wilson	73cb970	2016-10-28 13:58:46 +0100	[diff] [blame]	3810	}
				3811
Chris Wilson	25112b6	2017-03-30 15:50:39 +0100	[diff] [blame]	3812	static int wait_for_engines(struct drm_i915_private *i915)
				3813	{
Chris Wilson	ee42c00	2017-12-11 19:41:34 +0000	[diff] [blame]	3814	if (wait_for(intel_engines_are_idle(i915), I915_IDLE_ENGINES_TIMEOUT)) {
Chris Wilson	59e4b19	2017-12-11 19:41:35 +0000	[diff] [blame]	3815	dev_err(i915->drm.dev,
				3816	"Failed to idle engines, declaring wedged!\n");
Chris Wilson	629820f	2018-03-09 10:11:14 +0000	[diff] [blame]	3817	GEM_TRACE_DUMP();
Chris Wilson	cad9946	2017-08-26 12:09:33 +0100	[diff] [blame]	3818	i915_gem_set_wedged(i915);
				3819	return -EIO;
Chris Wilson	25112b6	2017-03-30 15:50:39 +0100	[diff] [blame]	3820	}
				3821
				3822	return 0;
				3823	}
				3824
Chris Wilson	ec625fb	2018-07-09 13:20:42 +0100	[diff] [blame]	3825	int i915_gem_wait_for_idle(struct drm_i915_private *i915,
				3826	unsigned int flags, long timeout)
Chris Wilson	73cb970	2016-10-28 13:58:46 +0100	[diff] [blame]	3827	{
Chris Wilson	ec625fb	2018-07-09 13:20:42 +0100	[diff] [blame]	3828	GEM_TRACE("flags=%x (%s), timeout=%ld%s\n",
				3829	flags, flags & I915_WAIT_LOCKED ? "locked" : "unlocked",
				3830	timeout, timeout == MAX_SCHEDULE_TIMEOUT ? " (forever)" : "");
Chris Wilson	09a4c02	2018-05-24 09:11:35 +0100	[diff] [blame]	3831
Chris Wilson	863e9fd	2017-05-30 13:13:32 +0100	[diff] [blame]	3832	/* If the device is asleep, we have no requests outstanding */
				3833	if (!READ_ONCE(i915->gt.awake))
				3834	return 0;
				3835
Chris Wilson	9caa34a	2016-11-11 14:58:08 +0000	[diff] [blame]	3836	if (flags & I915_WAIT_LOCKED) {
Chris Wilson	a89d1f9	2018-05-02 17:38:39 +0100	[diff] [blame]	3837	struct i915_timeline *tl;
				3838	int err;
Chris Wilson	9caa34a	2016-11-11 14:58:08 +0000	[diff] [blame]	3839
				3840	lockdep_assert_held(&i915->drm.struct_mutex);
				3841
				3842	list_for_each_entry(tl, &i915->gt.timelines, link) {
Chris Wilson	ec625fb	2018-07-09 13:20:42 +0100	[diff] [blame]	3843	timeout = wait_for_timeline(tl, flags, timeout);
				3844	if (timeout < 0)
				3845	return timeout;
Chris Wilson	9caa34a	2016-11-11 14:58:08 +0000	[diff] [blame]	3846	}
Chris Wilson	c1e63f6	2018-08-08 11:50:59 +0100	[diff] [blame]	3847	if (GEM_SHOW_DEBUG() && !timeout) {
				3848	/* Presume that timeout was non-zero to begin with! */
				3849	dev_warn(&i915->drm.pdev->dev,
				3850	"Missed idle-completion interrupt!\n");
				3851	GEM_TRACE_DUMP();
				3852	}
Chris Wilson	a61b47f	2018-06-27 12:53:34 +0100	[diff] [blame]	3853
				3854	err = wait_for_engines(i915);
				3855	if (err)
				3856	return err;
				3857
Chris Wilson	e61e0f5	2018-02-21 09:56:36 +0000	[diff] [blame]	3858	i915_retire_requests(i915);
Chris Wilson	09a4c02	2018-05-24 09:11:35 +0100	[diff] [blame]	3859	GEM_BUG_ON(i915->gt.active_requests);
Chris Wilson	9caa34a	2016-11-11 14:58:08 +0000	[diff] [blame]	3860	} else {
Chris Wilson	a89d1f9	2018-05-02 17:38:39 +0100	[diff] [blame]	3861	struct intel_engine_cs *engine;
				3862	enum intel_engine_id id;
Zou Nan hai	d1b851f	2010-05-21 09:08:57 +0800	[diff] [blame]	3863
Chris Wilson	a89d1f9	2018-05-02 17:38:39 +0100	[diff] [blame]	3864	for_each_engine(engine, i915, id) {
Chris Wilson	ec625fb	2018-07-09 13:20:42 +0100	[diff] [blame]	3865	struct i915_timeline *tl = &engine->timeline;
				3866
				3867	timeout = wait_for_timeline(tl, flags, timeout);
				3868	if (timeout < 0)
				3869	return timeout;
Chris Wilson	a89d1f9	2018-05-02 17:38:39 +0100	[diff] [blame]	3870	}
Chris Wilson	a89d1f9	2018-05-02 17:38:39 +0100	[diff] [blame]	3871	}
Chris Wilson	a61b47f	2018-06-27 12:53:34 +0100	[diff] [blame]	3872
				3873	return 0;
Daniel Vetter	4df2faf	2010-02-19 11:52:00 +0100	[diff] [blame]	3874	}
				3875
Chris Wilson	5a97bcc	2017-02-22 11:40:46 +0000	[diff] [blame]	3876	static void __i915_gem_object_flush_for_display(struct drm_i915_gem_object *obj)
				3877	{
Chris Wilson	e27ab73	2017-06-15 13:38:49 +0100	[diff] [blame]	3878	/*
				3879	* We manually flush the CPU domain so that we can override and
				3880	* force the flush for the display, and perform it asyncrhonously.
				3881	*/
				3882	flush_write_domain(obj, ~I915_GEM_DOMAIN_CPU);
				3883	if (obj->cache_dirty)
				3884	i915_gem_clflush_object(obj, I915_CLFLUSH_FORCE);
Christian König	c0a51fd	2018-02-16 13:43:38 +0100	[diff] [blame]	3885	obj->write_domain = 0;
Chris Wilson	5a97bcc	2017-02-22 11:40:46 +0000	[diff] [blame]	3886	}
				3887
				3888	void i915_gem_object_flush_if_display(struct drm_i915_gem_object *obj)
				3889	{
Chris Wilson	bd3d225	2017-10-13 21:26:14 +0100	[diff] [blame]	3890	if (!READ_ONCE(obj->pin_global))
Chris Wilson	5a97bcc	2017-02-22 11:40:46 +0000	[diff] [blame]	3891	return;
				3892
				3893	mutex_lock(&obj->base.dev->struct_mutex);
				3894	__i915_gem_object_flush_for_display(obj);
				3895	mutex_unlock(&obj->base.dev->struct_mutex);
				3896	}
				3897
Eric Anholt	2ef7eea	2008-11-10 10:53:25 -0800	[diff] [blame]	3898	/**
Chris Wilson	e22d8e3	2017-04-12 12:01:11 +0100	[diff] [blame]	3899	* Moves a single object to the WC read, and possibly write domain.
				3900	* @obj: object to act on
				3901	* @write: ask for write access or read only
				3902	*
				3903	* This function returns when the move is complete, including waiting on
				3904	* flushes to occur.
				3905	*/
				3906	int
				3907	i915_gem_object_set_to_wc_domain(struct drm_i915_gem_object *obj, bool write)
				3908	{
				3909	int ret;
				3910
				3911	lockdep_assert_held(&obj->base.dev->struct_mutex);
				3912
				3913	ret = i915_gem_object_wait(obj,
				3914	I915_WAIT_INTERRUPTIBLE \|
				3915	I915_WAIT_LOCKED \|
				3916	(write ? I915_WAIT_ALL : 0),
				3917	MAX_SCHEDULE_TIMEOUT,
				3918	NULL);
				3919	if (ret)
				3920	return ret;
				3921
Christian König	c0a51fd	2018-02-16 13:43:38 +0100	[diff] [blame]	3922	if (obj->write_domain == I915_GEM_DOMAIN_WC)
Chris Wilson	e22d8e3	2017-04-12 12:01:11 +0100	[diff] [blame]	3923	return 0;
				3924
				3925	/* Flush and acquire obj->pages so that we are coherent through
				3926	* direct access in memory with previous cached writes through
				3927	* shmemfs and that our cache domain tracking remains valid.
				3928	* For example, if the obj->filp was moved to swap without us
				3929	* being notified and releasing the pages, we would mistakenly
				3930	* continue to assume that the obj remained out of the CPU cached
				3931	* domain.
				3932	*/
				3933	ret = i915_gem_object_pin_pages(obj);
				3934	if (ret)
				3935	return ret;
				3936
				3937	flush_write_domain(obj, ~I915_GEM_DOMAIN_WC);
				3938
				3939	/* Serialise direct access to this object with the barriers for
				3940	* coherent writes from the GPU, by effectively invalidating the
				3941	* WC domain upon first access.
				3942	*/
Christian König	c0a51fd	2018-02-16 13:43:38 +0100	[diff] [blame]	3943	if ((obj->read_domains & I915_GEM_DOMAIN_WC) == 0)
Chris Wilson	e22d8e3	2017-04-12 12:01:11 +0100	[diff] [blame]	3944	mb();
				3945
				3946	/* It should now be out of any other write domains, and we can update
				3947	* the domain values for our changes.
				3948	*/
Christian König	c0a51fd	2018-02-16 13:43:38 +0100	[diff] [blame]	3949	GEM_BUG_ON((obj->write_domain & ~I915_GEM_DOMAIN_WC) != 0);
				3950	obj->read_domains \|= I915_GEM_DOMAIN_WC;
Chris Wilson	e22d8e3	2017-04-12 12:01:11 +0100	[diff] [blame]	3951	if (write) {
Christian König	c0a51fd	2018-02-16 13:43:38 +0100	[diff] [blame]	3952	obj->read_domains = I915_GEM_DOMAIN_WC;
				3953	obj->write_domain = I915_GEM_DOMAIN_WC;
Chris Wilson	e22d8e3	2017-04-12 12:01:11 +0100	[diff] [blame]	3954	obj->mm.dirty = true;
				3955	}
				3956
				3957	i915_gem_object_unpin_pages(obj);
				3958	return 0;
				3959	}
				3960
				3961	/**
Eric Anholt	2ef7eea	2008-11-10 10:53:25 -0800	[diff] [blame]	3962	* Moves a single object to the GTT read, and possibly write domain.
Tvrtko Ursulin	14bb2c1	2016-06-03 14:02:17 +0100	[diff] [blame]	3963	* @obj: object to act on
				3964	* @write: ask for write access or read only
Eric Anholt	2ef7eea	2008-11-10 10:53:25 -0800	[diff] [blame]	3965	*
				3966	* This function returns when the move is complete, including waiting on
				3967	* flushes to occur.
				3968	*/
Jesse Barnes	79e5394	2008-11-07 14:24:08 -0800	[diff] [blame]	3969	int
Chris Wilson	2021746	2010-11-23 15:26:33 +0000	[diff] [blame]	3970	i915_gem_object_set_to_gtt_domain(struct drm_i915_gem_object *obj, bool write)
Eric Anholt	2ef7eea	2008-11-10 10:53:25 -0800	[diff] [blame]	3971	{
Eric Anholt	e47c68e	2008-11-14 13:35:19 -0800	[diff] [blame]	3972	int ret;
Eric Anholt	2ef7eea	2008-11-10 10:53:25 -0800	[diff] [blame]	3973
Chris Wilson	e95433c	2016-10-28 13:58:27 +0100	[diff] [blame]	3974	lockdep_assert_held(&obj->base.dev->struct_mutex);
Chris Wilson	4c7d62c	2016-10-28 13:58:32 +0100	[diff] [blame]	3975
Chris Wilson	e95433c	2016-10-28 13:58:27 +0100	[diff] [blame]	3976	ret = i915_gem_object_wait(obj,
				3977	I915_WAIT_INTERRUPTIBLE \|
				3978	I915_WAIT_LOCKED \|
				3979	(write ? I915_WAIT_ALL : 0),
				3980	MAX_SCHEDULE_TIMEOUT,
				3981	NULL);
Chris Wilson	8824178	2011-01-07 17:09:48 +0000	[diff] [blame]	3982	if (ret)
				3983	return ret;
				3984
Christian König	c0a51fd	2018-02-16 13:43:38 +0100	[diff] [blame]	3985	if (obj->write_domain == I915_GEM_DOMAIN_GTT)
Chris Wilson	c13d87e	2016-07-20 09:21:15 +0100	[diff] [blame]	3986	return 0;
				3987
Chris Wilson	43566de	2015-01-02 16:29:29 +0530	[diff] [blame]	3988	/* Flush and acquire obj->pages so that we are coherent through
				3989	* direct access in memory with previous cached writes through
				3990	* shmemfs and that our cache domain tracking remains valid.
				3991	* For example, if the obj->filp was moved to swap without us
				3992	* being notified and releasing the pages, we would mistakenly
				3993	* continue to assume that the obj remained out of the CPU cached
				3994	* domain.
				3995	*/
Chris Wilson	a4f5ea6	2016-10-28 13:58:35 +0100	[diff] [blame]	3996	ret = i915_gem_object_pin_pages(obj);
Chris Wilson	43566de	2015-01-02 16:29:29 +0530	[diff] [blame]	3997	if (ret)
				3998	return ret;
				3999
Chris Wilson	ef74921	2017-04-12 12:01:10 +0100	[diff] [blame]	4000	flush_write_domain(obj, ~I915_GEM_DOMAIN_GTT);
Chris Wilson	1c5d22f	2009-08-25 11:15:50 +0100	[diff] [blame]	4001
Chris Wilson	d0a5778	2012-10-09 19:24:37 +0100	[diff] [blame]	4002	/* Serialise direct access to this object with the barriers for
				4003	* coherent writes from the GPU, by effectively invalidating the
				4004	* GTT domain upon first access.
				4005	*/
Christian König	c0a51fd	2018-02-16 13:43:38 +0100	[diff] [blame]	4006	if ((obj->read_domains & I915_GEM_DOMAIN_GTT) == 0)
Chris Wilson	d0a5778	2012-10-09 19:24:37 +0100	[diff] [blame]	4007	mb();
				4008
Eric Anholt	2ef7eea	2008-11-10 10:53:25 -0800	[diff] [blame]	4009	/* It should now be out of any other write domains, and we can update
				4010	* the domain values for our changes.
				4011	*/
Christian König	c0a51fd	2018-02-16 13:43:38 +0100	[diff] [blame]	4012	GEM_BUG_ON((obj->write_domain & ~I915_GEM_DOMAIN_GTT) != 0);
				4013	obj->read_domains \|= I915_GEM_DOMAIN_GTT;
Eric Anholt	e47c68e	2008-11-14 13:35:19 -0800	[diff] [blame]	4014	if (write) {
Christian König	c0a51fd	2018-02-16 13:43:38 +0100	[diff] [blame]	4015	obj->read_domains = I915_GEM_DOMAIN_GTT;
				4016	obj->write_domain = I915_GEM_DOMAIN_GTT;
Chris Wilson	a4f5ea6	2016-10-28 13:58:35 +0100	[diff] [blame]	4017	obj->mm.dirty = true;
Eric Anholt	e47c68e	2008-11-14 13:35:19 -0800	[diff] [blame]	4018	}
				4019
Chris Wilson	a4f5ea6	2016-10-28 13:58:35 +0100	[diff] [blame]	4020	i915_gem_object_unpin_pages(obj);
Eric Anholt	e47c68e	2008-11-14 13:35:19 -0800	[diff] [blame]	4021	return 0;
				4022	}
				4023
Chris Wilson	ef55f92	2015-10-09 14:11:27 +0100	[diff] [blame]	4024	/**
				4025	* Changes the cache-level of an object across all VMA.
Tvrtko Ursulin	14bb2c1	2016-06-03 14:02:17 +0100	[diff] [blame]	4026	* @obj: object to act on
				4027	* @cache_level: new cache level to set for the object
Chris Wilson	ef55f92	2015-10-09 14:11:27 +0100	[diff] [blame]	4028	*
				4029	* After this function returns, the object will be in the new cache-level
				4030	* across all GTT and the contents of the backing storage will be coherent,
				4031	* with respect to the new cache-level. In order to keep the backing storage
				4032	* coherent for all users, we only allow a single cache level to be set
				4033	* globally on the object and prevent it from being changed whilst the
				4034	* hardware is reading from the object. That is if the object is currently
				4035	* on the scanout it will be set to uncached (or equivalent display
				4036	* cache coherency) and all non-MOCS GPU access will also be uncached so
				4037	* that all direct access to the scanout remains coherent.
				4038	*/
Chris Wilson	e4ffd17	2011-04-04 09:44:39 +0100	[diff] [blame]	4039	int i915_gem_object_set_cache_level(struct drm_i915_gem_object *obj,
				4040	enum i915_cache_level cache_level)
				4041	{
Chris Wilson	aa653a6	2016-08-04 07:52:27 +0100	[diff] [blame]	4042	struct i915_vma *vma;
Chris Wilson	a6a7cc4	2016-11-18 21:17:46 +0000	[diff] [blame]	4043	int ret;
Chris Wilson	e4ffd17	2011-04-04 09:44:39 +0100	[diff] [blame]	4044
Chris Wilson	4c7d62c	2016-10-28 13:58:32 +0100	[diff] [blame]	4045	lockdep_assert_held(&obj->base.dev->struct_mutex);
				4046
Chris Wilson	e4ffd17	2011-04-04 09:44:39 +0100	[diff] [blame]	4047	if (obj->cache_level == cache_level)
Chris Wilson	a6a7cc4	2016-11-18 21:17:46 +0000	[diff] [blame]	4048	return 0;
Chris Wilson	e4ffd17	2011-04-04 09:44:39 +0100	[diff] [blame]	4049
Chris Wilson	ef55f92	2015-10-09 14:11:27 +0100	[diff] [blame]	4050	/* Inspect the list of currently bound VMA and unbind any that would
				4051	* be invalid given the new cache-level. This is principally to
				4052	* catch the issue of the CS prefetch crossing page boundaries and
				4053	* reading an invalid PTE on older architectures.
				4054	*/
Chris Wilson	aa653a6	2016-08-04 07:52:27 +0100	[diff] [blame]	4055	restart:
				4056	list_for_each_entry(vma, &obj->vma_list, obj_link) {
Chris Wilson	ef55f92	2015-10-09 14:11:27 +0100	[diff] [blame]	4057	if (!drm_mm_node_allocated(&vma->node))
				4058	continue;
				4059
Chris Wilson	20dfbde	2016-08-04 16:32:30 +0100	[diff] [blame]	4060	if (i915_vma_is_pinned(vma)) {
Chris Wilson	ef55f92	2015-10-09 14:11:27 +0100	[diff] [blame]	4061	DRM_DEBUG("can not change the cache level of pinned objects\n");
				4062	return -EBUSY;
				4063	}
				4064
Chris Wilson	010e3e6	2017-12-06 12:49:13 +0000	[diff] [blame]	4065	if (!i915_vma_is_closed(vma) &&
				4066	i915_gem_valid_gtt_space(vma, cache_level))
Chris Wilson	aa653a6	2016-08-04 07:52:27 +0100	[diff] [blame]	4067	continue;
				4068
				4069	ret = i915_vma_unbind(vma);
				4070	if (ret)
				4071	return ret;
				4072
				4073	/* As unbinding may affect other elements in the
				4074	* obj->vma_list (due to side-effects from retiring
				4075	* an active vma), play safe and restart the iterator.
				4076	*/
				4077	goto restart;
Chris Wilson	42d6ab4	2012-07-26 11:49:32 +0100	[diff] [blame]	4078	}
				4079
Chris Wilson	ef55f92	2015-10-09 14:11:27 +0100	[diff] [blame]	4080	/* We can reuse the existing drm_mm nodes but need to change the
				4081	* cache-level on the PTE. We could simply unbind them all and
				4082	* rebind with the correct cache-level on next use. However since
				4083	* we already have a valid slot, dma mapping, pages etc, we may as
				4084	* rewrite the PTE in the belief that doing so tramples upon less
				4085	* state and so involves less work.
				4086	*/
Chris Wilson	15717de	2016-08-04 07:52:26 +0100	[diff] [blame]	4087	if (obj->bind_count) {
Chris Wilson	ef55f92	2015-10-09 14:11:27 +0100	[diff] [blame]	4088	/* Before we change the PTE, the GPU must not be accessing it.
				4089	* If we wait upon the object, we know that all the bound
				4090	* VMA are no longer active.
				4091	*/
Chris Wilson	e95433c	2016-10-28 13:58:27 +0100	[diff] [blame]	4092	ret = i915_gem_object_wait(obj,
				4093	I915_WAIT_INTERRUPTIBLE \|
				4094	I915_WAIT_LOCKED \|
				4095	I915_WAIT_ALL,
				4096	MAX_SCHEDULE_TIMEOUT,
				4097	NULL);
Chris Wilson	e4ffd17	2011-04-04 09:44:39 +0100	[diff] [blame]	4098	if (ret)
				4099	return ret;
				4100
Tvrtko Ursulin	0031fb9	2016-11-04 14:42:44 +0000	[diff] [blame]	4101	if (!HAS_LLC(to_i915(obj->base.dev)) &&
				4102	cache_level != I915_CACHE_NONE) {
Chris Wilson	ef55f92	2015-10-09 14:11:27 +0100	[diff] [blame]	4103	/* Access to snoopable pages through the GTT is
				4104	* incoherent and on some machines causes a hard
				4105	* lockup. Relinquish the CPU mmaping to force
				4106	* userspace to refault in the pages and we can
				4107	* then double check if the GTT mapping is still
				4108	* valid for that pointer access.
				4109	*/
				4110	i915_gem_release_mmap(obj);
Chris Wilson	e4ffd17	2011-04-04 09:44:39 +0100	[diff] [blame]	4111
Chris Wilson	ef55f92	2015-10-09 14:11:27 +0100	[diff] [blame]	4112	/* As we no longer need a fence for GTT access,
				4113	* we can relinquish it now (and so prevent having
				4114	* to steal a fence from someone else on the next
				4115	* fence request). Note GPU activity would have
				4116	* dropped the fence as all snoopable access is
				4117	* supposed to be linear.
				4118	*/
Chris Wilson	e2189dd	2017-12-07 21:14:07 +0000	[diff] [blame]	4119	for_each_ggtt_vma(vma, obj) {
Chris Wilson	49ef529	2016-08-18 17:17:00 +0100	[diff] [blame]	4120	ret = i915_vma_put_fence(vma);
				4121	if (ret)
				4122	return ret;
				4123	}
Chris Wilson	ef55f92	2015-10-09 14:11:27 +0100	[diff] [blame]	4124	} else {
				4125	/* We either have incoherent backing store and
				4126	* so no GTT access or the architecture is fully
				4127	* coherent. In such cases, existing GTT mmaps
				4128	* ignore the cache bit in the PTE and we can
				4129	* rewrite it without confusing the GPU or having
				4130	* to force userspace to fault back in its mmaps.
				4131	*/
Chris Wilson	e4ffd17	2011-04-04 09:44:39 +0100	[diff] [blame]	4132	}
				4133
Chris Wilson	1c7f4bc	2016-02-26 11:03:19 +0000	[diff] [blame]	4134	list_for_each_entry(vma, &obj->vma_list, obj_link) {
Chris Wilson	ef55f92	2015-10-09 14:11:27 +0100	[diff] [blame]	4135	if (!drm_mm_node_allocated(&vma->node))
				4136	continue;
				4137
				4138	ret = i915_vma_bind(vma, cache_level, PIN_UPDATE);
				4139	if (ret)
				4140	return ret;
				4141	}
Chris Wilson	e4ffd17	2011-04-04 09:44:39 +0100	[diff] [blame]	4142	}
				4143
Chris Wilson	1c7f4bc	2016-02-26 11:03:19 +0000	[diff] [blame]	4144	list_for_each_entry(vma, &obj->vma_list, obj_link)
Chris Wilson	2c22569	2013-08-09 12:26:45 +0100	[diff] [blame]	4145	vma->node.color = cache_level;
Chris Wilson	b8f55be	2017-08-11 12:11:16 +0100	[diff] [blame]	4146	i915_gem_object_set_cache_coherency(obj, cache_level);
Chris Wilson	e27ab73	2017-06-15 13:38:49 +0100	[diff] [blame]	4147	obj->cache_dirty = true; /* Always invalidate stale cachelines */
Chris Wilson	2c22569	2013-08-09 12:26:45 +0100	[diff] [blame]	4148
Chris Wilson	e4ffd17	2011-04-04 09:44:39 +0100	[diff] [blame]	4149	return 0;
				4150	}
				4151
Ben Widawsky	199adf4	2012-09-21 17:01:20 -0700	[diff] [blame]	4152	int i915_gem_get_caching_ioctl(struct drm_device dev, void data,
				4153	struct drm_file *file)
Chris Wilson	e6994ae	2012-07-10 10:27:08 +0100	[diff] [blame]	4154	{
Ben Widawsky	199adf4	2012-09-21 17:01:20 -0700	[diff] [blame]	4155	struct drm_i915_gem_caching *args = data;
Chris Wilson	e6994ae	2012-07-10 10:27:08 +0100	[diff] [blame]	4156	struct drm_i915_gem_object *obj;
Chris Wilson	fbbd37b	2016-10-28 13:58:42 +0100	[diff] [blame]	4157	int err = 0;
Chris Wilson	e6994ae	2012-07-10 10:27:08 +0100	[diff] [blame]	4158
Chris Wilson	fbbd37b	2016-10-28 13:58:42 +0100	[diff] [blame]	4159	rcu_read_lock();
				4160	obj = i915_gem_object_lookup_rcu(file, args->handle);
				4161	if (!obj) {
				4162	err = -ENOENT;
				4163	goto out;
				4164	}
Chris Wilson	e6994ae	2012-07-10 10:27:08 +0100	[diff] [blame]	4165
Chris Wilson	651d794	2013-08-08 14:41:10 +0100	[diff] [blame]	4166	switch (obj->cache_level) {
				4167	case I915_CACHE_LLC:
				4168	case I915_CACHE_L3_LLC:
				4169	args->caching = I915_CACHING_CACHED;
				4170	break;
				4171
Chris Wilson	4257d3b	2013-08-08 14:41:11 +0100	[diff] [blame]	4172	case I915_CACHE_WT:
				4173	args->caching = I915_CACHING_DISPLAY;
				4174	break;
				4175
Chris Wilson	651d794	2013-08-08 14:41:10 +0100	[diff] [blame]	4176	default:
				4177	args->caching = I915_CACHING_NONE;
				4178	break;
				4179	}
Chris Wilson	fbbd37b	2016-10-28 13:58:42 +0100	[diff] [blame]	4180	out:
				4181	rcu_read_unlock();
				4182	return err;
Chris Wilson	e6994ae	2012-07-10 10:27:08 +0100	[diff] [blame]	4183	}
				4184
Ben Widawsky	199adf4	2012-09-21 17:01:20 -0700	[diff] [blame]	4185	int i915_gem_set_caching_ioctl(struct drm_device dev, void data,
				4186	struct drm_file *file)
Chris Wilson	e6994ae	2012-07-10 10:27:08 +0100	[diff] [blame]	4187	{
Chris Wilson	9c870d0	2016-10-24 13:42:15 +0100	[diff] [blame]	4188	struct drm_i915_private *i915 = to_i915(dev);
Ben Widawsky	199adf4	2012-09-21 17:01:20 -0700	[diff] [blame]	4189	struct drm_i915_gem_caching *args = data;
Chris Wilson	e6994ae	2012-07-10 10:27:08 +0100	[diff] [blame]	4190	struct drm_i915_gem_object *obj;
				4191	enum i915_cache_level level;
Chris Wilson	d65415d	2017-01-19 08:22:10 +0000	[diff] [blame]	4192	int ret = 0;
Chris Wilson	e6994ae	2012-07-10 10:27:08 +0100	[diff] [blame]	4193
Ben Widawsky	199adf4	2012-09-21 17:01:20 -0700	[diff] [blame]	4194	switch (args->caching) {
				4195	case I915_CACHING_NONE:
Chris Wilson	e6994ae	2012-07-10 10:27:08 +0100	[diff] [blame]	4196	level = I915_CACHE_NONE;
				4197	break;
Ben Widawsky	199adf4	2012-09-21 17:01:20 -0700	[diff] [blame]	4198	case I915_CACHING_CACHED:
Imre Deak	e5756c1	2015-08-14 18:43:30 +0300	[diff] [blame]	4199	/*
				4200	* Due to a HW issue on BXT A stepping, GPU stores via a
				4201	* snooped mapping may leave stale data in a corresponding CPU
				4202	* cacheline, whereas normally such cachelines would get
				4203	* invalidated.
				4204	*/
Chris Wilson	9c870d0	2016-10-24 13:42:15 +0100	[diff] [blame]	4205	if (!HAS_LLC(i915) && !HAS_SNOOP(i915))
Imre Deak	e5756c1	2015-08-14 18:43:30 +0300	[diff] [blame]	4206	return -ENODEV;
				4207
Chris Wilson	e6994ae	2012-07-10 10:27:08 +0100	[diff] [blame]	4208	level = I915_CACHE_LLC;
				4209	break;
Chris Wilson	4257d3b	2013-08-08 14:41:11 +0100	[diff] [blame]	4210	case I915_CACHING_DISPLAY:
Chris Wilson	9c870d0	2016-10-24 13:42:15 +0100	[diff] [blame]	4211	level = HAS_WT(i915) ? I915_CACHE_WT : I915_CACHE_NONE;
Chris Wilson	4257d3b	2013-08-08 14:41:11 +0100	[diff] [blame]	4212	break;
Chris Wilson	e6994ae	2012-07-10 10:27:08 +0100	[diff] [blame]	4213	default:
				4214	return -EINVAL;
				4215	}
				4216
Chris Wilson	d65415d	2017-01-19 08:22:10 +0000	[diff] [blame]	4217	obj = i915_gem_object_lookup(file, args->handle);
				4218	if (!obj)
				4219	return -ENOENT;
				4220
Tina Zhang	a03f395	2017-11-14 10:25:13 +0000	[diff] [blame]	4221	/*
				4222	* The caching mode of proxy object is handled by its generator, and
				4223	* not allowed to be changed by userspace.
				4224	*/
				4225	if (i915_gem_object_is_proxy(obj)) {
				4226	ret = -ENXIO;
				4227	goto out;
				4228	}
				4229
Chris Wilson	d65415d	2017-01-19 08:22:10 +0000	[diff] [blame]	4230	if (obj->cache_level == level)
				4231	goto out;
				4232
				4233	ret = i915_gem_object_wait(obj,
				4234	I915_WAIT_INTERRUPTIBLE,
				4235	MAX_SCHEDULE_TIMEOUT,
				4236	to_rps_client(file));
				4237	if (ret)
				4238	goto out;
				4239
Ben Widawsky	3bc2913	2012-09-26 16:15:20 -0700	[diff] [blame]	4240	ret = i915_mutex_lock_interruptible(dev);
				4241	if (ret)
Chris Wilson	d65415d	2017-01-19 08:22:10 +0000	[diff] [blame]	4242	goto out;
Chris Wilson	e6994ae	2012-07-10 10:27:08 +0100	[diff] [blame]	4243
				4244	ret = i915_gem_object_set_cache_level(obj, level);
Chris Wilson	e6994ae	2012-07-10 10:27:08 +0100	[diff] [blame]	4245	mutex_unlock(&dev->struct_mutex);
Chris Wilson	d65415d	2017-01-19 08:22:10 +0000	[diff] [blame]	4246
				4247	out:
				4248	i915_gem_object_put(obj);
Chris Wilson	e6994ae	2012-07-10 10:27:08 +0100	[diff] [blame]	4249	return ret;
				4250	}
				4251
Zhenyu Wang	b9241ea	2009-11-25 13:09:39 +0800	[diff] [blame]	4252	/*
Dhinakaran Pandiyan	07bcd99	2018-03-06 19:34:18 -0800	[diff] [blame]	4253	* Prepare buffer for display plane (scanout, cursors, etc). Can be called from
				4254	* an uninterruptible phase (modesetting) and allows any flushes to be pipelined
				4255	* (for pageflips). We only flush the caches while preparing the buffer for
				4256	* display, the callers are responsible for frontbuffer flush.
Zhenyu Wang	b9241ea	2009-11-25 13:09:39 +0800	[diff] [blame]	4257	*/
Chris Wilson	058d88c	2016-08-15 10:49:06 +0100	[diff] [blame]	4258	struct i915_vma *
Chris Wilson	2da3b9b	2011-04-14 09:41:17 +0100	[diff] [blame]	4259	i915_gem_object_pin_to_display_plane(struct drm_i915_gem_object *obj,
				4260	u32 alignment,
Chris Wilson	5935485	2018-02-20 13:42:06 +0000	[diff] [blame]	4261	const struct i915_ggtt_view *view,
				4262	unsigned int flags)
Zhenyu Wang	b9241ea	2009-11-25 13:09:39 +0800	[diff] [blame]	4263	{
Chris Wilson	058d88c	2016-08-15 10:49:06 +0100	[diff] [blame]	4264	struct i915_vma *vma;
Zhenyu Wang	b9241ea	2009-11-25 13:09:39 +0800	[diff] [blame]	4265	int ret;
				4266
Chris Wilson	4c7d62c	2016-10-28 13:58:32 +0100	[diff] [blame]	4267	lockdep_assert_held(&obj->base.dev->struct_mutex);
				4268
Chris Wilson	bd3d225	2017-10-13 21:26:14 +0100	[diff] [blame]	4269	/* Mark the global pin early so that we account for the
Chris Wilson	cc98b41	2013-08-09 12:25:09 +0100	[diff] [blame]	4270	* display coherency whilst setting up the cache domains.
				4271	*/
Chris Wilson	bd3d225	2017-10-13 21:26:14 +0100	[diff] [blame]	4272	obj->pin_global++;
Chris Wilson	cc98b41	2013-08-09 12:25:09 +0100	[diff] [blame]	4273
Eric Anholt	a7ef064	2011-03-29 16:59:54 -0700	[diff] [blame]	4274	/* The display engine is not coherent with the LLC cache on gen6. As
				4275	* a result, we make sure that the pinning that is about to occur is
				4276	* done with uncached PTEs. This is lowest common denominator for all
				4277	* chipsets.
				4278	*
				4279	* However for gen6+, we could do better by using the GFDT bit instead
				4280	* of uncaching, which would allow us to flush all the LLC-cached data
				4281	* with that bit in the PTE to main memory with just one PIPE_CONTROL.
				4282	*/
Chris Wilson	651d794	2013-08-08 14:41:10 +0100	[diff] [blame]	4283	ret = i915_gem_object_set_cache_level(obj,
Tvrtko Ursulin	8652744	2016-10-13 11:03:00 +0100	[diff] [blame]	4284	HAS_WT(to_i915(obj->base.dev)) ?
				4285	I915_CACHE_WT : I915_CACHE_NONE);
Chris Wilson	058d88c	2016-08-15 10:49:06 +0100	[diff] [blame]	4286	if (ret) {
				4287	vma = ERR_PTR(ret);
Chris Wilson	bd3d225	2017-10-13 21:26:14 +0100	[diff] [blame]	4288	goto err_unpin_global;
Chris Wilson	058d88c	2016-08-15 10:49:06 +0100	[diff] [blame]	4289	}
Eric Anholt	a7ef064	2011-03-29 16:59:54 -0700	[diff] [blame]	4290
Chris Wilson	2da3b9b	2011-04-14 09:41:17 +0100	[diff] [blame]	4291	/* As the user may map the buffer once pinned in the display plane
				4292	* (e.g. libkms for the bootup splash), we have to ensure that we
Chris Wilson	2efb813	2016-08-18 17:17:06 +0100	[diff] [blame]	4293	* always use map_and_fenceable for all scanout buffers. However,
				4294	* it may simply be too big to fit into mappable, in which case
				4295	* put it anyway and hope that userspace can cope (but always first
				4296	* try to preserve the existing ABI).
Chris Wilson	2da3b9b	2011-04-14 09:41:17 +0100	[diff] [blame]	4297	*/
Chris Wilson	2efb813	2016-08-18 17:17:06 +0100	[diff] [blame]	4298	vma = ERR_PTR(-ENOSPC);
Chris Wilson	5935485	2018-02-20 13:42:06 +0000	[diff] [blame]	4299	if ((flags & PIN_MAPPABLE) == 0 &&
				4300	(!view \|\| view->type == I915_GGTT_VIEW_NORMAL))
Chris Wilson	2efb813	2016-08-18 17:17:06 +0100	[diff] [blame]	4301	vma = i915_gem_object_ggtt_pin(obj, view, 0, alignment,
Chris Wilson	5935485	2018-02-20 13:42:06 +0000	[diff] [blame]	4302	flags \|
				4303	PIN_MAPPABLE \|
				4304	PIN_NONBLOCK);
				4305	if (IS_ERR(vma))
Chris Wilson	767a222	2016-11-07 11:01:28 +0000	[diff] [blame]	4306	vma = i915_gem_object_ggtt_pin(obj, view, 0, alignment, flags);
Chris Wilson	058d88c	2016-08-15 10:49:06 +0100	[diff] [blame]	4307	if (IS_ERR(vma))
Chris Wilson	bd3d225	2017-10-13 21:26:14 +0100	[diff] [blame]	4308	goto err_unpin_global;
Chris Wilson	2da3b9b	2011-04-14 09:41:17 +0100	[diff] [blame]	4309
Chris Wilson	d8923dc	2016-08-18 17:17:07 +0100	[diff] [blame]	4310	vma->display_alignment = max_t(u64, vma->display_alignment, alignment);
				4311
Chris Wilson	5a97bcc	2017-02-22 11:40:46 +0000	[diff] [blame]	4312	__i915_gem_object_flush_for_display(obj);
Chris Wilson	b118c1e	2010-05-27 13:18:14 +0100	[diff] [blame]	4313
Chris Wilson	2da3b9b	2011-04-14 09:41:17 +0100	[diff] [blame]	4314	/* It should now be out of any other write domains, and we can update
				4315	* the domain values for our changes.
				4316	*/
Christian König	c0a51fd	2018-02-16 13:43:38 +0100	[diff] [blame]	4317	obj->read_domains \|= I915_GEM_DOMAIN_GTT;
Zhenyu Wang	b9241ea	2009-11-25 13:09:39 +0800	[diff] [blame]	4318
Chris Wilson	058d88c	2016-08-15 10:49:06 +0100	[diff] [blame]	4319	return vma;
Chris Wilson	cc98b41	2013-08-09 12:25:09 +0100	[diff] [blame]	4320
Chris Wilson	bd3d225	2017-10-13 21:26:14 +0100	[diff] [blame]	4321	err_unpin_global:
				4322	obj->pin_global--;
Chris Wilson	058d88c	2016-08-15 10:49:06 +0100	[diff] [blame]	4323	return vma;
Chris Wilson	cc98b41	2013-08-09 12:25:09 +0100	[diff] [blame]	4324	}
				4325
				4326	void
Chris Wilson	058d88c	2016-08-15 10:49:06 +0100	[diff] [blame]	4327	i915_gem_object_unpin_from_display_plane(struct i915_vma *vma)
Chris Wilson	cc98b41	2013-08-09 12:25:09 +0100	[diff] [blame]	4328	{
Chris Wilson	49d7391	2016-11-29 09:50:08 +0000	[diff] [blame]	4329	lockdep_assert_held(&vma->vm->i915->drm.struct_mutex);
Chris Wilson	4c7d62c	2016-10-28 13:58:32 +0100	[diff] [blame]	4330
Chris Wilson	bd3d225	2017-10-13 21:26:14 +0100	[diff] [blame]	4331	if (WARN_ON(vma->obj->pin_global == 0))
Tvrtko Ursulin	8a0c39b	2015-04-13 11:50:09 +0100	[diff] [blame]	4332	return;
				4333
Chris Wilson	bd3d225	2017-10-13 21:26:14 +0100	[diff] [blame]	4334	if (--vma->obj->pin_global == 0)
Chris Wilson	f51455d	2017-01-10 14:47:34 +0000	[diff] [blame]	4335	vma->display_alignment = I915_GTT_MIN_ALIGNMENT;
Tvrtko Ursulin	e661733	2015-03-23 11:10:33 +0000	[diff] [blame]	4336
Chris Wilson	383d582	2016-08-18 17:17:08 +0100	[diff] [blame]	4337	/* Bump the LRU to try and avoid premature eviction whilst flipping */
Chris Wilson	befedbb	2017-01-19 19:26:55 +0000	[diff] [blame]	4338	i915_gem_object_bump_inactive_ggtt(vma->obj);
Chris Wilson	383d582	2016-08-18 17:17:08 +0100	[diff] [blame]	4339
Chris Wilson	058d88c	2016-08-15 10:49:06 +0100	[diff] [blame]	4340	i915_vma_unpin(vma);
Zhenyu Wang	b9241ea	2009-11-25 13:09:39 +0800	[diff] [blame]	4341	}
				4342
Eric Anholt	e47c68e	2008-11-14 13:35:19 -0800	[diff] [blame]	4343	/**
				4344	* Moves a single object to the CPU read, and possibly write domain.
Tvrtko Ursulin	14bb2c1	2016-06-03 14:02:17 +0100	[diff] [blame]	4345	* @obj: object to act on
				4346	* @write: requesting write or read-only access
Eric Anholt	e47c68e	2008-11-14 13:35:19 -0800	[diff] [blame]	4347	*
				4348	* This function returns when the move is complete, including waiting on
				4349	* flushes to occur.
				4350	*/
Chris Wilson	dabdfe0	2012-03-26 10:10:27 +0200	[diff] [blame]	4351	int
Chris Wilson	919926a	2010-11-12 13:42:53 +0000	[diff] [blame]	4352	i915_gem_object_set_to_cpu_domain(struct drm_i915_gem_object *obj, bool write)
Eric Anholt	e47c68e	2008-11-14 13:35:19 -0800	[diff] [blame]	4353	{
Eric Anholt	e47c68e	2008-11-14 13:35:19 -0800	[diff] [blame]	4354	int ret;
				4355
Chris Wilson	e95433c	2016-10-28 13:58:27 +0100	[diff] [blame]	4356	lockdep_assert_held(&obj->base.dev->struct_mutex);
Chris Wilson	4c7d62c	2016-10-28 13:58:32 +0100	[diff] [blame]	4357
Chris Wilson	e95433c	2016-10-28 13:58:27 +0100	[diff] [blame]	4358	ret = i915_gem_object_wait(obj,
				4359	I915_WAIT_INTERRUPTIBLE \|
				4360	I915_WAIT_LOCKED \|
				4361	(write ? I915_WAIT_ALL : 0),
				4362	MAX_SCHEDULE_TIMEOUT,
				4363	NULL);
Chris Wilson	8824178	2011-01-07 17:09:48 +0000	[diff] [blame]	4364	if (ret)
				4365	return ret;
				4366
Chris Wilson	ef74921	2017-04-12 12:01:10 +0100	[diff] [blame]	4367	flush_write_domain(obj, ~I915_GEM_DOMAIN_CPU);
Eric Anholt	e47c68e	2008-11-14 13:35:19 -0800	[diff] [blame]	4368
Eric Anholt	e47c68e	2008-11-14 13:35:19 -0800	[diff] [blame]	4369	/* Flush the CPU cache if it's still invalid. */
Christian König	c0a51fd	2018-02-16 13:43:38 +0100	[diff] [blame]	4370	if ((obj->read_domains & I915_GEM_DOMAIN_CPU) == 0) {
Chris Wilson	57822dc	2017-02-22 11:40:48 +0000	[diff] [blame]	4371	i915_gem_clflush_object(obj, I915_CLFLUSH_SYNC);
Christian König	c0a51fd	2018-02-16 13:43:38 +0100	[diff] [blame]	4372	obj->read_domains \|= I915_GEM_DOMAIN_CPU;
Eric Anholt	e47c68e	2008-11-14 13:35:19 -0800	[diff] [blame]	4373	}
				4374
				4375	/* It should now be out of any other write domains, and we can update
				4376	* the domain values for our changes.
				4377	*/
Christian König	c0a51fd	2018-02-16 13:43:38 +0100	[diff] [blame]	4378	GEM_BUG_ON(obj->write_domain & ~I915_GEM_DOMAIN_CPU);
Eric Anholt	e47c68e	2008-11-14 13:35:19 -0800	[diff] [blame]	4379
				4380	/* If we're writing through the CPU, then the GPU read domains will
				4381	* need to be invalidated at next use.
				4382	*/
Chris Wilson	e27ab73	2017-06-15 13:38:49 +0100	[diff] [blame]	4383	if (write)
				4384	__start_cpu_write(obj);
Eric Anholt	2ef7eea	2008-11-10 10:53:25 -0800	[diff] [blame]	4385
				4386	return 0;
				4387	}
				4388
Eric Anholt	673a394	2008-07-30 12:06:12 -0700	[diff] [blame]	4389	/* Throttle our rendering by waiting until the ring has completed our requests
				4390	* emitted over 20 msec ago.
				4391	*
Eric Anholt	b962442	2009-06-03 07:27:35 +0000	[diff] [blame]	4392	* Note that if we were to use the current jiffies each time around the loop,
				4393	* we wouldn't escape the function with any frames outstanding if the time to
				4394	* render a frame was over 20ms.
				4395	*
Eric Anholt	673a394	2008-07-30 12:06:12 -0700	[diff] [blame]	4396	* This should get us reasonable parallelism between CPU and GPU but also
				4397	* relatively low latency when blocking on a particular request to finish.
				4398	*/
				4399	static int
Chris Wilson	f787a5f	2010-09-24 16:02:42 +0100	[diff] [blame]	4400	i915_gem_ring_throttle(struct drm_device dev, struct drm_file file)
Eric Anholt	673a394	2008-07-30 12:06:12 -0700	[diff] [blame]	4401	{
Chris Wilson	fac5e23	2016-07-04 11:34:36 +0100	[diff] [blame]	4402	struct drm_i915_private *dev_priv = to_i915(dev);
Chris Wilson	f787a5f	2010-09-24 16:02:42 +0100	[diff] [blame]	4403	struct drm_i915_file_private *file_priv = file->driver_priv;
Chris Wilson	d0bc54f	2015-05-21 21:01:48 +0100	[diff] [blame]	4404	unsigned long recent_enough = jiffies - DRM_I915_THROTTLE_JIFFIES;
Chris Wilson	e61e0f5	2018-02-21 09:56:36 +0000	[diff] [blame]	4405	struct i915_request request, target = NULL;
Chris Wilson	e95433c	2016-10-28 13:58:27 +0100	[diff] [blame]	4406	long ret;
Eric Anholt	673a394	2008-07-30 12:06:12 -0700	[diff] [blame]	4407
Chris Wilson	f4457ae	2016-04-13 17:35:08 +0100	[diff] [blame]	4408	/* ABI: return -EIO if already wedged */
				4409	if (i915_terminally_wedged(&dev_priv->gpu_error))
				4410	return -EIO;
Chris Wilson	e110e8d	2011-01-26 15:39:14 +0000	[diff] [blame]	4411
Chris Wilson	1c25595	2010-09-26 11:03:27 +0100	[diff] [blame]	4412	spin_lock(&file_priv->mm.lock);
Chris Wilson	c8659ef	2017-03-02 12:25:25 +0000	[diff] [blame]	4413	list_for_each_entry(request, &file_priv->mm.request_list, client_link) {
Eric Anholt	b962442	2009-06-03 07:27:35 +0000	[diff] [blame]	4414	if (time_after_eq(request->emitted_jiffies, recent_enough))
				4415	break;
				4416
Chris Wilson	c8659ef	2017-03-02 12:25:25 +0000	[diff] [blame]	4417	if (target) {
				4418	list_del(&target->client_link);
				4419	target->file_priv = NULL;
				4420	}
John Harrison	fcfa423c	2015-05-29 17:44:12 +0100	[diff] [blame]	4421
John Harrison	54fb241	2014-11-24 18:49:27 +0000	[diff] [blame]	4422	target = request;
Eric Anholt	b962442	2009-06-03 07:27:35 +0000	[diff] [blame]	4423	}
John Harrison	ff86588	2014-11-24 18:49:28 +0000	[diff] [blame]	4424	if (target)
Chris Wilson	e61e0f5	2018-02-21 09:56:36 +0000	[diff] [blame]	4425	i915_request_get(target);
Chris Wilson	1c25595	2010-09-26 11:03:27 +0100	[diff] [blame]	4426	spin_unlock(&file_priv->mm.lock);
Chris Wilson	f787a5f	2010-09-24 16:02:42 +0100	[diff] [blame]	4427
John Harrison	54fb241	2014-11-24 18:49:27 +0000	[diff] [blame]	4428	if (target == NULL)
Chris Wilson	f787a5f	2010-09-24 16:02:42 +0100	[diff] [blame]	4429	return 0;
				4430
Chris Wilson	e61e0f5	2018-02-21 09:56:36 +0000	[diff] [blame]	4431	ret = i915_request_wait(target,
Chris Wilson	e95433c	2016-10-28 13:58:27 +0100	[diff] [blame]	4432	I915_WAIT_INTERRUPTIBLE,
				4433	MAX_SCHEDULE_TIMEOUT);
Chris Wilson	e61e0f5	2018-02-21 09:56:36 +0000	[diff] [blame]	4434	i915_request_put(target);
John Harrison	ff86588	2014-11-24 18:49:28 +0000	[diff] [blame]	4435
Chris Wilson	e95433c	2016-10-28 13:58:27 +0100	[diff] [blame]	4436	return ret < 0 ? ret : 0;
Eric Anholt	673a394	2008-07-30 12:06:12 -0700	[diff] [blame]	4437	}
				4438
Chris Wilson	058d88c	2016-08-15 10:49:06 +0100	[diff] [blame]	4439	struct i915_vma *
Joonas Lahtinen	ec7adb6	2015-03-16 14:11:13 +0200	[diff] [blame]	4440	i915_gem_object_ggtt_pin(struct drm_i915_gem_object *obj,
				4441	const struct i915_ggtt_view *view,
Chris Wilson	91b2db6	2016-08-04 16:32:23 +0100	[diff] [blame]	4442	u64 size,
Chris Wilson	2ffffd0	2016-08-04 16:32:22 +0100	[diff] [blame]	4443	u64 alignment,
				4444	u64 flags)
Joonas Lahtinen	ec7adb6	2015-03-16 14:11:13 +0200	[diff] [blame]	4445	{
Chris Wilson	ad16d2e	2016-10-13 09:55:04 +0100	[diff] [blame]	4446	struct drm_i915_private *dev_priv = to_i915(obj->base.dev);
Chris Wilson	82ad644	2018-06-05 16:37:58 +0100	[diff] [blame]	4447	struct i915_address_space *vm = &dev_priv->ggtt.vm;
Chris Wilson	59bfa12	2016-08-04 16:32:31 +0100	[diff] [blame]	4448	struct i915_vma *vma;
				4449	int ret;
Joonas Lahtinen	72e96d6	2016-03-30 16:57:10 +0300	[diff] [blame]	4450
Chris Wilson	4c7d62c	2016-10-28 13:58:32 +0100	[diff] [blame]	4451	lockdep_assert_held(&obj->base.dev->struct_mutex);
				4452
Chris Wilson	ac87a6fd	2018-02-20 13:42:05 +0000	[diff] [blame]	4453	if (flags & PIN_MAPPABLE &&
				4454	(!view \|\| view->type == I915_GGTT_VIEW_NORMAL)) {
Chris Wilson	43ae70d9	2017-10-09 09:44:01 +0100	[diff] [blame]	4455	/* If the required space is larger than the available
				4456	* aperture, we will not able to find a slot for the
				4457	* object and unbinding the object now will be in
				4458	* vain. Worse, doing so may cause us to ping-pong
				4459	* the object in and out of the Global GTT and
				4460	* waste a lot of cycles under the mutex.
				4461	*/
				4462	if (obj->base.size > dev_priv->ggtt.mappable_end)
				4463	return ERR_PTR(-E2BIG);
				4464
				4465	/* If NONBLOCK is set the caller is optimistically
				4466	* trying to cache the full object within the mappable
				4467	* aperture, and must have a fallback in place for
				4468	* situations where we cannot bind the object. We
				4469	* can be a little more lax here and use the fallback
				4470	* more often to avoid costly migrations of ourselves
				4471	* and other objects within the aperture.
				4472	*
				4473	* Half-the-aperture is used as a simple heuristic.
				4474	* More interesting would to do search for a free
				4475	* block prior to making the commitment to unbind.
				4476	* That caters for the self-harm case, and with a
				4477	* little more heuristics (e.g. NOFAULT, NOEVICT)
				4478	* we could try to minimise harm to others.
				4479	*/
				4480	if (flags & PIN_NONBLOCK &&
				4481	obj->base.size > dev_priv->ggtt.mappable_end / 2)
				4482	return ERR_PTR(-ENOSPC);
				4483	}
				4484
Chris Wilson	718659a	2017-01-16 15:21:28 +0000	[diff] [blame]	4485	vma = i915_vma_instance(obj, vm, view);
Chris Wilson	e0216b7	2017-01-19 19:26:57 +0000	[diff] [blame]	4486	if (unlikely(IS_ERR(vma)))
Chris Wilson	058d88c	2016-08-15 10:49:06 +0100	[diff] [blame]	4487	return vma;
Chris Wilson	59bfa12	2016-08-04 16:32:31 +0100	[diff] [blame]	4488
				4489	if (i915_vma_misplaced(vma, size, alignment, flags)) {
Chris Wilson	43ae70d9	2017-10-09 09:44:01 +0100	[diff] [blame]	4490	if (flags & PIN_NONBLOCK) {
				4491	if (i915_vma_is_pinned(vma) \|\| i915_vma_is_active(vma))
				4492	return ERR_PTR(-ENOSPC);
Chris Wilson	59bfa12	2016-08-04 16:32:31 +0100	[diff] [blame]	4493
Chris Wilson	43ae70d9	2017-10-09 09:44:01 +0100	[diff] [blame]	4494	if (flags & PIN_MAPPABLE &&
Chris Wilson	944397f	2017-01-09 16:16:11 +0000	[diff] [blame]	4495	vma->fence_size > dev_priv->ggtt.mappable_end / 2)
Chris Wilson	ad16d2e	2016-10-13 09:55:04 +0100	[diff] [blame]	4496	return ERR_PTR(-ENOSPC);
				4497	}
				4498
Chris Wilson	59bfa12	2016-08-04 16:32:31 +0100	[diff] [blame]	4499	WARN(i915_vma_is_pinned(vma),
				4500	"bo is already pinned in ggtt with incorrect alignment:"
Chris Wilson	05a20d0	2016-08-18 17:16:55 +0100	[diff] [blame]	4501	" offset=%08x, req.alignment=%llx,"
				4502	" req.map_and_fenceable=%d, vma->map_and_fenceable=%d\n",
				4503	i915_ggtt_offset(vma), alignment,
Chris Wilson	59bfa12	2016-08-04 16:32:31 +0100	[diff] [blame]	4504	!!(flags & PIN_MAPPABLE),
Chris Wilson	05a20d0	2016-08-18 17:16:55 +0100	[diff] [blame]	4505	i915_vma_is_map_and_fenceable(vma));
Chris Wilson	59bfa12	2016-08-04 16:32:31 +0100	[diff] [blame]	4506	ret = i915_vma_unbind(vma);
				4507	if (ret)
Chris Wilson	058d88c	2016-08-15 10:49:06 +0100	[diff] [blame]	4508	return ERR_PTR(ret);
Chris Wilson	59bfa12	2016-08-04 16:32:31 +0100	[diff] [blame]	4509	}
				4510
Chris Wilson	058d88c	2016-08-15 10:49:06 +0100	[diff] [blame]	4511	ret = i915_vma_pin(vma, size, alignment, flags \| PIN_GLOBAL);
				4512	if (ret)
				4513	return ERR_PTR(ret);
Joonas Lahtinen	ec7adb6	2015-03-16 14:11:13 +0200	[diff] [blame]	4514
Chris Wilson	058d88c	2016-08-15 10:49:06 +0100	[diff] [blame]	4515	return vma;
Eric Anholt	673a394	2008-07-30 12:06:12 -0700	[diff] [blame]	4516	}
				4517
Chris Wilson	edf6b76	2016-08-09 09:23:33 +0100	[diff] [blame]	4518	static __always_inline unsigned int __busy_read_flag(unsigned int id)
Chris Wilson	3fdc13c	2016-08-05 10:14:18 +0100	[diff] [blame]	4519	{
				4520	/* Note that we could alias engines in the execbuf API, but
				4521	* that would be very unwise as it prevents userspace from
				4522	* fine control over engine selection. Ahem.
				4523	*
				4524	* This should be something like EXEC_MAX_ENGINE instead of
				4525	* I915_NUM_ENGINES.
				4526	*/
				4527	BUILD_BUG_ON(I915_NUM_ENGINES > 16);
				4528	return 0x10000 << id;
				4529	}
				4530
				4531	static __always_inline unsigned int __busy_write_id(unsigned int id)
				4532	{
Chris Wilson	70cb472	2016-08-09 18:08:25 +0100	[diff] [blame]	4533	/* The uABI guarantees an active writer is also amongst the read
				4534	* engines. This would be true if we accessed the activity tracking
				4535	* under the lock, but as we perform the lookup of the object and
				4536	* its activity locklessly we can not guarantee that the last_write
				4537	* being active implies that we have set the same engine flag from
				4538	* last_read - hence we always set both read and write busy for
				4539	* last_write.
				4540	*/
				4541	return id \| __busy_read_flag(id);
Chris Wilson	3fdc13c	2016-08-05 10:14:18 +0100	[diff] [blame]	4542	}
				4543
Chris Wilson	edf6b76	2016-08-09 09:23:33 +0100	[diff] [blame]	4544	static __always_inline unsigned int
Chris Wilson	d07f0e5	2016-10-28 13:58:44 +0100	[diff] [blame]	4545	__busy_set_if_active(const struct dma_fence *fence,
Chris Wilson	3fdc13c	2016-08-05 10:14:18 +0100	[diff] [blame]	4546	unsigned int (*flag)(unsigned int id))
				4547	{
Chris Wilson	e61e0f5	2018-02-21 09:56:36 +0000	[diff] [blame]	4548	struct i915_request *rq;
Chris Wilson	1255501	2016-08-16 09:50:40 +0100	[diff] [blame]	4549
Chris Wilson	d07f0e5	2016-10-28 13:58:44 +0100	[diff] [blame]	4550	/* We have to check the current hw status of the fence as the uABI
				4551	* guarantees forward progress. We could rely on the idle worker
				4552	* to eventually flush us, but to minimise latency just ask the
				4553	* hardware.
				4554	*
				4555	* Note we only report on the status of native fences.
				4556	*/
				4557	if (!dma_fence_is_i915(fence))
Chris Wilson	1255501	2016-08-16 09:50:40 +0100	[diff] [blame]	4558	return 0;
				4559
Chris Wilson	d07f0e5	2016-10-28 13:58:44 +0100	[diff] [blame]	4560	/* opencode to_request() in order to avoid const warnings */
Chris Wilson	e61e0f5	2018-02-21 09:56:36 +0000	[diff] [blame]	4561	rq = container_of(fence, struct i915_request, fence);
				4562	if (i915_request_completed(rq))
Chris Wilson	d07f0e5	2016-10-28 13:58:44 +0100	[diff] [blame]	4563	return 0;
				4564
Chris Wilson	1d39f28	2017-04-11 13:43:06 +0100	[diff] [blame]	4565	return flag(rq->engine->uabi_id);
Chris Wilson	3fdc13c	2016-08-05 10:14:18 +0100	[diff] [blame]	4566	}
				4567
Chris Wilson	edf6b76	2016-08-09 09:23:33 +0100	[diff] [blame]	4568	static __always_inline unsigned int
Chris Wilson	d07f0e5	2016-10-28 13:58:44 +0100	[diff] [blame]	4569	busy_check_reader(const struct dma_fence *fence)
Chris Wilson	3fdc13c	2016-08-05 10:14:18 +0100	[diff] [blame]	4570	{
Chris Wilson	d07f0e5	2016-10-28 13:58:44 +0100	[diff] [blame]	4571	return __busy_set_if_active(fence, __busy_read_flag);
Chris Wilson	3fdc13c	2016-08-05 10:14:18 +0100	[diff] [blame]	4572	}
				4573
Chris Wilson	edf6b76	2016-08-09 09:23:33 +0100	[diff] [blame]	4574	static __always_inline unsigned int
Chris Wilson	d07f0e5	2016-10-28 13:58:44 +0100	[diff] [blame]	4575	busy_check_writer(const struct dma_fence *fence)
Chris Wilson	3fdc13c	2016-08-05 10:14:18 +0100	[diff] [blame]	4576	{
Chris Wilson	d07f0e5	2016-10-28 13:58:44 +0100	[diff] [blame]	4577	if (!fence)
				4578	return 0;
				4579
				4580	return __busy_set_if_active(fence, __busy_write_id);
Chris Wilson	3fdc13c	2016-08-05 10:14:18 +0100	[diff] [blame]	4581	}
				4582
Eric Anholt	673a394	2008-07-30 12:06:12 -0700	[diff] [blame]	4583	int
Eric Anholt	673a394	2008-07-30 12:06:12 -0700	[diff] [blame]	4584	i915_gem_busy_ioctl(struct drm_device dev, void data,
Chris Wilson	05394f3	2010-11-08 19:18:58 +0000	[diff] [blame]	4585	struct drm_file *file)
Eric Anholt	673a394	2008-07-30 12:06:12 -0700	[diff] [blame]	4586	{
				4587	struct drm_i915_gem_busy *args = data;
Chris Wilson	05394f3	2010-11-08 19:18:58 +0000	[diff] [blame]	4588	struct drm_i915_gem_object *obj;
Chris Wilson	d07f0e5	2016-10-28 13:58:44 +0100	[diff] [blame]	4589	struct reservation_object_list *list;
				4590	unsigned int seq;
Chris Wilson	fbbd37b	2016-10-28 13:58:42 +0100	[diff] [blame]	4591	int err;
Eric Anholt	673a394	2008-07-30 12:06:12 -0700	[diff] [blame]	4592
Chris Wilson	d07f0e5	2016-10-28 13:58:44 +0100	[diff] [blame]	4593	err = -ENOENT;
Chris Wilson	fbbd37b	2016-10-28 13:58:42 +0100	[diff] [blame]	4594	rcu_read_lock();
				4595	obj = i915_gem_object_lookup_rcu(file, args->handle);
Chris Wilson	d07f0e5	2016-10-28 13:58:44 +0100	[diff] [blame]	4596	if (!obj)
Chris Wilson	fbbd37b	2016-10-28 13:58:42 +0100	[diff] [blame]	4597	goto out;
Chris Wilson	d07f0e5	2016-10-28 13:58:44 +0100	[diff] [blame]	4598
				4599	/* A discrepancy here is that we do not report the status of
				4600	* non-i915 fences, i.e. even though we may report the object as idle,
				4601	* a call to set-domain may still stall waiting for foreign rendering.
				4602	* This also means that wait-ioctl may report an object as busy,
				4603	* where busy-ioctl considers it idle.
				4604	*
				4605	* We trade the ability to warn of foreign fences to report on which
				4606	* i915 engines are active for the object.
				4607	*
				4608	* Alternatively, we can trade that extra information on read/write
				4609	* activity with
				4610	* args->busy =
				4611	* !reservation_object_test_signaled_rcu(obj->resv, true);
				4612	* to report the overall busyness. This is what the wait-ioctl does.
				4613	*
				4614	*/
				4615	retry:
				4616	seq = raw_read_seqcount(&obj->resv->seq);
				4617
				4618	/* Translate the exclusive fence to the READ and WRITE engine */
				4619	args->busy = busy_check_writer(rcu_dereference(obj->resv->fence_excl));
				4620
				4621	/* Translate shared fences to READ set of engines */
				4622	list = rcu_dereference(obj->resv->fence);
				4623	if (list) {
				4624	unsigned int shared_count = list->shared_count, i;
				4625
				4626	for (i = 0; i < shared_count; ++i) {
				4627	struct dma_fence *fence =
				4628	rcu_dereference(list->shared[i]);
				4629
				4630	args->busy \|= busy_check_reader(fence);
				4631	}
Chris Wilson	fbbd37b	2016-10-28 13:58:42 +0100	[diff] [blame]	4632	}
Zou Nan hai	d1b851f	2010-05-21 09:08:57 +0800	[diff] [blame]	4633
Chris Wilson	d07f0e5	2016-10-28 13:58:44 +0100	[diff] [blame]	4634	if (args->busy && read_seqcount_retry(&obj->resv->seq, seq))
				4635	goto retry;
Chris Wilson	426960b	2016-01-15 16:51:46 +0000	[diff] [blame]	4636
Chris Wilson	d07f0e5	2016-10-28 13:58:44 +0100	[diff] [blame]	4637	err = 0;
Chris Wilson	fbbd37b	2016-10-28 13:58:42 +0100	[diff] [blame]	4638	out:
				4639	rcu_read_unlock();
				4640	return err;
Eric Anholt	673a394	2008-07-30 12:06:12 -0700	[diff] [blame]	4641	}
				4642
				4643	int
				4644	i915_gem_throttle_ioctl(struct drm_device dev, void data,
				4645	struct drm_file *file_priv)
				4646	{
Akshay Joshi	0206e35	2011-08-16 15:34:10 -0400	[diff] [blame]	4647	return i915_gem_ring_throttle(dev, file_priv);
Eric Anholt	673a394	2008-07-30 12:06:12 -0700	[diff] [blame]	4648	}
				4649
Chris Wilson	3ef94da	2009-09-14 16:50:29 +0100	[diff] [blame]	4650	int
				4651	i915_gem_madvise_ioctl(struct drm_device dev, void data,
				4652	struct drm_file *file_priv)
				4653	{
Chris Wilson	fac5e23	2016-07-04 11:34:36 +0100	[diff] [blame]	4654	struct drm_i915_private *dev_priv = to_i915(dev);
Chris Wilson	3ef94da	2009-09-14 16:50:29 +0100	[diff] [blame]	4655	struct drm_i915_gem_madvise *args = data;
Chris Wilson	05394f3	2010-11-08 19:18:58 +0000	[diff] [blame]	4656	struct drm_i915_gem_object *obj;
Chris Wilson	1233e2d	2016-10-28 13:58:37 +0100	[diff] [blame]	4657	int err;
Chris Wilson	3ef94da	2009-09-14 16:50:29 +0100	[diff] [blame]	4658
				4659	switch (args->madv) {
				4660	case I915_MADV_DONTNEED:
				4661	case I915_MADV_WILLNEED:
				4662	break;
				4663	default:
				4664	return -EINVAL;
				4665	}
				4666
Chris Wilson	03ac064	2016-07-20 13:31:51 +0100	[diff] [blame]	4667	obj = i915_gem_object_lookup(file_priv, args->handle);
Chris Wilson	1233e2d	2016-10-28 13:58:37 +0100	[diff] [blame]	4668	if (!obj)
				4669	return -ENOENT;
				4670
				4671	err = mutex_lock_interruptible(&obj->mm.lock);
				4672	if (err)
				4673	goto out;
Chris Wilson	3ef94da	2009-09-14 16:50:29 +0100	[diff] [blame]	4674
Chris Wilson	f1fa4f4	2017-10-13 21:26:13 +0100	[diff] [blame]	4675	if (i915_gem_object_has_pages(obj) &&
Chris Wilson	3e510a8	2016-08-05 10:14:23 +0100	[diff] [blame]	4676	i915_gem_object_is_tiled(obj) &&
Daniel Vetter	656bfa3	2014-11-20 09:26:30 +0100	[diff] [blame]	4677	dev_priv->quirks & QUIRK_PIN_SWIZZLED_PAGES) {
Chris Wilson	bc0629a	2016-11-01 10:03:17 +0000	[diff] [blame]	4678	if (obj->mm.madv == I915_MADV_WILLNEED) {
				4679	GEM_BUG_ON(!obj->mm.quirked);
Chris Wilson	a4f5ea6	2016-10-28 13:58:35 +0100	[diff] [blame]	4680	__i915_gem_object_unpin_pages(obj);
Chris Wilson	bc0629a	2016-11-01 10:03:17 +0000	[diff] [blame]	4681	obj->mm.quirked = false;
				4682	}
				4683	if (args->madv == I915_MADV_WILLNEED) {
Chris Wilson	2c3a3f4	2016-11-04 10:30:01 +0000	[diff] [blame]	4684	GEM_BUG_ON(obj->mm.quirked);
Chris Wilson	a4f5ea6	2016-10-28 13:58:35 +0100	[diff] [blame]	4685	__i915_gem_object_pin_pages(obj);
Chris Wilson	bc0629a	2016-11-01 10:03:17 +0000	[diff] [blame]	4686	obj->mm.quirked = true;
				4687	}
Daniel Vetter	656bfa3	2014-11-20 09:26:30 +0100	[diff] [blame]	4688	}
				4689
Chris Wilson	a4f5ea6	2016-10-28 13:58:35 +0100	[diff] [blame]	4690	if (obj->mm.madv != __I915_MADV_PURGED)
				4691	obj->mm.madv = args->madv;
Chris Wilson	3ef94da	2009-09-14 16:50:29 +0100	[diff] [blame]	4692
Chris Wilson	6c085a7	2012-08-20 11:40:46 +0200	[diff] [blame]	4693	/* if the object is no longer attached, discard its backing storage */
Chris Wilson	f1fa4f4	2017-10-13 21:26:13 +0100	[diff] [blame]	4694	if (obj->mm.madv == I915_MADV_DONTNEED &&
				4695	!i915_gem_object_has_pages(obj))
Chris Wilson	2d7ef39	2009-09-20 23:13:10 +0100	[diff] [blame]	4696	i915_gem_object_truncate(obj);
				4697
Chris Wilson	a4f5ea6	2016-10-28 13:58:35 +0100	[diff] [blame]	4698	args->retained = obj->mm.madv != __I915_MADV_PURGED;
Chris Wilson	1233e2d	2016-10-28 13:58:37 +0100	[diff] [blame]	4699	mutex_unlock(&obj->mm.lock);
Chris Wilson	bb6baf7	2009-09-22 14:24:13 +0100	[diff] [blame]	4700
Chris Wilson	1233e2d	2016-10-28 13:58:37 +0100	[diff] [blame]	4701	out:
Chris Wilson	f8c417c	2016-07-20 13:31:53 +0100	[diff] [blame]	4702	i915_gem_object_put(obj);
Chris Wilson	1233e2d	2016-10-28 13:58:37 +0100	[diff] [blame]	4703	return err;
Chris Wilson	3ef94da	2009-09-14 16:50:29 +0100	[diff] [blame]	4704	}
				4705
Chris Wilson	5b8c8ae	2016-11-16 19:07:04 +0000	[diff] [blame]	4706	static void
Chris Wilson	e61e0f5	2018-02-21 09:56:36 +0000	[diff] [blame]	4707	frontbuffer_retire(struct i915_gem_active active, struct i915_request request)
Chris Wilson	5b8c8ae	2016-11-16 19:07:04 +0000	[diff] [blame]	4708	{
				4709	struct drm_i915_gem_object *obj =
				4710	container_of(active, typeof(*obj), frontbuffer_write);
				4711
Chris Wilson	d59b21e	2017-02-22 11:40:49 +0000	[diff] [blame]	4712	intel_fb_obj_flush(obj, ORIGIN_CS);
Chris Wilson	5b8c8ae	2016-11-16 19:07:04 +0000	[diff] [blame]	4713	}
				4714
Chris Wilson	37e680a	2012-06-07 15:38:42 +0100	[diff] [blame]	4715	void i915_gem_object_init(struct drm_i915_gem_object *obj,
				4716	const struct drm_i915_gem_object_ops *ops)
Chris Wilson	0327d6b	2012-08-11 15:41:06 +0100	[diff] [blame]	4717	{
Chris Wilson	1233e2d	2016-10-28 13:58:37 +0100	[diff] [blame]	4718	mutex_init(&obj->mm.lock);
				4719
Ben Widawsky	2f63315	2013-07-17 12:19:03 -0700	[diff] [blame]	4720	INIT_LIST_HEAD(&obj->vma_list);
Chris Wilson	d1b48c1	2017-08-16 09:52:08 +0100	[diff] [blame]	4721	INIT_LIST_HEAD(&obj->lut_list);
Chris Wilson	8d9d574	2015-04-07 16:20:38 +0100	[diff] [blame]	4722	INIT_LIST_HEAD(&obj->batch_pool_link);
Chris Wilson	0327d6b	2012-08-11 15:41:06 +0100	[diff] [blame]	4723
Chris Wilson	37e680a	2012-06-07 15:38:42 +0100	[diff] [blame]	4724	obj->ops = ops;
				4725
Chris Wilson	d07f0e5	2016-10-28 13:58:44 +0100	[diff] [blame]	4726	reservation_object_init(&obj->__builtin_resv);
				4727	obj->resv = &obj->__builtin_resv;
				4728
Chris Wilson	5034924	2016-08-18 17:17:04 +0100	[diff] [blame]	4729	obj->frontbuffer_ggtt_origin = ORIGIN_GTT;
Chris Wilson	5b8c8ae	2016-11-16 19:07:04 +0000	[diff] [blame]	4730	init_request_active(&obj->frontbuffer_write, frontbuffer_retire);
Chris Wilson	a4f5ea6	2016-10-28 13:58:35 +0100	[diff] [blame]	4731
				4732	obj->mm.madv = I915_MADV_WILLNEED;
				4733	INIT_RADIX_TREE(&obj->mm.get_page.radix, GFP_KERNEL \| __GFP_NOWARN);
				4734	mutex_init(&obj->mm.get_page.lock);
Chris Wilson	0327d6b	2012-08-11 15:41:06 +0100	[diff] [blame]	4735
Dave Gordon	f19ec8c	2016-07-04 11:34:37 +0100	[diff] [blame]	4736	i915_gem_info_add_obj(to_i915(obj->base.dev), obj->base.size);
Chris Wilson	0327d6b	2012-08-11 15:41:06 +0100	[diff] [blame]	4737	}
				4738
Chris Wilson	37e680a	2012-06-07 15:38:42 +0100	[diff] [blame]	4739	static const struct drm_i915_gem_object_ops i915_gem_object_ops = {
Tvrtko Ursulin	3599a91	2016-11-01 14:44:10 +0000	[diff] [blame]	4740	.flags = I915_GEM_OBJECT_HAS_STRUCT_PAGE \|
				4741	I915_GEM_OBJECT_IS_SHRINKABLE,
Chris Wilson	7c55e2c	2017-03-07 12:03:38 +0000	[diff] [blame]	4742
Chris Wilson	37e680a	2012-06-07 15:38:42 +0100	[diff] [blame]	4743	.get_pages = i915_gem_object_get_pages_gtt,
				4744	.put_pages = i915_gem_object_put_pages_gtt,
Chris Wilson	7c55e2c	2017-03-07 12:03:38 +0000	[diff] [blame]	4745
				4746	.pwrite = i915_gem_object_pwrite_gtt,
Chris Wilson	37e680a	2012-06-07 15:38:42 +0100	[diff] [blame]	4747	};
				4748
Matthew Auld	465c403	2017-10-06 23:18:14 +0100	[diff] [blame]	4749	static int i915_gem_object_create_shmem(struct drm_device *dev,
				4750	struct drm_gem_object *obj,
				4751	size_t size)
				4752	{
				4753	struct drm_i915_private *i915 = to_i915(dev);
				4754	unsigned long flags = VM_NORESERVE;
				4755	struct file *filp;
				4756
				4757	drm_gem_private_object_init(dev, obj, size);
				4758
				4759	if (i915->mm.gemfs)
				4760	filp = shmem_file_setup_with_mnt(i915->mm.gemfs, "i915", size,
				4761	flags);
				4762	else
				4763	filp = shmem_file_setup("i915", size, flags);
				4764
				4765	if (IS_ERR(filp))
				4766	return PTR_ERR(filp);
				4767
				4768	obj->filp = filp;
				4769
				4770	return 0;
				4771	}
				4772
Chris Wilson	b4bcbe2	2016-10-18 13:02:49 +0100	[diff] [blame]	4773	struct drm_i915_gem_object *
Tvrtko Ursulin	12d79d7	2016-12-01 14:16:37 +0000	[diff] [blame]	4774	i915_gem_object_create(struct drm_i915_private *dev_priv, u64 size)
Daniel Vetter	ac52bc5	2010-04-09 19:05:06 +0000	[diff] [blame]	4775	{
Daniel Vetter	c397b90	2010-04-09 19:05:07 +0000	[diff] [blame]	4776	struct drm_i915_gem_object *obj;
Hugh Dickins	5949eac	2011-06-27 16:18:18 -0700	[diff] [blame]	4777	struct address_space *mapping;
Chris Wilson	b8f55be	2017-08-11 12:11:16 +0100	[diff] [blame]	4778	unsigned int cache_level;
Daniel Vetter	1a240d4	2012-11-29 22:18:51 +0100	[diff] [blame]	4779	gfp_t mask;
Chris Wilson	fe3db79	2016-04-25 13:32:13 +0100	[diff] [blame]	4780	int ret;
Daniel Vetter	c397b90	2010-04-09 19:05:07 +0000	[diff] [blame]	4781
Chris Wilson	b4bcbe2	2016-10-18 13:02:49 +0100	[diff] [blame]	4782	/* There is a prevalence of the assumption that we fit the object's
				4783	* page count inside a 32bit _signed_ variable. Let's document this and
				4784	* catch if we ever need to fix it. In the meantime, if you do spot
				4785	* such a local variable, please consider fixing!
				4786	*/
Tvrtko Ursulin	7a3ee5d	2017-03-30 17:31:30 +0100	[diff] [blame]	4787	if (size >> PAGE_SHIFT > INT_MAX)
Chris Wilson	b4bcbe2	2016-10-18 13:02:49 +0100	[diff] [blame]	4788	return ERR_PTR(-E2BIG);
				4789
				4790	if (overflows_type(size, obj->base.size))
				4791	return ERR_PTR(-E2BIG);
				4792
Tvrtko Ursulin	187685c	2016-12-01 14:16:36 +0000	[diff] [blame]	4793	obj = i915_gem_object_alloc(dev_priv);
Daniel Vetter	c397b90	2010-04-09 19:05:07 +0000	[diff] [blame]	4794	if (obj == NULL)
Chris Wilson	fe3db79	2016-04-25 13:32:13 +0100	[diff] [blame]	4795	return ERR_PTR(-ENOMEM);
Daniel Vetter	c397b90	2010-04-09 19:05:07 +0000	[diff] [blame]	4796
Matthew Auld	465c403	2017-10-06 23:18:14 +0100	[diff] [blame]	4797	ret = i915_gem_object_create_shmem(&dev_priv->drm, &obj->base, size);
Chris Wilson	fe3db79	2016-04-25 13:32:13 +0100	[diff] [blame]	4798	if (ret)
				4799	goto fail;
Daniel Vetter	c397b90	2010-04-09 19:05:07 +0000	[diff] [blame]	4800
Chris Wilson	bed1ea9	2012-05-24 20:48:12 +0100	[diff] [blame]	4801	mask = GFP_HIGHUSER \| __GFP_RECLAIMABLE;
Jani Nikula	c0f8683	2016-12-07 12:13:04 +0200	[diff] [blame]	4802	if (IS_I965GM(dev_priv) \|\| IS_I965G(dev_priv)) {
Chris Wilson	bed1ea9	2012-05-24 20:48:12 +0100	[diff] [blame]	4803	/* 965gm cannot relocate objects above 4GiB. */
				4804	mask &= ~__GFP_HIGHMEM;
				4805	mask \|= __GFP_DMA32;
				4806	}
				4807
Al Viro	93c76a3	2015-12-04 23:45:44 -0500	[diff] [blame]	4808	mapping = obj->base.filp->f_mapping;
Chris Wilson	bed1ea9	2012-05-24 20:48:12 +0100	[diff] [blame]	4809	mapping_set_gfp_mask(mapping, mask);
Chris Wilson	4846bf0	2017-06-09 12:03:46 +0100	[diff] [blame]	4810	GEM_BUG_ON(!(mapping_gfp_mask(mapping) & __GFP_RECLAIM));
Hugh Dickins	5949eac	2011-06-27 16:18:18 -0700	[diff] [blame]	4811
Chris Wilson	37e680a	2012-06-07 15:38:42 +0100	[diff] [blame]	4812	i915_gem_object_init(obj, &i915_gem_object_ops);
Chris Wilson	73aa808	2010-09-30 11:46:12 +0100	[diff] [blame]	4813
Christian König	c0a51fd	2018-02-16 13:43:38 +0100	[diff] [blame]	4814	obj->write_domain = I915_GEM_DOMAIN_CPU;
				4815	obj->read_domains = I915_GEM_DOMAIN_CPU;
Daniel Vetter	c397b90	2010-04-09 19:05:07 +0000	[diff] [blame]	4816
Chris Wilson	b8f55be	2017-08-11 12:11:16 +0100	[diff] [blame]	4817	if (HAS_LLC(dev_priv))
Eugeni Dodonov	3d29b84	2012-01-17 14:43:53 -0200	[diff] [blame]	4818	/* On some devices, we can have the GPU use the LLC (the CPU
Eric Anholt	a187111	2011-03-29 16:59:55 -0700	[diff] [blame]	4819	* cache) for about a 10% performance improvement
				4820	* compared to uncached. Graphics requests other than
				4821	* display scanout are coherent with the CPU in
				4822	* accessing this cache. This means in this mode we
				4823	* don't need to clflush on the CPU side, and on the
				4824	* GPU side we only need to flush internal caches to
				4825	* get data visible to the CPU.
				4826	*
				4827	* However, we maintain the display planes as UC, and so
				4828	* need to rebind when first used as such.
				4829	*/
Chris Wilson	b8f55be	2017-08-11 12:11:16 +0100	[diff] [blame]	4830	cache_level = I915_CACHE_LLC;
				4831	else
				4832	cache_level = I915_CACHE_NONE;
Eric Anholt	a187111	2011-03-29 16:59:55 -0700	[diff] [blame]	4833
Chris Wilson	b8f55be	2017-08-11 12:11:16 +0100	[diff] [blame]	4834	i915_gem_object_set_cache_coherency(obj, cache_level);
Chris Wilson	e27ab73	2017-06-15 13:38:49 +0100	[diff] [blame]	4835
Daniel Vetter	d861e33	2013-07-24 23:25:03 +0200	[diff] [blame]	4836	trace_i915_gem_object_create(obj);
				4837
Chris Wilson	05394f3	2010-11-08 19:18:58 +0000	[diff] [blame]	4838	return obj;
Chris Wilson	fe3db79	2016-04-25 13:32:13 +0100	[diff] [blame]	4839
				4840	fail:
				4841	i915_gem_object_free(obj);
Chris Wilson	fe3db79	2016-04-25 13:32:13 +0100	[diff] [blame]	4842	return ERR_PTR(ret);
Daniel Vetter	ac52bc5	2010-04-09 19:05:06 +0000	[diff] [blame]	4843	}
				4844
Chris Wilson	340fbd8	2014-05-22 09:16:52 +0100	[diff] [blame]	4845	static bool discard_backing_storage(struct drm_i915_gem_object *obj)
				4846	{
				4847	/* If we are the last user of the backing storage (be it shmemfs
				4848	* pages or stolen etc), we know that the pages are going to be
				4849	* immediately released. In this case, we can then skip copying
				4850	* back the contents from the GPU.
				4851	*/
				4852
Chris Wilson	a4f5ea6	2016-10-28 13:58:35 +0100	[diff] [blame]	4853	if (obj->mm.madv != I915_MADV_WILLNEED)
Chris Wilson	340fbd8	2014-05-22 09:16:52 +0100	[diff] [blame]	4854	return false;
				4855
				4856	if (obj->base.filp == NULL)
				4857	return true;
				4858
				4859	/* At first glance, this looks racy, but then again so would be
				4860	* userspace racing mmap against close. However, the first external
				4861	* reference to the filp can only be obtained through the
				4862	* i915_gem_mmap_ioctl() which safeguards us against the user
				4863	* acquiring such a reference whilst we are in the middle of
				4864	* freeing the object.
				4865	*/
				4866	return atomic_long_read(&obj->base.filp->f_count) == 1;
				4867	}
				4868
Chris Wilson	fbbd37b	2016-10-28 13:58:42 +0100	[diff] [blame]	4869	static void __i915_gem_free_objects(struct drm_i915_private *i915,
				4870	struct llist_node *freed)
Chris Wilson	be72615	2010-07-23 23:18:50 +0100	[diff] [blame]	4871	{
Chris Wilson	fbbd37b	2016-10-28 13:58:42 +0100	[diff] [blame]	4872	struct drm_i915_gem_object obj, on;
Chris Wilson	be72615	2010-07-23 23:18:50 +0100	[diff] [blame]	4873
Chris Wilson	fbbd37b	2016-10-28 13:58:42 +0100	[diff] [blame]	4874	intel_runtime_pm_get(i915);
Chris Wilson	cc731f5	2017-10-13 21:26:21 +0100	[diff] [blame]	4875	llist_for_each_entry_safe(obj, on, freed, freed) {
Chris Wilson	fbbd37b	2016-10-28 13:58:42 +0100	[diff] [blame]	4876	struct i915_vma vma, vn;
Paulo Zanoni	f65c916	2013-11-27 18:20:34 -0200	[diff] [blame]	4877
Chris Wilson	fbbd37b	2016-10-28 13:58:42 +0100	[diff] [blame]	4878	trace_i915_gem_object_destroy(obj);
				4879
Chris Wilson	cc731f5	2017-10-13 21:26:21 +0100	[diff] [blame]	4880	mutex_lock(&i915->drm.struct_mutex);
				4881
Chris Wilson	fbbd37b	2016-10-28 13:58:42 +0100	[diff] [blame]	4882	GEM_BUG_ON(i915_gem_object_is_active(obj));
				4883	list_for_each_entry_safe(vma, vn,
				4884	&obj->vma_list, obj_link) {
Chris Wilson	fbbd37b	2016-10-28 13:58:42 +0100	[diff] [blame]	4885	GEM_BUG_ON(i915_vma_is_active(vma));
				4886	vma->flags &= ~I915_VMA_PIN_MASK;
Chris Wilson	3365e22	2018-05-03 20:51:14 +0100	[diff] [blame]	4887	i915_vma_destroy(vma);
Chris Wilson	fbbd37b	2016-10-28 13:58:42 +0100	[diff] [blame]	4888	}
Chris Wilson	db6c2b4	2016-11-01 11:54:00 +0000	[diff] [blame]	4889	GEM_BUG_ON(!list_empty(&obj->vma_list));
				4890	GEM_BUG_ON(!RB_EMPTY_ROOT(&obj->vma_tree));
Chris Wilson	fbbd37b	2016-10-28 13:58:42 +0100	[diff] [blame]	4891
Chris Wilson	f212381	2017-10-16 12:40:37 +0100	[diff] [blame]	4892	/* This serializes freeing with the shrinker. Since the free
				4893	* is delayed, first by RCU then by the workqueue, we want the
				4894	* shrinker to be able to free pages of unreferenced objects,
				4895	* or else we may oom whilst there are plenty of deferred
				4896	* freed objects.
				4897	*/
				4898	if (i915_gem_object_has_pages(obj)) {
				4899	spin_lock(&i915->mm.obj_lock);
				4900	list_del_init(&obj->mm.link);
				4901	spin_unlock(&i915->mm.obj_lock);
				4902	}
				4903
Chris Wilson	cc731f5	2017-10-13 21:26:21 +0100	[diff] [blame]	4904	mutex_unlock(&i915->drm.struct_mutex);
Chris Wilson	fbbd37b	2016-10-28 13:58:42 +0100	[diff] [blame]	4905
Chris Wilson	fbbd37b	2016-10-28 13:58:42 +0100	[diff] [blame]	4906	GEM_BUG_ON(obj->bind_count);
Chris Wilson	a65adaf	2017-10-09 09:43:57 +0100	[diff] [blame]	4907	GEM_BUG_ON(obj->userfault_count);
Chris Wilson	fbbd37b	2016-10-28 13:58:42 +0100	[diff] [blame]	4908	GEM_BUG_ON(atomic_read(&obj->frontbuffer_bits));
Chris Wilson	67b4804	2017-08-22 12:05:16 +0100	[diff] [blame]	4909	GEM_BUG_ON(!list_empty(&obj->lut_list));
Chris Wilson	fbbd37b	2016-10-28 13:58:42 +0100	[diff] [blame]	4910
				4911	if (obj->ops->release)
				4912	obj->ops->release(obj);
				4913
				4914	if (WARN_ON(i915_gem_object_has_pinned_pages(obj)))
				4915	atomic_set(&obj->mm.pages_pin_count, 0);
Chris Wilson	548625e	2016-11-01 12:11:34 +0000	[diff] [blame]	4916	__i915_gem_object_put_pages(obj, I915_MM_NORMAL);
Chris Wilson	f1fa4f4	2017-10-13 21:26:13 +0100	[diff] [blame]	4917	GEM_BUG_ON(i915_gem_object_has_pages(obj));
Chris Wilson	fbbd37b	2016-10-28 13:58:42 +0100	[diff] [blame]	4918
				4919	if (obj->base.import_attach)
				4920	drm_prime_gem_destroy(&obj->base, NULL);
				4921
Chris Wilson	d07f0e5	2016-10-28 13:58:44 +0100	[diff] [blame]	4922	reservation_object_fini(&obj->__builtin_resv);
Chris Wilson	fbbd37b	2016-10-28 13:58:42 +0100	[diff] [blame]	4923	drm_gem_object_release(&obj->base);
				4924	i915_gem_info_remove_obj(i915, obj->base.size);
				4925
				4926	kfree(obj->bit_17);
				4927	i915_gem_object_free(obj);
Chris Wilson	cc731f5	2017-10-13 21:26:21 +0100	[diff] [blame]	4928
Chris Wilson	c9c70471	2018-02-19 22:06:31 +0000	[diff] [blame]	4929	GEM_BUG_ON(!atomic_read(&i915->mm.free_count));
				4930	atomic_dec(&i915->mm.free_count);
				4931
Chris Wilson	cc731f5	2017-10-13 21:26:21 +0100	[diff] [blame]	4932	if (on)
				4933	cond_resched();
Chris Wilson	fbbd37b	2016-10-28 13:58:42 +0100	[diff] [blame]	4934	}
Chris Wilson	cc731f5	2017-10-13 21:26:21 +0100	[diff] [blame]	4935	intel_runtime_pm_put(i915);
Chris Wilson	fbbd37b	2016-10-28 13:58:42 +0100	[diff] [blame]	4936	}
				4937
				4938	static void i915_gem_flush_free_objects(struct drm_i915_private *i915)
				4939	{
				4940	struct llist_node *freed;
				4941
Chris Wilson	87701b4	2017-10-13 21:26:20 +0100	[diff] [blame]	4942	/* Free the oldest, most stale object to keep the free_list short */
				4943	freed = NULL;
				4944	if (!llist_empty(&i915->mm.free_list)) { /* quick test for hotpath */
				4945	/* Only one consumer of llist_del_first() allowed */
				4946	spin_lock(&i915->mm.free_lock);
				4947	freed = llist_del_first(&i915->mm.free_list);
				4948	spin_unlock(&i915->mm.free_lock);
				4949	}
				4950	if (unlikely(freed)) {
				4951	freed->next = NULL;
Chris Wilson	fbbd37b	2016-10-28 13:58:42 +0100	[diff] [blame]	4952	__i915_gem_free_objects(i915, freed);
Chris Wilson	87701b4	2017-10-13 21:26:20 +0100	[diff] [blame]	4953	}
Chris Wilson	fbbd37b	2016-10-28 13:58:42 +0100	[diff] [blame]	4954	}
				4955
				4956	static void __i915_gem_free_work(struct work_struct *work)
				4957	{
				4958	struct drm_i915_private *i915 =
				4959	container_of(work, struct drm_i915_private, mm.free_work);
				4960	struct llist_node *freed;
Chris Wilson	26e12f8	2011-03-20 11:20:19 +0000	[diff] [blame]	4961
Chris Wilson	2ef1e72	2018-01-15 20:57:59 +0000	[diff] [blame]	4962	/*
				4963	* All file-owned VMA should have been released by this point through
Chris Wilson	b1f788c	2016-08-04 07:52:45 +0100	[diff] [blame]	4964	* i915_gem_close_object(), or earlier by i915_gem_context_close().
				4965	* However, the object may also be bound into the global GTT (e.g.
				4966	* older GPUs without per-process support, or for direct access through
				4967	* the GTT either for the user or for scanout). Those VMA still need to
				4968	* unbound now.
				4969	*/
Chris Wilson	1488fc0	2012-04-24 15:47:31 +0100	[diff] [blame]	4970
Chris Wilson	f991c49	2017-11-06 11:15:08 +0000	[diff] [blame]	4971	spin_lock(&i915->mm.free_lock);
Chris Wilson	5ad08be	2017-04-07 11:25:51 +0100	[diff] [blame]	4972	while ((freed = llist_del_all(&i915->mm.free_list))) {
Chris Wilson	f991c49	2017-11-06 11:15:08 +0000	[diff] [blame]	4973	spin_unlock(&i915->mm.free_lock);
				4974
Chris Wilson	fbbd37b	2016-10-28 13:58:42 +0100	[diff] [blame]	4975	__i915_gem_free_objects(i915, freed);
Chris Wilson	5ad08be	2017-04-07 11:25:51 +0100	[diff] [blame]	4976	if (need_resched())
Chris Wilson	f991c49	2017-11-06 11:15:08 +0000	[diff] [blame]	4977	return;
				4978
				4979	spin_lock(&i915->mm.free_lock);
Chris Wilson	5ad08be	2017-04-07 11:25:51 +0100	[diff] [blame]	4980	}
Chris Wilson	f991c49	2017-11-06 11:15:08 +0000	[diff] [blame]	4981	spin_unlock(&i915->mm.free_lock);
Chris Wilson	fbbd37b	2016-10-28 13:58:42 +0100	[diff] [blame]	4982	}
				4983
				4984	static void __i915_gem_free_object_rcu(struct rcu_head *head)
				4985	{
				4986	struct drm_i915_gem_object *obj =
				4987	container_of(head, typeof(*obj), rcu);
				4988	struct drm_i915_private *i915 = to_i915(obj->base.dev);
				4989
Chris Wilson	2ef1e72	2018-01-15 20:57:59 +0000	[diff] [blame]	4990	/*
				4991	* Since we require blocking on struct_mutex to unbind the freed
				4992	* object from the GPU before releasing resources back to the
				4993	* system, we can not do that directly from the RCU callback (which may
				4994	* be a softirq context), but must instead then defer that work onto a
				4995	* kthread. We use the RCU callback rather than move the freed object
				4996	* directly onto the work queue so that we can mix between using the
				4997	* worker and performing frees directly from subsequent allocations for
				4998	* crude but effective memory throttling.
Chris Wilson	fbbd37b	2016-10-28 13:58:42 +0100	[diff] [blame]	4999	*/
				5000	if (llist_add(&obj->freed, &i915->mm.free_list))
Chris Wilson	beacbd1	2018-01-15 12:28:45 +0000	[diff] [blame]	5001	queue_work(i915->wq, &i915->mm.free_work);
Chris Wilson	fbbd37b	2016-10-28 13:58:42 +0100	[diff] [blame]	5002	}
				5003
				5004	void i915_gem_free_object(struct drm_gem_object *gem_obj)
				5005	{
				5006	struct drm_i915_gem_object *obj = to_intel_bo(gem_obj);
				5007
Chris Wilson	bc0629a	2016-11-01 10:03:17 +0000	[diff] [blame]	5008	if (obj->mm.quirked)
				5009	__i915_gem_object_unpin_pages(obj);
				5010
Chris Wilson	fbbd37b	2016-10-28 13:58:42 +0100	[diff] [blame]	5011	if (discard_backing_storage(obj))
				5012	obj->mm.madv = I915_MADV_DONTNEED;
Daniel Vetter	a071fa0	2014-06-18 23:28:09 +0200	[diff] [blame]	5013
Chris Wilson	2ef1e72	2018-01-15 20:57:59 +0000	[diff] [blame]	5014	/*
				5015	* Before we free the object, make sure any pure RCU-only
Chris Wilson	fbbd37b	2016-10-28 13:58:42 +0100	[diff] [blame]	5016	* read-side critical sections are complete, e.g.
				5017	* i915_gem_busy_ioctl(). For the corresponding synchronized
				5018	* lookup see i915_gem_object_lookup_rcu().
				5019	*/
Chris Wilson	c9c70471	2018-02-19 22:06:31 +0000	[diff] [blame]	5020	atomic_inc(&to_i915(obj->base.dev)->mm.free_count);
Chris Wilson	fbbd37b	2016-10-28 13:58:42 +0100	[diff] [blame]	5021	call_rcu(&obj->rcu, __i915_gem_free_object_rcu);
Chris Wilson	be72615	2010-07-23 23:18:50 +0100	[diff] [blame]	5022	}
				5023
Chris Wilson	f8a7fde	2016-10-28 13:58:29 +0100	[diff] [blame]	5024	void __i915_gem_object_release_unless_active(struct drm_i915_gem_object *obj)
				5025	{
				5026	lockdep_assert_held(&obj->base.dev->struct_mutex);
				5027
Chris Wilson	d1b48c1	2017-08-16 09:52:08 +0100	[diff] [blame]	5028	if (!i915_gem_object_has_active_reference(obj) &&
				5029	i915_gem_object_is_active(obj))
Chris Wilson	f8a7fde	2016-10-28 13:58:29 +0100	[diff] [blame]	5030	i915_gem_object_set_active_reference(obj);
				5031	else
				5032	i915_gem_object_put(obj);
				5033	}
				5034
Chris Wilson	2414551	2017-01-24 11:01:35 +0000	[diff] [blame]	5035	void i915_gem_sanitize(struct drm_i915_private *i915)
				5036	{
Chris Wilson	4fdd5b4	2018-06-16 21:25:34 +0100	[diff] [blame]	5037	int err;
Chris Wilson	c3160da	2018-05-31 09:22:45 +0100	[diff] [blame]	5038
				5039	GEM_TRACE("\n");
				5040
Chris Wilson	4dfacb0	2018-05-31 09:22:43 +0100	[diff] [blame]	5041	mutex_lock(&i915->drm.struct_mutex);
Chris Wilson	c3160da	2018-05-31 09:22:45 +0100	[diff] [blame]	5042
				5043	intel_runtime_pm_get(i915);
				5044	intel_uncore_forcewake_get(i915, FORCEWAKE_ALL);
				5045
				5046	/*
				5047	* As we have just resumed the machine and woken the device up from
				5048	* deep PCI sleep (presumably D3_cold), assume the HW has been reset
				5049	* back to defaults, recovering from whatever wedged state we left it
				5050	* in and so worth trying to use the device once more.
				5051	*/
Chris Wilson	4dfacb0	2018-05-31 09:22:43 +0100	[diff] [blame]	5052	if (i915_terminally_wedged(&i915->gpu_error))
Chris Wilson	f36325f	2017-08-26 12:09:34 +0100	[diff] [blame]	5053	i915_gem_unset_wedged(i915);
Chris Wilson	f36325f	2017-08-26 12:09:34 +0100	[diff] [blame]	5054
Chris Wilson	2414551	2017-01-24 11:01:35 +0000	[diff] [blame]	5055	/*
				5056	* If we inherit context state from the BIOS or earlier occupants
				5057	* of the GPU, the GPU may be in an inconsistent state when we
				5058	* try to take over. The only way to remove the earlier state
				5059	* is by resetting. However, resetting on earlier gen is tricky as
				5060	* it may impact the display and we are uncertain about the stability
Joonas Lahtinen	ea117b8	2017-04-28 10:53:38 +0300	[diff] [blame]	5061	* of the reset, so this could be applied to even earlier gen.
Chris Wilson	2414551	2017-01-24 11:01:35 +0000	[diff] [blame]	5062	*/
Chris Wilson	4fdd5b4	2018-06-16 21:25:34 +0100	[diff] [blame]	5063	err = -ENODEV;
Daniele Ceraolo Spurio	ce1599a	2018-02-07 13:24:40 -0800	[diff] [blame]	5064	if (INTEL_GEN(i915) >= 5 && intel_has_gpu_reset(i915))
Chris Wilson	4fdd5b4	2018-06-16 21:25:34 +0100	[diff] [blame]	5065	err = WARN_ON(intel_gpu_reset(i915, ALL_ENGINES));
				5066	if (!err)
				5067	intel_engines_sanitize(i915);
Chris Wilson	c3160da	2018-05-31 09:22:45 +0100	[diff] [blame]	5068
				5069	intel_uncore_forcewake_put(i915, FORCEWAKE_ALL);
				5070	intel_runtime_pm_put(i915);
				5071
Chris Wilson	4dfacb0	2018-05-31 09:22:43 +0100	[diff] [blame]	5072	i915_gem_contexts_lost(i915);
				5073	mutex_unlock(&i915->drm.struct_mutex);
Chris Wilson	2414551	2017-01-24 11:01:35 +0000	[diff] [blame]	5074	}
				5075
Chris Wilson	bf06112	2018-07-09 14:02:04 +0100	[diff] [blame]	5076	int i915_gem_suspend(struct drm_i915_private *i915)
Eric Anholt	673a394	2008-07-30 12:06:12 -0700	[diff] [blame]	5077	{
Chris Wilson	dcff85c	2016-08-05 10:14:11 +0100	[diff] [blame]	5078	int ret;
Eric Anholt	673a394	2008-07-30 12:06:12 -0700	[diff] [blame]	5079
Chris Wilson	09a4c02	2018-05-24 09:11:35 +0100	[diff] [blame]	5080	GEM_TRACE("\n");
				5081
Chris Wilson	bf06112	2018-07-09 14:02:04 +0100	[diff] [blame]	5082	intel_runtime_pm_get(i915);
				5083	intel_suspend_gt_powersave(i915);
Chris Wilson	54b4f68	2016-07-21 21:16:19 +0100	[diff] [blame]	5084
Chris Wilson	bf06112	2018-07-09 14:02:04 +0100	[diff] [blame]	5085	mutex_lock(&i915->drm.struct_mutex);
Chris Wilson	5ab57c7	2016-07-15 14:56:20 +0100	[diff] [blame]	5086
Chris Wilson	bf06112	2018-07-09 14:02:04 +0100	[diff] [blame]	5087	/*
				5088	* We have to flush all the executing contexts to main memory so
Chris Wilson	5ab57c7	2016-07-15 14:56:20 +0100	[diff] [blame]	5089	* that they can saved in the hibernation image. To ensure the last
				5090	* context image is coherent, we have to switch away from it. That
Chris Wilson	bf06112	2018-07-09 14:02:04 +0100	[diff] [blame]	5091	* leaves the i915->kernel_context still active when
Chris Wilson	5ab57c7	2016-07-15 14:56:20 +0100	[diff] [blame]	5092	* we actually suspend, and its image in memory may not match the GPU
				5093	* state. Fortunately, the kernel_context is disposable and we do
				5094	* not rely on its state.
				5095	*/
Chris Wilson	bf06112	2018-07-09 14:02:04 +0100	[diff] [blame]	5096	if (!i915_terminally_wedged(&i915->gpu_error)) {
				5097	ret = i915_gem_switch_to_kernel_context(i915);
Chris Wilson	ecf73eb	2017-11-30 10:29:51 +0000	[diff] [blame]	5098	if (ret)
				5099	goto err_unlock;
Chris Wilson	5ab57c7	2016-07-15 14:56:20 +0100	[diff] [blame]	5100
Chris Wilson	bf06112	2018-07-09 14:02:04 +0100	[diff] [blame]	5101	ret = i915_gem_wait_for_idle(i915,
Chris Wilson	ecf73eb	2017-11-30 10:29:51 +0000	[diff] [blame]	5102	I915_WAIT_INTERRUPTIBLE \|
Chris Wilson	0606035	2018-05-31 09:22:44 +0100	[diff] [blame]	5103	I915_WAIT_LOCKED \|
Chris Wilson	ec625fb	2018-07-09 13:20:42 +0100	[diff] [blame]	5104	I915_WAIT_FOR_IDLE_BOOST,
				5105	MAX_SCHEDULE_TIMEOUT);
Chris Wilson	ecf73eb	2017-11-30 10:29:51 +0000	[diff] [blame]	5106	if (ret && ret != -EIO)
				5107	goto err_unlock;
Chris Wilson	f740334	2013-09-13 23:57:04 +0100	[diff] [blame]	5108
Chris Wilson	bf06112	2018-07-09 14:02:04 +0100	[diff] [blame]	5109	assert_kernel_context_is_current(i915);
Chris Wilson	ecf73eb	2017-11-30 10:29:51 +0000	[diff] [blame]	5110	}
Chris Wilson	01f8f33	2018-07-17 09:41:21 +0100	[diff] [blame]	5111	i915_retire_requests(i915); /* ensure we flush after wedging */
				5112
Chris Wilson	bf06112	2018-07-09 14:02:04 +0100	[diff] [blame]	5113	mutex_unlock(&i915->drm.struct_mutex);
Chris Wilson	45c5f20	2013-10-16 11:50:01 +0100	[diff] [blame]	5114
Chris Wilson	bf06112	2018-07-09 14:02:04 +0100	[diff] [blame]	5115	intel_uc_suspend(i915);
Sagar Arun Kamble	63987bf	2017-04-05 15:51:50 +0530	[diff] [blame]	5116
Chris Wilson	bf06112	2018-07-09 14:02:04 +0100	[diff] [blame]	5117	cancel_delayed_work_sync(&i915->gpu_error.hangcheck_work);
				5118	cancel_delayed_work_sync(&i915->gt.retire_work);
Chris Wilson	bdeb978	2016-12-23 14:57:56 +0000	[diff] [blame]	5119
Chris Wilson	bf06112	2018-07-09 14:02:04 +0100	[diff] [blame]	5120	/*
				5121	* As the idle_work is rearming if it detects a race, play safe and
Chris Wilson	bdeb978	2016-12-23 14:57:56 +0000	[diff] [blame]	5122	* repeat the flush until it is definitely idle.
				5123	*/
Chris Wilson	bf06112	2018-07-09 14:02:04 +0100	[diff] [blame]	5124	drain_delayed_work(&i915->gt.idle_work);
Chris Wilson	bdeb978	2016-12-23 14:57:56 +0000	[diff] [blame]	5125
Chris Wilson	bf06112	2018-07-09 14:02:04 +0100	[diff] [blame]	5126	/*
				5127	* Assert that we successfully flushed all the work and
Chris Wilson	bdcf120	2014-11-25 11:56:33 +0000	[diff] [blame]	5128	* reset the GPU back to its idle, low power state.
				5129	*/
Chris Wilson	bf06112	2018-07-09 14:02:04 +0100	[diff] [blame]	5130	WARN_ON(i915->gt.awake);
				5131	if (WARN_ON(!intel_engines_are_idle(i915)))
				5132	i915_gem_set_wedged(i915); /* no hope, discard everything */
Chris Wilson	bdcf120	2014-11-25 11:56:33 +0000	[diff] [blame]	5133
Chris Wilson	bf06112	2018-07-09 14:02:04 +0100	[diff] [blame]	5134	intel_runtime_pm_put(i915);
Chris Wilson	ec92ad0	2018-05-31 09:22:46 +0100	[diff] [blame]	5135	return 0;
				5136
				5137	err_unlock:
Chris Wilson	bf06112	2018-07-09 14:02:04 +0100	[diff] [blame]	5138	mutex_unlock(&i915->drm.struct_mutex);
				5139	intel_runtime_pm_put(i915);
Chris Wilson	ec92ad0	2018-05-31 09:22:46 +0100	[diff] [blame]	5140	return ret;
				5141	}
				5142
				5143	void i915_gem_suspend_late(struct drm_i915_private *i915)
				5144	{
Chris Wilson	9776f47	2018-06-01 15:41:24 +0100	[diff] [blame]	5145	struct drm_i915_gem_object *obj;
				5146	struct list_head *phases[] = {
				5147	&i915->mm.unbound_list,
				5148	&i915->mm.bound_list,
				5149	NULL
				5150	}, **phase;
				5151
Imre Deak	1c777c5	2016-10-12 17:46:37 +0300	[diff] [blame]	5152	/*
				5153	* Neither the BIOS, ourselves or any other kernel
				5154	* expects the system to be in execlists mode on startup,
				5155	* so we need to reset the GPU back to legacy mode. And the only
				5156	* known way to disable logical contexts is through a GPU reset.
				5157	*
				5158	* So in order to leave the system in a known default configuration,
				5159	* always reset the GPU upon unload and suspend. Afterwards we then
				5160	* clean up the GEM state tracking, flushing off the requests and
				5161	* leaving the system in a known idle state.
				5162	*
				5163	* Note that is of the upmost importance that the GPU is idle and
				5164	* all stray writes are flushed before we dismantle the backing
				5165	* storage for the pinned objects.
				5166	*
				5167	* However, since we are uncertain that resetting the GPU on older
				5168	* machines is a good idea, we don't - just in case it leaves the
				5169	* machine in an unusable condition.
				5170	*/
Chris Wilson	cad9946	2017-08-26 12:09:33 +0100	[diff] [blame]	5171
Chris Wilson	9776f47	2018-06-01 15:41:24 +0100	[diff] [blame]	5172	mutex_lock(&i915->drm.struct_mutex);
				5173	for (phase = phases; *phase; phase++) {
				5174	list_for_each_entry(obj, *phase, mm.link)
				5175	WARN_ON(i915_gem_object_set_to_gtt_domain(obj, false));
				5176	}
				5177	mutex_unlock(&i915->drm.struct_mutex);
				5178
Chris Wilson	ec92ad0	2018-05-31 09:22:46 +0100	[diff] [blame]	5179	intel_uc_sanitize(i915);
				5180	i915_gem_sanitize(i915);
Eric Anholt	673a394	2008-07-30 12:06:12 -0700	[diff] [blame]	5181	}
				5182
Chris Wilson	37cd330	2017-11-12 11:27:38 +0000	[diff] [blame]	5183	void i915_gem_resume(struct drm_i915_private *i915)
Chris Wilson	5ab57c7	2016-07-15 14:56:20 +0100	[diff] [blame]	5184	{
Chris Wilson	4dfacb0	2018-05-31 09:22:43 +0100	[diff] [blame]	5185	GEM_TRACE("\n");
				5186
Chris Wilson	37cd330	2017-11-12 11:27:38 +0000	[diff] [blame]	5187	WARN_ON(i915->gt.awake);
Chris Wilson	5ab57c7	2016-07-15 14:56:20 +0100	[diff] [blame]	5188
Chris Wilson	37cd330	2017-11-12 11:27:38 +0000	[diff] [blame]	5189	mutex_lock(&i915->drm.struct_mutex);
				5190	intel_uncore_forcewake_get(i915, FORCEWAKE_ALL);
Imre Deak	31ab49a	2016-11-07 11:20:05 +0200	[diff] [blame]	5191
Chris Wilson	37cd330	2017-11-12 11:27:38 +0000	[diff] [blame]	5192	i915_gem_restore_gtt_mappings(i915);
				5193	i915_gem_restore_fences(i915);
Chris Wilson	5ab57c7	2016-07-15 14:56:20 +0100	[diff] [blame]	5194
Chris Wilson	6ca9a2b	2017-12-13 13:43:47 +0000	[diff] [blame]	5195	/*
				5196	* As we didn't flush the kernel context before suspend, we cannot
Chris Wilson	5ab57c7	2016-07-15 14:56:20 +0100	[diff] [blame]	5197	* guarantee that the context image is complete. So let's just reset
				5198	* it and start again.
				5199	*/
Chris Wilson	37cd330	2017-11-12 11:27:38 +0000	[diff] [blame]	5200	i915->gt.resume(i915);
Chris Wilson	5ab57c7	2016-07-15 14:56:20 +0100	[diff] [blame]	5201
Chris Wilson	37cd330	2017-11-12 11:27:38 +0000	[diff] [blame]	5202	if (i915_gem_init_hw(i915))
				5203	goto err_wedged;
				5204
Michal Wajdeczko	7cfca4a	2018-03-02 11:15:49 +0000	[diff] [blame]	5205	intel_uc_resume(i915);
Chris Wilson	7469c62	2017-11-14 13:03:00 +0000	[diff] [blame]	5206
Chris Wilson	37cd330	2017-11-12 11:27:38 +0000	[diff] [blame]	5207	/* Always reload a context for powersaving. */
				5208	if (i915_gem_switch_to_kernel_context(i915))
				5209	goto err_wedged;
				5210
				5211	out_unlock:
				5212	intel_uncore_forcewake_put(i915, FORCEWAKE_ALL);
				5213	mutex_unlock(&i915->drm.struct_mutex);
				5214	return;
				5215
				5216	err_wedged:
Chris Wilson	6ca9a2b	2017-12-13 13:43:47 +0000	[diff] [blame]	5217	if (!i915_terminally_wedged(&i915->gpu_error)) {
				5218	DRM_ERROR("failed to re-initialize GPU, declaring wedged!\n");
				5219	i915_gem_set_wedged(i915);
				5220	}
Chris Wilson	37cd330	2017-11-12 11:27:38 +0000	[diff] [blame]	5221	goto out_unlock;
Chris Wilson	5ab57c7	2016-07-15 14:56:20 +0100	[diff] [blame]	5222	}
				5223
Tvrtko Ursulin	c6be607	2016-11-16 08:55:31 +0000	[diff] [blame]	5224	void i915_gem_init_swizzling(struct drm_i915_private *dev_priv)
Daniel Vetter	f691e2f	2012-02-02 09:58:12 +0100	[diff] [blame]	5225	{
Tvrtko Ursulin	c6be607	2016-11-16 08:55:31 +0000	[diff] [blame]	5226	if (INTEL_GEN(dev_priv) < 5 \|\|
Daniel Vetter	f691e2f	2012-02-02 09:58:12 +0100	[diff] [blame]	5227	dev_priv->mm.bit_6_swizzle_x == I915_BIT_6_SWIZZLE_NONE)
				5228	return;
				5229
				5230	I915_WRITE(DISP_ARB_CTL, I915_READ(DISP_ARB_CTL) \|
				5231	DISP_TILE_SURFACE_SWIZZLING);
				5232
Tvrtko Ursulin	5db9401	2016-10-13 11:03:10 +0100	[diff] [blame]	5233	if (IS_GEN5(dev_priv))
Daniel Vetter	11782b0	2012-01-31 16:47:55 +0100	[diff] [blame]	5234	return;
				5235
Daniel Vetter	f691e2f	2012-02-02 09:58:12 +0100	[diff] [blame]	5236	I915_WRITE(TILECTL, I915_READ(TILECTL) \| TILECTL_SWZCTL);
Tvrtko Ursulin	5db9401	2016-10-13 11:03:10 +0100	[diff] [blame]	5237	if (IS_GEN6(dev_priv))
Daniel Vetter	6b26c86	2012-04-24 14:04:12 +0200	[diff] [blame]	5238	I915_WRITE(ARB_MODE, _MASKED_BIT_ENABLE(ARB_MODE_SWIZZLE_SNB));
Tvrtko Ursulin	5db9401	2016-10-13 11:03:10 +0100	[diff] [blame]	5239	else if (IS_GEN7(dev_priv))
Daniel Vetter	6b26c86	2012-04-24 14:04:12 +0200	[diff] [blame]	5240	I915_WRITE(ARB_MODE, _MASKED_BIT_ENABLE(ARB_MODE_SWIZZLE_IVB));
Tvrtko Ursulin	5db9401	2016-10-13 11:03:10 +0100	[diff] [blame]	5241	else if (IS_GEN8(dev_priv))
Ben Widawsky	31a5336	2013-11-02 21:07:04 -0700	[diff] [blame]	5242	I915_WRITE(GAMTARBMODE, _MASKED_BIT_ENABLE(ARB_MODE_SWIZZLE_BDW));
Ben Widawsky	8782e26	2012-12-18 10:31:23 -0800	[diff] [blame]	5243	else
				5244	BUG();
Daniel Vetter	f691e2f	2012-02-02 09:58:12 +0100	[diff] [blame]	5245	}
Daniel Vetter	e21af88	2012-02-09 20:53:27 +0100	[diff] [blame]	5246
Tvrtko Ursulin	50a0bc9	2016-10-13 11:02:58 +0100	[diff] [blame]	5247	static void init_unused_ring(struct drm_i915_private *dev_priv, u32 base)
Ville Syrjälä	81e7f20	2014-08-15 01:21:55 +0300	[diff] [blame]	5248	{
Ville Syrjälä	81e7f20	2014-08-15 01:21:55 +0300	[diff] [blame]	5249	I915_WRITE(RING_CTL(base), 0);
				5250	I915_WRITE(RING_HEAD(base), 0);
				5251	I915_WRITE(RING_TAIL(base), 0);
				5252	I915_WRITE(RING_START(base), 0);
				5253	}
				5254
Tvrtko Ursulin	50a0bc9	2016-10-13 11:02:58 +0100	[diff] [blame]	5255	static void init_unused_rings(struct drm_i915_private *dev_priv)
Ville Syrjälä	81e7f20	2014-08-15 01:21:55 +0300	[diff] [blame]	5256	{
Tvrtko Ursulin	50a0bc9	2016-10-13 11:02:58 +0100	[diff] [blame]	5257	if (IS_I830(dev_priv)) {
				5258	init_unused_ring(dev_priv, PRB1_BASE);
				5259	init_unused_ring(dev_priv, SRB0_BASE);
				5260	init_unused_ring(dev_priv, SRB1_BASE);
				5261	init_unused_ring(dev_priv, SRB2_BASE);
				5262	init_unused_ring(dev_priv, SRB3_BASE);
				5263	} else if (IS_GEN2(dev_priv)) {
				5264	init_unused_ring(dev_priv, SRB0_BASE);
				5265	init_unused_ring(dev_priv, SRB1_BASE);
				5266	} else if (IS_GEN3(dev_priv)) {
				5267	init_unused_ring(dev_priv, PRB1_BASE);
				5268	init_unused_ring(dev_priv, PRB2_BASE);
Ville Syrjälä	81e7f20	2014-08-15 01:21:55 +0300	[diff] [blame]	5269	}
				5270	}
				5271
Chris Wilson	20a8a74	2017-02-08 14:30:31 +0000	[diff] [blame]	5272	static int __i915_gem_restart_engines(void *data)
Ben Widawsky	4fc7c97	2013-02-08 11:49:24 -0800	[diff] [blame]	5273	{
Chris Wilson	20a8a74	2017-02-08 14:30:31 +0000	[diff] [blame]	5274	struct drm_i915_private *i915 = data;
Tvrtko Ursulin	e2f8039	2016-03-16 11:00:36 +0000	[diff] [blame]	5275	struct intel_engine_cs *engine;
Akash Goel	3b3f165	2016-10-13 22:44:48 +0530	[diff] [blame]	5276	enum intel_engine_id id;
Chris Wilson	20a8a74	2017-02-08 14:30:31 +0000	[diff] [blame]	5277	int err;
				5278
				5279	for_each_engine(engine, i915, id) {
				5280	err = engine->init_hw(engine);
Chris Wilson	8177e11	2018-02-07 11:15:45 +0000	[diff] [blame]	5281	if (err) {
				5282	DRM_ERROR("Failed to restart %s (%d)\n",
				5283	engine->name, err);
Chris Wilson	20a8a74	2017-02-08 14:30:31 +0000	[diff] [blame]	5284	return err;
Chris Wilson	8177e11	2018-02-07 11:15:45 +0000	[diff] [blame]	5285	}
Chris Wilson	20a8a74	2017-02-08 14:30:31 +0000	[diff] [blame]	5286	}
				5287
				5288	return 0;
				5289	}
				5290
				5291	int i915_gem_init_hw(struct drm_i915_private *dev_priv)
				5292	{
Chris Wilson	d200cda	2016-04-28 09:56:44 +0100	[diff] [blame]	5293	int ret;
Ben Widawsky	4fc7c97	2013-02-08 11:49:24 -0800	[diff] [blame]	5294
Chris Wilson	de867c2	2016-10-25 13:16:02 +0100	[diff] [blame]	5295	dev_priv->gt.last_init_time = ktime_get();
				5296
Chris Wilson	5e4f518	2015-02-13 14:35:59 +0000	[diff] [blame]	5297	/* Double layer security blanket, see i915_gem_init() */
				5298	intel_uncore_forcewake_get(dev_priv, FORCEWAKE_ALL);
				5299
Tvrtko Ursulin	0031fb9	2016-11-04 14:42:44 +0000	[diff] [blame]	5300	if (HAS_EDRAM(dev_priv) && INTEL_GEN(dev_priv) < 9)
Ben Widawsky	05e21cc	2013-07-04 11:02:04 -0700	[diff] [blame]	5301	I915_WRITE(HSW_IDICR, I915_READ(HSW_IDICR) \| IDIHASHMSK(0xf));
Ben Widawsky	4fc7c97	2013-02-08 11:49:24 -0800	[diff] [blame]	5302
Tvrtko Ursulin	772c2a5	2016-10-13 11:03:01 +0100	[diff] [blame]	5303	if (IS_HASWELL(dev_priv))
Tvrtko Ursulin	50a0bc9	2016-10-13 11:02:58 +0100	[diff] [blame]	5304	I915_WRITE(MI_PREDICATE_RESULT_2, IS_HSW_GT3(dev_priv) ?
Ville Syrjälä	0bf2134	2013-11-29 14:56:12 +0200	[diff] [blame]	5305	LOWER_SLICE_ENABLED : LOWER_SLICE_DISABLED);
Rodrigo Vivi	9435373	2013-08-28 16:45:46 -0300	[diff] [blame]	5306
Oscar Mateo	59b449d	2018-04-10 09:12:47 -0700	[diff] [blame]	5307	intel_gt_workarounds_apply(dev_priv);
				5308
Tvrtko Ursulin	c6be607	2016-11-16 08:55:31 +0000	[diff] [blame]	5309	i915_gem_init_swizzling(dev_priv);
Ben Widawsky	4fc7c97	2013-02-08 11:49:24 -0800	[diff] [blame]	5310
Daniel Vetter	d5abdfd	2014-11-20 09:45:19 +0100	[diff] [blame]	5311	/*
				5312	* At least 830 can leave some of the unused rings
				5313	* "active" (ie. head != tail) after resume which
				5314	* will prevent c3 entry. Makes sure all unused rings
				5315	* are totally idle.
				5316	*/
Tvrtko Ursulin	50a0bc9	2016-10-13 11:02:58 +0100	[diff] [blame]	5317	init_unused_rings(dev_priv);
Daniel Vetter	d5abdfd	2014-11-20 09:45:19 +0100	[diff] [blame]	5318
Dave Gordon	ed54c1a	2016-01-19 19:02:54 +0000	[diff] [blame]	5319	BUG_ON(!dev_priv->kernel_context);
Chris Wilson	6f74b36	2017-10-15 15:37:25 +0100	[diff] [blame]	5320	if (i915_terminally_wedged(&dev_priv->gpu_error)) {
				5321	ret = -EIO;
				5322	goto out;
				5323	}
John Harrison	90638cc	2015-05-29 17:43:37 +0100	[diff] [blame]	5324
Tvrtko Ursulin	c6be607	2016-11-16 08:55:31 +0000	[diff] [blame]	5325	ret = i915_ppgtt_init_hw(dev_priv);
John Harrison	4ad2fd8	2015-06-18 13:11:20 +0100	[diff] [blame]	5326	if (ret) {
Chris Wilson	8177e11	2018-02-07 11:15:45 +0000	[diff] [blame]	5327	DRM_ERROR("Enabling PPGTT failed (%d)\n", ret);
John Harrison	4ad2fd8	2015-06-18 13:11:20 +0100	[diff] [blame]	5328	goto out;
				5329	}
				5330
Jackie Li	f08e203	2018-03-13 17:32:53 -0700	[diff] [blame]	5331	ret = intel_wopcm_init_hw(&dev_priv->wopcm);
				5332	if (ret) {
				5333	DRM_ERROR("Enabling WOPCM failed (%d)\n", ret);
				5334	goto out;
				5335	}
				5336
Michał Winiarski	9bdc357	2017-10-25 18:25:19 +0100	[diff] [blame]	5337	/* We can't enable contexts until all firmware is loaded */
				5338	ret = intel_uc_init_hw(dev_priv);
Chris Wilson	8177e11	2018-02-07 11:15:45 +0000	[diff] [blame]	5339	if (ret) {
				5340	DRM_ERROR("Enabling uc failed (%d)\n", ret);
Michał Winiarski	9bdc357	2017-10-25 18:25:19 +0100	[diff] [blame]	5341	goto out;
Chris Wilson	8177e11	2018-02-07 11:15:45 +0000	[diff] [blame]	5342	}
Michał Winiarski	9bdc357	2017-10-25 18:25:19 +0100	[diff] [blame]	5343
Tvrtko Ursulin	bf9e842	2016-12-01 14:16:38 +0000	[diff] [blame]	5344	intel_mocs_init_l3cc_table(dev_priv);
Peter Antoine	0ccdacf	2016-04-13 15:03:25 +0100	[diff] [blame]	5345
Chris Wilson	136109c	2017-11-02 13:14:30 +0000	[diff] [blame]	5346	/* Only when the HW is re-initialised, can we replay the requests */
				5347	ret = __i915_gem_restart_engines(dev_priv);
Michal Wajdeczko	b96f6eb	2018-06-05 12:24:43 +0000	[diff] [blame]	5348	if (ret)
				5349	goto cleanup_uc;
Michał Winiarski	60c0a66	2018-07-12 14:48:10 +0200	[diff] [blame]	5350
Chris Wilson	5e4f518	2015-02-13 14:35:59 +0000	[diff] [blame]	5351	intel_uncore_forcewake_put(dev_priv, FORCEWAKE_ALL);
Michał Winiarski	60c0a66	2018-07-12 14:48:10 +0200	[diff] [blame]	5352
				5353	return 0;
Michal Wajdeczko	b96f6eb	2018-06-05 12:24:43 +0000	[diff] [blame]	5354
				5355	cleanup_uc:
				5356	intel_uc_fini_hw(dev_priv);
Michał Winiarski	60c0a66	2018-07-12 14:48:10 +0200	[diff] [blame]	5357	out:
				5358	intel_uncore_forcewake_put(dev_priv, FORCEWAKE_ALL);
				5359
				5360	return ret;
Zou Nan hai	8187a2b	2010-05-21 09:08:55 +0800	[diff] [blame]	5361	}
				5362
Chris Wilson	d2b4b97	2017-11-10 14:26:33 +0000	[diff] [blame]	5363	static int __intel_engines_record_defaults(struct drm_i915_private *i915)
				5364	{
				5365	struct i915_gem_context *ctx;
				5366	struct intel_engine_cs *engine;
				5367	enum intel_engine_id id;
				5368	int err;
				5369
				5370	/*
				5371	* As we reset the gpu during very early sanitisation, the current
				5372	* register state on the GPU should reflect its defaults values.
				5373	* We load a context onto the hw (with restore-inhibit), then switch
				5374	* over to a second context to save that default register state. We
				5375	* can then prime every new context with that state so they all start
				5376	* from the same default HW values.
				5377	*/
				5378
				5379	ctx = i915_gem_context_create_kernel(i915, 0);
				5380	if (IS_ERR(ctx))
				5381	return PTR_ERR(ctx);
				5382
				5383	for_each_engine(engine, i915, id) {
Chris Wilson	e61e0f5	2018-02-21 09:56:36 +0000	[diff] [blame]	5384	struct i915_request *rq;
Chris Wilson	d2b4b97	2017-11-10 14:26:33 +0000	[diff] [blame]	5385
Chris Wilson	e61e0f5	2018-02-21 09:56:36 +0000	[diff] [blame]	5386	rq = i915_request_alloc(engine, ctx);
Chris Wilson	d2b4b97	2017-11-10 14:26:33 +0000	[diff] [blame]	5387	if (IS_ERR(rq)) {
				5388	err = PTR_ERR(rq);
				5389	goto out_ctx;
				5390	}
				5391
Chris Wilson	3fef5cd	2017-11-20 10:20:02 +0000	[diff] [blame]	5392	err = 0;
Chris Wilson	d2b4b97	2017-11-10 14:26:33 +0000	[diff] [blame]	5393	if (engine->init_context)
				5394	err = engine->init_context(rq);
				5395
Chris Wilson	697b9a8	2018-06-12 11:51:35 +0100	[diff] [blame]	5396	i915_request_add(rq);
Chris Wilson	d2b4b97	2017-11-10 14:26:33 +0000	[diff] [blame]	5397	if (err)
				5398	goto err_active;
				5399	}
				5400
				5401	err = i915_gem_switch_to_kernel_context(i915);
				5402	if (err)
				5403	goto err_active;
				5404
Chris Wilson	2621cef	2018-07-09 13:20:43 +0100	[diff] [blame]	5405	if (i915_gem_wait_for_idle(i915, I915_WAIT_LOCKED, HZ / 5)) {
				5406	i915_gem_set_wedged(i915);
				5407	err = -EIO; /* Caller will declare us wedged */
Chris Wilson	d2b4b97	2017-11-10 14:26:33 +0000	[diff] [blame]	5408	goto err_active;
Chris Wilson	2621cef	2018-07-09 13:20:43 +0100	[diff] [blame]	5409	}
Chris Wilson	d2b4b97	2017-11-10 14:26:33 +0000	[diff] [blame]	5410
				5411	assert_kernel_context_is_current(i915);
				5412
Chris Wilson	8e1cb32	2018-09-20 17:13:43 +0100	[diff] [blame]	5413	/*
				5414	* Immediately park the GPU so that we enable powersaving and
				5415	* treat it as idle. The next time we issue a request, we will
				5416	* unpark and start using the engine->pinned_default_state, otherwise
				5417	* it is in limbo and an early reset may fail.
				5418	*/
				5419	__i915_gem_park(i915);
				5420
Chris Wilson	d2b4b97	2017-11-10 14:26:33 +0000	[diff] [blame]	5421	for_each_engine(engine, i915, id) {
				5422	struct i915_vma *state;
Chris Wilson	37d7c9c	2018-09-14 13:35:03 +0100	[diff] [blame]	5423	void *vaddr;
Chris Wilson	d2b4b97	2017-11-10 14:26:33 +0000	[diff] [blame]	5424
Chris Wilson	666424a	2018-09-14 13:35:04 +0100	[diff] [blame]	5425	GEM_BUG_ON(to_intel_context(ctx, engine)->pin_count);
				5426
Chris Wilson	ab82a06	2018-04-30 14:15:01 +0100	[diff] [blame]	5427	state = to_intel_context(ctx, engine)->state;
Chris Wilson	d2b4b97	2017-11-10 14:26:33 +0000	[diff] [blame]	5428	if (!state)
				5429	continue;
				5430
				5431	/*
				5432	* As we will hold a reference to the logical state, it will
				5433	* not be torn down with the context, and importantly the
				5434	* object will hold onto its vma (making it possible for a
				5435	* stray GTT write to corrupt our defaults). Unmap the vma
				5436	* from the GTT to prevent such accidents and reclaim the
				5437	* space.
				5438	*/
				5439	err = i915_vma_unbind(state);
				5440	if (err)
				5441	goto err_active;
				5442
				5443	err = i915_gem_object_set_to_cpu_domain(state->obj, false);
				5444	if (err)
				5445	goto err_active;
				5446
				5447	engine->default_state = i915_gem_object_get(state->obj);
Chris Wilson	37d7c9c	2018-09-14 13:35:03 +0100	[diff] [blame]	5448
				5449	/* Check we can acquire the image of the context state */
				5450	vaddr = i915_gem_object_pin_map(engine->default_state,
Chris Wilson	666424a	2018-09-14 13:35:04 +0100	[diff] [blame]	5451	I915_MAP_FORCE_WB);
Chris Wilson	37d7c9c	2018-09-14 13:35:03 +0100	[diff] [blame]	5452	if (IS_ERR(vaddr)) {
				5453	err = PTR_ERR(vaddr);
				5454	goto err_active;
				5455	}
				5456
				5457	i915_gem_object_unpin_map(engine->default_state);
Chris Wilson	d2b4b97	2017-11-10 14:26:33 +0000	[diff] [blame]	5458	}
				5459
				5460	if (IS_ENABLED(CONFIG_DRM_I915_DEBUG_GEM)) {
				5461	unsigned int found = intel_engines_has_context_isolation(i915);
				5462
				5463	/*
				5464	* Make sure that classes with multiple engine instances all
				5465	* share the same basic configuration.
				5466	*/
				5467	for_each_engine(engine, i915, id) {
				5468	unsigned int bit = BIT(engine->uabi_class);
				5469	unsigned int expected = engine->default_state ? bit : 0;
				5470
				5471	if ((found & bit) != expected) {
				5472	DRM_ERROR("mismatching default context state for class %d on engine %s\n",
				5473	engine->uabi_class, engine->name);
				5474	}
				5475	}
				5476	}
				5477
				5478	out_ctx:
				5479	i915_gem_context_set_closed(ctx);
				5480	i915_gem_context_put(ctx);
				5481	return err;
				5482
				5483	err_active:
				5484	/*
				5485	* If we have to abandon now, we expect the engines to be idle
				5486	* and ready to be torn-down. First try to flush any remaining
				5487	* request, ensure we are pointing at the kernel context and
				5488	* then remove it.
				5489	*/
				5490	if (WARN_ON(i915_gem_switch_to_kernel_context(i915)))
				5491	goto out_ctx;
				5492
Chris Wilson	ec625fb	2018-07-09 13:20:42 +0100	[diff] [blame]	5493	if (WARN_ON(i915_gem_wait_for_idle(i915,
				5494	I915_WAIT_LOCKED,
				5495	MAX_SCHEDULE_TIMEOUT)))
Chris Wilson	d2b4b97	2017-11-10 14:26:33 +0000	[diff] [blame]	5496	goto out_ctx;
				5497
				5498	i915_gem_contexts_lost(i915);
				5499	goto out_ctx;
				5500	}
				5501
Tvrtko Ursulin	bf9e842	2016-12-01 14:16:38 +0000	[diff] [blame]	5502	int i915_gem_init(struct drm_i915_private *dev_priv)
Chris Wilson	1070a42	2012-04-24 15:47:41 +0100	[diff] [blame]	5503	{
Chris Wilson	1070a42	2012-04-24 15:47:41 +0100	[diff] [blame]	5504	int ret;
				5505
Changbin Du	52b2416	2018-05-08 17:07:05 +0800	[diff] [blame]	5506	/* We need to fallback to 4K pages if host doesn't support huge gtt. */
				5507	if (intel_vgpu_active(dev_priv) && !intel_vgpu_has_huge_gtt(dev_priv))
Matthew Auld	da9fe3f3	2017-10-06 23:18:31 +0100	[diff] [blame]	5508	mkwrite_device_info(dev_priv)->page_sizes =
				5509	I915_GTT_PAGE_SIZE_4K;
				5510
Chris Wilson	9431282	2017-05-03 10:39:18 +0100	[diff] [blame]	5511	dev_priv->mm.unordered_timeline = dma_fence_context_alloc(1);
Chris Wilson	57822dc	2017-02-22 11:40:48 +0000	[diff] [blame]	5512
Chris Wilson	fb5c551	2017-11-20 20:55:00 +0000	[diff] [blame]	5513	if (HAS_LOGICAL_RING_CONTEXTS(dev_priv)) {
Chris Wilson	821ed7d	2016-09-09 14:11:53 +0100	[diff] [blame]	5514	dev_priv->gt.resume = intel_lr_context_resume;
Tvrtko Ursulin	117897f	2016-03-16 11:00:40 +0000	[diff] [blame]	5515	dev_priv->gt.cleanup_engine = intel_logical_ring_cleanup;
Chris Wilson	fb5c551	2017-11-20 20:55:00 +0000	[diff] [blame]	5516	} else {
				5517	dev_priv->gt.resume = intel_legacy_submission_resume;
				5518	dev_priv->gt.cleanup_engine = intel_engine_cleanup;
Oscar Mateo	a83014d	2014-07-24 17:04:21 +0100	[diff] [blame]	5519	}
				5520
Chris Wilson	ee48700	2017-11-22 17:26:21 +0000	[diff] [blame]	5521	ret = i915_gem_init_userptr(dev_priv);
				5522	if (ret)
				5523	return ret;
				5524
Sagar Arun Kamble	70deead	2018-01-24 21:16:58 +0530	[diff] [blame]	5525	ret = intel_uc_init_misc(dev_priv);
Michał Winiarski	3176ff4	2017-12-13 23:13:47 +0100	[diff] [blame]	5526	if (ret)
				5527	return ret;
				5528
Michal Wajdeczko	f7dc015	2018-06-28 14:15:21 +0000	[diff] [blame]	5529	ret = intel_wopcm_init(&dev_priv->wopcm);
				5530	if (ret)
				5531	goto err_uc_misc;
				5532
Chris Wilson	5e4f518	2015-02-13 14:35:59 +0000	[diff] [blame]	5533	/* This is just a security blanket to placate dragons.
				5534	* On some systems, we very sporadically observe that the first TLBs
				5535	* used by the CS may be stale, despite us poking the TLB reset. If
				5536	* we hold the forcewake during initialisation these problems
				5537	* just magically go away.
				5538	*/
Chris Wilson	ee48700	2017-11-22 17:26:21 +0000	[diff] [blame]	5539	mutex_lock(&dev_priv->drm.struct_mutex);
Chris Wilson	5e4f518	2015-02-13 14:35:59 +0000	[diff] [blame]	5540	intel_uncore_forcewake_get(dev_priv, FORCEWAKE_ALL);
				5541
Chris Wilson	f6b9d5c	2016-08-04 07:52:23 +0100	[diff] [blame]	5542	ret = i915_gem_init_ggtt(dev_priv);
Chris Wilson	6ca9a2b	2017-12-13 13:43:47 +0000	[diff] [blame]	5543	if (ret) {
				5544	GEM_BUG_ON(ret == -EIO);
				5545	goto err_unlock;
				5546	}
Jesse Barnes	d62b489	2013-03-08 10:45:53 -0800	[diff] [blame]	5547
Chris Wilson	829a0af	2017-06-20 12:05:45 +0100	[diff] [blame]	5548	ret = i915_gem_contexts_init(dev_priv);
Chris Wilson	6ca9a2b	2017-12-13 13:43:47 +0000	[diff] [blame]	5549	if (ret) {
				5550	GEM_BUG_ON(ret == -EIO);
				5551	goto err_ggtt;
				5552	}
Ben Widawsky	2fa48d8	2013-12-06 14:11:04 -0800	[diff] [blame]	5553
Tvrtko Ursulin	bf9e842	2016-12-01 14:16:38 +0000	[diff] [blame]	5554	ret = intel_engines_init(dev_priv);
Chris Wilson	6ca9a2b	2017-12-13 13:43:47 +0000	[diff] [blame]	5555	if (ret) {
				5556	GEM_BUG_ON(ret == -EIO);
				5557	goto err_context;
				5558	}
Daniel Vetter	53ca26c	2012-04-26 23:28:03 +0200	[diff] [blame]	5559
Chris Wilson	f58d13d	2017-11-10 14:26:29 +0000	[diff] [blame]	5560	intel_init_gt_powersave(dev_priv);
				5561
Michał Winiarski	61b5c15	2017-12-13 23:13:48 +0100	[diff] [blame]	5562	ret = intel_uc_init(dev_priv);
Chris Wilson	cc6a818	2017-11-10 14:26:30 +0000	[diff] [blame]	5563	if (ret)
Chris Wilson	6ca9a2b	2017-12-13 13:43:47 +0000	[diff] [blame]	5564	goto err_pm;
Chris Wilson	cc6a818	2017-11-10 14:26:30 +0000	[diff] [blame]	5565
Michał Winiarski	61b5c15	2017-12-13 23:13:48 +0100	[diff] [blame]	5566	ret = i915_gem_init_hw(dev_priv);
				5567	if (ret)
				5568	goto err_uc_init;
				5569
Chris Wilson	cc6a818	2017-11-10 14:26:30 +0000	[diff] [blame]	5570	/*
				5571	* Despite its name intel_init_clock_gating applies both display
				5572	* clock gating workarounds; GT mmio workarounds and the occasional
				5573	* GT power context workaround. Worse, sometimes it includes a context
				5574	* register workaround which we need to apply before we record the
				5575	* default HW state for all contexts.
				5576	*
				5577	* FIXME: break up the workarounds and apply them at the right time!
				5578	*/
				5579	intel_init_clock_gating(dev_priv);
				5580
Chris Wilson	d2b4b97	2017-11-10 14:26:33 +0000	[diff] [blame]	5581	ret = __intel_engines_record_defaults(dev_priv);
Chris Wilson	6ca9a2b	2017-12-13 13:43:47 +0000	[diff] [blame]	5582	if (ret)
				5583	goto err_init_hw;
				5584
				5585	if (i915_inject_load_failure()) {
				5586	ret = -ENODEV;
				5587	goto err_init_hw;
				5588	}
				5589
				5590	if (i915_inject_load_failure()) {
				5591	ret = -EIO;
				5592	goto err_init_hw;
				5593	}
				5594
				5595	intel_uncore_forcewake_put(dev_priv, FORCEWAKE_ALL);
				5596	mutex_unlock(&dev_priv->drm.struct_mutex);
				5597
				5598	return 0;
				5599
				5600	/*
				5601	* Unwinding is complicated by that we want to handle -EIO to mean
				5602	* disable GPU submission but keep KMS alive. We want to mark the
				5603	* HW as irrevisibly wedged, but keep enough state around that the
				5604	* driver doesn't explode during runtime.
				5605	*/
				5606	err_init_hw:
Chris Wilson	8571a05	2018-06-06 15:54:41 +0100	[diff] [blame]	5607	mutex_unlock(&dev_priv->drm.struct_mutex);
				5608
				5609	WARN_ON(i915_gem_suspend(dev_priv));
				5610	i915_gem_suspend_late(dev_priv);
				5611
Chris Wilson	8bcf9f7	2018-07-10 10:44:20 +0100	[diff] [blame]	5612	i915_gem_drain_workqueue(dev_priv);
				5613
Chris Wilson	8571a05	2018-06-06 15:54:41 +0100	[diff] [blame]	5614	mutex_lock(&dev_priv->drm.struct_mutex);
Chris Wilson	6ca9a2b	2017-12-13 13:43:47 +0000	[diff] [blame]	5615	intel_uc_fini_hw(dev_priv);
Michał Winiarski	61b5c15	2017-12-13 23:13:48 +0100	[diff] [blame]	5616	err_uc_init:
				5617	intel_uc_fini(dev_priv);
Chris Wilson	6ca9a2b	2017-12-13 13:43:47 +0000	[diff] [blame]	5618	err_pm:
				5619	if (ret != -EIO) {
				5620	intel_cleanup_gt_powersave(dev_priv);
				5621	i915_gem_cleanup_engines(dev_priv);
				5622	}
				5623	err_context:
				5624	if (ret != -EIO)
				5625	i915_gem_contexts_fini(dev_priv);
				5626	err_ggtt:
				5627	err_unlock:
				5628	intel_uncore_forcewake_put(dev_priv, FORCEWAKE_ALL);
				5629	mutex_unlock(&dev_priv->drm.struct_mutex);
				5630
Michal Wajdeczko	f7dc015	2018-06-28 14:15:21 +0000	[diff] [blame]	5631	err_uc_misc:
Sagar Arun Kamble	70deead	2018-01-24 21:16:58 +0530	[diff] [blame]	5632	intel_uc_fini_misc(dev_priv);
Sagar Arun Kamble	da943b5	2018-01-10 18:24:16 +0530	[diff] [blame]	5633
Chris Wilson	6ca9a2b	2017-12-13 13:43:47 +0000	[diff] [blame]	5634	if (ret != -EIO)
				5635	i915_gem_cleanup_userptr(dev_priv);
				5636
Chris Wilson	6099032	2014-04-09 09:19:42 +0100	[diff] [blame]	5637	if (ret == -EIO) {
Chris Wilson	7ed43df	2018-07-26 09:50:32 +0100	[diff] [blame]	5638	mutex_lock(&dev_priv->drm.struct_mutex);
				5639
Chris Wilson	6ca9a2b	2017-12-13 13:43:47 +0000	[diff] [blame]	5640	/*
				5641	* Allow engine initialisation to fail by marking the GPU as
Chris Wilson	6099032	2014-04-09 09:19:42 +0100	[diff] [blame]	5642	* wedged. But we only want to do this where the GPU is angry,
				5643	* for all other failure, such as an allocation failure, bail.
				5644	*/
Chris Wilson	6f74b36	2017-10-15 15:37:25 +0100	[diff] [blame]	5645	if (!i915_terminally_wedged(&dev_priv->gpu_error)) {
Chris Wilson	51c18bf	2018-06-09 12:10:58 +0100	[diff] [blame]	5646	i915_load_error(dev_priv,
				5647	"Failed to initialize GPU, declaring it wedged!\n");
Chris Wilson	6f74b36	2017-10-15 15:37:25 +0100	[diff] [blame]	5648	i915_gem_set_wedged(dev_priv);
				5649	}
Chris Wilson	7ed43df	2018-07-26 09:50:32 +0100	[diff] [blame]	5650
				5651	/* Minimal basic recovery for KMS */
				5652	ret = i915_ggtt_enable_hw(dev_priv);
				5653	i915_gem_restore_gtt_mappings(dev_priv);
				5654	i915_gem_restore_fences(dev_priv);
				5655	intel_init_clock_gating(dev_priv);
				5656
				5657	mutex_unlock(&dev_priv->drm.struct_mutex);
Chris Wilson	1070a42	2012-04-24 15:47:41 +0100	[diff] [blame]	5658	}
				5659
Chris Wilson	6ca9a2b	2017-12-13 13:43:47 +0000	[diff] [blame]	5660	i915_gem_drain_freed_objects(dev_priv);
Chris Wilson	6099032	2014-04-09 09:19:42 +0100	[diff] [blame]	5661	return ret;
Chris Wilson	1070a42	2012-04-24 15:47:41 +0100	[diff] [blame]	5662	}
				5663
Michal Wajdeczko	8979187a	2018-06-04 09:00:32 +0000	[diff] [blame]	5664	void i915_gem_fini(struct drm_i915_private *dev_priv)
				5665	{
				5666	i915_gem_suspend_late(dev_priv);
Chris Wilson	30b71084	2018-08-12 23:36:29 +0100	[diff] [blame]	5667	intel_disable_gt_powersave(dev_priv);
Michal Wajdeczko	8979187a	2018-06-04 09:00:32 +0000	[diff] [blame]	5668
				5669	/* Flush any outstanding unpin_work. */
				5670	i915_gem_drain_workqueue(dev_priv);
				5671
				5672	mutex_lock(&dev_priv->drm.struct_mutex);
				5673	intel_uc_fini_hw(dev_priv);
				5674	intel_uc_fini(dev_priv);
				5675	i915_gem_cleanup_engines(dev_priv);
				5676	i915_gem_contexts_fini(dev_priv);
				5677	mutex_unlock(&dev_priv->drm.struct_mutex);
				5678
Chris Wilson	30b71084	2018-08-12 23:36:29 +0100	[diff] [blame]	5679	intel_cleanup_gt_powersave(dev_priv);
				5680
Michal Wajdeczko	8979187a	2018-06-04 09:00:32 +0000	[diff] [blame]	5681	intel_uc_fini_misc(dev_priv);
				5682	i915_gem_cleanup_userptr(dev_priv);
				5683
				5684	i915_gem_drain_freed_objects(dev_priv);
				5685
				5686	WARN_ON(!list_empty(&dev_priv->contexts.list));
				5687	}
				5688
Chris Wilson	2414551	2017-01-24 11:01:35 +0000	[diff] [blame]	5689	void i915_gem_init_mmio(struct drm_i915_private *i915)
				5690	{
				5691	i915_gem_sanitize(i915);
				5692	}
				5693
Zou Nan hai	8187a2b	2010-05-21 09:08:55 +0800	[diff] [blame]	5694	void
Tvrtko Ursulin	cb15d9f	2016-12-01 14:16:39 +0000	[diff] [blame]	5695	i915_gem_cleanup_engines(struct drm_i915_private *dev_priv)
Zou Nan hai	8187a2b	2010-05-21 09:08:55 +0800	[diff] [blame]	5696	{
Tvrtko Ursulin	e2f8039	2016-03-16 11:00:36 +0000	[diff] [blame]	5697	struct intel_engine_cs *engine;
Akash Goel	3b3f165	2016-10-13 22:44:48 +0530	[diff] [blame]	5698	enum intel_engine_id id;
Zou Nan hai	8187a2b	2010-05-21 09:08:55 +0800	[diff] [blame]	5699
Akash Goel	3b3f165	2016-10-13 22:44:48 +0530	[diff] [blame]	5700	for_each_engine(engine, dev_priv, id)
Tvrtko Ursulin	117897f	2016-03-16 11:00:40 +0000	[diff] [blame]	5701	dev_priv->gt.cleanup_engine(engine);
Zou Nan hai	8187a2b	2010-05-21 09:08:55 +0800	[diff] [blame]	5702	}
				5703
Eric Anholt	673a394	2008-07-30 12:06:12 -0700	[diff] [blame]	5704	void
Imre Deak	40ae4e1	2016-03-16 14:54:03 +0200	[diff] [blame]	5705	i915_gem_load_init_fences(struct drm_i915_private *dev_priv)
				5706	{
Chris Wilson	49ef529	2016-08-18 17:17:00 +0100	[diff] [blame]	5707	int i;
Imre Deak	40ae4e1	2016-03-16 14:54:03 +0200	[diff] [blame]	5708
Tvrtko Ursulin	c56b89f	2018-02-09 21:58:46 +0000	[diff] [blame]	5709	if (INTEL_GEN(dev_priv) >= 7 && !IS_VALLEYVIEW(dev_priv) &&
Imre Deak	40ae4e1	2016-03-16 14:54:03 +0200	[diff] [blame]	5710	!IS_CHERRYVIEW(dev_priv))
				5711	dev_priv->num_fence_regs = 32;
Tvrtko Ursulin	c56b89f	2018-02-09 21:58:46 +0000	[diff] [blame]	5712	else if (INTEL_GEN(dev_priv) >= 4 \|\|
Jani Nikula	73f67aa	2016-12-07 22:48:09 +0200	[diff] [blame]	5713	IS_I945G(dev_priv) \|\| IS_I945GM(dev_priv) \|\|
				5714	IS_G33(dev_priv) \|\| IS_PINEVIEW(dev_priv))
Imre Deak	40ae4e1	2016-03-16 14:54:03 +0200	[diff] [blame]	5715	dev_priv->num_fence_regs = 16;
				5716	else
				5717	dev_priv->num_fence_regs = 8;
				5718
Chris Wilson	c033666	2016-05-06 15:40:21 +0100	[diff] [blame]	5719	if (intel_vgpu_active(dev_priv))
Imre Deak	40ae4e1	2016-03-16 14:54:03 +0200	[diff] [blame]	5720	dev_priv->num_fence_regs =
				5721	I915_READ(vgtif_reg(avail_rs.fence_num));
				5722
				5723	/* Initialize fence registers to zero */
Chris Wilson	49ef529	2016-08-18 17:17:00 +0100	[diff] [blame]	5724	for (i = 0; i < dev_priv->num_fence_regs; i++) {
				5725	struct drm_i915_fence_reg *fence = &dev_priv->fence_regs[i];
				5726
				5727	fence->i915 = dev_priv;
				5728	fence->id = i;
				5729	list_add_tail(&fence->link, &dev_priv->mm.fence_list);
				5730	}
Tvrtko Ursulin	4362f4f	2016-11-16 08:55:33 +0000	[diff] [blame]	5731	i915_gem_restore_fences(dev_priv);
Imre Deak	40ae4e1	2016-03-16 14:54:03 +0200	[diff] [blame]	5732
Tvrtko Ursulin	4362f4f	2016-11-16 08:55:33 +0000	[diff] [blame]	5733	i915_gem_detect_bit_6_swizzle(dev_priv);
Imre Deak	40ae4e1	2016-03-16 14:54:03 +0200	[diff] [blame]	5734	}
				5735
Chris Wilson	9c52d1c	2017-11-10 23:24:47 +0000	[diff] [blame]	5736	static void i915_gem_init__mm(struct drm_i915_private *i915)
				5737	{
				5738	spin_lock_init(&i915->mm.object_stat_lock);
				5739	spin_lock_init(&i915->mm.obj_lock);
				5740	spin_lock_init(&i915->mm.free_lock);
				5741
				5742	init_llist_head(&i915->mm.free_list);
				5743
				5744	INIT_LIST_HEAD(&i915->mm.unbound_list);
				5745	INIT_LIST_HEAD(&i915->mm.bound_list);
				5746	INIT_LIST_HEAD(&i915->mm.fence_list);
				5747	INIT_LIST_HEAD(&i915->mm.userfault_list);
				5748
				5749	INIT_WORK(&i915->mm.free_work, __i915_gem_free_work);
				5750	}
				5751
Michal Wajdeczko	a0de908	2018-03-23 12:34:49 +0000	[diff] [blame]	5752	int i915_gem_init_early(struct drm_i915_private *dev_priv)
Eric Anholt	673a394	2008-07-30 12:06:12 -0700	[diff] [blame]	5753	{
Tvrtko Ursulin	a933568	2016-11-02 15:14:59 +0000	[diff] [blame]	5754	int err = -ENOMEM;
Chris Wilson	42dcedd	2012-11-15 11:32:30 +0000	[diff] [blame]	5755
Tvrtko Ursulin	a933568	2016-11-02 15:14:59 +0000	[diff] [blame]	5756	dev_priv->objects = KMEM_CACHE(drm_i915_gem_object, SLAB_HWCACHE_ALIGN);
				5757	if (!dev_priv->objects)
Chris Wilson	73cb970	2016-10-28 13:58:46 +0100	[diff] [blame]	5758	goto err_out;
Chris Wilson	73cb970	2016-10-28 13:58:46 +0100	[diff] [blame]	5759
Tvrtko Ursulin	a933568	2016-11-02 15:14:59 +0000	[diff] [blame]	5760	dev_priv->vmas = KMEM_CACHE(i915_vma, SLAB_HWCACHE_ALIGN);
				5761	if (!dev_priv->vmas)
Chris Wilson	73cb970	2016-10-28 13:58:46 +0100	[diff] [blame]	5762	goto err_objects;
Chris Wilson	73cb970	2016-10-28 13:58:46 +0100	[diff] [blame]	5763
Chris Wilson	d1b48c1	2017-08-16 09:52:08 +0100	[diff] [blame]	5764	dev_priv->luts = KMEM_CACHE(i915_lut_handle, 0);
				5765	if (!dev_priv->luts)
				5766	goto err_vmas;
				5767
Chris Wilson	e61e0f5	2018-02-21 09:56:36 +0000	[diff] [blame]	5768	dev_priv->requests = KMEM_CACHE(i915_request,
Tvrtko Ursulin	a933568	2016-11-02 15:14:59 +0000	[diff] [blame]	5769	SLAB_HWCACHE_ALIGN \|
				5770	SLAB_RECLAIM_ACCOUNT \|
Paul E. McKenney	5f0d5a3	2017-01-18 02:53:44 -0800	[diff] [blame]	5771	SLAB_TYPESAFE_BY_RCU);
Tvrtko Ursulin	a933568	2016-11-02 15:14:59 +0000	[diff] [blame]	5772	if (!dev_priv->requests)
Chris Wilson	d1b48c1	2017-08-16 09:52:08 +0100	[diff] [blame]	5773	goto err_luts;
Chris Wilson	73cb970	2016-10-28 13:58:46 +0100	[diff] [blame]	5774
Chris Wilson	52e5420	2016-11-14 20:41:02 +0000	[diff] [blame]	5775	dev_priv->dependencies = KMEM_CACHE(i915_dependency,
				5776	SLAB_HWCACHE_ALIGN \|
				5777	SLAB_RECLAIM_ACCOUNT);
				5778	if (!dev_priv->dependencies)
				5779	goto err_requests;
				5780
Chris Wilson	c5cf9a9	2017-05-17 13:10:04 +0100	[diff] [blame]	5781	dev_priv->priorities = KMEM_CACHE(i915_priolist, SLAB_HWCACHE_ALIGN);
				5782	if (!dev_priv->priorities)
				5783	goto err_dependencies;
				5784
Chris Wilson	73cb970	2016-10-28 13:58:46 +0100	[diff] [blame]	5785	INIT_LIST_HEAD(&dev_priv->gt.timelines);
Chris Wilson	643b450	2018-04-30 14:15:03 +0100	[diff] [blame]	5786	INIT_LIST_HEAD(&dev_priv->gt.active_rings);
Chris Wilson	3365e22	2018-05-03 20:51:14 +0100	[diff] [blame]	5787	INIT_LIST_HEAD(&dev_priv->gt.closed_vma);
Chris Wilson	643b450	2018-04-30 14:15:03 +0100	[diff] [blame]	5788
Chris Wilson	9c52d1c	2017-11-10 23:24:47 +0000	[diff] [blame]	5789	i915_gem_init__mm(dev_priv);
Chris Wilson	f212381	2017-10-16 12:40:37 +0100	[diff] [blame]	5790
Chris Wilson	67d97da	2016-07-04 08:08:31 +0100	[diff] [blame]	5791	INIT_DELAYED_WORK(&dev_priv->gt.retire_work,
Eric Anholt	673a394	2008-07-30 12:06:12 -0700	[diff] [blame]	5792	i915_gem_retire_work_handler);
Chris Wilson	67d97da	2016-07-04 08:08:31 +0100	[diff] [blame]	5793	INIT_DELAYED_WORK(&dev_priv->gt.idle_work,
Chris Wilson	b29c19b	2013-09-25 17:34:56 +0100	[diff] [blame]	5794	i915_gem_idle_work_handler);
Chris Wilson	1f15b76	2016-07-01 17:23:14 +0100	[diff] [blame]	5795	init_waitqueue_head(&dev_priv->gpu_error.wait_queue);
Daniel Vetter	1f83fee	2012-11-15 17:17:22 +0100	[diff] [blame]	5796	init_waitqueue_head(&dev_priv->gpu_error.reset_queue);
Chris Wilson	3116971	2009-09-14 16:50:28 +0100	[diff] [blame]	5797
Joonas Lahtinen	6f63340	2016-09-01 14:58:21 +0300	[diff] [blame]	5798	atomic_set(&dev_priv->mm.bsd_engine_dispatch_index, 0);
				5799
Chris Wilson	b5add95	2016-08-04 16:32:36 +0100	[diff] [blame]	5800	spin_lock_init(&dev_priv->fb_tracking.lock);
Chris Wilson	73cb970	2016-10-28 13:58:46 +0100	[diff] [blame]	5801
Matthew Auld	465c403	2017-10-06 23:18:14 +0100	[diff] [blame]	5802	err = i915_gemfs_init(dev_priv);
				5803	if (err)
				5804	DRM_NOTE("Unable to create a private tmpfs mount, hugepage support will be disabled(%d).\n", err);
				5805
Chris Wilson	73cb970	2016-10-28 13:58:46 +0100	[diff] [blame]	5806	return 0;
				5807
Chris Wilson	52e5420	2016-11-14 20:41:02 +0000	[diff] [blame]	5808	err_dependencies:
				5809	kmem_cache_destroy(dev_priv->dependencies);
Chris Wilson	73cb970	2016-10-28 13:58:46 +0100	[diff] [blame]	5810	err_requests:
				5811	kmem_cache_destroy(dev_priv->requests);
Chris Wilson	d1b48c1	2017-08-16 09:52:08 +0100	[diff] [blame]	5812	err_luts:
				5813	kmem_cache_destroy(dev_priv->luts);
Chris Wilson	73cb970	2016-10-28 13:58:46 +0100	[diff] [blame]	5814	err_vmas:
				5815	kmem_cache_destroy(dev_priv->vmas);
				5816	err_objects:
				5817	kmem_cache_destroy(dev_priv->objects);
				5818	err_out:
				5819	return err;
Eric Anholt	673a394	2008-07-30 12:06:12 -0700	[diff] [blame]	5820	}
Dave Airlie	71acb5e	2008-12-30 20:31:46 +1000	[diff] [blame]	5821
Michal Wajdeczko	a0de908	2018-03-23 12:34:49 +0000	[diff] [blame]	5822	void i915_gem_cleanup_early(struct drm_i915_private *dev_priv)
Imre Deak	d64aa09	2016-01-19 15:26:29 +0200	[diff] [blame]	5823	{
Chris Wilson	c4d4c1c	2017-02-10 16:35:23 +0000	[diff] [blame]	5824	i915_gem_drain_freed_objects(dev_priv);
Chris Wilson	c9c70471	2018-02-19 22:06:31 +0000	[diff] [blame]	5825	GEM_BUG_ON(!llist_empty(&dev_priv->mm.free_list));
				5826	GEM_BUG_ON(atomic_read(&dev_priv->mm.free_count));
Chris Wilson	c4d4c1c	2017-02-10 16:35:23 +0000	[diff] [blame]	5827	WARN_ON(dev_priv->mm.object_count);
Matthew Auld	ea84aa7	2016-11-17 21:04:11 +0000	[diff] [blame]	5828	WARN_ON(!list_empty(&dev_priv->gt.timelines));
Matthew Auld	ea84aa7	2016-11-17 21:04:11 +0000	[diff] [blame]	5829
Chris Wilson	c5cf9a9	2017-05-17 13:10:04 +0100	[diff] [blame]	5830	kmem_cache_destroy(dev_priv->priorities);
Chris Wilson	52e5420	2016-11-14 20:41:02 +0000	[diff] [blame]	5831	kmem_cache_destroy(dev_priv->dependencies);
Imre Deak	d64aa09	2016-01-19 15:26:29 +0200	[diff] [blame]	5832	kmem_cache_destroy(dev_priv->requests);
Chris Wilson	d1b48c1	2017-08-16 09:52:08 +0100	[diff] [blame]	5833	kmem_cache_destroy(dev_priv->luts);
Imre Deak	d64aa09	2016-01-19 15:26:29 +0200	[diff] [blame]	5834	kmem_cache_destroy(dev_priv->vmas);
				5835	kmem_cache_destroy(dev_priv->objects);
Chris Wilson	0eafec6	2016-08-04 16:32:41 +0100	[diff] [blame]	5836
				5837	/* And ensure that our DESTROY_BY_RCU slabs are truly destroyed */
				5838	rcu_barrier();
Matthew Auld	465c403	2017-10-06 23:18:14 +0100	[diff] [blame]	5839
				5840	i915_gemfs_fini(dev_priv);
Imre Deak	d64aa09	2016-01-19 15:26:29 +0200	[diff] [blame]	5841	}
				5842
Chris Wilson	6a800ea	2016-09-21 14:51:07 +0100	[diff] [blame]	5843	int i915_gem_freeze(struct drm_i915_private *dev_priv)
				5844	{
Chris Wilson	d0aa301	2017-04-07 11:25:49 +0100	[diff] [blame]	5845	/* Discard all purgeable objects, let userspace recover those as
				5846	* required after resuming.
				5847	*/
Chris Wilson	6a800ea	2016-09-21 14:51:07 +0100	[diff] [blame]	5848	i915_gem_shrink_all(dev_priv);
Chris Wilson	6a800ea	2016-09-21 14:51:07 +0100	[diff] [blame]	5849
Chris Wilson	6a800ea	2016-09-21 14:51:07 +0100	[diff] [blame]	5850	return 0;
				5851	}
				5852
Chris Wilson	95c778d	2018-06-01 15:41:25 +0100	[diff] [blame]	5853	int i915_gem_freeze_late(struct drm_i915_private *i915)
Chris Wilson	461fb99	2016-05-14 07:26:33 +0100	[diff] [blame]	5854	{
				5855	struct drm_i915_gem_object *obj;
Chris Wilson	7aab2d5	2016-09-09 20:02:18 +0100	[diff] [blame]	5856	struct list_head *phases[] = {
Chris Wilson	95c778d	2018-06-01 15:41:25 +0100	[diff] [blame]	5857	&i915->mm.unbound_list,
				5858	&i915->mm.bound_list,
Chris Wilson	7aab2d5	2016-09-09 20:02:18 +0100	[diff] [blame]	5859	NULL
Chris Wilson	95c778d	2018-06-01 15:41:25 +0100	[diff] [blame]	5860	}, **phase;
Chris Wilson	461fb99	2016-05-14 07:26:33 +0100	[diff] [blame]	5861
Chris Wilson	95c778d	2018-06-01 15:41:25 +0100	[diff] [blame]	5862	/*
				5863	* Called just before we write the hibernation image.
Chris Wilson	461fb99	2016-05-14 07:26:33 +0100	[diff] [blame]	5864	*
				5865	* We need to update the domain tracking to reflect that the CPU
				5866	* will be accessing all the pages to create and restore from the
				5867	* hibernation, and so upon restoration those pages will be in the
				5868	* CPU domain.
				5869	*
				5870	* To make sure the hibernation image contains the latest state,
				5871	* we update that state just before writing out the image.
Chris Wilson	7aab2d5	2016-09-09 20:02:18 +0100	[diff] [blame]	5872	*
				5873	* To try and reduce the hibernation image, we manually shrink
Chris Wilson	d0aa301	2017-04-07 11:25:49 +0100	[diff] [blame]	5874	* the objects as well, see i915_gem_freeze()
Chris Wilson	461fb99	2016-05-14 07:26:33 +0100	[diff] [blame]	5875	*/
				5876
Chris Wilson	95c778d	2018-06-01 15:41:25 +0100	[diff] [blame]	5877	i915_gem_shrink(i915, -1UL, NULL, I915_SHRINK_UNBOUND);
				5878	i915_gem_drain_freed_objects(i915);
Chris Wilson	461fb99	2016-05-14 07:26:33 +0100	[diff] [blame]	5879
Chris Wilson	95c778d	2018-06-01 15:41:25 +0100	[diff] [blame]	5880	mutex_lock(&i915->drm.struct_mutex);
				5881	for (phase = phases; *phase; phase++) {
				5882	list_for_each_entry(obj, *phase, mm.link)
				5883	WARN_ON(i915_gem_object_set_to_cpu_domain(obj, true));
Chris Wilson	461fb99	2016-05-14 07:26:33 +0100	[diff] [blame]	5884	}
Chris Wilson	95c778d	2018-06-01 15:41:25 +0100	[diff] [blame]	5885	mutex_unlock(&i915->drm.struct_mutex);
Chris Wilson	461fb99	2016-05-14 07:26:33 +0100	[diff] [blame]	5886
				5887	return 0;
				5888	}
				5889
Chris Wilson	f787a5f	2010-09-24 16:02:42 +0100	[diff] [blame]	5890	void i915_gem_release(struct drm_device dev, struct drm_file file)
Eric Anholt	b962442	2009-06-03 07:27:35 +0000	[diff] [blame]	5891	{
Chris Wilson	f787a5f	2010-09-24 16:02:42 +0100	[diff] [blame]	5892	struct drm_i915_file_private *file_priv = file->driver_priv;
Chris Wilson	e61e0f5	2018-02-21 09:56:36 +0000	[diff] [blame]	5893	struct i915_request *request;
Eric Anholt	b962442	2009-06-03 07:27:35 +0000	[diff] [blame]	5894
				5895	/* Clean up our request list when the client is going away, so that
				5896	* later retire_requests won't dereference our soon-to-be-gone
				5897	* file_priv.
				5898	*/
Chris Wilson	1c25595	2010-09-26 11:03:27 +0100	[diff] [blame]	5899	spin_lock(&file_priv->mm.lock);
Chris Wilson	c8659ef	2017-03-02 12:25:25 +0000	[diff] [blame]	5900	list_for_each_entry(request, &file_priv->mm.request_list, client_link)
Chris Wilson	f787a5f	2010-09-24 16:02:42 +0100	[diff] [blame]	5901	request->file_priv = NULL;
Chris Wilson	1c25595	2010-09-26 11:03:27 +0100	[diff] [blame]	5902	spin_unlock(&file_priv->mm.lock);
Chris Wilson	b29c19b	2013-09-25 17:34:56 +0100	[diff] [blame]	5903	}
				5904
Chris Wilson	829a0af	2017-06-20 12:05:45 +0100	[diff] [blame]	5905	int i915_gem_open(struct drm_i915_private i915, struct drm_file file)
Chris Wilson	b29c19b	2013-09-25 17:34:56 +0100	[diff] [blame]	5906	{
				5907	struct drm_i915_file_private *file_priv;
Ben Widawsky	e422b88	2013-12-06 14:10:58 -0800	[diff] [blame]	5908	int ret;
Chris Wilson	b29c19b	2013-09-25 17:34:56 +0100	[diff] [blame]	5909
Chris Wilson	c4c29d7	2016-11-09 10:45:07 +0000	[diff] [blame]	5910	DRM_DEBUG("\n");
Chris Wilson	b29c19b	2013-09-25 17:34:56 +0100	[diff] [blame]	5911
				5912	file_priv = kzalloc(sizeof(*file_priv), GFP_KERNEL);
				5913	if (!file_priv)
				5914	return -ENOMEM;
				5915
				5916	file->driver_priv = file_priv;
Chris Wilson	829a0af	2017-06-20 12:05:45 +0100	[diff] [blame]	5917	file_priv->dev_priv = i915;
Chris Wilson	ab0e7ff	2014-02-25 17:11:24 +0200	[diff] [blame]	5918	file_priv->file = file;
Chris Wilson	b29c19b	2013-09-25 17:34:56 +0100	[diff] [blame]	5919
				5920	spin_lock_init(&file_priv->mm.lock);
				5921	INIT_LIST_HEAD(&file_priv->mm.request_list);
Chris Wilson	b29c19b	2013-09-25 17:34:56 +0100	[diff] [blame]	5922
Chris Wilson	c80ff16	2016-07-27 09:07:27 +0100	[diff] [blame]	5923	file_priv->bsd_engine = -1;
Mika Kuoppala	14921f3	2018-06-15 13:44:29 +0300	[diff] [blame]	5924	file_priv->hang_timestamp = jiffies;
Tvrtko Ursulin	de1add3	2016-01-15 15:12:50 +0000	[diff] [blame]	5925
Chris Wilson	829a0af	2017-06-20 12:05:45 +0100	[diff] [blame]	5926	ret = i915_gem_context_open(i915, file);
Ben Widawsky	e422b88	2013-12-06 14:10:58 -0800	[diff] [blame]	5927	if (ret)
				5928	kfree(file_priv);
Chris Wilson	b29c19b	2013-09-25 17:34:56 +0100	[diff] [blame]	5929
Ben Widawsky	e422b88	2013-12-06 14:10:58 -0800	[diff] [blame]	5930	return ret;
Chris Wilson	b29c19b	2013-09-25 17:34:56 +0100	[diff] [blame]	5931	}
				5932
Daniel Vetter	b680c37	2014-09-19 18:27:27 +0200	[diff] [blame]	5933	/**
				5934	* i915_gem_track_fb - update frontbuffer tracking
Geliang Tang	d9072a3	2015-09-15 05:58:44 -0700	[diff] [blame]	5935	* @old: current GEM buffer for the frontbuffer slots
				5936	* @new: new GEM buffer for the frontbuffer slots
				5937	* @frontbuffer_bits: bitmask of frontbuffer slots
Daniel Vetter	b680c37	2014-09-19 18:27:27 +0200	[diff] [blame]	5938	*
				5939	* This updates the frontbuffer tracking bits @frontbuffer_bits by clearing them
				5940	* from @old and setting them in @new. Both @old and @new can be NULL.
				5941	*/
Daniel Vetter	a071fa0	2014-06-18 23:28:09 +0200	[diff] [blame]	5942	void i915_gem_track_fb(struct drm_i915_gem_object *old,
				5943	struct drm_i915_gem_object *new,
				5944	unsigned frontbuffer_bits)
				5945	{
Chris Wilson	faf5bf0	2016-08-04 16:32:37 +0100	[diff] [blame]	5946	/* Control of individual bits within the mask are guarded by
				5947	* the owning plane->mutex, i.e. we can never see concurrent
				5948	* manipulation of individual bits. But since the bitfield as a whole
				5949	* is updated using RMW, we need to use atomics in order to update
				5950	* the bits.
				5951	*/
				5952	BUILD_BUG_ON(INTEL_FRONTBUFFER_BITS_PER_PIPE * I915_MAX_PIPES >
Chris Wilson	74f6e18	2018-09-26 11:47:07 +0100	[diff] [blame]	5953	BITS_PER_TYPE(atomic_t));
Chris Wilson	faf5bf0	2016-08-04 16:32:37 +0100	[diff] [blame]	5954
Daniel Vetter	a071fa0	2014-06-18 23:28:09 +0200	[diff] [blame]	5955	if (old) {
Chris Wilson	faf5bf0	2016-08-04 16:32:37 +0100	[diff] [blame]	5956	WARN_ON(!(atomic_read(&old->frontbuffer_bits) & frontbuffer_bits));
				5957	atomic_andnot(frontbuffer_bits, &old->frontbuffer_bits);
Daniel Vetter	a071fa0	2014-06-18 23:28:09 +0200	[diff] [blame]	5958	}
				5959
				5960	if (new) {
Chris Wilson	faf5bf0	2016-08-04 16:32:37 +0100	[diff] [blame]	5961	WARN_ON(atomic_read(&new->frontbuffer_bits) & frontbuffer_bits);
				5962	atomic_or(frontbuffer_bits, &new->frontbuffer_bits);
Daniel Vetter	a071fa0	2014-06-18 23:28:09 +0200	[diff] [blame]	5963	}
				5964	}
				5965
Dave Gordon	ea70299	2015-07-09 19:29:02 +0100	[diff] [blame]	5966	/* Allocate a new GEM object and fill it with the supplied data */
				5967	struct drm_i915_gem_object *
Tvrtko Ursulin	12d79d7	2016-12-01 14:16:37 +0000	[diff] [blame]	5968	i915_gem_object_create_from_data(struct drm_i915_private *dev_priv,
Dave Gordon	ea70299	2015-07-09 19:29:02 +0100	[diff] [blame]	5969	const void *data, size_t size)
				5970	{
				5971	struct drm_i915_gem_object *obj;
Chris Wilson	be062fa	2017-03-17 19:46:48 +0000	[diff] [blame]	5972	struct file *file;
				5973	size_t offset;
				5974	int err;
Dave Gordon	ea70299	2015-07-09 19:29:02 +0100	[diff] [blame]	5975
Tvrtko Ursulin	12d79d7	2016-12-01 14:16:37 +0000	[diff] [blame]	5976	obj = i915_gem_object_create(dev_priv, round_up(size, PAGE_SIZE));
Chris Wilson	fe3db79	2016-04-25 13:32:13 +0100	[diff] [blame]	5977	if (IS_ERR(obj))
Dave Gordon	ea70299	2015-07-09 19:29:02 +0100	[diff] [blame]	5978	return obj;
				5979
Christian König	c0a51fd	2018-02-16 13:43:38 +0100	[diff] [blame]	5980	GEM_BUG_ON(obj->write_domain != I915_GEM_DOMAIN_CPU);
Dave Gordon	ea70299	2015-07-09 19:29:02 +0100	[diff] [blame]	5981
Chris Wilson	be062fa	2017-03-17 19:46:48 +0000	[diff] [blame]	5982	file = obj->base.filp;
				5983	offset = 0;
				5984	do {
				5985	unsigned int len = min_t(typeof(size), size, PAGE_SIZE);
				5986	struct page *page;
				5987	void pgdata, vaddr;
Dave Gordon	ea70299	2015-07-09 19:29:02 +0100	[diff] [blame]	5988
Chris Wilson	be062fa	2017-03-17 19:46:48 +0000	[diff] [blame]	5989	err = pagecache_write_begin(file, file->f_mapping,
				5990	offset, len, 0,
				5991	&page, &pgdata);
				5992	if (err < 0)
				5993	goto fail;
Dave Gordon	ea70299	2015-07-09 19:29:02 +0100	[diff] [blame]	5994
Chris Wilson	be062fa	2017-03-17 19:46:48 +0000	[diff] [blame]	5995	vaddr = kmap(page);
				5996	memcpy(vaddr, data, len);
				5997	kunmap(page);
				5998
				5999	err = pagecache_write_end(file, file->f_mapping,
				6000	offset, len, len,
				6001	page, pgdata);
				6002	if (err < 0)
				6003	goto fail;
				6004
				6005	size -= len;
				6006	data += len;
				6007	offset += len;
				6008	} while (size);
Dave Gordon	ea70299	2015-07-09 19:29:02 +0100	[diff] [blame]	6009
				6010	return obj;
				6011
				6012	fail:
Chris Wilson	f8c417c	2016-07-20 13:31:53 +0100	[diff] [blame]	6013	i915_gem_object_put(obj);
Chris Wilson	be062fa	2017-03-17 19:46:48 +0000	[diff] [blame]	6014	return ERR_PTR(err);
Dave Gordon	ea70299	2015-07-09 19:29:02 +0100	[diff] [blame]	6015	}
Chris Wilson	96d7763	2016-10-28 13:58:33 +0100	[diff] [blame]	6016
				6017	struct scatterlist *
				6018	i915_gem_object_get_sg(struct drm_i915_gem_object *obj,
				6019	unsigned int n,
				6020	unsigned int *offset)
				6021	{
Chris Wilson	a4f5ea6	2016-10-28 13:58:35 +0100	[diff] [blame]	6022	struct i915_gem_object_page_iter *iter = &obj->mm.get_page;
Chris Wilson	96d7763	2016-10-28 13:58:33 +0100	[diff] [blame]	6023	struct scatterlist *sg;
				6024	unsigned int idx, count;
				6025
				6026	might_sleep();
				6027	GEM_BUG_ON(n >= obj->base.size >> PAGE_SHIFT);
Chris Wilson	a4f5ea6	2016-10-28 13:58:35 +0100	[diff] [blame]	6028	GEM_BUG_ON(!i915_gem_object_has_pinned_pages(obj));
Chris Wilson	96d7763	2016-10-28 13:58:33 +0100	[diff] [blame]	6029
				6030	/* As we iterate forward through the sg, we record each entry in a
				6031	* radixtree for quick repeated (backwards) lookups. If we have seen
				6032	* this index previously, we will have an entry for it.
				6033	*
				6034	* Initial lookup is O(N), but this is amortized to O(1) for
				6035	* sequential page access (where each new request is consecutive
				6036	* to the previous one). Repeated lookups are O(lg(obj->base.size)),
				6037	* i.e. O(1) with a large constant!
				6038	*/
				6039	if (n < READ_ONCE(iter->sg_idx))
				6040	goto lookup;
				6041
				6042	mutex_lock(&iter->lock);
				6043
				6044	/* We prefer to reuse the last sg so that repeated lookup of this
				6045	* (or the subsequent) sg are fast - comparing against the last
				6046	* sg is faster than going through the radixtree.
				6047	*/
				6048
				6049	sg = iter->sg_pos;
				6050	idx = iter->sg_idx;
				6051	count = __sg_page_count(sg);
				6052
				6053	while (idx + count <= n) {
				6054	unsigned long exception, i;
				6055	int ret;
				6056
				6057	/* If we cannot allocate and insert this entry, or the
				6058	* individual pages from this range, cancel updating the
				6059	* sg_idx so that on this lookup we are forced to linearly
				6060	* scan onwards, but on future lookups we will try the
				6061	* insertion again (in which case we need to be careful of
				6062	* the error return reporting that we have already inserted
				6063	* this index).
				6064	*/
				6065	ret = radix_tree_insert(&iter->radix, idx, sg);
				6066	if (ret && ret != -EEXIST)
				6067	goto scan;
				6068
				6069	exception =
				6070	RADIX_TREE_EXCEPTIONAL_ENTRY \|
				6071	idx << RADIX_TREE_EXCEPTIONAL_SHIFT;
				6072	for (i = 1; i < count; i++) {
				6073	ret = radix_tree_insert(&iter->radix, idx + i,
				6074	(void *)exception);
				6075	if (ret && ret != -EEXIST)
				6076	goto scan;
				6077	}
				6078
				6079	idx += count;
				6080	sg = ____sg_next(sg);
				6081	count = __sg_page_count(sg);
				6082	}
				6083
				6084	scan:
				6085	iter->sg_pos = sg;
				6086	iter->sg_idx = idx;
				6087
				6088	mutex_unlock(&iter->lock);
				6089
				6090	if (unlikely(n < idx)) /* insertion completed by another thread */
				6091	goto lookup;
				6092
				6093	/* In case we failed to insert the entry into the radixtree, we need
				6094	* to look beyond the current sg.
				6095	*/
				6096	while (idx + count <= n) {
				6097	idx += count;
				6098	sg = ____sg_next(sg);
				6099	count = __sg_page_count(sg);
				6100	}
				6101
				6102	*offset = n - idx;
				6103	return sg;
				6104
				6105	lookup:
				6106	rcu_read_lock();
				6107
				6108	sg = radix_tree_lookup(&iter->radix, n);
				6109	GEM_BUG_ON(!sg);
				6110
				6111	/* If this index is in the middle of multi-page sg entry,
				6112	* the radixtree will contain an exceptional entry that points
				6113	* to the start of that range. We will return the pointer to
				6114	* the base page and the offset of this page within the
				6115	* sg entry's range.
				6116	*/
				6117	*offset = 0;
				6118	if (unlikely(radix_tree_exception(sg))) {
				6119	unsigned long base =
				6120	(unsigned long)sg >> RADIX_TREE_EXCEPTIONAL_SHIFT;
				6121
				6122	sg = radix_tree_lookup(&iter->radix, base);
				6123	GEM_BUG_ON(!sg);
				6124
				6125	*offset = n - base;
				6126	}
				6127
				6128	rcu_read_unlock();
				6129
				6130	return sg;
				6131	}
				6132
				6133	struct page *
				6134	i915_gem_object_get_page(struct drm_i915_gem_object *obj, unsigned int n)
				6135	{
				6136	struct scatterlist *sg;
				6137	unsigned int offset;
				6138
				6139	GEM_BUG_ON(!i915_gem_object_has_struct_page(obj));
				6140
				6141	sg = i915_gem_object_get_sg(obj, n, &offset);
				6142	return nth_page(sg_page(sg), offset);
				6143	}
				6144
				6145	/* Like i915_gem_object_get_page(), but mark the returned page dirty */
				6146	struct page *
				6147	i915_gem_object_get_dirty_page(struct drm_i915_gem_object *obj,
				6148	unsigned int n)
				6149	{
				6150	struct page *page;
				6151
				6152	page = i915_gem_object_get_page(obj, n);
Chris Wilson	a4f5ea6	2016-10-28 13:58:35 +0100	[diff] [blame]	6153	if (!obj->mm.dirty)
Chris Wilson	96d7763	2016-10-28 13:58:33 +0100	[diff] [blame]	6154	set_page_dirty(page);
				6155
				6156	return page;
				6157	}
				6158
				6159	dma_addr_t
				6160	i915_gem_object_get_dma_address(struct drm_i915_gem_object *obj,
				6161	unsigned long n)
				6162	{
				6163	struct scatterlist *sg;
				6164	unsigned int offset;
				6165
				6166	sg = i915_gem_object_get_sg(obj, n, &offset);
				6167	return sg_dma_address(sg) + (offset << PAGE_SHIFT);
				6168	}
Chris Wilson	935a2f7	2017-02-13 17:15:13 +0000	[diff] [blame]	6169
Chris Wilson	8eeb790	2017-07-26 19:16:01 +0100	[diff] [blame]	6170	int i915_gem_object_attach_phys(struct drm_i915_gem_object *obj, int align)
				6171	{
				6172	struct sg_table *pages;
				6173	int err;
				6174
				6175	if (align > obj->base.size)
				6176	return -EINVAL;
				6177
				6178	if (obj->ops == &i915_gem_phys_ops)
				6179	return 0;
				6180
				6181	if (obj->ops != &i915_gem_object_ops)
				6182	return -EINVAL;
				6183
				6184	err = i915_gem_object_unbind(obj);
				6185	if (err)
				6186	return err;
				6187
				6188	mutex_lock(&obj->mm.lock);
				6189
				6190	if (obj->mm.madv != I915_MADV_WILLNEED) {
				6191	err = -EFAULT;
				6192	goto err_unlock;
				6193	}
				6194
				6195	if (obj->mm.quirked) {
				6196	err = -EFAULT;
				6197	goto err_unlock;
				6198	}
				6199
				6200	if (obj->mm.mapping) {
				6201	err = -EBUSY;
				6202	goto err_unlock;
				6203	}
				6204
Chris Wilson	acd1c1e	2018-06-11 08:55:32 +0100	[diff] [blame]	6205	pages = __i915_gem_object_unset_pages(obj);
Chris Wilson	f212381	2017-10-16 12:40:37 +0100	[diff] [blame]	6206
Chris Wilson	8eeb790	2017-07-26 19:16:01 +0100	[diff] [blame]	6207	obj->ops = &i915_gem_phys_ops;
				6208
Chris Wilson	8fb6a5d	2017-07-26 19:16:02 +0100	[diff] [blame]	6209	err = ____i915_gem_object_get_pages(obj);
Chris Wilson	8eeb790	2017-07-26 19:16:01 +0100	[diff] [blame]	6210	if (err)
				6211	goto err_xfer;
				6212
				6213	/* Perma-pin (until release) the physical set of pages */
				6214	__i915_gem_object_pin_pages(obj);
				6215
				6216	if (!IS_ERR_OR_NULL(pages))
				6217	i915_gem_object_ops.put_pages(obj, pages);
				6218	mutex_unlock(&obj->mm.lock);
				6219	return 0;
				6220
				6221	err_xfer:
				6222	obj->ops = &i915_gem_object_ops;
Chris Wilson	acd1c1e	2018-06-11 08:55:32 +0100	[diff] [blame]	6223	if (!IS_ERR_OR_NULL(pages)) {
				6224	unsigned int sg_page_sizes = i915_sg_page_sizes(pages->sgl);
				6225
				6226	__i915_gem_object_set_pages(obj, pages, sg_page_sizes);
				6227	}
Chris Wilson	8eeb790	2017-07-26 19:16:01 +0100	[diff] [blame]	6228	err_unlock:
				6229	mutex_unlock(&obj->mm.lock);
				6230	return err;
				6231	}
				6232
Chris Wilson	935a2f7	2017-02-13 17:15:13 +0000	[diff] [blame]	6233	#if IS_ENABLED(CONFIG_DRM_I915_SELFTEST)
				6234	#include "selftests/scatterlist.c"
Chris Wilson	66d9cb5	2017-02-13 17:15:17 +0000	[diff] [blame]	6235	#include "selftests/mock_gem_device.c"
Chris Wilson	4465398	2017-02-13 17:15:20 +0000	[diff] [blame]	6236	#include "selftests/huge_gem_object.c"
Matthew Auld	4049866	2017-10-06 23:18:29 +0100	[diff] [blame]	6237	#include "selftests/huge_pages.c"
Chris Wilson	8335fd6	2017-02-13 17:15:28 +0000	[diff] [blame]	6238	#include "selftests/i915_gem_object.c"
Chris Wilson	1705945	2017-02-13 17:15:32 +0000	[diff] [blame]	6239	#include "selftests/i915_gem_coherency.c"
Chris Wilson	3f51b7e1	2018-08-30 14:48:06 +0100	[diff] [blame]	6240	#include "selftests/i915_gem.c"
Chris Wilson	935a2f7	2017-02-13 17:15:13 +0000	[diff] [blame]	6241	#endif