blob: f0f8c6ff684f4d19ee0497c3174e1a599cdcbbea [file] [log] [blame]
Eric Anholt673a3942008-07-30 12:06:12 -07001/*
2 * Copyright © 2008 Intel Corporation
3 *
4 * Permission is hereby granted, free of charge, to any person obtaining a
5 * copy of this software and associated documentation files (the "Software"),
6 * to deal in the Software without restriction, including without limitation
7 * the rights to use, copy, modify, merge, publish, distribute, sublicense,
8 * and/or sell copies of the Software, and to permit persons to whom the
9 * Software is furnished to do so, subject to the following conditions:
10 *
11 * The above copyright notice and this permission notice (including the next
12 * paragraph) shall be included in all copies or substantial portions of the
13 * Software.
14 *
15 * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
16 * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
17 * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL
18 * THE AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
19 * LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING
20 * FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS
21 * IN THE SOFTWARE.
22 *
23 * Authors:
24 * Eric Anholt <eric@anholt.net>
25 *
26 */
27
28#include "drmP.h"
29#include "drm.h"
30#include "i915_drm.h"
31#include "i915_drv.h"
Chris Wilson1c5d22f2009-08-25 11:15:50 +010032#include "i915_trace.h"
Jesse Barnes652c3932009-08-17 13:31:43 -070033#include "intel_drv.h"
Tejun Heo5a0e3ad2010-03-24 17:04:11 +090034#include <linux/slab.h>
Eric Anholt673a3942008-07-30 12:06:12 -070035#include <linux/swap.h>
Jesse Barnes79e53942008-11-07 14:24:08 -080036#include <linux/pci.h>
Eric Anholt673a3942008-07-30 12:06:12 -070037
Chris Wilson88241782011-01-07 17:09:48 +000038static __must_check int i915_gem_object_flush_gpu_write_domain(struct drm_i915_gem_object *obj);
Chris Wilson05394f32010-11-08 19:18:58 +000039static void i915_gem_object_flush_gtt_write_domain(struct drm_i915_gem_object *obj);
40static void i915_gem_object_flush_cpu_write_domain(struct drm_i915_gem_object *obj);
Chris Wilson88241782011-01-07 17:09:48 +000041static __must_check int i915_gem_object_set_to_cpu_domain(struct drm_i915_gem_object *obj,
42 bool write);
43static __must_check int i915_gem_object_set_cpu_read_domain_range(struct drm_i915_gem_object *obj,
44 uint64_t offset,
45 uint64_t size);
Chris Wilson05394f32010-11-08 19:18:58 +000046static void i915_gem_object_set_to_full_cpu_read_domain(struct drm_i915_gem_object *obj);
Chris Wilson88241782011-01-07 17:09:48 +000047static __must_check int i915_gem_object_bind_to_gtt(struct drm_i915_gem_object *obj,
48 unsigned alignment,
49 bool map_and_fenceable);
Chris Wilsond9e86c02010-11-10 16:40:20 +000050static void i915_gem_clear_fence_reg(struct drm_device *dev,
51 struct drm_i915_fence_reg *reg);
Chris Wilson05394f32010-11-08 19:18:58 +000052static int i915_gem_phys_pwrite(struct drm_device *dev,
53 struct drm_i915_gem_object *obj,
Dave Airlie71acb5e2008-12-30 20:31:46 +100054 struct drm_i915_gem_pwrite *args,
Chris Wilson05394f32010-11-08 19:18:58 +000055 struct drm_file *file);
56static void i915_gem_free_object_tail(struct drm_i915_gem_object *obj);
Eric Anholt673a3942008-07-30 12:06:12 -070057
Chris Wilson17250b72010-10-28 12:51:39 +010058static int i915_gem_inactive_shrink(struct shrinker *shrinker,
59 int nr_to_scan,
60 gfp_t gfp_mask);
61
Chris Wilson31169712009-09-14 16:50:28 +010062
Chris Wilson73aa8082010-09-30 11:46:12 +010063/* some bookkeeping */
64static void i915_gem_info_add_obj(struct drm_i915_private *dev_priv,
65 size_t size)
66{
67 dev_priv->mm.object_count++;
68 dev_priv->mm.object_memory += size;
69}
70
71static void i915_gem_info_remove_obj(struct drm_i915_private *dev_priv,
72 size_t size)
73{
74 dev_priv->mm.object_count--;
75 dev_priv->mm.object_memory -= size;
76}
77
Chris Wilson21dd3732011-01-26 15:55:56 +000078static int
79i915_gem_wait_for_error(struct drm_device *dev)
Chris Wilson30dbf0c2010-09-25 10:19:17 +010080{
81 struct drm_i915_private *dev_priv = dev->dev_private;
82 struct completion *x = &dev_priv->error_completion;
83 unsigned long flags;
84 int ret;
85
86 if (!atomic_read(&dev_priv->mm.wedged))
87 return 0;
88
89 ret = wait_for_completion_interruptible(x);
90 if (ret)
91 return ret;
92
Chris Wilson21dd3732011-01-26 15:55:56 +000093 if (atomic_read(&dev_priv->mm.wedged)) {
94 /* GPU is hung, bump the completion count to account for
95 * the token we just consumed so that we never hit zero and
96 * end up waiting upon a subsequent completion event that
97 * will never happen.
98 */
99 spin_lock_irqsave(&x->wait.lock, flags);
100 x->done++;
101 spin_unlock_irqrestore(&x->wait.lock, flags);
102 }
103 return 0;
Chris Wilson30dbf0c2010-09-25 10:19:17 +0100104}
105
Chris Wilson54cf91d2010-11-25 18:00:26 +0000106int i915_mutex_lock_interruptible(struct drm_device *dev)
Chris Wilson76c1dec2010-09-25 11:22:51 +0100107{
Chris Wilson76c1dec2010-09-25 11:22:51 +0100108 int ret;
109
Chris Wilson21dd3732011-01-26 15:55:56 +0000110 ret = i915_gem_wait_for_error(dev);
Chris Wilson76c1dec2010-09-25 11:22:51 +0100111 if (ret)
112 return ret;
113
114 ret = mutex_lock_interruptible(&dev->struct_mutex);
115 if (ret)
116 return ret;
117
Chris Wilson23bc5982010-09-29 16:10:57 +0100118 WARN_ON(i915_verify_lists(dev));
Chris Wilson76c1dec2010-09-25 11:22:51 +0100119 return 0;
120}
Chris Wilson30dbf0c2010-09-25 10:19:17 +0100121
Chris Wilson7d1c4802010-08-07 21:45:03 +0100122static inline bool
Chris Wilson05394f32010-11-08 19:18:58 +0000123i915_gem_object_is_inactive(struct drm_i915_gem_object *obj)
Chris Wilson7d1c4802010-08-07 21:45:03 +0100124{
Chris Wilson05394f32010-11-08 19:18:58 +0000125 return obj->gtt_space && !obj->active && obj->pin_count == 0;
Chris Wilson7d1c4802010-08-07 21:45:03 +0100126}
127
Chris Wilson20217462010-11-23 15:26:33 +0000128void i915_gem_do_init(struct drm_device *dev,
129 unsigned long start,
130 unsigned long mappable_end,
131 unsigned long end)
Jesse Barnes79e53942008-11-07 14:24:08 -0800132{
133 drm_i915_private_t *dev_priv = dev->dev_private;
134
Chris Wilsonbee4a182011-01-21 10:54:32 +0000135 drm_mm_init(&dev_priv->mm.gtt_space, start, end - start);
Jesse Barnes79e53942008-11-07 14:24:08 -0800136
Chris Wilsonbee4a182011-01-21 10:54:32 +0000137 dev_priv->mm.gtt_start = start;
138 dev_priv->mm.gtt_mappable_end = mappable_end;
139 dev_priv->mm.gtt_end = end;
Chris Wilson73aa8082010-09-30 11:46:12 +0100140 dev_priv->mm.gtt_total = end - start;
Daniel Vetterfb7d5162010-10-01 22:05:20 +0200141 dev_priv->mm.mappable_gtt_total = min(end, mappable_end) - start;
Chris Wilsonbee4a182011-01-21 10:54:32 +0000142
143 /* Take over this portion of the GTT */
144 intel_gtt_clear_range(start / PAGE_SIZE, (end-start) / PAGE_SIZE);
Jesse Barnes79e53942008-11-07 14:24:08 -0800145}
Keith Packard6dbe2772008-10-14 21:41:13 -0700146
Eric Anholt673a3942008-07-30 12:06:12 -0700147int
148i915_gem_init_ioctl(struct drm_device *dev, void *data,
Chris Wilson05394f32010-11-08 19:18:58 +0000149 struct drm_file *file)
Eric Anholt673a3942008-07-30 12:06:12 -0700150{
Eric Anholt673a3942008-07-30 12:06:12 -0700151 struct drm_i915_gem_init *args = data;
Chris Wilson20217462010-11-23 15:26:33 +0000152
153 if (args->gtt_start >= args->gtt_end ||
154 (args->gtt_end | args->gtt_start) & (PAGE_SIZE - 1))
155 return -EINVAL;
Eric Anholt673a3942008-07-30 12:06:12 -0700156
157 mutex_lock(&dev->struct_mutex);
Chris Wilson20217462010-11-23 15:26:33 +0000158 i915_gem_do_init(dev, args->gtt_start, args->gtt_end, args->gtt_end);
Eric Anholt673a3942008-07-30 12:06:12 -0700159 mutex_unlock(&dev->struct_mutex);
160
Chris Wilson20217462010-11-23 15:26:33 +0000161 return 0;
Eric Anholt673a3942008-07-30 12:06:12 -0700162}
163
Eric Anholt5a125c32008-10-22 21:40:13 -0700164int
165i915_gem_get_aperture_ioctl(struct drm_device *dev, void *data,
Chris Wilson05394f32010-11-08 19:18:58 +0000166 struct drm_file *file)
Eric Anholt5a125c32008-10-22 21:40:13 -0700167{
Chris Wilson73aa8082010-09-30 11:46:12 +0100168 struct drm_i915_private *dev_priv = dev->dev_private;
Eric Anholt5a125c32008-10-22 21:40:13 -0700169 struct drm_i915_gem_get_aperture *args = data;
Chris Wilson6299f992010-11-24 12:23:44 +0000170 struct drm_i915_gem_object *obj;
171 size_t pinned;
Eric Anholt5a125c32008-10-22 21:40:13 -0700172
173 if (!(dev->driver->driver_features & DRIVER_GEM))
174 return -ENODEV;
175
Chris Wilson6299f992010-11-24 12:23:44 +0000176 pinned = 0;
Chris Wilson73aa8082010-09-30 11:46:12 +0100177 mutex_lock(&dev->struct_mutex);
Chris Wilson6299f992010-11-24 12:23:44 +0000178 list_for_each_entry(obj, &dev_priv->mm.pinned_list, mm_list)
179 pinned += obj->gtt_space->size;
Chris Wilson73aa8082010-09-30 11:46:12 +0100180 mutex_unlock(&dev->struct_mutex);
Eric Anholt5a125c32008-10-22 21:40:13 -0700181
Chris Wilson6299f992010-11-24 12:23:44 +0000182 args->aper_size = dev_priv->mm.gtt_total;
183 args->aper_available_size = args->aper_size -pinned;
184
Eric Anholt5a125c32008-10-22 21:40:13 -0700185 return 0;
186}
187
Eric Anholt673a3942008-07-30 12:06:12 -0700188/**
189 * Creates a new mm object and returns a handle to it.
190 */
191int
192i915_gem_create_ioctl(struct drm_device *dev, void *data,
Chris Wilson05394f32010-11-08 19:18:58 +0000193 struct drm_file *file)
Eric Anholt673a3942008-07-30 12:06:12 -0700194{
195 struct drm_i915_gem_create *args = data;
Chris Wilson05394f32010-11-08 19:18:58 +0000196 struct drm_i915_gem_object *obj;
Pekka Paalanena1a2d1d2009-08-23 12:40:55 +0300197 int ret;
198 u32 handle;
Eric Anholt673a3942008-07-30 12:06:12 -0700199
200 args->size = roundup(args->size, PAGE_SIZE);
201
202 /* Allocate the new object */
Daniel Vetterac52bc52010-04-09 19:05:06 +0000203 obj = i915_gem_alloc_object(dev, args->size);
Eric Anholt673a3942008-07-30 12:06:12 -0700204 if (obj == NULL)
205 return -ENOMEM;
206
Chris Wilson05394f32010-11-08 19:18:58 +0000207 ret = drm_gem_handle_create(file, &obj->base, &handle);
Chris Wilson1dfd9752010-09-06 14:44:14 +0100208 if (ret) {
Chris Wilson05394f32010-11-08 19:18:58 +0000209 drm_gem_object_release(&obj->base);
210 i915_gem_info_remove_obj(dev->dev_private, obj->base.size);
Chris Wilson202f2fe2010-10-14 13:20:40 +0100211 kfree(obj);
Eric Anholt673a3942008-07-30 12:06:12 -0700212 return ret;
Chris Wilson1dfd9752010-09-06 14:44:14 +0100213 }
214
Chris Wilson202f2fe2010-10-14 13:20:40 +0100215 /* drop reference from allocate - handle holds it now */
Chris Wilson05394f32010-11-08 19:18:58 +0000216 drm_gem_object_unreference(&obj->base);
Chris Wilson202f2fe2010-10-14 13:20:40 +0100217 trace_i915_gem_object_create(obj);
218
Eric Anholt673a3942008-07-30 12:06:12 -0700219 args->handle = handle;
Eric Anholt673a3942008-07-30 12:06:12 -0700220 return 0;
221}
222
Chris Wilson05394f32010-11-08 19:18:58 +0000223static int i915_gem_object_needs_bit17_swizzle(struct drm_i915_gem_object *obj)
Eric Anholt280b7132009-03-12 16:56:27 -0700224{
Chris Wilson05394f32010-11-08 19:18:58 +0000225 drm_i915_private_t *dev_priv = obj->base.dev->dev_private;
Eric Anholt280b7132009-03-12 16:56:27 -0700226
227 return dev_priv->mm.bit_6_swizzle_x == I915_BIT_6_SWIZZLE_9_10_17 &&
Chris Wilson05394f32010-11-08 19:18:58 +0000228 obj->tiling_mode != I915_TILING_NONE;
Eric Anholt280b7132009-03-12 16:56:27 -0700229}
230
Chris Wilson99a03df2010-05-27 14:15:34 +0100231static inline void
Eric Anholt40123c12009-03-09 13:42:30 -0700232slow_shmem_copy(struct page *dst_page,
233 int dst_offset,
234 struct page *src_page,
235 int src_offset,
236 int length)
237{
238 char *dst_vaddr, *src_vaddr;
239
Chris Wilson99a03df2010-05-27 14:15:34 +0100240 dst_vaddr = kmap(dst_page);
241 src_vaddr = kmap(src_page);
Eric Anholt40123c12009-03-09 13:42:30 -0700242
243 memcpy(dst_vaddr + dst_offset, src_vaddr + src_offset, length);
244
Chris Wilson99a03df2010-05-27 14:15:34 +0100245 kunmap(src_page);
246 kunmap(dst_page);
Eric Anholt40123c12009-03-09 13:42:30 -0700247}
248
Chris Wilson99a03df2010-05-27 14:15:34 +0100249static inline void
Eric Anholt280b7132009-03-12 16:56:27 -0700250slow_shmem_bit17_copy(struct page *gpu_page,
251 int gpu_offset,
252 struct page *cpu_page,
253 int cpu_offset,
254 int length,
255 int is_read)
256{
257 char *gpu_vaddr, *cpu_vaddr;
258
259 /* Use the unswizzled path if this page isn't affected. */
260 if ((page_to_phys(gpu_page) & (1 << 17)) == 0) {
261 if (is_read)
262 return slow_shmem_copy(cpu_page, cpu_offset,
263 gpu_page, gpu_offset, length);
264 else
265 return slow_shmem_copy(gpu_page, gpu_offset,
266 cpu_page, cpu_offset, length);
267 }
268
Chris Wilson99a03df2010-05-27 14:15:34 +0100269 gpu_vaddr = kmap(gpu_page);
270 cpu_vaddr = kmap(cpu_page);
Eric Anholt280b7132009-03-12 16:56:27 -0700271
272 /* Copy the data, XORing A6 with A17 (1). The user already knows he's
273 * XORing with the other bits (A9 for Y, A9 and A10 for X)
274 */
275 while (length > 0) {
276 int cacheline_end = ALIGN(gpu_offset + 1, 64);
277 int this_length = min(cacheline_end - gpu_offset, length);
278 int swizzled_gpu_offset = gpu_offset ^ 64;
279
280 if (is_read) {
281 memcpy(cpu_vaddr + cpu_offset,
282 gpu_vaddr + swizzled_gpu_offset,
283 this_length);
284 } else {
285 memcpy(gpu_vaddr + swizzled_gpu_offset,
286 cpu_vaddr + cpu_offset,
287 this_length);
288 }
289 cpu_offset += this_length;
290 gpu_offset += this_length;
291 length -= this_length;
292 }
293
Chris Wilson99a03df2010-05-27 14:15:34 +0100294 kunmap(cpu_page);
295 kunmap(gpu_page);
Eric Anholt280b7132009-03-12 16:56:27 -0700296}
297
Eric Anholt673a3942008-07-30 12:06:12 -0700298/**
Eric Anholteb014592009-03-10 11:44:52 -0700299 * This is the fast shmem pread path, which attempts to copy_from_user directly
300 * from the backing pages of the object to the user's address space. On a
301 * fault, it fails so we can fall back to i915_gem_shmem_pwrite_slow().
302 */
303static int
Chris Wilson05394f32010-11-08 19:18:58 +0000304i915_gem_shmem_pread_fast(struct drm_device *dev,
305 struct drm_i915_gem_object *obj,
Eric Anholteb014592009-03-10 11:44:52 -0700306 struct drm_i915_gem_pread *args,
Chris Wilson05394f32010-11-08 19:18:58 +0000307 struct drm_file *file)
Eric Anholteb014592009-03-10 11:44:52 -0700308{
Chris Wilson05394f32010-11-08 19:18:58 +0000309 struct address_space *mapping = obj->base.filp->f_path.dentry->d_inode->i_mapping;
Eric Anholteb014592009-03-10 11:44:52 -0700310 ssize_t remain;
Chris Wilsone5281cc2010-10-28 13:45:36 +0100311 loff_t offset;
Eric Anholteb014592009-03-10 11:44:52 -0700312 char __user *user_data;
313 int page_offset, page_length;
Eric Anholteb014592009-03-10 11:44:52 -0700314
315 user_data = (char __user *) (uintptr_t) args->data_ptr;
316 remain = args->size;
317
Eric Anholteb014592009-03-10 11:44:52 -0700318 offset = args->offset;
319
320 while (remain > 0) {
Chris Wilsone5281cc2010-10-28 13:45:36 +0100321 struct page *page;
322 char *vaddr;
323 int ret;
324
Eric Anholteb014592009-03-10 11:44:52 -0700325 /* Operation in this page
326 *
Eric Anholteb014592009-03-10 11:44:52 -0700327 * page_offset = offset within page
328 * page_length = bytes to copy for this page
329 */
Eric Anholteb014592009-03-10 11:44:52 -0700330 page_offset = offset & (PAGE_SIZE-1);
331 page_length = remain;
332 if ((page_offset + remain) > PAGE_SIZE)
333 page_length = PAGE_SIZE - page_offset;
334
Chris Wilsone5281cc2010-10-28 13:45:36 +0100335 page = read_cache_page_gfp(mapping, offset >> PAGE_SHIFT,
336 GFP_HIGHUSER | __GFP_RECLAIMABLE);
337 if (IS_ERR(page))
338 return PTR_ERR(page);
339
340 vaddr = kmap_atomic(page);
341 ret = __copy_to_user_inatomic(user_data,
342 vaddr + page_offset,
343 page_length);
344 kunmap_atomic(vaddr);
345
346 mark_page_accessed(page);
347 page_cache_release(page);
348 if (ret)
Chris Wilson4f27b752010-10-14 15:26:45 +0100349 return -EFAULT;
Eric Anholteb014592009-03-10 11:44:52 -0700350
351 remain -= page_length;
352 user_data += page_length;
353 offset += page_length;
354 }
355
Chris Wilson4f27b752010-10-14 15:26:45 +0100356 return 0;
Eric Anholteb014592009-03-10 11:44:52 -0700357}
358
359/**
360 * This is the fallback shmem pread path, which allocates temporary storage
361 * in kernel space to copy_to_user into outside of the struct_mutex, so we
362 * can copy out of the object's backing pages while holding the struct mutex
363 * and not take page faults.
364 */
365static int
Chris Wilson05394f32010-11-08 19:18:58 +0000366i915_gem_shmem_pread_slow(struct drm_device *dev,
367 struct drm_i915_gem_object *obj,
Eric Anholteb014592009-03-10 11:44:52 -0700368 struct drm_i915_gem_pread *args,
Chris Wilson05394f32010-11-08 19:18:58 +0000369 struct drm_file *file)
Eric Anholteb014592009-03-10 11:44:52 -0700370{
Chris Wilson05394f32010-11-08 19:18:58 +0000371 struct address_space *mapping = obj->base.filp->f_path.dentry->d_inode->i_mapping;
Eric Anholteb014592009-03-10 11:44:52 -0700372 struct mm_struct *mm = current->mm;
373 struct page **user_pages;
374 ssize_t remain;
375 loff_t offset, pinned_pages, i;
376 loff_t first_data_page, last_data_page, num_pages;
Chris Wilsone5281cc2010-10-28 13:45:36 +0100377 int shmem_page_offset;
378 int data_page_index, data_page_offset;
Eric Anholteb014592009-03-10 11:44:52 -0700379 int page_length;
380 int ret;
381 uint64_t data_ptr = args->data_ptr;
Eric Anholt280b7132009-03-12 16:56:27 -0700382 int do_bit17_swizzling;
Eric Anholteb014592009-03-10 11:44:52 -0700383
384 remain = args->size;
385
386 /* Pin the user pages containing the data. We can't fault while
387 * holding the struct mutex, yet we want to hold it while
388 * dereferencing the user data.
389 */
390 first_data_page = data_ptr / PAGE_SIZE;
391 last_data_page = (data_ptr + args->size - 1) / PAGE_SIZE;
392 num_pages = last_data_page - first_data_page + 1;
393
Chris Wilson4f27b752010-10-14 15:26:45 +0100394 user_pages = drm_malloc_ab(num_pages, sizeof(struct page *));
Eric Anholteb014592009-03-10 11:44:52 -0700395 if (user_pages == NULL)
396 return -ENOMEM;
397
Chris Wilson4f27b752010-10-14 15:26:45 +0100398 mutex_unlock(&dev->struct_mutex);
Eric Anholteb014592009-03-10 11:44:52 -0700399 down_read(&mm->mmap_sem);
400 pinned_pages = get_user_pages(current, mm, (uintptr_t)args->data_ptr,
Eric Anholte5e9ecd2009-04-07 16:01:22 -0700401 num_pages, 1, 0, user_pages, NULL);
Eric Anholteb014592009-03-10 11:44:52 -0700402 up_read(&mm->mmap_sem);
Chris Wilson4f27b752010-10-14 15:26:45 +0100403 mutex_lock(&dev->struct_mutex);
Eric Anholteb014592009-03-10 11:44:52 -0700404 if (pinned_pages < num_pages) {
405 ret = -EFAULT;
Chris Wilson4f27b752010-10-14 15:26:45 +0100406 goto out;
Eric Anholteb014592009-03-10 11:44:52 -0700407 }
408
Chris Wilson4f27b752010-10-14 15:26:45 +0100409 ret = i915_gem_object_set_cpu_read_domain_range(obj,
410 args->offset,
Eric Anholteb014592009-03-10 11:44:52 -0700411 args->size);
Chris Wilson4f27b752010-10-14 15:26:45 +0100412 if (ret)
413 goto out;
414
415 do_bit17_swizzling = i915_gem_object_needs_bit17_swizzle(obj);
Eric Anholteb014592009-03-10 11:44:52 -0700416
Eric Anholteb014592009-03-10 11:44:52 -0700417 offset = args->offset;
418
419 while (remain > 0) {
Chris Wilsone5281cc2010-10-28 13:45:36 +0100420 struct page *page;
421
Eric Anholteb014592009-03-10 11:44:52 -0700422 /* Operation in this page
423 *
Eric Anholteb014592009-03-10 11:44:52 -0700424 * shmem_page_offset = offset within page in shmem file
425 * data_page_index = page number in get_user_pages return
426 * data_page_offset = offset with data_page_index page.
427 * page_length = bytes to copy for this page
428 */
Eric Anholteb014592009-03-10 11:44:52 -0700429 shmem_page_offset = offset & ~PAGE_MASK;
430 data_page_index = data_ptr / PAGE_SIZE - first_data_page;
431 data_page_offset = data_ptr & ~PAGE_MASK;
432
433 page_length = remain;
434 if ((shmem_page_offset + page_length) > PAGE_SIZE)
435 page_length = PAGE_SIZE - shmem_page_offset;
436 if ((data_page_offset + page_length) > PAGE_SIZE)
437 page_length = PAGE_SIZE - data_page_offset;
438
Chris Wilsone5281cc2010-10-28 13:45:36 +0100439 page = read_cache_page_gfp(mapping, offset >> PAGE_SHIFT,
440 GFP_HIGHUSER | __GFP_RECLAIMABLE);
441 if (IS_ERR(page))
442 return PTR_ERR(page);
443
Eric Anholt280b7132009-03-12 16:56:27 -0700444 if (do_bit17_swizzling) {
Chris Wilsone5281cc2010-10-28 13:45:36 +0100445 slow_shmem_bit17_copy(page,
Eric Anholt280b7132009-03-12 16:56:27 -0700446 shmem_page_offset,
Chris Wilson99a03df2010-05-27 14:15:34 +0100447 user_pages[data_page_index],
448 data_page_offset,
449 page_length,
450 1);
451 } else {
452 slow_shmem_copy(user_pages[data_page_index],
453 data_page_offset,
Chris Wilsone5281cc2010-10-28 13:45:36 +0100454 page,
Chris Wilson99a03df2010-05-27 14:15:34 +0100455 shmem_page_offset,
456 page_length);
Eric Anholt280b7132009-03-12 16:56:27 -0700457 }
Eric Anholteb014592009-03-10 11:44:52 -0700458
Chris Wilsone5281cc2010-10-28 13:45:36 +0100459 mark_page_accessed(page);
460 page_cache_release(page);
461
Eric Anholteb014592009-03-10 11:44:52 -0700462 remain -= page_length;
463 data_ptr += page_length;
464 offset += page_length;
465 }
466
Chris Wilson4f27b752010-10-14 15:26:45 +0100467out:
Eric Anholteb014592009-03-10 11:44:52 -0700468 for (i = 0; i < pinned_pages; i++) {
469 SetPageDirty(user_pages[i]);
Chris Wilsone5281cc2010-10-28 13:45:36 +0100470 mark_page_accessed(user_pages[i]);
Eric Anholteb014592009-03-10 11:44:52 -0700471 page_cache_release(user_pages[i]);
472 }
Jesse Barnes8e7d2b22009-05-08 16:13:25 -0700473 drm_free_large(user_pages);
Eric Anholteb014592009-03-10 11:44:52 -0700474
475 return ret;
476}
477
Eric Anholt673a3942008-07-30 12:06:12 -0700478/**
479 * Reads data from the object referenced by handle.
480 *
481 * On error, the contents of *data are undefined.
482 */
483int
484i915_gem_pread_ioctl(struct drm_device *dev, void *data,
Chris Wilson05394f32010-11-08 19:18:58 +0000485 struct drm_file *file)
Eric Anholt673a3942008-07-30 12:06:12 -0700486{
487 struct drm_i915_gem_pread *args = data;
Chris Wilson05394f32010-11-08 19:18:58 +0000488 struct drm_i915_gem_object *obj;
Chris Wilson35b62a82010-09-26 20:23:38 +0100489 int ret = 0;
Eric Anholt673a3942008-07-30 12:06:12 -0700490
Chris Wilson51311d02010-11-17 09:10:42 +0000491 if (args->size == 0)
492 return 0;
493
494 if (!access_ok(VERIFY_WRITE,
495 (char __user *)(uintptr_t)args->data_ptr,
496 args->size))
497 return -EFAULT;
498
499 ret = fault_in_pages_writeable((char __user *)(uintptr_t)args->data_ptr,
500 args->size);
501 if (ret)
502 return -EFAULT;
503
Chris Wilson4f27b752010-10-14 15:26:45 +0100504 ret = i915_mutex_lock_interruptible(dev);
Chris Wilson1d7cfea2010-10-17 09:45:41 +0100505 if (ret)
Chris Wilson4f27b752010-10-14 15:26:45 +0100506 return ret;
Eric Anholt673a3942008-07-30 12:06:12 -0700507
Chris Wilson05394f32010-11-08 19:18:58 +0000508 obj = to_intel_bo(drm_gem_object_lookup(dev, file, args->handle));
Chris Wilson1d7cfea2010-10-17 09:45:41 +0100509 if (obj == NULL) {
510 ret = -ENOENT;
511 goto unlock;
Chris Wilson4f27b752010-10-14 15:26:45 +0100512 }
Eric Anholt673a3942008-07-30 12:06:12 -0700513
Chris Wilson7dcd2492010-09-26 20:21:44 +0100514 /* Bounds check source. */
Chris Wilson05394f32010-11-08 19:18:58 +0000515 if (args->offset > obj->base.size ||
516 args->size > obj->base.size - args->offset) {
Chris Wilsonce9d4192010-09-26 20:50:05 +0100517 ret = -EINVAL;
Chris Wilson35b62a82010-09-26 20:23:38 +0100518 goto out;
Chris Wilsonce9d4192010-09-26 20:50:05 +0100519 }
520
Chris Wilsondb53a302011-02-03 11:57:46 +0000521 trace_i915_gem_object_pread(obj, args->offset, args->size);
522
Chris Wilson4f27b752010-10-14 15:26:45 +0100523 ret = i915_gem_object_set_cpu_read_domain_range(obj,
524 args->offset,
525 args->size);
526 if (ret)
Chris Wilsone5281cc2010-10-28 13:45:36 +0100527 goto out;
Chris Wilson4f27b752010-10-14 15:26:45 +0100528
529 ret = -EFAULT;
530 if (!i915_gem_object_needs_bit17_swizzle(obj))
Chris Wilson05394f32010-11-08 19:18:58 +0000531 ret = i915_gem_shmem_pread_fast(dev, obj, args, file);
Chris Wilson4f27b752010-10-14 15:26:45 +0100532 if (ret == -EFAULT)
Chris Wilson05394f32010-11-08 19:18:58 +0000533 ret = i915_gem_shmem_pread_slow(dev, obj, args, file);
Eric Anholt673a3942008-07-30 12:06:12 -0700534
Chris Wilson35b62a82010-09-26 20:23:38 +0100535out:
Chris Wilson05394f32010-11-08 19:18:58 +0000536 drm_gem_object_unreference(&obj->base);
Chris Wilson1d7cfea2010-10-17 09:45:41 +0100537unlock:
Chris Wilson4f27b752010-10-14 15:26:45 +0100538 mutex_unlock(&dev->struct_mutex);
Eric Anholteb014592009-03-10 11:44:52 -0700539 return ret;
Eric Anholt673a3942008-07-30 12:06:12 -0700540}
541
Keith Packard0839ccb2008-10-30 19:38:48 -0700542/* This is the fast write path which cannot handle
543 * page faults in the source data
Linus Torvalds9b7530cc2008-10-20 14:16:43 -0700544 */
Linus Torvalds9b7530cc2008-10-20 14:16:43 -0700545
Keith Packard0839ccb2008-10-30 19:38:48 -0700546static inline int
547fast_user_write(struct io_mapping *mapping,
548 loff_t page_base, int page_offset,
549 char __user *user_data,
550 int length)
551{
552 char *vaddr_atomic;
553 unsigned long unwritten;
554
Peter Zijlstra3e4d3af2010-10-26 14:21:51 -0700555 vaddr_atomic = io_mapping_map_atomic_wc(mapping, page_base);
Keith Packard0839ccb2008-10-30 19:38:48 -0700556 unwritten = __copy_from_user_inatomic_nocache(vaddr_atomic + page_offset,
557 user_data, length);
Peter Zijlstra3e4d3af2010-10-26 14:21:51 -0700558 io_mapping_unmap_atomic(vaddr_atomic);
Chris Wilsonfbd5a262010-10-14 15:03:58 +0100559 return unwritten;
Keith Packard0839ccb2008-10-30 19:38:48 -0700560}
561
562/* Here's the write path which can sleep for
563 * page faults
564 */
565
Chris Wilsonab34c222010-05-27 14:15:35 +0100566static inline void
Eric Anholt3de09aa2009-03-09 09:42:23 -0700567slow_kernel_write(struct io_mapping *mapping,
568 loff_t gtt_base, int gtt_offset,
569 struct page *user_page, int user_offset,
570 int length)
Keith Packard0839ccb2008-10-30 19:38:48 -0700571{
Chris Wilsonab34c222010-05-27 14:15:35 +0100572 char __iomem *dst_vaddr;
573 char *src_vaddr;
Keith Packard0839ccb2008-10-30 19:38:48 -0700574
Chris Wilsonab34c222010-05-27 14:15:35 +0100575 dst_vaddr = io_mapping_map_wc(mapping, gtt_base);
576 src_vaddr = kmap(user_page);
577
578 memcpy_toio(dst_vaddr + gtt_offset,
579 src_vaddr + user_offset,
580 length);
581
582 kunmap(user_page);
583 io_mapping_unmap(dst_vaddr);
Linus Torvalds9b7530cc2008-10-20 14:16:43 -0700584}
585
Eric Anholt3de09aa2009-03-09 09:42:23 -0700586/**
587 * This is the fast pwrite path, where we copy the data directly from the
588 * user into the GTT, uncached.
589 */
Eric Anholt673a3942008-07-30 12:06:12 -0700590static int
Chris Wilson05394f32010-11-08 19:18:58 +0000591i915_gem_gtt_pwrite_fast(struct drm_device *dev,
592 struct drm_i915_gem_object *obj,
Eric Anholt3de09aa2009-03-09 09:42:23 -0700593 struct drm_i915_gem_pwrite *args,
Chris Wilson05394f32010-11-08 19:18:58 +0000594 struct drm_file *file)
Eric Anholt673a3942008-07-30 12:06:12 -0700595{
Keith Packard0839ccb2008-10-30 19:38:48 -0700596 drm_i915_private_t *dev_priv = dev->dev_private;
Eric Anholt673a3942008-07-30 12:06:12 -0700597 ssize_t remain;
Keith Packard0839ccb2008-10-30 19:38:48 -0700598 loff_t offset, page_base;
Eric Anholt673a3942008-07-30 12:06:12 -0700599 char __user *user_data;
Keith Packard0839ccb2008-10-30 19:38:48 -0700600 int page_offset, page_length;
Eric Anholt673a3942008-07-30 12:06:12 -0700601
602 user_data = (char __user *) (uintptr_t) args->data_ptr;
603 remain = args->size;
Eric Anholt673a3942008-07-30 12:06:12 -0700604
Chris Wilson05394f32010-11-08 19:18:58 +0000605 offset = obj->gtt_offset + args->offset;
Eric Anholt673a3942008-07-30 12:06:12 -0700606
607 while (remain > 0) {
608 /* Operation in this page
609 *
Keith Packard0839ccb2008-10-30 19:38:48 -0700610 * page_base = page offset within aperture
611 * page_offset = offset within page
612 * page_length = bytes to copy for this page
Eric Anholt673a3942008-07-30 12:06:12 -0700613 */
Keith Packard0839ccb2008-10-30 19:38:48 -0700614 page_base = (offset & ~(PAGE_SIZE-1));
615 page_offset = offset & (PAGE_SIZE-1);
616 page_length = remain;
617 if ((page_offset + remain) > PAGE_SIZE)
618 page_length = PAGE_SIZE - page_offset;
Eric Anholt673a3942008-07-30 12:06:12 -0700619
Keith Packard0839ccb2008-10-30 19:38:48 -0700620 /* If we get a fault while copying data, then (presumably) our
Eric Anholt3de09aa2009-03-09 09:42:23 -0700621 * source page isn't available. Return the error and we'll
622 * retry in the slow path.
Keith Packard0839ccb2008-10-30 19:38:48 -0700623 */
Chris Wilsonfbd5a262010-10-14 15:03:58 +0100624 if (fast_user_write(dev_priv->mm.gtt_mapping, page_base,
625 page_offset, user_data, page_length))
626
627 return -EFAULT;
Eric Anholt673a3942008-07-30 12:06:12 -0700628
Keith Packard0839ccb2008-10-30 19:38:48 -0700629 remain -= page_length;
630 user_data += page_length;
631 offset += page_length;
Eric Anholt673a3942008-07-30 12:06:12 -0700632 }
Eric Anholt673a3942008-07-30 12:06:12 -0700633
Chris Wilsonfbd5a262010-10-14 15:03:58 +0100634 return 0;
Eric Anholt673a3942008-07-30 12:06:12 -0700635}
636
Eric Anholt3de09aa2009-03-09 09:42:23 -0700637/**
638 * This is the fallback GTT pwrite path, which uses get_user_pages to pin
639 * the memory and maps it using kmap_atomic for copying.
640 *
641 * This code resulted in x11perf -rgb10text consuming about 10% more CPU
642 * than using i915_gem_gtt_pwrite_fast on a G45 (32-bit).
643 */
Eric Anholt3043c602008-10-02 12:24:47 -0700644static int
Chris Wilson05394f32010-11-08 19:18:58 +0000645i915_gem_gtt_pwrite_slow(struct drm_device *dev,
646 struct drm_i915_gem_object *obj,
Eric Anholt3de09aa2009-03-09 09:42:23 -0700647 struct drm_i915_gem_pwrite *args,
Chris Wilson05394f32010-11-08 19:18:58 +0000648 struct drm_file *file)
Eric Anholt673a3942008-07-30 12:06:12 -0700649{
Eric Anholt3de09aa2009-03-09 09:42:23 -0700650 drm_i915_private_t *dev_priv = dev->dev_private;
651 ssize_t remain;
652 loff_t gtt_page_base, offset;
653 loff_t first_data_page, last_data_page, num_pages;
654 loff_t pinned_pages, i;
655 struct page **user_pages;
656 struct mm_struct *mm = current->mm;
657 int gtt_page_offset, data_page_offset, data_page_index, page_length;
Eric Anholt673a3942008-07-30 12:06:12 -0700658 int ret;
Eric Anholt3de09aa2009-03-09 09:42:23 -0700659 uint64_t data_ptr = args->data_ptr;
660
661 remain = args->size;
662
663 /* Pin the user pages containing the data. We can't fault while
664 * holding the struct mutex, and all of the pwrite implementations
665 * want to hold it while dereferencing the user data.
666 */
667 first_data_page = data_ptr / PAGE_SIZE;
668 last_data_page = (data_ptr + args->size - 1) / PAGE_SIZE;
669 num_pages = last_data_page - first_data_page + 1;
670
Chris Wilsonfbd5a262010-10-14 15:03:58 +0100671 user_pages = drm_malloc_ab(num_pages, sizeof(struct page *));
Eric Anholt3de09aa2009-03-09 09:42:23 -0700672 if (user_pages == NULL)
673 return -ENOMEM;
674
Chris Wilsonfbd5a262010-10-14 15:03:58 +0100675 mutex_unlock(&dev->struct_mutex);
Eric Anholt3de09aa2009-03-09 09:42:23 -0700676 down_read(&mm->mmap_sem);
677 pinned_pages = get_user_pages(current, mm, (uintptr_t)args->data_ptr,
678 num_pages, 0, 0, user_pages, NULL);
679 up_read(&mm->mmap_sem);
Chris Wilsonfbd5a262010-10-14 15:03:58 +0100680 mutex_lock(&dev->struct_mutex);
Eric Anholt3de09aa2009-03-09 09:42:23 -0700681 if (pinned_pages < num_pages) {
682 ret = -EFAULT;
683 goto out_unpin_pages;
684 }
685
Chris Wilsond9e86c02010-11-10 16:40:20 +0000686 ret = i915_gem_object_set_to_gtt_domain(obj, true);
687 if (ret)
688 goto out_unpin_pages;
689
690 ret = i915_gem_object_put_fence(obj);
Eric Anholt3de09aa2009-03-09 09:42:23 -0700691 if (ret)
Chris Wilsonfbd5a262010-10-14 15:03:58 +0100692 goto out_unpin_pages;
Eric Anholt3de09aa2009-03-09 09:42:23 -0700693
Chris Wilson05394f32010-11-08 19:18:58 +0000694 offset = obj->gtt_offset + args->offset;
Eric Anholt3de09aa2009-03-09 09:42:23 -0700695
696 while (remain > 0) {
697 /* Operation in this page
698 *
699 * gtt_page_base = page offset within aperture
700 * gtt_page_offset = offset within page in aperture
701 * data_page_index = page number in get_user_pages return
702 * data_page_offset = offset with data_page_index page.
703 * page_length = bytes to copy for this page
704 */
705 gtt_page_base = offset & PAGE_MASK;
706 gtt_page_offset = offset & ~PAGE_MASK;
707 data_page_index = data_ptr / PAGE_SIZE - first_data_page;
708 data_page_offset = data_ptr & ~PAGE_MASK;
709
710 page_length = remain;
711 if ((gtt_page_offset + page_length) > PAGE_SIZE)
712 page_length = PAGE_SIZE - gtt_page_offset;
713 if ((data_page_offset + page_length) > PAGE_SIZE)
714 page_length = PAGE_SIZE - data_page_offset;
715
Chris Wilsonab34c222010-05-27 14:15:35 +0100716 slow_kernel_write(dev_priv->mm.gtt_mapping,
717 gtt_page_base, gtt_page_offset,
718 user_pages[data_page_index],
719 data_page_offset,
720 page_length);
Eric Anholt3de09aa2009-03-09 09:42:23 -0700721
722 remain -= page_length;
723 offset += page_length;
724 data_ptr += page_length;
725 }
726
Eric Anholt3de09aa2009-03-09 09:42:23 -0700727out_unpin_pages:
728 for (i = 0; i < pinned_pages; i++)
729 page_cache_release(user_pages[i]);
Jesse Barnes8e7d2b22009-05-08 16:13:25 -0700730 drm_free_large(user_pages);
Eric Anholt3de09aa2009-03-09 09:42:23 -0700731
732 return ret;
733}
734
Eric Anholt40123c12009-03-09 13:42:30 -0700735/**
736 * This is the fast shmem pwrite path, which attempts to directly
737 * copy_from_user into the kmapped pages backing the object.
738 */
Eric Anholt673a3942008-07-30 12:06:12 -0700739static int
Chris Wilson05394f32010-11-08 19:18:58 +0000740i915_gem_shmem_pwrite_fast(struct drm_device *dev,
741 struct drm_i915_gem_object *obj,
Eric Anholt40123c12009-03-09 13:42:30 -0700742 struct drm_i915_gem_pwrite *args,
Chris Wilson05394f32010-11-08 19:18:58 +0000743 struct drm_file *file)
Eric Anholt673a3942008-07-30 12:06:12 -0700744{
Chris Wilson05394f32010-11-08 19:18:58 +0000745 struct address_space *mapping = obj->base.filp->f_path.dentry->d_inode->i_mapping;
Eric Anholt40123c12009-03-09 13:42:30 -0700746 ssize_t remain;
Chris Wilsone5281cc2010-10-28 13:45:36 +0100747 loff_t offset;
Eric Anholt40123c12009-03-09 13:42:30 -0700748 char __user *user_data;
749 int page_offset, page_length;
Eric Anholt40123c12009-03-09 13:42:30 -0700750
751 user_data = (char __user *) (uintptr_t) args->data_ptr;
752 remain = args->size;
Eric Anholt673a3942008-07-30 12:06:12 -0700753
Eric Anholt673a3942008-07-30 12:06:12 -0700754 offset = args->offset;
Chris Wilson05394f32010-11-08 19:18:58 +0000755 obj->dirty = 1;
Eric Anholt673a3942008-07-30 12:06:12 -0700756
Eric Anholt40123c12009-03-09 13:42:30 -0700757 while (remain > 0) {
Chris Wilsone5281cc2010-10-28 13:45:36 +0100758 struct page *page;
759 char *vaddr;
760 int ret;
761
Eric Anholt40123c12009-03-09 13:42:30 -0700762 /* Operation in this page
763 *
Eric Anholt40123c12009-03-09 13:42:30 -0700764 * page_offset = offset within page
765 * page_length = bytes to copy for this page
766 */
Eric Anholt40123c12009-03-09 13:42:30 -0700767 page_offset = offset & (PAGE_SIZE-1);
768 page_length = remain;
769 if ((page_offset + remain) > PAGE_SIZE)
770 page_length = PAGE_SIZE - page_offset;
771
Chris Wilsone5281cc2010-10-28 13:45:36 +0100772 page = read_cache_page_gfp(mapping, offset >> PAGE_SHIFT,
773 GFP_HIGHUSER | __GFP_RECLAIMABLE);
774 if (IS_ERR(page))
775 return PTR_ERR(page);
776
777 vaddr = kmap_atomic(page, KM_USER0);
778 ret = __copy_from_user_inatomic(vaddr + page_offset,
779 user_data,
780 page_length);
781 kunmap_atomic(vaddr, KM_USER0);
782
783 set_page_dirty(page);
784 mark_page_accessed(page);
785 page_cache_release(page);
786
787 /* If we get a fault while copying data, then (presumably) our
788 * source page isn't available. Return the error and we'll
789 * retry in the slow path.
790 */
791 if (ret)
Chris Wilsonfbd5a262010-10-14 15:03:58 +0100792 return -EFAULT;
Eric Anholt40123c12009-03-09 13:42:30 -0700793
794 remain -= page_length;
795 user_data += page_length;
796 offset += page_length;
Eric Anholt673a3942008-07-30 12:06:12 -0700797 }
798
Chris Wilsonfbd5a262010-10-14 15:03:58 +0100799 return 0;
Eric Anholt40123c12009-03-09 13:42:30 -0700800}
801
802/**
803 * This is the fallback shmem pwrite path, which uses get_user_pages to pin
804 * the memory and maps it using kmap_atomic for copying.
805 *
806 * This avoids taking mmap_sem for faulting on the user's address while the
807 * struct_mutex is held.
808 */
809static int
Chris Wilson05394f32010-11-08 19:18:58 +0000810i915_gem_shmem_pwrite_slow(struct drm_device *dev,
811 struct drm_i915_gem_object *obj,
Eric Anholt40123c12009-03-09 13:42:30 -0700812 struct drm_i915_gem_pwrite *args,
Chris Wilson05394f32010-11-08 19:18:58 +0000813 struct drm_file *file)
Eric Anholt40123c12009-03-09 13:42:30 -0700814{
Chris Wilson05394f32010-11-08 19:18:58 +0000815 struct address_space *mapping = obj->base.filp->f_path.dentry->d_inode->i_mapping;
Eric Anholt40123c12009-03-09 13:42:30 -0700816 struct mm_struct *mm = current->mm;
817 struct page **user_pages;
818 ssize_t remain;
819 loff_t offset, pinned_pages, i;
820 loff_t first_data_page, last_data_page, num_pages;
Chris Wilsone5281cc2010-10-28 13:45:36 +0100821 int shmem_page_offset;
Eric Anholt40123c12009-03-09 13:42:30 -0700822 int data_page_index, data_page_offset;
823 int page_length;
824 int ret;
825 uint64_t data_ptr = args->data_ptr;
Eric Anholt280b7132009-03-12 16:56:27 -0700826 int do_bit17_swizzling;
Eric Anholt40123c12009-03-09 13:42:30 -0700827
828 remain = args->size;
829
830 /* Pin the user pages containing the data. We can't fault while
831 * holding the struct mutex, and all of the pwrite implementations
832 * want to hold it while dereferencing the user data.
833 */
834 first_data_page = data_ptr / PAGE_SIZE;
835 last_data_page = (data_ptr + args->size - 1) / PAGE_SIZE;
836 num_pages = last_data_page - first_data_page + 1;
837
Chris Wilson4f27b752010-10-14 15:26:45 +0100838 user_pages = drm_malloc_ab(num_pages, sizeof(struct page *));
Eric Anholt40123c12009-03-09 13:42:30 -0700839 if (user_pages == NULL)
840 return -ENOMEM;
841
Chris Wilsonfbd5a262010-10-14 15:03:58 +0100842 mutex_unlock(&dev->struct_mutex);
Eric Anholt40123c12009-03-09 13:42:30 -0700843 down_read(&mm->mmap_sem);
844 pinned_pages = get_user_pages(current, mm, (uintptr_t)args->data_ptr,
845 num_pages, 0, 0, user_pages, NULL);
846 up_read(&mm->mmap_sem);
Chris Wilsonfbd5a262010-10-14 15:03:58 +0100847 mutex_lock(&dev->struct_mutex);
Eric Anholt40123c12009-03-09 13:42:30 -0700848 if (pinned_pages < num_pages) {
849 ret = -EFAULT;
Chris Wilsonfbd5a262010-10-14 15:03:58 +0100850 goto out;
Eric Anholt40123c12009-03-09 13:42:30 -0700851 }
852
Eric Anholt40123c12009-03-09 13:42:30 -0700853 ret = i915_gem_object_set_to_cpu_domain(obj, 1);
Chris Wilsonfbd5a262010-10-14 15:03:58 +0100854 if (ret)
855 goto out;
856
857 do_bit17_swizzling = i915_gem_object_needs_bit17_swizzle(obj);
Eric Anholt40123c12009-03-09 13:42:30 -0700858
Eric Anholt40123c12009-03-09 13:42:30 -0700859 offset = args->offset;
Chris Wilson05394f32010-11-08 19:18:58 +0000860 obj->dirty = 1;
Eric Anholt40123c12009-03-09 13:42:30 -0700861
862 while (remain > 0) {
Chris Wilsone5281cc2010-10-28 13:45:36 +0100863 struct page *page;
864
Eric Anholt40123c12009-03-09 13:42:30 -0700865 /* Operation in this page
866 *
Eric Anholt40123c12009-03-09 13:42:30 -0700867 * shmem_page_offset = offset within page in shmem file
868 * data_page_index = page number in get_user_pages return
869 * data_page_offset = offset with data_page_index page.
870 * page_length = bytes to copy for this page
871 */
Eric Anholt40123c12009-03-09 13:42:30 -0700872 shmem_page_offset = offset & ~PAGE_MASK;
873 data_page_index = data_ptr / PAGE_SIZE - first_data_page;
874 data_page_offset = data_ptr & ~PAGE_MASK;
875
876 page_length = remain;
877 if ((shmem_page_offset + page_length) > PAGE_SIZE)
878 page_length = PAGE_SIZE - shmem_page_offset;
879 if ((data_page_offset + page_length) > PAGE_SIZE)
880 page_length = PAGE_SIZE - data_page_offset;
881
Chris Wilsone5281cc2010-10-28 13:45:36 +0100882 page = read_cache_page_gfp(mapping, offset >> PAGE_SHIFT,
883 GFP_HIGHUSER | __GFP_RECLAIMABLE);
884 if (IS_ERR(page)) {
885 ret = PTR_ERR(page);
886 goto out;
887 }
888
Eric Anholt280b7132009-03-12 16:56:27 -0700889 if (do_bit17_swizzling) {
Chris Wilsone5281cc2010-10-28 13:45:36 +0100890 slow_shmem_bit17_copy(page,
Eric Anholt280b7132009-03-12 16:56:27 -0700891 shmem_page_offset,
892 user_pages[data_page_index],
893 data_page_offset,
Chris Wilson99a03df2010-05-27 14:15:34 +0100894 page_length,
895 0);
896 } else {
Chris Wilsone5281cc2010-10-28 13:45:36 +0100897 slow_shmem_copy(page,
Chris Wilson99a03df2010-05-27 14:15:34 +0100898 shmem_page_offset,
899 user_pages[data_page_index],
900 data_page_offset,
901 page_length);
Eric Anholt280b7132009-03-12 16:56:27 -0700902 }
Eric Anholt40123c12009-03-09 13:42:30 -0700903
Chris Wilsone5281cc2010-10-28 13:45:36 +0100904 set_page_dirty(page);
905 mark_page_accessed(page);
906 page_cache_release(page);
907
Eric Anholt40123c12009-03-09 13:42:30 -0700908 remain -= page_length;
909 data_ptr += page_length;
910 offset += page_length;
911 }
912
Chris Wilsonfbd5a262010-10-14 15:03:58 +0100913out:
Eric Anholt40123c12009-03-09 13:42:30 -0700914 for (i = 0; i < pinned_pages; i++)
915 page_cache_release(user_pages[i]);
Jesse Barnes8e7d2b22009-05-08 16:13:25 -0700916 drm_free_large(user_pages);
Eric Anholt40123c12009-03-09 13:42:30 -0700917
918 return ret;
Eric Anholt673a3942008-07-30 12:06:12 -0700919}
920
921/**
922 * Writes data to the object referenced by handle.
923 *
924 * On error, the contents of the buffer that were to be modified are undefined.
925 */
926int
927i915_gem_pwrite_ioctl(struct drm_device *dev, void *data,
Chris Wilsonfbd5a262010-10-14 15:03:58 +0100928 struct drm_file *file)
Eric Anholt673a3942008-07-30 12:06:12 -0700929{
930 struct drm_i915_gem_pwrite *args = data;
Chris Wilson05394f32010-11-08 19:18:58 +0000931 struct drm_i915_gem_object *obj;
Chris Wilson51311d02010-11-17 09:10:42 +0000932 int ret;
933
934 if (args->size == 0)
935 return 0;
936
937 if (!access_ok(VERIFY_READ,
938 (char __user *)(uintptr_t)args->data_ptr,
939 args->size))
940 return -EFAULT;
941
942 ret = fault_in_pages_readable((char __user *)(uintptr_t)args->data_ptr,
943 args->size);
944 if (ret)
945 return -EFAULT;
Eric Anholt673a3942008-07-30 12:06:12 -0700946
Chris Wilson1d7cfea2010-10-17 09:45:41 +0100947 ret = i915_mutex_lock_interruptible(dev);
948 if (ret)
949 return ret;
950
Chris Wilson05394f32010-11-08 19:18:58 +0000951 obj = to_intel_bo(drm_gem_object_lookup(dev, file, args->handle));
Chris Wilson1d7cfea2010-10-17 09:45:41 +0100952 if (obj == NULL) {
953 ret = -ENOENT;
954 goto unlock;
955 }
Eric Anholt673a3942008-07-30 12:06:12 -0700956
Chris Wilson7dcd2492010-09-26 20:21:44 +0100957 /* Bounds check destination. */
Chris Wilson05394f32010-11-08 19:18:58 +0000958 if (args->offset > obj->base.size ||
959 args->size > obj->base.size - args->offset) {
Chris Wilsonce9d4192010-09-26 20:50:05 +0100960 ret = -EINVAL;
Chris Wilson35b62a82010-09-26 20:23:38 +0100961 goto out;
Chris Wilsonce9d4192010-09-26 20:50:05 +0100962 }
963
Chris Wilsondb53a302011-02-03 11:57:46 +0000964 trace_i915_gem_object_pwrite(obj, args->offset, args->size);
965
Eric Anholt673a3942008-07-30 12:06:12 -0700966 /* We can only do the GTT pwrite on untiled buffers, as otherwise
967 * it would end up going through the fenced access, and we'll get
968 * different detiling behavior between reading and writing.
969 * pread/pwrite currently are reading and writing from the CPU
970 * perspective, requiring manual detiling by the client.
971 */
Chris Wilson05394f32010-11-08 19:18:58 +0000972 if (obj->phys_obj)
Chris Wilsonfbd5a262010-10-14 15:03:58 +0100973 ret = i915_gem_phys_pwrite(dev, obj, args, file);
Chris Wilsond9e86c02010-11-10 16:40:20 +0000974 else if (obj->gtt_space &&
Chris Wilson05394f32010-11-08 19:18:58 +0000975 obj->base.write_domain != I915_GEM_DOMAIN_CPU) {
Daniel Vetter75e9e912010-11-04 17:11:09 +0100976 ret = i915_gem_object_pin(obj, 0, true);
Chris Wilsonfbd5a262010-10-14 15:03:58 +0100977 if (ret)
978 goto out;
979
Chris Wilsond9e86c02010-11-10 16:40:20 +0000980 ret = i915_gem_object_set_to_gtt_domain(obj, true);
981 if (ret)
982 goto out_unpin;
983
984 ret = i915_gem_object_put_fence(obj);
Chris Wilsonfbd5a262010-10-14 15:03:58 +0100985 if (ret)
986 goto out_unpin;
987
988 ret = i915_gem_gtt_pwrite_fast(dev, obj, args, file);
989 if (ret == -EFAULT)
990 ret = i915_gem_gtt_pwrite_slow(dev, obj, args, file);
991
992out_unpin:
993 i915_gem_object_unpin(obj);
Eric Anholt40123c12009-03-09 13:42:30 -0700994 } else {
Chris Wilsonfbd5a262010-10-14 15:03:58 +0100995 ret = i915_gem_object_set_to_cpu_domain(obj, 1);
996 if (ret)
Chris Wilsone5281cc2010-10-28 13:45:36 +0100997 goto out;
Chris Wilsonfbd5a262010-10-14 15:03:58 +0100998
999 ret = -EFAULT;
1000 if (!i915_gem_object_needs_bit17_swizzle(obj))
1001 ret = i915_gem_shmem_pwrite_fast(dev, obj, args, file);
1002 if (ret == -EFAULT)
1003 ret = i915_gem_shmem_pwrite_slow(dev, obj, args, file);
Eric Anholt40123c12009-03-09 13:42:30 -07001004 }
Eric Anholt673a3942008-07-30 12:06:12 -07001005
Chris Wilson35b62a82010-09-26 20:23:38 +01001006out:
Chris Wilson05394f32010-11-08 19:18:58 +00001007 drm_gem_object_unreference(&obj->base);
Chris Wilson1d7cfea2010-10-17 09:45:41 +01001008unlock:
Chris Wilsonfbd5a262010-10-14 15:03:58 +01001009 mutex_unlock(&dev->struct_mutex);
Eric Anholt673a3942008-07-30 12:06:12 -07001010 return ret;
1011}
1012
1013/**
Eric Anholt2ef7eea2008-11-10 10:53:25 -08001014 * Called when user space prepares to use an object with the CPU, either
1015 * through the mmap ioctl's mapping or a GTT mapping.
Eric Anholt673a3942008-07-30 12:06:12 -07001016 */
1017int
1018i915_gem_set_domain_ioctl(struct drm_device *dev, void *data,
Chris Wilson05394f32010-11-08 19:18:58 +00001019 struct drm_file *file)
Eric Anholt673a3942008-07-30 12:06:12 -07001020{
1021 struct drm_i915_gem_set_domain *args = data;
Chris Wilson05394f32010-11-08 19:18:58 +00001022 struct drm_i915_gem_object *obj;
Eric Anholt2ef7eea2008-11-10 10:53:25 -08001023 uint32_t read_domains = args->read_domains;
1024 uint32_t write_domain = args->write_domain;
Eric Anholt673a3942008-07-30 12:06:12 -07001025 int ret;
1026
1027 if (!(dev->driver->driver_features & DRIVER_GEM))
1028 return -ENODEV;
1029
Eric Anholt2ef7eea2008-11-10 10:53:25 -08001030 /* Only handle setting domains to types used by the CPU. */
Chris Wilson21d509e2009-06-06 09:46:02 +01001031 if (write_domain & I915_GEM_GPU_DOMAINS)
Eric Anholt2ef7eea2008-11-10 10:53:25 -08001032 return -EINVAL;
1033
Chris Wilson21d509e2009-06-06 09:46:02 +01001034 if (read_domains & I915_GEM_GPU_DOMAINS)
Eric Anholt2ef7eea2008-11-10 10:53:25 -08001035 return -EINVAL;
1036
1037 /* Having something in the write domain implies it's in the read
1038 * domain, and only that read domain. Enforce that in the request.
1039 */
1040 if (write_domain != 0 && read_domains != write_domain)
1041 return -EINVAL;
1042
Chris Wilson76c1dec2010-09-25 11:22:51 +01001043 ret = i915_mutex_lock_interruptible(dev);
Chris Wilson1d7cfea2010-10-17 09:45:41 +01001044 if (ret)
Chris Wilson76c1dec2010-09-25 11:22:51 +01001045 return ret;
Eric Anholt673a3942008-07-30 12:06:12 -07001046
Chris Wilson05394f32010-11-08 19:18:58 +00001047 obj = to_intel_bo(drm_gem_object_lookup(dev, file, args->handle));
Chris Wilson1d7cfea2010-10-17 09:45:41 +01001048 if (obj == NULL) {
1049 ret = -ENOENT;
1050 goto unlock;
Chris Wilson76c1dec2010-09-25 11:22:51 +01001051 }
Jesse Barnes652c3932009-08-17 13:31:43 -07001052
Eric Anholt2ef7eea2008-11-10 10:53:25 -08001053 if (read_domains & I915_GEM_DOMAIN_GTT) {
1054 ret = i915_gem_object_set_to_gtt_domain(obj, write_domain != 0);
Eric Anholt02354392008-11-26 13:58:13 -08001055
1056 /* Silently promote "you're not bound, there was nothing to do"
1057 * to success, since the client was just asking us to
1058 * make sure everything was done.
1059 */
1060 if (ret == -EINVAL)
1061 ret = 0;
Eric Anholt2ef7eea2008-11-10 10:53:25 -08001062 } else {
Eric Anholte47c68e2008-11-14 13:35:19 -08001063 ret = i915_gem_object_set_to_cpu_domain(obj, write_domain != 0);
Eric Anholt2ef7eea2008-11-10 10:53:25 -08001064 }
1065
Chris Wilson05394f32010-11-08 19:18:58 +00001066 drm_gem_object_unreference(&obj->base);
Chris Wilson1d7cfea2010-10-17 09:45:41 +01001067unlock:
Eric Anholt673a3942008-07-30 12:06:12 -07001068 mutex_unlock(&dev->struct_mutex);
1069 return ret;
1070}
1071
1072/**
1073 * Called when user space has done writes to this buffer
1074 */
1075int
1076i915_gem_sw_finish_ioctl(struct drm_device *dev, void *data,
Chris Wilson05394f32010-11-08 19:18:58 +00001077 struct drm_file *file)
Eric Anholt673a3942008-07-30 12:06:12 -07001078{
1079 struct drm_i915_gem_sw_finish *args = data;
Chris Wilson05394f32010-11-08 19:18:58 +00001080 struct drm_i915_gem_object *obj;
Eric Anholt673a3942008-07-30 12:06:12 -07001081 int ret = 0;
1082
1083 if (!(dev->driver->driver_features & DRIVER_GEM))
1084 return -ENODEV;
1085
Chris Wilson76c1dec2010-09-25 11:22:51 +01001086 ret = i915_mutex_lock_interruptible(dev);
Chris Wilson1d7cfea2010-10-17 09:45:41 +01001087 if (ret)
Chris Wilson76c1dec2010-09-25 11:22:51 +01001088 return ret;
Chris Wilson1d7cfea2010-10-17 09:45:41 +01001089
Chris Wilson05394f32010-11-08 19:18:58 +00001090 obj = to_intel_bo(drm_gem_object_lookup(dev, file, args->handle));
Eric Anholt673a3942008-07-30 12:06:12 -07001091 if (obj == NULL) {
Chris Wilson1d7cfea2010-10-17 09:45:41 +01001092 ret = -ENOENT;
1093 goto unlock;
Eric Anholt673a3942008-07-30 12:06:12 -07001094 }
1095
Eric Anholt673a3942008-07-30 12:06:12 -07001096 /* Pinned buffers may be scanout, so flush the cache */
Chris Wilson05394f32010-11-08 19:18:58 +00001097 if (obj->pin_count)
Eric Anholte47c68e2008-11-14 13:35:19 -08001098 i915_gem_object_flush_cpu_write_domain(obj);
1099
Chris Wilson05394f32010-11-08 19:18:58 +00001100 drm_gem_object_unreference(&obj->base);
Chris Wilson1d7cfea2010-10-17 09:45:41 +01001101unlock:
Eric Anholt673a3942008-07-30 12:06:12 -07001102 mutex_unlock(&dev->struct_mutex);
1103 return ret;
1104}
1105
1106/**
1107 * Maps the contents of an object, returning the address it is mapped
1108 * into.
1109 *
1110 * While the mapping holds a reference on the contents of the object, it doesn't
1111 * imply a ref on the object itself.
1112 */
1113int
1114i915_gem_mmap_ioctl(struct drm_device *dev, void *data,
Chris Wilson05394f32010-11-08 19:18:58 +00001115 struct drm_file *file)
Eric Anholt673a3942008-07-30 12:06:12 -07001116{
Chris Wilsonda761a62010-10-27 17:37:08 +01001117 struct drm_i915_private *dev_priv = dev->dev_private;
Eric Anholt673a3942008-07-30 12:06:12 -07001118 struct drm_i915_gem_mmap *args = data;
1119 struct drm_gem_object *obj;
Eric Anholt673a3942008-07-30 12:06:12 -07001120 unsigned long addr;
1121
1122 if (!(dev->driver->driver_features & DRIVER_GEM))
1123 return -ENODEV;
1124
Chris Wilson05394f32010-11-08 19:18:58 +00001125 obj = drm_gem_object_lookup(dev, file, args->handle);
Eric Anholt673a3942008-07-30 12:06:12 -07001126 if (obj == NULL)
Chris Wilsonbf79cb92010-08-04 14:19:46 +01001127 return -ENOENT;
Eric Anholt673a3942008-07-30 12:06:12 -07001128
Chris Wilsonda761a62010-10-27 17:37:08 +01001129 if (obj->size > dev_priv->mm.gtt_mappable_end) {
1130 drm_gem_object_unreference_unlocked(obj);
1131 return -E2BIG;
1132 }
1133
Eric Anholt673a3942008-07-30 12:06:12 -07001134 down_write(&current->mm->mmap_sem);
1135 addr = do_mmap(obj->filp, 0, args->size,
1136 PROT_READ | PROT_WRITE, MAP_SHARED,
1137 args->offset);
1138 up_write(&current->mm->mmap_sem);
Luca Barbieribc9025b2010-02-09 05:49:12 +00001139 drm_gem_object_unreference_unlocked(obj);
Eric Anholt673a3942008-07-30 12:06:12 -07001140 if (IS_ERR((void *)addr))
1141 return addr;
1142
1143 args->addr_ptr = (uint64_t) addr;
1144
1145 return 0;
1146}
1147
Jesse Barnesde151cf2008-11-12 10:03:55 -08001148/**
1149 * i915_gem_fault - fault a page into the GTT
1150 * vma: VMA in question
1151 * vmf: fault info
1152 *
1153 * The fault handler is set up by drm_gem_mmap() when a object is GTT mapped
1154 * from userspace. The fault handler takes care of binding the object to
1155 * the GTT (if needed), allocating and programming a fence register (again,
1156 * only if needed based on whether the old reg is still valid or the object
1157 * is tiled) and inserting a new PTE into the faulting process.
1158 *
1159 * Note that the faulting process may involve evicting existing objects
1160 * from the GTT and/or fence registers to make room. So performance may
1161 * suffer if the GTT working set is large or there are few fence registers
1162 * left.
1163 */
1164int i915_gem_fault(struct vm_area_struct *vma, struct vm_fault *vmf)
1165{
Chris Wilson05394f32010-11-08 19:18:58 +00001166 struct drm_i915_gem_object *obj = to_intel_bo(vma->vm_private_data);
1167 struct drm_device *dev = obj->base.dev;
Chris Wilson7d1c4802010-08-07 21:45:03 +01001168 drm_i915_private_t *dev_priv = dev->dev_private;
Jesse Barnesde151cf2008-11-12 10:03:55 -08001169 pgoff_t page_offset;
1170 unsigned long pfn;
1171 int ret = 0;
Jesse Barnes0f973f22009-01-26 17:10:45 -08001172 bool write = !!(vmf->flags & FAULT_FLAG_WRITE);
Jesse Barnesde151cf2008-11-12 10:03:55 -08001173
1174 /* We don't use vmf->pgoff since that has the fake offset */
1175 page_offset = ((unsigned long)vmf->virtual_address - vma->vm_start) >>
1176 PAGE_SHIFT;
1177
Chris Wilsond9bc7e92011-02-07 13:09:31 +00001178 ret = i915_mutex_lock_interruptible(dev);
1179 if (ret)
1180 goto out;
Chris Wilsona00b10c2010-09-24 21:15:47 +01001181
Chris Wilsondb53a302011-02-03 11:57:46 +00001182 trace_i915_gem_object_fault(obj, page_offset, true, write);
1183
Chris Wilsond9bc7e92011-02-07 13:09:31 +00001184 /* Now bind it into the GTT if needed */
Chris Wilson919926a2010-11-12 13:42:53 +00001185 if (!obj->map_and_fenceable) {
1186 ret = i915_gem_object_unbind(obj);
1187 if (ret)
1188 goto unlock;
Chris Wilsona00b10c2010-09-24 21:15:47 +01001189 }
Chris Wilson05394f32010-11-08 19:18:58 +00001190 if (!obj->gtt_space) {
Daniel Vetter75e9e912010-11-04 17:11:09 +01001191 ret = i915_gem_object_bind_to_gtt(obj, 0, true);
Chris Wilsonc7150892009-09-23 00:43:56 +01001192 if (ret)
1193 goto unlock;
Jesse Barnesde151cf2008-11-12 10:03:55 -08001194 }
1195
Chris Wilson4a684a42010-10-28 14:44:08 +01001196 ret = i915_gem_object_set_to_gtt_domain(obj, write);
1197 if (ret)
1198 goto unlock;
1199
Chris Wilsond9e86c02010-11-10 16:40:20 +00001200 if (obj->tiling_mode == I915_TILING_NONE)
1201 ret = i915_gem_object_put_fence(obj);
1202 else
1203 ret = i915_gem_object_get_fence(obj, NULL, true);
1204 if (ret)
1205 goto unlock;
Jesse Barnesde151cf2008-11-12 10:03:55 -08001206
Chris Wilson05394f32010-11-08 19:18:58 +00001207 if (i915_gem_object_is_inactive(obj))
1208 list_move_tail(&obj->mm_list, &dev_priv->mm.inactive_list);
Chris Wilson7d1c4802010-08-07 21:45:03 +01001209
Chris Wilson6299f992010-11-24 12:23:44 +00001210 obj->fault_mappable = true;
1211
Chris Wilson05394f32010-11-08 19:18:58 +00001212 pfn = ((dev->agp->base + obj->gtt_offset) >> PAGE_SHIFT) +
Jesse Barnesde151cf2008-11-12 10:03:55 -08001213 page_offset;
1214
1215 /* Finally, remap it using the new GTT offset */
1216 ret = vm_insert_pfn(vma, (unsigned long)vmf->virtual_address, pfn);
Chris Wilsonc7150892009-09-23 00:43:56 +01001217unlock:
Jesse Barnesde151cf2008-11-12 10:03:55 -08001218 mutex_unlock(&dev->struct_mutex);
Chris Wilsond9bc7e92011-02-07 13:09:31 +00001219out:
Jesse Barnesde151cf2008-11-12 10:03:55 -08001220 switch (ret) {
Chris Wilsond9bc7e92011-02-07 13:09:31 +00001221 case -EIO:
Chris Wilson045e7692010-11-07 09:18:22 +00001222 case -EAGAIN:
Chris Wilsond9bc7e92011-02-07 13:09:31 +00001223 /* Give the error handler a chance to run and move the
1224 * objects off the GPU active list. Next time we service the
1225 * fault, we should be able to transition the page into the
1226 * GTT without touching the GPU (and so avoid further
1227 * EIO/EGAIN). If the GPU is wedged, then there is no issue
1228 * with coherency, just lost writes.
1229 */
Chris Wilson045e7692010-11-07 09:18:22 +00001230 set_need_resched();
Chris Wilsonc7150892009-09-23 00:43:56 +01001231 case 0:
1232 case -ERESTARTSYS:
1233 return VM_FAULT_NOPAGE;
Jesse Barnesde151cf2008-11-12 10:03:55 -08001234 case -ENOMEM:
Jesse Barnesde151cf2008-11-12 10:03:55 -08001235 return VM_FAULT_OOM;
Jesse Barnesde151cf2008-11-12 10:03:55 -08001236 default:
Chris Wilsonc7150892009-09-23 00:43:56 +01001237 return VM_FAULT_SIGBUS;
Jesse Barnesde151cf2008-11-12 10:03:55 -08001238 }
1239}
1240
1241/**
1242 * i915_gem_create_mmap_offset - create a fake mmap offset for an object
1243 * @obj: obj in question
1244 *
1245 * GEM memory mapping works by handing back to userspace a fake mmap offset
1246 * it can use in a subsequent mmap(2) call. The DRM core code then looks
1247 * up the object based on the offset and sets up the various memory mapping
1248 * structures.
1249 *
1250 * This routine allocates and attaches a fake offset for @obj.
1251 */
1252static int
Chris Wilson05394f32010-11-08 19:18:58 +00001253i915_gem_create_mmap_offset(struct drm_i915_gem_object *obj)
Jesse Barnesde151cf2008-11-12 10:03:55 -08001254{
Chris Wilson05394f32010-11-08 19:18:58 +00001255 struct drm_device *dev = obj->base.dev;
Jesse Barnesde151cf2008-11-12 10:03:55 -08001256 struct drm_gem_mm *mm = dev->mm_private;
Jesse Barnesde151cf2008-11-12 10:03:55 -08001257 struct drm_map_list *list;
Benjamin Herrenschmidtf77d3902009-02-02 16:55:46 +11001258 struct drm_local_map *map;
Jesse Barnesde151cf2008-11-12 10:03:55 -08001259 int ret = 0;
1260
1261 /* Set the object up for mmap'ing */
Chris Wilson05394f32010-11-08 19:18:58 +00001262 list = &obj->base.map_list;
Eric Anholt9a298b22009-03-24 12:23:04 -07001263 list->map = kzalloc(sizeof(struct drm_map_list), GFP_KERNEL);
Jesse Barnesde151cf2008-11-12 10:03:55 -08001264 if (!list->map)
1265 return -ENOMEM;
1266
1267 map = list->map;
1268 map->type = _DRM_GEM;
Chris Wilson05394f32010-11-08 19:18:58 +00001269 map->size = obj->base.size;
Jesse Barnesde151cf2008-11-12 10:03:55 -08001270 map->handle = obj;
1271
1272 /* Get a DRM GEM mmap offset allocated... */
1273 list->file_offset_node = drm_mm_search_free(&mm->offset_manager,
Chris Wilson05394f32010-11-08 19:18:58 +00001274 obj->base.size / PAGE_SIZE,
1275 0, 0);
Jesse Barnesde151cf2008-11-12 10:03:55 -08001276 if (!list->file_offset_node) {
Chris Wilson05394f32010-11-08 19:18:58 +00001277 DRM_ERROR("failed to allocate offset for bo %d\n",
1278 obj->base.name);
Chris Wilson9e0ae5342010-09-21 15:05:24 +01001279 ret = -ENOSPC;
Jesse Barnesde151cf2008-11-12 10:03:55 -08001280 goto out_free_list;
1281 }
1282
1283 list->file_offset_node = drm_mm_get_block(list->file_offset_node,
Chris Wilson05394f32010-11-08 19:18:58 +00001284 obj->base.size / PAGE_SIZE,
1285 0);
Jesse Barnesde151cf2008-11-12 10:03:55 -08001286 if (!list->file_offset_node) {
1287 ret = -ENOMEM;
1288 goto out_free_list;
1289 }
1290
1291 list->hash.key = list->file_offset_node->start;
Chris Wilson9e0ae5342010-09-21 15:05:24 +01001292 ret = drm_ht_insert_item(&mm->offset_hash, &list->hash);
1293 if (ret) {
Jesse Barnesde151cf2008-11-12 10:03:55 -08001294 DRM_ERROR("failed to add to map hash\n");
1295 goto out_free_mm;
1296 }
1297
Jesse Barnesde151cf2008-11-12 10:03:55 -08001298 return 0;
1299
1300out_free_mm:
1301 drm_mm_put_block(list->file_offset_node);
1302out_free_list:
Eric Anholt9a298b22009-03-24 12:23:04 -07001303 kfree(list->map);
Chris Wilson39a01d12010-10-28 13:03:06 +01001304 list->map = NULL;
Jesse Barnesde151cf2008-11-12 10:03:55 -08001305
1306 return ret;
1307}
1308
Chris Wilson901782b2009-07-10 08:18:50 +01001309/**
1310 * i915_gem_release_mmap - remove physical page mappings
1311 * @obj: obj in question
1312 *
André Goddard Rosaaf901ca2009-11-14 13:09:05 -02001313 * Preserve the reservation of the mmapping with the DRM core code, but
Chris Wilson901782b2009-07-10 08:18:50 +01001314 * relinquish ownership of the pages back to the system.
1315 *
1316 * It is vital that we remove the page mapping if we have mapped a tiled
1317 * object through the GTT and then lose the fence register due to
1318 * resource pressure. Similarly if the object has been moved out of the
1319 * aperture, than pages mapped into userspace must be revoked. Removing the
1320 * mapping will then trigger a page fault on the next user access, allowing
1321 * fixup by i915_gem_fault().
1322 */
Eric Anholtd05ca302009-07-10 13:02:26 -07001323void
Chris Wilson05394f32010-11-08 19:18:58 +00001324i915_gem_release_mmap(struct drm_i915_gem_object *obj)
Chris Wilson901782b2009-07-10 08:18:50 +01001325{
Chris Wilson6299f992010-11-24 12:23:44 +00001326 if (!obj->fault_mappable)
1327 return;
Chris Wilson901782b2009-07-10 08:18:50 +01001328
Chris Wilson6299f992010-11-24 12:23:44 +00001329 unmap_mapping_range(obj->base.dev->dev_mapping,
1330 (loff_t)obj->base.map_list.hash.key<<PAGE_SHIFT,
1331 obj->base.size, 1);
Daniel Vetterfb7d5162010-10-01 22:05:20 +02001332
Chris Wilson6299f992010-11-24 12:23:44 +00001333 obj->fault_mappable = false;
Chris Wilson901782b2009-07-10 08:18:50 +01001334}
1335
Jesse Barnesab00b3e2009-02-11 14:01:46 -08001336static void
Chris Wilson05394f32010-11-08 19:18:58 +00001337i915_gem_free_mmap_offset(struct drm_i915_gem_object *obj)
Jesse Barnesab00b3e2009-02-11 14:01:46 -08001338{
Chris Wilson05394f32010-11-08 19:18:58 +00001339 struct drm_device *dev = obj->base.dev;
Jesse Barnesab00b3e2009-02-11 14:01:46 -08001340 struct drm_gem_mm *mm = dev->mm_private;
Chris Wilson05394f32010-11-08 19:18:58 +00001341 struct drm_map_list *list = &obj->base.map_list;
Jesse Barnesab00b3e2009-02-11 14:01:46 -08001342
Jesse Barnesab00b3e2009-02-11 14:01:46 -08001343 drm_ht_remove_item(&mm->offset_hash, &list->hash);
Chris Wilson39a01d12010-10-28 13:03:06 +01001344 drm_mm_put_block(list->file_offset_node);
1345 kfree(list->map);
1346 list->map = NULL;
Jesse Barnesab00b3e2009-02-11 14:01:46 -08001347}
1348
Chris Wilson92b88ae2010-11-09 11:47:32 +00001349static uint32_t
1350i915_gem_get_gtt_size(struct drm_i915_gem_object *obj)
1351{
1352 struct drm_device *dev = obj->base.dev;
1353 uint32_t size;
1354
1355 if (INTEL_INFO(dev)->gen >= 4 ||
1356 obj->tiling_mode == I915_TILING_NONE)
1357 return obj->base.size;
1358
1359 /* Previous chips need a power-of-two fence region when tiling */
1360 if (INTEL_INFO(dev)->gen == 3)
1361 size = 1024*1024;
1362 else
1363 size = 512*1024;
1364
1365 while (size < obj->base.size)
1366 size <<= 1;
1367
1368 return size;
1369}
1370
Jesse Barnesde151cf2008-11-12 10:03:55 -08001371/**
1372 * i915_gem_get_gtt_alignment - return required GTT alignment for an object
1373 * @obj: object to check
1374 *
1375 * Return the required GTT alignment for an object, taking into account
Daniel Vetter5e783302010-11-14 22:32:36 +01001376 * potential fence register mapping.
Jesse Barnesde151cf2008-11-12 10:03:55 -08001377 */
1378static uint32_t
Chris Wilson05394f32010-11-08 19:18:58 +00001379i915_gem_get_gtt_alignment(struct drm_i915_gem_object *obj)
Jesse Barnesde151cf2008-11-12 10:03:55 -08001380{
Chris Wilson05394f32010-11-08 19:18:58 +00001381 struct drm_device *dev = obj->base.dev;
Jesse Barnesde151cf2008-11-12 10:03:55 -08001382
1383 /*
1384 * Minimum alignment is 4k (GTT page size), but might be greater
1385 * if a fence register is needed for the object.
1386 */
Chris Wilsona00b10c2010-09-24 21:15:47 +01001387 if (INTEL_INFO(dev)->gen >= 4 ||
Chris Wilson05394f32010-11-08 19:18:58 +00001388 obj->tiling_mode == I915_TILING_NONE)
Jesse Barnesde151cf2008-11-12 10:03:55 -08001389 return 4096;
1390
1391 /*
1392 * Previous chips need to be aligned to the size of the smallest
1393 * fence register that can contain the object.
1394 */
Chris Wilson05394f32010-11-08 19:18:58 +00001395 return i915_gem_get_gtt_size(obj);
Chris Wilsona00b10c2010-09-24 21:15:47 +01001396}
1397
Daniel Vetter5e783302010-11-14 22:32:36 +01001398/**
1399 * i915_gem_get_unfenced_gtt_alignment - return required GTT alignment for an
1400 * unfenced object
1401 * @obj: object to check
1402 *
1403 * Return the required GTT alignment for an object, only taking into account
1404 * unfenced tiled surface requirements.
1405 */
1406static uint32_t
Chris Wilson05394f32010-11-08 19:18:58 +00001407i915_gem_get_unfenced_gtt_alignment(struct drm_i915_gem_object *obj)
Daniel Vetter5e783302010-11-14 22:32:36 +01001408{
Chris Wilson05394f32010-11-08 19:18:58 +00001409 struct drm_device *dev = obj->base.dev;
Daniel Vetter5e783302010-11-14 22:32:36 +01001410 int tile_height;
1411
1412 /*
1413 * Minimum alignment is 4k (GTT page size) for sane hw.
1414 */
1415 if (INTEL_INFO(dev)->gen >= 4 || IS_G33(dev) ||
Chris Wilson05394f32010-11-08 19:18:58 +00001416 obj->tiling_mode == I915_TILING_NONE)
Daniel Vetter5e783302010-11-14 22:32:36 +01001417 return 4096;
1418
1419 /*
1420 * Older chips need unfenced tiled buffers to be aligned to the left
1421 * edge of an even tile row (where tile rows are counted as if the bo is
1422 * placed in a fenced gtt region).
1423 */
1424 if (IS_GEN2(dev) ||
Chris Wilson05394f32010-11-08 19:18:58 +00001425 (obj->tiling_mode == I915_TILING_Y && HAS_128_BYTE_Y_TILING(dev)))
Daniel Vetter5e783302010-11-14 22:32:36 +01001426 tile_height = 32;
1427 else
1428 tile_height = 8;
1429
Chris Wilson05394f32010-11-08 19:18:58 +00001430 return tile_height * obj->stride * 2;
Daniel Vetter5e783302010-11-14 22:32:36 +01001431}
1432
Jesse Barnesde151cf2008-11-12 10:03:55 -08001433/**
1434 * i915_gem_mmap_gtt_ioctl - prepare an object for GTT mmap'ing
1435 * @dev: DRM device
1436 * @data: GTT mapping ioctl data
Chris Wilson05394f32010-11-08 19:18:58 +00001437 * @file: GEM object info
Jesse Barnesde151cf2008-11-12 10:03:55 -08001438 *
1439 * Simply returns the fake offset to userspace so it can mmap it.
1440 * The mmap call will end up in drm_gem_mmap(), which will set things
1441 * up so we can get faults in the handler above.
1442 *
1443 * The fault handler will take care of binding the object into the GTT
1444 * (since it may have been evicted to make room for something), allocating
1445 * a fence register, and mapping the appropriate aperture address into
1446 * userspace.
1447 */
1448int
1449i915_gem_mmap_gtt_ioctl(struct drm_device *dev, void *data,
Chris Wilson05394f32010-11-08 19:18:58 +00001450 struct drm_file *file)
Jesse Barnesde151cf2008-11-12 10:03:55 -08001451{
Chris Wilsonda761a62010-10-27 17:37:08 +01001452 struct drm_i915_private *dev_priv = dev->dev_private;
Jesse Barnesde151cf2008-11-12 10:03:55 -08001453 struct drm_i915_gem_mmap_gtt *args = data;
Chris Wilson05394f32010-11-08 19:18:58 +00001454 struct drm_i915_gem_object *obj;
Jesse Barnesde151cf2008-11-12 10:03:55 -08001455 int ret;
1456
1457 if (!(dev->driver->driver_features & DRIVER_GEM))
1458 return -ENODEV;
1459
Chris Wilson76c1dec2010-09-25 11:22:51 +01001460 ret = i915_mutex_lock_interruptible(dev);
Chris Wilson1d7cfea2010-10-17 09:45:41 +01001461 if (ret)
Chris Wilson76c1dec2010-09-25 11:22:51 +01001462 return ret;
Jesse Barnesde151cf2008-11-12 10:03:55 -08001463
Chris Wilson05394f32010-11-08 19:18:58 +00001464 obj = to_intel_bo(drm_gem_object_lookup(dev, file, args->handle));
Chris Wilson1d7cfea2010-10-17 09:45:41 +01001465 if (obj == NULL) {
1466 ret = -ENOENT;
1467 goto unlock;
1468 }
Jesse Barnesde151cf2008-11-12 10:03:55 -08001469
Chris Wilson05394f32010-11-08 19:18:58 +00001470 if (obj->base.size > dev_priv->mm.gtt_mappable_end) {
Chris Wilsonda761a62010-10-27 17:37:08 +01001471 ret = -E2BIG;
1472 goto unlock;
1473 }
1474
Chris Wilson05394f32010-11-08 19:18:58 +00001475 if (obj->madv != I915_MADV_WILLNEED) {
Chris Wilsonab182822009-09-22 18:46:17 +01001476 DRM_ERROR("Attempting to mmap a purgeable buffer\n");
Chris Wilson1d7cfea2010-10-17 09:45:41 +01001477 ret = -EINVAL;
1478 goto out;
Chris Wilsonab182822009-09-22 18:46:17 +01001479 }
1480
Chris Wilson05394f32010-11-08 19:18:58 +00001481 if (!obj->base.map_list.map) {
Jesse Barnesde151cf2008-11-12 10:03:55 -08001482 ret = i915_gem_create_mmap_offset(obj);
Chris Wilson1d7cfea2010-10-17 09:45:41 +01001483 if (ret)
1484 goto out;
Jesse Barnesde151cf2008-11-12 10:03:55 -08001485 }
1486
Chris Wilson05394f32010-11-08 19:18:58 +00001487 args->offset = (u64)obj->base.map_list.hash.key << PAGE_SHIFT;
Jesse Barnesde151cf2008-11-12 10:03:55 -08001488
Chris Wilson1d7cfea2010-10-17 09:45:41 +01001489out:
Chris Wilson05394f32010-11-08 19:18:58 +00001490 drm_gem_object_unreference(&obj->base);
Chris Wilson1d7cfea2010-10-17 09:45:41 +01001491unlock:
Jesse Barnesde151cf2008-11-12 10:03:55 -08001492 mutex_unlock(&dev->struct_mutex);
Chris Wilson1d7cfea2010-10-17 09:45:41 +01001493 return ret;
Jesse Barnesde151cf2008-11-12 10:03:55 -08001494}
1495
Chris Wilsone5281cc2010-10-28 13:45:36 +01001496static int
Chris Wilson05394f32010-11-08 19:18:58 +00001497i915_gem_object_get_pages_gtt(struct drm_i915_gem_object *obj,
Chris Wilsone5281cc2010-10-28 13:45:36 +01001498 gfp_t gfpmask)
1499{
Chris Wilsone5281cc2010-10-28 13:45:36 +01001500 int page_count, i;
1501 struct address_space *mapping;
1502 struct inode *inode;
1503 struct page *page;
1504
1505 /* Get the list of pages out of our struct file. They'll be pinned
1506 * at this point until we release them.
1507 */
Chris Wilson05394f32010-11-08 19:18:58 +00001508 page_count = obj->base.size / PAGE_SIZE;
1509 BUG_ON(obj->pages != NULL);
1510 obj->pages = drm_malloc_ab(page_count, sizeof(struct page *));
1511 if (obj->pages == NULL)
Chris Wilsone5281cc2010-10-28 13:45:36 +01001512 return -ENOMEM;
1513
Chris Wilson05394f32010-11-08 19:18:58 +00001514 inode = obj->base.filp->f_path.dentry->d_inode;
Chris Wilsone5281cc2010-10-28 13:45:36 +01001515 mapping = inode->i_mapping;
1516 for (i = 0; i < page_count; i++) {
1517 page = read_cache_page_gfp(mapping, i,
1518 GFP_HIGHUSER |
1519 __GFP_COLD |
1520 __GFP_RECLAIMABLE |
1521 gfpmask);
1522 if (IS_ERR(page))
1523 goto err_pages;
1524
Chris Wilson05394f32010-11-08 19:18:58 +00001525 obj->pages[i] = page;
Chris Wilsone5281cc2010-10-28 13:45:36 +01001526 }
1527
Chris Wilson05394f32010-11-08 19:18:58 +00001528 if (obj->tiling_mode != I915_TILING_NONE)
Chris Wilsone5281cc2010-10-28 13:45:36 +01001529 i915_gem_object_do_bit_17_swizzle(obj);
1530
1531 return 0;
1532
1533err_pages:
1534 while (i--)
Chris Wilson05394f32010-11-08 19:18:58 +00001535 page_cache_release(obj->pages[i]);
Chris Wilsone5281cc2010-10-28 13:45:36 +01001536
Chris Wilson05394f32010-11-08 19:18:58 +00001537 drm_free_large(obj->pages);
1538 obj->pages = NULL;
Chris Wilsone5281cc2010-10-28 13:45:36 +01001539 return PTR_ERR(page);
1540}
1541
Chris Wilson5cdf5882010-09-27 15:51:07 +01001542static void
Chris Wilson05394f32010-11-08 19:18:58 +00001543i915_gem_object_put_pages_gtt(struct drm_i915_gem_object *obj)
Eric Anholt673a3942008-07-30 12:06:12 -07001544{
Chris Wilson05394f32010-11-08 19:18:58 +00001545 int page_count = obj->base.size / PAGE_SIZE;
Eric Anholt673a3942008-07-30 12:06:12 -07001546 int i;
1547
Chris Wilson05394f32010-11-08 19:18:58 +00001548 BUG_ON(obj->madv == __I915_MADV_PURGED);
Eric Anholt856fa192009-03-19 14:10:50 -07001549
Chris Wilson05394f32010-11-08 19:18:58 +00001550 if (obj->tiling_mode != I915_TILING_NONE)
Eric Anholt280b7132009-03-12 16:56:27 -07001551 i915_gem_object_save_bit_17_swizzle(obj);
1552
Chris Wilson05394f32010-11-08 19:18:58 +00001553 if (obj->madv == I915_MADV_DONTNEED)
1554 obj->dirty = 0;
Chris Wilson3ef94da2009-09-14 16:50:29 +01001555
1556 for (i = 0; i < page_count; i++) {
Chris Wilson05394f32010-11-08 19:18:58 +00001557 if (obj->dirty)
1558 set_page_dirty(obj->pages[i]);
Chris Wilson3ef94da2009-09-14 16:50:29 +01001559
Chris Wilson05394f32010-11-08 19:18:58 +00001560 if (obj->madv == I915_MADV_WILLNEED)
1561 mark_page_accessed(obj->pages[i]);
Chris Wilson3ef94da2009-09-14 16:50:29 +01001562
Chris Wilson05394f32010-11-08 19:18:58 +00001563 page_cache_release(obj->pages[i]);
Chris Wilson3ef94da2009-09-14 16:50:29 +01001564 }
Chris Wilson05394f32010-11-08 19:18:58 +00001565 obj->dirty = 0;
Eric Anholt673a3942008-07-30 12:06:12 -07001566
Chris Wilson05394f32010-11-08 19:18:58 +00001567 drm_free_large(obj->pages);
1568 obj->pages = NULL;
Eric Anholt673a3942008-07-30 12:06:12 -07001569}
1570
Chris Wilson54cf91d2010-11-25 18:00:26 +00001571void
Chris Wilson05394f32010-11-08 19:18:58 +00001572i915_gem_object_move_to_active(struct drm_i915_gem_object *obj,
Chris Wilson1ec14ad2010-12-04 11:30:53 +00001573 struct intel_ring_buffer *ring,
1574 u32 seqno)
Eric Anholt673a3942008-07-30 12:06:12 -07001575{
Chris Wilson05394f32010-11-08 19:18:58 +00001576 struct drm_device *dev = obj->base.dev;
Chris Wilson69dc4982010-10-19 10:36:51 +01001577 struct drm_i915_private *dev_priv = dev->dev_private;
Daniel Vetter617dbe22010-02-11 22:16:02 +01001578
Zou Nan hai852835f2010-05-21 09:08:56 +08001579 BUG_ON(ring == NULL);
Chris Wilson05394f32010-11-08 19:18:58 +00001580 obj->ring = ring;
Eric Anholt673a3942008-07-30 12:06:12 -07001581
1582 /* Add a reference if we're newly entering the active list. */
Chris Wilson05394f32010-11-08 19:18:58 +00001583 if (!obj->active) {
1584 drm_gem_object_reference(&obj->base);
1585 obj->active = 1;
Eric Anholt673a3942008-07-30 12:06:12 -07001586 }
Daniel Vettere35a41d2010-02-11 22:13:59 +01001587
Eric Anholt673a3942008-07-30 12:06:12 -07001588 /* Move from whatever list we were on to the tail of execution. */
Chris Wilson05394f32010-11-08 19:18:58 +00001589 list_move_tail(&obj->mm_list, &dev_priv->mm.active_list);
1590 list_move_tail(&obj->ring_list, &ring->active_list);
Chris Wilsoncaea7472010-11-12 13:53:37 +00001591
Chris Wilson05394f32010-11-08 19:18:58 +00001592 obj->last_rendering_seqno = seqno;
Chris Wilsoncaea7472010-11-12 13:53:37 +00001593 if (obj->fenced_gpu_access) {
1594 struct drm_i915_fence_reg *reg;
1595
1596 BUG_ON(obj->fence_reg == I915_FENCE_REG_NONE);
1597
1598 obj->last_fenced_seqno = seqno;
1599 obj->last_fenced_ring = ring;
1600
1601 reg = &dev_priv->fence_regs[obj->fence_reg];
1602 list_move_tail(&reg->lru_list, &dev_priv->mm.fence_list);
1603 }
1604}
1605
1606static void
1607i915_gem_object_move_off_active(struct drm_i915_gem_object *obj)
1608{
1609 list_del_init(&obj->ring_list);
1610 obj->last_rendering_seqno = 0;
Eric Anholt673a3942008-07-30 12:06:12 -07001611}
1612
Eric Anholtce44b0e2008-11-06 16:00:31 -08001613static void
Chris Wilson05394f32010-11-08 19:18:58 +00001614i915_gem_object_move_to_flushing(struct drm_i915_gem_object *obj)
Eric Anholtce44b0e2008-11-06 16:00:31 -08001615{
Chris Wilson05394f32010-11-08 19:18:58 +00001616 struct drm_device *dev = obj->base.dev;
Eric Anholtce44b0e2008-11-06 16:00:31 -08001617 drm_i915_private_t *dev_priv = dev->dev_private;
Eric Anholtce44b0e2008-11-06 16:00:31 -08001618
Chris Wilson05394f32010-11-08 19:18:58 +00001619 BUG_ON(!obj->active);
1620 list_move_tail(&obj->mm_list, &dev_priv->mm.flushing_list);
Chris Wilsoncaea7472010-11-12 13:53:37 +00001621
1622 i915_gem_object_move_off_active(obj);
1623}
1624
1625static void
1626i915_gem_object_move_to_inactive(struct drm_i915_gem_object *obj)
1627{
1628 struct drm_device *dev = obj->base.dev;
1629 struct drm_i915_private *dev_priv = dev->dev_private;
1630
1631 if (obj->pin_count != 0)
1632 list_move_tail(&obj->mm_list, &dev_priv->mm.pinned_list);
1633 else
1634 list_move_tail(&obj->mm_list, &dev_priv->mm.inactive_list);
1635
1636 BUG_ON(!list_empty(&obj->gpu_write_list));
1637 BUG_ON(!obj->active);
1638 obj->ring = NULL;
1639
1640 i915_gem_object_move_off_active(obj);
1641 obj->fenced_gpu_access = false;
Chris Wilsoncaea7472010-11-12 13:53:37 +00001642
1643 obj->active = 0;
Chris Wilson87ca9c82010-12-02 09:42:56 +00001644 obj->pending_gpu_write = false;
Chris Wilsoncaea7472010-11-12 13:53:37 +00001645 drm_gem_object_unreference(&obj->base);
1646
1647 WARN_ON(i915_verify_lists(dev));
Eric Anholtce44b0e2008-11-06 16:00:31 -08001648}
Eric Anholt673a3942008-07-30 12:06:12 -07001649
Chris Wilson963b4832009-09-20 23:03:54 +01001650/* Immediately discard the backing storage */
1651static void
Chris Wilson05394f32010-11-08 19:18:58 +00001652i915_gem_object_truncate(struct drm_i915_gem_object *obj)
Chris Wilson963b4832009-09-20 23:03:54 +01001653{
Chris Wilsonbb6baf72009-09-22 14:24:13 +01001654 struct inode *inode;
Chris Wilson963b4832009-09-20 23:03:54 +01001655
Chris Wilsonae9fed62010-08-07 11:01:30 +01001656 /* Our goal here is to return as much of the memory as
1657 * is possible back to the system as we are called from OOM.
1658 * To do this we must instruct the shmfs to drop all of its
1659 * backing pages, *now*. Here we mirror the actions taken
1660 * when by shmem_delete_inode() to release the backing store.
1661 */
Chris Wilson05394f32010-11-08 19:18:58 +00001662 inode = obj->base.filp->f_path.dentry->d_inode;
Chris Wilsonae9fed62010-08-07 11:01:30 +01001663 truncate_inode_pages(inode->i_mapping, 0);
1664 if (inode->i_op->truncate_range)
1665 inode->i_op->truncate_range(inode, 0, (loff_t)-1);
Chris Wilsonbb6baf72009-09-22 14:24:13 +01001666
Chris Wilson05394f32010-11-08 19:18:58 +00001667 obj->madv = __I915_MADV_PURGED;
Chris Wilson963b4832009-09-20 23:03:54 +01001668}
1669
1670static inline int
Chris Wilson05394f32010-11-08 19:18:58 +00001671i915_gem_object_is_purgeable(struct drm_i915_gem_object *obj)
Chris Wilson963b4832009-09-20 23:03:54 +01001672{
Chris Wilson05394f32010-11-08 19:18:58 +00001673 return obj->madv == I915_MADV_DONTNEED;
Chris Wilson963b4832009-09-20 23:03:54 +01001674}
1675
Eric Anholt673a3942008-07-30 12:06:12 -07001676static void
Chris Wilsondb53a302011-02-03 11:57:46 +00001677i915_gem_process_flushing_list(struct intel_ring_buffer *ring,
1678 uint32_t flush_domains)
Daniel Vetter63560392010-02-19 11:51:59 +01001679{
Chris Wilson05394f32010-11-08 19:18:58 +00001680 struct drm_i915_gem_object *obj, *next;
Daniel Vetter63560392010-02-19 11:51:59 +01001681
Chris Wilson05394f32010-11-08 19:18:58 +00001682 list_for_each_entry_safe(obj, next,
Chris Wilson64193402010-10-24 12:38:05 +01001683 &ring->gpu_write_list,
Daniel Vetter63560392010-02-19 11:51:59 +01001684 gpu_write_list) {
Chris Wilson05394f32010-11-08 19:18:58 +00001685 if (obj->base.write_domain & flush_domains) {
1686 uint32_t old_write_domain = obj->base.write_domain;
Daniel Vetter63560392010-02-19 11:51:59 +01001687
Chris Wilson05394f32010-11-08 19:18:58 +00001688 obj->base.write_domain = 0;
1689 list_del_init(&obj->gpu_write_list);
Chris Wilson1ec14ad2010-12-04 11:30:53 +00001690 i915_gem_object_move_to_active(obj, ring,
Chris Wilsondb53a302011-02-03 11:57:46 +00001691 i915_gem_next_request_seqno(ring));
Daniel Vetter63560392010-02-19 11:51:59 +01001692
Daniel Vetter63560392010-02-19 11:51:59 +01001693 trace_i915_gem_object_change_domain(obj,
Chris Wilson05394f32010-11-08 19:18:58 +00001694 obj->base.read_domains,
Daniel Vetter63560392010-02-19 11:51:59 +01001695 old_write_domain);
1696 }
1697 }
1698}
Zou Nan hai8187a2b2010-05-21 09:08:55 +08001699
Chris Wilson3cce4692010-10-27 16:11:02 +01001700int
Chris Wilsondb53a302011-02-03 11:57:46 +00001701i915_add_request(struct intel_ring_buffer *ring,
Chris Wilsonf787a5f2010-09-24 16:02:42 +01001702 struct drm_file *file,
Chris Wilsondb53a302011-02-03 11:57:46 +00001703 struct drm_i915_gem_request *request)
Eric Anholt673a3942008-07-30 12:06:12 -07001704{
Chris Wilsondb53a302011-02-03 11:57:46 +00001705 drm_i915_private_t *dev_priv = ring->dev->dev_private;
Eric Anholt673a3942008-07-30 12:06:12 -07001706 uint32_t seqno;
1707 int was_empty;
Chris Wilson3cce4692010-10-27 16:11:02 +01001708 int ret;
1709
1710 BUG_ON(request == NULL);
Eric Anholt673a3942008-07-30 12:06:12 -07001711
Chris Wilson3cce4692010-10-27 16:11:02 +01001712 ret = ring->add_request(ring, &seqno);
1713 if (ret)
1714 return ret;
Eric Anholt673a3942008-07-30 12:06:12 -07001715
Chris Wilsondb53a302011-02-03 11:57:46 +00001716 trace_i915_gem_request_add(ring, seqno);
Eric Anholt673a3942008-07-30 12:06:12 -07001717
1718 request->seqno = seqno;
Zou Nan hai852835f2010-05-21 09:08:56 +08001719 request->ring = ring;
Eric Anholt673a3942008-07-30 12:06:12 -07001720 request->emitted_jiffies = jiffies;
Zou Nan hai852835f2010-05-21 09:08:56 +08001721 was_empty = list_empty(&ring->request_list);
1722 list_add_tail(&request->list, &ring->request_list);
1723
Chris Wilsondb53a302011-02-03 11:57:46 +00001724 if (file) {
1725 struct drm_i915_file_private *file_priv = file->driver_priv;
1726
Chris Wilson1c255952010-09-26 11:03:27 +01001727 spin_lock(&file_priv->mm.lock);
Chris Wilsonf787a5f2010-09-24 16:02:42 +01001728 request->file_priv = file_priv;
Eric Anholtb9624422009-06-03 07:27:35 +00001729 list_add_tail(&request->client_list,
Chris Wilsonf787a5f2010-09-24 16:02:42 +01001730 &file_priv->mm.request_list);
Chris Wilson1c255952010-09-26 11:03:27 +01001731 spin_unlock(&file_priv->mm.lock);
Eric Anholtb9624422009-06-03 07:27:35 +00001732 }
Eric Anholt673a3942008-07-30 12:06:12 -07001733
Chris Wilsondb53a302011-02-03 11:57:46 +00001734 ring->outstanding_lazy_request = false;
1735
Ben Gamarif65d9422009-09-14 17:48:44 -04001736 if (!dev_priv->mm.suspended) {
Chris Wilsonb3b079d2010-09-13 23:44:34 +01001737 mod_timer(&dev_priv->hangcheck_timer,
1738 jiffies + msecs_to_jiffies(DRM_I915_HANGCHECK_PERIOD));
Ben Gamarif65d9422009-09-14 17:48:44 -04001739 if (was_empty)
Chris Wilsonb3b079d2010-09-13 23:44:34 +01001740 queue_delayed_work(dev_priv->wq,
1741 &dev_priv->mm.retire_work, HZ);
Ben Gamarif65d9422009-09-14 17:48:44 -04001742 }
Chris Wilson3cce4692010-10-27 16:11:02 +01001743 return 0;
Eric Anholt673a3942008-07-30 12:06:12 -07001744}
1745
Chris Wilsonf787a5f2010-09-24 16:02:42 +01001746static inline void
1747i915_gem_request_remove_from_client(struct drm_i915_gem_request *request)
Eric Anholt673a3942008-07-30 12:06:12 -07001748{
Chris Wilson1c255952010-09-26 11:03:27 +01001749 struct drm_i915_file_private *file_priv = request->file_priv;
Eric Anholt673a3942008-07-30 12:06:12 -07001750
Chris Wilson1c255952010-09-26 11:03:27 +01001751 if (!file_priv)
1752 return;
Chris Wilson1c5d22f2009-08-25 11:15:50 +01001753
Chris Wilson1c255952010-09-26 11:03:27 +01001754 spin_lock(&file_priv->mm.lock);
1755 list_del(&request->client_list);
1756 request->file_priv = NULL;
1757 spin_unlock(&file_priv->mm.lock);
Eric Anholt673a3942008-07-30 12:06:12 -07001758}
1759
Chris Wilsondfaae392010-09-22 10:31:52 +01001760static void i915_gem_reset_ring_lists(struct drm_i915_private *dev_priv,
1761 struct intel_ring_buffer *ring)
Chris Wilson9375e442010-09-19 12:21:28 +01001762{
Chris Wilsondfaae392010-09-22 10:31:52 +01001763 while (!list_empty(&ring->request_list)) {
1764 struct drm_i915_gem_request *request;
Chris Wilson9375e442010-09-19 12:21:28 +01001765
Chris Wilsondfaae392010-09-22 10:31:52 +01001766 request = list_first_entry(&ring->request_list,
1767 struct drm_i915_gem_request,
1768 list);
1769
1770 list_del(&request->list);
Chris Wilsonf787a5f2010-09-24 16:02:42 +01001771 i915_gem_request_remove_from_client(request);
Chris Wilsondfaae392010-09-22 10:31:52 +01001772 kfree(request);
1773 }
1774
1775 while (!list_empty(&ring->active_list)) {
Chris Wilson05394f32010-11-08 19:18:58 +00001776 struct drm_i915_gem_object *obj;
Eric Anholt673a3942008-07-30 12:06:12 -07001777
Chris Wilson05394f32010-11-08 19:18:58 +00001778 obj = list_first_entry(&ring->active_list,
1779 struct drm_i915_gem_object,
1780 ring_list);
Eric Anholt673a3942008-07-30 12:06:12 -07001781
Chris Wilson05394f32010-11-08 19:18:58 +00001782 obj->base.write_domain = 0;
1783 list_del_init(&obj->gpu_write_list);
1784 i915_gem_object_move_to_inactive(obj);
Eric Anholt673a3942008-07-30 12:06:12 -07001785 }
Eric Anholt673a3942008-07-30 12:06:12 -07001786}
1787
Chris Wilson312817a2010-11-22 11:50:11 +00001788static void i915_gem_reset_fences(struct drm_device *dev)
1789{
1790 struct drm_i915_private *dev_priv = dev->dev_private;
1791 int i;
1792
1793 for (i = 0; i < 16; i++) {
1794 struct drm_i915_fence_reg *reg = &dev_priv->fence_regs[i];
Chris Wilson7d2cb392010-11-27 17:38:29 +00001795 struct drm_i915_gem_object *obj = reg->obj;
1796
1797 if (!obj)
1798 continue;
1799
1800 if (obj->tiling_mode)
1801 i915_gem_release_mmap(obj);
1802
Chris Wilsond9e86c02010-11-10 16:40:20 +00001803 reg->obj->fence_reg = I915_FENCE_REG_NONE;
1804 reg->obj->fenced_gpu_access = false;
1805 reg->obj->last_fenced_seqno = 0;
1806 reg->obj->last_fenced_ring = NULL;
1807 i915_gem_clear_fence_reg(dev, reg);
Chris Wilson312817a2010-11-22 11:50:11 +00001808 }
1809}
1810
Chris Wilson069efc12010-09-30 16:53:18 +01001811void i915_gem_reset(struct drm_device *dev)
Eric Anholt673a3942008-07-30 12:06:12 -07001812{
Chris Wilsondfaae392010-09-22 10:31:52 +01001813 struct drm_i915_private *dev_priv = dev->dev_private;
Chris Wilson05394f32010-11-08 19:18:58 +00001814 struct drm_i915_gem_object *obj;
Chris Wilson1ec14ad2010-12-04 11:30:53 +00001815 int i;
Eric Anholt673a3942008-07-30 12:06:12 -07001816
Chris Wilson1ec14ad2010-12-04 11:30:53 +00001817 for (i = 0; i < I915_NUM_RINGS; i++)
1818 i915_gem_reset_ring_lists(dev_priv, &dev_priv->ring[i]);
Chris Wilsondfaae392010-09-22 10:31:52 +01001819
1820 /* Remove anything from the flushing lists. The GPU cache is likely
1821 * to be lost on reset along with the data, so simply move the
1822 * lost bo to the inactive list.
1823 */
1824 while (!list_empty(&dev_priv->mm.flushing_list)) {
Chris Wilson05394f32010-11-08 19:18:58 +00001825 obj= list_first_entry(&dev_priv->mm.flushing_list,
1826 struct drm_i915_gem_object,
1827 mm_list);
Chris Wilson9375e442010-09-19 12:21:28 +01001828
Chris Wilson05394f32010-11-08 19:18:58 +00001829 obj->base.write_domain = 0;
1830 list_del_init(&obj->gpu_write_list);
1831 i915_gem_object_move_to_inactive(obj);
Chris Wilson9375e442010-09-19 12:21:28 +01001832 }
Chris Wilson9375e442010-09-19 12:21:28 +01001833
Chris Wilsondfaae392010-09-22 10:31:52 +01001834 /* Move everything out of the GPU domains to ensure we do any
1835 * necessary invalidation upon reuse.
1836 */
Chris Wilson05394f32010-11-08 19:18:58 +00001837 list_for_each_entry(obj,
Chris Wilson77f01232010-09-19 12:31:36 +01001838 &dev_priv->mm.inactive_list,
Chris Wilson69dc4982010-10-19 10:36:51 +01001839 mm_list)
Chris Wilson77f01232010-09-19 12:31:36 +01001840 {
Chris Wilson05394f32010-11-08 19:18:58 +00001841 obj->base.read_domains &= ~I915_GEM_GPU_DOMAINS;
Chris Wilson77f01232010-09-19 12:31:36 +01001842 }
Chris Wilson069efc12010-09-30 16:53:18 +01001843
1844 /* The fence registers are invalidated so clear them out */
Chris Wilson312817a2010-11-22 11:50:11 +00001845 i915_gem_reset_fences(dev);
Eric Anholt673a3942008-07-30 12:06:12 -07001846}
1847
1848/**
1849 * This function clears the request list as sequence numbers are passed.
1850 */
Chris Wilsonb09a1fe2010-07-23 23:18:49 +01001851static void
Chris Wilsondb53a302011-02-03 11:57:46 +00001852i915_gem_retire_requests_ring(struct intel_ring_buffer *ring)
Eric Anholt673a3942008-07-30 12:06:12 -07001853{
Eric Anholt673a3942008-07-30 12:06:12 -07001854 uint32_t seqno;
Chris Wilson1ec14ad2010-12-04 11:30:53 +00001855 int i;
Eric Anholt673a3942008-07-30 12:06:12 -07001856
Chris Wilsondb53a302011-02-03 11:57:46 +00001857 if (list_empty(&ring->request_list))
Karsten Wiese6c0594a2009-02-23 15:07:57 +01001858 return;
1859
Chris Wilsondb53a302011-02-03 11:57:46 +00001860 WARN_ON(i915_verify_lists(ring->dev));
Eric Anholt673a3942008-07-30 12:06:12 -07001861
Chris Wilson78501ea2010-10-27 12:18:21 +01001862 seqno = ring->get_seqno(ring);
Chris Wilson1ec14ad2010-12-04 11:30:53 +00001863
Chris Wilson076e2c02011-01-21 10:07:18 +00001864 for (i = 0; i < ARRAY_SIZE(ring->sync_seqno); i++)
Chris Wilson1ec14ad2010-12-04 11:30:53 +00001865 if (seqno >= ring->sync_seqno[i])
1866 ring->sync_seqno[i] = 0;
1867
Zou Nan hai852835f2010-05-21 09:08:56 +08001868 while (!list_empty(&ring->request_list)) {
Eric Anholt673a3942008-07-30 12:06:12 -07001869 struct drm_i915_gem_request *request;
Eric Anholt673a3942008-07-30 12:06:12 -07001870
Zou Nan hai852835f2010-05-21 09:08:56 +08001871 request = list_first_entry(&ring->request_list,
Eric Anholt673a3942008-07-30 12:06:12 -07001872 struct drm_i915_gem_request,
1873 list);
Eric Anholt673a3942008-07-30 12:06:12 -07001874
Chris Wilsondfaae392010-09-22 10:31:52 +01001875 if (!i915_seqno_passed(seqno, request->seqno))
Eric Anholt673a3942008-07-30 12:06:12 -07001876 break;
Chris Wilsonb84d5f02010-09-18 01:38:04 +01001877
Chris Wilsondb53a302011-02-03 11:57:46 +00001878 trace_i915_gem_request_retire(ring, request->seqno);
Chris Wilsonb84d5f02010-09-18 01:38:04 +01001879
1880 list_del(&request->list);
Chris Wilsonf787a5f2010-09-24 16:02:42 +01001881 i915_gem_request_remove_from_client(request);
Chris Wilsonb84d5f02010-09-18 01:38:04 +01001882 kfree(request);
1883 }
1884
1885 /* Move any buffers on the active list that are no longer referenced
1886 * by the ringbuffer to the flushing/inactive lists as appropriate.
1887 */
1888 while (!list_empty(&ring->active_list)) {
Chris Wilson05394f32010-11-08 19:18:58 +00001889 struct drm_i915_gem_object *obj;
Chris Wilsonb84d5f02010-09-18 01:38:04 +01001890
Chris Wilson05394f32010-11-08 19:18:58 +00001891 obj= list_first_entry(&ring->active_list,
1892 struct drm_i915_gem_object,
1893 ring_list);
Chris Wilsonb84d5f02010-09-18 01:38:04 +01001894
Chris Wilson05394f32010-11-08 19:18:58 +00001895 if (!i915_seqno_passed(seqno, obj->last_rendering_seqno))
Chris Wilsonb84d5f02010-09-18 01:38:04 +01001896 break;
1897
Chris Wilson05394f32010-11-08 19:18:58 +00001898 if (obj->base.write_domain != 0)
Chris Wilsonb84d5f02010-09-18 01:38:04 +01001899 i915_gem_object_move_to_flushing(obj);
1900 else
1901 i915_gem_object_move_to_inactive(obj);
Eric Anholt673a3942008-07-30 12:06:12 -07001902 }
Chris Wilson9d34e5d2009-09-24 05:26:06 +01001903
Chris Wilsondb53a302011-02-03 11:57:46 +00001904 if (unlikely(ring->trace_irq_seqno &&
1905 i915_seqno_passed(seqno, ring->trace_irq_seqno))) {
Chris Wilson1ec14ad2010-12-04 11:30:53 +00001906 ring->irq_put(ring);
Chris Wilsondb53a302011-02-03 11:57:46 +00001907 ring->trace_irq_seqno = 0;
Chris Wilson9d34e5d2009-09-24 05:26:06 +01001908 }
Chris Wilson23bc5982010-09-29 16:10:57 +01001909
Chris Wilsondb53a302011-02-03 11:57:46 +00001910 WARN_ON(i915_verify_lists(ring->dev));
Eric Anholt673a3942008-07-30 12:06:12 -07001911}
1912
1913void
Chris Wilsonb09a1fe2010-07-23 23:18:49 +01001914i915_gem_retire_requests(struct drm_device *dev)
1915{
1916 drm_i915_private_t *dev_priv = dev->dev_private;
Chris Wilson1ec14ad2010-12-04 11:30:53 +00001917 int i;
Chris Wilsonb09a1fe2010-07-23 23:18:49 +01001918
Chris Wilsonbe726152010-07-23 23:18:50 +01001919 if (!list_empty(&dev_priv->mm.deferred_free_list)) {
Chris Wilson05394f32010-11-08 19:18:58 +00001920 struct drm_i915_gem_object *obj, *next;
Chris Wilsonbe726152010-07-23 23:18:50 +01001921
1922 /* We must be careful that during unbind() we do not
1923 * accidentally infinitely recurse into retire requests.
1924 * Currently:
1925 * retire -> free -> unbind -> wait -> retire_ring
1926 */
Chris Wilson05394f32010-11-08 19:18:58 +00001927 list_for_each_entry_safe(obj, next,
Chris Wilsonbe726152010-07-23 23:18:50 +01001928 &dev_priv->mm.deferred_free_list,
Chris Wilson69dc4982010-10-19 10:36:51 +01001929 mm_list)
Chris Wilson05394f32010-11-08 19:18:58 +00001930 i915_gem_free_object_tail(obj);
Chris Wilsonbe726152010-07-23 23:18:50 +01001931 }
1932
Chris Wilson1ec14ad2010-12-04 11:30:53 +00001933 for (i = 0; i < I915_NUM_RINGS; i++)
Chris Wilsondb53a302011-02-03 11:57:46 +00001934 i915_gem_retire_requests_ring(&dev_priv->ring[i]);
Chris Wilsonb09a1fe2010-07-23 23:18:49 +01001935}
1936
Daniel Vetter75ef9da2010-08-21 00:25:16 +02001937static void
Eric Anholt673a3942008-07-30 12:06:12 -07001938i915_gem_retire_work_handler(struct work_struct *work)
1939{
1940 drm_i915_private_t *dev_priv;
1941 struct drm_device *dev;
Chris Wilson0a587052011-01-09 21:05:44 +00001942 bool idle;
1943 int i;
Eric Anholt673a3942008-07-30 12:06:12 -07001944
1945 dev_priv = container_of(work, drm_i915_private_t,
1946 mm.retire_work.work);
1947 dev = dev_priv->dev;
1948
Chris Wilson891b48c2010-09-29 12:26:37 +01001949 /* Come back later if the device is busy... */
1950 if (!mutex_trylock(&dev->struct_mutex)) {
1951 queue_delayed_work(dev_priv->wq, &dev_priv->mm.retire_work, HZ);
1952 return;
1953 }
1954
Chris Wilsonb09a1fe2010-07-23 23:18:49 +01001955 i915_gem_retire_requests(dev);
Zou Nan haid1b851f2010-05-21 09:08:57 +08001956
Chris Wilson0a587052011-01-09 21:05:44 +00001957 /* Send a periodic flush down the ring so we don't hold onto GEM
1958 * objects indefinitely.
1959 */
1960 idle = true;
1961 for (i = 0; i < I915_NUM_RINGS; i++) {
1962 struct intel_ring_buffer *ring = &dev_priv->ring[i];
1963
1964 if (!list_empty(&ring->gpu_write_list)) {
1965 struct drm_i915_gem_request *request;
1966 int ret;
1967
Chris Wilsondb53a302011-02-03 11:57:46 +00001968 ret = i915_gem_flush_ring(ring,
1969 0, I915_GEM_GPU_DOMAINS);
Chris Wilson0a587052011-01-09 21:05:44 +00001970 request = kzalloc(sizeof(*request), GFP_KERNEL);
1971 if (ret || request == NULL ||
Chris Wilsondb53a302011-02-03 11:57:46 +00001972 i915_add_request(ring, NULL, request))
Chris Wilson0a587052011-01-09 21:05:44 +00001973 kfree(request);
1974 }
1975
1976 idle &= list_empty(&ring->request_list);
1977 }
1978
1979 if (!dev_priv->mm.suspended && !idle)
Eric Anholt9c9fe1f2009-08-03 16:09:16 -07001980 queue_delayed_work(dev_priv->wq, &dev_priv->mm.retire_work, HZ);
Chris Wilson0a587052011-01-09 21:05:44 +00001981
Eric Anholt673a3942008-07-30 12:06:12 -07001982 mutex_unlock(&dev->struct_mutex);
1983}
1984
Chris Wilsondb53a302011-02-03 11:57:46 +00001985/**
1986 * Waits for a sequence number to be signaled, and cleans up the
1987 * request and object lists appropriately for that event.
1988 */
Daniel Vetter5a5a0c62009-09-15 22:57:36 +02001989int
Chris Wilsondb53a302011-02-03 11:57:46 +00001990i915_wait_request(struct intel_ring_buffer *ring,
1991 uint32_t seqno,
1992 bool interruptible)
Eric Anholt673a3942008-07-30 12:06:12 -07001993{
Chris Wilsondb53a302011-02-03 11:57:46 +00001994 drm_i915_private_t *dev_priv = ring->dev->dev_private;
Jesse Barnes802c7eb2009-05-05 16:03:48 -07001995 u32 ier;
Eric Anholt673a3942008-07-30 12:06:12 -07001996 int ret = 0;
1997
1998 BUG_ON(seqno == 0);
1999
Chris Wilsond9bc7e92011-02-07 13:09:31 +00002000 if (atomic_read(&dev_priv->mm.wedged)) {
2001 struct completion *x = &dev_priv->error_completion;
2002 bool recovery_complete;
2003 unsigned long flags;
2004
2005 /* Give the error handler a chance to run. */
2006 spin_lock_irqsave(&x->wait.lock, flags);
2007 recovery_complete = x->done > 0;
2008 spin_unlock_irqrestore(&x->wait.lock, flags);
2009
2010 return recovery_complete ? -EIO : -EAGAIN;
2011 }
Ben Gamariffed1d02009-09-14 17:48:41 -04002012
Chris Wilson5d97eb62010-11-10 20:40:02 +00002013 if (seqno == ring->outstanding_lazy_request) {
Chris Wilson3cce4692010-10-27 16:11:02 +01002014 struct drm_i915_gem_request *request;
2015
2016 request = kzalloc(sizeof(*request), GFP_KERNEL);
2017 if (request == NULL)
Daniel Vettere35a41d2010-02-11 22:13:59 +01002018 return -ENOMEM;
Chris Wilson3cce4692010-10-27 16:11:02 +01002019
Chris Wilsondb53a302011-02-03 11:57:46 +00002020 ret = i915_add_request(ring, NULL, request);
Chris Wilson3cce4692010-10-27 16:11:02 +01002021 if (ret) {
2022 kfree(request);
2023 return ret;
2024 }
2025
2026 seqno = request->seqno;
Daniel Vettere35a41d2010-02-11 22:13:59 +01002027 }
2028
Chris Wilson78501ea2010-10-27 12:18:21 +01002029 if (!i915_seqno_passed(ring->get_seqno(ring), seqno)) {
Chris Wilsondb53a302011-02-03 11:57:46 +00002030 if (HAS_PCH_SPLIT(ring->dev))
Zhenyu Wang036a4a72009-06-08 14:40:19 +08002031 ier = I915_READ(DEIER) | I915_READ(GTIER);
2032 else
2033 ier = I915_READ(IER);
Jesse Barnes802c7eb2009-05-05 16:03:48 -07002034 if (!ier) {
2035 DRM_ERROR("something (likely vbetool) disabled "
2036 "interrupts, re-enabling\n");
Chris Wilsondb53a302011-02-03 11:57:46 +00002037 i915_driver_irq_preinstall(ring->dev);
2038 i915_driver_irq_postinstall(ring->dev);
Jesse Barnes802c7eb2009-05-05 16:03:48 -07002039 }
2040
Chris Wilsondb53a302011-02-03 11:57:46 +00002041 trace_i915_gem_request_wait_begin(ring, seqno);
Chris Wilson1c5d22f2009-08-25 11:15:50 +01002042
Chris Wilsonb2223492010-10-27 15:27:33 +01002043 ring->waiting_seqno = seqno;
Chris Wilsonb13c2b92010-12-13 16:54:50 +00002044 if (ring->irq_get(ring)) {
2045 if (interruptible)
2046 ret = wait_event_interruptible(ring->irq_queue,
2047 i915_seqno_passed(ring->get_seqno(ring), seqno)
2048 || atomic_read(&dev_priv->mm.wedged));
2049 else
2050 wait_event(ring->irq_queue,
2051 i915_seqno_passed(ring->get_seqno(ring), seqno)
2052 || atomic_read(&dev_priv->mm.wedged));
Daniel Vetter48764bf2009-09-15 22:57:32 +02002053
Chris Wilsonb13c2b92010-12-13 16:54:50 +00002054 ring->irq_put(ring);
Chris Wilsonb5ba1772010-12-14 12:17:15 +00002055 } else if (wait_for(i915_seqno_passed(ring->get_seqno(ring),
2056 seqno) ||
2057 atomic_read(&dev_priv->mm.wedged), 3000))
2058 ret = -EBUSY;
Chris Wilsonb2223492010-10-27 15:27:33 +01002059 ring->waiting_seqno = 0;
Chris Wilson1c5d22f2009-08-25 11:15:50 +01002060
Chris Wilsondb53a302011-02-03 11:57:46 +00002061 trace_i915_gem_request_wait_end(ring, seqno);
Eric Anholt673a3942008-07-30 12:06:12 -07002062 }
Ben Gamariba1234d2009-09-14 17:48:47 -04002063 if (atomic_read(&dev_priv->mm.wedged))
Chris Wilson30dbf0c2010-09-25 10:19:17 +01002064 ret = -EAGAIN;
Eric Anholt673a3942008-07-30 12:06:12 -07002065
2066 if (ret && ret != -ERESTARTSYS)
Daniel Vetter8bff9172010-02-11 22:19:40 +01002067 DRM_ERROR("%s returns %d (awaiting %d at %d, next %d)\n",
Chris Wilson78501ea2010-10-27 12:18:21 +01002068 __func__, ret, seqno, ring->get_seqno(ring),
Daniel Vetter8bff9172010-02-11 22:19:40 +01002069 dev_priv->next_seqno);
Eric Anholt673a3942008-07-30 12:06:12 -07002070
2071 /* Directly dispatch request retiring. While we have the work queue
2072 * to handle this, the waiter on a request often wants an associated
2073 * buffer to have made it to the inactive list, and we would need
2074 * a separate wait queue to handle that.
2075 */
2076 if (ret == 0)
Chris Wilsondb53a302011-02-03 11:57:46 +00002077 i915_gem_retire_requests_ring(ring);
Eric Anholt673a3942008-07-30 12:06:12 -07002078
2079 return ret;
2080}
2081
Daniel Vetter48764bf2009-09-15 22:57:32 +02002082/**
Eric Anholt673a3942008-07-30 12:06:12 -07002083 * Ensures that all rendering to the object has completed and the object is
2084 * safe to unbind from the GTT or access from the CPU.
2085 */
Chris Wilson54cf91d2010-11-25 18:00:26 +00002086int
Chris Wilson05394f32010-11-08 19:18:58 +00002087i915_gem_object_wait_rendering(struct drm_i915_gem_object *obj,
Chris Wilson2cf34d72010-09-14 13:03:28 +01002088 bool interruptible)
Eric Anholt673a3942008-07-30 12:06:12 -07002089{
Eric Anholt673a3942008-07-30 12:06:12 -07002090 int ret;
2091
Eric Anholte47c68e2008-11-14 13:35:19 -08002092 /* This function only exists to support waiting for existing rendering,
2093 * not for emitting required flushes.
Eric Anholt673a3942008-07-30 12:06:12 -07002094 */
Chris Wilson05394f32010-11-08 19:18:58 +00002095 BUG_ON((obj->base.write_domain & I915_GEM_GPU_DOMAINS) != 0);
Eric Anholt673a3942008-07-30 12:06:12 -07002096
2097 /* If there is rendering queued on the buffer being evicted, wait for
2098 * it.
2099 */
Chris Wilson05394f32010-11-08 19:18:58 +00002100 if (obj->active) {
Chris Wilsondb53a302011-02-03 11:57:46 +00002101 ret = i915_wait_request(obj->ring,
2102 obj->last_rendering_seqno,
2103 interruptible);
Chris Wilson2cf34d72010-09-14 13:03:28 +01002104 if (ret)
Eric Anholt673a3942008-07-30 12:06:12 -07002105 return ret;
2106 }
2107
2108 return 0;
2109}
2110
2111/**
2112 * Unbinds an object from the GTT aperture.
2113 */
Jesse Barnes0f973f22009-01-26 17:10:45 -08002114int
Chris Wilson05394f32010-11-08 19:18:58 +00002115i915_gem_object_unbind(struct drm_i915_gem_object *obj)
Eric Anholt673a3942008-07-30 12:06:12 -07002116{
Eric Anholt673a3942008-07-30 12:06:12 -07002117 int ret = 0;
2118
Chris Wilson05394f32010-11-08 19:18:58 +00002119 if (obj->gtt_space == NULL)
Eric Anholt673a3942008-07-30 12:06:12 -07002120 return 0;
2121
Chris Wilson05394f32010-11-08 19:18:58 +00002122 if (obj->pin_count != 0) {
Eric Anholt673a3942008-07-30 12:06:12 -07002123 DRM_ERROR("Attempting to unbind pinned buffer\n");
2124 return -EINVAL;
2125 }
2126
Eric Anholt5323fd02009-09-09 11:50:45 -07002127 /* blow away mappings if mapped through GTT */
2128 i915_gem_release_mmap(obj);
2129
Eric Anholt673a3942008-07-30 12:06:12 -07002130 /* Move the object to the CPU domain to ensure that
2131 * any possible CPU writes while it's not in the GTT
2132 * are flushed when we go to remap it. This will
2133 * also ensure that all pending GPU writes are finished
2134 * before we unbind.
2135 */
Eric Anholte47c68e2008-11-14 13:35:19 -08002136 ret = i915_gem_object_set_to_cpu_domain(obj, 1);
Chris Wilson8dc17752010-07-23 23:18:51 +01002137 if (ret == -ERESTARTSYS)
Eric Anholt673a3942008-07-30 12:06:12 -07002138 return ret;
Chris Wilson8dc17752010-07-23 23:18:51 +01002139 /* Continue on if we fail due to EIO, the GPU is hung so we
2140 * should be safe and we need to cleanup or else we might
2141 * cause memory corruption through use-after-free.
2142 */
Chris Wilson812ed4922010-09-30 15:08:57 +01002143 if (ret) {
2144 i915_gem_clflush_object(obj);
Chris Wilson05394f32010-11-08 19:18:58 +00002145 obj->base.read_domains = obj->base.write_domain = I915_GEM_DOMAIN_CPU;
Chris Wilson812ed4922010-09-30 15:08:57 +01002146 }
Eric Anholt673a3942008-07-30 12:06:12 -07002147
Daniel Vetter96b47b62009-12-15 17:50:00 +01002148 /* release the fence reg _after_ flushing */
Chris Wilsond9e86c02010-11-10 16:40:20 +00002149 ret = i915_gem_object_put_fence(obj);
2150 if (ret == -ERESTARTSYS)
2151 return ret;
Daniel Vetter96b47b62009-12-15 17:50:00 +01002152
Chris Wilsondb53a302011-02-03 11:57:46 +00002153 trace_i915_gem_object_unbind(obj);
2154
Daniel Vetter7c2e6fd2010-11-06 10:10:47 +01002155 i915_gem_gtt_unbind_object(obj);
Chris Wilsone5281cc2010-10-28 13:45:36 +01002156 i915_gem_object_put_pages_gtt(obj);
Eric Anholt673a3942008-07-30 12:06:12 -07002157
Chris Wilson6299f992010-11-24 12:23:44 +00002158 list_del_init(&obj->gtt_list);
Chris Wilson05394f32010-11-08 19:18:58 +00002159 list_del_init(&obj->mm_list);
Daniel Vetter75e9e912010-11-04 17:11:09 +01002160 /* Avoid an unnecessary call to unbind on rebind. */
Chris Wilson05394f32010-11-08 19:18:58 +00002161 obj->map_and_fenceable = true;
Eric Anholt673a3942008-07-30 12:06:12 -07002162
Chris Wilson05394f32010-11-08 19:18:58 +00002163 drm_mm_put_block(obj->gtt_space);
2164 obj->gtt_space = NULL;
2165 obj->gtt_offset = 0;
Eric Anholt673a3942008-07-30 12:06:12 -07002166
Chris Wilson05394f32010-11-08 19:18:58 +00002167 if (i915_gem_object_is_purgeable(obj))
Chris Wilson963b4832009-09-20 23:03:54 +01002168 i915_gem_object_truncate(obj);
2169
Chris Wilson8dc17752010-07-23 23:18:51 +01002170 return ret;
Eric Anholt673a3942008-07-30 12:06:12 -07002171}
2172
Chris Wilson88241782011-01-07 17:09:48 +00002173int
Chris Wilsondb53a302011-02-03 11:57:46 +00002174i915_gem_flush_ring(struct intel_ring_buffer *ring,
Chris Wilson54cf91d2010-11-25 18:00:26 +00002175 uint32_t invalidate_domains,
2176 uint32_t flush_domains)
2177{
Chris Wilson88241782011-01-07 17:09:48 +00002178 int ret;
2179
Chris Wilsondb53a302011-02-03 11:57:46 +00002180 trace_i915_gem_ring_flush(ring, invalidate_domains, flush_domains);
2181
Chris Wilson88241782011-01-07 17:09:48 +00002182 ret = ring->flush(ring, invalidate_domains, flush_domains);
2183 if (ret)
2184 return ret;
2185
Chris Wilsondb53a302011-02-03 11:57:46 +00002186 i915_gem_process_flushing_list(ring, flush_domains);
Chris Wilson88241782011-01-07 17:09:48 +00002187 return 0;
Chris Wilson54cf91d2010-11-25 18:00:26 +00002188}
2189
Chris Wilsondb53a302011-02-03 11:57:46 +00002190static int i915_ring_idle(struct intel_ring_buffer *ring)
Chris Wilsona56ba562010-09-28 10:07:56 +01002191{
Chris Wilson88241782011-01-07 17:09:48 +00002192 int ret;
2193
Chris Wilson395b70b2010-10-28 21:28:46 +01002194 if (list_empty(&ring->gpu_write_list) && list_empty(&ring->active_list))
Chris Wilson64193402010-10-24 12:38:05 +01002195 return 0;
2196
Chris Wilson88241782011-01-07 17:09:48 +00002197 if (!list_empty(&ring->gpu_write_list)) {
Chris Wilsondb53a302011-02-03 11:57:46 +00002198 ret = i915_gem_flush_ring(ring,
Chris Wilson0ac74c62010-12-06 14:36:02 +00002199 I915_GEM_GPU_DOMAINS, I915_GEM_GPU_DOMAINS);
Chris Wilson88241782011-01-07 17:09:48 +00002200 if (ret)
2201 return ret;
2202 }
2203
Chris Wilsondb53a302011-02-03 11:57:46 +00002204 return i915_wait_request(ring,
2205 i915_gem_next_request_seqno(ring),
2206 true);
Chris Wilsona56ba562010-09-28 10:07:56 +01002207}
2208
Chris Wilsonb47eb4a2010-08-07 11:01:23 +01002209int
Daniel Vetter4df2faf2010-02-19 11:52:00 +01002210i915_gpu_idle(struct drm_device *dev)
2211{
2212 drm_i915_private_t *dev_priv = dev->dev_private;
2213 bool lists_empty;
Chris Wilson1ec14ad2010-12-04 11:30:53 +00002214 int ret, i;
Daniel Vetter4df2faf2010-02-19 11:52:00 +01002215
Zou Nan haid1b851f2010-05-21 09:08:57 +08002216 lists_empty = (list_empty(&dev_priv->mm.flushing_list) &&
Chris Wilson395b70b2010-10-28 21:28:46 +01002217 list_empty(&dev_priv->mm.active_list));
Daniel Vetter4df2faf2010-02-19 11:52:00 +01002218 if (lists_empty)
2219 return 0;
2220
2221 /* Flush everything onto the inactive list. */
Chris Wilson1ec14ad2010-12-04 11:30:53 +00002222 for (i = 0; i < I915_NUM_RINGS; i++) {
Chris Wilsondb53a302011-02-03 11:57:46 +00002223 ret = i915_ring_idle(&dev_priv->ring[i]);
Chris Wilson1ec14ad2010-12-04 11:30:53 +00002224 if (ret)
2225 return ret;
2226 }
Zou Nan haid1b851f2010-05-21 09:08:57 +08002227
Daniel Vetter8a1a49f2010-02-11 22:29:04 +01002228 return 0;
Daniel Vetter4df2faf2010-02-19 11:52:00 +01002229}
2230
Daniel Vetterc6642782010-11-12 13:46:18 +00002231static int sandybridge_write_fence_reg(struct drm_i915_gem_object *obj,
2232 struct intel_ring_buffer *pipelined)
Eric Anholt4e901fd2009-10-26 16:44:17 -07002233{
Chris Wilson05394f32010-11-08 19:18:58 +00002234 struct drm_device *dev = obj->base.dev;
Eric Anholt4e901fd2009-10-26 16:44:17 -07002235 drm_i915_private_t *dev_priv = dev->dev_private;
Chris Wilson05394f32010-11-08 19:18:58 +00002236 u32 size = obj->gtt_space->size;
2237 int regnum = obj->fence_reg;
Eric Anholt4e901fd2009-10-26 16:44:17 -07002238 uint64_t val;
2239
Chris Wilson05394f32010-11-08 19:18:58 +00002240 val = (uint64_t)((obj->gtt_offset + size - 4096) &
Daniel Vetterc6642782010-11-12 13:46:18 +00002241 0xfffff000) << 32;
Chris Wilson05394f32010-11-08 19:18:58 +00002242 val |= obj->gtt_offset & 0xfffff000;
2243 val |= (uint64_t)((obj->stride / 128) - 1) <<
Eric Anholt4e901fd2009-10-26 16:44:17 -07002244 SANDYBRIDGE_FENCE_PITCH_SHIFT;
2245
Chris Wilson05394f32010-11-08 19:18:58 +00002246 if (obj->tiling_mode == I915_TILING_Y)
Eric Anholt4e901fd2009-10-26 16:44:17 -07002247 val |= 1 << I965_FENCE_TILING_Y_SHIFT;
2248 val |= I965_FENCE_REG_VALID;
2249
Daniel Vetterc6642782010-11-12 13:46:18 +00002250 if (pipelined) {
2251 int ret = intel_ring_begin(pipelined, 6);
2252 if (ret)
2253 return ret;
2254
2255 intel_ring_emit(pipelined, MI_NOOP);
2256 intel_ring_emit(pipelined, MI_LOAD_REGISTER_IMM(2));
2257 intel_ring_emit(pipelined, FENCE_REG_SANDYBRIDGE_0 + regnum*8);
2258 intel_ring_emit(pipelined, (u32)val);
2259 intel_ring_emit(pipelined, FENCE_REG_SANDYBRIDGE_0 + regnum*8 + 4);
2260 intel_ring_emit(pipelined, (u32)(val >> 32));
2261 intel_ring_advance(pipelined);
2262 } else
2263 I915_WRITE64(FENCE_REG_SANDYBRIDGE_0 + regnum * 8, val);
2264
2265 return 0;
Eric Anholt4e901fd2009-10-26 16:44:17 -07002266}
2267
Daniel Vetterc6642782010-11-12 13:46:18 +00002268static int i965_write_fence_reg(struct drm_i915_gem_object *obj,
2269 struct intel_ring_buffer *pipelined)
Jesse Barnesde151cf2008-11-12 10:03:55 -08002270{
Chris Wilson05394f32010-11-08 19:18:58 +00002271 struct drm_device *dev = obj->base.dev;
Jesse Barnesde151cf2008-11-12 10:03:55 -08002272 drm_i915_private_t *dev_priv = dev->dev_private;
Chris Wilson05394f32010-11-08 19:18:58 +00002273 u32 size = obj->gtt_space->size;
2274 int regnum = obj->fence_reg;
Jesse Barnesde151cf2008-11-12 10:03:55 -08002275 uint64_t val;
2276
Chris Wilson05394f32010-11-08 19:18:58 +00002277 val = (uint64_t)((obj->gtt_offset + size - 4096) &
Jesse Barnesde151cf2008-11-12 10:03:55 -08002278 0xfffff000) << 32;
Chris Wilson05394f32010-11-08 19:18:58 +00002279 val |= obj->gtt_offset & 0xfffff000;
2280 val |= ((obj->stride / 128) - 1) << I965_FENCE_PITCH_SHIFT;
2281 if (obj->tiling_mode == I915_TILING_Y)
Jesse Barnesde151cf2008-11-12 10:03:55 -08002282 val |= 1 << I965_FENCE_TILING_Y_SHIFT;
2283 val |= I965_FENCE_REG_VALID;
2284
Daniel Vetterc6642782010-11-12 13:46:18 +00002285 if (pipelined) {
2286 int ret = intel_ring_begin(pipelined, 6);
2287 if (ret)
2288 return ret;
2289
2290 intel_ring_emit(pipelined, MI_NOOP);
2291 intel_ring_emit(pipelined, MI_LOAD_REGISTER_IMM(2));
2292 intel_ring_emit(pipelined, FENCE_REG_965_0 + regnum*8);
2293 intel_ring_emit(pipelined, (u32)val);
2294 intel_ring_emit(pipelined, FENCE_REG_965_0 + regnum*8 + 4);
2295 intel_ring_emit(pipelined, (u32)(val >> 32));
2296 intel_ring_advance(pipelined);
2297 } else
2298 I915_WRITE64(FENCE_REG_965_0 + regnum * 8, val);
2299
2300 return 0;
Jesse Barnesde151cf2008-11-12 10:03:55 -08002301}
2302
Daniel Vetterc6642782010-11-12 13:46:18 +00002303static int i915_write_fence_reg(struct drm_i915_gem_object *obj,
2304 struct intel_ring_buffer *pipelined)
Jesse Barnesde151cf2008-11-12 10:03:55 -08002305{
Chris Wilson05394f32010-11-08 19:18:58 +00002306 struct drm_device *dev = obj->base.dev;
Jesse Barnesde151cf2008-11-12 10:03:55 -08002307 drm_i915_private_t *dev_priv = dev->dev_private;
Chris Wilson05394f32010-11-08 19:18:58 +00002308 u32 size = obj->gtt_space->size;
Daniel Vetterc6642782010-11-12 13:46:18 +00002309 u32 fence_reg, val, pitch_val;
Jesse Barnes0f973f22009-01-26 17:10:45 -08002310 int tile_width;
Jesse Barnesde151cf2008-11-12 10:03:55 -08002311
Daniel Vetterc6642782010-11-12 13:46:18 +00002312 if (WARN((obj->gtt_offset & ~I915_FENCE_START_MASK) ||
2313 (size & -size) != size ||
2314 (obj->gtt_offset & (size - 1)),
2315 "object 0x%08x [fenceable? %d] not 1M or pot-size (0x%08x) aligned\n",
2316 obj->gtt_offset, obj->map_and_fenceable, size))
2317 return -EINVAL;
Jesse Barnesde151cf2008-11-12 10:03:55 -08002318
Daniel Vetterc6642782010-11-12 13:46:18 +00002319 if (obj->tiling_mode == I915_TILING_Y && HAS_128_BYTE_Y_TILING(dev))
Jesse Barnes0f973f22009-01-26 17:10:45 -08002320 tile_width = 128;
Jesse Barnesde151cf2008-11-12 10:03:55 -08002321 else
Jesse Barnes0f973f22009-01-26 17:10:45 -08002322 tile_width = 512;
2323
2324 /* Note: pitch better be a power of two tile widths */
Chris Wilson05394f32010-11-08 19:18:58 +00002325 pitch_val = obj->stride / tile_width;
Jesse Barnes0f973f22009-01-26 17:10:45 -08002326 pitch_val = ffs(pitch_val) - 1;
Jesse Barnesde151cf2008-11-12 10:03:55 -08002327
Chris Wilson05394f32010-11-08 19:18:58 +00002328 val = obj->gtt_offset;
2329 if (obj->tiling_mode == I915_TILING_Y)
Jesse Barnesde151cf2008-11-12 10:03:55 -08002330 val |= 1 << I830_FENCE_TILING_Y_SHIFT;
Chris Wilsona00b10c2010-09-24 21:15:47 +01002331 val |= I915_FENCE_SIZE_BITS(size);
Jesse Barnesde151cf2008-11-12 10:03:55 -08002332 val |= pitch_val << I830_FENCE_PITCH_SHIFT;
2333 val |= I830_FENCE_REG_VALID;
2334
Chris Wilson05394f32010-11-08 19:18:58 +00002335 fence_reg = obj->fence_reg;
Chris Wilsona00b10c2010-09-24 21:15:47 +01002336 if (fence_reg < 8)
2337 fence_reg = FENCE_REG_830_0 + fence_reg * 4;
Eric Anholtdc529a42009-03-10 22:34:49 -07002338 else
Chris Wilsona00b10c2010-09-24 21:15:47 +01002339 fence_reg = FENCE_REG_945_8 + (fence_reg - 8) * 4;
Daniel Vetterc6642782010-11-12 13:46:18 +00002340
2341 if (pipelined) {
2342 int ret = intel_ring_begin(pipelined, 4);
2343 if (ret)
2344 return ret;
2345
2346 intel_ring_emit(pipelined, MI_NOOP);
2347 intel_ring_emit(pipelined, MI_LOAD_REGISTER_IMM(1));
2348 intel_ring_emit(pipelined, fence_reg);
2349 intel_ring_emit(pipelined, val);
2350 intel_ring_advance(pipelined);
2351 } else
2352 I915_WRITE(fence_reg, val);
2353
2354 return 0;
Jesse Barnesde151cf2008-11-12 10:03:55 -08002355}
2356
Daniel Vetterc6642782010-11-12 13:46:18 +00002357static int i830_write_fence_reg(struct drm_i915_gem_object *obj,
2358 struct intel_ring_buffer *pipelined)
Jesse Barnesde151cf2008-11-12 10:03:55 -08002359{
Chris Wilson05394f32010-11-08 19:18:58 +00002360 struct drm_device *dev = obj->base.dev;
Jesse Barnesde151cf2008-11-12 10:03:55 -08002361 drm_i915_private_t *dev_priv = dev->dev_private;
Chris Wilson05394f32010-11-08 19:18:58 +00002362 u32 size = obj->gtt_space->size;
2363 int regnum = obj->fence_reg;
Jesse Barnesde151cf2008-11-12 10:03:55 -08002364 uint32_t val;
2365 uint32_t pitch_val;
2366
Daniel Vetterc6642782010-11-12 13:46:18 +00002367 if (WARN((obj->gtt_offset & ~I830_FENCE_START_MASK) ||
2368 (size & -size) != size ||
2369 (obj->gtt_offset & (size - 1)),
2370 "object 0x%08x not 512K or pot-size 0x%08x aligned\n",
2371 obj->gtt_offset, size))
2372 return -EINVAL;
Jesse Barnesde151cf2008-11-12 10:03:55 -08002373
Chris Wilson05394f32010-11-08 19:18:58 +00002374 pitch_val = obj->stride / 128;
Eric Anholte76a16d2009-05-26 17:44:56 -07002375 pitch_val = ffs(pitch_val) - 1;
Eric Anholte76a16d2009-05-26 17:44:56 -07002376
Chris Wilson05394f32010-11-08 19:18:58 +00002377 val = obj->gtt_offset;
2378 if (obj->tiling_mode == I915_TILING_Y)
Jesse Barnesde151cf2008-11-12 10:03:55 -08002379 val |= 1 << I830_FENCE_TILING_Y_SHIFT;
Daniel Vetterc6642782010-11-12 13:46:18 +00002380 val |= I830_FENCE_SIZE_BITS(size);
Jesse Barnesde151cf2008-11-12 10:03:55 -08002381 val |= pitch_val << I830_FENCE_PITCH_SHIFT;
2382 val |= I830_FENCE_REG_VALID;
2383
Daniel Vetterc6642782010-11-12 13:46:18 +00002384 if (pipelined) {
2385 int ret = intel_ring_begin(pipelined, 4);
2386 if (ret)
2387 return ret;
2388
2389 intel_ring_emit(pipelined, MI_NOOP);
2390 intel_ring_emit(pipelined, MI_LOAD_REGISTER_IMM(1));
2391 intel_ring_emit(pipelined, FENCE_REG_830_0 + regnum*4);
2392 intel_ring_emit(pipelined, val);
2393 intel_ring_advance(pipelined);
2394 } else
2395 I915_WRITE(FENCE_REG_830_0 + regnum * 4, val);
2396
2397 return 0;
Jesse Barnesde151cf2008-11-12 10:03:55 -08002398}
2399
Chris Wilsond9e86c02010-11-10 16:40:20 +00002400static bool ring_passed_seqno(struct intel_ring_buffer *ring, u32 seqno)
2401{
2402 return i915_seqno_passed(ring->get_seqno(ring), seqno);
2403}
2404
2405static int
2406i915_gem_object_flush_fence(struct drm_i915_gem_object *obj,
2407 struct intel_ring_buffer *pipelined,
2408 bool interruptible)
2409{
2410 int ret;
2411
2412 if (obj->fenced_gpu_access) {
Chris Wilson88241782011-01-07 17:09:48 +00002413 if (obj->base.write_domain & I915_GEM_GPU_DOMAINS) {
Chris Wilsondb53a302011-02-03 11:57:46 +00002414 ret = i915_gem_flush_ring(obj->last_fenced_ring,
Chris Wilson88241782011-01-07 17:09:48 +00002415 0, obj->base.write_domain);
2416 if (ret)
2417 return ret;
2418 }
Chris Wilsond9e86c02010-11-10 16:40:20 +00002419
2420 obj->fenced_gpu_access = false;
2421 }
2422
2423 if (obj->last_fenced_seqno && pipelined != obj->last_fenced_ring) {
2424 if (!ring_passed_seqno(obj->last_fenced_ring,
2425 obj->last_fenced_seqno)) {
Chris Wilsondb53a302011-02-03 11:57:46 +00002426 ret = i915_wait_request(obj->last_fenced_ring,
2427 obj->last_fenced_seqno,
2428 interruptible);
2429
Chris Wilsond9e86c02010-11-10 16:40:20 +00002430 if (ret)
2431 return ret;
2432 }
2433
2434 obj->last_fenced_seqno = 0;
2435 obj->last_fenced_ring = NULL;
2436 }
2437
Chris Wilson63256ec2011-01-04 18:42:07 +00002438 /* Ensure that all CPU reads are completed before installing a fence
2439 * and all writes before removing the fence.
2440 */
2441 if (obj->base.read_domains & I915_GEM_DOMAIN_GTT)
2442 mb();
2443
Chris Wilsond9e86c02010-11-10 16:40:20 +00002444 return 0;
2445}
2446
2447int
2448i915_gem_object_put_fence(struct drm_i915_gem_object *obj)
2449{
2450 int ret;
2451
2452 if (obj->tiling_mode)
2453 i915_gem_release_mmap(obj);
2454
2455 ret = i915_gem_object_flush_fence(obj, NULL, true);
2456 if (ret)
2457 return ret;
2458
2459 if (obj->fence_reg != I915_FENCE_REG_NONE) {
2460 struct drm_i915_private *dev_priv = obj->base.dev->dev_private;
2461 i915_gem_clear_fence_reg(obj->base.dev,
2462 &dev_priv->fence_regs[obj->fence_reg]);
2463
2464 obj->fence_reg = I915_FENCE_REG_NONE;
2465 }
2466
2467 return 0;
2468}
2469
2470static struct drm_i915_fence_reg *
2471i915_find_fence_reg(struct drm_device *dev,
2472 struct intel_ring_buffer *pipelined)
Daniel Vetterae3db242010-02-19 11:51:58 +01002473{
Daniel Vetterae3db242010-02-19 11:51:58 +01002474 struct drm_i915_private *dev_priv = dev->dev_private;
Chris Wilsond9e86c02010-11-10 16:40:20 +00002475 struct drm_i915_fence_reg *reg, *first, *avail;
2476 int i;
Daniel Vetterae3db242010-02-19 11:51:58 +01002477
2478 /* First try to find a free reg */
Chris Wilsond9e86c02010-11-10 16:40:20 +00002479 avail = NULL;
Daniel Vetterae3db242010-02-19 11:51:58 +01002480 for (i = dev_priv->fence_reg_start; i < dev_priv->num_fence_regs; i++) {
2481 reg = &dev_priv->fence_regs[i];
2482 if (!reg->obj)
Chris Wilsond9e86c02010-11-10 16:40:20 +00002483 return reg;
Daniel Vetterae3db242010-02-19 11:51:58 +01002484
Chris Wilson05394f32010-11-08 19:18:58 +00002485 if (!reg->obj->pin_count)
Chris Wilsond9e86c02010-11-10 16:40:20 +00002486 avail = reg;
Daniel Vetterae3db242010-02-19 11:51:58 +01002487 }
2488
Chris Wilsond9e86c02010-11-10 16:40:20 +00002489 if (avail == NULL)
2490 return NULL;
Daniel Vetterae3db242010-02-19 11:51:58 +01002491
2492 /* None available, try to steal one or wait for a user to finish */
Chris Wilsond9e86c02010-11-10 16:40:20 +00002493 avail = first = NULL;
2494 list_for_each_entry(reg, &dev_priv->mm.fence_list, lru_list) {
2495 if (reg->obj->pin_count)
Daniel Vetterae3db242010-02-19 11:51:58 +01002496 continue;
2497
Chris Wilsond9e86c02010-11-10 16:40:20 +00002498 if (first == NULL)
2499 first = reg;
2500
2501 if (!pipelined ||
2502 !reg->obj->last_fenced_ring ||
2503 reg->obj->last_fenced_ring == pipelined) {
2504 avail = reg;
2505 break;
2506 }
Daniel Vetterae3db242010-02-19 11:51:58 +01002507 }
2508
Chris Wilsond9e86c02010-11-10 16:40:20 +00002509 if (avail == NULL)
2510 avail = first;
Daniel Vetterae3db242010-02-19 11:51:58 +01002511
Chris Wilsona00b10c2010-09-24 21:15:47 +01002512 return avail;
Daniel Vetterae3db242010-02-19 11:51:58 +01002513}
2514
Jesse Barnesde151cf2008-11-12 10:03:55 -08002515/**
Chris Wilsond9e86c02010-11-10 16:40:20 +00002516 * i915_gem_object_get_fence - set up a fence reg for an object
Jesse Barnesde151cf2008-11-12 10:03:55 -08002517 * @obj: object to map through a fence reg
Chris Wilsond9e86c02010-11-10 16:40:20 +00002518 * @pipelined: ring on which to queue the change, or NULL for CPU access
2519 * @interruptible: must we wait uninterruptibly for the register to retire?
Jesse Barnesde151cf2008-11-12 10:03:55 -08002520 *
2521 * When mapping objects through the GTT, userspace wants to be able to write
2522 * to them without having to worry about swizzling if the object is tiled.
2523 *
2524 * This function walks the fence regs looking for a free one for @obj,
2525 * stealing one if it can't find any.
2526 *
2527 * It then sets up the reg based on the object's properties: address, pitch
2528 * and tiling format.
2529 */
Chris Wilson8c4b8c32009-06-17 22:08:52 +01002530int
Chris Wilsond9e86c02010-11-10 16:40:20 +00002531i915_gem_object_get_fence(struct drm_i915_gem_object *obj,
2532 struct intel_ring_buffer *pipelined,
2533 bool interruptible)
Jesse Barnesde151cf2008-11-12 10:03:55 -08002534{
Chris Wilson05394f32010-11-08 19:18:58 +00002535 struct drm_device *dev = obj->base.dev;
Jesse Barnes79e53942008-11-07 14:24:08 -08002536 struct drm_i915_private *dev_priv = dev->dev_private;
Chris Wilsond9e86c02010-11-10 16:40:20 +00002537 struct drm_i915_fence_reg *reg;
Daniel Vetterae3db242010-02-19 11:51:58 +01002538 int ret;
Jesse Barnesde151cf2008-11-12 10:03:55 -08002539
Chris Wilson6bda10d2010-12-05 21:04:18 +00002540 /* XXX disable pipelining. There are bugs. Shocking. */
2541 pipelined = NULL;
2542
Chris Wilsond9e86c02010-11-10 16:40:20 +00002543 /* Just update our place in the LRU if our fence is getting reused. */
Chris Wilson05394f32010-11-08 19:18:58 +00002544 if (obj->fence_reg != I915_FENCE_REG_NONE) {
2545 reg = &dev_priv->fence_regs[obj->fence_reg];
Daniel Vetter007cc8a2010-04-28 11:02:31 +02002546 list_move_tail(&reg->lru_list, &dev_priv->mm.fence_list);
Chris Wilsond9e86c02010-11-10 16:40:20 +00002547
2548 if (!obj->fenced_gpu_access && !obj->last_fenced_seqno)
2549 pipelined = NULL;
2550
2551 if (!pipelined) {
2552 if (reg->setup_seqno) {
2553 if (!ring_passed_seqno(obj->last_fenced_ring,
2554 reg->setup_seqno)) {
Chris Wilsondb53a302011-02-03 11:57:46 +00002555 ret = i915_wait_request(obj->last_fenced_ring,
2556 reg->setup_seqno,
2557 interruptible);
Chris Wilsond9e86c02010-11-10 16:40:20 +00002558 if (ret)
2559 return ret;
2560 }
2561
2562 reg->setup_seqno = 0;
2563 }
2564 } else if (obj->last_fenced_ring &&
2565 obj->last_fenced_ring != pipelined) {
2566 ret = i915_gem_object_flush_fence(obj,
2567 pipelined,
2568 interruptible);
2569 if (ret)
2570 return ret;
2571 } else if (obj->tiling_changed) {
2572 if (obj->fenced_gpu_access) {
Chris Wilson88241782011-01-07 17:09:48 +00002573 if (obj->base.write_domain & I915_GEM_GPU_DOMAINS) {
Chris Wilsondb53a302011-02-03 11:57:46 +00002574 ret = i915_gem_flush_ring(obj->ring,
Chris Wilson88241782011-01-07 17:09:48 +00002575 0, obj->base.write_domain);
2576 if (ret)
2577 return ret;
2578 }
Chris Wilsond9e86c02010-11-10 16:40:20 +00002579
2580 obj->fenced_gpu_access = false;
2581 }
2582 }
2583
2584 if (!obj->fenced_gpu_access && !obj->last_fenced_seqno)
2585 pipelined = NULL;
2586 BUG_ON(!pipelined && reg->setup_seqno);
2587
2588 if (obj->tiling_changed) {
2589 if (pipelined) {
2590 reg->setup_seqno =
Chris Wilsondb53a302011-02-03 11:57:46 +00002591 i915_gem_next_request_seqno(pipelined);
Chris Wilsond9e86c02010-11-10 16:40:20 +00002592 obj->last_fenced_seqno = reg->setup_seqno;
2593 obj->last_fenced_ring = pipelined;
2594 }
2595 goto update;
2596 }
2597
Eric Anholta09ba7f2009-08-29 12:49:51 -07002598 return 0;
2599 }
2600
Chris Wilsond9e86c02010-11-10 16:40:20 +00002601 reg = i915_find_fence_reg(dev, pipelined);
2602 if (reg == NULL)
2603 return -ENOSPC;
Jesse Barnesde151cf2008-11-12 10:03:55 -08002604
Chris Wilsond9e86c02010-11-10 16:40:20 +00002605 ret = i915_gem_object_flush_fence(obj, pipelined, interruptible);
2606 if (ret)
Daniel Vetterae3db242010-02-19 11:51:58 +01002607 return ret;
Chris Wilsonfc7170b2009-02-11 14:26:46 +00002608
Chris Wilsond9e86c02010-11-10 16:40:20 +00002609 if (reg->obj) {
2610 struct drm_i915_gem_object *old = reg->obj;
2611
2612 drm_gem_object_reference(&old->base);
2613
2614 if (old->tiling_mode)
2615 i915_gem_release_mmap(old);
2616
Chris Wilsond9e86c02010-11-10 16:40:20 +00002617 ret = i915_gem_object_flush_fence(old,
Chris Wilson6bda10d2010-12-05 21:04:18 +00002618 pipelined,
Chris Wilsond9e86c02010-11-10 16:40:20 +00002619 interruptible);
2620 if (ret) {
2621 drm_gem_object_unreference(&old->base);
2622 return ret;
2623 }
2624
2625 if (old->last_fenced_seqno == 0 && obj->last_fenced_seqno == 0)
2626 pipelined = NULL;
2627
2628 old->fence_reg = I915_FENCE_REG_NONE;
2629 old->last_fenced_ring = pipelined;
2630 old->last_fenced_seqno =
Chris Wilsondb53a302011-02-03 11:57:46 +00002631 pipelined ? i915_gem_next_request_seqno(pipelined) : 0;
Chris Wilsond9e86c02010-11-10 16:40:20 +00002632
2633 drm_gem_object_unreference(&old->base);
2634 } else if (obj->last_fenced_seqno == 0)
2635 pipelined = NULL;
Eric Anholta09ba7f2009-08-29 12:49:51 -07002636
Jesse Barnesde151cf2008-11-12 10:03:55 -08002637 reg->obj = obj;
Chris Wilsond9e86c02010-11-10 16:40:20 +00002638 list_move_tail(&reg->lru_list, &dev_priv->mm.fence_list);
2639 obj->fence_reg = reg - dev_priv->fence_regs;
2640 obj->last_fenced_ring = pipelined;
Jesse Barnesde151cf2008-11-12 10:03:55 -08002641
Chris Wilsond9e86c02010-11-10 16:40:20 +00002642 reg->setup_seqno =
Chris Wilsondb53a302011-02-03 11:57:46 +00002643 pipelined ? i915_gem_next_request_seqno(pipelined) : 0;
Chris Wilsond9e86c02010-11-10 16:40:20 +00002644 obj->last_fenced_seqno = reg->setup_seqno;
2645
2646update:
2647 obj->tiling_changed = false;
Chris Wilsone259bef2010-09-17 00:32:02 +01002648 switch (INTEL_INFO(dev)->gen) {
2649 case 6:
Daniel Vetterc6642782010-11-12 13:46:18 +00002650 ret = sandybridge_write_fence_reg(obj, pipelined);
Chris Wilsone259bef2010-09-17 00:32:02 +01002651 break;
2652 case 5:
2653 case 4:
Daniel Vetterc6642782010-11-12 13:46:18 +00002654 ret = i965_write_fence_reg(obj, pipelined);
Chris Wilsone259bef2010-09-17 00:32:02 +01002655 break;
2656 case 3:
Daniel Vetterc6642782010-11-12 13:46:18 +00002657 ret = i915_write_fence_reg(obj, pipelined);
Chris Wilsone259bef2010-09-17 00:32:02 +01002658 break;
2659 case 2:
Daniel Vetterc6642782010-11-12 13:46:18 +00002660 ret = i830_write_fence_reg(obj, pipelined);
Chris Wilsone259bef2010-09-17 00:32:02 +01002661 break;
2662 }
Eric Anholtd9ddcb92009-01-27 10:33:49 -08002663
Daniel Vetterc6642782010-11-12 13:46:18 +00002664 return ret;
Jesse Barnesde151cf2008-11-12 10:03:55 -08002665}
2666
2667/**
2668 * i915_gem_clear_fence_reg - clear out fence register info
2669 * @obj: object to clear
2670 *
2671 * Zeroes out the fence register itself and clears out the associated
Chris Wilson05394f32010-11-08 19:18:58 +00002672 * data structures in dev_priv and obj.
Jesse Barnesde151cf2008-11-12 10:03:55 -08002673 */
2674static void
Chris Wilsond9e86c02010-11-10 16:40:20 +00002675i915_gem_clear_fence_reg(struct drm_device *dev,
2676 struct drm_i915_fence_reg *reg)
Jesse Barnesde151cf2008-11-12 10:03:55 -08002677{
Jesse Barnes79e53942008-11-07 14:24:08 -08002678 drm_i915_private_t *dev_priv = dev->dev_private;
Chris Wilsond9e86c02010-11-10 16:40:20 +00002679 uint32_t fence_reg = reg - dev_priv->fence_regs;
Jesse Barnesde151cf2008-11-12 10:03:55 -08002680
Chris Wilsone259bef2010-09-17 00:32:02 +01002681 switch (INTEL_INFO(dev)->gen) {
2682 case 6:
Chris Wilsond9e86c02010-11-10 16:40:20 +00002683 I915_WRITE64(FENCE_REG_SANDYBRIDGE_0 + fence_reg*8, 0);
Chris Wilsone259bef2010-09-17 00:32:02 +01002684 break;
2685 case 5:
2686 case 4:
Chris Wilsond9e86c02010-11-10 16:40:20 +00002687 I915_WRITE64(FENCE_REG_965_0 + fence_reg*8, 0);
Chris Wilsone259bef2010-09-17 00:32:02 +01002688 break;
2689 case 3:
Chris Wilsond9e86c02010-11-10 16:40:20 +00002690 if (fence_reg >= 8)
2691 fence_reg = FENCE_REG_945_8 + (fence_reg - 8) * 4;
Eric Anholtdc529a42009-03-10 22:34:49 -07002692 else
Chris Wilsone259bef2010-09-17 00:32:02 +01002693 case 2:
Chris Wilsond9e86c02010-11-10 16:40:20 +00002694 fence_reg = FENCE_REG_830_0 + fence_reg * 4;
Eric Anholtdc529a42009-03-10 22:34:49 -07002695
2696 I915_WRITE(fence_reg, 0);
Chris Wilsone259bef2010-09-17 00:32:02 +01002697 break;
Eric Anholtdc529a42009-03-10 22:34:49 -07002698 }
Jesse Barnesde151cf2008-11-12 10:03:55 -08002699
Daniel Vetter007cc8a2010-04-28 11:02:31 +02002700 list_del_init(&reg->lru_list);
Chris Wilsond9e86c02010-11-10 16:40:20 +00002701 reg->obj = NULL;
2702 reg->setup_seqno = 0;
Chris Wilson52dc7d32009-06-06 09:46:01 +01002703}
2704
2705/**
Eric Anholt673a3942008-07-30 12:06:12 -07002706 * Finds free space in the GTT aperture and binds the object there.
2707 */
2708static int
Chris Wilson05394f32010-11-08 19:18:58 +00002709i915_gem_object_bind_to_gtt(struct drm_i915_gem_object *obj,
Daniel Vetter920afa72010-09-16 17:54:23 +02002710 unsigned alignment,
Daniel Vetter75e9e912010-11-04 17:11:09 +01002711 bool map_and_fenceable)
Eric Anholt673a3942008-07-30 12:06:12 -07002712{
Chris Wilson05394f32010-11-08 19:18:58 +00002713 struct drm_device *dev = obj->base.dev;
Eric Anholt673a3942008-07-30 12:06:12 -07002714 drm_i915_private_t *dev_priv = dev->dev_private;
Eric Anholt673a3942008-07-30 12:06:12 -07002715 struct drm_mm_node *free_space;
Chris Wilsona00b10c2010-09-24 21:15:47 +01002716 gfp_t gfpmask = __GFP_NORETRY | __GFP_NOWARN;
Daniel Vetter5e783302010-11-14 22:32:36 +01002717 u32 size, fence_size, fence_alignment, unfenced_alignment;
Daniel Vetter75e9e912010-11-04 17:11:09 +01002718 bool mappable, fenceable;
Chris Wilson07f73f62009-09-14 16:50:30 +01002719 int ret;
Eric Anholt673a3942008-07-30 12:06:12 -07002720
Chris Wilson05394f32010-11-08 19:18:58 +00002721 if (obj->madv != I915_MADV_WILLNEED) {
Chris Wilson3ef94da2009-09-14 16:50:29 +01002722 DRM_ERROR("Attempting to bind a purgeable object\n");
2723 return -EINVAL;
2724 }
2725
Chris Wilson05394f32010-11-08 19:18:58 +00002726 fence_size = i915_gem_get_gtt_size(obj);
2727 fence_alignment = i915_gem_get_gtt_alignment(obj);
2728 unfenced_alignment = i915_gem_get_unfenced_gtt_alignment(obj);
Chris Wilsona00b10c2010-09-24 21:15:47 +01002729
Eric Anholt673a3942008-07-30 12:06:12 -07002730 if (alignment == 0)
Daniel Vetter5e783302010-11-14 22:32:36 +01002731 alignment = map_and_fenceable ? fence_alignment :
2732 unfenced_alignment;
Daniel Vetter75e9e912010-11-04 17:11:09 +01002733 if (map_and_fenceable && alignment & (fence_alignment - 1)) {
Eric Anholt673a3942008-07-30 12:06:12 -07002734 DRM_ERROR("Invalid object alignment requested %u\n", alignment);
2735 return -EINVAL;
2736 }
2737
Chris Wilson05394f32010-11-08 19:18:58 +00002738 size = map_and_fenceable ? fence_size : obj->base.size;
Chris Wilsona00b10c2010-09-24 21:15:47 +01002739
Chris Wilson654fc602010-05-27 13:18:21 +01002740 /* If the object is bigger than the entire aperture, reject it early
2741 * before evicting everything in a vain attempt to find space.
2742 */
Chris Wilson05394f32010-11-08 19:18:58 +00002743 if (obj->base.size >
Daniel Vetter75e9e912010-11-04 17:11:09 +01002744 (map_and_fenceable ? dev_priv->mm.gtt_mappable_end : dev_priv->mm.gtt_total)) {
Chris Wilson654fc602010-05-27 13:18:21 +01002745 DRM_ERROR("Attempting to bind an object larger than the aperture\n");
2746 return -E2BIG;
2747 }
2748
Eric Anholt673a3942008-07-30 12:06:12 -07002749 search_free:
Daniel Vetter75e9e912010-11-04 17:11:09 +01002750 if (map_and_fenceable)
Daniel Vetter920afa72010-09-16 17:54:23 +02002751 free_space =
2752 drm_mm_search_free_in_range(&dev_priv->mm.gtt_space,
Chris Wilsona00b10c2010-09-24 21:15:47 +01002753 size, alignment, 0,
Daniel Vetter920afa72010-09-16 17:54:23 +02002754 dev_priv->mm.gtt_mappable_end,
2755 0);
2756 else
2757 free_space = drm_mm_search_free(&dev_priv->mm.gtt_space,
Chris Wilsona00b10c2010-09-24 21:15:47 +01002758 size, alignment, 0);
Daniel Vetter920afa72010-09-16 17:54:23 +02002759
2760 if (free_space != NULL) {
Daniel Vetter75e9e912010-11-04 17:11:09 +01002761 if (map_and_fenceable)
Chris Wilson05394f32010-11-08 19:18:58 +00002762 obj->gtt_space =
Daniel Vetter920afa72010-09-16 17:54:23 +02002763 drm_mm_get_block_range_generic(free_space,
Chris Wilsona00b10c2010-09-24 21:15:47 +01002764 size, alignment, 0,
Daniel Vetter920afa72010-09-16 17:54:23 +02002765 dev_priv->mm.gtt_mappable_end,
2766 0);
2767 else
Chris Wilson05394f32010-11-08 19:18:58 +00002768 obj->gtt_space =
Chris Wilsona00b10c2010-09-24 21:15:47 +01002769 drm_mm_get_block(free_space, size, alignment);
Daniel Vetter920afa72010-09-16 17:54:23 +02002770 }
Chris Wilson05394f32010-11-08 19:18:58 +00002771 if (obj->gtt_space == NULL) {
Eric Anholt673a3942008-07-30 12:06:12 -07002772 /* If the gtt is empty and we're still having trouble
2773 * fitting our object in, we're out of memory.
2774 */
Daniel Vetter75e9e912010-11-04 17:11:09 +01002775 ret = i915_gem_evict_something(dev, size, alignment,
2776 map_and_fenceable);
Chris Wilson97311292009-09-21 00:22:34 +01002777 if (ret)
Eric Anholt673a3942008-07-30 12:06:12 -07002778 return ret;
Chris Wilson97311292009-09-21 00:22:34 +01002779
Eric Anholt673a3942008-07-30 12:06:12 -07002780 goto search_free;
2781 }
2782
Chris Wilsone5281cc2010-10-28 13:45:36 +01002783 ret = i915_gem_object_get_pages_gtt(obj, gfpmask);
Eric Anholt673a3942008-07-30 12:06:12 -07002784 if (ret) {
Chris Wilson05394f32010-11-08 19:18:58 +00002785 drm_mm_put_block(obj->gtt_space);
2786 obj->gtt_space = NULL;
Chris Wilson07f73f62009-09-14 16:50:30 +01002787
2788 if (ret == -ENOMEM) {
Chris Wilson809b6332011-01-10 17:33:15 +00002789 /* first try to reclaim some memory by clearing the GTT */
2790 ret = i915_gem_evict_everything(dev, false);
Chris Wilson07f73f62009-09-14 16:50:30 +01002791 if (ret) {
Chris Wilson07f73f62009-09-14 16:50:30 +01002792 /* now try to shrink everyone else */
Chris Wilson4bdadb92010-01-27 13:36:32 +00002793 if (gfpmask) {
2794 gfpmask = 0;
2795 goto search_free;
Chris Wilson07f73f62009-09-14 16:50:30 +01002796 }
2797
Chris Wilson809b6332011-01-10 17:33:15 +00002798 return -ENOMEM;
Chris Wilson07f73f62009-09-14 16:50:30 +01002799 }
2800
2801 goto search_free;
2802 }
2803
Eric Anholt673a3942008-07-30 12:06:12 -07002804 return ret;
2805 }
2806
Daniel Vetter7c2e6fd2010-11-06 10:10:47 +01002807 ret = i915_gem_gtt_bind_object(obj);
2808 if (ret) {
Chris Wilsone5281cc2010-10-28 13:45:36 +01002809 i915_gem_object_put_pages_gtt(obj);
Chris Wilson05394f32010-11-08 19:18:58 +00002810 drm_mm_put_block(obj->gtt_space);
2811 obj->gtt_space = NULL;
Chris Wilson07f73f62009-09-14 16:50:30 +01002812
Chris Wilson809b6332011-01-10 17:33:15 +00002813 if (i915_gem_evict_everything(dev, false))
Chris Wilson07f73f62009-09-14 16:50:30 +01002814 return ret;
Chris Wilson07f73f62009-09-14 16:50:30 +01002815
2816 goto search_free;
Eric Anholt673a3942008-07-30 12:06:12 -07002817 }
Eric Anholt673a3942008-07-30 12:06:12 -07002818
Chris Wilson6299f992010-11-24 12:23:44 +00002819 list_add_tail(&obj->gtt_list, &dev_priv->mm.gtt_list);
Chris Wilson05394f32010-11-08 19:18:58 +00002820 list_add_tail(&obj->mm_list, &dev_priv->mm.inactive_list);
Chris Wilsonbf1a1092010-08-07 11:01:20 +01002821
Eric Anholt673a3942008-07-30 12:06:12 -07002822 /* Assert that the object is not currently in any GPU domain. As it
2823 * wasn't in the GTT, there shouldn't be any way it could have been in
2824 * a GPU cache
2825 */
Chris Wilson05394f32010-11-08 19:18:58 +00002826 BUG_ON(obj->base.read_domains & I915_GEM_GPU_DOMAINS);
2827 BUG_ON(obj->base.write_domain & I915_GEM_GPU_DOMAINS);
Eric Anholt673a3942008-07-30 12:06:12 -07002828
Chris Wilson6299f992010-11-24 12:23:44 +00002829 obj->gtt_offset = obj->gtt_space->start;
Chris Wilson1c5d22f2009-08-25 11:15:50 +01002830
Daniel Vetter75e9e912010-11-04 17:11:09 +01002831 fenceable =
Chris Wilson05394f32010-11-08 19:18:58 +00002832 obj->gtt_space->size == fence_size &&
2833 (obj->gtt_space->start & (fence_alignment -1)) == 0;
Chris Wilsona00b10c2010-09-24 21:15:47 +01002834
Daniel Vetter75e9e912010-11-04 17:11:09 +01002835 mappable =
Chris Wilson05394f32010-11-08 19:18:58 +00002836 obj->gtt_offset + obj->base.size <= dev_priv->mm.gtt_mappable_end;
Chris Wilsona00b10c2010-09-24 21:15:47 +01002837
Chris Wilson05394f32010-11-08 19:18:58 +00002838 obj->map_and_fenceable = mappable && fenceable;
Daniel Vetter75e9e912010-11-04 17:11:09 +01002839
Chris Wilsondb53a302011-02-03 11:57:46 +00002840 trace_i915_gem_object_bind(obj, map_and_fenceable);
Eric Anholt673a3942008-07-30 12:06:12 -07002841 return 0;
2842}
2843
2844void
Chris Wilson05394f32010-11-08 19:18:58 +00002845i915_gem_clflush_object(struct drm_i915_gem_object *obj)
Eric Anholt673a3942008-07-30 12:06:12 -07002846{
Eric Anholt673a3942008-07-30 12:06:12 -07002847 /* If we don't have a page list set up, then we're not pinned
2848 * to GPU, and we can ignore the cache flush because it'll happen
2849 * again at bind time.
2850 */
Chris Wilson05394f32010-11-08 19:18:58 +00002851 if (obj->pages == NULL)
Eric Anholt673a3942008-07-30 12:06:12 -07002852 return;
2853
Chris Wilson1c5d22f2009-08-25 11:15:50 +01002854 trace_i915_gem_object_clflush(obj);
Eric Anholtcfa16a02009-05-26 18:46:16 -07002855
Chris Wilson05394f32010-11-08 19:18:58 +00002856 drm_clflush_pages(obj->pages, obj->base.size / PAGE_SIZE);
Eric Anholt673a3942008-07-30 12:06:12 -07002857}
2858
Eric Anholte47c68e2008-11-14 13:35:19 -08002859/** Flushes any GPU write domain for the object if it's dirty. */
Chris Wilson88241782011-01-07 17:09:48 +00002860static int
Chris Wilson3619df02010-11-28 15:37:17 +00002861i915_gem_object_flush_gpu_write_domain(struct drm_i915_gem_object *obj)
Eric Anholte47c68e2008-11-14 13:35:19 -08002862{
Chris Wilson05394f32010-11-08 19:18:58 +00002863 if ((obj->base.write_domain & I915_GEM_GPU_DOMAINS) == 0)
Chris Wilson88241782011-01-07 17:09:48 +00002864 return 0;
Eric Anholte47c68e2008-11-14 13:35:19 -08002865
2866 /* Queue the GPU write cache flushing we need. */
Chris Wilsondb53a302011-02-03 11:57:46 +00002867 return i915_gem_flush_ring(obj->ring, 0, obj->base.write_domain);
Eric Anholte47c68e2008-11-14 13:35:19 -08002868}
2869
2870/** Flushes the GTT write domain for the object if it's dirty. */
2871static void
Chris Wilson05394f32010-11-08 19:18:58 +00002872i915_gem_object_flush_gtt_write_domain(struct drm_i915_gem_object *obj)
Eric Anholte47c68e2008-11-14 13:35:19 -08002873{
Chris Wilson1c5d22f2009-08-25 11:15:50 +01002874 uint32_t old_write_domain;
2875
Chris Wilson05394f32010-11-08 19:18:58 +00002876 if (obj->base.write_domain != I915_GEM_DOMAIN_GTT)
Eric Anholte47c68e2008-11-14 13:35:19 -08002877 return;
2878
Chris Wilson63256ec2011-01-04 18:42:07 +00002879 /* No actual flushing is required for the GTT write domain. Writes
Eric Anholte47c68e2008-11-14 13:35:19 -08002880 * to it immediately go to main memory as far as we know, so there's
2881 * no chipset flush. It also doesn't land in render cache.
Chris Wilson63256ec2011-01-04 18:42:07 +00002882 *
2883 * However, we do have to enforce the order so that all writes through
2884 * the GTT land before any writes to the device, such as updates to
2885 * the GATT itself.
Eric Anholte47c68e2008-11-14 13:35:19 -08002886 */
Chris Wilson63256ec2011-01-04 18:42:07 +00002887 wmb();
2888
Chris Wilson4a684a42010-10-28 14:44:08 +01002889 i915_gem_release_mmap(obj);
2890
Chris Wilson05394f32010-11-08 19:18:58 +00002891 old_write_domain = obj->base.write_domain;
2892 obj->base.write_domain = 0;
Chris Wilson1c5d22f2009-08-25 11:15:50 +01002893
2894 trace_i915_gem_object_change_domain(obj,
Chris Wilson05394f32010-11-08 19:18:58 +00002895 obj->base.read_domains,
Chris Wilson1c5d22f2009-08-25 11:15:50 +01002896 old_write_domain);
Eric Anholte47c68e2008-11-14 13:35:19 -08002897}
2898
2899/** Flushes the CPU write domain for the object if it's dirty. */
2900static void
Chris Wilson05394f32010-11-08 19:18:58 +00002901i915_gem_object_flush_cpu_write_domain(struct drm_i915_gem_object *obj)
Eric Anholte47c68e2008-11-14 13:35:19 -08002902{
Chris Wilson1c5d22f2009-08-25 11:15:50 +01002903 uint32_t old_write_domain;
Eric Anholte47c68e2008-11-14 13:35:19 -08002904
Chris Wilson05394f32010-11-08 19:18:58 +00002905 if (obj->base.write_domain != I915_GEM_DOMAIN_CPU)
Eric Anholte47c68e2008-11-14 13:35:19 -08002906 return;
2907
2908 i915_gem_clflush_object(obj);
Daniel Vetter40ce6572010-11-05 18:12:18 +01002909 intel_gtt_chipset_flush();
Chris Wilson05394f32010-11-08 19:18:58 +00002910 old_write_domain = obj->base.write_domain;
2911 obj->base.write_domain = 0;
Chris Wilson1c5d22f2009-08-25 11:15:50 +01002912
2913 trace_i915_gem_object_change_domain(obj,
Chris Wilson05394f32010-11-08 19:18:58 +00002914 obj->base.read_domains,
Chris Wilson1c5d22f2009-08-25 11:15:50 +01002915 old_write_domain);
Eric Anholte47c68e2008-11-14 13:35:19 -08002916}
2917
Eric Anholt2ef7eea2008-11-10 10:53:25 -08002918/**
2919 * Moves a single object to the GTT read, and possibly write domain.
2920 *
2921 * This function returns when the move is complete, including waiting on
2922 * flushes to occur.
2923 */
Jesse Barnes79e53942008-11-07 14:24:08 -08002924int
Chris Wilson20217462010-11-23 15:26:33 +00002925i915_gem_object_set_to_gtt_domain(struct drm_i915_gem_object *obj, bool write)
Eric Anholt2ef7eea2008-11-10 10:53:25 -08002926{
Chris Wilson1c5d22f2009-08-25 11:15:50 +01002927 uint32_t old_write_domain, old_read_domains;
Eric Anholte47c68e2008-11-14 13:35:19 -08002928 int ret;
Eric Anholt2ef7eea2008-11-10 10:53:25 -08002929
Eric Anholt02354392008-11-26 13:58:13 -08002930 /* Not valid to be called on unbound objects. */
Chris Wilson05394f32010-11-08 19:18:58 +00002931 if (obj->gtt_space == NULL)
Eric Anholt02354392008-11-26 13:58:13 -08002932 return -EINVAL;
2933
Chris Wilson88241782011-01-07 17:09:48 +00002934 ret = i915_gem_object_flush_gpu_write_domain(obj);
2935 if (ret)
2936 return ret;
2937
Chris Wilson87ca9c82010-12-02 09:42:56 +00002938 if (obj->pending_gpu_write || write) {
2939 ret = i915_gem_object_wait_rendering(obj, true);
2940 if (ret)
2941 return ret;
2942 }
Chris Wilson2dafb1e2010-06-07 14:03:05 +01002943
Chris Wilson72133422010-09-13 23:56:38 +01002944 i915_gem_object_flush_cpu_write_domain(obj);
Chris Wilson1c5d22f2009-08-25 11:15:50 +01002945
Chris Wilson05394f32010-11-08 19:18:58 +00002946 old_write_domain = obj->base.write_domain;
2947 old_read_domains = obj->base.read_domains;
Eric Anholt2ef7eea2008-11-10 10:53:25 -08002948
Eric Anholt2ef7eea2008-11-10 10:53:25 -08002949 /* It should now be out of any other write domains, and we can update
2950 * the domain values for our changes.
2951 */
Chris Wilson05394f32010-11-08 19:18:58 +00002952 BUG_ON((obj->base.write_domain & ~I915_GEM_DOMAIN_GTT) != 0);
2953 obj->base.read_domains |= I915_GEM_DOMAIN_GTT;
Eric Anholte47c68e2008-11-14 13:35:19 -08002954 if (write) {
Chris Wilson05394f32010-11-08 19:18:58 +00002955 obj->base.read_domains = I915_GEM_DOMAIN_GTT;
2956 obj->base.write_domain = I915_GEM_DOMAIN_GTT;
2957 obj->dirty = 1;
Eric Anholte47c68e2008-11-14 13:35:19 -08002958 }
2959
Chris Wilson1c5d22f2009-08-25 11:15:50 +01002960 trace_i915_gem_object_change_domain(obj,
2961 old_read_domains,
2962 old_write_domain);
2963
Eric Anholte47c68e2008-11-14 13:35:19 -08002964 return 0;
2965}
2966
Zhenyu Wangb9241ea2009-11-25 13:09:39 +08002967/*
2968 * Prepare buffer for display plane. Use uninterruptible for possible flush
2969 * wait, as in modesetting process we're not supposed to be interrupted.
2970 */
2971int
Chris Wilson05394f32010-11-08 19:18:58 +00002972i915_gem_object_set_to_display_plane(struct drm_i915_gem_object *obj,
Chris Wilson919926a2010-11-12 13:42:53 +00002973 struct intel_ring_buffer *pipelined)
Zhenyu Wangb9241ea2009-11-25 13:09:39 +08002974{
Daniel Vetterba3d8d72010-02-11 22:37:04 +01002975 uint32_t old_read_domains;
Zhenyu Wangb9241ea2009-11-25 13:09:39 +08002976 int ret;
2977
2978 /* Not valid to be called on unbound objects. */
Chris Wilson05394f32010-11-08 19:18:58 +00002979 if (obj->gtt_space == NULL)
Zhenyu Wangb9241ea2009-11-25 13:09:39 +08002980 return -EINVAL;
2981
Chris Wilson88241782011-01-07 17:09:48 +00002982 ret = i915_gem_object_flush_gpu_write_domain(obj);
2983 if (ret)
2984 return ret;
2985
Zhenyu Wangb9241ea2009-11-25 13:09:39 +08002986
Chris Wilsonced270f2010-09-26 22:47:46 +01002987 /* Currently, we are always called from an non-interruptible context. */
Chris Wilson0be73282010-12-06 14:36:27 +00002988 if (pipelined != obj->ring) {
Chris Wilsonced270f2010-09-26 22:47:46 +01002989 ret = i915_gem_object_wait_rendering(obj, false);
2990 if (ret)
Zhenyu Wangb9241ea2009-11-25 13:09:39 +08002991 return ret;
2992 }
2993
Chris Wilsonb118c1e2010-05-27 13:18:14 +01002994 i915_gem_object_flush_cpu_write_domain(obj);
2995
Chris Wilson05394f32010-11-08 19:18:58 +00002996 old_read_domains = obj->base.read_domains;
2997 obj->base.read_domains |= I915_GEM_DOMAIN_GTT;
Zhenyu Wangb9241ea2009-11-25 13:09:39 +08002998
2999 trace_i915_gem_object_change_domain(obj,
3000 old_read_domains,
Chris Wilson05394f32010-11-08 19:18:58 +00003001 obj->base.write_domain);
Zhenyu Wangb9241ea2009-11-25 13:09:39 +08003002
3003 return 0;
3004}
3005
Chris Wilson85345512010-11-13 09:49:11 +00003006int
3007i915_gem_object_flush_gpu(struct drm_i915_gem_object *obj,
3008 bool interruptible)
3009{
Chris Wilson88241782011-01-07 17:09:48 +00003010 int ret;
3011
Chris Wilson85345512010-11-13 09:49:11 +00003012 if (!obj->active)
3013 return 0;
3014
Chris Wilson88241782011-01-07 17:09:48 +00003015 if (obj->base.write_domain & I915_GEM_GPU_DOMAINS) {
Chris Wilsondb53a302011-02-03 11:57:46 +00003016 ret = i915_gem_flush_ring(obj->ring, 0, obj->base.write_domain);
Chris Wilson88241782011-01-07 17:09:48 +00003017 if (ret)
3018 return ret;
3019 }
Chris Wilson85345512010-11-13 09:49:11 +00003020
Chris Wilson05394f32010-11-08 19:18:58 +00003021 return i915_gem_object_wait_rendering(obj, interruptible);
Chris Wilson85345512010-11-13 09:49:11 +00003022}
3023
Eric Anholte47c68e2008-11-14 13:35:19 -08003024/**
3025 * Moves a single object to the CPU read, and possibly write domain.
3026 *
3027 * This function returns when the move is complete, including waiting on
3028 * flushes to occur.
3029 */
3030static int
Chris Wilson919926a2010-11-12 13:42:53 +00003031i915_gem_object_set_to_cpu_domain(struct drm_i915_gem_object *obj, bool write)
Eric Anholte47c68e2008-11-14 13:35:19 -08003032{
Chris Wilson1c5d22f2009-08-25 11:15:50 +01003033 uint32_t old_write_domain, old_read_domains;
Eric Anholte47c68e2008-11-14 13:35:19 -08003034 int ret;
3035
Chris Wilson88241782011-01-07 17:09:48 +00003036 ret = i915_gem_object_flush_gpu_write_domain(obj);
3037 if (ret)
3038 return ret;
3039
Daniel Vetterde18a292010-11-27 22:30:41 +01003040 ret = i915_gem_object_wait_rendering(obj, true);
3041 if (ret)
Eric Anholte47c68e2008-11-14 13:35:19 -08003042 return ret;
3043
3044 i915_gem_object_flush_gtt_write_domain(obj);
3045
3046 /* If we have a partially-valid cache of the object in the CPU,
3047 * finish invalidating it and free the per-page flags.
3048 */
3049 i915_gem_object_set_to_full_cpu_read_domain(obj);
3050
Chris Wilson05394f32010-11-08 19:18:58 +00003051 old_write_domain = obj->base.write_domain;
3052 old_read_domains = obj->base.read_domains;
Chris Wilson1c5d22f2009-08-25 11:15:50 +01003053
Eric Anholte47c68e2008-11-14 13:35:19 -08003054 /* Flush the CPU cache if it's still invalid. */
Chris Wilson05394f32010-11-08 19:18:58 +00003055 if ((obj->base.read_domains & I915_GEM_DOMAIN_CPU) == 0) {
Eric Anholte47c68e2008-11-14 13:35:19 -08003056 i915_gem_clflush_object(obj);
Eric Anholte47c68e2008-11-14 13:35:19 -08003057
Chris Wilson05394f32010-11-08 19:18:58 +00003058 obj->base.read_domains |= I915_GEM_DOMAIN_CPU;
Eric Anholte47c68e2008-11-14 13:35:19 -08003059 }
3060
3061 /* It should now be out of any other write domains, and we can update
3062 * the domain values for our changes.
3063 */
Chris Wilson05394f32010-11-08 19:18:58 +00003064 BUG_ON((obj->base.write_domain & ~I915_GEM_DOMAIN_CPU) != 0);
Eric Anholte47c68e2008-11-14 13:35:19 -08003065
3066 /* If we're writing through the CPU, then the GPU read domains will
3067 * need to be invalidated at next use.
3068 */
3069 if (write) {
Chris Wilson05394f32010-11-08 19:18:58 +00003070 obj->base.read_domains = I915_GEM_DOMAIN_CPU;
3071 obj->base.write_domain = I915_GEM_DOMAIN_CPU;
Eric Anholte47c68e2008-11-14 13:35:19 -08003072 }
Eric Anholt2ef7eea2008-11-10 10:53:25 -08003073
Chris Wilson1c5d22f2009-08-25 11:15:50 +01003074 trace_i915_gem_object_change_domain(obj,
3075 old_read_domains,
3076 old_write_domain);
3077
Eric Anholt2ef7eea2008-11-10 10:53:25 -08003078 return 0;
3079}
3080
Eric Anholt673a3942008-07-30 12:06:12 -07003081/**
Eric Anholte47c68e2008-11-14 13:35:19 -08003082 * Moves the object from a partially CPU read to a full one.
Eric Anholt673a3942008-07-30 12:06:12 -07003083 *
Eric Anholte47c68e2008-11-14 13:35:19 -08003084 * Note that this only resolves i915_gem_object_set_cpu_read_domain_range(),
3085 * and doesn't handle transitioning from !(read_domains & I915_GEM_DOMAIN_CPU).
3086 */
3087static void
Chris Wilson05394f32010-11-08 19:18:58 +00003088i915_gem_object_set_to_full_cpu_read_domain(struct drm_i915_gem_object *obj)
Eric Anholte47c68e2008-11-14 13:35:19 -08003089{
Chris Wilson05394f32010-11-08 19:18:58 +00003090 if (!obj->page_cpu_valid)
Eric Anholte47c68e2008-11-14 13:35:19 -08003091 return;
3092
3093 /* If we're partially in the CPU read domain, finish moving it in.
3094 */
Chris Wilson05394f32010-11-08 19:18:58 +00003095 if (obj->base.read_domains & I915_GEM_DOMAIN_CPU) {
Eric Anholte47c68e2008-11-14 13:35:19 -08003096 int i;
3097
Chris Wilson05394f32010-11-08 19:18:58 +00003098 for (i = 0; i <= (obj->base.size - 1) / PAGE_SIZE; i++) {
3099 if (obj->page_cpu_valid[i])
Eric Anholte47c68e2008-11-14 13:35:19 -08003100 continue;
Chris Wilson05394f32010-11-08 19:18:58 +00003101 drm_clflush_pages(obj->pages + i, 1);
Eric Anholte47c68e2008-11-14 13:35:19 -08003102 }
Eric Anholte47c68e2008-11-14 13:35:19 -08003103 }
3104
3105 /* Free the page_cpu_valid mappings which are now stale, whether
3106 * or not we've got I915_GEM_DOMAIN_CPU.
3107 */
Chris Wilson05394f32010-11-08 19:18:58 +00003108 kfree(obj->page_cpu_valid);
3109 obj->page_cpu_valid = NULL;
Eric Anholte47c68e2008-11-14 13:35:19 -08003110}
3111
3112/**
3113 * Set the CPU read domain on a range of the object.
3114 *
3115 * The object ends up with I915_GEM_DOMAIN_CPU in its read flags although it's
3116 * not entirely valid. The page_cpu_valid member of the object flags which
3117 * pages have been flushed, and will be respected by
3118 * i915_gem_object_set_to_cpu_domain() if it's called on to get a valid mapping
3119 * of the whole object.
3120 *
3121 * This function returns when the move is complete, including waiting on
3122 * flushes to occur.
Eric Anholt673a3942008-07-30 12:06:12 -07003123 */
3124static int
Chris Wilson05394f32010-11-08 19:18:58 +00003125i915_gem_object_set_cpu_read_domain_range(struct drm_i915_gem_object *obj,
Eric Anholte47c68e2008-11-14 13:35:19 -08003126 uint64_t offset, uint64_t size)
Eric Anholt673a3942008-07-30 12:06:12 -07003127{
Chris Wilson1c5d22f2009-08-25 11:15:50 +01003128 uint32_t old_read_domains;
Eric Anholte47c68e2008-11-14 13:35:19 -08003129 int i, ret;
Eric Anholt673a3942008-07-30 12:06:12 -07003130
Chris Wilson05394f32010-11-08 19:18:58 +00003131 if (offset == 0 && size == obj->base.size)
Eric Anholte47c68e2008-11-14 13:35:19 -08003132 return i915_gem_object_set_to_cpu_domain(obj, 0);
3133
Chris Wilson88241782011-01-07 17:09:48 +00003134 ret = i915_gem_object_flush_gpu_write_domain(obj);
3135 if (ret)
3136 return ret;
3137
Daniel Vetterde18a292010-11-27 22:30:41 +01003138 ret = i915_gem_object_wait_rendering(obj, true);
3139 if (ret)
Eric Anholte47c68e2008-11-14 13:35:19 -08003140 return ret;
Daniel Vetterde18a292010-11-27 22:30:41 +01003141
Eric Anholte47c68e2008-11-14 13:35:19 -08003142 i915_gem_object_flush_gtt_write_domain(obj);
3143
3144 /* If we're already fully in the CPU read domain, we're done. */
Chris Wilson05394f32010-11-08 19:18:58 +00003145 if (obj->page_cpu_valid == NULL &&
3146 (obj->base.read_domains & I915_GEM_DOMAIN_CPU) != 0)
Eric Anholt673a3942008-07-30 12:06:12 -07003147 return 0;
3148
Eric Anholte47c68e2008-11-14 13:35:19 -08003149 /* Otherwise, create/clear the per-page CPU read domain flag if we're
3150 * newly adding I915_GEM_DOMAIN_CPU
3151 */
Chris Wilson05394f32010-11-08 19:18:58 +00003152 if (obj->page_cpu_valid == NULL) {
3153 obj->page_cpu_valid = kzalloc(obj->base.size / PAGE_SIZE,
3154 GFP_KERNEL);
3155 if (obj->page_cpu_valid == NULL)
Eric Anholte47c68e2008-11-14 13:35:19 -08003156 return -ENOMEM;
Chris Wilson05394f32010-11-08 19:18:58 +00003157 } else if ((obj->base.read_domains & I915_GEM_DOMAIN_CPU) == 0)
3158 memset(obj->page_cpu_valid, 0, obj->base.size / PAGE_SIZE);
Eric Anholt673a3942008-07-30 12:06:12 -07003159
3160 /* Flush the cache on any pages that are still invalid from the CPU's
3161 * perspective.
3162 */
Eric Anholte47c68e2008-11-14 13:35:19 -08003163 for (i = offset / PAGE_SIZE; i <= (offset + size - 1) / PAGE_SIZE;
3164 i++) {
Chris Wilson05394f32010-11-08 19:18:58 +00003165 if (obj->page_cpu_valid[i])
Eric Anholt673a3942008-07-30 12:06:12 -07003166 continue;
3167
Chris Wilson05394f32010-11-08 19:18:58 +00003168 drm_clflush_pages(obj->pages + i, 1);
Eric Anholt673a3942008-07-30 12:06:12 -07003169
Chris Wilson05394f32010-11-08 19:18:58 +00003170 obj->page_cpu_valid[i] = 1;
Eric Anholt673a3942008-07-30 12:06:12 -07003171 }
3172
Eric Anholte47c68e2008-11-14 13:35:19 -08003173 /* It should now be out of any other write domains, and we can update
3174 * the domain values for our changes.
3175 */
Chris Wilson05394f32010-11-08 19:18:58 +00003176 BUG_ON((obj->base.write_domain & ~I915_GEM_DOMAIN_CPU) != 0);
Eric Anholte47c68e2008-11-14 13:35:19 -08003177
Chris Wilson05394f32010-11-08 19:18:58 +00003178 old_read_domains = obj->base.read_domains;
3179 obj->base.read_domains |= I915_GEM_DOMAIN_CPU;
Eric Anholte47c68e2008-11-14 13:35:19 -08003180
Chris Wilson1c5d22f2009-08-25 11:15:50 +01003181 trace_i915_gem_object_change_domain(obj,
3182 old_read_domains,
Chris Wilson05394f32010-11-08 19:18:58 +00003183 obj->base.write_domain);
Chris Wilson1c5d22f2009-08-25 11:15:50 +01003184
Eric Anholt673a3942008-07-30 12:06:12 -07003185 return 0;
3186}
3187
Eric Anholt673a3942008-07-30 12:06:12 -07003188/* Throttle our rendering by waiting until the ring has completed our requests
3189 * emitted over 20 msec ago.
3190 *
Eric Anholtb9624422009-06-03 07:27:35 +00003191 * Note that if we were to use the current jiffies each time around the loop,
3192 * we wouldn't escape the function with any frames outstanding if the time to
3193 * render a frame was over 20ms.
3194 *
Eric Anholt673a3942008-07-30 12:06:12 -07003195 * This should get us reasonable parallelism between CPU and GPU but also
3196 * relatively low latency when blocking on a particular request to finish.
3197 */
3198static int
Chris Wilsonf787a5f2010-09-24 16:02:42 +01003199i915_gem_ring_throttle(struct drm_device *dev, struct drm_file *file)
Eric Anholt673a3942008-07-30 12:06:12 -07003200{
Chris Wilsonf787a5f2010-09-24 16:02:42 +01003201 struct drm_i915_private *dev_priv = dev->dev_private;
3202 struct drm_i915_file_private *file_priv = file->driver_priv;
Eric Anholtb9624422009-06-03 07:27:35 +00003203 unsigned long recent_enough = jiffies - msecs_to_jiffies(20);
Chris Wilsonf787a5f2010-09-24 16:02:42 +01003204 struct drm_i915_gem_request *request;
3205 struct intel_ring_buffer *ring = NULL;
3206 u32 seqno = 0;
3207 int ret;
Eric Anholt673a3942008-07-30 12:06:12 -07003208
Chris Wilsone110e8d2011-01-26 15:39:14 +00003209 if (atomic_read(&dev_priv->mm.wedged))
3210 return -EIO;
3211
Chris Wilson1c255952010-09-26 11:03:27 +01003212 spin_lock(&file_priv->mm.lock);
Chris Wilsonf787a5f2010-09-24 16:02:42 +01003213 list_for_each_entry(request, &file_priv->mm.request_list, client_list) {
Eric Anholtb9624422009-06-03 07:27:35 +00003214 if (time_after_eq(request->emitted_jiffies, recent_enough))
3215 break;
3216
Chris Wilsonf787a5f2010-09-24 16:02:42 +01003217 ring = request->ring;
3218 seqno = request->seqno;
Eric Anholtb9624422009-06-03 07:27:35 +00003219 }
Chris Wilson1c255952010-09-26 11:03:27 +01003220 spin_unlock(&file_priv->mm.lock);
Chris Wilsonf787a5f2010-09-24 16:02:42 +01003221
3222 if (seqno == 0)
3223 return 0;
3224
3225 ret = 0;
Chris Wilson78501ea2010-10-27 12:18:21 +01003226 if (!i915_seqno_passed(ring->get_seqno(ring), seqno)) {
Chris Wilsonf787a5f2010-09-24 16:02:42 +01003227 /* And wait for the seqno passing without holding any locks and
3228 * causing extra latency for others. This is safe as the irq
3229 * generation is designed to be run atomically and so is
3230 * lockless.
3231 */
Chris Wilsonb13c2b92010-12-13 16:54:50 +00003232 if (ring->irq_get(ring)) {
3233 ret = wait_event_interruptible(ring->irq_queue,
3234 i915_seqno_passed(ring->get_seqno(ring), seqno)
3235 || atomic_read(&dev_priv->mm.wedged));
3236 ring->irq_put(ring);
Chris Wilsonf787a5f2010-09-24 16:02:42 +01003237
Chris Wilsonb13c2b92010-12-13 16:54:50 +00003238 if (ret == 0 && atomic_read(&dev_priv->mm.wedged))
3239 ret = -EIO;
3240 }
Chris Wilsonf787a5f2010-09-24 16:02:42 +01003241 }
3242
3243 if (ret == 0)
3244 queue_delayed_work(dev_priv->wq, &dev_priv->mm.retire_work, 0);
Eric Anholtb9624422009-06-03 07:27:35 +00003245
Eric Anholt673a3942008-07-30 12:06:12 -07003246 return ret;
3247}
3248
Eric Anholt673a3942008-07-30 12:06:12 -07003249int
Chris Wilson05394f32010-11-08 19:18:58 +00003250i915_gem_object_pin(struct drm_i915_gem_object *obj,
3251 uint32_t alignment,
Daniel Vetter75e9e912010-11-04 17:11:09 +01003252 bool map_and_fenceable)
Eric Anholt673a3942008-07-30 12:06:12 -07003253{
Chris Wilson05394f32010-11-08 19:18:58 +00003254 struct drm_device *dev = obj->base.dev;
Chris Wilsonf13d3f72010-09-20 17:36:15 +01003255 struct drm_i915_private *dev_priv = dev->dev_private;
Eric Anholt673a3942008-07-30 12:06:12 -07003256 int ret;
3257
Chris Wilson05394f32010-11-08 19:18:58 +00003258 BUG_ON(obj->pin_count == DRM_I915_GEM_OBJECT_MAX_PIN_COUNT);
Chris Wilson23bc5982010-09-29 16:10:57 +01003259 WARN_ON(i915_verify_lists(dev));
Chris Wilsonac0c6b52010-05-27 13:18:18 +01003260
Chris Wilson05394f32010-11-08 19:18:58 +00003261 if (obj->gtt_space != NULL) {
3262 if ((alignment && obj->gtt_offset & (alignment - 1)) ||
3263 (map_and_fenceable && !obj->map_and_fenceable)) {
3264 WARN(obj->pin_count,
Chris Wilsonae7d49d2010-08-04 12:37:41 +01003265 "bo is already pinned with incorrect alignment:"
Daniel Vetter75e9e912010-11-04 17:11:09 +01003266 " offset=%x, req.alignment=%x, req.map_and_fenceable=%d,"
3267 " obj->map_and_fenceable=%d\n",
Chris Wilson05394f32010-11-08 19:18:58 +00003268 obj->gtt_offset, alignment,
Daniel Vetter75e9e912010-11-04 17:11:09 +01003269 map_and_fenceable,
Chris Wilson05394f32010-11-08 19:18:58 +00003270 obj->map_and_fenceable);
Chris Wilsonac0c6b52010-05-27 13:18:18 +01003271 ret = i915_gem_object_unbind(obj);
3272 if (ret)
3273 return ret;
3274 }
3275 }
3276
Chris Wilson05394f32010-11-08 19:18:58 +00003277 if (obj->gtt_space == NULL) {
Chris Wilsona00b10c2010-09-24 21:15:47 +01003278 ret = i915_gem_object_bind_to_gtt(obj, alignment,
Daniel Vetter75e9e912010-11-04 17:11:09 +01003279 map_and_fenceable);
Chris Wilson97311292009-09-21 00:22:34 +01003280 if (ret)
Eric Anholt673a3942008-07-30 12:06:12 -07003281 return ret;
Chris Wilson22c344e2009-02-11 14:26:45 +00003282 }
Jesse Barnes76446ca2009-12-17 22:05:42 -05003283
Chris Wilson05394f32010-11-08 19:18:58 +00003284 if (obj->pin_count++ == 0) {
Chris Wilson05394f32010-11-08 19:18:58 +00003285 if (!obj->active)
3286 list_move_tail(&obj->mm_list,
Chris Wilsonf13d3f72010-09-20 17:36:15 +01003287 &dev_priv->mm.pinned_list);
Eric Anholt673a3942008-07-30 12:06:12 -07003288 }
Chris Wilson6299f992010-11-24 12:23:44 +00003289 obj->pin_mappable |= map_and_fenceable;
Eric Anholt673a3942008-07-30 12:06:12 -07003290
Chris Wilson23bc5982010-09-29 16:10:57 +01003291 WARN_ON(i915_verify_lists(dev));
Eric Anholt673a3942008-07-30 12:06:12 -07003292 return 0;
3293}
3294
3295void
Chris Wilson05394f32010-11-08 19:18:58 +00003296i915_gem_object_unpin(struct drm_i915_gem_object *obj)
Eric Anholt673a3942008-07-30 12:06:12 -07003297{
Chris Wilson05394f32010-11-08 19:18:58 +00003298 struct drm_device *dev = obj->base.dev;
Eric Anholt673a3942008-07-30 12:06:12 -07003299 drm_i915_private_t *dev_priv = dev->dev_private;
Eric Anholt673a3942008-07-30 12:06:12 -07003300
Chris Wilson23bc5982010-09-29 16:10:57 +01003301 WARN_ON(i915_verify_lists(dev));
Chris Wilson05394f32010-11-08 19:18:58 +00003302 BUG_ON(obj->pin_count == 0);
3303 BUG_ON(obj->gtt_space == NULL);
Eric Anholt673a3942008-07-30 12:06:12 -07003304
Chris Wilson05394f32010-11-08 19:18:58 +00003305 if (--obj->pin_count == 0) {
3306 if (!obj->active)
3307 list_move_tail(&obj->mm_list,
Eric Anholt673a3942008-07-30 12:06:12 -07003308 &dev_priv->mm.inactive_list);
Chris Wilson6299f992010-11-24 12:23:44 +00003309 obj->pin_mappable = false;
Eric Anholt673a3942008-07-30 12:06:12 -07003310 }
Chris Wilson23bc5982010-09-29 16:10:57 +01003311 WARN_ON(i915_verify_lists(dev));
Eric Anholt673a3942008-07-30 12:06:12 -07003312}
3313
3314int
3315i915_gem_pin_ioctl(struct drm_device *dev, void *data,
Chris Wilson05394f32010-11-08 19:18:58 +00003316 struct drm_file *file)
Eric Anholt673a3942008-07-30 12:06:12 -07003317{
3318 struct drm_i915_gem_pin *args = data;
Chris Wilson05394f32010-11-08 19:18:58 +00003319 struct drm_i915_gem_object *obj;
Eric Anholt673a3942008-07-30 12:06:12 -07003320 int ret;
3321
Chris Wilson1d7cfea2010-10-17 09:45:41 +01003322 ret = i915_mutex_lock_interruptible(dev);
3323 if (ret)
3324 return ret;
Eric Anholt673a3942008-07-30 12:06:12 -07003325
Chris Wilson05394f32010-11-08 19:18:58 +00003326 obj = to_intel_bo(drm_gem_object_lookup(dev, file, args->handle));
Eric Anholt673a3942008-07-30 12:06:12 -07003327 if (obj == NULL) {
Chris Wilson1d7cfea2010-10-17 09:45:41 +01003328 ret = -ENOENT;
3329 goto unlock;
Eric Anholt673a3942008-07-30 12:06:12 -07003330 }
Eric Anholt673a3942008-07-30 12:06:12 -07003331
Chris Wilson05394f32010-11-08 19:18:58 +00003332 if (obj->madv != I915_MADV_WILLNEED) {
Chris Wilsonbb6baf72009-09-22 14:24:13 +01003333 DRM_ERROR("Attempting to pin a purgeable buffer\n");
Chris Wilson1d7cfea2010-10-17 09:45:41 +01003334 ret = -EINVAL;
3335 goto out;
Chris Wilson3ef94da2009-09-14 16:50:29 +01003336 }
3337
Chris Wilson05394f32010-11-08 19:18:58 +00003338 if (obj->pin_filp != NULL && obj->pin_filp != file) {
Jesse Barnes79e53942008-11-07 14:24:08 -08003339 DRM_ERROR("Already pinned in i915_gem_pin_ioctl(): %d\n",
3340 args->handle);
Chris Wilson1d7cfea2010-10-17 09:45:41 +01003341 ret = -EINVAL;
3342 goto out;
Jesse Barnes79e53942008-11-07 14:24:08 -08003343 }
3344
Chris Wilson05394f32010-11-08 19:18:58 +00003345 obj->user_pin_count++;
3346 obj->pin_filp = file;
3347 if (obj->user_pin_count == 1) {
Daniel Vetter75e9e912010-11-04 17:11:09 +01003348 ret = i915_gem_object_pin(obj, args->alignment, true);
Chris Wilson1d7cfea2010-10-17 09:45:41 +01003349 if (ret)
3350 goto out;
Eric Anholt673a3942008-07-30 12:06:12 -07003351 }
3352
3353 /* XXX - flush the CPU caches for pinned objects
3354 * as the X server doesn't manage domains yet
3355 */
Eric Anholte47c68e2008-11-14 13:35:19 -08003356 i915_gem_object_flush_cpu_write_domain(obj);
Chris Wilson05394f32010-11-08 19:18:58 +00003357 args->offset = obj->gtt_offset;
Chris Wilson1d7cfea2010-10-17 09:45:41 +01003358out:
Chris Wilson05394f32010-11-08 19:18:58 +00003359 drm_gem_object_unreference(&obj->base);
Chris Wilson1d7cfea2010-10-17 09:45:41 +01003360unlock:
Eric Anholt673a3942008-07-30 12:06:12 -07003361 mutex_unlock(&dev->struct_mutex);
Chris Wilson1d7cfea2010-10-17 09:45:41 +01003362 return ret;
Eric Anholt673a3942008-07-30 12:06:12 -07003363}
3364
3365int
3366i915_gem_unpin_ioctl(struct drm_device *dev, void *data,
Chris Wilson05394f32010-11-08 19:18:58 +00003367 struct drm_file *file)
Eric Anholt673a3942008-07-30 12:06:12 -07003368{
3369 struct drm_i915_gem_pin *args = data;
Chris Wilson05394f32010-11-08 19:18:58 +00003370 struct drm_i915_gem_object *obj;
Chris Wilson76c1dec2010-09-25 11:22:51 +01003371 int ret;
Eric Anholt673a3942008-07-30 12:06:12 -07003372
Chris Wilson1d7cfea2010-10-17 09:45:41 +01003373 ret = i915_mutex_lock_interruptible(dev);
3374 if (ret)
3375 return ret;
Eric Anholt673a3942008-07-30 12:06:12 -07003376
Chris Wilson05394f32010-11-08 19:18:58 +00003377 obj = to_intel_bo(drm_gem_object_lookup(dev, file, args->handle));
Eric Anholt673a3942008-07-30 12:06:12 -07003378 if (obj == NULL) {
Chris Wilson1d7cfea2010-10-17 09:45:41 +01003379 ret = -ENOENT;
3380 goto unlock;
Eric Anholt673a3942008-07-30 12:06:12 -07003381 }
Chris Wilson76c1dec2010-09-25 11:22:51 +01003382
Chris Wilson05394f32010-11-08 19:18:58 +00003383 if (obj->pin_filp != file) {
Jesse Barnes79e53942008-11-07 14:24:08 -08003384 DRM_ERROR("Not pinned by caller in i915_gem_pin_ioctl(): %d\n",
3385 args->handle);
Chris Wilson1d7cfea2010-10-17 09:45:41 +01003386 ret = -EINVAL;
3387 goto out;
Jesse Barnes79e53942008-11-07 14:24:08 -08003388 }
Chris Wilson05394f32010-11-08 19:18:58 +00003389 obj->user_pin_count--;
3390 if (obj->user_pin_count == 0) {
3391 obj->pin_filp = NULL;
Jesse Barnes79e53942008-11-07 14:24:08 -08003392 i915_gem_object_unpin(obj);
3393 }
Eric Anholt673a3942008-07-30 12:06:12 -07003394
Chris Wilson1d7cfea2010-10-17 09:45:41 +01003395out:
Chris Wilson05394f32010-11-08 19:18:58 +00003396 drm_gem_object_unreference(&obj->base);
Chris Wilson1d7cfea2010-10-17 09:45:41 +01003397unlock:
Eric Anholt673a3942008-07-30 12:06:12 -07003398 mutex_unlock(&dev->struct_mutex);
Chris Wilson1d7cfea2010-10-17 09:45:41 +01003399 return ret;
Eric Anholt673a3942008-07-30 12:06:12 -07003400}
3401
3402int
3403i915_gem_busy_ioctl(struct drm_device *dev, void *data,
Chris Wilson05394f32010-11-08 19:18:58 +00003404 struct drm_file *file)
Eric Anholt673a3942008-07-30 12:06:12 -07003405{
3406 struct drm_i915_gem_busy *args = data;
Chris Wilson05394f32010-11-08 19:18:58 +00003407 struct drm_i915_gem_object *obj;
Chris Wilson30dbf0c2010-09-25 10:19:17 +01003408 int ret;
3409
Chris Wilson1d7cfea2010-10-17 09:45:41 +01003410 ret = i915_mutex_lock_interruptible(dev);
3411 if (ret)
3412 return ret;
Eric Anholt673a3942008-07-30 12:06:12 -07003413
Chris Wilson05394f32010-11-08 19:18:58 +00003414 obj = to_intel_bo(drm_gem_object_lookup(dev, file, args->handle));
Eric Anholt673a3942008-07-30 12:06:12 -07003415 if (obj == NULL) {
Chris Wilson1d7cfea2010-10-17 09:45:41 +01003416 ret = -ENOENT;
3417 goto unlock;
Eric Anholt673a3942008-07-30 12:06:12 -07003418 }
Zou Nan haid1b851f2010-05-21 09:08:57 +08003419
Chris Wilson0be555b2010-08-04 15:36:30 +01003420 /* Count all active objects as busy, even if they are currently not used
3421 * by the gpu. Users of this interface expect objects to eventually
3422 * become non-busy without any further actions, therefore emit any
3423 * necessary flushes here.
Eric Anholtc4de0a52008-12-14 19:05:04 -08003424 */
Chris Wilson05394f32010-11-08 19:18:58 +00003425 args->busy = obj->active;
Chris Wilson0be555b2010-08-04 15:36:30 +01003426 if (args->busy) {
3427 /* Unconditionally flush objects, even when the gpu still uses this
3428 * object. Userspace calling this function indicates that it wants to
3429 * use this buffer rather sooner than later, so issuing the required
3430 * flush earlier is beneficial.
3431 */
Chris Wilson1a1c6972010-12-07 23:00:20 +00003432 if (obj->base.write_domain & I915_GEM_GPU_DOMAINS) {
Chris Wilsondb53a302011-02-03 11:57:46 +00003433 ret = i915_gem_flush_ring(obj->ring,
Chris Wilson88241782011-01-07 17:09:48 +00003434 0, obj->base.write_domain);
Chris Wilson1a1c6972010-12-07 23:00:20 +00003435 } else if (obj->ring->outstanding_lazy_request ==
3436 obj->last_rendering_seqno) {
3437 struct drm_i915_gem_request *request;
3438
Chris Wilson7a194872010-12-07 10:38:40 +00003439 /* This ring is not being cleared by active usage,
3440 * so emit a request to do so.
3441 */
Chris Wilson1a1c6972010-12-07 23:00:20 +00003442 request = kzalloc(sizeof(*request), GFP_KERNEL);
3443 if (request)
Chris Wilsondb53a302011-02-03 11:57:46 +00003444 ret = i915_add_request(obj->ring, NULL,request);
Chris Wilson1a1c6972010-12-07 23:00:20 +00003445 else
Chris Wilson7a194872010-12-07 10:38:40 +00003446 ret = -ENOMEM;
3447 }
Chris Wilson0be555b2010-08-04 15:36:30 +01003448
3449 /* Update the active list for the hardware's current position.
3450 * Otherwise this only updates on a delayed timer or when irqs
3451 * are actually unmasked, and our working set ends up being
3452 * larger than required.
3453 */
Chris Wilsondb53a302011-02-03 11:57:46 +00003454 i915_gem_retire_requests_ring(obj->ring);
Chris Wilson0be555b2010-08-04 15:36:30 +01003455
Chris Wilson05394f32010-11-08 19:18:58 +00003456 args->busy = obj->active;
Chris Wilson0be555b2010-08-04 15:36:30 +01003457 }
Eric Anholt673a3942008-07-30 12:06:12 -07003458
Chris Wilson05394f32010-11-08 19:18:58 +00003459 drm_gem_object_unreference(&obj->base);
Chris Wilson1d7cfea2010-10-17 09:45:41 +01003460unlock:
Eric Anholt673a3942008-07-30 12:06:12 -07003461 mutex_unlock(&dev->struct_mutex);
Chris Wilson1d7cfea2010-10-17 09:45:41 +01003462 return ret;
Eric Anholt673a3942008-07-30 12:06:12 -07003463}
3464
3465int
3466i915_gem_throttle_ioctl(struct drm_device *dev, void *data,
3467 struct drm_file *file_priv)
3468{
3469 return i915_gem_ring_throttle(dev, file_priv);
3470}
3471
Chris Wilson3ef94da2009-09-14 16:50:29 +01003472int
3473i915_gem_madvise_ioctl(struct drm_device *dev, void *data,
3474 struct drm_file *file_priv)
3475{
3476 struct drm_i915_gem_madvise *args = data;
Chris Wilson05394f32010-11-08 19:18:58 +00003477 struct drm_i915_gem_object *obj;
Chris Wilson76c1dec2010-09-25 11:22:51 +01003478 int ret;
Chris Wilson3ef94da2009-09-14 16:50:29 +01003479
3480 switch (args->madv) {
3481 case I915_MADV_DONTNEED:
3482 case I915_MADV_WILLNEED:
3483 break;
3484 default:
3485 return -EINVAL;
3486 }
3487
Chris Wilson1d7cfea2010-10-17 09:45:41 +01003488 ret = i915_mutex_lock_interruptible(dev);
3489 if (ret)
3490 return ret;
3491
Chris Wilson05394f32010-11-08 19:18:58 +00003492 obj = to_intel_bo(drm_gem_object_lookup(dev, file_priv, args->handle));
Chris Wilson3ef94da2009-09-14 16:50:29 +01003493 if (obj == NULL) {
Chris Wilson1d7cfea2010-10-17 09:45:41 +01003494 ret = -ENOENT;
3495 goto unlock;
Chris Wilson3ef94da2009-09-14 16:50:29 +01003496 }
Chris Wilson3ef94da2009-09-14 16:50:29 +01003497
Chris Wilson05394f32010-11-08 19:18:58 +00003498 if (obj->pin_count) {
Chris Wilson1d7cfea2010-10-17 09:45:41 +01003499 ret = -EINVAL;
3500 goto out;
Chris Wilson3ef94da2009-09-14 16:50:29 +01003501 }
3502
Chris Wilson05394f32010-11-08 19:18:58 +00003503 if (obj->madv != __I915_MADV_PURGED)
3504 obj->madv = args->madv;
Chris Wilson3ef94da2009-09-14 16:50:29 +01003505
Chris Wilson2d7ef392009-09-20 23:13:10 +01003506 /* if the object is no longer bound, discard its backing storage */
Chris Wilson05394f32010-11-08 19:18:58 +00003507 if (i915_gem_object_is_purgeable(obj) &&
3508 obj->gtt_space == NULL)
Chris Wilson2d7ef392009-09-20 23:13:10 +01003509 i915_gem_object_truncate(obj);
3510
Chris Wilson05394f32010-11-08 19:18:58 +00003511 args->retained = obj->madv != __I915_MADV_PURGED;
Chris Wilsonbb6baf72009-09-22 14:24:13 +01003512
Chris Wilson1d7cfea2010-10-17 09:45:41 +01003513out:
Chris Wilson05394f32010-11-08 19:18:58 +00003514 drm_gem_object_unreference(&obj->base);
Chris Wilson1d7cfea2010-10-17 09:45:41 +01003515unlock:
Chris Wilson3ef94da2009-09-14 16:50:29 +01003516 mutex_unlock(&dev->struct_mutex);
Chris Wilson1d7cfea2010-10-17 09:45:41 +01003517 return ret;
Chris Wilson3ef94da2009-09-14 16:50:29 +01003518}
3519
Chris Wilson05394f32010-11-08 19:18:58 +00003520struct drm_i915_gem_object *i915_gem_alloc_object(struct drm_device *dev,
3521 size_t size)
Daniel Vetterac52bc52010-04-09 19:05:06 +00003522{
Chris Wilson73aa8082010-09-30 11:46:12 +01003523 struct drm_i915_private *dev_priv = dev->dev_private;
Daniel Vetterc397b902010-04-09 19:05:07 +00003524 struct drm_i915_gem_object *obj;
3525
3526 obj = kzalloc(sizeof(*obj), GFP_KERNEL);
3527 if (obj == NULL)
3528 return NULL;
3529
3530 if (drm_gem_object_init(dev, &obj->base, size) != 0) {
3531 kfree(obj);
3532 return NULL;
3533 }
3534
Chris Wilson73aa8082010-09-30 11:46:12 +01003535 i915_gem_info_add_obj(dev_priv, size);
3536
Daniel Vetterc397b902010-04-09 19:05:07 +00003537 obj->base.write_domain = I915_GEM_DOMAIN_CPU;
3538 obj->base.read_domains = I915_GEM_DOMAIN_CPU;
3539
3540 obj->agp_type = AGP_USER_MEMORY;
Daniel Vetter62b8b212010-04-09 19:05:08 +00003541 obj->base.driver_private = NULL;
Daniel Vetterc397b902010-04-09 19:05:07 +00003542 obj->fence_reg = I915_FENCE_REG_NONE;
Chris Wilson69dc4982010-10-19 10:36:51 +01003543 INIT_LIST_HEAD(&obj->mm_list);
Daniel Vetter93a37f22010-11-05 20:24:53 +01003544 INIT_LIST_HEAD(&obj->gtt_list);
Chris Wilson69dc4982010-10-19 10:36:51 +01003545 INIT_LIST_HEAD(&obj->ring_list);
Chris Wilson432e58e2010-11-25 19:32:06 +00003546 INIT_LIST_HEAD(&obj->exec_list);
Daniel Vetterc397b902010-04-09 19:05:07 +00003547 INIT_LIST_HEAD(&obj->gpu_write_list);
Daniel Vetterc397b902010-04-09 19:05:07 +00003548 obj->madv = I915_MADV_WILLNEED;
Daniel Vetter75e9e912010-11-04 17:11:09 +01003549 /* Avoid an unnecessary call to unbind on the first bind. */
3550 obj->map_and_fenceable = true;
Daniel Vetterc397b902010-04-09 19:05:07 +00003551
Chris Wilson05394f32010-11-08 19:18:58 +00003552 return obj;
Daniel Vetterac52bc52010-04-09 19:05:06 +00003553}
3554
Eric Anholt673a3942008-07-30 12:06:12 -07003555int i915_gem_init_object(struct drm_gem_object *obj)
3556{
Daniel Vetterc397b902010-04-09 19:05:07 +00003557 BUG();
Jesse Barnesde151cf2008-11-12 10:03:55 -08003558
Eric Anholt673a3942008-07-30 12:06:12 -07003559 return 0;
3560}
3561
Chris Wilson05394f32010-11-08 19:18:58 +00003562static void i915_gem_free_object_tail(struct drm_i915_gem_object *obj)
Chris Wilsonbe726152010-07-23 23:18:50 +01003563{
Chris Wilson05394f32010-11-08 19:18:58 +00003564 struct drm_device *dev = obj->base.dev;
Chris Wilsonbe726152010-07-23 23:18:50 +01003565 drm_i915_private_t *dev_priv = dev->dev_private;
Chris Wilsonbe726152010-07-23 23:18:50 +01003566 int ret;
3567
3568 ret = i915_gem_object_unbind(obj);
3569 if (ret == -ERESTARTSYS) {
Chris Wilson05394f32010-11-08 19:18:58 +00003570 list_move(&obj->mm_list,
Chris Wilsonbe726152010-07-23 23:18:50 +01003571 &dev_priv->mm.deferred_free_list);
3572 return;
3573 }
3574
Chris Wilson05394f32010-11-08 19:18:58 +00003575 if (obj->base.map_list.map)
Chris Wilsonbe726152010-07-23 23:18:50 +01003576 i915_gem_free_mmap_offset(obj);
3577
Chris Wilson05394f32010-11-08 19:18:58 +00003578 drm_gem_object_release(&obj->base);
3579 i915_gem_info_remove_obj(dev_priv, obj->base.size);
Chris Wilsonbe726152010-07-23 23:18:50 +01003580
Chris Wilson05394f32010-11-08 19:18:58 +00003581 kfree(obj->page_cpu_valid);
3582 kfree(obj->bit_17);
3583 kfree(obj);
Chris Wilsondb53a302011-02-03 11:57:46 +00003584
3585 trace_i915_gem_object_destroy(obj);
Chris Wilsonbe726152010-07-23 23:18:50 +01003586}
3587
Chris Wilson05394f32010-11-08 19:18:58 +00003588void i915_gem_free_object(struct drm_gem_object *gem_obj)
Eric Anholt673a3942008-07-30 12:06:12 -07003589{
Chris Wilson05394f32010-11-08 19:18:58 +00003590 struct drm_i915_gem_object *obj = to_intel_bo(gem_obj);
3591 struct drm_device *dev = obj->base.dev;
Eric Anholt673a3942008-07-30 12:06:12 -07003592
Chris Wilson05394f32010-11-08 19:18:58 +00003593 while (obj->pin_count > 0)
Eric Anholt673a3942008-07-30 12:06:12 -07003594 i915_gem_object_unpin(obj);
3595
Chris Wilson05394f32010-11-08 19:18:58 +00003596 if (obj->phys_obj)
Dave Airlie71acb5e2008-12-30 20:31:46 +10003597 i915_gem_detach_phys_object(dev, obj);
3598
Chris Wilsonbe726152010-07-23 23:18:50 +01003599 i915_gem_free_object_tail(obj);
Eric Anholt673a3942008-07-30 12:06:12 -07003600}
3601
Jesse Barnes5669fca2009-02-17 15:13:31 -08003602int
Eric Anholt673a3942008-07-30 12:06:12 -07003603i915_gem_idle(struct drm_device *dev)
3604{
3605 drm_i915_private_t *dev_priv = dev->dev_private;
Chris Wilson29105cc2010-01-07 10:39:13 +00003606 int ret;
Eric Anholt673a3942008-07-30 12:06:12 -07003607
Keith Packard6dbe2772008-10-14 21:41:13 -07003608 mutex_lock(&dev->struct_mutex);
3609
Chris Wilson87acb0a2010-10-19 10:13:00 +01003610 if (dev_priv->mm.suspended) {
Keith Packard6dbe2772008-10-14 21:41:13 -07003611 mutex_unlock(&dev->struct_mutex);
Eric Anholt673a3942008-07-30 12:06:12 -07003612 return 0;
Keith Packard6dbe2772008-10-14 21:41:13 -07003613 }
Eric Anholt673a3942008-07-30 12:06:12 -07003614
Chris Wilson29105cc2010-01-07 10:39:13 +00003615 ret = i915_gpu_idle(dev);
Keith Packard6dbe2772008-10-14 21:41:13 -07003616 if (ret) {
3617 mutex_unlock(&dev->struct_mutex);
Eric Anholt673a3942008-07-30 12:06:12 -07003618 return ret;
Keith Packard6dbe2772008-10-14 21:41:13 -07003619 }
Eric Anholt673a3942008-07-30 12:06:12 -07003620
Chris Wilson29105cc2010-01-07 10:39:13 +00003621 /* Under UMS, be paranoid and evict. */
3622 if (!drm_core_check_feature(dev, DRIVER_MODESET)) {
Chris Wilson5eac3ab2010-10-31 08:49:47 +00003623 ret = i915_gem_evict_inactive(dev, false);
Chris Wilson29105cc2010-01-07 10:39:13 +00003624 if (ret) {
3625 mutex_unlock(&dev->struct_mutex);
3626 return ret;
3627 }
3628 }
3629
Chris Wilson312817a2010-11-22 11:50:11 +00003630 i915_gem_reset_fences(dev);
3631
Chris Wilson29105cc2010-01-07 10:39:13 +00003632 /* Hack! Don't let anybody do execbuf while we don't control the chip.
3633 * We need to replace this with a semaphore, or something.
3634 * And not confound mm.suspended!
3635 */
3636 dev_priv->mm.suspended = 1;
Daniel Vetterbc0c7f12010-08-20 18:18:48 +02003637 del_timer_sync(&dev_priv->hangcheck_timer);
Chris Wilson29105cc2010-01-07 10:39:13 +00003638
3639 i915_kernel_lost_context(dev);
Keith Packard6dbe2772008-10-14 21:41:13 -07003640 i915_gem_cleanup_ringbuffer(dev);
Chris Wilson29105cc2010-01-07 10:39:13 +00003641
Keith Packard6dbe2772008-10-14 21:41:13 -07003642 mutex_unlock(&dev->struct_mutex);
3643
Chris Wilson29105cc2010-01-07 10:39:13 +00003644 /* Cancel the retire work handler, which should be idle now. */
3645 cancel_delayed_work_sync(&dev_priv->mm.retire_work);
3646
Eric Anholt673a3942008-07-30 12:06:12 -07003647 return 0;
3648}
3649
Eric Anholt673a3942008-07-30 12:06:12 -07003650int
Zou Nan hai8187a2b2010-05-21 09:08:55 +08003651i915_gem_init_ringbuffer(struct drm_device *dev)
3652{
3653 drm_i915_private_t *dev_priv = dev->dev_private;
3654 int ret;
Chris Wilson68f95ba2010-05-27 13:18:22 +01003655
Xiang, Haihao5c1143b2010-09-16 10:43:11 +08003656 ret = intel_init_render_ring_buffer(dev);
Chris Wilson68f95ba2010-05-27 13:18:22 +01003657 if (ret)
Chris Wilsonb6913e42010-11-12 10:46:37 +00003658 return ret;
Chris Wilson68f95ba2010-05-27 13:18:22 +01003659
3660 if (HAS_BSD(dev)) {
Xiang, Haihao5c1143b2010-09-16 10:43:11 +08003661 ret = intel_init_bsd_ring_buffer(dev);
Chris Wilson68f95ba2010-05-27 13:18:22 +01003662 if (ret)
3663 goto cleanup_render_ring;
Zou Nan haid1b851f2010-05-21 09:08:57 +08003664 }
Chris Wilson68f95ba2010-05-27 13:18:22 +01003665
Chris Wilson549f7362010-10-19 11:19:32 +01003666 if (HAS_BLT(dev)) {
3667 ret = intel_init_blt_ring_buffer(dev);
3668 if (ret)
3669 goto cleanup_bsd_ring;
3670 }
3671
Chris Wilson6f392d52010-08-07 11:01:22 +01003672 dev_priv->next_seqno = 1;
3673
Chris Wilson68f95ba2010-05-27 13:18:22 +01003674 return 0;
3675
Chris Wilson549f7362010-10-19 11:19:32 +01003676cleanup_bsd_ring:
Chris Wilson1ec14ad2010-12-04 11:30:53 +00003677 intel_cleanup_ring_buffer(&dev_priv->ring[VCS]);
Chris Wilson68f95ba2010-05-27 13:18:22 +01003678cleanup_render_ring:
Chris Wilson1ec14ad2010-12-04 11:30:53 +00003679 intel_cleanup_ring_buffer(&dev_priv->ring[RCS]);
Zou Nan hai8187a2b2010-05-21 09:08:55 +08003680 return ret;
3681}
3682
3683void
3684i915_gem_cleanup_ringbuffer(struct drm_device *dev)
3685{
3686 drm_i915_private_t *dev_priv = dev->dev_private;
Chris Wilson1ec14ad2010-12-04 11:30:53 +00003687 int i;
Zou Nan hai8187a2b2010-05-21 09:08:55 +08003688
Chris Wilson1ec14ad2010-12-04 11:30:53 +00003689 for (i = 0; i < I915_NUM_RINGS; i++)
3690 intel_cleanup_ring_buffer(&dev_priv->ring[i]);
Zou Nan hai8187a2b2010-05-21 09:08:55 +08003691}
3692
3693int
Eric Anholt673a3942008-07-30 12:06:12 -07003694i915_gem_entervt_ioctl(struct drm_device *dev, void *data,
3695 struct drm_file *file_priv)
3696{
3697 drm_i915_private_t *dev_priv = dev->dev_private;
Chris Wilson1ec14ad2010-12-04 11:30:53 +00003698 int ret, i;
Eric Anholt673a3942008-07-30 12:06:12 -07003699
Jesse Barnes79e53942008-11-07 14:24:08 -08003700 if (drm_core_check_feature(dev, DRIVER_MODESET))
3701 return 0;
3702
Ben Gamariba1234d2009-09-14 17:48:47 -04003703 if (atomic_read(&dev_priv->mm.wedged)) {
Eric Anholt673a3942008-07-30 12:06:12 -07003704 DRM_ERROR("Reenabling wedged hardware, good luck\n");
Ben Gamariba1234d2009-09-14 17:48:47 -04003705 atomic_set(&dev_priv->mm.wedged, 0);
Eric Anholt673a3942008-07-30 12:06:12 -07003706 }
3707
Eric Anholt673a3942008-07-30 12:06:12 -07003708 mutex_lock(&dev->struct_mutex);
Eric Anholt9bb2d6f2008-12-23 18:42:32 -08003709 dev_priv->mm.suspended = 0;
3710
3711 ret = i915_gem_init_ringbuffer(dev);
Wu Fengguangd816f6a2009-04-18 10:43:32 +08003712 if (ret != 0) {
3713 mutex_unlock(&dev->struct_mutex);
Eric Anholt9bb2d6f2008-12-23 18:42:32 -08003714 return ret;
Wu Fengguangd816f6a2009-04-18 10:43:32 +08003715 }
Eric Anholt9bb2d6f2008-12-23 18:42:32 -08003716
Chris Wilson69dc4982010-10-19 10:36:51 +01003717 BUG_ON(!list_empty(&dev_priv->mm.active_list));
Eric Anholt673a3942008-07-30 12:06:12 -07003718 BUG_ON(!list_empty(&dev_priv->mm.flushing_list));
3719 BUG_ON(!list_empty(&dev_priv->mm.inactive_list));
Chris Wilson1ec14ad2010-12-04 11:30:53 +00003720 for (i = 0; i < I915_NUM_RINGS; i++) {
3721 BUG_ON(!list_empty(&dev_priv->ring[i].active_list));
3722 BUG_ON(!list_empty(&dev_priv->ring[i].request_list));
3723 }
Eric Anholt673a3942008-07-30 12:06:12 -07003724 mutex_unlock(&dev->struct_mutex);
Kristian Høgsbergdbb19d32008-08-20 11:04:27 -04003725
Chris Wilson5f353082010-06-07 14:03:03 +01003726 ret = drm_irq_install(dev);
3727 if (ret)
3728 goto cleanup_ringbuffer;
Kristian Høgsbergdbb19d32008-08-20 11:04:27 -04003729
Eric Anholt673a3942008-07-30 12:06:12 -07003730 return 0;
Chris Wilson5f353082010-06-07 14:03:03 +01003731
3732cleanup_ringbuffer:
3733 mutex_lock(&dev->struct_mutex);
3734 i915_gem_cleanup_ringbuffer(dev);
3735 dev_priv->mm.suspended = 1;
3736 mutex_unlock(&dev->struct_mutex);
3737
3738 return ret;
Eric Anholt673a3942008-07-30 12:06:12 -07003739}
3740
3741int
3742i915_gem_leavevt_ioctl(struct drm_device *dev, void *data,
3743 struct drm_file *file_priv)
3744{
Jesse Barnes79e53942008-11-07 14:24:08 -08003745 if (drm_core_check_feature(dev, DRIVER_MODESET))
3746 return 0;
3747
Kristian Høgsbergdbb19d32008-08-20 11:04:27 -04003748 drm_irq_uninstall(dev);
Linus Torvaldse6890f62009-09-08 17:09:24 -07003749 return i915_gem_idle(dev);
Eric Anholt673a3942008-07-30 12:06:12 -07003750}
3751
3752void
3753i915_gem_lastclose(struct drm_device *dev)
3754{
3755 int ret;
Eric Anholt673a3942008-07-30 12:06:12 -07003756
Eric Anholte806b492009-01-22 09:56:58 -08003757 if (drm_core_check_feature(dev, DRIVER_MODESET))
3758 return;
3759
Keith Packard6dbe2772008-10-14 21:41:13 -07003760 ret = i915_gem_idle(dev);
3761 if (ret)
3762 DRM_ERROR("failed to idle hardware: %d\n", ret);
Eric Anholt673a3942008-07-30 12:06:12 -07003763}
3764
Chris Wilson64193402010-10-24 12:38:05 +01003765static void
3766init_ring_lists(struct intel_ring_buffer *ring)
3767{
3768 INIT_LIST_HEAD(&ring->active_list);
3769 INIT_LIST_HEAD(&ring->request_list);
3770 INIT_LIST_HEAD(&ring->gpu_write_list);
3771}
3772
Eric Anholt673a3942008-07-30 12:06:12 -07003773void
3774i915_gem_load(struct drm_device *dev)
3775{
Grégoire Henryb5aa8a02009-06-23 15:41:02 +02003776 int i;
Eric Anholt673a3942008-07-30 12:06:12 -07003777 drm_i915_private_t *dev_priv = dev->dev_private;
3778
Chris Wilson69dc4982010-10-19 10:36:51 +01003779 INIT_LIST_HEAD(&dev_priv->mm.active_list);
Eric Anholt673a3942008-07-30 12:06:12 -07003780 INIT_LIST_HEAD(&dev_priv->mm.flushing_list);
3781 INIT_LIST_HEAD(&dev_priv->mm.inactive_list);
Chris Wilsonf13d3f72010-09-20 17:36:15 +01003782 INIT_LIST_HEAD(&dev_priv->mm.pinned_list);
Eric Anholta09ba7f2009-08-29 12:49:51 -07003783 INIT_LIST_HEAD(&dev_priv->mm.fence_list);
Chris Wilsonbe726152010-07-23 23:18:50 +01003784 INIT_LIST_HEAD(&dev_priv->mm.deferred_free_list);
Daniel Vetter93a37f22010-11-05 20:24:53 +01003785 INIT_LIST_HEAD(&dev_priv->mm.gtt_list);
Chris Wilson1ec14ad2010-12-04 11:30:53 +00003786 for (i = 0; i < I915_NUM_RINGS; i++)
3787 init_ring_lists(&dev_priv->ring[i]);
Daniel Vetter007cc8a2010-04-28 11:02:31 +02003788 for (i = 0; i < 16; i++)
3789 INIT_LIST_HEAD(&dev_priv->fence_regs[i].lru_list);
Eric Anholt673a3942008-07-30 12:06:12 -07003790 INIT_DELAYED_WORK(&dev_priv->mm.retire_work,
3791 i915_gem_retire_work_handler);
Chris Wilson30dbf0c2010-09-25 10:19:17 +01003792 init_completion(&dev_priv->error_completion);
Chris Wilson31169712009-09-14 16:50:28 +01003793
Dave Airlie94400122010-07-20 13:15:31 +10003794 /* On GEN3 we really need to make sure the ARB C3 LP bit is set */
3795 if (IS_GEN3(dev)) {
3796 u32 tmp = I915_READ(MI_ARB_STATE);
3797 if (!(tmp & MI_ARB_C3_LP_WRITE_ENABLE)) {
3798 /* arb state is a masked write, so set bit + bit in mask */
3799 tmp = MI_ARB_C3_LP_WRITE_ENABLE | (MI_ARB_C3_LP_WRITE_ENABLE << MI_ARB_MASK_SHIFT);
3800 I915_WRITE(MI_ARB_STATE, tmp);
3801 }
3802 }
3803
Chris Wilson72bfa192010-12-19 11:42:05 +00003804 dev_priv->relative_constants_mode = I915_EXEC_CONSTANTS_REL_GENERAL;
3805
Jesse Barnesde151cf2008-11-12 10:03:55 -08003806 /* Old X drivers will take 0-2 for front, back, depth buffers */
Eric Anholtb397c832010-01-26 09:43:10 -08003807 if (!drm_core_check_feature(dev, DRIVER_MODESET))
3808 dev_priv->fence_reg_start = 3;
Jesse Barnesde151cf2008-11-12 10:03:55 -08003809
Chris Wilsona6c45cf2010-09-17 00:32:17 +01003810 if (INTEL_INFO(dev)->gen >= 4 || IS_I945G(dev) || IS_I945GM(dev) || IS_G33(dev))
Jesse Barnesde151cf2008-11-12 10:03:55 -08003811 dev_priv->num_fence_regs = 16;
3812 else
3813 dev_priv->num_fence_regs = 8;
3814
Grégoire Henryb5aa8a02009-06-23 15:41:02 +02003815 /* Initialize fence registers to zero */
Chris Wilsona6c45cf2010-09-17 00:32:17 +01003816 switch (INTEL_INFO(dev)->gen) {
3817 case 6:
3818 for (i = 0; i < 16; i++)
3819 I915_WRITE64(FENCE_REG_SANDYBRIDGE_0 + (i * 8), 0);
3820 break;
3821 case 5:
3822 case 4:
Grégoire Henryb5aa8a02009-06-23 15:41:02 +02003823 for (i = 0; i < 16; i++)
3824 I915_WRITE64(FENCE_REG_965_0 + (i * 8), 0);
Chris Wilsona6c45cf2010-09-17 00:32:17 +01003825 break;
3826 case 3:
Grégoire Henryb5aa8a02009-06-23 15:41:02 +02003827 if (IS_I945G(dev) || IS_I945GM(dev) || IS_G33(dev))
3828 for (i = 0; i < 8; i++)
3829 I915_WRITE(FENCE_REG_945_8 + (i * 4), 0);
Chris Wilsona6c45cf2010-09-17 00:32:17 +01003830 case 2:
3831 for (i = 0; i < 8; i++)
3832 I915_WRITE(FENCE_REG_830_0 + (i * 4), 0);
3833 break;
Grégoire Henryb5aa8a02009-06-23 15:41:02 +02003834 }
Eric Anholt673a3942008-07-30 12:06:12 -07003835 i915_gem_detect_bit_6_swizzle(dev);
Kristian Høgsberg6b95a202009-11-18 11:25:18 -05003836 init_waitqueue_head(&dev_priv->pending_flip_queue);
Chris Wilson17250b72010-10-28 12:51:39 +01003837
3838 dev_priv->mm.inactive_shrinker.shrink = i915_gem_inactive_shrink;
3839 dev_priv->mm.inactive_shrinker.seeks = DEFAULT_SEEKS;
3840 register_shrinker(&dev_priv->mm.inactive_shrinker);
Eric Anholt673a3942008-07-30 12:06:12 -07003841}
Dave Airlie71acb5e2008-12-30 20:31:46 +10003842
3843/*
3844 * Create a physically contiguous memory object for this object
3845 * e.g. for cursor + overlay regs
3846 */
Chris Wilson995b6762010-08-20 13:23:26 +01003847static int i915_gem_init_phys_object(struct drm_device *dev,
3848 int id, int size, int align)
Dave Airlie71acb5e2008-12-30 20:31:46 +10003849{
3850 drm_i915_private_t *dev_priv = dev->dev_private;
3851 struct drm_i915_gem_phys_object *phys_obj;
3852 int ret;
3853
3854 if (dev_priv->mm.phys_objs[id - 1] || !size)
3855 return 0;
3856
Eric Anholt9a298b22009-03-24 12:23:04 -07003857 phys_obj = kzalloc(sizeof(struct drm_i915_gem_phys_object), GFP_KERNEL);
Dave Airlie71acb5e2008-12-30 20:31:46 +10003858 if (!phys_obj)
3859 return -ENOMEM;
3860
3861 phys_obj->id = id;
3862
Chris Wilson6eeefaf2010-08-07 11:01:39 +01003863 phys_obj->handle = drm_pci_alloc(dev, size, align);
Dave Airlie71acb5e2008-12-30 20:31:46 +10003864 if (!phys_obj->handle) {
3865 ret = -ENOMEM;
3866 goto kfree_obj;
3867 }
3868#ifdef CONFIG_X86
3869 set_memory_wc((unsigned long)phys_obj->handle->vaddr, phys_obj->handle->size / PAGE_SIZE);
3870#endif
3871
3872 dev_priv->mm.phys_objs[id - 1] = phys_obj;
3873
3874 return 0;
3875kfree_obj:
Eric Anholt9a298b22009-03-24 12:23:04 -07003876 kfree(phys_obj);
Dave Airlie71acb5e2008-12-30 20:31:46 +10003877 return ret;
3878}
3879
Chris Wilson995b6762010-08-20 13:23:26 +01003880static void i915_gem_free_phys_object(struct drm_device *dev, int id)
Dave Airlie71acb5e2008-12-30 20:31:46 +10003881{
3882 drm_i915_private_t *dev_priv = dev->dev_private;
3883 struct drm_i915_gem_phys_object *phys_obj;
3884
3885 if (!dev_priv->mm.phys_objs[id - 1])
3886 return;
3887
3888 phys_obj = dev_priv->mm.phys_objs[id - 1];
3889 if (phys_obj->cur_obj) {
3890 i915_gem_detach_phys_object(dev, phys_obj->cur_obj);
3891 }
3892
3893#ifdef CONFIG_X86
3894 set_memory_wb((unsigned long)phys_obj->handle->vaddr, phys_obj->handle->size / PAGE_SIZE);
3895#endif
3896 drm_pci_free(dev, phys_obj->handle);
3897 kfree(phys_obj);
3898 dev_priv->mm.phys_objs[id - 1] = NULL;
3899}
3900
3901void i915_gem_free_all_phys_object(struct drm_device *dev)
3902{
3903 int i;
3904
Dave Airlie260883c2009-01-22 17:58:49 +10003905 for (i = I915_GEM_PHYS_CURSOR_0; i <= I915_MAX_PHYS_OBJECT; i++)
Dave Airlie71acb5e2008-12-30 20:31:46 +10003906 i915_gem_free_phys_object(dev, i);
3907}
3908
3909void i915_gem_detach_phys_object(struct drm_device *dev,
Chris Wilson05394f32010-11-08 19:18:58 +00003910 struct drm_i915_gem_object *obj)
Dave Airlie71acb5e2008-12-30 20:31:46 +10003911{
Chris Wilson05394f32010-11-08 19:18:58 +00003912 struct address_space *mapping = obj->base.filp->f_path.dentry->d_inode->i_mapping;
Chris Wilsone5281cc2010-10-28 13:45:36 +01003913 char *vaddr;
Dave Airlie71acb5e2008-12-30 20:31:46 +10003914 int i;
Dave Airlie71acb5e2008-12-30 20:31:46 +10003915 int page_count;
3916
Chris Wilson05394f32010-11-08 19:18:58 +00003917 if (!obj->phys_obj)
Dave Airlie71acb5e2008-12-30 20:31:46 +10003918 return;
Chris Wilson05394f32010-11-08 19:18:58 +00003919 vaddr = obj->phys_obj->handle->vaddr;
Dave Airlie71acb5e2008-12-30 20:31:46 +10003920
Chris Wilson05394f32010-11-08 19:18:58 +00003921 page_count = obj->base.size / PAGE_SIZE;
Dave Airlie71acb5e2008-12-30 20:31:46 +10003922 for (i = 0; i < page_count; i++) {
Chris Wilsone5281cc2010-10-28 13:45:36 +01003923 struct page *page = read_cache_page_gfp(mapping, i,
3924 GFP_HIGHUSER | __GFP_RECLAIMABLE);
3925 if (!IS_ERR(page)) {
3926 char *dst = kmap_atomic(page);
3927 memcpy(dst, vaddr + i*PAGE_SIZE, PAGE_SIZE);
3928 kunmap_atomic(dst);
Dave Airlie71acb5e2008-12-30 20:31:46 +10003929
Chris Wilsone5281cc2010-10-28 13:45:36 +01003930 drm_clflush_pages(&page, 1);
3931
3932 set_page_dirty(page);
3933 mark_page_accessed(page);
3934 page_cache_release(page);
3935 }
Dave Airlie71acb5e2008-12-30 20:31:46 +10003936 }
Daniel Vetter40ce6572010-11-05 18:12:18 +01003937 intel_gtt_chipset_flush();
Chris Wilsond78b47b2009-06-17 21:52:49 +01003938
Chris Wilson05394f32010-11-08 19:18:58 +00003939 obj->phys_obj->cur_obj = NULL;
3940 obj->phys_obj = NULL;
Dave Airlie71acb5e2008-12-30 20:31:46 +10003941}
3942
3943int
3944i915_gem_attach_phys_object(struct drm_device *dev,
Chris Wilson05394f32010-11-08 19:18:58 +00003945 struct drm_i915_gem_object *obj,
Chris Wilson6eeefaf2010-08-07 11:01:39 +01003946 int id,
3947 int align)
Dave Airlie71acb5e2008-12-30 20:31:46 +10003948{
Chris Wilson05394f32010-11-08 19:18:58 +00003949 struct address_space *mapping = obj->base.filp->f_path.dentry->d_inode->i_mapping;
Dave Airlie71acb5e2008-12-30 20:31:46 +10003950 drm_i915_private_t *dev_priv = dev->dev_private;
Dave Airlie71acb5e2008-12-30 20:31:46 +10003951 int ret = 0;
3952 int page_count;
3953 int i;
3954
3955 if (id > I915_MAX_PHYS_OBJECT)
3956 return -EINVAL;
3957
Chris Wilson05394f32010-11-08 19:18:58 +00003958 if (obj->phys_obj) {
3959 if (obj->phys_obj->id == id)
Dave Airlie71acb5e2008-12-30 20:31:46 +10003960 return 0;
3961 i915_gem_detach_phys_object(dev, obj);
3962 }
3963
Dave Airlie71acb5e2008-12-30 20:31:46 +10003964 /* create a new object */
3965 if (!dev_priv->mm.phys_objs[id - 1]) {
3966 ret = i915_gem_init_phys_object(dev, id,
Chris Wilson05394f32010-11-08 19:18:58 +00003967 obj->base.size, align);
Dave Airlie71acb5e2008-12-30 20:31:46 +10003968 if (ret) {
Chris Wilson05394f32010-11-08 19:18:58 +00003969 DRM_ERROR("failed to init phys object %d size: %zu\n",
3970 id, obj->base.size);
Chris Wilsone5281cc2010-10-28 13:45:36 +01003971 return ret;
Dave Airlie71acb5e2008-12-30 20:31:46 +10003972 }
3973 }
3974
3975 /* bind to the object */
Chris Wilson05394f32010-11-08 19:18:58 +00003976 obj->phys_obj = dev_priv->mm.phys_objs[id - 1];
3977 obj->phys_obj->cur_obj = obj;
Dave Airlie71acb5e2008-12-30 20:31:46 +10003978
Chris Wilson05394f32010-11-08 19:18:58 +00003979 page_count = obj->base.size / PAGE_SIZE;
Dave Airlie71acb5e2008-12-30 20:31:46 +10003980
3981 for (i = 0; i < page_count; i++) {
Chris Wilsone5281cc2010-10-28 13:45:36 +01003982 struct page *page;
3983 char *dst, *src;
Dave Airlie71acb5e2008-12-30 20:31:46 +10003984
Chris Wilsone5281cc2010-10-28 13:45:36 +01003985 page = read_cache_page_gfp(mapping, i,
3986 GFP_HIGHUSER | __GFP_RECLAIMABLE);
3987 if (IS_ERR(page))
3988 return PTR_ERR(page);
3989
Chris Wilsonff75b9b2010-10-30 22:52:31 +01003990 src = kmap_atomic(page);
Chris Wilson05394f32010-11-08 19:18:58 +00003991 dst = obj->phys_obj->handle->vaddr + (i * PAGE_SIZE);
Dave Airlie71acb5e2008-12-30 20:31:46 +10003992 memcpy(dst, src, PAGE_SIZE);
Peter Zijlstra3e4d3af2010-10-26 14:21:51 -07003993 kunmap_atomic(src);
Chris Wilsone5281cc2010-10-28 13:45:36 +01003994
3995 mark_page_accessed(page);
3996 page_cache_release(page);
Dave Airlie71acb5e2008-12-30 20:31:46 +10003997 }
3998
3999 return 0;
Dave Airlie71acb5e2008-12-30 20:31:46 +10004000}
4001
4002static int
Chris Wilson05394f32010-11-08 19:18:58 +00004003i915_gem_phys_pwrite(struct drm_device *dev,
4004 struct drm_i915_gem_object *obj,
Dave Airlie71acb5e2008-12-30 20:31:46 +10004005 struct drm_i915_gem_pwrite *args,
4006 struct drm_file *file_priv)
4007{
Chris Wilson05394f32010-11-08 19:18:58 +00004008 void *vaddr = obj->phys_obj->handle->vaddr + args->offset;
Chris Wilsonb47b30c2010-11-08 01:12:29 +00004009 char __user *user_data = (char __user *) (uintptr_t) args->data_ptr;
Dave Airlie71acb5e2008-12-30 20:31:46 +10004010
Chris Wilsonb47b30c2010-11-08 01:12:29 +00004011 if (__copy_from_user_inatomic_nocache(vaddr, user_data, args->size)) {
4012 unsigned long unwritten;
4013
4014 /* The physical object once assigned is fixed for the lifetime
4015 * of the obj, so we can safely drop the lock and continue
4016 * to access vaddr.
4017 */
4018 mutex_unlock(&dev->struct_mutex);
4019 unwritten = copy_from_user(vaddr, user_data, args->size);
4020 mutex_lock(&dev->struct_mutex);
4021 if (unwritten)
4022 return -EFAULT;
4023 }
Dave Airlie71acb5e2008-12-30 20:31:46 +10004024
Daniel Vetter40ce6572010-11-05 18:12:18 +01004025 intel_gtt_chipset_flush();
Dave Airlie71acb5e2008-12-30 20:31:46 +10004026 return 0;
4027}
Eric Anholtb9624422009-06-03 07:27:35 +00004028
Chris Wilsonf787a5f2010-09-24 16:02:42 +01004029void i915_gem_release(struct drm_device *dev, struct drm_file *file)
Eric Anholtb9624422009-06-03 07:27:35 +00004030{
Chris Wilsonf787a5f2010-09-24 16:02:42 +01004031 struct drm_i915_file_private *file_priv = file->driver_priv;
Eric Anholtb9624422009-06-03 07:27:35 +00004032
4033 /* Clean up our request list when the client is going away, so that
4034 * later retire_requests won't dereference our soon-to-be-gone
4035 * file_priv.
4036 */
Chris Wilson1c255952010-09-26 11:03:27 +01004037 spin_lock(&file_priv->mm.lock);
Chris Wilsonf787a5f2010-09-24 16:02:42 +01004038 while (!list_empty(&file_priv->mm.request_list)) {
4039 struct drm_i915_gem_request *request;
4040
4041 request = list_first_entry(&file_priv->mm.request_list,
4042 struct drm_i915_gem_request,
4043 client_list);
4044 list_del(&request->client_list);
4045 request->file_priv = NULL;
4046 }
Chris Wilson1c255952010-09-26 11:03:27 +01004047 spin_unlock(&file_priv->mm.lock);
Eric Anholtb9624422009-06-03 07:27:35 +00004048}
Chris Wilson31169712009-09-14 16:50:28 +01004049
Chris Wilson31169712009-09-14 16:50:28 +01004050static int
Chris Wilson1637ef42010-04-20 17:10:35 +01004051i915_gpu_is_active(struct drm_device *dev)
4052{
4053 drm_i915_private_t *dev_priv = dev->dev_private;
4054 int lists_empty;
4055
Chris Wilson1637ef42010-04-20 17:10:35 +01004056 lists_empty = list_empty(&dev_priv->mm.flushing_list) &&
Chris Wilson17250b72010-10-28 12:51:39 +01004057 list_empty(&dev_priv->mm.active_list);
Chris Wilson1637ef42010-04-20 17:10:35 +01004058
4059 return !lists_empty;
4060}
4061
4062static int
Chris Wilson17250b72010-10-28 12:51:39 +01004063i915_gem_inactive_shrink(struct shrinker *shrinker,
4064 int nr_to_scan,
4065 gfp_t gfp_mask)
Chris Wilson31169712009-09-14 16:50:28 +01004066{
Chris Wilson17250b72010-10-28 12:51:39 +01004067 struct drm_i915_private *dev_priv =
4068 container_of(shrinker,
4069 struct drm_i915_private,
4070 mm.inactive_shrinker);
4071 struct drm_device *dev = dev_priv->dev;
4072 struct drm_i915_gem_object *obj, *next;
4073 int cnt;
4074
4075 if (!mutex_trylock(&dev->struct_mutex))
Chris Wilsonbbe2e112010-10-28 22:35:07 +01004076 return 0;
Chris Wilson31169712009-09-14 16:50:28 +01004077
4078 /* "fast-path" to count number of available objects */
4079 if (nr_to_scan == 0) {
Chris Wilson17250b72010-10-28 12:51:39 +01004080 cnt = 0;
4081 list_for_each_entry(obj,
4082 &dev_priv->mm.inactive_list,
4083 mm_list)
4084 cnt++;
4085 mutex_unlock(&dev->struct_mutex);
4086 return cnt / 100 * sysctl_vfs_cache_pressure;
Chris Wilson31169712009-09-14 16:50:28 +01004087 }
4088
Chris Wilson1637ef42010-04-20 17:10:35 +01004089rescan:
Chris Wilson31169712009-09-14 16:50:28 +01004090 /* first scan for clean buffers */
Chris Wilson17250b72010-10-28 12:51:39 +01004091 i915_gem_retire_requests(dev);
Chris Wilson31169712009-09-14 16:50:28 +01004092
Chris Wilson17250b72010-10-28 12:51:39 +01004093 list_for_each_entry_safe(obj, next,
4094 &dev_priv->mm.inactive_list,
4095 mm_list) {
4096 if (i915_gem_object_is_purgeable(obj)) {
Chris Wilson20217462010-11-23 15:26:33 +00004097 if (i915_gem_object_unbind(obj) == 0 &&
4098 --nr_to_scan == 0)
Chris Wilson17250b72010-10-28 12:51:39 +01004099 break;
Chris Wilson31169712009-09-14 16:50:28 +01004100 }
Chris Wilson31169712009-09-14 16:50:28 +01004101 }
4102
4103 /* second pass, evict/count anything still on the inactive list */
Chris Wilson17250b72010-10-28 12:51:39 +01004104 cnt = 0;
4105 list_for_each_entry_safe(obj, next,
4106 &dev_priv->mm.inactive_list,
4107 mm_list) {
Chris Wilson20217462010-11-23 15:26:33 +00004108 if (nr_to_scan &&
4109 i915_gem_object_unbind(obj) == 0)
Chris Wilson17250b72010-10-28 12:51:39 +01004110 nr_to_scan--;
Chris Wilson20217462010-11-23 15:26:33 +00004111 else
Chris Wilson17250b72010-10-28 12:51:39 +01004112 cnt++;
Chris Wilson31169712009-09-14 16:50:28 +01004113 }
4114
Chris Wilson17250b72010-10-28 12:51:39 +01004115 if (nr_to_scan && i915_gpu_is_active(dev)) {
Chris Wilson1637ef42010-04-20 17:10:35 +01004116 /*
4117 * We are desperate for pages, so as a last resort, wait
4118 * for the GPU to finish and discard whatever we can.
4119 * This has a dramatic impact to reduce the number of
4120 * OOM-killer events whilst running the GPU aggressively.
4121 */
Chris Wilson17250b72010-10-28 12:51:39 +01004122 if (i915_gpu_idle(dev) == 0)
Chris Wilson1637ef42010-04-20 17:10:35 +01004123 goto rescan;
4124 }
Chris Wilson17250b72010-10-28 12:51:39 +01004125 mutex_unlock(&dev->struct_mutex);
4126 return cnt / 100 * sysctl_vfs_cache_pressure;
Chris Wilson31169712009-09-14 16:50:28 +01004127}