Merge branch 'perf-urgent-for-linus' of git://git.kernel.org/pub/scm/linux/kernel...
[sfrench/cifs-2.6.git] / drivers / gpu / drm / i915 / selftests / i915_gem_object.c
1 /*
2  * Copyright © 2016 Intel Corporation
3  *
4  * Permission is hereby granted, free of charge, to any person obtaining a
5  * copy of this software and associated documentation files (the "Software"),
6  * to deal in the Software without restriction, including without limitation
7  * the rights to use, copy, modify, merge, publish, distribute, sublicense,
8  * and/or sell copies of the Software, and to permit persons to whom the
9  * Software is furnished to do so, subject to the following conditions:
10  *
11  * The above copyright notice and this permission notice (including the next
12  * paragraph) shall be included in all copies or substantial portions of the
13  * Software.
14  *
15  * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
16  * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
17  * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT.  IN NO EVENT SHALL
18  * THE AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
19  * LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING
20  * FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS
21  * IN THE SOFTWARE.
22  *
23  */
24
25 #include "../i915_selftest.h"
26
27 #include "mock_gem_device.h"
28 #include "huge_gem_object.h"
29
30 static int igt_gem_object(void *arg)
31 {
32         struct drm_i915_private *i915 = arg;
33         struct drm_i915_gem_object *obj;
34         int err = -ENOMEM;
35
36         /* Basic test to ensure we can create an object */
37
38         obj = i915_gem_object_create(i915, PAGE_SIZE);
39         if (IS_ERR(obj)) {
40                 err = PTR_ERR(obj);
41                 pr_err("i915_gem_object_create failed, err=%d\n", err);
42                 goto out;
43         }
44
45         err = 0;
46         i915_gem_object_put(obj);
47 out:
48         return err;
49 }
50
51 static int igt_phys_object(void *arg)
52 {
53         struct drm_i915_private *i915 = arg;
54         struct drm_i915_gem_object *obj;
55         int err;
56
57         /* Create an object and bind it to a contiguous set of physical pages,
58          * i.e. exercise the i915_gem_object_phys API.
59          */
60
61         obj = i915_gem_object_create(i915, PAGE_SIZE);
62         if (IS_ERR(obj)) {
63                 err = PTR_ERR(obj);
64                 pr_err("i915_gem_object_create failed, err=%d\n", err);
65                 goto out;
66         }
67
68         mutex_lock(&i915->drm.struct_mutex);
69         err = i915_gem_object_attach_phys(obj, PAGE_SIZE);
70         mutex_unlock(&i915->drm.struct_mutex);
71         if (err) {
72                 pr_err("i915_gem_object_attach_phys failed, err=%d\n", err);
73                 goto out_obj;
74         }
75
76         if (obj->ops != &i915_gem_phys_ops) {
77                 pr_err("i915_gem_object_attach_phys did not create a phys object\n");
78                 err = -EINVAL;
79                 goto out_obj;
80         }
81
82         if (!atomic_read(&obj->mm.pages_pin_count)) {
83                 pr_err("i915_gem_object_attach_phys did not pin its phys pages\n");
84                 err = -EINVAL;
85                 goto out_obj;
86         }
87
88         /* Make the object dirty so that put_pages must do copy back the data */
89         mutex_lock(&i915->drm.struct_mutex);
90         err = i915_gem_object_set_to_gtt_domain(obj, true);
91         mutex_unlock(&i915->drm.struct_mutex);
92         if (err) {
93                 pr_err("i915_gem_object_set_to_gtt_domain failed with err=%d\n",
94                        err);
95                 goto out_obj;
96         }
97
98 out_obj:
99         i915_gem_object_put(obj);
100 out:
101         return err;
102 }
103
104 static int igt_gem_huge(void *arg)
105 {
106         const unsigned int nreal = 509; /* just to be awkward */
107         struct drm_i915_private *i915 = arg;
108         struct drm_i915_gem_object *obj;
109         unsigned int n;
110         int err;
111
112         /* Basic sanitycheck of our huge fake object allocation */
113
114         obj = huge_gem_object(i915,
115                               nreal * PAGE_SIZE,
116                               i915->ggtt.base.total + PAGE_SIZE);
117         if (IS_ERR(obj))
118                 return PTR_ERR(obj);
119
120         err = i915_gem_object_pin_pages(obj);
121         if (err) {
122                 pr_err("Failed to allocate %u pages (%lu total), err=%d\n",
123                        nreal, obj->base.size / PAGE_SIZE, err);
124                 goto out;
125         }
126
127         for (n = 0; n < obj->base.size / PAGE_SIZE; n++) {
128                 if (i915_gem_object_get_page(obj, n) !=
129                     i915_gem_object_get_page(obj, n % nreal)) {
130                         pr_err("Page lookup mismatch at index %u [%u]\n",
131                                n, n % nreal);
132                         err = -EINVAL;
133                         goto out_unpin;
134                 }
135         }
136
137 out_unpin:
138         i915_gem_object_unpin_pages(obj);
139 out:
140         i915_gem_object_put(obj);
141         return err;
142 }
143
144 struct tile {
145         unsigned int width;
146         unsigned int height;
147         unsigned int stride;
148         unsigned int size;
149         unsigned int tiling;
150         unsigned int swizzle;
151 };
152
153 static u64 swizzle_bit(unsigned int bit, u64 offset)
154 {
155         return (offset & BIT_ULL(bit)) >> (bit - 6);
156 }
157
158 static u64 tiled_offset(const struct tile *tile, u64 v)
159 {
160         u64 x, y;
161
162         if (tile->tiling == I915_TILING_NONE)
163                 return v;
164
165         y = div64_u64_rem(v, tile->stride, &x);
166         v = div64_u64_rem(y, tile->height, &y) * tile->stride * tile->height;
167
168         if (tile->tiling == I915_TILING_X) {
169                 v += y * tile->width;
170                 v += div64_u64_rem(x, tile->width, &x) << tile->size;
171                 v += x;
172         } else {
173                 const unsigned int ytile_span = 16;
174                 const unsigned int ytile_height = 32 * ytile_span;
175
176                 v += y * ytile_span;
177                 v += div64_u64_rem(x, ytile_span, &x) * ytile_height;
178                 v += x;
179         }
180
181         switch (tile->swizzle) {
182         case I915_BIT_6_SWIZZLE_9:
183                 v ^= swizzle_bit(9, v);
184                 break;
185         case I915_BIT_6_SWIZZLE_9_10:
186                 v ^= swizzle_bit(9, v) ^ swizzle_bit(10, v);
187                 break;
188         case I915_BIT_6_SWIZZLE_9_11:
189                 v ^= swizzle_bit(9, v) ^ swizzle_bit(11, v);
190                 break;
191         case I915_BIT_6_SWIZZLE_9_10_11:
192                 v ^= swizzle_bit(9, v) ^ swizzle_bit(10, v) ^ swizzle_bit(11, v);
193                 break;
194         }
195
196         return v;
197 }
198
199 static int check_partial_mapping(struct drm_i915_gem_object *obj,
200                                  const struct tile *tile,
201                                  unsigned long end_time)
202 {
203         const unsigned int nreal = obj->scratch / PAGE_SIZE;
204         const unsigned long npages = obj->base.size / PAGE_SIZE;
205         struct i915_vma *vma;
206         unsigned long page;
207         int err;
208
209         if (igt_timeout(end_time,
210                         "%s: timed out before tiling=%d stride=%d\n",
211                         __func__, tile->tiling, tile->stride))
212                 return -EINTR;
213
214         err = i915_gem_object_set_tiling(obj, tile->tiling, tile->stride);
215         if (err)
216                 return err;
217
218         GEM_BUG_ON(i915_gem_object_get_tiling(obj) != tile->tiling);
219         GEM_BUG_ON(i915_gem_object_get_stride(obj) != tile->stride);
220
221         for_each_prime_number_from(page, 1, npages) {
222                 struct i915_ggtt_view view =
223                         compute_partial_view(obj, page, MIN_CHUNK_PAGES);
224                 u32 __iomem *io;
225                 struct page *p;
226                 unsigned int n;
227                 u64 offset;
228                 u32 *cpu;
229
230                 GEM_BUG_ON(view.partial.size > nreal);
231
232                 err = i915_gem_object_set_to_gtt_domain(obj, true);
233                 if (err)
234                         return err;
235
236                 vma = i915_gem_object_ggtt_pin(obj, &view, 0, 0, PIN_MAPPABLE);
237                 if (IS_ERR(vma)) {
238                         pr_err("Failed to pin partial view: offset=%lu\n",
239                                page);
240                         return PTR_ERR(vma);
241                 }
242
243                 n = page - view.partial.offset;
244                 GEM_BUG_ON(n >= view.partial.size);
245
246                 io = i915_vma_pin_iomap(vma);
247                 i915_vma_unpin(vma);
248                 if (IS_ERR(io)) {
249                         pr_err("Failed to iomap partial view: offset=%lu\n",
250                                page);
251                         return PTR_ERR(io);
252                 }
253
254                 err = i915_vma_get_fence(vma);
255                 if (err) {
256                         pr_err("Failed to get fence for partial view: offset=%lu\n",
257                                page);
258                         i915_vma_unpin_iomap(vma);
259                         return err;
260                 }
261
262                 iowrite32(page, io + n * PAGE_SIZE/sizeof(*io));
263                 i915_vma_unpin_iomap(vma);
264
265                 offset = tiled_offset(tile, page << PAGE_SHIFT);
266                 if (offset >= obj->base.size)
267                         continue;
268
269                 flush_write_domain(obj, ~I915_GEM_DOMAIN_CPU);
270
271                 p = i915_gem_object_get_page(obj, offset >> PAGE_SHIFT);
272                 cpu = kmap(p) + offset_in_page(offset);
273                 drm_clflush_virt_range(cpu, sizeof(*cpu));
274                 if (*cpu != (u32)page) {
275                         pr_err("Partial view for %lu [%u] (offset=%llu, size=%u [%llu, row size %u], fence=%d, tiling=%d, stride=%d) misalignment, expected write to page (%llu + %u [0x%llx]) of 0x%x, found 0x%x\n",
276                                page, n,
277                                view.partial.offset,
278                                view.partial.size,
279                                vma->size >> PAGE_SHIFT,
280                                tile_row_pages(obj),
281                                vma->fence ? vma->fence->id : -1, tile->tiling, tile->stride,
282                                offset >> PAGE_SHIFT,
283                                (unsigned int)offset_in_page(offset),
284                                offset,
285                                (u32)page, *cpu);
286                         err = -EINVAL;
287                 }
288                 *cpu = 0;
289                 drm_clflush_virt_range(cpu, sizeof(*cpu));
290                 kunmap(p);
291                 if (err)
292                         return err;
293         }
294
295         return 0;
296 }
297
298 static int igt_partial_tiling(void *arg)
299 {
300         const unsigned int nreal = 1 << 12; /* largest tile row x2 */
301         struct drm_i915_private *i915 = arg;
302         struct drm_i915_gem_object *obj;
303         int tiling;
304         int err;
305
306         /* We want to check the page mapping and fencing of a large object
307          * mmapped through the GTT. The object we create is larger than can
308          * possibly be mmaped as a whole, and so we must use partial GGTT vma.
309          * We then check that a write through each partial GGTT vma ends up
310          * in the right set of pages within the object, and with the expected
311          * tiling, which we verify by manual swizzling.
312          */
313
314         obj = huge_gem_object(i915,
315                               nreal << PAGE_SHIFT,
316                               (1 + next_prime_number(i915->ggtt.base.total >> PAGE_SHIFT)) << PAGE_SHIFT);
317         if (IS_ERR(obj))
318                 return PTR_ERR(obj);
319
320         err = i915_gem_object_pin_pages(obj);
321         if (err) {
322                 pr_err("Failed to allocate %u pages (%lu total), err=%d\n",
323                        nreal, obj->base.size / PAGE_SIZE, err);
324                 goto out;
325         }
326
327         mutex_lock(&i915->drm.struct_mutex);
328
329         if (1) {
330                 IGT_TIMEOUT(end);
331                 struct tile tile;
332
333                 tile.height = 1;
334                 tile.width = 1;
335                 tile.size = 0;
336                 tile.stride = 0;
337                 tile.swizzle = I915_BIT_6_SWIZZLE_NONE;
338                 tile.tiling = I915_TILING_NONE;
339
340                 err = check_partial_mapping(obj, &tile, end);
341                 if (err && err != -EINTR)
342                         goto out_unlock;
343         }
344
345         for (tiling = I915_TILING_X; tiling <= I915_TILING_Y; tiling++) {
346                 IGT_TIMEOUT(end);
347                 unsigned int max_pitch;
348                 unsigned int pitch;
349                 struct tile tile;
350
351                 tile.tiling = tiling;
352                 switch (tiling) {
353                 case I915_TILING_X:
354                         tile.swizzle = i915->mm.bit_6_swizzle_x;
355                         break;
356                 case I915_TILING_Y:
357                         tile.swizzle = i915->mm.bit_6_swizzle_y;
358                         break;
359                 }
360
361                 if (tile.swizzle == I915_BIT_6_SWIZZLE_UNKNOWN ||
362                     tile.swizzle == I915_BIT_6_SWIZZLE_9_10_17)
363                         continue;
364
365                 if (INTEL_GEN(i915) <= 2) {
366                         tile.height = 16;
367                         tile.width = 128;
368                         tile.size = 11;
369                 } else if (tile.tiling == I915_TILING_Y &&
370                            HAS_128_BYTE_Y_TILING(i915)) {
371                         tile.height = 32;
372                         tile.width = 128;
373                         tile.size = 12;
374                 } else {
375                         tile.height = 8;
376                         tile.width = 512;
377                         tile.size = 12;
378                 }
379
380                 if (INTEL_GEN(i915) < 4)
381                         max_pitch = 8192 / tile.width;
382                 else if (INTEL_GEN(i915) < 7)
383                         max_pitch = 128 * I965_FENCE_MAX_PITCH_VAL / tile.width;
384                 else
385                         max_pitch = 128 * GEN7_FENCE_MAX_PITCH_VAL / tile.width;
386
387                 for (pitch = max_pitch; pitch; pitch >>= 1) {
388                         tile.stride = tile.width * pitch;
389                         err = check_partial_mapping(obj, &tile, end);
390                         if (err == -EINTR)
391                                 goto next_tiling;
392                         if (err)
393                                 goto out_unlock;
394
395                         if (pitch > 2 && INTEL_GEN(i915) >= 4) {
396                                 tile.stride = tile.width * (pitch - 1);
397                                 err = check_partial_mapping(obj, &tile, end);
398                                 if (err == -EINTR)
399                                         goto next_tiling;
400                                 if (err)
401                                         goto out_unlock;
402                         }
403
404                         if (pitch < max_pitch && INTEL_GEN(i915) >= 4) {
405                                 tile.stride = tile.width * (pitch + 1);
406                                 err = check_partial_mapping(obj, &tile, end);
407                                 if (err == -EINTR)
408                                         goto next_tiling;
409                                 if (err)
410                                         goto out_unlock;
411                         }
412                 }
413
414                 if (INTEL_GEN(i915) >= 4) {
415                         for_each_prime_number(pitch, max_pitch) {
416                                 tile.stride = tile.width * pitch;
417                                 err = check_partial_mapping(obj, &tile, end);
418                                 if (err == -EINTR)
419                                         goto next_tiling;
420                                 if (err)
421                                         goto out_unlock;
422                         }
423                 }
424
425 next_tiling: ;
426         }
427
428 out_unlock:
429         mutex_unlock(&i915->drm.struct_mutex);
430         i915_gem_object_unpin_pages(obj);
431 out:
432         i915_gem_object_put(obj);
433         return err;
434 }
435
436 static int make_obj_busy(struct drm_i915_gem_object *obj)
437 {
438         struct drm_i915_private *i915 = to_i915(obj->base.dev);
439         struct drm_i915_gem_request *rq;
440         struct i915_vma *vma;
441         int err;
442
443         vma = i915_vma_instance(obj, &i915->ggtt.base, NULL);
444         if (IS_ERR(vma))
445                 return PTR_ERR(vma);
446
447         err = i915_vma_pin(vma, 0, 0, PIN_USER);
448         if (err)
449                 return err;
450
451         rq = i915_gem_request_alloc(i915->engine[RCS], i915->kernel_context);
452         if (IS_ERR(rq)) {
453                 i915_vma_unpin(vma);
454                 return PTR_ERR(rq);
455         }
456
457         i915_vma_move_to_active(vma, rq, 0);
458         i915_add_request(rq);
459
460         i915_gem_object_set_active_reference(obj);
461         i915_vma_unpin(vma);
462         return 0;
463 }
464
465 static bool assert_mmap_offset(struct drm_i915_private *i915,
466                                unsigned long size,
467                                int expected)
468 {
469         struct drm_i915_gem_object *obj;
470         int err;
471
472         obj = i915_gem_object_create_internal(i915, size);
473         if (IS_ERR(obj))
474                 return PTR_ERR(obj);
475
476         err = i915_gem_object_create_mmap_offset(obj);
477         i915_gem_object_put(obj);
478
479         return err == expected;
480 }
481
482 static int igt_mmap_offset_exhaustion(void *arg)
483 {
484         struct drm_i915_private *i915 = arg;
485         struct drm_mm *mm = &i915->drm.vma_offset_manager->vm_addr_space_mm;
486         struct drm_i915_gem_object *obj;
487         struct drm_mm_node resv, *hole;
488         u64 hole_start, hole_end;
489         int loop, err;
490
491         /* Trim the device mmap space to only a page */
492         memset(&resv, 0, sizeof(resv));
493         drm_mm_for_each_hole(hole, mm, hole_start, hole_end) {
494                 resv.start = hole_start;
495                 resv.size = hole_end - hole_start - 1; /* PAGE_SIZE units */
496                 err = drm_mm_reserve_node(mm, &resv);
497                 if (err) {
498                         pr_err("Failed to trim VMA manager, err=%d\n", err);
499                         return err;
500                 }
501                 break;
502         }
503
504         /* Just fits! */
505         if (!assert_mmap_offset(i915, PAGE_SIZE, 0)) {
506                 pr_err("Unable to insert object into single page hole\n");
507                 err = -EINVAL;
508                 goto out;
509         }
510
511         /* Too large */
512         if (!assert_mmap_offset(i915, 2*PAGE_SIZE, -ENOSPC)) {
513                 pr_err("Unexpectedly succeeded in inserting too large object into single page hole\n");
514                 err = -EINVAL;
515                 goto out;
516         }
517
518         /* Fill the hole, further allocation attempts should then fail */
519         obj = i915_gem_object_create_internal(i915, PAGE_SIZE);
520         if (IS_ERR(obj)) {
521                 err = PTR_ERR(obj);
522                 goto out;
523         }
524
525         err = i915_gem_object_create_mmap_offset(obj);
526         if (err) {
527                 pr_err("Unable to insert object into reclaimed hole\n");
528                 goto err_obj;
529         }
530
531         if (!assert_mmap_offset(i915, PAGE_SIZE, -ENOSPC)) {
532                 pr_err("Unexpectedly succeeded in inserting object into no holes!\n");
533                 err = -EINVAL;
534                 goto err_obj;
535         }
536
537         i915_gem_object_put(obj);
538
539         /* Now fill with busy dead objects that we expect to reap */
540         for (loop = 0; loop < 3; loop++) {
541                 obj = i915_gem_object_create_internal(i915, PAGE_SIZE);
542                 if (IS_ERR(obj)) {
543                         err = PTR_ERR(obj);
544                         goto out;
545                 }
546
547                 mutex_lock(&i915->drm.struct_mutex);
548                 intel_runtime_pm_get(i915);
549                 err = make_obj_busy(obj);
550                 intel_runtime_pm_put(i915);
551                 mutex_unlock(&i915->drm.struct_mutex);
552                 if (err) {
553                         pr_err("[loop %d] Failed to busy the object\n", loop);
554                         goto err_obj;
555                 }
556
557                 GEM_BUG_ON(!i915_gem_object_is_active(obj));
558                 err = i915_gem_object_create_mmap_offset(obj);
559                 if (err) {
560                         pr_err("[loop %d] i915_gem_object_create_mmap_offset failed with err=%d\n",
561                                loop, err);
562                         goto out;
563                 }
564         }
565
566 out:
567         drm_mm_remove_node(&resv);
568         return err;
569 err_obj:
570         i915_gem_object_put(obj);
571         goto out;
572 }
573
574 int i915_gem_object_mock_selftests(void)
575 {
576         static const struct i915_subtest tests[] = {
577                 SUBTEST(igt_gem_object),
578                 SUBTEST(igt_phys_object),
579         };
580         struct drm_i915_private *i915;
581         int err;
582
583         i915 = mock_gem_device();
584         if (!i915)
585                 return -ENOMEM;
586
587         err = i915_subtests(tests, i915);
588
589         drm_dev_unref(&i915->drm);
590         return err;
591 }
592
593 int i915_gem_object_live_selftests(struct drm_i915_private *i915)
594 {
595         static const struct i915_subtest tests[] = {
596                 SUBTEST(igt_gem_huge),
597                 SUBTEST(igt_partial_tiling),
598                 SUBTEST(igt_mmap_offset_exhaustion),
599         };
600
601         return i915_subtests(tests, i915);
602 }