Merge tag 'for-linus-4.8-rc0-tag' of git://git.kernel.org/pub/scm/linux/kernel/git...
[sfrench/cifs-2.6.git] / drivers / gpu / drm / ttm / ttm_bo.c
1 /**************************************************************************
2  *
3  * Copyright (c) 2006-2009 VMware, Inc., Palo Alto, CA., USA
4  * All Rights Reserved.
5  *
6  * Permission is hereby granted, free of charge, to any person obtaining a
7  * copy of this software and associated documentation files (the
8  * "Software"), to deal in the Software without restriction, including
9  * without limitation the rights to use, copy, modify, merge, publish,
10  * distribute, sub license, and/or sell copies of the Software, and to
11  * permit persons to whom the Software is furnished to do so, subject to
12  * the following conditions:
13  *
14  * The above copyright notice and this permission notice (including the
15  * next paragraph) shall be included in all copies or substantial portions
16  * of the Software.
17  *
18  * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
19  * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
20  * FITNESS FOR A PARTICULAR PURPOSE AND NON-INFRINGEMENT. IN NO EVENT SHALL
21  * THE COPYRIGHT HOLDERS, AUTHORS AND/OR ITS SUPPLIERS BE LIABLE FOR ANY CLAIM,
22  * DAMAGES OR OTHER LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR
23  * OTHERWISE, ARISING FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE
24  * USE OR OTHER DEALINGS IN THE SOFTWARE.
25  *
26  **************************************************************************/
27 /*
28  * Authors: Thomas Hellstrom <thellstrom-at-vmware-dot-com>
29  */
30
31 #define pr_fmt(fmt) "[TTM] " fmt
32
33 #include <drm/ttm/ttm_module.h>
34 #include <drm/ttm/ttm_bo_driver.h>
35 #include <drm/ttm/ttm_placement.h>
36 #include <linux/jiffies.h>
37 #include <linux/slab.h>
38 #include <linux/sched.h>
39 #include <linux/mm.h>
40 #include <linux/file.h>
41 #include <linux/module.h>
42 #include <linux/atomic.h>
43 #include <linux/reservation.h>
44
45 #define TTM_ASSERT_LOCKED(param)
46 #define TTM_DEBUG(fmt, arg...)
47 #define TTM_BO_HASH_ORDER 13
48
49 static int ttm_bo_swapout(struct ttm_mem_shrink *shrink);
50 static void ttm_bo_global_kobj_release(struct kobject *kobj);
51
52 static struct attribute ttm_bo_count = {
53         .name = "bo_count",
54         .mode = S_IRUGO
55 };
56
57 static inline int ttm_mem_type_from_place(const struct ttm_place *place,
58                                           uint32_t *mem_type)
59 {
60         int i;
61
62         for (i = 0; i <= TTM_PL_PRIV5; i++)
63                 if (place->flags & (1 << i)) {
64                         *mem_type = i;
65                         return 0;
66                 }
67         return -EINVAL;
68 }
69
70 static void ttm_mem_type_debug(struct ttm_bo_device *bdev, int mem_type)
71 {
72         struct ttm_mem_type_manager *man = &bdev->man[mem_type];
73
74         pr_err("    has_type: %d\n", man->has_type);
75         pr_err("    use_type: %d\n", man->use_type);
76         pr_err("    flags: 0x%08X\n", man->flags);
77         pr_err("    gpu_offset: 0x%08llX\n", man->gpu_offset);
78         pr_err("    size: %llu\n", man->size);
79         pr_err("    available_caching: 0x%08X\n", man->available_caching);
80         pr_err("    default_caching: 0x%08X\n", man->default_caching);
81         if (mem_type != TTM_PL_SYSTEM)
82                 (*man->func->debug)(man, TTM_PFX);
83 }
84
85 static void ttm_bo_mem_space_debug(struct ttm_buffer_object *bo,
86                                         struct ttm_placement *placement)
87 {
88         int i, ret, mem_type;
89
90         pr_err("No space for %p (%lu pages, %luK, %luM)\n",
91                bo, bo->mem.num_pages, bo->mem.size >> 10,
92                bo->mem.size >> 20);
93         for (i = 0; i < placement->num_placement; i++) {
94                 ret = ttm_mem_type_from_place(&placement->placement[i],
95                                                 &mem_type);
96                 if (ret)
97                         return;
98                 pr_err("  placement[%d]=0x%08X (%d)\n",
99                        i, placement->placement[i].flags, mem_type);
100                 ttm_mem_type_debug(bo->bdev, mem_type);
101         }
102 }
103
104 static ssize_t ttm_bo_global_show(struct kobject *kobj,
105                                   struct attribute *attr,
106                                   char *buffer)
107 {
108         struct ttm_bo_global *glob =
109                 container_of(kobj, struct ttm_bo_global, kobj);
110
111         return snprintf(buffer, PAGE_SIZE, "%lu\n",
112                         (unsigned long) atomic_read(&glob->bo_count));
113 }
114
115 static struct attribute *ttm_bo_global_attrs[] = {
116         &ttm_bo_count,
117         NULL
118 };
119
120 static const struct sysfs_ops ttm_bo_global_ops = {
121         .show = &ttm_bo_global_show
122 };
123
124 static struct kobj_type ttm_bo_glob_kobj_type  = {
125         .release = &ttm_bo_global_kobj_release,
126         .sysfs_ops = &ttm_bo_global_ops,
127         .default_attrs = ttm_bo_global_attrs
128 };
129
130
131 static inline uint32_t ttm_bo_type_flags(unsigned type)
132 {
133         return 1 << (type);
134 }
135
136 static void ttm_bo_release_list(struct kref *list_kref)
137 {
138         struct ttm_buffer_object *bo =
139             container_of(list_kref, struct ttm_buffer_object, list_kref);
140         struct ttm_bo_device *bdev = bo->bdev;
141         size_t acc_size = bo->acc_size;
142
143         BUG_ON(atomic_read(&bo->list_kref.refcount));
144         BUG_ON(atomic_read(&bo->kref.refcount));
145         BUG_ON(atomic_read(&bo->cpu_writers));
146         BUG_ON(bo->mem.mm_node != NULL);
147         BUG_ON(!list_empty(&bo->lru));
148         BUG_ON(!list_empty(&bo->ddestroy));
149
150         if (bo->ttm)
151                 ttm_tt_destroy(bo->ttm);
152         atomic_dec(&bo->glob->bo_count);
153         if (bo->resv == &bo->ttm_resv)
154                 reservation_object_fini(&bo->ttm_resv);
155         mutex_destroy(&bo->wu_mutex);
156         if (bo->destroy)
157                 bo->destroy(bo);
158         else {
159                 kfree(bo);
160         }
161         ttm_mem_global_free(bdev->glob->mem_glob, acc_size);
162 }
163
164 void ttm_bo_add_to_lru(struct ttm_buffer_object *bo)
165 {
166         struct ttm_bo_device *bdev = bo->bdev;
167
168         lockdep_assert_held(&bo->resv->lock.base);
169
170         if (!(bo->mem.placement & TTM_PL_FLAG_NO_EVICT)) {
171
172                 BUG_ON(!list_empty(&bo->lru));
173
174                 list_add(&bo->lru, bdev->driver->lru_tail(bo));
175                 kref_get(&bo->list_kref);
176
177                 if (bo->ttm && !(bo->ttm->page_flags & TTM_PAGE_FLAG_SG)) {
178                         list_add(&bo->swap, bdev->driver->swap_lru_tail(bo));
179                         kref_get(&bo->list_kref);
180                 }
181         }
182 }
183 EXPORT_SYMBOL(ttm_bo_add_to_lru);
184
185 int ttm_bo_del_from_lru(struct ttm_buffer_object *bo)
186 {
187         struct ttm_bo_device *bdev = bo->bdev;
188         int put_count = 0;
189
190         if (bdev->driver->lru_removal)
191                 bdev->driver->lru_removal(bo);
192
193         if (!list_empty(&bo->swap)) {
194                 list_del_init(&bo->swap);
195                 ++put_count;
196         }
197         if (!list_empty(&bo->lru)) {
198                 list_del_init(&bo->lru);
199                 ++put_count;
200         }
201
202         return put_count;
203 }
204
205 static void ttm_bo_ref_bug(struct kref *list_kref)
206 {
207         BUG();
208 }
209
210 void ttm_bo_list_ref_sub(struct ttm_buffer_object *bo, int count,
211                          bool never_free)
212 {
213         kref_sub(&bo->list_kref, count,
214                  (never_free) ? ttm_bo_ref_bug : ttm_bo_release_list);
215 }
216
217 void ttm_bo_del_sub_from_lru(struct ttm_buffer_object *bo)
218 {
219         int put_count;
220
221         spin_lock(&bo->glob->lru_lock);
222         put_count = ttm_bo_del_from_lru(bo);
223         spin_unlock(&bo->glob->lru_lock);
224         ttm_bo_list_ref_sub(bo, put_count, true);
225 }
226 EXPORT_SYMBOL(ttm_bo_del_sub_from_lru);
227
228 void ttm_bo_move_to_lru_tail(struct ttm_buffer_object *bo)
229 {
230         struct ttm_bo_device *bdev = bo->bdev;
231         int put_count = 0;
232
233         lockdep_assert_held(&bo->resv->lock.base);
234
235         if (bdev->driver->lru_removal)
236                 bdev->driver->lru_removal(bo);
237
238         put_count = ttm_bo_del_from_lru(bo);
239         ttm_bo_list_ref_sub(bo, put_count, true);
240         ttm_bo_add_to_lru(bo);
241 }
242 EXPORT_SYMBOL(ttm_bo_move_to_lru_tail);
243
244 struct list_head *ttm_bo_default_lru_tail(struct ttm_buffer_object *bo)
245 {
246         return bo->bdev->man[bo->mem.mem_type].lru.prev;
247 }
248 EXPORT_SYMBOL(ttm_bo_default_lru_tail);
249
250 struct list_head *ttm_bo_default_swap_lru_tail(struct ttm_buffer_object *bo)
251 {
252         return bo->glob->swap_lru.prev;
253 }
254 EXPORT_SYMBOL(ttm_bo_default_swap_lru_tail);
255
256 /*
257  * Call bo->mutex locked.
258  */
259 static int ttm_bo_add_ttm(struct ttm_buffer_object *bo, bool zero_alloc)
260 {
261         struct ttm_bo_device *bdev = bo->bdev;
262         struct ttm_bo_global *glob = bo->glob;
263         int ret = 0;
264         uint32_t page_flags = 0;
265
266         TTM_ASSERT_LOCKED(&bo->mutex);
267         bo->ttm = NULL;
268
269         if (bdev->need_dma32)
270                 page_flags |= TTM_PAGE_FLAG_DMA32;
271
272         switch (bo->type) {
273         case ttm_bo_type_device:
274                 if (zero_alloc)
275                         page_flags |= TTM_PAGE_FLAG_ZERO_ALLOC;
276         case ttm_bo_type_kernel:
277                 bo->ttm = bdev->driver->ttm_tt_create(bdev, bo->num_pages << PAGE_SHIFT,
278                                                       page_flags, glob->dummy_read_page);
279                 if (unlikely(bo->ttm == NULL))
280                         ret = -ENOMEM;
281                 break;
282         case ttm_bo_type_sg:
283                 bo->ttm = bdev->driver->ttm_tt_create(bdev, bo->num_pages << PAGE_SHIFT,
284                                                       page_flags | TTM_PAGE_FLAG_SG,
285                                                       glob->dummy_read_page);
286                 if (unlikely(bo->ttm == NULL)) {
287                         ret = -ENOMEM;
288                         break;
289                 }
290                 bo->ttm->sg = bo->sg;
291                 break;
292         default:
293                 pr_err("Illegal buffer object type\n");
294                 ret = -EINVAL;
295                 break;
296         }
297
298         return ret;
299 }
300
301 static int ttm_bo_handle_move_mem(struct ttm_buffer_object *bo,
302                                   struct ttm_mem_reg *mem,
303                                   bool evict, bool interruptible,
304                                   bool no_wait_gpu)
305 {
306         struct ttm_bo_device *bdev = bo->bdev;
307         bool old_is_pci = ttm_mem_reg_is_pci(bdev, &bo->mem);
308         bool new_is_pci = ttm_mem_reg_is_pci(bdev, mem);
309         struct ttm_mem_type_manager *old_man = &bdev->man[bo->mem.mem_type];
310         struct ttm_mem_type_manager *new_man = &bdev->man[mem->mem_type];
311         int ret = 0;
312
313         if (old_is_pci || new_is_pci ||
314             ((mem->placement & bo->mem.placement & TTM_PL_MASK_CACHING) == 0)) {
315                 ret = ttm_mem_io_lock(old_man, true);
316                 if (unlikely(ret != 0))
317                         goto out_err;
318                 ttm_bo_unmap_virtual_locked(bo);
319                 ttm_mem_io_unlock(old_man);
320         }
321
322         /*
323          * Create and bind a ttm if required.
324          */
325
326         if (!(new_man->flags & TTM_MEMTYPE_FLAG_FIXED)) {
327                 if (bo->ttm == NULL) {
328                         bool zero = !(old_man->flags & TTM_MEMTYPE_FLAG_FIXED);
329                         ret = ttm_bo_add_ttm(bo, zero);
330                         if (ret)
331                                 goto out_err;
332                 }
333
334                 ret = ttm_tt_set_placement_caching(bo->ttm, mem->placement);
335                 if (ret)
336                         goto out_err;
337
338                 if (mem->mem_type != TTM_PL_SYSTEM) {
339                         ret = ttm_tt_bind(bo->ttm, mem);
340                         if (ret)
341                                 goto out_err;
342                 }
343
344                 if (bo->mem.mem_type == TTM_PL_SYSTEM) {
345                         if (bdev->driver->move_notify)
346                                 bdev->driver->move_notify(bo, mem);
347                         bo->mem = *mem;
348                         mem->mm_node = NULL;
349                         goto moved;
350                 }
351         }
352
353         if (bdev->driver->move_notify)
354                 bdev->driver->move_notify(bo, mem);
355
356         if (!(old_man->flags & TTM_MEMTYPE_FLAG_FIXED) &&
357             !(new_man->flags & TTM_MEMTYPE_FLAG_FIXED))
358                 ret = ttm_bo_move_ttm(bo, evict, no_wait_gpu, mem);
359         else if (bdev->driver->move)
360                 ret = bdev->driver->move(bo, evict, interruptible,
361                                          no_wait_gpu, mem);
362         else
363                 ret = ttm_bo_move_memcpy(bo, evict, no_wait_gpu, mem);
364
365         if (ret) {
366                 if (bdev->driver->move_notify) {
367                         struct ttm_mem_reg tmp_mem = *mem;
368                         *mem = bo->mem;
369                         bo->mem = tmp_mem;
370                         bdev->driver->move_notify(bo, mem);
371                         bo->mem = *mem;
372                         *mem = tmp_mem;
373                 }
374
375                 goto out_err;
376         }
377
378 moved:
379         if (bo->evicted) {
380                 if (bdev->driver->invalidate_caches) {
381                         ret = bdev->driver->invalidate_caches(bdev, bo->mem.placement);
382                         if (ret)
383                                 pr_err("Can not flush read caches\n");
384                 }
385                 bo->evicted = false;
386         }
387
388         if (bo->mem.mm_node) {
389                 bo->offset = (bo->mem.start << PAGE_SHIFT) +
390                     bdev->man[bo->mem.mem_type].gpu_offset;
391                 bo->cur_placement = bo->mem.placement;
392         } else
393                 bo->offset = 0;
394
395         return 0;
396
397 out_err:
398         new_man = &bdev->man[bo->mem.mem_type];
399         if ((new_man->flags & TTM_MEMTYPE_FLAG_FIXED) && bo->ttm) {
400                 ttm_tt_unbind(bo->ttm);
401                 ttm_tt_destroy(bo->ttm);
402                 bo->ttm = NULL;
403         }
404
405         return ret;
406 }
407
408 /**
409  * Call bo::reserved.
410  * Will release GPU memory type usage on destruction.
411  * This is the place to put in driver specific hooks to release
412  * driver private resources.
413  * Will release the bo::reserved lock.
414  */
415
416 static void ttm_bo_cleanup_memtype_use(struct ttm_buffer_object *bo)
417 {
418         if (bo->bdev->driver->move_notify)
419                 bo->bdev->driver->move_notify(bo, NULL);
420
421         if (bo->ttm) {
422                 ttm_tt_unbind(bo->ttm);
423                 ttm_tt_destroy(bo->ttm);
424                 bo->ttm = NULL;
425         }
426         ttm_bo_mem_put(bo, &bo->mem);
427
428         ww_mutex_unlock (&bo->resv->lock);
429 }
430
431 static void ttm_bo_flush_all_fences(struct ttm_buffer_object *bo)
432 {
433         struct reservation_object_list *fobj;
434         struct fence *fence;
435         int i;
436
437         fobj = reservation_object_get_list(bo->resv);
438         fence = reservation_object_get_excl(bo->resv);
439         if (fence && !fence->ops->signaled)
440                 fence_enable_sw_signaling(fence);
441
442         for (i = 0; fobj && i < fobj->shared_count; ++i) {
443                 fence = rcu_dereference_protected(fobj->shared[i],
444                                         reservation_object_held(bo->resv));
445
446                 if (!fence->ops->signaled)
447                         fence_enable_sw_signaling(fence);
448         }
449 }
450
451 static void ttm_bo_cleanup_refs_or_queue(struct ttm_buffer_object *bo)
452 {
453         struct ttm_bo_device *bdev = bo->bdev;
454         struct ttm_bo_global *glob = bo->glob;
455         int put_count;
456         int ret;
457
458         spin_lock(&glob->lru_lock);
459         ret = __ttm_bo_reserve(bo, false, true, NULL);
460
461         if (!ret) {
462                 if (!ttm_bo_wait(bo, false, true)) {
463                         put_count = ttm_bo_del_from_lru(bo);
464
465                         spin_unlock(&glob->lru_lock);
466                         ttm_bo_cleanup_memtype_use(bo);
467
468                         ttm_bo_list_ref_sub(bo, put_count, true);
469
470                         return;
471                 } else
472                         ttm_bo_flush_all_fences(bo);
473
474                 /*
475                  * Make NO_EVICT bos immediately available to
476                  * shrinkers, now that they are queued for
477                  * destruction.
478                  */
479                 if (bo->mem.placement & TTM_PL_FLAG_NO_EVICT) {
480                         bo->mem.placement &= ~TTM_PL_FLAG_NO_EVICT;
481                         ttm_bo_add_to_lru(bo);
482                 }
483
484                 __ttm_bo_unreserve(bo);
485         }
486
487         kref_get(&bo->list_kref);
488         list_add_tail(&bo->ddestroy, &bdev->ddestroy);
489         spin_unlock(&glob->lru_lock);
490
491         schedule_delayed_work(&bdev->wq,
492                               ((HZ / 100) < 1) ? 1 : HZ / 100);
493 }
494
495 /**
496  * function ttm_bo_cleanup_refs_and_unlock
497  * If bo idle, remove from delayed- and lru lists, and unref.
498  * If not idle, do nothing.
499  *
500  * Must be called with lru_lock and reservation held, this function
501  * will drop both before returning.
502  *
503  * @interruptible         Any sleeps should occur interruptibly.
504  * @no_wait_gpu           Never wait for gpu. Return -EBUSY instead.
505  */
506
507 static int ttm_bo_cleanup_refs_and_unlock(struct ttm_buffer_object *bo,
508                                           bool interruptible,
509                                           bool no_wait_gpu)
510 {
511         struct ttm_bo_global *glob = bo->glob;
512         int put_count;
513         int ret;
514
515         ret = ttm_bo_wait(bo, false, true);
516
517         if (ret && !no_wait_gpu) {
518                 long lret;
519                 ww_mutex_unlock(&bo->resv->lock);
520                 spin_unlock(&glob->lru_lock);
521
522                 lret = reservation_object_wait_timeout_rcu(bo->resv,
523                                                            true,
524                                                            interruptible,
525                                                            30 * HZ);
526
527                 if (lret < 0)
528                         return lret;
529                 else if (lret == 0)
530                         return -EBUSY;
531
532                 spin_lock(&glob->lru_lock);
533                 ret = __ttm_bo_reserve(bo, false, true, NULL);
534
535                 /*
536                  * We raced, and lost, someone else holds the reservation now,
537                  * and is probably busy in ttm_bo_cleanup_memtype_use.
538                  *
539                  * Even if it's not the case, because we finished waiting any
540                  * delayed destruction would succeed, so just return success
541                  * here.
542                  */
543                 if (ret) {
544                         spin_unlock(&glob->lru_lock);
545                         return 0;
546                 }
547
548                 /*
549                  * remove sync_obj with ttm_bo_wait, the wait should be
550                  * finished, and no new wait object should have been added.
551                  */
552                 ret = ttm_bo_wait(bo, false, true);
553                 WARN_ON(ret);
554         }
555
556         if (ret || unlikely(list_empty(&bo->ddestroy))) {
557                 __ttm_bo_unreserve(bo);
558                 spin_unlock(&glob->lru_lock);
559                 return ret;
560         }
561
562         put_count = ttm_bo_del_from_lru(bo);
563         list_del_init(&bo->ddestroy);
564         ++put_count;
565
566         spin_unlock(&glob->lru_lock);
567         ttm_bo_cleanup_memtype_use(bo);
568
569         ttm_bo_list_ref_sub(bo, put_count, true);
570
571         return 0;
572 }
573
574 /**
575  * Traverse the delayed list, and call ttm_bo_cleanup_refs on all
576  * encountered buffers.
577  */
578
579 static int ttm_bo_delayed_delete(struct ttm_bo_device *bdev, bool remove_all)
580 {
581         struct ttm_bo_global *glob = bdev->glob;
582         struct ttm_buffer_object *entry = NULL;
583         int ret = 0;
584
585         spin_lock(&glob->lru_lock);
586         if (list_empty(&bdev->ddestroy))
587                 goto out_unlock;
588
589         entry = list_first_entry(&bdev->ddestroy,
590                 struct ttm_buffer_object, ddestroy);
591         kref_get(&entry->list_kref);
592
593         for (;;) {
594                 struct ttm_buffer_object *nentry = NULL;
595
596                 if (entry->ddestroy.next != &bdev->ddestroy) {
597                         nentry = list_first_entry(&entry->ddestroy,
598                                 struct ttm_buffer_object, ddestroy);
599                         kref_get(&nentry->list_kref);
600                 }
601
602                 ret = __ttm_bo_reserve(entry, false, true, NULL);
603                 if (remove_all && ret) {
604                         spin_unlock(&glob->lru_lock);
605                         ret = __ttm_bo_reserve(entry, false, false, NULL);
606                         spin_lock(&glob->lru_lock);
607                 }
608
609                 if (!ret)
610                         ret = ttm_bo_cleanup_refs_and_unlock(entry, false,
611                                                              !remove_all);
612                 else
613                         spin_unlock(&glob->lru_lock);
614
615                 kref_put(&entry->list_kref, ttm_bo_release_list);
616                 entry = nentry;
617
618                 if (ret || !entry)
619                         goto out;
620
621                 spin_lock(&glob->lru_lock);
622                 if (list_empty(&entry->ddestroy))
623                         break;
624         }
625
626 out_unlock:
627         spin_unlock(&glob->lru_lock);
628 out:
629         if (entry)
630                 kref_put(&entry->list_kref, ttm_bo_release_list);
631         return ret;
632 }
633
634 static void ttm_bo_delayed_workqueue(struct work_struct *work)
635 {
636         struct ttm_bo_device *bdev =
637             container_of(work, struct ttm_bo_device, wq.work);
638
639         if (ttm_bo_delayed_delete(bdev, false)) {
640                 schedule_delayed_work(&bdev->wq,
641                                       ((HZ / 100) < 1) ? 1 : HZ / 100);
642         }
643 }
644
645 static void ttm_bo_release(struct kref *kref)
646 {
647         struct ttm_buffer_object *bo =
648             container_of(kref, struct ttm_buffer_object, kref);
649         struct ttm_bo_device *bdev = bo->bdev;
650         struct ttm_mem_type_manager *man = &bdev->man[bo->mem.mem_type];
651
652         drm_vma_offset_remove(&bdev->vma_manager, &bo->vma_node);
653         ttm_mem_io_lock(man, false);
654         ttm_mem_io_free_vm(bo);
655         ttm_mem_io_unlock(man);
656         ttm_bo_cleanup_refs_or_queue(bo);
657         kref_put(&bo->list_kref, ttm_bo_release_list);
658 }
659
660 void ttm_bo_unref(struct ttm_buffer_object **p_bo)
661 {
662         struct ttm_buffer_object *bo = *p_bo;
663
664         *p_bo = NULL;
665         kref_put(&bo->kref, ttm_bo_release);
666 }
667 EXPORT_SYMBOL(ttm_bo_unref);
668
669 int ttm_bo_lock_delayed_workqueue(struct ttm_bo_device *bdev)
670 {
671         return cancel_delayed_work_sync(&bdev->wq);
672 }
673 EXPORT_SYMBOL(ttm_bo_lock_delayed_workqueue);
674
675 void ttm_bo_unlock_delayed_workqueue(struct ttm_bo_device *bdev, int resched)
676 {
677         if (resched)
678                 schedule_delayed_work(&bdev->wq,
679                                       ((HZ / 100) < 1) ? 1 : HZ / 100);
680 }
681 EXPORT_SYMBOL(ttm_bo_unlock_delayed_workqueue);
682
683 static int ttm_bo_evict(struct ttm_buffer_object *bo, bool interruptible,
684                         bool no_wait_gpu)
685 {
686         struct ttm_bo_device *bdev = bo->bdev;
687         struct ttm_mem_reg evict_mem;
688         struct ttm_placement placement;
689         int ret = 0;
690
691         ret = ttm_bo_wait(bo, interruptible, no_wait_gpu);
692
693         if (unlikely(ret != 0)) {
694                 if (ret != -ERESTARTSYS) {
695                         pr_err("Failed to expire sync object before buffer eviction\n");
696                 }
697                 goto out;
698         }
699
700         lockdep_assert_held(&bo->resv->lock.base);
701
702         evict_mem = bo->mem;
703         evict_mem.mm_node = NULL;
704         evict_mem.bus.io_reserved_vm = false;
705         evict_mem.bus.io_reserved_count = 0;
706
707         placement.num_placement = 0;
708         placement.num_busy_placement = 0;
709         bdev->driver->evict_flags(bo, &placement);
710         ret = ttm_bo_mem_space(bo, &placement, &evict_mem, interruptible,
711                                 no_wait_gpu);
712         if (ret) {
713                 if (ret != -ERESTARTSYS) {
714                         pr_err("Failed to find memory space for buffer 0x%p eviction\n",
715                                bo);
716                         ttm_bo_mem_space_debug(bo, &placement);
717                 }
718                 goto out;
719         }
720
721         ret = ttm_bo_handle_move_mem(bo, &evict_mem, true, interruptible,
722                                      no_wait_gpu);
723         if (ret) {
724                 if (ret != -ERESTARTSYS)
725                         pr_err("Buffer eviction failed\n");
726                 ttm_bo_mem_put(bo, &evict_mem);
727                 goto out;
728         }
729         bo->evicted = true;
730 out:
731         return ret;
732 }
733
734 static int ttm_mem_evict_first(struct ttm_bo_device *bdev,
735                                 uint32_t mem_type,
736                                 const struct ttm_place *place,
737                                 bool interruptible,
738                                 bool no_wait_gpu)
739 {
740         struct ttm_bo_global *glob = bdev->glob;
741         struct ttm_mem_type_manager *man = &bdev->man[mem_type];
742         struct ttm_buffer_object *bo;
743         int ret = -EBUSY, put_count;
744
745         spin_lock(&glob->lru_lock);
746         list_for_each_entry(bo, &man->lru, lru) {
747                 ret = __ttm_bo_reserve(bo, false, true, NULL);
748                 if (!ret) {
749                         if (place && (place->fpfn || place->lpfn)) {
750                                 /* Don't evict this BO if it's outside of the
751                                  * requested placement range
752                                  */
753                                 if (place->fpfn >= (bo->mem.start + bo->mem.size) ||
754                                     (place->lpfn && place->lpfn <= bo->mem.start)) {
755                                         __ttm_bo_unreserve(bo);
756                                         ret = -EBUSY;
757                                         continue;
758                                 }
759                         }
760
761                         break;
762                 }
763         }
764
765         if (ret) {
766                 spin_unlock(&glob->lru_lock);
767                 return ret;
768         }
769
770         kref_get(&bo->list_kref);
771
772         if (!list_empty(&bo->ddestroy)) {
773                 ret = ttm_bo_cleanup_refs_and_unlock(bo, interruptible,
774                                                      no_wait_gpu);
775                 kref_put(&bo->list_kref, ttm_bo_release_list);
776                 return ret;
777         }
778
779         put_count = ttm_bo_del_from_lru(bo);
780         spin_unlock(&glob->lru_lock);
781
782         BUG_ON(ret != 0);
783
784         ttm_bo_list_ref_sub(bo, put_count, true);
785
786         ret = ttm_bo_evict(bo, interruptible, no_wait_gpu);
787         ttm_bo_unreserve(bo);
788
789         kref_put(&bo->list_kref, ttm_bo_release_list);
790         return ret;
791 }
792
793 void ttm_bo_mem_put(struct ttm_buffer_object *bo, struct ttm_mem_reg *mem)
794 {
795         struct ttm_mem_type_manager *man = &bo->bdev->man[mem->mem_type];
796
797         if (mem->mm_node)
798                 (*man->func->put_node)(man, mem);
799 }
800 EXPORT_SYMBOL(ttm_bo_mem_put);
801
802 /**
803  * Repeatedly evict memory from the LRU for @mem_type until we create enough
804  * space, or we've evicted everything and there isn't enough space.
805  */
806 static int ttm_bo_mem_force_space(struct ttm_buffer_object *bo,
807                                         uint32_t mem_type,
808                                         const struct ttm_place *place,
809                                         struct ttm_mem_reg *mem,
810                                         bool interruptible,
811                                         bool no_wait_gpu)
812 {
813         struct ttm_bo_device *bdev = bo->bdev;
814         struct ttm_mem_type_manager *man = &bdev->man[mem_type];
815         int ret;
816
817         do {
818                 ret = (*man->func->get_node)(man, bo, place, mem);
819                 if (unlikely(ret != 0))
820                         return ret;
821                 if (mem->mm_node)
822                         break;
823                 ret = ttm_mem_evict_first(bdev, mem_type, place,
824                                           interruptible, no_wait_gpu);
825                 if (unlikely(ret != 0))
826                         return ret;
827         } while (1);
828         if (mem->mm_node == NULL)
829                 return -ENOMEM;
830         mem->mem_type = mem_type;
831         return 0;
832 }
833
834 static uint32_t ttm_bo_select_caching(struct ttm_mem_type_manager *man,
835                                       uint32_t cur_placement,
836                                       uint32_t proposed_placement)
837 {
838         uint32_t caching = proposed_placement & TTM_PL_MASK_CACHING;
839         uint32_t result = proposed_placement & ~TTM_PL_MASK_CACHING;
840
841         /**
842          * Keep current caching if possible.
843          */
844
845         if ((cur_placement & caching) != 0)
846                 result |= (cur_placement & caching);
847         else if ((man->default_caching & caching) != 0)
848                 result |= man->default_caching;
849         else if ((TTM_PL_FLAG_CACHED & caching) != 0)
850                 result |= TTM_PL_FLAG_CACHED;
851         else if ((TTM_PL_FLAG_WC & caching) != 0)
852                 result |= TTM_PL_FLAG_WC;
853         else if ((TTM_PL_FLAG_UNCACHED & caching) != 0)
854                 result |= TTM_PL_FLAG_UNCACHED;
855
856         return result;
857 }
858
859 static bool ttm_bo_mt_compatible(struct ttm_mem_type_manager *man,
860                                  uint32_t mem_type,
861                                  const struct ttm_place *place,
862                                  uint32_t *masked_placement)
863 {
864         uint32_t cur_flags = ttm_bo_type_flags(mem_type);
865
866         if ((cur_flags & place->flags & TTM_PL_MASK_MEM) == 0)
867                 return false;
868
869         if ((place->flags & man->available_caching) == 0)
870                 return false;
871
872         cur_flags |= (place->flags & man->available_caching);
873
874         *masked_placement = cur_flags;
875         return true;
876 }
877
878 /**
879  * Creates space for memory region @mem according to its type.
880  *
881  * This function first searches for free space in compatible memory types in
882  * the priority order defined by the driver.  If free space isn't found, then
883  * ttm_bo_mem_force_space is attempted in priority order to evict and find
884  * space.
885  */
886 int ttm_bo_mem_space(struct ttm_buffer_object *bo,
887                         struct ttm_placement *placement,
888                         struct ttm_mem_reg *mem,
889                         bool interruptible,
890                         bool no_wait_gpu)
891 {
892         struct ttm_bo_device *bdev = bo->bdev;
893         struct ttm_mem_type_manager *man;
894         uint32_t mem_type = TTM_PL_SYSTEM;
895         uint32_t cur_flags = 0;
896         bool type_found = false;
897         bool type_ok = false;
898         bool has_erestartsys = false;
899         int i, ret;
900
901         mem->mm_node = NULL;
902         for (i = 0; i < placement->num_placement; ++i) {
903                 const struct ttm_place *place = &placement->placement[i];
904
905                 ret = ttm_mem_type_from_place(place, &mem_type);
906                 if (ret)
907                         return ret;
908                 man = &bdev->man[mem_type];
909                 if (!man->has_type || !man->use_type)
910                         continue;
911
912                 type_ok = ttm_bo_mt_compatible(man, mem_type, place,
913                                                 &cur_flags);
914
915                 if (!type_ok)
916                         continue;
917
918                 type_found = true;
919                 cur_flags = ttm_bo_select_caching(man, bo->mem.placement,
920                                                   cur_flags);
921                 /*
922                  * Use the access and other non-mapping-related flag bits from
923                  * the memory placement flags to the current flags
924                  */
925                 ttm_flag_masked(&cur_flags, place->flags,
926                                 ~TTM_PL_MASK_MEMTYPE);
927
928                 if (mem_type == TTM_PL_SYSTEM)
929                         break;
930
931                 ret = (*man->func->get_node)(man, bo, place, mem);
932                 if (unlikely(ret))
933                         return ret;
934                 
935                 if (mem->mm_node)
936                         break;
937         }
938
939         if ((type_ok && (mem_type == TTM_PL_SYSTEM)) || mem->mm_node) {
940                 mem->mem_type = mem_type;
941                 mem->placement = cur_flags;
942                 return 0;
943         }
944
945         for (i = 0; i < placement->num_busy_placement; ++i) {
946                 const struct ttm_place *place = &placement->busy_placement[i];
947
948                 ret = ttm_mem_type_from_place(place, &mem_type);
949                 if (ret)
950                         return ret;
951                 man = &bdev->man[mem_type];
952                 if (!man->has_type || !man->use_type)
953                         continue;
954                 if (!ttm_bo_mt_compatible(man, mem_type, place, &cur_flags))
955                         continue;
956
957                 type_found = true;
958                 cur_flags = ttm_bo_select_caching(man, bo->mem.placement,
959                                                   cur_flags);
960                 /*
961                  * Use the access and other non-mapping-related flag bits from
962                  * the memory placement flags to the current flags
963                  */
964                 ttm_flag_masked(&cur_flags, place->flags,
965                                 ~TTM_PL_MASK_MEMTYPE);
966
967                 if (mem_type == TTM_PL_SYSTEM) {
968                         mem->mem_type = mem_type;
969                         mem->placement = cur_flags;
970                         mem->mm_node = NULL;
971                         return 0;
972                 }
973
974                 ret = ttm_bo_mem_force_space(bo, mem_type, place, mem,
975                                                 interruptible, no_wait_gpu);
976                 if (ret == 0 && mem->mm_node) {
977                         mem->placement = cur_flags;
978                         return 0;
979                 }
980                 if (ret == -ERESTARTSYS)
981                         has_erestartsys = true;
982         }
983
984         if (!type_found) {
985                 printk(KERN_ERR TTM_PFX "No compatible memory type found.\n");
986                 return -EINVAL;
987         }
988
989         return (has_erestartsys) ? -ERESTARTSYS : -ENOMEM;
990 }
991 EXPORT_SYMBOL(ttm_bo_mem_space);
992
993 static int ttm_bo_move_buffer(struct ttm_buffer_object *bo,
994                         struct ttm_placement *placement,
995                         bool interruptible,
996                         bool no_wait_gpu)
997 {
998         int ret = 0;
999         struct ttm_mem_reg mem;
1000
1001         lockdep_assert_held(&bo->resv->lock.base);
1002
1003         /*
1004          * Don't wait for the BO on initial allocation. This is important when
1005          * the BO has an imported reservation object.
1006          */
1007         if (bo->mem.mem_type != TTM_PL_SYSTEM || bo->ttm != NULL) {
1008                 /*
1009                  * FIXME: It's possible to pipeline buffer moves.
1010                  * Have the driver move function wait for idle when necessary,
1011                  * instead of doing it here.
1012                  */
1013                 ret = ttm_bo_wait(bo, interruptible, no_wait_gpu);
1014                 if (ret)
1015                         return ret;
1016         }
1017         mem.num_pages = bo->num_pages;
1018         mem.size = mem.num_pages << PAGE_SHIFT;
1019         mem.page_alignment = bo->mem.page_alignment;
1020         mem.bus.io_reserved_vm = false;
1021         mem.bus.io_reserved_count = 0;
1022         /*
1023          * Determine where to move the buffer.
1024          */
1025         ret = ttm_bo_mem_space(bo, placement, &mem,
1026                                interruptible, no_wait_gpu);
1027         if (ret)
1028                 goto out_unlock;
1029         ret = ttm_bo_handle_move_mem(bo, &mem, false,
1030                                      interruptible, no_wait_gpu);
1031 out_unlock:
1032         if (ret && mem.mm_node)
1033                 ttm_bo_mem_put(bo, &mem);
1034         return ret;
1035 }
1036
1037 bool ttm_bo_mem_compat(struct ttm_placement *placement,
1038                        struct ttm_mem_reg *mem,
1039                        uint32_t *new_flags)
1040 {
1041         int i;
1042
1043         for (i = 0; i < placement->num_placement; i++) {
1044                 const struct ttm_place *heap = &placement->placement[i];
1045                 if (mem->mm_node &&
1046                     (mem->start < heap->fpfn ||
1047                      (heap->lpfn != 0 && (mem->start + mem->num_pages) > heap->lpfn)))
1048                         continue;
1049
1050                 *new_flags = heap->flags;
1051                 if ((*new_flags & mem->placement & TTM_PL_MASK_CACHING) &&
1052                     (*new_flags & mem->placement & TTM_PL_MASK_MEM))
1053                         return true;
1054         }
1055
1056         for (i = 0; i < placement->num_busy_placement; i++) {
1057                 const struct ttm_place *heap = &placement->busy_placement[i];
1058                 if (mem->mm_node &&
1059                     (mem->start < heap->fpfn ||
1060                      (heap->lpfn != 0 && (mem->start + mem->num_pages) > heap->lpfn)))
1061                         continue;
1062
1063                 *new_flags = heap->flags;
1064                 if ((*new_flags & mem->placement & TTM_PL_MASK_CACHING) &&
1065                     (*new_flags & mem->placement & TTM_PL_MASK_MEM))
1066                         return true;
1067         }
1068
1069         return false;
1070 }
1071 EXPORT_SYMBOL(ttm_bo_mem_compat);
1072
1073 int ttm_bo_validate(struct ttm_buffer_object *bo,
1074                         struct ttm_placement *placement,
1075                         bool interruptible,
1076                         bool no_wait_gpu)
1077 {
1078         int ret;
1079         uint32_t new_flags;
1080
1081         lockdep_assert_held(&bo->resv->lock.base);
1082         /*
1083          * Check whether we need to move buffer.
1084          */
1085         if (!ttm_bo_mem_compat(placement, &bo->mem, &new_flags)) {
1086                 ret = ttm_bo_move_buffer(bo, placement, interruptible,
1087                                          no_wait_gpu);
1088                 if (ret)
1089                         return ret;
1090         } else {
1091                 /*
1092                  * Use the access and other non-mapping-related flag bits from
1093                  * the compatible memory placement flags to the active flags
1094                  */
1095                 ttm_flag_masked(&bo->mem.placement, new_flags,
1096                                 ~TTM_PL_MASK_MEMTYPE);
1097         }
1098         /*
1099          * We might need to add a TTM.
1100          */
1101         if (bo->mem.mem_type == TTM_PL_SYSTEM && bo->ttm == NULL) {
1102                 ret = ttm_bo_add_ttm(bo, true);
1103                 if (ret)
1104                         return ret;
1105         }
1106         return 0;
1107 }
1108 EXPORT_SYMBOL(ttm_bo_validate);
1109
1110 int ttm_bo_init(struct ttm_bo_device *bdev,
1111                 struct ttm_buffer_object *bo,
1112                 unsigned long size,
1113                 enum ttm_bo_type type,
1114                 struct ttm_placement *placement,
1115                 uint32_t page_alignment,
1116                 bool interruptible,
1117                 struct file *persistent_swap_storage,
1118                 size_t acc_size,
1119                 struct sg_table *sg,
1120                 struct reservation_object *resv,
1121                 void (*destroy) (struct ttm_buffer_object *))
1122 {
1123         int ret = 0;
1124         unsigned long num_pages;
1125         struct ttm_mem_global *mem_glob = bdev->glob->mem_glob;
1126         bool locked;
1127
1128         ret = ttm_mem_global_alloc(mem_glob, acc_size, false, false);
1129         if (ret) {
1130                 pr_err("Out of kernel memory\n");
1131                 if (destroy)
1132                         (*destroy)(bo);
1133                 else
1134                         kfree(bo);
1135                 return -ENOMEM;
1136         }
1137
1138         num_pages = (size + PAGE_SIZE - 1) >> PAGE_SHIFT;
1139         if (num_pages == 0) {
1140                 pr_err("Illegal buffer object size\n");
1141                 if (destroy)
1142                         (*destroy)(bo);
1143                 else
1144                         kfree(bo);
1145                 ttm_mem_global_free(mem_glob, acc_size);
1146                 return -EINVAL;
1147         }
1148         bo->destroy = destroy;
1149
1150         kref_init(&bo->kref);
1151         kref_init(&bo->list_kref);
1152         atomic_set(&bo->cpu_writers, 0);
1153         INIT_LIST_HEAD(&bo->lru);
1154         INIT_LIST_HEAD(&bo->ddestroy);
1155         INIT_LIST_HEAD(&bo->swap);
1156         INIT_LIST_HEAD(&bo->io_reserve_lru);
1157         mutex_init(&bo->wu_mutex);
1158         bo->bdev = bdev;
1159         bo->glob = bdev->glob;
1160         bo->type = type;
1161         bo->num_pages = num_pages;
1162         bo->mem.size = num_pages << PAGE_SHIFT;
1163         bo->mem.mem_type = TTM_PL_SYSTEM;
1164         bo->mem.num_pages = bo->num_pages;
1165         bo->mem.mm_node = NULL;
1166         bo->mem.page_alignment = page_alignment;
1167         bo->mem.bus.io_reserved_vm = false;
1168         bo->mem.bus.io_reserved_count = 0;
1169         bo->priv_flags = 0;
1170         bo->mem.placement = (TTM_PL_FLAG_SYSTEM | TTM_PL_FLAG_CACHED);
1171         bo->persistent_swap_storage = persistent_swap_storage;
1172         bo->acc_size = acc_size;
1173         bo->sg = sg;
1174         if (resv) {
1175                 bo->resv = resv;
1176                 lockdep_assert_held(&bo->resv->lock.base);
1177         } else {
1178                 bo->resv = &bo->ttm_resv;
1179                 reservation_object_init(&bo->ttm_resv);
1180         }
1181         atomic_inc(&bo->glob->bo_count);
1182         drm_vma_node_reset(&bo->vma_node);
1183
1184         /*
1185          * For ttm_bo_type_device buffers, allocate
1186          * address space from the device.
1187          */
1188         if (bo->type == ttm_bo_type_device ||
1189             bo->type == ttm_bo_type_sg)
1190                 ret = drm_vma_offset_add(&bdev->vma_manager, &bo->vma_node,
1191                                          bo->mem.num_pages);
1192
1193         /* passed reservation objects should already be locked,
1194          * since otherwise lockdep will be angered in radeon.
1195          */
1196         if (!resv) {
1197                 locked = ww_mutex_trylock(&bo->resv->lock);
1198                 WARN_ON(!locked);
1199         }
1200
1201         if (likely(!ret))
1202                 ret = ttm_bo_validate(bo, placement, interruptible, false);
1203
1204         if (!resv) {
1205                 ttm_bo_unreserve(bo);
1206
1207         } else if (!(bo->mem.placement & TTM_PL_FLAG_NO_EVICT)) {
1208                 spin_lock(&bo->glob->lru_lock);
1209                 ttm_bo_add_to_lru(bo);
1210                 spin_unlock(&bo->glob->lru_lock);
1211         }
1212
1213         if (unlikely(ret))
1214                 ttm_bo_unref(&bo);
1215
1216         return ret;
1217 }
1218 EXPORT_SYMBOL(ttm_bo_init);
1219
1220 size_t ttm_bo_acc_size(struct ttm_bo_device *bdev,
1221                        unsigned long bo_size,
1222                        unsigned struct_size)
1223 {
1224         unsigned npages = (PAGE_ALIGN(bo_size)) >> PAGE_SHIFT;
1225         size_t size = 0;
1226
1227         size += ttm_round_pot(struct_size);
1228         size += ttm_round_pot(npages * sizeof(void *));
1229         size += ttm_round_pot(sizeof(struct ttm_tt));
1230         return size;
1231 }
1232 EXPORT_SYMBOL(ttm_bo_acc_size);
1233
1234 size_t ttm_bo_dma_acc_size(struct ttm_bo_device *bdev,
1235                            unsigned long bo_size,
1236                            unsigned struct_size)
1237 {
1238         unsigned npages = (PAGE_ALIGN(bo_size)) >> PAGE_SHIFT;
1239         size_t size = 0;
1240
1241         size += ttm_round_pot(struct_size);
1242         size += ttm_round_pot(npages * (2*sizeof(void *) + sizeof(dma_addr_t)));
1243         size += ttm_round_pot(sizeof(struct ttm_dma_tt));
1244         return size;
1245 }
1246 EXPORT_SYMBOL(ttm_bo_dma_acc_size);
1247
1248 int ttm_bo_create(struct ttm_bo_device *bdev,
1249                         unsigned long size,
1250                         enum ttm_bo_type type,
1251                         struct ttm_placement *placement,
1252                         uint32_t page_alignment,
1253                         bool interruptible,
1254                         struct file *persistent_swap_storage,
1255                         struct ttm_buffer_object **p_bo)
1256 {
1257         struct ttm_buffer_object *bo;
1258         size_t acc_size;
1259         int ret;
1260
1261         bo = kzalloc(sizeof(*bo), GFP_KERNEL);
1262         if (unlikely(bo == NULL))
1263                 return -ENOMEM;
1264
1265         acc_size = ttm_bo_acc_size(bdev, size, sizeof(struct ttm_buffer_object));
1266         ret = ttm_bo_init(bdev, bo, size, type, placement, page_alignment,
1267                           interruptible, persistent_swap_storage, acc_size,
1268                           NULL, NULL, NULL);
1269         if (likely(ret == 0))
1270                 *p_bo = bo;
1271
1272         return ret;
1273 }
1274 EXPORT_SYMBOL(ttm_bo_create);
1275
1276 static int ttm_bo_force_list_clean(struct ttm_bo_device *bdev,
1277                                         unsigned mem_type, bool allow_errors)
1278 {
1279         struct ttm_mem_type_manager *man = &bdev->man[mem_type];
1280         struct ttm_bo_global *glob = bdev->glob;
1281         int ret;
1282
1283         /*
1284          * Can't use standard list traversal since we're unlocking.
1285          */
1286
1287         spin_lock(&glob->lru_lock);
1288         while (!list_empty(&man->lru)) {
1289                 spin_unlock(&glob->lru_lock);
1290                 ret = ttm_mem_evict_first(bdev, mem_type, NULL, false, false);
1291                 if (ret) {
1292                         if (allow_errors) {
1293                                 return ret;
1294                         } else {
1295                                 pr_err("Cleanup eviction failed\n");
1296                         }
1297                 }
1298                 spin_lock(&glob->lru_lock);
1299         }
1300         spin_unlock(&glob->lru_lock);
1301         return 0;
1302 }
1303
1304 int ttm_bo_clean_mm(struct ttm_bo_device *bdev, unsigned mem_type)
1305 {
1306         struct ttm_mem_type_manager *man;
1307         int ret = -EINVAL;
1308
1309         if (mem_type >= TTM_NUM_MEM_TYPES) {
1310                 pr_err("Illegal memory type %d\n", mem_type);
1311                 return ret;
1312         }
1313         man = &bdev->man[mem_type];
1314
1315         if (!man->has_type) {
1316                 pr_err("Trying to take down uninitialized memory manager type %u\n",
1317                        mem_type);
1318                 return ret;
1319         }
1320
1321         man->use_type = false;
1322         man->has_type = false;
1323
1324         ret = 0;
1325         if (mem_type > 0) {
1326                 ttm_bo_force_list_clean(bdev, mem_type, false);
1327
1328                 ret = (*man->func->takedown)(man);
1329         }
1330
1331         return ret;
1332 }
1333 EXPORT_SYMBOL(ttm_bo_clean_mm);
1334
1335 int ttm_bo_evict_mm(struct ttm_bo_device *bdev, unsigned mem_type)
1336 {
1337         struct ttm_mem_type_manager *man = &bdev->man[mem_type];
1338
1339         if (mem_type == 0 || mem_type >= TTM_NUM_MEM_TYPES) {
1340                 pr_err("Illegal memory manager memory type %u\n", mem_type);
1341                 return -EINVAL;
1342         }
1343
1344         if (!man->has_type) {
1345                 pr_err("Memory type %u has not been initialized\n", mem_type);
1346                 return 0;
1347         }
1348
1349         return ttm_bo_force_list_clean(bdev, mem_type, true);
1350 }
1351 EXPORT_SYMBOL(ttm_bo_evict_mm);
1352
1353 int ttm_bo_init_mm(struct ttm_bo_device *bdev, unsigned type,
1354                         unsigned long p_size)
1355 {
1356         int ret = -EINVAL;
1357         struct ttm_mem_type_manager *man;
1358
1359         BUG_ON(type >= TTM_NUM_MEM_TYPES);
1360         man = &bdev->man[type];
1361         BUG_ON(man->has_type);
1362         man->io_reserve_fastpath = true;
1363         man->use_io_reserve_lru = false;
1364         mutex_init(&man->io_reserve_mutex);
1365         INIT_LIST_HEAD(&man->io_reserve_lru);
1366
1367         ret = bdev->driver->init_mem_type(bdev, type, man);
1368         if (ret)
1369                 return ret;
1370         man->bdev = bdev;
1371
1372         ret = 0;
1373         if (type != TTM_PL_SYSTEM) {
1374                 ret = (*man->func->init)(man, p_size);
1375                 if (ret)
1376                         return ret;
1377         }
1378         man->has_type = true;
1379         man->use_type = true;
1380         man->size = p_size;
1381
1382         INIT_LIST_HEAD(&man->lru);
1383
1384         return 0;
1385 }
1386 EXPORT_SYMBOL(ttm_bo_init_mm);
1387
1388 static void ttm_bo_global_kobj_release(struct kobject *kobj)
1389 {
1390         struct ttm_bo_global *glob =
1391                 container_of(kobj, struct ttm_bo_global, kobj);
1392
1393         ttm_mem_unregister_shrink(glob->mem_glob, &glob->shrink);
1394         __free_page(glob->dummy_read_page);
1395         kfree(glob);
1396 }
1397
1398 void ttm_bo_global_release(struct drm_global_reference *ref)
1399 {
1400         struct ttm_bo_global *glob = ref->object;
1401
1402         kobject_del(&glob->kobj);
1403         kobject_put(&glob->kobj);
1404 }
1405 EXPORT_SYMBOL(ttm_bo_global_release);
1406
1407 int ttm_bo_global_init(struct drm_global_reference *ref)
1408 {
1409         struct ttm_bo_global_ref *bo_ref =
1410                 container_of(ref, struct ttm_bo_global_ref, ref);
1411         struct ttm_bo_global *glob = ref->object;
1412         int ret;
1413
1414         mutex_init(&glob->device_list_mutex);
1415         spin_lock_init(&glob->lru_lock);
1416         glob->mem_glob = bo_ref->mem_glob;
1417         glob->dummy_read_page = alloc_page(__GFP_ZERO | GFP_DMA32);
1418
1419         if (unlikely(glob->dummy_read_page == NULL)) {
1420                 ret = -ENOMEM;
1421                 goto out_no_drp;
1422         }
1423
1424         INIT_LIST_HEAD(&glob->swap_lru);
1425         INIT_LIST_HEAD(&glob->device_list);
1426
1427         ttm_mem_init_shrink(&glob->shrink, ttm_bo_swapout);
1428         ret = ttm_mem_register_shrink(glob->mem_glob, &glob->shrink);
1429         if (unlikely(ret != 0)) {
1430                 pr_err("Could not register buffer object swapout\n");
1431                 goto out_no_shrink;
1432         }
1433
1434         atomic_set(&glob->bo_count, 0);
1435
1436         ret = kobject_init_and_add(
1437                 &glob->kobj, &ttm_bo_glob_kobj_type, ttm_get_kobj(), "buffer_objects");
1438         if (unlikely(ret != 0))
1439                 kobject_put(&glob->kobj);
1440         return ret;
1441 out_no_shrink:
1442         __free_page(glob->dummy_read_page);
1443 out_no_drp:
1444         kfree(glob);
1445         return ret;
1446 }
1447 EXPORT_SYMBOL(ttm_bo_global_init);
1448
1449
1450 int ttm_bo_device_release(struct ttm_bo_device *bdev)
1451 {
1452         int ret = 0;
1453         unsigned i = TTM_NUM_MEM_TYPES;
1454         struct ttm_mem_type_manager *man;
1455         struct ttm_bo_global *glob = bdev->glob;
1456
1457         while (i--) {
1458                 man = &bdev->man[i];
1459                 if (man->has_type) {
1460                         man->use_type = false;
1461                         if ((i != TTM_PL_SYSTEM) && ttm_bo_clean_mm(bdev, i)) {
1462                                 ret = -EBUSY;
1463                                 pr_err("DRM memory manager type %d is not clean\n",
1464                                        i);
1465                         }
1466                         man->has_type = false;
1467                 }
1468         }
1469
1470         mutex_lock(&glob->device_list_mutex);
1471         list_del(&bdev->device_list);
1472         mutex_unlock(&glob->device_list_mutex);
1473
1474         cancel_delayed_work_sync(&bdev->wq);
1475
1476         while (ttm_bo_delayed_delete(bdev, true))
1477                 ;
1478
1479         spin_lock(&glob->lru_lock);
1480         if (list_empty(&bdev->ddestroy))
1481                 TTM_DEBUG("Delayed destroy list was clean\n");
1482
1483         if (list_empty(&bdev->man[0].lru))
1484                 TTM_DEBUG("Swap list was clean\n");
1485         spin_unlock(&glob->lru_lock);
1486
1487         drm_vma_offset_manager_destroy(&bdev->vma_manager);
1488
1489         return ret;
1490 }
1491 EXPORT_SYMBOL(ttm_bo_device_release);
1492
1493 int ttm_bo_device_init(struct ttm_bo_device *bdev,
1494                        struct ttm_bo_global *glob,
1495                        struct ttm_bo_driver *driver,
1496                        struct address_space *mapping,
1497                        uint64_t file_page_offset,
1498                        bool need_dma32)
1499 {
1500         int ret = -EINVAL;
1501
1502         bdev->driver = driver;
1503
1504         memset(bdev->man, 0, sizeof(bdev->man));
1505
1506         /*
1507          * Initialize the system memory buffer type.
1508          * Other types need to be driver / IOCTL initialized.
1509          */
1510         ret = ttm_bo_init_mm(bdev, TTM_PL_SYSTEM, 0);
1511         if (unlikely(ret != 0))
1512                 goto out_no_sys;
1513
1514         drm_vma_offset_manager_init(&bdev->vma_manager, file_page_offset,
1515                                     0x10000000);
1516         INIT_DELAYED_WORK(&bdev->wq, ttm_bo_delayed_workqueue);
1517         INIT_LIST_HEAD(&bdev->ddestroy);
1518         bdev->dev_mapping = mapping;
1519         bdev->glob = glob;
1520         bdev->need_dma32 = need_dma32;
1521         mutex_lock(&glob->device_list_mutex);
1522         list_add_tail(&bdev->device_list, &glob->device_list);
1523         mutex_unlock(&glob->device_list_mutex);
1524
1525         return 0;
1526 out_no_sys:
1527         return ret;
1528 }
1529 EXPORT_SYMBOL(ttm_bo_device_init);
1530
1531 /*
1532  * buffer object vm functions.
1533  */
1534
1535 bool ttm_mem_reg_is_pci(struct ttm_bo_device *bdev, struct ttm_mem_reg *mem)
1536 {
1537         struct ttm_mem_type_manager *man = &bdev->man[mem->mem_type];
1538
1539         if (!(man->flags & TTM_MEMTYPE_FLAG_FIXED)) {
1540                 if (mem->mem_type == TTM_PL_SYSTEM)
1541                         return false;
1542
1543                 if (man->flags & TTM_MEMTYPE_FLAG_CMA)
1544                         return false;
1545
1546                 if (mem->placement & TTM_PL_FLAG_CACHED)
1547                         return false;
1548         }
1549         return true;
1550 }
1551
1552 void ttm_bo_unmap_virtual_locked(struct ttm_buffer_object *bo)
1553 {
1554         struct ttm_bo_device *bdev = bo->bdev;
1555
1556         drm_vma_node_unmap(&bo->vma_node, bdev->dev_mapping);
1557         ttm_mem_io_free_vm(bo);
1558 }
1559
1560 void ttm_bo_unmap_virtual(struct ttm_buffer_object *bo)
1561 {
1562         struct ttm_bo_device *bdev = bo->bdev;
1563         struct ttm_mem_type_manager *man = &bdev->man[bo->mem.mem_type];
1564
1565         ttm_mem_io_lock(man, false);
1566         ttm_bo_unmap_virtual_locked(bo);
1567         ttm_mem_io_unlock(man);
1568 }
1569
1570
1571 EXPORT_SYMBOL(ttm_bo_unmap_virtual);
1572
1573 int ttm_bo_wait(struct ttm_buffer_object *bo,
1574                 bool interruptible, bool no_wait)
1575 {
1576         struct reservation_object_list *fobj;
1577         struct reservation_object *resv;
1578         struct fence *excl;
1579         long timeout = 15 * HZ;
1580         int i;
1581
1582         resv = bo->resv;
1583         fobj = reservation_object_get_list(resv);
1584         excl = reservation_object_get_excl(resv);
1585         if (excl) {
1586                 if (!fence_is_signaled(excl)) {
1587                         if (no_wait)
1588                                 return -EBUSY;
1589
1590                         timeout = fence_wait_timeout(excl,
1591                                                      interruptible, timeout);
1592                 }
1593         }
1594
1595         for (i = 0; fobj && timeout > 0 && i < fobj->shared_count; ++i) {
1596                 struct fence *fence;
1597                 fence = rcu_dereference_protected(fobj->shared[i],
1598                                                 reservation_object_held(resv));
1599
1600                 if (!fence_is_signaled(fence)) {
1601                         if (no_wait)
1602                                 return -EBUSY;
1603
1604                         timeout = fence_wait_timeout(fence,
1605                                                      interruptible, timeout);
1606                 }
1607         }
1608
1609         if (timeout < 0)
1610                 return timeout;
1611
1612         if (timeout == 0)
1613                 return -EBUSY;
1614
1615         reservation_object_add_excl_fence(resv, NULL);
1616         clear_bit(TTM_BO_PRIV_FLAG_MOVING, &bo->priv_flags);
1617         return 0;
1618 }
1619 EXPORT_SYMBOL(ttm_bo_wait);
1620
1621 int ttm_bo_synccpu_write_grab(struct ttm_buffer_object *bo, bool no_wait)
1622 {
1623         int ret = 0;
1624
1625         /*
1626          * Using ttm_bo_reserve makes sure the lru lists are updated.
1627          */
1628
1629         ret = ttm_bo_reserve(bo, true, no_wait, NULL);
1630         if (unlikely(ret != 0))
1631                 return ret;
1632         ret = ttm_bo_wait(bo, true, no_wait);
1633         if (likely(ret == 0))
1634                 atomic_inc(&bo->cpu_writers);
1635         ttm_bo_unreserve(bo);
1636         return ret;
1637 }
1638 EXPORT_SYMBOL(ttm_bo_synccpu_write_grab);
1639
1640 void ttm_bo_synccpu_write_release(struct ttm_buffer_object *bo)
1641 {
1642         atomic_dec(&bo->cpu_writers);
1643 }
1644 EXPORT_SYMBOL(ttm_bo_synccpu_write_release);
1645
1646 /**
1647  * A buffer object shrink method that tries to swap out the first
1648  * buffer object on the bo_global::swap_lru list.
1649  */
1650
1651 static int ttm_bo_swapout(struct ttm_mem_shrink *shrink)
1652 {
1653         struct ttm_bo_global *glob =
1654             container_of(shrink, struct ttm_bo_global, shrink);
1655         struct ttm_buffer_object *bo;
1656         int ret = -EBUSY;
1657         int put_count;
1658         uint32_t swap_placement = (TTM_PL_FLAG_CACHED | TTM_PL_FLAG_SYSTEM);
1659
1660         spin_lock(&glob->lru_lock);
1661         list_for_each_entry(bo, &glob->swap_lru, swap) {
1662                 ret = __ttm_bo_reserve(bo, false, true, NULL);
1663                 if (!ret)
1664                         break;
1665         }
1666
1667         if (ret) {
1668                 spin_unlock(&glob->lru_lock);
1669                 return ret;
1670         }
1671
1672         kref_get(&bo->list_kref);
1673
1674         if (!list_empty(&bo->ddestroy)) {
1675                 ret = ttm_bo_cleanup_refs_and_unlock(bo, false, false);
1676                 kref_put(&bo->list_kref, ttm_bo_release_list);
1677                 return ret;
1678         }
1679
1680         put_count = ttm_bo_del_from_lru(bo);
1681         spin_unlock(&glob->lru_lock);
1682
1683         ttm_bo_list_ref_sub(bo, put_count, true);
1684
1685         /**
1686          * Wait for GPU, then move to system cached.
1687          */
1688
1689         ret = ttm_bo_wait(bo, false, false);
1690
1691         if (unlikely(ret != 0))
1692                 goto out;
1693
1694         if ((bo->mem.placement & swap_placement) != swap_placement) {
1695                 struct ttm_mem_reg evict_mem;
1696
1697                 evict_mem = bo->mem;
1698                 evict_mem.mm_node = NULL;
1699                 evict_mem.placement = TTM_PL_FLAG_SYSTEM | TTM_PL_FLAG_CACHED;
1700                 evict_mem.mem_type = TTM_PL_SYSTEM;
1701
1702                 ret = ttm_bo_handle_move_mem(bo, &evict_mem, true,
1703                                              false, false);
1704                 if (unlikely(ret != 0))
1705                         goto out;
1706         }
1707
1708         ttm_bo_unmap_virtual(bo);
1709
1710         /**
1711          * Swap out. Buffer will be swapped in again as soon as
1712          * anyone tries to access a ttm page.
1713          */
1714
1715         if (bo->bdev->driver->swap_notify)
1716                 bo->bdev->driver->swap_notify(bo);
1717
1718         ret = ttm_tt_swapout(bo->ttm, bo->persistent_swap_storage);
1719 out:
1720
1721         /**
1722          *
1723          * Unreserve without putting on LRU to avoid swapping out an
1724          * already swapped buffer.
1725          */
1726
1727         __ttm_bo_unreserve(bo);
1728         kref_put(&bo->list_kref, ttm_bo_release_list);
1729         return ret;
1730 }
1731
1732 void ttm_bo_swapout_all(struct ttm_bo_device *bdev)
1733 {
1734         while (ttm_bo_swapout(&bdev->glob->shrink) == 0)
1735                 ;
1736 }
1737 EXPORT_SYMBOL(ttm_bo_swapout_all);
1738
1739 /**
1740  * ttm_bo_wait_unreserved - interruptible wait for a buffer object to become
1741  * unreserved
1742  *
1743  * @bo: Pointer to buffer
1744  */
1745 int ttm_bo_wait_unreserved(struct ttm_buffer_object *bo)
1746 {
1747         int ret;
1748
1749         /*
1750          * In the absense of a wait_unlocked API,
1751          * Use the bo::wu_mutex to avoid triggering livelocks due to
1752          * concurrent use of this function. Note that this use of
1753          * bo::wu_mutex can go away if we change locking order to
1754          * mmap_sem -> bo::reserve.
1755          */
1756         ret = mutex_lock_interruptible(&bo->wu_mutex);
1757         if (unlikely(ret != 0))
1758                 return -ERESTARTSYS;
1759         if (!ww_mutex_is_locked(&bo->resv->lock))
1760                 goto out_unlock;
1761         ret = __ttm_bo_reserve(bo, true, false, NULL);
1762         if (unlikely(ret != 0))
1763                 goto out_unlock;
1764         __ttm_bo_unreserve(bo);
1765
1766 out_unlock:
1767         mutex_unlock(&bo->wu_mutex);
1768         return ret;
1769 }