Home | History | Annotate | Line # | Download | only in amdgpu
amdgpu_object.c revision 1.2
      1 /*	$NetBSD: amdgpu_object.c,v 1.2 2018/08/27 04:58:19 riastradh Exp $	*/
      2 
      3 /*
      4  * Copyright 2009 Jerome Glisse.
      5  * All Rights Reserved.
      6  *
      7  * Permission is hereby granted, free of charge, to any person obtaining a
      8  * copy of this software and associated documentation files (the
      9  * "Software"), to deal in the Software without restriction, including
     10  * without limitation the rights to use, copy, modify, merge, publish,
     11  * distribute, sub license, and/or sell copies of the Software, and to
     12  * permit persons to whom the Software is furnished to do so, subject to
     13  * the following conditions:
     14  *
     15  * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
     16  * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
     17  * FITNESS FOR A PARTICULAR PURPOSE AND NON-INFRINGEMENT. IN NO EVENT SHALL
     18  * THE COPYRIGHT HOLDERS, AUTHORS AND/OR ITS SUPPLIERS BE LIABLE FOR ANY CLAIM,
     19  * DAMAGES OR OTHER LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR
     20  * OTHERWISE, ARISING FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE
     21  * USE OR OTHER DEALINGS IN THE SOFTWARE.
     22  *
     23  * The above copyright notice and this permission notice (including the
     24  * next paragraph) shall be included in all copies or substantial portions
     25  * of the Software.
     26  *
     27  */
     28 /*
     29  * Authors:
     30  *    Jerome Glisse <glisse (at) freedesktop.org>
     31  *    Thomas Hellstrom <thomas-at-tungstengraphics-dot-com>
     32  *    Dave Airlie
     33  */
     34 #include <sys/cdefs.h>
     35 __KERNEL_RCSID(0, "$NetBSD: amdgpu_object.c,v 1.2 2018/08/27 04:58:19 riastradh Exp $");
     36 
     37 #include <linux/list.h>
     38 #include <linux/slab.h>
     39 #include <drm/drmP.h>
     40 #include <drm/amdgpu_drm.h>
     41 #include <drm/drm_cache.h>
     42 #include "amdgpu.h"
     43 #include "amdgpu_trace.h"
     44 
     45 
     46 int amdgpu_ttm_init(struct amdgpu_device *adev);
     47 void amdgpu_ttm_fini(struct amdgpu_device *adev);
     48 
     49 static u64 amdgpu_get_vis_part_size(struct amdgpu_device *adev,
     50 						struct ttm_mem_reg *mem)
     51 {
     52 	u64 ret = 0;
     53 	if (mem->start << PAGE_SHIFT < adev->mc.visible_vram_size) {
     54 		ret = (u64)((mem->start << PAGE_SHIFT) + mem->size) >
     55 			   adev->mc.visible_vram_size ?
     56 			   adev->mc.visible_vram_size - (mem->start << PAGE_SHIFT) :
     57 			   mem->size;
     58 	}
     59 	return ret;
     60 }
     61 
     62 static void amdgpu_update_memory_usage(struct amdgpu_device *adev,
     63 		       struct ttm_mem_reg *old_mem,
     64 		       struct ttm_mem_reg *new_mem)
     65 {
     66 	u64 vis_size;
     67 	if (!adev)
     68 		return;
     69 
     70 	if (new_mem) {
     71 		switch (new_mem->mem_type) {
     72 		case TTM_PL_TT:
     73 			atomic64_add(new_mem->size, &adev->gtt_usage);
     74 			break;
     75 		case TTM_PL_VRAM:
     76 			atomic64_add(new_mem->size, &adev->vram_usage);
     77 			vis_size = amdgpu_get_vis_part_size(adev, new_mem);
     78 			atomic64_add(vis_size, &adev->vram_vis_usage);
     79 			break;
     80 		}
     81 	}
     82 
     83 	if (old_mem) {
     84 		switch (old_mem->mem_type) {
     85 		case TTM_PL_TT:
     86 			atomic64_sub(old_mem->size, &adev->gtt_usage);
     87 			break;
     88 		case TTM_PL_VRAM:
     89 			atomic64_sub(old_mem->size, &adev->vram_usage);
     90 			vis_size = amdgpu_get_vis_part_size(adev, old_mem);
     91 			atomic64_sub(vis_size, &adev->vram_vis_usage);
     92 			break;
     93 		}
     94 	}
     95 }
     96 
     97 static void amdgpu_ttm_bo_destroy(struct ttm_buffer_object *tbo)
     98 {
     99 	struct amdgpu_bo *bo;
    100 
    101 	bo = container_of(tbo, struct amdgpu_bo, tbo);
    102 
    103 	amdgpu_update_memory_usage(bo->adev, &bo->tbo.mem, NULL);
    104 
    105 	mutex_lock(&bo->adev->gem.mutex);
    106 	list_del_init(&bo->list);
    107 	mutex_unlock(&bo->adev->gem.mutex);
    108 	drm_gem_object_release(&bo->gem_base);
    109 	amdgpu_bo_unref(&bo->parent);
    110 	kfree(bo->metadata);
    111 	kfree(bo);
    112 }
    113 
    114 bool amdgpu_ttm_bo_is_amdgpu_bo(struct ttm_buffer_object *bo)
    115 {
    116 	if (bo->destroy == &amdgpu_ttm_bo_destroy)
    117 		return true;
    118 	return false;
    119 }
    120 
    121 static void amdgpu_ttm_placement_init(struct amdgpu_device *adev,
    122 				      struct ttm_placement *placement,
    123 				      struct ttm_place *placements,
    124 				      u32 domain, u64 flags)
    125 {
    126 	u32 c = 0, i;
    127 
    128 	placement->placement = placements;
    129 	placement->busy_placement = placements;
    130 
    131 	if (domain & AMDGPU_GEM_DOMAIN_VRAM) {
    132 		if (flags & AMDGPU_GEM_CREATE_NO_CPU_ACCESS &&
    133 			adev->mc.visible_vram_size < adev->mc.real_vram_size) {
    134 			placements[c].fpfn =
    135 				adev->mc.visible_vram_size >> PAGE_SHIFT;
    136 			placements[c++].flags = TTM_PL_FLAG_WC | TTM_PL_FLAG_UNCACHED |
    137 				TTM_PL_FLAG_VRAM | TTM_PL_FLAG_TOPDOWN;
    138 		}
    139 		placements[c].fpfn = 0;
    140 		placements[c++].flags = TTM_PL_FLAG_WC | TTM_PL_FLAG_UNCACHED |
    141 			TTM_PL_FLAG_VRAM;
    142 		if (!(flags & AMDGPU_GEM_CREATE_CPU_ACCESS_REQUIRED))
    143 			placements[c - 1].flags |= TTM_PL_FLAG_TOPDOWN;
    144 	}
    145 
    146 	if (domain & AMDGPU_GEM_DOMAIN_GTT) {
    147 		if (flags & AMDGPU_GEM_CREATE_CPU_GTT_USWC) {
    148 			placements[c].fpfn = 0;
    149 			placements[c++].flags = TTM_PL_FLAG_WC | TTM_PL_FLAG_TT |
    150 				TTM_PL_FLAG_UNCACHED;
    151 		} else {
    152 			placements[c].fpfn = 0;
    153 			placements[c++].flags = TTM_PL_FLAG_CACHED | TTM_PL_FLAG_TT;
    154 		}
    155 	}
    156 
    157 	if (domain & AMDGPU_GEM_DOMAIN_CPU) {
    158 		if (flags & AMDGPU_GEM_CREATE_CPU_GTT_USWC) {
    159 			placements[c].fpfn = 0;
    160 			placements[c++].flags = TTM_PL_FLAG_WC | TTM_PL_FLAG_SYSTEM |
    161 				TTM_PL_FLAG_UNCACHED;
    162 		} else {
    163 			placements[c].fpfn = 0;
    164 			placements[c++].flags = TTM_PL_FLAG_CACHED | TTM_PL_FLAG_SYSTEM;
    165 		}
    166 	}
    167 
    168 	if (domain & AMDGPU_GEM_DOMAIN_GDS) {
    169 		placements[c].fpfn = 0;
    170 		placements[c++].flags = TTM_PL_FLAG_UNCACHED |
    171 			AMDGPU_PL_FLAG_GDS;
    172 	}
    173 	if (domain & AMDGPU_GEM_DOMAIN_GWS) {
    174 		placements[c].fpfn = 0;
    175 		placements[c++].flags = TTM_PL_FLAG_UNCACHED |
    176 			AMDGPU_PL_FLAG_GWS;
    177 	}
    178 	if (domain & AMDGPU_GEM_DOMAIN_OA) {
    179 		placements[c].fpfn = 0;
    180 		placements[c++].flags = TTM_PL_FLAG_UNCACHED |
    181 			AMDGPU_PL_FLAG_OA;
    182 	}
    183 
    184 	if (!c) {
    185 		placements[c].fpfn = 0;
    186 		placements[c++].flags = TTM_PL_MASK_CACHING |
    187 			TTM_PL_FLAG_SYSTEM;
    188 	}
    189 	placement->num_placement = c;
    190 	placement->num_busy_placement = c;
    191 
    192 	for (i = 0; i < c; i++) {
    193 		if ((flags & AMDGPU_GEM_CREATE_CPU_ACCESS_REQUIRED) &&
    194 			(placements[i].flags & TTM_PL_FLAG_VRAM) &&
    195 			!placements[i].fpfn)
    196 			placements[i].lpfn =
    197 				adev->mc.visible_vram_size >> PAGE_SHIFT;
    198 		else
    199 			placements[i].lpfn = 0;
    200 	}
    201 }
    202 
    203 void amdgpu_ttm_placement_from_domain(struct amdgpu_bo *rbo, u32 domain)
    204 {
    205 	amdgpu_ttm_placement_init(rbo->adev, &rbo->placement,
    206 				  rbo->placements, domain, rbo->flags);
    207 }
    208 
    209 static void amdgpu_fill_placement_to_bo(struct amdgpu_bo *bo,
    210 					struct ttm_placement *placement)
    211 {
    212 	BUG_ON(placement->num_placement > (AMDGPU_GEM_DOMAIN_MAX + 1));
    213 
    214 	memcpy(bo->placements, placement->placement,
    215 	       placement->num_placement * sizeof(struct ttm_place));
    216 	bo->placement.num_placement = placement->num_placement;
    217 	bo->placement.num_busy_placement = placement->num_busy_placement;
    218 	bo->placement.placement = bo->placements;
    219 	bo->placement.busy_placement = bo->placements;
    220 }
    221 
    222 int amdgpu_bo_create_restricted(struct amdgpu_device *adev,
    223 				unsigned long size, int byte_align,
    224 				bool kernel, u32 domain, u64 flags,
    225 				struct sg_table *sg,
    226 				struct ttm_placement *placement,
    227 				struct reservation_object *resv,
    228 				struct amdgpu_bo **bo_ptr)
    229 {
    230 	struct amdgpu_bo *bo;
    231 	enum ttm_bo_type type;
    232 	unsigned long page_align;
    233 	size_t acc_size;
    234 	int r;
    235 
    236 	page_align = roundup(byte_align, PAGE_SIZE) >> PAGE_SHIFT;
    237 	size = ALIGN(size, PAGE_SIZE);
    238 
    239 	if (kernel) {
    240 		type = ttm_bo_type_kernel;
    241 	} else if (sg) {
    242 		type = ttm_bo_type_sg;
    243 	} else {
    244 		type = ttm_bo_type_device;
    245 	}
    246 	*bo_ptr = NULL;
    247 
    248 	acc_size = ttm_bo_dma_acc_size(&adev->mman.bdev, size,
    249 				       sizeof(struct amdgpu_bo));
    250 
    251 	bo = kzalloc(sizeof(struct amdgpu_bo), GFP_KERNEL);
    252 	if (bo == NULL)
    253 		return -ENOMEM;
    254 	r = drm_gem_object_init(adev->ddev, &bo->gem_base, size);
    255 	if (unlikely(r)) {
    256 		kfree(bo);
    257 		return r;
    258 	}
    259 	bo->adev = adev;
    260 	INIT_LIST_HEAD(&bo->list);
    261 	INIT_LIST_HEAD(&bo->va);
    262 	bo->initial_domain = domain & (AMDGPU_GEM_DOMAIN_VRAM |
    263 				       AMDGPU_GEM_DOMAIN_GTT |
    264 				       AMDGPU_GEM_DOMAIN_CPU |
    265 				       AMDGPU_GEM_DOMAIN_GDS |
    266 				       AMDGPU_GEM_DOMAIN_GWS |
    267 				       AMDGPU_GEM_DOMAIN_OA);
    268 
    269 	bo->flags = flags;
    270 
    271 	/* For architectures that don't support WC memory,
    272 	 * mask out the WC flag from the BO
    273 	 */
    274 	if (!drm_arch_can_wc_memory())
    275 		bo->flags &= ~AMDGPU_GEM_CREATE_CPU_GTT_USWC;
    276 
    277 	amdgpu_fill_placement_to_bo(bo, placement);
    278 	/* Kernel allocation are uninterruptible */
    279 	r = ttm_bo_init(&adev->mman.bdev, &bo->tbo, size, type,
    280 			&bo->placement, page_align, !kernel, NULL,
    281 			acc_size, sg, resv, &amdgpu_ttm_bo_destroy);
    282 	if (unlikely(r != 0)) {
    283 		return r;
    284 	}
    285 	*bo_ptr = bo;
    286 
    287 	trace_amdgpu_bo_create(bo);
    288 
    289 	return 0;
    290 }
    291 
    292 int amdgpu_bo_create(struct amdgpu_device *adev,
    293 		     unsigned long size, int byte_align,
    294 		     bool kernel, u32 domain, u64 flags,
    295 		     struct sg_table *sg,
    296 		     struct reservation_object *resv,
    297 		     struct amdgpu_bo **bo_ptr)
    298 {
    299 	struct ttm_placement placement = {0};
    300 	struct ttm_place placements[AMDGPU_GEM_DOMAIN_MAX + 1];
    301 
    302 	memset(&placements, 0,
    303 	       (AMDGPU_GEM_DOMAIN_MAX + 1) * sizeof(struct ttm_place));
    304 
    305 	amdgpu_ttm_placement_init(adev, &placement,
    306 				  placements, domain, flags);
    307 
    308 	return amdgpu_bo_create_restricted(adev, size, byte_align, kernel,
    309 					   domain, flags, sg, &placement,
    310 					   resv, bo_ptr);
    311 }
    312 
    313 int amdgpu_bo_kmap(struct amdgpu_bo *bo, void **ptr)
    314 {
    315 	bool is_iomem;
    316 	int r;
    317 
    318 	if (bo->flags & AMDGPU_GEM_CREATE_NO_CPU_ACCESS)
    319 		return -EPERM;
    320 
    321 	if (bo->kptr) {
    322 		if (ptr) {
    323 			*ptr = bo->kptr;
    324 		}
    325 		return 0;
    326 	}
    327 	r = ttm_bo_kmap(&bo->tbo, 0, bo->tbo.num_pages, &bo->kmap);
    328 	if (r) {
    329 		return r;
    330 	}
    331 	bo->kptr = ttm_kmap_obj_virtual(&bo->kmap, &is_iomem);
    332 	if (ptr) {
    333 		*ptr = bo->kptr;
    334 	}
    335 	return 0;
    336 }
    337 
    338 void amdgpu_bo_kunmap(struct amdgpu_bo *bo)
    339 {
    340 	if (bo->kptr == NULL)
    341 		return;
    342 	bo->kptr = NULL;
    343 	ttm_bo_kunmap(&bo->kmap);
    344 }
    345 
    346 struct amdgpu_bo *amdgpu_bo_ref(struct amdgpu_bo *bo)
    347 {
    348 	if (bo == NULL)
    349 		return NULL;
    350 
    351 	ttm_bo_reference(&bo->tbo);
    352 	return bo;
    353 }
    354 
    355 void amdgpu_bo_unref(struct amdgpu_bo **bo)
    356 {
    357 	struct ttm_buffer_object *tbo;
    358 
    359 	if ((*bo) == NULL)
    360 		return;
    361 
    362 	tbo = &((*bo)->tbo);
    363 	ttm_bo_unref(&tbo);
    364 	if (tbo == NULL)
    365 		*bo = NULL;
    366 }
    367 
    368 int amdgpu_bo_pin_restricted(struct amdgpu_bo *bo, u32 domain,
    369 			     u64 min_offset, u64 max_offset,
    370 			     u64 *gpu_addr)
    371 {
    372 	int r, i;
    373 	unsigned fpfn, lpfn;
    374 
    375 	if (amdgpu_ttm_tt_has_userptr(bo->tbo.ttm))
    376 		return -EPERM;
    377 
    378 	if (WARN_ON_ONCE(min_offset > max_offset))
    379 		return -EINVAL;
    380 
    381 	if (bo->pin_count) {
    382 		bo->pin_count++;
    383 		if (gpu_addr)
    384 			*gpu_addr = amdgpu_bo_gpu_offset(bo);
    385 
    386 		if (max_offset != 0) {
    387 			u64 domain_start;
    388 			if (domain == AMDGPU_GEM_DOMAIN_VRAM)
    389 				domain_start = bo->adev->mc.vram_start;
    390 			else
    391 				domain_start = bo->adev->mc.gtt_start;
    392 			WARN_ON_ONCE(max_offset <
    393 				     (amdgpu_bo_gpu_offset(bo) - domain_start));
    394 		}
    395 
    396 		return 0;
    397 	}
    398 	amdgpu_ttm_placement_from_domain(bo, domain);
    399 	for (i = 0; i < bo->placement.num_placement; i++) {
    400 		/* force to pin into visible video ram */
    401 		if ((bo->placements[i].flags & TTM_PL_FLAG_VRAM) &&
    402 		    !(bo->flags & AMDGPU_GEM_CREATE_NO_CPU_ACCESS) &&
    403 		    (!max_offset || max_offset > bo->adev->mc.visible_vram_size)) {
    404 			if (WARN_ON_ONCE(min_offset >
    405 					 bo->adev->mc.visible_vram_size))
    406 				return -EINVAL;
    407 			fpfn = min_offset >> PAGE_SHIFT;
    408 			lpfn = bo->adev->mc.visible_vram_size >> PAGE_SHIFT;
    409 		} else {
    410 			fpfn = min_offset >> PAGE_SHIFT;
    411 			lpfn = max_offset >> PAGE_SHIFT;
    412 		}
    413 		if (fpfn > bo->placements[i].fpfn)
    414 			bo->placements[i].fpfn = fpfn;
    415 		if (!bo->placements[i].lpfn ||
    416 		    (lpfn && lpfn < bo->placements[i].lpfn))
    417 			bo->placements[i].lpfn = lpfn;
    418 		bo->placements[i].flags |= TTM_PL_FLAG_NO_EVICT;
    419 	}
    420 
    421 	r = ttm_bo_validate(&bo->tbo, &bo->placement, false, false);
    422 	if (likely(r == 0)) {
    423 		bo->pin_count = 1;
    424 		if (gpu_addr != NULL)
    425 			*gpu_addr = amdgpu_bo_gpu_offset(bo);
    426 		if (domain == AMDGPU_GEM_DOMAIN_VRAM)
    427 			bo->adev->vram_pin_size += amdgpu_bo_size(bo);
    428 		else
    429 			bo->adev->gart_pin_size += amdgpu_bo_size(bo);
    430 	} else {
    431 		dev_err(bo->adev->dev, "%p pin failed\n", bo);
    432 	}
    433 	return r;
    434 }
    435 
    436 int amdgpu_bo_pin(struct amdgpu_bo *bo, u32 domain, u64 *gpu_addr)
    437 {
    438 	return amdgpu_bo_pin_restricted(bo, domain, 0, 0, gpu_addr);
    439 }
    440 
    441 int amdgpu_bo_unpin(struct amdgpu_bo *bo)
    442 {
    443 	int r, i;
    444 
    445 	if (!bo->pin_count) {
    446 		dev_warn(bo->adev->dev, "%p unpin not necessary\n", bo);
    447 		return 0;
    448 	}
    449 	bo->pin_count--;
    450 	if (bo->pin_count)
    451 		return 0;
    452 	for (i = 0; i < bo->placement.num_placement; i++) {
    453 		bo->placements[i].lpfn = 0;
    454 		bo->placements[i].flags &= ~TTM_PL_FLAG_NO_EVICT;
    455 	}
    456 	r = ttm_bo_validate(&bo->tbo, &bo->placement, false, false);
    457 	if (likely(r == 0)) {
    458 		if (bo->tbo.mem.mem_type == TTM_PL_VRAM)
    459 			bo->adev->vram_pin_size -= amdgpu_bo_size(bo);
    460 		else
    461 			bo->adev->gart_pin_size -= amdgpu_bo_size(bo);
    462 	} else {
    463 		dev_err(bo->adev->dev, "%p validate failed for unpin\n", bo);
    464 	}
    465 	return r;
    466 }
    467 
    468 int amdgpu_bo_evict_vram(struct amdgpu_device *adev)
    469 {
    470 	/* late 2.6.33 fix IGP hibernate - we need pm ops to do this correct */
    471 	if (0 && (adev->flags & AMD_IS_APU)) {
    472 		/* Useless to evict on IGP chips */
    473 		return 0;
    474 	}
    475 	return ttm_bo_evict_mm(&adev->mman.bdev, TTM_PL_VRAM);
    476 }
    477 
    478 void amdgpu_bo_force_delete(struct amdgpu_device *adev)
    479 {
    480 	struct amdgpu_bo *bo, *n;
    481 
    482 	if (list_empty(&adev->gem.objects)) {
    483 		return;
    484 	}
    485 	dev_err(adev->dev, "Userspace still has active objects !\n");
    486 	list_for_each_entry_safe(bo, n, &adev->gem.objects, list) {
    487 		dev_err(adev->dev, "%p %p %lu %lu force free\n",
    488 			&bo->gem_base, bo, (unsigned long)bo->gem_base.size,
    489 			*((unsigned long *)&bo->gem_base.refcount));
    490 		mutex_lock(&bo->adev->gem.mutex);
    491 		list_del_init(&bo->list);
    492 		mutex_unlock(&bo->adev->gem.mutex);
    493 		/* this should unref the ttm bo */
    494 		drm_gem_object_unreference_unlocked(&bo->gem_base);
    495 	}
    496 }
    497 
    498 int amdgpu_bo_init(struct amdgpu_device *adev)
    499 {
    500 	/* Add an MTRR for the VRAM */
    501 	adev->mc.vram_mtrr = arch_phys_wc_add(adev->mc.aper_base,
    502 					      adev->mc.aper_size);
    503 	DRM_INFO("Detected VRAM RAM=%lluM, BAR=%lluM\n",
    504 		adev->mc.mc_vram_size >> 20,
    505 		(unsigned long long)adev->mc.aper_size >> 20);
    506 	DRM_INFO("RAM width %dbits DDR\n",
    507 			adev->mc.vram_width);
    508 	return amdgpu_ttm_init(adev);
    509 }
    510 
    511 void amdgpu_bo_fini(struct amdgpu_device *adev)
    512 {
    513 	amdgpu_ttm_fini(adev);
    514 	arch_phys_wc_del(adev->mc.vram_mtrr);
    515 }
    516 
    517 int amdgpu_bo_fbdev_mmap(struct amdgpu_bo *bo,
    518 			     struct vm_area_struct *vma)
    519 {
    520 	return ttm_fbdev_mmap(vma, &bo->tbo);
    521 }
    522 
    523 int amdgpu_bo_set_tiling_flags(struct amdgpu_bo *bo, u64 tiling_flags)
    524 {
    525 	if (AMDGPU_TILING_GET(tiling_flags, TILE_SPLIT) > 6)
    526 		return -EINVAL;
    527 
    528 	bo->tiling_flags = tiling_flags;
    529 	return 0;
    530 }
    531 
    532 void amdgpu_bo_get_tiling_flags(struct amdgpu_bo *bo, u64 *tiling_flags)
    533 {
    534 	lockdep_assert_held(&bo->tbo.resv->lock.base);
    535 
    536 	if (tiling_flags)
    537 		*tiling_flags = bo->tiling_flags;
    538 }
    539 
    540 int amdgpu_bo_set_metadata (struct amdgpu_bo *bo, void *metadata,
    541 			    uint32_t metadata_size, uint64_t flags)
    542 {
    543 	void *buffer;
    544 
    545 	if (!metadata_size) {
    546 		if (bo->metadata_size) {
    547 			kfree(bo->metadata);
    548 			bo->metadata = NULL;
    549 			bo->metadata_size = 0;
    550 		}
    551 		return 0;
    552 	}
    553 
    554 	if (metadata == NULL)
    555 		return -EINVAL;
    556 
    557 	buffer = kmemdup(metadata, metadata_size, GFP_KERNEL);
    558 	if (buffer == NULL)
    559 		return -ENOMEM;
    560 
    561 	kfree(bo->metadata);
    562 	bo->metadata_flags = flags;
    563 	bo->metadata = buffer;
    564 	bo->metadata_size = metadata_size;
    565 
    566 	return 0;
    567 }
    568 
    569 int amdgpu_bo_get_metadata(struct amdgpu_bo *bo, void *buffer,
    570 			   size_t buffer_size, uint32_t *metadata_size,
    571 			   uint64_t *flags)
    572 {
    573 	if (!buffer && !metadata_size)
    574 		return -EINVAL;
    575 
    576 	if (buffer) {
    577 		if (buffer_size < bo->metadata_size)
    578 			return -EINVAL;
    579 
    580 		if (bo->metadata_size)
    581 			memcpy(buffer, bo->metadata, bo->metadata_size);
    582 	}
    583 
    584 	if (metadata_size)
    585 		*metadata_size = bo->metadata_size;
    586 	if (flags)
    587 		*flags = bo->metadata_flags;
    588 
    589 	return 0;
    590 }
    591 
    592 void amdgpu_bo_move_notify(struct ttm_buffer_object *bo,
    593 			   struct ttm_mem_reg *new_mem)
    594 {
    595 	struct amdgpu_bo *rbo;
    596 
    597 	if (!amdgpu_ttm_bo_is_amdgpu_bo(bo))
    598 		return;
    599 
    600 	rbo = container_of(bo, struct amdgpu_bo, tbo);
    601 	amdgpu_vm_bo_invalidate(rbo->adev, rbo);
    602 
    603 	/* update statistics */
    604 	if (!new_mem)
    605 		return;
    606 
    607 	/* move_notify is called before move happens */
    608 	amdgpu_update_memory_usage(rbo->adev, &bo->mem, new_mem);
    609 }
    610 
    611 int amdgpu_bo_fault_reserve_notify(struct ttm_buffer_object *bo)
    612 {
    613 	struct amdgpu_device *adev;
    614 	struct amdgpu_bo *abo;
    615 	unsigned long offset, size, lpfn;
    616 	int i, r;
    617 
    618 	if (!amdgpu_ttm_bo_is_amdgpu_bo(bo))
    619 		return 0;
    620 
    621 	abo = container_of(bo, struct amdgpu_bo, tbo);
    622 	adev = abo->adev;
    623 	if (bo->mem.mem_type != TTM_PL_VRAM)
    624 		return 0;
    625 
    626 	size = bo->mem.num_pages << PAGE_SHIFT;
    627 	offset = bo->mem.start << PAGE_SHIFT;
    628 	if ((offset + size) <= adev->mc.visible_vram_size)
    629 		return 0;
    630 
    631 	/* hurrah the memory is not visible ! */
    632 	amdgpu_ttm_placement_from_domain(abo, AMDGPU_GEM_DOMAIN_VRAM);
    633 	lpfn =	adev->mc.visible_vram_size >> PAGE_SHIFT;
    634 	for (i = 0; i < abo->placement.num_placement; i++) {
    635 		/* Force into visible VRAM */
    636 		if ((abo->placements[i].flags & TTM_PL_FLAG_VRAM) &&
    637 		    (!abo->placements[i].lpfn || abo->placements[i].lpfn > lpfn))
    638 			abo->placements[i].lpfn = lpfn;
    639 	}
    640 	r = ttm_bo_validate(bo, &abo->placement, false, false);
    641 	if (unlikely(r == -ENOMEM)) {
    642 		amdgpu_ttm_placement_from_domain(abo, AMDGPU_GEM_DOMAIN_GTT);
    643 		return ttm_bo_validate(bo, &abo->placement, false, false);
    644 	} else if (unlikely(r != 0)) {
    645 		return r;
    646 	}
    647 
    648 	offset = bo->mem.start << PAGE_SHIFT;
    649 	/* this should never happen */
    650 	if ((offset + size) > adev->mc.visible_vram_size)
    651 		return -EINVAL;
    652 
    653 	return 0;
    654 }
    655 
    656 /**
    657  * amdgpu_bo_fence - add fence to buffer object
    658  *
    659  * @bo: buffer object in question
    660  * @fence: fence to add
    661  * @shared: true if fence should be added shared
    662  *
    663  */
    664 void amdgpu_bo_fence(struct amdgpu_bo *bo, struct fence *fence,
    665 		     bool shared)
    666 {
    667 	struct reservation_object *resv = bo->tbo.resv;
    668 
    669 	if (shared)
    670 		reservation_object_add_shared_fence(resv, fence);
    671 	else
    672 		reservation_object_add_excl_fence(resv, fence);
    673 }
    674