amdgpu_bo.c revision 3f012e29
13f012e29Smrg/*
23f012e29Smrg * Copyright © 2014 Advanced Micro Devices, Inc.
33f012e29Smrg * All Rights Reserved.
43f012e29Smrg *
53f012e29Smrg * Permission is hereby granted, free of charge, to any person obtaining a
63f012e29Smrg * copy of this software and associated documentation files (the "Software"),
73f012e29Smrg * to deal in the Software without restriction, including without limitation
83f012e29Smrg * the rights to use, copy, modify, merge, publish, distribute, sublicense,
93f012e29Smrg * and/or sell copies of the Software, and to permit persons to whom the
103f012e29Smrg * Software is furnished to do so, subject to the following conditions:
113f012e29Smrg *
123f012e29Smrg * The above copyright notice and this permission notice shall be included in
133f012e29Smrg * all copies or substantial portions of the Software.
143f012e29Smrg *
153f012e29Smrg * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
163f012e29Smrg * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
173f012e29Smrg * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT.  IN NO EVENT SHALL
183f012e29Smrg * THE COPYRIGHT HOLDER(S) OR AUTHOR(S) BE LIABLE FOR ANY CLAIM, DAMAGES OR
193f012e29Smrg * OTHER LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE,
203f012e29Smrg * ARISING FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR
213f012e29Smrg * OTHER DEALINGS IN THE SOFTWARE.
223f012e29Smrg *
233f012e29Smrg */
243f012e29Smrg
253f012e29Smrg#ifdef HAVE_CONFIG_H
263f012e29Smrg#include "config.h"
273f012e29Smrg#endif
283f012e29Smrg
293f012e29Smrg#include <stdlib.h>
303f012e29Smrg#include <stdio.h>
313f012e29Smrg#include <stdint.h>
323f012e29Smrg#include <string.h>
333f012e29Smrg#include <errno.h>
343f012e29Smrg#include <fcntl.h>
353f012e29Smrg#include <unistd.h>
363f012e29Smrg#include <sys/ioctl.h>
373f012e29Smrg#include <sys/mman.h>
383f012e29Smrg#include <sys/time.h>
393f012e29Smrg
403f012e29Smrg#include "libdrm_macros.h"
413f012e29Smrg#include "xf86drm.h"
423f012e29Smrg#include "amdgpu_drm.h"
433f012e29Smrg#include "amdgpu_internal.h"
443f012e29Smrg#include "util_hash_table.h"
453f012e29Smrg#include "util_math.h"
463f012e29Smrg
473f012e29Smrgstatic void amdgpu_close_kms_handle(amdgpu_device_handle dev,
483f012e29Smrg				     uint32_t handle)
493f012e29Smrg{
503f012e29Smrg	struct drm_gem_close args = {};
513f012e29Smrg
523f012e29Smrg	args.handle = handle;
533f012e29Smrg	drmIoctl(dev->fd, DRM_IOCTL_GEM_CLOSE, &args);
543f012e29Smrg}
553f012e29Smrg
563f012e29Smrgdrm_private void amdgpu_bo_free_internal(amdgpu_bo_handle bo)
573f012e29Smrg{
583f012e29Smrg	/* Remove the buffer from the hash tables. */
593f012e29Smrg	pthread_mutex_lock(&bo->dev->bo_table_mutex);
603f012e29Smrg	util_hash_table_remove(bo->dev->bo_handles,
613f012e29Smrg			       (void*)(uintptr_t)bo->handle);
623f012e29Smrg	if (bo->flink_name) {
633f012e29Smrg		util_hash_table_remove(bo->dev->bo_flink_names,
643f012e29Smrg				       (void*)(uintptr_t)bo->flink_name);
653f012e29Smrg	}
663f012e29Smrg	pthread_mutex_unlock(&bo->dev->bo_table_mutex);
673f012e29Smrg
683f012e29Smrg	/* Release CPU access. */
693f012e29Smrg	if (bo->cpu_map_count > 0) {
703f012e29Smrg		bo->cpu_map_count = 1;
713f012e29Smrg		amdgpu_bo_cpu_unmap(bo);
723f012e29Smrg	}
733f012e29Smrg
743f012e29Smrg	amdgpu_close_kms_handle(bo->dev, bo->handle);
753f012e29Smrg	pthread_mutex_destroy(&bo->cpu_access_mutex);
763f012e29Smrg	free(bo);
773f012e29Smrg}
783f012e29Smrg
793f012e29Smrgint amdgpu_bo_alloc(amdgpu_device_handle dev,
803f012e29Smrg		    struct amdgpu_bo_alloc_request *alloc_buffer,
813f012e29Smrg		    amdgpu_bo_handle *buf_handle)
823f012e29Smrg{
833f012e29Smrg	struct amdgpu_bo *bo;
843f012e29Smrg	union drm_amdgpu_gem_create args;
853f012e29Smrg	unsigned heap = alloc_buffer->preferred_heap;
863f012e29Smrg	int r = 0;
873f012e29Smrg
883f012e29Smrg	/* It's an error if the heap is not specified */
893f012e29Smrg	if (!(heap & (AMDGPU_GEM_DOMAIN_GTT | AMDGPU_GEM_DOMAIN_VRAM)))
903f012e29Smrg		return -EINVAL;
913f012e29Smrg
923f012e29Smrg	bo = calloc(1, sizeof(struct amdgpu_bo));
933f012e29Smrg	if (!bo)
943f012e29Smrg		return -ENOMEM;
953f012e29Smrg
963f012e29Smrg	atomic_set(&bo->refcount, 1);
973f012e29Smrg	bo->dev = dev;
983f012e29Smrg	bo->alloc_size = alloc_buffer->alloc_size;
993f012e29Smrg
1003f012e29Smrg	memset(&args, 0, sizeof(args));
1013f012e29Smrg	args.in.bo_size = alloc_buffer->alloc_size;
1023f012e29Smrg	args.in.alignment = alloc_buffer->phys_alignment;
1033f012e29Smrg
1043f012e29Smrg	/* Set the placement. */
1053f012e29Smrg	args.in.domains = heap;
1063f012e29Smrg	args.in.domain_flags = alloc_buffer->flags;
1073f012e29Smrg
1083f012e29Smrg	/* Allocate the buffer with the preferred heap. */
1093f012e29Smrg	r = drmCommandWriteRead(dev->fd, DRM_AMDGPU_GEM_CREATE,
1103f012e29Smrg				&args, sizeof(args));
1113f012e29Smrg	if (r) {
1123f012e29Smrg		free(bo);
1133f012e29Smrg		return r;
1143f012e29Smrg	}
1153f012e29Smrg
1163f012e29Smrg	bo->handle = args.out.handle;
1173f012e29Smrg
1183f012e29Smrg	pthread_mutex_init(&bo->cpu_access_mutex, NULL);
1193f012e29Smrg
1203f012e29Smrg	*buf_handle = bo;
1213f012e29Smrg	return 0;
1223f012e29Smrg}
1233f012e29Smrg
1243f012e29Smrgint amdgpu_bo_set_metadata(amdgpu_bo_handle bo,
1253f012e29Smrg			   struct amdgpu_bo_metadata *info)
1263f012e29Smrg{
1273f012e29Smrg	struct drm_amdgpu_gem_metadata args = {};
1283f012e29Smrg
1293f012e29Smrg	args.handle = bo->handle;
1303f012e29Smrg	args.op = AMDGPU_GEM_METADATA_OP_SET_METADATA;
1313f012e29Smrg	args.data.flags = info->flags;
1323f012e29Smrg	args.data.tiling_info = info->tiling_info;
1333f012e29Smrg
1343f012e29Smrg	if (info->size_metadata > sizeof(args.data.data))
1353f012e29Smrg		return -EINVAL;
1363f012e29Smrg
1373f012e29Smrg	if (info->size_metadata) {
1383f012e29Smrg		args.data.data_size_bytes = info->size_metadata;
1393f012e29Smrg		memcpy(args.data.data, info->umd_metadata, info->size_metadata);
1403f012e29Smrg	}
1413f012e29Smrg
1423f012e29Smrg	return drmCommandWriteRead(bo->dev->fd,
1433f012e29Smrg				   DRM_AMDGPU_GEM_METADATA,
1443f012e29Smrg				   &args, sizeof(args));
1453f012e29Smrg}
1463f012e29Smrg
1473f012e29Smrgint amdgpu_bo_query_info(amdgpu_bo_handle bo,
1483f012e29Smrg			 struct amdgpu_bo_info *info)
1493f012e29Smrg{
1503f012e29Smrg	struct drm_amdgpu_gem_metadata metadata = {};
1513f012e29Smrg	struct drm_amdgpu_gem_create_in bo_info = {};
1523f012e29Smrg	struct drm_amdgpu_gem_op gem_op = {};
1533f012e29Smrg	int r;
1543f012e29Smrg
1553f012e29Smrg	/* Validate the BO passed in */
1563f012e29Smrg	if (!bo->handle)
1573f012e29Smrg		return -EINVAL;
1583f012e29Smrg
1593f012e29Smrg	/* Query metadata. */
1603f012e29Smrg	metadata.handle = bo->handle;
1613f012e29Smrg	metadata.op = AMDGPU_GEM_METADATA_OP_GET_METADATA;
1623f012e29Smrg
1633f012e29Smrg	r = drmCommandWriteRead(bo->dev->fd, DRM_AMDGPU_GEM_METADATA,
1643f012e29Smrg				&metadata, sizeof(metadata));
1653f012e29Smrg	if (r)
1663f012e29Smrg		return r;
1673f012e29Smrg
1683f012e29Smrg	if (metadata.data.data_size_bytes >
1693f012e29Smrg	    sizeof(info->metadata.umd_metadata))
1703f012e29Smrg		return -EINVAL;
1713f012e29Smrg
1723f012e29Smrg	/* Query buffer info. */
1733f012e29Smrg	gem_op.handle = bo->handle;
1743f012e29Smrg	gem_op.op = AMDGPU_GEM_OP_GET_GEM_CREATE_INFO;
1753f012e29Smrg	gem_op.value = (uintptr_t)&bo_info;
1763f012e29Smrg
1773f012e29Smrg	r = drmCommandWriteRead(bo->dev->fd, DRM_AMDGPU_GEM_OP,
1783f012e29Smrg				&gem_op, sizeof(gem_op));
1793f012e29Smrg	if (r)
1803f012e29Smrg		return r;
1813f012e29Smrg
1823f012e29Smrg	memset(info, 0, sizeof(*info));
1833f012e29Smrg	info->alloc_size = bo_info.bo_size;
1843f012e29Smrg	info->phys_alignment = bo_info.alignment;
1853f012e29Smrg	info->preferred_heap = bo_info.domains;
1863f012e29Smrg	info->alloc_flags = bo_info.domain_flags;
1873f012e29Smrg	info->metadata.flags = metadata.data.flags;
1883f012e29Smrg	info->metadata.tiling_info = metadata.data.tiling_info;
1893f012e29Smrg
1903f012e29Smrg	info->metadata.size_metadata = metadata.data.data_size_bytes;
1913f012e29Smrg	if (metadata.data.data_size_bytes > 0)
1923f012e29Smrg		memcpy(info->metadata.umd_metadata, metadata.data.data,
1933f012e29Smrg		       metadata.data.data_size_bytes);
1943f012e29Smrg
1953f012e29Smrg	return 0;
1963f012e29Smrg}
1973f012e29Smrg
1983f012e29Smrgstatic void amdgpu_add_handle_to_table(amdgpu_bo_handle bo)
1993f012e29Smrg{
2003f012e29Smrg	pthread_mutex_lock(&bo->dev->bo_table_mutex);
2013f012e29Smrg	util_hash_table_set(bo->dev->bo_handles,
2023f012e29Smrg			    (void*)(uintptr_t)bo->handle, bo);
2033f012e29Smrg	pthread_mutex_unlock(&bo->dev->bo_table_mutex);
2043f012e29Smrg}
2053f012e29Smrg
2063f012e29Smrgstatic int amdgpu_bo_export_flink(amdgpu_bo_handle bo)
2073f012e29Smrg{
2083f012e29Smrg	struct drm_gem_flink flink;
2093f012e29Smrg	int fd, dma_fd;
2103f012e29Smrg	uint32_t handle;
2113f012e29Smrg	int r;
2123f012e29Smrg
2133f012e29Smrg	fd = bo->dev->fd;
2143f012e29Smrg	handle = bo->handle;
2153f012e29Smrg	if (bo->flink_name)
2163f012e29Smrg		return 0;
2173f012e29Smrg
2183f012e29Smrg
2193f012e29Smrg	if (bo->dev->flink_fd != bo->dev->fd) {
2203f012e29Smrg		r = drmPrimeHandleToFD(bo->dev->fd, bo->handle, DRM_CLOEXEC,
2213f012e29Smrg				       &dma_fd);
2223f012e29Smrg		if (!r) {
2233f012e29Smrg			r = drmPrimeFDToHandle(bo->dev->flink_fd, dma_fd, &handle);
2243f012e29Smrg			close(dma_fd);
2253f012e29Smrg		}
2263f012e29Smrg		if (r)
2273f012e29Smrg			return r;
2283f012e29Smrg		fd = bo->dev->flink_fd;
2293f012e29Smrg	}
2303f012e29Smrg	memset(&flink, 0, sizeof(flink));
2313f012e29Smrg	flink.handle = handle;
2323f012e29Smrg
2333f012e29Smrg	r = drmIoctl(fd, DRM_IOCTL_GEM_FLINK, &flink);
2343f012e29Smrg	if (r)
2353f012e29Smrg		return r;
2363f012e29Smrg
2373f012e29Smrg	bo->flink_name = flink.name;
2383f012e29Smrg
2393f012e29Smrg	if (bo->dev->flink_fd != bo->dev->fd) {
2403f012e29Smrg		struct drm_gem_close args = {};
2413f012e29Smrg		args.handle = handle;
2423f012e29Smrg		drmIoctl(bo->dev->flink_fd, DRM_IOCTL_GEM_CLOSE, &args);
2433f012e29Smrg	}
2443f012e29Smrg
2453f012e29Smrg	pthread_mutex_lock(&bo->dev->bo_table_mutex);
2463f012e29Smrg	util_hash_table_set(bo->dev->bo_flink_names,
2473f012e29Smrg			    (void*)(uintptr_t)bo->flink_name,
2483f012e29Smrg			    bo);
2493f012e29Smrg	pthread_mutex_unlock(&bo->dev->bo_table_mutex);
2503f012e29Smrg
2513f012e29Smrg	return 0;
2523f012e29Smrg}
2533f012e29Smrg
2543f012e29Smrgint amdgpu_bo_export(amdgpu_bo_handle bo,
2553f012e29Smrg		     enum amdgpu_bo_handle_type type,
2563f012e29Smrg		     uint32_t *shared_handle)
2573f012e29Smrg{
2583f012e29Smrg	int r;
2593f012e29Smrg
2603f012e29Smrg	switch (type) {
2613f012e29Smrg	case amdgpu_bo_handle_type_gem_flink_name:
2623f012e29Smrg		r = amdgpu_bo_export_flink(bo);
2633f012e29Smrg		if (r)
2643f012e29Smrg			return r;
2653f012e29Smrg
2663f012e29Smrg		*shared_handle = bo->flink_name;
2673f012e29Smrg		return 0;
2683f012e29Smrg
2693f012e29Smrg	case amdgpu_bo_handle_type_kms:
2703f012e29Smrg		amdgpu_add_handle_to_table(bo);
2713f012e29Smrg		*shared_handle = bo->handle;
2723f012e29Smrg		return 0;
2733f012e29Smrg
2743f012e29Smrg	case amdgpu_bo_handle_type_dma_buf_fd:
2753f012e29Smrg		amdgpu_add_handle_to_table(bo);
2763f012e29Smrg		return drmPrimeHandleToFD(bo->dev->fd, bo->handle, DRM_CLOEXEC,
2773f012e29Smrg				       (int*)shared_handle);
2783f012e29Smrg	}
2793f012e29Smrg	return -EINVAL;
2803f012e29Smrg}
2813f012e29Smrg
2823f012e29Smrgint amdgpu_bo_import(amdgpu_device_handle dev,
2833f012e29Smrg		     enum amdgpu_bo_handle_type type,
2843f012e29Smrg		     uint32_t shared_handle,
2853f012e29Smrg		     struct amdgpu_bo_import_result *output)
2863f012e29Smrg{
2873f012e29Smrg	struct drm_gem_open open_arg = {};
2883f012e29Smrg	struct amdgpu_bo *bo = NULL;
2893f012e29Smrg	int r;
2903f012e29Smrg	int dma_fd;
2913f012e29Smrg	uint64_t dma_buf_size = 0;
2923f012e29Smrg
2933f012e29Smrg	/* We must maintain a list of pairs <handle, bo>, so that we always
2943f012e29Smrg	 * return the same amdgpu_bo instance for the same handle. */
2953f012e29Smrg	pthread_mutex_lock(&dev->bo_table_mutex);
2963f012e29Smrg
2973f012e29Smrg	/* Convert a DMA buf handle to a KMS handle now. */
2983f012e29Smrg	if (type == amdgpu_bo_handle_type_dma_buf_fd) {
2993f012e29Smrg		uint32_t handle;
3003f012e29Smrg		off_t size;
3013f012e29Smrg
3023f012e29Smrg		/* Get a KMS handle. */
3033f012e29Smrg		r = drmPrimeFDToHandle(dev->fd, shared_handle, &handle);
3043f012e29Smrg		if (r) {
3053f012e29Smrg			return r;
3063f012e29Smrg		}
3073f012e29Smrg
3083f012e29Smrg		/* Query the buffer size. */
3093f012e29Smrg		size = lseek(shared_handle, 0, SEEK_END);
3103f012e29Smrg		if (size == (off_t)-1) {
3113f012e29Smrg			pthread_mutex_unlock(&dev->bo_table_mutex);
3123f012e29Smrg			amdgpu_close_kms_handle(dev, handle);
3133f012e29Smrg			return -errno;
3143f012e29Smrg		}
3153f012e29Smrg		lseek(shared_handle, 0, SEEK_SET);
3163f012e29Smrg
3173f012e29Smrg		dma_buf_size = size;
3183f012e29Smrg		shared_handle = handle;
3193f012e29Smrg	}
3203f012e29Smrg
3213f012e29Smrg	/* If we have already created a buffer with this handle, find it. */
3223f012e29Smrg	switch (type) {
3233f012e29Smrg	case amdgpu_bo_handle_type_gem_flink_name:
3243f012e29Smrg		bo = util_hash_table_get(dev->bo_flink_names,
3253f012e29Smrg					 (void*)(uintptr_t)shared_handle);
3263f012e29Smrg		break;
3273f012e29Smrg
3283f012e29Smrg	case amdgpu_bo_handle_type_dma_buf_fd:
3293f012e29Smrg		bo = util_hash_table_get(dev->bo_handles,
3303f012e29Smrg					 (void*)(uintptr_t)shared_handle);
3313f012e29Smrg		break;
3323f012e29Smrg
3333f012e29Smrg	case amdgpu_bo_handle_type_kms:
3343f012e29Smrg		/* Importing a KMS handle in not allowed. */
3353f012e29Smrg		pthread_mutex_unlock(&dev->bo_table_mutex);
3363f012e29Smrg		return -EPERM;
3373f012e29Smrg
3383f012e29Smrg	default:
3393f012e29Smrg		pthread_mutex_unlock(&dev->bo_table_mutex);
3403f012e29Smrg		return -EINVAL;
3413f012e29Smrg	}
3423f012e29Smrg
3433f012e29Smrg	if (bo) {
3443f012e29Smrg		pthread_mutex_unlock(&dev->bo_table_mutex);
3453f012e29Smrg
3463f012e29Smrg		/* The buffer already exists, just bump the refcount. */
3473f012e29Smrg		atomic_inc(&bo->refcount);
3483f012e29Smrg
3493f012e29Smrg		output->buf_handle = bo;
3503f012e29Smrg		output->alloc_size = bo->alloc_size;
3513f012e29Smrg		return 0;
3523f012e29Smrg	}
3533f012e29Smrg
3543f012e29Smrg	bo = calloc(1, sizeof(struct amdgpu_bo));
3553f012e29Smrg	if (!bo) {
3563f012e29Smrg		pthread_mutex_unlock(&dev->bo_table_mutex);
3573f012e29Smrg		if (type == amdgpu_bo_handle_type_dma_buf_fd) {
3583f012e29Smrg			amdgpu_close_kms_handle(dev, shared_handle);
3593f012e29Smrg		}
3603f012e29Smrg		return -ENOMEM;
3613f012e29Smrg	}
3623f012e29Smrg
3633f012e29Smrg	/* Open the handle. */
3643f012e29Smrg	switch (type) {
3653f012e29Smrg	case amdgpu_bo_handle_type_gem_flink_name:
3663f012e29Smrg		open_arg.name = shared_handle;
3673f012e29Smrg		r = drmIoctl(dev->flink_fd, DRM_IOCTL_GEM_OPEN, &open_arg);
3683f012e29Smrg		if (r) {
3693f012e29Smrg			free(bo);
3703f012e29Smrg			pthread_mutex_unlock(&dev->bo_table_mutex);
3713f012e29Smrg			return r;
3723f012e29Smrg		}
3733f012e29Smrg
3743f012e29Smrg		bo->handle = open_arg.handle;
3753f012e29Smrg		if (dev->flink_fd != dev->fd) {
3763f012e29Smrg			r = drmPrimeHandleToFD(dev->flink_fd, bo->handle, DRM_CLOEXEC, &dma_fd);
3773f012e29Smrg			if (r) {
3783f012e29Smrg				free(bo);
3793f012e29Smrg				pthread_mutex_unlock(&dev->bo_table_mutex);
3803f012e29Smrg				return r;
3813f012e29Smrg			}
3823f012e29Smrg			r = drmPrimeFDToHandle(dev->fd, dma_fd, &bo->handle );
3833f012e29Smrg
3843f012e29Smrg			close(dma_fd);
3853f012e29Smrg
3863f012e29Smrg			if (r) {
3873f012e29Smrg				free(bo);
3883f012e29Smrg				pthread_mutex_unlock(&dev->bo_table_mutex);
3893f012e29Smrg				return r;
3903f012e29Smrg			}
3913f012e29Smrg		}
3923f012e29Smrg		bo->flink_name = shared_handle;
3933f012e29Smrg		bo->alloc_size = open_arg.size;
3943f012e29Smrg		util_hash_table_set(dev->bo_flink_names,
3953f012e29Smrg				    (void*)(uintptr_t)bo->flink_name, bo);
3963f012e29Smrg		break;
3973f012e29Smrg
3983f012e29Smrg	case amdgpu_bo_handle_type_dma_buf_fd:
3993f012e29Smrg		bo->handle = shared_handle;
4003f012e29Smrg		bo->alloc_size = dma_buf_size;
4013f012e29Smrg		break;
4023f012e29Smrg
4033f012e29Smrg	case amdgpu_bo_handle_type_kms:
4043f012e29Smrg		assert(0); /* unreachable */
4053f012e29Smrg	}
4063f012e29Smrg
4073f012e29Smrg	/* Initialize it. */
4083f012e29Smrg	atomic_set(&bo->refcount, 1);
4093f012e29Smrg	bo->dev = dev;
4103f012e29Smrg	pthread_mutex_init(&bo->cpu_access_mutex, NULL);
4113f012e29Smrg
4123f012e29Smrg	util_hash_table_set(dev->bo_handles, (void*)(uintptr_t)bo->handle, bo);
4133f012e29Smrg	pthread_mutex_unlock(&dev->bo_table_mutex);
4143f012e29Smrg
4153f012e29Smrg	output->buf_handle = bo;
4163f012e29Smrg	output->alloc_size = bo->alloc_size;
4173f012e29Smrg	return 0;
4183f012e29Smrg}
4193f012e29Smrg
4203f012e29Smrgint amdgpu_bo_free(amdgpu_bo_handle buf_handle)
4213f012e29Smrg{
4223f012e29Smrg	/* Just drop the reference. */
4233f012e29Smrg	amdgpu_bo_reference(&buf_handle, NULL);
4243f012e29Smrg	return 0;
4253f012e29Smrg}
4263f012e29Smrg
4273f012e29Smrgint amdgpu_bo_cpu_map(amdgpu_bo_handle bo, void **cpu)
4283f012e29Smrg{
4293f012e29Smrg	union drm_amdgpu_gem_mmap args;
4303f012e29Smrg	void *ptr;
4313f012e29Smrg	int r;
4323f012e29Smrg
4333f012e29Smrg	pthread_mutex_lock(&bo->cpu_access_mutex);
4343f012e29Smrg
4353f012e29Smrg	if (bo->cpu_ptr) {
4363f012e29Smrg		/* already mapped */
4373f012e29Smrg		assert(bo->cpu_map_count > 0);
4383f012e29Smrg		bo->cpu_map_count++;
4393f012e29Smrg		*cpu = bo->cpu_ptr;
4403f012e29Smrg		pthread_mutex_unlock(&bo->cpu_access_mutex);
4413f012e29Smrg		return 0;
4423f012e29Smrg	}
4433f012e29Smrg
4443f012e29Smrg	assert(bo->cpu_map_count == 0);
4453f012e29Smrg
4463f012e29Smrg	memset(&args, 0, sizeof(args));
4473f012e29Smrg
4483f012e29Smrg	/* Query the buffer address (args.addr_ptr).
4493f012e29Smrg	 * The kernel driver ignores the offset and size parameters. */
4503f012e29Smrg	args.in.handle = bo->handle;
4513f012e29Smrg
4523f012e29Smrg	r = drmCommandWriteRead(bo->dev->fd, DRM_AMDGPU_GEM_MMAP, &args,
4533f012e29Smrg				sizeof(args));
4543f012e29Smrg	if (r) {
4553f012e29Smrg		pthread_mutex_unlock(&bo->cpu_access_mutex);
4563f012e29Smrg		return r;
4573f012e29Smrg	}
4583f012e29Smrg
4593f012e29Smrg	/* Map the buffer. */
4603f012e29Smrg	ptr = drm_mmap(NULL, bo->alloc_size, PROT_READ | PROT_WRITE, MAP_SHARED,
4613f012e29Smrg		       bo->dev->fd, args.out.addr_ptr);
4623f012e29Smrg	if (ptr == MAP_FAILED) {
4633f012e29Smrg		pthread_mutex_unlock(&bo->cpu_access_mutex);
4643f012e29Smrg		return -errno;
4653f012e29Smrg	}
4663f012e29Smrg
4673f012e29Smrg	bo->cpu_ptr = ptr;
4683f012e29Smrg	bo->cpu_map_count = 1;
4693f012e29Smrg	pthread_mutex_unlock(&bo->cpu_access_mutex);
4703f012e29Smrg
4713f012e29Smrg	*cpu = ptr;
4723f012e29Smrg	return 0;
4733f012e29Smrg}
4743f012e29Smrg
4753f012e29Smrgint amdgpu_bo_cpu_unmap(amdgpu_bo_handle bo)
4763f012e29Smrg{
4773f012e29Smrg	int r;
4783f012e29Smrg
4793f012e29Smrg	pthread_mutex_lock(&bo->cpu_access_mutex);
4803f012e29Smrg	assert(bo->cpu_map_count >= 0);
4813f012e29Smrg
4823f012e29Smrg	if (bo->cpu_map_count == 0) {
4833f012e29Smrg		/* not mapped */
4843f012e29Smrg		pthread_mutex_unlock(&bo->cpu_access_mutex);
4853f012e29Smrg		return -EINVAL;
4863f012e29Smrg	}
4873f012e29Smrg
4883f012e29Smrg	bo->cpu_map_count--;
4893f012e29Smrg	if (bo->cpu_map_count > 0) {
4903f012e29Smrg		/* mapped multiple times */
4913f012e29Smrg		pthread_mutex_unlock(&bo->cpu_access_mutex);
4923f012e29Smrg		return 0;
4933f012e29Smrg	}
4943f012e29Smrg
4953f012e29Smrg	r = drm_munmap(bo->cpu_ptr, bo->alloc_size) == 0 ? 0 : -errno;
4963f012e29Smrg	bo->cpu_ptr = NULL;
4973f012e29Smrg	pthread_mutex_unlock(&bo->cpu_access_mutex);
4983f012e29Smrg	return r;
4993f012e29Smrg}
5003f012e29Smrg
5013f012e29Smrgint amdgpu_query_buffer_size_alignment(amdgpu_device_handle dev,
5023f012e29Smrg				struct amdgpu_buffer_size_alignments *info)
5033f012e29Smrg{
5043f012e29Smrg	info->size_local = dev->dev_info.pte_fragment_size;
5053f012e29Smrg	info->size_remote = dev->dev_info.gart_page_size;
5063f012e29Smrg	return 0;
5073f012e29Smrg}
5083f012e29Smrg
5093f012e29Smrgint amdgpu_bo_wait_for_idle(amdgpu_bo_handle bo,
5103f012e29Smrg			    uint64_t timeout_ns,
5113f012e29Smrg			    bool *busy)
5123f012e29Smrg{
5133f012e29Smrg	union drm_amdgpu_gem_wait_idle args;
5143f012e29Smrg	int r;
5153f012e29Smrg
5163f012e29Smrg	memset(&args, 0, sizeof(args));
5173f012e29Smrg	args.in.handle = bo->handle;
5183f012e29Smrg	args.in.timeout = amdgpu_cs_calculate_timeout(timeout_ns);
5193f012e29Smrg
5203f012e29Smrg	r = drmCommandWriteRead(bo->dev->fd, DRM_AMDGPU_GEM_WAIT_IDLE,
5213f012e29Smrg				&args, sizeof(args));
5223f012e29Smrg
5233f012e29Smrg	if (r == 0) {
5243f012e29Smrg		*busy = args.out.status;
5253f012e29Smrg		return 0;
5263f012e29Smrg	} else {
5273f012e29Smrg		fprintf(stderr, "amdgpu: GEM_WAIT_IDLE failed with %i\n", r);
5283f012e29Smrg		return r;
5293f012e29Smrg	}
5303f012e29Smrg}
5313f012e29Smrg
5323f012e29Smrgint amdgpu_create_bo_from_user_mem(amdgpu_device_handle dev,
5333f012e29Smrg				    void *cpu,
5343f012e29Smrg				    uint64_t size,
5353f012e29Smrg				    amdgpu_bo_handle *buf_handle)
5363f012e29Smrg{
5373f012e29Smrg	int r;
5383f012e29Smrg	struct amdgpu_bo *bo;
5393f012e29Smrg	struct drm_amdgpu_gem_userptr args;
5403f012e29Smrg
5413f012e29Smrg	args.addr = (uintptr_t)cpu;
5423f012e29Smrg	args.flags = AMDGPU_GEM_USERPTR_ANONONLY | AMDGPU_GEM_USERPTR_REGISTER |
5433f012e29Smrg		AMDGPU_GEM_USERPTR_VALIDATE;
5443f012e29Smrg	args.size = size;
5453f012e29Smrg	r = drmCommandWriteRead(dev->fd, DRM_AMDGPU_GEM_USERPTR,
5463f012e29Smrg				&args, sizeof(args));
5473f012e29Smrg	if (r)
5483f012e29Smrg		return r;
5493f012e29Smrg
5503f012e29Smrg	bo = calloc(1, sizeof(struct amdgpu_bo));
5513f012e29Smrg	if (!bo)
5523f012e29Smrg		return -ENOMEM;
5533f012e29Smrg
5543f012e29Smrg	atomic_set(&bo->refcount, 1);
5553f012e29Smrg	bo->dev = dev;
5563f012e29Smrg	bo->alloc_size = size;
5573f012e29Smrg	bo->handle = args.handle;
5583f012e29Smrg
5593f012e29Smrg	*buf_handle = bo;
5603f012e29Smrg
5613f012e29Smrg	return r;
5623f012e29Smrg}
5633f012e29Smrg
5643f012e29Smrgint amdgpu_bo_list_create(amdgpu_device_handle dev,
5653f012e29Smrg			  uint32_t number_of_resources,
5663f012e29Smrg			  amdgpu_bo_handle *resources,
5673f012e29Smrg			  uint8_t *resource_prios,
5683f012e29Smrg			  amdgpu_bo_list_handle *result)
5693f012e29Smrg{
5703f012e29Smrg	struct drm_amdgpu_bo_list_entry *list;
5713f012e29Smrg	union drm_amdgpu_bo_list args;
5723f012e29Smrg	unsigned i;
5733f012e29Smrg	int r;
5743f012e29Smrg
5753f012e29Smrg	if (!number_of_resources)
5763f012e29Smrg		return -EINVAL;
5773f012e29Smrg
5783f012e29Smrg	/* overflow check for multiplication */
5793f012e29Smrg	if (number_of_resources > UINT32_MAX / sizeof(struct drm_amdgpu_bo_list_entry))
5803f012e29Smrg		return -EINVAL;
5813f012e29Smrg
5823f012e29Smrg	list = malloc(number_of_resources * sizeof(struct drm_amdgpu_bo_list_entry));
5833f012e29Smrg	if (!list)
5843f012e29Smrg		return -ENOMEM;
5853f012e29Smrg
5863f012e29Smrg	*result = malloc(sizeof(struct amdgpu_bo_list));
5873f012e29Smrg	if (!*result) {
5883f012e29Smrg		free(list);
5893f012e29Smrg		return -ENOMEM;
5903f012e29Smrg	}
5913f012e29Smrg
5923f012e29Smrg	memset(&args, 0, sizeof(args));
5933f012e29Smrg	args.in.operation = AMDGPU_BO_LIST_OP_CREATE;
5943f012e29Smrg	args.in.bo_number = number_of_resources;
5953f012e29Smrg	args.in.bo_info_size = sizeof(struct drm_amdgpu_bo_list_entry);
5963f012e29Smrg	args.in.bo_info_ptr = (uint64_t)(uintptr_t)list;
5973f012e29Smrg
5983f012e29Smrg	for (i = 0; i < number_of_resources; i++) {
5993f012e29Smrg		list[i].bo_handle = resources[i]->handle;
6003f012e29Smrg		if (resource_prios)
6013f012e29Smrg			list[i].bo_priority = resource_prios[i];
6023f012e29Smrg		else
6033f012e29Smrg			list[i].bo_priority = 0;
6043f012e29Smrg	}
6053f012e29Smrg
6063f012e29Smrg	r = drmCommandWriteRead(dev->fd, DRM_AMDGPU_BO_LIST,
6073f012e29Smrg				&args, sizeof(args));
6083f012e29Smrg	free(list);
6093f012e29Smrg	if (r) {
6103f012e29Smrg		free(*result);
6113f012e29Smrg		return r;
6123f012e29Smrg	}
6133f012e29Smrg
6143f012e29Smrg	(*result)->dev = dev;
6153f012e29Smrg	(*result)->handle = args.out.list_handle;
6163f012e29Smrg	return 0;
6173f012e29Smrg}
6183f012e29Smrg
6193f012e29Smrgint amdgpu_bo_list_destroy(amdgpu_bo_list_handle list)
6203f012e29Smrg{
6213f012e29Smrg	union drm_amdgpu_bo_list args;
6223f012e29Smrg	int r;
6233f012e29Smrg
6243f012e29Smrg	memset(&args, 0, sizeof(args));
6253f012e29Smrg	args.in.operation = AMDGPU_BO_LIST_OP_DESTROY;
6263f012e29Smrg	args.in.list_handle = list->handle;
6273f012e29Smrg
6283f012e29Smrg	r = drmCommandWriteRead(list->dev->fd, DRM_AMDGPU_BO_LIST,
6293f012e29Smrg				&args, sizeof(args));
6303f012e29Smrg
6313f012e29Smrg	if (!r)
6323f012e29Smrg		free(list);
6333f012e29Smrg
6343f012e29Smrg	return r;
6353f012e29Smrg}
6363f012e29Smrg
6373f012e29Smrgint amdgpu_bo_list_update(amdgpu_bo_list_handle handle,
6383f012e29Smrg			  uint32_t number_of_resources,
6393f012e29Smrg			  amdgpu_bo_handle *resources,
6403f012e29Smrg			  uint8_t *resource_prios)
6413f012e29Smrg{
6423f012e29Smrg	struct drm_amdgpu_bo_list_entry *list;
6433f012e29Smrg	union drm_amdgpu_bo_list args;
6443f012e29Smrg	unsigned i;
6453f012e29Smrg	int r;
6463f012e29Smrg
6473f012e29Smrg	if (!number_of_resources)
6483f012e29Smrg		return -EINVAL;
6493f012e29Smrg
6503f012e29Smrg	/* overflow check for multiplication */
6513f012e29Smrg	if (number_of_resources > UINT32_MAX / sizeof(struct drm_amdgpu_bo_list_entry))
6523f012e29Smrg		return -EINVAL;
6533f012e29Smrg
6543f012e29Smrg	list = malloc(number_of_resources * sizeof(struct drm_amdgpu_bo_list_entry));
6553f012e29Smrg	if (list == NULL)
6563f012e29Smrg		return -ENOMEM;
6573f012e29Smrg
6583f012e29Smrg	args.in.operation = AMDGPU_BO_LIST_OP_UPDATE;
6593f012e29Smrg	args.in.list_handle = handle->handle;
6603f012e29Smrg	args.in.bo_number = number_of_resources;
6613f012e29Smrg	args.in.bo_info_size = sizeof(struct drm_amdgpu_bo_list_entry);
6623f012e29Smrg	args.in.bo_info_ptr = (uintptr_t)list;
6633f012e29Smrg
6643f012e29Smrg	for (i = 0; i < number_of_resources; i++) {
6653f012e29Smrg		list[i].bo_handle = resources[i]->handle;
6663f012e29Smrg		if (resource_prios)
6673f012e29Smrg			list[i].bo_priority = resource_prios[i];
6683f012e29Smrg		else
6693f012e29Smrg			list[i].bo_priority = 0;
6703f012e29Smrg	}
6713f012e29Smrg
6723f012e29Smrg	r = drmCommandWriteRead(handle->dev->fd, DRM_AMDGPU_BO_LIST,
6733f012e29Smrg				&args, sizeof(args));
6743f012e29Smrg	free(list);
6753f012e29Smrg	return r;
6763f012e29Smrg}
6773f012e29Smrg
6783f012e29Smrgint amdgpu_bo_va_op(amdgpu_bo_handle bo,
6793f012e29Smrg		     uint64_t offset,
6803f012e29Smrg		     uint64_t size,
6813f012e29Smrg		     uint64_t addr,
6823f012e29Smrg		     uint64_t flags,
6833f012e29Smrg		     uint32_t ops)
6843f012e29Smrg{
6853f012e29Smrg	amdgpu_device_handle dev = bo->dev;
6863f012e29Smrg	struct drm_amdgpu_gem_va va;
6873f012e29Smrg	int r;
6883f012e29Smrg
6893f012e29Smrg	if (ops != AMDGPU_VA_OP_MAP && ops != AMDGPU_VA_OP_UNMAP)
6903f012e29Smrg		return -EINVAL;
6913f012e29Smrg
6923f012e29Smrg	memset(&va, 0, sizeof(va));
6933f012e29Smrg	va.handle = bo->handle;
6943f012e29Smrg	va.operation = ops;
6953f012e29Smrg	va.flags = AMDGPU_VM_PAGE_READABLE |
6963f012e29Smrg		   AMDGPU_VM_PAGE_WRITEABLE |
6973f012e29Smrg		   AMDGPU_VM_PAGE_EXECUTABLE;
6983f012e29Smrg	va.va_address = addr;
6993f012e29Smrg	va.offset_in_bo = offset;
7003f012e29Smrg	va.map_size = ALIGN(size, getpagesize());
7013f012e29Smrg
7023f012e29Smrg	r = drmCommandWriteRead(dev->fd, DRM_AMDGPU_GEM_VA, &va, sizeof(va));
7033f012e29Smrg
7043f012e29Smrg	return r;
7053f012e29Smrg}
706