amdgpu_bo.c revision d8807b2f
13f012e29Smrg/*
23f012e29Smrg * Copyright © 2014 Advanced Micro Devices, Inc.
33f012e29Smrg * All Rights Reserved.
43f012e29Smrg *
53f012e29Smrg * Permission is hereby granted, free of charge, to any person obtaining a
63f012e29Smrg * copy of this software and associated documentation files (the "Software"),
73f012e29Smrg * to deal in the Software without restriction, including without limitation
83f012e29Smrg * the rights to use, copy, modify, merge, publish, distribute, sublicense,
93f012e29Smrg * and/or sell copies of the Software, and to permit persons to whom the
103f012e29Smrg * Software is furnished to do so, subject to the following conditions:
113f012e29Smrg *
123f012e29Smrg * The above copyright notice and this permission notice shall be included in
133f012e29Smrg * all copies or substantial portions of the Software.
143f012e29Smrg *
153f012e29Smrg * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
163f012e29Smrg * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
173f012e29Smrg * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT.  IN NO EVENT SHALL
183f012e29Smrg * THE COPYRIGHT HOLDER(S) OR AUTHOR(S) BE LIABLE FOR ANY CLAIM, DAMAGES OR
193f012e29Smrg * OTHER LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE,
203f012e29Smrg * ARISING FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR
213f012e29Smrg * OTHER DEALINGS IN THE SOFTWARE.
223f012e29Smrg *
233f012e29Smrg */
243f012e29Smrg
253f012e29Smrg#ifdef HAVE_CONFIG_H
263f012e29Smrg#include "config.h"
273f012e29Smrg#endif
283f012e29Smrg
293f012e29Smrg#include <stdlib.h>
303f012e29Smrg#include <stdio.h>
313f012e29Smrg#include <stdint.h>
323f012e29Smrg#include <string.h>
333f012e29Smrg#include <errno.h>
343f012e29Smrg#include <fcntl.h>
353f012e29Smrg#include <unistd.h>
363f012e29Smrg#include <sys/ioctl.h>
373f012e29Smrg#include <sys/mman.h>
383f012e29Smrg#include <sys/time.h>
393f012e29Smrg
403f012e29Smrg#include "libdrm_macros.h"
413f012e29Smrg#include "xf86drm.h"
423f012e29Smrg#include "amdgpu_drm.h"
433f012e29Smrg#include "amdgpu_internal.h"
443f012e29Smrg#include "util_hash_table.h"
453f012e29Smrg#include "util_math.h"
463f012e29Smrg
473f012e29Smrgstatic void amdgpu_close_kms_handle(amdgpu_device_handle dev,
483f012e29Smrg				     uint32_t handle)
493f012e29Smrg{
503f012e29Smrg	struct drm_gem_close args = {};
513f012e29Smrg
523f012e29Smrg	args.handle = handle;
533f012e29Smrg	drmIoctl(dev->fd, DRM_IOCTL_GEM_CLOSE, &args);
543f012e29Smrg}
553f012e29Smrg
563f012e29Smrgint amdgpu_bo_alloc(amdgpu_device_handle dev,
573f012e29Smrg		    struct amdgpu_bo_alloc_request *alloc_buffer,
583f012e29Smrg		    amdgpu_bo_handle *buf_handle)
593f012e29Smrg{
603f012e29Smrg	struct amdgpu_bo *bo;
613f012e29Smrg	union drm_amdgpu_gem_create args;
623f012e29Smrg	unsigned heap = alloc_buffer->preferred_heap;
633f012e29Smrg	int r = 0;
643f012e29Smrg
653f012e29Smrg	/* It's an error if the heap is not specified */
663f012e29Smrg	if (!(heap & (AMDGPU_GEM_DOMAIN_GTT | AMDGPU_GEM_DOMAIN_VRAM)))
673f012e29Smrg		return -EINVAL;
683f012e29Smrg
693f012e29Smrg	bo = calloc(1, sizeof(struct amdgpu_bo));
703f012e29Smrg	if (!bo)
713f012e29Smrg		return -ENOMEM;
723f012e29Smrg
733f012e29Smrg	atomic_set(&bo->refcount, 1);
743f012e29Smrg	bo->dev = dev;
753f012e29Smrg	bo->alloc_size = alloc_buffer->alloc_size;
763f012e29Smrg
773f012e29Smrg	memset(&args, 0, sizeof(args));
783f012e29Smrg	args.in.bo_size = alloc_buffer->alloc_size;
793f012e29Smrg	args.in.alignment = alloc_buffer->phys_alignment;
803f012e29Smrg
813f012e29Smrg	/* Set the placement. */
823f012e29Smrg	args.in.domains = heap;
833f012e29Smrg	args.in.domain_flags = alloc_buffer->flags;
843f012e29Smrg
853f012e29Smrg	/* Allocate the buffer with the preferred heap. */
863f012e29Smrg	r = drmCommandWriteRead(dev->fd, DRM_AMDGPU_GEM_CREATE,
873f012e29Smrg				&args, sizeof(args));
883f012e29Smrg	if (r) {
893f012e29Smrg		free(bo);
903f012e29Smrg		return r;
913f012e29Smrg	}
923f012e29Smrg
933f012e29Smrg	bo->handle = args.out.handle;
943f012e29Smrg
953f012e29Smrg	pthread_mutex_init(&bo->cpu_access_mutex, NULL);
963f012e29Smrg
973f012e29Smrg	*buf_handle = bo;
983f012e29Smrg	return 0;
993f012e29Smrg}
1003f012e29Smrg
1013f012e29Smrgint amdgpu_bo_set_metadata(amdgpu_bo_handle bo,
1023f012e29Smrg			   struct amdgpu_bo_metadata *info)
1033f012e29Smrg{
1043f012e29Smrg	struct drm_amdgpu_gem_metadata args = {};
1053f012e29Smrg
1063f012e29Smrg	args.handle = bo->handle;
1073f012e29Smrg	args.op = AMDGPU_GEM_METADATA_OP_SET_METADATA;
1083f012e29Smrg	args.data.flags = info->flags;
1093f012e29Smrg	args.data.tiling_info = info->tiling_info;
1103f012e29Smrg
1113f012e29Smrg	if (info->size_metadata > sizeof(args.data.data))
1123f012e29Smrg		return -EINVAL;
1133f012e29Smrg
1143f012e29Smrg	if (info->size_metadata) {
1153f012e29Smrg		args.data.data_size_bytes = info->size_metadata;
1163f012e29Smrg		memcpy(args.data.data, info->umd_metadata, info->size_metadata);
1173f012e29Smrg	}
1183f012e29Smrg
1193f012e29Smrg	return drmCommandWriteRead(bo->dev->fd,
1203f012e29Smrg				   DRM_AMDGPU_GEM_METADATA,
1213f012e29Smrg				   &args, sizeof(args));
1223f012e29Smrg}
1233f012e29Smrg
1243f012e29Smrgint amdgpu_bo_query_info(amdgpu_bo_handle bo,
1253f012e29Smrg			 struct amdgpu_bo_info *info)
1263f012e29Smrg{
1273f012e29Smrg	struct drm_amdgpu_gem_metadata metadata = {};
1283f012e29Smrg	struct drm_amdgpu_gem_create_in bo_info = {};
1293f012e29Smrg	struct drm_amdgpu_gem_op gem_op = {};
1303f012e29Smrg	int r;
1313f012e29Smrg
1323f012e29Smrg	/* Validate the BO passed in */
1333f012e29Smrg	if (!bo->handle)
1343f012e29Smrg		return -EINVAL;
1353f012e29Smrg
1363f012e29Smrg	/* Query metadata. */
1373f012e29Smrg	metadata.handle = bo->handle;
1383f012e29Smrg	metadata.op = AMDGPU_GEM_METADATA_OP_GET_METADATA;
1393f012e29Smrg
1403f012e29Smrg	r = drmCommandWriteRead(bo->dev->fd, DRM_AMDGPU_GEM_METADATA,
1413f012e29Smrg				&metadata, sizeof(metadata));
1423f012e29Smrg	if (r)
1433f012e29Smrg		return r;
1443f012e29Smrg
1453f012e29Smrg	if (metadata.data.data_size_bytes >
1463f012e29Smrg	    sizeof(info->metadata.umd_metadata))
1473f012e29Smrg		return -EINVAL;
1483f012e29Smrg
1493f012e29Smrg	/* Query buffer info. */
1503f012e29Smrg	gem_op.handle = bo->handle;
1513f012e29Smrg	gem_op.op = AMDGPU_GEM_OP_GET_GEM_CREATE_INFO;
1523f012e29Smrg	gem_op.value = (uintptr_t)&bo_info;
1533f012e29Smrg
1543f012e29Smrg	r = drmCommandWriteRead(bo->dev->fd, DRM_AMDGPU_GEM_OP,
1553f012e29Smrg				&gem_op, sizeof(gem_op));
1563f012e29Smrg	if (r)
1573f012e29Smrg		return r;
1583f012e29Smrg
1593f012e29Smrg	memset(info, 0, sizeof(*info));
1603f012e29Smrg	info->alloc_size = bo_info.bo_size;
1613f012e29Smrg	info->phys_alignment = bo_info.alignment;
1623f012e29Smrg	info->preferred_heap = bo_info.domains;
1633f012e29Smrg	info->alloc_flags = bo_info.domain_flags;
1643f012e29Smrg	info->metadata.flags = metadata.data.flags;
1653f012e29Smrg	info->metadata.tiling_info = metadata.data.tiling_info;
1663f012e29Smrg
1673f012e29Smrg	info->metadata.size_metadata = metadata.data.data_size_bytes;
1683f012e29Smrg	if (metadata.data.data_size_bytes > 0)
1693f012e29Smrg		memcpy(info->metadata.umd_metadata, metadata.data.data,
1703f012e29Smrg		       metadata.data.data_size_bytes);
1713f012e29Smrg
1723f012e29Smrg	return 0;
1733f012e29Smrg}
1743f012e29Smrg
1753f012e29Smrgstatic void amdgpu_add_handle_to_table(amdgpu_bo_handle bo)
1763f012e29Smrg{
1773f012e29Smrg	pthread_mutex_lock(&bo->dev->bo_table_mutex);
1783f012e29Smrg	util_hash_table_set(bo->dev->bo_handles,
1793f012e29Smrg			    (void*)(uintptr_t)bo->handle, bo);
1803f012e29Smrg	pthread_mutex_unlock(&bo->dev->bo_table_mutex);
1813f012e29Smrg}
1823f012e29Smrg
1833f012e29Smrgstatic int amdgpu_bo_export_flink(amdgpu_bo_handle bo)
1843f012e29Smrg{
1853f012e29Smrg	struct drm_gem_flink flink;
1863f012e29Smrg	int fd, dma_fd;
1873f012e29Smrg	uint32_t handle;
1883f012e29Smrg	int r;
1893f012e29Smrg
1903f012e29Smrg	fd = bo->dev->fd;
1913f012e29Smrg	handle = bo->handle;
1923f012e29Smrg	if (bo->flink_name)
1933f012e29Smrg		return 0;
1943f012e29Smrg
1953f012e29Smrg
1963f012e29Smrg	if (bo->dev->flink_fd != bo->dev->fd) {
1973f012e29Smrg		r = drmPrimeHandleToFD(bo->dev->fd, bo->handle, DRM_CLOEXEC,
1983f012e29Smrg				       &dma_fd);
1993f012e29Smrg		if (!r) {
2003f012e29Smrg			r = drmPrimeFDToHandle(bo->dev->flink_fd, dma_fd, &handle);
2013f012e29Smrg			close(dma_fd);
2023f012e29Smrg		}
2033f012e29Smrg		if (r)
2043f012e29Smrg			return r;
2053f012e29Smrg		fd = bo->dev->flink_fd;
2063f012e29Smrg	}
2073f012e29Smrg	memset(&flink, 0, sizeof(flink));
2083f012e29Smrg	flink.handle = handle;
2093f012e29Smrg
2103f012e29Smrg	r = drmIoctl(fd, DRM_IOCTL_GEM_FLINK, &flink);
2113f012e29Smrg	if (r)
2123f012e29Smrg		return r;
2133f012e29Smrg
2143f012e29Smrg	bo->flink_name = flink.name;
2153f012e29Smrg
2163f012e29Smrg	if (bo->dev->flink_fd != bo->dev->fd) {
2173f012e29Smrg		struct drm_gem_close args = {};
2183f012e29Smrg		args.handle = handle;
2193f012e29Smrg		drmIoctl(bo->dev->flink_fd, DRM_IOCTL_GEM_CLOSE, &args);
2203f012e29Smrg	}
2213f012e29Smrg
2223f012e29Smrg	pthread_mutex_lock(&bo->dev->bo_table_mutex);
2233f012e29Smrg	util_hash_table_set(bo->dev->bo_flink_names,
2243f012e29Smrg			    (void*)(uintptr_t)bo->flink_name,
2253f012e29Smrg			    bo);
2263f012e29Smrg	pthread_mutex_unlock(&bo->dev->bo_table_mutex);
2273f012e29Smrg
2283f012e29Smrg	return 0;
2293f012e29Smrg}
2303f012e29Smrg
2313f012e29Smrgint amdgpu_bo_export(amdgpu_bo_handle bo,
2323f012e29Smrg		     enum amdgpu_bo_handle_type type,
2333f012e29Smrg		     uint32_t *shared_handle)
2343f012e29Smrg{
2353f012e29Smrg	int r;
2363f012e29Smrg
2373f012e29Smrg	switch (type) {
2383f012e29Smrg	case amdgpu_bo_handle_type_gem_flink_name:
2393f012e29Smrg		r = amdgpu_bo_export_flink(bo);
2403f012e29Smrg		if (r)
2413f012e29Smrg			return r;
2423f012e29Smrg
2433f012e29Smrg		*shared_handle = bo->flink_name;
2443f012e29Smrg		return 0;
2453f012e29Smrg
2463f012e29Smrg	case amdgpu_bo_handle_type_kms:
2473f012e29Smrg		amdgpu_add_handle_to_table(bo);
2483f012e29Smrg		*shared_handle = bo->handle;
2493f012e29Smrg		return 0;
2503f012e29Smrg
2513f012e29Smrg	case amdgpu_bo_handle_type_dma_buf_fd:
2523f012e29Smrg		amdgpu_add_handle_to_table(bo);
2533f012e29Smrg		return drmPrimeHandleToFD(bo->dev->fd, bo->handle, DRM_CLOEXEC,
2543f012e29Smrg				       (int*)shared_handle);
2553f012e29Smrg	}
2563f012e29Smrg	return -EINVAL;
2573f012e29Smrg}
2583f012e29Smrg
2593f012e29Smrgint amdgpu_bo_import(amdgpu_device_handle dev,
2603f012e29Smrg		     enum amdgpu_bo_handle_type type,
2613f012e29Smrg		     uint32_t shared_handle,
2623f012e29Smrg		     struct amdgpu_bo_import_result *output)
2633f012e29Smrg{
2643f012e29Smrg	struct drm_gem_open open_arg = {};
2653f012e29Smrg	struct amdgpu_bo *bo = NULL;
2663f012e29Smrg	int r;
2673f012e29Smrg	int dma_fd;
2683f012e29Smrg	uint64_t dma_buf_size = 0;
2693f012e29Smrg
2703f012e29Smrg	/* We must maintain a list of pairs <handle, bo>, so that we always
2713f012e29Smrg	 * return the same amdgpu_bo instance for the same handle. */
2723f012e29Smrg	pthread_mutex_lock(&dev->bo_table_mutex);
2733f012e29Smrg
2743f012e29Smrg	/* Convert a DMA buf handle to a KMS handle now. */
2753f012e29Smrg	if (type == amdgpu_bo_handle_type_dma_buf_fd) {
2763f012e29Smrg		uint32_t handle;
2773f012e29Smrg		off_t size;
2783f012e29Smrg
2793f012e29Smrg		/* Get a KMS handle. */
2803f012e29Smrg		r = drmPrimeFDToHandle(dev->fd, shared_handle, &handle);
2813f012e29Smrg		if (r) {
282d8807b2fSmrg			pthread_mutex_unlock(&dev->bo_table_mutex);
2833f012e29Smrg			return r;
2843f012e29Smrg		}
2853f012e29Smrg
2863f012e29Smrg		/* Query the buffer size. */
2873f012e29Smrg		size = lseek(shared_handle, 0, SEEK_END);
2883f012e29Smrg		if (size == (off_t)-1) {
2893f012e29Smrg			pthread_mutex_unlock(&dev->bo_table_mutex);
2903f012e29Smrg			amdgpu_close_kms_handle(dev, handle);
2913f012e29Smrg			return -errno;
2923f012e29Smrg		}
2933f012e29Smrg		lseek(shared_handle, 0, SEEK_SET);
2943f012e29Smrg
2953f012e29Smrg		dma_buf_size = size;
2963f012e29Smrg		shared_handle = handle;
2973f012e29Smrg	}
2983f012e29Smrg
2993f012e29Smrg	/* If we have already created a buffer with this handle, find it. */
3003f012e29Smrg	switch (type) {
3013f012e29Smrg	case amdgpu_bo_handle_type_gem_flink_name:
3023f012e29Smrg		bo = util_hash_table_get(dev->bo_flink_names,
3033f012e29Smrg					 (void*)(uintptr_t)shared_handle);
3043f012e29Smrg		break;
3053f012e29Smrg
3063f012e29Smrg	case amdgpu_bo_handle_type_dma_buf_fd:
3073f012e29Smrg		bo = util_hash_table_get(dev->bo_handles,
3083f012e29Smrg					 (void*)(uintptr_t)shared_handle);
3093f012e29Smrg		break;
3103f012e29Smrg
3113f012e29Smrg	case amdgpu_bo_handle_type_kms:
3123f012e29Smrg		/* Importing a KMS handle in not allowed. */
3133f012e29Smrg		pthread_mutex_unlock(&dev->bo_table_mutex);
3143f012e29Smrg		return -EPERM;
3153f012e29Smrg
3163f012e29Smrg	default:
3173f012e29Smrg		pthread_mutex_unlock(&dev->bo_table_mutex);
3183f012e29Smrg		return -EINVAL;
3193f012e29Smrg	}
3203f012e29Smrg
3213f012e29Smrg	if (bo) {
3223f012e29Smrg		/* The buffer already exists, just bump the refcount. */
3233f012e29Smrg		atomic_inc(&bo->refcount);
324d8807b2fSmrg		pthread_mutex_unlock(&dev->bo_table_mutex);
3253f012e29Smrg
3263f012e29Smrg		output->buf_handle = bo;
3273f012e29Smrg		output->alloc_size = bo->alloc_size;
3283f012e29Smrg		return 0;
3293f012e29Smrg	}
3303f012e29Smrg
3313f012e29Smrg	bo = calloc(1, sizeof(struct amdgpu_bo));
3323f012e29Smrg	if (!bo) {
3333f012e29Smrg		pthread_mutex_unlock(&dev->bo_table_mutex);
3343f012e29Smrg		if (type == amdgpu_bo_handle_type_dma_buf_fd) {
3353f012e29Smrg			amdgpu_close_kms_handle(dev, shared_handle);
3363f012e29Smrg		}
3373f012e29Smrg		return -ENOMEM;
3383f012e29Smrg	}
3393f012e29Smrg
3403f012e29Smrg	/* Open the handle. */
3413f012e29Smrg	switch (type) {
3423f012e29Smrg	case amdgpu_bo_handle_type_gem_flink_name:
3433f012e29Smrg		open_arg.name = shared_handle;
3443f012e29Smrg		r = drmIoctl(dev->flink_fd, DRM_IOCTL_GEM_OPEN, &open_arg);
3453f012e29Smrg		if (r) {
3463f012e29Smrg			free(bo);
3473f012e29Smrg			pthread_mutex_unlock(&dev->bo_table_mutex);
3483f012e29Smrg			return r;
3493f012e29Smrg		}
3503f012e29Smrg
3513f012e29Smrg		bo->handle = open_arg.handle;
3523f012e29Smrg		if (dev->flink_fd != dev->fd) {
3533f012e29Smrg			r = drmPrimeHandleToFD(dev->flink_fd, bo->handle, DRM_CLOEXEC, &dma_fd);
3543f012e29Smrg			if (r) {
3553f012e29Smrg				free(bo);
3563f012e29Smrg				pthread_mutex_unlock(&dev->bo_table_mutex);
3573f012e29Smrg				return r;
3583f012e29Smrg			}
3593f012e29Smrg			r = drmPrimeFDToHandle(dev->fd, dma_fd, &bo->handle );
3603f012e29Smrg
3613f012e29Smrg			close(dma_fd);
3623f012e29Smrg
3633f012e29Smrg			if (r) {
3643f012e29Smrg				free(bo);
3653f012e29Smrg				pthread_mutex_unlock(&dev->bo_table_mutex);
3663f012e29Smrg				return r;
3673f012e29Smrg			}
3683f012e29Smrg		}
3693f012e29Smrg		bo->flink_name = shared_handle;
3703f012e29Smrg		bo->alloc_size = open_arg.size;
3713f012e29Smrg		util_hash_table_set(dev->bo_flink_names,
3723f012e29Smrg				    (void*)(uintptr_t)bo->flink_name, bo);
3733f012e29Smrg		break;
3743f012e29Smrg
3753f012e29Smrg	case amdgpu_bo_handle_type_dma_buf_fd:
3763f012e29Smrg		bo->handle = shared_handle;
3773f012e29Smrg		bo->alloc_size = dma_buf_size;
3783f012e29Smrg		break;
3793f012e29Smrg
3803f012e29Smrg	case amdgpu_bo_handle_type_kms:
3813f012e29Smrg		assert(0); /* unreachable */
3823f012e29Smrg	}
3833f012e29Smrg
3843f012e29Smrg	/* Initialize it. */
3853f012e29Smrg	atomic_set(&bo->refcount, 1);
3863f012e29Smrg	bo->dev = dev;
3873f012e29Smrg	pthread_mutex_init(&bo->cpu_access_mutex, NULL);
3883f012e29Smrg
3893f012e29Smrg	util_hash_table_set(dev->bo_handles, (void*)(uintptr_t)bo->handle, bo);
3903f012e29Smrg	pthread_mutex_unlock(&dev->bo_table_mutex);
3913f012e29Smrg
3923f012e29Smrg	output->buf_handle = bo;
3933f012e29Smrg	output->alloc_size = bo->alloc_size;
3943f012e29Smrg	return 0;
3953f012e29Smrg}
3963f012e29Smrg
3973f012e29Smrgint amdgpu_bo_free(amdgpu_bo_handle buf_handle)
3983f012e29Smrg{
399d8807b2fSmrg	struct amdgpu_device *dev;
400d8807b2fSmrg	struct amdgpu_bo *bo = buf_handle;
401d8807b2fSmrg
402d8807b2fSmrg	assert(bo != NULL);
403d8807b2fSmrg	dev = bo->dev;
404d8807b2fSmrg	pthread_mutex_lock(&dev->bo_table_mutex);
405d8807b2fSmrg
406d8807b2fSmrg	if (update_references(&bo->refcount, NULL)) {
407d8807b2fSmrg		/* Remove the buffer from the hash tables. */
408d8807b2fSmrg		util_hash_table_remove(dev->bo_handles,
409d8807b2fSmrg					(void*)(uintptr_t)bo->handle);
410d8807b2fSmrg
411d8807b2fSmrg		if (bo->flink_name) {
412d8807b2fSmrg			util_hash_table_remove(dev->bo_flink_names,
413d8807b2fSmrg						(void*)(uintptr_t)bo->flink_name);
414d8807b2fSmrg		}
415d8807b2fSmrg
416d8807b2fSmrg		/* Release CPU access. */
417d8807b2fSmrg		if (bo->cpu_map_count > 0) {
418d8807b2fSmrg			bo->cpu_map_count = 1;
419d8807b2fSmrg			amdgpu_bo_cpu_unmap(bo);
420d8807b2fSmrg		}
421d8807b2fSmrg
422d8807b2fSmrg		amdgpu_close_kms_handle(dev, bo->handle);
423d8807b2fSmrg		pthread_mutex_destroy(&bo->cpu_access_mutex);
424d8807b2fSmrg		free(bo);
425d8807b2fSmrg	}
426d8807b2fSmrg
427d8807b2fSmrg	pthread_mutex_unlock(&dev->bo_table_mutex);
4283f012e29Smrg	return 0;
4293f012e29Smrg}
4303f012e29Smrg
4313f012e29Smrgint amdgpu_bo_cpu_map(amdgpu_bo_handle bo, void **cpu)
4323f012e29Smrg{
4333f012e29Smrg	union drm_amdgpu_gem_mmap args;
4343f012e29Smrg	void *ptr;
4353f012e29Smrg	int r;
4363f012e29Smrg
4373f012e29Smrg	pthread_mutex_lock(&bo->cpu_access_mutex);
4383f012e29Smrg
4393f012e29Smrg	if (bo->cpu_ptr) {
4403f012e29Smrg		/* already mapped */
4413f012e29Smrg		assert(bo->cpu_map_count > 0);
4423f012e29Smrg		bo->cpu_map_count++;
4433f012e29Smrg		*cpu = bo->cpu_ptr;
4443f012e29Smrg		pthread_mutex_unlock(&bo->cpu_access_mutex);
4453f012e29Smrg		return 0;
4463f012e29Smrg	}
4473f012e29Smrg
4483f012e29Smrg	assert(bo->cpu_map_count == 0);
4493f012e29Smrg
4503f012e29Smrg	memset(&args, 0, sizeof(args));
4513f012e29Smrg
4523f012e29Smrg	/* Query the buffer address (args.addr_ptr).
4533f012e29Smrg	 * The kernel driver ignores the offset and size parameters. */
4543f012e29Smrg	args.in.handle = bo->handle;
4553f012e29Smrg
4563f012e29Smrg	r = drmCommandWriteRead(bo->dev->fd, DRM_AMDGPU_GEM_MMAP, &args,
4573f012e29Smrg				sizeof(args));
4583f012e29Smrg	if (r) {
4593f012e29Smrg		pthread_mutex_unlock(&bo->cpu_access_mutex);
4603f012e29Smrg		return r;
4613f012e29Smrg	}
4623f012e29Smrg
4633f012e29Smrg	/* Map the buffer. */
4643f012e29Smrg	ptr = drm_mmap(NULL, bo->alloc_size, PROT_READ | PROT_WRITE, MAP_SHARED,
4653f012e29Smrg		       bo->dev->fd, args.out.addr_ptr);
4663f012e29Smrg	if (ptr == MAP_FAILED) {
4673f012e29Smrg		pthread_mutex_unlock(&bo->cpu_access_mutex);
4683f012e29Smrg		return -errno;
4693f012e29Smrg	}
4703f012e29Smrg
4713f012e29Smrg	bo->cpu_ptr = ptr;
4723f012e29Smrg	bo->cpu_map_count = 1;
4733f012e29Smrg	pthread_mutex_unlock(&bo->cpu_access_mutex);
4743f012e29Smrg
4753f012e29Smrg	*cpu = ptr;
4763f012e29Smrg	return 0;
4773f012e29Smrg}
4783f012e29Smrg
4793f012e29Smrgint amdgpu_bo_cpu_unmap(amdgpu_bo_handle bo)
4803f012e29Smrg{
4813f012e29Smrg	int r;
4823f012e29Smrg
4833f012e29Smrg	pthread_mutex_lock(&bo->cpu_access_mutex);
4843f012e29Smrg	assert(bo->cpu_map_count >= 0);
4853f012e29Smrg
4863f012e29Smrg	if (bo->cpu_map_count == 0) {
4873f012e29Smrg		/* not mapped */
4883f012e29Smrg		pthread_mutex_unlock(&bo->cpu_access_mutex);
4893f012e29Smrg		return -EINVAL;
4903f012e29Smrg	}
4913f012e29Smrg
4923f012e29Smrg	bo->cpu_map_count--;
4933f012e29Smrg	if (bo->cpu_map_count > 0) {
4943f012e29Smrg		/* mapped multiple times */
4953f012e29Smrg		pthread_mutex_unlock(&bo->cpu_access_mutex);
4963f012e29Smrg		return 0;
4973f012e29Smrg	}
4983f012e29Smrg
4993f012e29Smrg	r = drm_munmap(bo->cpu_ptr, bo->alloc_size) == 0 ? 0 : -errno;
5003f012e29Smrg	bo->cpu_ptr = NULL;
5013f012e29Smrg	pthread_mutex_unlock(&bo->cpu_access_mutex);
5023f012e29Smrg	return r;
5033f012e29Smrg}
5043f012e29Smrg
5053f012e29Smrgint amdgpu_query_buffer_size_alignment(amdgpu_device_handle dev,
5063f012e29Smrg				struct amdgpu_buffer_size_alignments *info)
5073f012e29Smrg{
5083f012e29Smrg	info->size_local = dev->dev_info.pte_fragment_size;
5093f012e29Smrg	info->size_remote = dev->dev_info.gart_page_size;
5103f012e29Smrg	return 0;
5113f012e29Smrg}
5123f012e29Smrg
5133f012e29Smrgint amdgpu_bo_wait_for_idle(amdgpu_bo_handle bo,
5143f012e29Smrg			    uint64_t timeout_ns,
5153f012e29Smrg			    bool *busy)
5163f012e29Smrg{
5173f012e29Smrg	union drm_amdgpu_gem_wait_idle args;
5183f012e29Smrg	int r;
5193f012e29Smrg
5203f012e29Smrg	memset(&args, 0, sizeof(args));
5213f012e29Smrg	args.in.handle = bo->handle;
5223f012e29Smrg	args.in.timeout = amdgpu_cs_calculate_timeout(timeout_ns);
5233f012e29Smrg
5243f012e29Smrg	r = drmCommandWriteRead(bo->dev->fd, DRM_AMDGPU_GEM_WAIT_IDLE,
5253f012e29Smrg				&args, sizeof(args));
5263f012e29Smrg
5273f012e29Smrg	if (r == 0) {
5283f012e29Smrg		*busy = args.out.status;
5293f012e29Smrg		return 0;
5303f012e29Smrg	} else {
5313f012e29Smrg		fprintf(stderr, "amdgpu: GEM_WAIT_IDLE failed with %i\n", r);
5323f012e29Smrg		return r;
5333f012e29Smrg	}
5343f012e29Smrg}
5353f012e29Smrg
5363f012e29Smrgint amdgpu_create_bo_from_user_mem(amdgpu_device_handle dev,
5373f012e29Smrg				    void *cpu,
5383f012e29Smrg				    uint64_t size,
5393f012e29Smrg				    amdgpu_bo_handle *buf_handle)
5403f012e29Smrg{
5413f012e29Smrg	int r;
5423f012e29Smrg	struct amdgpu_bo *bo;
5433f012e29Smrg	struct drm_amdgpu_gem_userptr args;
5443f012e29Smrg
5453f012e29Smrg	args.addr = (uintptr_t)cpu;
5463f012e29Smrg	args.flags = AMDGPU_GEM_USERPTR_ANONONLY | AMDGPU_GEM_USERPTR_REGISTER |
5473f012e29Smrg		AMDGPU_GEM_USERPTR_VALIDATE;
5483f012e29Smrg	args.size = size;
5493f012e29Smrg	r = drmCommandWriteRead(dev->fd, DRM_AMDGPU_GEM_USERPTR,
5503f012e29Smrg				&args, sizeof(args));
5513f012e29Smrg	if (r)
5523f012e29Smrg		return r;
5533f012e29Smrg
5543f012e29Smrg	bo = calloc(1, sizeof(struct amdgpu_bo));
5553f012e29Smrg	if (!bo)
5563f012e29Smrg		return -ENOMEM;
5573f012e29Smrg
5583f012e29Smrg	atomic_set(&bo->refcount, 1);
5593f012e29Smrg	bo->dev = dev;
5603f012e29Smrg	bo->alloc_size = size;
5613f012e29Smrg	bo->handle = args.handle;
5623f012e29Smrg
5633f012e29Smrg	*buf_handle = bo;
5643f012e29Smrg
5653f012e29Smrg	return r;
5663f012e29Smrg}
5673f012e29Smrg
5683f012e29Smrgint amdgpu_bo_list_create(amdgpu_device_handle dev,
5693f012e29Smrg			  uint32_t number_of_resources,
5703f012e29Smrg			  amdgpu_bo_handle *resources,
5713f012e29Smrg			  uint8_t *resource_prios,
5723f012e29Smrg			  amdgpu_bo_list_handle *result)
5733f012e29Smrg{
5743f012e29Smrg	struct drm_amdgpu_bo_list_entry *list;
5753f012e29Smrg	union drm_amdgpu_bo_list args;
5763f012e29Smrg	unsigned i;
5773f012e29Smrg	int r;
5783f012e29Smrg
5793f012e29Smrg	if (!number_of_resources)
5803f012e29Smrg		return -EINVAL;
5813f012e29Smrg
5823f012e29Smrg	/* overflow check for multiplication */
5833f012e29Smrg	if (number_of_resources > UINT32_MAX / sizeof(struct drm_amdgpu_bo_list_entry))
5843f012e29Smrg		return -EINVAL;
5853f012e29Smrg
5863f012e29Smrg	list = malloc(number_of_resources * sizeof(struct drm_amdgpu_bo_list_entry));
5873f012e29Smrg	if (!list)
5883f012e29Smrg		return -ENOMEM;
5893f012e29Smrg
5903f012e29Smrg	*result = malloc(sizeof(struct amdgpu_bo_list));
5913f012e29Smrg	if (!*result) {
5923f012e29Smrg		free(list);
5933f012e29Smrg		return -ENOMEM;
5943f012e29Smrg	}
5953f012e29Smrg
5963f012e29Smrg	memset(&args, 0, sizeof(args));
5973f012e29Smrg	args.in.operation = AMDGPU_BO_LIST_OP_CREATE;
5983f012e29Smrg	args.in.bo_number = number_of_resources;
5993f012e29Smrg	args.in.bo_info_size = sizeof(struct drm_amdgpu_bo_list_entry);
6003f012e29Smrg	args.in.bo_info_ptr = (uint64_t)(uintptr_t)list;
6013f012e29Smrg
6023f012e29Smrg	for (i = 0; i < number_of_resources; i++) {
6033f012e29Smrg		list[i].bo_handle = resources[i]->handle;
6043f012e29Smrg		if (resource_prios)
6053f012e29Smrg			list[i].bo_priority = resource_prios[i];
6063f012e29Smrg		else
6073f012e29Smrg			list[i].bo_priority = 0;
6083f012e29Smrg	}
6093f012e29Smrg
6103f012e29Smrg	r = drmCommandWriteRead(dev->fd, DRM_AMDGPU_BO_LIST,
6113f012e29Smrg				&args, sizeof(args));
6123f012e29Smrg	free(list);
6133f012e29Smrg	if (r) {
6143f012e29Smrg		free(*result);
6153f012e29Smrg		return r;
6163f012e29Smrg	}
6173f012e29Smrg
6183f012e29Smrg	(*result)->dev = dev;
6193f012e29Smrg	(*result)->handle = args.out.list_handle;
6203f012e29Smrg	return 0;
6213f012e29Smrg}
6223f012e29Smrg
6233f012e29Smrgint amdgpu_bo_list_destroy(amdgpu_bo_list_handle list)
6243f012e29Smrg{
6253f012e29Smrg	union drm_amdgpu_bo_list args;
6263f012e29Smrg	int r;
6273f012e29Smrg
6283f012e29Smrg	memset(&args, 0, sizeof(args));
6293f012e29Smrg	args.in.operation = AMDGPU_BO_LIST_OP_DESTROY;
6303f012e29Smrg	args.in.list_handle = list->handle;
6313f012e29Smrg
6323f012e29Smrg	r = drmCommandWriteRead(list->dev->fd, DRM_AMDGPU_BO_LIST,
6333f012e29Smrg				&args, sizeof(args));
6343f012e29Smrg
6353f012e29Smrg	if (!r)
6363f012e29Smrg		free(list);
6373f012e29Smrg
6383f012e29Smrg	return r;
6393f012e29Smrg}
6403f012e29Smrg
6413f012e29Smrgint amdgpu_bo_list_update(amdgpu_bo_list_handle handle,
6423f012e29Smrg			  uint32_t number_of_resources,
6433f012e29Smrg			  amdgpu_bo_handle *resources,
6443f012e29Smrg			  uint8_t *resource_prios)
6453f012e29Smrg{
6463f012e29Smrg	struct drm_amdgpu_bo_list_entry *list;
6473f012e29Smrg	union drm_amdgpu_bo_list args;
6483f012e29Smrg	unsigned i;
6493f012e29Smrg	int r;
6503f012e29Smrg
6513f012e29Smrg	if (!number_of_resources)
6523f012e29Smrg		return -EINVAL;
6533f012e29Smrg
6543f012e29Smrg	/* overflow check for multiplication */
6553f012e29Smrg	if (number_of_resources > UINT32_MAX / sizeof(struct drm_amdgpu_bo_list_entry))
6563f012e29Smrg		return -EINVAL;
6573f012e29Smrg
6583f012e29Smrg	list = malloc(number_of_resources * sizeof(struct drm_amdgpu_bo_list_entry));
659d8807b2fSmrg	if (!list)
6603f012e29Smrg		return -ENOMEM;
6613f012e29Smrg
6623f012e29Smrg	args.in.operation = AMDGPU_BO_LIST_OP_UPDATE;
6633f012e29Smrg	args.in.list_handle = handle->handle;
6643f012e29Smrg	args.in.bo_number = number_of_resources;
6653f012e29Smrg	args.in.bo_info_size = sizeof(struct drm_amdgpu_bo_list_entry);
6663f012e29Smrg	args.in.bo_info_ptr = (uintptr_t)list;
6673f012e29Smrg
6683f012e29Smrg	for (i = 0; i < number_of_resources; i++) {
6693f012e29Smrg		list[i].bo_handle = resources[i]->handle;
6703f012e29Smrg		if (resource_prios)
6713f012e29Smrg			list[i].bo_priority = resource_prios[i];
6723f012e29Smrg		else
6733f012e29Smrg			list[i].bo_priority = 0;
6743f012e29Smrg	}
6753f012e29Smrg
6763f012e29Smrg	r = drmCommandWriteRead(handle->dev->fd, DRM_AMDGPU_BO_LIST,
6773f012e29Smrg				&args, sizeof(args));
6783f012e29Smrg	free(list);
6793f012e29Smrg	return r;
6803f012e29Smrg}
6813f012e29Smrg
6823f012e29Smrgint amdgpu_bo_va_op(amdgpu_bo_handle bo,
6833f012e29Smrg		     uint64_t offset,
6843f012e29Smrg		     uint64_t size,
6853f012e29Smrg		     uint64_t addr,
6863f012e29Smrg		     uint64_t flags,
6873f012e29Smrg		     uint32_t ops)
6883f012e29Smrg{
6893f012e29Smrg	amdgpu_device_handle dev = bo->dev;
690d8807b2fSmrg
691d8807b2fSmrg	size = ALIGN(size, getpagesize());
692d8807b2fSmrg
693d8807b2fSmrg	return amdgpu_bo_va_op_raw(dev, bo, offset, size, addr,
694d8807b2fSmrg				   AMDGPU_VM_PAGE_READABLE |
695d8807b2fSmrg				   AMDGPU_VM_PAGE_WRITEABLE |
696d8807b2fSmrg				   AMDGPU_VM_PAGE_EXECUTABLE, ops);
697d8807b2fSmrg}
698d8807b2fSmrg
699d8807b2fSmrgint amdgpu_bo_va_op_raw(amdgpu_device_handle dev,
700d8807b2fSmrg			amdgpu_bo_handle bo,
701d8807b2fSmrg			uint64_t offset,
702d8807b2fSmrg			uint64_t size,
703d8807b2fSmrg			uint64_t addr,
704d8807b2fSmrg			uint64_t flags,
705d8807b2fSmrg			uint32_t ops)
706d8807b2fSmrg{
7073f012e29Smrg	struct drm_amdgpu_gem_va va;
7083f012e29Smrg	int r;
7093f012e29Smrg
710d8807b2fSmrg	if (ops != AMDGPU_VA_OP_MAP && ops != AMDGPU_VA_OP_UNMAP &&
711d8807b2fSmrg	    ops != AMDGPU_VA_OP_REPLACE && ops != AMDGPU_VA_OP_CLEAR)
7123f012e29Smrg		return -EINVAL;
7133f012e29Smrg
7143f012e29Smrg	memset(&va, 0, sizeof(va));
715d8807b2fSmrg	va.handle = bo ? bo->handle : 0;
7163f012e29Smrg	va.operation = ops;
717d8807b2fSmrg	va.flags = flags;
7183f012e29Smrg	va.va_address = addr;
7193f012e29Smrg	va.offset_in_bo = offset;
720d8807b2fSmrg	va.map_size = size;
7213f012e29Smrg
7223f012e29Smrg	r = drmCommandWriteRead(dev->fd, DRM_AMDGPU_GEM_VA, &va, sizeof(va));
7233f012e29Smrg
7243f012e29Smrg	return r;
7253f012e29Smrg}
726