13f012e29Smrg/*
23f012e29Smrg * Copyright © 2014 Advanced Micro Devices, Inc.
33f012e29Smrg * All Rights Reserved.
43f012e29Smrg *
53f012e29Smrg * Permission is hereby granted, free of charge, to any person obtaining a
63f012e29Smrg * copy of this software and associated documentation files (the "Software"),
73f012e29Smrg * to deal in the Software without restriction, including without limitation
83f012e29Smrg * the rights to use, copy, modify, merge, publish, distribute, sublicense,
93f012e29Smrg * and/or sell copies of the Software, and to permit persons to whom the
103f012e29Smrg * Software is furnished to do so, subject to the following conditions:
113f012e29Smrg *
123f012e29Smrg * The above copyright notice and this permission notice shall be included in
133f012e29Smrg * all copies or substantial portions of the Software.
143f012e29Smrg *
153f012e29Smrg * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
163f012e29Smrg * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
173f012e29Smrg * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT.  IN NO EVENT SHALL
183f012e29Smrg * THE COPYRIGHT HOLDER(S) OR AUTHOR(S) BE LIABLE FOR ANY CLAIM, DAMAGES OR
193f012e29Smrg * OTHER LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE,
203f012e29Smrg * ARISING FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR
213f012e29Smrg * OTHER DEALINGS IN THE SOFTWARE.
223f012e29Smrg *
233f012e29Smrg */
243f012e29Smrg
253f012e29Smrg#include <stdlib.h>
263f012e29Smrg#include <stdio.h>
273f012e29Smrg#include <stdint.h>
283f012e29Smrg#include <string.h>
293f012e29Smrg#include <errno.h>
303f012e29Smrg#include <fcntl.h>
313f012e29Smrg#include <unistd.h>
323f012e29Smrg#include <sys/ioctl.h>
333f012e29Smrg#include <sys/mman.h>
343f012e29Smrg#include <sys/time.h>
353f012e29Smrg
363f012e29Smrg#include "libdrm_macros.h"
373f012e29Smrg#include "xf86drm.h"
383f012e29Smrg#include "amdgpu_drm.h"
393f012e29Smrg#include "amdgpu_internal.h"
403f012e29Smrg#include "util_math.h"
413f012e29Smrg
427cdc0497Smrgstatic int amdgpu_bo_create(amdgpu_device_handle dev,
437cdc0497Smrg			    uint64_t size,
447cdc0497Smrg			    uint32_t handle,
457cdc0497Smrg			    amdgpu_bo_handle *buf_handle)
463f012e29Smrg{
473f012e29Smrg	struct amdgpu_bo *bo;
48bf6cc7dcSmrg	int r;
493f012e29Smrg
503f012e29Smrg	bo = calloc(1, sizeof(struct amdgpu_bo));
513f012e29Smrg	if (!bo)
523f012e29Smrg		return -ENOMEM;
533f012e29Smrg
54bf6cc7dcSmrg	r = handle_table_insert(&dev->bo_handles, handle, bo);
55bf6cc7dcSmrg	if (r) {
56bf6cc7dcSmrg		free(bo);
57bf6cc7dcSmrg		return r;
58bf6cc7dcSmrg	}
59bf6cc7dcSmrg
603f012e29Smrg	atomic_set(&bo->refcount, 1);
613f012e29Smrg	bo->dev = dev;
627cdc0497Smrg	bo->alloc_size = size;
637cdc0497Smrg	bo->handle = handle;
647cdc0497Smrg	pthread_mutex_init(&bo->cpu_access_mutex, NULL);
657cdc0497Smrg
667cdc0497Smrg	*buf_handle = bo;
677cdc0497Smrg	return 0;
687cdc0497Smrg}
697cdc0497Smrg
707cdc0497Smrgdrm_public int amdgpu_bo_alloc(amdgpu_device_handle dev,
717cdc0497Smrg			       struct amdgpu_bo_alloc_request *alloc_buffer,
727cdc0497Smrg			       amdgpu_bo_handle *buf_handle)
737cdc0497Smrg{
747cdc0497Smrg	union drm_amdgpu_gem_create args;
757cdc0497Smrg	int r;
763f012e29Smrg
773f012e29Smrg	memset(&args, 0, sizeof(args));
783f012e29Smrg	args.in.bo_size = alloc_buffer->alloc_size;
793f012e29Smrg	args.in.alignment = alloc_buffer->phys_alignment;
803f012e29Smrg
813f012e29Smrg	/* Set the placement. */
827cdc0497Smrg	args.in.domains = alloc_buffer->preferred_heap;
833f012e29Smrg	args.in.domain_flags = alloc_buffer->flags;
843f012e29Smrg
853f012e29Smrg	/* Allocate the buffer with the preferred heap. */
863f012e29Smrg	r = drmCommandWriteRead(dev->fd, DRM_AMDGPU_GEM_CREATE,
873f012e29Smrg				&args, sizeof(args));
887cdc0497Smrg	if (r)
897cdc0497Smrg		goto out;
907cdc0497Smrg
91bf6cc7dcSmrg	pthread_mutex_lock(&dev->bo_table_mutex);
927cdc0497Smrg	r = amdgpu_bo_create(dev, alloc_buffer->alloc_size, args.out.handle,
937cdc0497Smrg			     buf_handle);
94bf6cc7dcSmrg	pthread_mutex_unlock(&dev->bo_table_mutex);
953f012e29Smrg	if (r) {
96adfa0b0cSmrg		drmCloseBufferHandle(dev->fd, args.out.handle);
973f012e29Smrg	}
983f012e29Smrg
997cdc0497Smrgout:
1007cdc0497Smrg	return r;
1013f012e29Smrg}
1023f012e29Smrg
1037cdc0497Smrgdrm_public int amdgpu_bo_set_metadata(amdgpu_bo_handle bo,
1047cdc0497Smrg				      struct amdgpu_bo_metadata *info)
1053f012e29Smrg{
1063f012e29Smrg	struct drm_amdgpu_gem_metadata args = {};
1073f012e29Smrg
1083f012e29Smrg	args.handle = bo->handle;
1093f012e29Smrg	args.op = AMDGPU_GEM_METADATA_OP_SET_METADATA;
1103f012e29Smrg	args.data.flags = info->flags;
1113f012e29Smrg	args.data.tiling_info = info->tiling_info;
1123f012e29Smrg
1133f012e29Smrg	if (info->size_metadata > sizeof(args.data.data))
1143f012e29Smrg		return -EINVAL;
1153f012e29Smrg
1163f012e29Smrg	if (info->size_metadata) {
1173f012e29Smrg		args.data.data_size_bytes = info->size_metadata;
1183f012e29Smrg		memcpy(args.data.data, info->umd_metadata, info->size_metadata);
1193f012e29Smrg	}
1203f012e29Smrg
1213f012e29Smrg	return drmCommandWriteRead(bo->dev->fd,
1223f012e29Smrg				   DRM_AMDGPU_GEM_METADATA,
1233f012e29Smrg				   &args, sizeof(args));
1243f012e29Smrg}
1253f012e29Smrg
1267cdc0497Smrgdrm_public int amdgpu_bo_query_info(amdgpu_bo_handle bo,
1277cdc0497Smrg				    struct amdgpu_bo_info *info)
1283f012e29Smrg{
1293f012e29Smrg	struct drm_amdgpu_gem_metadata metadata = {};
1303f012e29Smrg	struct drm_amdgpu_gem_create_in bo_info = {};
1313f012e29Smrg	struct drm_amdgpu_gem_op gem_op = {};
1323f012e29Smrg	int r;
1333f012e29Smrg
1343f012e29Smrg	/* Validate the BO passed in */
1353f012e29Smrg	if (!bo->handle)
1363f012e29Smrg		return -EINVAL;
1373f012e29Smrg
1383f012e29Smrg	/* Query metadata. */
1393f012e29Smrg	metadata.handle = bo->handle;
1403f012e29Smrg	metadata.op = AMDGPU_GEM_METADATA_OP_GET_METADATA;
1413f012e29Smrg
1423f012e29Smrg	r = drmCommandWriteRead(bo->dev->fd, DRM_AMDGPU_GEM_METADATA,
1433f012e29Smrg				&metadata, sizeof(metadata));
1443f012e29Smrg	if (r)
1453f012e29Smrg		return r;
1463f012e29Smrg
1473f012e29Smrg	if (metadata.data.data_size_bytes >
1483f012e29Smrg	    sizeof(info->metadata.umd_metadata))
1493f012e29Smrg		return -EINVAL;
1503f012e29Smrg
1513f012e29Smrg	/* Query buffer info. */
1523f012e29Smrg	gem_op.handle = bo->handle;
1533f012e29Smrg	gem_op.op = AMDGPU_GEM_OP_GET_GEM_CREATE_INFO;
1543f012e29Smrg	gem_op.value = (uintptr_t)&bo_info;
1553f012e29Smrg
1563f012e29Smrg	r = drmCommandWriteRead(bo->dev->fd, DRM_AMDGPU_GEM_OP,
1573f012e29Smrg				&gem_op, sizeof(gem_op));
1583f012e29Smrg	if (r)
1593f012e29Smrg		return r;
1603f012e29Smrg
1613f012e29Smrg	memset(info, 0, sizeof(*info));
1623f012e29Smrg	info->alloc_size = bo_info.bo_size;
1633f012e29Smrg	info->phys_alignment = bo_info.alignment;
1643f012e29Smrg	info->preferred_heap = bo_info.domains;
1653f012e29Smrg	info->alloc_flags = bo_info.domain_flags;
1663f012e29Smrg	info->metadata.flags = metadata.data.flags;
1673f012e29Smrg	info->metadata.tiling_info = metadata.data.tiling_info;
1683f012e29Smrg
1693f012e29Smrg	info->metadata.size_metadata = metadata.data.data_size_bytes;
1703f012e29Smrg	if (metadata.data.data_size_bytes > 0)
1713f012e29Smrg		memcpy(info->metadata.umd_metadata, metadata.data.data,
1723f012e29Smrg		       metadata.data.data_size_bytes);
1733f012e29Smrg
1743f012e29Smrg	return 0;
1753f012e29Smrg}
1763f012e29Smrg
1773f012e29Smrgstatic int amdgpu_bo_export_flink(amdgpu_bo_handle bo)
1783f012e29Smrg{
1793f012e29Smrg	struct drm_gem_flink flink;
1803f012e29Smrg	int fd, dma_fd;
1813f012e29Smrg	uint32_t handle;
1823f012e29Smrg	int r;
1833f012e29Smrg
1843f012e29Smrg	fd = bo->dev->fd;
1853f012e29Smrg	handle = bo->handle;
1863f012e29Smrg	if (bo->flink_name)
1873f012e29Smrg		return 0;
1883f012e29Smrg
1893f012e29Smrg
1903f012e29Smrg	if (bo->dev->flink_fd != bo->dev->fd) {
1913f012e29Smrg		r = drmPrimeHandleToFD(bo->dev->fd, bo->handle, DRM_CLOEXEC,
1923f012e29Smrg				       &dma_fd);
1933f012e29Smrg		if (!r) {
1943f012e29Smrg			r = drmPrimeFDToHandle(bo->dev->flink_fd, dma_fd, &handle);
1953f012e29Smrg			close(dma_fd);
1963f012e29Smrg		}
1973f012e29Smrg		if (r)
1983f012e29Smrg			return r;
1993f012e29Smrg		fd = bo->dev->flink_fd;
2003f012e29Smrg	}
2013f012e29Smrg	memset(&flink, 0, sizeof(flink));
2023f012e29Smrg	flink.handle = handle;
2033f012e29Smrg
2043f012e29Smrg	r = drmIoctl(fd, DRM_IOCTL_GEM_FLINK, &flink);
2053f012e29Smrg	if (r)
2063f012e29Smrg		return r;
2073f012e29Smrg
2083f012e29Smrg	bo->flink_name = flink.name;
2093f012e29Smrg
210bf6cc7dcSmrg	if (bo->dev->flink_fd != bo->dev->fd)
211adfa0b0cSmrg		drmCloseBufferHandle(bo->dev->flink_fd, handle);
2123f012e29Smrg
2133f012e29Smrg	pthread_mutex_lock(&bo->dev->bo_table_mutex);
2147cdc0497Smrg	r = handle_table_insert(&bo->dev->bo_flink_names, bo->flink_name, bo);
2153f012e29Smrg	pthread_mutex_unlock(&bo->dev->bo_table_mutex);
2163f012e29Smrg
2177cdc0497Smrg	return r;
2183f012e29Smrg}
2193f012e29Smrg
2207cdc0497Smrgdrm_public int amdgpu_bo_export(amdgpu_bo_handle bo,
2217cdc0497Smrg				enum amdgpu_bo_handle_type type,
2227cdc0497Smrg				uint32_t *shared_handle)
2233f012e29Smrg{
2243f012e29Smrg	int r;
2253f012e29Smrg
2263f012e29Smrg	switch (type) {
2273f012e29Smrg	case amdgpu_bo_handle_type_gem_flink_name:
2283f012e29Smrg		r = amdgpu_bo_export_flink(bo);
2293f012e29Smrg		if (r)
2303f012e29Smrg			return r;
2313f012e29Smrg
2323f012e29Smrg		*shared_handle = bo->flink_name;
2333f012e29Smrg		return 0;
2343f012e29Smrg
2353f012e29Smrg	case amdgpu_bo_handle_type_kms:
2367cdc0497Smrg	case amdgpu_bo_handle_type_kms_noimport:
2373f012e29Smrg		*shared_handle = bo->handle;
2383f012e29Smrg		return 0;
2393f012e29Smrg
2403f012e29Smrg	case amdgpu_bo_handle_type_dma_buf_fd:
2417cdc0497Smrg		return drmPrimeHandleToFD(bo->dev->fd, bo->handle,
2427cdc0497Smrg					  DRM_CLOEXEC | DRM_RDWR,
2437cdc0497Smrg					  (int*)shared_handle);
2443f012e29Smrg	}
2453f012e29Smrg	return -EINVAL;
2463f012e29Smrg}
2473f012e29Smrg
2487cdc0497Smrgdrm_public int amdgpu_bo_import(amdgpu_device_handle dev,
2497cdc0497Smrg				enum amdgpu_bo_handle_type type,
2507cdc0497Smrg				uint32_t shared_handle,
2513f012e29Smrg		     struct amdgpu_bo_import_result *output)
2523f012e29Smrg{
2533f012e29Smrg	struct drm_gem_open open_arg = {};
2543f012e29Smrg	struct amdgpu_bo *bo = NULL;
2557cdc0497Smrg	uint32_t handle = 0, flink_name = 0;
2567cdc0497Smrg	uint64_t alloc_size = 0;
2577cdc0497Smrg	int r = 0;
2583f012e29Smrg	int dma_fd;
2593f012e29Smrg	uint64_t dma_buf_size = 0;
2603f012e29Smrg
2613f012e29Smrg	/* We must maintain a list of pairs <handle, bo>, so that we always
2623f012e29Smrg	 * return the same amdgpu_bo instance for the same handle. */
2633f012e29Smrg	pthread_mutex_lock(&dev->bo_table_mutex);
2643f012e29Smrg
2653f012e29Smrg	/* Convert a DMA buf handle to a KMS handle now. */
2663f012e29Smrg	if (type == amdgpu_bo_handle_type_dma_buf_fd) {
2673f012e29Smrg		off_t size;
2683f012e29Smrg
2693f012e29Smrg		/* Get a KMS handle. */
2703f012e29Smrg		r = drmPrimeFDToHandle(dev->fd, shared_handle, &handle);
2717cdc0497Smrg		if (r)
2727cdc0497Smrg			goto unlock;
2733f012e29Smrg
2743f012e29Smrg		/* Query the buffer size. */
2753f012e29Smrg		size = lseek(shared_handle, 0, SEEK_END);
2763f012e29Smrg		if (size == (off_t)-1) {
2777cdc0497Smrg			r = -errno;
2787cdc0497Smrg			goto free_bo_handle;
2793f012e29Smrg		}
2803f012e29Smrg		lseek(shared_handle, 0, SEEK_SET);
2813f012e29Smrg
2823f012e29Smrg		dma_buf_size = size;
2833f012e29Smrg		shared_handle = handle;
2843f012e29Smrg	}
2853f012e29Smrg
2863f012e29Smrg	/* If we have already created a buffer with this handle, find it. */
2873f012e29Smrg	switch (type) {
2883f012e29Smrg	case amdgpu_bo_handle_type_gem_flink_name:
2897cdc0497Smrg		bo = handle_table_lookup(&dev->bo_flink_names, shared_handle);
2903f012e29Smrg		break;
2913f012e29Smrg
2923f012e29Smrg	case amdgpu_bo_handle_type_dma_buf_fd:
2937cdc0497Smrg		bo = handle_table_lookup(&dev->bo_handles, shared_handle);
2943f012e29Smrg		break;
2953f012e29Smrg
2963f012e29Smrg	case amdgpu_bo_handle_type_kms:
2977cdc0497Smrg	case amdgpu_bo_handle_type_kms_noimport:
2983f012e29Smrg		/* Importing a KMS handle in not allowed. */
2997cdc0497Smrg		r = -EPERM;
3007cdc0497Smrg		goto unlock;
3013f012e29Smrg
3023f012e29Smrg	default:
3037cdc0497Smrg		r = -EINVAL;
3047cdc0497Smrg		goto unlock;
3053f012e29Smrg	}
3063f012e29Smrg
3073f012e29Smrg	if (bo) {
3083f012e29Smrg		/* The buffer already exists, just bump the refcount. */
3093f012e29Smrg		atomic_inc(&bo->refcount);
310d8807b2fSmrg		pthread_mutex_unlock(&dev->bo_table_mutex);
3113f012e29Smrg
3123f012e29Smrg		output->buf_handle = bo;
3133f012e29Smrg		output->alloc_size = bo->alloc_size;
3143f012e29Smrg		return 0;
3153f012e29Smrg	}
3163f012e29Smrg
3173f012e29Smrg	/* Open the handle. */
3183f012e29Smrg	switch (type) {
3193f012e29Smrg	case amdgpu_bo_handle_type_gem_flink_name:
3203f012e29Smrg		open_arg.name = shared_handle;
3213f012e29Smrg		r = drmIoctl(dev->flink_fd, DRM_IOCTL_GEM_OPEN, &open_arg);
3227cdc0497Smrg		if (r)
3237cdc0497Smrg			goto unlock;
3243f012e29Smrg
3257cdc0497Smrg		flink_name = shared_handle;
3267cdc0497Smrg		handle = open_arg.handle;
3277cdc0497Smrg		alloc_size = open_arg.size;
3283f012e29Smrg		if (dev->flink_fd != dev->fd) {
3297cdc0497Smrg			r = drmPrimeHandleToFD(dev->flink_fd, handle,
3307cdc0497Smrg					       DRM_CLOEXEC, &dma_fd);
3317cdc0497Smrg			if (r)
3327cdc0497Smrg				goto free_bo_handle;
3337cdc0497Smrg			r = drmPrimeFDToHandle(dev->fd, dma_fd, &handle);
3343f012e29Smrg			close(dma_fd);
3357cdc0497Smrg			if (r)
3367cdc0497Smrg				goto free_bo_handle;
337adfa0b0cSmrg			r = drmCloseBufferHandle(dev->flink_fd,
338adfa0b0cSmrg						 open_arg.handle);
3397cdc0497Smrg			if (r)
3407cdc0497Smrg				goto free_bo_handle;
3413f012e29Smrg		}
342bf6cc7dcSmrg		open_arg.handle = 0;
3433f012e29Smrg		break;
3443f012e29Smrg
3453f012e29Smrg	case amdgpu_bo_handle_type_dma_buf_fd:
3467cdc0497Smrg		handle = shared_handle;
3477cdc0497Smrg		alloc_size = dma_buf_size;
3483f012e29Smrg		break;
3493f012e29Smrg
3503f012e29Smrg	case amdgpu_bo_handle_type_kms:
3517cdc0497Smrg	case amdgpu_bo_handle_type_kms_noimport:
3523f012e29Smrg		assert(0); /* unreachable */
3533f012e29Smrg	}
3543f012e29Smrg
3553f012e29Smrg	/* Initialize it. */
3567cdc0497Smrg	r = amdgpu_bo_create(dev, alloc_size, handle, &bo);
3577cdc0497Smrg	if (r)
3587cdc0497Smrg		goto free_bo_handle;
3593f012e29Smrg
3607cdc0497Smrg	if (flink_name) {
3617cdc0497Smrg		bo->flink_name = flink_name;
3627cdc0497Smrg		r = handle_table_insert(&dev->bo_flink_names, flink_name,
3637cdc0497Smrg					bo);
3647cdc0497Smrg		if (r)
365bf6cc7dcSmrg			goto free_bo_handle;
3667cdc0497Smrg
3677cdc0497Smrg	}
3683f012e29Smrg
3693f012e29Smrg	output->buf_handle = bo;
3703f012e29Smrg	output->alloc_size = bo->alloc_size;
3717cdc0497Smrg	pthread_mutex_unlock(&dev->bo_table_mutex);
3723f012e29Smrg	return 0;
3737cdc0497Smrg
3747cdc0497Smrgfree_bo_handle:
375bf6cc7dcSmrg	if (flink_name && open_arg.handle)
376adfa0b0cSmrg		drmCloseBufferHandle(dev->flink_fd, open_arg.handle);
377bf6cc7dcSmrg
3787cdc0497Smrg	if (bo)
3797cdc0497Smrg		amdgpu_bo_free(bo);
3807cdc0497Smrg	else
381adfa0b0cSmrg		drmCloseBufferHandle(dev->fd, handle);
3827cdc0497Smrgunlock:
3837cdc0497Smrg	pthread_mutex_unlock(&dev->bo_table_mutex);
3847cdc0497Smrg	return r;
3853f012e29Smrg}
3863f012e29Smrg
3877cdc0497Smrgdrm_public int amdgpu_bo_free(amdgpu_bo_handle buf_handle)
3883f012e29Smrg{
389d8807b2fSmrg	struct amdgpu_device *dev;
390d8807b2fSmrg	struct amdgpu_bo *bo = buf_handle;
391d8807b2fSmrg
392d8807b2fSmrg	assert(bo != NULL);
393d8807b2fSmrg	dev = bo->dev;
394d8807b2fSmrg	pthread_mutex_lock(&dev->bo_table_mutex);
395d8807b2fSmrg
396d8807b2fSmrg	if (update_references(&bo->refcount, NULL)) {
397d8807b2fSmrg		/* Remove the buffer from the hash tables. */
3987cdc0497Smrg		handle_table_remove(&dev->bo_handles, bo->handle);
399d8807b2fSmrg
4007cdc0497Smrg		if (bo->flink_name)
4017cdc0497Smrg			handle_table_remove(&dev->bo_flink_names,
4027cdc0497Smrg					    bo->flink_name);
403d8807b2fSmrg
404d8807b2fSmrg		/* Release CPU access. */
405d8807b2fSmrg		if (bo->cpu_map_count > 0) {
406d8807b2fSmrg			bo->cpu_map_count = 1;
407d8807b2fSmrg			amdgpu_bo_cpu_unmap(bo);
408d8807b2fSmrg		}
409d8807b2fSmrg
410adfa0b0cSmrg		drmCloseBufferHandle(dev->fd, bo->handle);
411d8807b2fSmrg		pthread_mutex_destroy(&bo->cpu_access_mutex);
412d8807b2fSmrg		free(bo);
413d8807b2fSmrg	}
414d8807b2fSmrg
415d8807b2fSmrg	pthread_mutex_unlock(&dev->bo_table_mutex);
416bf6cc7dcSmrg
4173f012e29Smrg	return 0;
4183f012e29Smrg}
4193f012e29Smrg
4207cdc0497Smrgdrm_public void amdgpu_bo_inc_ref(amdgpu_bo_handle bo)
4217cdc0497Smrg{
4227cdc0497Smrg	atomic_inc(&bo->refcount);
4237cdc0497Smrg}
4247cdc0497Smrg
4257cdc0497Smrgdrm_public int amdgpu_bo_cpu_map(amdgpu_bo_handle bo, void **cpu)
4263f012e29Smrg{
4273f012e29Smrg	union drm_amdgpu_gem_mmap args;
4283f012e29Smrg	void *ptr;
4293f012e29Smrg	int r;
4303f012e29Smrg
4313f012e29Smrg	pthread_mutex_lock(&bo->cpu_access_mutex);
4323f012e29Smrg
4333f012e29Smrg	if (bo->cpu_ptr) {
4343f012e29Smrg		/* already mapped */
4353f012e29Smrg		assert(bo->cpu_map_count > 0);
4363f012e29Smrg		bo->cpu_map_count++;
4373f012e29Smrg		*cpu = bo->cpu_ptr;
4383f012e29Smrg		pthread_mutex_unlock(&bo->cpu_access_mutex);
4393f012e29Smrg		return 0;
4403f012e29Smrg	}
4413f012e29Smrg
4423f012e29Smrg	assert(bo->cpu_map_count == 0);
4433f012e29Smrg
4443f012e29Smrg	memset(&args, 0, sizeof(args));
4453f012e29Smrg
4463f012e29Smrg	/* Query the buffer address (args.addr_ptr).
4473f012e29Smrg	 * The kernel driver ignores the offset and size parameters. */
4483f012e29Smrg	args.in.handle = bo->handle;
4493f012e29Smrg
4503f012e29Smrg	r = drmCommandWriteRead(bo->dev->fd, DRM_AMDGPU_GEM_MMAP, &args,
4513f012e29Smrg				sizeof(args));
4523f012e29Smrg	if (r) {
4533f012e29Smrg		pthread_mutex_unlock(&bo->cpu_access_mutex);
4543f012e29Smrg		return r;
4553f012e29Smrg	}
4563f012e29Smrg
4573f012e29Smrg	/* Map the buffer. */
4583f012e29Smrg	ptr = drm_mmap(NULL, bo->alloc_size, PROT_READ | PROT_WRITE, MAP_SHARED,
4593f012e29Smrg		       bo->dev->fd, args.out.addr_ptr);
4603f012e29Smrg	if (ptr == MAP_FAILED) {
4613f012e29Smrg		pthread_mutex_unlock(&bo->cpu_access_mutex);
4623f012e29Smrg		return -errno;
4633f012e29Smrg	}
4643f012e29Smrg
4653f012e29Smrg	bo->cpu_ptr = ptr;
4663f012e29Smrg	bo->cpu_map_count = 1;
4673f012e29Smrg	pthread_mutex_unlock(&bo->cpu_access_mutex);
4683f012e29Smrg
4693f012e29Smrg	*cpu = ptr;
4703f012e29Smrg	return 0;
4713f012e29Smrg}
4723f012e29Smrg
4737cdc0497Smrgdrm_public int amdgpu_bo_cpu_unmap(amdgpu_bo_handle bo)
4743f012e29Smrg{
4753f012e29Smrg	int r;
4763f012e29Smrg
4773f012e29Smrg	pthread_mutex_lock(&bo->cpu_access_mutex);
4783f012e29Smrg	assert(bo->cpu_map_count >= 0);
4793f012e29Smrg
4803f012e29Smrg	if (bo->cpu_map_count == 0) {
4813f012e29Smrg		/* not mapped */
4823f012e29Smrg		pthread_mutex_unlock(&bo->cpu_access_mutex);
4833f012e29Smrg		return -EINVAL;
4843f012e29Smrg	}
4853f012e29Smrg
4863f012e29Smrg	bo->cpu_map_count--;
4873f012e29Smrg	if (bo->cpu_map_count > 0) {
4883f012e29Smrg		/* mapped multiple times */
4893f012e29Smrg		pthread_mutex_unlock(&bo->cpu_access_mutex);
4903f012e29Smrg		return 0;
4913f012e29Smrg	}
4923f012e29Smrg
4933f012e29Smrg	r = drm_munmap(bo->cpu_ptr, bo->alloc_size) == 0 ? 0 : -errno;
4943f012e29Smrg	bo->cpu_ptr = NULL;
4953f012e29Smrg	pthread_mutex_unlock(&bo->cpu_access_mutex);
4963f012e29Smrg	return r;
4973f012e29Smrg}
4983f012e29Smrg
4997cdc0497Smrgdrm_public int amdgpu_query_buffer_size_alignment(amdgpu_device_handle dev,
5003f012e29Smrg				struct amdgpu_buffer_size_alignments *info)
5013f012e29Smrg{
5023f012e29Smrg	info->size_local = dev->dev_info.pte_fragment_size;
5033f012e29Smrg	info->size_remote = dev->dev_info.gart_page_size;
5043f012e29Smrg	return 0;
5053f012e29Smrg}
5063f012e29Smrg
5077cdc0497Smrgdrm_public int amdgpu_bo_wait_for_idle(amdgpu_bo_handle bo,
5087cdc0497Smrg				       uint64_t timeout_ns,
5093f012e29Smrg			    bool *busy)
5103f012e29Smrg{
5113f012e29Smrg	union drm_amdgpu_gem_wait_idle args;
5123f012e29Smrg	int r;
5133f012e29Smrg
5143f012e29Smrg	memset(&args, 0, sizeof(args));
5153f012e29Smrg	args.in.handle = bo->handle;
5163f012e29Smrg	args.in.timeout = amdgpu_cs_calculate_timeout(timeout_ns);
5173f012e29Smrg
5183f012e29Smrg	r = drmCommandWriteRead(bo->dev->fd, DRM_AMDGPU_GEM_WAIT_IDLE,
5193f012e29Smrg				&args, sizeof(args));
5203f012e29Smrg
5213f012e29Smrg	if (r == 0) {
5223f012e29Smrg		*busy = args.out.status;
5233f012e29Smrg		return 0;
5243f012e29Smrg	} else {
5253f012e29Smrg		fprintf(stderr, "amdgpu: GEM_WAIT_IDLE failed with %i\n", r);
5263f012e29Smrg		return r;
5273f012e29Smrg	}
5283f012e29Smrg}
5293f012e29Smrg
5307cdc0497Smrgdrm_public int amdgpu_find_bo_by_cpu_mapping(amdgpu_device_handle dev,
5317cdc0497Smrg					     void *cpu,
5327cdc0497Smrg					     uint64_t size,
5337cdc0497Smrg					     amdgpu_bo_handle *buf_handle,
5347cdc0497Smrg					     uint64_t *offset_in_bo)
5353f012e29Smrg{
5363b115362Smrg	struct amdgpu_bo *bo = NULL;
5377cdc0497Smrg	uint32_t i;
5387cdc0497Smrg	int r = 0;
5397cdc0497Smrg
5407cdc0497Smrg	if (cpu == NULL || size == 0)
5417cdc0497Smrg		return -EINVAL;
5427cdc0497Smrg
5437cdc0497Smrg	/*
5447cdc0497Smrg	 * Workaround for a buggy application which tries to import previously
5457cdc0497Smrg	 * exposed CPU pointers. If we find a real world use case we should
5467cdc0497Smrg	 * improve that by asking the kernel for the right handle.
5477cdc0497Smrg	 */
5487cdc0497Smrg	pthread_mutex_lock(&dev->bo_table_mutex);
5497cdc0497Smrg	for (i = 0; i < dev->bo_handles.max_key; i++) {
5507cdc0497Smrg		bo = handle_table_lookup(&dev->bo_handles, i);
5517cdc0497Smrg		if (!bo || !bo->cpu_ptr || size > bo->alloc_size)
5527cdc0497Smrg			continue;
5537cdc0497Smrg		if (cpu >= bo->cpu_ptr &&
55448246ce7Smrg		    cpu < (void*)((uintptr_t)bo->cpu_ptr + (size_t)bo->alloc_size))
5557cdc0497Smrg			break;
5567cdc0497Smrg	}
5577cdc0497Smrg
5587cdc0497Smrg	if (i < dev->bo_handles.max_key) {
5597cdc0497Smrg		atomic_inc(&bo->refcount);
5607cdc0497Smrg		*buf_handle = bo;
5617cdc0497Smrg		*offset_in_bo = (uintptr_t)cpu - (uintptr_t)bo->cpu_ptr;
5627cdc0497Smrg	} else {
5637cdc0497Smrg		*buf_handle = NULL;
5647cdc0497Smrg		*offset_in_bo = 0;
5657cdc0497Smrg		r = -ENXIO;
5667cdc0497Smrg	}
5677cdc0497Smrg	pthread_mutex_unlock(&dev->bo_table_mutex);
5687cdc0497Smrg
5697cdc0497Smrg	return r;
5707cdc0497Smrg}
5717cdc0497Smrg
5727cdc0497Smrgdrm_public int amdgpu_create_bo_from_user_mem(amdgpu_device_handle dev,
5737cdc0497Smrg					      void *cpu,
5747cdc0497Smrg					      uint64_t size,
5757cdc0497Smrg					      amdgpu_bo_handle *buf_handle)
5767cdc0497Smrg{
5777cdc0497Smrg	int r;
5783f012e29Smrg	struct drm_amdgpu_gem_userptr args;
5793f012e29Smrg
5803f012e29Smrg	args.addr = (uintptr_t)cpu;
5813f012e29Smrg	args.flags = AMDGPU_GEM_USERPTR_ANONONLY | AMDGPU_GEM_USERPTR_REGISTER |
5823f012e29Smrg		AMDGPU_GEM_USERPTR_VALIDATE;
5833f012e29Smrg	args.size = size;
5843f012e29Smrg	r = drmCommandWriteRead(dev->fd, DRM_AMDGPU_GEM_USERPTR,
5853f012e29Smrg				&args, sizeof(args));
5863f012e29Smrg	if (r)
5877cdc0497Smrg		goto out;
5883f012e29Smrg
589bf6cc7dcSmrg	pthread_mutex_lock(&dev->bo_table_mutex);
5907cdc0497Smrg	r = amdgpu_bo_create(dev, size, args.handle, buf_handle);
591bf6cc7dcSmrg	pthread_mutex_unlock(&dev->bo_table_mutex);
5927cdc0497Smrg	if (r) {
593adfa0b0cSmrg		drmCloseBufferHandle(dev->fd, args.handle);
5947cdc0497Smrg	}
5953f012e29Smrg
5967cdc0497Smrgout:
5973f012e29Smrg	return r;
5983f012e29Smrg}
5993f012e29Smrg
6004545e80cSmrgdrm_public int amdgpu_bo_list_create_raw(amdgpu_device_handle dev,
6014545e80cSmrg					 uint32_t number_of_buffers,
6024545e80cSmrg					 struct drm_amdgpu_bo_list_entry *buffers,
6034545e80cSmrg					 uint32_t *result)
6044545e80cSmrg{
6054545e80cSmrg	union drm_amdgpu_bo_list args;
6064545e80cSmrg	int r;
6074545e80cSmrg
6084545e80cSmrg	memset(&args, 0, sizeof(args));
6094545e80cSmrg	args.in.operation = AMDGPU_BO_LIST_OP_CREATE;
6104545e80cSmrg	args.in.bo_number = number_of_buffers;
6114545e80cSmrg	args.in.bo_info_size = sizeof(struct drm_amdgpu_bo_list_entry);
6124545e80cSmrg	args.in.bo_info_ptr = (uint64_t)(uintptr_t)buffers;
6134545e80cSmrg
6144545e80cSmrg	r = drmCommandWriteRead(dev->fd, DRM_AMDGPU_BO_LIST,
6154545e80cSmrg				&args, sizeof(args));
6164545e80cSmrg	if (!r)
6174545e80cSmrg		*result = args.out.list_handle;
6184545e80cSmrg	return r;
6194545e80cSmrg}
6204545e80cSmrg
6214545e80cSmrgdrm_public int amdgpu_bo_list_destroy_raw(amdgpu_device_handle dev,
6224545e80cSmrg					  uint32_t bo_list)
6234545e80cSmrg{
6244545e80cSmrg	union drm_amdgpu_bo_list args;
6254545e80cSmrg
6264545e80cSmrg	memset(&args, 0, sizeof(args));
6274545e80cSmrg	args.in.operation = AMDGPU_BO_LIST_OP_DESTROY;
6284545e80cSmrg	args.in.list_handle = bo_list;
6294545e80cSmrg
6304545e80cSmrg	return drmCommandWriteRead(dev->fd, DRM_AMDGPU_BO_LIST,
6314545e80cSmrg				   &args, sizeof(args));
6324545e80cSmrg}
6334545e80cSmrg
6347cdc0497Smrgdrm_public int amdgpu_bo_list_create(amdgpu_device_handle dev,
6357cdc0497Smrg				     uint32_t number_of_resources,
6367cdc0497Smrg				     amdgpu_bo_handle *resources,
6377cdc0497Smrg				     uint8_t *resource_prios,
6387cdc0497Smrg				     amdgpu_bo_list_handle *result)
6393f012e29Smrg{
6403f012e29Smrg	struct drm_amdgpu_bo_list_entry *list;
6413f012e29Smrg	union drm_amdgpu_bo_list args;
6423f012e29Smrg	unsigned i;
6433f012e29Smrg	int r;
6443f012e29Smrg
6453f012e29Smrg	if (!number_of_resources)
6463f012e29Smrg		return -EINVAL;
6473f012e29Smrg
6483f012e29Smrg	/* overflow check for multiplication */
6493f012e29Smrg	if (number_of_resources > UINT32_MAX / sizeof(struct drm_amdgpu_bo_list_entry))
6503f012e29Smrg		return -EINVAL;
6513f012e29Smrg
6523f012e29Smrg	list = malloc(number_of_resources * sizeof(struct drm_amdgpu_bo_list_entry));
6533f012e29Smrg	if (!list)
6543f012e29Smrg		return -ENOMEM;
6553f012e29Smrg
6563f012e29Smrg	*result = malloc(sizeof(struct amdgpu_bo_list));
6573f012e29Smrg	if (!*result) {
6583f012e29Smrg		free(list);
6593f012e29Smrg		return -ENOMEM;
6603f012e29Smrg	}
6613f012e29Smrg
6623f012e29Smrg	memset(&args, 0, sizeof(args));
6633f012e29Smrg	args.in.operation = AMDGPU_BO_LIST_OP_CREATE;
6643f012e29Smrg	args.in.bo_number = number_of_resources;
6653f012e29Smrg	args.in.bo_info_size = sizeof(struct drm_amdgpu_bo_list_entry);
6663f012e29Smrg	args.in.bo_info_ptr = (uint64_t)(uintptr_t)list;
6673f012e29Smrg
6683f012e29Smrg	for (i = 0; i < number_of_resources; i++) {
6693f012e29Smrg		list[i].bo_handle = resources[i]->handle;
6703f012e29Smrg		if (resource_prios)
6713f012e29Smrg			list[i].bo_priority = resource_prios[i];
6723f012e29Smrg		else
6733f012e29Smrg			list[i].bo_priority = 0;
6743f012e29Smrg	}
6753f012e29Smrg
6763f012e29Smrg	r = drmCommandWriteRead(dev->fd, DRM_AMDGPU_BO_LIST,
6773f012e29Smrg				&args, sizeof(args));
6783f012e29Smrg	free(list);
6793f012e29Smrg	if (r) {
6803f012e29Smrg		free(*result);
6813f012e29Smrg		return r;
6823f012e29Smrg	}
6833f012e29Smrg
6843f012e29Smrg	(*result)->dev = dev;
6853f012e29Smrg	(*result)->handle = args.out.list_handle;
6863f012e29Smrg	return 0;
6873f012e29Smrg}
6883f012e29Smrg
6897cdc0497Smrgdrm_public int amdgpu_bo_list_destroy(amdgpu_bo_list_handle list)
6903f012e29Smrg{
6913f012e29Smrg	union drm_amdgpu_bo_list args;
6923f012e29Smrg	int r;
6933f012e29Smrg
6943f012e29Smrg	memset(&args, 0, sizeof(args));
6953f012e29Smrg	args.in.operation = AMDGPU_BO_LIST_OP_DESTROY;
6963f012e29Smrg	args.in.list_handle = list->handle;
6973f012e29Smrg
6983f012e29Smrg	r = drmCommandWriteRead(list->dev->fd, DRM_AMDGPU_BO_LIST,
6993f012e29Smrg				&args, sizeof(args));
7003f012e29Smrg
7013f012e29Smrg	if (!r)
7023f012e29Smrg		free(list);
7033f012e29Smrg
7043f012e29Smrg	return r;
7053f012e29Smrg}
7063f012e29Smrg
7077cdc0497Smrgdrm_public int amdgpu_bo_list_update(amdgpu_bo_list_handle handle,
7087cdc0497Smrg				     uint32_t number_of_resources,
7097cdc0497Smrg				     amdgpu_bo_handle *resources,
7107cdc0497Smrg				     uint8_t *resource_prios)
7113f012e29Smrg{
7123f012e29Smrg	struct drm_amdgpu_bo_list_entry *list;
7133f012e29Smrg	union drm_amdgpu_bo_list args;
7143f012e29Smrg	unsigned i;
7153f012e29Smrg	int r;
7163f012e29Smrg
7173f012e29Smrg	if (!number_of_resources)
7183f012e29Smrg		return -EINVAL;
7193f012e29Smrg
7203f012e29Smrg	/* overflow check for multiplication */
7213f012e29Smrg	if (number_of_resources > UINT32_MAX / sizeof(struct drm_amdgpu_bo_list_entry))
7223f012e29Smrg		return -EINVAL;
7233f012e29Smrg
7243f012e29Smrg	list = malloc(number_of_resources * sizeof(struct drm_amdgpu_bo_list_entry));
725d8807b2fSmrg	if (!list)
7263f012e29Smrg		return -ENOMEM;
7273f012e29Smrg
7283f012e29Smrg	args.in.operation = AMDGPU_BO_LIST_OP_UPDATE;
7293f012e29Smrg	args.in.list_handle = handle->handle;
7303f012e29Smrg	args.in.bo_number = number_of_resources;
7313f012e29Smrg	args.in.bo_info_size = sizeof(struct drm_amdgpu_bo_list_entry);
7323f012e29Smrg	args.in.bo_info_ptr = (uintptr_t)list;
7333f012e29Smrg
7343f012e29Smrg	for (i = 0; i < number_of_resources; i++) {
7353f012e29Smrg		list[i].bo_handle = resources[i]->handle;
7363f012e29Smrg		if (resource_prios)
7373f012e29Smrg			list[i].bo_priority = resource_prios[i];
7383f012e29Smrg		else
7393f012e29Smrg			list[i].bo_priority = 0;
7403f012e29Smrg	}
7413f012e29Smrg
7423f012e29Smrg	r = drmCommandWriteRead(handle->dev->fd, DRM_AMDGPU_BO_LIST,
7433f012e29Smrg				&args, sizeof(args));
7443f012e29Smrg	free(list);
7453f012e29Smrg	return r;
7463f012e29Smrg}
7473f012e29Smrg
7487cdc0497Smrgdrm_public int amdgpu_bo_va_op(amdgpu_bo_handle bo,
7497cdc0497Smrg			       uint64_t offset,
7507cdc0497Smrg			       uint64_t size,
7517cdc0497Smrg			       uint64_t addr,
7527cdc0497Smrg			       uint64_t flags,
7537cdc0497Smrg			       uint32_t ops)
7543f012e29Smrg{
7553f012e29Smrg	amdgpu_device_handle dev = bo->dev;
756d8807b2fSmrg
757d8807b2fSmrg	size = ALIGN(size, getpagesize());
758d8807b2fSmrg
759d8807b2fSmrg	return amdgpu_bo_va_op_raw(dev, bo, offset, size, addr,
760d8807b2fSmrg				   AMDGPU_VM_PAGE_READABLE |
761d8807b2fSmrg				   AMDGPU_VM_PAGE_WRITEABLE |
762d8807b2fSmrg				   AMDGPU_VM_PAGE_EXECUTABLE, ops);
763d8807b2fSmrg}
764d8807b2fSmrg
7657cdc0497Smrgdrm_public int amdgpu_bo_va_op_raw(amdgpu_device_handle dev,
7667cdc0497Smrg				   amdgpu_bo_handle bo,
7677cdc0497Smrg				   uint64_t offset,
7687cdc0497Smrg				   uint64_t size,
7697cdc0497Smrg				   uint64_t addr,
7707cdc0497Smrg				   uint64_t flags,
7717cdc0497Smrg				   uint32_t ops)
772d8807b2fSmrg{
7733f012e29Smrg	struct drm_amdgpu_gem_va va;
7743f012e29Smrg	int r;
7753f012e29Smrg
776d8807b2fSmrg	if (ops != AMDGPU_VA_OP_MAP && ops != AMDGPU_VA_OP_UNMAP &&
777d8807b2fSmrg	    ops != AMDGPU_VA_OP_REPLACE && ops != AMDGPU_VA_OP_CLEAR)
7783f012e29Smrg		return -EINVAL;
7793f012e29Smrg
7803f012e29Smrg	memset(&va, 0, sizeof(va));
781d8807b2fSmrg	va.handle = bo ? bo->handle : 0;
7823f012e29Smrg	va.operation = ops;
783d8807b2fSmrg	va.flags = flags;
7843f012e29Smrg	va.va_address = addr;
7853f012e29Smrg	va.offset_in_bo = offset;
786d8807b2fSmrg	va.map_size = size;
7873f012e29Smrg
7883f012e29Smrg	r = drmCommandWriteRead(dev->fd, DRM_AMDGPU_GEM_VA, &va, sizeof(va));
7893f012e29Smrg
7903f012e29Smrg	return r;
7913f012e29Smrg}
792